From fb9bdbb294428e20981dd99af44fc038e8fb9e09 Mon Sep 17 00:00:00 2001
From: Waldemar Brodkorb <wbx@uclibc-ng.org>
Date: Tue, 25 Aug 2015 11:40:44 +0200
Subject: update 4.1.x to latest

---
 .../solidrun-imx6/patches/4.1.3/0001-xbian.patch   | 171697 ------------------
 .../solidrun-imx6/patches/4.1.6/0001-xbian.patch   | 171697 ++++++++++++++++++
 2 files changed, 171697 insertions(+), 171697 deletions(-)
 delete mode 100644 target/arm/solidrun-imx6/patches/4.1.3/0001-xbian.patch
 create mode 100644 target/arm/solidrun-imx6/patches/4.1.6/0001-xbian.patch

(limited to 'target/arm/solidrun-imx6/patches')

diff --git a/target/arm/solidrun-imx6/patches/4.1.3/0001-xbian.patch b/target/arm/solidrun-imx6/patches/4.1.3/0001-xbian.patch
deleted file mode 100644
index 6286c0868..000000000
--- a/target/arm/solidrun-imx6/patches/4.1.3/0001-xbian.patch
+++ /dev/null
@@ -1,171697 +0,0 @@
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6dl.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6dl.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6dl.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6dl.dtsi	2015-07-27 23:13:00.299912248 +0200
-@@ -60,17 +60,103 @@
- 	};
- 
- 	soc {
--		ocram: sram@00900000 {
-+		busfreq { /* BUSFREQ */
-+			compatible = "fsl,imx6_busfreq";
-+			clocks = <&clks 171>, <&clks 6>, <&clks 11>, <&clks 104>, <&clks 172>, <&clks 58>,
-+				 <&clks 18>, <&clks 60>, <&clks 20>, <&clks 3>, <&clks 22> , <&clks 8>;
-+			clock-names = "pll2_bus", "pll2_pfd2_396m", "pll2_198m", "arm", "pll3_usb_otg", "periph",
-+				      "periph_pre", "periph_clk2", "periph_clk2_sel", "osc", "axi_sel", "pll3_pfd1_540m";
-+			interrupts = <0 107 0x04>, <0 112 0x4>;
-+			interrupt-names = "irq_busfreq_0", "irq_busfreq_1";
-+			fsl,max_ddr_freq = <400000000>;
-+		};
-+
-+		gpu@00130000 {
-+			compatible = "fsl,imx6dl-gpu", "fsl,imx6q-gpu";
-+			reg = <0x00130000 0x4000>, <0x00134000 0x4000>,
-+			      <0x0 0x0>;
-+			reg-names = "iobase_3d", "iobase_2d",
-+			            "phys_baseaddr";
-+			interrupts = <0 9 0x04>, <0 10 0x04>;
-+			interrupt-names = "irq_3d", "irq_2d";
-+			clocks = <&clks 26>, <&clks 27>,
-+			         <&clks 121>, <&clks 122>,
-+			         <&clks 74>;
-+			clock-names = "gpu2d_axi_clk", "gpu3d_axi_clk",
-+		                      "gpu2d_clk", "gpu3d_clk",
-+		                      "gpu3d_shader_clk";
-+			resets = <&src 0>, <&src 3>;
-+			reset-names = "gpu3d", "gpu2d";
-+			power-domains = <&gpc 1>;
-+		};
-+
-+		hdmi_core: hdmi_core@00120000 {
-+			compatible = "fsl,imx6q-hdmi-core";
-+			reg = <0x00120000 0x9000>;
-+			clocks = <&clks 124>, <&clks 123>;
-+			clock-names = "hdmi_isfr", "hdmi_iahb";
-+			status = "disabled";
-+		};
-+
-+		hdmi_video: hdmi_video@020e0000 {
-+			compatible = "fsl,imx6q-hdmi-video";
-+			reg = <0x020e0000 0x1000>;
-+			reg-names = "hdmi_gpr";
-+			interrupts = <0 115 0x04>;
-+			clocks = <&clks 124>, <&clks 123>;
-+			clock-names = "hdmi_isfr", "hdmi_iahb";
-+			status = "disabled";
-+		};
-+
-+		hdmi_audio: hdmi_audio@00120000 {
-+			compatible = "fsl,imx6q-hdmi-audio";
-+			clocks = <&clks 124>, <&clks 123>;
-+			clock-names = "hdmi_isfr", "hdmi_iahb";
-+			dmas = <&sdma 2 23 0>;
-+			dma-names = "tx";
-+			status = "disabled";
-+		};
-+
-+		hdmi_cec: hdmi_cec@00120000 {
-+			compatible = "fsl,imx6q-hdmi-cec";
-+			interrupts = <0 115 0x04>;
-+			status = "disabled";
-+		};
-+
-+		ocrams: sram@00900000 {
-+			compatible = "fsl,lpm-sram";
-+			reg = <0x00900000 0x4000>;
-+			clocks = <&clks IMX6QDL_CLK_OCRAM>;
-+		};
-+
-+		ocrams_ddr: sram@00904000 {
-+			compatible = "fsl,ddr-lpm-sram";
-+			reg = <0x00904000 0x1000>;
-+			clocks = <&clks IMX6QDL_CLK_OCRAM>;
-+		};
-+
-+		ocram: sram@00905000 {
- 			compatible = "mmio-sram";
--			reg = <0x00900000 0x20000>;
-+			reg = <0x00905000 0x1B000>;
- 			clocks = <&clks IMX6QDL_CLK_OCRAM>;
- 		};
- 
- 		aips1: aips-bus@02000000 {
-+			vpu@02040000 {
-+				iramsize = <0>;
-+				status = "okay";
-+			};
-+
- 			iomuxc: iomuxc@020e0000 {
- 				compatible = "fsl,imx6dl-iomuxc";
- 			};
- 
-+			dcic2: dcic@020e8000 {
-+				clocks = <&clks IMX6QDL_CLK_DCIC1 >,
-+					 <&clks IMX6QDL_CLK_DCIC2>; /* DCIC2 depend on DCIC1 clock in imx6dl*/
-+				clock-names = "dcic", "disp-axi";
-+			};
-+
- 			pxp: pxp@020f0000 {
- 				reg = <0x020f0000 0x4000>;
- 				interrupts = <0 98 IRQ_TYPE_LEVEL_HIGH>;
-@@ -99,26 +185,13 @@
- 			};
- 		};
- 	};
--
--	display-subsystem {
--		compatible = "fsl,imx-display-subsystem";
--		ports = <&ipu1_di0>, <&ipu1_di1>;
--	};
--};
--
--&hdmi {
--	compatible = "fsl,imx6dl-hdmi";
- };
- 
- &ldb {
--	clocks = <&clks IMX6QDL_CLK_LDB_DI0_SEL>, <&clks IMX6QDL_CLK_LDB_DI1_SEL>,
--		 <&clks IMX6QDL_CLK_IPU1_DI0_SEL>, <&clks IMX6QDL_CLK_IPU1_DI1_SEL>,
--		 <&clks IMX6QDL_CLK_LDB_DI0>, <&clks IMX6QDL_CLK_LDB_DI1>;
-+	clocks = <&clks 33>, <&clks 34>,
-+		 <&clks 39>, <&clks 40>,
-+		 <&clks 135>, <&clks 136>;
- 	clock-names = "di0_pll", "di1_pll",
- 		      "di0_sel", "di1_sel",
- 		      "di0", "di1";
- };
--
--&vpu {
--	compatible = "fsl,imx6dl-vpu", "cnm,coda960";
--};
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi	2015-07-27 23:13:00.303898027 +0200
-@@ -45,11 +45,22 @@
- #include <dt-bindings/gpio/gpio.h>
- 
- / {
-+	chosen {
-+		bootargs = "quiet console=ttymxc0,115200 root=/dev/mmcblk0p2 rw";
-+	};
-+
-+	aliases {
-+		mmc0 = &usdhc2;
-+		mmc1 = &usdhc1;
-+		mxcfb0 = &mxcfb1;
-+	};
-+
- 	ir_recv: ir-receiver {
- 		compatible = "gpio-ir-receiver";
- 		gpios = <&gpio3 9 1>;
- 		pinctrl-names = "default";
- 		pinctrl-0 = <&pinctrl_cubox_i_ir>;
-+		linux,rc-map-name = "rc-rc6-mce";
- 	};
- 
- 	pwmleds {
-@@ -78,6 +89,8 @@
- 
- 		reg_usbh1_vbus: usb-h1-vbus {
- 			compatible = "regulator-fixed";
-+			regulator-boot-on;
-+			regulator-always-on;
- 			enable-active-high;
- 			gpio = <&gpio1 0 0>;
- 			pinctrl-names = "default";
-@@ -89,6 +102,8 @@
- 
- 		reg_usbotg_vbus: usb-otg-vbus {
- 			compatible = "regulator-fixed";
-+			regulator-boot-on;
-+			regulator-always-on;
- 			enable-active-high;
- 			gpio = <&gpio3 22 0>;
- 			pinctrl-names = "default";
-@@ -101,8 +116,7 @@
- 
- 	sound-spdif {
- 		compatible = "fsl,imx-audio-spdif";
--		model = "Integrated SPDIF";
--		/* IMX6 doesn't implement this yet */
-+		model = "imx-spdif";
- 		spdif-controller = <&spdif>;
- 		spdif-out;
- 	};
-@@ -118,12 +132,45 @@
- 			linux,code = <BTN_0>;
- 		};
- 	};
-+
-+	sound-hdmi {
-+		compatible = "fsl,imx6q-audio-hdmi",
-+			     "fsl,imx-audio-hdmi";
-+		model = "imx-audio-hdmi";
-+		hdmi-controller = <&hdmi_audio>;
-+	};
-+
-+	mxcfb1: fb@0 {
-+		compatible = "fsl,mxc_sdc_fb";
-+		disp_dev = "hdmi";
-+		interface_pix_fmt = "RGB24";
-+		mode_str ="1920x1080M@60";
-+		default_bpp = <32>;
-+		int_clk = <0>;
-+		late_init = <0>;
-+		status = "okay";
-+	};
-+};
-+
-+&hdmi_core {
-+	ipu_id = <0>;
-+	disp_id = <0>;
-+	status = "okay";
-+};
-+
-+&hdmi_video {
-+	fsl,phy_reg_vlev = <0x0294>;
-+	fsl,phy_reg_cksymtx = <0x800d>;
-+	status = "okay";
-+};
-+
-+&hdmi_audio {
-+	status = "okay";
- };
- 
--&hdmi {
-+&hdmi_cec {
- 	pinctrl-names = "default";
- 	pinctrl-0 = <&pinctrl_cubox_i_hdmi>;
--	ddc-i2c-bus = <&i2c2>;
- 	status = "okay";
- };
- 
-@@ -131,7 +178,13 @@
- 	clock-frequency = <100000>;
- 	pinctrl-names = "default";
- 	pinctrl-0 = <&pinctrl_cubox_i_i2c2>;
-+
- 	status = "okay";
-+
-+	ddc: imx6_hdmi_i2c@50 {
-+		compatible = "fsl,imx6-hdmi-i2c";
-+		reg = <0x50>;
-+	};
- };
- 
- &i2c3 {
-@@ -228,6 +281,28 @@
- 				MX6QDL_PAD_EIM_DA8__GPIO3_IO08	0x17059
- 			>;
- 		};
-+
-+		pinctrl_cubox_i_usdhc2_100mhz: cubox-i-usdhc2-100mhz {
-+			fsl,pins = <
-+				MX6QDL_PAD_SD2_CMD__SD2_CMD    0x170b9
-+				MX6QDL_PAD_SD2_CLK__SD2_CLK    0x100b9
-+				MX6QDL_PAD_SD2_DAT0__SD2_DATA0 0x170b9
-+				MX6QDL_PAD_SD2_DAT1__SD2_DATA1 0x170b9
-+				MX6QDL_PAD_SD2_DAT2__SD2_DATA2 0x170b9
-+				MX6QDL_PAD_SD2_DAT3__SD2_DATA3 0x130b9
-+			>;
-+		};
-+
-+		pinctrl_cubox_i_usdhc2_200mhz: cubox-i-usdhc2-200mhz {
-+			fsl,pins = <
-+				MX6QDL_PAD_SD2_CMD__SD2_CMD    0x170f9
-+				MX6QDL_PAD_SD2_CLK__SD2_CLK    0x100f9
-+				MX6QDL_PAD_SD2_DAT0__SD2_DATA0 0x170f9
-+				MX6QDL_PAD_SD2_DAT1__SD2_DATA1 0x170f9
-+				MX6QDL_PAD_SD2_DAT2__SD2_DATA2 0x170f9
-+				MX6QDL_PAD_SD2_DAT3__SD2_DATA3 0x130f9
-+			>;
-+		};
- 	};
- };
- 
-@@ -256,9 +331,24 @@
- };
- 
- &usdhc2 {
--	pinctrl-names = "default";
-+	pinctrl-names = "default", "state_100mhz", "state_200mhz";
- 	pinctrl-0 = <&pinctrl_cubox_i_usdhc2_aux &pinctrl_cubox_i_usdhc2>;
-+	pinctrl-1 = <&pinctrl_cubox_i_usdhc2_aux &pinctrl_cubox_i_usdhc2_100mhz>;
-+	pinctrl-2 = <&pinctrl_cubox_i_usdhc2_aux &pinctrl_cubox_i_usdhc2_200mhz>;
- 	vmmc-supply = <&reg_3p3v>;
- 	cd-gpios = <&gpio1 4 0>;
- 	status = "okay";
-+	no-1-8-v;
-+};
-+
-+&dcic1 {
-+	dcic_id = <0>;
-+	dcic_mux = "dcic-hdmi";
-+	status = "okay";
-+};
-+
-+&dcic2 {
-+	dcic_id = <1>;
-+	dcic_mux = "dcic-lvds1";
-+	status = "okay";
- };
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6qdl.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl.dtsi	2015-07-27 23:13:00.303898027 +0200
-@@ -14,6 +14,7 @@
- #include <dt-bindings/interrupt-controller/arm-gic.h>
- 
- #include "skeleton.dtsi"
-+#include <dt-bindings/gpio/gpio.h>
- 
- / {
- 	aliases {
-@@ -30,6 +31,7 @@
- 		i2c0 = &i2c1;
- 		i2c1 = &i2c2;
- 		i2c2 = &i2c3;
-+		ipu0 = &ipu1;
- 		mmc0 = &usdhc1;
- 		mmc1 = &usdhc2;
- 		mmc2 = &usdhc3;
-@@ -79,6 +81,10 @@
- 		};
- 	};
- 
-+	pu_dummy: pudummy_reg {
-+		compatible = "fsl,imx6-dummy-pureg"; /* only used in ldo-bypass */
-+	};
-+
- 	soc {
- 		#address-cells = <1>;
- 		#size-cells = <1>;
-@@ -86,6 +92,11 @@
- 		interrupt-parent = <&gpc>;
- 		ranges;
- 
-+		caam_sm: caam-sm@00100000 {
-+			compatible = "fsl,imx6q-caam-sm";
-+			reg = <0x00100000 0x3fff>;
-+		};
-+
- 		dma_apbh: dma-apbh@00110000 {
- 			compatible = "fsl,imx6q-dma-apbh", "fsl,imx28-dma-apbh";
- 			reg = <0x00110000 0x2000>;
-@@ -99,6 +110,12 @@
- 			clocks = <&clks IMX6QDL_CLK_APBH_DMA>;
- 		};
- 
-+		irq_sec_vio: caam_secvio {
-+			compatible = "fsl,imx6q-caam-secvio";
-+			interrupts = <0 20 0x04>;
-+			secvio_src = <0x8000001d>;
-+		};
-+
- 		gpmi: gpmi-nand@00112000 {
- 			compatible = "fsl,imx6q-gpmi-nand";
- 			#address-cells = <1>;
-@@ -190,16 +207,16 @@
- 					dmas = <&sdma 14 18 0>,
- 					       <&sdma 15 18 0>;
- 					dma-names = "rx", "tx";
--					clocks = <&clks IMX6QDL_CLK_SPDIF>, <&clks IMX6QDL_CLK_OSC>,
--						 <&clks IMX6QDL_CLK_SPDIF>, <&clks IMX6QDL_CLK_DUMMY>,
--						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_DUMMY>,
--						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_DUMMY>,
--						 <&clks IMX6QDL_CLK_DUMMY>;
-+					clocks = <&clks IMX6QDL_CLK_SPDIF_GCLK>, <&clks IMX6QDL_CLK_OSC>,
-+						 <&clks IMX6QDL_CLK_SPDIF>, <&clks IMX6QDL_CLK_ASRC>,
-+						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_ESAI_EXTAL>,
-+						 <&clks IMX6QDL_CLK_IPG>, <&clks IMX6QDL_CLK_MLB>,
-+						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_SPBA>;
- 					clock-names = "core",  "rxtx0",
- 						      "rxtx1", "rxtx2",
- 						      "rxtx3", "rxtx4",
- 						      "rxtx5", "rxtx6",
--						      "rxtx7";
-+						      "rxtx7", "dma";
- 					status = "disabled";
- 				};
- 
-@@ -274,7 +291,12 @@
- 				esai: esai@02024000 {
- 					reg = <0x02024000 0x4000>;
- 					interrupts = <0 51 IRQ_TYPE_LEVEL_HIGH>;
--				};
-+					compatible = "fsl,imx6q-esai";
-+					clocks = <&clks 118>;
-+					fsl,esai-dma-events = <24 23>;
-+					fsl,flags = <1>;
-+					status = "disabled";
-+                                };
- 
- 				ssi1: ssi@02028000 {
- 					#sound-dai-cells = <0>;
-@@ -325,8 +347,30 @@
- 				};
- 
- 				asrc: asrc@02034000 {
-+					compatible = "fsl,imx53-asrc";
- 					reg = <0x02034000 0x4000>;
- 					interrupts = <0 50 IRQ_TYPE_LEVEL_HIGH>;
-+					clocks = <&clks IMX6QDL_CLK_ASRC_MEM>,
-+						 <&clks IMX6QDL_CLK_ASRC_IPG>,
-+						 <&clks IMX6QDL_CLK_SPDIF>,
-+						 <&clks IMX6QDL_CLK_SPBA>;
-+					clock-names = "mem", "ipg", "asrck_0", "dma";
-+					dmas = <&sdma 17 20 1>, <&sdma 18 20 1>, <&sdma 19 20 1>,
-+					       <&sdma 20 20 1>, <&sdma 21 20 1>, <&sdma 22 20 1>;
-+					dma-names = "rxa", "rxb", "rxc",
-+						    "txa", "txb", "txc";
-+					fsl,asrc-rate = <48000>;
-+					fsl,asrc-width = <16>;
-+					status = "okay";
-+				};
-+
-+				asrc_p2p: asrc_p2p {
-+					compatible = "fsl,imx6q-asrc-p2p";
-+					fsl,output-rate  = <48000>;
-+					fsl,output-width = <16>;
-+					fsl,asrc-dma-rx-events = <17 18 19>;
-+					fsl,asrc-dma-tx-events = <20 21 22>;
-+					status = "okay";
- 				};
- 
- 				spba@0203c000 {
-@@ -335,16 +379,20 @@
- 			};
- 
- 			vpu: vpu@02040000 {
--				compatible = "cnm,coda960";
-+				compatible = "cnm,coda960", "fsl,imx6-vpu";
- 				reg = <0x02040000 0x3c000>;
-+				reg-names = "vpu_regs";
- 				interrupts = <0 12 IRQ_TYPE_LEVEL_HIGH>,
- 					     <0 3 IRQ_TYPE_LEVEL_HIGH>;
- 				interrupt-names = "bit", "jpeg";
- 				clocks = <&clks IMX6QDL_CLK_VPU_AXI>,
--					 <&clks IMX6QDL_CLK_MMDC_CH0_AXI>;
--				clock-names = "per", "ahb";
--				resets = <&src 1>;
-+					 <&clks IMX6QDL_CLK_MMDC_CH0_AXI>,
-+					 <&clks IMX6QDL_CLK_OCRAM>;
-+				clock-names = "per", "ahb", "ocram";
-+				iramsize = <0x21000>;
- 				iram = <&ocram>;
-+				resets = <&src 1>;
-+				power-domains = <&gpc 1>;
- 			};
- 
- 			aipstz@0207c000 { /* AIPSTZ1 */
-@@ -552,20 +600,21 @@
- 					anatop-min-bit-val = <4>;
- 					anatop-min-voltage = <800000>;
- 					anatop-max-voltage = <1375000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
--				regulator-3p0@120 {
-+				reg_3p0: regulator-3p0@120 {
- 					compatible = "fsl,anatop-regulator";
- 					regulator-name = "vdd3p0";
--					regulator-min-microvolt = <2800000>;
--					regulator-max-microvolt = <3150000>;
--					regulator-always-on;
-+					regulator-min-microvolt = <2625000>;
-+					regulator-max-microvolt = <3400000>;
- 					anatop-reg-offset = <0x120>;
- 					anatop-vol-bit-shift = <8>;
- 					anatop-vol-bit-width = <5>;
- 					anatop-min-bit-val = <0>;
- 					anatop-min-voltage = <2625000>;
- 					anatop-max-voltage = <3400000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
- 				regulator-2p5@130 {
-@@ -580,6 +629,7 @@
- 					anatop-min-bit-val = <0>;
- 					anatop-min-voltage = <2000000>;
- 					anatop-max-voltage = <2750000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
- 				reg_arm: regulator-vddcore@140 {
-@@ -647,6 +697,7 @@
- 				reg = <0x020c9000 0x1000>;
- 				interrupts = <0 44 IRQ_TYPE_LEVEL_HIGH>;
- 				clocks = <&clks IMX6QDL_CLK_USBPHY1>;
-+				phy-3p0-supply = <&reg_3p0>;
- 				fsl,anatop = <&anatop>;
- 			};
- 
-@@ -655,9 +706,15 @@
- 				reg = <0x020ca000 0x1000>;
- 				interrupts = <0 45 IRQ_TYPE_LEVEL_HIGH>;
- 				clocks = <&clks IMX6QDL_CLK_USBPHY2>;
-+				phy-3p0-supply = <&reg_3p0>;
- 				fsl,anatop = <&anatop>;
- 			};
- 
-+			caam_snvs: caam-snvs@020cc000 {
-+				compatible = "fsl,imx6q-caam-snvs";
-+				reg = <0x020cc000 0x4000>;
-+			};
-+
- 			snvs@020cc000 {
- 				compatible = "fsl,sec-v4.0-mon", "simple-bus";
- 				#address-cells = <1>;
-@@ -704,14 +761,12 @@
- 				interrupts = <0 89 IRQ_TYPE_LEVEL_HIGH>,
- 					     <0 90 IRQ_TYPE_LEVEL_HIGH>;
- 				interrupt-parent = <&intc>;
--				pu-supply = <&reg_pu>;
--				clocks = <&clks IMX6QDL_CLK_GPU3D_CORE>,
--					 <&clks IMX6QDL_CLK_GPU3D_SHADER>,
--					 <&clks IMX6QDL_CLK_GPU2D_CORE>,
--					 <&clks IMX6QDL_CLK_GPU2D_AXI>,
--					 <&clks IMX6QDL_CLK_OPENVG_AXI>,
--					 <&clks IMX6QDL_CLK_VPU_AXI>;
- 				#power-domain-cells = <1>;
-+				clocks = <&clks 122>, <&clks 74>, <&clks 121>,
-+					 <&clks 26>, <&clks 143>, <&clks 168>;
-+				clock-names = "gpu3d_core", "gpu3d_shader", "gpu2d_core",
-+					      "gpu2d_axi", "openvg_axi", "vpu_axi";
-+				pu-supply = <&reg_pu>;
- 			};
- 
- 			gpr: iomuxc-gpr@020e0000 {
-@@ -736,22 +791,6 @@
- 					#size-cells = <0>;
- 					reg = <0>;
- 					status = "disabled";
--
--					port@0 {
--						reg = <0>;
--
--						lvds0_mux_0: endpoint {
--							remote-endpoint = <&ipu1_di0_lvds0>;
--						};
--					};
--
--					port@1 {
--						reg = <1>;
--
--						lvds0_mux_1: endpoint {
--							remote-endpoint = <&ipu1_di1_lvds0>;
--						};
--					};
- 				};
- 
- 				lvds-channel@1 {
-@@ -759,22 +798,6 @@
- 					#size-cells = <0>;
- 					reg = <1>;
- 					status = "disabled";
--
--					port@0 {
--						reg = <0>;
--
--						lvds1_mux_0: endpoint {
--							remote-endpoint = <&ipu1_di0_lvds1>;
--						};
--					};
--
--					port@1 {
--						reg = <1>;
--
--						lvds1_mux_1: endpoint {
--							remote-endpoint = <&ipu1_di1_lvds1>;
--						};
--					};
- 				};
- 			};
- 
-@@ -788,32 +811,26 @@
- 					 <&clks IMX6QDL_CLK_HDMI_ISFR>;
- 				clock-names = "iahb", "isfr";
- 				status = "disabled";
--
--				port@0 {
--					reg = <0>;
--
--					hdmi_mux_0: endpoint {
--						remote-endpoint = <&ipu1_di0_hdmi>;
--					};
--				};
--
--				port@1 {
--					reg = <1>;
--
--					hdmi_mux_1: endpoint {
--						remote-endpoint = <&ipu1_di1_hdmi>;
--					};
--				};
- 			};
- 
- 			dcic1: dcic@020e4000 {
-+				compatible = "fsl,imx6q-dcic";
- 				reg = <0x020e4000 0x4000>;
- 				interrupts = <0 124 IRQ_TYPE_LEVEL_HIGH>;
-+				clocks = <&clks IMX6QDL_CLK_DCIC1>, <&clks IMX6QDL_CLK_DCIC1>;
-+				clock-names = "dcic", "disp-axi";
-+				gpr = <&gpr>;
-+				status = "disabled";
- 			};
- 
- 			dcic2: dcic@020e8000 {
-+				compatible = "fsl,imx6q-dcic";
- 				reg = <0x020e8000 0x4000>;
- 				interrupts = <0 125 IRQ_TYPE_LEVEL_HIGH>;
-+				clocks = <&clks IMX6QDL_CLK_DCIC2>, <&clks IMX6QDL_CLK_DCIC2>;
-+				clock-names = "dcic", "disp-axi";
-+				gpr = <&gpr>;
-+				status = "disabled";
- 			};
- 
- 			sdma: sdma@020ec000 {
-@@ -824,6 +841,7 @@
- 					 <&clks IMX6QDL_CLK_SDMA>;
- 				clock-names = "ipg", "ahb";
- 				#dma-cells = <3>;
-+				iram = <&ocram>;
- 				fsl,sdma-ram-script-name = "imx/sdma/sdma-imx6q.bin";
- 			};
- 		};
-@@ -835,10 +853,30 @@
- 			reg = <0x02100000 0x100000>;
- 			ranges;
- 
--			caam@02100000 {
--				reg = <0x02100000 0x40000>;
--				interrupts = <0 105 IRQ_TYPE_LEVEL_HIGH>,
--					     <0 106 IRQ_TYPE_LEVEL_HIGH>;
-+			crypto: caam@2100000 {
-+				compatible = "fsl,sec-v4.0";
-+				#address-cells = <1>;
-+				#size-cells = <1>;
-+				reg = <0x2100000 0x40000>;
-+				ranges = <0 0x2100000 0x40000>;
-+				interrupt-parent = <&intc>; /* interrupts = <0 92 0x4>; */
-+				interrupts = <0 92 0x4>;
-+				clocks = <&clks 213>, <&clks 214>, <&clks 215> ,<&clks 196>;
-+				clock-names = "caam_mem", "caam_aclk", "caam_ipg", "caam_emi_slow";
-+
-+				sec_jr0: jr0@1000 {
-+					compatible = "fsl,sec-v4.0-job-ring";
-+					reg = <0x1000 0x1000>;
-+					interrupt-parent = <&intc>;
-+					interrupts = <0 105 IRQ_TYPE_LEVEL_HIGH>;
-+				};
-+
-+				sec_jr1: jr1@2000 {
-+					compatible = "fsl,sec-v4.0-job-ring";
-+					reg = <0x2000 0x1000>;
-+					interrupt-parent = <&intc>;
-+					interrupts = <0 106 IRQ_TYPE_LEVEL_HIGH>;
-+				};
- 			};
- 
- 			aipstz@0217c000 { /* AIPSTZ2 */
-@@ -852,6 +890,7 @@
- 				clocks = <&clks IMX6QDL_CLK_USBOH3>;
- 				fsl,usbphy = <&usbphy1>;
- 				fsl,usbmisc = <&usbmisc 0>;
-+				fsl,anatop = <&anatop>;
- 				status = "disabled";
- 			};
- 
-@@ -903,14 +942,21 @@
- 					 <&clks IMX6QDL_CLK_ENET>,
- 					 <&clks IMX6QDL_CLK_ENET_REF>;
- 				clock-names = "ipg", "ahb", "ptp";
--				status = "disabled";
-+				phy-mode = "rgmii";
-+				fsl,magic-packet;
-+				status = "okay";
- 			};
- 
--			mlb@0218c000 {
-+			mlb: mlb@0218c000 {
- 				reg = <0x0218c000 0x4000>;
- 				interrupts = <0 53 IRQ_TYPE_LEVEL_HIGH>,
- 					     <0 117 IRQ_TYPE_LEVEL_HIGH>,
- 					     <0 126 IRQ_TYPE_LEVEL_HIGH>;
-+				compatible = "fsl,imx6q-mlb150";
-+				clocks = <&clks 139>, <&clks 175>;
-+				clock-names = "mlb", "pll8_mlb";
-+				iram = <&ocram>;
-+				status = "disabled";
- 			};
- 
- 			usdhc1: usdhc@02190000 {
-@@ -995,6 +1041,11 @@
- 				reg = <0x021ac000 0x4000>;
- 			};
- 
-+			mmdc0-1@021b0000 {
-+				compatible = "fsl,imx6q-mmdc-combine";
-+				reg = <0x021b0000 0x8000>;
-+			};
-+
- 			mmdc0: mmdc@021b0000 { /* MMDC0 */
- 				compatible = "fsl,imx6q-mmdc";
- 				reg = <0x021b0000 0x4000>;
-@@ -1011,11 +1062,17 @@
- 				clocks = <&clks IMX6QDL_CLK_EIM_SLOW>;
- 			};
- 
--			ocotp: ocotp@021bc000 {
--				compatible = "fsl,imx6q-ocotp", "syscon";
-+			ocotp: ocotp-ctrl@021bc000 {
-+				compatible = "syscon";
- 				reg = <0x021bc000 0x4000>;
- 			};
- 
-+			ocotp-fuse@021bc000 {
-+				compatible = "fsl,imx6q-ocotp";
-+				reg = <0x021bc000 0x4000>;
-+				clocks = <&clks 128>;
-+			};
-+
- 			tzasc@021d0000 { /* TZASC1 */
- 				reg = <0x021d0000 0x4000>;
- 				interrupts = <0 108 IRQ_TYPE_LEVEL_HIGH>;
-@@ -1034,39 +1091,38 @@
- 
- 			mipi_csi: mipi@021dc000 {
- 				reg = <0x021dc000 0x4000>;
-+				compatible = "fsl,imx6q-mipi-csi2";
-+				interrupts = <0 100 0x04>, <0 101 0x04>;
-+				clocks = <&clks IMX6QDL_CLK_HSI_TX>,
-+					 <&clks IMX6QDL_CLK_EIM_SEL>,
-+					 <&clks IMX6QDL_CLK_LVDS2_IN>;
-+				/* Note: clks 138 is hsi_tx, however, the dphy_c
-+                                 * hsi_tx and pll_refclk use the same clk gate.
-+                                 * In current clk driver, open/close clk gate do
-+                                 * use hsi_tx for a temporary debug purpose.
-+                                 */
-+				clock-names = "dphy_clk", "pixel_clk", "cfg_clk";
-+				status = "disabled";
- 			};
- 
- 			mipi_dsi: mipi@021e0000 {
-+				compatible = "fsl,imx6q-mipi-dsi";
- 				#address-cells = <1>;
- 				#size-cells = <0>;
- 				reg = <0x021e0000 0x4000>;
- 				status = "disabled";
--
--				ports {
--					#address-cells = <1>;
--					#size-cells = <0>;
--
--					port@0 {
--						reg = <0>;
--
--						mipi_mux_0: endpoint {
--							remote-endpoint = <&ipu1_di0_mipi>;
--						};
--					};
--
--					port@1 {
--						reg = <1>;
--
--						mipi_mux_1: endpoint {
--							remote-endpoint = <&ipu1_di1_mipi>;
--						};
--					};
--				};
-+				interrupts = <0 102 0x04>;
-+				gpr = <&gpr>;
-+				clocks = <&clks IMX6QDL_CLK_HSI_TX>, <&clks IMX6QDL_CLK_VIDEO_27M>;
-+				clock-names = "mipi_pllref_clk", "mipi_cfg_clk";
- 			};
- 
- 			vdoa@021e4000 {
-+				compatible = "fsl,imx6q-vdoa";
- 				reg = <0x021e4000 0x4000>;
- 				interrupts = <0 18 IRQ_TYPE_LEVEL_HIGH>;
-+				clocks = <&clks 202>;
-+				iram = <&ocram>;
- 			};
- 
- 			uart2: serial@021e8000 {
-@@ -1127,67 +1183,14 @@
- 				     <0 5 IRQ_TYPE_LEVEL_HIGH>;
- 			clocks = <&clks IMX6QDL_CLK_IPU1>,
- 				 <&clks IMX6QDL_CLK_IPU1_DI0>,
--				 <&clks IMX6QDL_CLK_IPU1_DI1>;
--			clock-names = "bus", "di0", "di1";
-+				 <&clks IMX6QDL_CLK_IPU1_DI1>,
-+                                 <&clks 39>, <&clks 40>,
-+                                 <&clks 135>, <&clks 136>;
-+			clock-names = "bus", "di0", "di1",
-+                                      "di0_sel", "di1_sel",
-+                                      "ldb_di0", "ldb_di1";
- 			resets = <&src 2>;
--
--			ipu1_csi0: port@0 {
--				reg = <0>;
--			};
--
--			ipu1_csi1: port@1 {
--				reg = <1>;
--			};
--
--			ipu1_di0: port@2 {
--				#address-cells = <1>;
--				#size-cells = <0>;
--				reg = <2>;
--
--				ipu1_di0_disp0: endpoint@0 {
--				};
--
--				ipu1_di0_hdmi: endpoint@1 {
--					remote-endpoint = <&hdmi_mux_0>;
--				};
--
--				ipu1_di0_mipi: endpoint@2 {
--					remote-endpoint = <&mipi_mux_0>;
--				};
--
--				ipu1_di0_lvds0: endpoint@3 {
--					remote-endpoint = <&lvds0_mux_0>;
--				};
--
--				ipu1_di0_lvds1: endpoint@4 {
--					remote-endpoint = <&lvds1_mux_0>;
--				};
--			};
--
--			ipu1_di1: port@3 {
--				#address-cells = <1>;
--				#size-cells = <0>;
--				reg = <3>;
--
--				ipu1_di0_disp1: endpoint@0 {
--				};
--
--				ipu1_di1_hdmi: endpoint@1 {
--					remote-endpoint = <&hdmi_mux_1>;
--				};
--
--				ipu1_di1_mipi: endpoint@2 {
--					remote-endpoint = <&mipi_mux_1>;
--				};
--
--				ipu1_di1_lvds0: endpoint@3 {
--					remote-endpoint = <&lvds0_mux_1>;
--				};
--
--				ipu1_di1_lvds1: endpoint@4 {
--					remote-endpoint = <&lvds1_mux_1>;
--				};
--			};
-+			bypass_reset = <0>;
- 		};
- 	};
- };
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi	2015-07-27 23:13:00.303898027 +0200
-@@ -43,8 +43,10 @@
- #include "imx6qdl-microsom-ar8035.dtsi"
- 
- / {
--	chosen {
--		stdout-path = &uart1;
-+	aliases {
-+		mmc0 = &usdhc2;
-+		mmc1 = &usdhc1;
-+		mxcfb0 = &mxcfb1;
- 	};
- 
- 	ir_recv: ir-receiver {
-@@ -52,6 +54,7 @@
- 		gpios = <&gpio3 5 1>;
- 		pinctrl-names = "default";
- 		pinctrl-0 = <&pinctrl_hummingboard_gpio3_5>;
-+		linux,rc-map-name = "rc-rc6-mce";
- 	};
- 
- 	regulators {
-@@ -98,32 +101,70 @@
- 		model = "On-board Codec";
- 		mux-ext-port = <5>;
- 		mux-int-port = <1>;
-+		cpu-dai = <&ssi1>;
- 		ssi-controller = <&ssi1>;
- 	};
- 
- 	sound-spdif {
- 		compatible = "fsl,imx-audio-spdif";
--		model = "On-board SPDIF";
-+		model = "imx-spdif";
- 		/* IMX6 doesn't implement this yet */
- 		spdif-controller = <&spdif>;
- 		spdif-out;
- 	};
-+
-+	sound-hdmi {
-+		compatible = "fsl,imx6q-audio-hdmi",
-+			     "fsl,imx-audio-hdmi";
-+		model = "imx-audio-hdmi";
-+		hdmi-controller = <&hdmi_audio>;
-+	};
-+
-+	mxcfb1: fb@0 {
-+		compatible = "fsl,mxc_sdc_fb";
-+		disp_dev = "hdmi";
-+		interface_pix_fmt = "RGB24";
-+		mode_str ="1920x1080M@60";
-+		default_bpp = <32>;
-+		int_clk = <0>;
-+		late_init = <0>;
-+		status = "okay";
-+	};
- };
- 
- &audmux {
- 	status = "okay";
- };
- 
--&can1 {
-+/*&can1 {
- 	pinctrl-names = "default";
- 	pinctrl-0 = <&pinctrl_hummingboard_flexcan1>;
- 	status = "okay";
- };
-+*/
-+&hdmi_core {
-+	ipu_id = <0>;
-+	disp_id = <0>;
-+	status = "okay";
-+};
-+
-+&hdmi_video {
-+	fsl,phy_reg_vlev = <0x0294>;
-+	fsl,phy_reg_cksymtx = <0x800d>;
-+	status = "okay";
-+};
-+
-+&hdmi_audio {
-+	status = "okay";
-+};
-+
-+&ocram {
-+	status = "okay";
-+};
- 
--&hdmi {
-+&hdmi_cec {
- 	pinctrl-names = "default";
- 	pinctrl-0 = <&pinctrl_hummingboard_hdmi>;
--	ddc-i2c-bus = <&i2c2>;
- 	status = "okay";
- };
- 
-@@ -136,6 +177,7 @@
- 	rtc: pcf8523@68 {
- 		compatible = "nxp,pcf8523";
- 		reg = <0x68>;
-+		nxp,12p5_pf;
- 	};
- 
- 	/* Pro baseboard model */
-@@ -155,20 +197,57 @@
- 	pinctrl-names = "default";
- 	pinctrl-0 = <&pinctrl_hummingboard_i2c2>;
- 	status = "okay";
-+
-+	ddc: imx6_hdmi_i2c@50 {
-+		compatible = "fsl,imx6-hdmi-i2c";
-+		reg = <0x50>;
-+	};
- };
- 
- &iomuxc {
-+	pinctrl-names = "default";
-+	pinctrl-0 = <&pinctrl_hog>;
- 	hummingboard {
--		pinctrl_hummingboard_flexcan1: hummingboard-flexcan1 {
-+		pinctrl_hog: hoggrp {
-+			fsl,pins = <
-+				/*
-+                                 * 26 pin header GPIO description. The pins.
-+                                 * numbering as following -
-+                                 * GPIO number | GPIO (bank,num) |  PIN number
-+                                 * ------------+-----------------+------------
-+                                 * gpio1       | (1,1)           | IO7
-+                                 * gpio73      | (3,9)           | IO11
-+                                 * gpio72      | (3,8)           | IO12
-+                                 * gpio71      | (3,7)           | IO13
-+                                 * gpio70      | (3,6)           | IO15
-+                                 * gpio194     | (7,2)           | IO16
-+                                 * gpio195     | (7,3)           | IO18
-+                                 * gpio67      | (3,3)           | IO22
-+                                 *
-+                                 * Notice the gpioX and GPIO (Y,Z) mapping forumla :
-+                                 * X = (Y-1) * 32 + Z
-+                                 */
-+				MX6QDL_PAD_GPIO_1__GPIO1_IO01 0x400130b1
-+				MX6QDL_PAD_EIM_DA9__GPIO3_IO09 0x400130b1
-+				MX6QDL_PAD_EIM_DA8__GPIO3_IO08 0x400130b1
-+				MX6QDL_PAD_EIM_DA7__GPIO3_IO07 0x400130b1
-+				MX6QDL_PAD_EIM_DA6__GPIO3_IO06 0x400130b1
-+				MX6QDL_PAD_SD3_CMD__GPIO7_IO02 0x400130b1
-+				MX6QDL_PAD_SD3_CLK__GPIO7_IO03 0x400130b1
-+				MX6QDL_PAD_EIM_DA3__GPIO3_IO03 0x400130b1
-+			>;
-+		};
-+
-+/*		pinctrl_hummingboard_flexcan1: hummingboard-flexcan1 {
- 			fsl,pins = <
- 				MX6QDL_PAD_SD3_CLK__FLEXCAN1_RX 0x80000000
- 				MX6QDL_PAD_SD3_CMD__FLEXCAN1_TX 0x80000000
- 			>;
- 		};
--
-+*/
- 		pinctrl_hummingboard_gpio3_5: hummingboard-gpio3_5 {
- 			fsl,pins = <
--				MX6QDL_PAD_EIM_DA5__GPIO3_IO05 0x1b0b1
-+				MX6QDL_PAD_EIM_DA5__GPIO3_IO05 0x80000000
- 			>;
- 		};
- 
-@@ -198,10 +277,10 @@
- 
- 		pinctrl_hummingboard_sgtl5000: hummingboard-sgtl5000 {
- 			fsl,pins = <
--				MX6QDL_PAD_DISP0_DAT19__AUD5_RXD 0x130b0
--				MX6QDL_PAD_KEY_COL0__AUD5_TXC 0x130b0
--				MX6QDL_PAD_KEY_ROW0__AUD5_TXD 0x110b0
--				MX6QDL_PAD_KEY_COL1__AUD5_TXFS 0x130b0
-+				MX6QDL_PAD_DISP0_DAT19__AUD5_RXD 0x130b0 /*brk*/
-+				MX6QDL_PAD_KEY_COL0__AUD5_TXC 0x130b0 /*ok*/
-+				MX6QDL_PAD_KEY_ROW0__AUD5_TXD 0x110b0 /*brk*/
-+				MX6QDL_PAD_KEY_COL1__AUD5_TXFS 0x130b0 /*ok*/
- 				MX6QDL_PAD_GPIO_5__CCM_CLKO1 0x130b0
- 			>;
- 		};
-@@ -219,7 +298,7 @@
- 			 * Similar to pinctrl_usbotg_2, but we want it
- 			 * pulled down for a fixed host connection.
- 			 */
--			fsl,pins = <MX6QDL_PAD_GPIO_1__USB_OTG_ID 0x13059>;
-+			fsl,pins = <MX6QDL_PAD_ENET_RX_ER__USB_OTG_ID 0x13059>;
- 		};
- 
- 		pinctrl_hummingboard_usbotg_vbus: hummingboard-usbotg-vbus {
-@@ -242,6 +321,13 @@
- 				MX6QDL_PAD_SD2_DAT3__SD2_DATA3 0x13059
- 			>;
- 		};
-+
-+		pinctrl_hummingboard_pcie_reset: hummingboard-pcie-reset {
-+			fsl,pins = <
-+				MX6QDL_PAD_EIM_DA4__GPIO3_IO04 0x80000000
-+			>;
-+		};
-+
- 	};
- };
- 
-@@ -256,6 +342,14 @@
- 	 status = "okay";
- };
- 
-+&pwm3 {
-+	status = "disabled";
-+};
-+
-+&pwm4 {
-+	status = "disabled";
-+};
-+
- &spdif {
- 	pinctrl-names = "default";
- 	pinctrl-0 = <&pinctrl_hummingboard_spdif>;
-@@ -291,3 +385,48 @@
- 	cd-gpios = <&gpio1 4 0>;
- 	status = "okay";
- };
-+
-+&gpc {
-+	fsl,cpu_pupscr_sw2iso = <0xf>;
-+	fsl,cpu_pupscr_sw = <0xf>;
-+	fsl,cpu_pdnscr_iso2sw = <0x1>;
-+	fsl,cpu_pdnscr_iso = <0x1>;
-+	status = "okay";
-+};
-+
-+&pcie {
-+	pinctrl-names = "default";
-+	pinctrl-0 = <
-+		&pinctrl_hummingboard_pcie_reset
-+	>;
-+	reset-gpio = <&gpio3 4 0>;
-+	status = "okay";
-+	no-msi;
-+};
-+
-+&ecspi1 {
-+	status = "okay";
-+	fsl,spi-num-chipselects = <1>;
-+};
-+
-+&ecspi2 {
-+	status = "okay";
-+	fsl,spi-num-chipselects = <2>;
-+};
-+
-+&ecspi3 {
-+	status = "okay";
-+	fsl,spi-num-chipselects = <3>;
-+};
-+
-+&dcic1 {
-+	dcic_id = <0>;
-+	dcic_mux = "dcic-hdmi";
-+	status = "okay";
-+};
-+
-+&dcic2 {
-+	dcic_id = <1>;
-+	dcic_mux = "dcic-lvds1";
-+	status = "okay";
-+};
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl-microsom.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-microsom.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6qdl-microsom.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-microsom.dtsi	2015-07-27 23:13:00.303898027 +0200
-@@ -39,15 +39,98 @@
-  *     FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
-  *     OTHER DEALINGS IN THE SOFTWARE.
-  */
-+#include <dt-bindings/gpio/gpio.h>
-+/ {
-+	clk_sdio: sdio-clock {
-+		compatible = "gpio-gate-clock";
-+		#clock-cells = <0>;
-+		pinctrl-names = "default";
-+		pinctrl-0 = <&pinctrl_microsom_brcm_osc>;
-+		enable-gpios = <&gpio5 5 GPIO_ACTIVE_HIGH>;
-+	};
-+
-+	regulators {
-+		compatible = "simple-bus";
-+
-+		reg_brcm: brcm-reg {
-+			compatible = "regulator-fixed";
-+			enable-active-high;
-+			gpio = <&gpio3 19 0>;
-+			pinctrl-names = "default";
-+			pinctrl-0 = <&pinctrl_microsom_brcm_reg>;
-+			regulator-name = "brcm_reg";
-+			regulator-min-microvolt = <3300000>;
-+			regulator-max-microvolt = <3300000>;
-+			startup-delay-us = <200000>;
-+		};
-+	};
-+
-+	usdhc1_pwrseq: usdhc1_pwrseq {
-+		compatible = "mmc-pwrseq-simple";
-+		reset-gpios = <&gpio5 26 GPIO_ACTIVE_LOW>,
-+			      <&gpio6 0 GPIO_ACTIVE_LOW>;
-+		clocks = <&clk_sdio>;
-+		clock-names = "ext_clock";
-+	};
-+};
- 
- &iomuxc {
- 	microsom {
-+		pinctrl_microsom_brcm_bt: microsom-brcm-bt {
-+			fsl,pins = <
-+				MX6QDL_PAD_CSI0_DAT14__GPIO6_IO00	0x40013070
-+				MX6QDL_PAD_CSI0_DAT15__GPIO6_IO01	0x40013070
-+				MX6QDL_PAD_CSI0_DAT18__GPIO6_IO04	0x40013070
-+			>;
-+		};
-+
-+		pinctrl_microsom_brcm_osc: microsom-brcm-osc {
-+			fsl,pins = <
-+				MX6QDL_PAD_DISP0_DAT11__GPIO5_IO05	0x40013070
-+			>;
-+		};
-+
-+		pinctrl_microsom_brcm_reg: microsom-brcm-reg {
-+			fsl,pins = <
-+				MX6QDL_PAD_EIM_D19__GPIO3_IO19		0x40013070
-+			>;
-+		};
-+
-+		pinctrl_microsom_brcm_wifi: microsom-brcm-wifi {
-+			fsl,pins = <
-+				MX6QDL_PAD_GPIO_8__XTALOSC_REF_CLK_32K	0x1b0b0
-+				MX6QDL_PAD_CSI0_DATA_EN__GPIO5_IO20	0x40013070
-+				MX6QDL_PAD_CSI0_DAT8__GPIO5_IO26	0x40013070
-+				MX6QDL_PAD_CSI0_DAT9__GPIO5_IO27	0x40013070
-+			>;
-+		};
-+
- 		pinctrl_microsom_uart1: microsom-uart1 {
- 			fsl,pins = <
- 				MX6QDL_PAD_CSI0_DAT10__UART1_TX_DATA	0x1b0b1
- 				MX6QDL_PAD_CSI0_DAT11__UART1_RX_DATA	0x1b0b1
- 			>;
- 		};
-+
-+		pinctrl_microsom_uart4: microsom-uart4 {
-+			fsl,pins = <
-+				MX6QDL_PAD_CSI0_DAT12__UART4_TX_DATA 0x1b0b1
-+				MX6QDL_PAD_CSI0_DAT13__UART4_RX_DATA 0x1b0b1
-+				MX6QDL_PAD_CSI0_DAT16__UART4_RTS_B 0x1b0b1
-+				MX6QDL_PAD_CSI0_DAT17__UART4_CTS_B 0x1b0b1
-+			>;
-+		};
-+
-+		pinctrl_microsom_usdhc1: microsom-usdhc1 {
-+			fsl,pins = <
-+				MX6QDL_PAD_SD1_CMD__SD1_CMD    0x17059
-+				MX6QDL_PAD_SD1_CLK__SD1_CLK    0x10059
-+				MX6QDL_PAD_SD1_DAT0__SD1_DATA0 0x17059
-+				MX6QDL_PAD_SD1_DAT1__SD1_DATA1 0x17059
-+				MX6QDL_PAD_SD1_DAT2__SD1_DATA2 0x17059
-+				MX6QDL_PAD_SD1_DAT3__SD1_DATA3 0x17059
-+			>;
-+		};
- 	};
- };
- 
-@@ -56,3 +139,23 @@
- 	pinctrl-0 = <&pinctrl_microsom_uart1>;
- 	status = "okay";
- };
-+
-+/* UART4 - Connected to optional BRCM Wifi/BT/FM */
-+&uart4 {
-+	pinctrl-names = "default";
-+	pinctrl-0 = <&pinctrl_microsom_brcm_bt &pinctrl_microsom_uart4>;
-+	fsl,uart-has-rtscts;
-+	status = "okay";
-+};
-+
-+/* USDHC1 - Connected to optional BRCM Wifi/BT/FM */
-+&usdhc1 {
-+	pinctrl-names = "default";
-+	pinctrl-0 = <&pinctrl_microsom_brcm_wifi &pinctrl_microsom_usdhc1>;
-+	bus-width = <4>;
-+	mmc-pwrseq = <&usdhc1_pwrseq>;
-+	keep-power-in-suspend;
-+	non-removable;
-+	vmmc-supply = <&reg_brcm>;
-+	status = "okay";
-+};
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6q.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6q.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6q.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6q.dtsi	2015-07-27 23:13:00.303898027 +0200
-@@ -14,6 +14,7 @@
- 
- / {
- 	aliases {
-+		ipu1 = &ipu2;
- 		spi4 = &ecspi5;
- 	};
- 
-@@ -47,9 +48,12 @@
- 				 <&clks IMX6QDL_CLK_PLL2_PFD2_396M>,
- 				 <&clks IMX6QDL_CLK_STEP>,
- 				 <&clks IMX6QDL_CLK_PLL1_SW>,
--				 <&clks IMX6QDL_CLK_PLL1_SYS>;
-+				 <&clks IMX6QDL_CLK_PLL1_SYS>,
-+				 <&clks IMX6QDL_PLL1_BYPASS>,
-+				 <&clks IMX6QDL_CLK_PLL1>,
-+				 <&clks IMX6QDL_PLL1_BYPASS_SRC> ;
- 			clock-names = "arm", "pll2_pfd2_396m", "step",
--				      "pll1_sw", "pll1_sys";
-+				      "pll1_sw", "pll1_sys", "pll1_bypass", "pll1", "pll1_bypass_src";
- 			arm-supply = <&reg_arm>;
- 			pu-supply = <&reg_pu>;
- 			soc-supply = <&reg_soc>;
-@@ -78,9 +82,85 @@
- 	};
- 
- 	soc {
--		ocram: sram@00900000 {
-+
-+		busfreq { /* BUSFREQ */
-+			compatible = "fsl,imx6_busfreq";
-+			clocks = <&clks 171>, <&clks 6>, <&clks 11>, <&clks 104>, <&clks 172>, <&clks 58>,
-+				 <&clks 18>, <&clks 60>, <&clks 20>, <&clks 3>;
-+			clock-names = "pll2_bus", "pll2_pfd2_396m", "pll2_198m", "arm", "pll3_usb_otg", "periph",
-+				      "periph_pre", "periph_clk2", "periph_clk2_sel", "osc";
-+			interrupts = <0 107 0x04>, <0 112 0x4>, <0 113 0x4>, <0 114 0x4>;
-+			interrupt-names = "irq_busfreq_0", "irq_busfreq_1", "irq_busfreq_2", "irq_busfreq_3";
-+			fsl,max_ddr_freq = <528000000>;
-+		};
-+
-+		gpu@00130000 {
-+			compatible = "fsl,imx6q-gpu";
-+			reg = <0x00130000 0x4000>, <0x00134000 0x4000>,
-+			      <0x02204000 0x4000>, <0x0 0x0>;
-+			reg-names = "iobase_3d", "iobase_2d",
-+				    "iobase_vg", "phys_baseaddr";
-+			interrupts = <0 9 0x04>, <0 10 0x04>,<0 11 0x04>;
-+			interrupt-names = "irq_3d", "irq_2d", "irq_vg";
-+			clocks = <&clks 26>, <&clks 143>,
-+				 <&clks 27>, <&clks 121>,
-+				 <&clks 122>, <&clks 74>;
-+			clock-names = "gpu2d_axi_clk", "openvg_axi_clk",
-+				      "gpu3d_axi_clk", "gpu2d_clk",
-+				      "gpu3d_clk", "gpu3d_shader_clk";
-+			resets = <&src 0>, <&src 3>, <&src 3>;
-+			reset-names = "gpu3d", "gpu2d", "gpuvg";
-+			power-domains = <&gpc 1>;
-+		};
-+
-+		hdmi_core: hdmi_core@00120000 {
-+			compatible = "fsl,imx6q-hdmi-core";
-+			reg = <0x00120000 0x9000>;
-+			clocks = <&clks 124>, <&clks 123>;
-+			clock-names = "hdmi_isfr", "hdmi_iahb";
-+			status = "disabled";
-+		};
-+
-+		hdmi_video: hdmi_video@020e0000 {
-+			compatible = "fsl,imx6q-hdmi-video";
-+			reg = <0x020e0000 0x1000>;
-+			reg-names = "hdmi_gpr";
-+			interrupts = <0 115 0x04>;
-+			clocks = <&clks 124>, <&clks 123>;
-+			clock-names = "hdmi_isfr", "hdmi_iahb";
-+			status = "disabled";
-+		};
-+
-+		hdmi_audio: hdmi_audio@00120000 {
-+			compatible = "fsl,imx6q-hdmi-audio";
-+			clocks = <&clks 124>, <&clks 123>;
-+			clock-names = "hdmi_isfr", "hdmi_iahb";
-+			dmas = <&sdma 2 23 0>;
-+			dma-names = "tx";
-+			status = "disabled";
-+		};
-+
-+		hdmi_cec: hdmi_cec@00120000 {
-+			compatible = "fsl,imx6q-hdmi-cec";
-+			interrupts = <0 115 0x04>;
-+			status = "disabled";
-+		};
-+
-+		ocrams: sram@00900000 {
-+			compatible = "fsl,lpm-sram";
-+			reg = <0x00900000 0x4000>;
-+			clocks = <&clks IMX6QDL_CLK_OCRAM>;
-+		};
-+
-+		ocrams_ddr: sram@00904000 {
-+			compatible = "fsl,ddr-lpm-sram";
-+			reg = <0x00904000 0x1000>;
-+			clocks = <&clks IMX6QDL_CLK_OCRAM>;
-+		};
-+
-+		ocram: sram@00905000 {
- 			compatible = "mmio-sram";
--			reg = <0x00900000 0x40000>;
-+			reg = <0x00905000 0x3B000>;
- 			clocks = <&clks IMX6QDL_CLK_OCRAM>;
- 		};
- 
-@@ -101,6 +181,10 @@
- 				};
- 			};
- 
-+			vpu@02040000 {
-+				status = "okay";
-+			};
-+
- 			iomuxc: iomuxc@020e0000 {
- 				compatible = "fsl,imx6q-iomuxc";
- 
-@@ -154,165 +238,33 @@
- 		};
- 
- 		ipu2: ipu@02800000 {
--			#address-cells = <1>;
--			#size-cells = <0>;
- 			compatible = "fsl,imx6q-ipu";
- 			reg = <0x02800000 0x400000>;
- 			interrupts = <0 8 IRQ_TYPE_LEVEL_HIGH>,
- 				     <0 7 IRQ_TYPE_LEVEL_HIGH>;
--			clocks = <&clks IMX6QDL_CLK_IPU2>,
--				 <&clks IMX6QDL_CLK_IPU2_DI0>,
--				 <&clks IMX6QDL_CLK_IPU2_DI1>;
--			clock-names = "bus", "di0", "di1";
-+			clocks = <&clks 133>, <&clks 134>, <&clks 137>,
-+				 <&clks 41>, <&clks 42>,
-+				 <&clks 135>, <&clks 136>;
-+			clock-names = "bus", "di0", "di1",
-+				      "di0_sel", "di1_sel",
-+				      "ldb_di0", "ldb_di1";
- 			resets = <&src 4>;
--
--			ipu2_csi0: port@0 {
--				reg = <0>;
--			};
--
--			ipu2_csi1: port@1 {
--				reg = <1>;
--			};
--
--			ipu2_di0: port@2 {
--				#address-cells = <1>;
--				#size-cells = <0>;
--				reg = <2>;
--
--				ipu2_di0_disp0: endpoint@0 {
--				};
--
--				ipu2_di0_hdmi: endpoint@1 {
--					remote-endpoint = <&hdmi_mux_2>;
--				};
--
--				ipu2_di0_mipi: endpoint@2 {
--				};
--
--				ipu2_di0_lvds0: endpoint@3 {
--					remote-endpoint = <&lvds0_mux_2>;
--				};
--
--				ipu2_di0_lvds1: endpoint@4 {
--					remote-endpoint = <&lvds1_mux_2>;
--				};
--			};
--
--			ipu2_di1: port@3 {
--				#address-cells = <1>;
--				#size-cells = <0>;
--				reg = <3>;
--
--				ipu2_di1_hdmi: endpoint@1 {
--					remote-endpoint = <&hdmi_mux_3>;
--				};
--
--				ipu2_di1_mipi: endpoint@2 {
--				};
--
--				ipu2_di1_lvds0: endpoint@3 {
--					remote-endpoint = <&lvds0_mux_3>;
--				};
--
--				ipu2_di1_lvds1: endpoint@4 {
--					remote-endpoint = <&lvds1_mux_3>;
--				};
--			};
--		};
--	};
--
--	display-subsystem {
--		compatible = "fsl,imx-display-subsystem";
--		ports = <&ipu1_di0>, <&ipu1_di1>, <&ipu2_di0>, <&ipu2_di1>;
--	};
--};
--
--&hdmi {
--	compatible = "fsl,imx6q-hdmi";
--
--	port@2 {
--		reg = <2>;
--
--		hdmi_mux_2: endpoint {
--			remote-endpoint = <&ipu2_di0_hdmi>;
--		};
--	};
--
--	port@3 {
--		reg = <3>;
--
--		hdmi_mux_3: endpoint {
--			remote-endpoint = <&ipu2_di1_hdmi>;
-+			bypass_reset = <0>;
- 		};
- 	};
- };
- 
- &ldb {
--	clocks = <&clks IMX6QDL_CLK_LDB_DI0_SEL>, <&clks IMX6QDL_CLK_LDB_DI1_SEL>,
-+	clocks = <&clks IMX6QDL_CLK_LDB_DI0>, <&clks IMX6QDL_CLK_LDB_DI1>,
- 		 <&clks IMX6QDL_CLK_IPU1_DI0_SEL>, <&clks IMX6QDL_CLK_IPU1_DI1_SEL>,
- 		 <&clks IMX6QDL_CLK_IPU2_DI0_SEL>, <&clks IMX6QDL_CLK_IPU2_DI1_SEL>,
--		 <&clks IMX6QDL_CLK_LDB_DI0>, <&clks IMX6QDL_CLK_LDB_DI1>;
--	clock-names = "di0_pll", "di1_pll",
--		      "di0_sel", "di1_sel", "di2_sel", "di3_sel",
--		      "di0", "di1";
--
--	lvds-channel@0 {
--		port@2 {
--			reg = <2>;
--
--			lvds0_mux_2: endpoint {
--				remote-endpoint = <&ipu2_di0_lvds0>;
--			};
--		};
--
--		port@3 {
--			reg = <3>;
--
--			lvds0_mux_3: endpoint {
--				remote-endpoint = <&ipu2_di1_lvds0>;
--			};
--		};
--	};
--
--	lvds-channel@1 {
--		port@2 {
--			reg = <2>;
--
--			lvds1_mux_2: endpoint {
--				remote-endpoint = <&ipu2_di0_lvds1>;
--			};
--		};
--
--		port@3 {
--			reg = <3>;
--
--			lvds1_mux_3: endpoint {
--				remote-endpoint = <&ipu2_di1_lvds1>;
--			};
--		};
--	};
--};
--
--&mipi_dsi {
--	ports {
--		port@2 {
--			reg = <2>;
--
--			mipi_mux_2: endpoint {
--				remote-endpoint = <&ipu2_di0_mipi>;
--			};
--		};
--
--		port@3 {
--			reg = <3>;
--
--			mipi_mux_3: endpoint {
--				remote-endpoint = <&ipu2_di1_mipi>;
--			};
--		};
--	};
--};
--
--&vpu {
--	compatible = "fsl,imx6q-vpu", "cnm,coda960";
-+		 <&clks IMX6QDL_CLK_LDB_DI0_DIV_3_5>, <&clks IMX6QDL_CLK_LDB_DI1_DIV_3_5>,
-+		 <&clks IMX6QDL_CLK_LDB_DI0_DIV_7>, <&clks IMX6QDL_CLK_LDB_DI1_DIV_7>,
-+		 <&clks IMX6QDL_CLK_LDB_DI0_DIV_SEL>, <&clks IMX6QDL_CLK_LDB_DI1_DIV_SEL>;
-+	clock-names = "ldb_di0", "ldb_di1",
-+		      "di0_sel", "di1_sel",
-+		      "di2_sel", "di3_sel",
-+		      "ldb_di0_div_3_5", "ldb_di1_div_3_5",
-+		      "ldb_di0_div_7", "ldb_di1_div_7",
-+		      "ldb_di0_div_sel", "ldb_di1_div_sel";
- };
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6q-hummingboard.dts linux-xbian-imx6/arch/arm/boot/dts/imx6q-hummingboard.dts
---- linux-4.1.3/arch/arm/boot/dts/imx6q-hummingboard.dts	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6q-hummingboard.dts	2015-07-27 23:13:00.303898027 +0200
-@@ -57,3 +57,7 @@
- 	fsl,transmit-atten-16ths = <9>;
- 	fsl,receive-eq-mdB = <3000>;
- };
-+
-+&sgtl5000 {
-+	status = "okay";
-+};
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6sl.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6sl.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6sl.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6sl.dtsi	2015-07-27 23:13:00.307883804 +0200
-@@ -457,20 +457,21 @@
- 					anatop-min-bit-val = <4>;
- 					anatop-min-voltage = <800000>;
- 					anatop-max-voltage = <1375000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
--				regulator-3p0@120 {
-+				reg_3p0: regulator-3p0@120 {
- 					compatible = "fsl,anatop-regulator";
- 					regulator-name = "vdd3p0";
--					regulator-min-microvolt = <2800000>;
--					regulator-max-microvolt = <3150000>;
--					regulator-always-on;
-+					regulator-min-microvolt = <2625000>;
-+					regulator-max-microvolt = <3400000>;
- 					anatop-reg-offset = <0x120>;
- 					anatop-vol-bit-shift = <8>;
- 					anatop-vol-bit-width = <5>;
- 					anatop-min-bit-val = <0>;
- 					anatop-min-voltage = <2625000>;
- 					anatop-max-voltage = <3400000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
- 				regulator-2p5@130 {
-@@ -485,6 +486,7 @@
- 					anatop-min-bit-val = <0>;
- 					anatop-min-voltage = <2100000>;
- 					anatop-max-voltage = <2850000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
- 				reg_arm: regulator-vddcore@140 {
-@@ -552,6 +554,7 @@
- 				reg = <0x020c9000 0x1000>;
- 				interrupts = <0 44 IRQ_TYPE_LEVEL_HIGH>;
- 				clocks = <&clks IMX6SL_CLK_USBPHY1>;
-+				phy-3p0-supply = <&reg_3p0>;
- 				fsl,anatop = <&anatop>;
- 			};
- 
-@@ -560,6 +563,7 @@
- 				reg = <0x020ca000 0x1000>;
- 				interrupts = <0 45 IRQ_TYPE_LEVEL_HIGH>;
- 				clocks = <&clks IMX6SL_CLK_USBPHY2>;
-+				phy-3p0-supply = <&reg_3p0>;
- 				fsl,anatop = <&anatop>;
- 			};
- 
-diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6sx.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6sx.dtsi
---- linux-4.1.3/arch/arm/boot/dts/imx6sx.dtsi	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/boot/dts/imx6sx.dtsi	2015-07-27 23:13:00.307883804 +0200
-@@ -556,20 +556,21 @@
- 					anatop-min-bit-val = <4>;
- 					anatop-min-voltage = <800000>;
- 					anatop-max-voltage = <1375000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
--				regulator-3p0@120 {
-+				reg_3p0: regulator-3p0@120 {
- 					compatible = "fsl,anatop-regulator";
- 					regulator-name = "vdd3p0";
--					regulator-min-microvolt = <2800000>;
--					regulator-max-microvolt = <3150000>;
--					regulator-always-on;
-+					regulator-min-microvolt = <2625000>;
-+					regulator-max-microvolt = <3400000>;
- 					anatop-reg-offset = <0x120>;
- 					anatop-vol-bit-shift = <8>;
- 					anatop-vol-bit-width = <5>;
- 					anatop-min-bit-val = <0>;
- 					anatop-min-voltage = <2625000>;
- 					anatop-max-voltage = <3400000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
- 				regulator-2p5@130 {
-@@ -584,6 +585,7 @@
- 					anatop-min-bit-val = <0>;
- 					anatop-min-voltage = <2100000>;
- 					anatop-max-voltage = <2875000>;
-+					anatop-enable-bit = <0>;
- 				};
- 
- 				reg_arm: regulator-vddcore@140 {
-@@ -650,6 +652,7 @@
- 				reg = <0x020c9000 0x1000>;
- 				interrupts = <GIC_SPI 44 IRQ_TYPE_LEVEL_HIGH>;
- 				clocks = <&clks IMX6SX_CLK_USBPHY1>;
-+				phy-3p0-supply = <&reg_3p0>;
- 				fsl,anatop = <&anatop>;
- 			};
- 
-@@ -658,6 +661,7 @@
- 				reg = <0x020ca000 0x1000>;
- 				interrupts = <GIC_SPI 45 IRQ_TYPE_LEVEL_HIGH>;
- 				clocks = <&clks IMX6SX_CLK_USBPHY2>;
-+				phy-3p0-supply = <&reg_3p0>;
- 				fsl,anatop = <&anatop>;
- 			};
- 
-diff -Nur linux-4.1.3/arch/arm/include/asm/glue-cache.h linux-xbian-imx6/arch/arm/include/asm/glue-cache.h
---- linux-4.1.3/arch/arm/include/asm/glue-cache.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/include/asm/glue-cache.h	2015-07-27 23:13:00.746319518 +0200
-@@ -102,19 +102,19 @@
- #endif
- 
- #if defined(CONFIG_CPU_V6) || defined(CONFIG_CPU_V6K)
--# ifdef _CACHE
-+//# ifdef _CACHE
- #  define MULTI_CACHE 1
--# else
--#  define _CACHE v6
--# endif
-+//# else
-+//#  define _CACHE v6
-+//# endif
- #endif
- 
- #if defined(CONFIG_CPU_V7)
--# ifdef _CACHE
-+//# ifdef _CACHE
- #  define MULTI_CACHE 1
--# else
--#  define _CACHE v7
--# endif
-+//# else
-+//#  define _CACHE v7
-+//# endif
- #endif
- 
- #if defined(CONFIG_CPU_V7M)
-diff -Nur linux-4.1.3/arch/arm/Kconfig linux-xbian-imx6/arch/arm/Kconfig
---- linux-4.1.3/arch/arm/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/Kconfig	2015-07-27 23:13:00.128523741 +0200
-@@ -1688,6 +1688,7 @@
- 	range 11 64 if ARCH_SHMOBILE_LEGACY
- 	default "12" if SOC_AM33XX
- 	default "9" if SA1111 || ARCH_EFM32
-+	default "14" if ARCH_MXC
- 	default "11"
- 	help
- 	  The kernel memory allocator divides physically contiguous memory
-diff -Nur linux-4.1.3/arch/arm/mach-imx/busfreq_ddr3.c linux-xbian-imx6/arch/arm/mach-imx/busfreq_ddr3.c
---- linux-4.1.3/arch/arm/mach-imx/busfreq_ddr3.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/arch/arm/mach-imx/busfreq_ddr3.c	2015-07-27 23:13:01.073153409 +0200
-@@ -0,0 +1,514 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file busfreq_ddr3.c
-+ *
-+ * @brief iMX6 DDR3 frequency change specific file.
-+ *
-+ * @ingroup PM
-+ */
-+#define DEBUG
-+
-+#include <asm/cacheflush.h>
-+#include <asm/fncpy.h>
-+#include <asm/io.h>
-+#include <asm/mach/map.h>
-+#include <asm/mach-types.h>
-+#include <asm/tlb.h>
-+#include <linux/clk.h>
-+#include <linux/cpumask.h>
-+#include <linux/delay.h>
-+#include <linux/genalloc.h>
-+#include <linux/interrupt.h>
-+#include <linux/irqchip/arm-gic.h>
-+#include <linux/kernel.h>
-+#include <linux/mutex.h>
-+#include <linux/of.h>
-+#include <linux/of_address.h>
-+#include <linux/of_device.h>
-+#include <linux/platform_device.h>
-+#include <linux/proc_fs.h>
-+#include <linux/sched.h>
-+#include <linux/smp.h>
-+#include <linux/slab.h>
-+
-+#include "hardware.h"
-+
-+/* DDR settings */
-+static unsigned long (*iram_ddr_settings)[2];
-+static unsigned long (*normal_mmdc_settings)[2];
-+static unsigned long (*iram_iomux_settings)[2];
-+static void __iomem *mmdc_base;
-+static void __iomem *iomux_base;
-+static void __iomem *ccm_base;
-+static void __iomem *l2_base;
-+static void __iomem *gic_dist_base;
-+static u32 *irqs_used;
-+
-+static void *ddr_freq_change_iram_base;
-+static int ddr_settings_size;
-+static int iomux_settings_size;
-+static volatile unsigned int cpus_in_wfe;
-+static volatile bool wait_for_ddr_freq_update;
-+static int curr_ddr_rate;
-+
-+void (*mx6_change_ddr_freq)(u32 freq, void *ddr_settings,
-+	bool dll_mode, void *iomux_offsets) = NULL;
-+
-+extern unsigned int ddr_med_rate;
-+extern unsigned int ddr_normal_rate;
-+extern int low_bus_freq_mode;
-+extern int audio_bus_freq_mode;
-+extern void mx6_ddr3_freq_change(u32 freq, void *ddr_settings,
-+	bool dll_mode, void *iomux_offsets);
-+extern unsigned long save_ttbr1(void);
-+extern void restore_ttbr1(unsigned long ttbr1);
-+
-+#ifdef CONFIG_SMP
-+extern void __iomem *imx_scu_base;
-+static unsigned int online_cpus;
-+#endif
-+
-+#define MIN_DLL_ON_FREQ		333000000
-+#define MAX_DLL_OFF_FREQ		125000000
-+#define DDR_FREQ_CHANGE_SIZE	0x2000
-+
-+unsigned long ddr3_dll_mx6q[][2] = {
-+	{0x0c, 0x0},
-+	{0x10, 0x0},
-+	{0x1C, 0x04088032},
-+	{0x1C, 0x0408803a},
-+	{0x1C, 0x08408030},
-+	{0x1C, 0x08408038},
-+	{0x818, 0x0},
-+};
-+
-+unsigned long ddr3_calibration[][2] = {
-+	{0x83c, 0x0},
-+	{0x840, 0x0},
-+	{0x483c, 0x0},
-+	{0x4840, 0x0},
-+	{0x848, 0x0},
-+	{0x4848, 0x0},
-+	{0x850, 0x0},
-+	{0x4850, 0x0},
-+};
-+
-+unsigned long ddr3_dll_mx6dl[][2] = {
-+	{0x0c, 0x0},
-+	{0x10, 0x0},
-+	{0x1C, 0x04008032},
-+	{0x1C, 0x0400803a},
-+	{0x1C, 0x07208030},
-+	{0x1C, 0x07208038},
-+	{0x818, 0x0},
-+};
-+
-+unsigned long iomux_offsets_mx6q[][2] = {
-+	{0x5A8, 0x0},
-+	{0x5B0, 0x0},
-+	{0x524, 0x0},
-+	{0x51C, 0x0},
-+	{0x518, 0x0},
-+	{0x50C, 0x0},
-+	{0x5B8, 0x0},
-+	{0x5C0, 0x0},
-+};
-+
-+unsigned long iomux_offsets_mx6dl[][2] = {
-+	{0x4BC, 0x0},
-+	{0x4C0, 0x0},
-+	{0x4C4, 0x0},
-+	{0x4C8, 0x0},
-+	{0x4CC, 0x0},
-+	{0x4D0, 0x0},
-+	{0x4D4, 0x0},
-+	{0x4D8, 0x0},
-+};
-+
-+unsigned long ddr3_400[][2] = {
-+	{0x83c, 0x42490249},
-+	{0x840, 0x02470247},
-+	{0x483c, 0x42570257},
-+	{0x4840, 0x02400240},
-+	{0x848, 0x4039363C},
-+	{0x4848, 0x3A39333F},
-+	{0x850, 0x38414441},
-+	{0x4850, 0x472D4833}
-+};
-+
-+int can_change_ddr_freq(void)
-+{
-+	return 0;
-+}
-+
-+/*
-+ * each active core apart from the one changing
-+ * the DDR frequency will execute this function.
-+ * the rest of the cores have to remain in WFE
-+ * state until the frequency is changed.
-+ */
-+irqreturn_t wait_in_wfe_irq(int irq, void *dev_id)
-+{
-+	u32 me = smp_processor_id();
-+
-+	*((char *)(&cpus_in_wfe) + (u8)me) = 0xff;
-+
-+	while (wait_for_ddr_freq_update)
-+		wfe();
-+
-+	*((char *)(&cpus_in_wfe) + (u8)me) = 0;
-+
-+	return IRQ_HANDLED;
-+}
-+
-+/* change the DDR frequency. */
-+int update_ddr_freq(int ddr_rate)
-+{
-+	int i, j;
-+	bool dll_off = false;
-+	int me = 0;
-+	unsigned long ttbr1;
-+#ifdef CONFIG_SMP
-+	unsigned int reg;
-+	int cpu = 0;
-+#endif
-+
-+	if (!can_change_ddr_freq())
-+		return -1;
-+
-+	if (ddr_rate == curr_ddr_rate)
-+		return 0;
-+
-+	printk(KERN_DEBUG "\nBus freq set to %d start...\n", ddr_rate);
-+
-+	if (low_bus_freq_mode || audio_bus_freq_mode)
-+		dll_off = true;
-+
-+	iram_ddr_settings[0][0] = ddr_settings_size;
-+	iram_iomux_settings[0][0] = iomux_settings_size;
-+	if (ddr_rate == ddr_med_rate && cpu_is_imx6q() &&
-+		ddr_med_rate != ddr_normal_rate) {
-+		for (i = 0; i < ARRAY_SIZE(ddr3_dll_mx6q); i++) {
-+			iram_ddr_settings[i + 1][0] =
-+					normal_mmdc_settings[i][0];
-+			iram_ddr_settings[i + 1][1] =
-+					normal_mmdc_settings[i][1];
-+		}
-+		for (j = 0, i = ARRAY_SIZE(ddr3_dll_mx6q);
-+			i < iram_ddr_settings[0][0]; j++, i++) {
-+			iram_ddr_settings[i + 1][0] =
-+					ddr3_400[j][0];
-+			iram_ddr_settings[i + 1][1] =
-+					ddr3_400[j][1];
-+		}
-+	} else if (ddr_rate == ddr_normal_rate) {
-+		for (i = 0; i < iram_ddr_settings[0][0]; i++) {
-+			iram_ddr_settings[i + 1][0] =
-+					normal_mmdc_settings[i][0];
-+			iram_ddr_settings[i + 1][1] =
-+					normal_mmdc_settings[i][1];
-+		}
-+	}
-+
-+	/* ensure that all Cores are in WFE. */
-+	local_irq_disable();
-+
-+#ifdef CONFIG_SMP
-+	me = smp_processor_id();
-+
-+	/* Make sure all the online cores are active */
-+	while (1) {
-+		bool not_exited_busfreq = false;
-+		for_each_online_cpu(cpu) {
-+			u32 reg = __raw_readl(imx_scu_base + 0x08);
-+			if (reg & (0x02 << (cpu * 8)))
-+				not_exited_busfreq = true;
-+		}
-+		if (!not_exited_busfreq)
-+			break;
-+	}
-+
-+	wmb();
-+	wait_for_ddr_freq_update = 1;
-+	dsb();
-+
-+	online_cpus = readl_relaxed(imx_scu_base + 0x08);
-+	for_each_online_cpu(cpu) {
-+		*((char *)(&online_cpus) + (u8)cpu) = 0x02;
-+		if (cpu != me) {
-+			/* set the interrupt to be pending in the GIC. */
-+			reg = 1 << (irqs_used[cpu] % 32);
-+			writel_relaxed(reg, gic_dist_base + GIC_DIST_PENDING_SET
-+				+ (irqs_used[cpu] / 32) * 4);
-+		}
-+	}
-+	/* Wait for the other active CPUs to idle */
-+	while (1) {
-+		u32 reg = readl_relaxed(imx_scu_base + 0x08);
-+		reg |= (0x02 << (me * 8));
-+		if (reg == online_cpus)
-+			break;
-+	}
-+#endif
-+
-+	/* Ensure iram_tlb_phys_addr is flushed to DDR. */
-+	/*__cpuc_flush_dcache_area(&iram_tlb_phys_addr, sizeof(iram_tlb_phys_addr));
-+	outer_clean_range(virt_to_phys(&iram_tlb_phys_addr), virt_to_phys(&iram_tlb_phys_addr + 1));*/
-+
-+	/*
-+	 * Flush the TLB, to ensure no TLB maintenance occurs
-+	 * when DDR is in self-refresh.
-+	 */
-+	local_flush_tlb_all();
-+
-+	ttbr1 = save_ttbr1();
-+	/* Now we can change the DDR frequency. */
-+	mx6_change_ddr_freq(ddr_rate, iram_ddr_settings,
-+		dll_off, iram_iomux_settings);
-+	restore_ttbr1(ttbr1);
-+	curr_ddr_rate = ddr_rate;
-+
-+#ifdef CONFIG_SMP
-+	wmb();
-+	/* DDR frequency change is done . */
-+	wait_for_ddr_freq_update = 0;
-+	dsb();
-+
-+	/* wake up all the cores. */
-+	sev();
-+#endif
-+
-+	local_irq_enable();
-+
-+	printk(KERN_DEBUG "Bus freq set to %d done! cpu=%d\n", ddr_rate, me);
-+
-+	return 0;
-+}
-+
-+int init_mmdc_ddr3_settings(struct platform_device *busfreq_pdev)
-+{
-+	struct device *dev = &busfreq_pdev->dev;
-+	struct platform_device *ocram_dev;
-+	unsigned int iram_paddr;
-+	int i, err;
-+	u32 cpu;
-+	struct device_node *node;
-+	struct gen_pool *iram_pool;
-+
-+	node = of_find_compatible_node(NULL, NULL, "fsl,imx6q-mmdc-combine");
-+	if (!node) {
-+		pr_err("failed to find imx6q-mmdc device tree data!\n");
-+		return -EINVAL;
-+	}
-+	mmdc_base = of_iomap(node, 0);
-+	WARN(!mmdc_base, "unable to map mmdc registers\n");
-+
-+	node = NULL;
-+	if (cpu_is_imx6q())
-+		node = of_find_compatible_node(NULL, NULL, "fsl,imx6q-iomuxc");
-+	if (cpu_is_imx6dl())
-+		node = of_find_compatible_node(NULL, NULL,
-+			"fsl,imx6dl-iomuxc");
-+	if (!node) {
-+		pr_err("failed to find imx6q-iomux device tree data!\n");
-+		return -EINVAL;
-+	}
-+	iomux_base = of_iomap(node, 0);
-+	WARN(!iomux_base, "unable to map iomux registers\n");
-+
-+	node = of_find_compatible_node(NULL, NULL, "fsl,imx6q-ccm");
-+	if (!node) {
-+		pr_err("failed to find imx6q-ccm device tree data!\n");
-+		return -EINVAL;
-+	}
-+	ccm_base = of_iomap(node, 0);
-+	WARN(!ccm_base, "unable to map mmdc registers\n");
-+
-+	node = of_find_compatible_node(NULL, NULL, "arm,pl310-cache");
-+	if (!node) {
-+		pr_err("failed to find imx6q-pl310-cache device tree data!\n");
-+		return -EINVAL;
-+	}
-+	l2_base = of_iomap(node, 0);
-+	WARN(!ccm_base, "unable to map mmdc registers\n");
-+
-+	node = NULL;
-+	node = of_find_compatible_node(NULL, NULL, "arm,cortex-a9-gic");
-+	if (!node) {
-+		pr_err("failed to find imx6q-a9-gic device tree data!\n");
-+		return -EINVAL;
-+	}
-+	gic_dist_base = of_iomap(node, 0);
-+	WARN(!gic_dist_base, "unable to map gic dist registers\n");
-+
-+	if (cpu_is_imx6q())
-+		ddr_settings_size = ARRAY_SIZE(ddr3_dll_mx6q) +
-+			ARRAY_SIZE(ddr3_calibration);
-+	if (cpu_is_imx6dl())
-+		ddr_settings_size = ARRAY_SIZE(ddr3_dll_mx6dl) +
-+			ARRAY_SIZE(ddr3_calibration);
-+
-+	normal_mmdc_settings = kmalloc((ddr_settings_size * 8), GFP_KERNEL);
-+	if (cpu_is_imx6q()) {
-+		memcpy(normal_mmdc_settings, ddr3_dll_mx6q,
-+			sizeof(ddr3_dll_mx6q));
-+		memcpy(((char *)normal_mmdc_settings + sizeof(ddr3_dll_mx6q)),
-+			ddr3_calibration, sizeof(ddr3_calibration));
-+	}
-+	if (cpu_is_imx6dl()) {
-+		memcpy(normal_mmdc_settings, ddr3_dll_mx6dl,
-+			sizeof(ddr3_dll_mx6dl));
-+		memcpy(((char *)normal_mmdc_settings + sizeof(ddr3_dll_mx6dl)),
-+			ddr3_calibration, sizeof(ddr3_calibration));
-+	}
-+	/* store the original DDR settings at boot. */
-+	for (i = 0; i < ddr_settings_size; i++) {
-+		/*
-+		 * writes via command mode register cannot be read back.
-+		 * hence hardcode them in the initial static array.
-+		 * this may require modification on a per customer basis.
-+		 */
-+		if (normal_mmdc_settings[i][0] != 0x1C)
-+			normal_mmdc_settings[i][1] =
-+				readl_relaxed(mmdc_base
-+				+ normal_mmdc_settings[i][0]);
-+	}
-+
-+	irqs_used = devm_kzalloc(dev, sizeof(u32) * num_present_cpus(),
-+					GFP_KERNEL);
-+
-+	for_each_online_cpu(cpu) {
-+		int irq;
-+
-+		/*
-+		 * set up a reserved interrupt to get all
-+		 * the active cores into a WFE state
-+		 * before changing the DDR frequency.
-+		 */
-+		irq = platform_get_irq(busfreq_pdev, cpu);
-+		err = request_irq(irq, wait_in_wfe_irq,
-+			IRQF_PERCPU, "mmdc_1", NULL);
-+		if (err) {
-+			dev_err(dev,
-+				"Busfreq:request_irq failed %d, err = %d\n",
-+				irq, err);
-+			return err;
-+		}
-+		err = irq_set_affinity(irq, cpumask_of(cpu));
-+		if (err) {
-+			dev_err(dev,
-+				"Busfreq: Cannot set irq affinity irq=%d,\n",
-+				irq);
-+			return err;
-+		}
-+		irqs_used[cpu] = irq;
-+	}
-+
-+	node = NULL;
-+	node = of_find_compatible_node(NULL, NULL, "mmio-sram");
-+	if (!node) {
-+		dev_err(dev, "%s: failed to find ocram node\n",
-+			__func__);
-+		return -EINVAL;
-+	}
-+
-+	ocram_dev = of_find_device_by_node(node);
-+	if (!ocram_dev) {
-+		dev_err(dev, "failed to find ocram device!\n");
-+		return -EINVAL;
-+	}
-+
-+	iram_pool = dev_get_gen_pool(&ocram_dev->dev);
-+	if (!iram_pool) {
-+		dev_err(dev, "iram pool unavailable!\n");
-+		return -EINVAL;
-+	}
-+
-+	iomux_settings_size = ARRAY_SIZE(iomux_offsets_mx6q);
-+	iram_iomux_settings = (void*)gen_pool_alloc(iram_pool,
-+						(iomux_settings_size * 8) + 8);
-+	if (!iram_iomux_settings) {
-+		dev_err(dev, "unable to alloc iram for IOMUX settings!\n");
-+		return -ENOMEM;
-+	}
-+
-+	/*
-+	 * Allocate extra space to store the number of entries in the
-+	 * ddr_settings plus 4 extra regsiter information that needs
-+	 * to be passed to the frequency change code.
-+	 * sizeof(iram_ddr_settings) = sizeof(ddr_settings) +
-+	 *					entries in ddr_settings + 16.
-+	 * The last 4 enties store the addresses of the registers:
-+	 * CCM_BASE_ADDR
-+	 * MMDC_BASE_ADDR
-+	 * IOMUX_BASE_ADDR
-+	 * L2X0_BASE_ADDR
-+	 */
-+	iram_ddr_settings = (void*)gen_pool_alloc(iram_pool,
-+					(ddr_settings_size * 8) + 8 + 32);
-+	if (!iram_ddr_settings) {
-+		dev_err(dev, "unable to alloc iram for ddr settings!\n");
-+		return -ENOMEM;
-+	}
-+	i = ddr_settings_size + 1;
-+	iram_ddr_settings[i][0] = (unsigned long)mmdc_base;
-+	iram_ddr_settings[i+1][0] = (unsigned long)ccm_base;
-+	iram_ddr_settings[i+2][0] = (unsigned long)iomux_base;
-+	iram_ddr_settings[i+3][0] = (unsigned long)l2_base;
-+
-+	if (cpu_is_imx6q()) {
-+		/* store the IOMUX settings at boot. */
-+		for (i = 0; i < iomux_settings_size; i++) {
-+			iomux_offsets_mx6q[i][1] =
-+				readl_relaxed(iomux_base +
-+					iomux_offsets_mx6q[i][0]);
-+			iram_iomux_settings[i+1][0] = iomux_offsets_mx6q[i][0];
-+			iram_iomux_settings[i+1][1] = iomux_offsets_mx6q[i][1];
-+		}
-+	}
-+
-+	if (cpu_is_imx6dl()) {
-+		for (i = 0; i < iomux_settings_size; i++) {
-+			iomux_offsets_mx6dl[i][1] =
-+				readl_relaxed(iomux_base +
-+					iomux_offsets_mx6dl[i][0]);
-+			iram_iomux_settings[i+1][0] = iomux_offsets_mx6dl[i][0];
-+			iram_iomux_settings[i+1][1] = iomux_offsets_mx6dl[i][1];
-+		}
-+	}
-+
-+	ddr_freq_change_iram_base = (void*)gen_pool_alloc(iram_pool,
-+						DDR_FREQ_CHANGE_SIZE);
-+	if (!ddr_freq_change_iram_base) {
-+		dev_err(dev, "Cannot alloc iram for ddr freq change code!\n");
-+		return -ENOMEM;
-+	}
-+
-+	iram_paddr = gen_pool_virt_to_phys(iram_pool,
-+				(unsigned long)ddr_freq_change_iram_base);
-+	/*
-+	 * Need to remap the area here since we want
-+	 * the memory region to be executable.
-+	 */
-+	ddr_freq_change_iram_base = __arm_ioremap(iram_paddr,
-+						DDR_FREQ_CHANGE_SIZE,
-+						MT_MEMORY_RWX_NONCACHED);
-+	mx6_change_ddr_freq = (void *)fncpy(ddr_freq_change_iram_base,
-+		&mx6_ddr3_freq_change, DDR_FREQ_CHANGE_SIZE);
-+
-+	curr_ddr_rate = ddr_normal_rate;
-+
-+	return 0;
-+}
-diff -Nur linux-4.1.3/arch/arm/mach-imx/busfreq-imx6.c linux-xbian-imx6/arch/arm/mach-imx/busfreq-imx6.c
---- linux-4.1.3/arch/arm/mach-imx/busfreq-imx6.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/arch/arm/mach-imx/busfreq-imx6.c	2015-07-27 23:13:01.073153409 +0200
-@@ -0,0 +1,984 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*!
-+ * @file busfreq-imx6.c
-+ *
-+ * @brief A common API for the Freescale Semiconductor iMX6 Busfreq API
-+ *
-+ * The APIs are for setting bus frequency to different values based on the
-+ * highest freqeuncy requested.
-+ *
-+ * @ingroup PM
-+ */
-+
-+#include <linux/module.h>
-+#include <linux/moduleparam.h>
-+#include <asm/cacheflush.h>
-+#include <asm/io.h>
-+#include <asm/mach/map.h>
-+#include <asm/mach-types.h>
-+#include <asm/tlb.h>
-+#include <linux/busfreq-imx6.h>
-+#include <linux/clk.h>
-+#include <linux/clk-provider.h>
-+#include <linux/delay.h>
-+#include <linux/module.h>
-+#include <linux/mutex.h>
-+#include <linux/of.h>
-+#include <linux/platform_device.h>
-+#include <linux/proc_fs.h>
-+#include <linux/reboot.h>
-+#include <linux/regulator/consumer.h>
-+#include <linux/sched.h>
-+#include <linux/suspend.h>
-+#include "hardware.h"
-+
-+#define LPAPM_CLK		24000000
-+#define DDR3_AUDIO_CLK		50000000
-+#define LPDDR2_AUDIO_CLK	100000000
-+
-+int vpu352 = 0;
-+
-+int high_bus_freq_mode;
-+int med_bus_freq_mode;
-+int audio_bus_freq_mode;
-+int low_bus_freq_mode;
-+int ultra_low_bus_freq_mode;
-+unsigned int ddr_med_rate;
-+unsigned int ddr_normal_rate;
-+
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+static int bus_freq_scaling_initialized;
-+static struct device *busfreq_dev;
-+static int busfreq_suspended;
-+static u32 org_arm_rate;
-+static int bus_freq_scaling_is_active;
-+static int high_bus_count, med_bus_count, audio_bus_count, low_bus_count;
-+static unsigned int ddr_low_rate;
-+
-+extern int init_mmdc_lpddr2_settings(struct platform_device *dev);
-+extern int init_mmdc_ddr3_settings(struct platform_device *dev);
-+extern int update_ddr_freq(int ddr_rate);
-+extern int update_lpddr2_freq(int ddr_rate);
-+
-+DEFINE_MUTEX(bus_freq_mutex);
-+static DEFINE_SPINLOCK(freq_lock);
-+
-+static struct clk *pll2_400;
-+static struct clk *periph_clk;
-+static struct clk *periph_pre_clk;
-+static struct clk *periph_clk2_sel;
-+static struct clk *periph_clk2;
-+static struct clk *osc_clk;
-+static struct clk *cpu_clk;
-+static struct clk *pll3;
-+static struct clk *pll2;
-+static struct clk *pll2_200;
-+static struct clk *pll1_sys;
-+static struct clk *periph2_clk;
-+static struct clk *ocram_clk;
-+static struct clk *ahb_clk;
-+static struct clk *pll1_sw_clk;
-+static struct clk *periph2_pre_clk;
-+static struct clk *periph2_clk2_sel;
-+static struct clk *periph2_clk2;
-+static struct clk *step_clk;
-+static struct clk *axi_sel_clk;
-+static struct clk *pll3_pfd1_540m;
-+
-+static u32 pll2_org_rate;
-+static struct delayed_work low_bus_freq_handler;
-+static struct delayed_work bus_freq_daemon;
-+
-+static void enter_lpm_imx6sl(void)
-+{
-+	unsigned long flags;
-+
-+	if (high_bus_freq_mode) {
-+		pll2_org_rate = clk_get_rate(pll2);
-+		/* Set periph_clk to be sourced from OSC_CLK */
-+		clk_set_parent(periph_clk2_sel, osc_clk);
-+		clk_set_parent(periph_clk, periph_clk2);
-+		/* Ensure AHB/AXI clks are at 24MHz. */
-+		clk_set_rate(ahb_clk, LPAPM_CLK);
-+		clk_set_rate(ocram_clk, LPAPM_CLK);
-+	}
-+	if (audio_bus_count) {
-+		/* Set AHB to 8MHz to lower pwer.*/
-+		clk_set_rate(ahb_clk, LPAPM_CLK / 3);
-+
-+		/* Set up DDR to 100MHz. */
-+		spin_lock_irqsave(&freq_lock, flags);
-+		update_lpddr2_freq(LPDDR2_AUDIO_CLK);
-+		spin_unlock_irqrestore(&freq_lock, flags);
-+
-+		/* Fix the clock tree in kernel */
-+		clk_set_rate(pll2, pll2_org_rate);
-+		clk_set_parent(periph2_pre_clk, pll2_200);
-+		clk_set_parent(periph2_clk, periph2_pre_clk);
-+
-+		if (low_bus_freq_mode || ultra_low_bus_freq_mode) {
-+			/*
-+			 * Swtich ARM to run off PLL2_PFD2_400MHz
-+			 * since DDR is anyway at 100MHz.
-+			 */
-+			clk_set_parent(step_clk, pll2_400);
-+			clk_set_parent(pll1_sw_clk, step_clk);
-+			/*
-+			 * Ensure that the clock will be
-+			 * at original speed.
-+			 */
-+			clk_set_rate(cpu_clk, org_arm_rate);
-+		}
-+		low_bus_freq_mode = 0;
-+		ultra_low_bus_freq_mode = 0;
-+		audio_bus_freq_mode = 1;
-+	} else {
-+		u32 arm_div, pll1_rate;
-+		org_arm_rate = clk_get_rate(cpu_clk);
-+		if (low_bus_freq_mode && low_bus_count == 0) {
-+			/*
-+			 * We are already in DDR @ 24MHz state, but
-+			 * no one but ARM needs the DDR. In this case,
-+			 * we can lower the DDR freq to 1MHz when ARM
-+			 * enters WFI in this state. Keep track of this state.
-+			 */
-+			ultra_low_bus_freq_mode = 1;
-+			low_bus_freq_mode = 0;
-+			audio_bus_freq_mode = 0;
-+		} else {
-+			if (!ultra_low_bus_freq_mode && !low_bus_freq_mode) {
-+				/*
-+				 * Set DDR to 24MHz.
-+				 * Since we are going to bypass PLL2,
-+				 * we need to move ARM clk off PLL2_PFD2
-+				 * to PLL1. Make sure the PLL1 is running
-+				 * at the lowest possible freq.
-+				 */
-+				clk_set_rate(pll1_sys,
-+					clk_round_rate(pll1_sys, org_arm_rate));
-+				pll1_rate = clk_get_rate(pll1_sys);
-+				arm_div = pll1_rate / org_arm_rate + 1;
-+				/*
-+				 * Ensure ARM CLK is lower before
-+				 * changing the parent.
-+				 */
-+				clk_set_rate(cpu_clk, org_arm_rate / arm_div);
-+				/* Now set the ARM clk parent to PLL1_SYS. */
-+				clk_set_parent(pll1_sw_clk, pll1_sys);
-+
-+				/*
-+				 * Set STEP_CLK back to OSC to save power and
-+				 * also to maintain the parent.The WFI iram code
-+				 * will switch step_clk to osc, but the clock API
-+				 * is not aware of the change and when a new request
-+				 * to change the step_clk parent to pll2_pfd2_400M
-+				 * is requested sometime later, the change is ignored.
-+				 */
-+				clk_set_parent(step_clk, osc_clk);
-+				/* Now set DDR to 24MHz. */
-+				spin_lock_irqsave(&freq_lock, flags);
-+				update_lpddr2_freq(LPAPM_CLK);
-+				spin_unlock_irqrestore(&freq_lock, flags);
-+
-+				/*
-+				 * Fix the clock tree in kernel.
-+				 * Make sure PLL2 rate is updated as it gets
-+				 * bypassed in the DDR freq change code.
-+				 */
-+				clk_set_rate(pll2, LPAPM_CLK);
-+				clk_set_parent(periph2_clk2_sel, pll2);
-+				clk_set_parent(periph2_clk, periph2_clk2_sel);
-+
-+			}
-+			if (low_bus_count == 0) {
-+				ultra_low_bus_freq_mode = 1;
-+				low_bus_freq_mode = 0;
-+			} else {
-+				ultra_low_bus_freq_mode = 0;
-+				low_bus_freq_mode = 1;
-+			}
-+			audio_bus_freq_mode = 0;
-+		}
-+	}
-+}
-+
-+static void exit_lpm_imx6sl(void)
-+{
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&freq_lock, flags);
-+	/* Change DDR freq in IRAM. */
-+	update_lpddr2_freq(ddr_normal_rate);
-+	spin_unlock_irqrestore(&freq_lock, flags);
-+
-+	/*
-+	 * Fix the clock tree in kernel.
-+	 * Make sure PLL2 rate is updated as it gets
-+	 * un-bypassed in the DDR freq change code.
-+	 */
-+	clk_set_rate(pll2, pll2_org_rate);
-+	clk_set_parent(periph2_pre_clk, pll2_400);
-+	clk_set_parent(periph2_clk, periph2_pre_clk);
-+
-+	/* Ensure that periph_clk is sourced from PLL2_400. */
-+	clk_set_parent(periph_pre_clk, pll2_400);
-+	/*
-+	 * Before switching the perhiph_clk, ensure that the
-+	 * AHB/AXI will not be too fast.
-+	 */
-+	clk_set_rate(ahb_clk, LPAPM_CLK / 3);
-+	clk_set_rate(ocram_clk, LPAPM_CLK / 2);
-+	clk_set_parent(periph_clk, periph_pre_clk);
-+
-+	if (low_bus_freq_mode || ultra_low_bus_freq_mode) {
-+		/* Move ARM from PLL1_SW_CLK to PLL2_400. */
-+		clk_set_parent(step_clk, pll2_400);
-+		clk_set_parent(pll1_sw_clk, step_clk);
-+		clk_set_rate(cpu_clk, org_arm_rate);
-+		ultra_low_bus_freq_mode = 0;
-+	}
-+}
-+
-+int reduce_bus_freq(void)
-+{
-+	int ret = 0;
-+	clk_prepare_enable(pll3);
-+	if (cpu_is_imx6sl())
-+		enter_lpm_imx6sl();
-+	else {
-+		if (cpu_is_imx6dl() && (clk_get_parent(axi_sel_clk)
-+			!= periph_clk))
-+			/* Set axi to periph_clk */
-+			clk_set_parent(axi_sel_clk, periph_clk);
-+
-+		if (audio_bus_count) {
-+			/* Need to ensure that PLL2_PFD_400M is kept ON. */
-+			clk_prepare_enable(pll2_400);
-+			update_ddr_freq(DDR3_AUDIO_CLK);
-+			/* Make sure periph clk's parent also got updated */
-+			ret = clk_set_parent(periph_clk2_sel, pll3);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			ret = clk_set_parent(periph_pre_clk, pll2_200);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			ret = clk_set_parent(periph_clk, periph_pre_clk);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			audio_bus_freq_mode = 1;
-+			low_bus_freq_mode = 0;
-+		} else {
-+			update_ddr_freq(LPAPM_CLK);
-+			/* Make sure periph clk's parent also got updated */
-+			ret = clk_set_parent(periph_clk2_sel, osc_clk);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			/* Set periph_clk parent to OSC via periph_clk2_sel */
-+			ret = clk_set_parent(periph_clk, periph_clk2);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			if (audio_bus_freq_mode)
-+				clk_disable_unprepare(pll2_400);
-+			low_bus_freq_mode = 1;
-+			audio_bus_freq_mode = 0;
-+		}
-+	}
-+	clk_disable_unprepare(pll3);
-+
-+	med_bus_freq_mode = 0;
-+	high_bus_freq_mode = 0;
-+
-+	if (audio_bus_freq_mode)
-+		dev_dbg(busfreq_dev, "Bus freq set to audio mode. Count:\
-+			high %d, med %d, audio %d\n",
-+			high_bus_count, med_bus_count, audio_bus_count);
-+	if (low_bus_freq_mode)
-+		dev_dbg(busfreq_dev, "Bus freq set to low mode. Count:\
-+			high %d, med %d, audio %d\n",
-+			high_bus_count, med_bus_count, audio_bus_count);
-+
-+	return ret;
-+}
-+
-+static void reduce_bus_freq_handler(struct work_struct *work)
-+{
-+	mutex_lock(&bus_freq_mutex);
-+
-+	reduce_bus_freq();
-+
-+	mutex_unlock(&bus_freq_mutex);
-+}
-+
-+/*
-+ * Set the DDR, AHB to 24MHz.
-+ * This mode will be activated only when none of the modules that
-+ * need a higher DDR or AHB frequency are active.
-+ */
-+int set_low_bus_freq(void)
-+{
-+	if (busfreq_suspended)
-+		return 0;
-+
-+	if (!bus_freq_scaling_initialized || !bus_freq_scaling_is_active)
-+		return 0;
-+
-+	/*
-+	 * Check to see if we need to got from
-+	 * low bus freq mode to audio bus freq mode.
-+	 * If so, the change needs to be done immediately.
-+	 */
-+	if (audio_bus_count && (low_bus_freq_mode || ultra_low_bus_freq_mode))
-+		reduce_bus_freq();
-+	else
-+		/*
-+		 * Don't lower the frequency immediately. Instead
-+		 * scheduled a delayed work and drop the freq if
-+		 * the conditions still remain the same.
-+		 */
-+		schedule_delayed_work(&low_bus_freq_handler,
-+					usecs_to_jiffies(3000000));
-+	return 0;
-+}
-+
-+/*
-+ * Set the DDR to either 528MHz or 400MHz for iMX6qd
-+ * or 400MHz for iMX6dl.
-+ */
-+int set_high_bus_freq(int high_bus_freq)
-+{
-+	int ret = 0;
-+	struct clk *periph_clk_parent;
-+
-+	if (bus_freq_scaling_initialized && bus_freq_scaling_is_active)
-+		cancel_delayed_work_sync(&low_bus_freq_handler);
-+
-+	if (busfreq_suspended)
-+		return 0;
-+
-+	if (cpu_is_imx6q())
-+		periph_clk_parent = pll2;
-+	else
-+		periph_clk_parent = pll2_400;
-+
-+	if (!bus_freq_scaling_initialized || !bus_freq_scaling_is_active)
-+		return 0;
-+
-+	if (high_bus_freq_mode)
-+		return 0;
-+
-+	/* medium bus freq is only supported for MX6DQ */
-+	if (med_bus_freq_mode && !high_bus_freq)
-+		return 0;
-+
-+	clk_prepare_enable(pll3);
-+	if (cpu_is_imx6sl())
-+		exit_lpm_imx6sl();
-+	else {
-+		if (high_bus_freq) {
-+			update_ddr_freq(ddr_normal_rate);
-+			/* Make sure periph clk's parent also got updated */
-+			ret = clk_set_parent(periph_clk2_sel, pll3);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			ret = clk_set_parent(periph_pre_clk, periph_clk_parent);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			ret = clk_set_parent(periph_clk, periph_pre_clk);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			if (cpu_is_imx6dl() && (clk_get_parent(axi_sel_clk)
-+				!= pll3_pfd1_540m))
-+				/* Set axi to pll3_pfd1_540m */
-+				clk_set_parent(axi_sel_clk, pll3_pfd1_540m);
-+		} else {
-+			update_ddr_freq(ddr_med_rate);
-+			/* Make sure periph clk's parent also got updated */
-+			ret = clk_set_parent(periph_clk2_sel, pll3);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			ret = clk_set_parent(periph_pre_clk, pll2_400);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+			ret = clk_set_parent(periph_clk, periph_pre_clk);
-+			if (ret)
-+				dev_WARN(busfreq_dev,
-+					"%s: %d: clk set parent fail!\n",
-+					__func__, __LINE__);
-+		}
-+		if (audio_bus_freq_mode)
-+			clk_disable_unprepare(pll2_400);
-+	}
-+
-+	high_bus_freq_mode = 1;
-+	med_bus_freq_mode = 0;
-+	low_bus_freq_mode = 0;
-+	audio_bus_freq_mode = 0;
-+
-+	clk_disable_unprepare(pll3);
-+
-+	if (high_bus_freq_mode)
-+		dev_dbg(busfreq_dev, "Bus freq set to high mode. Count:\
-+			high %d, med %d, audio %d\n",
-+			high_bus_count, med_bus_count, audio_bus_count);
-+	if (med_bus_freq_mode)
-+		dev_dbg(busfreq_dev, "Bus freq set to med mode. Count:\
-+			high %d, med %d, audio %d\n",
-+			high_bus_count, med_bus_count, audio_bus_count);
-+
-+	return 0;
-+}
-+#endif
-+
-+void request_bus_freq(enum bus_freq_mode mode)
-+{
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+	mutex_lock(&bus_freq_mutex);
-+
-+	if (mode == BUS_FREQ_HIGH)
-+		high_bus_count++;
-+	else if (mode == BUS_FREQ_MED)
-+		med_bus_count++;
-+	else if (mode == BUS_FREQ_AUDIO)
-+		audio_bus_count++;
-+	else if (mode == BUS_FREQ_LOW)
-+		low_bus_count++;
-+
-+	if (busfreq_suspended || !bus_freq_scaling_initialized ||
-+		!bus_freq_scaling_is_active) {
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+	cancel_delayed_work_sync(&low_bus_freq_handler);
-+
-+	if (cpu_is_imx6dl()) {
-+		/* No support for medium setpoint on MX6DL. */
-+		if (mode == BUS_FREQ_MED) {
-+			high_bus_count++;
-+			mode = BUS_FREQ_HIGH;
-+		}
-+	}
-+
-+	if ((mode == BUS_FREQ_HIGH) && (!high_bus_freq_mode)) {
-+		set_high_bus_freq(1);
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+
-+	if ((mode == BUS_FREQ_MED) && (!high_bus_freq_mode) &&
-+		(!med_bus_freq_mode)) {
-+		set_high_bus_freq(0);
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+	if ((mode == BUS_FREQ_AUDIO) && (!high_bus_freq_mode) &&
-+		(!med_bus_freq_mode) && (!audio_bus_freq_mode)) {
-+		set_low_bus_freq();
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+	mutex_unlock(&bus_freq_mutex);
-+#endif
-+	return;
-+}
-+EXPORT_SYMBOL(request_bus_freq);
-+
-+void release_bus_freq(enum bus_freq_mode mode)
-+{
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+	mutex_lock(&bus_freq_mutex);
-+
-+	if (mode == BUS_FREQ_HIGH) {
-+		if (high_bus_count == 0) {
-+			dev_err(busfreq_dev, "high bus count mismatch!\n");
-+			dump_stack();
-+			mutex_unlock(&bus_freq_mutex);
-+			return;
-+		}
-+		high_bus_count--;
-+	} else if (mode == BUS_FREQ_MED) {
-+		if (med_bus_count == 0) {
-+			dev_err(busfreq_dev, "med bus count mismatch!\n");
-+			dump_stack();
-+			mutex_unlock(&bus_freq_mutex);
-+			return;
-+		}
-+		med_bus_count--;
-+	} else if (mode == BUS_FREQ_AUDIO) {
-+		if (audio_bus_count == 0) {
-+			dev_err(busfreq_dev, "audio bus count mismatch!\n");
-+			dump_stack();
-+			mutex_unlock(&bus_freq_mutex);
-+			return;
-+		}
-+		audio_bus_count--;
-+	} else if (mode == BUS_FREQ_LOW) {
-+		if (low_bus_count == 0) {
-+			dev_err(busfreq_dev, "low bus count mismatch!\n");
-+			dump_stack();
-+			mutex_unlock(&bus_freq_mutex);
-+			return;
-+		}
-+		low_bus_count--;
-+	}
-+
-+	if (busfreq_suspended || !bus_freq_scaling_initialized ||
-+		!bus_freq_scaling_is_active) {
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+
-+	if (cpu_is_imx6dl()) {
-+		/* No support for medium setpoint on MX6DL. */
-+		if (mode == BUS_FREQ_MED) {
-+			high_bus_count--;
-+			mode = BUS_FREQ_HIGH;
-+		}
-+	}
-+
-+	if ((!audio_bus_freq_mode) && (high_bus_count == 0) &&
-+		(med_bus_count == 0) && (audio_bus_count != 0)) {
-+		set_low_bus_freq();
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+	if ((!low_bus_freq_mode) && (high_bus_count == 0) &&
-+		(med_bus_count == 0) && (audio_bus_count == 0) &&
-+		(low_bus_count != 0)) {
-+		set_low_bus_freq();
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+	if ((!ultra_low_bus_freq_mode) && (high_bus_count == 0) &&
-+		(med_bus_count == 0) && (audio_bus_count == 0) &&
-+		(low_bus_count == 0)) {
-+		set_low_bus_freq();
-+		mutex_unlock(&bus_freq_mutex);
-+		return;
-+	}
-+
-+	mutex_unlock(&bus_freq_mutex);
-+#endif
-+	return;
-+}
-+EXPORT_SYMBOL(release_bus_freq);
-+
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+static void bus_freq_daemon_handler(struct work_struct *work)
-+{
-+	mutex_lock(&bus_freq_mutex);
-+	if ((!low_bus_freq_mode) && (!ultra_low_bus_freq_mode) && (high_bus_count == 0) &&
-+		(med_bus_count == 0) && (audio_bus_count == 0))
-+		set_low_bus_freq();
-+	mutex_unlock(&bus_freq_mutex);
-+}
-+
-+static ssize_t bus_freq_scaling_enable_show(struct device *dev,
-+				struct device_attribute *attr, char *buf)
-+{
-+	if (bus_freq_scaling_is_active)
-+		return sprintf(buf, "Bus frequency scaling is enabled\n");
-+	else
-+		return sprintf(buf, "Bus frequency scaling is disabled\n");
-+}
-+
-+static ssize_t vpu352_enable_show(struct device *dev,
-+				struct device_attribute *attr, char *buf)
-+{
-+	if (vpu352)
-+		return sprintf(buf, "VPU352M is enabled\n");
-+	else
-+		return sprintf(buf, "VPU352M is disabled\n");
-+}
-+
-+static int vpu352_setup(char *options)
-+{
-+	return kstrtol(options, 0, (long int *)&vpu352);
-+}
-+
-+static ssize_t bus_freq_scaling_enable_store(struct device *dev,
-+				 struct device_attribute *attr,
-+				 const char *buf, size_t size)
-+{
-+	if (strncmp(buf, "1", 1) == 0) {
-+		bus_freq_scaling_is_active = 1;
-+		set_high_bus_freq(1);
-+		/*
-+		 * We set bus freq to highest at the beginning,
-+		 * so we use this daemon thread to make sure system
-+		 * can enter low bus mode if
-+		 * there is no high bus request pending
-+		 */
-+		schedule_delayed_work(&bus_freq_daemon,
-+			usecs_to_jiffies(5000000));
-+	} else if (strncmp(buf, "0", 1) == 0) {
-+		if (bus_freq_scaling_is_active)
-+			set_high_bus_freq(1);
-+		bus_freq_scaling_is_active = 0;
-+	}
-+	return size;
-+}
-+
-+static int bus_freq_pm_notify(struct notifier_block *nb, unsigned long event,
-+	void *dummy)
-+{
-+	mutex_lock(&bus_freq_mutex);
-+
-+	if (event == PM_SUSPEND_PREPARE) {
-+		high_bus_count++;
-+		set_high_bus_freq(1);
-+		busfreq_suspended = 1;
-+	} else if (event == PM_POST_SUSPEND) {
-+		busfreq_suspended = 0;
-+		high_bus_count--;
-+		schedule_delayed_work(&bus_freq_daemon,
-+			usecs_to_jiffies(5000000));
-+	}
-+
-+	mutex_unlock(&bus_freq_mutex);
-+
-+	return NOTIFY_OK;
-+}
-+
-+static int busfreq_reboot_notifier_event(struct notifier_block *this,
-+						 unsigned long event, void *ptr)
-+{
-+	/* System is rebooting. Set the system into high_bus_freq_mode. */
-+	request_bus_freq(BUS_FREQ_HIGH);
-+
-+	return 0;
-+}
-+
-+static struct notifier_block imx_bus_freq_pm_notifier = {
-+	.notifier_call = bus_freq_pm_notify,
-+};
-+
-+static struct notifier_block imx_busfreq_reboot_notifier = {
-+	.notifier_call = busfreq_reboot_notifier_event,
-+};
-+
-+
-+static DEVICE_ATTR(enable, 0644, bus_freq_scaling_enable_show,
-+			bus_freq_scaling_enable_store);
-+static DEVICE_ATTR(vpu352, 0444, vpu352_enable_show,
-+			NULL);
-+#endif
-+
-+/*!
-+ * This is the probe routine for the bus frequency driver.
-+ *
-+ * @param   pdev   The platform device structure
-+ *
-+ * @return         The function returns 0 on success
-+ *
-+ */
-+
-+static int busfreq_probe(struct platform_device *pdev)
-+{
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+	u32 err;
-+
-+	busfreq_dev = &pdev->dev;
-+
-+	pll2_400 = devm_clk_get(&pdev->dev, "pll2_pfd2_396m");
-+	if (IS_ERR(pll2_400)) {
-+		dev_err(busfreq_dev, "%s: failed to get pll2_pfd2_396m\n",
-+		__func__);
-+		return PTR_ERR(pll2_400);
-+	}
-+
-+	pll2_200 = devm_clk_get(&pdev->dev, "pll2_198m");
-+	if (IS_ERR(pll2_200)) {
-+		dev_err(busfreq_dev, "%s: failed to get pll2_198m\n",
-+			__func__);
-+		return PTR_ERR(pll2_200);
-+	}
-+
-+	pll2 = devm_clk_get(&pdev->dev, "pll2_bus");
-+	if (IS_ERR(pll2)) {
-+		dev_err(busfreq_dev, "%s: failed to get pll2_bus\n",
-+			__func__);
-+		return PTR_ERR(pll2);
-+	}
-+
-+	cpu_clk = devm_clk_get(&pdev->dev, "arm");
-+	if (IS_ERR(cpu_clk)) {
-+		dev_err(busfreq_dev, "%s: failed to get cpu_clk\n",
-+			__func__);
-+		return PTR_ERR(cpu_clk);
-+	}
-+
-+	pll3 = devm_clk_get(&pdev->dev, "pll3_usb_otg");
-+	if (IS_ERR(pll3)) {
-+		dev_err(busfreq_dev, "%s: failed to get pll3_usb_otg\n",
-+			__func__);
-+		return PTR_ERR(pll3);
-+	}
-+
-+	periph_clk = devm_clk_get(&pdev->dev, "periph");
-+	if (IS_ERR(periph_clk)) {
-+		dev_err(busfreq_dev, "%s: failed to get periph\n",
-+			__func__);
-+		return PTR_ERR(periph_clk);
-+	}
-+
-+	periph_pre_clk = devm_clk_get(&pdev->dev, "periph_pre");
-+	if (IS_ERR(periph_pre_clk)) {
-+		dev_err(busfreq_dev, "%s: failed to get periph_pre\n",
-+			__func__);
-+		return PTR_ERR(periph_pre_clk);
-+	}
-+
-+	periph_clk2 = devm_clk_get(&pdev->dev, "periph_clk2");
-+	if (IS_ERR(periph_clk2)) {
-+		dev_err(busfreq_dev, "%s: failed to get periph_clk2\n",
-+			__func__);
-+		return PTR_ERR(periph_clk2);
-+	}
-+
-+	periph_clk2_sel = devm_clk_get(&pdev->dev, "periph_clk2_sel");
-+	if (IS_ERR(periph_clk2_sel)) {
-+		dev_err(busfreq_dev, "%s: failed to get periph_clk2_sel\n",
-+			__func__);
-+		return PTR_ERR(periph_clk2_sel);
-+	}
-+
-+	osc_clk = devm_clk_get(&pdev->dev, "osc");
-+	if (IS_ERR(osc_clk)) {
-+		dev_err(busfreq_dev, "%s: failed to get osc_clk\n",
-+			__func__);
-+		return PTR_ERR(osc_clk);
-+	}
-+
-+	if (cpu_is_imx6dl()) {
-+		axi_sel_clk = devm_clk_get(&pdev->dev, "axi_sel");
-+		if (IS_ERR(axi_sel_clk)) {
-+			dev_err(busfreq_dev, "%s: failed to get axi_sel_clk\n",
-+				__func__);
-+			return PTR_ERR(axi_sel_clk);
-+		}
-+
-+		pll3_pfd1_540m = devm_clk_get(&pdev->dev, "pll3_pfd1_540m");
-+		if (IS_ERR(pll3_pfd1_540m)) {
-+			dev_err(busfreq_dev,
-+				"%s: failed to get pll3_pfd1_540m\n", __func__);
-+			return PTR_ERR(pll3_pfd1_540m);
-+		}
-+	}
-+
-+	if (cpu_is_imx6sl()) {
-+		pll1_sys = devm_clk_get(&pdev->dev, "pll1_sys");
-+		if (IS_ERR(pll1_sys)) {
-+			dev_err(busfreq_dev, "%s: failed to get pll1_sys\n",
-+				__func__);
-+			return PTR_ERR(pll1_sys);
-+		}
-+
-+		ahb_clk = devm_clk_get(&pdev->dev, "ahb");
-+		if (IS_ERR(ahb_clk)) {
-+			dev_err(busfreq_dev, "%s: failed to get ahb_clk\n",
-+				__func__);
-+			return PTR_ERR(ahb_clk);
-+		}
-+
-+		ocram_clk = devm_clk_get(&pdev->dev, "ocram");
-+		if (IS_ERR(ocram_clk)) {
-+			dev_err(busfreq_dev, "%s: failed to get ocram_clk\n",
-+				__func__);
-+			return PTR_ERR(ocram_clk);
-+		}
-+
-+		pll1_sw_clk = devm_clk_get(&pdev->dev, "pll1_sw");
-+		if (IS_ERR(pll1_sw_clk)) {
-+			dev_err(busfreq_dev, "%s: failed to get pll1_sw_clk\n",
-+				__func__);
-+			return PTR_ERR(pll1_sw_clk);
-+		}
-+
-+		periph2_clk = devm_clk_get(&pdev->dev, "periph2");
-+		if (IS_ERR(periph2_clk)) {
-+			dev_err(busfreq_dev, "%s: failed to get periph2\n",
-+				__func__);
-+			return PTR_ERR(periph2_clk);
-+		}
-+
-+		periph2_pre_clk = devm_clk_get(&pdev->dev, "periph2_pre");
-+		if (IS_ERR(periph2_pre_clk)) {
-+			dev_err(busfreq_dev,
-+				"%s: failed to get periph2_pre_clk\n",
-+				__func__);
-+			return PTR_ERR(periph2_pre_clk);
-+		}
-+
-+		periph2_clk2 = devm_clk_get(&pdev->dev, "periph2_clk2");
-+		if (IS_ERR(periph2_clk2)) {
-+			dev_err(busfreq_dev,
-+				"%s: failed to get periph2_clk2\n",
-+				__func__);
-+			return PTR_ERR(periph2_clk2);
-+		}
-+
-+		periph2_clk2_sel = devm_clk_get(&pdev->dev, "periph2_clk2_sel");
-+		if (IS_ERR(periph2_clk2_sel)) {
-+			dev_err(busfreq_dev,
-+				"%s: failed to get periph2_clk2_sel\n",
-+				__func__);
-+			return PTR_ERR(periph2_clk2_sel);
-+		}
-+
-+		step_clk = devm_clk_get(&pdev->dev, "step");
-+		if (IS_ERR(step_clk)) {
-+			dev_err(busfreq_dev,
-+				"%s: failed to get step_clk\n",
-+				__func__);
-+			return PTR_ERR(periph2_clk2_sel);
-+		}
-+
-+	}
-+
-+	err = sysfs_create_file(&busfreq_dev->kobj, &dev_attr_enable.attr);
-+	if (err) {
-+		dev_err(busfreq_dev,
-+		       "Unable to register sysdev entry for BUSFREQ");
-+		return err;
-+	}
-+	err = sysfs_create_file(&busfreq_dev->kobj, &dev_attr_vpu352.attr);
-+	if (err) {
-+		dev_err(busfreq_dev,
-+		       "Unable to register sysdev entry for BUSFREQ");
-+		return err;
-+	}
-+
-+	if (of_property_read_u32(pdev->dev.of_node, "fsl,max_ddr_freq",
-+			&ddr_normal_rate)) {
-+		dev_err(busfreq_dev, "max_ddr_freq entry missing\n");
-+		return -EINVAL;
-+	}
-+#endif
-+
-+	high_bus_freq_mode = 1;
-+	med_bus_freq_mode = 0;
-+	low_bus_freq_mode = 0;
-+	audio_bus_freq_mode = 0;
-+	ultra_low_bus_freq_mode = 0;
-+
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+	bus_freq_scaling_is_active = 1;
-+	bus_freq_scaling_initialized = 1;
-+
-+	ddr_low_rate = LPAPM_CLK;
-+	if (cpu_is_imx6q()) {
-+		if (of_property_read_u32(pdev->dev.of_node, "fsl,med_ddr_freq",
-+				&ddr_med_rate)) {
-+			dev_info(busfreq_dev,
-+					"DDR medium rate not supported.\n");
-+			ddr_med_rate = ddr_normal_rate;
-+		}
-+	}
-+
-+	INIT_DELAYED_WORK(&low_bus_freq_handler, reduce_bus_freq_handler);
-+	INIT_DELAYED_WORK(&bus_freq_daemon, bus_freq_daemon_handler);
-+	register_pm_notifier(&imx_bus_freq_pm_notifier);
-+	register_reboot_notifier(&imx_busfreq_reboot_notifier);
-+
-+	if (cpu_is_imx6sl())
-+		err = init_mmdc_lpddr2_settings(pdev);
-+	else
-+		err = init_mmdc_ddr3_settings(pdev);
-+	if (err) {
-+		dev_err(busfreq_dev, "Busfreq init of MMDC failed\n");
-+		return err;
-+	}
-+#endif
-+	return 0;
-+}
-+
-+static const struct of_device_id imx6_busfreq_ids[] = {
-+	{ .compatible = "fsl,imx6_busfreq", },
-+	{ /* sentinel */ }
-+};
-+
-+static struct platform_driver busfreq_driver = {
-+	.driver = {
-+		.name = "imx6_busfreq",
-+		.owner  = THIS_MODULE,
-+		.of_match_table = imx6_busfreq_ids,
-+		},
-+	.probe = busfreq_probe,
-+};
-+
-+/*!
-+ * Initialise the busfreq_driver.
-+ *
-+ * @return  The function always returns 0.
-+ */
-+
-+static int __init busfreq_init(void)
-+{
-+	if (vpu352) {
-+		printk(KERN_INFO "VPU@352Mhz activated. Bus freq driver module not loading\n");
-+		return 0;
-+	}
-+
-+	if (platform_driver_register(&busfreq_driver) != 0)
-+		return -ENODEV;
-+
-+	printk(KERN_INFO "Bus freq driver module loaded\n");
-+
-+	return 0;
-+}
-+
-+static void __exit busfreq_cleanup(void)
-+{
-+#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+	sysfs_remove_file(&busfreq_dev->kobj, &dev_attr_enable.attr);
-+
-+	bus_freq_scaling_initialized = 0;
-+#endif
-+	/* Unregister the device structure */
-+	platform_driver_unregister(&busfreq_driver);
-+}
-+
-+__setup("vpu352=", vpu352_setup);
-+module_init(busfreq_init);
-+module_exit(busfreq_cleanup);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("BusFreq driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/arch/arm/mach-imx/busfreq_lpddr2.c linux-xbian-imx6/arch/arm/mach-imx/busfreq_lpddr2.c
---- linux-4.1.3/arch/arm/mach-imx/busfreq_lpddr2.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/arch/arm/mach-imx/busfreq_lpddr2.c	2015-07-27 23:13:01.073153409 +0200
-@@ -0,0 +1,183 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file busfreq_lpddr2.c
-+ *
-+ * @brief iMX6 LPDDR2 frequency change specific file.
-+ *
-+ * @ingroup PM
-+ */
-+#include <asm/cacheflush.h>
-+#include <asm/fncpy.h>
-+#include <asm/io.h>
-+#include <asm/mach/map.h>
-+#include <asm/mach-types.h>
-+#include <asm/tlb.h>
-+#include <linux/clk.h>
-+#include <linux/cpumask.h>
-+#include <linux/delay.h>
-+#include <linux/genalloc.h>
-+#include <linux/interrupt.h>
-+#include <linux/irqchip/arm-gic.h>
-+#include <linux/kernel.h>
-+#include <linux/mutex.h>
-+#include <linux/of.h>
-+#include <linux/of_address.h>
-+#include <linux/of_device.h>
-+#include <linux/platform_device.h>
-+#include <linux/proc_fs.h>
-+#include <linux/sched.h>
-+#include <linux/smp.h>
-+
-+#include "hardware.h"
-+
-+/* DDR settings */
-+static void __iomem *mmdc_base;
-+static void __iomem *anatop_base;
-+static void __iomem *ccm_base;
-+static void __iomem *l2_base;
-+static struct device *busfreq_dev;
-+static void *ddr_freq_change_iram_base;
-+static int curr_ddr_rate;
-+
-+unsigned long reg_addrs[4];
-+
-+void (*mx6_change_lpddr2_freq)(u32 ddr_freq, int bus_freq_mode,
-+	void *iram_addr) = NULL;
-+
-+extern unsigned int ddr_normal_rate;
-+extern int low_bus_freq_mode;
-+extern int ultra_low_bus_freq_mode;
-+extern void mx6_lpddr2_freq_change(u32 freq, int bus_freq_mode,
-+	void *iram_addr);
-+
-+
-+#define LPDDR2_FREQ_CHANGE_SIZE	0x1000
-+
-+
-+/* change the DDR frequency. */
-+int update_lpddr2_freq(int ddr_rate)
-+{
-+	if (ddr_rate == curr_ddr_rate)
-+		return 0;
-+
-+	dev_dbg(busfreq_dev, "\nBus freq set to %d start...\n", ddr_rate);
-+
-+	/*
-+	 * Flush the TLB, to ensure no TLB maintenance occurs
-+	 * when DDR is in self-refresh.
-+	 */
-+	local_flush_tlb_all();
-+	/* Now change DDR frequency. */
-+	mx6_change_lpddr2_freq(ddr_rate,
-+		(low_bus_freq_mode | ultra_low_bus_freq_mode),
-+		reg_addrs);
-+
-+	curr_ddr_rate = ddr_rate;
-+
-+	dev_dbg(busfreq_dev, "\nBus freq set to %d done...\n", ddr_rate);
-+
-+	return 0;
-+}
-+
-+int init_mmdc_lpddr2_settings(struct platform_device *busfreq_pdev)
-+{
-+	struct platform_device *ocram_dev;
-+	unsigned int iram_paddr;
-+	struct device_node *node;
-+	struct gen_pool *iram_pool;
-+
-+	busfreq_dev = &busfreq_pdev->dev;
-+	node = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-mmdc");
-+	if (!node) {
-+		printk(KERN_ERR "failed to find imx6sl-mmdc device tree data!\n");
-+		return -EINVAL;
-+	}
-+	mmdc_base = of_iomap(node, 0);
-+	WARN(!mmdc_base, "unable to map mmdc registers\n");
-+
-+	node = NULL;
-+	node = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-ccm");
-+	if (!node) {
-+		printk(KERN_ERR "failed to find imx6sl-ccm device tree data!\n");
-+		return -EINVAL;
-+	}
-+	ccm_base = of_iomap(node, 0);
-+	WARN(!ccm_base, "unable to map ccm registers\n");
-+
-+	node = of_find_compatible_node(NULL, NULL, "arm,pl310-cache");
-+	if (!node) {
-+		printk(KERN_ERR "failed to find imx6sl-pl310-cache device tree data!\n");
-+		return -EINVAL;
-+	}
-+	l2_base = of_iomap(node, 0);
-+	WARN(!l2_base, "unable to map PL310 registers\n");
-+
-+	node = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-anatop");
-+	if (!node) {
-+		printk(KERN_ERR "failed to find imx6sl-pl310-cache device tree data!\n");
-+		return -EINVAL;
-+	}
-+	anatop_base = of_iomap(node, 0);
-+	WARN(!anatop_base, "unable to map anatop registers\n");
-+
-+	node = NULL;
-+	node = of_find_compatible_node(NULL, NULL, "mmio-sram");
-+	if (!node) {
-+		dev_err(busfreq_dev, "%s: failed to find ocram node\n",
-+			__func__);
-+		return -EINVAL;
-+	}
-+
-+	ocram_dev = of_find_device_by_node(node);
-+	if (!ocram_dev) {
-+		dev_err(busfreq_dev, "failed to find ocram device!\n");
-+		return -EINVAL;
-+	}
-+
-+	iram_pool = dev_get_gen_pool(&ocram_dev->dev);
-+	if (!iram_pool) {
-+		dev_err(busfreq_dev, "iram pool unavailable!\n");
-+		return -EINVAL;
-+	}
-+
-+	reg_addrs[0] = (unsigned long)anatop_base;
-+	reg_addrs[1] = (unsigned long)ccm_base;
-+	reg_addrs[2] = (unsigned long)mmdc_base;
-+	reg_addrs[3] = (unsigned long)l2_base;
-+
-+	ddr_freq_change_iram_base = (void *)gen_pool_alloc(iram_pool,
-+						LPDDR2_FREQ_CHANGE_SIZE);
-+	if (!ddr_freq_change_iram_base) {
-+		dev_err(busfreq_dev,
-+			"Cannot alloc iram for ddr freq change code!\n");
-+		return -ENOMEM;
-+	}
-+
-+	iram_paddr = gen_pool_virt_to_phys(iram_pool,
-+				(unsigned long)ddr_freq_change_iram_base);
-+	/*
-+	 * Need to remap the area here since we want
-+	 * the memory region to be executable.
-+	 */
-+	ddr_freq_change_iram_base = __arm_ioremap(iram_paddr,
-+						LPDDR2_FREQ_CHANGE_SIZE,
-+						MT_MEMORY_RWX_NONCACHED);
-+	mx6_change_lpddr2_freq = (void *)fncpy(ddr_freq_change_iram_base,
-+		&mx6_lpddr2_freq_change, LPDDR2_FREQ_CHANGE_SIZE);
-+
-+	curr_ddr_rate = ddr_normal_rate;
-+
-+	return 0;
-+}
-diff -Nur linux-4.1.3/arch/arm/mach-imx/clk.h linux-xbian-imx6/arch/arm/mach-imx/clk.h
---- linux-4.1.3/arch/arm/mach-imx/clk.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/clk.h	2015-07-27 23:13:01.085110746 +0200
-@@ -55,6 +55,34 @@
- 			shift, 0, &imx_ccm_lock, share_count);
- }
- 
-+static inline void imx_clk_prepare_enable(struct clk *clk)
-+{
-+	int ret = clk_prepare_enable(clk);
-+
-+	if (ret)
-+		pr_err("failed to prepare and enable clk %s: %d\n",
-+			__clk_get_name(clk), ret);
-+}
-+
-+static inline int imx_clk_set_parent(struct clk *clk, struct clk *parent)
-+{
-+	int ret = clk_set_parent(clk, parent);
-+
-+	if (ret)
-+		pr_err("failed to set parent of clk %s to %s: %d\n",
-+			__clk_get_name(clk), __clk_get_name(parent), ret);
-+	return ret;
-+}
-+
-+static inline void imx_clk_set_rate(struct clk *clk, unsigned long rate)
-+{
-+	int ret = clk_set_rate(clk, rate);
-+
-+	if (ret)
-+		pr_err("failed to set rate of clk %s to %ld: %d\n",
-+			__clk_get_name(clk), rate, ret);
-+}
-+
- struct clk *imx_clk_pfd(const char *name, const char *parent_name,
- 		void __iomem *reg, u8 idx);
- 
-diff -Nur linux-4.1.3/arch/arm/mach-imx/clk-imx6q.c linux-xbian-imx6/arch/arm/mach-imx/clk-imx6q.c
---- linux-4.1.3/arch/arm/mach-imx/clk-imx6q.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/clk-imx6q.c	2015-07-27 23:13:01.081124967 +0200
-@@ -24,7 +24,6 @@
- #include "clk.h"
- #include "common.h"
- #include "hardware.h"
--
- static const char *step_sels[]	= { "osc", "pll2_pfd2_396m", };
- static const char *pll1_sw_sels[]	= { "pll1_sys", "step", };
- static const char *periph_pre_sels[]	= { "pll2_bus", "pll2_pfd2_396m", "pll2_pfd0_352m", "pll2_198m", };
-@@ -41,6 +40,8 @@
- static const char *ipu_sels[]		= { "mmdc_ch0_axi", "pll2_pfd2_396m", "pll3_120m", "pll3_pfd1_540m", };
- static const char *ldb_di_sels[]	= { "pll5_video_div", "pll2_pfd0_352m", "pll2_pfd2_396m", "mmdc_ch1_axi", "pll3_usb_otg", };
- static const char *ipu_di_pre_sels[]	= { "mmdc_ch0_axi", "pll3_usb_otg", "pll5_video_div", "pll2_pfd0_352m", "pll2_pfd2_396m", "pll3_pfd1_540m", };
-+static const char *ldb_di0_div_sels[]   = { "ldb_di0_div_3_5", "ldb_di0_div_7", };
-+static const char *ldb_di1_div_sels[]   = { "ldb_di1_div_3_5", "ldb_di1_div_7", };
- static const char *ipu1_di0_sels[]	= { "ipu1_di0_pre", "dummy", "dummy", "ldb_di0", "ldb_di1", };
- static const char *ipu1_di1_sels[]	= { "ipu1_di1_pre", "dummy", "dummy", "ldb_di0", "ldb_di1", };
- static const char *ipu2_di0_sels[]	= { "ipu2_di0_pre", "dummy", "dummy", "ldb_di0", "ldb_di1", };
-@@ -119,8 +120,118 @@
- static unsigned int share_count_ssi1;
- static unsigned int share_count_ssi2;
- static unsigned int share_count_ssi3;
-+static unsigned int share_count_spdif;
- static unsigned int share_count_mipi_core_cfg;
- 
-+static void __iomem *ccm_base;
-+
-+static void init_ldb_clks(struct clk *new_parent)
-+{
-+	u32 reg;
-+
-+	/*
-+	 * Need to follow a strict procedure when changing the LDB
-+	 * clock, else we can introduce a glitch. Things to keep in
-+	 * mind:
-+	 * 1. The current and new parent clocks must be disabled.
-+	 * 2. The default clock for ldb_dio_clk is mmdc_ch1 which has
-+	 * no CG bit.
-+	 * 3. In the RTL implementation of the LDB_DI_CLK_SEL mux
-+	 * the top four options are in one mux and the PLL3 option along
-+	 * with another option is in the second mux. There is third mux
-+	 * used to decide between the first and second mux.
-+	 * The code below switches the parent to the bottom mux first
-+	 * and then manipulates the top mux. This ensures that no glitch
-+	 * will enter the divider.
-+	 *
-+	 * Need to disable MMDC_CH1 clock manually as there is no CG bit
-+	 * for this clock. The only way to disable this clock is to move
-+	 * it topll3_sw_clk and then to disable pll3_sw_clk
-+	 * Make sure periph2_clk2_sel is set to pll3_sw_clk
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x18);
-+	reg &= ~(1 << 20);
-+	writel_relaxed(reg, ccm_base + 0x18);
-+
-+	/*
-+	 * Set MMDC_CH1 mask bit.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x4);
-+	reg |= 1 << 16;
-+	writel_relaxed(reg, ccm_base + 0x4);
-+
-+	/*
-+	 * Set the periph2_clk_sel to the top mux so that
-+	 * mmdc_ch1 is from pll3_sw_clk.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x14);
-+	reg |= 1 << 26;
-+	writel_relaxed(reg, ccm_base + 0x14);
-+
-+	/*
-+	 * Wait for the clock switch.
-+	 */
-+	while (readl_relaxed(ccm_base + 0x48))
-+		;
-+
-+	/*
-+	 * Disable pll3_sw_clk by selecting the bypass clock source.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0xc);
-+	reg |= 1 << 0;
-+	writel_relaxed(reg, ccm_base + 0xc);
-+
-+	/*
-+	 * Set the ldb_di0_clk and ldb_di1_clk to 111b.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x2c);
-+	reg |= ((7 << 9) | (7 << 12));
-+	writel_relaxed(reg, ccm_base + 0x2c);
-+
-+	/*
-+	 * Set the ldb_di0_clk and ldb_di1_clk to 100b.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x2c);
-+	reg &= ~((7 << 9) | (7 << 12));
-+	reg |= ((4 << 9) | (4 << 12));
-+	writel_relaxed(reg, ccm_base + 0x2c);
-+
-+	/*
-+	 * Perform the LDB parent clock switch.
-+	 */
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI0_SEL], new_parent);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI1_SEL], new_parent);
-+
-+	/*
-+	 * Unbypass pll3_sw_clk.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0xc);
-+	reg &= ~(1 << 0);
-+	writel_relaxed(reg, ccm_base + 0xc);
-+
-+	/*
-+	 * Set the periph2_clk_sel back to the bottom mux so that
-+	 * mmdc_ch1 is from its original parent.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x14);
-+	reg &= ~(1 << 26);
-+	writel_relaxed(reg, ccm_base + 0x14);
-+
-+	/*
-+	 * Wait for the clock switch.
-+	 */
-+	while (readl_relaxed(ccm_base + 0x48))
-+		;
-+
-+	/*
-+	 * Clear MMDC_CH1 mask bit.
-+	 */
-+	reg = readl_relaxed(ccm_base + 0x4);
-+	reg &= ~(1 << 16);
-+	writel_relaxed(reg, ccm_base + 0x4);
-+
-+}
-+
- static void __init imx6q_clocks_init(struct device_node *ccm_node)
- {
- 	struct device_node *np;
-@@ -174,13 +285,13 @@
- 	clk[IMX6QDL_PLL7_BYPASS] = imx_clk_mux_flags("pll7_bypass", base + 0x20, 16, 1, pll7_bypass_sels, ARRAY_SIZE(pll7_bypass_sels), CLK_SET_RATE_PARENT);
- 
- 	/* Do not bypass PLLs initially */
--	clk_set_parent(clk[IMX6QDL_PLL1_BYPASS], clk[IMX6QDL_CLK_PLL1]);
--	clk_set_parent(clk[IMX6QDL_PLL2_BYPASS], clk[IMX6QDL_CLK_PLL2]);
--	clk_set_parent(clk[IMX6QDL_PLL3_BYPASS], clk[IMX6QDL_CLK_PLL3]);
--	clk_set_parent(clk[IMX6QDL_PLL4_BYPASS], clk[IMX6QDL_CLK_PLL4]);
--	clk_set_parent(clk[IMX6QDL_PLL5_BYPASS], clk[IMX6QDL_CLK_PLL5]);
--	clk_set_parent(clk[IMX6QDL_PLL6_BYPASS], clk[IMX6QDL_CLK_PLL6]);
--	clk_set_parent(clk[IMX6QDL_PLL7_BYPASS], clk[IMX6QDL_CLK_PLL7]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL1_BYPASS], clk[IMX6QDL_CLK_PLL1]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL2_BYPASS], clk[IMX6QDL_CLK_PLL2]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL3_BYPASS], clk[IMX6QDL_CLK_PLL3]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL4_BYPASS], clk[IMX6QDL_CLK_PLL4]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL5_BYPASS], clk[IMX6QDL_CLK_PLL5]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL6_BYPASS], clk[IMX6QDL_CLK_PLL6]);
-+	imx_clk_set_parent(clk[IMX6QDL_PLL7_BYPASS], clk[IMX6QDL_CLK_PLL7]);
- 
- 	clk[IMX6QDL_CLK_PLL1_SYS]      = imx_clk_gate("pll1_sys",      "pll1_bypass", base + 0x00, 13);
- 	clk[IMX6QDL_CLK_PLL2_BUS]      = imx_clk_gate("pll2_bus",      "pll2_bypass", base + 0x30, 13);
-@@ -259,7 +370,7 @@
- 	clk[IMX6QDL_CLK_PLL5_VIDEO_DIV] = clk_register_divider_table(NULL, "pll5_video_div", "pll5_post_div", CLK_SET_RATE_PARENT, base + 0x170, 30, 2, 0, video_div_table, &imx_ccm_lock);
- 
- 	np = ccm_node;
--	base = of_iomap(np, 0);
-+	ccm_base = base = of_iomap(np, 0);
- 	WARN_ON(!base);
- 
- 	imx6q_pm_set_ccm_base(base);
-@@ -286,6 +397,8 @@
- 	clk[IMX6QDL_CLK_IPU2_SEL]         = imx_clk_mux("ipu2_sel",         base + 0x3c, 14, 2, ipu_sels,          ARRAY_SIZE(ipu_sels));
- 	clk[IMX6QDL_CLK_LDB_DI0_SEL]      = imx_clk_mux_flags("ldb_di0_sel", base + 0x2c, 9,  3, ldb_di_sels,      ARRAY_SIZE(ldb_di_sels), CLK_SET_RATE_PARENT);
- 	clk[IMX6QDL_CLK_LDB_DI1_SEL]      = imx_clk_mux_flags("ldb_di1_sel", base + 0x2c, 12, 3, ldb_di_sels,      ARRAY_SIZE(ldb_di_sels), CLK_SET_RATE_PARENT);
-+	clk[IMX6QDL_CLK_LDB_DI0_DIV_SEL]  = imx_clk_mux_flags("ldb_di0_div_sel", base + 0x20, 10, 1, ldb_di0_div_sels, ARRAY_SIZE(ldb_di0_div_sels), CLK_SET_RATE_PARENT);
-+	clk[IMX6QDL_CLK_LDB_DI1_DIV_SEL]  = imx_clk_mux_flags("ldb_di1_div_sel", base + 0x20, 11, 1, ldb_di1_div_sels, ARRAY_SIZE(ldb_di1_div_sels), CLK_SET_RATE_PARENT);
- 	clk[IMX6QDL_CLK_IPU1_DI0_PRE_SEL] = imx_clk_mux_flags("ipu1_di0_pre_sel", base + 0x34, 6,  3, ipu_di_pre_sels,   ARRAY_SIZE(ipu_di_pre_sels), CLK_SET_RATE_PARENT);
- 	clk[IMX6QDL_CLK_IPU1_DI1_PRE_SEL] = imx_clk_mux_flags("ipu1_di1_pre_sel", base + 0x34, 15, 3, ipu_di_pre_sels,   ARRAY_SIZE(ipu_di_pre_sels), CLK_SET_RATE_PARENT);
- 	clk[IMX6QDL_CLK_IPU2_DI0_PRE_SEL] = imx_clk_mux_flags("ipu2_di0_pre_sel", base + 0x38, 6,  3, ipu_di_pre_sels,   ARRAY_SIZE(ipu_di_pre_sels), CLK_SET_RATE_PARENT);
-@@ -335,9 +448,9 @@
- 	clk[IMX6QDL_CLK_IPU1_PODF]        = imx_clk_divider("ipu1_podf",        "ipu1_sel",          base + 0x3c, 11, 3);
- 	clk[IMX6QDL_CLK_IPU2_PODF]        = imx_clk_divider("ipu2_podf",        "ipu2_sel",          base + 0x3c, 16, 3);
- 	clk[IMX6QDL_CLK_LDB_DI0_DIV_3_5]  = imx_clk_fixed_factor("ldb_di0_div_3_5", "ldb_di0_sel", 2, 7);
--	clk[IMX6QDL_CLK_LDB_DI0_PODF]     = imx_clk_divider_flags("ldb_di0_podf", "ldb_di0_div_3_5", base + 0x20, 10, 1, 0);
-+	clk[IMX6QDL_CLK_LDB_DI0_DIV_7]    = imx_clk_fixed_factor("ldb_di0_div_7",   "ldb_di0_sel", 1, 7);
- 	clk[IMX6QDL_CLK_LDB_DI1_DIV_3_5]  = imx_clk_fixed_factor("ldb_di1_div_3_5", "ldb_di1_sel", 2, 7);
--	clk[IMX6QDL_CLK_LDB_DI1_PODF]     = imx_clk_divider_flags("ldb_di1_podf", "ldb_di1_div_3_5", base + 0x20, 11, 1, 0);
-+	clk[IMX6QDL_CLK_LDB_DI1_DIV_7]    = imx_clk_fixed_factor("ldb_di1_div_7",   "ldb_di1_sel", 1, 7);
- 	clk[IMX6QDL_CLK_IPU1_DI0_PRE]     = imx_clk_divider("ipu1_di0_pre",     "ipu1_di0_pre_sel",  base + 0x34, 3,  3);
- 	clk[IMX6QDL_CLK_IPU1_DI1_PRE]     = imx_clk_divider("ipu1_di1_pre",     "ipu1_di1_pre_sel",  base + 0x34, 12, 3);
- 	clk[IMX6QDL_CLK_IPU2_DI0_PRE]     = imx_clk_divider("ipu2_di0_pre",     "ipu2_di0_pre_sel",  base + 0x38, 3,  3);
-@@ -378,6 +491,8 @@
- 	clk[IMX6QDL_CLK_CAN1_SERIAL]  = imx_clk_gate2("can1_serial",   "can_root",          base + 0x68, 16);
- 	clk[IMX6QDL_CLK_CAN2_IPG]     = imx_clk_gate2("can2_ipg",      "ipg",               base + 0x68, 18);
- 	clk[IMX6QDL_CLK_CAN2_SERIAL]  = imx_clk_gate2("can2_serial",   "can_root",          base + 0x68, 20);
-+	clk[IMX6QDL_CLK_DCIC1]        = imx_clk_gate2("dcic1",         "ipu1_podf",         base + 0x68, 24);
-+	clk[IMX6QDL_CLK_DCIC2]        = imx_clk_gate2("dcic2",         "ipu2_podf",         base + 0x68, 26);
- 	clk[IMX6QDL_CLK_ECSPI1]       = imx_clk_gate2("ecspi1",        "ecspi_root",        base + 0x6c, 0);
- 	clk[IMX6QDL_CLK_ECSPI2]       = imx_clk_gate2("ecspi2",        "ecspi_root",        base + 0x6c, 2);
- 	clk[IMX6QDL_CLK_ECSPI3]       = imx_clk_gate2("ecspi3",        "ecspi_root",        base + 0x6c, 4);
-@@ -414,9 +529,9 @@
- 	clk[IMX6QDL_CLK_IPU1_DI1]     = imx_clk_gate2("ipu1_di1",      "ipu1_di1_sel",      base + 0x74, 4);
- 	clk[IMX6QDL_CLK_IPU2]         = imx_clk_gate2("ipu2",          "ipu2_podf",         base + 0x74, 6);
- 	clk[IMX6QDL_CLK_IPU2_DI0]     = imx_clk_gate2("ipu2_di0",      "ipu2_di0_sel",      base + 0x74, 8);
--	clk[IMX6QDL_CLK_LDB_DI0]      = imx_clk_gate2("ldb_di0",       "ldb_di0_podf",      base + 0x74, 12);
--	clk[IMX6QDL_CLK_LDB_DI1]      = imx_clk_gate2("ldb_di1",       "ldb_di1_podf",      base + 0x74, 14);
- 	clk[IMX6QDL_CLK_IPU2_DI1]     = imx_clk_gate2("ipu2_di1",      "ipu2_di1_sel",      base + 0x74, 10);
-+	clk[IMX6QDL_CLK_LDB_DI0]      = imx_clk_gate2("ldb_di0",       "ldb_di0_div_sel",      base + 0x74, 12);
-+	clk[IMX6QDL_CLK_LDB_DI1]      = imx_clk_gate2("ldb_di1",       "ldb_di1_div_sel",      base + 0x74, 14);
- 	clk[IMX6QDL_CLK_HSI_TX]       = imx_clk_gate2_shared("hsi_tx", "hsi_tx_podf",       base + 0x74, 16, &share_count_mipi_core_cfg);
- 	clk[IMX6QDL_CLK_MIPI_CORE_CFG] = imx_clk_gate2_shared("mipi_core_cfg", "video_27m", base + 0x74, 16, &share_count_mipi_core_cfg);
- 	clk[IMX6QDL_CLK_MIPI_IPG]     = imx_clk_gate2_shared("mipi_ipg", "ipg",             base + 0x74, 16, &share_count_mipi_core_cfg);
-@@ -446,7 +561,8 @@
- 	clk[IMX6QDL_CLK_SATA]         = imx_clk_gate2("sata",          "ahb",               base + 0x7c, 4);
- 	clk[IMX6QDL_CLK_SDMA]         = imx_clk_gate2("sdma",          "ahb",               base + 0x7c, 6);
- 	clk[IMX6QDL_CLK_SPBA]         = imx_clk_gate2("spba",          "ipg",               base + 0x7c, 12);
--	clk[IMX6QDL_CLK_SPDIF]        = imx_clk_gate2("spdif",         "spdif_podf",        base + 0x7c, 14);
-+	clk[IMX6QDL_CLK_SPDIF]        = imx_clk_gate2_shared("spdif",         "spdif_podf", base + 0x7c, 14, &share_count_spdif);
-+	clk[IMX6QDL_CLK_SPDIF_GCLK]   = imx_clk_gate2_shared("spdif_gclk", "ipg",           base + 0x7c, 14, &share_count_spdif);
- 	clk[IMX6QDL_CLK_SSI1_IPG]     = imx_clk_gate2_shared("ssi1_ipg",      "ipg",        base + 0x7c, 18, &share_count_ssi1);
- 	clk[IMX6QDL_CLK_SSI2_IPG]     = imx_clk_gate2_shared("ssi2_ipg",      "ipg",        base + 0x7c, 20, &share_count_ssi2);
- 	clk[IMX6QDL_CLK_SSI3_IPG]     = imx_clk_gate2_shared("ssi3_ipg",      "ipg",        base + 0x7c, 22, &share_count_ssi3);
-@@ -479,54 +595,104 @@
- 	clk_data.clk_num = ARRAY_SIZE(clk);
- 	of_clk_add_provider(np, of_clk_src_onecell_get, &clk_data);
- 
-+	clk_register_clkdev(clk[IMX6QDL_CLK_GPT_3M], "gpt_3m", "imx-gpt.0");
- 	clk_register_clkdev(clk[IMX6QDL_CLK_ENET_REF], "enet_ref", NULL);
- 
- 	if ((imx_get_soc_revision() != IMX_CHIP_REVISION_1_0) ||
- 	    cpu_is_imx6dl()) {
--		clk_set_parent(clk[IMX6QDL_CLK_LDB_DI0_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
--		clk_set_parent(clk[IMX6QDL_CLK_LDB_DI1_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI0_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI1_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
- 	}
- 
--	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_SEL], clk[IMX6QDL_CLK_IPU1_DI0_PRE]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_SEL], clk[IMX6QDL_CLK_IPU1_DI1_PRE]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_SEL], clk[IMX6QDL_CLK_IPU2_DI0_PRE]);
--	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_SEL], clk[IMX6QDL_CLK_IPU2_DI1_PRE]);
-+	init_ldb_clks(clk[IMX6QDL_CLK_PLL2_PFD0_352M]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_SEL], clk[IMX6QDL_CLK_IPU1_DI0_PRE]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_SEL], clk[IMX6QDL_CLK_IPU1_DI1_PRE]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_SEL], clk[IMX6QDL_CLK_IPU2_DI0_PRE]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_SEL], clk[IMX6QDL_CLK_IPU2_DI1_PRE]);
-+
-+	if (cpu_is_imx6dl())
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_SEL], clk[IMX6QDL_CLK_PLL3_PFD1_540M]);
- 
- 	/*
- 	 * The gpmi needs 100MHz frequency in the EDO/Sync mode,
- 	 * We can not get the 100MHz from the pll2_pfd0_352m.
- 	 * So choose pll2_pfd2_396m as enfc_sel's parent.
- 	 */
--	clk_set_parent(clk[IMX6QDL_CLK_ENFC_SEL], clk[IMX6QDL_CLK_PLL2_PFD2_396M]);
--
--	for (i = 0; i < ARRAY_SIZE(clks_init_on); i++)
--		clk_prepare_enable(clk[clks_init_on[i]]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_ENFC_SEL], clk[IMX6QDL_CLK_PLL2_PFD2_396M]);
- 
-+	/* gpu clock initilazation */
-+	/*
-+	* On mx6dl, 2d core clock sources(sel, podf) is from 3d
-+	* shader core clock, but 3d shader clock multiplexer of
-+	* mx6dl is different. For instance the equivalent of
-+	* pll2_pfd_594M on mx6q is pll2_pfd_528M on mx6dl.
-+	* Make a note here.
-+	*/
-+#if 0
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_GPU3D_SHADER_SEL], clk[IMX6QDL_CLK_PLL2_PFD1_594M]);
-+	if (cpu_is_imx6dl()) {
-+		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_SHADER], 528000000);
-+		/* for mx6dl, change gpu3d_core parent to 594_PFD*/
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU3D_CORE_SEL], clk[IMX6QDL_CLK_PLL2_PFD1_594M]);
-+		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_CORE], 528000000);
-+		/* for mx6dl, change gpu2d_core parent to 594_PFD*/
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU2D_CORE_SEL], clk[IMX6QDL_CLK_PLL2_PFD1_594M]);
-+		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU2D_CORE], 528000000);
-+	} else if (cpu_is_imx6q()) {
-+		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_SHADER], 594000000);
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU3D_CORE_SEL], clk[IMX6QDL_CLK_MMDC_CH0_AXI]);
-+		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_CORE], 528000000);
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU2D_CORE_SEL], clk[IMX6QDL_CLK_PLL3_USB_OTG]);
-+		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU2D_CORE], 480000000);
-+	}
-+#endif
- 	if (IS_ENABLED(CONFIG_USB_MXS_PHY)) {
--		clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY1_GATE]);
--		clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY2_GATE]);
-+		imx_clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY1_GATE]);
-+		imx_clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY2_GATE]);
- 	}
- 
- 	/*
- 	 * Let's initially set up CLKO with OSC24M, since this configuration
- 	 * is widely used by imx6q board designs to clock audio codec.
- 	 */
--	ret = clk_set_parent(clk[IMX6QDL_CLK_CKO2_SEL], clk[IMX6QDL_CLK_OSC]);
-+	ret = imx_clk_set_parent(clk[IMX6QDL_CLK_CKO2_SEL], clk[IMX6QDL_CLK_OSC]);
- 	if (!ret)
--		ret = clk_set_parent(clk[IMX6QDL_CLK_CKO], clk[IMX6QDL_CLK_CKO2]);
-+		ret = imx_clk_set_parent(clk[IMX6QDL_CLK_CKO], clk[IMX6QDL_CLK_CKO2]);
- 	if (ret)
- 		pr_warn("failed to set up CLKO: %d\n", ret);
- 
- 	/* Audio-related clocks configuration */
--	clk_set_parent(clk[IMX6QDL_CLK_SPDIF_SEL], clk[IMX6QDL_CLK_PLL3_PFD3_454M]);
-+	imx_clk_set_parent(clk[IMX6QDL_CLK_SPDIF_SEL], clk[IMX6QDL_CLK_PLL3_PFD3_454M]);
- 
- 	/* All existing boards with PCIe use LVDS1 */
- 	if (IS_ENABLED(CONFIG_PCI_IMX6))
--		clk_set_parent(clk[IMX6QDL_CLK_LVDS1_SEL], clk[IMX6QDL_CLK_SATA_REF_100M]);
-+		imx_clk_set_parent(clk[IMX6QDL_CLK_LVDS1_SEL], clk[IMX6QDL_CLK_SATA_REF_100M]);
-+
-+	/*
-+	 * Enable clocks only after both parent and rate are all initialized
-+	 * as needed
-+	 */
-+	for (i = 0; i < ARRAY_SIZE(clks_init_on); i++)
-+		imx_clk_prepare_enable(clk[clks_init_on[i]]);
-+
-+	/*
-+	 * If VPU 352M is enabled, then PLL2_PDF2 need to be
-+	 * set to 352M, cpufreq will be disabled as VDDSOC/PU
-+	 * need to be at highest voltage, scaling cpu freq is
-+	 * not saving any power, and busfreq will be also disabled
-+	 * as the PLL2_PFD2 is not at default freq, in a word,
-+	 * all modules that sourceing clk from PLL2_PFD2 will
-+	 * be impacted.
-+	 */
-+	if (vpu352) {
-+		clk_set_rate(clk[IMX6QDL_CLK_PLL2_PFD2_396M], 352000000);
-+		clk_set_parent(clk[IMX6QDL_CLK_VPU_AXI_SEL], clk[IMX6QDL_CLK_PLL2_PFD2_396M]);
-+		pr_info("VPU 352M is enabled!\n");
-+	}
- 
- 	/* Set initial power mode */
- 	imx6q_set_lpm(WAIT_CLOCKED);
-diff -Nur linux-4.1.3/arch/arm/mach-imx/clk-pllv3.c linux-xbian-imx6/arch/arm/mach-imx/clk-pllv3.c
---- linux-4.1.3/arch/arm/mach-imx/clk-pllv3.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/clk-pllv3.c	2015-07-27 23:13:01.085110746 +0200
-@@ -23,6 +23,7 @@
- #define PLL_DENOM_OFFSET	0x20
- 
- #define BM_PLL_POWER		(0x1 << 12)
-+#define BM_PLL_BYPASS		(0x1 << 16)
- #define BM_PLL_LOCK		(0x1 << 31)
- 
- /**
-@@ -237,9 +238,10 @@
- 	struct clk_pllv3 *pll = to_clk_pllv3(hw);
- 	unsigned long min_rate = parent_rate * 27;
- 	unsigned long max_rate = parent_rate * 54;
--	u32 val, div;
-+	u32 val, newval, div;
- 	u32 mfn, mfd = 1000000;
- 	s64 temp64;
-+	int ret;
- 
- 	if (rate < min_rate || rate > max_rate)
- 		return -EINVAL;
-@@ -251,13 +253,27 @@
- 	mfn = temp64;
- 
- 	val = readl_relaxed(pll->base);
--	val &= ~pll->div_mask;
--	val |= div;
--	writel_relaxed(val, pll->base);
-+
-+	/* set the PLL into bypass mode */
-+	newval = val | BM_PLL_BYPASS;
-+	writel_relaxed(newval, pll->base);
-+
-+	/* configure the new frequency */
-+	newval &= ~pll->div_mask;
-+	newval |= div;
-+	writel_relaxed(newval, pll->base);
- 	writel_relaxed(mfn, pll->base + PLL_NUM_OFFSET);
- 	writel_relaxed(mfd, pll->base + PLL_DENOM_OFFSET);
- 
--	return clk_pllv3_wait_lock(pll);
-+	ret = clk_pllv3_wait_lock(pll);
-+	if (ret == 0 && val & BM_PLL_POWER) {
-+		/* only if it locked can we switch back to the PLL */
-+		newval &= ~BM_PLL_BYPASS;
-+		newval |= val & BM_PLL_BYPASS;
-+		writel_relaxed(newval, pll->base);
-+	}
-+
-+	return ret;
- }
- 
- static const struct clk_ops clk_pllv3_av_ops = {
-diff -Nur linux-4.1.3/arch/arm/mach-imx/common.h linux-xbian-imx6/arch/arm/mach-imx/common.h
---- linux-4.1.3/arch/arm/mach-imx/common.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/common.h	2015-07-27 23:13:01.085110746 +0200
-@@ -56,6 +56,7 @@
- void mxc_set_cpu_type(unsigned int type);
- void mxc_restart(enum reboot_mode, const char *);
- void mxc_arch_reset_init(void __iomem *);
-+void mxc_arch_reset_init_dt(void);
- int mx51_revision(void);
- int mx53_revision(void);
- void imx_set_aips(void __iomem *);
-@@ -86,6 +87,8 @@
- 	MX3_SLEEP,
- };
- 
-+extern int vpu352;
-+
- void mx3_cpu_lp_set(enum mx3_cpu_pwr_mode mode);
- void imx_print_silicon_rev(const char *cpu, int srev);
- 
-@@ -102,6 +105,7 @@
- static inline void imx_smp_prepare(void) {}
- #endif
- void imx_src_init(void);
-+
- void imx_gpc_pre_suspend(bool arm_power_off);
- void imx_gpc_post_resume(void);
- void imx_gpc_mask_all(void);
-diff -Nur linux-4.1.3/arch/arm/mach-imx/ddr3_freq_imx6.S linux-xbian-imx6/arch/arm/mach-imx/ddr3_freq_imx6.S
---- linux-4.1.3/arch/arm/mach-imx/ddr3_freq_imx6.S	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/arch/arm/mach-imx/ddr3_freq_imx6.S	2015-07-27 23:13:01.089096525 +0200
-@@ -0,0 +1,893 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/linkage.h>
-+
-+#define MMDC0_MDPDC		0x4
-+#define MMDC0_MDCF0			0x0c
-+#define MMDC0_MDCF1			0x10
-+#define MMDC0_MDMISC		0x18
-+#define MMDC0_MDSCR		0x1c
-+#define MMDC0_MAPSR			0x404
-+#define MMDC0_MADPCR0		0x410
-+#define MMDC0_MPZQHWCTRL	0x800
-+#define MMDC1_MPZQHWCTRL	0x4800
-+#define MMDC0_MPODTCTRL	0x818
-+#define MMDC1_MPODTCTRL	0x4818
-+#define MMDC0_MPDGCTRL0	0x83c
-+#define MMDC1_MPDGCTRL0	0x483c
-+#define MMDC0_MPMUR0		0x8b8
-+#define MMDC1_MPMUR0		0x48b8
-+
-+#define CCM_CBCDR			0x14
-+#define CCM_CBCMR			0x18
-+#define CCM_CSCMR1			0x1c
-+#define CCM_CDHIPR			0x48
-+
-+#define L2_CACHE_SYNC		0x730
-+
-+	.align 3
-+
-+	.macro	switch_to_528MHz
-+
-+	/* check if periph_clk_sel is already set */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	beq	set_ahb_podf_before_switch
-+
-+	/* change periph_clk to be sourced from pll3_clk. */
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	bic	r0, r0, #(3 << 12)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(0x38 << 20)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+	/*
-+	 * set the AHB dividers before the switch,
-+	 * don't change AXI clock divider,
-+	 * set the MMDC_DIV=1, AXI_DIV = 2, AHB_DIV=4,
-+	 */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	ldr	r2, =0x3f1f00
-+	bic	r0, r0, r2
-+	orr	r0, r0, #0xd00
-+	orr	r0, r0, #(1 << 16)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+wait_div_update528:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	wait_div_update528
-+
-+	/* now switch periph_clk to pll3_main_clk. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	orr	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch3:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch3
-+
-+	b	switch_pre_periph_clk_528
-+
-+set_ahb_podf_before_switch:
-+	/*
-+	 * set the MMDC_DIV=1, AXI_DIV = 2, AHB_DIV=4,
-+	 */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	ldr	r2, =0x3f1f00
-+	bic	r0, r0, r2
-+	orr	r0, r0, #0xd00
-+	orr	r0, r0, #(1 << 16)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+wait_div_update528_1:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	wait_div_update528_1
-+
-+switch_pre_periph_clk_528:
-+
-+	/* now switch pre_periph_clk to PLL2_528MHz. */
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	bic	r0, r0, #(0xc << 16)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	/* now switch periph_clk back. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch4:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch4
-+
-+	.endm
-+
-+	.macro	switch_to_400MHz
-+
-+	/* check if periph_clk_sel is already set. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	beq	set_ahb_podf_before_switch1
-+
-+	/* change periph_clk to be sourced from pll3_clk. */
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	bic	r0, r0, #(3 << 12)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(0x38 << 24)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+	/* now switch periph_clk to pll3_main_clk. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	orr	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch5:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch5
-+
-+	b	switch_pre_periph_clk_400
-+
-+set_ahb_podf_before_switch1:
-+	/*
-+	 * set the MMDC_DIV=1, AXI_DIV = 2, AHB_DIV=4,
-+	 */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	ldr	r2, =0x3f1f00
-+	bic	r0, r0, r2
-+	orr	r0, r0, #(0x9 << 8)
-+	orr	r0, r0, #(1 << 16)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+wait_div_update400_1:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	wait_div_update400_1
-+
-+switch_pre_periph_clk_400:
-+
-+	/* now switch pre_periph_clk to PFD_400MHz. */
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	bic	r0, r0, #(0xc << 16)
-+	orr	r0, r0, #(0x4 << 16)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	/* now switch periph_clk back. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch6:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch6
-+
-+	/*
-+	 * change AHB divider so that we are at 400/3=133MHz.
-+	 * don't change AXI clock divider.
-+	 * set the MMDC_DIV=1, AXI_DIV=2, AHB_DIV=3,
-+	 */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	ldr	r2, =0x3f1f00
-+	bic	r0, r0, r2
-+	orr	r0, r0, #(0x9 << 8)
-+	orr	r0, r0, #(1 << 16)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+wait_div_update400_2:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	wait_div_update400_2
-+
-+	.endm
-+
-+	.macro	switch_to_50MHz
-+
-+	/* check if periph_clk_sel is already set. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	beq	switch_pre_periph_clk_50
-+
-+	/*
-+	 * set the periph_clk to be sourced from PLL2_PFD_200M
-+	 * change periph_clk to be sourced from pll3_clk.
-+	 * ensure PLL3 is the source and set the divider to 1.
-+	 */
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	bic	r0, r0, #(0x3 << 12)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(0x38 << 24)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+	/* now switch periph_clk to pll3_main_clk. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	orr	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch_50:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch_50
-+
-+switch_pre_periph_clk_50:
-+
-+	/* now switch pre_periph_clk to PFD_200MHz. */
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	orr	r0, r0, #(0xc << 16)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	/*
-+	 * set the MMDC_DIV=4, AXI_DIV = 4, AHB_DIV=8,
-+	 */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	ldr	r2, =0x3f1f00
-+	bic	r0, r0, r2
-+	orr	r0, r0, #(0x18 << 16)
-+	orr	r0, r0, #(0x3 << 16)
-+
-+	/*
-+	 * if changing AHB divider remember to change
-+	 * the IPGPER divider too below.
-+	 */
-+	orr	r0, r0, #0x1d00
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+wait_div_update_50:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	wait_div_update_50
-+
-+	/* now switch periph_clk back. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch2:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch2
-+
-+	.endm
-+
-+	.macro	switch_to_24MHz
-+	/*
-+	 * change the freq now try setting DDR to 24MHz.
-+	 * source it from the periph_clk2 ensure the
-+	 * periph_clk2 is sourced from 24MHz and the
-+	 * divider is 1.
-+	 */
-+
-+	ldr	r0, [r6, #CCM_CBCMR]
-+	bic	r0, r0, #(0x3 << 12)
-+	orr	r0, r0, #(1 << 12)
-+	str	r0, [r6, #CCM_CBCMR]
-+
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	bic	r0, r0, #(0x38 << 24)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+	/* now switch periph_clk to 24MHz. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	orr	r0, r0, #(1 << 25)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+periph_clk_switch1:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	periph_clk_switch1
-+
-+	/* change all the dividers to 1. */
-+	ldr	r0, [r6, #CCM_CBCDR]
-+	ldr	r2, =0x3f1f00
-+	bic	r0, r0, r2
-+	orr	r0, r0, #(1 << 8)
-+	str	r0, [r6, #CCM_CBCDR]
-+
-+	/* Wait for the divider to change. */
-+wait_div_update:
-+	ldr	r0, [r6, #CCM_CDHIPR]
-+	cmp	r0, #0
-+	bne	wait_div_update
-+
-+	.endm
-+
-+/*
-+ *  mx6_ddr3_freq_change
-+ *
-+ *  idle the processor (eg, wait for interrupt).
-+ *  make sure DDR is in self-refresh.
-+ *  IRQs are already disabled.
-+ */
-+ENTRY(mx6_ddr3_freq_change)
-+
-+	stmfd	sp!, {r4-r12}
-+
-+	/*
-+	  * r5 -> mmdc_base
-+	  * r6 -> ccm_base
-+	  * r7 -> iomux_base
-+	  * r12 -> l2_base
-+	  */
-+	mov	r4, r0
-+	mov	r8, r1
-+	mov	r9, r2
-+	mov	r11, r3
-+
-+	/*
-+	  * Get the addresses of the registers.
-+	  * They are last few entries in the
-+	  * ddr_settings parameter.
-+	  * The first entry contains the count,
-+	  * and each entry is 2 words.
-+	  */
-+	ldr	r0, [r1]
-+	add	r0, r0, #1
-+	lsl	r0, r0, #3
-+	add	r1, r0, r1
-+	/* mmdc_base. */
-+	ldr	r5, [r1]
-+	add	r1, #8
-+	/* ccm_base */
-+	ldr	r6, [r1]
-+	add	r1, #8
-+	/*iomux_base */
-+	ldr	r7, [r1]
-+	add	r1, #8
-+	/*l2_base */
-+	ldr	r12, [r1]
-+
-+ddr_freq_change:
-+	/*
-+	 * make sure no TLB miss will occur when
-+	 * the DDR is in self refresh. invalidate
-+	 * TLB single entry to ensure that the
-+	 * address is not already in the TLB.
-+	 */
-+
-+	adr	r10, ddr_freq_change
-+
-+	ldr	r2, [r6]
-+	ldr	r2, [r5]
-+	ldr	r2, [r7]
-+	ldr	r2, [r8]
-+	ldr	r2, [r10]
-+	ldr	r2, [r11]
-+	ldr	r2, [r12]
-+
-+#ifdef CONFIG_CACHE_L2X0
-+	/*
-+	  * Make sure the L2 buffers are drained.
-+	  * Sync operation on L2 drains the buffers.
-+	  */
-+	mov    r1, #0x0
-+	str      r1, [r12, #L2_CACHE_SYNC]
-+#endif
-+
-+	/* disable automatic power saving. */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	orr	r0, r0, #0x01
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+	/* disable MMDC power down timer. */
-+	ldr	r0, [r5, #MMDC0_MDPDC]
-+	bic	r0, r0, #(0xff << 8)
-+	str	r0, [r5, #MMDC0_MDPDC]
-+
-+	/* delay for a while */
-+	ldr	r1, =4
-+delay1:
-+	ldr	r2, =0
-+cont1:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont1
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay1
-+
-+	/* set CON_REG */
-+	ldr	r0, =0x8000
-+	str	r0, [r5, #MMDC0_MDSCR]
-+poll_conreq_set_1:
-+	ldr	r0, [r5, #MMDC0_MDSCR]
-+	and	r0, r0, #(0x4 << 12)
-+	cmp	r0, #(0x4 << 12)
-+	bne	poll_conreq_set_1
-+
-+	ldr	r0, =0x00008050
-+	str	r0, [r5, #MMDC0_MDSCR]
-+	ldr	r0, =0x00008058
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	/*
-+	 * if requested frequency is greater than
-+	 * 300MHz go to DLL on mode.
-+	 */
-+	ldr	r1, =300000000
-+	cmp	r4, r1
-+	bge	dll_on_mode
-+
-+dll_off_mode:
-+
-+	/* if DLL is currently on, turn it off. */
-+	cmp	r9, #1
-+	beq	continue_dll_off_1
-+
-+	ldr	r0, =0x00018031
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x00018039
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r1, =10
-+delay1a:
-+	ldr	r2, =0
-+cont1a:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont1a
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay1a
-+
-+continue_dll_off_1:
-+	/* set DVFS - enter self refresh mode */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	orr	r0, r0, #(1 << 21)
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+	/* de-assert con_req */
-+	mov	r0, #0x0
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+poll_dvfs_set_1:
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	bne	poll_dvfs_set_1
-+
-+	ldr	r1, =24000000
-+	cmp	r4, r1
-+	beq	switch_freq_24
-+
-+	switch_to_50MHz
-+	b	continue_dll_off_2
-+
-+switch_freq_24:
-+	switch_to_24MHz
-+
-+continue_dll_off_2:
-+
-+	/* set SBS - block ddr accesses */
-+	ldr	r0, [r5, #MMDC0_MADPCR0]
-+	orr	r0, r0, #(1 << 8)
-+	str	r0, [r5, #MMDC0_MADPCR0]
-+
-+	/* clear DVFS - exit from self refresh mode */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	bic	r0, r0, #(1 << 21)
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+poll_dvfs_clear_1:
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	beq	poll_dvfs_clear_1
-+
-+	/* if DLL was previously on, continue DLL off routine. */
-+	cmp    	r9, #1
-+	beq 	continue_dll_off_3
-+
-+	ldr	r0, =0x00018031
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x00018039
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x08208030
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x08208038
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x00088032
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x0008803A
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	/* delay for a while. */
-+	ldr	r1, =4
-+delay_1:
-+	ldr	r2, =0
-+cont_1:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont_1
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay_1
-+
-+	ldr	r0, [r5, #MMDC0_MDCF0]
-+	bic	r0, r0, #0xf
-+	orr	r0, r0, #0x3
-+	str	r0, [r5, #MMDC0_MDCF0]
-+
-+	ldr	r0, [r5, #MMDC0_MDCF1]
-+	bic	r0, r0, #0x7
-+	orr	r0, r0, #0x4
-+	str	r0, [r5, #MMDC0_MDCF1]
-+
-+	ldr	r0, =0x00011680
-+	str	r0, [r5, #MMDC0_MDMISC]
-+
-+	/* enable dqs pull down in the IOMUX. */
-+	ldr	r1, [r11]
-+	add	r11, r11, #8
-+	ldr	r2, =0x3028
-+update_iomux:
-+	ldr	r0, [r11, #0x0]
-+	ldr	r3, [r7, r0]
-+	bic	r3, r3, r2
-+	orr	r3, r3, #(0x3 << 12)
-+	orr	r3, r3, #0x28
-+	str	r3, [r7, r0]
-+	add	r11, r11, #8
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	update_iomux
-+
-+	/*  ODT disabled. */
-+	ldr	r0, =0x0
-+	ldr	r2, =MMDC0_MPODTCTRL
-+	str	r0, [r5, r2]
-+	ldr	r2, =MMDC1_MPODTCTRL
-+	str	r0, [r5, r2]
-+
-+	/* DQS gating disabled. */
-+	ldr	r2, =MMDC0_MPDGCTRL0
-+	ldr	r0, [r5, r2]
-+	orr	r0, r0, #(1 << 29)
-+	str	r0, [r5, r2]
-+
-+	ldr	r2, =MMDC1_MPDGCTRL0
-+	ldr	r0, [r5, r2]
-+	orr	r0, r0, #(0x1 << 29)
-+	str	r0, [r5, r2]
-+
-+	/* MMDC0_MAPSR adopt power down enable. */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	bic	r0, r0, #0x01
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+	/* frc_msr + mu bypass */
-+	ldr	r0, =0x00000060
-+	str	r0, [r5, #MMDC0_MPMUR0]
-+	ldr	r2, =MMDC1_MPMUR0
-+	str	r0, [r5, r2]
-+	ldr	r0, =0x00000460
-+	str	r0, [r5, #MMDC0_MPMUR0]
-+	ldr	r2, =MMDC1_MPMUR0
-+	str	r0, [r5, r2]
-+	ldr	r0, =0x00000c60
-+	str	r0, [r5, #MMDC0_MPMUR0]
-+	ldr	r2, =MMDC1_MPMUR0
-+	str	r0, [r5, r2]
-+
-+continue_dll_off_3:
-+	/* clear SBS - unblock accesses to DDR. */
-+	ldr	r0, [r5, #MMDC0_MADPCR0]
-+	bic	r0, r0, #(0x1 << 8)
-+	str	r0, [r5, #MMDC0_MADPCR0]
-+
-+	mov	r0, #0x0
-+	str	r0, [r5, #MMDC0_MDSCR]
-+poll_conreq_clear_1:
-+	ldr	r0, [r5, #MMDC0_MDSCR]
-+	and	r0, r0, #(0x4 << 12)
-+	cmp	r0, #(0x4 << 12)
-+	beq	poll_conreq_clear_1
-+
-+	b	done
-+
-+dll_on_mode:
-+	/* assert DVFS - enter self refresh mode. */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	orr	r0, r0, #(1 << 21)
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+	/* de-assert CON_REQ. */
-+	mov	r0, #0x0
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	/* poll DVFS ack. */
-+poll_dvfs_set_2:
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	bne	poll_dvfs_set_2
-+
-+	ldr	r1, =528000000
-+	cmp	r4, r1
-+	beq	switch_freq_528
-+
-+	switch_to_400MHz
-+
-+	b	continue_dll_on
-+
-+switch_freq_528:
-+	switch_to_528MHz
-+
-+continue_dll_on:
-+
-+	/* set SBS step-by-step mode. */
-+	ldr	r0, [r5, #MMDC0_MADPCR0]
-+	orr	r0, r0, #( 1 << 8)
-+	str	r0, [r5, #MMDC0_MADPCR0]
-+
-+	/* clear DVFS - exit self refresh mode. */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	bic	r0, r0, #(1 << 21)
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+poll_dvfs_clear_2:
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	and	r0, r0, #(1 << 25)
-+	cmp	r0, #(1 << 25)
-+	beq	poll_dvfs_clear_2
-+
-+	/* if DLL is currently off, turn it back on. */
-+	cmp	r9, #0
-+	beq	update_calibration_only
-+
-+	ldr	r0, =0xa5390003
-+	str	r0, [r5, #MMDC0_MPZQHWCTRL]
-+	ldr	r2, =MMDC1_MPZQHWCTRL
-+	str	r0, [r5, r2]
-+
-+	/* enable DQS gating. */
-+	ldr	r2, =MMDC0_MPDGCTRL0
-+	ldr	r0, [r5, r2]
-+	bic	r0, r0, #(1 << 29)
-+	str	r0, [r5, r2]
-+
-+	ldr	r2, =MMDC1_MPDGCTRL0
-+	ldr	r0, [r5, r2]
-+	bic	r0, r0, #(1 << 29)
-+	str	r0, [r5, r2]
-+
-+	/* force measure. */
-+	ldr	r0, =0x00000800
-+	str	r0, [r5, #MMDC0_MPMUR0]
-+	ldr	r2, =MMDC1_MPMUR0
-+	str	r0, [r5, r2]
-+
-+	/* delay for while. */
-+	ldr	r1, =4
-+delay5:
-+	ldr	r2, =0
-+cont5:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont5
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay5
-+
-+	/* disable dqs pull down in the IOMUX. */
-+	ldr	r1, [r11]
-+	add	r11, r11, #8
-+update_iomux1:
-+	ldr	r0, [r11, #0x0]
-+	ldr	r3, [r11, #0x4]
-+	str	r3, [r7, r0]
-+	add	r11, r11, #8
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	update_iomux1
-+
-+	/* config MMDC timings to 528MHz. */
-+	ldr	r9, [r8]
-+	add	r8, r8, #8
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	/* update MISC register: WALAT, RALAT */
-+	ldr	r0, =0x00001740
-+	str	r0, [r5, #MMDC0_MDMISC]
-+
-+	/* configure ddr devices to dll on, odt. */
-+	ldr	r0, =0x00048031
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x00048039
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	/* delay for while. */
-+	ldr	r1, =4
-+delay7:
-+	ldr	r2, =0
-+cont7:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont7
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay7
-+
-+	/* reset dll. */
-+	ldr	r0, =0x09408030
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x09408038
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	/* delay for while. */
-+	ldr	r1, =100
-+delay8:
-+	ldr	r2, =0
-+cont8:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont8
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay8
-+
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	ldr	r0, =0x00428031
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x00428039
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	/* issue a zq command. */
-+	ldr	r0, =0x04008040
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	ldr	r0, =0x04008048
-+	str	r0, [r5, #MMDC0_MDSCR]
-+
-+	/* MMDC ODT enable. */
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+
-+	ldr	r2, =0x4818
-+	str	r3, [r5, r2]
-+
-+	/* delay for while. */
-+	ldr	r1, =40
-+delay15:
-+	ldr	r2, =0
-+cont15:
-+	ldr	r0, [r5, r2]
-+	add	r2, r2, #4
-+	cmp	r2, #16
-+	bne	cont15
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	delay15
-+
-+	/* MMDC0_MAPSR adopt power down enable. */
-+	ldr	r0, [r5, #MMDC0_MAPSR]
-+	bic	r0, r0, #0x01
-+	str	r0, [r5, #MMDC0_MAPSR]
-+
-+	/* enable MMDC power down timer. */
-+	ldr	r0, [r5, #MMDC0_MDPDC]
-+	orr	r0, r0, #(0x55 << 8)
-+	str	r0, [r5, #MMDC0_MDPDC]
-+
-+	b	update_calibration
-+
-+update_calibration_only:
-+	ldr	r1, [r8]
-+	sub	r1, r1, #7
-+	add	r8, r8, #64
-+	b	update_calib
-+
-+update_calibration:
-+	/* write the new calibration values. */
-+	mov	r1, r9
-+	sub	r1, r1, #7
-+
-+update_calib:
-+	ldr	r0, [r8, #0x0]
-+	ldr	r3, [r8, #0x4]
-+	str	r3, [r5, r0]
-+	add	r8, r8, #8
-+	sub	r1, r1, #1
-+	cmp	r1, #0
-+	bgt	update_calib
-+
-+	/* perform a force measurement. */
-+	ldr	r0, =0x800
-+	str	r0, [r5, #MMDC0_MPMUR0]
-+	ldr	r2, =MMDC1_MPMUR0
-+	str	r0, [r5, r2]
-+
-+	/* clear SBS - unblock DDR accesses. */
-+	ldr	r0, [r5, #MMDC0_MADPCR0]
-+	bic	r0, r0, #(1 << 8)
-+	str	r0, [r5, #MMDC0_MADPCR0]
-+
-+	mov	r0, #0x0
-+	str	r0, [r5, #MMDC0_MDSCR]
-+poll_conreq_clear_2:
-+	ldr	r0, [r5, #MMDC0_MDSCR]
-+	and	r0, r0, #(0x4 << 12)
-+	cmp	r0, #(0x4 << 12)
-+	beq	poll_conreq_clear_2
-+
-+done:
-+	/* restore registers */
-+
-+	ldmfd	sp!, {r4-r12}
-+	mov	pc, lr
-+
-+	.type	mx6_do_ddr3_freq_change, #object
-+ENTRY(mx6_do_ddr_freq_change)
-+	.word	mx6_ddr3_freq_change
-+	.size	mx6_ddr3_freq_change, . - mx6_ddr3_freq_change
-diff -Nur linux-4.1.3/arch/arm/mach-imx/Kconfig linux-xbian-imx6/arch/arm/mach-imx/Kconfig
---- linux-4.1.3/arch/arm/mach-imx/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/Kconfig	2015-07-27 23:13:01.053224513 +0200
-@@ -1,5 +1,6 @@
- menuconfig ARCH_MXC
- 	bool "Freescale i.MX family" if ARCH_MULTI_V4_V5 || ARCH_MULTI_V6_V7
-+	select ARCH_HAS_RESET_CONTROLLER
- 	select ARCH_REQUIRE_GPIOLIB
- 	select ARM_CPU_SUSPEND if PM
- 	select CLKSRC_MMIO
-@@ -8,6 +9,7 @@
- 	select PM_OPP if PM
- 	select SOC_BUS
- 	select SRAM
-+	select ZONE_DMA
- 	help
- 	  Support for Freescale MXC/iMX-based family of processors
- 
-@@ -58,7 +60,6 @@
- 
- config HAVE_IMX_SRC
- 	def_bool y if SMP
--	select ARCH_HAS_RESET_CONTROLLER
- 
- config IMX_HAVE_IOMUX_V1
- 	bool
-diff -Nur linux-4.1.3/arch/arm/mach-imx/lpddr2_freq_imx6.S linux-xbian-imx6/arch/arm/mach-imx/lpddr2_freq_imx6.S
---- linux-4.1.3/arch/arm/mach-imx/lpddr2_freq_imx6.S	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/arch/arm/mach-imx/lpddr2_freq_imx6.S	2015-07-27 23:13:01.093082305 +0200
-@@ -0,0 +1,484 @@
-+/*
-+ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/linkage.h>
-+
-+	.macro    mx6sl_switch_to_24MHz
-+
-+	/*
-+	 * Set MMDC clock to be sourced from PLL3.
-+	 * Ensure first periph2_clk2 is sourced from PLL3.
-+	 * Set the PERIPH2_CLK2_PODF to divide by 2.
-+	 */
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x7
-+	orr	r6, r6, #0x1
-+	str	r6, [r2, #0x14]
-+
-+	/* Select PLL3 to source MMDC. */
-+	ldr	r6, [r2, #0x18]
-+	bic	r6, r6, #0x100000
-+	str	r6, [r2, #0x18]
-+
-+	/* Swtich periph2_clk_sel to run from PLL3. */
-+	ldr	r6, [r2, #0x14]
-+	orr	r6, r6, #0x4000000
-+	str	r6, [r2, #0x14]
-+
-+periph2_clk_switch1:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	periph2_clk_switch1
-+
-+	/*
-+	 * Need to clock gate the 528 PFDs before
-+	 * powering down PLL2.
-+	 * Only the PLL2_PFD2_400M should be ON
-+	 * at this time, so only clock gate that one.
-+	 */
-+	ldr	r6, [r3, #0x100]
-+	orr	r6, r6, #0x800000
-+	str	r6, [r3, #0x100]
-+
-+	/*
-+	 * Set PLL2 to bypass state. We should be here
-+	 * only if MMDC is not sourced from PLL2.
-+	 */
-+	ldr	r6, [r3, #0x30]
-+	orr	r6, r6, #0x10000
-+	str	r6, [r3, #0x30]
-+
-+	ldr	r6, [r3, #0x30]
-+	orr	r6, r6, #0x1000
-+	str	r6, [r3, #0x30]
-+
-+	/* Ensure pre_periph2_clk_mux is set to pll2 */
-+	ldr	r6, [r2, #0x18]
-+	bic	r6, r6, #0x600000
-+	str	r6, [r2, #0x18]
-+
-+	/* Set MMDC clock to be sourced from the bypassed PLL2. */
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x4000000
-+	str	r6, [r2, #0x14]
-+
-+periph2_clk_switch2:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	periph2_clk_switch2
-+
-+	/*
-+	 * Now move MMDC back to periph2_clk2 source.
-+	 * after selecting PLL2 as the option.
-+	 * Select PLL2 as the source.
-+	 */
-+	ldr	r6, [r2, #0x18]
-+	orr	r6, r6, #0x100000
-+	str	r6, [r2, #0x18]
-+
-+	/* set periph2_clk2_podf to divide by 1. */
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x7
-+	str	r6, [r2, #0x14]
-+
-+	/* Now move periph2_clk to periph2_clk2 source */
-+	ldr	r6, [r2, #0x14]
-+	orr	r6, r6, #0x4000000
-+	str	r6, [r2, #0x14]
-+
-+periph2_clk_switch3:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	periph2_clk_switch3
-+
-+	/* Now set the MMDC PODF back to 1.*/
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x38
-+	str	r6, [r2, #0x14]
-+
-+mmdc_podf0:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	mmdc_podf0
-+
-+	.endm
-+
-+	  .macro	ddr_switch_400MHz
-+
-+	/* Set MMDC divider first, in case PLL3 is at 480MHz. */
-+	ldr	r6, [r3, #0x10]
-+	and	r6, r6, #0x10000
-+	cmp	r6, #0x10000
-+	beq	pll3_in_bypass
-+
-+	/* Set MMDC divder to divide by 2. */
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x38
-+	orr	r6, r6, #0x8
-+	str	r6, [r2, #0x14]
-+
-+mmdc_podf:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	mmdc_podf
-+
-+pll3_in_bypass:
-+	/*
-+	 * Check if we are switching between
-+	 * 400Mhz <-> 100MHz.If so, we should
-+	 * try to source MMDC from PLL2_200M.
-+	 */
-+	cmp	r1, #0
-+	beq	not_low_bus_freq
-+
-+	/* Ensure that MMDC is sourced from PLL2 mux first. */
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x4000000
-+	str	r6, [r2, #0x14]
-+
-+periph2_clk_switch4:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	periph2_clk_switch4
-+
-+not_low_bus_freq:
-+	/* Now ensure periph2_clk2_sel mux is set to PLL3 */
-+	ldr	r6, [r2, #0x18]
-+	bic	r6, r6, #0x100000
-+	str	r6, [r2, #0x18]
-+
-+	/* Now switch MMDC to PLL3. */
-+	ldr	r6, [r2, #0x14]
-+	orr	r6, r6, #0x4000000
-+	str	r6, [r2, #0x14]
-+
-+periph2_clk_switch5:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	periph2_clk_switch5
-+
-+	/*
-+	 * Check if PLL2 is already unlocked.
-+	 * If so do nothing with PLL2.
-+	 */
-+	cmp	r1, #0
-+	beq	pll2_already_on
-+
-+	/* Now power up PLL2 and unbypass it. */
-+	ldr	r6, [r3, #0x30]
-+	bic	r6, r6, #0x1000
-+	str	r6, [r3, #0x30]
-+
-+	/* Make sure PLL2 has locked.*/
-+wait_for_pll_lock:
-+	ldr	r6, [r3, #0x30]
-+	and	r6, r6, #0x80000000
-+	cmp	r6, #0x80000000
-+	bne	wait_for_pll_lock
-+
-+	ldr	r6, [r3, #0x30]
-+	bic	r6, r6, #0x10000
-+	str	r6, [r3, #0x30]
-+
-+	/*
-+	 * Need to enable the 528 PFDs after
-+	 * powering up PLL2.
-+	 * Only the PLL2_PFD2_400M should be ON
-+	 * as it feeds the MMDC. Rest should have
-+	 * been managed by clock code.
-+	 */
-+	ldr	r6, [r3, #0x100]
-+	bic	r6, r6, #0x800000
-+	str	r6, [r3, #0x100]
-+
-+pll2_already_on:
-+	/*
-+	 * Now switch MMDC clk back to pll2_mux option.
-+	 * Ensure pre_periph2_clk2 is set to pll2_pfd_400M.
-+	 * If switching to audio DDR freq, set the
-+	 * pre_periph2_clk2 to PLL2_PFD_200M
-+	 */
-+	ldr	r6, =400000000
-+	cmp	r6, r0
-+	bne	use_pll2_pfd_200M
-+
-+	ldr	r6, [r2, #0x18]
-+	bic	r6, r6, #0x600000
-+	orr	r6, r6, #0x200000
-+	str	r6, [r2, #0x18]
-+	ldr	r6, =400000000
-+	b       cont2
-+
-+use_pll2_pfd_200M:
-+	ldr	r6, [r2, #0x18]
-+	orr	r6, r6, #0x600000
-+	str	r6, [r2, #0x18]
-+	ldr	r6, =200000000
-+
-+cont2:
-+	ldr	r4, [r2, #0x14]
-+	bic	r4, r4, #0x4000000
-+	str	r4, [r2, #0x14]
-+
-+periph2_clk_switch6:
-+	ldr	r4, [r2, #0x48]
-+	cmp	r4, #0
-+	bne	periph2_clk_switch6
-+
-+change_divider_only:
-+	/*
-+	 * Calculate the MMDC divider
-+	 * based on the requested freq.
-+	 */
-+	ldr	r4, =0
-+Loop2:
-+	sub	r6, r6, r0
-+	cmp	r6, r0
-+	blt	Div_Found
-+	add	r4, r4, #1
-+	bgt	Loop2
-+
-+	/* Shift divider into correct offset. */
-+	lsl	r4, r4, #3
-+Div_Found:
-+	/* Set the MMDC PODF. */
-+	ldr	r6, [r2, #0x14]
-+	bic	r6, r6, #0x38
-+	orr	r6, r6, r4
-+	str	r6, [r2, #0x14]
-+
-+mmdc_podf1:
-+	ldr	r6, [r2, #0x48]
-+	cmp	r6, #0
-+	bne	mmdc_podf1
-+
-+	.endm
-+
-+	.macro	mmdc_clk_lower_100MHz
-+
-+	/*
-+	 * Prior to reducing the DDR frequency (at 528/400 MHz),
-+	 * read the Measure unit count bits (MU_UNIT_DEL_NUM)
-+	 */
-+	ldr	r5, =0x8B8
-+	ldr	r6, [r8, r5]
-+	/* Original MU unit count */
-+	mov	r6, r6, LSR #16
-+	ldr	r4, =0x3FF
-+	and	r6, r6, r4
-+	/* Original MU unit count * 2 */
-+	mov	r7, r6, LSL #1
-+	/*
-+	 * Bypass the automatic measure unit when below 100 MHz
-+	 * by setting the Measure unit bypass enable bit (MU_BYP_EN)
-+	 */
-+	ldr	r6, [r8, r5]
-+	orr	r6, r6, #0x400
-+	str	r6, [r8, r5]
-+	/*
-+	 * Double the measure count value read in step 1 and program it in the
-+	 * measurement bypass bits (MU_BYP_VAL) of the MMDC PHY Measure Unit
-+	 * Register for the reduced frequency operation below 100 MHz
-+	 */
-+	ldr	r6, [r8, r5]
-+	ldr	r4, =0x3FF
-+	bic	r6, r6, r4
-+	orr	r6, r6, r7
-+	str	r6, [r8, r5]
-+	/* Now perform a Force Measurement. */
-+	ldr	r6, [r8, r5]
-+	orr	r6, r6, #0x800
-+	str	r6, [r8, r5]
-+	/* Wait for FRC_MSR to clear. */
-+force_measure:
-+	ldr	r6, [r8, r5]
-+	and	r6, r6, #0x800
-+	cmp	r6, #0x0
-+	bne	force_measure
-+
-+	.endm
-+
-+	.macro	mmdc_clk_above_100MHz
-+
-+	/* Make sure that the PHY measurement unit is NOT in bypass mode */
-+	ldr	r5, =0x8B8
-+	ldr	r6, [r8, r5]
-+	bic	r6, r6, #0x400
-+	str	r6, [r8, r5]
-+	/* Now perform a Force Measurement. */
-+	ldr	r6, [r8, r5]
-+	orr	r6, r6, #0x800
-+	str	r6, [r8, r5]
-+	/* Wait for FRC_MSR to clear. */
-+force_measure1:
-+	ldr	r6, [r8, r5]
-+	and	r6, r6, #0x800
-+	cmp	r6, #0x0
-+	bne	force_measure1
-+	.endm
-+
-+/*
-+ *  mx6_lpddr2_freq_change
-+ *
-+ *  Make sure DDR is in self-refresh.
-+ *  IRQs are already disabled.
-+ * r0 : DDR freq.
-+ * r1: low_bus_freq_mode flag
-+ * r2: Pointer to array containing addresses of registers.
-+ */
-+	.align 3
-+ENTRY(mx6_lpddr2_freq_change)
-+
-+	push {r4-r10}
-+
-+	mov	r4, r2
-+	ldr	r3, [r4]			@ANATOP_BASE_ADDR
-+	ldr	r2, [r4, #0x4]		@CCM_BASE_ADDR
-+	ldr	r8, [r4, #0x8]		@MMDC_P0_BASE_ADDR
-+	ldr	r7, [r4, #0xC]		@L2_BASE_ADDR
-+
-+lpddr2_freq_change:
-+	adr	r9, lpddr2_freq_change
-+
-+	/* Prime all TLB entries. */
-+	ldr	r6, [r9]
-+	ldr	r6, [r8]
-+	ldr	r6, [r3]
-+	ldr	r6, [r2]
-+
-+	 /* Drain all the L1 buffers. */
-+	 dsb
-+
-+#ifdef CONFIG_CACHE_L2X0
-+	/*
-+	 * Need to make sure the buffers in L2 are drained.
-+	 * Performing a sync operation does this.
-+	 */
-+	mov	r6, #0x0
-+	str	r6, [r7, #0x730]
-+#endif
-+
-+	/*
-+	 * The second dsb might be needed to keep cache sync (device write)
-+	 * ordering with the memory accesses before it.
-+	 */
-+	dsb
-+	isb
-+
-+	/* Disable Automatic power savings. */
-+	ldr	r6, [r8, #0x404]
-+	orr	r6, r6, #0x01
-+	str	r6, [r8, #0x404]
-+
-+	/* MMDC0_MDPDC disable power down timer */
-+	ldr	r6, [r8, #0x4]
-+	bic	r6, r6, #0xff00
-+	str	r6, [r8, #0x4]
-+
-+	/* Delay for a while */
-+	ldr	r10, =10
-+delay1:
-+	ldr	r7, =0
-+cont1:
-+	ldr	r6, [r8, r7]
-+	add	r7, r7, #4
-+	cmp	r7, #16
-+	bne	cont1
-+	sub	r10, r10, #1
-+	cmp	r10, #0
-+	bgt	delay1
-+
-+	/* Make the DDR explicitly enter self-refresh. */
-+	ldr	r6, [r8, #0x404]
-+	orr	r6, r6, #0x200000
-+	str	r6, [r8, #0x404]
-+
-+poll_dvfs_set_1:
-+	ldr	r6, [r8, #0x404]
-+	and	r6, r6, #0x2000000
-+	cmp	r6, #0x2000000
-+	bne	poll_dvfs_set_1
-+
-+	/* set SBS step-by-step mode */
-+	ldr	r6, [r8, #0x410]
-+	orr	r6, r6, #0x100
-+	str	r6, [r8, #0x410]
-+
-+	ldr	r10, =100000000
-+	cmp	r0, r10
-+	bgt	set_ddr_mu_above_100
-+	mmdc_clk_lower_100MHz
-+
-+set_ddr_mu_above_100:
-+	ldr	r10, =24000000
-+	cmp	r0, r10
-+	beq	set_to_24MHz
-+
-+	ddr_switch_400MHz
-+
-+	ldr	r10,=100000000
-+	cmp	r0, r10
-+	blt	done
-+	mmdc_clk_above_100MHz
-+
-+	b	done
-+
-+set_to_24MHz:
-+	mx6sl_switch_to_24MHz
-+
-+done:
-+	/* clear DVFS - exit from self refresh mode */
-+	ldr	r6, [r8, #0x404]
-+	bic	r6, r6, #0x200000
-+	str	r6, [r8, #0x404]
-+
-+poll_dvfs_clear_1:
-+	ldr	r6, [r8, #0x404]
-+	and	r6, r6, #0x2000000
-+	cmp	r6, #0x2000000
-+	beq	poll_dvfs_clear_1
-+
-+	/* Enable Automatic power savings. */
-+	ldr	r6, [r8, #0x404]
-+	bic	r6, r6, #0x01
-+	str	r6, [r8, #0x404]
-+
-+	ldr	r10, =24000000
-+	cmp	r0, r10
-+	beq	skip_power_down
-+
-+	/* Enable MMDC power down timer. */
-+	ldr	r6, [r8, #0x4]
-+	orr	r6, r6, #0x5500
-+	str	r6, [r8, #0x4]
-+
-+skip_power_down:
-+	/* clear SBS - unblock DDR accesses */
-+	ldr	r6, [r8, #0x410]
-+	bic	r6, r6, #0x100
-+	str	r6, [r8, #0x410]
-+
-+	pop {r4-r10}
-+
-+	/* Restore registers */
-+	mov	pc, lr
-+
-+	.type	mx6_lpddr2_do_iram, #object
-+ENTRY(mx6_lpddr2_do_iram)
-+	.word	mx6_lpddr2_freq_change
-+	.size		mx6_lpddr2_freq_change, . - mx6_lpddr2_freq_change
-diff -Nur linux-4.1.3/arch/arm/mach-imx/mach-imx6q.c linux-xbian-imx6/arch/arm/mach-imx/mach-imx6q.c
---- linux-4.1.3/arch/arm/mach-imx/mach-imx6q.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/mach-imx6q.c	2015-07-27 23:13:01.097068084 +0200
-@@ -265,10 +265,12 @@
- static void __init imx6q_init_machine(void)
- {
- 	struct device *parent;
-+	void __iomem *p;
- 
- 	imx_print_silicon_rev(cpu_is_imx6dl() ? "i.MX6DL" : "i.MX6Q",
- 			      imx_get_soc_revision());
- 
-+	mxc_arch_reset_init_dt();
- 	parent = imx_soc_device_init();
- 	if (parent == NULL)
- 		pr_warn("failed to initialize soc device\n");
-@@ -281,6 +283,12 @@
- 	cpu_is_imx6q() ?  imx6q_pm_init() : imx6dl_pm_init();
- 	imx6q_1588_init();
- 	imx6q_axi_init();
-+
-+	p = ioremap(0x21b0000, SZ_4K);
-+	if (p) {
-+		writel(0x7f, p + 0x40);
-+		iounmap(p);
-+	}
- }
- 
- #define OCOTP_CFG3			0x440
-@@ -330,6 +338,12 @@
- 			if (dev_pm_opp_disable(cpu_dev, 852000000))
- 				pr_warn("failed to disable 852 MHz OPP\n");
- 	}
-+	if (vpu352) {
-+		if (dev_pm_opp_disable(cpu_dev, 396000000))
-+			pr_warn("VPU352: failed to disable 396MHz OPP\n");
-+		pr_info("VPU352: remove 396MHz OPP for VPU running at 352MHz!\n");
-+	}
-+
- 	iounmap(base);
- put_node:
- 	of_node_put(np);
-@@ -408,4 +422,5 @@
- 	.init_machine	= imx6q_init_machine,
- 	.init_late      = imx6q_init_late,
- 	.dt_compat	= imx6q_dt_compat,
-+	.restart	= mxc_restart,
- MACHINE_END
-diff -Nur linux-4.1.3/arch/arm/mach-imx/Makefile linux-xbian-imx6/arch/arm/mach-imx/Makefile
---- linux-4.1.3/arch/arm/mach-imx/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/Makefile	2015-07-27 23:13:01.053224513 +0200
-@@ -28,6 +28,12 @@
- obj-$(CONFIG_MXC_USE_EPIT) += epit.o
- obj-$(CONFIG_MXC_DEBUG_BOARD) += 3ds_debugboard.o
- 
-+obj-y += busfreq-imx6.o
-+ifdef CONFIG_ARM_IMX6Q_CPUFREQ
-+obj-$(CONFIG_SOC_IMX6Q) += ddr3_freq_imx6.o busfreq_ddr3.o
-+obj-$(CONFIG_SOC_IMX6SL) += lpddr2_freq_imx6.o busfreq_lpddr2.o
-+endif
-+
- ifeq ($(CONFIG_CPU_IDLE),y)
- obj-$(CONFIG_SOC_IMX5) += cpuidle-imx5.o
- obj-$(CONFIG_SOC_IMX6Q) += cpuidle-imx6q.o
-diff -Nur linux-4.1.3/arch/arm/mach-imx/src.c linux-xbian-imx6/arch/arm/mach-imx/src.c
---- linux-4.1.3/arch/arm/mach-imx/src.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/src.c	2015-07-27 23:13:01.097068084 +0200
-@@ -1,5 +1,5 @@
- /*
-- * Copyright 2011 Freescale Semiconductor, Inc.
-+ * Copyright 2011-2014 Freescale Semiconductor, Inc.
-  * Copyright 2011 Linaro Ltd.
-  *
-  * The code contained herein is licensed under the GNU General Public
-@@ -18,6 +18,7 @@
- #include <linux/smp.h>
- #include <asm/smp_plat.h>
- #include "common.h"
-+#include "hardware.h"
- 
- #define SRC_SCR				0x000
- #define SRC_GPR1			0x020
-@@ -32,6 +33,7 @@
- 
- static void __iomem *src_base;
- static DEFINE_SPINLOCK(scr_lock);
-+static bool m4_is_enabled;
- 
- static const int sw_reset_bits[5] = {
- 	BP_SRC_SCR_SW_GPU_RST,
-@@ -41,6 +43,11 @@
- 	BP_SRC_SCR_SW_IPU2_RST
- };
- 
-+bool imx_src_is_m4_enabled(void)
-+{
-+	return m4_is_enabled;
-+}
-+
- static int imx_src_reset_module(struct reset_controller_dev *rcdev,
- 		unsigned long sw_reset_idx)
- {
-@@ -136,6 +143,14 @@
- 	 */
- 	spin_lock(&scr_lock);
- 	val = readl_relaxed(src_base + SRC_SCR);
-+
-+	/* bit 4 is m4c_non_sclr_rst on i.MX6SX */
-+	if (cpu_is_imx6sx() && ((val &
-+		(1 << BP_SRC_SCR_SW_OPEN_VG_RST)) == 0))
-+		m4_is_enabled = true;
-+	else
-+		m4_is_enabled = false;
-+
- 	val &= ~(1 << BP_SRC_SCR_WARM_RESET_ENABLE);
- 	writel_relaxed(val, src_base + SRC_SCR);
- 	spin_unlock(&scr_lock);
-diff -Nur linux-4.1.3/arch/arm/mach-imx/system.c linux-xbian-imx6/arch/arm/mach-imx/system.c
---- linux-4.1.3/arch/arm/mach-imx/system.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mach-imx/system.c	2015-07-27 23:13:01.101053863 +0200
-@@ -34,6 +34,7 @@
- 
- static void __iomem *wdog_base;
- static struct clk *wdog_clk;
-+static u32 wdog_source = 1; /* use WDOG1 default */
- 
- /*
-  * Reset the system. It is called by machine_restart().
-@@ -50,6 +51,17 @@
- 
- 	if (cpu_is_mx1())
- 		wcr_enable = (1 << 0);
-+	/*
-+	 * Some i.MX6 boards use WDOG2 to reset external pmic in bypass mode,
-+	 * so do WDOG2 reset here. Do not set SRS, since we will
-+	 * trigger external POR later. Use WDOG1 to reset in ldo-enable
-+	 * mode. You can set it by "fsl,wdog-reset" in dts.
-+	 * For i.MX6SX we have to trigger wdog-reset to reset QSPI-NOR flash to
-+	 * workaround qspi-nor reboot issue whatever ldo-bypass or not.
-+	 */
-+	else if ((wdog_source == 2 && (cpu_is_imx6q() || cpu_is_imx6dl() ||
-+			cpu_is_imx6sl())) || cpu_is_imx6sx())
-+		wcr_enable = 0x14;
- 	else
- 		wcr_enable = (1 << 2);
- 
-@@ -89,6 +101,41 @@
- 		clk_prepare(wdog_clk);
- }
- 
-+void __init mxc_arch_reset_init_dt(void)
-+{
-+        struct device_node *np = NULL;
-+
-+        if (cpu_is_imx6q() || cpu_is_imx6dl())
-+                np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-gpc");
-+        else if (cpu_is_imx6sl())
-+                np = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-gpc");
-+
-+        if (np)
-+                of_property_read_u32(np, "fsl,wdog-reset", &wdog_source);
-+        pr_info("Use WDOG%d as reset source\n", wdog_source);
-+
-+        np = of_find_compatible_node(NULL, NULL, "fsl,imx21-wdt");
-+        wdog_base = of_iomap(np, 0);
-+        WARN_ON(!wdog_base);
-+
-+        /* Some i.MX6 boards use WDOG2 to reset board in ldo-bypass mode */
-+        if (wdog_source == 2 && (cpu_is_imx6q() || cpu_is_imx6dl() ||
-+                cpu_is_imx6sl())) {
-+                np = of_find_compatible_node(np, NULL, "fsl,imx21-wdt");
-+                wdog_base = of_iomap(np, 0);
-+                WARN_ON(!wdog_base);
-+        }
-+
-+        wdog_clk = of_clk_get(np, 0);
-+        if (IS_ERR(wdog_clk)) {
-+                pr_warn("%s: failed to get wdog clock\n", __func__);
-+                wdog_clk = NULL;
-+                return;
-+        }
-+
-+        clk_prepare(wdog_clk);
-+}
-+
- #ifdef CONFIG_CACHE_L2X0
- void __init imx_init_l2cache(void)
- {
-diff -Nur linux-4.1.3/arch/arm/mm/cache-v7.S linux-xbian-imx6/arch/arm/mm/cache-v7.S
---- linux-4.1.3/arch/arm/mm/cache-v7.S	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/arch/arm/mm/cache-v7.S	2015-07-27 23:13:01.503617563 +0200
-@@ -446,3 +446,5 @@
- 
- 	@ define struct cpu_cache_fns (see <asm/cacheflush.h> and proc-macros.S)
- 	define_cache_functions v7
-+
-+	.long	v7_dma_flush_range
-diff -Nur linux-4.1.3/block/bfq-cgroup.c linux-xbian-imx6/block/bfq-cgroup.c
---- linux-4.1.3/block/bfq-cgroup.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/block/bfq-cgroup.c	2015-07-27 23:13:03.600137415 +0200
-@@ -0,0 +1,936 @@
-+/*
-+ * BFQ: CGROUPS support.
-+ *
-+ * Based on ideas and code from CFQ:
-+ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
-+ *
-+ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
-+ *		      Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Licensed under the GPL-2 as detailed in the accompanying COPYING.BFQ
-+ * file.
-+ */
-+
-+#ifdef CONFIG_CGROUP_BFQIO
-+
-+static DEFINE_MUTEX(bfqio_mutex);
-+
-+static bool bfqio_is_removed(struct bfqio_cgroup *bgrp)
-+{
-+	return bgrp ? !bgrp->online : false;
-+}
-+
-+static struct bfqio_cgroup bfqio_root_cgroup = {
-+	.weight = BFQ_DEFAULT_GRP_WEIGHT,
-+	.ioprio = BFQ_DEFAULT_GRP_IOPRIO,
-+	.ioprio_class = BFQ_DEFAULT_GRP_CLASS,
-+};
-+
-+static inline void bfq_init_entity(struct bfq_entity *entity,
-+				   struct bfq_group *bfqg)
-+{
-+	entity->weight = entity->new_weight;
-+	entity->orig_weight = entity->new_weight;
-+	entity->ioprio = entity->new_ioprio;
-+	entity->ioprio_class = entity->new_ioprio_class;
-+	entity->parent = bfqg->my_entity;
-+	entity->sched_data = &bfqg->sched_data;
-+}
-+
-+static struct bfqio_cgroup *css_to_bfqio(struct cgroup_subsys_state *css)
-+{
-+	return css ? container_of(css, struct bfqio_cgroup, css) : NULL;
-+}
-+
-+/*
-+ * Search the bfq_group for bfqd into the hash table (by now only a list)
-+ * of bgrp.  Must be called under rcu_read_lock().
-+ */
-+static struct bfq_group *bfqio_lookup_group(struct bfqio_cgroup *bgrp,
-+					    struct bfq_data *bfqd)
-+{
-+	struct bfq_group *bfqg;
-+	void *key;
-+
-+	hlist_for_each_entry_rcu(bfqg, &bgrp->group_data, group_node) {
-+		key = rcu_dereference(bfqg->bfqd);
-+		if (key == bfqd)
-+			return bfqg;
-+	}
-+
-+	return NULL;
-+}
-+
-+static inline void bfq_group_init_entity(struct bfqio_cgroup *bgrp,
-+					 struct bfq_group *bfqg)
-+{
-+	struct bfq_entity *entity = &bfqg->entity;
-+
-+	/*
-+	 * If the weight of the entity has never been set via the sysfs
-+	 * interface, then bgrp->weight == 0. In this case we initialize
-+	 * the weight from the current ioprio value. Otherwise, the group
-+	 * weight, if set, has priority over the ioprio value.
-+	 */
-+	if (bgrp->weight == 0) {
-+		entity->new_weight = bfq_ioprio_to_weight(bgrp->ioprio);
-+		entity->new_ioprio = bgrp->ioprio;
-+	} else {
-+		if (bgrp->weight < BFQ_MIN_WEIGHT ||
-+		    bgrp->weight > BFQ_MAX_WEIGHT) {
-+			printk(KERN_CRIT "bfq_group_init_entity: "
-+					 "bgrp->weight %d\n", bgrp->weight);
-+			BUG();
-+		}
-+		entity->new_weight = bgrp->weight;
-+		entity->new_ioprio = bfq_weight_to_ioprio(bgrp->weight);
-+	}
-+	entity->orig_weight = entity->weight = entity->new_weight;
-+	entity->ioprio = entity->new_ioprio;
-+	entity->ioprio_class = entity->new_ioprio_class = bgrp->ioprio_class;
-+	entity->my_sched_data = &bfqg->sched_data;
-+	bfqg->active_entities = 0;
-+}
-+
-+static inline void bfq_group_set_parent(struct bfq_group *bfqg,
-+					struct bfq_group *parent)
-+{
-+	struct bfq_entity *entity;
-+
-+	BUG_ON(parent == NULL);
-+	BUG_ON(bfqg == NULL);
-+
-+	entity = &bfqg->entity;
-+	entity->parent = parent->my_entity;
-+	entity->sched_data = &parent->sched_data;
-+}
-+
-+/**
-+ * bfq_group_chain_alloc - allocate a chain of groups.
-+ * @bfqd: queue descriptor.
-+ * @css: the leaf cgroup_subsys_state this chain starts from.
-+ *
-+ * Allocate a chain of groups starting from the one belonging to
-+ * @cgroup up to the root cgroup.  Stop if a cgroup on the chain
-+ * to the root has already an allocated group on @bfqd.
-+ */
-+static struct bfq_group *bfq_group_chain_alloc(struct bfq_data *bfqd,
-+					       struct cgroup_subsys_state *css)
-+{
-+	struct bfqio_cgroup *bgrp;
-+	struct bfq_group *bfqg, *prev = NULL, *leaf = NULL;
-+
-+	for (; css != NULL; css = css->parent) {
-+		bgrp = css_to_bfqio(css);
-+
-+		bfqg = bfqio_lookup_group(bgrp, bfqd);
-+		if (bfqg != NULL) {
-+			/*
-+			 * All the cgroups in the path from there to the
-+			 * root must have a bfq_group for bfqd, so we don't
-+			 * need any more allocations.
-+			 */
-+			break;
-+		}
-+
-+		bfqg = kzalloc(sizeof(*bfqg), GFP_ATOMIC);
-+		if (bfqg == NULL)
-+			goto cleanup;
-+
-+		bfq_group_init_entity(bgrp, bfqg);
-+		bfqg->my_entity = &bfqg->entity;
-+
-+		if (leaf == NULL) {
-+			leaf = bfqg;
-+			prev = leaf;
-+		} else {
-+			bfq_group_set_parent(prev, bfqg);
-+			/*
-+			 * Build a list of allocated nodes using the bfqd
-+			 * filed, that is still unused and will be
-+			 * initialized only after the node will be
-+			 * connected.
-+			 */
-+			prev->bfqd = bfqg;
-+			prev = bfqg;
-+		}
-+	}
-+
-+	return leaf;
-+
-+cleanup:
-+	while (leaf != NULL) {
-+		prev = leaf;
-+		leaf = leaf->bfqd;
-+		kfree(prev);
-+	}
-+
-+	return NULL;
-+}
-+
-+/**
-+ * bfq_group_chain_link - link an allocated group chain to a cgroup
-+ *                        hierarchy.
-+ * @bfqd: the queue descriptor.
-+ * @css: the leaf cgroup_subsys_state to start from.
-+ * @leaf: the leaf group (to be associated to @cgroup).
-+ *
-+ * Try to link a chain of groups to a cgroup hierarchy, connecting the
-+ * nodes bottom-up, so we can be sure that when we find a cgroup in the
-+ * hierarchy that already as a group associated to @bfqd all the nodes
-+ * in the path to the root cgroup have one too.
-+ *
-+ * On locking: the queue lock protects the hierarchy (there is a hierarchy
-+ * per device) while the bfqio_cgroup lock protects the list of groups
-+ * belonging to the same cgroup.
-+ */
-+static void bfq_group_chain_link(struct bfq_data *bfqd,
-+				 struct cgroup_subsys_state *css,
-+				 struct bfq_group *leaf)
-+{
-+	struct bfqio_cgroup *bgrp;
-+	struct bfq_group *bfqg, *next, *prev = NULL;
-+	unsigned long flags;
-+
-+	assert_spin_locked(bfqd->queue->queue_lock);
-+
-+	for (; css != NULL && leaf != NULL; css = css->parent) {
-+		bgrp = css_to_bfqio(css);
-+		next = leaf->bfqd;
-+
-+		bfqg = bfqio_lookup_group(bgrp, bfqd);
-+		BUG_ON(bfqg != NULL);
-+
-+		spin_lock_irqsave(&bgrp->lock, flags);
-+
-+		rcu_assign_pointer(leaf->bfqd, bfqd);
-+		hlist_add_head_rcu(&leaf->group_node, &bgrp->group_data);
-+		hlist_add_head(&leaf->bfqd_node, &bfqd->group_list);
-+
-+		spin_unlock_irqrestore(&bgrp->lock, flags);
-+
-+		prev = leaf;
-+		leaf = next;
-+	}
-+
-+	BUG_ON(css == NULL && leaf != NULL);
-+	if (css != NULL && prev != NULL) {
-+		bgrp = css_to_bfqio(css);
-+		bfqg = bfqio_lookup_group(bgrp, bfqd);
-+		bfq_group_set_parent(prev, bfqg);
-+	}
-+}
-+
-+/**
-+ * bfq_find_alloc_group - return the group associated to @bfqd in @cgroup.
-+ * @bfqd: queue descriptor.
-+ * @cgroup: cgroup being searched for.
-+ *
-+ * Return a group associated to @bfqd in @cgroup, allocating one if
-+ * necessary.  When a group is returned all the cgroups in the path
-+ * to the root have a group associated to @bfqd.
-+ *
-+ * If the allocation fails, return the root group: this breaks guarantees
-+ * but is a safe fallback.  If this loss becomes a problem it can be
-+ * mitigated using the equivalent weight (given by the product of the
-+ * weights of the groups in the path from @group to the root) in the
-+ * root scheduler.
-+ *
-+ * We allocate all the missing nodes in the path from the leaf cgroup
-+ * to the root and we connect the nodes only after all the allocations
-+ * have been successful.
-+ */
-+static struct bfq_group *bfq_find_alloc_group(struct bfq_data *bfqd,
-+					      struct cgroup_subsys_state *css)
-+{
-+	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
-+	struct bfq_group *bfqg;
-+
-+	bfqg = bfqio_lookup_group(bgrp, bfqd);
-+	if (bfqg != NULL)
-+		return bfqg;
-+
-+	bfqg = bfq_group_chain_alloc(bfqd, css);
-+	if (bfqg != NULL)
-+		bfq_group_chain_link(bfqd, css, bfqg);
-+	else
-+		bfqg = bfqd->root_group;
-+
-+	return bfqg;
-+}
-+
-+/**
-+ * bfq_bfqq_move - migrate @bfqq to @bfqg.
-+ * @bfqd: queue descriptor.
-+ * @bfqq: the queue to move.
-+ * @entity: @bfqq's entity.
-+ * @bfqg: the group to move to.
-+ *
-+ * Move @bfqq to @bfqg, deactivating it from its old group and reactivating
-+ * it on the new one.  Avoid putting the entity on the old group idle tree.
-+ *
-+ * Must be called under the queue lock; the cgroup owning @bfqg must
-+ * not disappear (by now this just means that we are called under
-+ * rcu_read_lock()).
-+ */
-+static void bfq_bfqq_move(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+			  struct bfq_entity *entity, struct bfq_group *bfqg)
-+{
-+	int busy, resume;
-+
-+	busy = bfq_bfqq_busy(bfqq);
-+	resume = !RB_EMPTY_ROOT(&bfqq->sort_list);
-+
-+	BUG_ON(resume && !entity->on_st);
-+	BUG_ON(busy && !resume && entity->on_st &&
-+	       bfqq != bfqd->in_service_queue);
-+
-+	if (busy) {
-+		BUG_ON(atomic_read(&bfqq->ref) < 2);
-+
-+		if (!resume)
-+			bfq_del_bfqq_busy(bfqd, bfqq, 0);
-+		else
-+			bfq_deactivate_bfqq(bfqd, bfqq, 0);
-+	} else if (entity->on_st)
-+		bfq_put_idle_entity(bfq_entity_service_tree(entity), entity);
-+
-+	/*
-+	 * Here we use a reference to bfqg.  We don't need a refcounter
-+	 * as the cgroup reference will not be dropped, so that its
-+	 * destroy() callback will not be invoked.
-+	 */
-+	entity->parent = bfqg->my_entity;
-+	entity->sched_data = &bfqg->sched_data;
-+
-+	if (busy && resume)
-+		bfq_activate_bfqq(bfqd, bfqq);
-+
-+	if (bfqd->in_service_queue == NULL && !bfqd->rq_in_driver)
-+		bfq_schedule_dispatch(bfqd);
-+}
-+
-+/**
-+ * __bfq_bic_change_cgroup - move @bic to @cgroup.
-+ * @bfqd: the queue descriptor.
-+ * @bic: the bic to move.
-+ * @cgroup: the cgroup to move to.
-+ *
-+ * Move bic to cgroup, assuming that bfqd->queue is locked; the caller
-+ * has to make sure that the reference to cgroup is valid across the call.
-+ *
-+ * NOTE: an alternative approach might have been to store the current
-+ * cgroup in bfqq and getting a reference to it, reducing the lookup
-+ * time here, at the price of slightly more complex code.
-+ */
-+static struct bfq_group *__bfq_bic_change_cgroup(struct bfq_data *bfqd,
-+						struct bfq_io_cq *bic,
-+						struct cgroup_subsys_state *css)
-+{
-+	struct bfq_queue *async_bfqq = bic_to_bfqq(bic, 0);
-+	struct bfq_queue *sync_bfqq = bic_to_bfqq(bic, 1);
-+	struct bfq_entity *entity;
-+	struct bfq_group *bfqg;
-+	struct bfqio_cgroup *bgrp;
-+
-+	bgrp = css_to_bfqio(css);
-+
-+	bfqg = bfq_find_alloc_group(bfqd, css);
-+	if (async_bfqq != NULL) {
-+		entity = &async_bfqq->entity;
-+
-+		if (entity->sched_data != &bfqg->sched_data) {
-+			bic_set_bfqq(bic, NULL, 0);
-+			bfq_log_bfqq(bfqd, async_bfqq,
-+				     "bic_change_group: %p %d",
-+				     async_bfqq, atomic_read(&async_bfqq->ref));
-+			bfq_put_queue(async_bfqq);
-+		}
-+	}
-+
-+	if (sync_bfqq != NULL) {
-+		entity = &sync_bfqq->entity;
-+		if (entity->sched_data != &bfqg->sched_data)
-+			bfq_bfqq_move(bfqd, sync_bfqq, entity, bfqg);
-+	}
-+
-+	return bfqg;
-+}
-+
-+/**
-+ * bfq_bic_change_cgroup - move @bic to @cgroup.
-+ * @bic: the bic being migrated.
-+ * @cgroup: the destination cgroup.
-+ *
-+ * When the task owning @bic is moved to @cgroup, @bic is immediately
-+ * moved into its new parent group.
-+ */
-+static void bfq_bic_change_cgroup(struct bfq_io_cq *bic,
-+				  struct cgroup_subsys_state *css)
-+{
-+	struct bfq_data *bfqd;
-+	unsigned long uninitialized_var(flags);
-+
-+	bfqd = bfq_get_bfqd_locked(&(bic->icq.q->elevator->elevator_data),
-+				   &flags);
-+	if (bfqd != NULL) {
-+		__bfq_bic_change_cgroup(bfqd, bic, css);
-+		bfq_put_bfqd_unlock(bfqd, &flags);
-+	}
-+}
-+
-+/**
-+ * bfq_bic_update_cgroup - update the cgroup of @bic.
-+ * @bic: the @bic to update.
-+ *
-+ * Make sure that @bic is enqueued in the cgroup of the current task.
-+ * We need this in addition to moving bics during the cgroup attach
-+ * phase because the task owning @bic could be at its first disk
-+ * access or we may end up in the root cgroup as the result of a
-+ * memory allocation failure and here we try to move to the right
-+ * group.
-+ *
-+ * Must be called under the queue lock.  It is safe to use the returned
-+ * value even after the rcu_read_unlock() as the migration/destruction
-+ * paths act under the queue lock too.  IOW it is impossible to race with
-+ * group migration/destruction and end up with an invalid group as:
-+ *   a) here cgroup has not yet been destroyed, nor its destroy callback
-+ *      has started execution, as current holds a reference to it,
-+ *   b) if it is destroyed after rcu_read_unlock() [after current is
-+ *      migrated to a different cgroup] its attach() callback will have
-+ *      taken care of remove all the references to the old cgroup data.
-+ */
-+static struct bfq_group *bfq_bic_update_cgroup(struct bfq_io_cq *bic)
-+{
-+	struct bfq_data *bfqd = bic_to_bfqd(bic);
-+	struct bfq_group *bfqg;
-+	struct cgroup_subsys_state *css;
-+
-+	BUG_ON(bfqd == NULL);
-+
-+	rcu_read_lock();
-+	css = task_css(current, bfqio_cgrp_id);
-+	bfqg = __bfq_bic_change_cgroup(bfqd, bic, css);
-+	rcu_read_unlock();
-+
-+	return bfqg;
-+}
-+
-+/**
-+ * bfq_flush_idle_tree - deactivate any entity on the idle tree of @st.
-+ * @st: the service tree being flushed.
-+ */
-+static inline void bfq_flush_idle_tree(struct bfq_service_tree *st)
-+{
-+	struct bfq_entity *entity = st->first_idle;
-+
-+	for (; entity != NULL; entity = st->first_idle)
-+		__bfq_deactivate_entity(entity, 0);
-+}
-+
-+/**
-+ * bfq_reparent_leaf_entity - move leaf entity to the root_group.
-+ * @bfqd: the device data structure with the root group.
-+ * @entity: the entity to move.
-+ */
-+static inline void bfq_reparent_leaf_entity(struct bfq_data *bfqd,
-+					    struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+
-+	BUG_ON(bfqq == NULL);
-+	bfq_bfqq_move(bfqd, bfqq, entity, bfqd->root_group);
-+	return;
-+}
-+
-+/**
-+ * bfq_reparent_active_entities - move to the root group all active
-+ *                                entities.
-+ * @bfqd: the device data structure with the root group.
-+ * @bfqg: the group to move from.
-+ * @st: the service tree with the entities.
-+ *
-+ * Needs queue_lock to be taken and reference to be valid over the call.
-+ */
-+static inline void bfq_reparent_active_entities(struct bfq_data *bfqd,
-+						struct bfq_group *bfqg,
-+						struct bfq_service_tree *st)
-+{
-+	struct rb_root *active = &st->active;
-+	struct bfq_entity *entity = NULL;
-+
-+	if (!RB_EMPTY_ROOT(&st->active))
-+		entity = bfq_entity_of(rb_first(active));
-+
-+	for (; entity != NULL; entity = bfq_entity_of(rb_first(active)))
-+		bfq_reparent_leaf_entity(bfqd, entity);
-+
-+	if (bfqg->sched_data.in_service_entity != NULL)
-+		bfq_reparent_leaf_entity(bfqd,
-+			bfqg->sched_data.in_service_entity);
-+
-+	return;
-+}
-+
-+/**
-+ * bfq_destroy_group - destroy @bfqg.
-+ * @bgrp: the bfqio_cgroup containing @bfqg.
-+ * @bfqg: the group being destroyed.
-+ *
-+ * Destroy @bfqg, making sure that it is not referenced from its parent.
-+ */
-+static void bfq_destroy_group(struct bfqio_cgroup *bgrp, struct bfq_group *bfqg)
-+{
-+	struct bfq_data *bfqd;
-+	struct bfq_service_tree *st;
-+	struct bfq_entity *entity = bfqg->my_entity;
-+	unsigned long uninitialized_var(flags);
-+	int i;
-+
-+	hlist_del(&bfqg->group_node);
-+
-+	/*
-+	 * Empty all service_trees belonging to this group before
-+	 * deactivating the group itself.
-+	 */
-+	for (i = 0; i < BFQ_IOPRIO_CLASSES; i++) {
-+		st = bfqg->sched_data.service_tree + i;
-+
-+		/*
-+		 * The idle tree may still contain bfq_queues belonging
-+		 * to exited task because they never migrated to a different
-+		 * cgroup from the one being destroyed now.  No one else
-+		 * can access them so it's safe to act without any lock.
-+		 */
-+		bfq_flush_idle_tree(st);
-+
-+		/*
-+		 * It may happen that some queues are still active
-+		 * (busy) upon group destruction (if the corresponding
-+		 * processes have been forced to terminate). We move
-+		 * all the leaf entities corresponding to these queues
-+		 * to the root_group.
-+		 * Also, it may happen that the group has an entity
-+		 * in service, which is disconnected from the active
-+		 * tree: it must be moved, too.
-+		 * There is no need to put the sync queues, as the
-+		 * scheduler has taken no reference.
-+		 */
-+		bfqd = bfq_get_bfqd_locked(&bfqg->bfqd, &flags);
-+		if (bfqd != NULL) {
-+			bfq_reparent_active_entities(bfqd, bfqg, st);
-+			bfq_put_bfqd_unlock(bfqd, &flags);
-+		}
-+		BUG_ON(!RB_EMPTY_ROOT(&st->active));
-+		BUG_ON(!RB_EMPTY_ROOT(&st->idle));
-+	}
-+	BUG_ON(bfqg->sched_data.next_in_service != NULL);
-+	BUG_ON(bfqg->sched_data.in_service_entity != NULL);
-+
-+	/*
-+	 * We may race with device destruction, take extra care when
-+	 * dereferencing bfqg->bfqd.
-+	 */
-+	bfqd = bfq_get_bfqd_locked(&bfqg->bfqd, &flags);
-+	if (bfqd != NULL) {
-+		hlist_del(&bfqg->bfqd_node);
-+		__bfq_deactivate_entity(entity, 0);
-+		bfq_put_async_queues(bfqd, bfqg);
-+		bfq_put_bfqd_unlock(bfqd, &flags);
-+	}
-+	BUG_ON(entity->tree != NULL);
-+
-+	/*
-+	 * No need to defer the kfree() to the end of the RCU grace
-+	 * period: we are called from the destroy() callback of our
-+	 * cgroup, so we can be sure that no one is a) still using
-+	 * this cgroup or b) doing lookups in it.
-+	 */
-+	kfree(bfqg);
-+}
-+
-+static void bfq_end_wr_async(struct bfq_data *bfqd)
-+{
-+	struct hlist_node *tmp;
-+	struct bfq_group *bfqg;
-+
-+	hlist_for_each_entry_safe(bfqg, tmp, &bfqd->group_list, bfqd_node)
-+		bfq_end_wr_async_queues(bfqd, bfqg);
-+	bfq_end_wr_async_queues(bfqd, bfqd->root_group);
-+}
-+
-+/**
-+ * bfq_disconnect_groups - disconnect @bfqd from all its groups.
-+ * @bfqd: the device descriptor being exited.
-+ *
-+ * When the device exits we just make sure that no lookup can return
-+ * the now unused group structures.  They will be deallocated on cgroup
-+ * destruction.
-+ */
-+static void bfq_disconnect_groups(struct bfq_data *bfqd)
-+{
-+	struct hlist_node *tmp;
-+	struct bfq_group *bfqg;
-+
-+	bfq_log(bfqd, "disconnect_groups beginning");
-+	hlist_for_each_entry_safe(bfqg, tmp, &bfqd->group_list, bfqd_node) {
-+		hlist_del(&bfqg->bfqd_node);
-+
-+		__bfq_deactivate_entity(bfqg->my_entity, 0);
-+
-+		/*
-+		 * Don't remove from the group hash, just set an
-+		 * invalid key.  No lookups can race with the
-+		 * assignment as bfqd is being destroyed; this
-+		 * implies also that new elements cannot be added
-+		 * to the list.
-+		 */
-+		rcu_assign_pointer(bfqg->bfqd, NULL);
-+
-+		bfq_log(bfqd, "disconnect_groups: put async for group %p",
-+			bfqg);
-+		bfq_put_async_queues(bfqd, bfqg);
-+	}
-+}
-+
-+static inline void bfq_free_root_group(struct bfq_data *bfqd)
-+{
-+	struct bfqio_cgroup *bgrp = &bfqio_root_cgroup;
-+	struct bfq_group *bfqg = bfqd->root_group;
-+
-+	bfq_put_async_queues(bfqd, bfqg);
-+
-+	spin_lock_irq(&bgrp->lock);
-+	hlist_del_rcu(&bfqg->group_node);
-+	spin_unlock_irq(&bgrp->lock);
-+
-+	/*
-+	 * No need to synchronize_rcu() here: since the device is gone
-+	 * there cannot be any read-side access to its root_group.
-+	 */
-+	kfree(bfqg);
-+}
-+
-+static struct bfq_group *bfq_alloc_root_group(struct bfq_data *bfqd, int node)
-+{
-+	struct bfq_group *bfqg;
-+	struct bfqio_cgroup *bgrp;
-+	int i;
-+
-+	bfqg = kzalloc_node(sizeof(*bfqg), GFP_KERNEL, node);
-+	if (bfqg == NULL)
-+		return NULL;
-+
-+	bfqg->entity.parent = NULL;
-+	for (i = 0; i < BFQ_IOPRIO_CLASSES; i++)
-+		bfqg->sched_data.service_tree[i] = BFQ_SERVICE_TREE_INIT;
-+
-+	bgrp = &bfqio_root_cgroup;
-+	spin_lock_irq(&bgrp->lock);
-+	rcu_assign_pointer(bfqg->bfqd, bfqd);
-+	hlist_add_head_rcu(&bfqg->group_node, &bgrp->group_data);
-+	spin_unlock_irq(&bgrp->lock);
-+
-+	return bfqg;
-+}
-+
-+#define SHOW_FUNCTION(__VAR)						\
-+static u64 bfqio_cgroup_##__VAR##_read(struct cgroup_subsys_state *css, \
-+				       struct cftype *cftype)		\
-+{									\
-+	struct bfqio_cgroup *bgrp = css_to_bfqio(css);			\
-+	u64 ret = -ENODEV;						\
-+									\
-+	mutex_lock(&bfqio_mutex);					\
-+	if (bfqio_is_removed(bgrp))					\
-+		goto out_unlock;					\
-+									\
-+	spin_lock_irq(&bgrp->lock);					\
-+	ret = bgrp->__VAR;						\
-+	spin_unlock_irq(&bgrp->lock);					\
-+									\
-+out_unlock:								\
-+	mutex_unlock(&bfqio_mutex);					\
-+	return ret;							\
-+}
-+
-+SHOW_FUNCTION(weight);
-+SHOW_FUNCTION(ioprio);
-+SHOW_FUNCTION(ioprio_class);
-+#undef SHOW_FUNCTION
-+
-+#define STORE_FUNCTION(__VAR, __MIN, __MAX)				\
-+static int bfqio_cgroup_##__VAR##_write(struct cgroup_subsys_state *css,\
-+					struct cftype *cftype,		\
-+					u64 val)			\
-+{									\
-+	struct bfqio_cgroup *bgrp = css_to_bfqio(css);			\
-+	struct bfq_group *bfqg;						\
-+	int ret = -EINVAL;						\
-+									\
-+	if (val < (__MIN) || val > (__MAX))				\
-+		return ret;						\
-+									\
-+	ret = -ENODEV;							\
-+	mutex_lock(&bfqio_mutex);					\
-+	if (bfqio_is_removed(bgrp))					\
-+		goto out_unlock;					\
-+	ret = 0;							\
-+									\
-+	spin_lock_irq(&bgrp->lock);					\
-+	bgrp->__VAR = (unsigned short)val;				\
-+	hlist_for_each_entry(bfqg, &bgrp->group_data, group_node) {	\
-+		/*							\
-+		 * Setting the ioprio_changed flag of the entity        \
-+		 * to 1 with new_##__VAR == ##__VAR would re-set        \
-+		 * the value of the weight to its ioprio mapping.       \
-+		 * Set the flag only if necessary.			\
-+		 */							\
-+		if ((unsigned short)val != bfqg->entity.new_##__VAR) {  \
-+			bfqg->entity.new_##__VAR = (unsigned short)val; \
-+			/*						\
-+			 * Make sure that the above new value has been	\
-+			 * stored in bfqg->entity.new_##__VAR before	\
-+			 * setting the ioprio_changed flag. In fact,	\
-+			 * this flag may be read asynchronously (in	\
-+			 * critical sections protected by a different	\
-+			 * lock than that held here), and finding this	\
-+			 * flag set may cause the execution of the code	\
-+			 * for updating parameters whose value may	\
-+			 * depend also on bfqg->entity.new_##__VAR (in	\
-+			 * __bfq_entity_update_weight_prio).		\
-+			 * This barrier makes sure that the new value	\
-+			 * of bfqg->entity.new_##__VAR is correctly	\
-+			 * seen in that code.				\
-+			 */						\
-+			smp_wmb();                                      \
-+			bfqg->entity.ioprio_changed = 1;                \
-+		}							\
-+	}								\
-+	spin_unlock_irq(&bgrp->lock);					\
-+									\
-+out_unlock:								\
-+	mutex_unlock(&bfqio_mutex);					\
-+	return ret;							\
-+}
-+
-+STORE_FUNCTION(weight, BFQ_MIN_WEIGHT, BFQ_MAX_WEIGHT);
-+STORE_FUNCTION(ioprio, 0, IOPRIO_BE_NR - 1);
-+STORE_FUNCTION(ioprio_class, IOPRIO_CLASS_RT, IOPRIO_CLASS_IDLE);
-+#undef STORE_FUNCTION
-+
-+static struct cftype bfqio_files[] = {
-+	{
-+		.name = "weight",
-+		.read_u64 = bfqio_cgroup_weight_read,
-+		.write_u64 = bfqio_cgroup_weight_write,
-+	},
-+	{
-+		.name = "ioprio",
-+		.read_u64 = bfqio_cgroup_ioprio_read,
-+		.write_u64 = bfqio_cgroup_ioprio_write,
-+	},
-+	{
-+		.name = "ioprio_class",
-+		.read_u64 = bfqio_cgroup_ioprio_class_read,
-+		.write_u64 = bfqio_cgroup_ioprio_class_write,
-+	},
-+	{ },	/* terminate */
-+};
-+
-+static struct cgroup_subsys_state *bfqio_create(struct cgroup_subsys_state
-+						*parent_css)
-+{
-+	struct bfqio_cgroup *bgrp;
-+
-+	if (parent_css != NULL) {
-+		bgrp = kzalloc(sizeof(*bgrp), GFP_KERNEL);
-+		if (bgrp == NULL)
-+			return ERR_PTR(-ENOMEM);
-+	} else
-+		bgrp = &bfqio_root_cgroup;
-+
-+	spin_lock_init(&bgrp->lock);
-+	INIT_HLIST_HEAD(&bgrp->group_data);
-+	bgrp->ioprio = BFQ_DEFAULT_GRP_IOPRIO;
-+	bgrp->ioprio_class = BFQ_DEFAULT_GRP_CLASS;
-+
-+	return &bgrp->css;
-+}
-+
-+/*
-+ * We cannot support shared io contexts, as we have no means to support
-+ * two tasks with the same ioc in two different groups without major rework
-+ * of the main bic/bfqq data structures.  By now we allow a task to change
-+ * its cgroup only if it's the only owner of its ioc; the drawback of this
-+ * behavior is that a group containing a task that forked using CLONE_IO
-+ * will not be destroyed until the tasks sharing the ioc die.
-+ */
-+static int bfqio_can_attach(struct cgroup_subsys_state *css,
-+			    struct cgroup_taskset *tset)
-+{
-+	struct task_struct *task;
-+	struct io_context *ioc;
-+	int ret = 0;
-+
-+	cgroup_taskset_for_each(task, tset) {
-+		/*
-+		 * task_lock() is needed to avoid races with
-+		 * exit_io_context()
-+		 */
-+		task_lock(task);
-+		ioc = task->io_context;
-+		if (ioc != NULL && atomic_read(&ioc->nr_tasks) > 1)
-+			/*
-+			 * ioc == NULL means that the task is either too
-+			 * young or exiting: if it has still no ioc the
-+			 * ioc can't be shared, if the task is exiting the
-+			 * attach will fail anyway, no matter what we
-+			 * return here.
-+			 */
-+			ret = -EINVAL;
-+		task_unlock(task);
-+		if (ret)
-+			break;
-+	}
-+
-+	return ret;
-+}
-+
-+static void bfqio_attach(struct cgroup_subsys_state *css,
-+			 struct cgroup_taskset *tset)
-+{
-+	struct task_struct *task;
-+	struct io_context *ioc;
-+	struct io_cq *icq;
-+
-+	/*
-+	 * IMPORTANT NOTE: The move of more than one process at a time to a
-+	 * new group has not yet been tested.
-+	 */
-+	cgroup_taskset_for_each(task, tset) {
-+		ioc = get_task_io_context(task, GFP_ATOMIC, NUMA_NO_NODE);
-+		if (ioc) {
-+			/*
-+			 * Handle cgroup change here.
-+			 */
-+			rcu_read_lock();
-+			hlist_for_each_entry_rcu(icq, &ioc->icq_list, ioc_node)
-+				if (!strncmp(
-+					icq->q->elevator->type->elevator_name,
-+					"bfq", ELV_NAME_MAX))
-+					bfq_bic_change_cgroup(icq_to_bic(icq),
-+							      css);
-+			rcu_read_unlock();
-+			put_io_context(ioc);
-+		}
-+	}
-+}
-+
-+static void bfqio_destroy(struct cgroup_subsys_state *css)
-+{
-+	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
-+	struct hlist_node *tmp;
-+	struct bfq_group *bfqg;
-+
-+	/*
-+	 * Since we are destroying the cgroup, there are no more tasks
-+	 * referencing it, and all the RCU grace periods that may have
-+	 * referenced it are ended (as the destruction of the parent
-+	 * cgroup is RCU-safe); bgrp->group_data will not be accessed by
-+	 * anything else and we don't need any synchronization.
-+	 */
-+	hlist_for_each_entry_safe(bfqg, tmp, &bgrp->group_data, group_node)
-+		bfq_destroy_group(bgrp, bfqg);
-+
-+	BUG_ON(!hlist_empty(&bgrp->group_data));
-+
-+	kfree(bgrp);
-+}
-+
-+static int bfqio_css_online(struct cgroup_subsys_state *css)
-+{
-+	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
-+
-+	mutex_lock(&bfqio_mutex);
-+	bgrp->online = true;
-+	mutex_unlock(&bfqio_mutex);
-+
-+	return 0;
-+}
-+
-+static void bfqio_css_offline(struct cgroup_subsys_state *css)
-+{
-+	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
-+
-+	mutex_lock(&bfqio_mutex);
-+	bgrp->online = false;
-+	mutex_unlock(&bfqio_mutex);
-+}
-+
-+struct cgroup_subsys bfqio_cgrp_subsys = {
-+	.css_alloc = bfqio_create,
-+	.css_online = bfqio_css_online,
-+	.css_offline = bfqio_css_offline,
-+	.can_attach = bfqio_can_attach,
-+	.attach = bfqio_attach,
-+	.css_free = bfqio_destroy,
-+	.legacy_cftypes = bfqio_files,
-+};
-+#else
-+static inline void bfq_init_entity(struct bfq_entity *entity,
-+				   struct bfq_group *bfqg)
-+{
-+	entity->weight = entity->new_weight;
-+	entity->orig_weight = entity->new_weight;
-+	entity->ioprio = entity->new_ioprio;
-+	entity->ioprio_class = entity->new_ioprio_class;
-+	entity->sched_data = &bfqg->sched_data;
-+}
-+
-+static inline struct bfq_group *
-+bfq_bic_update_cgroup(struct bfq_io_cq *bic)
-+{
-+	struct bfq_data *bfqd = bic_to_bfqd(bic);
-+	return bfqd->root_group;
-+}
-+
-+static inline void bfq_bfqq_move(struct bfq_data *bfqd,
-+				 struct bfq_queue *bfqq,
-+				 struct bfq_entity *entity,
-+				 struct bfq_group *bfqg)
-+{
-+}
-+
-+static void bfq_end_wr_async(struct bfq_data *bfqd)
-+{
-+	bfq_end_wr_async_queues(bfqd, bfqd->root_group);
-+}
-+
-+static inline void bfq_disconnect_groups(struct bfq_data *bfqd)
-+{
-+	bfq_put_async_queues(bfqd, bfqd->root_group);
-+}
-+
-+static inline void bfq_free_root_group(struct bfq_data *bfqd)
-+{
-+	kfree(bfqd->root_group);
-+}
-+
-+static struct bfq_group *bfq_alloc_root_group(struct bfq_data *bfqd, int node)
-+{
-+	struct bfq_group *bfqg;
-+	int i;
-+
-+	bfqg = kmalloc_node(sizeof(*bfqg), GFP_KERNEL | __GFP_ZERO, node);
-+	if (bfqg == NULL)
-+		return NULL;
-+
-+	for (i = 0; i < BFQ_IOPRIO_CLASSES; i++)
-+		bfqg->sched_data.service_tree[i] = BFQ_SERVICE_TREE_INIT;
-+
-+	return bfqg;
-+}
-+#endif
-diff -Nur linux-4.1.3/block/bfq.h linux-xbian-imx6/block/bfq.h
---- linux-4.1.3/block/bfq.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/block/bfq.h	2015-07-27 23:13:03.604123194 +0200
-@@ -0,0 +1,811 @@
-+/*
-+ * BFQ-v7r7 for 4.0.0: data structures and common functions prototypes.
-+ *
-+ * Based on ideas and code from CFQ:
-+ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
-+ *
-+ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
-+ *		      Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
-+ */
-+
-+#ifndef _BFQ_H
-+#define _BFQ_H
-+
-+#include <linux/blktrace_api.h>
-+#include <linux/hrtimer.h>
-+#include <linux/ioprio.h>
-+#include <linux/rbtree.h>
-+
-+#define BFQ_IOPRIO_CLASSES	3
-+#define BFQ_CL_IDLE_TIMEOUT	(HZ/5)
-+
-+#define BFQ_MIN_WEIGHT	1
-+#define BFQ_MAX_WEIGHT	1000
-+
-+#define BFQ_DEFAULT_QUEUE_IOPRIO	4
-+
-+#define BFQ_DEFAULT_GRP_WEIGHT	10
-+#define BFQ_DEFAULT_GRP_IOPRIO	0
-+#define BFQ_DEFAULT_GRP_CLASS	IOPRIO_CLASS_BE
-+
-+struct bfq_entity;
-+
-+/**
-+ * struct bfq_service_tree - per ioprio_class service tree.
-+ * @active: tree for active entities (i.e., those backlogged).
-+ * @idle: tree for idle entities (i.e., those not backlogged, with V <= F_i).
-+ * @first_idle: idle entity with minimum F_i.
-+ * @last_idle: idle entity with maximum F_i.
-+ * @vtime: scheduler virtual time.
-+ * @wsum: scheduler weight sum; active and idle entities contribute to it.
-+ *
-+ * Each service tree represents a B-WF2Q+ scheduler on its own.  Each
-+ * ioprio_class has its own independent scheduler, and so its own
-+ * bfq_service_tree.  All the fields are protected by the queue lock
-+ * of the containing bfqd.
-+ */
-+struct bfq_service_tree {
-+	struct rb_root active;
-+	struct rb_root idle;
-+
-+	struct bfq_entity *first_idle;
-+	struct bfq_entity *last_idle;
-+
-+	u64 vtime;
-+	unsigned long wsum;
-+};
-+
-+/**
-+ * struct bfq_sched_data - multi-class scheduler.
-+ * @in_service_entity: entity in service.
-+ * @next_in_service: head-of-the-line entity in the scheduler.
-+ * @service_tree: array of service trees, one per ioprio_class.
-+ *
-+ * bfq_sched_data is the basic scheduler queue.  It supports three
-+ * ioprio_classes, and can be used either as a toplevel queue or as
-+ * an intermediate queue on a hierarchical setup.
-+ * @next_in_service points to the active entity of the sched_data
-+ * service trees that will be scheduled next.
-+ *
-+ * The supported ioprio_classes are the same as in CFQ, in descending
-+ * priority order, IOPRIO_CLASS_RT, IOPRIO_CLASS_BE, IOPRIO_CLASS_IDLE.
-+ * Requests from higher priority queues are served before all the
-+ * requests from lower priority queues; among requests of the same
-+ * queue requests are served according to B-WF2Q+.
-+ * All the fields are protected by the queue lock of the containing bfqd.
-+ */
-+struct bfq_sched_data {
-+	struct bfq_entity *in_service_entity;
-+	struct bfq_entity *next_in_service;
-+	struct bfq_service_tree service_tree[BFQ_IOPRIO_CLASSES];
-+};
-+
-+/**
-+ * struct bfq_weight_counter - counter of the number of all active entities
-+ *                             with a given weight.
-+ * @weight: weight of the entities that this counter refers to.
-+ * @num_active: number of active entities with this weight.
-+ * @weights_node: weights tree member (see bfq_data's @queue_weights_tree
-+ *                and @group_weights_tree).
-+ */
-+struct bfq_weight_counter {
-+	short int weight;
-+	unsigned int num_active;
-+	struct rb_node weights_node;
-+};
-+
-+/**
-+ * struct bfq_entity - schedulable entity.
-+ * @rb_node: service_tree member.
-+ * @weight_counter: pointer to the weight counter associated with this entity.
-+ * @on_st: flag, true if the entity is on a tree (either the active or
-+ *         the idle one of its service_tree).
-+ * @finish: B-WF2Q+ finish timestamp (aka F_i).
-+ * @start: B-WF2Q+ start timestamp (aka S_i).
-+ * @tree: tree the entity is enqueued into; %NULL if not on a tree.
-+ * @min_start: minimum start time of the (active) subtree rooted at
-+ *             this entity; used for O(log N) lookups into active trees.
-+ * @service: service received during the last round of service.
-+ * @budget: budget used to calculate F_i; F_i = S_i + @budget / @weight.
-+ * @weight: weight of the queue
-+ * @parent: parent entity, for hierarchical scheduling.
-+ * @my_sched_data: for non-leaf nodes in the cgroup hierarchy, the
-+ *                 associated scheduler queue, %NULL on leaf nodes.
-+ * @sched_data: the scheduler queue this entity belongs to.
-+ * @ioprio: the ioprio in use.
-+ * @new_weight: when a weight change is requested, the new weight value.
-+ * @orig_weight: original weight, used to implement weight boosting
-+ * @new_ioprio: when an ioprio change is requested, the new ioprio value.
-+ * @ioprio_class: the ioprio_class in use.
-+ * @new_ioprio_class: when an ioprio_class change is requested, the new
-+ *                    ioprio_class value.
-+ * @ioprio_changed: flag, true when the user requested a weight, ioprio or
-+ *                  ioprio_class change.
-+ *
-+ * A bfq_entity is used to represent either a bfq_queue (leaf node in the
-+ * cgroup hierarchy) or a bfq_group into the upper level scheduler.  Each
-+ * entity belongs to the sched_data of the parent group in the cgroup
-+ * hierarchy.  Non-leaf entities have also their own sched_data, stored
-+ * in @my_sched_data.
-+ *
-+ * Each entity stores independently its priority values; this would
-+ * allow different weights on different devices, but this
-+ * functionality is not exported to userspace by now.  Priorities and
-+ * weights are updated lazily, first storing the new values into the
-+ * new_* fields, then setting the @ioprio_changed flag.  As soon as
-+ * there is a transition in the entity state that allows the priority
-+ * update to take place the effective and the requested priority
-+ * values are synchronized.
-+ *
-+ * Unless cgroups are used, the weight value is calculated from the
-+ * ioprio to export the same interface as CFQ.  When dealing with
-+ * ``well-behaved'' queues (i.e., queues that do not spend too much
-+ * time to consume their budget and have true sequential behavior, and
-+ * when there are no external factors breaking anticipation) the
-+ * relative weights at each level of the cgroups hierarchy should be
-+ * guaranteed.  All the fields are protected by the queue lock of the
-+ * containing bfqd.
-+ */
-+struct bfq_entity {
-+	struct rb_node rb_node;
-+	struct bfq_weight_counter *weight_counter;
-+
-+	int on_st;
-+
-+	u64 finish;
-+	u64 start;
-+
-+	struct rb_root *tree;
-+
-+	u64 min_start;
-+
-+	unsigned long service, budget;
-+	unsigned short weight, new_weight;
-+	unsigned short orig_weight;
-+
-+	struct bfq_entity *parent;
-+
-+	struct bfq_sched_data *my_sched_data;
-+	struct bfq_sched_data *sched_data;
-+
-+	unsigned short ioprio, new_ioprio;
-+	unsigned short ioprio_class, new_ioprio_class;
-+
-+	int ioprio_changed;
-+};
-+
-+struct bfq_group;
-+
-+/**
-+ * struct bfq_queue - leaf schedulable entity.
-+ * @ref: reference counter.
-+ * @bfqd: parent bfq_data.
-+ * @new_bfqq: shared bfq_queue if queue is cooperating with
-+ *           one or more other queues.
-+ * @pos_node: request-position tree member (see bfq_data's @rq_pos_tree).
-+ * @pos_root: request-position tree root (see bfq_data's @rq_pos_tree).
-+ * @sort_list: sorted list of pending requests.
-+ * @next_rq: if fifo isn't expired, next request to serve.
-+ * @queued: nr of requests queued in @sort_list.
-+ * @allocated: currently allocated requests.
-+ * @meta_pending: pending metadata requests.
-+ * @fifo: fifo list of requests in sort_list.
-+ * @entity: entity representing this queue in the scheduler.
-+ * @max_budget: maximum budget allowed from the feedback mechanism.
-+ * @budget_timeout: budget expiration (in jiffies).
-+ * @dispatched: number of requests on the dispatch list or inside driver.
-+ * @flags: status flags.
-+ * @bfqq_list: node for active/idle bfqq list inside our bfqd.
-+ * @burst_list_node: node for the device's burst list.
-+ * @seek_samples: number of seeks sampled
-+ * @seek_total: sum of the distances of the seeks sampled
-+ * @seek_mean: mean seek distance
-+ * @last_request_pos: position of the last request enqueued
-+ * @requests_within_timer: number of consecutive pairs of request completion
-+ *                         and arrival, such that the queue becomes idle
-+ *                         after the completion, but the next request arrives
-+ *                         within an idle time slice; used only if the queue's
-+ *                         IO_bound has been cleared.
-+ * @pid: pid of the process owning the queue, used for logging purposes.
-+ * @last_wr_start_finish: start time of the current weight-raising period if
-+ *                        the @bfq-queue is being weight-raised, otherwise
-+ *                        finish time of the last weight-raising period
-+ * @wr_cur_max_time: current max raising time for this queue
-+ * @soft_rt_next_start: minimum time instant such that, only if a new
-+ *                      request is enqueued after this time instant in an
-+ *                      idle @bfq_queue with no outstanding requests, then
-+ *                      the task associated with the queue it is deemed as
-+ *                      soft real-time (see the comments to the function
-+ *                      bfq_bfqq_softrt_next_start())
-+ * @last_idle_bklogged: time of the last transition of the @bfq_queue from
-+ *                      idle to backlogged
-+ * @service_from_backlogged: cumulative service received from the @bfq_queue
-+ *                           since the last transition from idle to
-+ *                           backlogged
-+ * @bic: pointer to the bfq_io_cq owning the bfq_queue, set to %NULL if the
-+ *	 queue is shared
-+ *
-+ * A bfq_queue is a leaf request queue; it can be associated with an
-+ * io_context or more, if it  is  async or shared  between  cooperating
-+ * processes. @cgroup holds a reference to the cgroup, to be sure that it
-+ * does not disappear while a bfqq still references it (mostly to avoid
-+ * races between request issuing and task migration followed by cgroup
-+ * destruction).
-+ * All the fields are protected by the queue lock of the containing bfqd.
-+ */
-+struct bfq_queue {
-+	atomic_t ref;
-+	struct bfq_data *bfqd;
-+
-+	/* fields for cooperating queues handling */
-+	struct bfq_queue *new_bfqq;
-+	struct rb_node pos_node;
-+	struct rb_root *pos_root;
-+
-+	struct rb_root sort_list;
-+	struct request *next_rq;
-+	int queued[2];
-+	int allocated[2];
-+	int meta_pending;
-+	struct list_head fifo;
-+
-+	struct bfq_entity entity;
-+
-+	unsigned long max_budget;
-+	unsigned long budget_timeout;
-+
-+	int dispatched;
-+
-+	unsigned int flags;
-+
-+	struct list_head bfqq_list;
-+
-+	struct hlist_node burst_list_node;
-+
-+	unsigned int seek_samples;
-+	u64 seek_total;
-+	sector_t seek_mean;
-+	sector_t last_request_pos;
-+
-+	unsigned int requests_within_timer;
-+
-+	pid_t pid;
-+	struct bfq_io_cq *bic;
-+
-+	/* weight-raising fields */
-+	unsigned long wr_cur_max_time;
-+	unsigned long soft_rt_next_start;
-+	unsigned long last_wr_start_finish;
-+	unsigned int wr_coeff;
-+	unsigned long last_idle_bklogged;
-+	unsigned long service_from_backlogged;
-+};
-+
-+/**
-+ * struct bfq_ttime - per process thinktime stats.
-+ * @ttime_total: total process thinktime
-+ * @ttime_samples: number of thinktime samples
-+ * @ttime_mean: average process thinktime
-+ */
-+struct bfq_ttime {
-+	unsigned long last_end_request;
-+
-+	unsigned long ttime_total;
-+	unsigned long ttime_samples;
-+	unsigned long ttime_mean;
-+};
-+
-+/**
-+ * struct bfq_io_cq - per (request_queue, io_context) structure.
-+ * @icq: associated io_cq structure
-+ * @bfqq: array of two process queues, the sync and the async
-+ * @ttime: associated @bfq_ttime struct
-+ * @wr_time_left: snapshot of the time left before weight raising ends
-+ *                for the sync queue associated to this process; this
-+ *		  snapshot is taken to remember this value while the weight
-+ *		  raising is suspended because the queue is merged with a
-+ *		  shared queue, and is used to set @raising_cur_max_time
-+ *		  when the queue is split from the shared queue and its
-+ *		  weight is raised again
-+ * @saved_idle_window: same purpose as the previous field for the idle
-+ *                     window
-+ * @saved_IO_bound: same purpose as the previous two fields for the I/O
-+ *                  bound classification of a queue
-+ * @saved_in_large_burst: same purpose as the previous fields for the
-+ *                        value of the field keeping the queue's belonging
-+ *                        to a large burst
-+ * @was_in_burst_list: true if the queue belonged to a burst list
-+ *                     before its merge with another cooperating queue
-+ * @cooperations: counter of consecutive successful queue merges underwent
-+ *                by any of the process' @bfq_queues
-+ * @failed_cooperations: counter of consecutive failed queue merges of any
-+ *                       of the process' @bfq_queues
-+ */
-+struct bfq_io_cq {
-+	struct io_cq icq; /* must be the first member */
-+	struct bfq_queue *bfqq[2];
-+	struct bfq_ttime ttime;
-+	int ioprio;
-+
-+	unsigned int wr_time_left;
-+	bool saved_idle_window;
-+	bool saved_IO_bound;
-+
-+	bool saved_in_large_burst;
-+	bool was_in_burst_list;
-+
-+	unsigned int cooperations;
-+	unsigned int failed_cooperations;
-+};
-+
-+enum bfq_device_speed {
-+	BFQ_BFQD_FAST,
-+	BFQ_BFQD_SLOW,
-+};
-+
-+/**
-+ * struct bfq_data - per device data structure.
-+ * @queue: request queue for the managed device.
-+ * @root_group: root bfq_group for the device.
-+ * @rq_pos_tree: rbtree sorted by next_request position, used when
-+ *               determining if two or more queues have interleaving
-+ *               requests (see bfq_close_cooperator()).
-+ * @active_numerous_groups: number of bfq_groups containing more than one
-+ *                          active @bfq_entity.
-+ * @queue_weights_tree: rbtree of weight counters of @bfq_queues, sorted by
-+ *                      weight. Used to keep track of whether all @bfq_queues
-+ *                     have the same weight. The tree contains one counter
-+ *                     for each distinct weight associated to some active
-+ *                     and not weight-raised @bfq_queue (see the comments to
-+ *                      the functions bfq_weights_tree_[add|remove] for
-+ *                     further details).
-+ * @group_weights_tree: rbtree of non-queue @bfq_entity weight counters, sorted
-+ *                      by weight. Used to keep track of whether all
-+ *                     @bfq_groups have the same weight. The tree contains
-+ *                     one counter for each distinct weight associated to
-+ *                     some active @bfq_group (see the comments to the
-+ *                     functions bfq_weights_tree_[add|remove] for further
-+ *                     details).
-+ * @busy_queues: number of bfq_queues containing requests (including the
-+ *		 queue in service, even if it is idling).
-+ * @busy_in_flight_queues: number of @bfq_queues containing pending or
-+ *                         in-flight requests, plus the @bfq_queue in
-+ *                         service, even if idle but waiting for the
-+ *                         possible arrival of its next sync request. This
-+ *                         field is updated only if the device is rotational,
-+ *                         but used only if the device is also NCQ-capable.
-+ *                         The reason why the field is updated also for non-
-+ *                         NCQ-capable rotational devices is related to the
-+ *                         fact that the value of @hw_tag may be set also
-+ *                         later than when busy_in_flight_queues may need to
-+ *                         be incremented for the first time(s). Taking also
-+ *                         this possibility into account, to avoid unbalanced
-+ *                         increments/decrements, would imply more overhead
-+ *                         than just updating busy_in_flight_queues
-+ *                         regardless of the value of @hw_tag.
-+ * @const_seeky_busy_in_flight_queues: number of constantly-seeky @bfq_queues
-+ *                                     (that is, seeky queues that expired
-+ *                                     for budget timeout at least once)
-+ *                                     containing pending or in-flight
-+ *                                     requests, including the in-service
-+ *                                     @bfq_queue if constantly seeky. This
-+ *                                     field is updated only if the device
-+ *                                     is rotational, but used only if the
-+ *                                     device is also NCQ-capable (see the
-+ *                                     comments to @busy_in_flight_queues).
-+ * @wr_busy_queues: number of weight-raised busy @bfq_queues.
-+ * @queued: number of queued requests.
-+ * @rq_in_driver: number of requests dispatched and waiting for completion.
-+ * @sync_flight: number of sync requests in the driver.
-+ * @max_rq_in_driver: max number of reqs in driver in the last
-+ *                    @hw_tag_samples completed requests.
-+ * @hw_tag_samples: nr of samples used to calculate hw_tag.
-+ * @hw_tag: flag set to one if the driver is showing a queueing behavior.
-+ * @budgets_assigned: number of budgets assigned.
-+ * @idle_slice_timer: timer set when idling for the next sequential request
-+ *                    from the queue in service.
-+ * @unplug_work: delayed work to restart dispatching on the request queue.
-+ * @in_service_queue: bfq_queue in service.
-+ * @in_service_bic: bfq_io_cq (bic) associated with the @in_service_queue.
-+ * @last_position: on-disk position of the last served request.
-+ * @last_budget_start: beginning of the last budget.
-+ * @last_idling_start: beginning of the last idle slice.
-+ * @peak_rate: peak transfer rate observed for a budget.
-+ * @peak_rate_samples: number of samples used to calculate @peak_rate.
-+ * @bfq_max_budget: maximum budget allotted to a bfq_queue before
-+ *                  rescheduling.
-+ * @group_list: list of all the bfq_groups active on the device.
-+ * @active_list: list of all the bfq_queues active on the device.
-+ * @idle_list: list of all the bfq_queues idle on the device.
-+ * @bfq_quantum: max number of requests dispatched per dispatch round.
-+ * @bfq_fifo_expire: timeout for async/sync requests; when it expires
-+ *                   requests are served in fifo order.
-+ * @bfq_back_penalty: weight of backward seeks wrt forward ones.
-+ * @bfq_back_max: maximum allowed backward seek.
-+ * @bfq_slice_idle: maximum idling time.
-+ * @bfq_user_max_budget: user-configured max budget value
-+ *                       (0 for auto-tuning).
-+ * @bfq_max_budget_async_rq: maximum budget (in nr of requests) allotted to
-+ *                           async queues.
-+ * @bfq_timeout: timeout for bfq_queues to consume their budget; used to
-+ *               to prevent seeky queues to impose long latencies to well
-+ *               behaved ones (this also implies that seeky queues cannot
-+ *               receive guarantees in the service domain; after a timeout
-+ *               they are charged for the whole allocated budget, to try
-+ *               to preserve a behavior reasonably fair among them, but
-+ *               without service-domain guarantees).
-+ * @bfq_coop_thresh: number of queue merges after which a @bfq_queue is
-+ *                   no more granted any weight-raising.
-+ * @bfq_failed_cooperations: number of consecutive failed cooperation
-+ *                           chances after which weight-raising is restored
-+ *                           to a queue subject to more than bfq_coop_thresh
-+ *                           queue merges.
-+ * @bfq_requests_within_timer: number of consecutive requests that must be
-+ *                             issued within the idle time slice to set
-+ *                             again idling to a queue which was marked as
-+ *                             non-I/O-bound (see the definition of the
-+ *                             IO_bound flag for further details).
-+ * @last_ins_in_burst: last time at which a queue entered the current
-+ *                     burst of queues being activated shortly after
-+ *                     each other; for more details about this and the
-+ *                     following parameters related to a burst of
-+ *                     activations, see the comments to the function
-+ *                     @bfq_handle_burst.
-+ * @bfq_burst_interval: reference time interval used to decide whether a
-+ *                      queue has been activated shortly after
-+ *                      @last_ins_in_burst.
-+ * @burst_size: number of queues in the current burst of queue activations.
-+ * @bfq_large_burst_thresh: maximum burst size above which the current
-+ * 			    queue-activation burst is deemed as 'large'.
-+ * @large_burst: true if a large queue-activation burst is in progress.
-+ * @burst_list: head of the burst list (as for the above fields, more details
-+ * 		in the comments to the function bfq_handle_burst).
-+ * @low_latency: if set to true, low-latency heuristics are enabled.
-+ * @bfq_wr_coeff: maximum factor by which the weight of a weight-raised
-+ *                queue is multiplied.
-+ * @bfq_wr_max_time: maximum duration of a weight-raising period (jiffies).
-+ * @bfq_wr_rt_max_time: maximum duration for soft real-time processes.
-+ * @bfq_wr_min_idle_time: minimum idle period after which weight-raising
-+ *			  may be reactivated for a queue (in jiffies).
-+ * @bfq_wr_min_inter_arr_async: minimum period between request arrivals
-+ *				after which weight-raising may be
-+ *				reactivated for an already busy queue
-+ *				(in jiffies).
-+ * @bfq_wr_max_softrt_rate: max service-rate for a soft real-time queue,
-+ *			    sectors per seconds.
-+ * @RT_prod: cached value of the product R*T used for computing the maximum
-+ *	     duration of the weight raising automatically.
-+ * @device_speed: device-speed class for the low-latency heuristic.
-+ * @oom_bfqq: fallback dummy bfqq for extreme OOM conditions.
-+ *
-+ * All the fields are protected by the @queue lock.
-+ */
-+struct bfq_data {
-+	struct request_queue *queue;
-+
-+	struct bfq_group *root_group;
-+	struct rb_root rq_pos_tree;
-+
-+#ifdef CONFIG_CGROUP_BFQIO
-+	int active_numerous_groups;
-+#endif
-+
-+	struct rb_root queue_weights_tree;
-+	struct rb_root group_weights_tree;
-+
-+	int busy_queues;
-+	int busy_in_flight_queues;
-+	int const_seeky_busy_in_flight_queues;
-+	int wr_busy_queues;
-+	int queued;
-+	int rq_in_driver;
-+	int sync_flight;
-+
-+	int max_rq_in_driver;
-+	int hw_tag_samples;
-+	int hw_tag;
-+
-+	int budgets_assigned;
-+
-+	struct timer_list idle_slice_timer;
-+	struct work_struct unplug_work;
-+
-+	struct bfq_queue *in_service_queue;
-+	struct bfq_io_cq *in_service_bic;
-+
-+	sector_t last_position;
-+
-+	ktime_t last_budget_start;
-+	ktime_t last_idling_start;
-+	int peak_rate_samples;
-+	u64 peak_rate;
-+	unsigned long bfq_max_budget;
-+
-+	struct hlist_head group_list;
-+	struct list_head active_list;
-+	struct list_head idle_list;
-+
-+	unsigned int bfq_quantum;
-+	unsigned int bfq_fifo_expire[2];
-+	unsigned int bfq_back_penalty;
-+	unsigned int bfq_back_max;
-+	unsigned int bfq_slice_idle;
-+	u64 bfq_class_idle_last_service;
-+
-+	unsigned int bfq_user_max_budget;
-+	unsigned int bfq_max_budget_async_rq;
-+	unsigned int bfq_timeout[2];
-+
-+	unsigned int bfq_coop_thresh;
-+	unsigned int bfq_failed_cooperations;
-+	unsigned int bfq_requests_within_timer;
-+
-+	unsigned long last_ins_in_burst;
-+	unsigned long bfq_burst_interval;
-+	int burst_size;
-+	unsigned long bfq_large_burst_thresh;
-+	bool large_burst;
-+	struct hlist_head burst_list;
-+
-+	bool low_latency;
-+
-+	/* parameters of the low_latency heuristics */
-+	unsigned int bfq_wr_coeff;
-+	unsigned int bfq_wr_max_time;
-+	unsigned int bfq_wr_rt_max_time;
-+	unsigned int bfq_wr_min_idle_time;
-+	unsigned long bfq_wr_min_inter_arr_async;
-+	unsigned int bfq_wr_max_softrt_rate;
-+	u64 RT_prod;
-+	enum bfq_device_speed device_speed;
-+
-+	struct bfq_queue oom_bfqq;
-+};
-+
-+enum bfqq_state_flags {
-+	BFQ_BFQQ_FLAG_busy = 0,		/* has requests or is in service */
-+	BFQ_BFQQ_FLAG_wait_request,	/* waiting for a request */
-+	BFQ_BFQQ_FLAG_must_alloc,	/* must be allowed rq alloc */
-+	BFQ_BFQQ_FLAG_fifo_expire,	/* FIFO checked in this slice */
-+	BFQ_BFQQ_FLAG_idle_window,	/* slice idling enabled */
-+	BFQ_BFQQ_FLAG_prio_changed,	/* task priority has changed */
-+	BFQ_BFQQ_FLAG_sync,		/* synchronous queue */
-+	BFQ_BFQQ_FLAG_budget_new,	/* no completion with this budget */
-+	BFQ_BFQQ_FLAG_IO_bound,		/*
-+					 * bfqq has timed-out at least once
-+					 * having consumed at most 2/10 of
-+					 * its budget
-+					 */
-+	BFQ_BFQQ_FLAG_in_large_burst,	/*
-+					 * bfqq activated in a large burst,
-+					 * see comments to bfq_handle_burst.
-+					 */
-+	BFQ_BFQQ_FLAG_constantly_seeky,	/*
-+					 * bfqq has proved to be slow and
-+					 * seeky until budget timeout
-+					 */
-+	BFQ_BFQQ_FLAG_softrt_update,	/*
-+					 * may need softrt-next-start
-+					 * update
-+					 */
-+	BFQ_BFQQ_FLAG_coop,		/* bfqq is shared */
-+	BFQ_BFQQ_FLAG_split_coop,	/* shared bfqq will be split */
-+	BFQ_BFQQ_FLAG_just_split,	/* queue has just been split */
-+};
-+
-+#define BFQ_BFQQ_FNS(name)						\
-+static inline void bfq_mark_bfqq_##name(struct bfq_queue *bfqq)		\
-+{									\
-+	(bfqq)->flags |= (1 << BFQ_BFQQ_FLAG_##name);			\
-+}									\
-+static inline void bfq_clear_bfqq_##name(struct bfq_queue *bfqq)	\
-+{									\
-+	(bfqq)->flags &= ~(1 << BFQ_BFQQ_FLAG_##name);			\
-+}									\
-+static inline int bfq_bfqq_##name(const struct bfq_queue *bfqq)		\
-+{									\
-+	return ((bfqq)->flags & (1 << BFQ_BFQQ_FLAG_##name)) != 0;	\
-+}
-+
-+BFQ_BFQQ_FNS(busy);
-+BFQ_BFQQ_FNS(wait_request);
-+BFQ_BFQQ_FNS(must_alloc);
-+BFQ_BFQQ_FNS(fifo_expire);
-+BFQ_BFQQ_FNS(idle_window);
-+BFQ_BFQQ_FNS(prio_changed);
-+BFQ_BFQQ_FNS(sync);
-+BFQ_BFQQ_FNS(budget_new);
-+BFQ_BFQQ_FNS(IO_bound);
-+BFQ_BFQQ_FNS(in_large_burst);
-+BFQ_BFQQ_FNS(constantly_seeky);
-+BFQ_BFQQ_FNS(coop);
-+BFQ_BFQQ_FNS(split_coop);
-+BFQ_BFQQ_FNS(just_split);
-+BFQ_BFQQ_FNS(softrt_update);
-+#undef BFQ_BFQQ_FNS
-+
-+/* Logging facilities. */
-+#define bfq_log_bfqq(bfqd, bfqq, fmt, args...) \
-+	blk_add_trace_msg((bfqd)->queue, "bfq%d " fmt, (bfqq)->pid, ##args)
-+
-+#define bfq_log(bfqd, fmt, args...) \
-+	blk_add_trace_msg((bfqd)->queue, "bfq " fmt, ##args)
-+
-+/* Expiration reasons. */
-+enum bfqq_expiration {
-+	BFQ_BFQQ_TOO_IDLE = 0,		/*
-+					 * queue has been idling for
-+					 * too long
-+					 */
-+	BFQ_BFQQ_BUDGET_TIMEOUT,	/* budget took too long to be used */
-+	BFQ_BFQQ_BUDGET_EXHAUSTED,	/* budget consumed */
-+	BFQ_BFQQ_NO_MORE_REQUESTS,	/* the queue has no more requests */
-+};
-+
-+#ifdef CONFIG_CGROUP_BFQIO
-+/**
-+ * struct bfq_group - per (device, cgroup) data structure.
-+ * @entity: schedulable entity to insert into the parent group sched_data.
-+ * @sched_data: own sched_data, to contain child entities (they may be
-+ *              both bfq_queues and bfq_groups).
-+ * @group_node: node to be inserted into the bfqio_cgroup->group_data
-+ *              list of the containing cgroup's bfqio_cgroup.
-+ * @bfqd_node: node to be inserted into the @bfqd->group_list list
-+ *             of the groups active on the same device; used for cleanup.
-+ * @bfqd: the bfq_data for the device this group acts upon.
-+ * @async_bfqq: array of async queues for all the tasks belonging to
-+ *              the group, one queue per ioprio value per ioprio_class,
-+ *              except for the idle class that has only one queue.
-+ * @async_idle_bfqq: async queue for the idle class (ioprio is ignored).
-+ * @my_entity: pointer to @entity, %NULL for the toplevel group; used
-+ *             to avoid too many special cases during group creation/
-+ *             migration.
-+ * @active_entities: number of active entities belonging to the group;
-+ *                   unused for the root group. Used to know whether there
-+ *                   are groups with more than one active @bfq_entity
-+ *                   (see the comments to the function
-+ *                   bfq_bfqq_must_not_expire()).
-+ *
-+ * Each (device, cgroup) pair has its own bfq_group, i.e., for each cgroup
-+ * there is a set of bfq_groups, each one collecting the lower-level
-+ * entities belonging to the group that are acting on the same device.
-+ *
-+ * Locking works as follows:
-+ *    o @group_node is protected by the bfqio_cgroup lock, and is accessed
-+ *      via RCU from its readers.
-+ *    o @bfqd is protected by the queue lock, RCU is used to access it
-+ *      from the readers.
-+ *    o All the other fields are protected by the @bfqd queue lock.
-+ */
-+struct bfq_group {
-+	struct bfq_entity entity;
-+	struct bfq_sched_data sched_data;
-+
-+	struct hlist_node group_node;
-+	struct hlist_node bfqd_node;
-+
-+	void *bfqd;
-+
-+	struct bfq_queue *async_bfqq[2][IOPRIO_BE_NR];
-+	struct bfq_queue *async_idle_bfqq;
-+
-+	struct bfq_entity *my_entity;
-+
-+	int active_entities;
-+};
-+
-+/**
-+ * struct bfqio_cgroup - bfq cgroup data structure.
-+ * @css: subsystem state for bfq in the containing cgroup.
-+ * @online: flag marked when the subsystem is inserted.
-+ * @weight: cgroup weight.
-+ * @ioprio: cgroup ioprio.
-+ * @ioprio_class: cgroup ioprio_class.
-+ * @lock: spinlock that protects @ioprio, @ioprio_class and @group_data.
-+ * @group_data: list containing the bfq_group belonging to this cgroup.
-+ *
-+ * @group_data is accessed using RCU, with @lock protecting the updates,
-+ * @ioprio and @ioprio_class are protected by @lock.
-+ */
-+struct bfqio_cgroup {
-+	struct cgroup_subsys_state css;
-+	bool online;
-+
-+	unsigned short weight, ioprio, ioprio_class;
-+
-+	spinlock_t lock;
-+	struct hlist_head group_data;
-+};
-+#else
-+struct bfq_group {
-+	struct bfq_sched_data sched_data;
-+
-+	struct bfq_queue *async_bfqq[2][IOPRIO_BE_NR];
-+	struct bfq_queue *async_idle_bfqq;
-+};
-+#endif
-+
-+static inline struct bfq_service_tree *
-+bfq_entity_service_tree(struct bfq_entity *entity)
-+{
-+	struct bfq_sched_data *sched_data = entity->sched_data;
-+	unsigned int idx = entity->ioprio_class - 1;
-+
-+	BUG_ON(idx >= BFQ_IOPRIO_CLASSES);
-+	BUG_ON(sched_data == NULL);
-+
-+	return sched_data->service_tree + idx;
-+}
-+
-+static inline struct bfq_queue *bic_to_bfqq(struct bfq_io_cq *bic,
-+					    bool is_sync)
-+{
-+	return bic->bfqq[is_sync];
-+}
-+
-+static inline void bic_set_bfqq(struct bfq_io_cq *bic,
-+				struct bfq_queue *bfqq, bool is_sync)
-+{
-+	bic->bfqq[is_sync] = bfqq;
-+}
-+
-+static inline struct bfq_data *bic_to_bfqd(struct bfq_io_cq *bic)
-+{
-+	return bic->icq.q->elevator->elevator_data;
-+}
-+
-+/**
-+ * bfq_get_bfqd_locked - get a lock to a bfqd using a RCU protected pointer.
-+ * @ptr: a pointer to a bfqd.
-+ * @flags: storage for the flags to be saved.
-+ *
-+ * This function allows bfqg->bfqd to be protected by the
-+ * queue lock of the bfqd they reference; the pointer is dereferenced
-+ * under RCU, so the storage for bfqd is assured to be safe as long
-+ * as the RCU read side critical section does not end.  After the
-+ * bfqd->queue->queue_lock is taken the pointer is rechecked, to be
-+ * sure that no other writer accessed it.  If we raced with a writer,
-+ * the function returns NULL, with the queue unlocked, otherwise it
-+ * returns the dereferenced pointer, with the queue locked.
-+ */
-+static inline struct bfq_data *bfq_get_bfqd_locked(void **ptr,
-+						   unsigned long *flags)
-+{
-+	struct bfq_data *bfqd;
-+
-+	rcu_read_lock();
-+	bfqd = rcu_dereference(*(struct bfq_data **)ptr);
-+
-+	if (bfqd != NULL) {
-+		spin_lock_irqsave(bfqd->queue->queue_lock, *flags);
-+		if (*ptr == bfqd)
-+			goto out;
-+		spin_unlock_irqrestore(bfqd->queue->queue_lock, *flags);
-+	}
-+
-+	bfqd = NULL;
-+out:
-+	rcu_read_unlock();
-+	return bfqd;
-+}
-+
-+static inline void bfq_put_bfqd_unlock(struct bfq_data *bfqd,
-+				       unsigned long *flags)
-+{
-+	spin_unlock_irqrestore(bfqd->queue->queue_lock, *flags);
-+}
-+
-+static void bfq_changed_ioprio(struct bfq_io_cq *bic);
-+static void bfq_put_queue(struct bfq_queue *bfqq);
-+static void bfq_dispatch_insert(struct request_queue *q, struct request *rq);
-+static struct bfq_queue *bfq_get_queue(struct bfq_data *bfqd,
-+				       struct bfq_group *bfqg, int is_sync,
-+				       struct bfq_io_cq *bic, gfp_t gfp_mask);
-+static void bfq_end_wr_async_queues(struct bfq_data *bfqd,
-+				    struct bfq_group *bfqg);
-+static void bfq_put_async_queues(struct bfq_data *bfqd, struct bfq_group *bfqg);
-+static void bfq_exit_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq);
-+
-+#endif /* _BFQ_H */
-diff -Nur linux-4.1.3/block/bfq-ioc.c linux-xbian-imx6/block/bfq-ioc.c
---- linux-4.1.3/block/bfq-ioc.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/block/bfq-ioc.c	2015-07-27 23:13:03.600137415 +0200
-@@ -0,0 +1,36 @@
-+/*
-+ * BFQ: I/O context handling.
-+ *
-+ * Based on ideas and code from CFQ:
-+ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
-+ *
-+ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
-+ *		      Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
-+ */
-+
-+/**
-+ * icq_to_bic - convert iocontext queue structure to bfq_io_cq.
-+ * @icq: the iocontext queue.
-+ */
-+static inline struct bfq_io_cq *icq_to_bic(struct io_cq *icq)
-+{
-+	/* bic->icq is the first member, %NULL will convert to %NULL */
-+	return container_of(icq, struct bfq_io_cq, icq);
-+}
-+
-+/**
-+ * bfq_bic_lookup - search into @ioc a bic associated to @bfqd.
-+ * @bfqd: the lookup key.
-+ * @ioc: the io_context of the process doing I/O.
-+ *
-+ * Queue lock must be held.
-+ */
-+static inline struct bfq_io_cq *bfq_bic_lookup(struct bfq_data *bfqd,
-+					       struct io_context *ioc)
-+{
-+	if (ioc)
-+		return icq_to_bic(ioc_lookup_icq(ioc, bfqd->queue));
-+	return NULL;
-+}
-diff -Nur linux-4.1.3/block/bfq-iosched.c linux-xbian-imx6/block/bfq-iosched.c
---- linux-4.1.3/block/bfq-iosched.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/block/bfq-iosched.c	2015-07-27 23:13:03.600137415 +0200
-@@ -0,0 +1,4223 @@
-+/*
-+ * Budget Fair Queueing (BFQ) disk scheduler.
-+ *
-+ * Based on ideas and code from CFQ:
-+ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
-+ *
-+ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
-+ *		      Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Licensed under the GPL-2 as detailed in the accompanying COPYING.BFQ
-+ * file.
-+ *
-+ * BFQ is a proportional-share storage-I/O scheduling algorithm based on
-+ * the slice-by-slice service scheme of CFQ. But BFQ assigns budgets,
-+ * measured in number of sectors, to processes instead of time slices. The
-+ * device is not granted to the in-service process for a given time slice,
-+ * but until it has exhausted its assigned budget. This change from the time
-+ * to the service domain allows BFQ to distribute the device throughput
-+ * among processes as desired, without any distortion due to ZBR, workload
-+ * fluctuations or other factors. BFQ uses an ad hoc internal scheduler,
-+ * called B-WF2Q+, to schedule processes according to their budgets. More
-+ * precisely, BFQ schedules queues associated to processes. Thanks to the
-+ * accurate policy of B-WF2Q+, BFQ can afford to assign high budgets to
-+ * I/O-bound processes issuing sequential requests (to boost the
-+ * throughput), and yet guarantee a low latency to interactive and soft
-+ * real-time applications.
-+ *
-+ * BFQ is described in [1], where also a reference to the initial, more
-+ * theoretical paper on BFQ can be found. The interested reader can find
-+ * in the latter paper full details on the main algorithm, as well as
-+ * formulas of the guarantees and formal proofs of all the properties.
-+ * With respect to the version of BFQ presented in these papers, this
-+ * implementation adds a few more heuristics, such as the one that
-+ * guarantees a low latency to soft real-time applications, and a
-+ * hierarchical extension based on H-WF2Q+.
-+ *
-+ * B-WF2Q+ is based on WF2Q+, that is described in [2], together with
-+ * H-WF2Q+, while the augmented tree used to implement B-WF2Q+ with O(log N)
-+ * complexity derives from the one introduced with EEVDF in [3].
-+ *
-+ * [1] P. Valente and M. Andreolini, ``Improving Application Responsiveness
-+ *     with the BFQ Disk I/O Scheduler'',
-+ *     Proceedings of the 5th Annual International Systems and Storage
-+ *     Conference (SYSTOR '12), June 2012.
-+ *
-+ * http://algogroup.unimo.it/people/paolo/disk_sched/bf1-v1-suite-results.pdf
-+ *
-+ * [2] Jon C.R. Bennett and H. Zhang, ``Hierarchical Packet Fair Queueing
-+ *     Algorithms,'' IEEE/ACM Transactions on Networking, 5(5):675-689,
-+ *     Oct 1997.
-+ *
-+ * http://www.cs.cmu.edu/~hzhang/papers/TON-97-Oct.ps.gz
-+ *
-+ * [3] I. Stoica and H. Abdel-Wahab, ``Earliest Eligible Virtual Deadline
-+ *     First: A Flexible and Accurate Mechanism for Proportional Share
-+ *     Resource Allocation,'' technical report.
-+ *
-+ * http://www.cs.berkeley.edu/~istoica/papers/eevdf-tr-95.pdf
-+ */
-+#include <linux/module.h>
-+#include <linux/slab.h>
-+#include <linux/blkdev.h>
-+#include <linux/cgroup.h>
-+#include <linux/elevator.h>
-+#include <linux/jiffies.h>
-+#include <linux/rbtree.h>
-+#include <linux/ioprio.h>
-+#include "bfq.h"
-+#include "blk.h"
-+
-+/* Max number of dispatches in one round of service. */
-+static const int bfq_quantum = 4;
-+
-+/* Expiration time of sync (0) and async (1) requests, in jiffies. */
-+static const int bfq_fifo_expire[2] = { HZ / 4, HZ / 8 };
-+
-+/* Maximum backwards seek, in KiB. */
-+static const int bfq_back_max = 16 * 1024;
-+
-+/* Penalty of a backwards seek, in number of sectors. */
-+static const int bfq_back_penalty = 2;
-+
-+/* Idling period duration, in jiffies. */
-+static int bfq_slice_idle = HZ / 125;
-+
-+/* Default maximum budget values, in sectors and number of requests. */
-+static const int bfq_default_max_budget = 16 * 1024;
-+static const int bfq_max_budget_async_rq = 4;
-+
-+/*
-+ * Async to sync throughput distribution is controlled as follows:
-+ * when an async request is served, the entity is charged the number
-+ * of sectors of the request, multiplied by the factor below
-+ */
-+static const int bfq_async_charge_factor = 10;
-+
-+/* Default timeout values, in jiffies, approximating CFQ defaults. */
-+static const int bfq_timeout_sync = HZ / 8;
-+static int bfq_timeout_async = HZ / 25;
-+
-+struct kmem_cache *bfq_pool;
-+
-+/* Below this threshold (in ms), we consider thinktime immediate. */
-+#define BFQ_MIN_TT		2
-+
-+/* hw_tag detection: parallel requests threshold and min samples needed. */
-+#define BFQ_HW_QUEUE_THRESHOLD	4
-+#define BFQ_HW_QUEUE_SAMPLES	32
-+
-+#define BFQQ_SEEK_THR	 (sector_t)(8 * 1024)
-+#define BFQQ_SEEKY(bfqq) ((bfqq)->seek_mean > BFQQ_SEEK_THR)
-+
-+/* Min samples used for peak rate estimation (for autotuning). */
-+#define BFQ_PEAK_RATE_SAMPLES	32
-+
-+/* Shift used for peak rate fixed precision calculations. */
-+#define BFQ_RATE_SHIFT		16
-+
-+/*
-+ * By default, BFQ computes the duration of the weight raising for
-+ * interactive applications automatically, using the following formula:
-+ * duration = (R / r) * T, where r is the peak rate of the device, and
-+ * R and T are two reference parameters.
-+ * In particular, R is the peak rate of the reference device (see below),
-+ * and T is a reference time: given the systems that are likely to be
-+ * installed on the reference device according to its speed class, T is
-+ * about the maximum time needed, under BFQ and while reading two files in
-+ * parallel, to load typical large applications on these systems.
-+ * In practice, the slower/faster the device at hand is, the more/less it
-+ * takes to load applications with respect to the reference device.
-+ * Accordingly, the longer/shorter BFQ grants weight raising to interactive
-+ * applications.
-+ *
-+ * BFQ uses four different reference pairs (R, T), depending on:
-+ * . whether the device is rotational or non-rotational;
-+ * . whether the device is slow, such as old or portable HDDs, as well as
-+ *   SD cards, or fast, such as newer HDDs and SSDs.
-+ *
-+ * The device's speed class is dynamically (re)detected in
-+ * bfq_update_peak_rate() every time the estimated peak rate is updated.
-+ *
-+ * In the following definitions, R_slow[0]/R_fast[0] and T_slow[0]/T_fast[0]
-+ * are the reference values for a slow/fast rotational device, whereas
-+ * R_slow[1]/R_fast[1] and T_slow[1]/T_fast[1] are the reference values for
-+ * a slow/fast non-rotational device. Finally, device_speed_thresh are the
-+ * thresholds used to switch between speed classes.
-+ * Both the reference peak rates and the thresholds are measured in
-+ * sectors/usec, left-shifted by BFQ_RATE_SHIFT.
-+ */
-+static int R_slow[2] = {1536, 10752};
-+static int R_fast[2] = {17415, 34791};
-+/*
-+ * To improve readability, a conversion function is used to initialize the
-+ * following arrays, which entails that they can be initialized only in a
-+ * function.
-+ */
-+static int T_slow[2];
-+static int T_fast[2];
-+static int device_speed_thresh[2];
-+
-+#define BFQ_SERVICE_TREE_INIT	((struct bfq_service_tree)		\
-+				{ RB_ROOT, RB_ROOT, NULL, NULL, 0, 0 })
-+
-+#define RQ_BIC(rq)		((struct bfq_io_cq *) (rq)->elv.priv[0])
-+#define RQ_BFQQ(rq)		((rq)->elv.priv[1])
-+
-+static inline void bfq_schedule_dispatch(struct bfq_data *bfqd);
-+
-+#include "bfq-ioc.c"
-+#include "bfq-sched.c"
-+#include "bfq-cgroup.c"
-+
-+#define bfq_class_idle(bfqq)	((bfqq)->entity.ioprio_class ==\
-+				 IOPRIO_CLASS_IDLE)
-+#define bfq_class_rt(bfqq)	((bfqq)->entity.ioprio_class ==\
-+				 IOPRIO_CLASS_RT)
-+
-+#define bfq_sample_valid(samples)	((samples) > 80)
-+
-+/*
-+ * We regard a request as SYNC, if either it's a read or has the SYNC bit
-+ * set (in which case it could also be a direct WRITE).
-+ */
-+static inline int bfq_bio_sync(struct bio *bio)
-+{
-+	if (bio_data_dir(bio) == READ || (bio->bi_rw & REQ_SYNC))
-+		return 1;
-+
-+	return 0;
-+}
-+
-+/*
-+ * Scheduler run of queue, if there are requests pending and no one in the
-+ * driver that will restart queueing.
-+ */
-+static inline void bfq_schedule_dispatch(struct bfq_data *bfqd)
-+{
-+	if (bfqd->queued != 0) {
-+		bfq_log(bfqd, "schedule dispatch");
-+		kblockd_schedule_work(&bfqd->unplug_work);
-+	}
-+}
-+
-+/*
-+ * Lifted from AS - choose which of rq1 and rq2 that is best served now.
-+ * We choose the request that is closesr to the head right now.  Distance
-+ * behind the head is penalized and only allowed to a certain extent.
-+ */
-+static struct request *bfq_choose_req(struct bfq_data *bfqd,
-+				      struct request *rq1,
-+				      struct request *rq2,
-+				      sector_t last)
-+{
-+	sector_t s1, s2, d1 = 0, d2 = 0;
-+	unsigned long back_max;
-+#define BFQ_RQ1_WRAP	0x01 /* request 1 wraps */
-+#define BFQ_RQ2_WRAP	0x02 /* request 2 wraps */
-+	unsigned wrap = 0; /* bit mask: requests behind the disk head? */
-+
-+	if (rq1 == NULL || rq1 == rq2)
-+		return rq2;
-+	if (rq2 == NULL)
-+		return rq1;
-+
-+	if (rq_is_sync(rq1) && !rq_is_sync(rq2))
-+		return rq1;
-+	else if (rq_is_sync(rq2) && !rq_is_sync(rq1))
-+		return rq2;
-+	if ((rq1->cmd_flags & REQ_META) && !(rq2->cmd_flags & REQ_META))
-+		return rq1;
-+	else if ((rq2->cmd_flags & REQ_META) && !(rq1->cmd_flags & REQ_META))
-+		return rq2;
-+
-+	s1 = blk_rq_pos(rq1);
-+	s2 = blk_rq_pos(rq2);
-+
-+	/*
-+	 * By definition, 1KiB is 2 sectors.
-+	 */
-+	back_max = bfqd->bfq_back_max * 2;
-+
-+	/*
-+	 * Strict one way elevator _except_ in the case where we allow
-+	 * short backward seeks which are biased as twice the cost of a
-+	 * similar forward seek.
-+	 */
-+	if (s1 >= last)
-+		d1 = s1 - last;
-+	else if (s1 + back_max >= last)
-+		d1 = (last - s1) * bfqd->bfq_back_penalty;
-+	else
-+		wrap |= BFQ_RQ1_WRAP;
-+
-+	if (s2 >= last)
-+		d2 = s2 - last;
-+	else if (s2 + back_max >= last)
-+		d2 = (last - s2) * bfqd->bfq_back_penalty;
-+	else
-+		wrap |= BFQ_RQ2_WRAP;
-+
-+	/* Found required data */
-+
-+	/*
-+	 * By doing switch() on the bit mask "wrap" we avoid having to
-+	 * check two variables for all permutations: --> faster!
-+	 */
-+	switch (wrap) {
-+	case 0: /* common case for CFQ: rq1 and rq2 not wrapped */
-+		if (d1 < d2)
-+			return rq1;
-+		else if (d2 < d1)
-+			return rq2;
-+		else {
-+			if (s1 >= s2)
-+				return rq1;
-+			else
-+				return rq2;
-+		}
-+
-+	case BFQ_RQ2_WRAP:
-+		return rq1;
-+	case BFQ_RQ1_WRAP:
-+		return rq2;
-+	case (BFQ_RQ1_WRAP|BFQ_RQ2_WRAP): /* both rqs wrapped */
-+	default:
-+		/*
-+		 * Since both rqs are wrapped,
-+		 * start with the one that's further behind head
-+		 * (--> only *one* back seek required),
-+		 * since back seek takes more time than forward.
-+		 */
-+		if (s1 <= s2)
-+			return rq1;
-+		else
-+			return rq2;
-+	}
-+}
-+
-+static struct bfq_queue *
-+bfq_rq_pos_tree_lookup(struct bfq_data *bfqd, struct rb_root *root,
-+		     sector_t sector, struct rb_node **ret_parent,
-+		     struct rb_node ***rb_link)
-+{
-+	struct rb_node **p, *parent;
-+	struct bfq_queue *bfqq = NULL;
-+
-+	parent = NULL;
-+	p = &root->rb_node;
-+	while (*p) {
-+		struct rb_node **n;
-+
-+		parent = *p;
-+		bfqq = rb_entry(parent, struct bfq_queue, pos_node);
-+
-+		/*
-+		 * Sort strictly based on sector. Smallest to the left,
-+		 * largest to the right.
-+		 */
-+		if (sector > blk_rq_pos(bfqq->next_rq))
-+			n = &(*p)->rb_right;
-+		else if (sector < blk_rq_pos(bfqq->next_rq))
-+			n = &(*p)->rb_left;
-+		else
-+			break;
-+		p = n;
-+		bfqq = NULL;
-+	}
-+
-+	*ret_parent = parent;
-+	if (rb_link)
-+		*rb_link = p;
-+
-+	bfq_log(bfqd, "rq_pos_tree_lookup %llu: returning %d",
-+		(long long unsigned)sector,
-+		bfqq != NULL ? bfqq->pid : 0);
-+
-+	return bfqq;
-+}
-+
-+static void bfq_rq_pos_tree_add(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	struct rb_node **p, *parent;
-+	struct bfq_queue *__bfqq;
-+
-+	if (bfqq->pos_root != NULL) {
-+		rb_erase(&bfqq->pos_node, bfqq->pos_root);
-+		bfqq->pos_root = NULL;
-+	}
-+
-+	if (bfq_class_idle(bfqq))
-+		return;
-+	if (!bfqq->next_rq)
-+		return;
-+
-+	bfqq->pos_root = &bfqd->rq_pos_tree;
-+	__bfqq = bfq_rq_pos_tree_lookup(bfqd, bfqq->pos_root,
-+			blk_rq_pos(bfqq->next_rq), &parent, &p);
-+	if (__bfqq == NULL) {
-+		rb_link_node(&bfqq->pos_node, parent, p);
-+		rb_insert_color(&bfqq->pos_node, bfqq->pos_root);
-+	} else
-+		bfqq->pos_root = NULL;
-+}
-+
-+/*
-+ * Tell whether there are active queues or groups with differentiated weights.
-+ */
-+static inline bool bfq_differentiated_weights(struct bfq_data *bfqd)
-+{
-+	BUG_ON(!bfqd->hw_tag);
-+	/*
-+	 * For weights to differ, at least one of the trees must contain
-+	 * at least two nodes.
-+	 */
-+	return (!RB_EMPTY_ROOT(&bfqd->queue_weights_tree) &&
-+		(bfqd->queue_weights_tree.rb_node->rb_left ||
-+		 bfqd->queue_weights_tree.rb_node->rb_right)
-+#ifdef CONFIG_CGROUP_BFQIO
-+	       ) ||
-+	       (!RB_EMPTY_ROOT(&bfqd->group_weights_tree) &&
-+		(bfqd->group_weights_tree.rb_node->rb_left ||
-+		 bfqd->group_weights_tree.rb_node->rb_right)
-+#endif
-+	       );
-+}
-+
-+/*
-+ * If the weight-counter tree passed as input contains no counter for
-+ * the weight of the input entity, then add that counter; otherwise just
-+ * increment the existing counter.
-+ *
-+ * Note that weight-counter trees contain few nodes in mostly symmetric
-+ * scenarios. For example, if all queues have the same weight, then the
-+ * weight-counter tree for the queues may contain at most one node.
-+ * This holds even if low_latency is on, because weight-raised queues
-+ * are not inserted in the tree.
-+ * In most scenarios, the rate at which nodes are created/destroyed
-+ * should be low too.
-+ */
-+static void bfq_weights_tree_add(struct bfq_data *bfqd,
-+				 struct bfq_entity *entity,
-+				 struct rb_root *root)
-+{
-+	struct rb_node **new = &(root->rb_node), *parent = NULL;
-+
-+	/*
-+	 * Do not insert if:
-+	 * - the device does not support queueing;
-+	 * - the entity is already associated with a counter, which happens if:
-+	 *   1) the entity is associated with a queue, 2) a request arrival
-+	 *   has caused the queue to become both non-weight-raised, and hence
-+	 *   change its weight, and backlogged; in this respect, each
-+	 *   of the two events causes an invocation of this function,
-+	 *   3) this is the invocation of this function caused by the second
-+	 *   event. This second invocation is actually useless, and we handle
-+	 *   this fact by exiting immediately. More efficient or clearer
-+	 *   solutions might possibly be adopted.
-+	 */
-+	if (!bfqd->hw_tag || entity->weight_counter)
-+		return;
-+
-+	while (*new) {
-+		struct bfq_weight_counter *__counter = container_of(*new,
-+						struct bfq_weight_counter,
-+						weights_node);
-+		parent = *new;
-+
-+		if (entity->weight == __counter->weight) {
-+			entity->weight_counter = __counter;
-+			goto inc_counter;
-+		}
-+		if (entity->weight < __counter->weight)
-+			new = &((*new)->rb_left);
-+		else
-+			new = &((*new)->rb_right);
-+	}
-+
-+	entity->weight_counter = kzalloc(sizeof(struct bfq_weight_counter),
-+					 GFP_ATOMIC);
-+	entity->weight_counter->weight = entity->weight;
-+	rb_link_node(&entity->weight_counter->weights_node, parent, new);
-+	rb_insert_color(&entity->weight_counter->weights_node, root);
-+
-+inc_counter:
-+	entity->weight_counter->num_active++;
-+}
-+
-+/*
-+ * Decrement the weight counter associated with the entity, and, if the
-+ * counter reaches 0, remove the counter from the tree.
-+ * See the comments to the function bfq_weights_tree_add() for considerations
-+ * about overhead.
-+ */
-+static void bfq_weights_tree_remove(struct bfq_data *bfqd,
-+				    struct bfq_entity *entity,
-+				    struct rb_root *root)
-+{
-+	/*
-+	 * Check whether the entity is actually associated with a counter.
-+	 * In fact, the device may not be considered NCQ-capable for a while,
-+	 * which implies that no insertion in the weight trees is performed,
-+	 * after which the device may start to be deemed NCQ-capable, and hence
-+	 * this function may start to be invoked. This may cause the function
-+	 * to be invoked for entities that are not associated with any counter.
-+	 */
-+	if (!entity->weight_counter)
-+		return;
-+
-+	BUG_ON(RB_EMPTY_ROOT(root));
-+	BUG_ON(entity->weight_counter->weight != entity->weight);
-+
-+	BUG_ON(!entity->weight_counter->num_active);
-+	entity->weight_counter->num_active--;
-+	if (entity->weight_counter->num_active > 0)
-+		goto reset_entity_pointer;
-+
-+	rb_erase(&entity->weight_counter->weights_node, root);
-+	kfree(entity->weight_counter);
-+
-+reset_entity_pointer:
-+	entity->weight_counter = NULL;
-+}
-+
-+static struct request *bfq_find_next_rq(struct bfq_data *bfqd,
-+					struct bfq_queue *bfqq,
-+					struct request *last)
-+{
-+	struct rb_node *rbnext = rb_next(&last->rb_node);
-+	struct rb_node *rbprev = rb_prev(&last->rb_node);
-+	struct request *next = NULL, *prev = NULL;
-+
-+	BUG_ON(RB_EMPTY_NODE(&last->rb_node));
-+
-+	if (rbprev != NULL)
-+		prev = rb_entry_rq(rbprev);
-+
-+	if (rbnext != NULL)
-+		next = rb_entry_rq(rbnext);
-+	else {
-+		rbnext = rb_first(&bfqq->sort_list);
-+		if (rbnext && rbnext != &last->rb_node)
-+			next = rb_entry_rq(rbnext);
-+	}
-+
-+	return bfq_choose_req(bfqd, next, prev, blk_rq_pos(last));
-+}
-+
-+/* see the definition of bfq_async_charge_factor for details */
-+static inline unsigned long bfq_serv_to_charge(struct request *rq,
-+					       struct bfq_queue *bfqq)
-+{
-+	return blk_rq_sectors(rq) *
-+		(1 + ((!bfq_bfqq_sync(bfqq)) * (bfqq->wr_coeff == 1) *
-+		bfq_async_charge_factor));
-+}
-+
-+/**
-+ * bfq_updated_next_req - update the queue after a new next_rq selection.
-+ * @bfqd: the device data the queue belongs to.
-+ * @bfqq: the queue to update.
-+ *
-+ * If the first request of a queue changes we make sure that the queue
-+ * has enough budget to serve at least its first request (if the
-+ * request has grown).  We do this because if the queue has not enough
-+ * budget for its first request, it has to go through two dispatch
-+ * rounds to actually get it dispatched.
-+ */
-+static void bfq_updated_next_req(struct bfq_data *bfqd,
-+				 struct bfq_queue *bfqq)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+	struct bfq_service_tree *st = bfq_entity_service_tree(entity);
-+	struct request *next_rq = bfqq->next_rq;
-+	unsigned long new_budget;
-+
-+	if (next_rq == NULL)
-+		return;
-+
-+	if (bfqq == bfqd->in_service_queue)
-+		/*
-+		 * In order not to break guarantees, budgets cannot be
-+		 * changed after an entity has been selected.
-+		 */
-+		return;
-+
-+	BUG_ON(entity->tree != &st->active);
-+	BUG_ON(entity == entity->sched_data->in_service_entity);
-+
-+	new_budget = max_t(unsigned long, bfqq->max_budget,
-+			   bfq_serv_to_charge(next_rq, bfqq));
-+	if (entity->budget != new_budget) {
-+		entity->budget = new_budget;
-+		bfq_log_bfqq(bfqd, bfqq, "updated next rq: new budget %lu",
-+					 new_budget);
-+		bfq_activate_bfqq(bfqd, bfqq);
-+	}
-+}
-+
-+static inline unsigned int bfq_wr_duration(struct bfq_data *bfqd)
-+{
-+	u64 dur;
-+
-+	if (bfqd->bfq_wr_max_time > 0)
-+		return bfqd->bfq_wr_max_time;
-+
-+	dur = bfqd->RT_prod;
-+	do_div(dur, bfqd->peak_rate);
-+
-+	return dur;
-+}
-+
-+static inline unsigned
-+bfq_bfqq_cooperations(struct bfq_queue *bfqq)
-+{
-+	return bfqq->bic ? bfqq->bic->cooperations : 0;
-+}
-+
-+static inline void
-+bfq_bfqq_resume_state(struct bfq_queue *bfqq, struct bfq_io_cq *bic)
-+{
-+	if (bic->saved_idle_window)
-+		bfq_mark_bfqq_idle_window(bfqq);
-+	else
-+		bfq_clear_bfqq_idle_window(bfqq);
-+	if (bic->saved_IO_bound)
-+		bfq_mark_bfqq_IO_bound(bfqq);
-+	else
-+		bfq_clear_bfqq_IO_bound(bfqq);
-+	/* Assuming that the flag in_large_burst is already correctly set */
-+	if (bic->wr_time_left && bfqq->bfqd->low_latency &&
-+	    !bfq_bfqq_in_large_burst(bfqq) &&
-+	    bic->cooperations < bfqq->bfqd->bfq_coop_thresh) {
-+		/*
-+		 * Start a weight raising period with the duration given by
-+		 * the raising_time_left snapshot.
-+		 */
-+		if (bfq_bfqq_busy(bfqq))
-+			bfqq->bfqd->wr_busy_queues++;
-+		bfqq->wr_coeff = bfqq->bfqd->bfq_wr_coeff;
-+		bfqq->wr_cur_max_time = bic->wr_time_left;
-+		bfqq->last_wr_start_finish = jiffies;
-+		bfqq->entity.ioprio_changed = 1;
-+	}
-+	/*
-+	 * Clear wr_time_left to prevent bfq_bfqq_save_state() from
-+	 * getting confused about the queue's need of a weight-raising
-+	 * period.
-+	 */
-+	bic->wr_time_left = 0;
-+}
-+
-+/* Must be called with the queue_lock held. */
-+static int bfqq_process_refs(struct bfq_queue *bfqq)
-+{
-+	int process_refs, io_refs;
-+
-+	io_refs = bfqq->allocated[READ] + bfqq->allocated[WRITE];
-+	process_refs = atomic_read(&bfqq->ref) - io_refs - bfqq->entity.on_st;
-+	BUG_ON(process_refs < 0);
-+	return process_refs;
-+}
-+
-+/* Empty burst list and add just bfqq (see comments to bfq_handle_burst) */
-+static inline void bfq_reset_burst_list(struct bfq_data *bfqd,
-+					struct bfq_queue *bfqq)
-+{
-+	struct bfq_queue *item;
-+	struct hlist_node *n;
-+
-+	hlist_for_each_entry_safe(item, n, &bfqd->burst_list, burst_list_node)
-+		hlist_del_init(&item->burst_list_node);
-+	hlist_add_head(&bfqq->burst_list_node, &bfqd->burst_list);
-+	bfqd->burst_size = 1;
-+}
-+
-+/* Add bfqq to the list of queues in current burst (see bfq_handle_burst) */
-+static void bfq_add_to_burst(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	/* Increment burst size to take into account also bfqq */
-+	bfqd->burst_size++;
-+
-+	if (bfqd->burst_size == bfqd->bfq_large_burst_thresh) {
-+		struct bfq_queue *pos, *bfqq_item;
-+		struct hlist_node *n;
-+
-+		/*
-+		 * Enough queues have been activated shortly after each
-+		 * other to consider this burst as large.
-+		 */
-+		bfqd->large_burst = true;
-+
-+		/*
-+		 * We can now mark all queues in the burst list as
-+		 * belonging to a large burst.
-+		 */
-+		hlist_for_each_entry(bfqq_item, &bfqd->burst_list,
-+				     burst_list_node)
-+		        bfq_mark_bfqq_in_large_burst(bfqq_item);
-+		bfq_mark_bfqq_in_large_burst(bfqq);
-+
-+		/*
-+		 * From now on, and until the current burst finishes, any
-+		 * new queue being activated shortly after the last queue
-+		 * was inserted in the burst can be immediately marked as
-+		 * belonging to a large burst. So the burst list is not
-+		 * needed any more. Remove it.
-+		 */
-+		hlist_for_each_entry_safe(pos, n, &bfqd->burst_list,
-+					  burst_list_node)
-+			hlist_del_init(&pos->burst_list_node);
-+	} else /* burst not yet large: add bfqq to the burst list */
-+		hlist_add_head(&bfqq->burst_list_node, &bfqd->burst_list);
-+}
-+
-+/*
-+ * If many queues happen to become active shortly after each other, then,
-+ * to help the processes associated to these queues get their job done as
-+ * soon as possible, it is usually better to not grant either weight-raising
-+ * or device idling to these queues. In this comment we describe, firstly,
-+ * the reasons why this fact holds, and, secondly, the next function, which
-+ * implements the main steps needed to properly mark these queues so that
-+ * they can then be treated in a different way.
-+ *
-+ * As for the terminology, we say that a queue becomes active, i.e.,
-+ * switches from idle to backlogged, either when it is created (as a
-+ * consequence of the arrival of an I/O request), or, if already existing,
-+ * when a new request for the queue arrives while the queue is idle.
-+ * Bursts of activations, i.e., activations of different queues occurring
-+ * shortly after each other, are typically caused by services or applications
-+ * that spawn or reactivate many parallel threads/processes. Examples are
-+ * systemd during boot or git grep.
-+ *
-+ * These services or applications benefit mostly from a high throughput:
-+ * the quicker the requests of the activated queues are cumulatively served,
-+ * the sooner the target job of these queues gets completed. As a consequence,
-+ * weight-raising any of these queues, which also implies idling the device
-+ * for it, is almost always counterproductive: in most cases it just lowers
-+ * throughput.
-+ *
-+ * On the other hand, a burst of activations may be also caused by the start
-+ * of an application that does not consist in a lot of parallel I/O-bound
-+ * threads. In fact, with a complex application, the burst may be just a
-+ * consequence of the fact that several processes need to be executed to
-+ * start-up the application. To start an application as quickly as possible,
-+ * the best thing to do is to privilege the I/O related to the application
-+ * with respect to all other I/O. Therefore, the best strategy to start as
-+ * quickly as possible an application that causes a burst of activations is
-+ * to weight-raise all the queues activated during the burst. This is the
-+ * exact opposite of the best strategy for the other type of bursts.
-+ *
-+ * In the end, to take the best action for each of the two cases, the two
-+ * types of bursts need to be distinguished. Fortunately, this seems
-+ * relatively easy to do, by looking at the sizes of the bursts. In
-+ * particular, we found a threshold such that bursts with a larger size
-+ * than that threshold are apparently caused only by services or commands
-+ * such as systemd or git grep. For brevity, hereafter we call just 'large'
-+ * these bursts. BFQ *does not* weight-raise queues whose activations occur
-+ * in a large burst. In addition, for each of these queues BFQ performs or
-+ * does not perform idling depending on which choice boosts the throughput
-+ * most. The exact choice depends on the device and request pattern at
-+ * hand.
-+ *
-+ * Turning back to the next function, it implements all the steps needed
-+ * to detect the occurrence of a large burst and to properly mark all the
-+ * queues belonging to it (so that they can then be treated in a different
-+ * way). This goal is achieved by maintaining a special "burst list" that
-+ * holds, temporarily, the queues that belong to the burst in progress. The
-+ * list is then used to mark these queues as belonging to a large burst if
-+ * the burst does become large. The main steps are the following.
-+ *
-+ * . when the very first queue is activated, the queue is inserted into the
-+ *   list (as it could be the first queue in a possible burst)
-+ *
-+ * . if the current burst has not yet become large, and a queue Q that does
-+ *   not yet belong to the burst is activated shortly after the last time
-+ *   at which a new queue entered the burst list, then the function appends
-+ *   Q to the burst list
-+ *
-+ * . if, as a consequence of the previous step, the burst size reaches
-+ *   the large-burst threshold, then
-+ *
-+ *     . all the queues in the burst list are marked as belonging to a
-+ *       large burst
-+ *
-+ *     . the burst list is deleted; in fact, the burst list already served
-+ *       its purpose (keeping temporarily track of the queues in a burst,
-+ *       so as to be able to mark them as belonging to a large burst in the
-+ *       previous sub-step), and now is not needed any more
-+ *
-+ *     . the device enters a large-burst mode
-+ *
-+ * . if a queue Q that does not belong to the burst is activated while
-+ *   the device is in large-burst mode and shortly after the last time
-+ *   at which a queue either entered the burst list or was marked as
-+ *   belonging to the current large burst, then Q is immediately marked
-+ *   as belonging to a large burst.
-+ *
-+ * . if a queue Q that does not belong to the burst is activated a while
-+ *   later, i.e., not shortly after, than the last time at which a queue
-+ *   either entered the burst list or was marked as belonging to the
-+ *   current large burst, then the current burst is deemed as finished and:
-+ *
-+ *        . the large-burst mode is reset if set
-+ *
-+ *        . the burst list is emptied
-+ *
-+ *        . Q is inserted in the burst list, as Q may be the first queue
-+ *          in a possible new burst (then the burst list contains just Q
-+ *          after this step).
-+ */
-+static void bfq_handle_burst(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+			     bool idle_for_long_time)
-+{
-+	/*
-+	 * If bfqq happened to be activated in a burst, but has been idle
-+	 * for at least as long as an interactive queue, then we assume
-+	 * that, in the overall I/O initiated in the burst, the I/O
-+	 * associated to bfqq is finished. So bfqq does not need to be
-+	 * treated as a queue belonging to a burst anymore. Accordingly,
-+	 * we reset bfqq's in_large_burst flag if set, and remove bfqq
-+	 * from the burst list if it's there. We do not decrement instead
-+	 * burst_size, because the fact that bfqq does not need to belong
-+	 * to the burst list any more does not invalidate the fact that
-+	 * bfqq may have been activated during the current burst.
-+	 */
-+	if (idle_for_long_time) {
-+		hlist_del_init(&bfqq->burst_list_node);
-+		bfq_clear_bfqq_in_large_burst(bfqq);
-+	}
-+
-+	/*
-+	 * If bfqq is already in the burst list or is part of a large
-+	 * burst, then there is nothing else to do.
-+	 */
-+	if (!hlist_unhashed(&bfqq->burst_list_node) ||
-+	    bfq_bfqq_in_large_burst(bfqq))
-+		return;
-+
-+	/*
-+	 * If bfqq's activation happens late enough, then the current
-+	 * burst is finished, and related data structures must be reset.
-+	 *
-+	 * In this respect, consider the special case where bfqq is the very
-+	 * first queue being activated. In this case, last_ins_in_burst is
-+	 * not yet significant when we get here. But it is easy to verify
-+	 * that, whether or not the following condition is true, bfqq will
-+	 * end up being inserted into the burst list. In particular the
-+	 * list will happen to contain only bfqq. And this is exactly what
-+	 * has to happen, as bfqq may be the first queue in a possible
-+	 * burst.
-+	 */
-+	if (time_is_before_jiffies(bfqd->last_ins_in_burst +
-+	    bfqd->bfq_burst_interval)) {
-+		bfqd->large_burst = false;
-+		bfq_reset_burst_list(bfqd, bfqq);
-+		return;
-+	}
-+
-+	/*
-+	 * If we get here, then bfqq is being activated shortly after the
-+	 * last queue. So, if the current burst is also large, we can mark
-+	 * bfqq as belonging to this large burst immediately.
-+	 */
-+	if (bfqd->large_burst) {
-+		bfq_mark_bfqq_in_large_burst(bfqq);
-+		return;
-+	}
-+
-+	/*
-+	 * If we get here, then a large-burst state has not yet been
-+	 * reached, but bfqq is being activated shortly after the last
-+	 * queue. Then we add bfqq to the burst.
-+	 */
-+	bfq_add_to_burst(bfqd, bfqq);
-+}
-+
-+static void bfq_add_request(struct request *rq)
-+{
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq);
-+	struct bfq_entity *entity = &bfqq->entity;
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+	struct request *next_rq, *prev;
-+	unsigned long old_wr_coeff = bfqq->wr_coeff;
-+	bool interactive = false;
-+
-+	bfq_log_bfqq(bfqd, bfqq, "add_request %d", rq_is_sync(rq));
-+	bfqq->queued[rq_is_sync(rq)]++;
-+	bfqd->queued++;
-+
-+	elv_rb_add(&bfqq->sort_list, rq);
-+
-+	/*
-+	 * Check if this request is a better next-serve candidate.
-+	 */
-+	prev = bfqq->next_rq;
-+	next_rq = bfq_choose_req(bfqd, bfqq->next_rq, rq, bfqd->last_position);
-+	BUG_ON(next_rq == NULL);
-+	bfqq->next_rq = next_rq;
-+
-+	/*
-+	 * Adjust priority tree position, if next_rq changes.
-+	 */
-+	if (prev != bfqq->next_rq)
-+		bfq_rq_pos_tree_add(bfqd, bfqq);
-+
-+	if (!bfq_bfqq_busy(bfqq)) {
-+		bool soft_rt, coop_or_in_burst,
-+		     idle_for_long_time = time_is_before_jiffies(
-+						bfqq->budget_timeout +
-+						bfqd->bfq_wr_min_idle_time);
-+
-+		if (bfq_bfqq_sync(bfqq)) {
-+			bool already_in_burst =
-+			   !hlist_unhashed(&bfqq->burst_list_node) ||
-+			   bfq_bfqq_in_large_burst(bfqq);
-+			bfq_handle_burst(bfqd, bfqq, idle_for_long_time);
-+			/*
-+			 * If bfqq was not already in the current burst,
-+			 * then, at this point, bfqq either has been
-+			 * added to the current burst or has caused the
-+			 * current burst to terminate. In particular, in
-+			 * the second case, bfqq has become the first
-+			 * queue in a possible new burst.
-+			 * In both cases last_ins_in_burst needs to be
-+			 * moved forward.
-+			 */
-+			if (!already_in_burst)
-+				bfqd->last_ins_in_burst = jiffies;
-+		}
-+
-+		coop_or_in_burst = bfq_bfqq_in_large_burst(bfqq) ||
-+			bfq_bfqq_cooperations(bfqq) >= bfqd->bfq_coop_thresh;
-+		soft_rt = bfqd->bfq_wr_max_softrt_rate > 0 &&
-+			!coop_or_in_burst &&
-+			time_is_before_jiffies(bfqq->soft_rt_next_start);
-+		interactive = !coop_or_in_burst && idle_for_long_time;
-+		entity->budget = max_t(unsigned long, bfqq->max_budget,
-+				       bfq_serv_to_charge(next_rq, bfqq));
-+
-+		if (!bfq_bfqq_IO_bound(bfqq)) {
-+			if (time_before(jiffies,
-+					RQ_BIC(rq)->ttime.last_end_request +
-+					bfqd->bfq_slice_idle)) {
-+				bfqq->requests_within_timer++;
-+				if (bfqq->requests_within_timer >=
-+				    bfqd->bfq_requests_within_timer)
-+					bfq_mark_bfqq_IO_bound(bfqq);
-+			} else
-+				bfqq->requests_within_timer = 0;
-+		}
-+
-+		if (!bfqd->low_latency)
-+			goto add_bfqq_busy;
-+
-+		if (bfq_bfqq_just_split(bfqq))
-+			goto set_ioprio_changed;
-+
-+		/*
-+		 * If the queue:
-+		 * - is not being boosted,
-+		 * - has been idle for enough time,
-+		 * - is not a sync queue or is linked to a bfq_io_cq (it is
-+		 *   shared "for its nature" or it is not shared and its
-+		 *   requests have not been redirected to a shared queue)
-+		 * start a weight-raising period.
-+		 */
-+		if (old_wr_coeff == 1 && (interactive || soft_rt) &&
-+		    (!bfq_bfqq_sync(bfqq) || bfqq->bic != NULL)) {
-+			bfqq->wr_coeff = bfqd->bfq_wr_coeff;
-+			if (interactive)
-+				bfqq->wr_cur_max_time = bfq_wr_duration(bfqd);
-+			else
-+				bfqq->wr_cur_max_time =
-+					bfqd->bfq_wr_rt_max_time;
-+			bfq_log_bfqq(bfqd, bfqq,
-+				     "wrais starting at %lu, rais_max_time %u",
-+				     jiffies,
-+				     jiffies_to_msecs(bfqq->wr_cur_max_time));
-+		} else if (old_wr_coeff > 1) {
-+			if (interactive)
-+				bfqq->wr_cur_max_time = bfq_wr_duration(bfqd);
-+			else if (coop_or_in_burst ||
-+				 (bfqq->wr_cur_max_time ==
-+				  bfqd->bfq_wr_rt_max_time &&
-+				  !soft_rt)) {
-+				bfqq->wr_coeff = 1;
-+				bfq_log_bfqq(bfqd, bfqq,
-+					"wrais ending at %lu, rais_max_time %u",
-+					jiffies,
-+					jiffies_to_msecs(bfqq->
-+						wr_cur_max_time));
-+			} else if (time_before(
-+					bfqq->last_wr_start_finish +
-+					bfqq->wr_cur_max_time,
-+					jiffies +
-+					bfqd->bfq_wr_rt_max_time) &&
-+				   soft_rt) {
-+				/*
-+				 *
-+				 * The remaining weight-raising time is lower
-+				 * than bfqd->bfq_wr_rt_max_time, which means
-+				 * that the application is enjoying weight
-+				 * raising either because deemed soft-rt in
-+				 * the near past, or because deemed interactive
-+				 * a long ago.
-+				 * In both cases, resetting now the current
-+				 * remaining weight-raising time for the
-+				 * application to the weight-raising duration
-+				 * for soft rt applications would not cause any
-+				 * latency increase for the application (as the
-+				 * new duration would be higher than the
-+				 * remaining time).
-+				 *
-+				 * In addition, the application is now meeting
-+				 * the requirements for being deemed soft rt.
-+				 * In the end we can correctly and safely
-+				 * (re)charge the weight-raising duration for
-+				 * the application with the weight-raising
-+				 * duration for soft rt applications.
-+				 *
-+				 * In particular, doing this recharge now, i.e.,
-+				 * before the weight-raising period for the
-+				 * application finishes, reduces the probability
-+				 * of the following negative scenario:
-+				 * 1) the weight of a soft rt application is
-+				 *    raised at startup (as for any newly
-+				 *    created application),
-+				 * 2) since the application is not interactive,
-+				 *    at a certain time weight-raising is
-+				 *    stopped for the application,
-+				 * 3) at that time the application happens to
-+				 *    still have pending requests, and hence
-+				 *    is destined to not have a chance to be
-+				 *    deemed soft rt before these requests are
-+				 *    completed (see the comments to the
-+				 *    function bfq_bfqq_softrt_next_start()
-+				 *    for details on soft rt detection),
-+				 * 4) these pending requests experience a high
-+				 *    latency because the application is not
-+				 *    weight-raised while they are pending.
-+				 */
-+				bfqq->last_wr_start_finish = jiffies;
-+				bfqq->wr_cur_max_time =
-+					bfqd->bfq_wr_rt_max_time;
-+			}
-+		}
-+set_ioprio_changed:
-+		if (old_wr_coeff != bfqq->wr_coeff)
-+			entity->ioprio_changed = 1;
-+add_bfqq_busy:
-+		bfqq->last_idle_bklogged = jiffies;
-+		bfqq->service_from_backlogged = 0;
-+		bfq_clear_bfqq_softrt_update(bfqq);
-+		bfq_add_bfqq_busy(bfqd, bfqq);
-+	} else {
-+		if (bfqd->low_latency && old_wr_coeff == 1 && !rq_is_sync(rq) &&
-+		    time_is_before_jiffies(
-+				bfqq->last_wr_start_finish +
-+				bfqd->bfq_wr_min_inter_arr_async)) {
-+			bfqq->wr_coeff = bfqd->bfq_wr_coeff;
-+			bfqq->wr_cur_max_time = bfq_wr_duration(bfqd);
-+
-+			bfqd->wr_busy_queues++;
-+			entity->ioprio_changed = 1;
-+			bfq_log_bfqq(bfqd, bfqq,
-+			    "non-idle wrais starting at %lu, rais_max_time %u",
-+			    jiffies,
-+			    jiffies_to_msecs(bfqq->wr_cur_max_time));
-+		}
-+		if (prev != bfqq->next_rq)
-+			bfq_updated_next_req(bfqd, bfqq);
-+	}
-+
-+	if (bfqd->low_latency &&
-+		(old_wr_coeff == 1 || bfqq->wr_coeff == 1 || interactive))
-+		bfqq->last_wr_start_finish = jiffies;
-+}
-+
-+static struct request *bfq_find_rq_fmerge(struct bfq_data *bfqd,
-+					  struct bio *bio)
-+{
-+	struct task_struct *tsk = current;
-+	struct bfq_io_cq *bic;
-+	struct bfq_queue *bfqq;
-+
-+	bic = bfq_bic_lookup(bfqd, tsk->io_context);
-+	if (bic == NULL)
-+		return NULL;
-+
-+	bfqq = bic_to_bfqq(bic, bfq_bio_sync(bio));
-+	if (bfqq != NULL)
-+		return elv_rb_find(&bfqq->sort_list, bio_end_sector(bio));
-+
-+	return NULL;
-+}
-+
-+static void bfq_activate_request(struct request_queue *q, struct request *rq)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+
-+	bfqd->rq_in_driver++;
-+	bfqd->last_position = blk_rq_pos(rq) + blk_rq_sectors(rq);
-+	bfq_log(bfqd, "activate_request: new bfqd->last_position %llu",
-+		(long long unsigned)bfqd->last_position);
-+}
-+
-+static inline void bfq_deactivate_request(struct request_queue *q,
-+					  struct request *rq)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+
-+	BUG_ON(bfqd->rq_in_driver == 0);
-+	bfqd->rq_in_driver--;
-+}
-+
-+static void bfq_remove_request(struct request *rq)
-+{
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq);
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+	const int sync = rq_is_sync(rq);
-+
-+	if (bfqq->next_rq == rq) {
-+		bfqq->next_rq = bfq_find_next_rq(bfqd, bfqq, rq);
-+		bfq_updated_next_req(bfqd, bfqq);
-+	}
-+
-+	list_del_init(&rq->queuelist);
-+	BUG_ON(bfqq->queued[sync] == 0);
-+	bfqq->queued[sync]--;
-+	bfqd->queued--;
-+	elv_rb_del(&bfqq->sort_list, rq);
-+
-+	if (RB_EMPTY_ROOT(&bfqq->sort_list)) {
-+		if (bfq_bfqq_busy(bfqq) && bfqq != bfqd->in_service_queue)
-+			bfq_del_bfqq_busy(bfqd, bfqq, 1);
-+		/*
-+		 * Remove queue from request-position tree as it is empty.
-+		 */
-+		if (bfqq->pos_root != NULL) {
-+			rb_erase(&bfqq->pos_node, bfqq->pos_root);
-+			bfqq->pos_root = NULL;
-+		}
-+	}
-+
-+	if (rq->cmd_flags & REQ_META) {
-+		BUG_ON(bfqq->meta_pending == 0);
-+		bfqq->meta_pending--;
-+	}
-+}
-+
-+static int bfq_merge(struct request_queue *q, struct request **req,
-+		     struct bio *bio)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct request *__rq;
-+
-+	__rq = bfq_find_rq_fmerge(bfqd, bio);
-+	if (__rq != NULL && elv_rq_merge_ok(__rq, bio)) {
-+		*req = __rq;
-+		return ELEVATOR_FRONT_MERGE;
-+	}
-+
-+	return ELEVATOR_NO_MERGE;
-+}
-+
-+static void bfq_merged_request(struct request_queue *q, struct request *req,
-+			       int type)
-+{
-+	if (type == ELEVATOR_FRONT_MERGE &&
-+	    rb_prev(&req->rb_node) &&
-+	    blk_rq_pos(req) <
-+	    blk_rq_pos(container_of(rb_prev(&req->rb_node),
-+				    struct request, rb_node))) {
-+		struct bfq_queue *bfqq = RQ_BFQQ(req);
-+		struct bfq_data *bfqd = bfqq->bfqd;
-+		struct request *prev, *next_rq;
-+
-+		/* Reposition request in its sort_list */
-+		elv_rb_del(&bfqq->sort_list, req);
-+		elv_rb_add(&bfqq->sort_list, req);
-+		/* Choose next request to be served for bfqq */
-+		prev = bfqq->next_rq;
-+		next_rq = bfq_choose_req(bfqd, bfqq->next_rq, req,
-+					 bfqd->last_position);
-+		BUG_ON(next_rq == NULL);
-+		bfqq->next_rq = next_rq;
-+		/*
-+		 * If next_rq changes, update both the queue's budget to
-+		 * fit the new request and the queue's position in its
-+		 * rq_pos_tree.
-+		 */
-+		if (prev != bfqq->next_rq) {
-+			bfq_updated_next_req(bfqd, bfqq);
-+			bfq_rq_pos_tree_add(bfqd, bfqq);
-+		}
-+	}
-+}
-+
-+static void bfq_merged_requests(struct request_queue *q, struct request *rq,
-+				struct request *next)
-+{
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq);
-+
-+	/*
-+	 * Reposition in fifo if next is older than rq.
-+	 */
-+	if (!list_empty(&rq->queuelist) && !list_empty(&next->queuelist) &&
-+	    time_before(next->fifo_time, rq->fifo_time)) {
-+		list_move(&rq->queuelist, &next->queuelist);
-+		rq->fifo_time = next->fifo_time;
-+	}
-+
-+	if (bfqq->next_rq == next)
-+		bfqq->next_rq = rq;
-+
-+	bfq_remove_request(next);
-+}
-+
-+/* Must be called with bfqq != NULL */
-+static inline void bfq_bfqq_end_wr(struct bfq_queue *bfqq)
-+{
-+	BUG_ON(bfqq == NULL);
-+	if (bfq_bfqq_busy(bfqq))
-+		bfqq->bfqd->wr_busy_queues--;
-+	bfqq->wr_coeff = 1;
-+	bfqq->wr_cur_max_time = 0;
-+	/* Trigger a weight change on the next activation of the queue */
-+	bfqq->entity.ioprio_changed = 1;
-+}
-+
-+static void bfq_end_wr_async_queues(struct bfq_data *bfqd,
-+				    struct bfq_group *bfqg)
-+{
-+	int i, j;
-+
-+	for (i = 0; i < 2; i++)
-+		for (j = 0; j < IOPRIO_BE_NR; j++)
-+			if (bfqg->async_bfqq[i][j] != NULL)
-+				bfq_bfqq_end_wr(bfqg->async_bfqq[i][j]);
-+	if (bfqg->async_idle_bfqq != NULL)
-+		bfq_bfqq_end_wr(bfqg->async_idle_bfqq);
-+}
-+
-+static void bfq_end_wr(struct bfq_data *bfqd)
-+{
-+	struct bfq_queue *bfqq;
-+
-+	spin_lock_irq(bfqd->queue->queue_lock);
-+
-+	list_for_each_entry(bfqq, &bfqd->active_list, bfqq_list)
-+		bfq_bfqq_end_wr(bfqq);
-+	list_for_each_entry(bfqq, &bfqd->idle_list, bfqq_list)
-+		bfq_bfqq_end_wr(bfqq);
-+	bfq_end_wr_async(bfqd);
-+
-+	spin_unlock_irq(bfqd->queue->queue_lock);
-+}
-+
-+static inline sector_t bfq_io_struct_pos(void *io_struct, bool request)
-+{
-+	if (request)
-+		return blk_rq_pos(io_struct);
-+	else
-+		return ((struct bio *)io_struct)->bi_iter.bi_sector;
-+}
-+
-+static inline sector_t bfq_dist_from(sector_t pos1,
-+				     sector_t pos2)
-+{
-+	if (pos1 >= pos2)
-+		return pos1 - pos2;
-+	else
-+		return pos2 - pos1;
-+}
-+
-+static inline int bfq_rq_close_to_sector(void *io_struct, bool request,
-+					 sector_t sector)
-+{
-+	return bfq_dist_from(bfq_io_struct_pos(io_struct, request), sector) <=
-+	       BFQQ_SEEK_THR;
-+}
-+
-+static struct bfq_queue *bfqq_close(struct bfq_data *bfqd, sector_t sector)
-+{
-+	struct rb_root *root = &bfqd->rq_pos_tree;
-+	struct rb_node *parent, *node;
-+	struct bfq_queue *__bfqq;
-+
-+	if (RB_EMPTY_ROOT(root))
-+		return NULL;
-+
-+	/*
-+	 * First, if we find a request starting at the end of the last
-+	 * request, choose it.
-+	 */
-+	__bfqq = bfq_rq_pos_tree_lookup(bfqd, root, sector, &parent, NULL);
-+	if (__bfqq != NULL)
-+		return __bfqq;
-+
-+	/*
-+	 * If the exact sector wasn't found, the parent of the NULL leaf
-+	 * will contain the closest sector (rq_pos_tree sorted by
-+	 * next_request position).
-+	 */
-+	__bfqq = rb_entry(parent, struct bfq_queue, pos_node);
-+	if (bfq_rq_close_to_sector(__bfqq->next_rq, true, sector))
-+		return __bfqq;
-+
-+	if (blk_rq_pos(__bfqq->next_rq) < sector)
-+		node = rb_next(&__bfqq->pos_node);
-+	else
-+		node = rb_prev(&__bfqq->pos_node);
-+	if (node == NULL)
-+		return NULL;
-+
-+	__bfqq = rb_entry(node, struct bfq_queue, pos_node);
-+	if (bfq_rq_close_to_sector(__bfqq->next_rq, true, sector))
-+		return __bfqq;
-+
-+	return NULL;
-+}
-+
-+/*
-+ * bfqd - obvious
-+ * cur_bfqq - passed in so that we don't decide that the current queue
-+ *            is closely cooperating with itself
-+ * sector - used as a reference point to search for a close queue
-+ */
-+static struct bfq_queue *bfq_close_cooperator(struct bfq_data *bfqd,
-+					      struct bfq_queue *cur_bfqq,
-+					      sector_t sector)
-+{
-+	struct bfq_queue *bfqq;
-+
-+	if (bfq_class_idle(cur_bfqq))
-+		return NULL;
-+	if (!bfq_bfqq_sync(cur_bfqq))
-+		return NULL;
-+	if (BFQQ_SEEKY(cur_bfqq))
-+		return NULL;
-+
-+	/* If device has only one backlogged bfq_queue, don't search. */
-+	if (bfqd->busy_queues == 1)
-+		return NULL;
-+
-+	/*
-+	 * We should notice if some of the queues are cooperating, e.g.
-+	 * working closely on the same area of the disk. In that case,
-+	 * we can group them together and don't waste time idling.
-+	 */
-+	bfqq = bfqq_close(bfqd, sector);
-+	if (bfqq == NULL || bfqq == cur_bfqq)
-+		return NULL;
-+
-+	/*
-+	 * Do not merge queues from different bfq_groups.
-+	*/
-+	if (bfqq->entity.parent != cur_bfqq->entity.parent)
-+		return NULL;
-+
-+	/*
-+	 * It only makes sense to merge sync queues.
-+	 */
-+	if (!bfq_bfqq_sync(bfqq))
-+		return NULL;
-+	if (BFQQ_SEEKY(bfqq))
-+		return NULL;
-+
-+	/*
-+	 * Do not merge queues of different priority classes.
-+	 */
-+	if (bfq_class_rt(bfqq) != bfq_class_rt(cur_bfqq))
-+		return NULL;
-+
-+	return bfqq;
-+}
-+
-+static struct bfq_queue *
-+bfq_setup_merge(struct bfq_queue *bfqq, struct bfq_queue *new_bfqq)
-+{
-+	int process_refs, new_process_refs;
-+	struct bfq_queue *__bfqq;
-+
-+	/*
-+	 * If there are no process references on the new_bfqq, then it is
-+	 * unsafe to follow the ->new_bfqq chain as other bfqq's in the chain
-+	 * may have dropped their last reference (not just their last process
-+	 * reference).
-+	 */
-+	if (!bfqq_process_refs(new_bfqq))
-+		return NULL;
-+
-+	/* Avoid a circular list and skip interim queue merges. */
-+	while ((__bfqq = new_bfqq->new_bfqq)) {
-+		if (__bfqq == bfqq)
-+			return NULL;
-+		new_bfqq = __bfqq;
-+	}
-+
-+	process_refs = bfqq_process_refs(bfqq);
-+	new_process_refs = bfqq_process_refs(new_bfqq);
-+	/*
-+	 * If the process for the bfqq has gone away, there is no
-+	 * sense in merging the queues.
-+	 */
-+	if (process_refs == 0 || new_process_refs == 0)
-+		return NULL;
-+
-+	bfq_log_bfqq(bfqq->bfqd, bfqq, "scheduling merge with queue %d",
-+		new_bfqq->pid);
-+
-+	/*
-+	 * Merging is just a redirection: the requests of the process
-+	 * owning one of the two queues are redirected to the other queue.
-+	 * The latter queue, in its turn, is set as shared if this is the
-+	 * first time that the requests of some process are redirected to
-+	 * it.
-+	 *
-+	 * We redirect bfqq to new_bfqq and not the opposite, because we
-+	 * are in the context of the process owning bfqq, hence we have
-+	 * the io_cq of this process. So we can immediately configure this
-+	 * io_cq to redirect the requests of the process to new_bfqq.
-+	 *
-+	 * NOTE, even if new_bfqq coincides with the in-service queue, the
-+	 * io_cq of new_bfqq is not available, because, if the in-service
-+	 * queue is shared, bfqd->in_service_bic may not point to the
-+	 * io_cq of the in-service queue.
-+	 * Redirecting the requests of the process owning bfqq to the
-+	 * currently in-service queue is in any case the best option, as
-+	 * we feed the in-service queue with new requests close to the
-+	 * last request served and, by doing so, hopefully increase the
-+	 * throughput.
-+	 */
-+	bfqq->new_bfqq = new_bfqq;
-+	atomic_add(process_refs, &new_bfqq->ref);
-+	return new_bfqq;
-+}
-+
-+/*
-+ * Attempt to schedule a merge of bfqq with the currently in-service queue
-+ * or with a close queue among the scheduled queues.
-+ * Return NULL if no merge was scheduled, a pointer to the shared bfq_queue
-+ * structure otherwise.
-+ *
-+ * The OOM queue is not allowed to participate to cooperation: in fact, since
-+ * the requests temporarily redirected to the OOM queue could be redirected
-+ * again to dedicated queues at any time, the state needed to correctly
-+ * handle merging with the OOM queue would be quite complex and expensive
-+ * to maintain. Besides, in such a critical condition as an out of memory,
-+ * the benefits of queue merging may be little relevant, or even negligible.
-+ */
-+static struct bfq_queue *
-+bfq_setup_cooperator(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+		     void *io_struct, bool request)
-+{
-+	struct bfq_queue *in_service_bfqq, *new_bfqq;
-+
-+	if (bfqq->new_bfqq)
-+		return bfqq->new_bfqq;
-+
-+	if (!io_struct || unlikely(bfqq == &bfqd->oom_bfqq))
-+		return NULL;
-+
-+	in_service_bfqq = bfqd->in_service_queue;
-+
-+	if (in_service_bfqq == NULL || in_service_bfqq == bfqq ||
-+	    !bfqd->in_service_bic ||
-+	    unlikely(in_service_bfqq == &bfqd->oom_bfqq))
-+		goto check_scheduled;
-+
-+	if (bfq_class_idle(in_service_bfqq) || bfq_class_idle(bfqq))
-+		goto check_scheduled;
-+
-+	if (bfq_class_rt(in_service_bfqq) != bfq_class_rt(bfqq))
-+		goto check_scheduled;
-+
-+	if (in_service_bfqq->entity.parent != bfqq->entity.parent)
-+		goto check_scheduled;
-+
-+	if (bfq_rq_close_to_sector(io_struct, request, bfqd->last_position) &&
-+	    bfq_bfqq_sync(in_service_bfqq) && bfq_bfqq_sync(bfqq)) {
-+		new_bfqq = bfq_setup_merge(bfqq, in_service_bfqq);
-+		if (new_bfqq != NULL)
-+			return new_bfqq; /* Merge with in-service queue */
-+	}
-+
-+	/*
-+	 * Check whether there is a cooperator among currently scheduled
-+	 * queues. The only thing we need is that the bio/request is not
-+	 * NULL, as we need it to establish whether a cooperator exists.
-+	 */
-+check_scheduled:
-+	new_bfqq = bfq_close_cooperator(bfqd, bfqq,
-+					bfq_io_struct_pos(io_struct, request));
-+	if (new_bfqq && likely(new_bfqq != &bfqd->oom_bfqq))
-+		return bfq_setup_merge(bfqq, new_bfqq);
-+
-+	return NULL;
-+}
-+
-+static inline void
-+bfq_bfqq_save_state(struct bfq_queue *bfqq)
-+{
-+	/*
-+	 * If bfqq->bic == NULL, the queue is already shared or its requests
-+	 * have already been redirected to a shared queue; both idle window
-+	 * and weight raising state have already been saved. Do nothing.
-+	 */
-+	if (bfqq->bic == NULL)
-+		return;
-+	if (bfqq->bic->wr_time_left)
-+		/*
-+		 * This is the queue of a just-started process, and would
-+		 * deserve weight raising: we set wr_time_left to the full
-+		 * weight-raising duration to trigger weight-raising when
-+		 * and if the queue is split and the first request of the
-+		 * queue is enqueued.
-+		 */
-+		bfqq->bic->wr_time_left = bfq_wr_duration(bfqq->bfqd);
-+	else if (bfqq->wr_coeff > 1) {
-+		unsigned long wr_duration =
-+			jiffies - bfqq->last_wr_start_finish;
-+		/*
-+		 * It may happen that a queue's weight raising period lasts
-+		 * longer than its wr_cur_max_time, as weight raising is
-+		 * handled only when a request is enqueued or dispatched (it
-+		 * does not use any timer). If the weight raising period is
-+		 * about to end, don't save it.
-+		 */
-+		if (bfqq->wr_cur_max_time <= wr_duration)
-+			bfqq->bic->wr_time_left = 0;
-+		else
-+			bfqq->bic->wr_time_left =
-+				bfqq->wr_cur_max_time - wr_duration;
-+		/*
-+		 * The bfq_queue is becoming shared or the requests of the
-+		 * process owning the queue are being redirected to a shared
-+		 * queue. Stop the weight raising period of the queue, as in
-+		 * both cases it should not be owned by an interactive or
-+		 * soft real-time application.
-+		 */
-+		bfq_bfqq_end_wr(bfqq);
-+	} else
-+		bfqq->bic->wr_time_left = 0;
-+	bfqq->bic->saved_idle_window = bfq_bfqq_idle_window(bfqq);
-+	bfqq->bic->saved_IO_bound = bfq_bfqq_IO_bound(bfqq);
-+	bfqq->bic->saved_in_large_burst = bfq_bfqq_in_large_burst(bfqq);
-+	bfqq->bic->was_in_burst_list = !hlist_unhashed(&bfqq->burst_list_node);
-+	bfqq->bic->cooperations++;
-+	bfqq->bic->failed_cooperations = 0;
-+}
-+
-+static inline void
-+bfq_get_bic_reference(struct bfq_queue *bfqq)
-+{
-+	/*
-+	 * If bfqq->bic has a non-NULL value, the bic to which it belongs
-+	 * is about to begin using a shared bfq_queue.
-+	 */
-+	if (bfqq->bic)
-+		atomic_long_inc(&bfqq->bic->icq.ioc->refcount);
-+}
-+
-+static void
-+bfq_merge_bfqqs(struct bfq_data *bfqd, struct bfq_io_cq *bic,
-+		struct bfq_queue *bfqq, struct bfq_queue *new_bfqq)
-+{
-+	bfq_log_bfqq(bfqd, bfqq, "merging with queue %lu",
-+		(long unsigned)new_bfqq->pid);
-+	/* Save weight raising and idle window of the merged queues */
-+	bfq_bfqq_save_state(bfqq);
-+	bfq_bfqq_save_state(new_bfqq);
-+	if (bfq_bfqq_IO_bound(bfqq))
-+		bfq_mark_bfqq_IO_bound(new_bfqq);
-+	bfq_clear_bfqq_IO_bound(bfqq);
-+	/*
-+	 * Grab a reference to the bic, to prevent it from being destroyed
-+	 * before being possibly touched by a bfq_split_bfqq().
-+	 */
-+	bfq_get_bic_reference(bfqq);
-+	bfq_get_bic_reference(new_bfqq);
-+	/*
-+	 * Merge queues (that is, let bic redirect its requests to new_bfqq)
-+	 */
-+	bic_set_bfqq(bic, new_bfqq, 1);
-+	bfq_mark_bfqq_coop(new_bfqq);
-+	/*
-+	 * new_bfqq now belongs to at least two bics (it is a shared queue):
-+	 * set new_bfqq->bic to NULL. bfqq either:
-+	 * - does not belong to any bic any more, and hence bfqq->bic must
-+	 *   be set to NULL, or
-+	 * - is a queue whose owning bics have already been redirected to a
-+	 *   different queue, hence the queue is destined to not belong to
-+	 *   any bic soon and bfqq->bic is already NULL (therefore the next
-+	 *   assignment causes no harm).
-+	 */
-+	new_bfqq->bic = NULL;
-+	bfqq->bic = NULL;
-+	bfq_put_queue(bfqq);
-+}
-+
-+static inline void bfq_bfqq_increase_failed_cooperations(struct bfq_queue *bfqq)
-+{
-+	struct bfq_io_cq *bic = bfqq->bic;
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+
-+	if (bic && bfq_bfqq_cooperations(bfqq) >= bfqd->bfq_coop_thresh) {
-+		bic->failed_cooperations++;
-+		if (bic->failed_cooperations >= bfqd->bfq_failed_cooperations)
-+			bic->cooperations = 0;
-+	}
-+}
-+
-+static int bfq_allow_merge(struct request_queue *q, struct request *rq,
-+			   struct bio *bio)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct bfq_io_cq *bic;
-+	struct bfq_queue *bfqq, *new_bfqq;
-+
-+	/*
-+	 * Disallow merge of a sync bio into an async request.
-+	 */
-+	if (bfq_bio_sync(bio) && !rq_is_sync(rq))
-+		return 0;
-+
-+	/*
-+	 * Lookup the bfqq that this bio will be queued with. Allow
-+	 * merge only if rq is queued there.
-+	 * Queue lock is held here.
-+	 */
-+	bic = bfq_bic_lookup(bfqd, current->io_context);
-+	if (bic == NULL)
-+		return 0;
-+
-+	bfqq = bic_to_bfqq(bic, bfq_bio_sync(bio));
-+	/*
-+	 * We take advantage of this function to perform an early merge
-+	 * of the queues of possible cooperating processes.
-+	 */
-+	if (bfqq != NULL) {
-+		new_bfqq = bfq_setup_cooperator(bfqd, bfqq, bio, false);
-+		if (new_bfqq != NULL) {
-+			bfq_merge_bfqqs(bfqd, bic, bfqq, new_bfqq);
-+			/*
-+			 * If we get here, the bio will be queued in the
-+			 * shared queue, i.e., new_bfqq, so use new_bfqq
-+			 * to decide whether bio and rq can be merged.
-+			 */
-+			bfqq = new_bfqq;
-+		} else
-+			bfq_bfqq_increase_failed_cooperations(bfqq);
-+	}
-+
-+	return bfqq == RQ_BFQQ(rq);
-+}
-+
-+static void __bfq_set_in_service_queue(struct bfq_data *bfqd,
-+				       struct bfq_queue *bfqq)
-+{
-+	if (bfqq != NULL) {
-+		bfq_mark_bfqq_must_alloc(bfqq);
-+		bfq_mark_bfqq_budget_new(bfqq);
-+		bfq_clear_bfqq_fifo_expire(bfqq);
-+
-+		bfqd->budgets_assigned = (bfqd->budgets_assigned*7 + 256) / 8;
-+
-+		bfq_log_bfqq(bfqd, bfqq,
-+			     "set_in_service_queue, cur-budget = %lu",
-+			     bfqq->entity.budget);
-+	}
-+
-+	bfqd->in_service_queue = bfqq;
-+}
-+
-+/*
-+ * Get and set a new queue for service.
-+ */
-+static struct bfq_queue *bfq_set_in_service_queue(struct bfq_data *bfqd)
-+{
-+	struct bfq_queue *bfqq = bfq_get_next_queue(bfqd);
-+
-+	__bfq_set_in_service_queue(bfqd, bfqq);
-+	return bfqq;
-+}
-+
-+/*
-+ * If enough samples have been computed, return the current max budget
-+ * stored in bfqd, which is dynamically updated according to the
-+ * estimated disk peak rate; otherwise return the default max budget
-+ */
-+static inline unsigned long bfq_max_budget(struct bfq_data *bfqd)
-+{
-+	if (bfqd->budgets_assigned < 194)
-+		return bfq_default_max_budget;
-+	else
-+		return bfqd->bfq_max_budget;
-+}
-+
-+/*
-+ * Return min budget, which is a fraction of the current or default
-+ * max budget (trying with 1/32)
-+ */
-+static inline unsigned long bfq_min_budget(struct bfq_data *bfqd)
-+{
-+	if (bfqd->budgets_assigned < 194)
-+		return bfq_default_max_budget / 32;
-+	else
-+		return bfqd->bfq_max_budget / 32;
-+}
-+
-+static void bfq_arm_slice_timer(struct bfq_data *bfqd)
-+{
-+	struct bfq_queue *bfqq = bfqd->in_service_queue;
-+	struct bfq_io_cq *bic;
-+	unsigned long sl;
-+
-+	BUG_ON(!RB_EMPTY_ROOT(&bfqq->sort_list));
-+
-+	/* Processes have exited, don't wait. */
-+	bic = bfqd->in_service_bic;
-+	if (bic == NULL || atomic_read(&bic->icq.ioc->active_ref) == 0)
-+		return;
-+
-+	bfq_mark_bfqq_wait_request(bfqq);
-+
-+	/*
-+	 * We don't want to idle for seeks, but we do want to allow
-+	 * fair distribution of slice time for a process doing back-to-back
-+	 * seeks. So allow a little bit of time for him to submit a new rq.
-+	 *
-+	 * To prevent processes with (partly) seeky workloads from
-+	 * being too ill-treated, grant them a small fraction of the
-+	 * assigned budget before reducing the waiting time to
-+	 * BFQ_MIN_TT. This happened to help reduce latency.
-+	 */
-+	sl = bfqd->bfq_slice_idle;
-+	/*
-+	 * Unless the queue is being weight-raised, grant only minimum idle
-+	 * time if the queue either has been seeky for long enough or has
-+	 * already proved to be constantly seeky.
-+	 */
-+	if (bfq_sample_valid(bfqq->seek_samples) &&
-+	    ((BFQQ_SEEKY(bfqq) && bfqq->entity.service >
-+				  bfq_max_budget(bfqq->bfqd) / 8) ||
-+	      bfq_bfqq_constantly_seeky(bfqq)) && bfqq->wr_coeff == 1)
-+		sl = min(sl, msecs_to_jiffies(BFQ_MIN_TT));
-+	else if (bfqq->wr_coeff > 1)
-+		sl = sl * 3;
-+	bfqd->last_idling_start = ktime_get();
-+	mod_timer(&bfqd->idle_slice_timer, jiffies + sl);
-+	bfq_log(bfqd, "arm idle: %u/%u ms",
-+		jiffies_to_msecs(sl), jiffies_to_msecs(bfqd->bfq_slice_idle));
-+}
-+
-+/*
-+ * Set the maximum time for the in-service queue to consume its
-+ * budget. This prevents seeky processes from lowering the disk
-+ * throughput (always guaranteed with a time slice scheme as in CFQ).
-+ */
-+static void bfq_set_budget_timeout(struct bfq_data *bfqd)
-+{
-+	struct bfq_queue *bfqq = bfqd->in_service_queue;
-+	unsigned int timeout_coeff;
-+	if (bfqq->wr_cur_max_time == bfqd->bfq_wr_rt_max_time)
-+		timeout_coeff = 1;
-+	else
-+		timeout_coeff = bfqq->entity.weight / bfqq->entity.orig_weight;
-+
-+	bfqd->last_budget_start = ktime_get();
-+
-+	bfq_clear_bfqq_budget_new(bfqq);
-+	bfqq->budget_timeout = jiffies +
-+		bfqd->bfq_timeout[bfq_bfqq_sync(bfqq)] * timeout_coeff;
-+
-+	bfq_log_bfqq(bfqd, bfqq, "set budget_timeout %u",
-+		jiffies_to_msecs(bfqd->bfq_timeout[bfq_bfqq_sync(bfqq)] *
-+		timeout_coeff));
-+}
-+
-+/*
-+ * Move request from internal lists to the request queue dispatch list.
-+ */
-+static void bfq_dispatch_insert(struct request_queue *q, struct request *rq)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq);
-+
-+	/*
-+	 * For consistency, the next instruction should have been executed
-+	 * after removing the request from the queue and dispatching it.
-+	 * We execute instead this instruction before bfq_remove_request()
-+	 * (and hence introduce a temporary inconsistency), for efficiency.
-+	 * In fact, in a forced_dispatch, this prevents two counters related
-+	 * to bfqq->dispatched to risk to be uselessly decremented if bfqq
-+	 * is not in service, and then to be incremented again after
-+	 * incrementing bfqq->dispatched.
-+	 */
-+	bfqq->dispatched++;
-+	bfq_remove_request(rq);
-+	elv_dispatch_sort(q, rq);
-+
-+	if (bfq_bfqq_sync(bfqq))
-+		bfqd->sync_flight++;
-+}
-+
-+/*
-+ * Return expired entry, or NULL to just start from scratch in rbtree.
-+ */
-+static struct request *bfq_check_fifo(struct bfq_queue *bfqq)
-+{
-+	struct request *rq = NULL;
-+
-+	if (bfq_bfqq_fifo_expire(bfqq))
-+		return NULL;
-+
-+	bfq_mark_bfqq_fifo_expire(bfqq);
-+
-+	if (list_empty(&bfqq->fifo))
-+		return NULL;
-+
-+	rq = rq_entry_fifo(bfqq->fifo.next);
-+
-+	if (time_before(jiffies, rq->fifo_time))
-+		return NULL;
-+
-+	return rq;
-+}
-+
-+static inline unsigned long bfq_bfqq_budget_left(struct bfq_queue *bfqq)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+	return entity->budget - entity->service;
-+}
-+
-+static void __bfq_bfqq_expire(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	BUG_ON(bfqq != bfqd->in_service_queue);
-+
-+	__bfq_bfqd_reset_in_service(bfqd);
-+
-+	/*
-+	 * If this bfqq is shared between multiple processes, check
-+	 * to make sure that those processes are still issuing I/Os
-+	 * within the mean seek distance. If not, it may be time to
-+	 * break the queues apart again.
-+	 */
-+	if (bfq_bfqq_coop(bfqq) && BFQQ_SEEKY(bfqq))
-+		bfq_mark_bfqq_split_coop(bfqq);
-+
-+	if (RB_EMPTY_ROOT(&bfqq->sort_list)) {
-+		/*
-+		 * Overloading budget_timeout field to store the time
-+		 * at which the queue remains with no backlog; used by
-+		 * the weight-raising mechanism.
-+		 */
-+		bfqq->budget_timeout = jiffies;
-+		bfq_del_bfqq_busy(bfqd, bfqq, 1);
-+	} else {
-+		bfq_activate_bfqq(bfqd, bfqq);
-+		/*
-+		 * Resort priority tree of potential close cooperators.
-+		 */
-+		bfq_rq_pos_tree_add(bfqd, bfqq);
-+	}
-+}
-+
-+/**
-+ * __bfq_bfqq_recalc_budget - try to adapt the budget to the @bfqq behavior.
-+ * @bfqd: device data.
-+ * @bfqq: queue to update.
-+ * @reason: reason for expiration.
-+ *
-+ * Handle the feedback on @bfqq budget.  See the body for detailed
-+ * comments.
-+ */
-+static void __bfq_bfqq_recalc_budget(struct bfq_data *bfqd,
-+				     struct bfq_queue *bfqq,
-+				     enum bfqq_expiration reason)
-+{
-+	struct request *next_rq;
-+	unsigned long budget, min_budget;
-+
-+	budget = bfqq->max_budget;
-+	min_budget = bfq_min_budget(bfqd);
-+
-+	BUG_ON(bfqq != bfqd->in_service_queue);
-+
-+	bfq_log_bfqq(bfqd, bfqq, "recalc_budg: last budg %lu, budg left %lu",
-+		bfqq->entity.budget, bfq_bfqq_budget_left(bfqq));
-+	bfq_log_bfqq(bfqd, bfqq, "recalc_budg: last max_budg %lu, min budg %lu",
-+		budget, bfq_min_budget(bfqd));
-+	bfq_log_bfqq(bfqd, bfqq, "recalc_budg: sync %d, seeky %d",
-+		bfq_bfqq_sync(bfqq), BFQQ_SEEKY(bfqd->in_service_queue));
-+
-+	if (bfq_bfqq_sync(bfqq)) {
-+		switch (reason) {
-+		/*
-+		 * Caveat: in all the following cases we trade latency
-+		 * for throughput.
-+		 */
-+		case BFQ_BFQQ_TOO_IDLE:
-+			/*
-+			 * This is the only case where we may reduce
-+			 * the budget: if there is no request of the
-+			 * process still waiting for completion, then
-+			 * we assume (tentatively) that the timer has
-+			 * expired because the batch of requests of
-+			 * the process could have been served with a
-+			 * smaller budget.  Hence, betting that
-+			 * process will behave in the same way when it
-+			 * becomes backlogged again, we reduce its
-+			 * next budget.  As long as we guess right,
-+			 * this budget cut reduces the latency
-+			 * experienced by the process.
-+			 *
-+			 * However, if there are still outstanding
-+			 * requests, then the process may have not yet
-+			 * issued its next request just because it is
-+			 * still waiting for the completion of some of
-+			 * the still outstanding ones.  So in this
-+			 * subcase we do not reduce its budget, on the
-+			 * contrary we increase it to possibly boost
-+			 * the throughput, as discussed in the
-+			 * comments to the BUDGET_TIMEOUT case.
-+			 */
-+			if (bfqq->dispatched > 0) /* still outstanding reqs */
-+				budget = min(budget * 2, bfqd->bfq_max_budget);
-+			else {
-+				if (budget > 5 * min_budget)
-+					budget -= 4 * min_budget;
-+				else
-+					budget = min_budget;
-+			}
-+			break;
-+		case BFQ_BFQQ_BUDGET_TIMEOUT:
-+			/*
-+			 * We double the budget here because: 1) it
-+			 * gives the chance to boost the throughput if
-+			 * this is not a seeky process (which may have
-+			 * bumped into this timeout because of, e.g.,
-+			 * ZBR), 2) together with charge_full_budget
-+			 * it helps give seeky processes higher
-+			 * timestamps, and hence be served less
-+			 * frequently.
-+			 */
-+			budget = min(budget * 2, bfqd->bfq_max_budget);
-+			break;
-+		case BFQ_BFQQ_BUDGET_EXHAUSTED:
-+			/*
-+			 * The process still has backlog, and did not
-+			 * let either the budget timeout or the disk
-+			 * idling timeout expire. Hence it is not
-+			 * seeky, has a short thinktime and may be
-+			 * happy with a higher budget too. So
-+			 * definitely increase the budget of this good
-+			 * candidate to boost the disk throughput.
-+			 */
-+			budget = min(budget * 4, bfqd->bfq_max_budget);
-+			break;
-+		case BFQ_BFQQ_NO_MORE_REQUESTS:
-+		       /*
-+			* Leave the budget unchanged.
-+			*/
-+		default:
-+			return;
-+		}
-+	} else /* async queue */
-+	    /* async queues get always the maximum possible budget
-+	     * (their ability to dispatch is limited by
-+	     * @bfqd->bfq_max_budget_async_rq).
-+	     */
-+		budget = bfqd->bfq_max_budget;
-+
-+	bfqq->max_budget = budget;
-+
-+	if (bfqd->budgets_assigned >= 194 && bfqd->bfq_user_max_budget == 0 &&
-+	    bfqq->max_budget > bfqd->bfq_max_budget)
-+		bfqq->max_budget = bfqd->bfq_max_budget;
-+
-+	/*
-+	 * Make sure that we have enough budget for the next request.
-+	 * Since the finish time of the bfqq must be kept in sync with
-+	 * the budget, be sure to call __bfq_bfqq_expire() after the
-+	 * update.
-+	 */
-+	next_rq = bfqq->next_rq;
-+	if (next_rq != NULL)
-+		bfqq->entity.budget = max_t(unsigned long, bfqq->max_budget,
-+					    bfq_serv_to_charge(next_rq, bfqq));
-+	else
-+		bfqq->entity.budget = bfqq->max_budget;
-+
-+	bfq_log_bfqq(bfqd, bfqq, "head sect: %u, new budget %lu",
-+			next_rq != NULL ? blk_rq_sectors(next_rq) : 0,
-+			bfqq->entity.budget);
-+}
-+
-+static unsigned long bfq_calc_max_budget(u64 peak_rate, u64 timeout)
-+{
-+	unsigned long max_budget;
-+
-+	/*
-+	 * The max_budget calculated when autotuning is equal to the
-+	 * amount of sectors transfered in timeout_sync at the
-+	 * estimated peak rate.
-+	 */
-+	max_budget = (unsigned long)(peak_rate * 1000 *
-+				     timeout >> BFQ_RATE_SHIFT);
-+
-+	return max_budget;
-+}
-+
-+/*
-+ * In addition to updating the peak rate, checks whether the process
-+ * is "slow", and returns 1 if so. This slow flag is used, in addition
-+ * to the budget timeout, to reduce the amount of service provided to
-+ * seeky processes, and hence reduce their chances to lower the
-+ * throughput. See the code for more details.
-+ */
-+static int bfq_update_peak_rate(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+				int compensate, enum bfqq_expiration reason)
-+{
-+	u64 bw, usecs, expected, timeout;
-+	ktime_t delta;
-+	int update = 0;
-+
-+	if (!bfq_bfqq_sync(bfqq) || bfq_bfqq_budget_new(bfqq))
-+		return 0;
-+
-+	if (compensate)
-+		delta = bfqd->last_idling_start;
-+	else
-+		delta = ktime_get();
-+	delta = ktime_sub(delta, bfqd->last_budget_start);
-+	usecs = ktime_to_us(delta);
-+
-+	/* Don't trust short/unrealistic values. */
-+	if (usecs < 100 || usecs >= LONG_MAX)
-+		return 0;
-+
-+	/*
-+	 * Calculate the bandwidth for the last slice.  We use a 64 bit
-+	 * value to store the peak rate, in sectors per usec in fixed
-+	 * point math.  We do so to have enough precision in the estimate
-+	 * and to avoid overflows.
-+	 */
-+	bw = (u64)bfqq->entity.service << BFQ_RATE_SHIFT;
-+	do_div(bw, (unsigned long)usecs);
-+
-+	timeout = jiffies_to_msecs(bfqd->bfq_timeout[BLK_RW_SYNC]);
-+
-+	/*
-+	 * Use only long (> 20ms) intervals to filter out spikes for
-+	 * the peak rate estimation.
-+	 */
-+	if (usecs > 20000) {
-+		if (bw > bfqd->peak_rate ||
-+		   (!BFQQ_SEEKY(bfqq) &&
-+		    reason == BFQ_BFQQ_BUDGET_TIMEOUT)) {
-+			bfq_log(bfqd, "measured bw =%llu", bw);
-+			/*
-+			 * To smooth oscillations use a low-pass filter with
-+			 * alpha=7/8, i.e.,
-+			 * new_rate = (7/8) * old_rate + (1/8) * bw
-+			 */
-+			do_div(bw, 8);
-+			if (bw == 0)
-+				return 0;
-+			bfqd->peak_rate *= 7;
-+			do_div(bfqd->peak_rate, 8);
-+			bfqd->peak_rate += bw;
-+			update = 1;
-+			bfq_log(bfqd, "new peak_rate=%llu", bfqd->peak_rate);
-+		}
-+
-+		update |= bfqd->peak_rate_samples == BFQ_PEAK_RATE_SAMPLES - 1;
-+
-+		if (bfqd->peak_rate_samples < BFQ_PEAK_RATE_SAMPLES)
-+			bfqd->peak_rate_samples++;
-+
-+		if (bfqd->peak_rate_samples == BFQ_PEAK_RATE_SAMPLES &&
-+		    update) {
-+			int dev_type = blk_queue_nonrot(bfqd->queue);
-+			if (bfqd->bfq_user_max_budget == 0) {
-+				bfqd->bfq_max_budget =
-+					bfq_calc_max_budget(bfqd->peak_rate,
-+							    timeout);
-+				bfq_log(bfqd, "new max_budget=%lu",
-+					bfqd->bfq_max_budget);
-+			}
-+			if (bfqd->device_speed == BFQ_BFQD_FAST &&
-+			    bfqd->peak_rate < device_speed_thresh[dev_type]) {
-+				bfqd->device_speed = BFQ_BFQD_SLOW;
-+				bfqd->RT_prod = R_slow[dev_type] *
-+						T_slow[dev_type];
-+			} else if (bfqd->device_speed == BFQ_BFQD_SLOW &&
-+			    bfqd->peak_rate > device_speed_thresh[dev_type]) {
-+				bfqd->device_speed = BFQ_BFQD_FAST;
-+				bfqd->RT_prod = R_fast[dev_type] *
-+						T_fast[dev_type];
-+			}
-+		}
-+	}
-+
-+	/*
-+	 * If the process has been served for a too short time
-+	 * interval to let its possible sequential accesses prevail on
-+	 * the initial seek time needed to move the disk head on the
-+	 * first sector it requested, then give the process a chance
-+	 * and for the moment return false.
-+	 */
-+	if (bfqq->entity.budget <= bfq_max_budget(bfqd) / 8)
-+		return 0;
-+
-+	/*
-+	 * A process is considered ``slow'' (i.e., seeky, so that we
-+	 * cannot treat it fairly in the service domain, as it would
-+	 * slow down too much the other processes) if, when a slice
-+	 * ends for whatever reason, it has received service at a
-+	 * rate that would not be high enough to complete the budget
-+	 * before the budget timeout expiration.
-+	 */
-+	expected = bw * 1000 * timeout >> BFQ_RATE_SHIFT;
-+
-+	/*
-+	 * Caveat: processes doing IO in the slower disk zones will
-+	 * tend to be slow(er) even if not seeky. And the estimated
-+	 * peak rate will actually be an average over the disk
-+	 * surface. Hence, to not be too harsh with unlucky processes,
-+	 * we keep a budget/3 margin of safety before declaring a
-+	 * process slow.
-+	 */
-+	return expected > (4 * bfqq->entity.budget) / 3;
-+}
-+
-+/*
-+ * To be deemed as soft real-time, an application must meet two
-+ * requirements. First, the application must not require an average
-+ * bandwidth higher than the approximate bandwidth required to playback or
-+ * record a compressed high-definition video.
-+ * The next function is invoked on the completion of the last request of a
-+ * batch, to compute the next-start time instant, soft_rt_next_start, such
-+ * that, if the next request of the application does not arrive before
-+ * soft_rt_next_start, then the above requirement on the bandwidth is met.
-+ *
-+ * The second requirement is that the request pattern of the application is
-+ * isochronous, i.e., that, after issuing a request or a batch of requests,
-+ * the application stops issuing new requests until all its pending requests
-+ * have been completed. After that, the application may issue a new batch,
-+ * and so on.
-+ * For this reason the next function is invoked to compute
-+ * soft_rt_next_start only for applications that meet this requirement,
-+ * whereas soft_rt_next_start is set to infinity for applications that do
-+ * not.
-+ *
-+ * Unfortunately, even a greedy application may happen to behave in an
-+ * isochronous way if the CPU load is high. In fact, the application may
-+ * stop issuing requests while the CPUs are busy serving other processes,
-+ * then restart, then stop again for a while, and so on. In addition, if
-+ * the disk achieves a low enough throughput with the request pattern
-+ * issued by the application (e.g., because the request pattern is random
-+ * and/or the device is slow), then the application may meet the above
-+ * bandwidth requirement too. To prevent such a greedy application to be
-+ * deemed as soft real-time, a further rule is used in the computation of
-+ * soft_rt_next_start: soft_rt_next_start must be higher than the current
-+ * time plus the maximum time for which the arrival of a request is waited
-+ * for when a sync queue becomes idle, namely bfqd->bfq_slice_idle.
-+ * This filters out greedy applications, as the latter issue instead their
-+ * next request as soon as possible after the last one has been completed
-+ * (in contrast, when a batch of requests is completed, a soft real-time
-+ * application spends some time processing data).
-+ *
-+ * Unfortunately, the last filter may easily generate false positives if
-+ * only bfqd->bfq_slice_idle is used as a reference time interval and one
-+ * or both the following cases occur:
-+ * 1) HZ is so low that the duration of a jiffy is comparable to or higher
-+ *    than bfqd->bfq_slice_idle. This happens, e.g., on slow devices with
-+ *    HZ=100.
-+ * 2) jiffies, instead of increasing at a constant rate, may stop increasing
-+ *    for a while, then suddenly 'jump' by several units to recover the lost
-+ *    increments. This seems to happen, e.g., inside virtual machines.
-+ * To address this issue, we do not use as a reference time interval just
-+ * bfqd->bfq_slice_idle, but bfqd->bfq_slice_idle plus a few jiffies. In
-+ * particular we add the minimum number of jiffies for which the filter
-+ * seems to be quite precise also in embedded systems and KVM/QEMU virtual
-+ * machines.
-+ */
-+static inline unsigned long bfq_bfqq_softrt_next_start(struct bfq_data *bfqd,
-+						       struct bfq_queue *bfqq)
-+{
-+	return max(bfqq->last_idle_bklogged +
-+		   HZ * bfqq->service_from_backlogged /
-+		   bfqd->bfq_wr_max_softrt_rate,
-+		   jiffies + bfqq->bfqd->bfq_slice_idle + 4);
-+}
-+
-+/*
-+ * Return the largest-possible time instant such that, for as long as possible,
-+ * the current time will be lower than this time instant according to the macro
-+ * time_is_before_jiffies().
-+ */
-+static inline unsigned long bfq_infinity_from_now(unsigned long now)
-+{
-+	return now + ULONG_MAX / 2;
-+}
-+
-+/**
-+ * bfq_bfqq_expire - expire a queue.
-+ * @bfqd: device owning the queue.
-+ * @bfqq: the queue to expire.
-+ * @compensate: if true, compensate for the time spent idling.
-+ * @reason: the reason causing the expiration.
-+ *
-+ *
-+ * If the process associated to the queue is slow (i.e., seeky), or in
-+ * case of budget timeout, or, finally, if it is async, we
-+ * artificially charge it an entire budget (independently of the
-+ * actual service it received). As a consequence, the queue will get
-+ * higher timestamps than the correct ones upon reactivation, and
-+ * hence it will be rescheduled as if it had received more service
-+ * than what it actually received. In the end, this class of processes
-+ * will receive less service in proportion to how slowly they consume
-+ * their budgets (and hence how seriously they tend to lower the
-+ * throughput).
-+ *
-+ * In contrast, when a queue expires because it has been idling for
-+ * too much or because it exhausted its budget, we do not touch the
-+ * amount of service it has received. Hence when the queue will be
-+ * reactivated and its timestamps updated, the latter will be in sync
-+ * with the actual service received by the queue until expiration.
-+ *
-+ * Charging a full budget to the first type of queues and the exact
-+ * service to the others has the effect of using the WF2Q+ policy to
-+ * schedule the former on a timeslice basis, without violating the
-+ * service domain guarantees of the latter.
-+ */
-+static void bfq_bfqq_expire(struct bfq_data *bfqd,
-+			    struct bfq_queue *bfqq,
-+			    int compensate,
-+			    enum bfqq_expiration reason)
-+{
-+	int slow;
-+	BUG_ON(bfqq != bfqd->in_service_queue);
-+
-+	/* Update disk peak rate for autotuning and check whether the
-+	 * process is slow (see bfq_update_peak_rate).
-+	 */
-+	slow = bfq_update_peak_rate(bfqd, bfqq, compensate, reason);
-+
-+	/*
-+	 * As above explained, 'punish' slow (i.e., seeky), timed-out
-+	 * and async queues, to favor sequential sync workloads.
-+	 *
-+	 * Processes doing I/O in the slower disk zones will tend to be
-+	 * slow(er) even if not seeky. Hence, since the estimated peak
-+	 * rate is actually an average over the disk surface, these
-+	 * processes may timeout just for bad luck. To avoid punishing
-+	 * them we do not charge a full budget to a process that
-+	 * succeeded in consuming at least 2/3 of its budget.
-+	 */
-+	if (slow || (reason == BFQ_BFQQ_BUDGET_TIMEOUT &&
-+		     bfq_bfqq_budget_left(bfqq) >=  bfqq->entity.budget / 3))
-+		bfq_bfqq_charge_full_budget(bfqq);
-+
-+	bfqq->service_from_backlogged += bfqq->entity.service;
-+
-+	if (BFQQ_SEEKY(bfqq) && reason == BFQ_BFQQ_BUDGET_TIMEOUT &&
-+	    !bfq_bfqq_constantly_seeky(bfqq)) {
-+		bfq_mark_bfqq_constantly_seeky(bfqq);
-+		if (!blk_queue_nonrot(bfqd->queue))
-+			bfqd->const_seeky_busy_in_flight_queues++;
-+	}
-+
-+	if (reason == BFQ_BFQQ_TOO_IDLE &&
-+	    bfqq->entity.service <= 2 * bfqq->entity.budget / 10 )
-+		bfq_clear_bfqq_IO_bound(bfqq);
-+
-+	if (bfqd->low_latency && bfqq->wr_coeff == 1)
-+		bfqq->last_wr_start_finish = jiffies;
-+
-+	if (bfqd->low_latency && bfqd->bfq_wr_max_softrt_rate > 0 &&
-+	    RB_EMPTY_ROOT(&bfqq->sort_list)) {
-+		/*
-+		 * If we get here, and there are no outstanding requests,
-+		 * then the request pattern is isochronous (see the comments
-+		 * to the function bfq_bfqq_softrt_next_start()). Hence we
-+		 * can compute soft_rt_next_start. If, instead, the queue
-+		 * still has outstanding requests, then we have to wait
-+		 * for the completion of all the outstanding requests to
-+		 * discover whether the request pattern is actually
-+		 * isochronous.
-+		 */
-+		if (bfqq->dispatched == 0)
-+			bfqq->soft_rt_next_start =
-+				bfq_bfqq_softrt_next_start(bfqd, bfqq);
-+		else {
-+			/*
-+			 * The application is still waiting for the
-+			 * completion of one or more requests:
-+			 * prevent it from possibly being incorrectly
-+			 * deemed as soft real-time by setting its
-+			 * soft_rt_next_start to infinity. In fact,
-+			 * without this assignment, the application
-+			 * would be incorrectly deemed as soft
-+			 * real-time if:
-+			 * 1) it issued a new request before the
-+			 *    completion of all its in-flight
-+			 *    requests, and
-+			 * 2) at that time, its soft_rt_next_start
-+			 *    happened to be in the past.
-+			 */
-+			bfqq->soft_rt_next_start =
-+				bfq_infinity_from_now(jiffies);
-+			/*
-+			 * Schedule an update of soft_rt_next_start to when
-+			 * the task may be discovered to be isochronous.
-+			 */
-+			bfq_mark_bfqq_softrt_update(bfqq);
-+		}
-+	}
-+
-+	bfq_log_bfqq(bfqd, bfqq,
-+		"expire (%d, slow %d, num_disp %d, idle_win %d)", reason,
-+		slow, bfqq->dispatched, bfq_bfqq_idle_window(bfqq));
-+
-+	/*
-+	 * Increase, decrease or leave budget unchanged according to
-+	 * reason.
-+	 */
-+	__bfq_bfqq_recalc_budget(bfqd, bfqq, reason);
-+	__bfq_bfqq_expire(bfqd, bfqq);
-+}
-+
-+/*
-+ * Budget timeout is not implemented through a dedicated timer, but
-+ * just checked on request arrivals and completions, as well as on
-+ * idle timer expirations.
-+ */
-+static int bfq_bfqq_budget_timeout(struct bfq_queue *bfqq)
-+{
-+	if (bfq_bfqq_budget_new(bfqq) ||
-+	    time_before(jiffies, bfqq->budget_timeout))
-+		return 0;
-+	return 1;
-+}
-+
-+/*
-+ * If we expire a queue that is waiting for the arrival of a new
-+ * request, we may prevent the fictitious timestamp back-shifting that
-+ * allows the guarantees of the queue to be preserved (see [1] for
-+ * this tricky aspect). Hence we return true only if this condition
-+ * does not hold, or if the queue is slow enough to deserve only to be
-+ * kicked off for preserving a high throughput.
-+*/
-+static inline int bfq_may_expire_for_budg_timeout(struct bfq_queue *bfqq)
-+{
-+	bfq_log_bfqq(bfqq->bfqd, bfqq,
-+		"may_budget_timeout: wait_request %d left %d timeout %d",
-+		bfq_bfqq_wait_request(bfqq),
-+			bfq_bfqq_budget_left(bfqq) >=  bfqq->entity.budget / 3,
-+		bfq_bfqq_budget_timeout(bfqq));
-+
-+	return (!bfq_bfqq_wait_request(bfqq) ||
-+		bfq_bfqq_budget_left(bfqq) >=  bfqq->entity.budget / 3)
-+		&&
-+		bfq_bfqq_budget_timeout(bfqq);
-+}
-+
-+/*
-+ * Device idling is allowed only for the queues for which this function
-+ * returns true. For this reason, the return value of this function plays a
-+ * critical role for both throughput boosting and service guarantees. The
-+ * return value is computed through a logical expression. In this rather
-+ * long comment, we try to briefly describe all the details and motivations
-+ * behind the components of this logical expression.
-+ *
-+ * First, the expression is false if bfqq is not sync, or if: bfqq happened
-+ * to become active during a large burst of queue activations, and the
-+ * pattern of requests bfqq contains boosts the throughput if bfqq is
-+ * expired. In fact, queues that became active during a large burst benefit
-+ * only from throughput, as discussed in the comments to bfq_handle_burst.
-+ * In this respect, expiring bfqq certainly boosts the throughput on NCQ-
-+ * capable flash-based devices, whereas, on rotational devices, it boosts
-+ * the throughput only if bfqq contains random requests.
-+ *
-+ * On the opposite end, if (a) bfqq is sync, (b) the above burst-related
-+ * condition does not hold, and (c) bfqq is being weight-raised, then the
-+ * expression always evaluates to true, as device idling is instrumental
-+ * for preserving low-latency guarantees (see [1]). If, instead, conditions
-+ * (a) and (b) do hold, but (c) does not, then the expression evaluates to
-+ * true only if: (1) bfqq is I/O-bound and has a non-null idle window, and
-+ * (2) at least one of the following two conditions holds.
-+ * The first condition is that the device is not performing NCQ, because
-+ * idling the device most certainly boosts the throughput if this condition
-+ * holds and bfqq is I/O-bound and has been granted a non-null idle window.
-+ * The second compound condition is made of the logical AND of two components.
-+ *
-+ * The first component is true only if there is no weight-raised busy
-+ * queue. This guarantees that the device is not idled for a sync non-
-+ * weight-raised queue when there are busy weight-raised queues. The former
-+ * is then expired immediately if empty. Combined with the timestamping
-+ * rules of BFQ (see [1] for details), this causes sync non-weight-raised
-+ * queues to get a lower number of requests served, and hence to ask for a
-+ * lower number of requests from the request pool, before the busy weight-
-+ * raised queues get served again.
-+ *
-+ * This is beneficial for the processes associated with weight-raised
-+ * queues, when the request pool is saturated (e.g., in the presence of
-+ * write hogs). In fact, if the processes associated with the other queues
-+ * ask for requests at a lower rate, then weight-raised processes have a
-+ * higher probability to get a request from the pool immediately (or at
-+ * least soon) when they need one. Hence they have a higher probability to
-+ * actually get a fraction of the disk throughput proportional to their
-+ * high weight. This is especially true with NCQ-capable drives, which
-+ * enqueue several requests in advance and further reorder internally-
-+ * queued requests.
-+ *
-+ * In the end, mistreating non-weight-raised queues when there are busy
-+ * weight-raised queues seems to mitigate starvation problems in the
-+ * presence of heavy write workloads and NCQ, and hence to guarantee a
-+ * higher application and system responsiveness in these hostile scenarios.
-+ *
-+ * If the first component of the compound condition is instead true, i.e.,
-+ * there is no weight-raised busy queue, then the second component of the
-+ * compound condition takes into account service-guarantee and throughput
-+ * issues related to NCQ (recall that the compound condition is evaluated
-+ * only if the device is detected as supporting NCQ).
-+ *
-+ * As for service guarantees, allowing the drive to enqueue more than one
-+ * request at a time, and hence delegating de facto final scheduling
-+ * decisions to the drive's internal scheduler, causes loss of control on
-+ * the actual request service order. In this respect, when the drive is
-+ * allowed to enqueue more than one request at a time, the service
-+ * distribution enforced by the drive's internal scheduler is likely to
-+ * coincide with the desired device-throughput distribution only in the
-+ * following, perfectly symmetric, scenario:
-+ * 1) all active queues have the same weight,
-+ * 2) all active groups at the same level in the groups tree have the same
-+ *    weight,
-+ * 3) all active groups at the same level in the groups tree have the same
-+ *    number of children.
-+ *
-+ * Even in such a scenario, sequential I/O may still receive a preferential
-+ * treatment, but this is not likely to be a big issue with flash-based
-+ * devices, because of their non-dramatic loss of throughput with random
-+ * I/O. Things do differ with HDDs, for which additional care is taken, as
-+ * explained after completing the discussion for flash-based devices.
-+ *
-+ * Unfortunately, keeping the necessary state for evaluating exactly the
-+ * above symmetry conditions would be quite complex and time-consuming.
-+ * Therefore BFQ evaluates instead the following stronger sub-conditions,
-+ * for which it is much easier to maintain the needed state:
-+ * 1) all active queues have the same weight,
-+ * 2) all active groups have the same weight,
-+ * 3) all active groups have at most one active child each.
-+ * In particular, the last two conditions are always true if hierarchical
-+ * support and the cgroups interface are not enabled, hence no state needs
-+ * to be maintained in this case.
-+ *
-+ * According to the above considerations, the second component of the
-+ * compound condition evaluates to true if any of the above symmetry
-+ * sub-condition does not hold, or the device is not flash-based. Therefore,
-+ * if also the first component is true, then idling is allowed for a sync
-+ * queue. These are the only sub-conditions considered if the device is
-+ * flash-based, as, for such a device, it is sensible to force idling only
-+ * for service-guarantee issues. In fact, as for throughput, idling
-+ * NCQ-capable flash-based devices would not boost the throughput even
-+ * with sequential I/O; rather it would lower the throughput in proportion
-+ * to how fast the device is. In the end, (only) if all the three
-+ * sub-conditions hold and the device is flash-based, the compound
-+ * condition evaluates to false and therefore no idling is performed.
-+ *
-+ * As already said, things change with a rotational device, where idling
-+ * boosts the throughput with sequential I/O (even with NCQ). Hence, for
-+ * such a device the second component of the compound condition evaluates
-+ * to true also if the following additional sub-condition does not hold:
-+ * the queue is constantly seeky. Unfortunately, this different behavior
-+ * with respect to flash-based devices causes an additional asymmetry: if
-+ * some sync queues enjoy idling and some other sync queues do not, then
-+ * the latter get a low share of the device throughput, simply because the
-+ * former get many requests served after being set as in service, whereas
-+ * the latter do not. As a consequence, to guarantee the desired throughput
-+ * distribution, on HDDs the compound expression evaluates to true (and
-+ * hence device idling is performed) also if the following last symmetry
-+ * condition does not hold: no other queue is benefiting from idling. Also
-+ * this last condition is actually replaced with a simpler-to-maintain and
-+ * stronger condition: there is no busy queue which is not constantly seeky
-+ * (and hence may also benefit from idling).
-+ *
-+ * To sum up, when all the required symmetry and throughput-boosting
-+ * sub-conditions hold, the second component of the compound condition
-+ * evaluates to false, and hence no idling is performed. This helps to
-+ * keep the drives' internal queues full on NCQ-capable devices, and hence
-+ * to boost the throughput, without causing 'almost' any loss of service
-+ * guarantees. The 'almost' follows from the fact that, if the internal
-+ * queue of one such device is filled while all the sub-conditions hold,
-+ * but at some point in time some sub-condition stops to hold, then it may
-+ * become impossible to let requests be served in the new desired order
-+ * until all the requests already queued in the device have been served.
-+ */
-+static inline bool bfq_bfqq_must_not_expire(struct bfq_queue *bfqq)
-+{
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+#ifdef CONFIG_CGROUP_BFQIO
-+#define symmetric_scenario	  (!bfqd->active_numerous_groups && \
-+				   !bfq_differentiated_weights(bfqd))
-+#else
-+#define symmetric_scenario	  (!bfq_differentiated_weights(bfqd))
-+#endif
-+#define cond_for_seeky_on_ncq_hdd (bfq_bfqq_constantly_seeky(bfqq) && \
-+				   bfqd->busy_in_flight_queues == \
-+				   bfqd->const_seeky_busy_in_flight_queues)
-+
-+#define cond_for_expiring_in_burst	(bfq_bfqq_in_large_burst(bfqq) && \
-+					 bfqd->hw_tag && \
-+					 (blk_queue_nonrot(bfqd->queue) || \
-+					  bfq_bfqq_constantly_seeky(bfqq)))
-+
-+/*
-+ * Condition for expiring a non-weight-raised queue (and hence not idling
-+ * the device).
-+ */
-+#define cond_for_expiring_non_wr  (bfqd->hw_tag && \
-+				   (bfqd->wr_busy_queues > 0 || \
-+				    (symmetric_scenario && \
-+				     (blk_queue_nonrot(bfqd->queue) || \
-+				      cond_for_seeky_on_ncq_hdd))))
-+
-+	return bfq_bfqq_sync(bfqq) &&
-+		!cond_for_expiring_in_burst &&
-+		(bfqq->wr_coeff > 1 ||
-+		 (bfq_bfqq_IO_bound(bfqq) && bfq_bfqq_idle_window(bfqq) &&
-+		  !cond_for_expiring_non_wr)
-+	);
-+}
-+
-+/*
-+ * If the in-service queue is empty but sync, and the function
-+ * bfq_bfqq_must_not_expire returns true, then:
-+ * 1) the queue must remain in service and cannot be expired, and
-+ * 2) the disk must be idled to wait for the possible arrival of a new
-+ *    request for the queue.
-+ * See the comments to the function bfq_bfqq_must_not_expire for the reasons
-+ * why performing device idling is the best choice to boost the throughput
-+ * and preserve service guarantees when bfq_bfqq_must_not_expire itself
-+ * returns true.
-+ */
-+static inline bool bfq_bfqq_must_idle(struct bfq_queue *bfqq)
-+{
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+
-+	return RB_EMPTY_ROOT(&bfqq->sort_list) && bfqd->bfq_slice_idle != 0 &&
-+	       bfq_bfqq_must_not_expire(bfqq);
-+}
-+
-+/*
-+ * Select a queue for service.  If we have a current queue in service,
-+ * check whether to continue servicing it, or retrieve and set a new one.
-+ */
-+static struct bfq_queue *bfq_select_queue(struct bfq_data *bfqd)
-+{
-+	struct bfq_queue *bfqq;
-+	struct request *next_rq;
-+	enum bfqq_expiration reason = BFQ_BFQQ_BUDGET_TIMEOUT;
-+
-+	bfqq = bfqd->in_service_queue;
-+	if (bfqq == NULL)
-+		goto new_queue;
-+
-+	bfq_log_bfqq(bfqd, bfqq, "select_queue: already in-service queue");
-+
-+	if (bfq_may_expire_for_budg_timeout(bfqq) &&
-+	    !timer_pending(&bfqd->idle_slice_timer) &&
-+	    !bfq_bfqq_must_idle(bfqq))
-+		goto expire;
-+
-+	next_rq = bfqq->next_rq;
-+	/*
-+	 * If bfqq has requests queued and it has enough budget left to
-+	 * serve them, keep the queue, otherwise expire it.
-+	 */
-+	if (next_rq != NULL) {
-+		if (bfq_serv_to_charge(next_rq, bfqq) >
-+			bfq_bfqq_budget_left(bfqq)) {
-+			reason = BFQ_BFQQ_BUDGET_EXHAUSTED;
-+			goto expire;
-+		} else {
-+			/*
-+			 * The idle timer may be pending because we may
-+			 * not disable disk idling even when a new request
-+			 * arrives.
-+			 */
-+			if (timer_pending(&bfqd->idle_slice_timer)) {
-+				/*
-+				 * If we get here: 1) at least a new request
-+				 * has arrived but we have not disabled the
-+				 * timer because the request was too small,
-+				 * 2) then the block layer has unplugged
-+				 * the device, causing the dispatch to be
-+				 * invoked.
-+				 *
-+				 * Since the device is unplugged, now the
-+				 * requests are probably large enough to
-+				 * provide a reasonable throughput.
-+				 * So we disable idling.
-+				 */
-+				bfq_clear_bfqq_wait_request(bfqq);
-+				del_timer(&bfqd->idle_slice_timer);
-+			}
-+			goto keep_queue;
-+		}
-+	}
-+
-+	/*
-+	 * No requests pending.  If the in-service queue still has requests
-+	 * in flight (possibly waiting for a completion) or is idling for a
-+	 * new request, then keep it.
-+	 */
-+	if (timer_pending(&bfqd->idle_slice_timer) ||
-+	    (bfqq->dispatched != 0 && bfq_bfqq_must_not_expire(bfqq))) {
-+		bfqq = NULL;
-+		goto keep_queue;
-+	}
-+
-+	reason = BFQ_BFQQ_NO_MORE_REQUESTS;
-+expire:
-+	bfq_bfqq_expire(bfqd, bfqq, 0, reason);
-+new_queue:
-+	bfqq = bfq_set_in_service_queue(bfqd);
-+	bfq_log(bfqd, "select_queue: new queue %d returned",
-+		bfqq != NULL ? bfqq->pid : 0);
-+keep_queue:
-+	return bfqq;
-+}
-+
-+static void bfq_update_wr_data(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+	if (bfqq->wr_coeff > 1) { /* queue is being weight-raised */
-+		bfq_log_bfqq(bfqd, bfqq,
-+			"raising period dur %u/%u msec, old coeff %u, w %d(%d)",
-+			jiffies_to_msecs(jiffies - bfqq->last_wr_start_finish),
-+			jiffies_to_msecs(bfqq->wr_cur_max_time),
-+			bfqq->wr_coeff,
-+			bfqq->entity.weight, bfqq->entity.orig_weight);
-+
-+		BUG_ON(bfqq != bfqd->in_service_queue && entity->weight !=
-+		       entity->orig_weight * bfqq->wr_coeff);
-+		if (entity->ioprio_changed)
-+			bfq_log_bfqq(bfqd, bfqq, "WARN: pending prio change");
-+
-+		/*
-+		 * If the queue was activated in a burst, or
-+		 * too much time has elapsed from the beginning
-+		 * of this weight-raising period, or the queue has
-+		 * exceeded the acceptable number of cooperations,
-+		 * then end weight raising.
-+		 */
-+		if (bfq_bfqq_in_large_burst(bfqq) ||
-+		    bfq_bfqq_cooperations(bfqq) >= bfqd->bfq_coop_thresh ||
-+		    time_is_before_jiffies(bfqq->last_wr_start_finish +
-+					   bfqq->wr_cur_max_time)) {
-+			bfqq->last_wr_start_finish = jiffies;
-+			bfq_log_bfqq(bfqd, bfqq,
-+				     "wrais ending at %lu, rais_max_time %u",
-+				     bfqq->last_wr_start_finish,
-+				     jiffies_to_msecs(bfqq->wr_cur_max_time));
-+			bfq_bfqq_end_wr(bfqq);
-+		}
-+	}
-+	/* Update weight both if it must be raised and if it must be lowered */
-+	if ((entity->weight > entity->orig_weight) != (bfqq->wr_coeff > 1))
-+		__bfq_entity_update_weight_prio(
-+			bfq_entity_service_tree(entity),
-+			entity);
-+}
-+
-+/*
-+ * Dispatch one request from bfqq, moving it to the request queue
-+ * dispatch list.
-+ */
-+static int bfq_dispatch_request(struct bfq_data *bfqd,
-+				struct bfq_queue *bfqq)
-+{
-+	int dispatched = 0;
-+	struct request *rq;
-+	unsigned long service_to_charge;
-+
-+	BUG_ON(RB_EMPTY_ROOT(&bfqq->sort_list));
-+
-+	/* Follow expired path, else get first next available. */
-+	rq = bfq_check_fifo(bfqq);
-+	if (rq == NULL)
-+		rq = bfqq->next_rq;
-+	service_to_charge = bfq_serv_to_charge(rq, bfqq);
-+
-+	if (service_to_charge > bfq_bfqq_budget_left(bfqq)) {
-+		/*
-+		 * This may happen if the next rq is chosen in fifo order
-+		 * instead of sector order. The budget is properly
-+		 * dimensioned to be always sufficient to serve the next
-+		 * request only if it is chosen in sector order. The reason
-+		 * is that it would be quite inefficient and little useful
-+		 * to always make sure that the budget is large enough to
-+		 * serve even the possible next rq in fifo order.
-+		 * In fact, requests are seldom served in fifo order.
-+		 *
-+		 * Expire the queue for budget exhaustion, and make sure
-+		 * that the next act_budget is enough to serve the next
-+		 * request, even if it comes from the fifo expired path.
-+		 */
-+		bfqq->next_rq = rq;
-+		/*
-+		 * Since this dispatch is failed, make sure that
-+		 * a new one will be performed
-+		 */
-+		if (!bfqd->rq_in_driver)
-+			bfq_schedule_dispatch(bfqd);
-+		goto expire;
-+	}
-+
-+	/* Finally, insert request into driver dispatch list. */
-+	bfq_bfqq_served(bfqq, service_to_charge);
-+	bfq_dispatch_insert(bfqd->queue, rq);
-+
-+	bfq_update_wr_data(bfqd, bfqq);
-+
-+	bfq_log_bfqq(bfqd, bfqq,
-+			"dispatched %u sec req (%llu), budg left %lu",
-+			blk_rq_sectors(rq),
-+			(long long unsigned)blk_rq_pos(rq),
-+			bfq_bfqq_budget_left(bfqq));
-+
-+	dispatched++;
-+
-+	if (bfqd->in_service_bic == NULL) {
-+		atomic_long_inc(&RQ_BIC(rq)->icq.ioc->refcount);
-+		bfqd->in_service_bic = RQ_BIC(rq);
-+	}
-+
-+	if (bfqd->busy_queues > 1 && ((!bfq_bfqq_sync(bfqq) &&
-+	    dispatched >= bfqd->bfq_max_budget_async_rq) ||
-+	    bfq_class_idle(bfqq)))
-+		goto expire;
-+
-+	return dispatched;
-+
-+expire:
-+	bfq_bfqq_expire(bfqd, bfqq, 0, BFQ_BFQQ_BUDGET_EXHAUSTED);
-+	return dispatched;
-+}
-+
-+static int __bfq_forced_dispatch_bfqq(struct bfq_queue *bfqq)
-+{
-+	int dispatched = 0;
-+
-+	while (bfqq->next_rq != NULL) {
-+		bfq_dispatch_insert(bfqq->bfqd->queue, bfqq->next_rq);
-+		dispatched++;
-+	}
-+
-+	BUG_ON(!list_empty(&bfqq->fifo));
-+	return dispatched;
-+}
-+
-+/*
-+ * Drain our current requests.
-+ * Used for barriers and when switching io schedulers on-the-fly.
-+ */
-+static int bfq_forced_dispatch(struct bfq_data *bfqd)
-+{
-+	struct bfq_queue *bfqq, *n;
-+	struct bfq_service_tree *st;
-+	int dispatched = 0;
-+
-+	bfqq = bfqd->in_service_queue;
-+	if (bfqq != NULL)
-+		__bfq_bfqq_expire(bfqd, bfqq);
-+
-+	/*
-+	 * Loop through classes, and be careful to leave the scheduler
-+	 * in a consistent state, as feedback mechanisms and vtime
-+	 * updates cannot be disabled during the process.
-+	 */
-+	list_for_each_entry_safe(bfqq, n, &bfqd->active_list, bfqq_list) {
-+		st = bfq_entity_service_tree(&bfqq->entity);
-+
-+		dispatched += __bfq_forced_dispatch_bfqq(bfqq);
-+		bfqq->max_budget = bfq_max_budget(bfqd);
-+
-+		bfq_forget_idle(st);
-+	}
-+
-+	BUG_ON(bfqd->busy_queues != 0);
-+
-+	return dispatched;
-+}
-+
-+static int bfq_dispatch_requests(struct request_queue *q, int force)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct bfq_queue *bfqq;
-+	int max_dispatch;
-+
-+	bfq_log(bfqd, "dispatch requests: %d busy queues", bfqd->busy_queues);
-+	if (bfqd->busy_queues == 0)
-+		return 0;
-+
-+	if (unlikely(force))
-+		return bfq_forced_dispatch(bfqd);
-+
-+	bfqq = bfq_select_queue(bfqd);
-+	if (bfqq == NULL)
-+		return 0;
-+
-+	max_dispatch = bfqd->bfq_quantum;
-+	if (bfq_class_idle(bfqq))
-+		max_dispatch = 1;
-+
-+	if (!bfq_bfqq_sync(bfqq))
-+		max_dispatch = bfqd->bfq_max_budget_async_rq;
-+
-+	if (bfqq->dispatched >= max_dispatch) {
-+		if (bfqd->busy_queues > 1)
-+			return 0;
-+		if (bfqq->dispatched >= 4 * max_dispatch)
-+			return 0;
-+	}
-+
-+	if (bfqd->sync_flight != 0 && !bfq_bfqq_sync(bfqq))
-+		return 0;
-+
-+	bfq_clear_bfqq_wait_request(bfqq);
-+	BUG_ON(timer_pending(&bfqd->idle_slice_timer));
-+
-+	if (!bfq_dispatch_request(bfqd, bfqq))
-+		return 0;
-+
-+	bfq_log_bfqq(bfqd, bfqq, "dispatched one request of %d (max_disp %d)",
-+			bfqq->pid, max_dispatch);
-+
-+	return 1;
-+}
-+
-+/*
-+ * Task holds one reference to the queue, dropped when task exits.  Each rq
-+ * in-flight on this queue also holds a reference, dropped when rq is freed.
-+ *
-+ * Queue lock must be held here.
-+ */
-+static void bfq_put_queue(struct bfq_queue *bfqq)
-+{
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+
-+	BUG_ON(atomic_read(&bfqq->ref) <= 0);
-+
-+	bfq_log_bfqq(bfqd, bfqq, "put_queue: %p %d", bfqq,
-+		     atomic_read(&bfqq->ref));
-+	if (!atomic_dec_and_test(&bfqq->ref))
-+		return;
-+
-+	BUG_ON(rb_first(&bfqq->sort_list) != NULL);
-+	BUG_ON(bfqq->allocated[READ] + bfqq->allocated[WRITE] != 0);
-+	BUG_ON(bfqq->entity.tree != NULL);
-+	BUG_ON(bfq_bfqq_busy(bfqq));
-+	BUG_ON(bfqd->in_service_queue == bfqq);
-+
-+	if (bfq_bfqq_sync(bfqq))
-+		/*
-+		 * The fact that this queue is being destroyed does not
-+		 * invalidate the fact that this queue may have been
-+		 * activated during the current burst. As a consequence,
-+		 * although the queue does not exist anymore, and hence
-+		 * needs to be removed from the burst list if there,
-+		 * the burst size has not to be decremented.
-+		 */
-+		hlist_del_init(&bfqq->burst_list_node);
-+
-+	bfq_log_bfqq(bfqd, bfqq, "put_queue: %p freed", bfqq);
-+
-+	kmem_cache_free(bfq_pool, bfqq);
-+}
-+
-+static void bfq_put_cooperator(struct bfq_queue *bfqq)
-+{
-+	struct bfq_queue *__bfqq, *next;
-+
-+	/*
-+	 * If this queue was scheduled to merge with another queue, be
-+	 * sure to drop the reference taken on that queue (and others in
-+	 * the merge chain). See bfq_setup_merge and bfq_merge_bfqqs.
-+	 */
-+	__bfqq = bfqq->new_bfqq;
-+	while (__bfqq) {
-+		if (__bfqq == bfqq)
-+			break;
-+		next = __bfqq->new_bfqq;
-+		bfq_put_queue(__bfqq);
-+		__bfqq = next;
-+	}
-+}
-+
-+static void bfq_exit_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	if (bfqq == bfqd->in_service_queue) {
-+		__bfq_bfqq_expire(bfqd, bfqq);
-+		bfq_schedule_dispatch(bfqd);
-+	}
-+
-+	bfq_log_bfqq(bfqd, bfqq, "exit_bfqq: %p, %d", bfqq,
-+		     atomic_read(&bfqq->ref));
-+
-+	bfq_put_cooperator(bfqq);
-+
-+	bfq_put_queue(bfqq);
-+}
-+
-+static inline void bfq_init_icq(struct io_cq *icq)
-+{
-+	struct bfq_io_cq *bic = icq_to_bic(icq);
-+
-+	bic->ttime.last_end_request = jiffies;
-+	/*
-+	 * A newly created bic indicates that the process has just
-+	 * started doing I/O, and is probably mapping into memory its
-+	 * executable and libraries: it definitely needs weight raising.
-+	 * There is however the possibility that the process performs,
-+	 * for a while, I/O close to some other process. EQM intercepts
-+	 * this behavior and may merge the queue corresponding to the
-+	 * process  with some other queue, BEFORE the weight of the queue
-+	 * is raised. Merged queues are not weight-raised (they are assumed
-+	 * to belong to processes that benefit only from high throughput).
-+	 * If the merge is basically the consequence of an accident, then
-+	 * the queue will be split soon and will get back its old weight.
-+	 * It is then important to write down somewhere that this queue
-+	 * does need weight raising, even if it did not make it to get its
-+	 * weight raised before being merged. To this purpose, we overload
-+	 * the field raising_time_left and assign 1 to it, to mark the queue
-+	 * as needing weight raising.
-+	 */
-+	bic->wr_time_left = 1;
-+}
-+
-+static void bfq_exit_icq(struct io_cq *icq)
-+{
-+	struct bfq_io_cq *bic = icq_to_bic(icq);
-+	struct bfq_data *bfqd = bic_to_bfqd(bic);
-+
-+	if (bic->bfqq[BLK_RW_ASYNC]) {
-+		bfq_exit_bfqq(bfqd, bic->bfqq[BLK_RW_ASYNC]);
-+		bic->bfqq[BLK_RW_ASYNC] = NULL;
-+	}
-+
-+	if (bic->bfqq[BLK_RW_SYNC]) {
-+		/*
-+		 * If the bic is using a shared queue, put the reference
-+		 * taken on the io_context when the bic started using a
-+		 * shared bfq_queue.
-+		 */
-+		if (bfq_bfqq_coop(bic->bfqq[BLK_RW_SYNC]))
-+			put_io_context(icq->ioc);
-+		bfq_exit_bfqq(bfqd, bic->bfqq[BLK_RW_SYNC]);
-+		bic->bfqq[BLK_RW_SYNC] = NULL;
-+	}
-+}
-+
-+/*
-+ * Update the entity prio values; note that the new values will not
-+ * be used until the next (re)activation.
-+ */
-+static void bfq_init_prio_data(struct bfq_queue *bfqq, struct bfq_io_cq *bic)
-+{
-+	struct task_struct *tsk = current;
-+	int ioprio_class;
-+
-+	if (!bfq_bfqq_prio_changed(bfqq))
-+		return;
-+
-+	ioprio_class = IOPRIO_PRIO_CLASS(bic->ioprio);
-+	switch (ioprio_class) {
-+	default:
-+		dev_err(bfqq->bfqd->queue->backing_dev_info.dev,
-+			"bfq: bad prio class %d\n", ioprio_class);
-+	case IOPRIO_CLASS_NONE:
-+		/*
-+		 * No prio set, inherit CPU scheduling settings.
-+		 */
-+		bfqq->entity.new_ioprio = task_nice_ioprio(tsk);
-+		bfqq->entity.new_ioprio_class = task_nice_ioclass(tsk);
-+		break;
-+	case IOPRIO_CLASS_RT:
-+		bfqq->entity.new_ioprio = IOPRIO_PRIO_DATA(bic->ioprio);
-+		bfqq->entity.new_ioprio_class = IOPRIO_CLASS_RT;
-+		break;
-+	case IOPRIO_CLASS_BE:
-+		bfqq->entity.new_ioprio = IOPRIO_PRIO_DATA(bic->ioprio);
-+		bfqq->entity.new_ioprio_class = IOPRIO_CLASS_BE;
-+		break;
-+	case IOPRIO_CLASS_IDLE:
-+		bfqq->entity.new_ioprio_class = IOPRIO_CLASS_IDLE;
-+		bfqq->entity.new_ioprio = 7;
-+		bfq_clear_bfqq_idle_window(bfqq);
-+		break;
-+	}
-+
-+	if (bfqq->entity.new_ioprio < 0 ||
-+	    bfqq->entity.new_ioprio >= IOPRIO_BE_NR) {
-+		printk(KERN_CRIT "bfq_init_prio_data: new_ioprio %d\n",
-+				 bfqq->entity.new_ioprio);
-+		BUG();
-+	}
-+
-+	bfqq->entity.ioprio_changed = 1;
-+
-+	bfq_clear_bfqq_prio_changed(bfqq);
-+}
-+
-+static void bfq_changed_ioprio(struct bfq_io_cq *bic)
-+{
-+	struct bfq_data *bfqd;
-+	struct bfq_queue *bfqq, *new_bfqq;
-+	struct bfq_group *bfqg;
-+	unsigned long uninitialized_var(flags);
-+	int ioprio = bic->icq.ioc->ioprio;
-+
-+	bfqd = bfq_get_bfqd_locked(&(bic->icq.q->elevator->elevator_data),
-+				   &flags);
-+	/*
-+	 * This condition may trigger on a newly created bic, be sure to
-+	 * drop the lock before returning.
-+	 */
-+	if (unlikely(bfqd == NULL) || likely(bic->ioprio == ioprio))
-+		goto out;
-+
-+	bfqq = bic->bfqq[BLK_RW_ASYNC];
-+	if (bfqq != NULL) {
-+		bfqg = container_of(bfqq->entity.sched_data, struct bfq_group,
-+				    sched_data);
-+		new_bfqq = bfq_get_queue(bfqd, bfqg, BLK_RW_ASYNC, bic,
-+					 GFP_ATOMIC);
-+		if (new_bfqq != NULL) {
-+			bic->bfqq[BLK_RW_ASYNC] = new_bfqq;
-+			bfq_log_bfqq(bfqd, bfqq,
-+				     "changed_ioprio: bfqq %p %d",
-+				     bfqq, atomic_read(&bfqq->ref));
-+			bfq_put_queue(bfqq);
-+		}
-+	}
-+
-+	bfqq = bic->bfqq[BLK_RW_SYNC];
-+	if (bfqq != NULL)
-+		bfq_mark_bfqq_prio_changed(bfqq);
-+
-+	bic->ioprio = ioprio;
-+
-+out:
-+	bfq_put_bfqd_unlock(bfqd, &flags);
-+}
-+
-+static void bfq_init_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+			  pid_t pid, int is_sync)
-+{
-+	RB_CLEAR_NODE(&bfqq->entity.rb_node);
-+	INIT_LIST_HEAD(&bfqq->fifo);
-+	INIT_HLIST_NODE(&bfqq->burst_list_node);
-+
-+	atomic_set(&bfqq->ref, 0);
-+	bfqq->bfqd = bfqd;
-+
-+	bfq_mark_bfqq_prio_changed(bfqq);
-+
-+	if (is_sync) {
-+		if (!bfq_class_idle(bfqq))
-+			bfq_mark_bfqq_idle_window(bfqq);
-+		bfq_mark_bfqq_sync(bfqq);
-+	}
-+	bfq_mark_bfqq_IO_bound(bfqq);
-+
-+	/* Tentative initial value to trade off between thr and lat */
-+	bfqq->max_budget = (2 * bfq_max_budget(bfqd)) / 3;
-+	bfqq->pid = pid;
-+
-+	bfqq->wr_coeff = 1;
-+	bfqq->last_wr_start_finish = 0;
-+	/*
-+	 * Set to the value for which bfqq will not be deemed as
-+	 * soft rt when it becomes backlogged.
-+	 */
-+	bfqq->soft_rt_next_start = bfq_infinity_from_now(jiffies);
-+}
-+
-+static struct bfq_queue *bfq_find_alloc_queue(struct bfq_data *bfqd,
-+					      struct bfq_group *bfqg,
-+					      int is_sync,
-+					      struct bfq_io_cq *bic,
-+					      gfp_t gfp_mask)
-+{
-+	struct bfq_queue *bfqq, *new_bfqq = NULL;
-+
-+retry:
-+	/* bic always exists here */
-+	bfqq = bic_to_bfqq(bic, is_sync);
-+
-+	/*
-+	 * Always try a new alloc if we fall back to the OOM bfqq
-+	 * originally, since it should just be a temporary situation.
-+	 */
-+	if (bfqq == NULL || bfqq == &bfqd->oom_bfqq) {
-+		bfqq = NULL;
-+		if (new_bfqq != NULL) {
-+			bfqq = new_bfqq;
-+			new_bfqq = NULL;
-+		} else if (gfp_mask & __GFP_WAIT) {
-+			spin_unlock_irq(bfqd->queue->queue_lock);
-+			new_bfqq = kmem_cache_alloc_node(bfq_pool,
-+					gfp_mask | __GFP_ZERO,
-+					bfqd->queue->node);
-+			spin_lock_irq(bfqd->queue->queue_lock);
-+			if (new_bfqq != NULL)
-+				goto retry;
-+		} else {
-+			bfqq = kmem_cache_alloc_node(bfq_pool,
-+					gfp_mask | __GFP_ZERO,
-+					bfqd->queue->node);
-+		}
-+
-+		if (bfqq != NULL) {
-+			bfq_init_bfqq(bfqd, bfqq, current->pid, is_sync);
-+			bfq_init_prio_data(bfqq, bic);
-+			bfq_init_entity(&bfqq->entity, bfqg);
-+			bfq_log_bfqq(bfqd, bfqq, "allocated");
-+		} else {
-+			bfqq = &bfqd->oom_bfqq;
-+			bfq_log_bfqq(bfqd, bfqq, "using oom bfqq");
-+		}
-+	}
-+
-+	if (new_bfqq != NULL)
-+		kmem_cache_free(bfq_pool, new_bfqq);
-+
-+	return bfqq;
-+}
-+
-+static struct bfq_queue **bfq_async_queue_prio(struct bfq_data *bfqd,
-+					       struct bfq_group *bfqg,
-+					       int ioprio_class, int ioprio)
-+{
-+	switch (ioprio_class) {
-+	case IOPRIO_CLASS_RT:
-+		return &bfqg->async_bfqq[0][ioprio];
-+	case IOPRIO_CLASS_NONE:
-+		ioprio = IOPRIO_NORM;
-+		/* fall through */
-+	case IOPRIO_CLASS_BE:
-+		return &bfqg->async_bfqq[1][ioprio];
-+	case IOPRIO_CLASS_IDLE:
-+		return &bfqg->async_idle_bfqq;
-+	default:
-+		BUG();
-+	}
-+}
-+
-+static struct bfq_queue *bfq_get_queue(struct bfq_data *bfqd,
-+				       struct bfq_group *bfqg, int is_sync,
-+				       struct bfq_io_cq *bic, gfp_t gfp_mask)
-+{
-+	const int ioprio = IOPRIO_PRIO_DATA(bic->ioprio);
-+	const int ioprio_class = IOPRIO_PRIO_CLASS(bic->ioprio);
-+	struct bfq_queue **async_bfqq = NULL;
-+	struct bfq_queue *bfqq = NULL;
-+
-+	if (!is_sync) {
-+		async_bfqq = bfq_async_queue_prio(bfqd, bfqg, ioprio_class,
-+						  ioprio);
-+		bfqq = *async_bfqq;
-+	}
-+
-+	if (bfqq == NULL)
-+		bfqq = bfq_find_alloc_queue(bfqd, bfqg, is_sync, bic, gfp_mask);
-+
-+	/*
-+	 * Pin the queue now that it's allocated, scheduler exit will
-+	 * prune it.
-+	 */
-+	if (!is_sync && *async_bfqq == NULL) {
-+		atomic_inc(&bfqq->ref);
-+		bfq_log_bfqq(bfqd, bfqq, "get_queue, bfqq not in async: %p, %d",
-+			     bfqq, atomic_read(&bfqq->ref));
-+		*async_bfqq = bfqq;
-+	}
-+
-+	atomic_inc(&bfqq->ref);
-+	bfq_log_bfqq(bfqd, bfqq, "get_queue, at end: %p, %d", bfqq,
-+		     atomic_read(&bfqq->ref));
-+	return bfqq;
-+}
-+
-+static void bfq_update_io_thinktime(struct bfq_data *bfqd,
-+				    struct bfq_io_cq *bic)
-+{
-+	unsigned long elapsed = jiffies - bic->ttime.last_end_request;
-+	unsigned long ttime = min(elapsed, 2UL * bfqd->bfq_slice_idle);
-+
-+	bic->ttime.ttime_samples = (7*bic->ttime.ttime_samples + 256) / 8;
-+	bic->ttime.ttime_total = (7*bic->ttime.ttime_total + 256*ttime) / 8;
-+	bic->ttime.ttime_mean = (bic->ttime.ttime_total + 128) /
-+				bic->ttime.ttime_samples;
-+}
-+
-+static void bfq_update_io_seektime(struct bfq_data *bfqd,
-+				   struct bfq_queue *bfqq,
-+				   struct request *rq)
-+{
-+	sector_t sdist;
-+	u64 total;
-+
-+	if (bfqq->last_request_pos < blk_rq_pos(rq))
-+		sdist = blk_rq_pos(rq) - bfqq->last_request_pos;
-+	else
-+		sdist = bfqq->last_request_pos - blk_rq_pos(rq);
-+
-+	/*
-+	 * Don't allow the seek distance to get too large from the
-+	 * odd fragment, pagein, etc.
-+	 */
-+	if (bfqq->seek_samples == 0) /* first request, not really a seek */
-+		sdist = 0;
-+	else if (bfqq->seek_samples <= 60) /* second & third seek */
-+		sdist = min(sdist, (bfqq->seek_mean * 4) + 2*1024*1024);
-+	else
-+		sdist = min(sdist, (bfqq->seek_mean * 4) + 2*1024*64);
-+
-+	bfqq->seek_samples = (7*bfqq->seek_samples + 256) / 8;
-+	bfqq->seek_total = (7*bfqq->seek_total + (u64)256*sdist) / 8;
-+	total = bfqq->seek_total + (bfqq->seek_samples/2);
-+	do_div(total, bfqq->seek_samples);
-+	bfqq->seek_mean = (sector_t)total;
-+
-+	bfq_log_bfqq(bfqd, bfqq, "dist=%llu mean=%llu", (u64)sdist,
-+			(u64)bfqq->seek_mean);
-+}
-+
-+/*
-+ * Disable idle window if the process thinks too long or seeks so much that
-+ * it doesn't matter.
-+ */
-+static void bfq_update_idle_window(struct bfq_data *bfqd,
-+				   struct bfq_queue *bfqq,
-+				   struct bfq_io_cq *bic)
-+{
-+	int enable_idle;
-+
-+	/* Don't idle for async or idle io prio class. */
-+	if (!bfq_bfqq_sync(bfqq) || bfq_class_idle(bfqq))
-+		return;
-+
-+	/* Idle window just restored, statistics are meaningless. */
-+	if (bfq_bfqq_just_split(bfqq))
-+		return;
-+
-+	enable_idle = bfq_bfqq_idle_window(bfqq);
-+
-+	if (atomic_read(&bic->icq.ioc->active_ref) == 0 ||
-+	    bfqd->bfq_slice_idle == 0 ||
-+		(bfqd->hw_tag && BFQQ_SEEKY(bfqq) &&
-+			bfqq->wr_coeff == 1))
-+		enable_idle = 0;
-+	else if (bfq_sample_valid(bic->ttime.ttime_samples)) {
-+		if (bic->ttime.ttime_mean > bfqd->bfq_slice_idle &&
-+			bfqq->wr_coeff == 1)
-+			enable_idle = 0;
-+		else
-+			enable_idle = 1;
-+	}
-+	bfq_log_bfqq(bfqd, bfqq, "update_idle_window: enable_idle %d",
-+		enable_idle);
-+
-+	if (enable_idle)
-+		bfq_mark_bfqq_idle_window(bfqq);
-+	else
-+		bfq_clear_bfqq_idle_window(bfqq);
-+}
-+
-+/*
-+ * Called when a new fs request (rq) is added to bfqq.  Check if there's
-+ * something we should do about it.
-+ */
-+static void bfq_rq_enqueued(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+			    struct request *rq)
-+{
-+	struct bfq_io_cq *bic = RQ_BIC(rq);
-+
-+	if (rq->cmd_flags & REQ_META)
-+		bfqq->meta_pending++;
-+
-+	bfq_update_io_thinktime(bfqd, bic);
-+	bfq_update_io_seektime(bfqd, bfqq, rq);
-+	if (!BFQQ_SEEKY(bfqq) && bfq_bfqq_constantly_seeky(bfqq)) {
-+		bfq_clear_bfqq_constantly_seeky(bfqq);
-+		if (!blk_queue_nonrot(bfqd->queue)) {
-+			BUG_ON(!bfqd->const_seeky_busy_in_flight_queues);
-+			bfqd->const_seeky_busy_in_flight_queues--;
-+		}
-+	}
-+	if (bfqq->entity.service > bfq_max_budget(bfqd) / 8 ||
-+	    !BFQQ_SEEKY(bfqq))
-+		bfq_update_idle_window(bfqd, bfqq, bic);
-+	bfq_clear_bfqq_just_split(bfqq);
-+
-+	bfq_log_bfqq(bfqd, bfqq,
-+		     "rq_enqueued: idle_window=%d (seeky %d, mean %llu)",
-+		     bfq_bfqq_idle_window(bfqq), BFQQ_SEEKY(bfqq),
-+		     (long long unsigned)bfqq->seek_mean);
-+
-+	bfqq->last_request_pos = blk_rq_pos(rq) + blk_rq_sectors(rq);
-+
-+	if (bfqq == bfqd->in_service_queue && bfq_bfqq_wait_request(bfqq)) {
-+		int small_req = bfqq->queued[rq_is_sync(rq)] == 1 &&
-+				blk_rq_sectors(rq) < 32;
-+		int budget_timeout = bfq_bfqq_budget_timeout(bfqq);
-+
-+		/*
-+		 * There is just this request queued: if the request
-+		 * is small and the queue is not to be expired, then
-+		 * just exit.
-+		 *
-+		 * In this way, if the disk is being idled to wait for
-+		 * a new request from the in-service queue, we avoid
-+		 * unplugging the device and committing the disk to serve
-+		 * just a small request. On the contrary, we wait for
-+		 * the block layer to decide when to unplug the device:
-+		 * hopefully, new requests will be merged to this one
-+		 * quickly, then the device will be unplugged and
-+		 * larger requests will be dispatched.
-+		 */
-+		if (small_req && !budget_timeout)
-+			return;
-+
-+		/*
-+		 * A large enough request arrived, or the queue is to
-+		 * be expired: in both cases disk idling is to be
-+		 * stopped, so clear wait_request flag and reset
-+		 * timer.
-+		 */
-+		bfq_clear_bfqq_wait_request(bfqq);
-+		del_timer(&bfqd->idle_slice_timer);
-+
-+		/*
-+		 * The queue is not empty, because a new request just
-+		 * arrived. Hence we can safely expire the queue, in
-+		 * case of budget timeout, without risking that the
-+		 * timestamps of the queue are not updated correctly.
-+		 * See [1] for more details.
-+		 */
-+		if (budget_timeout)
-+			bfq_bfqq_expire(bfqd, bfqq, 0, BFQ_BFQQ_BUDGET_TIMEOUT);
-+
-+		/*
-+		 * Let the request rip immediately, or let a new queue be
-+		 * selected if bfqq has just been expired.
-+		 */
-+		__blk_run_queue(bfqd->queue);
-+	}
-+}
-+
-+static void bfq_insert_request(struct request_queue *q, struct request *rq)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq), *new_bfqq;
-+
-+	assert_spin_locked(bfqd->queue->queue_lock);
-+
-+	/*
-+	 * An unplug may trigger a requeue of a request from the device
-+	 * driver: make sure we are in process context while trying to
-+	 * merge two bfq_queues.
-+	 */
-+	if (!in_interrupt()) {
-+		new_bfqq = bfq_setup_cooperator(bfqd, bfqq, rq, true);
-+		if (new_bfqq != NULL) {
-+			if (bic_to_bfqq(RQ_BIC(rq), 1) != bfqq)
-+				new_bfqq = bic_to_bfqq(RQ_BIC(rq), 1);
-+			/*
-+			 * Release the request's reference to the old bfqq
-+			 * and make sure one is taken to the shared queue.
-+			 */
-+			new_bfqq->allocated[rq_data_dir(rq)]++;
-+			bfqq->allocated[rq_data_dir(rq)]--;
-+			atomic_inc(&new_bfqq->ref);
-+			bfq_put_queue(bfqq);
-+			if (bic_to_bfqq(RQ_BIC(rq), 1) == bfqq)
-+				bfq_merge_bfqqs(bfqd, RQ_BIC(rq),
-+						bfqq, new_bfqq);
-+			rq->elv.priv[1] = new_bfqq;
-+			bfqq = new_bfqq;
-+		} else
-+			bfq_bfqq_increase_failed_cooperations(bfqq);
-+	}
-+
-+	bfq_init_prio_data(bfqq, RQ_BIC(rq));
-+
-+	bfq_add_request(rq);
-+
-+	/*
-+	 * Here a newly-created bfq_queue has already started a weight-raising
-+	 * period: clear raising_time_left to prevent bfq_bfqq_save_state()
-+	 * from assigning it a full weight-raising period. See the detailed
-+	 * comments about this field in bfq_init_icq().
-+	 */
-+	if (bfqq->bic != NULL)
-+		bfqq->bic->wr_time_left = 0;
-+	rq->fifo_time = jiffies + bfqd->bfq_fifo_expire[rq_is_sync(rq)];
-+	list_add_tail(&rq->queuelist, &bfqq->fifo);
-+
-+	bfq_rq_enqueued(bfqd, bfqq, rq);
-+}
-+
-+static void bfq_update_hw_tag(struct bfq_data *bfqd)
-+{
-+	bfqd->max_rq_in_driver = max(bfqd->max_rq_in_driver,
-+				     bfqd->rq_in_driver);
-+
-+	if (bfqd->hw_tag == 1)
-+		return;
-+
-+	/*
-+	 * This sample is valid if the number of outstanding requests
-+	 * is large enough to allow a queueing behavior.  Note that the
-+	 * sum is not exact, as it's not taking into account deactivated
-+	 * requests.
-+	 */
-+	if (bfqd->rq_in_driver + bfqd->queued < BFQ_HW_QUEUE_THRESHOLD)
-+		return;
-+
-+	if (bfqd->hw_tag_samples++ < BFQ_HW_QUEUE_SAMPLES)
-+		return;
-+
-+	bfqd->hw_tag = bfqd->max_rq_in_driver > BFQ_HW_QUEUE_THRESHOLD;
-+	bfqd->max_rq_in_driver = 0;
-+	bfqd->hw_tag_samples = 0;
-+}
-+
-+static void bfq_completed_request(struct request_queue *q, struct request *rq)
-+{
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq);
-+	struct bfq_data *bfqd = bfqq->bfqd;
-+	bool sync = bfq_bfqq_sync(bfqq);
-+
-+	bfq_log_bfqq(bfqd, bfqq, "completed one req with %u sects left (%d)",
-+		     blk_rq_sectors(rq), sync);
-+
-+	bfq_update_hw_tag(bfqd);
-+
-+	BUG_ON(!bfqd->rq_in_driver);
-+	BUG_ON(!bfqq->dispatched);
-+	bfqd->rq_in_driver--;
-+	bfqq->dispatched--;
-+
-+	if (!bfqq->dispatched && !bfq_bfqq_busy(bfqq)) {
-+		bfq_weights_tree_remove(bfqd, &bfqq->entity,
-+					&bfqd->queue_weights_tree);
-+		if (!blk_queue_nonrot(bfqd->queue)) {
-+			BUG_ON(!bfqd->busy_in_flight_queues);
-+			bfqd->busy_in_flight_queues--;
-+			if (bfq_bfqq_constantly_seeky(bfqq)) {
-+				BUG_ON(!bfqd->
-+					const_seeky_busy_in_flight_queues);
-+				bfqd->const_seeky_busy_in_flight_queues--;
-+			}
-+		}
-+	}
-+
-+	if (sync) {
-+		bfqd->sync_flight--;
-+		RQ_BIC(rq)->ttime.last_end_request = jiffies;
-+	}
-+
-+	/*
-+	 * If we are waiting to discover whether the request pattern of the
-+	 * task associated with the queue is actually isochronous, and
-+	 * both requisites for this condition to hold are satisfied, then
-+	 * compute soft_rt_next_start (see the comments to the function
-+	 * bfq_bfqq_softrt_next_start()).
-+	 */
-+	if (bfq_bfqq_softrt_update(bfqq) && bfqq->dispatched == 0 &&
-+	    RB_EMPTY_ROOT(&bfqq->sort_list))
-+		bfqq->soft_rt_next_start =
-+			bfq_bfqq_softrt_next_start(bfqd, bfqq);
-+
-+	/*
-+	 * If this is the in-service queue, check if it needs to be expired,
-+	 * or if we want to idle in case it has no pending requests.
-+	 */
-+	if (bfqd->in_service_queue == bfqq) {
-+		if (bfq_bfqq_budget_new(bfqq))
-+			bfq_set_budget_timeout(bfqd);
-+
-+		if (bfq_bfqq_must_idle(bfqq)) {
-+			bfq_arm_slice_timer(bfqd);
-+			goto out;
-+		} else if (bfq_may_expire_for_budg_timeout(bfqq))
-+			bfq_bfqq_expire(bfqd, bfqq, 0, BFQ_BFQQ_BUDGET_TIMEOUT);
-+		else if (RB_EMPTY_ROOT(&bfqq->sort_list) &&
-+			 (bfqq->dispatched == 0 ||
-+			  !bfq_bfqq_must_not_expire(bfqq)))
-+			bfq_bfqq_expire(bfqd, bfqq, 0,
-+					BFQ_BFQQ_NO_MORE_REQUESTS);
-+	}
-+
-+	if (!bfqd->rq_in_driver)
-+		bfq_schedule_dispatch(bfqd);
-+
-+out:
-+	return;
-+}
-+
-+static inline int __bfq_may_queue(struct bfq_queue *bfqq)
-+{
-+	if (bfq_bfqq_wait_request(bfqq) && bfq_bfqq_must_alloc(bfqq)) {
-+		bfq_clear_bfqq_must_alloc(bfqq);
-+		return ELV_MQUEUE_MUST;
-+	}
-+
-+	return ELV_MQUEUE_MAY;
-+}
-+
-+static int bfq_may_queue(struct request_queue *q, int rw)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct task_struct *tsk = current;
-+	struct bfq_io_cq *bic;
-+	struct bfq_queue *bfqq;
-+
-+	/*
-+	 * Don't force setup of a queue from here, as a call to may_queue
-+	 * does not necessarily imply that a request actually will be
-+	 * queued. So just lookup a possibly existing queue, or return
-+	 * 'may queue' if that fails.
-+	 */
-+	bic = bfq_bic_lookup(bfqd, tsk->io_context);
-+	if (bic == NULL)
-+		return ELV_MQUEUE_MAY;
-+
-+	bfqq = bic_to_bfqq(bic, rw_is_sync(rw));
-+	if (bfqq != NULL) {
-+		bfq_init_prio_data(bfqq, bic);
-+
-+		return __bfq_may_queue(bfqq);
-+	}
-+
-+	return ELV_MQUEUE_MAY;
-+}
-+
-+/*
-+ * Queue lock held here.
-+ */
-+static void bfq_put_request(struct request *rq)
-+{
-+	struct bfq_queue *bfqq = RQ_BFQQ(rq);
-+
-+	if (bfqq != NULL) {
-+		const int rw = rq_data_dir(rq);
-+
-+		BUG_ON(!bfqq->allocated[rw]);
-+		bfqq->allocated[rw]--;
-+
-+		rq->elv.priv[0] = NULL;
-+		rq->elv.priv[1] = NULL;
-+
-+		bfq_log_bfqq(bfqq->bfqd, bfqq, "put_request %p, %d",
-+			     bfqq, atomic_read(&bfqq->ref));
-+		bfq_put_queue(bfqq);
-+	}
-+}
-+
-+/*
-+ * Returns NULL if a new bfqq should be allocated, or the old bfqq if this
-+ * was the last process referring to said bfqq.
-+ */
-+static struct bfq_queue *
-+bfq_split_bfqq(struct bfq_io_cq *bic, struct bfq_queue *bfqq)
-+{
-+	bfq_log_bfqq(bfqq->bfqd, bfqq, "splitting queue");
-+
-+	put_io_context(bic->icq.ioc);
-+
-+	if (bfqq_process_refs(bfqq) == 1) {
-+		bfqq->pid = current->pid;
-+		bfq_clear_bfqq_coop(bfqq);
-+		bfq_clear_bfqq_split_coop(bfqq);
-+		return bfqq;
-+	}
-+
-+	bic_set_bfqq(bic, NULL, 1);
-+
-+	bfq_put_cooperator(bfqq);
-+
-+	bfq_put_queue(bfqq);
-+	return NULL;
-+}
-+
-+/*
-+ * Allocate bfq data structures associated with this request.
-+ */
-+static int bfq_set_request(struct request_queue *q, struct request *rq,
-+			   struct bio *bio, gfp_t gfp_mask)
-+{
-+	struct bfq_data *bfqd = q->elevator->elevator_data;
-+	struct bfq_io_cq *bic = icq_to_bic(rq->elv.icq);
-+	const int rw = rq_data_dir(rq);
-+	const int is_sync = rq_is_sync(rq);
-+	struct bfq_queue *bfqq;
-+	struct bfq_group *bfqg;
-+	unsigned long flags;
-+	bool split = false;
-+
-+	might_sleep_if(gfp_mask & __GFP_WAIT);
-+
-+	bfq_changed_ioprio(bic);
-+
-+	spin_lock_irqsave(q->queue_lock, flags);
-+
-+	if (bic == NULL)
-+		goto queue_fail;
-+
-+	bfqg = bfq_bic_update_cgroup(bic);
-+
-+new_queue:
-+	bfqq = bic_to_bfqq(bic, is_sync);
-+	if (bfqq == NULL || bfqq == &bfqd->oom_bfqq) {
-+		bfqq = bfq_get_queue(bfqd, bfqg, is_sync, bic, gfp_mask);
-+		bic_set_bfqq(bic, bfqq, is_sync);
-+		if (split && is_sync) {
-+			if ((bic->was_in_burst_list && bfqd->large_burst) ||
-+			    bic->saved_in_large_burst)
-+				bfq_mark_bfqq_in_large_burst(bfqq);
-+			else {
-+			    bfq_clear_bfqq_in_large_burst(bfqq);
-+			    if (bic->was_in_burst_list)
-+			       hlist_add_head(&bfqq->burst_list_node,
-+				              &bfqd->burst_list);
-+			}
-+		}
-+	} else {
-+		/* If the queue was seeky for too long, break it apart. */
-+		if (bfq_bfqq_coop(bfqq) && bfq_bfqq_split_coop(bfqq)) {
-+			bfq_log_bfqq(bfqd, bfqq, "breaking apart bfqq");
-+			bfqq = bfq_split_bfqq(bic, bfqq);
-+			split = true;
-+			if (!bfqq)
-+				goto new_queue;
-+		}
-+	}
-+
-+	bfqq->allocated[rw]++;
-+	atomic_inc(&bfqq->ref);
-+	bfq_log_bfqq(bfqd, bfqq, "set_request: bfqq %p, %d", bfqq,
-+		     atomic_read(&bfqq->ref));
-+
-+	rq->elv.priv[0] = bic;
-+	rq->elv.priv[1] = bfqq;
-+
-+	/*
-+	 * If a bfq_queue has only one process reference, it is owned
-+	 * by only one bfq_io_cq: we can set the bic field of the
-+	 * bfq_queue to the address of that structure. Also, if the
-+	 * queue has just been split, mark a flag so that the
-+	 * information is available to the other scheduler hooks.
-+	 */
-+	if (likely(bfqq != &bfqd->oom_bfqq) && bfqq_process_refs(bfqq) == 1) {
-+		bfqq->bic = bic;
-+		if (split) {
-+			bfq_mark_bfqq_just_split(bfqq);
-+			/*
-+			 * If the queue has just been split from a shared
-+			 * queue, restore the idle window and the possible
-+			 * weight raising period.
-+			 */
-+			bfq_bfqq_resume_state(bfqq, bic);
-+		}
-+	}
-+
-+	spin_unlock_irqrestore(q->queue_lock, flags);
-+
-+	return 0;
-+
-+queue_fail:
-+	bfq_schedule_dispatch(bfqd);
-+	spin_unlock_irqrestore(q->queue_lock, flags);
-+
-+	return 1;
-+}
-+
-+static void bfq_kick_queue(struct work_struct *work)
-+{
-+	struct bfq_data *bfqd =
-+		container_of(work, struct bfq_data, unplug_work);
-+	struct request_queue *q = bfqd->queue;
-+
-+	spin_lock_irq(q->queue_lock);
-+	__blk_run_queue(q);
-+	spin_unlock_irq(q->queue_lock);
-+}
-+
-+/*
-+ * Handler of the expiration of the timer running if the in-service queue
-+ * is idling inside its time slice.
-+ */
-+static void bfq_idle_slice_timer(unsigned long data)
-+{
-+	struct bfq_data *bfqd = (struct bfq_data *)data;
-+	struct bfq_queue *bfqq;
-+	unsigned long flags;
-+	enum bfqq_expiration reason;
-+
-+	spin_lock_irqsave(bfqd->queue->queue_lock, flags);
-+
-+	bfqq = bfqd->in_service_queue;
-+	/*
-+	 * Theoretical race here: the in-service queue can be NULL or
-+	 * different from the queue that was idling if the timer handler
-+	 * spins on the queue_lock and a new request arrives for the
-+	 * current queue and there is a full dispatch cycle that changes
-+	 * the in-service queue.  This can hardly happen, but in the worst
-+	 * case we just expire a queue too early.
-+	 */
-+	if (bfqq != NULL) {
-+		bfq_log_bfqq(bfqd, bfqq, "slice_timer expired");
-+		if (bfq_bfqq_budget_timeout(bfqq))
-+			/*
-+			 * Also here the queue can be safely expired
-+			 * for budget timeout without wasting
-+			 * guarantees
-+			 */
-+			reason = BFQ_BFQQ_BUDGET_TIMEOUT;
-+		else if (bfqq->queued[0] == 0 && bfqq->queued[1] == 0)
-+			/*
-+			 * The queue may not be empty upon timer expiration,
-+			 * because we may not disable the timer when the
-+			 * first request of the in-service queue arrives
-+			 * during disk idling.
-+			 */
-+			reason = BFQ_BFQQ_TOO_IDLE;
-+		else
-+			goto schedule_dispatch;
-+
-+		bfq_bfqq_expire(bfqd, bfqq, 1, reason);
-+	}
-+
-+schedule_dispatch:
-+	bfq_schedule_dispatch(bfqd);
-+
-+	spin_unlock_irqrestore(bfqd->queue->queue_lock, flags);
-+}
-+
-+static void bfq_shutdown_timer_wq(struct bfq_data *bfqd)
-+{
-+	del_timer_sync(&bfqd->idle_slice_timer);
-+	cancel_work_sync(&bfqd->unplug_work);
-+}
-+
-+static inline void __bfq_put_async_bfqq(struct bfq_data *bfqd,
-+					struct bfq_queue **bfqq_ptr)
-+{
-+	struct bfq_group *root_group = bfqd->root_group;
-+	struct bfq_queue *bfqq = *bfqq_ptr;
-+
-+	bfq_log(bfqd, "put_async_bfqq: %p", bfqq);
-+	if (bfqq != NULL) {
-+		bfq_bfqq_move(bfqd, bfqq, &bfqq->entity, root_group);
-+		bfq_log_bfqq(bfqd, bfqq, "put_async_bfqq: putting %p, %d",
-+			     bfqq, atomic_read(&bfqq->ref));
-+		bfq_put_queue(bfqq);
-+		*bfqq_ptr = NULL;
-+	}
-+}
-+
-+/*
-+ * Release all the bfqg references to its async queues.  If we are
-+ * deallocating the group these queues may still contain requests, so
-+ * we reparent them to the root cgroup (i.e., the only one that will
-+ * exist for sure until all the requests on a device are gone).
-+ */
-+static void bfq_put_async_queues(struct bfq_data *bfqd, struct bfq_group *bfqg)
-+{
-+	int i, j;
-+
-+	for (i = 0; i < 2; i++)
-+		for (j = 0; j < IOPRIO_BE_NR; j++)
-+			__bfq_put_async_bfqq(bfqd, &bfqg->async_bfqq[i][j]);
-+
-+	__bfq_put_async_bfqq(bfqd, &bfqg->async_idle_bfqq);
-+}
-+
-+static void bfq_exit_queue(struct elevator_queue *e)
-+{
-+	struct bfq_data *bfqd = e->elevator_data;
-+	struct request_queue *q = bfqd->queue;
-+	struct bfq_queue *bfqq, *n;
-+
-+	bfq_shutdown_timer_wq(bfqd);
-+
-+	spin_lock_irq(q->queue_lock);
-+
-+	BUG_ON(bfqd->in_service_queue != NULL);
-+	list_for_each_entry_safe(bfqq, n, &bfqd->idle_list, bfqq_list)
-+		bfq_deactivate_bfqq(bfqd, bfqq, 0);
-+
-+	bfq_disconnect_groups(bfqd);
-+	spin_unlock_irq(q->queue_lock);
-+
-+	bfq_shutdown_timer_wq(bfqd);
-+
-+	synchronize_rcu();
-+
-+	BUG_ON(timer_pending(&bfqd->idle_slice_timer));
-+
-+	bfq_free_root_group(bfqd);
-+	kfree(bfqd);
-+}
-+
-+static int bfq_init_queue(struct request_queue *q, struct elevator_type *e)
-+{
-+	struct bfq_group *bfqg;
-+	struct bfq_data *bfqd;
-+	struct elevator_queue *eq;
-+
-+	eq = elevator_alloc(q, e);
-+	if (eq == NULL)
-+		return -ENOMEM;
-+
-+	bfqd = kzalloc_node(sizeof(*bfqd), GFP_KERNEL, q->node);
-+	if (bfqd == NULL) {
-+		kobject_put(&eq->kobj);
-+		return -ENOMEM;
-+	}
-+	eq->elevator_data = bfqd;
-+
-+	/*
-+	 * Our fallback bfqq if bfq_find_alloc_queue() runs into OOM issues.
-+	 * Grab a permanent reference to it, so that the normal code flow
-+	 * will not attempt to free it.
-+	 */
-+	bfq_init_bfqq(bfqd, &bfqd->oom_bfqq, 1, 0);
-+	atomic_inc(&bfqd->oom_bfqq.ref);
-+	bfqd->oom_bfqq.entity.new_ioprio = BFQ_DEFAULT_QUEUE_IOPRIO;
-+	bfqd->oom_bfqq.entity.new_ioprio_class = IOPRIO_CLASS_BE;
-+	/*
-+	 * Trigger weight initialization, according to ioprio, at the
-+	 * oom_bfqq's first activation. The oom_bfqq's ioprio and ioprio
-+	 * class won't be changed any more.
-+	 */
-+	bfqd->oom_bfqq.entity.ioprio_changed = 1;
-+
-+	bfqd->queue = q;
-+
-+	spin_lock_irq(q->queue_lock);
-+	q->elevator = eq;
-+	spin_unlock_irq(q->queue_lock);
-+
-+	bfqg = bfq_alloc_root_group(bfqd, q->node);
-+	if (bfqg == NULL) {
-+		kfree(bfqd);
-+		kobject_put(&eq->kobj);
-+		return -ENOMEM;
-+	}
-+
-+	bfqd->root_group = bfqg;
-+	bfq_init_entity(&bfqd->oom_bfqq.entity, bfqd->root_group);
-+#ifdef CONFIG_CGROUP_BFQIO
-+	bfqd->active_numerous_groups = 0;
-+#endif
-+
-+	init_timer(&bfqd->idle_slice_timer);
-+	bfqd->idle_slice_timer.function = bfq_idle_slice_timer;
-+	bfqd->idle_slice_timer.data = (unsigned long)bfqd;
-+
-+	bfqd->rq_pos_tree = RB_ROOT;
-+	bfqd->queue_weights_tree = RB_ROOT;
-+	bfqd->group_weights_tree = RB_ROOT;
-+
-+	INIT_WORK(&bfqd->unplug_work, bfq_kick_queue);
-+
-+	INIT_LIST_HEAD(&bfqd->active_list);
-+	INIT_LIST_HEAD(&bfqd->idle_list);
-+	INIT_HLIST_HEAD(&bfqd->burst_list);
-+
-+	bfqd->hw_tag = -1;
-+
-+	bfqd->bfq_max_budget = bfq_default_max_budget;
-+
-+	bfqd->bfq_quantum = bfq_quantum;
-+	bfqd->bfq_fifo_expire[0] = bfq_fifo_expire[0];
-+	bfqd->bfq_fifo_expire[1] = bfq_fifo_expire[1];
-+	bfqd->bfq_back_max = bfq_back_max;
-+	bfqd->bfq_back_penalty = bfq_back_penalty;
-+	bfqd->bfq_slice_idle = bfq_slice_idle;
-+	bfqd->bfq_class_idle_last_service = 0;
-+	bfqd->bfq_max_budget_async_rq = bfq_max_budget_async_rq;
-+	bfqd->bfq_timeout[BLK_RW_ASYNC] = bfq_timeout_async;
-+	bfqd->bfq_timeout[BLK_RW_SYNC] = bfq_timeout_sync;
-+
-+	bfqd->bfq_coop_thresh = 2;
-+	bfqd->bfq_failed_cooperations = 7000;
-+	bfqd->bfq_requests_within_timer = 120;
-+
-+	bfqd->bfq_large_burst_thresh = 11;
-+	bfqd->bfq_burst_interval = msecs_to_jiffies(500);
-+
-+	bfqd->low_latency = true;
-+
-+	bfqd->bfq_wr_coeff = 20;
-+	bfqd->bfq_wr_rt_max_time = msecs_to_jiffies(300);
-+	bfqd->bfq_wr_max_time = 0;
-+	bfqd->bfq_wr_min_idle_time = msecs_to_jiffies(2000);
-+	bfqd->bfq_wr_min_inter_arr_async = msecs_to_jiffies(500);
-+	bfqd->bfq_wr_max_softrt_rate = 7000; /*
-+					      * Approximate rate required
-+					      * to playback or record a
-+					      * high-definition compressed
-+					      * video.
-+					      */
-+	bfqd->wr_busy_queues = 0;
-+	bfqd->busy_in_flight_queues = 0;
-+	bfqd->const_seeky_busy_in_flight_queues = 0;
-+
-+	/*
-+	 * Begin by assuming, optimistically, that the device peak rate is
-+	 * equal to the highest reference rate.
-+	 */
-+	bfqd->RT_prod = R_fast[blk_queue_nonrot(bfqd->queue)] *
-+			T_fast[blk_queue_nonrot(bfqd->queue)];
-+	bfqd->peak_rate = R_fast[blk_queue_nonrot(bfqd->queue)];
-+	bfqd->device_speed = BFQ_BFQD_FAST;
-+
-+	return 0;
-+}
-+
-+static void bfq_slab_kill(void)
-+{
-+	if (bfq_pool != NULL)
-+		kmem_cache_destroy(bfq_pool);
-+}
-+
-+static int __init bfq_slab_setup(void)
-+{
-+	bfq_pool = KMEM_CACHE(bfq_queue, 0);
-+	if (bfq_pool == NULL)
-+		return -ENOMEM;
-+	return 0;
-+}
-+
-+static ssize_t bfq_var_show(unsigned int var, char *page)
-+{
-+	return sprintf(page, "%d\n", var);
-+}
-+
-+static ssize_t bfq_var_store(unsigned long *var, const char *page,
-+			     size_t count)
-+{
-+	unsigned long new_val;
-+	int ret = kstrtoul(page, 10, &new_val);
-+
-+	if (ret == 0)
-+		*var = new_val;
-+
-+	return count;
-+}
-+
-+static ssize_t bfq_wr_max_time_show(struct elevator_queue *e, char *page)
-+{
-+	struct bfq_data *bfqd = e->elevator_data;
-+	return sprintf(page, "%d\n", bfqd->bfq_wr_max_time > 0 ?
-+		       jiffies_to_msecs(bfqd->bfq_wr_max_time) :
-+		       jiffies_to_msecs(bfq_wr_duration(bfqd)));
-+}
-+
-+static ssize_t bfq_weights_show(struct elevator_queue *e, char *page)
-+{
-+	struct bfq_queue *bfqq;
-+	struct bfq_data *bfqd = e->elevator_data;
-+	ssize_t num_char = 0;
-+
-+	num_char += sprintf(page + num_char, "Tot reqs queued %d\n\n",
-+			    bfqd->queued);
-+
-+	spin_lock_irq(bfqd->queue->queue_lock);
-+
-+	num_char += sprintf(page + num_char, "Active:\n");
-+	list_for_each_entry(bfqq, &bfqd->active_list, bfqq_list) {
-+	  num_char += sprintf(page + num_char,
-+			      "pid%d: weight %hu, nr_queued %d %d, dur %d/%u\n",
-+			      bfqq->pid,
-+			      bfqq->entity.weight,
-+			      bfqq->queued[0],
-+			      bfqq->queued[1],
-+			jiffies_to_msecs(jiffies - bfqq->last_wr_start_finish),
-+			jiffies_to_msecs(bfqq->wr_cur_max_time));
-+	}
-+
-+	num_char += sprintf(page + num_char, "Idle:\n");
-+	list_for_each_entry(bfqq, &bfqd->idle_list, bfqq_list) {
-+			num_char += sprintf(page + num_char,
-+				"pid%d: weight %hu, dur %d/%u\n",
-+				bfqq->pid,
-+				bfqq->entity.weight,
-+				jiffies_to_msecs(jiffies -
-+					bfqq->last_wr_start_finish),
-+				jiffies_to_msecs(bfqq->wr_cur_max_time));
-+	}
-+
-+	spin_unlock_irq(bfqd->queue->queue_lock);
-+
-+	return num_char;
-+}
-+
-+#define SHOW_FUNCTION(__FUNC, __VAR, __CONV)				\
-+static ssize_t __FUNC(struct elevator_queue *e, char *page)		\
-+{									\
-+	struct bfq_data *bfqd = e->elevator_data;			\
-+	unsigned int __data = __VAR;					\
-+	if (__CONV)							\
-+		__data = jiffies_to_msecs(__data);			\
-+	return bfq_var_show(__data, (page));				\
-+}
-+SHOW_FUNCTION(bfq_quantum_show, bfqd->bfq_quantum, 0);
-+SHOW_FUNCTION(bfq_fifo_expire_sync_show, bfqd->bfq_fifo_expire[1], 1);
-+SHOW_FUNCTION(bfq_fifo_expire_async_show, bfqd->bfq_fifo_expire[0], 1);
-+SHOW_FUNCTION(bfq_back_seek_max_show, bfqd->bfq_back_max, 0);
-+SHOW_FUNCTION(bfq_back_seek_penalty_show, bfqd->bfq_back_penalty, 0);
-+SHOW_FUNCTION(bfq_slice_idle_show, bfqd->bfq_slice_idle, 1);
-+SHOW_FUNCTION(bfq_max_budget_show, bfqd->bfq_user_max_budget, 0);
-+SHOW_FUNCTION(bfq_max_budget_async_rq_show,
-+	      bfqd->bfq_max_budget_async_rq, 0);
-+SHOW_FUNCTION(bfq_timeout_sync_show, bfqd->bfq_timeout[BLK_RW_SYNC], 1);
-+SHOW_FUNCTION(bfq_timeout_async_show, bfqd->bfq_timeout[BLK_RW_ASYNC], 1);
-+SHOW_FUNCTION(bfq_low_latency_show, bfqd->low_latency, 0);
-+SHOW_FUNCTION(bfq_wr_coeff_show, bfqd->bfq_wr_coeff, 0);
-+SHOW_FUNCTION(bfq_wr_rt_max_time_show, bfqd->bfq_wr_rt_max_time, 1);
-+SHOW_FUNCTION(bfq_wr_min_idle_time_show, bfqd->bfq_wr_min_idle_time, 1);
-+SHOW_FUNCTION(bfq_wr_min_inter_arr_async_show, bfqd->bfq_wr_min_inter_arr_async,
-+	1);
-+SHOW_FUNCTION(bfq_wr_max_softrt_rate_show, bfqd->bfq_wr_max_softrt_rate, 0);
-+#undef SHOW_FUNCTION
-+
-+#define STORE_FUNCTION(__FUNC, __PTR, MIN, MAX, __CONV)			\
-+static ssize_t								\
-+__FUNC(struct elevator_queue *e, const char *page, size_t count)	\
-+{									\
-+	struct bfq_data *bfqd = e->elevator_data;			\
-+	unsigned long uninitialized_var(__data);			\
-+	int ret = bfq_var_store(&__data, (page), count);		\
-+	if (__data < (MIN))						\
-+		__data = (MIN);						\
-+	else if (__data > (MAX))					\
-+		__data = (MAX);						\
-+	if (__CONV)							\
-+		*(__PTR) = msecs_to_jiffies(__data);			\
-+	else								\
-+		*(__PTR) = __data;					\
-+	return ret;							\
-+}
-+STORE_FUNCTION(bfq_quantum_store, &bfqd->bfq_quantum, 1, INT_MAX, 0);
-+STORE_FUNCTION(bfq_fifo_expire_sync_store, &bfqd->bfq_fifo_expire[1], 1,
-+		INT_MAX, 1);
-+STORE_FUNCTION(bfq_fifo_expire_async_store, &bfqd->bfq_fifo_expire[0], 1,
-+		INT_MAX, 1);
-+STORE_FUNCTION(bfq_back_seek_max_store, &bfqd->bfq_back_max, 0, INT_MAX, 0);
-+STORE_FUNCTION(bfq_back_seek_penalty_store, &bfqd->bfq_back_penalty, 1,
-+		INT_MAX, 0);
-+STORE_FUNCTION(bfq_slice_idle_store, &bfqd->bfq_slice_idle, 0, INT_MAX, 1);
-+STORE_FUNCTION(bfq_max_budget_async_rq_store, &bfqd->bfq_max_budget_async_rq,
-+		1, INT_MAX, 0);
-+STORE_FUNCTION(bfq_timeout_async_store, &bfqd->bfq_timeout[BLK_RW_ASYNC], 0,
-+		INT_MAX, 1);
-+STORE_FUNCTION(bfq_wr_coeff_store, &bfqd->bfq_wr_coeff, 1, INT_MAX, 0);
-+STORE_FUNCTION(bfq_wr_max_time_store, &bfqd->bfq_wr_max_time, 0, INT_MAX, 1);
-+STORE_FUNCTION(bfq_wr_rt_max_time_store, &bfqd->bfq_wr_rt_max_time, 0, INT_MAX,
-+		1);
-+STORE_FUNCTION(bfq_wr_min_idle_time_store, &bfqd->bfq_wr_min_idle_time, 0,
-+		INT_MAX, 1);
-+STORE_FUNCTION(bfq_wr_min_inter_arr_async_store,
-+		&bfqd->bfq_wr_min_inter_arr_async, 0, INT_MAX, 1);
-+STORE_FUNCTION(bfq_wr_max_softrt_rate_store, &bfqd->bfq_wr_max_softrt_rate, 0,
-+		INT_MAX, 0);
-+#undef STORE_FUNCTION
-+
-+/* do nothing for the moment */
-+static ssize_t bfq_weights_store(struct elevator_queue *e,
-+				    const char *page, size_t count)
-+{
-+	return count;
-+}
-+
-+static inline unsigned long bfq_estimated_max_budget(struct bfq_data *bfqd)
-+{
-+	u64 timeout = jiffies_to_msecs(bfqd->bfq_timeout[BLK_RW_SYNC]);
-+
-+	if (bfqd->peak_rate_samples >= BFQ_PEAK_RATE_SAMPLES)
-+		return bfq_calc_max_budget(bfqd->peak_rate, timeout);
-+	else
-+		return bfq_default_max_budget;
-+}
-+
-+static ssize_t bfq_max_budget_store(struct elevator_queue *e,
-+				    const char *page, size_t count)
-+{
-+	struct bfq_data *bfqd = e->elevator_data;
-+	unsigned long uninitialized_var(__data);
-+	int ret = bfq_var_store(&__data, (page), count);
-+
-+	if (__data == 0)
-+		bfqd->bfq_max_budget = bfq_estimated_max_budget(bfqd);
-+	else {
-+		if (__data > INT_MAX)
-+			__data = INT_MAX;
-+		bfqd->bfq_max_budget = __data;
-+	}
-+
-+	bfqd->bfq_user_max_budget = __data;
-+
-+	return ret;
-+}
-+
-+static ssize_t bfq_timeout_sync_store(struct elevator_queue *e,
-+				      const char *page, size_t count)
-+{
-+	struct bfq_data *bfqd = e->elevator_data;
-+	unsigned long uninitialized_var(__data);
-+	int ret = bfq_var_store(&__data, (page), count);
-+
-+	if (__data < 1)
-+		__data = 1;
-+	else if (__data > INT_MAX)
-+		__data = INT_MAX;
-+
-+	bfqd->bfq_timeout[BLK_RW_SYNC] = msecs_to_jiffies(__data);
-+	if (bfqd->bfq_user_max_budget == 0)
-+		bfqd->bfq_max_budget = bfq_estimated_max_budget(bfqd);
-+
-+	return ret;
-+}
-+
-+static ssize_t bfq_low_latency_store(struct elevator_queue *e,
-+				     const char *page, size_t count)
-+{
-+	struct bfq_data *bfqd = e->elevator_data;
-+	unsigned long uninitialized_var(__data);
-+	int ret = bfq_var_store(&__data, (page), count);
-+
-+	if (__data > 1)
-+		__data = 1;
-+	if (__data == 0 && bfqd->low_latency != 0)
-+		bfq_end_wr(bfqd);
-+	bfqd->low_latency = __data;
-+
-+	return ret;
-+}
-+
-+#define BFQ_ATTR(name) \
-+	__ATTR(name, S_IRUGO|S_IWUSR, bfq_##name##_show, bfq_##name##_store)
-+
-+static struct elv_fs_entry bfq_attrs[] = {
-+	BFQ_ATTR(quantum),
-+	BFQ_ATTR(fifo_expire_sync),
-+	BFQ_ATTR(fifo_expire_async),
-+	BFQ_ATTR(back_seek_max),
-+	BFQ_ATTR(back_seek_penalty),
-+	BFQ_ATTR(slice_idle),
-+	BFQ_ATTR(max_budget),
-+	BFQ_ATTR(max_budget_async_rq),
-+	BFQ_ATTR(timeout_sync),
-+	BFQ_ATTR(timeout_async),
-+	BFQ_ATTR(low_latency),
-+	BFQ_ATTR(wr_coeff),
-+	BFQ_ATTR(wr_max_time),
-+	BFQ_ATTR(wr_rt_max_time),
-+	BFQ_ATTR(wr_min_idle_time),
-+	BFQ_ATTR(wr_min_inter_arr_async),
-+	BFQ_ATTR(wr_max_softrt_rate),
-+	BFQ_ATTR(weights),
-+	__ATTR_NULL
-+};
-+
-+static struct elevator_type iosched_bfq = {
-+	.ops = {
-+		.elevator_merge_fn =		bfq_merge,
-+		.elevator_merged_fn =		bfq_merged_request,
-+		.elevator_merge_req_fn =	bfq_merged_requests,
-+		.elevator_allow_merge_fn =	bfq_allow_merge,
-+		.elevator_dispatch_fn =		bfq_dispatch_requests,
-+		.elevator_add_req_fn =		bfq_insert_request,
-+		.elevator_activate_req_fn =	bfq_activate_request,
-+		.elevator_deactivate_req_fn =	bfq_deactivate_request,
-+		.elevator_completed_req_fn =	bfq_completed_request,
-+		.elevator_former_req_fn =	elv_rb_former_request,
-+		.elevator_latter_req_fn =	elv_rb_latter_request,
-+		.elevator_init_icq_fn =		bfq_init_icq,
-+		.elevator_exit_icq_fn =		bfq_exit_icq,
-+		.elevator_set_req_fn =		bfq_set_request,
-+		.elevator_put_req_fn =		bfq_put_request,
-+		.elevator_may_queue_fn =	bfq_may_queue,
-+		.elevator_init_fn =		bfq_init_queue,
-+		.elevator_exit_fn =		bfq_exit_queue,
-+	},
-+	.icq_size =		sizeof(struct bfq_io_cq),
-+	.icq_align =		__alignof__(struct bfq_io_cq),
-+	.elevator_attrs =	bfq_attrs,
-+	.elevator_name =	"bfq",
-+	.elevator_owner =	THIS_MODULE,
-+};
-+
-+static int __init bfq_init(void)
-+{
-+	/*
-+	 * Can be 0 on HZ < 1000 setups.
-+	 */
-+	if (bfq_slice_idle == 0)
-+		bfq_slice_idle = 1;
-+
-+	if (bfq_timeout_async == 0)
-+		bfq_timeout_async = 1;
-+
-+	if (bfq_slab_setup())
-+		return -ENOMEM;
-+
-+	/*
-+	 * Times to load large popular applications for the typical systems
-+	 * installed on the reference devices (see the comments before the
-+	 * definitions of the two arrays).
-+	 */
-+	T_slow[0] = msecs_to_jiffies(2600);
-+	T_slow[1] = msecs_to_jiffies(1000);
-+	T_fast[0] = msecs_to_jiffies(5500);
-+	T_fast[1] = msecs_to_jiffies(2000);
-+
-+	/*
-+	 * Thresholds that determine the switch between speed classes (see
-+	 * the comments before the definition of the array).
-+	 */
-+	device_speed_thresh[0] = (R_fast[0] + R_slow[0]) / 2;
-+	device_speed_thresh[1] = (R_fast[1] + R_slow[1]) / 2;
-+
-+	elv_register(&iosched_bfq);
-+	pr_info("BFQ I/O-scheduler version: v7r7");
-+
-+	return 0;
-+}
-+
-+static void __exit bfq_exit(void)
-+{
-+	elv_unregister(&iosched_bfq);
-+	bfq_slab_kill();
-+}
-+
-+module_init(bfq_init);
-+module_exit(bfq_exit);
-+
-+MODULE_AUTHOR("Fabio Checconi, Paolo Valente");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/block/bfq-sched.c linux-xbian-imx6/block/bfq-sched.c
---- linux-4.1.3/block/bfq-sched.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/block/bfq-sched.c	2015-07-27 23:13:03.604123194 +0200
-@@ -0,0 +1,1186 @@
-+/*
-+ * BFQ: Hierarchical B-WF2Q+ scheduler.
-+ *
-+ * Based on ideas and code from CFQ:
-+ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
-+ *
-+ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
-+ *		      Paolo Valente <paolo.valente@unimore.it>
-+ *
-+ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
-+ */
-+
-+#ifdef CONFIG_CGROUP_BFQIO
-+#define for_each_entity(entity)	\
-+	for (; entity != NULL; entity = entity->parent)
-+
-+#define for_each_entity_safe(entity, parent) \
-+	for (; entity && ({ parent = entity->parent; 1; }); entity = parent)
-+
-+static struct bfq_entity *bfq_lookup_next_entity(struct bfq_sched_data *sd,
-+						 int extract,
-+						 struct bfq_data *bfqd);
-+
-+static inline void bfq_update_budget(struct bfq_entity *next_in_service)
-+{
-+	struct bfq_entity *bfqg_entity;
-+	struct bfq_group *bfqg;
-+	struct bfq_sched_data *group_sd;
-+
-+	BUG_ON(next_in_service == NULL);
-+
-+	group_sd = next_in_service->sched_data;
-+
-+	bfqg = container_of(group_sd, struct bfq_group, sched_data);
-+	/*
-+	 * bfq_group's my_entity field is not NULL only if the group
-+	 * is not the root group. We must not touch the root entity
-+	 * as it must never become an in-service entity.
-+	 */
-+	bfqg_entity = bfqg->my_entity;
-+	if (bfqg_entity != NULL)
-+		bfqg_entity->budget = next_in_service->budget;
-+}
-+
-+static int bfq_update_next_in_service(struct bfq_sched_data *sd)
-+{
-+	struct bfq_entity *next_in_service;
-+
-+	if (sd->in_service_entity != NULL)
-+		/* will update/requeue at the end of service */
-+		return 0;
-+
-+	/*
-+	 * NOTE: this can be improved in many ways, such as returning
-+	 * 1 (and thus propagating upwards the update) only when the
-+	 * budget changes, or caching the bfqq that will be scheduled
-+	 * next from this subtree.  By now we worry more about
-+	 * correctness than about performance...
-+	 */
-+	next_in_service = bfq_lookup_next_entity(sd, 0, NULL);
-+	sd->next_in_service = next_in_service;
-+
-+	if (next_in_service != NULL)
-+		bfq_update_budget(next_in_service);
-+
-+	return 1;
-+}
-+
-+static inline void bfq_check_next_in_service(struct bfq_sched_data *sd,
-+					     struct bfq_entity *entity)
-+{
-+	BUG_ON(sd->next_in_service != entity);
-+}
-+#else
-+#define for_each_entity(entity)	\
-+	for (; entity != NULL; entity = NULL)
-+
-+#define for_each_entity_safe(entity, parent) \
-+	for (parent = NULL; entity != NULL; entity = parent)
-+
-+static inline int bfq_update_next_in_service(struct bfq_sched_data *sd)
-+{
-+	return 0;
-+}
-+
-+static inline void bfq_check_next_in_service(struct bfq_sched_data *sd,
-+					     struct bfq_entity *entity)
-+{
-+}
-+
-+static inline void bfq_update_budget(struct bfq_entity *next_in_service)
-+{
-+}
-+#endif
-+
-+/*
-+ * Shift for timestamp calculations.  This actually limits the maximum
-+ * service allowed in one timestamp delta (small shift values increase it),
-+ * the maximum total weight that can be used for the queues in the system
-+ * (big shift values increase it), and the period of virtual time
-+ * wraparounds.
-+ */
-+#define WFQ_SERVICE_SHIFT	22
-+
-+/**
-+ * bfq_gt - compare two timestamps.
-+ * @a: first ts.
-+ * @b: second ts.
-+ *
-+ * Return @a > @b, dealing with wrapping correctly.
-+ */
-+static inline int bfq_gt(u64 a, u64 b)
-+{
-+	return (s64)(a - b) > 0;
-+}
-+
-+static inline struct bfq_queue *bfq_entity_to_bfqq(struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = NULL;
-+
-+	BUG_ON(entity == NULL);
-+
-+	if (entity->my_sched_data == NULL)
-+		bfqq = container_of(entity, struct bfq_queue, entity);
-+
-+	return bfqq;
-+}
-+
-+
-+/**
-+ * bfq_delta - map service into the virtual time domain.
-+ * @service: amount of service.
-+ * @weight: scale factor (weight of an entity or weight sum).
-+ */
-+static inline u64 bfq_delta(unsigned long service,
-+					unsigned long weight)
-+{
-+	u64 d = (u64)service << WFQ_SERVICE_SHIFT;
-+
-+	do_div(d, weight);
-+	return d;
-+}
-+
-+/**
-+ * bfq_calc_finish - assign the finish time to an entity.
-+ * @entity: the entity to act upon.
-+ * @service: the service to be charged to the entity.
-+ */
-+static inline void bfq_calc_finish(struct bfq_entity *entity,
-+				   unsigned long service)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+
-+	BUG_ON(entity->weight == 0);
-+
-+	entity->finish = entity->start +
-+		bfq_delta(service, entity->weight);
-+
-+	if (bfqq != NULL) {
-+		bfq_log_bfqq(bfqq->bfqd, bfqq,
-+			"calc_finish: serv %lu, w %d",
-+			service, entity->weight);
-+		bfq_log_bfqq(bfqq->bfqd, bfqq,
-+			"calc_finish: start %llu, finish %llu, delta %llu",
-+			entity->start, entity->finish,
-+			bfq_delta(service, entity->weight));
-+	}
-+}
-+
-+/**
-+ * bfq_entity_of - get an entity from a node.
-+ * @node: the node field of the entity.
-+ *
-+ * Convert a node pointer to the relative entity.  This is used only
-+ * to simplify the logic of some functions and not as the generic
-+ * conversion mechanism because, e.g., in the tree walking functions,
-+ * the check for a %NULL value would be redundant.
-+ */
-+static inline struct bfq_entity *bfq_entity_of(struct rb_node *node)
-+{
-+	struct bfq_entity *entity = NULL;
-+
-+	if (node != NULL)
-+		entity = rb_entry(node, struct bfq_entity, rb_node);
-+
-+	return entity;
-+}
-+
-+/**
-+ * bfq_extract - remove an entity from a tree.
-+ * @root: the tree root.
-+ * @entity: the entity to remove.
-+ */
-+static inline void bfq_extract(struct rb_root *root,
-+			       struct bfq_entity *entity)
-+{
-+	BUG_ON(entity->tree != root);
-+
-+	entity->tree = NULL;
-+	rb_erase(&entity->rb_node, root);
-+}
-+
-+/**
-+ * bfq_idle_extract - extract an entity from the idle tree.
-+ * @st: the service tree of the owning @entity.
-+ * @entity: the entity being removed.
-+ */
-+static void bfq_idle_extract(struct bfq_service_tree *st,
-+			     struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+	struct rb_node *next;
-+
-+	BUG_ON(entity->tree != &st->idle);
-+
-+	if (entity == st->first_idle) {
-+		next = rb_next(&entity->rb_node);
-+		st->first_idle = bfq_entity_of(next);
-+	}
-+
-+	if (entity == st->last_idle) {
-+		next = rb_prev(&entity->rb_node);
-+		st->last_idle = bfq_entity_of(next);
-+	}
-+
-+	bfq_extract(&st->idle, entity);
-+
-+	if (bfqq != NULL)
-+		list_del(&bfqq->bfqq_list);
-+}
-+
-+/**
-+ * bfq_insert - generic tree insertion.
-+ * @root: tree root.
-+ * @entity: entity to insert.
-+ *
-+ * This is used for the idle and the active tree, since they are both
-+ * ordered by finish time.
-+ */
-+static void bfq_insert(struct rb_root *root, struct bfq_entity *entity)
-+{
-+	struct bfq_entity *entry;
-+	struct rb_node **node = &root->rb_node;
-+	struct rb_node *parent = NULL;
-+
-+	BUG_ON(entity->tree != NULL);
-+
-+	while (*node != NULL) {
-+		parent = *node;
-+		entry = rb_entry(parent, struct bfq_entity, rb_node);
-+
-+		if (bfq_gt(entry->finish, entity->finish))
-+			node = &parent->rb_left;
-+		else
-+			node = &parent->rb_right;
-+	}
-+
-+	rb_link_node(&entity->rb_node, parent, node);
-+	rb_insert_color(&entity->rb_node, root);
-+
-+	entity->tree = root;
-+}
-+
-+/**
-+ * bfq_update_min - update the min_start field of a entity.
-+ * @entity: the entity to update.
-+ * @node: one of its children.
-+ *
-+ * This function is called when @entity may store an invalid value for
-+ * min_start due to updates to the active tree.  The function  assumes
-+ * that the subtree rooted at @node (which may be its left or its right
-+ * child) has a valid min_start value.
-+ */
-+static inline void bfq_update_min(struct bfq_entity *entity,
-+				  struct rb_node *node)
-+{
-+	struct bfq_entity *child;
-+
-+	if (node != NULL) {
-+		child = rb_entry(node, struct bfq_entity, rb_node);
-+		if (bfq_gt(entity->min_start, child->min_start))
-+			entity->min_start = child->min_start;
-+	}
-+}
-+
-+/**
-+ * bfq_update_active_node - recalculate min_start.
-+ * @node: the node to update.
-+ *
-+ * @node may have changed position or one of its children may have moved,
-+ * this function updates its min_start value.  The left and right subtrees
-+ * are assumed to hold a correct min_start value.
-+ */
-+static inline void bfq_update_active_node(struct rb_node *node)
-+{
-+	struct bfq_entity *entity = rb_entry(node, struct bfq_entity, rb_node);
-+
-+	entity->min_start = entity->start;
-+	bfq_update_min(entity, node->rb_right);
-+	bfq_update_min(entity, node->rb_left);
-+}
-+
-+/**
-+ * bfq_update_active_tree - update min_start for the whole active tree.
-+ * @node: the starting node.
-+ *
-+ * @node must be the deepest modified node after an update.  This function
-+ * updates its min_start using the values held by its children, assuming
-+ * that they did not change, and then updates all the nodes that may have
-+ * changed in the path to the root.  The only nodes that may have changed
-+ * are the ones in the path or their siblings.
-+ */
-+static void bfq_update_active_tree(struct rb_node *node)
-+{
-+	struct rb_node *parent;
-+
-+up:
-+	bfq_update_active_node(node);
-+
-+	parent = rb_parent(node);
-+	if (parent == NULL)
-+		return;
-+
-+	if (node == parent->rb_left && parent->rb_right != NULL)
-+		bfq_update_active_node(parent->rb_right);
-+	else if (parent->rb_left != NULL)
-+		bfq_update_active_node(parent->rb_left);
-+
-+	node = parent;
-+	goto up;
-+}
-+
-+static void bfq_weights_tree_add(struct bfq_data *bfqd,
-+				 struct bfq_entity *entity,
-+				 struct rb_root *root);
-+
-+static void bfq_weights_tree_remove(struct bfq_data *bfqd,
-+				    struct bfq_entity *entity,
-+				    struct rb_root *root);
-+
-+
-+/**
-+ * bfq_active_insert - insert an entity in the active tree of its
-+ *                     group/device.
-+ * @st: the service tree of the entity.
-+ * @entity: the entity being inserted.
-+ *
-+ * The active tree is ordered by finish time, but an extra key is kept
-+ * per each node, containing the minimum value for the start times of
-+ * its children (and the node itself), so it's possible to search for
-+ * the eligible node with the lowest finish time in logarithmic time.
-+ */
-+static void bfq_active_insert(struct bfq_service_tree *st,
-+			      struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+	struct rb_node *node = &entity->rb_node;
-+#ifdef CONFIG_CGROUP_BFQIO
-+	struct bfq_sched_data *sd = NULL;
-+	struct bfq_group *bfqg = NULL;
-+	struct bfq_data *bfqd = NULL;
-+#endif
-+
-+	bfq_insert(&st->active, entity);
-+
-+	if (node->rb_left != NULL)
-+		node = node->rb_left;
-+	else if (node->rb_right != NULL)
-+		node = node->rb_right;
-+
-+	bfq_update_active_tree(node);
-+
-+#ifdef CONFIG_CGROUP_BFQIO
-+	sd = entity->sched_data;
-+	bfqg = container_of(sd, struct bfq_group, sched_data);
-+	BUG_ON(!bfqg);
-+	bfqd = (struct bfq_data *)bfqg->bfqd;
-+#endif
-+	if (bfqq != NULL)
-+		list_add(&bfqq->bfqq_list, &bfqq->bfqd->active_list);
-+#ifdef CONFIG_CGROUP_BFQIO
-+	else { /* bfq_group */
-+		BUG_ON(!bfqd);
-+		bfq_weights_tree_add(bfqd, entity, &bfqd->group_weights_tree);
-+	}
-+	if (bfqg != bfqd->root_group) {
-+		BUG_ON(!bfqg);
-+		BUG_ON(!bfqd);
-+		bfqg->active_entities++;
-+		if (bfqg->active_entities == 2)
-+			bfqd->active_numerous_groups++;
-+	}
-+#endif
-+}
-+
-+/**
-+ * bfq_ioprio_to_weight - calc a weight from an ioprio.
-+ * @ioprio: the ioprio value to convert.
-+ */
-+static inline unsigned short bfq_ioprio_to_weight(int ioprio)
-+{
-+	BUG_ON(ioprio < 0 || ioprio >= IOPRIO_BE_NR);
-+	return IOPRIO_BE_NR - ioprio;
-+}
-+
-+/**
-+ * bfq_weight_to_ioprio - calc an ioprio from a weight.
-+ * @weight: the weight value to convert.
-+ *
-+ * To preserve as mush as possible the old only-ioprio user interface,
-+ * 0 is used as an escape ioprio value for weights (numerically) equal or
-+ * larger than IOPRIO_BE_NR
-+ */
-+static inline unsigned short bfq_weight_to_ioprio(int weight)
-+{
-+	BUG_ON(weight < BFQ_MIN_WEIGHT || weight > BFQ_MAX_WEIGHT);
-+	return IOPRIO_BE_NR - weight < 0 ? 0 : IOPRIO_BE_NR - weight;
-+}
-+
-+static inline void bfq_get_entity(struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+
-+	if (bfqq != NULL) {
-+		atomic_inc(&bfqq->ref);
-+		bfq_log_bfqq(bfqq->bfqd, bfqq, "get_entity: %p %d",
-+			     bfqq, atomic_read(&bfqq->ref));
-+	}
-+}
-+
-+/**
-+ * bfq_find_deepest - find the deepest node that an extraction can modify.
-+ * @node: the node being removed.
-+ *
-+ * Do the first step of an extraction in an rb tree, looking for the
-+ * node that will replace @node, and returning the deepest node that
-+ * the following modifications to the tree can touch.  If @node is the
-+ * last node in the tree return %NULL.
-+ */
-+static struct rb_node *bfq_find_deepest(struct rb_node *node)
-+{
-+	struct rb_node *deepest;
-+
-+	if (node->rb_right == NULL && node->rb_left == NULL)
-+		deepest = rb_parent(node);
-+	else if (node->rb_right == NULL)
-+		deepest = node->rb_left;
-+	else if (node->rb_left == NULL)
-+		deepest = node->rb_right;
-+	else {
-+		deepest = rb_next(node);
-+		if (deepest->rb_right != NULL)
-+			deepest = deepest->rb_right;
-+		else if (rb_parent(deepest) != node)
-+			deepest = rb_parent(deepest);
-+	}
-+
-+	return deepest;
-+}
-+
-+/**
-+ * bfq_active_extract - remove an entity from the active tree.
-+ * @st: the service_tree containing the tree.
-+ * @entity: the entity being removed.
-+ */
-+static void bfq_active_extract(struct bfq_service_tree *st,
-+			       struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+	struct rb_node *node;
-+#ifdef CONFIG_CGROUP_BFQIO
-+	struct bfq_sched_data *sd = NULL;
-+	struct bfq_group *bfqg = NULL;
-+	struct bfq_data *bfqd = NULL;
-+#endif
-+
-+	node = bfq_find_deepest(&entity->rb_node);
-+	bfq_extract(&st->active, entity);
-+
-+	if (node != NULL)
-+		bfq_update_active_tree(node);
-+
-+#ifdef CONFIG_CGROUP_BFQIO
-+	sd = entity->sched_data;
-+	bfqg = container_of(sd, struct bfq_group, sched_data);
-+	BUG_ON(!bfqg);
-+	bfqd = (struct bfq_data *)bfqg->bfqd;
-+#endif
-+	if (bfqq != NULL)
-+		list_del(&bfqq->bfqq_list);
-+#ifdef CONFIG_CGROUP_BFQIO
-+	else { /* bfq_group */
-+		BUG_ON(!bfqd);
-+		bfq_weights_tree_remove(bfqd, entity,
-+					&bfqd->group_weights_tree);
-+	}
-+	if (bfqg != bfqd->root_group) {
-+		BUG_ON(!bfqg);
-+		BUG_ON(!bfqd);
-+		BUG_ON(!bfqg->active_entities);
-+		bfqg->active_entities--;
-+		if (bfqg->active_entities == 1) {
-+			BUG_ON(!bfqd->active_numerous_groups);
-+			bfqd->active_numerous_groups--;
-+		}
-+	}
-+#endif
-+}
-+
-+/**
-+ * bfq_idle_insert - insert an entity into the idle tree.
-+ * @st: the service tree containing the tree.
-+ * @entity: the entity to insert.
-+ */
-+static void bfq_idle_insert(struct bfq_service_tree *st,
-+			    struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+	struct bfq_entity *first_idle = st->first_idle;
-+	struct bfq_entity *last_idle = st->last_idle;
-+
-+	if (first_idle == NULL || bfq_gt(first_idle->finish, entity->finish))
-+		st->first_idle = entity;
-+	if (last_idle == NULL || bfq_gt(entity->finish, last_idle->finish))
-+		st->last_idle = entity;
-+
-+	bfq_insert(&st->idle, entity);
-+
-+	if (bfqq != NULL)
-+		list_add(&bfqq->bfqq_list, &bfqq->bfqd->idle_list);
-+}
-+
-+/**
-+ * bfq_forget_entity - remove an entity from the wfq trees.
-+ * @st: the service tree.
-+ * @entity: the entity being removed.
-+ *
-+ * Update the device status and forget everything about @entity, putting
-+ * the device reference to it, if it is a queue.  Entities belonging to
-+ * groups are not refcounted.
-+ */
-+static void bfq_forget_entity(struct bfq_service_tree *st,
-+			      struct bfq_entity *entity)
-+{
-+	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+	struct bfq_sched_data *sd;
-+
-+	BUG_ON(!entity->on_st);
-+
-+	entity->on_st = 0;
-+	st->wsum -= entity->weight;
-+	if (bfqq != NULL) {
-+		sd = entity->sched_data;
-+		bfq_log_bfqq(bfqq->bfqd, bfqq, "forget_entity: %p %d",
-+			     bfqq, atomic_read(&bfqq->ref));
-+		bfq_put_queue(bfqq);
-+	}
-+}
-+
-+/**
-+ * bfq_put_idle_entity - release the idle tree ref of an entity.
-+ * @st: service tree for the entity.
-+ * @entity: the entity being released.
-+ */
-+static void bfq_put_idle_entity(struct bfq_service_tree *st,
-+				struct bfq_entity *entity)
-+{
-+	bfq_idle_extract(st, entity);
-+	bfq_forget_entity(st, entity);
-+}
-+
-+/**
-+ * bfq_forget_idle - update the idle tree if necessary.
-+ * @st: the service tree to act upon.
-+ *
-+ * To preserve the global O(log N) complexity we only remove one entry here;
-+ * as the idle tree will not grow indefinitely this can be done safely.
-+ */
-+static void bfq_forget_idle(struct bfq_service_tree *st)
-+{
-+	struct bfq_entity *first_idle = st->first_idle;
-+	struct bfq_entity *last_idle = st->last_idle;
-+
-+	if (RB_EMPTY_ROOT(&st->active) && last_idle != NULL &&
-+	    !bfq_gt(last_idle->finish, st->vtime)) {
-+		/*
-+		 * Forget the whole idle tree, increasing the vtime past
-+		 * the last finish time of idle entities.
-+		 */
-+		st->vtime = last_idle->finish;
-+	}
-+
-+	if (first_idle != NULL && !bfq_gt(first_idle->finish, st->vtime))
-+		bfq_put_idle_entity(st, first_idle);
-+}
-+
-+static struct bfq_service_tree *
-+__bfq_entity_update_weight_prio(struct bfq_service_tree *old_st,
-+			 struct bfq_entity *entity)
-+{
-+	struct bfq_service_tree *new_st = old_st;
-+
-+	if (entity->ioprio_changed) {
-+		struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
-+		unsigned short prev_weight, new_weight;
-+		struct bfq_data *bfqd = NULL;
-+		struct rb_root *root;
-+#ifdef CONFIG_CGROUP_BFQIO
-+		struct bfq_sched_data *sd;
-+		struct bfq_group *bfqg;
-+#endif
-+
-+		if (bfqq != NULL)
-+			bfqd = bfqq->bfqd;
-+#ifdef CONFIG_CGROUP_BFQIO
-+		else {
-+			sd = entity->my_sched_data;
-+			bfqg = container_of(sd, struct bfq_group, sched_data);
-+			BUG_ON(!bfqg);
-+			bfqd = (struct bfq_data *)bfqg->bfqd;
-+			BUG_ON(!bfqd);
-+		}
-+#endif
-+
-+		BUG_ON(old_st->wsum < entity->weight);
-+		old_st->wsum -= entity->weight;
-+
-+		if (entity->new_weight != entity->orig_weight) {
-+			if (entity->new_weight < BFQ_MIN_WEIGHT ||
-+			    entity->new_weight > BFQ_MAX_WEIGHT) {
-+				printk(KERN_CRIT "update_weight_prio: "
-+						 "new_weight %d\n",
-+					entity->new_weight);
-+				BUG();
-+			}
-+			entity->orig_weight = entity->new_weight;
-+			entity->ioprio =
-+				bfq_weight_to_ioprio(entity->orig_weight);
-+		} else if (entity->new_ioprio != entity->ioprio) {
-+			entity->ioprio = entity->new_ioprio;
-+			entity->orig_weight =
-+					bfq_ioprio_to_weight(entity->ioprio);
-+		} else
-+			entity->new_weight = entity->orig_weight =
-+				bfq_ioprio_to_weight(entity->ioprio);
-+
-+		entity->ioprio_class = entity->new_ioprio_class;
-+		entity->ioprio_changed = 0;
-+
-+		/*
-+		 * NOTE: here we may be changing the weight too early,
-+		 * this will cause unfairness.  The correct approach
-+		 * would have required additional complexity to defer
-+		 * weight changes to the proper time instants (i.e.,
-+		 * when entity->finish <= old_st->vtime).
-+		 */
-+		new_st = bfq_entity_service_tree(entity);
-+
-+		prev_weight = entity->weight;
-+		new_weight = entity->orig_weight *
-+			     (bfqq != NULL ? bfqq->wr_coeff : 1);
-+		/*
-+		 * If the weight of the entity changes, remove the entity
-+		 * from its old weight counter (if there is a counter
-+		 * associated with the entity), and add it to the counter
-+		 * associated with its new weight.
-+		 */
-+		if (prev_weight != new_weight) {
-+			root = bfqq ? &bfqd->queue_weights_tree :
-+				      &bfqd->group_weights_tree;
-+			bfq_weights_tree_remove(bfqd, entity, root);
-+		}
-+		entity->weight = new_weight;
-+		/*
-+		 * Add the entity to its weights tree only if it is
-+		 * not associated with a weight-raised queue.
-+		 */
-+		if (prev_weight != new_weight &&
-+		    (bfqq ? bfqq->wr_coeff == 1 : 1))
-+			/* If we get here, root has been initialized. */
-+			bfq_weights_tree_add(bfqd, entity, root);
-+
-+		new_st->wsum += entity->weight;
-+
-+		if (new_st != old_st)
-+			entity->start = new_st->vtime;
-+	}
-+
-+	return new_st;
-+}
-+
-+/**
-+ * bfq_bfqq_served - update the scheduler status after selection for
-+ *                   service.
-+ * @bfqq: the queue being served.
-+ * @served: bytes to transfer.
-+ *
-+ * NOTE: this can be optimized, as the timestamps of upper level entities
-+ * are synchronized every time a new bfqq is selected for service.  By now,
-+ * we keep it to better check consistency.
-+ */
-+static void bfq_bfqq_served(struct bfq_queue *bfqq, unsigned long served)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+	struct bfq_service_tree *st;
-+
-+	for_each_entity(entity) {
-+		st = bfq_entity_service_tree(entity);
-+
-+		entity->service += served;
-+		BUG_ON(entity->service > entity->budget);
-+		BUG_ON(st->wsum == 0);
-+
-+		st->vtime += bfq_delta(served, st->wsum);
-+		bfq_forget_idle(st);
-+	}
-+	bfq_log_bfqq(bfqq->bfqd, bfqq, "bfqq_served %lu secs", served);
-+}
-+
-+/**
-+ * bfq_bfqq_charge_full_budget - set the service to the entity budget.
-+ * @bfqq: the queue that needs a service update.
-+ *
-+ * When it's not possible to be fair in the service domain, because
-+ * a queue is not consuming its budget fast enough (the meaning of
-+ * fast depends on the timeout parameter), we charge it a full
-+ * budget.  In this way we should obtain a sort of time-domain
-+ * fairness among all the seeky/slow queues.
-+ */
-+static inline void bfq_bfqq_charge_full_budget(struct bfq_queue *bfqq)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+
-+	bfq_log_bfqq(bfqq->bfqd, bfqq, "charge_full_budget");
-+
-+	bfq_bfqq_served(bfqq, entity->budget - entity->service);
-+}
-+
-+/**
-+ * __bfq_activate_entity - activate an entity.
-+ * @entity: the entity being activated.
-+ *
-+ * Called whenever an entity is activated, i.e., it is not active and one
-+ * of its children receives a new request, or has to be reactivated due to
-+ * budget exhaustion.  It uses the current budget of the entity (and the
-+ * service received if @entity is active) of the queue to calculate its
-+ * timestamps.
-+ */
-+static void __bfq_activate_entity(struct bfq_entity *entity)
-+{
-+	struct bfq_sched_data *sd = entity->sched_data;
-+	struct bfq_service_tree *st = bfq_entity_service_tree(entity);
-+
-+	if (entity == sd->in_service_entity) {
-+		BUG_ON(entity->tree != NULL);
-+		/*
-+		 * If we are requeueing the current entity we have
-+		 * to take care of not charging to it service it has
-+		 * not received.
-+		 */
-+		bfq_calc_finish(entity, entity->service);
-+		entity->start = entity->finish;
-+		sd->in_service_entity = NULL;
-+	} else if (entity->tree == &st->active) {
-+		/*
-+		 * Requeueing an entity due to a change of some
-+		 * next_in_service entity below it.  We reuse the
-+		 * old start time.
-+		 */
-+		bfq_active_extract(st, entity);
-+	} else if (entity->tree == &st->idle) {
-+		/*
-+		 * Must be on the idle tree, bfq_idle_extract() will
-+		 * check for that.
-+		 */
-+		bfq_idle_extract(st, entity);
-+		entity->start = bfq_gt(st->vtime, entity->finish) ?
-+				       st->vtime : entity->finish;
-+	} else {
-+		/*
-+		 * The finish time of the entity may be invalid, and
-+		 * it is in the past for sure, otherwise the queue
-+		 * would have been on the idle tree.
-+		 */
-+		entity->start = st->vtime;
-+		st->wsum += entity->weight;
-+		bfq_get_entity(entity);
-+
-+		BUG_ON(entity->on_st);
-+		entity->on_st = 1;
-+	}
-+
-+	st = __bfq_entity_update_weight_prio(st, entity);
-+	bfq_calc_finish(entity, entity->budget);
-+	bfq_active_insert(st, entity);
-+}
-+
-+/**
-+ * bfq_activate_entity - activate an entity and its ancestors if necessary.
-+ * @entity: the entity to activate.
-+ *
-+ * Activate @entity and all the entities on the path from it to the root.
-+ */
-+static void bfq_activate_entity(struct bfq_entity *entity)
-+{
-+	struct bfq_sched_data *sd;
-+
-+	for_each_entity(entity) {
-+		__bfq_activate_entity(entity);
-+
-+		sd = entity->sched_data;
-+		if (!bfq_update_next_in_service(sd))
-+			/*
-+			 * No need to propagate the activation to the
-+			 * upper entities, as they will be updated when
-+			 * the in-service entity is rescheduled.
-+			 */
-+			break;
-+	}
-+}
-+
-+/**
-+ * __bfq_deactivate_entity - deactivate an entity from its service tree.
-+ * @entity: the entity to deactivate.
-+ * @requeue: if false, the entity will not be put into the idle tree.
-+ *
-+ * Deactivate an entity, independently from its previous state.  If the
-+ * entity was not on a service tree just return, otherwise if it is on
-+ * any scheduler tree, extract it from that tree, and if necessary
-+ * and if the caller did not specify @requeue, put it on the idle tree.
-+ *
-+ * Return %1 if the caller should update the entity hierarchy, i.e.,
-+ * if the entity was in service or if it was the next_in_service for
-+ * its sched_data; return %0 otherwise.
-+ */
-+static int __bfq_deactivate_entity(struct bfq_entity *entity, int requeue)
-+{
-+	struct bfq_sched_data *sd = entity->sched_data;
-+	struct bfq_service_tree *st = bfq_entity_service_tree(entity);
-+	int was_in_service = entity == sd->in_service_entity;
-+	int ret = 0;
-+
-+	if (!entity->on_st)
-+		return 0;
-+
-+	BUG_ON(was_in_service && entity->tree != NULL);
-+
-+	if (was_in_service) {
-+		bfq_calc_finish(entity, entity->service);
-+		sd->in_service_entity = NULL;
-+	} else if (entity->tree == &st->active)
-+		bfq_active_extract(st, entity);
-+	else if (entity->tree == &st->idle)
-+		bfq_idle_extract(st, entity);
-+	else if (entity->tree != NULL)
-+		BUG();
-+
-+	if (was_in_service || sd->next_in_service == entity)
-+		ret = bfq_update_next_in_service(sd);
-+
-+	if (!requeue || !bfq_gt(entity->finish, st->vtime))
-+		bfq_forget_entity(st, entity);
-+	else
-+		bfq_idle_insert(st, entity);
-+
-+	BUG_ON(sd->in_service_entity == entity);
-+	BUG_ON(sd->next_in_service == entity);
-+
-+	return ret;
-+}
-+
-+/**
-+ * bfq_deactivate_entity - deactivate an entity.
-+ * @entity: the entity to deactivate.
-+ * @requeue: true if the entity can be put on the idle tree
-+ */
-+static void bfq_deactivate_entity(struct bfq_entity *entity, int requeue)
-+{
-+	struct bfq_sched_data *sd;
-+	struct bfq_entity *parent;
-+
-+	for_each_entity_safe(entity, parent) {
-+		sd = entity->sched_data;
-+
-+		if (!__bfq_deactivate_entity(entity, requeue))
-+			/*
-+			 * The parent entity is still backlogged, and
-+			 * we don't need to update it as it is still
-+			 * in service.
-+			 */
-+			break;
-+
-+		if (sd->next_in_service != NULL)
-+			/*
-+			 * The parent entity is still backlogged and
-+			 * the budgets on the path towards the root
-+			 * need to be updated.
-+			 */
-+			goto update;
-+
-+		/*
-+		 * If we reach there the parent is no more backlogged and
-+		 * we want to propagate the dequeue upwards.
-+		 */
-+		requeue = 1;
-+	}
-+
-+	return;
-+
-+update:
-+	entity = parent;
-+	for_each_entity(entity) {
-+		__bfq_activate_entity(entity);
-+
-+		sd = entity->sched_data;
-+		if (!bfq_update_next_in_service(sd))
-+			break;
-+	}
-+}
-+
-+/**
-+ * bfq_update_vtime - update vtime if necessary.
-+ * @st: the service tree to act upon.
-+ *
-+ * If necessary update the service tree vtime to have at least one
-+ * eligible entity, skipping to its start time.  Assumes that the
-+ * active tree of the device is not empty.
-+ *
-+ * NOTE: this hierarchical implementation updates vtimes quite often,
-+ * we may end up with reactivated processes getting timestamps after a
-+ * vtime skip done because we needed a ->first_active entity on some
-+ * intermediate node.
-+ */
-+static void bfq_update_vtime(struct bfq_service_tree *st)
-+{
-+	struct bfq_entity *entry;
-+	struct rb_node *node = st->active.rb_node;
-+
-+	entry = rb_entry(node, struct bfq_entity, rb_node);
-+	if (bfq_gt(entry->min_start, st->vtime)) {
-+		st->vtime = entry->min_start;
-+		bfq_forget_idle(st);
-+	}
-+}
-+
-+/**
-+ * bfq_first_active_entity - find the eligible entity with
-+ *                           the smallest finish time
-+ * @st: the service tree to select from.
-+ *
-+ * This function searches the first schedulable entity, starting from the
-+ * root of the tree and going on the left every time on this side there is
-+ * a subtree with at least one eligible (start >= vtime) entity. The path on
-+ * the right is followed only if a) the left subtree contains no eligible
-+ * entities and b) no eligible entity has been found yet.
-+ */
-+static struct bfq_entity *bfq_first_active_entity(struct bfq_service_tree *st)
-+{
-+	struct bfq_entity *entry, *first = NULL;
-+	struct rb_node *node = st->active.rb_node;
-+
-+	while (node != NULL) {
-+		entry = rb_entry(node, struct bfq_entity, rb_node);
-+left:
-+		if (!bfq_gt(entry->start, st->vtime))
-+			first = entry;
-+
-+		BUG_ON(bfq_gt(entry->min_start, st->vtime));
-+
-+		if (node->rb_left != NULL) {
-+			entry = rb_entry(node->rb_left,
-+					 struct bfq_entity, rb_node);
-+			if (!bfq_gt(entry->min_start, st->vtime)) {
-+				node = node->rb_left;
-+				goto left;
-+			}
-+		}
-+		if (first != NULL)
-+			break;
-+		node = node->rb_right;
-+	}
-+
-+	BUG_ON(first == NULL && !RB_EMPTY_ROOT(&st->active));
-+	return first;
-+}
-+
-+/**
-+ * __bfq_lookup_next_entity - return the first eligible entity in @st.
-+ * @st: the service tree.
-+ *
-+ * Update the virtual time in @st and return the first eligible entity
-+ * it contains.
-+ */
-+static struct bfq_entity *__bfq_lookup_next_entity(struct bfq_service_tree *st,
-+						   bool force)
-+{
-+	struct bfq_entity *entity, *new_next_in_service = NULL;
-+
-+	if (RB_EMPTY_ROOT(&st->active))
-+		return NULL;
-+
-+	bfq_update_vtime(st);
-+	entity = bfq_first_active_entity(st);
-+	BUG_ON(bfq_gt(entity->start, st->vtime));
-+
-+	/*
-+	 * If the chosen entity does not match with the sched_data's
-+	 * next_in_service and we are forcedly serving the IDLE priority
-+	 * class tree, bubble up budget update.
-+	 */
-+	if (unlikely(force && entity != entity->sched_data->next_in_service)) {
-+		new_next_in_service = entity;
-+		for_each_entity(new_next_in_service)
-+			bfq_update_budget(new_next_in_service);
-+	}
-+
-+	return entity;
-+}
-+
-+/**
-+ * bfq_lookup_next_entity - return the first eligible entity in @sd.
-+ * @sd: the sched_data.
-+ * @extract: if true the returned entity will be also extracted from @sd.
-+ *
-+ * NOTE: since we cache the next_in_service entity at each level of the
-+ * hierarchy, the complexity of the lookup can be decreased with
-+ * absolutely no effort just returning the cached next_in_service value;
-+ * we prefer to do full lookups to test the consistency of * the data
-+ * structures.
-+ */
-+static struct bfq_entity *bfq_lookup_next_entity(struct bfq_sched_data *sd,
-+						 int extract,
-+						 struct bfq_data *bfqd)
-+{
-+	struct bfq_service_tree *st = sd->service_tree;
-+	struct bfq_entity *entity;
-+	int i = 0;
-+
-+	BUG_ON(sd->in_service_entity != NULL);
-+
-+	if (bfqd != NULL &&
-+	    jiffies - bfqd->bfq_class_idle_last_service > BFQ_CL_IDLE_TIMEOUT) {
-+		entity = __bfq_lookup_next_entity(st + BFQ_IOPRIO_CLASSES - 1,
-+						  true);
-+		if (entity != NULL) {
-+			i = BFQ_IOPRIO_CLASSES - 1;
-+			bfqd->bfq_class_idle_last_service = jiffies;
-+			sd->next_in_service = entity;
-+		}
-+	}
-+	for (; i < BFQ_IOPRIO_CLASSES; i++) {
-+		entity = __bfq_lookup_next_entity(st + i, false);
-+		if (entity != NULL) {
-+			if (extract) {
-+				bfq_check_next_in_service(sd, entity);
-+				bfq_active_extract(st + i, entity);
-+				sd->in_service_entity = entity;
-+				sd->next_in_service = NULL;
-+			}
-+			break;
-+		}
-+	}
-+
-+	return entity;
-+}
-+
-+/*
-+ * Get next queue for service.
-+ */
-+static struct bfq_queue *bfq_get_next_queue(struct bfq_data *bfqd)
-+{
-+	struct bfq_entity *entity = NULL;
-+	struct bfq_sched_data *sd;
-+	struct bfq_queue *bfqq;
-+
-+	BUG_ON(bfqd->in_service_queue != NULL);
-+
-+	if (bfqd->busy_queues == 0)
-+		return NULL;
-+
-+	sd = &bfqd->root_group->sched_data;
-+	for (; sd != NULL; sd = entity->my_sched_data) {
-+		entity = bfq_lookup_next_entity(sd, 1, bfqd);
-+		BUG_ON(entity == NULL);
-+		entity->service = 0;
-+	}
-+
-+	bfqq = bfq_entity_to_bfqq(entity);
-+	BUG_ON(bfqq == NULL);
-+
-+	return bfqq;
-+}
-+
-+static void __bfq_bfqd_reset_in_service(struct bfq_data *bfqd)
-+{
-+	if (bfqd->in_service_bic != NULL) {
-+		put_io_context(bfqd->in_service_bic->icq.ioc);
-+		bfqd->in_service_bic = NULL;
-+	}
-+
-+	bfqd->in_service_queue = NULL;
-+	del_timer(&bfqd->idle_slice_timer);
-+}
-+
-+static void bfq_deactivate_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+				int requeue)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+
-+	if (bfqq == bfqd->in_service_queue)
-+		__bfq_bfqd_reset_in_service(bfqd);
-+
-+	bfq_deactivate_entity(entity, requeue);
-+}
-+
-+static void bfq_activate_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	struct bfq_entity *entity = &bfqq->entity;
-+
-+	bfq_activate_entity(entity);
-+}
-+
-+/*
-+ * Called when the bfqq no longer has requests pending, remove it from
-+ * the service tree.
-+ */
-+static void bfq_del_bfqq_busy(struct bfq_data *bfqd, struct bfq_queue *bfqq,
-+			      int requeue)
-+{
-+	BUG_ON(!bfq_bfqq_busy(bfqq));
-+	BUG_ON(!RB_EMPTY_ROOT(&bfqq->sort_list));
-+
-+	bfq_log_bfqq(bfqd, bfqq, "del from busy");
-+
-+	bfq_clear_bfqq_busy(bfqq);
-+
-+	BUG_ON(bfqd->busy_queues == 0);
-+	bfqd->busy_queues--;
-+
-+	if (!bfqq->dispatched) {
-+		bfq_weights_tree_remove(bfqd, &bfqq->entity,
-+					&bfqd->queue_weights_tree);
-+		if (!blk_queue_nonrot(bfqd->queue)) {
-+			BUG_ON(!bfqd->busy_in_flight_queues);
-+			bfqd->busy_in_flight_queues--;
-+			if (bfq_bfqq_constantly_seeky(bfqq)) {
-+				BUG_ON(!bfqd->
-+					const_seeky_busy_in_flight_queues);
-+				bfqd->const_seeky_busy_in_flight_queues--;
-+			}
-+		}
-+	}
-+	if (bfqq->wr_coeff > 1)
-+		bfqd->wr_busy_queues--;
-+
-+	bfq_deactivate_bfqq(bfqd, bfqq, requeue);
-+}
-+
-+/*
-+ * Called when an inactive queue receives a new request.
-+ */
-+static void bfq_add_bfqq_busy(struct bfq_data *bfqd, struct bfq_queue *bfqq)
-+{
-+	BUG_ON(bfq_bfqq_busy(bfqq));
-+	BUG_ON(bfqq == bfqd->in_service_queue);
-+
-+	bfq_log_bfqq(bfqd, bfqq, "add to busy");
-+
-+	bfq_activate_bfqq(bfqd, bfqq);
-+
-+	bfq_mark_bfqq_busy(bfqq);
-+	bfqd->busy_queues++;
-+
-+	if (!bfqq->dispatched) {
-+		if (bfqq->wr_coeff == 1)
-+			bfq_weights_tree_add(bfqd, &bfqq->entity,
-+					     &bfqd->queue_weights_tree);
-+		if (!blk_queue_nonrot(bfqd->queue)) {
-+			bfqd->busy_in_flight_queues++;
-+			if (bfq_bfqq_constantly_seeky(bfqq))
-+				bfqd->const_seeky_busy_in_flight_queues++;
-+		}
-+	}
-+	if (bfqq->wr_coeff > 1)
-+		bfqd->wr_busy_queues++;
-+}
-diff -Nur linux-4.1.3/block/Kconfig.iosched linux-xbian-imx6/block/Kconfig.iosched
---- linux-4.1.3/block/Kconfig.iosched	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/block/Kconfig.iosched	2015-07-27 23:13:03.600137415 +0200
-@@ -39,6 +39,27 @@
- 	---help---
- 	  Enable group IO scheduling in CFQ.
- 
-+config IOSCHED_BFQ
-+	tristate "BFQ I/O scheduler"
-+	default n
-+	---help---
-+	  The BFQ I/O scheduler tries to distribute bandwidth among
-+	  all processes according to their weights.
-+	  It aims at distributing the bandwidth as desired, independently of
-+	  the disk parameters and with any workload. It also tries to
-+	  guarantee low latency to interactive and soft real-time
-+	  applications. If compiled built-in (saying Y here), BFQ can
-+	  be configured to support hierarchical scheduling.
-+
-+config CGROUP_BFQIO
-+	bool "BFQ hierarchical scheduling support"
-+	depends on CGROUPS && IOSCHED_BFQ=y
-+	default n
-+	---help---
-+	  Enable hierarchical scheduling in BFQ, using the cgroups
-+	  filesystem interface.  The name of the subsystem will be
-+	  bfqio.
-+
- choice
- 	prompt "Default I/O scheduler"
- 	default DEFAULT_CFQ
-@@ -52,6 +73,16 @@
- 	config DEFAULT_CFQ
- 		bool "CFQ" if IOSCHED_CFQ=y
- 
-+	config DEFAULT_BFQ
-+		bool "BFQ" if IOSCHED_BFQ=y
-+		help
-+		  Selects BFQ as the default I/O scheduler which will be
-+		  used by default for all block devices.
-+		  The BFQ I/O scheduler aims at distributing the bandwidth
-+		  as desired, independently of the disk parameters and with
-+		  any workload. It also tries to guarantee low latency to
-+		  interactive and soft real-time applications.
-+
- 	config DEFAULT_NOOP
- 		bool "No-op"
- 
-@@ -61,6 +92,7 @@
- 	string
- 	default "deadline" if DEFAULT_DEADLINE
- 	default "cfq" if DEFAULT_CFQ
-+	default "bfq" if DEFAULT_BFQ
- 	default "noop" if DEFAULT_NOOP
- 
- endmenu
-diff -Nur linux-4.1.3/block/Makefile linux-xbian-imx6/block/Makefile
---- linux-4.1.3/block/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/block/Makefile	2015-07-27 23:13:03.600137415 +0200
-@@ -18,6 +18,7 @@
- obj-$(CONFIG_IOSCHED_NOOP)	+= noop-iosched.o
- obj-$(CONFIG_IOSCHED_DEADLINE)	+= deadline-iosched.o
- obj-$(CONFIG_IOSCHED_CFQ)	+= cfq-iosched.o
-+obj-$(CONFIG_IOSCHED_BFQ)	+= bfq-iosched.o
- 
- obj-$(CONFIG_BLOCK_COMPAT)	+= compat_ioctl.o
- obj-$(CONFIG_BLK_CMDLINE_PARSER)	+= cmdline-parser.o
-diff -Nur linux-4.1.3/Documentation/devicetree/bindings/mmc/mmc.txt linux-xbian-imx6/Documentation/devicetree/bindings/mmc/mmc.txt
---- linux-4.1.3/Documentation/devicetree/bindings/mmc/mmc.txt	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/Documentation/devicetree/bindings/mmc/mmc.txt	2015-07-27 23:12:59.335353684 +0200
-@@ -5,6 +5,8 @@
- Interpreted by the OF core:
- - reg: Registers location and length.
- - interrupts: Interrupts used by the MMC controller.
-+- clocks: Clocks needed for the host controller, if any.
-+- clock-names: Goes with clocks above.
- 
- Card detection:
- If no property below is supplied, host native card detect is used.
-@@ -43,6 +45,15 @@
- - dsr: Value the card's (optional) Driver Stage Register (DSR) should be
-   programmed with. Valid range: [0 .. 0xffff].
- 
-+Card power and reset control:
-+The following properties can be specified for cases where the MMC
-+peripheral needs additional reset, regulator and clock lines. It is for
-+example common for WiFi/BT adapters to have these separate from the main
-+MMC bus:
-+  - card-reset-gpios: Specify GPIOs for card reset (reset active low)
-+  - card-external-vcc-supply: Regulator to drive (independent) card VCC
-+  - clock with name "card_ext_clock": External clock provided to the card
-+
- *NOTE* on CD and WP polarity. To use common for all SD/MMC host controllers line
- polarity properties, we have to fix the meaning of the "normal" and "inverted"
- line levels. We choose to follow the SDHCI standard, which specifies both those
-diff -Nur linux-4.1.3/Documentation/devicetree/bindings/vendor-prefixes.txt linux-xbian-imx6/Documentation/devicetree/bindings/vendor-prefixes.txt
---- linux-4.1.3/Documentation/devicetree/bindings/vendor-prefixes.txt	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/Documentation/devicetree/bindings/vendor-prefixes.txt	2015-07-27 23:12:59.518699524 +0200
-@@ -201,6 +201,7 @@
- variscite	Variscite Ltd.
- via	VIA Technologies, Inc.
- virtio	Virtual I/O Device Specification, developed by the OASIS consortium
-+vivante	Vivante Corporation
- voipac	Voipac Technologies s.r.o.
- winbond Winbond Electronics corp.
- wlf	Wolfson Microelectronics
-diff -Nur linux-4.1.3/drivers/char/frandom.c linux-xbian-imx6/drivers/char/frandom.c
---- linux-4.1.3/drivers/char/frandom.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/char/frandom.c	2015-07-27 23:13:03.986757999 +0200
-@@ -0,0 +1,415 @@
-+/*
-+** frandom.c
-+**      Fast pseudo-random generator
-+**
-+**      (c) Copyright 2003-2011 Eli Billauer
-+**      http://www.billauer.co.il
-+**
-+** This program is free software; you can redistribute it and/or modify
-+** it under the terms of the GNU General Public License as published by
-+** the Free Software Foundation; either version 2 of the License, or
-+** (at your option) any later version.
-+**
-+**
-+*/
-+
-+#include <linux/version.h>
-+#include <linux/module.h>
-+#include <linux/moduleparam.h>
-+
-+#include <linux/kernel.h>
-+#include <linux/init.h>
-+#include <linux/slab.h>
-+#include <linux/fs.h>
-+#include <linux/errno.h>
-+#include <linux/types.h>
-+#include <linux/random.h>
-+
-+#include <asm/uaccess.h>
-+#include <linux/cdev.h>
-+#include <linux/err.h>
-+#include <linux/device.h>
-+
-+#define INTERNAL_SEED 0
-+#define EXTERNAL_SEED 1
-+
-+#define FRANDOM_MAJOR 235
-+#define FRANDOM_MINOR 11
-+#define ERANDOM_MINOR 12
-+
-+static struct file_operations frandom_fops; /* Values assigned below */
-+
-+static int erandom_seeded = 0; /* Internal flag */
-+
-+static int frandom_major = FRANDOM_MAJOR;
-+static int frandom_minor = FRANDOM_MINOR;
-+static int erandom_minor = ERANDOM_MINOR;
-+static int frandom_bufsize = 256;
-+static int frandom_chunklimit = 0; /* =0 means unlimited */
-+
-+static struct cdev frandom_cdev;
-+static struct cdev erandom_cdev;
-+static struct class *frandom_class;
-+struct device *frandom_device;
-+struct device *erandom_device;
-+
-+MODULE_DESCRIPTION("Fast pseudo-random number generator");
-+MODULE_LICENSE("GPL");
-+MODULE_AUTHOR("Eli Billauer");
-+module_param(frandom_major, int, 0);
-+module_param(frandom_minor, int, 0);
-+module_param(erandom_minor, int, 0);
-+module_param(frandom_bufsize, int, 0);
-+module_param(frandom_chunklimit, int, 0);
-+
-+MODULE_PARM_DESC(frandom_major,"Major number of /dev/frandom and /dev/erandom");
-+MODULE_PARM_DESC(frandom_minor,"Minor number of /dev/frandom");
-+MODULE_PARM_DESC(erandom_minor,"Minor number of /dev/erandom");
-+MODULE_PARM_DESC(frandom_bufsize,"Internal buffer size in bytes. Default is 256. Must be >= 256");
-+MODULE_PARM_DESC(frandom_chunklimit,"Limit for read() blocks size. 0 (default) is unlimited, otherwise must be >= 256");
-+
-+struct frandom_state
-+{
-+	struct semaphore sem; /* Semaphore on the state structure */
-+
-+	u8 S[256]; /* The state array */
-+	u8 i;
-+	u8 j;
-+
-+	char *buf;
-+};
-+
-+static struct frandom_state *erandom_state;
-+
-+static inline void swap_byte(u8 *a, u8 *b)
-+{
-+	u8 swapByte;
-+
-+	swapByte = *a;
-+	*a = *b;
-+	*b = swapByte;
-+}
-+
-+static void init_rand_state(struct frandom_state *state, int seedflag);
-+
-+void erandom_get_random_bytes(char *buf, size_t count)
-+{
-+	struct frandom_state *state = erandom_state;
-+	int k;
-+
-+	unsigned int i;
-+	unsigned int j;
-+	u8 *S;
-+
-+	/* If we fail to get the semaphore, we revert to external random data.
-+	   Since semaphore blocking is expected to be very rare, and interrupts
-+	   during these rare and very short periods of time even less frequent,
-+	   we take the better-safe-than-sorry approach, and fill the buffer
-+	   some expensive random data, in case the caller wasn't aware of this
-+	   possibility, and expects random data anyhow.
-+	*/
-+
-+	if (down_interruptible(&state->sem)) {
-+		get_random_bytes(buf, count);
-+		return;
-+	}
-+
-+	/* We seed erandom as late as possible, hoping that the kernel's main
-+	   RNG is already restored in the boot sequence (not critical, but
-+	   better.
-+	*/
-+
-+	if (!erandom_seeded) {
-+		erandom_seeded = 1;
-+		init_rand_state(state, EXTERNAL_SEED);
-+		printk(KERN_INFO "frandom: Seeded global generator now (used by erandom)\n");
-+	}
-+
-+	i = state->i;
-+	j = state->j;
-+	S = state->S;
-+
-+	for (k=0; k<count; k++) {
-+		i = (i + 1) & 0xff;
-+		j = (j + S[i]) & 0xff;
-+		swap_byte(&S[i], &S[j]);
-+		*buf++ = S[(S[i] + S[j]) & 0xff];
-+	}
-+
-+	state->i = i;
-+	state->j = j;
-+
-+	up(&state->sem);
-+}
-+
-+static void init_rand_state(struct frandom_state *state, int seedflag)
-+{
-+	unsigned int i, j, k;
-+	u8 *S;
-+	u8 *seed = state->buf;
-+
-+	if (seedflag == INTERNAL_SEED)
-+		erandom_get_random_bytes(seed, 256);
-+	else
-+		get_random_bytes(seed, 256);
-+
-+	S = state->S;
-+	for (i=0; i<256; i++)
-+		*S++=i;
-+
-+	j=0;
-+	S = state->S;
-+
-+	for (i=0; i<256; i++) {
-+		j = (j + S[i] + *seed++) & 0xff;
-+		swap_byte(&S[i], &S[j]);
-+	}
-+
-+	/* It's considered good practice to discard the first 256 bytes
-+	   generated. So we do it:
-+	*/
-+
-+	i=0; j=0;
-+	for (k=0; k<256; k++) {
-+		i = (i + 1) & 0xff;
-+		j = (j + S[i]) & 0xff;
-+		swap_byte(&S[i], &S[j]);
-+	}
-+
-+	state->i = i; /* Save state */
-+	state->j = j;
-+}
-+
-+static int frandom_open(struct inode *inode, struct file *filp)
-+{
-+
-+	struct frandom_state *state;
-+
-+	int num = iminor(inode);
-+
-+	/* This should never happen, now when the minors are regsitered
-+	 * explicitly
-+	 */
-+	if ((num != frandom_minor) && (num != erandom_minor)) return -ENODEV;
-+
-+	state = kmalloc(sizeof(struct frandom_state), GFP_KERNEL);
-+	if (!state)
-+		return -ENOMEM;
-+
-+	state->buf = kmalloc(frandom_bufsize, GFP_KERNEL);
-+	if (!state->buf) {
-+		kfree(state);
-+		return -ENOMEM;
-+	}
-+
-+	sema_init(&state->sem, 1); /* Init semaphore as a mutex */
-+
-+	if (num == frandom_minor)
-+		init_rand_state(state, EXTERNAL_SEED);
-+	else
-+		init_rand_state(state, INTERNAL_SEED);
-+
-+	filp->private_data = state;
-+
-+	return 0; /* Success */
-+}
-+
-+static int frandom_release(struct inode *inode, struct file *filp)
-+{
-+
-+	struct frandom_state *state = filp->private_data;
-+
-+	kfree(state->buf);
-+	kfree(state);
-+
-+	return 0;
-+}
-+
-+static ssize_t frandom_read(struct file *filp, char *buf, size_t count,
-+			    loff_t *f_pos)
-+{
-+	struct frandom_state *state = filp->private_data;
-+	ssize_t ret;
-+	int dobytes, k;
-+	char *localbuf;
-+
-+	unsigned int i;
-+	unsigned int j;
-+	u8 *S;
-+
-+	if (down_interruptible(&state->sem))
-+		return -ERESTARTSYS;
-+
-+	if ((frandom_chunklimit > 0) && (count > frandom_chunklimit))
-+		count = frandom_chunklimit;
-+
-+	ret = count; /* It's either everything or an error... */
-+
-+	i = state->i;
-+	j = state->j;
-+	S = state->S;
-+
-+	while (count) {
-+		if (count > frandom_bufsize)
-+			dobytes = frandom_bufsize;
-+		else
-+			dobytes = count;
-+
-+		localbuf = state->buf;
-+
-+		for (k=0; k<dobytes; k++) {
-+			i = (i + 1) & 0xff;
-+			j = (j + S[i]) & 0xff;
-+			swap_byte(&S[i], &S[j]);
-+			*localbuf++ = S[(S[i] + S[j]) & 0xff];
-+		}
-+
-+		if (copy_to_user(buf, state->buf, dobytes)) {
-+			ret = -EFAULT;
-+			goto out;
-+		}
-+
-+		buf += dobytes;
-+		count -= dobytes;
-+	}
-+
-+ out:
-+	state->i = i;
-+	state->j = j;
-+
-+	up(&state->sem);
-+	return ret;
-+}
-+
-+static struct file_operations frandom_fops = {
-+	read:       frandom_read,
-+	open:       frandom_open,
-+	release:    frandom_release,
-+};
-+
-+static void frandom_cleanup_module(void) {
-+	unregister_chrdev_region(MKDEV(frandom_major, erandom_minor), 1);
-+	cdev_del(&erandom_cdev);
-+	device_destroy(frandom_class, MKDEV(frandom_major, erandom_minor));
-+
-+	unregister_chrdev_region(MKDEV(frandom_major, frandom_minor), 1);
-+	cdev_del(&frandom_cdev);
-+	device_destroy(frandom_class, MKDEV(frandom_major, frandom_minor));
-+	class_destroy(frandom_class);
-+
-+	kfree(erandom_state->buf);
-+	kfree(erandom_state);
-+}
-+
-+
-+static int frandom_init_module(void)
-+{
-+	int result;
-+
-+	/* The buffer size MUST be at least 256 bytes, because we assume that
-+	   minimal length in init_rand_state().
-+	*/
-+	if (frandom_bufsize < 256) {
-+		printk(KERN_ERR "frandom: Refused to load because frandom_bufsize=%d < 256\n",frandom_bufsize);
-+		return -EINVAL;
-+	}
-+	if ((frandom_chunklimit != 0) && (frandom_chunklimit < 256)) {
-+		printk(KERN_ERR "frandom: Refused to load because frandom_chunklimit=%d < 256 and != 0\n",frandom_chunklimit);
-+		return -EINVAL;
-+	}
-+
-+	erandom_state = kmalloc(sizeof(struct frandom_state), GFP_KERNEL);
-+	if (!erandom_state)
-+		return -ENOMEM;
-+
-+	/* This specific buffer is only used for seeding, so we need
-+	   256 bytes exactly */
-+	erandom_state->buf = kmalloc(256, GFP_KERNEL);
-+	if (!erandom_state->buf) {
-+		kfree(erandom_state);
-+		return -ENOMEM;
-+	}
-+
-+	sema_init(&erandom_state->sem, 1); /* Init semaphore as a mutex */
-+
-+	erandom_seeded = 0;
-+
-+	frandom_class = class_create(THIS_MODULE, "fastrng");
-+	if (IS_ERR(frandom_class)) {
-+		result = PTR_ERR(frandom_class);
-+		printk(KERN_WARNING "frandom: Failed to register class fastrng\n");
-+		goto error0;
-+	}
-+
-+	/*
-+	 * Register your major, and accept a dynamic number. This is the
-+	 * first thing to do, in order to avoid releasing other module's
-+	 * fops in frandom_cleanup_module()
-+	 */
-+
-+	cdev_init(&frandom_cdev, &frandom_fops);
-+	frandom_cdev.owner = THIS_MODULE;
-+	result = cdev_add(&frandom_cdev, MKDEV(frandom_major, frandom_minor), 1);
-+	if (result) {
-+	  printk(KERN_WARNING "frandom: Failed to add cdev for /dev/frandom\n");
-+	  goto error1;
-+	}
-+
-+	result = register_chrdev_region(MKDEV(frandom_major, frandom_minor), 1, "/dev/frandom");
-+	if (result < 0) {
-+		printk(KERN_WARNING "frandom: can't get major/minor %d/%d\n", frandom_major, frandom_minor);
-+	  goto error2;
-+	}
-+
-+	frandom_device = device_create(frandom_class, NULL, MKDEV(frandom_major, frandom_minor), NULL, "frandom");
-+
-+	if (IS_ERR(frandom_device)) {
-+		printk(KERN_WARNING "frandom: Failed to create frandom device\n");
-+		goto error3;
-+	}
-+
-+	cdev_init(&erandom_cdev, &frandom_fops);
-+	erandom_cdev.owner = THIS_MODULE;
-+	result = cdev_add(&erandom_cdev, MKDEV(frandom_major, erandom_minor), 1);
-+	if (result) {
-+	  printk(KERN_WARNING "frandom: Failed to add cdev for /dev/erandom\n");
-+	  goto error4;
-+	}
-+
-+	result = register_chrdev_region(MKDEV(frandom_major, erandom_minor), 1, "/dev/erandom");
-+	if (result < 0) {
-+		printk(KERN_WARNING "frandom: can't get major/minor %d/%d\n", frandom_major, erandom_minor);
-+		goto error5;
-+	}
-+
-+	erandom_device = device_create(frandom_class, NULL, MKDEV(frandom_major, erandom_minor), NULL, "erandom");
-+
-+	if (IS_ERR(erandom_device)) {
-+		printk(KERN_WARNING "frandom: Failed to create erandom device\n");
-+		goto error6;
-+	}
-+	return 0; /* succeed */
-+
-+ error6:
-+	unregister_chrdev_region(MKDEV(frandom_major, erandom_minor), 1);
-+ error5:
-+	cdev_del(&erandom_cdev);
-+ error4:
-+	device_destroy(frandom_class, MKDEV(frandom_major, frandom_minor));
-+ error3:
-+	unregister_chrdev_region(MKDEV(frandom_major, frandom_minor), 1);
-+ error2:
-+	cdev_del(&frandom_cdev);
-+ error1:
-+	class_destroy(frandom_class);
-+ error0:
-+	kfree(erandom_state->buf);
-+	kfree(erandom_state);
-+
-+	return result;
-+}
-+
-+module_init(frandom_init_module);
-+module_exit(frandom_cleanup_module);
-+
-+EXPORT_SYMBOL(erandom_get_random_bytes);
-diff -Nur linux-4.1.3/drivers/char/Makefile linux-xbian-imx6/drivers/char/Makefile
---- linux-4.1.3/drivers/char/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/char/Makefile	2015-07-27 23:13:03.982772220 +0200
-@@ -2,6 +2,7 @@
- # Makefile for the kernel character device drivers.
- #
- 
-+obj-m				+= frandom.o
- obj-y				+= mem.o random.o
- obj-$(CONFIG_TTY_PRINTK)	+= ttyprintk.o
- obj-y				+= misc.o
-diff -Nur linux-4.1.3/drivers/cpufreq/imx6q-cpufreq.c linux-xbian-imx6/drivers/cpufreq/imx6q-cpufreq.c
---- linux-4.1.3/drivers/cpufreq/imx6q-cpufreq.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/cpufreq/imx6q-cpufreq.c	2015-07-27 23:13:04.158146502 +0200
-@@ -20,6 +20,8 @@
- #define PU_SOC_VOLTAGE_HIGH	1275000
- #define FREQ_1P2_GHZ		1200000000
- 
-+extern int vpu352;
-+
- static struct regulator *arm_reg;
- static struct regulator *pu_reg;
- static struct regulator *soc_reg;
-@@ -251,6 +253,10 @@
- 			unsigned long volt = be32_to_cpup(val++);
- 			if (freq_table[j].frequency == freq) {
- 				imx6_soc_volt[soc_opp_count++] = volt;
-+				if (vpu352 && freq == 792000) {
-+					pr_info("VPU352: increase SOC/PU voltage for VPU352MHz\n");
-+					imx6_soc_volt[soc_opp_count-1] = 1250000;
-+				}
- 				break;
- 			}
- 		}
-diff -Nur linux-4.1.3/drivers/crypto/caam/caamalg.c linux-xbian-imx6/drivers/crypto/caam/caamalg.c
---- linux-4.1.3/drivers/crypto/caam/caamalg.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/caamalg.c	2015-07-27 23:13:04.205975852 +0200
-@@ -1,7 +1,7 @@
- /*
-  * caam - Freescale FSL CAAM support for crypto API
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  *
-  * Based on talitos crypto API driver.
-  *
-@@ -53,6 +53,7 @@
- #include "error.h"
- #include "sg_sw_sec4.h"
- #include "key_gen.h"
-+#include <linux/string.h>
- 
- /*
-  * crypto alg
-@@ -60,68 +61,42 @@
- #define CAAM_CRA_PRIORITY		3000
- /* max key is sum of AES_MAX_KEY_SIZE, max split key size */
- #define CAAM_MAX_KEY_SIZE		(AES_MAX_KEY_SIZE + \
--					 CTR_RFC3686_NONCE_SIZE + \
- 					 SHA512_DIGEST_SIZE * 2)
- /* max IV is max of AES_BLOCK_SIZE, DES3_EDE_BLOCK_SIZE */
- #define CAAM_MAX_IV_LENGTH		16
- 
- /* length of descriptors text */
-+#define DESC_JOB_IO_LEN			(CAAM_CMD_SZ * 5 + CAAM_PTR_SZ * 3)
-+
- #define DESC_AEAD_BASE			(4 * CAAM_CMD_SZ)
--#define DESC_AEAD_ENC_LEN		(DESC_AEAD_BASE + 15 * CAAM_CMD_SZ)
--#define DESC_AEAD_DEC_LEN		(DESC_AEAD_BASE + 18 * CAAM_CMD_SZ)
-+#define DESC_AEAD_ENC_LEN		(DESC_AEAD_BASE + 16 * CAAM_CMD_SZ)
-+#define DESC_AEAD_DEC_LEN		(DESC_AEAD_BASE + 21 * CAAM_CMD_SZ)
- #define DESC_AEAD_GIVENC_LEN		(DESC_AEAD_ENC_LEN + 7 * CAAM_CMD_SZ)
- 
--/* Note: Nonce is counted in enckeylen */
--#define DESC_AEAD_CTR_RFC3686_LEN	(6 * CAAM_CMD_SZ)
--
--#define DESC_AEAD_NULL_BASE		(3 * CAAM_CMD_SZ)
--#define DESC_AEAD_NULL_ENC_LEN		(DESC_AEAD_NULL_BASE + 14 * CAAM_CMD_SZ)
--#define DESC_AEAD_NULL_DEC_LEN		(DESC_AEAD_NULL_BASE + 17 * CAAM_CMD_SZ)
--
--#define DESC_GCM_BASE			(3 * CAAM_CMD_SZ)
--#define DESC_GCM_ENC_LEN		(DESC_GCM_BASE + 23 * CAAM_CMD_SZ)
--#define DESC_GCM_DEC_LEN		(DESC_GCM_BASE + 19 * CAAM_CMD_SZ)
--
--#define DESC_RFC4106_BASE		(3 * CAAM_CMD_SZ)
--#define DESC_RFC4106_ENC_LEN		(DESC_RFC4106_BASE + 15 * CAAM_CMD_SZ)
--#define DESC_RFC4106_DEC_LEN		(DESC_RFC4106_BASE + 14 * CAAM_CMD_SZ)
--#define DESC_RFC4106_GIVENC_LEN		(DESC_RFC4106_BASE + 21 * CAAM_CMD_SZ)
--
--#define DESC_RFC4543_BASE		(3 * CAAM_CMD_SZ)
--#define DESC_RFC4543_ENC_LEN		(DESC_RFC4543_BASE + 25 * CAAM_CMD_SZ)
--#define DESC_RFC4543_DEC_LEN		(DESC_RFC4543_BASE + 27 * CAAM_CMD_SZ)
--#define DESC_RFC4543_GIVENC_LEN		(DESC_RFC4543_BASE + 30 * CAAM_CMD_SZ)
--
- #define DESC_ABLKCIPHER_BASE		(3 * CAAM_CMD_SZ)
- #define DESC_ABLKCIPHER_ENC_LEN		(DESC_ABLKCIPHER_BASE + \
- 					 20 * CAAM_CMD_SZ)
- #define DESC_ABLKCIPHER_DEC_LEN		(DESC_ABLKCIPHER_BASE + \
- 					 15 * CAAM_CMD_SZ)
- 
--#define DESC_MAX_USED_BYTES		(DESC_RFC4543_GIVENC_LEN + \
-+#define DESC_MAX_USED_BYTES		(DESC_AEAD_GIVENC_LEN + \
- 					 CAAM_MAX_KEY_SIZE)
- #define DESC_MAX_USED_LEN		(DESC_MAX_USED_BYTES / CAAM_CMD_SZ)
- 
- #ifdef DEBUG
- /* for print_hex_dumps with line references */
-+#define xstr(s) str(s)
-+#define str(s) #s
- #define debug(format, arg...) printk(format, arg)
- #else
- #define debug(format, arg...)
- #endif
--static struct list_head alg_list;
- 
- /* Set DK bit in class 1 operation if shared */
- static inline void append_dec_op1(u32 *desc, u32 type)
- {
- 	u32 *jump_cmd, *uncond_jump_cmd;
- 
--	/* DK bit is valid only for AES */
--	if ((type & OP_ALG_ALGSEL_MASK) != OP_ALG_ALGSEL_AES) {
--		append_operation(desc, type | OP_ALG_AS_INITFINAL |
--				 OP_ALG_DECRYPT);
--		return;
--	}
--
- 	jump_cmd = append_jump(desc, JUMP_TEST_ALL | JUMP_COND_SHRD);
- 	append_operation(desc, type | OP_ALG_AS_INITFINAL |
- 			 OP_ALG_DECRYPT);
-@@ -133,26 +108,37 @@
- }
- 
- /*
-+ * Wait for completion of class 1 key loading before allowing
-+ * error propagation
-+ */
-+static inline void append_dec_shr_done(u32 *desc)
-+{
-+	u32 *jump_cmd;
-+
-+	jump_cmd = append_jump(desc, JUMP_CLASS_CLASS1 | JUMP_TEST_ALL);
-+	set_jump_tgt_here(desc, jump_cmd);
-+	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
-+}
-+
-+/*
-  * For aead functions, read payload and write payload,
-  * both of which are specified in req->src and req->dst
-  */
- static inline void aead_append_src_dst(u32 *desc, u32 msg_type)
- {
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | KEY_VLF);
- 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_BOTH |
- 			     KEY_VLF | msg_type | FIFOLD_TYPE_LASTBOTH);
-+	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | KEY_VLF);
- }
- 
- /*
-  * For aead encrypt and decrypt, read iv for both classes
-  */
--static inline void aead_append_ld_iv(u32 *desc, int ivsize, int ivoffset)
-+static inline void aead_append_ld_iv(u32 *desc, int ivsize)
- {
--	append_seq_load(desc, ivsize, LDST_CLASS_1_CCB |
--			LDST_SRCDST_BYTE_CONTEXT |
--			(ivoffset << LDST_OFFSET_SHIFT));
--	append_move(desc, MOVE_SRC_CLASS1CTX | MOVE_DEST_CLASS2INFIFO |
--		    (ivoffset << MOVE_OFFSET_SHIFT) | ivsize);
-+	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+		   LDST_CLASS_1_CCB | ivsize);
-+	append_move(desc, MOVE_SRC_CLASS1CTX | MOVE_DEST_CLASS2INFIFO | ivsize);
- }
- 
- /*
-@@ -198,309 +184,68 @@
- };
- 
- static void append_key_aead(u32 *desc, struct caam_ctx *ctx,
--			    int keys_fit_inline, bool is_rfc3686)
-+			    int keys_fit_inline)
- {
--	u32 *nonce;
--	unsigned int enckeylen = ctx->enckeylen;
--
--	/*
--	 * RFC3686 specific:
--	 *	| ctx->key = {AUTH_KEY, ENC_KEY, NONCE}
--	 *	| enckeylen = encryption key size + nonce size
--	 */
--	if (is_rfc3686)
--		enckeylen -= CTR_RFC3686_NONCE_SIZE;
--
- 	if (keys_fit_inline) {
- 		append_key_as_imm(desc, ctx->key, ctx->split_key_pad_len,
- 				  ctx->split_key_len, CLASS_2 |
- 				  KEY_DEST_MDHA_SPLIT | KEY_ENC);
- 		append_key_as_imm(desc, (void *)ctx->key +
--				  ctx->split_key_pad_len, enckeylen,
--				  enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
-+				  ctx->split_key_pad_len, ctx->enckeylen,
-+				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
- 	} else {
- 		append_key(desc, ctx->key_dma, ctx->split_key_len, CLASS_2 |
- 			   KEY_DEST_MDHA_SPLIT | KEY_ENC);
- 		append_key(desc, ctx->key_dma + ctx->split_key_pad_len,
--			   enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	}
--
--	/* Load Counter into CONTEXT1 reg */
--	if (is_rfc3686) {
--		nonce = (u32 *)((void *)ctx->key + ctx->split_key_pad_len +
--			       enckeylen);
--		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
--				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
--		append_move(desc,
--			    MOVE_SRC_OUTFIFO |
--			    MOVE_DEST_CLASS1CTX |
--			    (16 << MOVE_OFFSET_SHIFT) |
--			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
-+			   ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
- 	}
- }
- 
- static void init_sh_desc_key_aead(u32 *desc, struct caam_ctx *ctx,
--				  int keys_fit_inline, bool is_rfc3686)
-+				  int keys_fit_inline)
- {
- 	u32 *key_jump_cmd;
- 
--	/* Note: Context registers are saved. */
--	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
--
--	/* Skip if already shared */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--
--	append_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
--
--	set_jump_tgt_here(desc, key_jump_cmd);
--}
--
--static int aead_null_set_sh_desc(struct crypto_aead *aead)
--{
--	struct aead_tfm *tfm = &aead->base.crt_aead;
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	bool keys_fit_inline = false;
--	u32 *key_jump_cmd, *jump_cmd, *read_move_cmd, *write_move_cmd;
--	u32 *desc;
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	if (DESC_AEAD_NULL_ENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->split_key_pad_len <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	/* aead_encrypt shared descriptor */
--	desc = ctx->sh_desc_enc;
--
- 	init_sh_desc(desc, HDR_SHARE_SERIAL);
- 
- 	/* Skip if already shared */
- 	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
- 				   JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, ctx->key, ctx->split_key_pad_len,
--				  ctx->split_key_len, CLASS_2 |
--				  KEY_DEST_MDHA_SPLIT | KEY_ENC);
--	else
--		append_key(desc, ctx->key_dma, ctx->split_key_len, CLASS_2 |
--			   KEY_DEST_MDHA_SPLIT | KEY_ENC);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* cryptlen = seqoutlen - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
--
--	/*
--	 * NULL encryption; IV is zero
--	 * assoclen = (assoclen + cryptlen) - cryptlen
--	 */
--	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
--
--	/* read assoc before reading payload */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
--			     KEY_VLF);
--
--	/* Prepare to read and write cryptlen bytes */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
--
--	/*
--	 * MOVE_LEN opcode is not available in all SEC HW revisions,
--	 * thus need to do some magic, i.e. self-patch the descriptor
--	 * buffer.
--	 */
--	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF |
--				    MOVE_DEST_MATH3 |
--				    (0x6 << MOVE_LEN_SHIFT));
--	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 |
--				     MOVE_DEST_DESCBUF |
--				     MOVE_WAITCOMP |
--				     (0x8 << MOVE_LEN_SHIFT));
--
--	/* Class 2 operation */
--	append_operation(desc, ctx->class2_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
--
--	/* Read and write cryptlen bytes */
--	aead_append_src_dst(desc, FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
--
--	set_move_tgt_here(desc, read_move_cmd);
--	set_move_tgt_here(desc, write_move_cmd);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO |
--		    MOVE_AUX_LS);
--
--	/* Write ICV */
--	append_seq_store(desc, ctx->authsize, LDST_CLASS_2_CCB |
--			 LDST_SRCDST_BYTE_CONTEXT);
--
--	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "aead null enc shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	keys_fit_inline = false;
--	if (DESC_AEAD_NULL_DEC_LEN + DESC_JOB_IO_LEN +
--	    ctx->split_key_pad_len <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	desc = ctx->sh_desc_dec;
- 
--	/* aead_decrypt shared descriptor */
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
-+	append_key_aead(desc, ctx, keys_fit_inline);
- 
--	/* Skip if already shared */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, ctx->key, ctx->split_key_pad_len,
--				  ctx->split_key_len, CLASS_2 |
--				  KEY_DEST_MDHA_SPLIT | KEY_ENC);
--	else
--		append_key(desc, ctx->key_dma, ctx->split_key_len, CLASS_2 |
--			   KEY_DEST_MDHA_SPLIT | KEY_ENC);
- 	set_jump_tgt_here(desc, key_jump_cmd);
- 
--	/* Class 2 operation */
--	append_operation(desc, ctx->class2_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
--
--	/* assoclen + cryptlen = seqinlen - ivsize - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
--				ctx->authsize + tfm->ivsize);
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
--	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
--	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
--
--	/* read assoc before reading payload */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
--			     KEY_VLF);
--
--	/* Prepare to read and write cryptlen bytes */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG2, CAAM_CMD_SZ);
--
--	/*
--	 * MOVE_LEN opcode is not available in all SEC HW revisions,
--	 * thus need to do some magic, i.e. self-patch the descriptor
--	 * buffer.
--	 */
--	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF |
--				    MOVE_DEST_MATH2 |
--				    (0x6 << MOVE_LEN_SHIFT));
--	write_move_cmd = append_move(desc, MOVE_SRC_MATH2 |
--				     MOVE_DEST_DESCBUF |
--				     MOVE_WAITCOMP |
--				     (0x8 << MOVE_LEN_SHIFT));
--
--	/* Read and write cryptlen bytes */
--	aead_append_src_dst(desc, FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
--
--	/*
--	 * Insert a NOP here, since we need at least 4 instructions between
--	 * code patching the descriptor buffer and the location being patched.
--	 */
--	jump_cmd = append_jump(desc, JUMP_TEST_ALL);
--	set_jump_tgt_here(desc, jump_cmd);
--
--	set_move_tgt_here(desc, read_move_cmd);
--	set_move_tgt_here(desc, write_move_cmd);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO |
--		    MOVE_AUX_LS);
--	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
--
--	/* Load ICV */
--	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS2 |
--			     FIFOLD_TYPE_LAST2 | FIFOLD_TYPE_ICV);
--
--	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "aead null dec shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	return 0;
-+	/* Propagate errors from shared to job descriptor */
-+	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
- }
- 
- static int aead_set_sh_desc(struct crypto_aead *aead)
- {
- 	struct aead_tfm *tfm = &aead->base.crt_aead;
- 	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct crypto_tfm *ctfm = crypto_aead_tfm(aead);
--	const char *alg_name = crypto_tfm_alg_name(ctfm);
- 	struct device *jrdev = ctx->jrdev;
--	bool keys_fit_inline;
-+	bool keys_fit_inline = false;
-+	u32 *key_jump_cmd, *jump_cmd;
- 	u32 geniv, moveiv;
--	u32 ctx1_iv_off = 0;
- 	u32 *desc;
--	const bool ctr_mode = ((ctx->class1_alg_type & OP_ALG_AAI_MASK) ==
--			       OP_ALG_AAI_CTR_MOD128);
--	const bool is_rfc3686 = (ctr_mode &&
--				 (strstr(alg_name, "rfc3686") != NULL));
- 
--	if (!ctx->authsize)
-+	if (!ctx->enckeylen || !ctx->authsize)
- 		return 0;
- 
--	/* NULL encryption / decryption */
--	if (!ctx->enckeylen)
--		return aead_null_set_sh_desc(aead);
--
--	/*
--	 * AES-CTR needs to load IV in CONTEXT1 reg
--	 * at an offset of 128bits (16bytes)
--	 * CONTEXT1[255:128] = IV
--	 */
--	if (ctr_mode)
--		ctx1_iv_off = 16;
--
--	/*
--	 * RFC3686 specific:
--	 *	CONTEXT1[255:128] = {NONCE, IV, COUNTER}
--	 */
--	if (is_rfc3686)
--		ctx1_iv_off = 16 + CTR_RFC3686_NONCE_SIZE;
--
- 	/*
- 	 * Job Descriptor and Shared Descriptors
- 	 * must all fit into the 64-word Descriptor h/w Buffer
- 	 */
--	keys_fit_inline = false;
- 	if (DESC_AEAD_ENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->split_key_pad_len + ctx->enckeylen +
--	    (is_rfc3686 ? DESC_AEAD_CTR_RFC3686_LEN : 0) <=
-+	    ctx->split_key_pad_len + ctx->enckeylen <=
- 	    CAAM_DESC_BYTES_MAX)
- 		keys_fit_inline = true;
- 
- 	/* aead_encrypt shared descriptor */
- 	desc = ctx->sh_desc_enc;
- 
--	/* Note: Context registers are saved. */
--	init_sh_desc_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
-+	init_sh_desc_key_aead(desc, ctx, keys_fit_inline);
- 
- 	/* Class 2 operation */
- 	append_operation(desc, ctx->class2_alg_type |
-@@ -512,21 +257,13 @@
- 	/* assoclen + cryptlen = seqinlen - ivsize */
- 	append_math_sub_imm_u32(desc, REG2, SEQINLEN, IMM, tfm->ivsize);
- 
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
-+	/* assoclen + cryptlen = (assoclen + cryptlen) - cryptlen */
- 	append_math_sub(desc, VARSEQINLEN, REG2, REG3, CAAM_CMD_SZ);
- 
- 	/* read assoc before reading payload */
- 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
- 			     KEY_VLF);
--	aead_append_ld_iv(desc, tfm->ivsize, ctx1_iv_off);
--
--	/* Load Counter into CONTEXT1 reg */
--	if (is_rfc3686)
--		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
--				    LDST_CLASS_1_CCB |
--				    LDST_SRCDST_BYTE_CONTEXT |
--				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
--				     LDST_OFFSET_SHIFT));
-+	aead_append_ld_iv(desc, tfm->ivsize);
- 
- 	/* Class 1 operation */
- 	append_operation(desc, ctx->class1_alg_type |
-@@ -549,35 +286,46 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "aead enc shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "aead enc shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
- 
-+	dma_sync_single_for_cpu(jrdev, ctx->sh_desc_enc_dma, desc_bytes(desc),
-+				DMA_TO_DEVICE);
- 	/*
- 	 * Job Descriptor and Shared Descriptors
- 	 * must all fit into the 64-word Descriptor h/w Buffer
- 	 */
--	keys_fit_inline = false;
- 	if (DESC_AEAD_DEC_LEN + DESC_JOB_IO_LEN +
--	    ctx->split_key_pad_len + ctx->enckeylen +
--	    (is_rfc3686 ? DESC_AEAD_CTR_RFC3686_LEN : 0) <=
-+	    ctx->split_key_pad_len + ctx->enckeylen <=
- 	    CAAM_DESC_BYTES_MAX)
- 		keys_fit_inline = true;
- 
--	/* aead_decrypt shared descriptor */
- 	desc = ctx->sh_desc_dec;
- 
--	/* Note: Context registers are saved. */
--	init_sh_desc_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
-+	/* aead_decrypt shared descriptor */
-+	init_sh_desc(desc, HDR_SHARE_SERIAL);
-+
-+	/* Skip if already shared */
-+	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
-+				   JUMP_COND_SHRD);
-+
-+	append_key_aead(desc, ctx, keys_fit_inline);
-+
-+	/* Only propagate error immediately if shared */
-+	jump_cmd = append_jump(desc, JUMP_TEST_ALL);
-+	set_jump_tgt_here(desc, key_jump_cmd);
-+	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
-+	set_jump_tgt_here(desc, jump_cmd);
- 
- 	/* Class 2 operation */
- 	append_operation(desc, ctx->class2_alg_type |
- 			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
- 
--	/* assoclen + cryptlen = seqinlen - ivsize - authsize */
-+	/* assoclen + cryptlen = seqinlen - ivsize */
- 	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
--				ctx->authsize + tfm->ivsize);
-+				ctx->authsize + tfm->ivsize)
- 	/* assoclen = (assoclen + cryptlen) - cryptlen */
- 	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
- 	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
-@@ -586,22 +334,9 @@
- 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
- 			     KEY_VLF);
- 
--	aead_append_ld_iv(desc, tfm->ivsize, ctx1_iv_off);
-+	aead_append_ld_iv(desc, tfm->ivsize);
- 
--	/* Load Counter into CONTEXT1 reg */
--	if (is_rfc3686)
--		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
--				    LDST_CLASS_1_CCB |
--				    LDST_SRCDST_BYTE_CONTEXT |
--				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
--				     LDST_OFFSET_SHIFT));
--
--	/* Choose operation */
--	if (ctr_mode)
--		append_operation(desc, ctx->class1_alg_type |
--				 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT);
--	else
--		append_dec_op1(desc, ctx->class1_alg_type);
-+	append_dec_op1(desc, ctx->class1_alg_type);
- 
- 	/* Read and write cryptlen bytes */
- 	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
-@@ -611,6 +346,7 @@
- 	/* Load ICV */
- 	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS2 |
- 			     FIFOLD_TYPE_LAST2 | FIFOLD_TYPE_ICV);
-+	append_dec_shr_done(desc);
- 
- 	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
- 					      desc_bytes(desc),
-@@ -620,27 +356,26 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "aead dec shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "aead dec shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_cpu(jrdev, ctx->sh_desc_dec_dma, desc_bytes(desc),
-+				DMA_TO_DEVICE);
- 
- 	/*
- 	 * Job Descriptor and Shared Descriptors
- 	 * must all fit into the 64-word Descriptor h/w Buffer
- 	 */
--	keys_fit_inline = false;
- 	if (DESC_AEAD_GIVENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->split_key_pad_len + ctx->enckeylen +
--	    (is_rfc3686 ? DESC_AEAD_CTR_RFC3686_LEN : 0) <=
-+	    ctx->split_key_pad_len + ctx->enckeylen <=
- 	    CAAM_DESC_BYTES_MAX)
- 		keys_fit_inline = true;
- 
- 	/* aead_givencrypt shared descriptor */
- 	desc = ctx->sh_desc_givenc;
- 
--	/* Note: Context registers are saved. */
--	init_sh_desc_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
-+	init_sh_desc_key_aead(desc, ctx, keys_fit_inline);
- 
- 	/* Generate IV */
- 	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
-@@ -649,16 +384,13 @@
- 	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
- 			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
- 	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	append_move(desc, MOVE_WAITCOMP |
--		    MOVE_SRC_INFIFO | MOVE_DEST_CLASS1CTX |
--		    (ctx1_iv_off << MOVE_OFFSET_SHIFT) |
--		    (tfm->ivsize << MOVE_LEN_SHIFT));
-+	append_move(desc, MOVE_SRC_INFIFO |
-+		    MOVE_DEST_CLASS1CTX | (tfm->ivsize << MOVE_LEN_SHIFT));
- 	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
- 
- 	/* Copy IV to class 1 context */
--	append_move(desc, MOVE_SRC_CLASS1CTX | MOVE_DEST_OUTFIFO |
--		    (ctx1_iv_off << MOVE_OFFSET_SHIFT) |
--		    (tfm->ivsize << MOVE_LEN_SHIFT));
-+	append_move(desc, MOVE_SRC_CLASS1CTX |
-+		    MOVE_DEST_OUTFIFO | (tfm->ivsize << MOVE_LEN_SHIFT));
- 
- 	/* Return to encryption */
- 	append_operation(desc, ctx->class2_alg_type |
-@@ -674,7 +406,7 @@
- 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
- 			     KEY_VLF);
- 
--	/* Copy iv from outfifo to class 2 fifo */
-+	/* Copy iv from class 1 ctx to class 2 fifo*/
- 	moveiv = NFIFOENTRY_STYPE_OFIFO | NFIFOENTRY_DEST_CLASS2 |
- 		 NFIFOENTRY_DTYPE_MSG | (tfm->ivsize << NFIFOENTRY_DLEN_SHIFT);
- 	append_load_imm_u32(desc, moveiv, LDST_CLASS_IND_CCB |
-@@ -682,14 +414,6 @@
- 	append_load_imm_u32(desc, tfm->ivsize, LDST_CLASS_2_CCB |
- 			    LDST_SRCDST_WORD_DATASZ_REG | LDST_IMM);
- 
--	/* Load Counter into CONTEXT1 reg */
--	if (is_rfc3686)
--		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
--				    LDST_CLASS_1_CCB |
--				    LDST_SRCDST_BYTE_CONTEXT |
--				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
--				     LDST_OFFSET_SHIFT));
--
- 	/* Class 1 operation */
- 	append_operation(desc, ctx->class1_alg_type |
- 			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
-@@ -717,10 +441,12 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "aead givenc shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "aead givenc shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_cpu(jrdev, ctx->sh_desc_givenc_dma,
-+				desc_bytes(desc), DMA_TO_DEVICE);
- 
- 	return 0;
- }
-@@ -736,977 +462,84 @@
- 	return 0;
- }
- 
--static int gcm_set_sh_desc(struct crypto_aead *aead)
-+static u32 gen_split_aead_key(struct caam_ctx *ctx, const u8 *key_in,
-+			      u32 authkeylen)
- {
--	struct aead_tfm *tfm = &aead->base.crt_aead;
-+	return gen_split_key(ctx->jrdev, ctx->key, ctx->split_key_len,
-+			       ctx->split_key_pad_len, key_in, authkeylen,
-+			       ctx->alg_op);
-+}
-+
-+static int aead_setkey(struct crypto_aead *aead,
-+			       const u8 *key, unsigned int keylen)
-+{
-+	/* Sizes for MDHA pads (*not* keys): MD5, SHA1, 224, 256, 384, 512 */
-+	static const u8 mdpadlen[] = { 16, 20, 32, 32, 64, 64 };
- 	struct caam_ctx *ctx = crypto_aead_ctx(aead);
- 	struct device *jrdev = ctx->jrdev;
--	bool keys_fit_inline = false;
--	u32 *key_jump_cmd, *zero_payload_jump_cmd,
--	    *zero_assoc_jump_cmd1, *zero_assoc_jump_cmd2;
--	u32 *desc;
--
--	if (!ctx->enckeylen || !ctx->authsize)
--		return 0;
--
--	/*
--	 * AES GCM encrypt shared descriptor
--	 * Job Descriptor and Shared Descriptor
--	 * must fit into the 64-word Descriptor h/w Buffer
--	 */
--	if (DESC_GCM_ENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
-+	struct rtattr *rta = (void *)key;
-+	struct crypto_authenc_key_param *param;
-+	unsigned int authkeylen;
-+	unsigned int enckeylen;
-+	int ret = 0;
- 
--	desc = ctx->sh_desc_enc;
-+	param = RTA_DATA(rta);
-+	enckeylen = be32_to_cpu(param->enckeylen);
- 
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
-+	key += RTA_ALIGN(rta->rta_len);
-+	keylen -= RTA_ALIGN(rta->rta_len);
- 
--	/* skip key loading if they are loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD | JUMP_COND_SELF);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
-+	if (keylen < enckeylen)
-+		goto badkey;
- 
--	/* class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
-+	authkeylen = keylen - enckeylen;
- 
--	/* cryptlen = seqoutlen - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
-+	if (keylen > CAAM_MAX_KEY_SIZE)
-+		goto badkey;
- 
--	/* assoclen + cryptlen = seqinlen - ivsize */
--	append_math_sub_imm_u32(desc, REG2, SEQINLEN, IMM, tfm->ivsize);
-+	/* Pick class 2 key length from algorithm submask */
-+	ctx->split_key_len = mdpadlen[(ctx->alg_op & OP_ALG_ALGSEL_SUBMASK) >>
-+				      OP_ALG_ALGSEL_SHIFT] * 2;
-+	ctx->split_key_pad_len = ALIGN(ctx->split_key_len, 16);
- 
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
--	append_math_sub(desc, REG1, REG2, REG3, CAAM_CMD_SZ);
-+#ifdef DEBUG
-+	printk(KERN_ERR "keylen %d enckeylen %d authkeylen %d\n",
-+	       keylen, enckeylen, authkeylen);
-+	printk(KERN_ERR "split_key_len %d split_key_pad_len %d\n",
-+	       ctx->split_key_len, ctx->split_key_pad_len);
-+	print_hex_dump(KERN_ERR, "key in @"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
-+#endif
- 
--	/* if cryptlen is ZERO jump to zero-payload commands */
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
--	zero_payload_jump_cmd = append_jump(desc, JUMP_TEST_ALL |
--					    JUMP_COND_MATH_Z);
--	/* read IV */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
--
--	/* if assoclen is ZERO, skip reading the assoc data */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
--	zero_assoc_jump_cmd1 = append_jump(desc, JUMP_TEST_ALL |
--					   JUMP_COND_MATH_Z);
--
--	/* read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
--	set_jump_tgt_here(desc, zero_assoc_jump_cmd1);
-+	ret = gen_split_aead_key(ctx, key, authkeylen);
-+	if (ret) {
-+		goto badkey;
-+	}
- 
--	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
-+	/* postpend encryption key to auth split key */
-+	memcpy(ctx->key + ctx->split_key_pad_len, key + authkeylen, enckeylen);
- 
--	/* write encrypted data */
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
-+	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->split_key_pad_len +
-+				       enckeylen, DMA_TO_DEVICE);
-+	if (dma_mapping_error(jrdev, ctx->key_dma)) {
-+		dev_err(jrdev, "unable to map key i/o memory\n");
-+		return -ENOMEM;
-+	}
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
-+		       ctx->split_key_pad_len + enckeylen, 1);
-+#endif
-+	dma_sync_single_for_device(jrdev, ctx->key_dma,
-+				   ctx->split_key_pad_len + enckeylen,
-+				   DMA_TO_DEVICE);
- 
--	/* read payload data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1);
--
--	/* jump the zero-payload commands */
--	append_jump(desc, JUMP_TEST_ALL | 7);
--
--	/* zero-payload commands */
--	set_jump_tgt_here(desc, zero_payload_jump_cmd);
--
--	/* if assoclen is ZERO, jump to IV reading - is the only input data */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
--	zero_assoc_jump_cmd2 = append_jump(desc, JUMP_TEST_ALL |
--					   JUMP_COND_MATH_Z);
--	/* read IV */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
--
--	/* read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_LAST1);
--
--	/* jump to ICV writing */
--	append_jump(desc, JUMP_TEST_ALL | 2);
--
--	/* read IV - is the only input data */
--	set_jump_tgt_here(desc, zero_assoc_jump_cmd2);
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 |
--			     FIFOLD_TYPE_LAST1);
--
--	/* write ICV */
--	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
--			 LDST_SRCDST_BYTE_CONTEXT);
--
--	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "gcm enc shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	keys_fit_inline = false;
--	if (DESC_GCM_DEC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	desc = ctx->sh_desc_dec;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* skip key loading if they are loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL |
--				   JUMP_TEST_ALL | JUMP_COND_SHRD |
--				   JUMP_COND_SELF);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
--
--	/* assoclen + cryptlen = seqinlen - ivsize - icvsize */
--	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
--				ctx->authsize + tfm->ivsize);
--
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
--	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
--	append_math_sub(desc, REG1, REG3, REG2, CAAM_CMD_SZ);
--
--	/* read IV */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
--
--	/* jump to zero-payload command if cryptlen is zero */
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG2, CAAM_CMD_SZ);
--	zero_payload_jump_cmd = append_jump(desc, JUMP_TEST_ALL |
--					    JUMP_COND_MATH_Z);
--
--	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
--	/* if asoclen is ZERO, skip reading assoc data */
--	zero_assoc_jump_cmd1 = append_jump(desc, JUMP_TEST_ALL |
--					   JUMP_COND_MATH_Z);
--	/* read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
--	set_jump_tgt_here(desc, zero_assoc_jump_cmd1);
--
--	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
--
--	/* store encrypted data */
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
--
--	/* read payload data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
--
--	/* jump the zero-payload commands */
--	append_jump(desc, JUMP_TEST_ALL | 4);
--
--	/* zero-payload command */
--	set_jump_tgt_here(desc, zero_payload_jump_cmd);
--
--	/* if assoclen is ZERO, jump to ICV reading */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
--	zero_assoc_jump_cmd2 = append_jump(desc, JUMP_TEST_ALL |
--					   JUMP_COND_MATH_Z);
--	/* read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
--	set_jump_tgt_here(desc, zero_assoc_jump_cmd2);
--
--	/* read ICV */
--	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_ICV | FIFOLD_TYPE_LAST1);
--
--	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "gcm dec shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	return 0;
--}
--
--static int gcm_setauthsize(struct crypto_aead *authenc, unsigned int authsize)
--{
--	struct caam_ctx *ctx = crypto_aead_ctx(authenc);
--
--	ctx->authsize = authsize;
--	gcm_set_sh_desc(authenc);
--
--	return 0;
--}
--
--static int rfc4106_set_sh_desc(struct crypto_aead *aead)
--{
--	struct aead_tfm *tfm = &aead->base.crt_aead;
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	bool keys_fit_inline = false;
--	u32 *key_jump_cmd, *move_cmd, *write_iv_cmd;
--	u32 *desc;
--	u32 geniv;
--
--	if (!ctx->enckeylen || !ctx->authsize)
--		return 0;
--
--	/*
--	 * RFC4106 encrypt shared descriptor
--	 * Job Descriptor and Shared Descriptor
--	 * must fit into the 64-word Descriptor h/w Buffer
--	 */
--	if (DESC_RFC4106_ENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	desc = ctx->sh_desc_enc;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* Skip key loading if it is loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
--
--	/* cryptlen = seqoutlen - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
--
--	/* assoclen + cryptlen = seqinlen - ivsize */
--	append_math_sub_imm_u32(desc, REG2, SEQINLEN, IMM, tfm->ivsize);
--
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
--	append_math_sub(desc, VARSEQINLEN, REG2, REG3, CAAM_CMD_SZ);
--
--	/* Read Salt */
--	append_fifo_load_as_imm(desc, (void *)(ctx->key + ctx->enckeylen),
--				4, FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_IV);
--	/* Read AES-GCM-ESP IV */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
--
--	/* Read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
--
--	/* Will read cryptlen bytes */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
--
--	/* Write encrypted data */
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
--
--	/* Read payload data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1);
--
--	/* Write ICV */
--	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
--			 LDST_SRCDST_BYTE_CONTEXT);
--
--	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "rfc4106 enc shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	keys_fit_inline = false;
--	if (DESC_RFC4106_DEC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	desc = ctx->sh_desc_dec;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* Skip key loading if it is loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL |
--				   JUMP_TEST_ALL | JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
--
--	/* assoclen + cryptlen = seqinlen - ivsize - icvsize */
--	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
--				ctx->authsize + tfm->ivsize);
--
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
--	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
--	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
--
--	/* Will write cryptlen bytes */
--	append_math_sub(desc, VARSEQOUTLEN, SEQOUTLEN, REG0, CAAM_CMD_SZ);
--
--	/* Read Salt */
--	append_fifo_load_as_imm(desc, (void *)(ctx->key + ctx->enckeylen),
--				4, FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_IV);
--	/* Read AES-GCM-ESP IV */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
--
--	/* Read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
--
--	/* Will read cryptlen bytes */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
--
--	/* Store payload data */
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
--
--	/* Read encrypted data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
--
--	/* Read ICV */
--	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_ICV | FIFOLD_TYPE_LAST1);
--
--	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "rfc4106 dec shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	keys_fit_inline = false;
--	if (DESC_RFC4106_GIVENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->split_key_pad_len + ctx->enckeylen <=
--	    CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	/* rfc4106_givencrypt shared descriptor */
--	desc = ctx->sh_desc_givenc;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* Skip key loading if it is loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Generate IV */
--	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
--		NFIFOENTRY_DTYPE_MSG | NFIFOENTRY_LC1 |
--		NFIFOENTRY_PTYPE_RND | (tfm->ivsize << NFIFOENTRY_DLEN_SHIFT);
--	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
--			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	move_cmd = append_move(desc, MOVE_SRC_INFIFO | MOVE_DEST_DESCBUF |
--			       (tfm->ivsize << MOVE_LEN_SHIFT));
--	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
--
--	/* Copy generated IV to OFIFO */
--	write_iv_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_OUTFIFO |
--				   (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* Class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
--
--	/* ivsize + cryptlen = seqoutlen - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
--
--	/* assoclen = seqinlen - (ivsize + cryptlen) */
--	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
--
--	/* Will write ivsize + cryptlen */
--	append_math_add(desc, VARSEQOUTLEN, REG3, REG0, CAAM_CMD_SZ);
--
--	/* Read Salt and generated IV */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_IV |
--		   FIFOLD_TYPE_FLUSH1 | IMMEDIATE | 12);
--	/* Append Salt */
--	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
--	set_move_tgt_here(desc, move_cmd);
--	set_move_tgt_here(desc, write_iv_cmd);
--	/* Blank commands. Will be overwritten by generated IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* No need to reload iv */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_SKIP);
--
--	/* Read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
--
--	/* Will read cryptlen */
--	append_math_add(desc, VARSEQINLEN, SEQINLEN, REG0, CAAM_CMD_SZ);
--
--	/* Store generated IV and encrypted data */
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
--
--	/* Read payload data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1);
--
--	/* Write ICV */
--	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
--			 LDST_SRCDST_BYTE_CONTEXT);
--
--	ctx->sh_desc_givenc_dma = dma_map_single(jrdev, desc,
--						 desc_bytes(desc),
--						 DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_givenc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "rfc4106 givenc shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	return 0;
--}
--
--static int rfc4106_setauthsize(struct crypto_aead *authenc,
--			       unsigned int authsize)
--{
--	struct caam_ctx *ctx = crypto_aead_ctx(authenc);
--
--	ctx->authsize = authsize;
--	rfc4106_set_sh_desc(authenc);
--
--	return 0;
--}
--
--static int rfc4543_set_sh_desc(struct crypto_aead *aead)
--{
--	struct aead_tfm *tfm = &aead->base.crt_aead;
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	bool keys_fit_inline = false;
--	u32 *key_jump_cmd, *write_iv_cmd, *write_aad_cmd;
--	u32 *read_move_cmd, *write_move_cmd;
--	u32 *desc;
--	u32 geniv;
--
--	if (!ctx->enckeylen || !ctx->authsize)
--		return 0;
--
--	/*
--	 * RFC4543 encrypt shared descriptor
--	 * Job Descriptor and Shared Descriptor
--	 * must fit into the 64-word Descriptor h/w Buffer
--	 */
--	if (DESC_RFC4543_ENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	desc = ctx->sh_desc_enc;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* Skip key loading if it is loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
--
--	/* Load AES-GMAC ESP IV into Math1 register */
--	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_WORD_DECO_MATH1 |
--		   LDST_CLASS_DECO | tfm->ivsize);
--
--	/* Wait the DMA transaction to finish */
--	append_jump(desc, JUMP_TEST_ALL | JUMP_COND_CALM |
--		    (1 << JUMP_OFFSET_SHIFT));
--
--	/* Overwrite blank immediate AES-GMAC ESP IV data */
--	write_iv_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
--				   (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* Overwrite blank immediate AAD data */
--	write_aad_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
--				    (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* cryptlen = seqoutlen - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
--
--	/* assoclen = (seqinlen - ivsize) - cryptlen */
--	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
--
--	/* Read Salt and AES-GMAC ESP IV */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
--		   FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 | (4 + tfm->ivsize));
--	/* Append Salt */
--	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
--	set_move_tgt_here(desc, write_iv_cmd);
--	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* Read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD);
--
--	/* Will read cryptlen bytes */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
--
--	/* Will write cryptlen bytes */
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
--
--	/*
--	 * MOVE_LEN opcode is not available in all SEC HW revisions,
--	 * thus need to do some magic, i.e. self-patch the descriptor
--	 * buffer.
--	 */
--	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_MATH3 |
--				    (0x6 << MOVE_LEN_SHIFT));
--	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 | MOVE_DEST_DESCBUF |
--				     (0x8 << MOVE_LEN_SHIFT));
--
--	/* Authenticate AES-GMAC ESP IV  */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
--		   FIFOLD_TYPE_AAD | tfm->ivsize);
--	set_move_tgt_here(desc, write_aad_cmd);
--	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* Read and write cryptlen bytes */
--	aead_append_src_dst(desc, FIFOLD_TYPE_AAD);
--
--	set_move_tgt_here(desc, read_move_cmd);
--	set_move_tgt_here(desc, write_move_cmd);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	/* Move payload data to OFIFO */
--	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO);
--
--	/* Write ICV */
--	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
--			 LDST_SRCDST_BYTE_CONTEXT);
--
--	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "rfc4543 enc shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	keys_fit_inline = false;
--	if (DESC_RFC4543_DEC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	desc = ctx->sh_desc_dec;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* Skip key loading if it is loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL |
--				   JUMP_TEST_ALL | JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
--
--	/* Load AES-GMAC ESP IV into Math1 register */
--	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_WORD_DECO_MATH1 |
--		   LDST_CLASS_DECO | tfm->ivsize);
--
--	/* Wait the DMA transaction to finish */
--	append_jump(desc, JUMP_TEST_ALL | JUMP_COND_CALM |
--		    (1 << JUMP_OFFSET_SHIFT));
--
--	/* assoclen + cryptlen = (seqinlen - ivsize) - icvsize */
--	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM, ctx->authsize);
--
--	/* Overwrite blank immediate AES-GMAC ESP IV data */
--	write_iv_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
--				   (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* Overwrite blank immediate AAD data */
--	write_aad_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
--				    (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* assoclen = (assoclen + cryptlen) - cryptlen */
--	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
--	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
--
--	/*
--	 * MOVE_LEN opcode is not available in all SEC HW revisions,
--	 * thus need to do some magic, i.e. self-patch the descriptor
--	 * buffer.
--	 */
--	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_MATH3 |
--				    (0x6 << MOVE_LEN_SHIFT));
--	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 | MOVE_DEST_DESCBUF |
--				     (0x8 << MOVE_LEN_SHIFT));
--
--	/* Read Salt and AES-GMAC ESP IV */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
--		   FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 | (4 + tfm->ivsize));
--	/* Append Salt */
--	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
--	set_move_tgt_here(desc, write_iv_cmd);
--	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* Read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD);
--
--	/* Will read cryptlen bytes */
--	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
--
--	/* Will write cryptlen bytes */
--	append_math_add(desc, VARSEQOUTLEN, ZERO, REG2, CAAM_CMD_SZ);
--
--	/* Authenticate AES-GMAC ESP IV  */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
--		   FIFOLD_TYPE_AAD | tfm->ivsize);
--	set_move_tgt_here(desc, write_aad_cmd);
--	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* Store payload data */
--	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
--
--	/* In-snoop cryptlen data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_BOTH | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_LAST2FLUSH1);
--
--	set_move_tgt_here(desc, read_move_cmd);
--	set_move_tgt_here(desc, write_move_cmd);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	/* Move payload data to OFIFO */
--	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO);
--	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
--
--	/* Read ICV */
--	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS1 |
--			     FIFOLD_TYPE_ICV | FIFOLD_TYPE_LAST1);
--
--	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
--					      desc_bytes(desc),
--					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "rfc4543 dec shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	/*
--	 * Job Descriptor and Shared Descriptors
--	 * must all fit into the 64-word Descriptor h/w Buffer
--	 */
--	keys_fit_inline = false;
--	if (DESC_RFC4543_GIVENC_LEN + DESC_JOB_IO_LEN +
--	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
--		keys_fit_inline = true;
--
--	/* rfc4543_givencrypt shared descriptor */
--	desc = ctx->sh_desc_givenc;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL);
--
--	/* Skip key loading if it is loaded due to sharing */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--	if (keys_fit_inline)
--		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
--	else
--		append_key(desc, ctx->key_dma, ctx->enckeylen,
--			   CLASS_1 | KEY_DEST_CLASS_REG);
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Generate IV */
--	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
--		NFIFOENTRY_DTYPE_MSG | NFIFOENTRY_LC1 |
--		NFIFOENTRY_PTYPE_RND | (tfm->ivsize << NFIFOENTRY_DLEN_SHIFT);
--	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
--			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	/* Move generated IV to Math1 register */
--	append_move(desc, MOVE_SRC_INFIFO | MOVE_DEST_MATH1 |
--		    (tfm->ivsize << MOVE_LEN_SHIFT));
--	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
--
--	/* Overwrite blank immediate AES-GMAC IV data */
--	write_iv_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
--				   (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* Overwrite blank immediate AAD data */
--	write_aad_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
--				    (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* Copy generated IV to OFIFO */
--	append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_OUTFIFO |
--		    (tfm->ivsize << MOVE_LEN_SHIFT));
--
--	/* Class 1 operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
--
--	/* ivsize + cryptlen = seqoutlen - authsize */
--	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
--
--	/* assoclen = seqinlen - (ivsize + cryptlen) */
--	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
--
--	/* Will write ivsize + cryptlen */
--	append_math_add(desc, VARSEQOUTLEN, REG3, REG0, CAAM_CMD_SZ);
--
--	/*
--	 * MOVE_LEN opcode is not available in all SEC HW revisions,
--	 * thus need to do some magic, i.e. self-patch the descriptor
--	 * buffer.
--	 */
--	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_MATH3 |
--				    (0x6 << MOVE_LEN_SHIFT));
--	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 | MOVE_DEST_DESCBUF |
--				     (0x8 << MOVE_LEN_SHIFT));
--
--	/* Read Salt and AES-GMAC generated IV */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
--		   FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 | (4 + tfm->ivsize));
--	/* Append Salt */
--	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
--	set_move_tgt_here(desc, write_iv_cmd);
--	/* Blank commands. Will be overwritten by AES-GMAC generated IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* No need to reload iv */
--	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_SKIP);
--
--	/* Read assoc data */
--	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
--			     FIFOLD_TYPE_AAD);
--
--	/* Will read cryptlen */
--	append_math_add(desc, VARSEQINLEN, SEQINLEN, REG0, CAAM_CMD_SZ);
--
--	/* Authenticate AES-GMAC IV  */
--	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
--		   FIFOLD_TYPE_AAD | tfm->ivsize);
--	set_move_tgt_here(desc, write_aad_cmd);
--	/* Blank commands. Will be overwritten by AES-GMAC IV. */
--	append_cmd(desc, 0x00000000);
--	append_cmd(desc, 0x00000000);
--	/* End of blank commands */
--
--	/* Read and write cryptlen bytes */
--	aead_append_src_dst(desc, FIFOLD_TYPE_AAD);
--
--	set_move_tgt_here(desc, read_move_cmd);
--	set_move_tgt_here(desc, write_move_cmd);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	/* Move payload data to OFIFO */
--	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO);
--
--	/* Write ICV */
--	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
--			 LDST_SRCDST_BYTE_CONTEXT);
--
--	ctx->sh_desc_givenc_dma = dma_map_single(jrdev, desc,
--						 desc_bytes(desc),
--						 DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_givenc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "rfc4543 givenc shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--
--	return 0;
--}
--
--static int rfc4543_setauthsize(struct crypto_aead *authenc,
--			       unsigned int authsize)
--{
--	struct caam_ctx *ctx = crypto_aead_ctx(authenc);
--
--	ctx->authsize = authsize;
--	rfc4543_set_sh_desc(authenc);
--
--	return 0;
--}
--
--static u32 gen_split_aead_key(struct caam_ctx *ctx, const u8 *key_in,
--			      u32 authkeylen)
--{
--	return gen_split_key(ctx->jrdev, ctx->key, ctx->split_key_len,
--			       ctx->split_key_pad_len, key_in, authkeylen,
--			       ctx->alg_op);
--}
--
--static int aead_setkey(struct crypto_aead *aead,
--			       const u8 *key, unsigned int keylen)
--{
--	/* Sizes for MDHA pads (*not* keys): MD5, SHA1, 224, 256, 384, 512 */
--	static const u8 mdpadlen[] = { 16, 20, 32, 32, 64, 64 };
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	struct crypto_authenc_keys keys;
--	int ret = 0;
--
--	if (crypto_authenc_extractkeys(&keys, key, keylen) != 0)
--		goto badkey;
--
--	/* Pick class 2 key length from algorithm submask */
--	ctx->split_key_len = mdpadlen[(ctx->alg_op & OP_ALG_ALGSEL_SUBMASK) >>
--				      OP_ALG_ALGSEL_SHIFT] * 2;
--	ctx->split_key_pad_len = ALIGN(ctx->split_key_len, 16);
--
--	if (ctx->split_key_pad_len + keys.enckeylen > CAAM_MAX_KEY_SIZE)
--		goto badkey;
--
--#ifdef DEBUG
--	printk(KERN_ERR "keylen %d enckeylen %d authkeylen %d\n",
--	       keys.authkeylen + keys.enckeylen, keys.enckeylen,
--	       keys.authkeylen);
--	printk(KERN_ERR "split_key_len %d split_key_pad_len %d\n",
--	       ctx->split_key_len, ctx->split_key_pad_len);
--	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
--#endif
--
--	ret = gen_split_aead_key(ctx, keys.authkey, keys.authkeylen);
--	if (ret) {
--		goto badkey;
--	}
--
--	/* postpend encryption key to auth split key */
--	memcpy(ctx->key + ctx->split_key_pad_len, keys.enckey, keys.enckeylen);
--
--	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->split_key_pad_len +
--				      keys.enckeylen, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->key_dma)) {
--		dev_err(jrdev, "unable to map key i/o memory\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
--		       ctx->split_key_pad_len + keys.enckeylen, 1);
--#endif
--
--	ctx->enckeylen = keys.enckeylen;
-+	ctx->enckeylen = enckeylen;
- 
- 	ret = aead_set_sh_desc(aead);
- 	if (ret) {
- 		dma_unmap_single(jrdev, ctx->key_dma, ctx->split_key_pad_len +
--				 keys.enckeylen, DMA_TO_DEVICE);
-+				 enckeylen, DMA_TO_DEVICE);
- 	}
- 
- 	return ret;
-@@ -1715,154 +548,20 @@
- 	return -EINVAL;
- }
- 
--static int gcm_setkey(struct crypto_aead *aead,
--		      const u8 *key, unsigned int keylen)
--{
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	int ret = 0;
--
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
--#endif
--
--	memcpy(ctx->key, key, keylen);
--	ctx->key_dma = dma_map_single(jrdev, ctx->key, keylen,
--				      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->key_dma)) {
--		dev_err(jrdev, "unable to map key i/o memory\n");
--		return -ENOMEM;
--	}
--	ctx->enckeylen = keylen;
--
--	ret = gcm_set_sh_desc(aead);
--	if (ret) {
--		dma_unmap_single(jrdev, ctx->key_dma, ctx->enckeylen,
--				 DMA_TO_DEVICE);
--	}
--
--	return ret;
--}
--
--static int rfc4106_setkey(struct crypto_aead *aead,
--			  const u8 *key, unsigned int keylen)
--{
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	int ret = 0;
--
--	if (keylen < 4)
--		return -EINVAL;
--
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
--#endif
--
--	memcpy(ctx->key, key, keylen);
--
--	/*
--	 * The last four bytes of the key material are used as the salt value
--	 * in the nonce. Update the AES key length.
--	 */
--	ctx->enckeylen = keylen - 4;
--
--	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->enckeylen,
--				      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->key_dma)) {
--		dev_err(jrdev, "unable to map key i/o memory\n");
--		return -ENOMEM;
--	}
--
--	ret = rfc4106_set_sh_desc(aead);
--	if (ret) {
--		dma_unmap_single(jrdev, ctx->key_dma, ctx->enckeylen,
--				 DMA_TO_DEVICE);
--	}
--
--	return ret;
--}
--
--static int rfc4543_setkey(struct crypto_aead *aead,
--			  const u8 *key, unsigned int keylen)
--{
--	struct caam_ctx *ctx = crypto_aead_ctx(aead);
--	struct device *jrdev = ctx->jrdev;
--	int ret = 0;
--
--	if (keylen < 4)
--		return -EINVAL;
--
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
--#endif
--
--	memcpy(ctx->key, key, keylen);
--
--	/*
--	 * The last four bytes of the key material are used as the salt value
--	 * in the nonce. Update the AES key length.
--	 */
--	ctx->enckeylen = keylen - 4;
--
--	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->enckeylen,
--				      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->key_dma)) {
--		dev_err(jrdev, "unable to map key i/o memory\n");
--		return -ENOMEM;
--	}
--
--	ret = rfc4543_set_sh_desc(aead);
--	if (ret) {
--		dma_unmap_single(jrdev, ctx->key_dma, ctx->enckeylen,
--				 DMA_TO_DEVICE);
--	}
--
--	return ret;
--}
--
- static int ablkcipher_setkey(struct crypto_ablkcipher *ablkcipher,
- 			     const u8 *key, unsigned int keylen)
- {
- 	struct caam_ctx *ctx = crypto_ablkcipher_ctx(ablkcipher);
--	struct ablkcipher_tfm *crt = &ablkcipher->base.crt_ablkcipher;
--	struct crypto_tfm *tfm = crypto_ablkcipher_tfm(ablkcipher);
--	const char *alg_name = crypto_tfm_alg_name(tfm);
-+	struct ablkcipher_tfm *tfm = &ablkcipher->base.crt_ablkcipher;
- 	struct device *jrdev = ctx->jrdev;
- 	int ret = 0;
--	u32 *key_jump_cmd;
-+	u32 *key_jump_cmd, *jump_cmd;
- 	u32 *desc;
--	u32 *nonce;
--	u32 geniv;
--	u32 ctx1_iv_off = 0;
--	const bool ctr_mode = ((ctx->class1_alg_type & OP_ALG_AAI_MASK) ==
--			       OP_ALG_AAI_CTR_MOD128);
--	const bool is_rfc3686 = (ctr_mode &&
--				 (strstr(alg_name, "rfc3686") != NULL));
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "key in @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
- #endif
--	/*
--	 * AES-CTR needs to load IV in CONTEXT1 reg
--	 * at an offset of 128bits (16bytes)
--	 * CONTEXT1[255:128] = IV
--	 */
--	if (ctr_mode)
--		ctx1_iv_off = 16;
--
--	/*
--	 * RFC3686 specific:
--	 *	| CONTEXT1[255:128] = {NONCE, IV, COUNTER}
--	 *	| *key = {KEY, NONCE}
--	 */
--	if (is_rfc3686) {
--		ctx1_iv_off = 16 + CTR_RFC3686_NONCE_SIZE;
--		keylen -= CTR_RFC3686_NONCE_SIZE;
--	}
- 
- 	memcpy(ctx->key, key, keylen);
- 	ctx->key_dma = dma_map_single(jrdev, ctx->key, keylen,
-@@ -1872,10 +571,11 @@
- 		return -ENOMEM;
- 	}
- 	ctx->enckeylen = keylen;
-+	dma_sync_single_for_device(jrdev, ctx->key_dma, keylen, DMA_TO_DEVICE);
- 
- 	/* ablkcipher_encrypt shared descriptor */
- 	desc = ctx->sh_desc_enc;
--	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
-+	init_sh_desc(desc, HDR_SHARE_SERIAL);
- 	/* Skip if already shared */
- 	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
- 				   JUMP_COND_SHRD);
-@@ -1885,32 +585,20 @@
- 			  ctx->enckeylen, CLASS_1 |
- 			  KEY_DEST_CLASS_REG);
- 
--	/* Load nonce into CONTEXT1 reg */
--	if (is_rfc3686) {
--		nonce = (u32 *)(key + keylen);
--		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
--				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
--		append_move(desc, MOVE_WAITCOMP |
--			    MOVE_SRC_OUTFIFO |
--			    MOVE_DEST_CLASS1CTX |
--			    (16 << MOVE_OFFSET_SHIFT) |
--			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
--	}
--
- 	set_jump_tgt_here(desc, key_jump_cmd);
- 
--	/* Load iv */
--	append_seq_load(desc, crt->ivsize, LDST_SRCDST_BYTE_CONTEXT |
--			LDST_CLASS_1_CCB | (ctx1_iv_off << LDST_OFFSET_SHIFT));
--
--	/* Load counter into CONTEXT1 reg */
--	if (is_rfc3686)
--		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
--				    LDST_CLASS_1_CCB |
--				    LDST_SRCDST_BYTE_CONTEXT |
--				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
--				     LDST_OFFSET_SHIFT));
-+	/* Propagate errors from shared to job descriptor */
-+	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
- 
-+	/* load IV */
-+	if (strncmp(ablkcipher->base.__crt_alg->cra_name, "ctr(aes)", 8) == 0) {
-+		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+			LDST_CLASS_1_CCB | tfm->ivsize |
-+			(16 << LDST_OFFSET_SHIFT));
-+	} else {
-+		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+				    LDST_CLASS_1_CCB | tfm->ivsize);
-+	}
- 	/* Load operation */
- 	append_operation(desc, ctx->class1_alg_type |
- 			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
-@@ -1926,15 +614,17 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ablkcipher enc shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ablkcipher enc shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_enc_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
-+
- 	/* ablkcipher_decrypt shared descriptor */
- 	desc = ctx->sh_desc_dec;
- 
--	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
-+	init_sh_desc(desc, HDR_SHARE_SERIAL);
- 	/* Skip if already shared */
- 	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
- 				   JUMP_COND_SHRD);
-@@ -1944,133 +634,49 @@
- 			  ctx->enckeylen, CLASS_1 |
- 			  KEY_DEST_CLASS_REG);
- 
--	/* Load nonce into CONTEXT1 reg */
--	if (is_rfc3686) {
--		nonce = (u32 *)(key + keylen);
--		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
--				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
--		append_move(desc, MOVE_WAITCOMP |
--			    MOVE_SRC_OUTFIFO |
--			    MOVE_DEST_CLASS1CTX |
--			    (16 << MOVE_OFFSET_SHIFT) |
--			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
--	}
--
-+	/* For aead, only propagate error immediately if shared */
-+	jump_cmd = append_jump(desc, JUMP_TEST_ALL);
- 	set_jump_tgt_here(desc, key_jump_cmd);
-+	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
-+	set_jump_tgt_here(desc, jump_cmd);
- 
- 	/* load IV */
--	append_seq_load(desc, crt->ivsize, LDST_SRCDST_BYTE_CONTEXT |
--			LDST_CLASS_1_CCB | (ctx1_iv_off << LDST_OFFSET_SHIFT));
--
--	/* Load counter into CONTEXT1 reg */
--	if (is_rfc3686)
--		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
--				    LDST_CLASS_1_CCB |
--				    LDST_SRCDST_BYTE_CONTEXT |
--				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
--				     LDST_OFFSET_SHIFT));
-+	if (strncmp(ablkcipher->base.__crt_alg->cra_name, "ctr(aes)", 8) == 0) {
-+		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+			LDST_CLASS_1_CCB | tfm->ivsize |
-+			(16 << LDST_OFFSET_SHIFT));
- 
--	/* Choose operation */
--	if (ctr_mode)
- 		append_operation(desc, ctx->class1_alg_type |
--				 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT);
--	else
-+			OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT);
-+	} else {
-+		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+				    LDST_CLASS_1_CCB | tfm->ivsize);
-+
-+		/* Choose operation */
- 		append_dec_op1(desc, ctx->class1_alg_type);
-+	}
- 
- 	/* Perform operation */
- 	ablkcipher_append_src_dst(desc);
- 
-+	/* Wait for key to load before allowing propagating error */
-+	append_dec_shr_done(desc);
-+
- 	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
- 					      desc_bytes(desc),
- 					      DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
-+	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
- 		dev_err(jrdev, "unable to map shared descriptor\n");
- 		return -ENOMEM;
- 	}
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ablkcipher dec shdesc@"__stringify(__LINE__)": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
--		       desc_bytes(desc), 1);
--#endif
--	/* ablkcipher_givencrypt shared descriptor */
--	desc = ctx->sh_desc_givenc;
--
--	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
--	/* Skip if already shared */
--	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
--				   JUMP_COND_SHRD);
--
--	/* Load class1 key only */
--	append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
--			  ctx->enckeylen, CLASS_1 |
--			  KEY_DEST_CLASS_REG);
--
--	/* Load Nonce into CONTEXT1 reg */
--	if (is_rfc3686) {
--		nonce = (u32 *)(key + keylen);
--		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
--				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
--		append_move(desc, MOVE_WAITCOMP |
--			    MOVE_SRC_OUTFIFO |
--			    MOVE_DEST_CLASS1CTX |
--			    (16 << MOVE_OFFSET_SHIFT) |
--			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
--	}
--	set_jump_tgt_here(desc, key_jump_cmd);
--
--	/* Generate IV */
--	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
--		NFIFOENTRY_DTYPE_MSG | NFIFOENTRY_LC1 |
--		NFIFOENTRY_PTYPE_RND | (crt->ivsize << NFIFOENTRY_DLEN_SHIFT);
--	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
--			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
--	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
--	append_move(desc, MOVE_WAITCOMP |
--		    MOVE_SRC_INFIFO |
--		    MOVE_DEST_CLASS1CTX |
--		    (crt->ivsize << MOVE_LEN_SHIFT) |
--		    (ctx1_iv_off << MOVE_OFFSET_SHIFT));
--	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
--
--	/* Copy generated IV to memory */
--	append_seq_store(desc, crt->ivsize,
--			 LDST_SRCDST_BYTE_CONTEXT | LDST_CLASS_1_CCB |
--			 (ctx1_iv_off << LDST_OFFSET_SHIFT));
--
--	/* Load Counter into CONTEXT1 reg */
--	if (is_rfc3686)
--		append_load_imm_u32(desc, (u32)1, LDST_IMM |
--				    LDST_CLASS_1_CCB |
--				    LDST_SRCDST_BYTE_CONTEXT |
--				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
--				     LDST_OFFSET_SHIFT));
--
--	if (ctx1_iv_off)
--		append_jump(desc, JUMP_JSL | JUMP_TEST_ALL | JUMP_COND_NCP |
--			    (1 << JUMP_OFFSET_SHIFT));
--
--	/* Load operation */
--	append_operation(desc, ctx->class1_alg_type |
--			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
--
--	/* Perform operation */
--	ablkcipher_append_src_dst(desc);
--
--	ctx->sh_desc_givenc_dma = dma_map_single(jrdev, desc,
--						 desc_bytes(desc),
--						 DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_givenc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ablkcipher givenc shdesc@" __stringify(__LINE__) ": ",
-+	print_hex_dump(KERN_ERR, "ablkcipher dec shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_dec_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
- 
- 	return ret;
- }
-@@ -2195,19 +801,22 @@
- 	edesc = (struct aead_edesc *)((char *)desc -
- 		 offsetof(struct aead_edesc, hw_desc));
- 
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- 	aead_unmap(jrdev, edesc, req);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "assoc  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "assoc  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->assoc),
- 		       req->assoclen , 1);
--	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src) - ivsize,
- 		       edesc->src_nents ? 100 : ivsize, 1);
--	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 		       edesc->src_nents ? 100 : req->cryptlen +
- 		       ctx->authsize + 4, 1);
-@@ -2235,16 +844,19 @@
- 		 offsetof(struct aead_edesc, hw_desc));
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, req->iv,
- 		       ivsize, 1);
--	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->dst),
--		       req->cryptlen - ctx->authsize, 1);
-+		       req->cryptlen, 1);
- #endif
- 
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- 	aead_unmap(jrdev, edesc, req);
- 
-@@ -2255,7 +867,7 @@
- 		err = -EBADMSG;
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "iphdrout@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "iphdrout@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4,
- 		       ((char *)sg_virt(req->assoc) - sizeof(struct iphdr)),
- 		       sizeof(struct iphdr) + req->assoclen +
-@@ -2263,7 +875,7 @@
- 		       ctx->authsize + 36, 1);
- 	if (!err && edesc->sec4_sg_bytes) {
- 		struct scatterlist *sg = sg_last(req->src, edesc->src_nents);
--		print_hex_dump(KERN_ERR, "sglastout@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "sglastout@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(sg),
- 			sg->length + ctx->authsize + 16, 1);
- 	}
-@@ -2289,14 +901,17 @@
- 	edesc = (struct ablkcipher_edesc *)((char *)desc -
- 		 offsetof(struct ablkcipher_edesc, hw_desc));
- 
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
- 		       edesc->src_nents > 1 ? 100 : ivsize, 1);
--	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 		       edesc->dst_nents > 1 ? 100 : req->nbytes, 1);
- #endif
-@@ -2321,14 +936,17 @@
- 
- 	edesc = (struct ablkcipher_edesc *)((char *)desc -
- 		 offsetof(struct ablkcipher_edesc, hw_desc));
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
- 		       ivsize, 1);
--	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 		       edesc->dst_nents > 1 ? 100 : req->nbytes, 1);
- #endif
-@@ -2355,38 +973,29 @@
- 	u32 out_options = 0, in_options;
- 	dma_addr_t dst_dma, src_dma;
- 	int len, sec4_sg_index = 0;
--	bool is_gcm = false;
- 
- #ifdef DEBUG
- 	debug("assoclen %d cryptlen %d authsize %d\n",
- 	      req->assoclen, req->cryptlen, authsize);
--	print_hex_dump(KERN_ERR, "assoc  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "assoc  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->assoc),
- 		       req->assoclen , 1);
--	print_hex_dump(KERN_ERR, "presciv@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "presciv@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, req->iv,
- 		       edesc->src_nents ? 100 : ivsize, 1);
--	print_hex_dump(KERN_ERR, "src    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "src    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 			edesc->src_nents ? 100 : req->cryptlen, 1);
--	print_hex_dump(KERN_ERR, "shrdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "shrdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sh_desc,
- 		       desc_bytes(sh_desc), 1);
- #endif
- 
--	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
--	      OP_ALG_ALGSEL_AES) &&
--	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
--		is_gcm = true;
--
- 	len = desc_len(sh_desc);
- 	init_job_desc_shared(desc, ptr, len, HDR_SHARE_DEFER | HDR_REVERSE);
- 
- 	if (all_contig) {
--		if (is_gcm)
--			src_dma = edesc->iv_dma;
--		else
--			src_dma = sg_dma_address(req->assoc);
-+		src_dma = sg_dma_address(req->assoc);
- 		in_options = 0;
- 	} else {
- 		src_dma = edesc->sec4_sg_dma;
-@@ -2394,9 +1003,12 @@
- 				 (edesc->src_nents ? : 1);
- 		in_options = LDST_SGF;
- 	}
--
--	append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize + req->cryptlen,
--			  in_options);
-+	if (encrypt)
-+		append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize +
-+				  req->cryptlen - authsize, in_options);
-+	else
-+		append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize +
-+				  req->cryptlen, in_options);
- 
- 	if (likely(req->src == req->dst)) {
- 		if (all_contig) {
-@@ -2417,8 +1029,7 @@
- 		}
- 	}
- 	if (encrypt)
--		append_seq_out_ptr(desc, dst_dma, req->cryptlen + authsize,
--				   out_options);
-+		append_seq_out_ptr(desc, dst_dma, req->cryptlen, out_options);
- 	else
- 		append_seq_out_ptr(desc, dst_dma, req->cryptlen - authsize,
- 				   out_options);
-@@ -2440,53 +1051,43 @@
- 	u32 out_options = 0, in_options;
- 	dma_addr_t dst_dma, src_dma;
- 	int len, sec4_sg_index = 0;
--	bool is_gcm = false;
- 
- #ifdef DEBUG
- 	debug("assoclen %d cryptlen %d authsize %d\n",
- 	      req->assoclen, req->cryptlen, authsize);
--	print_hex_dump(KERN_ERR, "assoc  @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "assoc  @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->assoc),
- 		       req->assoclen , 1);
--	print_hex_dump(KERN_ERR, "presciv@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "presciv@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, req->iv, ivsize, 1);
--	print_hex_dump(KERN_ERR, "src    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "src    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 			edesc->src_nents > 1 ? 100 : req->cryptlen, 1);
--	print_hex_dump(KERN_ERR, "shrdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "shrdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sh_desc,
- 		       desc_bytes(sh_desc), 1);
- #endif
- 
--	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
--	      OP_ALG_ALGSEL_AES) &&
--	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
--		is_gcm = true;
--
- 	len = desc_len(sh_desc);
- 	init_job_desc_shared(desc, ptr, len, HDR_SHARE_DEFER | HDR_REVERSE);
- 
- 	if (contig & GIV_SRC_CONTIG) {
--		if (is_gcm)
--			src_dma = edesc->iv_dma;
--		else
--			src_dma = sg_dma_address(req->assoc);
-+		src_dma = sg_dma_address(req->assoc);
- 		in_options = 0;
- 	} else {
- 		src_dma = edesc->sec4_sg_dma;
- 		sec4_sg_index += edesc->assoc_nents + 1 + edesc->src_nents;
- 		in_options = LDST_SGF;
- 	}
--	append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize + req->cryptlen,
--			  in_options);
-+	append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize +
-+			  req->cryptlen - authsize, in_options);
- 
- 	if (contig & GIV_DST_CONTIG) {
- 		dst_dma = edesc->iv_dma;
- 	} else {
- 		if (likely(req->src == req->dst)) {
- 			dst_dma = src_dma + sizeof(struct sec4_sg_entry) *
--				  (edesc->assoc_nents +
--				   (is_gcm ? 1 + edesc->src_nents : 0));
-+				  edesc->assoc_nents;
- 			out_options = LDST_SGF;
- 		} else {
- 			dst_dma = edesc->sec4_sg_dma +
-@@ -2496,8 +1097,7 @@
- 		}
- 	}
- 
--	append_seq_out_ptr(desc, dst_dma, ivsize + req->cryptlen + authsize,
--			   out_options);
-+	append_seq_out_ptr(desc, dst_dma, ivsize + req->cryptlen, out_options);
- }
- 
- /*
-@@ -2516,10 +1116,10 @@
- 	int len, sec4_sg_index = 0;
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "presciv@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "presciv@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
- 		       ivsize, 1);
--	print_hex_dump(KERN_ERR, "src    @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "src    @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 		       edesc->src_nents ? 100 : req->nbytes, 1);
- #endif
-@@ -2532,7 +1132,7 @@
- 		in_options = 0;
- 	} else {
- 		src_dma = edesc->sec4_sg_dma;
--		sec4_sg_index += edesc->src_nents + 1;
-+		sec4_sg_index += (iv_contig ? 0 : 1) + edesc->src_nents;
- 		in_options = LDST_SGF;
- 	}
- 	append_seq_in_ptr(desc, src_dma, req->nbytes + ivsize, in_options);
-@@ -2558,59 +1158,10 @@
- }
- 
- /*
-- * Fill in ablkcipher givencrypt job descriptor
-- */
--static void init_ablkcipher_giv_job(u32 *sh_desc, dma_addr_t ptr,
--				    struct ablkcipher_edesc *edesc,
--				    struct ablkcipher_request *req,
--				    bool iv_contig)
--{
--	struct crypto_ablkcipher *ablkcipher = crypto_ablkcipher_reqtfm(req);
--	int ivsize = crypto_ablkcipher_ivsize(ablkcipher);
--	u32 *desc = edesc->hw_desc;
--	u32 out_options, in_options;
--	dma_addr_t dst_dma, src_dma;
--	int len, sec4_sg_index = 0;
--
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR, "presciv@" __stringify(__LINE__) ": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
--		       ivsize, 1);
--	print_hex_dump(KERN_ERR, "src    @" __stringify(__LINE__) ": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
--		       edesc->src_nents ? 100 : req->nbytes, 1);
--#endif
--
--	len = desc_len(sh_desc);
--	init_job_desc_shared(desc, ptr, len, HDR_SHARE_DEFER | HDR_REVERSE);
--
--	if (!edesc->src_nents) {
--		src_dma = sg_dma_address(req->src);
--		in_options = 0;
--	} else {
--		src_dma = edesc->sec4_sg_dma;
--		sec4_sg_index += edesc->src_nents;
--		in_options = LDST_SGF;
--	}
--	append_seq_in_ptr(desc, src_dma, req->nbytes, in_options);
--
--	if (iv_contig) {
--		dst_dma = edesc->iv_dma;
--		out_options = 0;
--	} else {
--		dst_dma = edesc->sec4_sg_dma +
--			  sec4_sg_index * sizeof(struct sec4_sg_entry);
--		out_options = LDST_SGF;
--	}
--	append_seq_out_ptr(desc, dst_dma, req->nbytes + ivsize, out_options);
--}
--
--/*
-  * allocate and map the aead extended descriptor
-  */
- static struct aead_edesc *aead_edesc_alloc(struct aead_request *req,
--					   int desc_bytes, bool *all_contig_ptr,
--					   bool encrypt)
-+					   int desc_bytes, bool *all_contig_ptr)
- {
- 	struct crypto_aead *aead = crypto_aead_reqtfm(req);
- 	struct caam_ctx *ctx = crypto_aead_ctx(aead);
-@@ -2625,26 +1176,15 @@
- 	bool assoc_chained = false, src_chained = false, dst_chained = false;
- 	int ivsize = crypto_aead_ivsize(aead);
- 	int sec4_sg_index, sec4_sg_len = 0, sec4_sg_bytes;
--	unsigned int authsize = ctx->authsize;
--	bool is_gcm = false;
- 
- 	assoc_nents = sg_count(req->assoc, req->assoclen, &assoc_chained);
-+	src_nents = sg_count(req->src, req->cryptlen, &src_chained);
- 
--	if (unlikely(req->dst != req->src)) {
--		src_nents = sg_count(req->src, req->cryptlen, &src_chained);
--		dst_nents = sg_count(req->dst,
--				     req->cryptlen +
--					(encrypt ? authsize : (-authsize)),
--				     &dst_chained);
--	} else {
--		src_nents = sg_count(req->src,
--				     req->cryptlen +
--					(encrypt ? authsize : 0),
--				     &src_chained);
--	}
-+	if (unlikely(req->dst != req->src))
-+		dst_nents = sg_count(req->dst, req->cryptlen, &dst_chained);
- 
- 	sgc = dma_map_sg_chained(jrdev, req->assoc, assoc_nents ? : 1,
--				 DMA_TO_DEVICE, assoc_chained);
-+				 DMA_BIDIRECTIONAL, assoc_chained);
- 	if (likely(req->src == req->dst)) {
- 		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
- 					 DMA_BIDIRECTIONAL, src_chained);
-@@ -2655,43 +1195,23 @@
- 					 DMA_FROM_DEVICE, dst_chained);
- 	}
- 
-+	/* Check if data are contiguous */
- 	iv_dma = dma_map_single(jrdev, req->iv, ivsize, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, iv_dma)) {
--		dev_err(jrdev, "unable to map IV\n");
--		return ERR_PTR(-ENOMEM);
--	}
--
--	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
--	      OP_ALG_ALGSEL_AES) &&
--	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
--		is_gcm = true;
--
--	/*
--	 * Check if data are contiguous.
--	 * GCM expected input sequence: IV, AAD, text
--	 * All other - expected input sequence: AAD, IV, text
--	 */
--	if (is_gcm)
--		all_contig = (!assoc_nents &&
--			      iv_dma + ivsize == sg_dma_address(req->assoc) &&
--			      !src_nents && sg_dma_address(req->assoc) +
--			      req->assoclen == sg_dma_address(req->src));
--	else
--		all_contig = (!assoc_nents && sg_dma_address(req->assoc) +
--			      req->assoclen == iv_dma && !src_nents &&
--			      iv_dma + ivsize == sg_dma_address(req->src));
--	if (!all_contig) {
-+	if (assoc_nents || sg_dma_address(req->assoc) + req->assoclen !=
-+	    iv_dma || src_nents || iv_dma + ivsize !=
-+	    sg_dma_address(req->src)) {
-+		all_contig = false;
- 		assoc_nents = assoc_nents ? : 1;
- 		src_nents = src_nents ? : 1;
- 		sec4_sg_len = assoc_nents + 1 + src_nents;
- 	}
--
- 	sec4_sg_len += dst_nents;
- 
- 	sec4_sg_bytes = sec4_sg_len * sizeof(struct sec4_sg_entry);
-+	dma_sync_single_for_device(jrdev, iv_dma, ivsize, DMA_TO_DEVICE);
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct aead_edesc) + desc_bytes +
-+	edesc = kzalloc(sizeof(struct aead_edesc) + desc_bytes +
- 			sec4_sg_bytes, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -2708,46 +1228,32 @@
- 	edesc->sec4_sg_bytes = sec4_sg_bytes;
- 	edesc->sec4_sg = (void *)edesc + sizeof(struct aead_edesc) +
- 			 desc_bytes;
-+	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+					    sec4_sg_bytes, DMA_TO_DEVICE);
- 	*all_contig_ptr = all_contig;
- 
- 	sec4_sg_index = 0;
- 	if (!all_contig) {
--		if (!is_gcm) {
--			sg_to_sec4_sg(req->assoc,
--				      assoc_nents,
--				      edesc->sec4_sg +
--				      sec4_sg_index, 0);
--			sec4_sg_index += assoc_nents;
--		}
--
-+		sg_to_sec4_sg(req->assoc,
-+			      (assoc_nents ? : 1),
-+			      edesc->sec4_sg +
-+			      sec4_sg_index, 0);
-+		sec4_sg_index += assoc_nents ? : 1;
- 		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
- 				   iv_dma, ivsize, 0);
- 		sec4_sg_index += 1;
--
--		if (is_gcm) {
--			sg_to_sec4_sg(req->assoc,
--				      assoc_nents,
--				      edesc->sec4_sg +
--				      sec4_sg_index, 0);
--			sec4_sg_index += assoc_nents;
--		}
--
- 		sg_to_sec4_sg_last(req->src,
--				   src_nents,
-+				   (src_nents ? : 1),
- 				   edesc->sec4_sg +
- 				   sec4_sg_index, 0);
--		sec4_sg_index += src_nents;
-+		sec4_sg_index += src_nents ? : 1;
- 	}
- 	if (dst_nents) {
- 		sg_to_sec4_sg_last(req->dst, dst_nents,
- 				   edesc->sec4_sg + sec4_sg_index, 0);
- 	}
--	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return ERR_PTR(-ENOMEM);
--	}
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
-+				   DMA_TO_DEVICE);
- 
- 	return edesc;
- }
-@@ -2762,9 +1268,11 @@
- 	u32 *desc;
- 	int ret = 0;
- 
-+	req->cryptlen += ctx->authsize;
-+
- 	/* allocate extended descriptor */
- 	edesc = aead_edesc_alloc(req, DESC_JOB_IO_LEN *
--				 CAAM_CMD_SZ, &all_contig, true);
-+				 CAAM_CMD_SZ, &all_contig);
- 	if (IS_ERR(edesc))
- 		return PTR_ERR(edesc);
- 
-@@ -2772,7 +1280,7 @@
- 	init_aead_job(ctx->sh_desc_enc, ctx->sh_desc_enc_dma, edesc, req,
- 		      all_contig, true);
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "aead jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "aead jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
- 		       desc_bytes(edesc->hw_desc), 1);
- #endif
-@@ -2801,12 +1309,12 @@
- 
- 	/* allocate extended descriptor */
- 	edesc = aead_edesc_alloc(req, DESC_JOB_IO_LEN *
--				 CAAM_CMD_SZ, &all_contig, false);
-+				 CAAM_CMD_SZ, &all_contig);
- 	if (IS_ERR(edesc))
- 		return PTR_ERR(edesc);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "dec src@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "dec src@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 		       req->cryptlen, 1);
- #endif
-@@ -2815,7 +1323,7 @@
- 	init_aead_job(ctx->sh_desc_dec,
- 		      ctx->sh_desc_dec_dma, edesc, req, all_contig, false);
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "aead jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "aead jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
- 		       desc_bytes(edesc->hw_desc), 1);
- #endif
-@@ -2853,17 +1361,15 @@
- 	int ivsize = crypto_aead_ivsize(aead);
- 	bool assoc_chained = false, src_chained = false, dst_chained = false;
- 	int sec4_sg_index, sec4_sg_len = 0, sec4_sg_bytes;
--	bool is_gcm = false;
- 
- 	assoc_nents = sg_count(req->assoc, req->assoclen, &assoc_chained);
- 	src_nents = sg_count(req->src, req->cryptlen, &src_chained);
- 
- 	if (unlikely(req->dst != req->src))
--		dst_nents = sg_count(req->dst, req->cryptlen + ctx->authsize,
--				     &dst_chained);
-+		dst_nents = sg_count(req->dst, req->cryptlen, &dst_chained);
- 
- 	sgc = dma_map_sg_chained(jrdev, req->assoc, assoc_nents ? : 1,
--				 DMA_TO_DEVICE, assoc_chained);
-+				 DMA_BIDIRECTIONAL, assoc_chained);
- 	if (likely(req->src == req->dst)) {
- 		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
- 					 DMA_BIDIRECTIONAL, src_chained);
-@@ -2874,64 +1380,32 @@
- 					 DMA_FROM_DEVICE, dst_chained);
- 	}
- 
-+	/* Check if data are contiguous */
- 	iv_dma = dma_map_single(jrdev, greq->giv, ivsize, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, iv_dma)) {
--		dev_err(jrdev, "unable to map IV\n");
--		return ERR_PTR(-ENOMEM);
--	}
--
--	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
--	      OP_ALG_ALGSEL_AES) &&
--	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
--		is_gcm = true;
--
--	/*
--	 * Check if data are contiguous.
--	 * GCM expected input sequence: IV, AAD, text
--	 * All other - expected input sequence: AAD, IV, text
--	 */
--
--	if (is_gcm) {
--		if (assoc_nents || iv_dma + ivsize !=
--		    sg_dma_address(req->assoc) || src_nents ||
--		    sg_dma_address(req->assoc) + req->assoclen !=
--		    sg_dma_address(req->src))
--			contig &= ~GIV_SRC_CONTIG;
--	} else {
--		if (assoc_nents ||
--		    sg_dma_address(req->assoc) + req->assoclen != iv_dma ||
--		    src_nents || iv_dma + ivsize != sg_dma_address(req->src))
--			contig &= ~GIV_SRC_CONTIG;
--	}
--
-+	if (assoc_nents || sg_dma_address(req->assoc) + req->assoclen !=
-+	    iv_dma || src_nents || iv_dma + ivsize != sg_dma_address(req->src))
-+		contig &= ~GIV_SRC_CONTIG;
- 	if (dst_nents || iv_dma + ivsize != sg_dma_address(req->dst))
- 		contig &= ~GIV_DST_CONTIG;
--
-+	if (unlikely(req->src != req->dst)) {
-+		dst_nents = dst_nents ? : 1;
-+		sec4_sg_len += 1;
-+	}
- 	if (!(contig & GIV_SRC_CONTIG)) {
- 		assoc_nents = assoc_nents ? : 1;
- 		src_nents = src_nents ? : 1;
- 		sec4_sg_len += assoc_nents + 1 + src_nents;
--		if (req->src == req->dst &&
--		    (src_nents || iv_dma + ivsize != sg_dma_address(req->src)))
--			contig &= ~GIV_DST_CONTIG;
--	}
--
--	/*
--	 * Add new sg entries for GCM output sequence.
--	 * Expected output sequence: IV, encrypted text.
--	 */
--	if (is_gcm && req->src == req->dst && !(contig & GIV_DST_CONTIG))
--		sec4_sg_len += 1 + src_nents;
--
--	if (unlikely(req->src != req->dst)) {
--		dst_nents = dst_nents ? : 1;
--		sec4_sg_len += 1 + dst_nents;
-+		if (likely(req->src == req->dst))
-+			contig &= ~GIV_DST_CONTIG;
- 	}
-+	sec4_sg_len += dst_nents;
- 
- 	sec4_sg_bytes = sec4_sg_len * sizeof(struct sec4_sg_entry);
- 
-+	dma_sync_single_for_device(jrdev, iv_dma, ivsize, DMA_TO_DEVICE);
-+
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct aead_edesc) + desc_bytes +
-+	edesc = kzalloc(sizeof(struct aead_edesc) + desc_bytes +
- 			sec4_sg_bytes, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -2948,40 +1422,24 @@
- 	edesc->sec4_sg_bytes = sec4_sg_bytes;
- 	edesc->sec4_sg = (void *)edesc + sizeof(struct aead_edesc) +
- 			 desc_bytes;
-+	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+					    sec4_sg_bytes, DMA_TO_DEVICE);
- 	*contig_ptr = contig;
- 
- 	sec4_sg_index = 0;
- 	if (!(contig & GIV_SRC_CONTIG)) {
--		if (!is_gcm) {
--			sg_to_sec4_sg(req->assoc, assoc_nents,
--				      edesc->sec4_sg + sec4_sg_index, 0);
--			sec4_sg_index += assoc_nents;
--		}
--
-+		sg_to_sec4_sg(req->assoc, assoc_nents,
-+			      edesc->sec4_sg +
-+			      sec4_sg_index, 0);
-+		sec4_sg_index += assoc_nents;
- 		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
- 				   iv_dma, ivsize, 0);
- 		sec4_sg_index += 1;
--
--		if (is_gcm) {
--			sg_to_sec4_sg(req->assoc, assoc_nents,
--				      edesc->sec4_sg + sec4_sg_index, 0);
--			sec4_sg_index += assoc_nents;
--		}
--
- 		sg_to_sec4_sg_last(req->src, src_nents,
- 				   edesc->sec4_sg +
- 				   sec4_sg_index, 0);
- 		sec4_sg_index += src_nents;
- 	}
--
--	if (is_gcm && req->src == req->dst && !(contig & GIV_DST_CONTIG)) {
--		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
--				   iv_dma, ivsize, 0);
--		sec4_sg_index += 1;
--		sg_to_sec4_sg_last(req->src, src_nents,
--				   edesc->sec4_sg + sec4_sg_index, 0);
--	}
--
- 	if (unlikely(req->src != req->dst && !(contig & GIV_DST_CONTIG))) {
- 		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
- 				   iv_dma, ivsize, 0);
-@@ -2989,12 +1447,8 @@
- 		sg_to_sec4_sg_last(req->dst, dst_nents,
- 				   edesc->sec4_sg + sec4_sg_index, 0);
- 	}
--	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return ERR_PTR(-ENOMEM);
--	}
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
-+				   DMA_TO_DEVICE);
- 
- 	return edesc;
- }
-@@ -3010,6 +1464,8 @@
- 	u32 *desc;
- 	int ret = 0;
- 
-+	req->cryptlen += ctx->authsize;
-+
- 	/* allocate extended descriptor */
- 	edesc = aead_giv_edesc_alloc(areq, DESC_JOB_IO_LEN *
- 				     CAAM_CMD_SZ, &contig);
-@@ -3018,7 +1474,7 @@
- 		return PTR_ERR(edesc);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "giv src@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "giv src@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
- 		       req->cryptlen, 1);
- #endif
-@@ -3027,7 +1483,7 @@
- 	init_aead_giv_job(ctx->sh_desc_givenc,
- 			  ctx->sh_desc_givenc_dma, edesc, req, contig);
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "aead jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "aead jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
- 		       desc_bytes(edesc->hw_desc), 1);
- #endif
-@@ -3044,11 +1500,6 @@
- 	return ret;
- }
- 
--static int aead_null_givencrypt(struct aead_givcrypt_request *areq)
--{
--	return aead_encrypt(&areq->areq);
--}
--
- /*
-  * allocate and map the ablkcipher extended descriptor for ablkcipher
-  */
-@@ -3086,16 +1537,12 @@
- 					 DMA_FROM_DEVICE, dst_chained);
- 	}
- 
--	iv_dma = dma_map_single(jrdev, req->info, ivsize, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, iv_dma)) {
--		dev_err(jrdev, "unable to map IV\n");
--		return ERR_PTR(-ENOMEM);
--	}
--
- 	/*
- 	 * Check if iv can be contiguous with source and destination.
- 	 * If so, include it. If not, create scatterlist.
- 	 */
-+	iv_dma = dma_map_single(jrdev, req->info, ivsize, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(jrdev, iv_dma, ivsize, DMA_TO_DEVICE);
- 	if (!src_nents && iv_dma + ivsize == sg_dma_address(req->src))
- 		iv_contig = true;
- 	else
-@@ -3104,7 +1551,7 @@
- 			sizeof(struct sec4_sg_entry);
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct ablkcipher_edesc) + desc_bytes +
-+	edesc = kzalloc(sizeof(struct ablkcipher_edesc) + desc_bytes +
- 			sec4_sg_bytes, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -3134,15 +1581,13 @@
- 
- 	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
- 					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return ERR_PTR(-ENOMEM);
--	}
--
- 	edesc->iv_dma = iv_dma;
- 
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
-+				   DMA_TO_DEVICE);
-+
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ablkcipher sec4_sg@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ablkcipher sec4_sg@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->sec4_sg,
- 		       sec4_sg_bytes, 1);
- #endif
-@@ -3171,7 +1616,7 @@
- 	init_ablkcipher_job(ctx->sh_desc_enc,
- 		ctx->sh_desc_enc_dma, edesc, req, iv_contig);
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
- 		       desc_bytes(edesc->hw_desc), 1);
- #endif
-@@ -3209,7 +1654,7 @@
- 		ctx->sh_desc_dec_dma, edesc, req, iv_contig);
- 	desc = edesc->hw_desc;
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
- 		       desc_bytes(edesc->hw_desc), 1);
- #endif
-@@ -3225,291 +1670,28 @@
- 	return ret;
- }
- 
--/*
-- * allocate and map the ablkcipher extended descriptor
-- * for ablkcipher givencrypt
-- */
--static struct ablkcipher_edesc *ablkcipher_giv_edesc_alloc(
--				struct skcipher_givcrypt_request *greq,
--				int desc_bytes,
--				bool *iv_contig_out)
--{
--	struct ablkcipher_request *req = &greq->creq;
--	struct crypto_ablkcipher *ablkcipher = crypto_ablkcipher_reqtfm(req);
--	struct caam_ctx *ctx = crypto_ablkcipher_ctx(ablkcipher);
--	struct device *jrdev = ctx->jrdev;
--	gfp_t flags = (req->base.flags & (CRYPTO_TFM_REQ_MAY_BACKLOG |
--					  CRYPTO_TFM_REQ_MAY_SLEEP)) ?
--		       GFP_KERNEL : GFP_ATOMIC;
--	int src_nents, dst_nents = 0, sec4_sg_bytes;
--	struct ablkcipher_edesc *edesc;
--	dma_addr_t iv_dma = 0;
--	bool iv_contig = false;
--	int sgc;
--	int ivsize = crypto_ablkcipher_ivsize(ablkcipher);
--	bool src_chained = false, dst_chained = false;
--	int sec4_sg_index;
--
--	src_nents = sg_count(req->src, req->nbytes, &src_chained);
--
--	if (unlikely(req->dst != req->src))
--		dst_nents = sg_count(req->dst, req->nbytes, &dst_chained);
--
--	if (likely(req->src == req->dst)) {
--		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
--					 DMA_BIDIRECTIONAL, src_chained);
--	} else {
--		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
--					 DMA_TO_DEVICE, src_chained);
--		sgc = dma_map_sg_chained(jrdev, req->dst, dst_nents ? : 1,
--					 DMA_FROM_DEVICE, dst_chained);
--	}
--
--	/*
--	 * Check if iv can be contiguous with source and destination.
--	 * If so, include it. If not, create scatterlist.
--	 */
--	iv_dma = dma_map_single(jrdev, greq->giv, ivsize, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, iv_dma)) {
--		dev_err(jrdev, "unable to map IV\n");
--		return ERR_PTR(-ENOMEM);
--	}
--
--	if (!dst_nents && iv_dma + ivsize == sg_dma_address(req->dst))
--		iv_contig = true;
--	else
--		dst_nents = dst_nents ? : 1;
--	sec4_sg_bytes = ((iv_contig ? 0 : 1) + src_nents + dst_nents) *
--			sizeof(struct sec4_sg_entry);
--
--	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(*edesc) + desc_bytes +
--			sec4_sg_bytes, GFP_DMA | flags);
--	if (!edesc) {
--		dev_err(jrdev, "could not allocate extended descriptor\n");
--		return ERR_PTR(-ENOMEM);
--	}
--
--	edesc->src_nents = src_nents;
--	edesc->src_chained = src_chained;
--	edesc->dst_nents = dst_nents;
--	edesc->dst_chained = dst_chained;
--	edesc->sec4_sg_bytes = sec4_sg_bytes;
--	edesc->sec4_sg = (void *)edesc + sizeof(struct ablkcipher_edesc) +
--			 desc_bytes;
--
--	sec4_sg_index = 0;
--	if (src_nents) {
--		sg_to_sec4_sg_last(req->src, src_nents, edesc->sec4_sg, 0);
--		sec4_sg_index += src_nents;
--	}
--
--	if (!iv_contig) {
--		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
--				   iv_dma, ivsize, 0);
--		sec4_sg_index += 1;
--		sg_to_sec4_sg_last(req->dst, dst_nents,
--				   edesc->sec4_sg + sec4_sg_index, 0);
--	}
--
--	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return ERR_PTR(-ENOMEM);
--	}
--	edesc->iv_dma = iv_dma;
--
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ablkcipher sec4_sg@" __stringify(__LINE__) ": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->sec4_sg,
--		       sec4_sg_bytes, 1);
--#endif
--
--	*iv_contig_out = iv_contig;
--	return edesc;
--}
--
--static int ablkcipher_givencrypt(struct skcipher_givcrypt_request *creq)
--{
--	struct ablkcipher_request *req = &creq->creq;
--	struct ablkcipher_edesc *edesc;
--	struct crypto_ablkcipher *ablkcipher = crypto_ablkcipher_reqtfm(req);
--	struct caam_ctx *ctx = crypto_ablkcipher_ctx(ablkcipher);
--	struct device *jrdev = ctx->jrdev;
--	bool iv_contig;
--	u32 *desc;
--	int ret = 0;
--
--	/* allocate extended descriptor */
--	edesc = ablkcipher_giv_edesc_alloc(creq, DESC_JOB_IO_LEN *
--				       CAAM_CMD_SZ, &iv_contig);
--	if (IS_ERR(edesc))
--		return PTR_ERR(edesc);
--
--	/* Create and submit job descriptor*/
--	init_ablkcipher_giv_job(ctx->sh_desc_givenc, ctx->sh_desc_givenc_dma,
--				edesc, req, iv_contig);
--#ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ablkcipher jobdesc@" __stringify(__LINE__) ": ",
--		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
--		       desc_bytes(edesc->hw_desc), 1);
--#endif
--	desc = edesc->hw_desc;
--	ret = caam_jr_enqueue(jrdev, desc, ablkcipher_encrypt_done, req);
--
--	if (!ret) {
--		ret = -EINPROGRESS;
--	} else {
--		ablkcipher_unmap(jrdev, edesc, req);
--		kfree(edesc);
--	}
--
--	return ret;
--}
--
- #define template_aead		template_u.aead
- #define template_ablkcipher	template_u.ablkcipher
- struct caam_alg_template {
- 	char name[CRYPTO_MAX_ALG_NAME];
--	char driver_name[CRYPTO_MAX_ALG_NAME];
--	unsigned int blocksize;
--	u32 type;
--	union {
--		struct ablkcipher_alg ablkcipher;
--		struct aead_alg aead;
--		struct blkcipher_alg blkcipher;
--		struct cipher_alg cipher;
--		struct compress_alg compress;
--		struct rng_alg rng;
--	} template_u;
--	u32 class1_alg_type;
--	u32 class2_alg_type;
--	u32 alg_op;
--};
--
--static struct caam_alg_template driver_algs[] = {
--	/* single-pass ipsec_esp descriptor */
--	{
--		.name = "authenc(hmac(md5),ecb(cipher_null))",
--		.driver_name = "authenc-hmac-md5-ecb-cipher_null-caam",
--		.blocksize = NULL_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_null_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = NULL_IV_SIZE,
--			.maxauthsize = MD5_DIGEST_SIZE,
--			},
--		.class1_alg_type = 0,
--		.class2_alg_type = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha1),ecb(cipher_null))",
--		.driver_name = "authenc-hmac-sha1-ecb-cipher_null-caam",
--		.blocksize = NULL_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_null_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = NULL_IV_SIZE,
--			.maxauthsize = SHA1_DIGEST_SIZE,
--			},
--		.class1_alg_type = 0,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha224),ecb(cipher_null))",
--		.driver_name = "authenc-hmac-sha224-ecb-cipher_null-caam",
--		.blocksize = NULL_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_null_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = NULL_IV_SIZE,
--			.maxauthsize = SHA224_DIGEST_SIZE,
--			},
--		.class1_alg_type = 0,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA224 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA224 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha256),ecb(cipher_null))",
--		.driver_name = "authenc-hmac-sha256-ecb-cipher_null-caam",
--		.blocksize = NULL_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_null_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = NULL_IV_SIZE,
--			.maxauthsize = SHA256_DIGEST_SIZE,
--			},
--		.class1_alg_type = 0,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA256 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA256 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha384),ecb(cipher_null))",
--		.driver_name = "authenc-hmac-sha384-ecb-cipher_null-caam",
--		.blocksize = NULL_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_null_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = NULL_IV_SIZE,
--			.maxauthsize = SHA384_DIGEST_SIZE,
--			},
--		.class1_alg_type = 0,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA384 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA384 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha512),ecb(cipher_null))",
--		.driver_name = "authenc-hmac-sha512-ecb-cipher_null-caam",
--		.blocksize = NULL_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_null_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = NULL_IV_SIZE,
--			.maxauthsize = SHA512_DIGEST_SIZE,
--			},
--		.class1_alg_type = 0,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA512 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA512 | OP_ALG_AAI_HMAC,
--	},
-+	char driver_name[CRYPTO_MAX_ALG_NAME];
-+	unsigned int blocksize;
-+	u32 type;
-+	union {
-+		struct ablkcipher_alg ablkcipher;
-+		struct aead_alg aead;
-+		struct blkcipher_alg blkcipher;
-+		struct cipher_alg cipher;
-+		struct compress_alg compress;
-+		struct rng_alg rng;
-+	} template_u;
-+	u32 class1_alg_type;
-+	u32 class2_alg_type;
-+	u32 alg_op;
-+};
-+
-+static struct caam_alg_template driver_algs[] = {
-+	/* single-pass ipsec_esp descriptor */
- 	{
- 		.name = "authenc(hmac(md5),cbc(aes))",
- 		.driver_name = "authenc-hmac-md5-cbc-aes-caam",
-@@ -3865,188 +2047,81 @@
- 				   OP_ALG_AAI_HMAC_PRECOMP,
- 		.alg_op = OP_ALG_ALGSEL_SHA512 | OP_ALG_AAI_HMAC,
- 	},
-+	/* ablkcipher descriptor */
- 	{
--		.name = "authenc(hmac(md5),rfc3686(ctr(aes)))",
--		.driver_name = "authenc-hmac-md5-rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			.maxauthsize = MD5_DIGEST_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--		.class2_alg_type = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha1),rfc3686(ctr(aes)))",
--		.driver_name = "authenc-hmac-sha1-rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			.maxauthsize = SHA1_DIGEST_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "authenc(hmac(sha224),rfc3686(ctr(aes)))",
--		.driver_name = "authenc-hmac-sha224-rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			.maxauthsize = SHA224_DIGEST_SIZE,
-+		.name = "ecb(des)",
-+		.driver_name = "ecb-des-caam",
-+		.blocksize = DES_BLOCK_SIZE,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
-+		.template_ablkcipher = {
-+			.setkey = ablkcipher_setkey,
-+			.encrypt = ablkcipher_encrypt,
-+			.decrypt = ablkcipher_decrypt,
-+			.geniv = "eseqiv",
-+			.min_keysize = DES_KEY_SIZE,
-+			.max_keysize = DES_KEY_SIZE,
-+			.ivsize = DES_BLOCK_SIZE,
- 			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA224 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA224 | OP_ALG_AAI_HMAC,
-+		.class1_alg_type = OP_ALG_ALGSEL_DES | OP_ALG_AAI_ECB,
- 	},
- 	{
--		.name = "authenc(hmac(sha256),rfc3686(ctr(aes)))",
--		.driver_name = "authenc-hmac-sha256-rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			.maxauthsize = SHA256_DIGEST_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA256 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA256 | OP_ALG_AAI_HMAC,
-+		.name = "ecb(arc4)",
-+		.driver_name = "ecb-arc4-caam",
-+		.blocksize = ARC4_BLOCK_SIZE,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
-+		.template_ablkcipher = {
-+			.setkey = ablkcipher_setkey,
-+			.encrypt = ablkcipher_encrypt,
-+			.decrypt = ablkcipher_decrypt,
-+			.geniv = "eseqiv",
-+			.min_keysize = ARC4_MIN_KEY_SIZE,
-+			.max_keysize = ARC4_MAX_KEY_SIZE,
-+			.ivsize = ARC4_BLOCK_SIZE,
-+		},
-+	.class1_alg_type = OP_ALG_ALGSEL_ARC4 | OP_ALG_AAI_ECB
- 	},
- 	{
--		.name = "authenc(hmac(sha384),rfc3686(ctr(aes)))",
--		.driver_name = "authenc-hmac-sha384-rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			.maxauthsize = SHA384_DIGEST_SIZE,
-+		.name = "ecb(aes)",
-+		.driver_name = "ecb-aes-caam",
-+		.blocksize = AES_BLOCK_SIZE,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
-+		.template_ablkcipher = {
-+			.setkey = ablkcipher_setkey,
-+			.encrypt = ablkcipher_encrypt,
-+			.decrypt = ablkcipher_decrypt,
-+			.geniv = "eseqiv",
-+			.min_keysize = AES_MIN_KEY_SIZE,
-+			.max_keysize = AES_MAX_KEY_SIZE,
-+			.ivsize = AES_BLOCK_SIZE,
- 			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA384 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA384 | OP_ALG_AAI_HMAC,
-+		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_ECB,
- 	},
- 	{
--		.name = "authenc(hmac(sha512),rfc3686(ctr(aes)))",
--		.driver_name = "authenc-hmac-sha512-rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = aead_setkey,
--			.setauthsize = aead_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			.maxauthsize = SHA512_DIGEST_SIZE,
-+		.name = "ctr(aes)",
-+		.driver_name = "ctr-aes-caam",
-+		.blocksize = AES_BLOCK_SIZE,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
-+		.template_ablkcipher = {
-+			.setkey = ablkcipher_setkey,
-+			.encrypt = ablkcipher_encrypt,
-+			.decrypt = ablkcipher_decrypt,
-+			.geniv = "eseqiv",
-+			.min_keysize = AES_MIN_KEY_SIZE,
-+			.max_keysize = AES_MAX_KEY_SIZE,
-+			.ivsize = AES_BLOCK_SIZE,
- 			},
- 		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--		.class2_alg_type = OP_ALG_ALGSEL_SHA512 |
--				   OP_ALG_AAI_HMAC_PRECOMP,
--		.alg_op = OP_ALG_ALGSEL_SHA512 | OP_ALG_AAI_HMAC,
--	},
--	{
--		.name = "rfc4106(gcm(aes))",
--		.driver_name = "rfc4106-gcm-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = rfc4106_setkey,
--			.setauthsize = rfc4106_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = 8,
--			.maxauthsize = AES_BLOCK_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_GCM,
--	},
--	{
--		.name = "rfc4543(gcm(aes))",
--		.driver_name = "rfc4543-gcm-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = rfc4543_setkey,
--			.setauthsize = rfc4543_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = aead_givencrypt,
--			.geniv = "<built-in>",
--			.ivsize = 8,
--			.maxauthsize = AES_BLOCK_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_GCM,
--	},
--	/* Galois Counter Mode */
--	{
--		.name = "gcm(aes)",
--		.driver_name = "gcm-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_AEAD,
--		.template_aead = {
--			.setkey = gcm_setkey,
--			.setauthsize = gcm_setauthsize,
--			.encrypt = aead_encrypt,
--			.decrypt = aead_decrypt,
--			.givencrypt = NULL,
--			.geniv = "<built-in>",
--			.ivsize = 12,
--			.maxauthsize = AES_BLOCK_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_GCM,
- 	},
--	/* ablkcipher descriptor */
- 	{
- 		.name = "cbc(aes)",
- 		.driver_name = "cbc-aes-caam",
- 		.blocksize = AES_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
- 		.template_ablkcipher = {
- 			.setkey = ablkcipher_setkey,
- 			.encrypt = ablkcipher_encrypt,
- 			.decrypt = ablkcipher_decrypt,
--			.givencrypt = ablkcipher_givencrypt,
--			.geniv = "<built-in>",
-+			.geniv = "eseqiv",
- 			.min_keysize = AES_MIN_KEY_SIZE,
- 			.max_keysize = AES_MAX_KEY_SIZE,
- 			.ivsize = AES_BLOCK_SIZE,
-@@ -4054,16 +2129,31 @@
- 		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CBC,
- 	},
- 	{
-+		.name = "ecb(des3_ede)",
-+		.driver_name = "ecb-des3-caam",
-+		.blocksize = DES3_EDE_BLOCK_SIZE,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
-+		.template_ablkcipher = {
-+			.setkey = ablkcipher_setkey,
-+			.encrypt = ablkcipher_encrypt,
-+			.decrypt = ablkcipher_decrypt,
-+			.geniv = "eseqiv",
-+			.min_keysize = DES3_EDE_KEY_SIZE,
-+			.max_keysize = DES3_EDE_KEY_SIZE,
-+			.ivsize = DES3_EDE_BLOCK_SIZE,
-+			},
-+		.class1_alg_type = OP_ALG_ALGSEL_3DES | OP_ALG_AAI_ECB,
-+	},
-+	{
- 		.name = "cbc(des3_ede)",
- 		.driver_name = "cbc-3des-caam",
- 		.blocksize = DES3_EDE_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
- 		.template_ablkcipher = {
- 			.setkey = ablkcipher_setkey,
- 			.encrypt = ablkcipher_encrypt,
- 			.decrypt = ablkcipher_decrypt,
--			.givencrypt = ablkcipher_givencrypt,
--			.geniv = "<built-in>",
-+			.geniv = "eseqiv",
- 			.min_keysize = DES3_EDE_KEY_SIZE,
- 			.max_keysize = DES3_EDE_KEY_SIZE,
- 			.ivsize = DES3_EDE_BLOCK_SIZE,
-@@ -4074,58 +2164,23 @@
- 		.name = "cbc(des)",
- 		.driver_name = "cbc-des-caam",
- 		.blocksize = DES_BLOCK_SIZE,
--		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
-+		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
- 		.template_ablkcipher = {
- 			.setkey = ablkcipher_setkey,
- 			.encrypt = ablkcipher_encrypt,
- 			.decrypt = ablkcipher_decrypt,
--			.givencrypt = ablkcipher_givencrypt,
--			.geniv = "<built-in>",
-+			.geniv = "eseqiv",
- 			.min_keysize = DES_KEY_SIZE,
- 			.max_keysize = DES_KEY_SIZE,
- 			.ivsize = DES_BLOCK_SIZE,
- 			},
- 		.class1_alg_type = OP_ALG_ALGSEL_DES | OP_ALG_AAI_CBC,
--	},
--	{
--		.name = "ctr(aes)",
--		.driver_name = "ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
--		.template_ablkcipher = {
--			.setkey = ablkcipher_setkey,
--			.encrypt = ablkcipher_encrypt,
--			.decrypt = ablkcipher_decrypt,
--			.geniv = "chainiv",
--			.min_keysize = AES_MIN_KEY_SIZE,
--			.max_keysize = AES_MAX_KEY_SIZE,
--			.ivsize = AES_BLOCK_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
--	},
--	{
--		.name = "rfc3686(ctr(aes))",
--		.driver_name = "rfc3686-ctr-aes-caam",
--		.blocksize = 1,
--		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
--		.template_ablkcipher = {
--			.setkey = ablkcipher_setkey,
--			.encrypt = ablkcipher_encrypt,
--			.decrypt = ablkcipher_decrypt,
--			.givencrypt = ablkcipher_givencrypt,
--			.geniv = "<built-in>",
--			.min_keysize = AES_MIN_KEY_SIZE +
--				       CTR_RFC3686_NONCE_SIZE,
--			.max_keysize = AES_MAX_KEY_SIZE +
--				       CTR_RFC3686_NONCE_SIZE,
--			.ivsize = CTR_RFC3686_IV_SIZE,
--			},
--		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
- 	}
- };
- 
- struct caam_crypto_alg {
- 	struct list_head entry;
-+	struct device *ctrldev;
- 	int class1_alg_type;
- 	int class2_alg_type;
- 	int alg_op;
-@@ -4138,12 +2193,14 @@
- 	struct caam_crypto_alg *caam_alg =
- 		 container_of(alg, struct caam_crypto_alg, crypto_alg);
- 	struct caam_ctx *ctx = crypto_tfm_ctx(tfm);
-+	struct caam_drv_private *priv = dev_get_drvdata(caam_alg->ctrldev);
-+	int tgt_jr = atomic_inc_return(&priv->tfm_count);
- 
--	ctx->jrdev = caam_jr_alloc();
--	if (IS_ERR(ctx->jrdev)) {
--		pr_err("Job Ring Device allocation for transform failed\n");
--		return PTR_ERR(ctx->jrdev);
--	}
-+	/*
-+	 * distribute tfms across job rings to ensure in-order
-+	 * crypto request processing per tfm
-+	 */
-+	ctx->jrdev = priv->algapi_jr[(tgt_jr / 2) % priv->num_jrs_for_algapi];
- 
- 	/* copy descriptor header template value */
- 	ctx->class1_alg_type = OP_TYPE_CLASS1_ALG | caam_alg->class1_alg_type;
-@@ -4170,31 +2227,57 @@
- 		dma_unmap_single(ctx->jrdev, ctx->sh_desc_givenc_dma,
- 				 desc_bytes(ctx->sh_desc_givenc),
- 				 DMA_TO_DEVICE);
--	if (ctx->key_dma &&
--	    !dma_mapping_error(ctx->jrdev, ctx->key_dma))
--		dma_unmap_single(ctx->jrdev, ctx->key_dma,
--				 ctx->enckeylen + ctx->split_key_pad_len,
--				 DMA_TO_DEVICE);
--
--	caam_jr_free(ctx->jrdev);
- }
- 
- static void __exit caam_algapi_exit(void)
- {
- 
-+	struct device_node *dev_node;
-+	struct platform_device *pdev;
-+	struct device *ctrldev;
-+	struct caam_drv_private *priv;
- 	struct caam_crypto_alg *t_alg, *n;
-+	int i, err;
-+
-+	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
-+	if (!dev_node) {
-+		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
-+		if (!dev_node)
-+			return;
-+	}
-+
-+	pdev = of_find_device_by_node(dev_node);
-+	if (!pdev) {
-+		of_node_put(dev_node);
-+		return;
-+	}
- 
--	if (!alg_list.next)
-+	ctrldev = &pdev->dev;
-+	priv = dev_get_drvdata(ctrldev);
-+
-+	if (!priv->alg_list.next) {
-+		of_node_put(dev_node);
- 		return;
-+	}
- 
--	list_for_each_entry_safe(t_alg, n, &alg_list, entry) {
-+	list_for_each_entry_safe(t_alg, n, &priv->alg_list, entry) {
- 		crypto_unregister_alg(&t_alg->crypto_alg);
- 		list_del(&t_alg->entry);
- 		kfree(t_alg);
- 	}
-+
-+	for (i = 0; i < priv->total_jobrs; i++) {
-+		err = caam_jr_deregister(priv->algapi_jr[i]);
-+		if (err < 0)
-+			break;
-+	}
-+	kfree(priv->algapi_jr);
-+
-+	of_node_put(dev_node);
- }
- 
--static struct caam_crypto_alg *caam_alg_alloc(struct caam_alg_template
-+static struct caam_crypto_alg *caam_alg_alloc(struct device *ctrldev,
-+					      struct caam_alg_template
- 					      *template)
- {
- 	struct caam_crypto_alg *t_alg;
-@@ -4202,7 +2285,7 @@
- 
- 	t_alg = kzalloc(sizeof(struct caam_crypto_alg), GFP_KERNEL);
- 	if (!t_alg) {
--		pr_err("failed to allocate t_alg\n");
-+		dev_err(ctrldev, "failed to allocate t_alg\n");
- 		return ERR_PTR(-ENOMEM);
- 	}
- 
-@@ -4218,13 +2301,13 @@
- 	alg->cra_blocksize = template->blocksize;
- 	alg->cra_alignmask = 0;
- 	alg->cra_ctxsize = sizeof(struct caam_ctx);
--	alg->cra_flags = CRYPTO_ALG_ASYNC | CRYPTO_ALG_KERN_DRIVER_ONLY |
--			 template->type;
-+	alg->cra_flags = CRYPTO_ALG_ASYNC | template->type;
-+
-+#ifdef CRYPTO_ALG_KERN_DRIVER_ONLY
-+	alg->cra_flags |= CRYPTO_ALG_KERN_DRIVER_ONLY;
-+#endif
-+
- 	switch (template->type) {
--	case CRYPTO_ALG_TYPE_GIVCIPHER:
--		alg->cra_type = &crypto_givcipher_type;
--		alg->cra_ablkcipher = template->template_ablkcipher;
--		break;
- 	case CRYPTO_ALG_TYPE_ABLKCIPHER:
- 		alg->cra_type = &crypto_ablkcipher_type;
- 		alg->cra_ablkcipher = template->template_ablkcipher;
-@@ -4238,6 +2321,7 @@
- 	t_alg->class1_alg_type = template->class1_alg_type;
- 	t_alg->class2_alg_type = template->class2_alg_type;
- 	t_alg->alg_op = template->alg_op;
-+	t_alg->ctrldev = ctrldev;
- 
- 	return t_alg;
- }
-@@ -4246,9 +2330,11 @@
- {
- 	struct device_node *dev_node;
- 	struct platform_device *pdev;
--	struct device *ctrldev;
--	void *priv;
--	int i = 0, err = 0;
-+	struct device *ctrldev, **jrdev;
-+	struct caam_drv_private *priv;
-+	int i = 0, err = 0, md_limit = 0;
-+	int des_inst, aes_inst, md_inst;
-+	u64 cha_inst;
- 
- 	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
- 	if (!dev_node) {
-@@ -4265,42 +2351,117 @@
- 
- 	ctrldev = &pdev->dev;
- 	priv = dev_get_drvdata(ctrldev);
--	of_node_put(dev_node);
- 
--	/*
--	 * If priv is NULL, it's probably because the caam driver wasn't
--	 * properly initialized (e.g. RNG4 init failed). Thus, bail out here.
--	 */
--	if (!priv)
--		return -ENODEV;
-+	INIT_LIST_HEAD(&priv->alg_list);
-+
-+	jrdev = kmalloc(sizeof(*jrdev) * priv->total_jobrs, GFP_ATOMIC);
-+	if (!jrdev) {
-+		of_node_put(dev_node);
-+		return -ENOMEM;
-+	}
- 
-+	for (i = 0; i < priv->total_jobrs; i++) {
-+		err = caam_jr_register(ctrldev, &jrdev[i]);
-+		if (err < 0)
-+			break;
-+	}
-+	if (err < 0 && i == 0) {
-+		dev_err(ctrldev, "algapi error in job ring registration: %d\n",
-+			err);
-+		of_node_put(dev_node);
-+		kfree(jrdev);
-+		return err;
-+	}
- 
--	INIT_LIST_HEAD(&alg_list);
-+	priv->num_jrs_for_algapi = i;
-+	priv->algapi_jr = jrdev;
-+	atomic_set(&priv->tfm_count, -1);
-+
-+	/*
-+	 * register crypto algorithms the device supports
-+	 * first, detect presence of DES, AES, and MD blocks. If MD present,
-+	 * determine limit of supported digest size
-+	 */
-+	cha_inst = rd_reg64(&priv->ctrl->perfmon.cha_num);
-+	des_inst = (cha_inst & CHA_ID_DES_MASK) >> CHA_ID_DES_SHIFT;
-+	aes_inst = (cha_inst & CHA_ID_AES_MASK) >> CHA_ID_AES_SHIFT;
-+	md_inst = (cha_inst & CHA_ID_MD_MASK) >> CHA_ID_MD_SHIFT;
-+	if (md_inst) {
-+		md_limit = SHA512_DIGEST_SIZE;
-+		if ((rd_reg64(&priv->ctrl->perfmon.cha_id) & CHA_ID_MD_MASK)
-+		     == CHA_ID_MD_LP256) /* LP256 limits digest size */
-+			md_limit = SHA256_DIGEST_SIZE;
-+	}
- 
--	/* register crypto algorithms the device supports */
- 	for (i = 0; i < ARRAY_SIZE(driver_algs); i++) {
--		/* TODO: check if h/w supports alg */
- 		struct caam_crypto_alg *t_alg;
-+		bool done = false;
-+
-+authencesn:
-+		/*
-+		 * All registrable algs in this module require a blockcipher
-+		 * All aead algs require message digests, so check them for
-+		 * instantiation and size.
-+		 */
-+		if (driver_algs[i].type == CRYPTO_ALG_TYPE_AEAD) {
-+			/* If no MD instantiated, or MD too small, skip */
-+			if ((!md_inst) ||
-+			    (driver_algs[i].template_aead.maxauthsize >
-+			     md_limit))
-+				continue;
-+		}
-+		/* If DES alg, and CHA not instantiated, skip */
-+		if ((driver_algs[i].class1_alg_type & OP_ALG_ALGSEL_3DES) ||
-+		    (driver_algs[i].class1_alg_type & OP_ALG_ALGSEL_DES))
-+			if (!des_inst)
-+				continue;
-+		/* If AES alg, and CHA not instantiated, skip */
-+		if (driver_algs[i].class1_alg_type & OP_ALG_ALGSEL_AES)
-+			if (!aes_inst)
-+				continue;
- 
--		t_alg = caam_alg_alloc(&driver_algs[i]);
-+		t_alg = caam_alg_alloc(ctrldev, &driver_algs[i]);
- 		if (IS_ERR(t_alg)) {
- 			err = PTR_ERR(t_alg);
--			pr_warn("%s alg allocation failed\n",
--				driver_algs[i].driver_name);
-+			dev_warn(ctrldev, "%s alg allocation failed\n",
-+				 driver_algs[i].driver_name);
- 			continue;
- 		}
- 
- 		err = crypto_register_alg(&t_alg->crypto_alg);
- 		if (err) {
--			pr_warn("%s alg registration failed\n",
-+			dev_warn(ctrldev, "%s alg registration failed\n",
- 				t_alg->crypto_alg.cra_driver_name);
- 			kfree(t_alg);
--		} else
--			list_add_tail(&t_alg->entry, &alg_list);
-+		} else {
-+			list_add_tail(&t_alg->entry, &priv->alg_list);
-+			dev_info(ctrldev, "%s\n",
-+				 t_alg->crypto_alg.cra_driver_name);
-+
-+			if (driver_algs[i].type == CRYPTO_ALG_TYPE_AEAD &&
-+			    !memcmp(driver_algs[i].name, "authenc", 7) &&
-+			    !done) {
-+				char *name;
-+
-+				name = driver_algs[i].name;
-+				memmove(name + 10, name + 7, strlen(name) - 7);
-+				memcpy(name + 7, "esn", 3);
-+
-+				name = driver_algs[i].driver_name;
-+				memmove(name + 10, name + 7, strlen(name) - 7);
-+				memcpy(name + 7, "esn", 3);
-+
-+				done = true;
-+				goto authencesn;
-+			}
-+		}
- 	}
--	if (!list_empty(&alg_list))
--		pr_info("caam algorithms registered in /proc/crypto\n");
- 
-+	if (!list_empty(&priv->alg_list))
-+		dev_info(ctrldev, "%s algorithms registered in /proc/crypto\n",
-+			 (char *)of_get_property(dev_node, "compatible", NULL));
-+
-+	of_node_put(dev_node);
- 	return err;
- }
- 
-diff -Nur linux-4.1.3/drivers/crypto/caam/caamhash.c linux-xbian-imx6/drivers/crypto/caam/caamhash.c
---- linux-4.1.3/drivers/crypto/caam/caamhash.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/caamhash.c	2015-07-27 23:13:04.209961631 +0200
-@@ -1,7 +1,7 @@
- /*
-  * caam - Freescale FSL CAAM support for ahash functions of crypto API
-  *
-- * Copyright 2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
-  *
-  * Based on caamalg.c crypto API driver.
-  *
-@@ -62,6 +62,7 @@
- #include "error.h"
- #include "sg_sw_sec4.h"
- #include "key_gen.h"
-+#include <linux/string.h>
- 
- #define CAAM_CRA_PRIORITY		3000
- 
-@@ -72,6 +73,8 @@
- #define CAAM_MAX_HASH_DIGEST_SIZE	SHA512_DIGEST_SIZE
- 
- /* length of descriptors text */
-+#define DESC_JOB_IO_LEN			(CAAM_CMD_SZ * 5 + CAAM_PTR_SZ * 3)
-+
- #define DESC_AHASH_BASE			(4 * CAAM_CMD_SZ)
- #define DESC_AHASH_UPDATE_LEN		(6 * CAAM_CMD_SZ)
- #define DESC_AHASH_UPDATE_FIRST_LEN	(DESC_AHASH_BASE + 4 * CAAM_CMD_SZ)
-@@ -89,14 +92,13 @@
- 
- #ifdef DEBUG
- /* for print_hex_dumps with line references */
-+#define xstr(s) str(s)
-+#define str(s) #s
- #define debug(format, arg...) printk(format, arg)
- #else
- #define debug(format, arg...)
- #endif
- 
--
--static struct list_head hash_list;
--
- /* ahash per-session context */
- struct caam_hash_ctx {
- 	struct device *jrdev;
-@@ -115,6 +117,7 @@
- 	u8 key[CAAM_MAX_HASH_KEY_SIZE];
- 	dma_addr_t key_dma;
- 	int ctx_len;
-+	unsigned int key_len;
- 	unsigned int split_key_len;
- 	unsigned int split_key_pad_len;
- };
-@@ -137,20 +140,13 @@
- /* Common job descriptor seq in/out ptr routines */
- 
- /* Map state->caam_ctx, and append seq_out_ptr command that points to it */
--static inline int map_seq_out_ptr_ctx(u32 *desc, struct device *jrdev,
--				      struct caam_hash_state *state,
--				      int ctx_len)
-+static inline void map_seq_out_ptr_ctx(u32 *desc, struct device *jrdev,
-+				       struct caam_hash_state *state,
-+				       int ctx_len)
- {
- 	state->ctx_dma = dma_map_single(jrdev, state->caam_ctx,
- 					ctx_len, DMA_FROM_DEVICE);
--	if (dma_mapping_error(jrdev, state->ctx_dma)) {
--		dev_err(jrdev, "unable to map ctx\n");
--		return -ENOMEM;
--	}
--
- 	append_seq_out_ptr(desc, state->ctx_dma, ctx_len, 0);
--
--	return 0;
- }
- 
- /* Map req->result, and append seq_out_ptr command that points to it */
-@@ -173,6 +169,7 @@
- 	dma_addr_t buf_dma;
- 
- 	buf_dma = dma_map_single(jrdev, buf, buflen, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(jrdev, buf_dma, buflen, DMA_TO_DEVICE);
- 	dma_to_sec4_sg_one(sec4_sg, buf_dma, buflen, 0);
- 
- 	return buf_dma;
-@@ -208,19 +205,17 @@
- }
- 
- /* Map state->caam_ctx, and add it to link table */
--static inline int ctx_map_to_sec4_sg(u32 *desc, struct device *jrdev,
--				     struct caam_hash_state *state, int ctx_len,
--				     struct sec4_sg_entry *sec4_sg, u32 flag)
-+static inline void ctx_map_to_sec4_sg(u32 *desc, struct device *jrdev,
-+				      struct caam_hash_state *state,
-+				      int ctx_len,
-+				      struct sec4_sg_entry *sec4_sg,
-+				      u32 flag)
- {
- 	state->ctx_dma = dma_map_single(jrdev, state->caam_ctx, ctx_len, flag);
--	if (dma_mapping_error(jrdev, state->ctx_dma)) {
--		dev_err(jrdev, "unable to map ctx\n");
--		return -ENOMEM;
--	}
--
-+	if ((flag == DMA_TO_DEVICE) || (flag == DMA_BIDIRECTIONAL))
-+		dma_sync_single_for_device(jrdev, state->ctx_dma, ctx_len,
-+					   flag);
- 	dma_to_sec4_sg_one(sec4_sg, state->ctx_dma, ctx_len, 0);
--
--	return 0;
- }
- 
- /* Common shared descriptor commands */
-@@ -231,6 +226,13 @@
- 			  KEY_DEST_MDHA_SPLIT | KEY_ENC);
- }
- 
-+static inline void append_key_axcbc(u32 *desc, struct caam_hash_ctx *ctx)
-+{
-+	append_key_as_imm(desc, ctx->key, ctx->key_len,
-+			  ctx->key_len, CLASS_1 |
-+			  KEY_DEST_CLASS_REG);
-+}
-+
- /* Append key if it has been set */
- static inline void init_sh_desc_key_ahash(u32 *desc, struct caam_hash_ctx *ctx)
- {
-@@ -252,6 +254,25 @@
- 	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
- }
- 
-+static inline void init_sh_desc_key_axcbc(u32 *desc, struct caam_hash_ctx *ctx)
-+{
-+	u32 *key_jump_cmd;
-+
-+	init_sh_desc(desc, HDR_SHARE_SERIAL);
-+
-+	if (ctx->key_len) {
-+		key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
-+					   JUMP_COND_SHRD);
-+
-+		append_key_axcbc(desc, ctx);
-+
-+		set_jump_tgt_here(desc, key_jump_cmd);
-+	}
-+
-+	/* Propagate errors from shared to job descriptor */
-+	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
-+
-+}
- /*
-  * For ahash read data from seqin following state->caam_ctx,
-  * and write resulting class2 context to seqout, which may be state->caam_ctx
-@@ -271,6 +292,20 @@
- 			 LDST_SRCDST_BYTE_CONTEXT);
- }
- 
-+static inline void axcbc_append_load_str(u32 *desc, int digestsize)
-+{
-+	/* Calculate remaining bytes to read */
-+	 append_math_add(desc, VARSEQINLEN, SEQINLEN, REG0, CAAM_CMD_SZ);
-+
-+	/* Read remaining bytes */
-+	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_LAST1 |
-+			     FIFOLD_TYPE_MSG | KEY_VLF);
-+
-+	/* Store class1 context bytes */
-+	append_seq_store(desc, digestsize, LDST_CLASS_1_CCB |
-+			 LDST_SRCDST_BYTE_CONTEXT);
-+}
-+
- /*
-  * For ahash update, final and finup, import context, read and write to seqout
-  */
-@@ -293,6 +328,27 @@
- 	ahash_append_load_str(desc, digestsize);
- }
- 
-+/*
-+ * For ahash update, final and finup, import context, read and write to seqout
-+ */
-+static inline void axcbc_ctx_data_to_out(u32 *desc, u32 op, u32 state,
-+					 int digestsize,
-+					 struct caam_hash_ctx *ctx)
-+{
-+	init_sh_desc_key_axcbc(desc, ctx);
-+
-+	/* Import context from software */
-+	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+		   LDST_CLASS_1_CCB | ctx->ctx_len);
-+
-+	/* Class 1 operation */
-+	append_operation(desc, op | state | OP_ALG_ENCRYPT);
-+
-+	/*
-+	 * Load from buf and/or src and write to req->result or state->context
-+	 */
-+	axcbc_append_load_str(desc, digestsize);
-+}
- /* For ahash firsts and digest, read and write to seqout */
- static inline void ahash_data_to_out(u32 *desc, u32 op, u32 state,
- 				     int digestsize, struct caam_hash_ctx *ctx)
-@@ -308,6 +364,21 @@
- 	ahash_append_load_str(desc, digestsize);
- }
- 
-+/* For ahash firsts and digest, read and write to seqout */
-+static inline void axcbc_data_to_out(u32 *desc, u32 op, u32 state,
-+				     int digestsize, struct caam_hash_ctx *ctx)
-+{
-+	init_sh_desc_key_axcbc(desc, ctx);
-+
-+	/* Class 1 operation */
-+	append_operation(desc, op | state | OP_ALG_ENCRYPT);
-+
-+	/*
-+	 * Load from buf and/or src and write to req->result or state->context
-+	 */
-+	axcbc_append_load_str(desc, digestsize);
-+}
-+
- static int ahash_set_sh_desc(struct crypto_ahash *ahash)
- {
- 	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
-@@ -342,8 +413,7 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ahash update shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ahash update shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -361,10 +431,11 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ahash update first shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ahash update first shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_update_first_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
- 
- 	/* ahash_final shared descriptor */
- 	desc = ctx->sh_desc_fin;
-@@ -379,10 +450,12 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ahash final shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ahash final shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_fin_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
- 
- 	/* ahash_finup shared descriptor */
- 	desc = ctx->sh_desc_finup;
-@@ -397,10 +470,12 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ahash finup shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ahash finup shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_finup_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
- 
- 	/* ahash_digest shared descriptor */
- 	desc = ctx->sh_desc_digest;
-@@ -416,15 +491,134 @@
- 		return -ENOMEM;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR,
--		       "ahash digest shdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ahash digest shdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 		       desc_bytes(desc), 1);
- #endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_digest_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
- 
- 	return 0;
- }
- 
-+static int axcbc_set_sh_desc(struct crypto_ahash *ahash)
-+{
-+	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
-+	int digestsize = crypto_ahash_digestsize(ahash);
-+	struct device *jrdev = ctx->jrdev;
-+	u32 have_key = 0;
-+	u32 *desc;
-+
-+	/* ahash_update shared descriptor */
-+	desc = ctx->sh_desc_update;
-+
-+	init_sh_desc(desc, HDR_SHARE_SERIAL);
-+
-+	/* Import context from software */
-+	 append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
-+		   LDST_CLASS_1_CCB | ctx->ctx_len);
-+
-+	/* Class 1 operation */
-+	append_operation(desc, ctx->alg_type | OP_ALG_AS_UPDATE |
-+			 OP_ALG_ENCRYPT);
-+
-+	/* Load data and write to result or context */
-+	axcbc_append_load_str(desc, ctx->ctx_len);
-+
-+	ctx->sh_desc_update_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
-+						 DMA_TO_DEVICE);
-+	if (dma_mapping_error(jrdev, ctx->sh_desc_update_dma)) {
-+		dev_err(jrdev, "unable to map shared descriptor\n");
-+		return -ENOMEM;
-+	}
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ahash update shdesc@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
-+#endif
-+
-+	/* ahash_update_first shared descriptor */
-+	desc = ctx->sh_desc_update_first;
-+
-+	axcbc_data_to_out(desc, have_key | ctx->alg_type, OP_ALG_AS_INIT,
-+			  ctx->ctx_len, ctx);
-+
-+	ctx->sh_desc_update_first_dma = dma_map_single(jrdev, desc,
-+						       desc_bytes(desc),
-+						       DMA_TO_DEVICE);
-+	if (dma_mapping_error(jrdev, ctx->sh_desc_update_first_dma)) {
-+		dev_err(jrdev, "unable to map shared descriptor\n");
-+		return -ENOMEM;
-+	}
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ahash update first shdesc@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
-+#endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_update_first_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
-+
-+	/* ahash_final shared descriptor */
-+	desc = ctx->sh_desc_fin;
-+
-+	axcbc_ctx_data_to_out(desc, have_key | ctx->alg_type,
-+			      OP_ALG_AS_FINALIZE, digestsize, ctx);
-+
-+	ctx->sh_desc_fin_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
-+					      DMA_TO_DEVICE);
-+	if (dma_mapping_error(jrdev, ctx->sh_desc_fin_dma)) {
-+		dev_err(jrdev, "unable to map shared descriptor\n");
-+		return -ENOMEM;
-+	}
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ahash final shdesc@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
-+		       desc_bytes(desc), 1);
-+#endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_fin_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
-+
-+	/* ahash_finup shared descriptor */
-+	desc = ctx->sh_desc_finup;
-+
-+	axcbc_ctx_data_to_out(desc, have_key | ctx->alg_type,
-+			      OP_ALG_AS_FINALIZE, digestsize, ctx);
-+
-+	ctx->sh_desc_finup_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
-+						DMA_TO_DEVICE);
-+	if (dma_mapping_error(jrdev, ctx->sh_desc_finup_dma)) {
-+		dev_err(jrdev, "unable to map shared descriptor\n");
-+		return -ENOMEM;
-+	}
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ahash finup shdesc@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
-+		       desc_bytes(desc), 1);
-+#endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_finup_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
-+
-+	/* ahash_digest shared descriptor */
-+	desc = ctx->sh_desc_digest;
-+
-+	axcbc_data_to_out(desc, have_key | ctx->alg_type, OP_ALG_AS_INITFINAL,
-+			  digestsize, ctx);
-+
-+	ctx->sh_desc_digest_dma = dma_map_single(jrdev, desc,
-+						 desc_bytes(desc),
-+						 DMA_TO_DEVICE);
-+	if (dma_mapping_error(jrdev, ctx->sh_desc_digest_dma)) {
-+		dev_err(jrdev, "unable to map shared descriptor\n");
-+		return -ENOMEM;
-+	}
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ahash digest shdesc@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
-+		       desc_bytes(desc), 1);
-+#endif
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_digest_dma,
-+				   desc_bytes(desc), DMA_TO_DEVICE);
-+
-+	return 0;
-+}
- static int gen_split_hash_key(struct caam_hash_ctx *ctx, const u8 *key_in,
- 			      u32 keylen)
- {
-@@ -458,6 +652,8 @@
- 		kfree(desc);
- 		return -ENOMEM;
- 	}
-+	dma_sync_single_for_device(jrdev, src_dma, *keylen, DMA_TO_DEVICE);
-+
- 	dst_dma = dma_map_single(jrdev, (void *)key_out, digestsize,
- 				 DMA_FROM_DEVICE);
- 	if (dma_mapping_error(jrdev, dst_dma)) {
-@@ -478,9 +674,9 @@
- 			 LDST_SRCDST_BYTE_CONTEXT);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "key_in@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "key_in@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, key_in, *keylen, 1);
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -493,17 +689,17 @@
- 		wait_for_completion_interruptible(&result.completion);
- 		ret = result.err;
- #ifdef DEBUG
--		print_hex_dump(KERN_ERR,
--			       "digested key@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "digested key@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, key_in,
- 			       digestsize, 1);
- #endif
- 	}
-+	*keylen = digestsize;
-+
- 	dma_unmap_single(jrdev, src_dma, *keylen, DMA_TO_DEVICE);
-+	dma_sync_single_for_cpu(jrdev, dst_dma, digestsize, DMA_FROM_DEVICE);
- 	dma_unmap_single(jrdev, dst_dma, digestsize, DMA_FROM_DEVICE);
- 
--	*keylen = digestsize;
--
- 	kfree(desc);
- 
- 	return ret;
-@@ -545,7 +741,7 @@
- #ifdef DEBUG
- 	printk(KERN_ERR "split_key_len %d split_key_pad_len %d\n",
- 	       ctx->split_key_len, ctx->split_key_pad_len);
--	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "key in @"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
- #endif
- 
-@@ -557,11 +753,14 @@
- 				      DMA_TO_DEVICE);
- 	if (dma_mapping_error(jrdev, ctx->key_dma)) {
- 		dev_err(jrdev, "unable to map key i/o memory\n");
--		ret = -ENOMEM;
--		goto map_err;
-+		return -ENOMEM;
- 	}
-+
-+	dma_sync_single_for_device(jrdev, ctx->key_dma, ctx->split_key_pad_len,
-+				   DMA_TO_DEVICE);
-+
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
- 		       ctx->split_key_pad_len, 1);
- #endif
-@@ -572,7 +771,6 @@
- 				 DMA_TO_DEVICE);
- 	}
- 
--map_err:
- 	kfree(hashed_key);
- 	return ret;
- badkey:
-@@ -581,6 +779,25 @@
- 	return -EINVAL;
- }
- 
-+static int axcbc_setkey(struct crypto_ahash *ahash,
-+			const u8 *key, unsigned int keylen)
-+{
-+	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
-+	int ret = 0;
-+
-+	ctx->key_len = keylen;
-+	memcpy(ctx->key, key, keylen);
-+
-+#ifdef DEBUG
-+	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
-+		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
-+		       ctx->key_len, 1);
-+#endif
-+
-+	ret = axcbc_set_sh_desc(ahash);
-+
-+	return ret;
-+}
- /*
-  * ahash_edesc - s/w-extended ahash descriptor
-  * @dst_dma: physical mapped address of req->result
-@@ -608,8 +825,11 @@
- 	if (edesc->src_nents)
- 		dma_unmap_sg_chained(dev, req->src, edesc->src_nents,
- 				     DMA_TO_DEVICE, edesc->chained);
--	if (edesc->dst_dma)
-+	if (edesc->dst_dma) {
-+		dma_sync_single_for_cpu(dev, edesc->dst_dma, dst_len,
-+					DMA_FROM_DEVICE);
- 		dma_unmap_single(dev, edesc->dst_dma, dst_len, DMA_FROM_DEVICE);
-+	}
- 
- 	if (edesc->sec4_sg_bytes)
- 		dma_unmap_single(dev, edesc->sec4_sg_dma,
-@@ -624,8 +844,12 @@
- 	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
- 	struct caam_hash_state *state = ahash_request_ctx(req);
- 
--	if (state->ctx_dma)
-+	if (state->ctx_dma) {
-+		if ((flag == DMA_FROM_DEVICE) || (flag == DMA_BIDIRECTIONAL))
-+			dma_sync_single_for_cpu(dev, state->ctx_dma,
-+						ctx->ctx_len, flag);
- 		dma_unmap_single(dev, state->ctx_dma, ctx->ctx_len, flag);
-+	}
- 	ahash_unmap(dev, edesc, req, dst_len);
- }
- 
-@@ -645,18 +869,21 @@
- 
- 	edesc = (struct ahash_edesc *)((char *)desc -
- 		 offsetof(struct ahash_edesc, hw_desc));
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- 	ahash_unmap(jrdev, edesc, req, digestsize);
- 	kfree(edesc);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
- 		       ctx->ctx_len, 1);
- 	if (req->result)
--		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
- 			       digestsize, 1);
- #endif
-@@ -680,18 +907,21 @@
- 
- 	edesc = (struct ahash_edesc *)((char *)desc -
- 		 offsetof(struct ahash_edesc, hw_desc));
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- 	ahash_unmap_ctx(jrdev, edesc, req, ctx->ctx_len, DMA_BIDIRECTIONAL);
- 	kfree(edesc);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
- 		       ctx->ctx_len, 1);
- 	if (req->result)
--		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
- 			       digestsize, 1);
- #endif
-@@ -715,18 +945,21 @@
- 
- 	edesc = (struct ahash_edesc *)((char *)desc -
- 		 offsetof(struct ahash_edesc, hw_desc));
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
- 
--	ahash_unmap_ctx(jrdev, edesc, req, digestsize, DMA_TO_DEVICE);
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
-+
-+	ahash_unmap_ctx(jrdev, edesc, req, digestsize, DMA_FROM_DEVICE);
- 	kfree(edesc);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
- 		       ctx->ctx_len, 1);
- 	if (req->result)
--		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
- 			       digestsize, 1);
- #endif
-@@ -750,18 +983,21 @@
- 
- 	edesc = (struct ahash_edesc *)((char *)desc -
- 		 offsetof(struct ahash_edesc, hw_desc));
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
--	ahash_unmap_ctx(jrdev, edesc, req, ctx->ctx_len, DMA_FROM_DEVICE);
-+	ahash_unmap_ctx(jrdev, edesc, req, ctx->ctx_len, DMA_TO_DEVICE);
- 	kfree(edesc);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
- 		       ctx->ctx_len, 1);
- 	if (req->result)
--		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
- 			       digestsize, 1);
- #endif
-@@ -807,7 +1043,7 @@
- 		 * allocate space for base edesc and hw desc commands,
- 		 * link tables
- 		 */
--		edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
-+		edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
- 				sec4_sg_bytes, GFP_DMA | flags);
- 		if (!edesc) {
- 			dev_err(jrdev,
-@@ -820,11 +1056,12 @@
- 		edesc->sec4_sg_bytes = sec4_sg_bytes;
- 		edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 				 DESC_JOB_IO_LEN;
-+		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+						     sec4_sg_bytes,
-+						     DMA_TO_DEVICE);
- 
--		ret = ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
--					 edesc->sec4_sg, DMA_BIDIRECTIONAL);
--		if (ret)
--			return ret;
-+		ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
-+				   edesc->sec4_sg, DMA_BIDIRECTIONAL);
- 
- 		state->buf_dma = try_buf_map_to_sec4_sg(jrdev,
- 							edesc->sec4_sg + 1,
-@@ -851,21 +1088,16 @@
- 		init_job_desc_shared(desc, ptr, sh_len, HDR_SHARE_DEFER |
- 				     HDR_REVERSE);
- 
--		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--						     sec4_sg_bytes,
--						     DMA_TO_DEVICE);
--		if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--			dev_err(jrdev, "unable to map S/G table\n");
--			return -ENOMEM;
--		}
--
- 		append_seq_in_ptr(desc, edesc->sec4_sg_dma, ctx->ctx_len +
- 				       to_hash, LDST_SGF);
- 
- 		append_seq_out_ptr(desc, state->ctx_dma, ctx->ctx_len, 0);
- 
-+		dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
-+					   sec4_sg_bytes, DMA_TO_DEVICE);
-+
- #ifdef DEBUG
--		print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 			       desc_bytes(desc), 1);
- #endif
-@@ -885,9 +1117,9 @@
- 		*next_buflen = last_buflen;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "buf@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "buf@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, buf, *buflen, 1);
--	print_hex_dump(KERN_ERR, "next buf@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "next buf@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, next_buf,
- 		       *next_buflen, 1);
- #endif
-@@ -918,7 +1150,7 @@
- 	sec4_sg_bytes = (1 + (buflen ? 1 : 0)) * sizeof(struct sec4_sg_entry);
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
-+	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
- 			sec4_sg_bytes, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -932,37 +1164,29 @@
- 	edesc->sec4_sg_bytes = sec4_sg_bytes;
- 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 			 DESC_JOB_IO_LEN;
-+	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+					    sec4_sg_bytes, DMA_TO_DEVICE);
- 	edesc->src_nents = 0;
- 
--	ret = ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
--				 edesc->sec4_sg, DMA_TO_DEVICE);
--	if (ret)
--		return ret;
-+	ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len, edesc->sec4_sg,
-+			   DMA_TO_DEVICE);
- 
- 	state->buf_dma = try_buf_map_to_sec4_sg(jrdev, edesc->sec4_sg + 1,
- 						buf, state->buf_dma, buflen,
- 						last_buflen);
- 	(edesc->sec4_sg + sec4_sg_bytes - 1)->len |= SEC4_SG_LEN_FIN;
- 
--	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return -ENOMEM;
--	}
--
- 	append_seq_in_ptr(desc, edesc->sec4_sg_dma, ctx->ctx_len + buflen,
- 			  LDST_SGF);
- 
- 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
- 						digestsize);
--	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
--		dev_err(jrdev, "unable to map dst\n");
--		return -ENOMEM;
--	}
-+
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
-+				   DMA_TO_DEVICE);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -1005,7 +1229,7 @@
- 			 sizeof(struct sec4_sg_entry);
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
-+	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
- 			sec4_sg_bytes, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -1021,11 +1245,11 @@
- 	edesc->sec4_sg_bytes = sec4_sg_bytes;
- 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 			 DESC_JOB_IO_LEN;
-+	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+					    sec4_sg_bytes, DMA_TO_DEVICE);
- 
--	ret = ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
--				 edesc->sec4_sg, DMA_TO_DEVICE);
--	if (ret)
--		return ret;
-+	ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len, edesc->sec4_sg,
-+			   DMA_TO_DEVICE);
- 
- 	state->buf_dma = try_buf_map_to_sec4_sg(jrdev, edesc->sec4_sg + 1,
- 						buf, state->buf_dma, buflen,
-@@ -1034,25 +1258,17 @@
- 	src_map_to_sec4_sg(jrdev, req->src, src_nents, edesc->sec4_sg +
- 			   sec4_sg_src_index, chained);
- 
--	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return -ENOMEM;
--	}
--
- 	append_seq_in_ptr(desc, edesc->sec4_sg_dma, ctx->ctx_len +
- 			       buflen + req->nbytes, LDST_SGF);
- 
- 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
- 						digestsize);
--	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
--		dev_err(jrdev, "unable to map dst\n");
--		return -ENOMEM;
--	}
-+
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
-+				   DMA_TO_DEVICE);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -1091,7 +1307,7 @@
- 	sec4_sg_bytes = src_nents * sizeof(struct sec4_sg_entry);
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct ahash_edesc) + sec4_sg_bytes +
-+	edesc = kzalloc(sizeof(struct ahash_edesc) + sec4_sg_bytes +
- 			DESC_JOB_IO_LEN, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -1099,6 +1315,8 @@
- 	}
- 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 			  DESC_JOB_IO_LEN;
-+	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+					    sec4_sg_bytes, DMA_TO_DEVICE);
- 	edesc->sec4_sg_bytes = sec4_sg_bytes;
- 	edesc->src_nents = src_nents;
- 	edesc->chained = chained;
-@@ -1109,12 +1327,6 @@
- 
- 	if (src_nents) {
- 		sg_to_sec4_sg_last(req->src, src_nents, edesc->sec4_sg, 0);
--		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--		if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--			dev_err(jrdev, "unable to map S/G table\n");
--			return -ENOMEM;
--		}
- 		src_dma = edesc->sec4_sg_dma;
- 		options = LDST_SGF;
- 	} else {
-@@ -1123,15 +1335,14 @@
- 	}
- 	append_seq_in_ptr(desc, src_dma, req->nbytes, options);
- 
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
-+				   edesc->sec4_sg_bytes, DMA_TO_DEVICE);
-+
- 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
- 						digestsize);
--	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
--		dev_err(jrdev, "unable to map dst\n");
--		return -ENOMEM;
--	}
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -1165,7 +1376,7 @@
- 	int sh_len;
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN,
-+	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN,
- 			GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -1178,23 +1389,17 @@
- 	init_job_desc_shared(desc, ptr, sh_len, HDR_SHARE_DEFER | HDR_REVERSE);
- 
- 	state->buf_dma = dma_map_single(jrdev, buf, buflen, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, state->buf_dma)) {
--		dev_err(jrdev, "unable to map src\n");
--		return -ENOMEM;
--	}
- 
- 	append_seq_in_ptr(desc, state->buf_dma, buflen, 0);
- 
- 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
- 						digestsize);
--	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
--		dev_err(jrdev, "unable to map dst\n");
--		return -ENOMEM;
--	}
- 	edesc->src_nents = 0;
- 
-+	dma_sync_single_for_device(jrdev, state->buf_dma, buflen,
-+				   DMA_TO_DEVICE);
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -1245,7 +1450,7 @@
- 		 * allocate space for base edesc and hw desc commands,
- 		 * link tables
- 		 */
--		edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
-+		edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
- 				sec4_sg_bytes, GFP_DMA | flags);
- 		if (!edesc) {
- 			dev_err(jrdev,
-@@ -1258,7 +1463,9 @@
- 		edesc->sec4_sg_bytes = sec4_sg_bytes;
- 		edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 				 DESC_JOB_IO_LEN;
--		edesc->dst_dma = 0;
-+		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+						    sec4_sg_bytes,
-+						    DMA_TO_DEVICE);
- 
- 		state->buf_dma = buf_map_to_sec4_sg(jrdev, edesc->sec4_sg,
- 						    buf, *buflen);
-@@ -1276,22 +1483,14 @@
- 		init_job_desc_shared(desc, ptr, sh_len, HDR_SHARE_DEFER |
- 				     HDR_REVERSE);
- 
--		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--						    sec4_sg_bytes,
--						    DMA_TO_DEVICE);
--		if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--			dev_err(jrdev, "unable to map S/G table\n");
--			return -ENOMEM;
--		}
--
- 		append_seq_in_ptr(desc, edesc->sec4_sg_dma, to_hash, LDST_SGF);
- 
--		ret = map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
--		if (ret)
--			return ret;
-+		map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
- 
-+		dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
-+					   sec4_sg_bytes, DMA_TO_DEVICE);
- #ifdef DEBUG
--		print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 			       desc_bytes(desc), 1);
- #endif
-@@ -1314,9 +1513,9 @@
- 		*next_buflen = 0;
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "buf@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "buf@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, buf, *buflen, 1);
--	print_hex_dump(KERN_ERR, "next buf@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "next buf@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, next_buf,
- 		       *next_buflen, 1);
- #endif
-@@ -1352,7 +1551,7 @@
- 			 sizeof(struct sec4_sg_entry);
- 
- 	/* allocate space for base edesc and hw desc commands, link tables */
--	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
-+	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
- 			sec4_sg_bytes, GFP_DMA | flags);
- 	if (!edesc) {
- 		dev_err(jrdev, "could not allocate extended descriptor\n");
-@@ -1368,6 +1567,8 @@
- 	edesc->sec4_sg_bytes = sec4_sg_bytes;
- 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 			 DESC_JOB_IO_LEN;
-+	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+					    sec4_sg_bytes, DMA_TO_DEVICE);
- 
- 	state->buf_dma = try_buf_map_to_sec4_sg(jrdev, edesc->sec4_sg, buf,
- 						state->buf_dma, buflen,
-@@ -1376,25 +1577,17 @@
- 	src_map_to_sec4_sg(jrdev, req->src, src_nents, edesc->sec4_sg + 1,
- 			   chained);
- 
--	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
--					    sec4_sg_bytes, DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--		dev_err(jrdev, "unable to map S/G table\n");
--		return -ENOMEM;
--	}
--
- 	append_seq_in_ptr(desc, edesc->sec4_sg_dma, buflen +
- 			       req->nbytes, LDST_SGF);
- 
- 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
- 						digestsize);
--	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
--		dev_err(jrdev, "unable to map dst\n");
--		return -ENOMEM;
--	}
-+
-+	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
-+				   DMA_TO_DEVICE);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -1447,7 +1640,7 @@
- 		 * allocate space for base edesc and hw desc commands,
- 		 * link tables
- 		 */
--		edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
-+		edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
- 				sec4_sg_bytes, GFP_DMA | flags);
- 		if (!edesc) {
- 			dev_err(jrdev,
-@@ -1460,19 +1653,13 @@
- 		edesc->sec4_sg_bytes = sec4_sg_bytes;
- 		edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
- 				 DESC_JOB_IO_LEN;
--		edesc->dst_dma = 0;
-+		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
-+						    sec4_sg_bytes,
-+						    DMA_TO_DEVICE);
- 
- 		if (src_nents) {
- 			sg_to_sec4_sg_last(req->src, src_nents,
- 					   edesc->sec4_sg, 0);
--			edesc->sec4_sg_dma = dma_map_single(jrdev,
--							    edesc->sec4_sg,
--							    sec4_sg_bytes,
--							    DMA_TO_DEVICE);
--			if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
--				dev_err(jrdev, "unable to map S/G table\n");
--				return -ENOMEM;
--			}
- 			src_dma = edesc->sec4_sg_dma;
- 			options = LDST_SGF;
- 		} else {
-@@ -1491,12 +1678,12 @@
- 
- 		append_seq_in_ptr(desc, src_dma, to_hash, options);
- 
--		ret = map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
--		if (ret)
--			return ret;
-+		map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
- 
-+		dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
-+					   sec4_sg_bytes, DMA_TO_DEVICE);
- #ifdef DEBUG
--		print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, desc,
- 			       desc_bytes(desc), 1);
- #endif
-@@ -1521,7 +1708,7 @@
- 					 req->nbytes, 0);
- 	}
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "next buf@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "next buf@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, next_buf,
- 		       *next_buflen, 1);
- #endif
-@@ -1735,10 +1922,33 @@
- 		.alg_type = OP_ALG_ALGSEL_MD5,
- 		.alg_op = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC,
- 	},
-+	 {
-+		.name = "xcbc(aes)",
-+		.driver_name = "xcbc-aes-caam",
-+		.hmac_name = "xcbc(aes)",
-+		.hmac_driver_name = "xcbc-aes-caam",
-+		.blocksize = XCBC_MAC_BLOCK_WORDS * 4,
-+		.template_ahash = {
-+			.init = ahash_init,
-+			.update = ahash_update,
-+			.final = ahash_final,
-+			.finup = ahash_finup,
-+			.digest = ahash_digest,
-+			.export = ahash_export,
-+			.import = ahash_import,
-+			.setkey = axcbc_setkey,
-+			.halg = {
-+				.digestsize = XCBC_MAC_DIGEST_SIZE,
-+				},
-+			},
-+		.alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_XCBC_MAC,
-+		.alg_op = OP_ALG_ALGSEL_AES,
-+	},
- };
- 
- struct caam_hash_alg {
- 	struct list_head entry;
-+	struct device *ctrldev;
- 	int alg_type;
- 	int alg_op;
- 	struct ahash_alg ahash_alg;
-@@ -1755,6 +1965,7 @@
- 	struct caam_hash_alg *caam_hash =
- 		 container_of(alg, struct caam_hash_alg, ahash_alg);
- 	struct caam_hash_ctx *ctx = crypto_tfm_ctx(tfm);
-+	struct caam_drv_private *priv = dev_get_drvdata(caam_hash->ctrldev);
- 	/* Sizes for MDHA running digests: MD5, SHA1, 224, 256, 384, 512 */
- 	static const u8 runninglen[] = { HASH_MSG_LEN + MD5_DIGEST_SIZE,
- 					 HASH_MSG_LEN + SHA1_DIGEST_SIZE,
-@@ -1762,17 +1973,15 @@
- 					 HASH_MSG_LEN + SHA256_DIGEST_SIZE,
- 					 HASH_MSG_LEN + 64,
- 					 HASH_MSG_LEN + SHA512_DIGEST_SIZE };
-+	int tgt_jr = atomic_inc_return(&priv->tfm_count);
- 	int ret = 0;
- 
- 	/*
--	 * Get a Job ring from Job Ring driver to ensure in-order
-+	 * distribute tfms across job rings to ensure in-order
- 	 * crypto request processing per tfm
- 	 */
--	ctx->jrdev = caam_jr_alloc();
--	if (IS_ERR(ctx->jrdev)) {
--		pr_err("Job Ring Device allocation for transform failed\n");
--		return PTR_ERR(ctx->jrdev);
--	}
-+	ctx->jrdev = priv->jrdev[tgt_jr % priv->total_jobrs];
-+
- 	/* copy descriptor header template value */
- 	ctx->alg_type = OP_TYPE_CLASS2_ALG | caam_hash->alg_type;
- 	ctx->alg_op = OP_TYPE_CLASS2_ALG | caam_hash->alg_op;
-@@ -1788,6 +1997,39 @@
- 	return ret;
- }
- 
-+static int caam_axcbc_cra_init(struct crypto_tfm *tfm)
-+{
-+	struct crypto_ahash *ahash = __crypto_ahash_cast(tfm);
-+	struct crypto_alg *base = tfm->__crt_alg;
-+	struct hash_alg_common *halg =
-+		 container_of(base, struct hash_alg_common, base);
-+	struct ahash_alg *alg =
-+		 container_of(halg, struct ahash_alg, halg);
-+	struct caam_hash_alg *caam_hash =
-+		 container_of(alg, struct caam_hash_alg, ahash_alg);
-+	struct caam_hash_ctx *ctx = crypto_tfm_ctx(tfm);
-+	struct caam_drv_private *priv = dev_get_drvdata(caam_hash->ctrldev);
-+	int tgt_jr = atomic_inc_return(&priv->tfm_count);
-+	int ret = 0;
-+
-+	/*
-+	 * distribute tfms across job rings to ensure in-order
-+	 * crypto request processing per tfm
-+	 */
-+	ctx->jrdev = priv->jrdev[tgt_jr % priv->total_jobrs];
-+
-+	/* copy descriptor header template value */
-+	ctx->alg_type = OP_TYPE_CLASS1_ALG | caam_hash->alg_type;
-+	ctx->alg_op = OP_TYPE_CLASS1_ALG | caam_hash->alg_op;
-+
-+	crypto_ahash_set_reqsize(__crypto_ahash_cast(tfm),
-+				 sizeof(struct caam_hash_state));
-+
-+	ret = axcbc_set_sh_desc(ahash);
-+
-+	return ret;
-+}
-+
- static void caam_hash_cra_exit(struct crypto_tfm *tfm)
- {
- 	struct caam_hash_ctx *ctx = crypto_tfm_ctx(tfm);
-@@ -1815,35 +2057,57 @@
- 	    !dma_mapping_error(ctx->jrdev, ctx->sh_desc_finup_dma))
- 		dma_unmap_single(ctx->jrdev, ctx->sh_desc_finup_dma,
- 				 desc_bytes(ctx->sh_desc_finup), DMA_TO_DEVICE);
--
--	caam_jr_free(ctx->jrdev);
- }
- 
- static void __exit caam_algapi_hash_exit(void)
- {
-+	struct device_node *dev_node;
-+	struct platform_device *pdev;
-+	struct device *ctrldev;
-+	struct caam_drv_private *priv;
- 	struct caam_hash_alg *t_alg, *n;
- 
--	if (!hash_list.next)
-+	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
-+	if (!dev_node) {
-+		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
-+		if (!dev_node)
-+			return;
-+	}
-+
-+	pdev = of_find_device_by_node(dev_node);
-+	if (!pdev) {
-+		of_node_put(dev_node);
- 		return;
-+	}
- 
--	list_for_each_entry_safe(t_alg, n, &hash_list, entry) {
-+	ctrldev = &pdev->dev;
-+	priv = dev_get_drvdata(ctrldev);
-+
-+	if (!priv->hash_list.next) {
-+		of_node_put(dev_node);
-+		return;
-+	}
-+
-+	list_for_each_entry_safe(t_alg, n, &priv->hash_list, entry) {
- 		crypto_unregister_ahash(&t_alg->ahash_alg);
- 		list_del(&t_alg->entry);
- 		kfree(t_alg);
- 	}
-+
-+	of_node_put(dev_node);
- }
- 
- static struct caam_hash_alg *
--caam_hash_alloc(struct caam_hash_template *template,
-+caam_hash_alloc(struct device *ctrldev, struct caam_hash_template *template,
- 		bool keyed)
- {
- 	struct caam_hash_alg *t_alg;
- 	struct ahash_alg *halg;
- 	struct crypto_alg *alg;
- 
--	t_alg = kzalloc(sizeof(struct caam_hash_alg), GFP_KERNEL);
-+	t_alg = kzalloc(sizeof(struct caam_hash_alg), GFP_ATOMIC);
- 	if (!t_alg) {
--		pr_err("failed to allocate t_alg\n");
-+		dev_err(ctrldev, "failed to allocate t_alg\n");
- 		return ERR_PTR(-ENOMEM);
- 	}
- 
-@@ -1863,7 +2127,11 @@
- 			 template->driver_name);
- 	}
- 	alg->cra_module = THIS_MODULE;
--	alg->cra_init = caam_hash_cra_init;
-+
-+	if (strstr(alg->cra_name, "xcbc") > 0)
-+		alg->cra_init = caam_axcbc_cra_init;
-+	else
-+		alg->cra_init = caam_hash_cra_init;
- 	alg->cra_exit = caam_hash_cra_exit;
- 	alg->cra_ctxsize = sizeof(struct caam_hash_ctx);
- 	alg->cra_priority = CAAM_CRA_PRIORITY;
-@@ -1874,6 +2142,7 @@
- 
- 	t_alg->alg_type = template->alg_type;
- 	t_alg->alg_op = template->alg_op;
-+	t_alg->ctrldev = ctrldev;
- 
- 	return t_alg;
- }
-@@ -1883,8 +2152,9 @@
- 	struct device_node *dev_node;
- 	struct platform_device *pdev;
- 	struct device *ctrldev;
--	void *priv;
--	int i = 0, err = 0;
-+	struct caam_drv_private *priv;
-+	int i = 0, err = 0, md_limit = 0, md_inst;
-+	u64 cha_inst;
- 
- 	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
- 	if (!dev_node) {
-@@ -1898,60 +2168,68 @@
- 		of_node_put(dev_node);
- 		return -ENODEV;
- 	}
--
- 	ctrldev = &pdev->dev;
- 	priv = dev_get_drvdata(ctrldev);
--	of_node_put(dev_node);
- 
--	/*
--	 * If priv is NULL, it's probably because the caam driver wasn't
--	 * properly initialized (e.g. RNG4 init failed). Thus, bail out here.
--	 */
--	if (!priv)
--		return -ENODEV;
-+	INIT_LIST_HEAD(&priv->hash_list);
- 
--	INIT_LIST_HEAD(&hash_list);
-+	atomic_set(&priv->tfm_count, -1);
-+
-+	/* register algorithms the device supports */
-+	cha_inst = rd_reg64(&priv->ctrl->perfmon.cha_num);
-+	md_inst = (cha_inst & CHA_ID_MD_MASK) >> CHA_ID_MD_SHIFT;
-+	if (md_inst) {
-+		md_limit = SHA512_DIGEST_SIZE;
-+		if ((rd_reg64(&priv->ctrl->perfmon.cha_id) & CHA_ID_MD_MASK)
-+		     == CHA_ID_MD_LP256) /* LP256 limits digest size */
-+			md_limit = SHA256_DIGEST_SIZE;
-+	}
- 
--	/* register crypto algorithms the device supports */
- 	for (i = 0; i < ARRAY_SIZE(driver_hash); i++) {
--		/* TODO: check if h/w supports alg */
- 		struct caam_hash_alg *t_alg;
- 
-+		/* If no MD instantiated, or MD too small, skip */
-+		if ((!md_inst) ||
-+		    (driver_hash[i].template_ahash.halg.digestsize >
-+		     md_limit))
-+			continue;
-+
- 		/* register hmac version */
--		t_alg = caam_hash_alloc(&driver_hash[i], true);
-+		t_alg = caam_hash_alloc(ctrldev, &driver_hash[i], true);
- 		if (IS_ERR(t_alg)) {
- 			err = PTR_ERR(t_alg);
--			pr_warn("%s alg allocation failed\n",
--				driver_hash[i].driver_name);
-+			dev_warn(ctrldev, "%s alg allocation failed\n",
-+				 driver_hash[i].driver_name);
- 			continue;
- 		}
- 
- 		err = crypto_register_ahash(&t_alg->ahash_alg);
- 		if (err) {
--			pr_warn("%s alg registration failed\n",
-+			dev_warn(ctrldev, "%s alg registration failed\n",
- 				t_alg->ahash_alg.halg.base.cra_driver_name);
- 			kfree(t_alg);
- 		} else
--			list_add_tail(&t_alg->entry, &hash_list);
-+			list_add_tail(&t_alg->entry, &priv->hash_list);
- 
- 		/* register unkeyed version */
--		t_alg = caam_hash_alloc(&driver_hash[i], false);
-+		t_alg = caam_hash_alloc(ctrldev, &driver_hash[i], false);
- 		if (IS_ERR(t_alg)) {
- 			err = PTR_ERR(t_alg);
--			pr_warn("%s alg allocation failed\n",
--				driver_hash[i].driver_name);
-+			dev_warn(ctrldev, "%s alg allocation failed\n",
-+				 driver_hash[i].driver_name);
- 			continue;
- 		}
- 
- 		err = crypto_register_ahash(&t_alg->ahash_alg);
- 		if (err) {
--			pr_warn("%s alg registration failed\n",
-+			dev_warn(ctrldev, "%s alg registration failed\n",
- 				t_alg->ahash_alg.halg.base.cra_driver_name);
- 			kfree(t_alg);
- 		} else
--			list_add_tail(&t_alg->entry, &hash_list);
-+			list_add_tail(&t_alg->entry, &priv->hash_list);
- 	}
- 
-+	of_node_put(dev_node);
- 	return err;
- }
- 
-diff -Nur linux-4.1.3/drivers/crypto/caam/caam_keyblob.c linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.c
---- linux-4.1.3/drivers/crypto/caam/caam_keyblob.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.c	2015-07-27 23:13:04.205975852 +0200
-@@ -0,0 +1,687 @@
-+/*
-+ * Key blob driver based on CAAM hardware
-+ *
-+ * Copyright (C) 2015 Freescale Semiconductor, Inc.
-+ */
-+
-+#include <linux/of_irq.h>
-+#include <linux/of_address.h>
-+
-+#include "compat.h"
-+#include "regs.h"
-+#include "jr.h"
-+#include "desc.h"
-+#include "intern.h"
-+#include "sm.h"
-+#include "caam_keyblob.h"
-+
-+#define INITIAL_DESCSZ 16	/* size of tmp buffer for descriptor const. */
-+
-+/**
-+ * struct kb_device - the metadata of the caam key blob device node
-+ * @dev:		the actual misc device
-+ */
-+struct kb_device {
-+	struct miscdevice misc_dev;
-+    struct device *jr_dev;
-+};
-+
-+/*
-+ * Pseudo-synchronous ring access functions for carrying out key
-+ * encapsulation and decapsulation
-+ */
-+
-+struct sm_key_job_result {
-+	int error;
-+	struct completion completion;
-+};
-+
-+
-+static struct kb_device *kb_dev;
-+
-+static struct kb_device *kb_device_create(void);
-+static int kb_device_destroy(struct kb_device *kb_dev);
-+static int kb_open(struct inode *inode, struct file *file);
-+static int kb_release(struct inode *inode, struct file *file);
-+static void sm_key_job_done(struct device *dev, u32 *desc,
-+		u32 err, void *context);
-+static int gen_mem_encap(struct device *jr_dev, void __user *secretbuf,
-+		int keylen, void __user *kmodbuf, void __user *outbuf);
-+static int gen_mem_decap(struct device *jr_dev, void __user *keyblobbuf,
-+		int bloblen, void __user *kmodbuf, void __user *outbuf);
-+static long kb_ioctl(struct file *file, unsigned int cmd, unsigned long arg);
-+static int caam_keyblob_probe(struct platform_device *pdev);
-+static int caam_keyblob_remove(struct platform_device *pdev);
-+
-+static int kb_open(struct inode *inode, struct file *file)
-+{
-+	struct miscdevice *miscdev = file->private_data;
-+	struct kb_device *dev = container_of(miscdev, struct kb_device, misc_dev);
-+    struct device *jr_dev;
-+
-+    if (!dev->jr_dev) {
-+		jr_dev = caam_jr_alloc();
-+		if (IS_ERR(jr_dev)) {
-+			pr_err("Job Ring Device allocation for transform failed\n");
-+			return -ENOMEM;
-+		}
-+		pr_info("Allocate a job ring device\n");
-+		dev->jr_dev = jr_dev;
-+    }
-+	else {
-+		pr_err("Already created a job ring device");
-+		return -EPERM;
-+	}
-+
-+	return 0;
-+}
-+
-+static int kb_release(struct inode *inode, struct file *file)
-+{
-+	struct miscdevice *miscdev = file->private_data;
-+	struct kb_device *dev = container_of(miscdev, struct kb_device, misc_dev);
-+
-+    if (dev && dev->jr_dev) {
-+	    caam_jr_free(dev->jr_dev);
-+		pr_info("Free a job ring device\n");
-+		dev->jr_dev = NULL;
-+    }
-+	return 0;
-+}
-+
-+static void sm_key_job_done(struct device *dev, u32 *desc,
-+		u32 err, void *context)
-+{
-+	struct sm_key_job_result *res = context;
-+
-+	res->error = err;	/* save off the error for postprocessing */
-+	complete(&res->completion);	/* mark us complete */
-+}
-+
-+/*
-+ * Construct a blob encapsulation job descriptor
-+ *
-+ * This function dynamically constructs a blob encapsulation job descriptor
-+ * from the following arguments:
-+ *
-+ * - desc	pointer to a pointer to the descriptor generated by this
-+ *		function. Caller will be responsible to kfree() this
-+ *		descriptor after execution.
-+ * - keymod	Physical pointer to a key modifier, which must reside in a
-+ *		contiguous piece of memory. Modifier will be assumed to be
-+ *		8 bytes long for a blob of type SM_SECMEM, or 16 bytes long
-+ *		for a blob of type SM_GENMEM (see blobtype argument).
-+ * - secretbuf	Physical pointer to a secret, normally a black or red key,
-+ *		possibly residing within an accessible secure memory page,
-+ *		of the secret to be encapsulated to an output blob.
-+ * - outbuf	Physical pointer to the destination buffer to receive the
-+ *		encapsulated output. This buffer will need to be 48 bytes
-+ *		larger than the input because of the added encapsulation data.
-+ *		The generated descriptor will account for the increase in size,
-+ *		but the caller must also account for this increase in the
-+ *		buffer allocator.
-+ * - secretsz	Size of input secret, in bytes. This is limited to 65536
-+ *		less the size of blob overhead, since the length embeds into
-+ *		DECO pointer in/out instructions.
-+ * - keycolor   Determines if the source data is covered (black key) or
-+ *		plaintext (red key). RED_KEY or BLACK_KEY are defined in
-+ *		for this purpose.
-+ * - blobtype	Determine if encapsulated blob should be a secure memory
-+ *		blob (SM_SECMEM), with partition data embedded with key
-+ *		material, or a general memory blob (SM_GENMEM).
-+ * - auth	If BLACK_KEY source is covered via AES-CCM, specify
-+ *		KEY_COVER_CCM, else uses AES-ECB (KEY_COVER_ECB).
-+ *
-+ * Upon completion, desc points to a buffer containing a CAAM job
-+ * descriptor which encapsulates data into an externally-storable blob
-+ * suitable for use across power cycles.
-+ *
-+ * This is an example of a black key encapsulation job into a general memory
-+ * blob. Notice the 16-byte key modifier in the LOAD instruction. Also note
-+ * the output 48 bytes longer than the input:
-+ *
-+ * [00] B0800008       jobhdr: stidx=0 len=8
-+ * [01] 14400010           ld: ccb2-key len=16 offs=0
-+ * [02] 08144891               ptr->@0x08144891
-+ * [03] F800003A    seqoutptr: len=58
-+ * [04] 01000000               out_ptr->@0x01000000
-+ * [05] F000000A     seqinptr: len=10
-+ * [06] 09745090               in_ptr->@0x09745090
-+ * [07] 870D0004    operation: encap blob  reg=memory, black, format=normal
-+ *
-+ * This is an example of a red key encapsulation job for storing a red key
-+ * into a secure memory blob. Note the 8 byte modifier on the 12 byte offset
-+ * in the LOAD instruction; this accounts for blob permission storage:
-+ *
-+ * [00] B0800008       jobhdr: stidx=0 len=8
-+ * [01] 14400C08           ld: ccb2-key len=8 offs=12
-+ * [02] 087D0784               ptr->@0x087d0784
-+ * [03] F8000050    seqoutptr: len=80
-+ * [04] 09251BB2               out_ptr->@0x09251bb2
-+ * [05] F0000020     seqinptr: len=32
-+ * [06] 40000F31               in_ptr->@0x40000f31
-+ * [07] 870D0008    operation: encap blob  reg=memory, red, sec_mem,
-+ *                             format=normal
-+ *
-+ * Note: this function only generates 32-bit pointers at present, and should
-+ * be refactored using a scheme that allows both 32 and 64 bit addressing
-+ */
-+
-+static int blob_encap_jobdesc(u32 **desc, dma_addr_t keymod,
-+			      void *secretbuf, dma_addr_t outbuf,
-+			      u16 secretsz, u8 keycolor, u8 blobtype, u8 auth)
-+{
-+	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
-+	u16 dsize, idx;
-+
-+	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
-+	idx = 1;
-+
-+	/*
-+	 * Key modifier works differently for secure/general memory blobs
-+	 * This accounts for the permission/protection data encapsulated
-+	 * within the blob if a secure memory blob is requested
-+	 */
-+	if (blobtype == SM_SECMEM)
-+		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
-+				 LDST_SRCDST_BYTE_KEY |
-+				 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK)
-+				 | (8 & LDST_LEN_MASK);
-+	else /* is general memory blob */
-+		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
-+				 LDST_SRCDST_BYTE_KEY | (16 & LDST_LEN_MASK);
-+
-+	tmpdesc[idx++] = (u32)keymod;
-+
-+	/*
-+	 * Encapsulation output must include space for blob key encryption
-+	 * key and MAC tag
-+	 */
-+	tmpdesc[idx++] = CMD_SEQ_OUT_PTR | (secretsz + BLOB_OVERHEAD);
-+	tmpdesc[idx++] = (u32)outbuf;
-+
-+	/* Input data, should be somewhere in secure memory */
-+	tmpdesc[idx++] = CMD_SEQ_IN_PTR | secretsz;
-+	tmpdesc[idx++] = (u32)secretbuf;
-+
-+	/* Set blob encap, then color */
-+	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_ENCAP_PROTOCOL | OP_PCLID_BLOB;
-+
-+	if (blobtype == SM_SECMEM)
-+		tmpdesc[idx] |= OP_PCL_BLOB_PTXT_SECMEM;
-+
-+	if (auth == KEY_COVER_CCM)
-+		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
-+
-+	if (keycolor == BLACK_KEY)
-+		tmpdesc[idx] |= OP_PCL_BLOB_BLACK;
-+
-+	idx++;
-+	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
-+	dsize = idx * sizeof(u32);
-+
-+	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
-+	if (tdesc == NULL)
-+		return 0;
-+
-+	memcpy(tdesc, tmpdesc, dsize);
-+	*desc = tdesc;
-+	return dsize;
-+}
-+
-+/*
-+ * Construct a blob decapsulation job descriptor
-+ *
-+ * This function dynamically constructs a blob decapsulation job descriptor
-+ * from the following arguments:
-+ *
-+ * - desc	pointer to a pointer to the descriptor generated by this
-+ *		function. Caller will be responsible to kfree() this
-+ *		descriptor after execution.
-+ * - keymod	Physical pointer to a key modifier, which must reside in a
-+ *		contiguous piece of memory. Modifier will be assumed to be
-+ *		8 bytes long for a blob of type SM_SECMEM, or 16 bytes long
-+ *		for a blob of type SM_GENMEM (see blobtype argument).
-+ * - blobbuf	Physical pointer (into external memory) of the blob to
-+ *		be decapsulated. Blob must reside in a contiguous memory
-+ *		segment.
-+ * - outbuf	Physical pointer of the decapsulated output, possibly into
-+ *		a location within a secure memory page. Must be contiguous.
-+ * - secretsz	Size of encapsulated secret in bytes (not the size of the
-+ *		input blob).
-+ * - keycolor   Determines if decapsulated content is encrypted (BLACK_KEY)
-+ *		or left as plaintext (RED_KEY).
-+ * - blobtype	Determine if encapsulated blob should be a secure memory
-+ *		blob (SM_SECMEM), with partition data embedded with key
-+ *		material, or a general memory blob (SM_GENMEM).
-+ * - auth	If decapsulation path is specified by BLACK_KEY, then if
-+ *		AES-CCM is requested for key covering use KEY_COVER_CCM, else
-+ *		use AES-ECB (KEY_COVER_ECB).
-+ *
-+ * Upon completion, desc points to a buffer containing a CAAM job descriptor
-+ * that decapsulates a key blob from external memory into a black (encrypted)
-+ * key or red (plaintext) content.
-+ *
-+ * This is an example of a black key decapsulation job from a general memory
-+ * blob. Notice the 16-byte key modifier in the LOAD instruction.
-+ *
-+ * [00] B0800008       jobhdr: stidx=0 len=8
-+ * [01] 14400010           ld: ccb2-key len=16 offs=0
-+ * [02] 08A63B7F               ptr->@0x08a63b7f
-+ * [03] F8000010    seqoutptr: len=16
-+ * [04] 01000000               out_ptr->@0x01000000
-+ * [05] F000003A     seqinptr: len=58
-+ * [06] 01000010               in_ptr->@0x01000010
-+ * [07] 860D0004    operation: decap blob  reg=memory, black, format=normal
-+ *
-+ * This is an example of a red key decapsulation job for restoring a red key
-+ * from a secure memory blob. Note the 8 byte modifier on the 12 byte offset
-+ * in the LOAD instruction:
-+ *
-+ * [00] B0800008       jobhdr: stidx=0 len=8
-+ * [01] 14400C08           ld: ccb2-key len=8 offs=12
-+ * [02] 01000000               ptr->@0x01000000
-+ * [03] F8000020    seqoutptr: len=32
-+ * [04] 400000E6               out_ptr->@0x400000e6
-+ * [05] F0000050     seqinptr: len=80
-+ * [06] 08F0C0EA               in_ptr->@0x08f0c0ea
-+ * [07] 860D0008    operation: decap blob  reg=memory, red, sec_mem,
-+ *			       format=normal
-+ *
-+ * Note: this function only generates 32-bit pointers at present, and should
-+ * be refactored using a scheme that allows both 32 and 64 bit addressing
-+ */
-+
-+static int blob_decap_jobdesc(u32 **desc, dma_addr_t keymod, dma_addr_t blobbuf,
-+			      u8 *outbuf, u16 secretsz, u8 keycolor,
-+			      u8 blobtype, u8 auth)
-+{
-+	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
-+	u16 dsize, idx;
-+
-+	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
-+	idx = 1;
-+
-+	/* Load key modifier */
-+	if (blobtype == SM_SECMEM)
-+		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
-+				 LDST_SRCDST_BYTE_KEY |
-+				 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK)
-+				 | (8 & LDST_LEN_MASK);
-+	else /* is general memory blob */
-+		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
-+				 LDST_SRCDST_BYTE_KEY | (16 & LDST_LEN_MASK);
-+
-+	tmpdesc[idx++] = (u32)keymod;
-+
-+	/* Compensate BKEK + MAC tag over size of encapsulated secret */
-+	tmpdesc[idx++] = CMD_SEQ_IN_PTR | (secretsz + BLOB_OVERHEAD);
-+	tmpdesc[idx++] = (u32)blobbuf;
-+	tmpdesc[idx++] = CMD_SEQ_OUT_PTR | secretsz;
-+	tmpdesc[idx++] = (u32)outbuf;
-+
-+	/* Decapsulate from secure memory partition to black blob */
-+	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_DECAP_PROTOCOL | OP_PCLID_BLOB;
-+
-+	if (blobtype == SM_SECMEM)
-+		tmpdesc[idx] |= OP_PCL_BLOB_PTXT_SECMEM;
-+
-+	if (auth == KEY_COVER_CCM)
-+		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
-+
-+	if (keycolor == BLACK_KEY)
-+		tmpdesc[idx] |= OP_PCL_BLOB_BLACK;
-+
-+	idx++;
-+	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
-+	dsize = idx * sizeof(u32);
-+
-+	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
-+	if (tdesc == NULL)
-+		return 0;
-+
-+	memcpy(tdesc, tmpdesc, dsize);
-+	*desc = tdesc;
-+	return dsize;
-+}
-+
-+
-+
-+static int gen_mem_encap(struct device *jr_dev, void __user *secretbuf,
-+		int keylen, void __user *kmodbuf, void __user *outbuf)
-+{
-+	int retval = 0;
-+	u32 dsize;
-+    u32 __iomem *encapdesc = NULL;
-+	dma_addr_t secret_dma = 0, keymod_dma = 0, outbuf_dma = 0;
-+	u8 __iomem *lsecret = NULL, *lkeymod = NULL, *loutbuf = NULL;
-+	struct sm_key_job_result testres;
-+
-+	/* Build/map/flush the scret */
-+	lsecret = kmalloc(keylen, GFP_KERNEL | GFP_DMA);
-+    if (!lsecret) {
-+		dev_err(jr_dev, "%s: can't alloc for key\n", __func__);
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+    if (copy_from_user(lsecret, secretbuf, keylen)) {
-+		dev_err(jr_dev, "%s: can't Copy for key\n", __func__);
-+		retval = -EFAULT;
-+		goto out;
-+	}
-+	secret_dma = dma_map_single(jr_dev, lsecret, keylen,
-+				    DMA_TO_DEVICE);
-+
-+	/* Build/map/flush the key modifier */
-+	lkeymod = kmalloc(GENMEM_KEYMOD_LEN, GFP_KERNEL | GFP_DMA);
-+    if (!lkeymod) {
-+		dev_err(jr_dev, "%s: can't alloc for keymod\n", __func__);
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+    if (copy_from_user(lkeymod, kmodbuf, GENMEM_KEYMOD_LEN)) {
-+		dev_err(jr_dev, "%s: can't Copy for keymod\n", __func__);
-+		retval = -EFAULT;
-+		goto out;
-+	}
-+	keymod_dma = dma_map_single(jr_dev, lkeymod, GENMEM_KEYMOD_LEN,
-+				    DMA_TO_DEVICE);
-+
-+	loutbuf = kmalloc(keylen + BLOB_OVERHEAD, GFP_KERNEL | GFP_DMA);
-+    if (!lkeymod) {
-+		dev_err(jr_dev, "%s: can't alloc for output\n", __func__);
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+	outbuf_dma = dma_map_single(jr_dev, loutbuf, keylen + BLOB_OVERHEAD,
-+				    DMA_FROM_DEVICE);
-+	dsize = blob_encap_jobdesc(&encapdesc, keymod_dma, (void *)secret_dma, outbuf_dma,
-+			keylen, RED_KEY, SM_GENMEM, KEY_COVER_ECB);
-+	if (!dsize) {
-+		dev_err(jr_dev, "can't alloc an encapsulation descriptor\n");
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+	init_completion(&testres.completion);
-+
-+	retval = caam_jr_enqueue(jr_dev, encapdesc, sm_key_job_done,
-+			&testres);
-+	if (!retval) {
-+		wait_for_completion_interruptible(&testres.completion);
-+		dev_info(jr_dev, "job ring return %d\n", testres.error);
-+		if (!testres.error) {
-+			dma_sync_single_for_cpu(jr_dev, outbuf_dma, keylen + BLOB_OVERHEAD,
-+				DMA_FROM_DEVICE);
-+
-+			if (copy_to_user(outbuf, loutbuf, keylen + BLOB_OVERHEAD)) {
-+				retval = -EFAULT;
-+				dev_err(jr_dev, "can't copy for output\n");
-+				goto out;
-+			}
-+		}
-+		retval = testres.error;
-+	}
-+
-+out:
-+	if (outbuf_dma)
-+		dma_unmap_single(jr_dev, outbuf_dma, keylen + BLOB_OVERHEAD,
-+			 DMA_FROM_DEVICE);
-+	if (keymod_dma)
-+		dma_unmap_single(jr_dev, keymod_dma, GENMEM_KEYMOD_LEN, DMA_TO_DEVICE);
-+    if (secret_dma)
-+		dma_unmap_single(jr_dev, secret_dma, keylen, DMA_TO_DEVICE);
-+	kfree(encapdesc);
-+	kfree(lkeymod);
-+	kfree(lsecret);
-+	kfree(loutbuf);
-+
-+	return retval;
-+}
-+
-+static int gen_mem_decap(struct device *jr_dev, void __user *keyblobbuf,
-+		int bloblen, void __user *kmodbuf, void __user *outbuf)
-+{
-+	int retval = 0;
-+    int keylen = bloblen - BLOB_OVERHEAD;
-+	u32 dsize;
-+	dma_addr_t keyblob_dma = 0, keymod_dma = 0, outbuf_dma = 0;
-+	u8 __iomem *lkeyblob = NULL, *lkeymod = NULL, *loutbuf = NULL;
-+	struct sm_key_job_result testres;
-+	u32 __iomem *decapdesc = NULL;
-+
-+	/* Build/map/flush the scret */
-+	lkeyblob = kmalloc(bloblen, GFP_KERNEL | GFP_DMA);
-+    if (!lkeyblob) {
-+		dev_err(jr_dev, "%s: can't alloc for keylob\n", __func__);
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+    if (copy_from_user(lkeyblob, keyblobbuf, bloblen)) {
-+		dev_err(jr_dev, "%s: can't Copy for keyblob\n", __func__);
-+		retval = -EFAULT;
-+		goto out;
-+    }
-+	keyblob_dma = dma_map_single(jr_dev, lkeyblob, bloblen,
-+				    DMA_TO_DEVICE);
-+
-+	/* Build/map/flush the key modifier */
-+	lkeymod = kmalloc(GENMEM_KEYMOD_LEN, GFP_KERNEL | GFP_DMA);
-+    if (!lkeymod) {
-+		dev_err(jr_dev, "%s: can't alloc for keymod\n", __func__);
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+    if (copy_from_user(lkeymod, kmodbuf, GENMEM_KEYMOD_LEN)) {
-+		dev_err(jr_dev, "%s: can't Copy for keymod\n", __func__);
-+		retval = -EFAULT;
-+		goto out;
-+	}
-+	keymod_dma = dma_map_single(jr_dev, lkeymod, GENMEM_KEYMOD_LEN,
-+				    DMA_TO_DEVICE);
-+
-+	loutbuf = kmalloc(keylen, GFP_KERNEL | GFP_DMA);
-+    if (!loutbuf) {
-+		dev_err(jr_dev, "%s: can't alloc for outbuf\n", __func__);
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+	outbuf_dma = dma_map_single(jr_dev, loutbuf, keylen,
-+				    DMA_FROM_DEVICE);
-+
-+	/* Build the encapsulation job descriptor */
-+	dsize = blob_decap_jobdesc(&decapdesc, keymod_dma, keyblob_dma, (u8 *)outbuf_dma,
-+				   keylen, RED_KEY, SM_GENMEM, KEY_COVER_ECB);
-+	if (!dsize) {
-+		dev_err(jr_dev, "can't alloc a decapsulation descriptor\n");
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+
-+	init_completion(&testres.completion);
-+
-+	retval = caam_jr_enqueue(jr_dev, decapdesc, sm_key_job_done,
-+			      &testres);
-+	if (!retval) {
-+		wait_for_completion_interruptible(&testres.completion);
-+		dev_info(jr_dev, "job ring return %d\n", testres.error);
-+		if (!testres.error) {
-+			dma_sync_single_for_cpu(jr_dev, outbuf_dma, keylen,
-+				DMA_FROM_DEVICE);
-+
-+			if (copy_to_user(outbuf, loutbuf, keylen)) {
-+				retval = -EFAULT;
-+				goto out;
-+			}
-+		}
-+		retval = testres.error;
-+	}
-+
-+out:
-+	if (outbuf_dma)
-+		dma_unmap_single(jr_dev, outbuf_dma, keylen,
-+				DMA_FROM_DEVICE);
-+	if (keymod_dma)
-+		dma_unmap_single(jr_dev, keymod_dma, GENMEM_KEYMOD_LEN,
-+				DMA_TO_DEVICE);
-+	if (keyblob_dma)
-+		dma_unmap_single(jr_dev, keyblob_dma, bloblen,
-+				DMA_TO_DEVICE);
-+	kfree(decapdesc);
-+	kfree(lkeymod);
-+	kfree(lkeyblob);
-+	kfree(loutbuf);
-+
-+	return retval;
-+}
-+
-+
-+static long kb_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
-+{
-+	int retval = 0;
-+    struct caam_kb_data kb_data;
-+	struct miscdevice *miscdev = file->private_data;
-+	struct kb_device *dev = container_of(miscdev, struct kb_device, misc_dev);
-+
-+    if (copy_from_user(&kb_data, (void *)arg, sizeof(kb_data))) {
-+		retval = -EFAULT;
-+		goto err;
-+	}
-+
-+    if (!kb_data.rawkey || !kb_data.keyblob ||
-+			(kb_data.rawkey_len + BLOB_OVERHEAD != kb_data.keyblob_len) ||
-+			(kb_data.keymod_len != GENMEM_KEYMOD_LEN)) {
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	printk(KERN_INFO"%s:rawkey_len %d, keyblob_len %d\n",
-+			__func__, kb_data.rawkey_len, kb_data.keyblob_len);
-+
-+	switch (cmd) {
-+	case CAAM_KB_ENCRYPT:
-+	    {
-+			retval = gen_mem_encap(dev->jr_dev, kb_data.rawkey, kb_data.rawkey_len,
-+					kb_data.keymod, kb_data.keyblob);
-+		    break;
-+	    }
-+	case CAAM_KB_DECRYPT:
-+	    {
-+			retval = gen_mem_decap(dev->jr_dev, kb_data.keyblob, kb_data.keyblob_len,
-+					kb_data.keymod, kb_data.rawkey);
-+		    break;
-+	    }
-+	default:
-+		    return -ENOTTY;
-+	}
-+
-+err:
-+	return retval;
-+}
-+
-+static const struct file_operations kb_fops = {
-+	.owner          = THIS_MODULE,
-+	.open           = kb_open,
-+	.release        = kb_release,
-+	.unlocked_ioctl = kb_ioctl,
-+};
-+
-+static struct kb_device *kb_device_create(void)
-+{
-+	struct kb_device *idev;
-+	int ret;
-+
-+	idev = kzalloc(sizeof(struct kb_device), GFP_KERNEL);
-+	if (!idev)
-+		return ERR_PTR(-ENOMEM);
-+
-+	idev->misc_dev.minor = MISC_DYNAMIC_MINOR;
-+	idev->misc_dev.name = "caam_kb";
-+	idev->misc_dev.fops = &kb_fops;
-+	idev->misc_dev.parent = NULL;
-+	ret = misc_register(&idev->misc_dev);
-+	if (ret) {
-+		pr_err("ion: failed to register misc device.\n");
-+		return ERR_PTR(ret);
-+	}
-+
-+	return idev;
-+}
-+
-+static int kb_device_destroy(struct kb_device *kb_dev)
-+{
-+    if ((kb_dev) && (kb_dev->jr_dev)) {
-+		caam_jr_free(kb_dev->jr_dev);
-+		kb_dev->jr_dev = NULL;
-+	}
-+
-+    if (kb_dev)
-+		misc_deregister(&kb_dev->misc_dev);
-+
-+    return 0;
-+}
-+/*
-+ * Probe key blob device
-+ */
-+static int caam_keyblob_probe(struct platform_device *pdev)
-+{
-+	int err;
-+
-+	dev_dbg(&pdev->dev, "%s enter\n", __func__);
-+	kb_dev = kb_device_create();
-+	if (IS_ERR_OR_NULL(kb_dev)) {
-+		err = PTR_ERR(kb_dev);
-+		goto err;
-+	}
-+	return 0;
-+err:
-+    return err;
-+}
-+
-+/*
-+ * Remove key blob device
-+ */
-+static int caam_keyblob_remove(struct platform_device *pdev)
-+{
-+    kb_device_destroy(kb_dev);
-+	return 0;
-+}
-+
-+static struct of_device_id caam_keyblob_match[] = {
-+	{
-+		.compatible = "fsl,sec-v4.0-keyblob",
-+	},
-+	{
-+		.compatible = "fsl,sec4.0-keyblob",
-+	},
-+	{},
-+};
-+
-+MODULE_DEVICE_TABLE(of, caam_keyblob_match);
-+
-+static struct platform_driver caam_keyblob_driver = {
-+	.driver = {
-+		.name = "caam_keyblob",
-+		.owner = THIS_MODULE,
-+		.of_match_table = caam_keyblob_match,
-+	},
-+	.probe       = caam_keyblob_probe,
-+	.remove      = caam_keyblob_remove,
-+};
-+
-+static int __init keyblob_driver_init(void)
-+{
-+	return platform_driver_register(&caam_keyblob_driver);
-+}
-+
-+static void __exit keyblob_driver_exit(void)
-+{
-+	platform_driver_unregister(&caam_keyblob_driver);
-+}
-+
-+module_init(keyblob_driver_init);
-+module_exit(keyblob_driver_exit);
-+
-+
-+MODULE_LICENSE("Dual BSD/GPL");
-+MODULE_DESCRIPTION("FSL CAAM Secure Memory / Keystore");
-+MODULE_AUTHOR("Freescale Semiconductor - NMSG/MAD");
-diff -Nur linux-4.1.3/drivers/crypto/caam/caam_keyblob.h linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.h
---- linux-4.1.3/drivers/crypto/caam/caam_keyblob.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.h	2015-07-27 23:13:04.205975852 +0200
-@@ -0,0 +1,45 @@
-+/*
-+ * CAAM public-level include definitions for the key blob
-+ *
-+ * Copyright (C) 2015 Freescale Semiconductor, Inc.
-+ */
-+
-+#ifndef CAAM_KEYBLOB_H
-+#define CAAM_KEYBLOB_H
-+
-+
-+#include <linux/ioctl.h>
-+#include <linux/types.h>
-+
-+struct caam_kb_data {
-+	char *rawkey;
-+    size_t rawkey_len;
-+    char *keyblob;
-+    size_t keyblob_len;
-+    char *keymod;
-+    size_t keymod_len;
-+};
-+
-+
-+#define CAAM_KB_MAGIC		'I'
-+
-+/**
-+ * DOC: CAAM_KB_ENCRYPT - generate a key blob from raw key
-+ *
-+ * Takes an caam_kb_data struct and returns it with the key blob
-+ */
-+#define CAAM_KB_ENCRYPT		_IOWR(CAAM_KB_MAGIC, 0, \
-+				      struct caam_kb_data)
-+
-+/**
-+ * DOC: CAAM_KB_DECRYPT - get keys from a key blob
-+ *
-+ * Takes an caam_kb_data struct and returns it with the raw key.
-+ */
-+#define CAAM_KB_DECRYPT		_IOWR(CAAM_KB_MAGIC, 1, struct caam_kb_data)
-+
-+#ifndef GENMEM_KEYMOD_LEN
-+#define GENMEM_KEYMOD_LEN 16
-+#endif
-+
-+#endif /* CAAM_KEYBLOB_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/caamrng.c linux-xbian-imx6/drivers/crypto/caam/caamrng.c
---- linux-4.1.3/drivers/crypto/caam/caamrng.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/caamrng.c	2015-07-27 23:13:04.209961631 +0200
-@@ -1,7 +1,7 @@
- /*
-  * caam - Freescale FSL CAAM support for hw_random
-  *
-- * Copyright 2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
-  *
-  * Based on caamalg.c crypto API driver.
-  *
-@@ -80,9 +80,12 @@
- 
- static inline void rng_unmap_buf(struct device *jrdev, struct buf_data *bd)
- {
--	if (bd->addr)
-+	if (bd->addr) {
-+		dma_sync_single_for_cpu(jrdev, bd->addr, RN_BUF_SIZE,
-+					DMA_FROM_DEVICE);
- 		dma_unmap_single(jrdev, bd->addr, RN_BUF_SIZE,
- 				 DMA_FROM_DEVICE);
-+	}
- }
- 
- static inline void rng_unmap_ctx(struct caam_rng_ctx *ctx)
-@@ -103,11 +106,18 @@
- 	bd = (struct buf_data *)((char *)desc -
- 	      offsetof(struct buf_data, hw_desc));
- 
--	if (err)
--		caam_jr_strstatus(jrdev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- 	atomic_set(&bd->empty, BUF_NOT_EMPTY);
- 	complete(&bd->filled);
-+
-+	/* Buffer refilled, invalidate cache */
-+	dma_sync_single_for_cpu(jrdev, bd->addr, RN_BUF_SIZE, DMA_FROM_DEVICE);
-+
- #ifdef DEBUG
- 	print_hex_dump(KERN_ERR, "rng refreshed buf@: ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, bd->buf, RN_BUF_SIZE, 1);
-@@ -185,7 +195,7 @@
- 				      max - copied_idx, false);
- }
- 
--static inline int rng_create_sh_desc(struct caam_rng_ctx *ctx)
-+static inline void rng_create_sh_desc(struct caam_rng_ctx *ctx)
- {
- 	struct device *jrdev = ctx->jrdev;
- 	u32 *desc = ctx->sh_desc;
-@@ -203,18 +213,16 @@
- 
- 	ctx->sh_desc_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
- 					  DMA_TO_DEVICE);
--	if (dma_mapping_error(jrdev, ctx->sh_desc_dma)) {
--		dev_err(jrdev, "unable to map shared descriptor\n");
--		return -ENOMEM;
--	}
-+	dma_sync_single_for_device(jrdev, ctx->sh_desc_dma, desc_bytes(desc),
-+			       DMA_TO_DEVICE);
-+
- #ifdef DEBUG
- 	print_hex_dump(KERN_ERR, "rng shdesc@: ", DUMP_PREFIX_ADDRESS, 16, 4,
- 		       desc, desc_bytes(desc), 1);
- #endif
--	return 0;
- }
- 
--static inline int rng_create_job_desc(struct caam_rng_ctx *ctx, int buf_id)
-+static inline void rng_create_job_desc(struct caam_rng_ctx *ctx, int buf_id)
- {
- 	struct device *jrdev = ctx->jrdev;
- 	struct buf_data *bd = &ctx->bufs[buf_id];
-@@ -225,17 +233,12 @@
- 			     HDR_REVERSE);
- 
- 	bd->addr = dma_map_single(jrdev, bd->buf, RN_BUF_SIZE, DMA_FROM_DEVICE);
--	if (dma_mapping_error(jrdev, bd->addr)) {
--		dev_err(jrdev, "unable to map dst\n");
--		return -ENOMEM;
--	}
- 
- 	append_seq_out_ptr_intlen(desc, bd->addr, RN_BUF_SIZE, 0);
- #ifdef DEBUG
- 	print_hex_dump(KERN_ERR, "rng job desc@: ", DUMP_PREFIX_ADDRESS, 16, 4,
- 		       desc, desc_bytes(desc), 1);
- #endif
--	return 0;
- }
- 
- static void caam_cleanup(struct hwrng *rng)
-@@ -252,44 +255,67 @@
- 	rng_unmap_ctx(rng_ctx);
- }
- 
--static int caam_init_buf(struct caam_rng_ctx *ctx, int buf_id)
-+#ifdef CONFIG_CRYPTO_DEV_FSL_CAAM_RNG_TEST
-+static inline void test_len(struct hwrng *rng, size_t len, bool wait)
- {
--	struct buf_data *bd = &ctx->bufs[buf_id];
--	int err;
-+	u8 *buf;
-+	int real_len;
- 
--	err = rng_create_job_desc(ctx, buf_id);
--	if (err)
--		return err;
-+	buf = kzalloc(sizeof(u8) * len, GFP_KERNEL);
-+	real_len = rng->read(rng, buf, len, wait);
-+	if (real_len == 0 && wait)
-+		pr_err("WAITING FAILED\n");
-+	pr_info("wanted %d bytes, got %d\n", len, real_len);
-+	print_hex_dump(KERN_INFO, "random bytes@: ", DUMP_PREFIX_ADDRESS,
-+		       16, 4, buf, real_len, 1);
-+	kfree(buf);
-+}
- 
--	atomic_set(&bd->empty, BUF_EMPTY);
--	submit_job(ctx, buf_id == ctx->current_buf);
--	wait_for_completion(&bd->filled);
-+static inline void test_mode_once(struct hwrng *rng, bool wait)
-+{
-+#define TEST_CHUNK (RN_BUF_SIZE / 4)
- 
--	return 0;
-+	test_len(rng, TEST_CHUNK, wait);
-+	test_len(rng, RN_BUF_SIZE * 2, wait);
-+	test_len(rng, RN_BUF_SIZE * 2 - TEST_CHUNK, wait);
- }
- 
--static int caam_init_rng(struct caam_rng_ctx *ctx, struct device *jrdev)
-+static inline void test_mode(struct hwrng *rng, bool wait)
- {
--	int err;
--
--	ctx->jrdev = jrdev;
-+#define TEST_PASS 1
-+	int i;
- 
--	err = rng_create_sh_desc(ctx);
--	if (err)
--		return err;
-+	for (i = 0; i < TEST_PASS; i++)
-+		test_mode_once(rng, wait);
-+}
- 
--	ctx->current_buf = 0;
--	ctx->cur_buf_idx = 0;
-+static void self_test(struct hwrng *rng)
-+{
-+	pr_info("testing without waiting\n");
-+	test_mode(rng, false);
-+	pr_info("testing with waiting\n");
-+	test_mode(rng, true);
-+}
-+#endif
- 
--	err = caam_init_buf(ctx, 0);
--	if (err)
--		return err;
-+static void caam_init_buf(struct caam_rng_ctx *ctx, int buf_id)
-+{
-+	struct buf_data *bd = &ctx->bufs[buf_id];
- 
--	err = caam_init_buf(ctx, 1);
--	if (err)
--		return err;
-+	rng_create_job_desc(ctx, buf_id);
-+	atomic_set(&bd->empty, BUF_EMPTY);
-+	submit_job(ctx, buf_id == ctx->current_buf);
-+	wait_for_completion(&bd->filled);
-+}
- 
--	return 0;
-+static void caam_init_rng(struct caam_rng_ctx *ctx, struct device *jrdev)
-+{
-+	ctx->jrdev = jrdev;
-+	rng_create_sh_desc(ctx);
-+	ctx->current_buf = 0;
-+	ctx->cur_buf_idx = 0;
-+	caam_init_buf(ctx, 0);
-+	caam_init_buf(ctx, 1);
- }
- 
- static struct hwrng caam_rng = {
-@@ -300,19 +326,15 @@
- 
- static void __exit caam_rng_exit(void)
- {
--	caam_jr_free(rng_ctx->jrdev);
- 	hwrng_unregister(&caam_rng);
--	kfree(rng_ctx);
- }
- 
- static int __init caam_rng_init(void)
- {
--	struct device *dev;
- 	struct device_node *dev_node;
- 	struct platform_device *pdev;
- 	struct device *ctrldev;
--	void *priv;
--	int err;
-+	struct caam_drv_private *priv;
- 
- 	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
- 	if (!dev_node) {
-@@ -322,35 +344,26 @@
- 	}
- 
- 	pdev = of_find_device_by_node(dev_node);
--	if (!pdev) {
--		of_node_put(dev_node);
-+	if (!pdev)
- 		return -ENODEV;
--	}
- 
- 	ctrldev = &pdev->dev;
- 	priv = dev_get_drvdata(ctrldev);
- 	of_node_put(dev_node);
- 
--	/*
--	 * If priv is NULL, it's probably because the caam driver wasn't
--	 * properly initialized (e.g. RNG4 init failed). Thus, bail out here.
--	 */
--	if (!priv)
-+	/* Check RNG present in hardware before registration */
-+	if (!(rd_reg64(&priv->ctrl->perfmon.cha_num) & CHA_ID_RNG_MASK))
- 		return -ENODEV;
- 
--	dev = caam_jr_alloc();
--	if (IS_ERR(dev)) {
--		pr_err("Job Ring Device allocation for transform failed\n");
--		return PTR_ERR(dev);
--	}
--	rng_ctx = kmalloc(sizeof(struct caam_rng_ctx), GFP_DMA);
--	if (!rng_ctx)
--		return -ENOMEM;
--	err = caam_init_rng(rng_ctx, dev);
--	if (err)
--		return err;
-+	rng_ctx = kmalloc(sizeof(struct caam_rng_ctx), GFP_KERNEL | GFP_DMA);
-+
-+	caam_init_rng(rng_ctx, priv->jrdev[0]);
-+
-+#ifdef CONFIG_CRYPTO_DEV_FSL_CAAM_RNG_TEST
-+	self_test(&caam_rng);
-+#endif
- 
--	dev_info(dev, "registering rng-caam\n");
-+	dev_info(priv->jrdev[0], "registering rng-caam\n");
- 	return hwrng_register(&caam_rng);
- }
- 
-diff -Nur linux-4.1.3/drivers/crypto/caam/compat.h linux-xbian-imx6/drivers/crypto/caam/compat.h
---- linux-4.1.3/drivers/crypto/caam/compat.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/compat.h	2015-07-27 23:13:04.209961631 +0200
-@@ -14,6 +14,8 @@
- #include <linux/hash.h>
- #include <linux/hw_random.h>
- #include <linux/of_platform.h>
-+#include <linux/of_address.h>
-+#include <linux/of_irq.h>
- #include <linux/dma-mapping.h>
- #include <linux/io.h>
- #include <linux/spinlock.h>
-@@ -23,12 +25,15 @@
- #include <linux/types.h>
- #include <linux/debugfs.h>
- #include <linux/circ_buf.h>
-+#include <crypto/scatterwalk.h>
-+
-+#ifdef CONFIG_ARM /* needs the clock control subsystem */
-+#include <linux/clk.h>
-+#endif
- #include <net/xfrm.h>
- 
- #include <crypto/algapi.h>
--#include <crypto/null.h>
- #include <crypto/aes.h>
--#include <crypto/ctr.h>
- #include <crypto/des.h>
- #include <crypto/sha.h>
- #include <crypto/md5.h>
-diff -Nur linux-4.1.3/drivers/crypto/caam/ctrl.c linux-xbian-imx6/drivers/crypto/caam/ctrl.c
---- linux-4.1.3/drivers/crypto/caam/ctrl.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/ctrl.c	2015-07-27 23:13:04.209961631 +0200
-@@ -1,405 +1,260 @@
--/* * CAAM control-plane driver backend
-+/*
-+ * CAAM control-plane driver backend
-  * Controller-level driver, kernel property detection, initialization
-  *
-- * Copyright 2008-2012 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  */
- 
--#include <linux/device.h>
--#include <linux/of_address.h>
--#include <linux/of_irq.h>
--
- #include "compat.h"
- #include "regs.h"
- #include "intern.h"
- #include "jr.h"
- #include "desc_constr.h"
- #include "error.h"
-+#include "ctrl.h"
-+#include "sm.h"
-+#include <linux/device.h>
- 
--/*
-- * Descriptor to instantiate RNG State Handle 0 in normal mode and
-- * load the JDKEK, TDKEK and TDSK registers
-- */
--static void build_instantiation_desc(u32 *desc, int handle, int do_sk)
--{
--	u32 *jump_cmd, op_flags;
--
--	init_job_desc(desc, 0);
--
--	op_flags = OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
--			(handle << OP_ALG_AAI_SHIFT) | OP_ALG_AS_INIT;
--
--	/* INIT RNG in non-test mode */
--	append_operation(desc, op_flags);
--
--	if (!handle && do_sk) {
--		/*
--		 * For SH0, Secure Keys must be generated as well
--		 */
-+/* Used to capture the array of job rings */
-+struct device **caam_jr_dev;
- 
--		/* wait for done */
--		jump_cmd = append_jump(desc, JUMP_CLASS_CLASS1);
--		set_jump_tgt_here(desc, jump_cmd);
-+static int caam_remove(struct platform_device *pdev)
-+{
-+	struct device *ctrldev;
-+	struct caam_drv_private *ctrlpriv;
-+	struct caam_drv_private_jr *jrpriv;
-+	struct caam_full __iomem *topregs;
-+	int ring, ret = 0;
- 
--		/*
--		 * load 1 to clear written reg:
--		 * resets the done interrrupt and returns the RNG to idle.
--		 */
--		append_load_imm_u32(desc, 1, LDST_SRCDST_WORD_CLRW);
-+	ctrldev = &pdev->dev;
-+	ctrlpriv = dev_get_drvdata(ctrldev);
-+	topregs = (struct caam_full __iomem *)ctrlpriv->ctrl;
- 
--		/* Initialize State Handle  */
--		append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
--				 OP_ALG_AAI_RNG4_SK);
-+	/* shut down JobRs */
-+	for (ring = 0; ring < ctrlpriv->total_jobrs; ring++) {
-+		ret |= caam_jr_shutdown(ctrlpriv->jrdev[ring]);
-+		jrpriv = dev_get_drvdata(ctrlpriv->jrdev[ring]);
-+		irq_dispose_mapping(jrpriv->irq);
- 	}
- 
--	append_jump(desc, JUMP_CLASS_CLASS1 | JUMP_TYPE_HALT);
--}
-+	/* Shut down debug views */
-+#ifdef CONFIG_DEBUG_FS
-+	debugfs_remove_recursive(ctrlpriv->dfs_root);
-+#endif
- 
--/* Descriptor for deinstantiation of State Handle 0 of the RNG block. */
--static void build_deinstantiation_desc(u32 *desc, int handle)
--{
--	init_job_desc(desc, 0);
-+	/* Unmap controller region */
-+	iounmap(&topregs->ctrl);
- 
--	/* Uninstantiate State Handle 0 */
--	append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
--			 (handle << OP_ALG_AAI_SHIFT) | OP_ALG_AS_INITFINAL);
-+#ifdef CONFIG_ARM
-+	/* shut clocks off before finalizing shutdown */
-+	clk_disable(ctrlpriv->caam_ipg);
-+	clk_disable(ctrlpriv->caam_mem);
-+	clk_disable(ctrlpriv->caam_aclk);
-+#endif
-+
-+	kfree(ctrlpriv->jrdev);
-+	kfree(ctrlpriv);
- 
--	append_jump(desc, JUMP_CLASS_CLASS1 | JUMP_TYPE_HALT);
-+	return ret;
- }
- 
- /*
-- * run_descriptor_deco0 - runs a descriptor on DECO0, under direct control of
-- *			  the software (no JR/QI used).
-- * @ctrldev - pointer to device
-- * @status - descriptor status, after being run
-- *
-- * Return: - 0 if no error occurred
-- *	   - -ENODEV if the DECO couldn't be acquired
-- *	   - -EAGAIN if an error occurred while executing the descriptor
-+ * Descriptor to instantiate RNG State Handle 0 in normal mode and
-+ * load the JDKEK, TDKEK and TDSK registers
-  */
--static inline int run_descriptor_deco0(struct device *ctrldev, u32 *desc,
--					u32 *status)
-+static void build_instantiation_desc(u32 *desc)
- {
--	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
--	struct caam_ctrl __iomem *ctrl = ctrlpriv->ctrl;
--	struct caam_deco __iomem *deco = ctrlpriv->deco;
--	unsigned int timeout = 100000;
--	u32 deco_dbg_reg, flags;
--	int i;
--
-+	u32 *jump_cmd;
- 
--	if (ctrlpriv->virt_en == 1) {
--		setbits32(&ctrl->deco_rsr, DECORSR_JR0);
--
--		while (!(rd_reg32(&ctrl->deco_rsr) & DECORSR_VALID) &&
--		       --timeout)
--			cpu_relax();
--
--		timeout = 100000;
--	}
--
--	setbits32(&ctrl->deco_rq, DECORR_RQD0ENABLE);
--
--	while (!(rd_reg32(&ctrl->deco_rq) & DECORR_DEN0) &&
--								 --timeout)
--		cpu_relax();
-+	init_job_desc(desc, 0);
- 
--	if (!timeout) {
--		dev_err(ctrldev, "failed to acquire DECO 0\n");
--		clrbits32(&ctrl->deco_rq, DECORR_RQD0ENABLE);
--		return -ENODEV;
--	}
-+	/* INIT RNG in non-test mode */
-+	append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
-+			 OP_ALG_AS_INIT);
- 
--	for (i = 0; i < desc_len(desc); i++)
--		wr_reg32(&deco->descbuf[i], *(desc + i));
-+	/* wait for done */
-+	jump_cmd = append_jump(desc, JUMP_CLASS_CLASS1);
-+	set_jump_tgt_here(desc, jump_cmd);
- 
--	flags = DECO_JQCR_WHL;
- 	/*
--	 * If the descriptor length is longer than 4 words, then the
--	 * FOUR bit in JRCTRL register must be set.
-+	 * load 1 to clear written reg:
-+	 * resets the done interrupt and returns the RNG to idle.
- 	 */
--	if (desc_len(desc) >= 4)
--		flags |= DECO_JQCR_FOUR;
-+	append_load_imm_u32(desc, 1, LDST_SRCDST_WORD_CLRW);
- 
--	/* Instruct the DECO to execute it */
--	wr_reg32(&deco->jr_ctl_hi, flags);
--
--	timeout = 10000000;
--	do {
--		deco_dbg_reg = rd_reg32(&deco->desc_dbg);
--		/*
--		 * If an error occured in the descriptor, then
--		 * the DECO status field will be set to 0x0D
--		 */
--		if ((deco_dbg_reg & DESC_DBG_DECO_STAT_MASK) ==
--		    DESC_DBG_DECO_STAT_HOST_ERR)
--			break;
--		cpu_relax();
--	} while ((deco_dbg_reg & DESC_DBG_DECO_STAT_VALID) && --timeout);
--
--	*status = rd_reg32(&deco->op_status_hi) &
--		  DECO_OP_STATUS_HI_ERR_MASK;
--
--	if (ctrlpriv->virt_en == 1)
--		clrbits32(&ctrl->deco_rsr, DECORSR_JR0);
--
--	/* Mark the DECO as free */
--	clrbits32(&ctrl->deco_rq, DECORR_RQD0ENABLE);
--
--	if (!timeout)
--		return -EAGAIN;
--
--	return 0;
- }
- 
--/*
-- * instantiate_rng - builds and executes a descriptor on DECO0,
-- *		     which initializes the RNG block.
-- * @ctrldev - pointer to device
-- * @state_handle_mask - bitmask containing the instantiation status
-- *			for the RNG4 state handles which exist in
-- *			the RNG4 block: 1 if it's been instantiated
-- *			by an external entry, 0 otherwise.
-- * @gen_sk  - generate data to be loaded into the JDKEK, TDKEK and TDSK;
-- *	      Caution: this can be done only once; if the keys need to be
-- *	      regenerated, a POR is required
-- *
-- * Return: - 0 if no error occurred
-- *	   - -ENOMEM if there isn't enough memory to allocate the descriptor
-- *	   - -ENODEV if DECO0 couldn't be acquired
-- *	   - -EAGAIN if an error occurred when executing the descriptor
-- *	      f.i. there was a RNG hardware error due to not "good enough"
-- *	      entropy being aquired.
-- */
--static int instantiate_rng(struct device *ctrldev, int state_handle_mask,
--			   int gen_sk)
-+static void generate_secure_keys_desc(u32 *desc)
- {
--	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
--	struct caam_ctrl __iomem *ctrl;
--	u32 *desc, status, rdsta_val;
--	int ret = 0, sh_idx;
--
--	ctrl = (struct caam_ctrl __iomem *)ctrlpriv->ctrl;
--	desc = kmalloc(CAAM_CMD_SZ * 7, GFP_KERNEL);
--	if (!desc)
--		return -ENOMEM;
-+	/* generate secure keys (non-test) */
-+	append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
-+					 OP_ALG_RNG4_SK);
-+}
- 
--	for (sh_idx = 0; sh_idx < RNG4_MAX_HANDLES; sh_idx++) {
--		/*
--		 * If the corresponding bit is set, this state handle
--		 * was initialized by somebody else, so it's left alone.
--		 */
--		if ((1 << sh_idx) & state_handle_mask)
--			continue;
-+struct instantiate_result {
-+	struct completion completion;
-+	int err;
-+};
- 
--		/* Create the descriptor for instantiating RNG State Handle */
--		build_instantiation_desc(desc, sh_idx, gen_sk);
-+static void rng4_init_done(struct device *dev, u32 *desc, u32 err,
-+			   void *context)
-+{
-+	struct instantiate_result *instantiation = context;
- 
--		/* Try to run it through DECO0 */
--		ret = run_descriptor_deco0(ctrldev, desc, &status);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
- 
--		/*
--		 * If ret is not 0, or descriptor status is not 0, then
--		 * something went wrong. No need to try the next state
--		 * handle (if available), bail out here.
--		 * Also, if for some reason, the State Handle didn't get
--		 * instantiated although the descriptor has finished
--		 * without any error (HW optimizations for later
--		 * CAAM eras), then try again.
--		 */
--		rdsta_val = rd_reg32(&ctrl->r4tst[0].rdsta) & RDSTA_IFMASK;
--		if (status || !(rdsta_val & (1 << sh_idx)))
--			ret = -EAGAIN;
--		if (ret)
--			break;
--		dev_info(ctrldev, "Instantiated RNG4 SH%d\n", sh_idx);
--		/* Clear the contents before recreating the descriptor */
--		memset(desc, 0x00, CAAM_CMD_SZ * 7);
-+		dev_err(dev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
- 	}
- 
--	kfree(desc);
--
--	return ret;
-+	instantiation->err = err;
-+	complete(&instantiation->completion);
- }
- 
--/*
-- * deinstantiate_rng - builds and executes a descriptor on DECO0,
-- *		       which deinitializes the RNG block.
-- * @ctrldev - pointer to device
-- * @state_handle_mask - bitmask containing the instantiation status
-- *			for the RNG4 state handles which exist in
-- *			the RNG4 block: 1 if it's been instantiated
-- *
-- * Return: - 0 if no error occurred
-- *	   - -ENOMEM if there isn't enough memory to allocate the descriptor
-- *	   - -ENODEV if DECO0 couldn't be acquired
-- *	   - -EAGAIN if an error occurred when executing the descriptor
-- */
--static int deinstantiate_rng(struct device *ctrldev, int state_handle_mask)
-+static int instantiate_rng(struct device *jrdev, u32 keys_generated)
- {
--	u32 *desc, status;
--	int sh_idx, ret = 0;
-+	struct instantiate_result instantiation;
- 
--	desc = kmalloc(CAAM_CMD_SZ * 3, GFP_KERNEL);
--	if (!desc)
-+	dma_addr_t desc_dma;
-+	u32 *desc;
-+	int ret;
-+
-+	desc = kmalloc(CAAM_CMD_SZ * 6, GFP_KERNEL | GFP_DMA);
-+	if (!desc) {
-+		dev_err(jrdev, "cannot allocate RNG init descriptor memory\n");
- 		return -ENOMEM;
--
--	for (sh_idx = 0; sh_idx < RNG4_MAX_HANDLES; sh_idx++) {
--		/*
--		 * If the corresponding bit is set, then it means the state
--		 * handle was initialized by us, and thus it needs to be
--		 * deintialized as well
--		 */
--		if ((1 << sh_idx) & state_handle_mask) {
--			/*
--			 * Create the descriptor for deinstantating this state
--			 * handle
--			 */
--			build_deinstantiation_desc(desc, sh_idx);
--
--			/* Try to run it through DECO0 */
--			ret = run_descriptor_deco0(ctrldev, desc, &status);
--
--			if (ret || status) {
--				dev_err(ctrldev,
--					"Failed to deinstantiate RNG4 SH%d\n",
--					sh_idx);
--				break;
--			}
--			dev_info(ctrldev, "Deinstantiated RNG4 SH%d\n", sh_idx);
--		}
- 	}
- 
--	kfree(desc);
--
--	return ret;
--}
-+	build_instantiation_desc(desc);
- 
--static int caam_remove(struct platform_device *pdev)
--{
--	struct device *ctrldev;
--	struct caam_drv_private *ctrlpriv;
--	struct caam_ctrl __iomem *ctrl;
--	int ring, ret = 0;
--
--	ctrldev = &pdev->dev;
--	ctrlpriv = dev_get_drvdata(ctrldev);
--	ctrl = (struct caam_ctrl __iomem *)ctrlpriv->ctrl;
--
--	/* Remove platform devices for JobRs */
--	for (ring = 0; ring < ctrlpriv->total_jobrs; ring++) {
--		if (ctrlpriv->jrpdev[ring])
--			of_device_unregister(ctrlpriv->jrpdev[ring]);
-+	/* If keys have not been generated, add op code to generate key. */
-+	if (!keys_generated)
-+		generate_secure_keys_desc(desc);
-+
-+	desc_dma = dma_map_single(jrdev, desc, desc_bytes(desc), DMA_TO_DEVICE);
-+	dma_sync_single_for_device(jrdev, desc_dma, desc_bytes(desc),
-+				   DMA_TO_DEVICE);
-+	init_completion(&instantiation.completion);
-+	ret = caam_jr_enqueue(jrdev, desc, rng4_init_done, &instantiation);
-+	if (!ret) {
-+		wait_for_completion_interruptible(&instantiation.completion);
-+		ret = instantiation.err;
-+		if (ret)
-+			dev_err(jrdev, "unable to instantiate RNG\n");
- 	}
- 
--	/* De-initialize RNG state handles initialized by this driver. */
--	if (ctrlpriv->rng4_sh_init)
--		deinstantiate_rng(ctrldev, ctrlpriv->rng4_sh_init);
--
--	/* Shut down debug views */
--#ifdef CONFIG_DEBUG_FS
--	debugfs_remove_recursive(ctrlpriv->dfs_root);
--#endif
-+	dma_unmap_single(jrdev, desc_dma, desc_bytes(desc), DMA_TO_DEVICE);
- 
--	/* Unmap controller region */
--	iounmap(&ctrl);
-+	kfree(desc);
- 
- 	return ret;
- }
- 
- /*
-- * kick_trng - sets the various parameters for enabling the initialization
-- *	       of the RNG4 block in CAAM
-- * @pdev - pointer to the platform device
-- * @ent_delay - Defines the length (in system clocks) of each entropy sample.
-+ * By default, the TRNG runs for 200 clocks per sample;
-+ * 1600 clocks per sample generates better entropy.
-  */
--static void kick_trng(struct platform_device *pdev, int ent_delay)
-+static void kick_trng(struct platform_device *pdev)
- {
- 	struct device *ctrldev = &pdev->dev;
- 	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
--	struct caam_ctrl __iomem *ctrl;
-+	struct caam_full __iomem *topregs;
- 	struct rng4tst __iomem *r4tst;
- 	u32 val;
- 
--	ctrl = (struct caam_ctrl __iomem *)ctrlpriv->ctrl;
--	r4tst = &ctrl->r4tst[0];
-+	topregs = (struct caam_full __iomem *)ctrlpriv->ctrl;
-+	r4tst = &topregs->ctrl.r4tst[0];
- 
-+	val = rd_reg32(&r4tst->rtmctl);
- 	/* put RNG4 into program mode */
- 	setbits32(&r4tst->rtmctl, RTMCTL_PRGM);
--
--	/*
--	 * Performance-wise, it does not make sense to
--	 * set the delay to a value that is lower
--	 * than the last one that worked (i.e. the state handles
--	 * were instantiated properly. Thus, instead of wasting
--	 * time trying to set the values controlling the sample
--	 * frequency, the function simply returns.
--	 */
--	val = (rd_reg32(&r4tst->rtsdctl) & RTSDCTL_ENT_DLY_MASK)
--	      >> RTSDCTL_ENT_DLY_SHIFT;
--	if (ent_delay <= val) {
--		/* put RNG4 into run mode */
--		clrbits32(&r4tst->rtmctl, RTMCTL_PRGM);
--		return;
--	}
--
-+	/* Set clocks per sample to the default, and divider to zero */
- 	val = rd_reg32(&r4tst->rtsdctl);
- 	val = (val & ~RTSDCTL_ENT_DLY_MASK) |
--	      (ent_delay << RTSDCTL_ENT_DLY_SHIFT);
-+	       (RNG4_ENT_CLOCKS_SAMPLE << RTSDCTL_ENT_DLY_SHIFT);
- 	wr_reg32(&r4tst->rtsdctl, val);
--	/* min. freq. count, equal to 1/4 of the entropy sample length */
--	wr_reg32(&r4tst->rtfrqmin, ent_delay >> 2);
--	/* disable maximum frequency count */
--	wr_reg32(&r4tst->rtfrqmax, RTFRQMAX_DISABLE);
--	/* read the control register */
--	val = rd_reg32(&r4tst->rtmctl);
--	/*
--	 * select raw sampling in both entropy shifter
--	 * and statistical checker
--	 */
--	setbits32(&val, RTMCTL_SAMP_MODE_RAW_ES_SC);
-+	/* min. freq. count */
-+	wr_reg32(&r4tst->rtfrqmin, RNG4_ENT_CLOCKS_SAMPLE / 4);
-+	/* max. freq. count */
-+	wr_reg32(&r4tst->rtfrqmax, RNG4_ENT_CLOCKS_SAMPLE * 8);
- 	/* put RNG4 into run mode */
--	clrbits32(&val, RTMCTL_PRGM);
--	/* write back the control register */
--	wr_reg32(&r4tst->rtmctl, val);
-+	clrbits32(&r4tst->rtmctl, RTMCTL_PRGM);
- }
- 
- /**
-  * caam_get_era() - Return the ERA of the SEC on SoC, based
-- * on "sec-era" propery in the DTS. This property is updated by u-boot.
-+ * on the SEC_VID register.
-+ * Returns the ERA number (1..4) or -ENOTSUPP if the ERA is unknown.
-+ * @caam_id - the value of the SEC_VID register
-  **/
--int caam_get_era(void)
-+int caam_get_era(u64 caam_id)
- {
--	struct device_node *caam_node;
--	for_each_compatible_node(caam_node, NULL, "fsl,sec-v4.0") {
--		const uint32_t *prop = (uint32_t *)of_get_property(caam_node,
--				"fsl,sec-era",
--				NULL);
--		return prop ? *prop : -ENOTSUPP;
--	}
-+	struct sec_vid *sec_vid = (struct sec_vid *)&caam_id;
-+	static const struct {
-+		u16 ip_id;
-+		u8 maj_rev;
-+		u8 era;
-+	} caam_eras[] = {
-+		{0x0A10, 1, 1},
-+		{0x0A10, 2, 2},
-+		{0x0A12, 1, 3},
-+		{0x0A14, 1, 3},
-+		{0x0A14, 2, 4},
-+		{0x0A16, 1, 4},
-+		{0x0A11, 1, 4},
-+		{0x0A10, 3, 4},
-+		{0x0A18, 1, 4},
-+		{0x0A11, 2, 5},
-+		{0x0A12, 2, 5},
-+		{0x0A13, 1, 5},
-+		{0x0A1C, 1, 5},
-+		{0x0A12, 4, 6},
-+		{0x0A13, 2, 6},
-+		{0x0A16, 2, 6},
-+		{0x0A18, 2, 6},
-+		{0x0A1A, 1, 6},
-+		{0x0A1C, 2, 6},
-+		{0x0A17, 1, 6}
-+	};
-+	int i;
-+
-+	for (i = 0; i < ARRAY_SIZE(caam_eras); i++)
-+		if (caam_eras[i].ip_id == sec_vid->ip_id &&
-+			caam_eras[i].maj_rev == sec_vid->maj_rev)
-+				return caam_eras[i].era;
- 
- 	return -ENOTSUPP;
- }
- EXPORT_SYMBOL(caam_get_era);
- 
-+/*
-+ * Return a job ring device.  This is available so outside
-+ * entities can gain direct access to the job ring.  For now,
-+ * this function returns the first job ring (at index 0).
-+ */
-+struct device *caam_get_jrdev(void)
-+{
-+	return caam_jr_dev[0];
-+}
-+EXPORT_SYMBOL(caam_get_jrdev);
-+
-+
- /* Probe routine for CAAM top (controller) level */
- static int caam_probe(struct platform_device *pdev)
- {
--	int ret, ring, rspec, gen_sk, ent_delay = RTSDCTL_ENT_DLY_MIN;
-+	int ret, ring, rspec;
- 	u64 caam_id;
- 	struct device *dev;
- 	struct device_node *nprop, *np;
- 	struct caam_ctrl __iomem *ctrl;
-+	struct caam_full __iomem *topregs;
-+	struct snvs_full __iomem *snvsregs;
- 	struct caam_drv_private *ctrlpriv;
- #ifdef CONFIG_DEBUG_FS
- 	struct caam_perfmon *perfmon;
- #endif
--	u32 scfgr, comp_params;
--	u32 cha_vid_ls;
--	int pg_size;
--	int BLOCK_OFFSET = 0;
- 
--	ctrlpriv = devm_kzalloc(&pdev->dev, sizeof(struct caam_drv_private),
--				GFP_KERNEL);
-+	ctrlpriv = kzalloc(sizeof(struct caam_drv_private), GFP_KERNEL);
- 	if (!ctrlpriv)
- 		return -ENOMEM;
- 
-@@ -415,71 +270,128 @@
- 		dev_err(dev, "caam: of_iomap() failed\n");
- 		return -ENOMEM;
- 	}
--	/* Finding the page size for using the CTPR_MS register */
--	comp_params = rd_reg32(&ctrl->perfmon.comp_parms_ms);
--	pg_size = (comp_params & CTPR_MS_PG_SZ_MASK) >> CTPR_MS_PG_SZ_SHIFT;
--
--	/* Allocating the BLOCK_OFFSET based on the supported page size on
--	 * the platform
--	 */
--	if (pg_size == 0)
--		BLOCK_OFFSET = PG_SIZE_4K;
--	else
--		BLOCK_OFFSET = PG_SIZE_64K;
--
- 	ctrlpriv->ctrl = (struct caam_ctrl __force *)ctrl;
--	ctrlpriv->assure = (struct caam_assurance __force *)
--			   ((uint8_t *)ctrl +
--			    BLOCK_OFFSET * ASSURE_BLOCK_NUMBER
--			   );
--	ctrlpriv->deco = (struct caam_deco __force *)
--			 ((uint8_t *)ctrl +
--			 BLOCK_OFFSET * DECO_BLOCK_NUMBER
--			 );
-+
-+	/* topregs used to derive pointers to CAAM sub-blocks only */
-+	topregs = (struct caam_full __iomem *)ctrl;
- 
- 	/* Get the IRQ of the controller (for security violations only) */
--	ctrlpriv->secvio_irq = irq_of_parse_and_map(nprop, 0);
-+	ctrlpriv->secvio_irq = of_irq_to_resource(nprop, 0, NULL);
-+
-+	/* Get SNVS register Page */
-+	np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-snvs");
-+
-+	if (!np)
-+		return -ENODEV;
-+
-+	snvsregs = of_iomap(np, 0);
-+	ctrlpriv->snvs = snvsregs;
-+	/* Get CAAM-SM node and of_iomap() and save */
-+	np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-sm");
-+
-+	if (!np)
-+		return -ENODEV;
-+
-+	ctrlpriv->sm_base = of_iomap(np, 0);
-+	ctrlpriv->sm_size = 0x3fff;
-+
-+/*
-+ * ARM targets tend to have clock control subsystems that can
-+ * enable/disable clocking to our device. Turn clocking on to proceed
-+ */
-+#ifdef CONFIG_ARM
-+	ctrlpriv->caam_ipg = devm_clk_get(&ctrlpriv->pdev->dev, "caam_ipg");
-+	if (IS_ERR(ctrlpriv->caam_ipg)) {
-+		ret = PTR_ERR(ctrlpriv->caam_ipg);
-+		dev_err(&ctrlpriv->pdev->dev,
-+			"can't identify CAAM ipg clk: %d\n", ret);
-+		return -ENODEV;
-+	}
-+	ctrlpriv->caam_mem = devm_clk_get(&ctrlpriv->pdev->dev, "caam_mem");
-+	if (IS_ERR(ctrlpriv->caam_mem)) {
-+		ret = PTR_ERR(ctrlpriv->caam_mem);
-+		dev_err(&ctrlpriv->pdev->dev,
-+			"can't identify CAAM secure mem clk: %d\n", ret);
-+		return -ENODEV;
-+	}
-+	ctrlpriv->caam_aclk = devm_clk_get(&ctrlpriv->pdev->dev, "caam_aclk");
-+	if (IS_ERR(ctrlpriv->caam_aclk)) {
-+		ret = PTR_ERR(ctrlpriv->caam_aclk);
-+		dev_err(&ctrlpriv->pdev->dev,
-+			"can't identify CAAM aclk clk: %d\n", ret);
-+		return -ENODEV;
-+	}
-+
-+	ret = clk_prepare(ctrlpriv->caam_ipg);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "can't prepare CAAM ipg clock: %d\n", ret);
-+		return -ENODEV;
-+	}
-+	ret = clk_prepare(ctrlpriv->caam_mem);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "can't prepare CAAM secure mem clock: %d\n", ret);
-+		return -ENODEV;
-+	}
-+	ret = clk_prepare(ctrlpriv->caam_aclk);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "can't prepare CAAM aclk clock: %d\n", ret);
-+		return -ENODEV;
-+	}
-+
-+	ret = clk_enable(ctrlpriv->caam_ipg);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "can't enable CAAM ipg clock: %d\n", ret);
-+		return -ENODEV;
-+	}
-+	ret = clk_enable(ctrlpriv->caam_mem);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "can't enable CAAM secure mem clock: %d\n", ret);
-+		return -ENODEV;
-+	}
-+	ret = clk_enable(ctrlpriv->caam_aclk);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "can't enable CAAM aclk clock: %d\n", ret);
-+		return -ENODEV;
-+	}
-+
-+	pr_debug("%s caam_ipg clock:%d\n", __func__,
-+		(int)clk_get_rate(ctrlpriv->caam_ipg));
-+	pr_debug("%s caam_mem clock:%d\n", __func__,
-+		(int)clk_get_rate(ctrlpriv->caam_mem));
-+	pr_debug("%s caam_aclk clock:%d\n", __func__,
-+		(int)clk_get_rate(ctrlpriv->caam_aclk));
-+#endif
- 
- 	/*
- 	 * Enable DECO watchdogs and, if this is a PHYS_ADDR_T_64BIT kernel,
- 	 * long pointers in master configuration register
- 	 */
--	setbits32(&ctrl->mcr, MCFGR_WDENABLE |
-+	setbits32(&topregs->ctrl.mcr, MCFGR_WDENABLE |
- 		  (sizeof(dma_addr_t) == sizeof(u64) ? MCFGR_LONG_PTR : 0));
- 
-+#ifdef CONFIG_ARCH_MX6
- 	/*
--	 *  Read the Compile Time paramters and SCFGR to determine
--	 * if Virtualization is enabled for this platform
-+	 * ERRATA:  mx6 devices have an issue wherein AXI bus transactions
-+	 * may not occur in the correct order. This isn't a problem running
-+	 * single descriptors, but can be if running multiple concurrent
-+	 * descriptors. Reworking the driver to throttle to single requests
-+	 * is impractical, thus the workaround is to limit the AXI pipeline
-+	 * to a depth of 1 (from it's default of 4) to preclude this situation
-+	 * from occurring.
- 	 */
--	scfgr = rd_reg32(&ctrl->scfgr);
--
--	ctrlpriv->virt_en = 0;
--	if (comp_params & CTPR_MS_VIRT_EN_INCL) {
--		/* VIRT_EN_INCL = 1 & VIRT_EN_POR = 1 or
--		 * VIRT_EN_INCL = 1 & VIRT_EN_POR = 0 & SCFGR_VIRT_EN = 1
--		 */
--		if ((comp_params & CTPR_MS_VIRT_EN_POR) ||
--		    (!(comp_params & CTPR_MS_VIRT_EN_POR) &&
--		       (scfgr & SCFGR_VIRT_EN)))
--				ctrlpriv->virt_en = 1;
--	} else {
--		/* VIRT_EN_INCL = 0 && VIRT_EN_POR_VALUE = 1 */
--		if (comp_params & CTPR_MS_VIRT_EN_POR)
--				ctrlpriv->virt_en = 1;
--	}
--
--	if (ctrlpriv->virt_en == 1)
--		setbits32(&ctrl->jrstart, JRSTART_JR0_START |
--			  JRSTART_JR1_START | JRSTART_JR2_START |
--			  JRSTART_JR3_START);
-+	wr_reg32(&topregs->ctrl.mcr,
-+		 (rd_reg32(&topregs->ctrl.mcr) & ~(MCFGR_AXIPIPE_MASK)) |
-+		 ((1 << MCFGR_AXIPIPE_SHIFT) & MCFGR_AXIPIPE_MASK));
-+#endif
- 
-+	/* Set DMA masks according to platform ranging */
- 	if (sizeof(dma_addr_t) == sizeof(u64))
--		if (of_device_is_compatible(nprop, "fsl,sec-v5.0"))
--			dma_set_mask_and_coherent(dev, DMA_BIT_MASK(40));
-+		if (of_device_is_compatible(nprop, "fsl,sec-v4.0"))
-+			dma_set_mask(dev, DMA_BIT_MASK(40));
- 		else
--			dma_set_mask_and_coherent(dev, DMA_BIT_MASK(36));
-+			dma_set_mask(dev, DMA_BIT_MASK(36));
- 	else
--		dma_set_mask_and_coherent(dev, DMA_BIT_MASK(32));
-+		dma_set_mask(dev, DMA_BIT_MASK(32));
- 
- 	/*
- 	 * Detect and enable JobRs
-@@ -487,51 +399,65 @@
- 	 * for all, then go probe each one.
- 	 */
- 	rspec = 0;
--	for_each_available_child_of_node(nprop, np)
--		if (of_device_is_compatible(np, "fsl,sec-v4.0-job-ring") ||
--		    of_device_is_compatible(np, "fsl,sec4.0-job-ring"))
-+	for_each_compatible_node(np, NULL, "fsl,sec-v4.0-job-ring")
-+		rspec++;
-+	if (!rspec) {
-+		/* for backward compatible with device trees */
-+		for_each_compatible_node(np, NULL, "fsl,sec4.0-job-ring")
- 			rspec++;
-+	}
- 
--	ctrlpriv->jrpdev = devm_kzalloc(&pdev->dev,
--					sizeof(struct platform_device *) * rspec,
--					GFP_KERNEL);
--	if (ctrlpriv->jrpdev == NULL) {
--		iounmap(&ctrl);
-+	ctrlpriv->jrdev = kzalloc(sizeof(struct device *) * rspec, GFP_KERNEL);
-+	if (ctrlpriv->jrdev == NULL) {
-+		iounmap(&topregs->ctrl);
- 		return -ENOMEM;
- 	}
- 
- 	ring = 0;
- 	ctrlpriv->total_jobrs = 0;
--	for_each_available_child_of_node(nprop, np)
--		if (of_device_is_compatible(np, "fsl,sec-v4.0-job-ring") ||
--		    of_device_is_compatible(np, "fsl,sec4.0-job-ring")) {
--			ctrlpriv->jrpdev[ring] =
--				of_platform_device_create(np, NULL, dev);
--			if (!ctrlpriv->jrpdev[ring]) {
--				pr_warn("JR%d Platform device creation error\n",
--					ring);
--				continue;
-+	for_each_compatible_node(np, NULL, "fsl,sec-v4.0-job-ring") {
-+		ret = caam_jr_probe(pdev, np, ring);
-+		if (ret < 0) {
-+			/*
-+			 * Job ring not found, error out.  At some
-+			 * point, we should enhance job ring handling
-+			 * to allow for non-consecutive job rings to
-+			 * be found.
-+			 */
-+			pr_err("fsl,sec-v4.0-job-ring not found ");
-+			pr_err("(ring %d)\n", ring);
-+			return ret;
-+		}
-+		ctrlpriv->total_jobrs++;
-+		ring++;
-+	}
-+
-+	if (!ring) {
-+		for_each_compatible_node(np, NULL, "fsl,sec4.0-job-ring") {
-+			ret = caam_jr_probe(pdev, np, ring);
-+			if (ret < 0) {
-+				/*
-+				 * Job ring not found, error out.  At some
-+				 * point, we should enhance job ring handling
-+				 * to allow for non-consecutive job rings to
-+				 * be found.
-+				 */
-+				pr_err("fsl,sec4.0-job-ring not found ");
-+				pr_err("(ring %d)\n", ring);
-+				return ret;
- 			}
--			ctrlpriv->jr[ring] = (struct caam_job_ring __force *)
--					     ((uint8_t *)ctrl +
--					     (ring + JR_BLOCK_NUMBER) *
--					      BLOCK_OFFSET
--					     );
- 			ctrlpriv->total_jobrs++;
- 			ring++;
-+		}
- 	}
- 
- 	/* Check to see if QI present. If so, enable */
--	ctrlpriv->qi_present =
--			!!(rd_reg32(&ctrl->perfmon.comp_parms_ms) &
--			   CTPR_MS_QI_MASK);
-+	ctrlpriv->qi_present = !!(rd_reg64(&topregs->ctrl.perfmon.comp_parms) &
-+				  CTPR_QI_MASK);
- 	if (ctrlpriv->qi_present) {
--		ctrlpriv->qi = (struct caam_queue_if __force *)
--			       ((uint8_t *)ctrl +
--				 BLOCK_OFFSET * QI_BLOCK_NUMBER
--			       );
-+		ctrlpriv->qi = (struct caam_queue_if __force *)&topregs->qi;
- 		/* This is all that's required to physically enable QI */
--		wr_reg32(&ctrlpriv->qi->qi_control_lo, QICTL_DQEN);
-+		wr_reg32(&topregs->qi.qi_control_lo, QICTL_DQEN);
- 	}
- 
- 	/* If no QI and no rings specified, quit and go home */
-@@ -541,81 +467,53 @@
- 		return -ENOMEM;
- 	}
- 
--	cha_vid_ls = rd_reg32(&ctrl->perfmon.cha_id_ls);
--
- 	/*
--	 * If SEC has RNG version >= 4 and RNG state handle has not been
--	 * already instantiated, do RNG instantiation
-+	 * RNG4 based SECs (v5+ | >= i.MX6) need special initialization prior
-+	 * to executing any descriptors. If there's a problem with init,
-+	 * remove other subsystems and return; internal padding functions
-+	 * cannot run without an RNG. This procedure assumes a single RNG4
-+	 * instance.
- 	 */
--	if ((cha_vid_ls & CHA_ID_LS_RNG_MASK) >> CHA_ID_LS_RNG_SHIFT >= 4) {
--		ctrlpriv->rng4_sh_init =
--			rd_reg32(&ctrl->r4tst[0].rdsta);
-+	if ((rd_reg64(&topregs->ctrl.perfmon.cha_id) & CHA_ID_RNG_MASK)
-+	    == CHA_ID_RNG_4) {
-+		struct rng4tst __iomem *r4tst;
-+		u32 rdsta, rng_if, rng_skvn;
-+
- 		/*
--		 * If the secure keys (TDKEK, JDKEK, TDSK), were already
--		 * generated, signal this to the function that is instantiating
--		 * the state handles. An error would occur if RNG4 attempts
--		 * to regenerate these keys before the next POR.
-+		 * Check to see if the RNG has already been instantiated.
-+		 * If either the state 0 or 1 instantiated flags are set,
-+		 * then don't continue on and try to instantiate the RNG
-+		 * again.
- 		 */
--		gen_sk = ctrlpriv->rng4_sh_init & RDSTA_SKVN ? 0 : 1;
--		ctrlpriv->rng4_sh_init &= RDSTA_IFMASK;
--		do {
--			int inst_handles =
--				rd_reg32(&ctrl->r4tst[0].rdsta) &
--								RDSTA_IFMASK;
--			/*
--			 * If either SH were instantiated by somebody else
--			 * (e.g. u-boot) then it is assumed that the entropy
--			 * parameters are properly set and thus the function
--			 * setting these (kick_trng(...)) is skipped.
--			 * Also, if a handle was instantiated, do not change
--			 * the TRNG parameters.
--			 */
--			if (!(ctrlpriv->rng4_sh_init || inst_handles)) {
--				dev_info(dev,
--					 "Entropy delay = %u\n",
--					 ent_delay);
--				kick_trng(pdev, ent_delay);
--				ent_delay += 400;
-+		r4tst = &topregs->ctrl.r4tst[0];
-+		rdsta = rd_reg32(&r4tst->rdsta); /* Read RDSTA register */
-+
-+		/* Check IF bit for non-deterministic instantiation */
-+		rng_if = rdsta & RDSTA_IF;
-+
-+		/* Check SKVN bit for non-deterministic key generation */
-+		rng_skvn = rdsta & RDSTA_SKVN;
-+		if (!rng_if) {
-+			kick_trng(pdev);
-+			ret = instantiate_rng(ctrlpriv->jrdev[0], rng_skvn);
-+			if (ret) {
-+				caam_remove(pdev);
-+				return -ENODEV;
- 			}
--			/*
--			 * if instantiate_rng(...) fails, the loop will rerun
--			 * and the kick_trng(...) function will modfiy the
--			 * upper and lower limits of the entropy sampling
--			 * interval, leading to a sucessful initialization of
--			 * the RNG.
--			 */
--			ret = instantiate_rng(dev, inst_handles,
--					      gen_sk);
--			if (ret == -EAGAIN)
--				/*
--				 * if here, the loop will rerun,
--				 * so don't hog the CPU
--				 */
--				cpu_relax();
--		} while ((ret == -EAGAIN) && (ent_delay < RTSDCTL_ENT_DLY_MAX));
--		if (ret) {
--			dev_err(dev, "failed to instantiate RNG");
--			caam_remove(pdev);
--			return ret;
-+			ctrlpriv->rng_inst++;
- 		}
--		/*
--		 * Set handles init'ed by this module as the complement of the
--		 * already initialized ones
--		 */
--		ctrlpriv->rng4_sh_init = ~ctrlpriv->rng4_sh_init & RDSTA_IFMASK;
--
--		/* Enable RDB bit so that RNG works faster */
--		setbits32(&ctrl->scfgr, SCFGR_RDBENABLE);
- 	}
- 
- 	/* NOTE: RTIC detection ought to go here, around Si time */
- 
--	caam_id = (u64)rd_reg32(&ctrl->perfmon.caam_id_ms) << 32 |
--		  (u64)rd_reg32(&ctrl->perfmon.caam_id_ls);
-+	/* Initialize queue allocator lock */
-+	spin_lock_init(&ctrlpriv->jr_alloc_lock);
-+
-+	caam_id = rd_reg64(&topregs->ctrl.perfmon.caam_id);
- 
- 	/* Report "alive" for developer to see */
- 	dev_info(dev, "device ID = 0x%016llx (Era %d)\n", caam_id,
--		 caam_get_era());
-+		 caam_get_era(caam_id));
- 	dev_info(dev, "job rings = %d, qi = %d\n",
- 		 ctrlpriv->total_jobrs, ctrlpriv->qi_present);
- 
-@@ -627,7 +525,7 @@
- 	 */
- 	perfmon = (struct caam_perfmon __force *)&ctrl->perfmon;
- 
--	ctrlpriv->dfs_root = debugfs_create_dir(dev_name(dev), NULL);
-+	ctrlpriv->dfs_root = debugfs_create_dir("caam", NULL);
- 	ctrlpriv->ctl = debugfs_create_dir("ctl", ctrlpriv->dfs_root);
- 
- 	/* Controller-level - performance monitor counters */
-@@ -716,6 +614,7 @@
- static struct platform_driver caam_driver = {
- 	.driver = {
- 		.name = "caam",
-+		.owner = THIS_MODULE,
- 		.of_match_table = caam_match,
- 	},
- 	.probe       = caam_probe,
-diff -Nur linux-4.1.3/drivers/crypto/caam/ctrl.h linux-xbian-imx6/drivers/crypto/caam/ctrl.h
---- linux-4.1.3/drivers/crypto/caam/ctrl.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/ctrl.h	2015-07-27 23:13:04.209961631 +0200
-@@ -8,6 +8,6 @@
- #define CTRL_H
- 
- /* Prototypes for backend-level services exposed to APIs */
--int caam_get_era(void);
-+int caam_get_era(u64 caam_id);
- 
- #endif /* CTRL_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/desc_constr.h linux-xbian-imx6/drivers/crypto/caam/desc_constr.h
---- linux-4.1.3/drivers/crypto/caam/desc_constr.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/desc_constr.h	2015-07-27 23:13:04.209961631 +0200
-@@ -10,7 +10,6 @@
- #define CAAM_CMD_SZ sizeof(u32)
- #define CAAM_PTR_SZ sizeof(dma_addr_t)
- #define CAAM_DESC_BYTES_MAX (CAAM_CMD_SZ * MAX_CAAM_DESCSIZE)
--#define DESC_JOB_IO_LEN (CAAM_CMD_SZ * 5 + CAAM_PTR_SZ * 3)
- 
- #ifdef DEBUG
- #define PRINT_POS do { printk(KERN_DEBUG "%02d: %s\n", desc_len(desc),\
-@@ -111,26 +110,6 @@
- 	(*desc)++;
- }
- 
--#define append_u32 append_cmd
--
--static inline void append_u64(u32 *desc, u64 data)
--{
--	u32 *offset = desc_end(desc);
--
--	*offset = upper_32_bits(data);
--	*(++offset) = lower_32_bits(data);
--
--	(*desc) += 2;
--}
--
--/* Write command without affecting header, and return pointer to next word */
--static inline u32 *write_cmd(u32 *desc, u32 command)
--{
--	*desc = command;
--
--	return desc + 1;
--}
--
- static inline void append_cmd_ptr(u32 *desc, dma_addr_t ptr, int len,
- 				  u32 command)
- {
-@@ -143,8 +122,7 @@
- 					 unsigned int len, u32 command)
- {
- 	append_cmd(desc, command);
--	if (!(command & (SQIN_RTO | SQIN_PRE)))
--		append_ptr(desc, ptr);
-+	append_ptr(desc, ptr);
- 	append_cmd(desc, len);
- }
- 
-@@ -155,29 +133,21 @@
- 	append_data(desc, data, len);
- }
- 
--#define APPEND_CMD_RET(cmd, op) \
--static inline u32 *append_##cmd(u32 *desc, u32 options) \
--{ \
--	u32 *cmd = desc_end(desc); \
--	PRINT_POS; \
--	append_cmd(desc, CMD_##op | options); \
--	return cmd; \
-+static inline u32 *append_jump(u32 *desc, u32 options)
-+{
-+	u32 *cmd = desc_end(desc);
-+
-+	PRINT_POS;
-+	append_cmd(desc, CMD_JUMP | options);
-+
-+	return cmd;
- }
--APPEND_CMD_RET(jump, JUMP)
--APPEND_CMD_RET(move, MOVE)
- 
- static inline void set_jump_tgt_here(u32 *desc, u32 *jump_cmd)
- {
- 	*jump_cmd = *jump_cmd | (desc_len(desc) - (jump_cmd - desc));
- }
- 
--static inline void set_move_tgt_here(u32 *desc, u32 *move_cmd)
--{
--	*move_cmd &= ~MOVE_OFFSET_MASK;
--	*move_cmd = *move_cmd | ((desc_len(desc) << (MOVE_OFFSET_SHIFT + 2)) &
--				 MOVE_OFFSET_MASK);
--}
--
- #define APPEND_CMD(cmd, op) \
- static inline void append_##cmd(u32 *desc, u32 options) \
- { \
-@@ -185,6 +155,7 @@
- 	append_cmd(desc, CMD_##op | options); \
- }
- APPEND_CMD(operation, OPERATION)
-+APPEND_CMD(move, MOVE)
- 
- #define APPEND_CMD_LEN(cmd, op) \
- static inline void append_##cmd(u32 *desc, unsigned int len, u32 options) \
-@@ -192,8 +163,6 @@
- 	PRINT_POS; \
- 	append_cmd(desc, CMD_##op | len | options); \
- }
--
--APPEND_CMD_LEN(seq_load, SEQ_LOAD)
- APPEND_CMD_LEN(seq_store, SEQ_STORE)
- APPEND_CMD_LEN(seq_fifo_load, SEQ_FIFO_LOAD)
- APPEND_CMD_LEN(seq_fifo_store, SEQ_FIFO_STORE)
-@@ -207,36 +176,17 @@
- }
- APPEND_CMD_PTR(key, KEY)
- APPEND_CMD_PTR(load, LOAD)
-+APPEND_CMD_PTR(store, STORE)
- APPEND_CMD_PTR(fifo_load, FIFO_LOAD)
- APPEND_CMD_PTR(fifo_store, FIFO_STORE)
- 
--static inline void append_store(u32 *desc, dma_addr_t ptr, unsigned int len,
--				u32 options)
--{
--	u32 cmd_src;
--
--	cmd_src = options & LDST_SRCDST_MASK;
--
--	append_cmd(desc, CMD_STORE | options | len);
--
--	/* The following options do not require pointer */
--	if (!(cmd_src == LDST_SRCDST_WORD_DESCBUF_SHARED ||
--	      cmd_src == LDST_SRCDST_WORD_DESCBUF_JOB    ||
--	      cmd_src == LDST_SRCDST_WORD_DESCBUF_JOB_WE ||
--	      cmd_src == LDST_SRCDST_WORD_DESCBUF_SHARED_WE))
--		append_ptr(desc, ptr);
--}
--
- #define APPEND_SEQ_PTR_INTLEN(cmd, op) \
- static inline void append_seq_##cmd##_ptr_intlen(u32 *desc, dma_addr_t ptr, \
- 						 unsigned int len, \
- 						 u32 options) \
- { \
- 	PRINT_POS; \
--	if (options & (SQIN_RTO | SQIN_PRE)) \
--		append_cmd(desc, CMD_SEQ_##op##_PTR | len | options); \
--	else \
--		append_cmd_ptr(desc, ptr, len, CMD_SEQ_##op##_PTR | options); \
-+	append_cmd_ptr(desc, ptr, len, CMD_SEQ_##op##_PTR | options); \
- }
- APPEND_SEQ_PTR_INTLEN(in, IN)
- APPEND_SEQ_PTR_INTLEN(out, OUT)
-@@ -309,7 +259,7 @@
-  */
- #define APPEND_MATH(op, desc, dest, src_0, src_1, len) \
- append_cmd(desc, CMD_MATH | MATH_FUN_##op | MATH_DEST_##dest | \
--	MATH_SRC0_##src_0 | MATH_SRC1_##src_1 | (u32)len);
-+	   MATH_SRC0_##src_0 | MATH_SRC1_##src_1 | (u32) (len & MATH_LEN_MASK));
- 
- #define append_math_add(desc, dest, src0, src1, len) \
- 	APPEND_MATH(ADD, desc, dest, src0, src1, len)
-@@ -329,15 +279,13 @@
- 	APPEND_MATH(LSHIFT, desc, dest, src0, src1, len)
- #define append_math_rshift(desc, dest, src0, src1, len) \
- 	APPEND_MATH(RSHIFT, desc, dest, src0, src1, len)
--#define append_math_ldshift(desc, dest, src0, src1, len) \
--	APPEND_MATH(SHLD, desc, dest, src0, src1, len)
- 
- /* Exactly one source is IMM. Data is passed in as u32 value */
- #define APPEND_MATH_IMM_u32(op, desc, dest, src_0, src_1, data) \
- do { \
- 	APPEND_MATH(op, desc, dest, src_0, src_1, CAAM_CMD_SZ); \
- 	append_cmd(desc, data); \
--} while (0)
-+} while (0);
- 
- #define append_math_add_imm_u32(desc, dest, src0, src1, data) \
- 	APPEND_MATH_IMM_u32(ADD, desc, dest, src0, src1, data)
-@@ -357,34 +305,3 @@
- 	APPEND_MATH_IMM_u32(LSHIFT, desc, dest, src0, src1, data)
- #define append_math_rshift_imm_u32(desc, dest, src0, src1, data) \
- 	APPEND_MATH_IMM_u32(RSHIFT, desc, dest, src0, src1, data)
--
--/* Exactly one source is IMM. Data is passed in as u64 value */
--#define APPEND_MATH_IMM_u64(op, desc, dest, src_0, src_1, data) \
--do { \
--	u32 upper = (data >> 16) >> 16; \
--	APPEND_MATH(op, desc, dest, src_0, src_1, CAAM_CMD_SZ * 2 | \
--		    (upper ? 0 : MATH_IFB)); \
--	if (upper) \
--		append_u64(desc, data); \
--	else \
--		append_u32(desc, data); \
--} while (0)
--
--#define append_math_add_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(ADD, desc, dest, src0, src1, data)
--#define append_math_sub_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(SUB, desc, dest, src0, src1, data)
--#define append_math_add_c_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(ADDC, desc, dest, src0, src1, data)
--#define append_math_sub_b_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(SUBB, desc, dest, src0, src1, data)
--#define append_math_and_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(AND, desc, dest, src0, src1, data)
--#define append_math_or_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(OR, desc, dest, src0, src1, data)
--#define append_math_xor_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(XOR, desc, dest, src0, src1, data)
--#define append_math_lshift_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(LSHIFT, desc, dest, src0, src1, data)
--#define append_math_rshift_imm_u64(desc, dest, src0, src1, data) \
--	APPEND_MATH_IMM_u64(RSHIFT, desc, dest, src0, src1, data)
-diff -Nur linux-4.1.3/drivers/crypto/caam/desc.h linux-xbian-imx6/drivers/crypto/caam/desc.h
---- linux-4.1.3/drivers/crypto/caam/desc.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/desc.h	2015-07-27 23:13:04.209961631 +0200
-@@ -2,19 +2,35 @@
-  * CAAM descriptor composition header
-  * Definitions to support CAAM descriptor instruction generation
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  */
- 
- #ifndef DESC_H
- #define DESC_H
- 
-+/*
-+ * 16-byte hardware scatter/gather table
-+ * An 8-byte table exists in the hardware spec, but has never been
-+ * implemented to date. The 8/16 option is selected at RTL-compile-time.
-+ * and this selection is visible in the Compile Time Parameters Register
-+ */
-+
-+#define SEC4_SG_LEN_EXT		0x80000000	/* Entry points to table */
-+#define SEC4_SG_LEN_FIN		0x40000000	/* Last ent in table */
-+#define SEC4_SG_BPID_MASK	0x000000ff
-+#define SEC4_SG_BPID_SHIFT	16
-+#define SEC4_SG_LEN_MASK	0x3fffffff	/* Excludes EXT and FINAL */
-+#define SEC4_SG_OFFS_MASK	0x00001fff
-+
- struct sec4_sg_entry {
-+#ifdef CONFIG_64BIT
- 	u64 ptr;
--#define SEC4_SG_LEN_FIN 0x40000000
--#define SEC4_SG_LEN_EXT 0x80000000
-+#else
-+	u32 reserved;
-+	u32 ptr;
-+#endif
- 	u32 len;
--	u8 reserved;
--	u8 buf_pool_id;
-+	u16 buf_pool_id;
- 	u16 offset;
- };
- 
-@@ -231,12 +247,7 @@
- #define LDST_SRCDST_WORD_PKHA_B_SZ	(0x11 << LDST_SRCDST_SHIFT)
- #define LDST_SRCDST_WORD_PKHA_N_SZ	(0x12 << LDST_SRCDST_SHIFT)
- #define LDST_SRCDST_WORD_PKHA_E_SZ	(0x13 << LDST_SRCDST_SHIFT)
--#define LDST_SRCDST_WORD_CLASS_CTX	(0x20 << LDST_SRCDST_SHIFT)
- #define LDST_SRCDST_WORD_DESCBUF	(0x40 << LDST_SRCDST_SHIFT)
--#define LDST_SRCDST_WORD_DESCBUF_JOB	(0x41 << LDST_SRCDST_SHIFT)
--#define LDST_SRCDST_WORD_DESCBUF_SHARED	(0x42 << LDST_SRCDST_SHIFT)
--#define LDST_SRCDST_WORD_DESCBUF_JOB_WE	(0x45 << LDST_SRCDST_SHIFT)
--#define LDST_SRCDST_WORD_DESCBUF_SHARED_WE (0x46 << LDST_SRCDST_SHIFT)
- #define LDST_SRCDST_WORD_INFO_FIFO	(0x7a << LDST_SRCDST_SHIFT)
- 
- /* Offset in source/destination */
-@@ -321,6 +332,7 @@
- /* Continue - Not the last FIFO store to come */
- #define FIFOST_CONT_SHIFT	23
- #define FIFOST_CONT_MASK	(1 << FIFOST_CONT_SHIFT)
-+#define FIFOST_CONT_MASK	(1 << FIFOST_CONT_SHIFT)
- 
- /*
-  * Extended Length - use 32-bit extended length that
-@@ -370,7 +382,6 @@
- #define FIFOLD_TYPE_LAST2FLUSH1 (0x05 << FIFOLD_TYPE_SHIFT)
- #define FIFOLD_TYPE_LASTBOTH	(0x06 << FIFOLD_TYPE_SHIFT)
- #define FIFOLD_TYPE_LASTBOTHFL	(0x07 << FIFOLD_TYPE_SHIFT)
--#define FIFOLD_TYPE_NOINFOFIFO	(0x0F << FIFOLD_TYPE_SHIFT)
- 
- #define FIFOLDST_LEN_MASK	0xffff
- #define FIFOLDST_EXT_LEN_MASK	0xffffffff
-@@ -1092,6 +1103,23 @@
- #define OP_PCL_PKPROT_ECC			 0x0002
- #define OP_PCL_PKPROT_F2M			 0x0001
- 
-+/* Blob protocol protinfo bits */
-+#define OP_PCL_BLOB_TK			0x0200
-+#define OP_PCL_BLOB_EKT			0x0100
-+
-+#define OP_PCL_BLOB_K2KR_MEM		0x0000
-+#define OP_PCL_BLOB_K2KR_C1KR		0x0010
-+#define OP_PCL_BLOB_K2KR_C2KR		0x0030
-+#define OP_PCL_BLOB_K2KR_AFHAS		0x0050
-+#define OP_PCL_BLOB_K2KR_C2KR_SPLIT	0x0070
-+
-+#define OP_PCL_BLOB_PTXT_SECMEM		0x0008
-+#define OP_PCL_BLOB_BLACK		0x0004
-+
-+#define OP_PCL_BLOB_FMT_NORMAL		0x0000
-+#define OP_PCL_BLOB_FMT_MSTR		0x0002
-+#define OP_PCL_BLOB_FMT_TEST		0x0003
-+
- /* For non-protocol/alg-only op commands */
- #define OP_ALG_TYPE_SHIFT	24
- #define OP_ALG_TYPE_MASK	(0x7 << OP_ALG_TYPE_SHIFT)
-@@ -1154,15 +1182,8 @@
- 
- /* randomizer AAI set */
- #define OP_ALG_AAI_RNG		(0x00 << OP_ALG_AAI_SHIFT)
--#define OP_ALG_AAI_RNG_NZB	(0x10 << OP_ALG_AAI_SHIFT)
--#define OP_ALG_AAI_RNG_OBP	(0x20 << OP_ALG_AAI_SHIFT)
--
--/* RNG4 AAI set */
--#define OP_ALG_AAI_RNG4_SH_0	(0x00 << OP_ALG_AAI_SHIFT)
--#define OP_ALG_AAI_RNG4_SH_1	(0x01 << OP_ALG_AAI_SHIFT)
--#define OP_ALG_AAI_RNG4_PS	(0x40 << OP_ALG_AAI_SHIFT)
--#define OP_ALG_AAI_RNG4_AI	(0x80 << OP_ALG_AAI_SHIFT)
--#define OP_ALG_AAI_RNG4_SK	(0x100 << OP_ALG_AAI_SHIFT)
-+#define OP_ALG_AAI_RNG_NOZERO	(0x10 << OP_ALG_AAI_SHIFT)
-+#define OP_ALG_AAI_RNG_ODD	(0x20 << OP_ALG_AAI_SHIFT)
- 
- /* hmac/smac AAI set */
- #define OP_ALG_AAI_HASH		(0x00 << OP_ALG_AAI_SHIFT)
-@@ -1184,6 +1205,12 @@
- #define OP_ALG_AAI_GSM		(0x10 << OP_ALG_AAI_SHIFT)
- #define OP_ALG_AAI_EDGE		(0x20 << OP_ALG_AAI_SHIFT)
- 
-+/* RNG4 set */
-+#define OP_ALG_RNG4_SHIFT	4
-+#define OP_ALG_RNG4_MASK	(0x1f3 << OP_ALG_RNG4_SHIFT)
-+
-+#define OP_ALG_RNG4_SK		(0x100 << OP_ALG_RNG4_SHIFT)
-+
- #define OP_ALG_AS_SHIFT		2
- #define OP_ALG_AS_MASK		(0x3 << OP_ALG_AS_SHIFT)
- #define OP_ALG_AS_UPDATE	(0 << OP_ALG_AS_SHIFT)
-@@ -1300,10 +1327,10 @@
- #define SQOUT_SGF	0x01000000
- 
- /* Appends to a previous pointer */
--#define SQOUT_PRE	SQIN_PRE
-+#define SQOUT_PRE	0x00800000
- 
- /* Restore sequence with pointer/length */
--#define SQOUT_RTO	 SQIN_RTO
-+#define SQOUT_RTO	0x00200000
- 
- /* Use extended length following pointer */
- #define SQOUT_EXT	0x00400000
-@@ -1365,7 +1392,6 @@
- #define MOVE_DEST_MATH3		(0x07 << MOVE_DEST_SHIFT)
- #define MOVE_DEST_CLASS1INFIFO	(0x08 << MOVE_DEST_SHIFT)
- #define MOVE_DEST_CLASS2INFIFO	(0x09 << MOVE_DEST_SHIFT)
--#define MOVE_DEST_INFIFO_NOINFO (0x0a << MOVE_DEST_SHIFT)
- #define MOVE_DEST_PK_A		(0x0c << MOVE_DEST_SHIFT)
- #define MOVE_DEST_CLASS1KEY	(0x0d << MOVE_DEST_SHIFT)
- #define MOVE_DEST_CLASS2KEY	(0x0e << MOVE_DEST_SHIFT)
-@@ -1418,7 +1444,6 @@
- #define MATH_SRC0_REG2		(0x02 << MATH_SRC0_SHIFT)
- #define MATH_SRC0_REG3		(0x03 << MATH_SRC0_SHIFT)
- #define MATH_SRC0_IMM		(0x04 << MATH_SRC0_SHIFT)
--#define MATH_SRC0_DPOVRD	(0x07 << MATH_SRC0_SHIFT)
- #define MATH_SRC0_SEQINLEN	(0x08 << MATH_SRC0_SHIFT)
- #define MATH_SRC0_SEQOUTLEN	(0x09 << MATH_SRC0_SHIFT)
- #define MATH_SRC0_VARSEQINLEN	(0x0a << MATH_SRC0_SHIFT)
-@@ -1433,7 +1458,6 @@
- #define MATH_SRC1_REG2		(0x02 << MATH_SRC1_SHIFT)
- #define MATH_SRC1_REG3		(0x03 << MATH_SRC1_SHIFT)
- #define MATH_SRC1_IMM		(0x04 << MATH_SRC1_SHIFT)
--#define MATH_SRC1_DPOVRD	(0x07 << MATH_SRC0_SHIFT)
- #define MATH_SRC1_INFIFO	(0x0a << MATH_SRC1_SHIFT)
- #define MATH_SRC1_OUTFIFO	(0x0b << MATH_SRC1_SHIFT)
- #define MATH_SRC1_ONE		(0x0c << MATH_SRC1_SHIFT)
-@@ -1609,13 +1633,28 @@
- #define NFIFOENTRY_PLEN_SHIFT	0
- #define NFIFOENTRY_PLEN_MASK	(0xFF << NFIFOENTRY_PLEN_SHIFT)
- 
--/* Append Load Immediate Command */
--#define FD_CMD_APPEND_LOAD_IMMEDIATE			0x80000000
-+/*
-+ * PDB internal definitions
-+ */
-+
-+/* IPSec ESP CBC Encap/Decap Options */
-+#define PDBOPTS_ESPCBC_ARSNONE	0x00	/* no antireplay window	*/
-+#define PDBOPTS_ESPCBC_ARS32	0x40	/* 32-entry antireplay window */
-+#define PDBOPTS_ESPCBC_ARS64	0xc0	/* 64-entry antireplay window */
-+#define PDBOPTS_ESPCBC_IVSRC	0x20	/* IV comes from internal random gen */
-+#define PDBOPTS_ESPCBC_ESN	0x10	/* extended sequence included */
-+#define PDBOPTS_ESPCBC_OUTFMT	0x08	/* output only decapsulation (decap) */
-+#define PDBOPTS_ESPCBC_IPHDRSRC 0x08	/* IP header comes from PDB (encap) */
-+#define PDBOPTS_ESPCBC_INCIPHDR 0x04	/* Prepend IP header to output frame */
-+#define PDBOPTS_ESPCBC_IPVSN	0x02	/* process IPv6 header */
-+#define PDBOPTS_ESPCBC_TUNNEL	0x01	/* tunnel mode next-header byte */
-+
-+#define ARC4_BLOCK_SIZE       1
-+#define ARC4_MAX_KEY_SIZE     256
-+#define ARC4_MIN_KEY_SIZE     1
- 
--/* Set SEQ LIODN equal to the Non-SEQ LIODN for the job */
--#define FD_CMD_SET_SEQ_LIODN_EQUAL_NONSEQ_LIODN		0x40000000
-+#define XCBC_MAC_DIGEST_SIZE  16
-+#define XCBC_MAC_BLOCK_WORDS  16
- 
--/* Frame Descriptor Command for Replacement Job Descriptor */
--#define FD_CMD_REPLACE_JOB_DESC				0x20000000
- 
- #endif /* DESC_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/error.c linux-xbian-imx6/drivers/crypto/caam/error.c
---- linux-4.1.3/drivers/crypto/caam/error.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/error.c	2015-07-27 23:13:04.213947410 +0200
-@@ -11,243 +11,264 @@
- #include "jr.h"
- #include "error.h"
- 
--static const struct {
--	u8 value;
--	const char *error_text;
--} desc_error_list[] = {
--	{ 0x00, "No error." },
--	{ 0x01, "SGT Length Error. The descriptor is trying to read more data than is contained in the SGT table." },
--	{ 0x02, "SGT Null Entry Error." },
--	{ 0x03, "Job Ring Control Error. There is a bad value in the Job Ring Control register." },
--	{ 0x04, "Invalid Descriptor Command. The Descriptor Command field is invalid." },
--	{ 0x05, "Reserved." },
--	{ 0x06, "Invalid KEY Command" },
--	{ 0x07, "Invalid LOAD Command" },
--	{ 0x08, "Invalid STORE Command" },
--	{ 0x09, "Invalid OPERATION Command" },
--	{ 0x0A, "Invalid FIFO LOAD Command" },
--	{ 0x0B, "Invalid FIFO STORE Command" },
--	{ 0x0C, "Invalid MOVE/MOVE_LEN Command" },
--	{ 0x0D, "Invalid JUMP Command. A nonlocal JUMP Command is invalid because the target is not a Job Header Command, or the jump is from a Trusted Descriptor to a Job Descriptor, or because the target Descriptor contains a Shared Descriptor." },
--	{ 0x0E, "Invalid MATH Command" },
--	{ 0x0F, "Invalid SIGNATURE Command" },
--	{ 0x10, "Invalid Sequence Command. A SEQ IN PTR OR SEQ OUT PTR Command is invalid or a SEQ KEY, SEQ LOAD, SEQ FIFO LOAD, or SEQ FIFO STORE decremented the input or output sequence length below 0. This error may result if a built-in PROTOCOL Command has encountered a malformed PDU." },
--	{ 0x11, "Skip data type invalid. The type must be 0xE or 0xF."},
--	{ 0x12, "Shared Descriptor Header Error" },
--	{ 0x13, "Header Error. Invalid length or parity, or certain other problems." },
--	{ 0x14, "Burster Error. Burster has gotten to an illegal state" },
--	{ 0x15, "Context Register Length Error. The descriptor is trying to read or write past the end of the Context Register. A SEQ LOAD or SEQ STORE with the VLF bit set was executed with too large a length in the variable length register (VSOL for SEQ STORE or VSIL for SEQ LOAD)." },
--	{ 0x16, "DMA Error" },
--	{ 0x17, "Reserved." },
--	{ 0x1A, "Job failed due to JR reset" },
--	{ 0x1B, "Job failed due to Fail Mode" },
--	{ 0x1C, "DECO Watchdog timer timeout error" },
--	{ 0x1D, "DECO tried to copy a key from another DECO but the other DECO's Key Registers were locked" },
--	{ 0x1E, "DECO attempted to copy data from a DECO that had an unmasked Descriptor error" },
--	{ 0x1F, "LIODN error. DECO was trying to share from itself or from another DECO but the two Non-SEQ LIODN values didn't match or the 'shared from' DECO's Descriptor required that the SEQ LIODNs be the same and they aren't." },
--	{ 0x20, "DECO has completed a reset initiated via the DRR register" },
--	{ 0x21, "Nonce error. When using EKT (CCM) key encryption option in the FIFO STORE Command, the Nonce counter reached its maximum value and this encryption mode can no longer be used." },
--	{ 0x22, "Meta data is too large (> 511 bytes) for TLS decap (input frame; block ciphers) and IPsec decap (output frame, when doing the next header byte update) and DCRC (output frame)." },
--	{ 0x23, "Read Input Frame error" },
--	{ 0x24, "JDKEK, TDKEK or TDSK not loaded error" },
--	{ 0x80, "DNR (do not run) error" },
--	{ 0x81, "undefined protocol command" },
--	{ 0x82, "invalid setting in PDB" },
--	{ 0x83, "Anti-replay LATE error" },
--	{ 0x84, "Anti-replay REPLAY error" },
--	{ 0x85, "Sequence number overflow" },
--	{ 0x86, "Sigver invalid signature" },
--	{ 0x87, "DSA Sign Illegal test descriptor" },
--	{ 0x88, "Protocol Format Error - A protocol has seen an error in the format of data received. When running RSA, this means that formatting with random padding was used, and did not follow the form: 0x00, 0x02, 8-to-N bytes of non-zero pad, 0x00, F data." },
--	{ 0x89, "Protocol Size Error - A protocol has seen an error in size. When running RSA, pdb size N < (size of F) when no formatting is used; or pdb size N < (F + 11) when formatting is used." },
--	{ 0xC1, "Blob Command error: Undefined mode" },
--	{ 0xC2, "Blob Command error: Secure Memory Blob mode error" },
--	{ 0xC4, "Blob Command error: Black Blob key or input size error" },
--	{ 0xC5, "Blob Command error: Invalid key destination" },
--	{ 0xC8, "Blob Command error: Trusted/Secure mode error" },
--	{ 0xF0, "IPsec TTL or hop limit field either came in as 0, or was decremented to 0" },
--	{ 0xF1, "3GPP HFN matches or exceeds the Threshold" },
--};
--
--static const char * const cha_id_list[] = {
--	"",
--	"AES",
--	"DES",
--	"ARC4",
--	"MDHA",
--	"RNG",
--	"SNOW f8",
--	"Kasumi f8/9",
--	"PKHA",
--	"CRCA",
--	"SNOW f9",
--	"ZUCE",
--	"ZUCA",
--};
--
--static const char * const err_id_list[] = {
--	"No error.",
--	"Mode error.",
--	"Data size error.",
--	"Key size error.",
--	"PKHA A memory size error.",
--	"PKHA B memory size error.",
--	"Data arrived out of sequence error.",
--	"PKHA divide-by-zero error.",
--	"PKHA modulus even error.",
--	"DES key parity error.",
--	"ICV check failed.",
--	"Hardware error.",
--	"Unsupported CCM AAD size.",
--	"Class 1 CHA is not reset",
--	"Invalid CHA combination was selected",
--	"Invalid CHA selected.",
--};
--
--static const char * const rng_err_id_list[] = {
--	"",
--	"",
--	"",
--	"Instantiate",
--	"Not instantiated",
--	"Test instantiate",
--	"Prediction resistance",
--	"Prediction resistance and test request",
--	"Uninstantiate",
--	"Secure key generation",
--};
-+#define SPRINTFCAT(str, format, param, max_alloc)		\
-+{								\
-+	char *tmp;						\
-+								\
-+	tmp = kmalloc(sizeof(format) + max_alloc, GFP_ATOMIC);	\
-+	if (likely(tmp)) {					\
-+		sprintf(tmp, format, param);			\
-+		strcat(str, tmp);				\
-+		kfree(tmp);					\
-+	} else {						\
-+		strcat(str, "kmalloc failure in SPRINTFCAT");	\
-+	}							\
-+}
- 
--static void report_ccb_status(struct device *jrdev, const u32 status,
--			      const char *error)
-+static void report_jump_idx(u32 status, char *outstr)
- {
--	u8 cha_id = (status & JRSTA_CCBERR_CHAID_MASK) >>
--		    JRSTA_CCBERR_CHAID_SHIFT;
--	u8 err_id = status & JRSTA_CCBERR_ERRID_MASK;
- 	u8 idx = (status & JRSTA_DECOERR_INDEX_MASK) >>
- 		  JRSTA_DECOERR_INDEX_SHIFT;
--	char *idx_str;
--	const char *cha_str = "unidentified cha_id value 0x";
--	char cha_err_code[3] = { 0 };
--	const char *err_str = "unidentified err_id value 0x";
--	char err_err_code[3] = { 0 };
- 
- 	if (status & JRSTA_DECOERR_JUMP)
--		idx_str = "jump tgt desc idx";
-+		strcat(outstr, "jump tgt desc idx ");
- 	else
--		idx_str = "desc idx";
-+		strcat(outstr, "desc idx ");
- 
--	if (cha_id < ARRAY_SIZE(cha_id_list))
--		cha_str = cha_id_list[cha_id];
--	else
--		snprintf(cha_err_code, sizeof(cha_err_code), "%02x", cha_id);
-+	SPRINTFCAT(outstr, "%d: ", idx, sizeof("255"));
-+}
-+
-+static void report_ccb_status(u32 status, char *outstr)
-+{
-+	static const char * const cha_id_list[] = {
-+		"",
-+		"AES",
-+		"DES",
-+		"ARC4",
-+		"MDHA",
-+		"RNG",
-+		"SNOW f8",
-+		"Kasumi f8/9",
-+		"PKHA",
-+		"CRCA",
-+		"SNOW f9",
-+		"ZUCE",
-+		"ZUCA",
-+	};
-+	static const char * const err_id_list[] = {
-+		"No error.",
-+		"Mode error.",
-+		"Data size error.",
-+		"Key size error.",
-+		"PKHA A memory size error.",
-+		"PKHA B memory size error.",
-+		"Data arrived out of sequence error.",
-+		"PKHA divide-by-zero error.",
-+		"PKHA modulus even error.",
-+		"DES key parity error.",
-+		"ICV check failed.",
-+		"Hardware error.",
-+		"Unsupported CCM AAD size.",
-+		"Class 1 CHA is not reset",
-+		"Invalid CHA combination was selected",
-+		"Invalid CHA selected.",
-+	};
-+	static const char * const rng_err_id_list[] = {
-+		"",
-+		"",
-+		"",
-+		"Instantiate",
-+		"Not instantiated",
-+		"Test instantiate",
-+		"Prediction resistance",
-+		"Prediction resistance and test request",
-+		"Uninstantiate",
-+		"Secure key generation",
-+	};
-+	u8 cha_id = (status & JRSTA_CCBERR_CHAID_MASK) >>
-+		    JRSTA_CCBERR_CHAID_SHIFT;
-+	u8 err_id = status & JRSTA_CCBERR_ERRID_MASK;
-+
-+	report_jump_idx(status, outstr);
-+
-+	if (cha_id < ARRAY_SIZE(cha_id_list)) {
-+		SPRINTFCAT(outstr, "%s: ", cha_id_list[cha_id],
-+			   strlen(cha_id_list[cha_id]));
-+	} else {
-+		SPRINTFCAT(outstr, "unidentified cha_id value 0x%02x: ",
-+			   cha_id, sizeof("ff"));
-+	}
- 
- 	if ((cha_id << JRSTA_CCBERR_CHAID_SHIFT) == JRSTA_CCBERR_CHAID_RNG &&
- 	    err_id < ARRAY_SIZE(rng_err_id_list) &&
- 	    strlen(rng_err_id_list[err_id])) {
- 		/* RNG-only error */
--		err_str = rng_err_id_list[err_id];
--	} else if (err_id < ARRAY_SIZE(err_id_list))
--		err_str = err_id_list[err_id];
--	else
--		snprintf(err_err_code, sizeof(err_err_code), "%02x", err_id);
--
--	/*
--	 * CCB ICV check failures are part of normal operation life;
--	 * we leave the upper layers to do what they want with them.
--	 */
--	if (err_id != JRSTA_CCBERR_ERRID_ICVCHK)
--		dev_err(jrdev, "%08x: %s: %s %d: %s%s: %s%s\n",
--			status, error, idx_str, idx,
--			cha_str, cha_err_code,
--			err_str, err_err_code);
-+		SPRINTFCAT(outstr, "%s", rng_err_id_list[err_id],
-+			   strlen(rng_err_id_list[err_id]));
-+	} else if (err_id < ARRAY_SIZE(err_id_list)) {
-+		SPRINTFCAT(outstr, "%s", err_id_list[err_id],
-+			   strlen(err_id_list[err_id]));
-+	} else {
-+		SPRINTFCAT(outstr, "unidentified err_id value 0x%02x",
-+			   err_id, sizeof("ff"));
-+	}
- }
- 
--static void report_jump_status(struct device *jrdev, const u32 status,
--			       const char *error)
-+static void report_jump_status(u32 status, char *outstr)
- {
--	dev_err(jrdev, "%08x: %s: %s() not implemented\n",
--		status, error, __func__);
-+	SPRINTFCAT(outstr, "%s() not implemented", __func__, sizeof(__func__));
- }
- 
--static void report_deco_status(struct device *jrdev, const u32 status,
--			       const char *error)
-+static void report_deco_status(u32 status, char *outstr)
- {
--	u8 err_id = status & JRSTA_DECOERR_ERROR_MASK;
--	u8 idx = (status & JRSTA_DECOERR_INDEX_MASK) >>
--		  JRSTA_DECOERR_INDEX_SHIFT;
--	char *idx_str;
--	const char *err_str = "unidentified error value 0x";
--	char err_err_code[3] = { 0 };
-+	static const struct {
-+		u8 value;
-+		char *error_text;
-+	} desc_error_list[] = {
-+		{ 0x00, "No error." },
-+		{ 0x01, "SGT Length Error. The descriptor is trying to read "
-+			"more data than is contained in the SGT table." },
-+		{ 0x02, "SGT Null Entry Error." },
-+		{ 0x03, "Job Ring Control Error. There is a bad value in the "
-+			"Job Ring Control register." },
-+		{ 0x04, "Invalid Descriptor Command. The Descriptor Command "
-+			"field is invalid." },
-+		{ 0x05, "Reserved." },
-+		{ 0x06, "Invalid KEY Command" },
-+		{ 0x07, "Invalid LOAD Command" },
-+		{ 0x08, "Invalid STORE Command" },
-+		{ 0x09, "Invalid OPERATION Command" },
-+		{ 0x0A, "Invalid FIFO LOAD Command" },
-+		{ 0x0B, "Invalid FIFO STORE Command" },
-+		{ 0x0C, "Invalid MOVE/MOVE_LEN Command" },
-+		{ 0x0D, "Invalid JUMP Command. A nonlocal JUMP Command is "
-+			"invalid because the target is not a Job Header "
-+			"Command, or the jump is from a Trusted Descriptor to "
-+			"a Job Descriptor, or because the target Descriptor "
-+			"contains a Shared Descriptor." },
-+		{ 0x0E, "Invalid MATH Command" },
-+		{ 0x0F, "Invalid SIGNATURE Command" },
-+		{ 0x10, "Invalid Sequence Command. A SEQ IN PTR OR SEQ OUT PTR "
-+			"Command is invalid or a SEQ KEY, SEQ LOAD, SEQ FIFO "
-+			"LOAD, or SEQ FIFO STORE decremented the input or "
-+			"output sequence length below 0. This error may result "
-+			"if a built-in PROTOCOL Command has encountered a "
-+			"malformed PDU." },
-+		{ 0x11, "Skip data type invalid. The type must be 0xE or 0xF."},
-+		{ 0x12, "Shared Descriptor Header Error" },
-+		{ 0x13, "Header Error. Invalid length or parity, or certain "
-+			"other problems." },
-+		{ 0x14, "Burster Error. Burster has gotten to an illegal "
-+			"state" },
-+		{ 0x15, "Context Register Length Error. The descriptor is "
-+			"trying to read or write past the end of the Context "
-+			"Register. A SEQ LOAD or SEQ STORE with the VLF bit "
-+			"set was executed with too large a length in the "
-+			"variable length register (VSOL for SEQ STORE or VSIL "
-+			"for SEQ LOAD)." },
-+		{ 0x16, "DMA Error" },
-+		{ 0x17, "Reserved." },
-+		{ 0x1A, "Job failed due to JR reset" },
-+		{ 0x1B, "Job failed due to Fail Mode" },
-+		{ 0x1C, "DECO Watchdog timer timeout error" },
-+		{ 0x1D, "DECO tried to copy a key from another DECO but the "
-+			"other DECO's Key Registers were locked" },
-+		{ 0x1E, "DECO attempted to copy data from a DECO that had an "
-+			"unmasked Descriptor error" },
-+		{ 0x1F, "LIODN error. DECO was trying to share from itself or "
-+			"from another DECO but the two Non-SEQ LIODN values "
-+			"didn't match or the 'shared from' DECO's Descriptor "
-+			"required that the SEQ LIODNs be the same and they "
-+			"aren't." },
-+		{ 0x20, "DECO has completed a reset initiated via the DRR "
-+			"register" },
-+		{ 0x21, "Nonce error. When using EKT (CCM) key encryption "
-+			"option in the FIFO STORE Command, the Nonce counter "
-+			"reached its maximum value and this encryption mode "
-+			"can no longer be used." },
-+		{ 0x22, "Meta data is too large (> 511 bytes) for TLS decap "
-+			"(input frame; block ciphers) and IPsec decap (output "
-+			"frame, when doing the next header byte update) and "
-+			"DCRC (output frame)." },
-+		{ 0x23, "Read Input Frame error" },
-+		{ 0x24, "JDKEK, TDKEK or TDSK not loaded error" },
-+		{ 0x80, "DNR (do not run) error" },
-+		{ 0x81, "undefined protocol command" },
-+		{ 0x82, "invalid setting in PDB" },
-+		{ 0x83, "Anti-replay LATE error" },
-+		{ 0x84, "Anti-replay REPLAY error" },
-+		{ 0x85, "Sequence number overflow" },
-+		{ 0x86, "Sigver invalid signature" },
-+		{ 0x87, "DSA Sign Illegal test descriptor" },
-+		{ 0x88, "Protocol Format Error - A protocol has seen an error "
-+			"in the format of data received. When running RSA, "
-+			"this means that formatting with random padding was "
-+			"used, and did not follow the form: 0x00, 0x02, 8-to-N "
-+			"bytes of non-zero pad, 0x00, F data." },
-+		{ 0x89, "Protocol Size Error - A protocol has seen an error in "
-+			"size. When running RSA, pdb size N < (size of F) when "
-+			"no formatting is used; or pdb size N < (F + 11) when "
-+			"formatting is used." },
-+		{ 0xC1, "Blob Command error: Undefined mode" },
-+		{ 0xC2, "Blob Command error: Secure Memory Blob mode error" },
-+		{ 0xC4, "Blob Command error: Black Blob key or input size "
-+			"error" },
-+		{ 0xC5, "Blob Command error: Invalid key destination" },
-+		{ 0xC8, "Blob Command error: Trusted/Secure mode error" },
-+		{ 0xF0, "IPsec TTL or hop limit field either came in as 0, "
-+			"or was decremented to 0" },
-+		{ 0xF1, "3GPP HFN matches or exceeds the Threshold" },
-+	};
-+	u8 desc_error = status & JRSTA_DECOERR_ERROR_MASK;
- 	int i;
- 
--	if (status & JRSTA_DECOERR_JUMP)
--		idx_str = "jump tgt desc idx";
--	else
--		idx_str = "desc idx";
-+	report_jump_idx(status, outstr);
- 
- 	for (i = 0; i < ARRAY_SIZE(desc_error_list); i++)
--		if (desc_error_list[i].value == err_id)
-+		if (desc_error_list[i].value == desc_error)
- 			break;
- 
--	if (i != ARRAY_SIZE(desc_error_list) && desc_error_list[i].error_text)
--		err_str = desc_error_list[i].error_text;
--	else
--		snprintf(err_err_code, sizeof(err_err_code), "%02x", err_id);
--
--	dev_err(jrdev, "%08x: %s: %s %d: %s%s\n",
--		status, error, idx_str, idx, err_str, err_err_code);
-+	if (i != ARRAY_SIZE(desc_error_list) && desc_error_list[i].error_text) {
-+		SPRINTFCAT(outstr, "%s", desc_error_list[i].error_text,
-+			   strlen(desc_error_list[i].error_text));
-+	} else {
-+		SPRINTFCAT(outstr, "unidentified error value 0x%02x",
-+			   desc_error, sizeof("ff"));
-+	}
- }
- 
--static void report_jr_status(struct device *jrdev, const u32 status,
--			     const char *error)
-+static void report_jr_status(u32 status, char *outstr)
- {
--	dev_err(jrdev, "%08x: %s: %s() not implemented\n",
--		status, error, __func__);
-+	SPRINTFCAT(outstr, "%s() not implemented", __func__, sizeof(__func__));
- }
- 
--static void report_cond_code_status(struct device *jrdev, const u32 status,
--				    const char *error)
-+static void report_cond_code_status(u32 status, char *outstr)
- {
--	dev_err(jrdev, "%08x: %s: %s() not implemented\n",
--		status, error, __func__);
-+	SPRINTFCAT(outstr, "%s() not implemented", __func__, sizeof(__func__));
- }
- 
--void caam_jr_strstatus(struct device *jrdev, u32 status)
-+char *caam_jr_strstatus(char *outstr, u32 status)
- {
- 	static const struct stat_src {
--		void (*report_ssed)(struct device *jrdev, const u32 status,
--				    const char *error);
--		const char *error;
--	} status_src[16] = {
-+		void (*report_ssed)(u32 status, char *outstr);
-+		char *error;
-+	} status_src[] = {
- 		{ NULL, "No error" },
- 		{ NULL, NULL },
- 		{ report_ccb_status, "CCB" },
- 		{ report_jump_status, "Jump" },
- 		{ report_deco_status, "DECO" },
--		{ NULL, "Queue Manager Interface" },
-+		{ NULL, NULL },
- 		{ report_jr_status, "Job Ring" },
- 		{ report_cond_code_status, "Condition Code" },
--		{ NULL, NULL },
--		{ NULL, NULL },
--		{ NULL, NULL },
--		{ NULL, NULL },
--		{ NULL, NULL },
--		{ NULL, NULL },
--		{ NULL, NULL },
--		{ NULL, NULL },
- 	};
- 	u32 ssrc = status >> JRSTA_SSRC_SHIFT;
--	const char *error = status_src[ssrc].error;
- 
--	/*
--	 * If there is an error handling function, call it to report the error.
--	 * Otherwise print the error source name.
--	 */
-+	sprintf(outstr, "%s: ", status_src[ssrc].error);
-+
- 	if (status_src[ssrc].report_ssed)
--		status_src[ssrc].report_ssed(jrdev, status, error);
--	else if (error)
--		dev_err(jrdev, "%d: %s\n", ssrc, error);
--	else
--		dev_err(jrdev, "%d: unknown error source\n", ssrc);
-+		status_src[ssrc].report_ssed(status, outstr);
-+
-+	return outstr;
- }
- EXPORT_SYMBOL(caam_jr_strstatus);
-diff -Nur linux-4.1.3/drivers/crypto/caam/error.h linux-xbian-imx6/drivers/crypto/caam/error.h
---- linux-4.1.3/drivers/crypto/caam/error.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/error.h	2015-07-27 23:13:04.213947410 +0200
-@@ -7,5 +7,5 @@
- #ifndef CAAM_ERROR_H
- #define CAAM_ERROR_H
- #define CAAM_ERROR_STR_MAX 302
--void caam_jr_strstatus(struct device *jrdev, u32 status);
-+extern char *caam_jr_strstatus(char *outstr, u32 status);
- #endif /* CAAM_ERROR_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/intern.h linux-xbian-imx6/drivers/crypto/caam/intern.h
---- linux-4.1.3/drivers/crypto/caam/intern.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/intern.h	2015-07-27 23:13:04.213947410 +0200
-@@ -2,13 +2,19 @@
-  * CAAM/SEC 4.x driver backend
-  * Private/internal definitions between modules
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  *
-  */
- 
- #ifndef INTERN_H
- #define INTERN_H
- 
-+#define JOBR_UNASSIGNED 0
-+#define JOBR_ASSIGNED 1
-+
-+/* Default clock/sample settings for an RNG4 entropy source */
-+#define RNG4_ENT_CLOCKS_SAMPLE 1600
-+
- /* Currently comes from Kconfig param as a ^2 (driver-required) */
- #define JOBR_DEPTH (1 << CONFIG_CRYPTO_DEV_FSL_CAAM_RINGSIZE)
- 
-@@ -37,15 +43,13 @@
- 
- /* Private sub-storage for a single JobR */
- struct caam_drv_private_jr {
--	struct list_head	list_node;	/* Job Ring device list */
--	struct device		*dev;
-+	struct device *parentdev;	/* points back to controller dev */
-+	struct platform_device *jr_pdev;/* points to platform device for JR */
- 	int ridx;
- 	struct caam_job_ring __iomem *rregs;	/* JobR's register space */
- 	struct tasklet_struct irqtask;
- 	int irq;			/* One per queue */
--
--	/* Number of scatterlist crypt transforms active on the JobR */
--	atomic_t tfm_count ____cacheline_aligned;
-+	int assign;			/* busy/free */
- 
- 	/* Job ring info */
- 	int ringsize;	/* Size of rings (assume input = output) */
-@@ -66,15 +70,20 @@
- struct caam_drv_private {
- 
- 	struct device *dev;
--	struct platform_device **jrpdev; /* Alloc'ed array per sub-device */
-+	struct device *smdev;
-+	struct device *secviodev;
-+	struct device **jrdev; /* Alloc'ed array per sub-device */
-+	spinlock_t jr_alloc_lock;
- 	struct platform_device *pdev;
- 
- 	/* Physical-presence section */
--	struct caam_ctrl __iomem *ctrl; /* controller region */
--	struct caam_deco __iomem *deco; /* DECO/CCB views */
--	struct caam_assurance __iomem *assure;
--	struct caam_queue_if __iomem *qi; /* QI control region */
--	struct caam_job_ring __iomem *jr[4];	/* JobR's register space */
-+	struct caam_ctrl *ctrl; /* controller region */
-+	struct caam_deco **deco; /* DECO/CCB views */
-+	struct caam_assurance *ac;
-+	struct caam_queue_if *qi; /* QI control region */
-+	struct snvs_full __iomem *snvs;	/* SNVS HP+LP register space */
-+	dma_addr_t __iomem *sm_base;	/* Secure memory storage base */
-+	u32 sm_size;
- 
- 	/*
- 	 * Detected geometry block. Filled in from device tree if powerpc,
-@@ -83,14 +92,22 @@
- 	u8 total_jobrs;		/* Total Job Rings in device */
- 	u8 qi_present;		/* Nonzero if QI present in device */
- 	int secvio_irq;		/* Security violation interrupt number */
--	int virt_en;		/* Virtualization enabled in CAAM */
--
--#define	RNG4_MAX_HANDLES 2
--	/* RNG4 block */
--	u32 rng4_sh_init;	/* This bitmap shows which of the State
--				   Handles of the RNG4 block are initialized
--				   by this driver */
-+	int rng_inst;		/* Total instantiated RNGs */
- 
-+	/* which jr allocated to scatterlist crypto */
-+	atomic_t tfm_count ____cacheline_aligned;
-+	int num_jrs_for_algapi;
-+	struct device **algapi_jr;
-+	/* list of registered crypto algorithms (mk generic context handle?) */
-+	struct list_head alg_list;
-+	/* list of registered hash algorithms (mk generic context handle?) */
-+	struct list_head hash_list;
-+
-+#ifdef CONFIG_ARM
-+	struct clk *caam_ipg;
-+	struct clk *caam_mem;
-+	struct clk *caam_aclk;
-+#endif
- 	/*
- 	 * debugfs entries for developer view into driver/device
- 	 * variables at runtime.
-diff -Nur linux-4.1.3/drivers/crypto/caam/jr.c linux-xbian-imx6/drivers/crypto/caam/jr.c
---- linux-4.1.3/drivers/crypto/caam/jr.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/jr.c	2015-07-27 23:13:04.213947410 +0200
-@@ -2,125 +2,15 @@
-  * CAAM/SEC 4.x transport/backend driver
-  * JobR backend functionality
-  *
-- * Copyright 2008-2012 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  */
- 
--#include <linux/of_irq.h>
--#include <linux/of_address.h>
--
- #include "compat.h"
- #include "regs.h"
- #include "jr.h"
- #include "desc.h"
- #include "intern.h"
- 
--struct jr_driver_data {
--	/* List of Physical JobR's with the Driver */
--	struct list_head	jr_list;
--	spinlock_t		jr_alloc_lock;	/* jr_list lock */
--} ____cacheline_aligned;
--
--static struct jr_driver_data driver_data;
--
--static int caam_reset_hw_jr(struct device *dev)
--{
--	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
--	unsigned int timeout = 100000;
--
--	/*
--	 * mask interrupts since we are going to poll
--	 * for reset completion status
--	 */
--	setbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
--
--	/* initiate flush (required prior to reset) */
--	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
--	while (((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) ==
--		JRINT_ERR_HALT_INPROGRESS) && --timeout)
--		cpu_relax();
--
--	if ((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) !=
--	    JRINT_ERR_HALT_COMPLETE || timeout == 0) {
--		dev_err(dev, "failed to flush job ring %d\n", jrp->ridx);
--		return -EIO;
--	}
--
--	/* initiate reset */
--	timeout = 100000;
--	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
--	while ((rd_reg32(&jrp->rregs->jrcommand) & JRCR_RESET) && --timeout)
--		cpu_relax();
--
--	if (timeout == 0) {
--		dev_err(dev, "failed to reset job ring %d\n", jrp->ridx);
--		return -EIO;
--	}
--
--	/* unmask interrupts */
--	clrbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
--
--	return 0;
--}
--
--/*
-- * Shutdown JobR independent of platform property code
-- */
--int caam_jr_shutdown(struct device *dev)
--{
--	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
--	dma_addr_t inpbusaddr, outbusaddr;
--	int ret;
--
--	ret = caam_reset_hw_jr(dev);
--
--	tasklet_kill(&jrp->irqtask);
--
--	/* Release interrupt */
--	free_irq(jrp->irq, dev);
--
--	/* Free rings */
--	inpbusaddr = rd_reg64(&jrp->rregs->inpring_base);
--	outbusaddr = rd_reg64(&jrp->rregs->outring_base);
--	dma_free_coherent(dev, sizeof(dma_addr_t) * JOBR_DEPTH,
--			  jrp->inpring, inpbusaddr);
--	dma_free_coherent(dev, sizeof(struct jr_outentry) * JOBR_DEPTH,
--			  jrp->outring, outbusaddr);
--	kfree(jrp->entinfo);
--
--	return ret;
--}
--
--static int caam_jr_remove(struct platform_device *pdev)
--{
--	int ret;
--	struct device *jrdev;
--	struct caam_drv_private_jr *jrpriv;
--
--	jrdev = &pdev->dev;
--	jrpriv = dev_get_drvdata(jrdev);
--
--	/*
--	 * Return EBUSY if job ring already allocated.
--	 */
--	if (atomic_read(&jrpriv->tfm_count)) {
--		dev_err(jrdev, "Device is busy\n");
--		return -EBUSY;
--	}
--
--	/* Remove the node from Physical JobR list maintained by driver */
--	spin_lock(&driver_data.jr_alloc_lock);
--	list_del(&jrpriv->list_node);
--	spin_unlock(&driver_data.jr_alloc_lock);
--
--	/* Release ring */
--	ret = caam_jr_shutdown(jrdev);
--	if (ret)
--		dev_err(jrdev, "Failed to shut down job ring\n");
--	irq_dispose_mapping(jrpriv->irq);
--
--	return ret;
--}
--
- /* Main per-ring interrupt handler */
- static irqreturn_t caam_jr_interrupt(int irq, void *st_dev)
- {
-@@ -168,6 +58,9 @@
- 	void (*usercall)(struct device *dev, u32 *desc, u32 status, void *arg);
- 	u32 *userdesc, userstatus;
- 	void *userarg;
-+	dma_addr_t outbusaddr;
-+
-+	outbusaddr = rd_reg64(&jrp->rregs->outring_base);
- 
- 	while (rd_reg32(&jrp->rregs->outring_used)) {
- 
-@@ -177,10 +70,15 @@
- 
- 		sw_idx = tail = jrp->tail;
- 		hw_idx = jrp->out_ring_read_index;
-+		dma_sync_single_for_cpu(dev, outbusaddr,
-+					sizeof(struct jr_outentry) * JOBR_DEPTH,
-+					DMA_FROM_DEVICE);
- 
- 		for (i = 0; CIRC_CNT(head, tail + i, JOBR_DEPTH) >= 1; i++) {
- 			sw_idx = (tail + i) & (JOBR_DEPTH - 1);
- 
-+			smp_read_barrier_depends();
-+
- 			if (jrp->outring[hw_idx].desc ==
- 			    jrp->entinfo[sw_idx].desc_addr_dma)
- 				break; /* found */
-@@ -202,6 +100,8 @@
- 		userdesc = jrp->entinfo[sw_idx].desc_addr_virt;
- 		userstatus = jrp->outring[hw_idx].jrstatus;
- 
-+		smp_mb();
-+
- 		/* set done */
- 		wr_reg32(&jrp->rregs->outring_rmvd, 1);
- 
-@@ -216,6 +116,7 @@
- 		if (sw_idx == tail) {
- 			do {
- 				tail = (tail + 1) & (JOBR_DEPTH - 1);
-+				smp_read_barrier_depends();
- 			} while (CIRC_CNT(head, tail, JOBR_DEPTH) >= 1 &&
- 				 jrp->entinfo[tail].desc_addr_dma == 0);
- 
-@@ -233,57 +134,70 @@
- }
- 
- /**
-- * caam_jr_alloc() - Alloc a job ring for someone to use as needed.
-- *
-- * returns :  pointer to the newly allocated physical
-- *	      JobR dev can be written to if successful.
-+ * caam_jr_register() - Alloc a ring for someone to use as needed. Returns
-+ * an ordinal of the rings allocated, else returns -ENODEV if no rings
-+ * are available.
-+ * @ctrldev: points to the controller level dev (parent) that
-+ *           owns rings available for use.
-+ * @dev:     points to where a pointer to the newly allocated queue's
-+ *           dev can be written to if successful.
-  **/
--struct device *caam_jr_alloc(void)
-+int caam_jr_register(struct device *ctrldev, struct device **rdev)
- {
--	struct caam_drv_private_jr *jrpriv, *min_jrpriv = NULL;
--	struct device *dev = NULL;
--	int min_tfm_cnt	= INT_MAX;
--	int tfm_cnt;
--
--	spin_lock(&driver_data.jr_alloc_lock);
--
--	if (list_empty(&driver_data.jr_list)) {
--		spin_unlock(&driver_data.jr_alloc_lock);
--		return ERR_PTR(-ENODEV);
--	}
--
--	list_for_each_entry(jrpriv, &driver_data.jr_list, list_node) {
--		tfm_cnt = atomic_read(&jrpriv->tfm_count);
--		if (tfm_cnt < min_tfm_cnt) {
--			min_tfm_cnt = tfm_cnt;
--			min_jrpriv = jrpriv;
-+	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
-+	struct caam_drv_private_jr *jrpriv = NULL;
-+	int ring;
-+
-+	/* Lock, if free ring - assign, unlock */
-+	spin_lock(&ctrlpriv->jr_alloc_lock);
-+	for (ring = 0; ring < ctrlpriv->total_jobrs; ring++) {
-+		jrpriv = dev_get_drvdata(ctrlpriv->jrdev[ring]);
-+		if (jrpriv->assign == JOBR_UNASSIGNED) {
-+			jrpriv->assign = JOBR_ASSIGNED;
-+			*rdev = ctrlpriv->jrdev[ring];
-+			spin_unlock(&ctrlpriv->jr_alloc_lock);
-+			return ring;
- 		}
--		if (!min_tfm_cnt)
--			break;
- 	}
- 
--	if (min_jrpriv) {
--		atomic_inc(&min_jrpriv->tfm_count);
--		dev = min_jrpriv->dev;
--	}
--	spin_unlock(&driver_data.jr_alloc_lock);
-+	/* If assigned, write dev where caller needs it */
-+	spin_unlock(&ctrlpriv->jr_alloc_lock);
-+	*rdev = NULL;
- 
--	return dev;
-+	return -ENODEV;
- }
--EXPORT_SYMBOL(caam_jr_alloc);
-+EXPORT_SYMBOL(caam_jr_register);
- 
- /**
-- * caam_jr_free() - Free the Job Ring
-- * @rdev     - points to the dev that identifies the Job ring to
-- *             be released.
-+ * caam_jr_deregister() - Deregister an API and release the queue.
-+ * Returns 0 if OK, -EBUSY if queue still contains pending entries
-+ * or unprocessed results at the time of the call
-+ * @dev     - points to the dev that identifies the queue to
-+ *            be released.
-  **/
--void caam_jr_free(struct device *rdev)
-+int caam_jr_deregister(struct device *rdev)
- {
- 	struct caam_drv_private_jr *jrpriv = dev_get_drvdata(rdev);
-+	struct caam_drv_private *ctrlpriv;
-+
-+	/* Get the owning controller's private space */
-+	ctrlpriv = dev_get_drvdata(jrpriv->parentdev);
-+
-+	/*
-+	 * Make sure ring empty before release
-+	 */
-+	if (rd_reg32(&jrpriv->rregs->outring_used) ||
-+	    (rd_reg32(&jrpriv->rregs->inpring_avail) != JOBR_DEPTH))
-+		return -EBUSY;
- 
--	atomic_dec(&jrpriv->tfm_count);
-+	/* Release ring */
-+	spin_lock(&ctrlpriv->jr_alloc_lock);
-+	jrpriv->assign = JOBR_UNASSIGNED;
-+	spin_unlock(&ctrlpriv->jr_alloc_lock);
-+
-+	return 0;
- }
--EXPORT_SYMBOL(caam_jr_free);
-+EXPORT_SYMBOL(caam_jr_deregister);
- 
- /**
-  * caam_jr_enqueue() - Enqueue a job descriptor head. Returns 0 if OK,
-@@ -321,7 +235,7 @@
- 	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
- 	struct caam_jrentry_info *head_entry;
- 	int head, tail, desc_size;
--	dma_addr_t desc_dma;
-+	dma_addr_t desc_dma, inpbusaddr;
- 
- 	desc_size = (*desc & HDR_JD_LENGTH_MASK) * sizeof(u32);
- 	desc_dma = dma_map_single(dev, desc, desc_size, DMA_TO_DEVICE);
-@@ -330,6 +244,13 @@
- 		return -EIO;
- 	}
- 
-+	dma_sync_single_for_device(dev, desc_dma, desc_size, DMA_TO_DEVICE);
-+
-+	inpbusaddr = rd_reg64(&jrp->rregs->inpring_base);
-+	dma_sync_single_for_device(dev, inpbusaddr,
-+					sizeof(dma_addr_t) * JOBR_DEPTH,
-+					DMA_TO_DEVICE);
-+
- 	spin_lock_bh(&jrp->inplock);
- 
- 	head = jrp->head;
-@@ -351,12 +272,18 @@
- 
- 	jrp->inpring[jrp->inp_ring_write_index] = desc_dma;
- 
-+	dma_sync_single_for_device(dev, inpbusaddr,
-+					sizeof(dma_addr_t) * JOBR_DEPTH,
-+					DMA_TO_DEVICE);
-+
- 	smp_wmb();
- 
- 	jrp->inp_ring_write_index = (jrp->inp_ring_write_index + 1) &
- 				    (JOBR_DEPTH - 1);
- 	jrp->head = (head + 1) & (JOBR_DEPTH - 1);
- 
-+	wmb();
-+
- 	wr_reg32(&jrp->rregs->inpring_jobadd, 1);
- 
- 	spin_unlock_bh(&jrp->inplock);
-@@ -365,6 +292,46 @@
- }
- EXPORT_SYMBOL(caam_jr_enqueue);
- 
-+static int caam_reset_hw_jr(struct device *dev)
-+{
-+	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
-+	unsigned int timeout = 100000;
-+
-+	/*
-+	 * mask interrupts since we are going to poll
-+	 * for reset completion status
-+	 */
-+	setbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
-+
-+	/* initiate flush (required prior to reset) */
-+	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
-+	while (((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) ==
-+		JRINT_ERR_HALT_INPROGRESS) && --timeout)
-+		cpu_relax();
-+
-+	if ((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) !=
-+	    JRINT_ERR_HALT_COMPLETE || timeout == 0) {
-+		dev_err(dev, "failed to flush job ring %d\n", jrp->ridx);
-+		return -EIO;
-+	}
-+
-+	/* initiate reset */
-+	timeout = 100000;
-+	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
-+	while ((rd_reg32(&jrp->rregs->jrcommand) & JRCR_RESET) && --timeout)
-+		cpu_relax();
-+
-+	if (timeout == 0) {
-+		dev_err(dev, "failed to reset job ring %d\n", jrp->ridx);
-+		return -EIO;
-+	}
-+
-+	/* unmask interrupts */
-+	clrbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
-+
-+	return 0;
-+}
-+
- /*
-  * Init JobR independent of platform property detection
-  */
-@@ -380,32 +347,34 @@
- 
- 	/* Connect job ring interrupt handler. */
- 	error = request_irq(jrp->irq, caam_jr_interrupt, IRQF_SHARED,
--			    dev_name(dev), dev);
-+			    "caam-jobr", dev);
- 	if (error) {
- 		dev_err(dev, "can't connect JobR %d interrupt (%d)\n",
- 			jrp->ridx, jrp->irq);
--		goto out_kill_deq;
-+		irq_dispose_mapping(jrp->irq);
-+		jrp->irq = 0;
-+		return -EINVAL;
- 	}
- 
- 	error = caam_reset_hw_jr(dev);
- 	if (error)
--		goto out_free_irq;
-+		return error;
- 
--	error = -ENOMEM;
- 	jrp->inpring = dma_alloc_coherent(dev, sizeof(dma_addr_t) * JOBR_DEPTH,
- 					  &inpbusaddr, GFP_KERNEL);
--	if (!jrp->inpring)
--		goto out_free_irq;
- 
- 	jrp->outring = dma_alloc_coherent(dev, sizeof(struct jr_outentry) *
- 					  JOBR_DEPTH, &outbusaddr, GFP_KERNEL);
--	if (!jrp->outring)
--		goto out_free_inpring;
- 
- 	jrp->entinfo = kzalloc(sizeof(struct caam_jrentry_info) * JOBR_DEPTH,
- 			       GFP_KERNEL);
--	if (!jrp->entinfo)
--		goto out_free_outring;
-+
-+	if ((jrp->inpring == NULL) || (jrp->outring == NULL) ||
-+	    (jrp->entinfo == NULL)) {
-+		dev_err(dev, "can't allocate job rings for %d\n",
-+			jrp->ridx);
-+		return -ENOMEM;
-+	}
- 
- 	for (i = 0; i < JOBR_DEPTH; i++)
- 		jrp->entinfo[i].desc_addr_dma = !0;
-@@ -431,120 +400,123 @@
- 		  (JOBR_INTC_COUNT_THLD << JRCFG_ICDCT_SHIFT) |
- 		  (JOBR_INTC_TIME_THLD << JRCFG_ICTT_SHIFT));
- 
-+	jrp->assign = JOBR_UNASSIGNED;
- 	return 0;
-+}
- 
--out_free_outring:
--	dma_free_coherent(dev, sizeof(struct jr_outentry) * JOBR_DEPTH,
--			  jrp->outring, outbusaddr);
--out_free_inpring:
-+/*
-+ * Shutdown JobR independent of platform property code
-+ */
-+int caam_jr_shutdown(struct device *dev)
-+{
-+	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
-+	dma_addr_t inpbusaddr, outbusaddr;
-+	int ret;
-+
-+	ret = caam_reset_hw_jr(dev);
-+
-+	tasklet_kill(&jrp->irqtask);
-+
-+	/* Release interrupt */
-+	free_irq(jrp->irq, dev);
-+
-+	/* Free rings */
-+	inpbusaddr = rd_reg64(&jrp->rregs->inpring_base);
-+	outbusaddr = rd_reg64(&jrp->rregs->outring_base);
- 	dma_free_coherent(dev, sizeof(dma_addr_t) * JOBR_DEPTH,
- 			  jrp->inpring, inpbusaddr);
--	dev_err(dev, "can't allocate job rings for %d\n", jrp->ridx);
--out_free_irq:
--	free_irq(jrp->irq, dev);
--out_kill_deq:
--	tasklet_kill(&jrp->irqtask);
--	return error;
--}
-+	dma_free_coherent(dev, sizeof(struct jr_outentry) * JOBR_DEPTH,
-+			  jrp->outring, outbusaddr);
-+	kfree(jrp->entinfo);
-+	of_device_unregister(jrp->jr_pdev);
- 
-+	return ret;
-+}
- 
- /*
-- * Probe routine for each detected JobR subsystem.
-+ * Probe routine for each detected JobR subsystem. It assumes that
-+ * property detection was picked up externally.
-  */
--static int caam_jr_probe(struct platform_device *pdev)
-+int caam_jr_probe(struct platform_device *pdev, struct device_node *np,
-+		  int ring)
- {
--	struct device *jrdev;
--	struct device_node *nprop;
--	struct caam_job_ring __iomem *ctrl;
-+	struct device *ctrldev, *jrdev;
-+	struct platform_device *jr_pdev;
-+	struct caam_drv_private *ctrlpriv;
- 	struct caam_drv_private_jr *jrpriv;
--	static int total_jobrs;
-+	const __be32 *jroffset_addr;
-+	u32 jroffset;
- 	int error;
- 
--	jrdev = &pdev->dev;
--	jrpriv = devm_kmalloc(jrdev, sizeof(struct caam_drv_private_jr),
--			      GFP_KERNEL);
--	if (!jrpriv)
-+	ctrldev = &pdev->dev;
-+	ctrlpriv = dev_get_drvdata(ctrldev);
-+
-+	jrpriv = kmalloc(sizeof(struct caam_drv_private_jr),
-+			 GFP_KERNEL);
-+	if (jrpriv == NULL) {
-+		dev_err(ctrldev, "can't alloc private mem for job ring %d\n",
-+			ring);
- 		return -ENOMEM;
-+	}
-+	jrpriv->parentdev = ctrldev; /* point back to parent */
-+	jrpriv->ridx = ring; /* save ring identity relative to detection */
- 
--	dev_set_drvdata(jrdev, jrpriv);
-+	/*
-+	 * Derive a pointer to the detected JobRs regs
-+	 * Driver has already iomapped the entire space, we just
-+	 * need to add in the offset to this JobR. Don't know if I
-+	 * like this long-term, but it'll run
-+	 */
-+	jroffset_addr = of_get_property(np, "reg", NULL);
- 
--	/* save ring identity relative to detection */
--	jrpriv->ridx = total_jobrs++;
-+	if (jroffset_addr == NULL) {
-+		kfree(jrpriv);
-+		return -EINVAL;
-+	}
- 
--	nprop = pdev->dev.of_node;
--	/* Get configuration properties from device tree */
--	/* First, get register page */
--	ctrl = of_iomap(nprop, 0);
--	if (!ctrl) {
--		dev_err(jrdev, "of_iomap() failed\n");
--		return -ENOMEM;
-+	/*
-+	 * Fix the endianness of this value read from the device
-+	 * tree if running on ARM.
-+	 */
-+	jroffset = be32_to_cpup(jroffset_addr);
-+
-+	jrpriv->rregs = (struct caam_job_ring __iomem *)((void *)ctrlpriv->ctrl
-+							 + jroffset);
-+
-+	/* Build a local dev for each detected queue */
-+	jr_pdev = of_platform_device_create(np, NULL, ctrldev);
-+	if (jr_pdev == NULL) {
-+		kfree(jrpriv);
-+		return -EINVAL;
- 	}
- 
--	jrpriv->rregs = (struct caam_job_ring __force *)ctrl;
-+	jrpriv->jr_pdev = jr_pdev;
-+	jrdev = &jr_pdev->dev;
-+	dev_set_drvdata(jrdev, jrpriv);
-+	ctrlpriv->jrdev[ring] = jrdev;
- 
- 	if (sizeof(dma_addr_t) == sizeof(u64))
--		if (of_device_is_compatible(nprop, "fsl,sec-v5.0-job-ring"))
--			dma_set_mask_and_coherent(jrdev, DMA_BIT_MASK(40));
-+		if (of_device_is_compatible(np, "fsl,sec-v4.0-job-ring"))
-+			dma_set_mask(jrdev, DMA_BIT_MASK(40));
- 		else
--			dma_set_mask_and_coherent(jrdev, DMA_BIT_MASK(36));
-+			dma_set_mask(jrdev, DMA_BIT_MASK(36));
- 	else
--		dma_set_mask_and_coherent(jrdev, DMA_BIT_MASK(32));
-+		dma_set_mask(jrdev, DMA_BIT_MASK(32));
- 
- 	/* Identify the interrupt */
--	jrpriv->irq = irq_of_parse_and_map(nprop, 0);
-+	jrpriv->irq = of_irq_to_resource(np, 0, NULL);
-+	if (jrpriv->irq <= 0) {
-+		kfree(jrpriv);
-+		return -EINVAL;
-+	}
- 
- 	/* Now do the platform independent part */
- 	error = caam_jr_init(jrdev); /* now turn on hardware */
- 	if (error) {
--		irq_dispose_mapping(jrpriv->irq);
-+		of_device_unregister(jr_pdev);
-+		kfree(jrpriv);
- 		return error;
- 	}
- 
--	jrpriv->dev = jrdev;
--	spin_lock(&driver_data.jr_alloc_lock);
--	list_add_tail(&jrpriv->list_node, &driver_data.jr_list);
--	spin_unlock(&driver_data.jr_alloc_lock);
--
--	atomic_set(&jrpriv->tfm_count, 0);
--
--	return 0;
--}
--
--static struct of_device_id caam_jr_match[] = {
--	{
--		.compatible = "fsl,sec-v4.0-job-ring",
--	},
--	{
--		.compatible = "fsl,sec4.0-job-ring",
--	},
--	{},
--};
--MODULE_DEVICE_TABLE(of, caam_jr_match);
--
--static struct platform_driver caam_jr_driver = {
--	.driver = {
--		.name = "caam_jr",
--		.of_match_table = caam_jr_match,
--	},
--	.probe       = caam_jr_probe,
--	.remove      = caam_jr_remove,
--};
--
--static int __init jr_driver_init(void)
--{
--	spin_lock_init(&driver_data.jr_alloc_lock);
--	INIT_LIST_HEAD(&driver_data.jr_list);
--	return platform_driver_register(&caam_jr_driver);
--}
--
--static void __exit jr_driver_exit(void)
--{
--	platform_driver_unregister(&caam_jr_driver);
-+	return error;
- }
--
--module_init(jr_driver_init);
--module_exit(jr_driver_exit);
--
--MODULE_LICENSE("GPL");
--MODULE_DESCRIPTION("FSL CAAM JR request backend");
--MODULE_AUTHOR("Freescale Semiconductor - NMG/STC");
-diff -Nur linux-4.1.3/drivers/crypto/caam/jr.h linux-xbian-imx6/drivers/crypto/caam/jr.h
---- linux-4.1.3/drivers/crypto/caam/jr.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/jr.h	2015-07-27 23:13:04.213947410 +0200
-@@ -1,18 +1,22 @@
- /*
-  * CAAM public-level include definitions for the JobR backend
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  */
- 
- #ifndef JR_H
- #define JR_H
- 
- /* Prototypes for backend-level services exposed to APIs */
--struct device *caam_jr_alloc(void);
--void caam_jr_free(struct device *rdev);
-+int caam_jr_register(struct device *ctrldev, struct device **rdev);
-+int caam_jr_deregister(struct device *rdev);
- int caam_jr_enqueue(struct device *dev, u32 *desc,
- 		    void (*cbk)(struct device *dev, u32 *desc, u32 status,
- 				void *areq),
- 		    void *areq);
- 
-+extern int caam_jr_probe(struct platform_device *pdev, struct device_node *np,
-+			 int ring);
-+extern int caam_jr_shutdown(struct device *dev);
-+extern struct device *caam_get_jrdev(void);
- #endif /* JR_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/Kconfig linux-xbian-imx6/drivers/crypto/caam/Kconfig
---- linux-4.1.3/drivers/crypto/caam/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/Kconfig	2015-07-27 23:13:04.205975852 +0200
-@@ -1,32 +1,19 @@
- config CRYPTO_DEV_FSL_CAAM
- 	tristate "Freescale CAAM-Multicore driver backend"
--	depends on FSL_SOC
-+	depends on FSL_SOC || ARCH_MXC
- 	help
- 	  Enables the driver module for Freescale's Cryptographic Accelerator
- 	  and Assurance Module (CAAM), also known as the SEC version 4 (SEC4).
--	  This module creates job ring devices, and configures h/w
-+	  This module adds a job ring operation interface, and configures h/w
- 	  to operate as a DPAA component automatically, depending
- 	  on h/w feature availability.
- 
- 	  To compile this driver as a module, choose M here: the module
- 	  will be called caam.
- 
--config CRYPTO_DEV_FSL_CAAM_JR
--	tristate "Freescale CAAM Job Ring driver backend"
--	depends on CRYPTO_DEV_FSL_CAAM
--	default y
--	help
--	  Enables the driver module for Job Rings which are part of
--	  Freescale's Cryptographic Accelerator
--	  and Assurance Module (CAAM). This module adds a job ring operation
--	  interface.
--
--	  To compile this driver as a module, choose M here: the module
--	  will be called caam_jr.
--
- config CRYPTO_DEV_FSL_CAAM_RINGSIZE
- 	int "Job Ring size"
--	depends on CRYPTO_DEV_FSL_CAAM_JR
-+	depends on CRYPTO_DEV_FSL_CAAM
- 	range 2 9
- 	default "9"
- 	help
-@@ -44,7 +31,7 @@
- 
- config CRYPTO_DEV_FSL_CAAM_INTC
- 	bool "Job Ring interrupt coalescing"
--	depends on CRYPTO_DEV_FSL_CAAM_JR
-+	depends on CRYPTO_DEV_FSL_CAAM
- 	default n
- 	help
- 	  Enable the Job Ring's interrupt coalescing feature.
-@@ -75,7 +62,7 @@
- 
- config CRYPTO_DEV_FSL_CAAM_CRYPTO_API
- 	tristate "Register algorithm implementations with the Crypto API"
--	depends on CRYPTO_DEV_FSL_CAAM && CRYPTO_DEV_FSL_CAAM_JR
-+	depends on CRYPTO_DEV_FSL_CAAM
- 	default y
- 	select CRYPTO_ALGAPI
- 	select CRYPTO_AUTHENC
-@@ -89,7 +76,7 @@
- 
- config CRYPTO_DEV_FSL_CAAM_AHASH_API
- 	tristate "Register hash algorithm implementations with Crypto API"
--	depends on CRYPTO_DEV_FSL_CAAM && CRYPTO_DEV_FSL_CAAM_JR
-+	depends on CRYPTO_DEV_FSL_CAAM
- 	default y
- 	select CRYPTO_HASH
- 	help
-@@ -101,7 +88,7 @@
- 
- config CRYPTO_DEV_FSL_CAAM_RNG_API
- 	tristate "Register caam device for hwrng API"
--	depends on CRYPTO_DEV_FSL_CAAM && CRYPTO_DEV_FSL_CAAM_JR
-+	depends on CRYPTO_DEV_FSL_CAAM
- 	default y
- 	select CRYPTO_RNG
- 	select HW_RANDOM
-@@ -112,6 +99,54 @@
- 	  To compile this as a module, choose M here: the module
- 	  will be called caamrng.
- 
-+config CRYPTO_DEV_FSL_CAAM_RNG_TEST
-+	boolean "Test caam rng"
-+	depends on CRYPTO_DEV_FSL_CAAM_RNG_API
-+	default n
-+	help
-+	  Selecting this will enable self-test for caam rng.
-+
-+config CRYPTO_DEV_FSL_CAAM_SM
-+	tristate "CAAM Secure Memory / Keystore API (EXPERIMENTAL)"
-+	default n
-+	help
-+	  Enables use of a prototype kernel-level Keystore API with CAAM
-+	  Secure Memory for insertion/extraction of bus-protected secrets.
-+
-+config CRYPTO_DEV_FSL_CAAM_SM_SLOTSIZE
-+	int "Size of each keystore slot in Secure Memory"
-+	depends on CRYPTO_DEV_FSL_CAAM_SM
-+	range 5 9
-+	default 7
-+	help
-+	  Select size of allocation units to divide Secure Memory pages into
-+	  (the size of a "slot" as referenced inside the API code).
-+	  Established as powers of two.
-+	  Examples:
-+		5 => 32 bytes
-+		6 => 64 bytes
-+		7 => 128 bytes
-+		8 => 256 bytes
-+		9 => 512 bytes
-+
-+config CRYPTO_DEV_FSL_CAAM_SM_TEST
-+	tristate "CAAM Secure Memory - Keystore Test/Example (EXPERIMENTAL)"
-+	depends on CRYPTO_DEV_FSL_CAAM_SM
-+	default n
-+	help
-+	  Example thread to exercise the Keystore API and to verify that
-+	  stored and recovered secrets can be used for general purpose
-+	  encryption/decryption.
-+
-+config CRYPTO_DEV_FSL_CAAM_SECVIO
-+	tristate "CAAM/SNVS Security Violation Handler (EXPERIMENTAL)"
-+	depends on CRYPTO_DEV_FSL_CAAM
-+	default n
-+	help
-+	  Enables installation of an interrupt handler with registrable
-+          handler functions which can be specified to act on the consequences
-+          of a security violation.
-+
- config CRYPTO_DEV_FSL_CAAM_DEBUG
- 	bool "Enable debug output in CAAM driver"
- 	depends on CRYPTO_DEV_FSL_CAAM
-@@ -119,3 +154,19 @@
- 	help
- 	  Selecting this will enable printing of various debug
- 	  information in the CAAM driver.
-+
-+config CRYPTO_DEV_FSL_CAAM_KEYBLOB
-+	tristate "Freescale CAAM memory keyblob driver backend"
-+	depends on CRYPTO_DEV_FSL_CAAM
-+	depends on CRYPTO_DEV_FSL_CAAM_JR
-+	default y
-+	help
-+	  Enables the driver module for Key Blob which are part of
-+	  Freescale's Cryptographic Accelerator
-+	  and Assurance Module (CAAM). This module adds a key blob operation
-+	  interface.
-+
-+	  To compile this driver as a module, choose M here: the module
-+	  will be called caam_keyblob.
-+
-+
-diff -Nur linux-4.1.3/drivers/crypto/caam/key_gen.c linux-xbian-imx6/drivers/crypto/caam/key_gen.c
---- linux-4.1.3/drivers/crypto/caam/key_gen.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/key_gen.c	2015-07-27 23:13:04.213947410 +0200
-@@ -1,7 +1,7 @@
- /*
-  * CAAM/SEC 4.x functions for handling key-generation jobs
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  *
-  */
- #include "compat.h"
-@@ -19,8 +19,11 @@
- 	dev_err(dev, "%s %d: err 0x%x\n", __func__, __LINE__, err);
- #endif
- 
--	if (err)
--		caam_jr_strstatus(dev, err);
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+
-+		dev_err(dev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
- 
- 	res->err = err;
- 
-@@ -48,29 +51,24 @@
- 	u32 *desc;
- 	struct split_key_result result;
- 	dma_addr_t dma_addr_in, dma_addr_out;
--	int ret = -ENOMEM;
-+	int ret = 0;
- 
- 	desc = kmalloc(CAAM_CMD_SZ * 6 + CAAM_PTR_SZ * 2, GFP_KERNEL | GFP_DMA);
- 	if (!desc) {
- 		dev_err(jrdev, "unable to allocate key input memory\n");
--		return ret;
-+		return -ENOMEM;
- 	}
- 
-+	init_job_desc(desc, 0);
-+
- 	dma_addr_in = dma_map_single(jrdev, (void *)key_in, keylen,
- 				     DMA_TO_DEVICE);
- 	if (dma_mapping_error(jrdev, dma_addr_in)) {
- 		dev_err(jrdev, "unable to map key input memory\n");
--		goto out_free;
-+		kfree(desc);
-+		return -ENOMEM;
- 	}
--
--	dma_addr_out = dma_map_single(jrdev, key_out, split_key_pad_len,
--				      DMA_FROM_DEVICE);
--	if (dma_mapping_error(jrdev, dma_addr_out)) {
--		dev_err(jrdev, "unable to map key output memory\n");
--		goto out_unmap_in;
--	}
--
--	init_job_desc(desc, 0);
-+	dma_sync_single_for_device(jrdev, dma_addr_in, keylen, DMA_TO_DEVICE);
- 	append_key(desc, dma_addr_in, keylen, CLASS_2 | KEY_DEST_CLASS_REG);
- 
- 	/* Sets MDHA up into an HMAC-INIT */
-@@ -91,9 +89,9 @@
- 			  LDST_CLASS_2_CCB | FIFOST_TYPE_SPLIT_KEK);
- 
- #ifdef DEBUG
--	print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, key_in, keylen, 1);
--	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
-+	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
- 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
- #endif
- 
-@@ -106,12 +104,13 @@
- 		wait_for_completion_interruptible(&result.completion);
- 		ret = result.err;
- #ifdef DEBUG
--		print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
-+		print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
- 			       DUMP_PREFIX_ADDRESS, 16, 4, key_out,
- 			       split_key_pad_len, 1);
- #endif
- 	}
--
-+	dma_sync_single_for_cpu(jrdev, dma_addr_out, split_key_pad_len,
-+				DMA_FROM_DEVICE);
- 	dma_unmap_single(jrdev, dma_addr_out, split_key_pad_len,
- 			 DMA_FROM_DEVICE);
- out_unmap_in:
-diff -Nur linux-4.1.3/drivers/crypto/caam/Makefile linux-xbian-imx6/drivers/crypto/caam/Makefile
---- linux-4.1.3/drivers/crypto/caam/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/Makefile	2015-07-27 23:13:04.205975852 +0200
-@@ -1,15 +1,14 @@
- #
- # Makefile for the CAAM backend and dependent components
- #
--ifeq ($(CONFIG_CRYPTO_DEV_FSL_CAAM_DEBUG), y)
--	EXTRA_CFLAGS := -DDEBUG
--endif
- 
- obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM) += caam.o
--obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_JR) += caam_jr.o
- obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_CRYPTO_API) += caamalg.o
- obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_AHASH_API) += caamhash.o
- obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_RNG_API) += caamrng.o
-+obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_SM) += sm_store.o
-+obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_SM_TEST) += sm_test.o
-+obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_SECVIO) += secvio.o
-+obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_KEYBLOB) += caam_keyblob.o
- 
--caam-objs := ctrl.o
--caam_jr-objs := jr.o key_gen.o error.o
-+caam-objs := ctrl.o jr.o error.o key_gen.o
-diff -Nur linux-4.1.3/drivers/crypto/caam/pdb.h linux-xbian-imx6/drivers/crypto/caam/pdb.h
---- linux-4.1.3/drivers/crypto/caam/pdb.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/pdb.h	2015-07-27 23:13:04.213947410 +0200
-@@ -44,7 +44,6 @@
- #define PDBOPTS_ESP_IPHDRSRC	0x08 /* IP header comes from PDB (encap) */
- #define PDBOPTS_ESP_INCIPHDR	0x04 /* Prepend IP header to output frame */
- #define PDBOPTS_ESP_IPVSN	0x02 /* process IPv6 header */
--#define PDBOPTS_ESP_AOFL	0x04 /* adjust out frame len (decap, SEC>=5.3)*/
- #define PDBOPTS_ESP_TUNNEL	0x01 /* tunnel mode next-header byte */
- #define PDBOPTS_ESP_IPV6	0x02 /* ip header version is V6 */
- #define PDBOPTS_ESP_DIFFSERV	0x40 /* copy TOS/TC from inner iphdr */
-diff -Nur linux-4.1.3/drivers/crypto/caam/regs.h linux-xbian-imx6/drivers/crypto/caam/regs.h
---- linux-4.1.3/drivers/crypto/caam/regs.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/regs.h	2015-07-27 23:13:04.213947410 +0200
-@@ -1,7 +1,7 @@
- /*
-  * CAAM hardware register-level view
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  */
- 
- #ifndef REGS_H
-@@ -74,17 +74,22 @@
- #endif
- #else
- #ifdef __LITTLE_ENDIAN
--#define wr_reg32(reg, data) __raw_writel(data, reg)
--#define rd_reg32(reg) __raw_readl(reg)
-+#define wr_reg32(reg, data) writel(data, reg)
-+#define rd_reg32(reg) readl(reg)
- #ifdef CONFIG_64BIT
--#define wr_reg64(reg, data) __raw_writeq(data, reg)
--#define rd_reg64(reg) __raw_readq(reg)
-+#define wr_reg64(reg, data) writeq(data, reg)
-+#define rd_reg64(reg) readq(reg)
- #endif
- #endif
- #endif
- 
-+#ifdef CONFIG_ARM
-+/* These are common macros for Power, put here for ARMs */
-+#define setbits32(_addr, _v) writel((readl(_addr) | (_v)), (_addr))
-+#define clrbits32(_addr, _v) writel((readl(_addr) & ~(_v)), (_addr))
-+#endif
-+
- #ifndef CONFIG_64BIT
--#ifdef __BIG_ENDIAN
- static inline void wr_reg64(u64 __iomem *reg, u64 data)
- {
- 	wr_reg32((u32 __iomem *)reg, (data & 0xffffffff00000000ull) >> 32);
-@@ -96,21 +101,6 @@
- 	return (((u64)rd_reg32((u32 __iomem *)reg)) << 32) |
- 		((u64)rd_reg32((u32 __iomem *)reg + 1));
- }
--#else
--#ifdef __LITTLE_ENDIAN
--static inline void wr_reg64(u64 __iomem *reg, u64 data)
--{
--	wr_reg32((u32 __iomem *)reg + 1, (data & 0xffffffff00000000ull) >> 32);
--	wr_reg32((u32 __iomem *)reg, data & 0x00000000ffffffffull);
--}
--
--static inline u64 rd_reg64(u64 __iomem *reg)
--{
--	return (((u64)rd_reg32((u32 __iomem *)reg + 1)) << 32) |
--		((u64)rd_reg32((u32 __iomem *)reg));
--}
--#endif
--#endif
- #endif
- 
- /*
-@@ -123,6 +113,98 @@
- } __packed;
- 
- /*
-+ * CHA version ID / instantiation bitfields
-+ * Defined for use within cha_id in perfmon
-+ * Note that the same shift/mask selectors can be used to pull out number
-+ * of instantiated blocks within cha_num in perfmon, the locations are
-+ * the same.
-+ */
-+
-+/* Job Ring */
-+#define CHA_ID_JR_SHIFT	60
-+#define CHA_ID_JR_MASK		(0xfull << CHA_ID_JR_SHIFT)
-+
-+/* DEscriptor COntroller */
-+#define CHA_ID_DECO_SHIFT	56
-+#define CHA_ID_DECO_MASK	(0xfull << CHA_ID_DECO_SHIFT)
-+#define CHA_NUM_DECONUM_SHIFT	56 /* legacy definition */
-+#define CHA_NUM_DECONUM_MASK	(0xfull << CHA_NUM_DECONUM_SHIFT)
-+
-+/* ZUC-Authentication */
-+#define CHA_ID_ZA_SHIFT	44
-+#define CHA_ID_ZA_MASK		(0xfull << CHA_ID_ZA_SHIFT)
-+
-+/* ZUC-Encryption */
-+#define CHA_ID_ZE_SHIFT	40
-+#define CHA_ID_ZE_MASK		(0xfull << CHA_ID_ZE_SHIFT)
-+
-+/* SNOW f9 */
-+#define CHA_ID_SNW9_SHIFT	36
-+#define CHA_ID_SNW9_MASK	(0xfull << CHA_ID_SNW9_SHIFT)
-+
-+/* CRC */
-+#define CHA_ID_CRC_SHIFT	32
-+#define CHA_ID_CRC_MASK		(0xfull << CHA_ID_CRC_SHIFT)
-+
-+/* Public Key */
-+#define CHA_ID_PK_SHIFT	28
-+#define CHA_ID_PK_MASK		(0xfull << CHA_ID_PK_SHIFT)
-+
-+/* Kasumi */
-+#define CHA_ID_KAS_SHIFT	24
-+#define CHA_ID_KAS_MASK		(0xfull << CHA_ID_KAS_SHIFT)
-+
-+/* SNOW f8 */
-+#define CHA_ID_SNW8_SHIFT	20
-+#define CHA_ID_SNW8_MASK	(0xfull << CHA_ID_SNW8_SHIFT)
-+
-+/*
-+ * Random Generator
-+ * RNG4 = FIPS-verification-compliant, requires init kickstart for use
-+ */
-+#define CHA_ID_RNG_SHIFT	16
-+#define CHA_ID_RNG_MASK		(0xfull << CHA_ID_RNG_SHIFT)
-+#define CHA_ID_RNG_A		(0x1ull << CHA_ID_RNG_SHIFT)
-+#define CHA_ID_RNG_B		(0x2ull << CHA_ID_RNG_SHIFT)
-+#define CHA_ID_RNG_C		(0x3ull << CHA_ID_RNG_SHIFT)
-+#define CHA_ID_RNG_4		(0x4ull << CHA_ID_RNG_SHIFT)
-+
-+/*
-+ * Message Digest
-+ * LP256 = Low Power (MD5/SHA1/SHA224/SHA256 + HMAC)
-+ * LP512 = Low Power (LP256 + SHA384/SHA512)
-+ * HP    = High Power (LP512 + SMAC)
-+ */
-+#define CHA_ID_MD_SHIFT		12
-+#define CHA_ID_MD_MASK		(0xfull << CHA_ID_MD_SHIFT)
-+#define CHA_ID_MD_LP256		(0x0ull << CHA_ID_MD_SHIFT)
-+#define CHA_ID_MD_LP512		(0x1ull << CHA_ID_MD_SHIFT)
-+#define CHA_ID_MD_HP		(0x2ull << CHA_ID_MD_SHIFT)
-+
-+/* ARC4 Streamcipher */
-+#define CHA_ID_ARC4_SHIFT	8
-+#define CHA_ID_ARC4_MASK	(0xfull << CHA_ID_ARC4_SHIFT)
-+#define CHA_ID_ARC4_LP		(0x0ull << CHA_ID_ARC4_SHIFT)
-+#define CHA_ID_ARC4_HP		(0x1ull << CHA_ID_ARC4_SHIFT)
-+
-+/* DES Blockcipher Accelerator */
-+#define CHA_ID_DES_SHIFT	4
-+#define CHA_ID_DES_MASK		(0xfull << CHA_ID_DES_SHIFT)
-+
-+/*
-+ * AES Blockcipher + Combo Mode Accelerator
-+ * LP = Low Power (includes ECB/CBC/CFB128/OFB/CTR/CCM/CMAC/XCBC-MAC)
-+ * HP = High Power (LP + CBCXCBC/CTRXCBC/XTS/GCM)
-+ * DIFFPWR = ORed in if differential-power-analysis resistance implemented
-+ */
-+#define CHA_ID_AES_SHIFT	0
-+#define CHA_ID_AES_MASK		(0xfull << CHA_ID_AES_SHIFT)
-+#define CHA_ID_AES_LP		(0x3ull << CHA_ID_AES_SHIFT)
-+#define CHA_ID_AES_HP		(0x4ull << CHA_ID_AES_SHIFT)
-+#define CHA_ID_AES_DIFFPWR	(0x1ull << CHA_ID_AES_SHIFT)
-+
-+
-+/*
-  * caam_perfmon - Performance Monitor/Secure Memory Status/
-  *                CAAM Global Status/Component Version IDs
-  *
-@@ -130,45 +212,8 @@
-  */
- 
- /* Number of DECOs */
--#define CHA_NUM_MS_DECONUM_SHIFT	24
--#define CHA_NUM_MS_DECONUM_MASK	(0xfull << CHA_NUM_MS_DECONUM_SHIFT)
--
--/* CHA Version IDs */
--#define CHA_ID_LS_AES_SHIFT	0
--#define CHA_ID_LS_AES_MASK		(0xfull << CHA_ID_LS_AES_SHIFT)
--
--#define CHA_ID_LS_DES_SHIFT	4
--#define CHA_ID_LS_DES_MASK		(0xfull << CHA_ID_LS_DES_SHIFT)
--
--#define CHA_ID_LS_ARC4_SHIFT	8
--#define CHA_ID_LS_ARC4_MASK	(0xfull << CHA_ID_LS_ARC4_SHIFT)
--
--#define CHA_ID_LS_MD_SHIFT	12
--#define CHA_ID_LS_MD_MASK	(0xfull << CHA_ID_LS_MD_SHIFT)
--
--#define CHA_ID_LS_RNG_SHIFT	16
--#define CHA_ID_LS_RNG_MASK	(0xfull << CHA_ID_LS_RNG_SHIFT)
--
--#define CHA_ID_LS_SNW8_SHIFT	20
--#define CHA_ID_LS_SNW8_MASK	(0xfull << CHA_ID_LS_SNW8_SHIFT)
--
--#define CHA_ID_LS_KAS_SHIFT	24
--#define CHA_ID_LS_KAS_MASK	(0xfull << CHA_ID_LS_KAS_SHIFT)
--
--#define CHA_ID_LS_PK_SHIFT	28
--#define CHA_ID_LS_PK_MASK	(0xfull << CHA_ID_LS_PK_SHIFT)
--
--#define CHA_ID_MS_CRC_SHIFT	0
--#define CHA_ID_MS_CRC_MASK	(0xfull << CHA_ID_MS_CRC_SHIFT)
--
--#define CHA_ID_MS_SNW9_SHIFT	4
--#define CHA_ID_MS_SNW9_MASK	(0xfull << CHA_ID_MS_SNW9_SHIFT)
--
--#define CHA_ID_MS_DECO_SHIFT	24
--#define CHA_ID_MS_DECO_MASK	(0xfull << CHA_ID_MS_DECO_SHIFT)
--
--#define CHA_ID_MS_JR_SHIFT	28
--#define CHA_ID_MS_JR_MASK	(0xfull << CHA_ID_MS_JR_SHIFT)
-+#define CHA_NUM_DECONUM_SHIFT	56
-+#define CHA_NUM_DECONUM_MASK	(0xfull << CHA_NUM_DECONUM_SHIFT)
- 
- struct sec_vid {
- 	u16 ip_id;
-@@ -176,6 +221,10 @@
- 	u8 min_rev;
- };
- 
-+#define SEC_VID_IPID_SHIFT      16
-+#define SEC_VID_MAJ_SHIFT       8
-+#define SEC_VID_MAJ_MASK        0xFF00
-+
- struct caam_perfmon {
- 	/* Performance Monitor Registers			f00-f9f */
- 	u64 req_dequeued;	/* PC_REQ_DEQ - Dequeued Requests	     */
-@@ -188,36 +237,89 @@
- 	u64 rsvd[13];
- 
- 	/* CAAM Hardware Instantiation Parameters		fa0-fbf */
--	u32 cha_rev_ms;		/* CRNR - CHA Rev No. Most significant half*/
--	u32 cha_rev_ls;		/* CRNR - CHA Rev No. Least significant half*/
--#define CTPR_MS_QI_SHIFT	25
--#define CTPR_MS_QI_MASK		(0x1ull << CTPR_MS_QI_SHIFT)
--#define CTPR_MS_VIRT_EN_INCL	0x00000001
--#define CTPR_MS_VIRT_EN_POR	0x00000002
--#define CTPR_MS_PG_SZ_MASK	0x10
--#define CTPR_MS_PG_SZ_SHIFT	4
--	u32 comp_parms_ms;	/* CTPR - Compile Parameters Register	*/
--	u32 comp_parms_ls;	/* CTPR - Compile Parameters Register	*/
--	u64 rsvd1[2];
-+	u64 cha_rev;		/* CRNR - CHA Revision Number		*/
-+#define CTPR_QI_SHIFT		57
-+#define CTPR_QI_MASK		(0x1ull << CTPR_QI_SHIFT)
-+	u64 comp_parms;	/* CTPR - Compile Parameters Register	*/
-+
-+	/* Secure Memory State Visibility */
-+	u32 rsvd1;
-+	u32 smstatus;	/* Secure memory status */
-+	u32 rsvd2;
-+	u32 smpartown;	/* Secure memory partition owner */
- 
- 	/* CAAM Global Status					fc0-fdf */
- 	u64 faultaddr;	/* FAR  - Fault Address		*/
- 	u32 faultliodn;	/* FALR - Fault Address LIODN	*/
- 	u32 faultdetail;	/* FADR - Fault Addr Detail	*/
--	u32 rsvd2;
-+	u32 rsvd3;
- 	u32 status;		/* CSTA - CAAM Status */
--	u64 rsvd3;
-+	u32 smpart;		/* Secure Memory Partition Parameters */
-+	u32 smvid;		/* Secure Memory Version ID */
- 
- 	/* Component Instantiation Parameters			fe0-fff */
- 	u32 rtic_id;		/* RVID - RTIC Version ID	*/
- 	u32 ccb_id;		/* CCBVID - CCB Version ID	*/
--	u32 cha_id_ms;		/* CHAVID - CHA Version ID Most Significant*/
--	u32 cha_id_ls;		/* CHAVID - CHA Version ID Least Significant*/
--	u32 cha_num_ms;		/* CHANUM - CHA Number Most Significant	*/
--	u32 cha_num_ls;		/* CHANUM - CHA Number Least Significant*/
--	u32 caam_id_ms;		/* CAAMVID - CAAM Version ID MS	*/
--	u32 caam_id_ls;		/* CAAMVID - CAAM Version ID LS	*/
--};
-+	u64 cha_id;		/* CHAVID - CHA Version ID	*/
-+	u64 cha_num;		/* CHANUM - CHA Number		*/
-+	u64 caam_id;		/* CAAMVID - CAAM Version ID	*/
-+};
-+
-+#define SMSTATUS_PART_SHIFT	28
-+#define SMSTATUS_PART_MASK	(0xf << SMSTATUS_PART_SHIFT)
-+#define SMSTATUS_PAGE_SHIFT	16
-+#define SMSTATUS_PAGE_MASK	(0x7ff << SMSTATUS_PAGE_SHIFT)
-+#define SMSTATUS_MID_SHIFT	8
-+#define SMSTATUS_MID_MASK	(0x3f << SMSTATUS_MID_SHIFT)
-+#define SMSTATUS_ACCERR_SHIFT	4
-+#define SMSTATUS_ACCERR_MASK	(0xf << SMSTATUS_ACCERR_SHIFT)
-+#define SMSTATUS_ACCERR_NONE	0
-+#define SMSTATUS_ACCERR_ALLOC	1	/* Page not allocated */
-+#define SMSTATUS_ACCESS_ID	2	/* Not granted by ID */
-+#define SMSTATUS_ACCESS_WRITE	3	/* Writes not allowed */
-+#define SMSTATUS_ACCESS_READ	4	/* Reads not allowed */
-+#define SMSTATUS_ACCESS_NONKEY	6	/* Non-key reads not allowed */
-+#define SMSTATUS_ACCESS_BLOB	9	/* Blob access not allowed */
-+#define SMSTATUS_ACCESS_DESCB	10	/* Descriptor Blob access spans pages */
-+#define SMSTATUS_ACCESS_NON_SM	11	/* Outside Secure Memory range */
-+#define SMSTATUS_ACCESS_XPAGE	12	/* Access crosses pages */
-+#define SMSTATUS_ACCESS_INITPG	13	/* Page still initializing */
-+#define SMSTATUS_STATE_SHIFT	0
-+#define SMSTATUS_STATE_MASK	(0xf << SMSTATUS_STATE_SHIFT)
-+#define SMSTATUS_STATE_RESET	0
-+#define SMSTATUS_STATE_INIT	1
-+#define SMSTATUS_STATE_NORMAL	2
-+#define SMSTATUS_STATE_FAIL	3
-+
-+/* up to 15 rings, 2 bits shifted by ring number */
-+#define SMPARTOWN_RING_SHIFT	2
-+#define SMPARTOWN_RING_MASK	3
-+#define SMPARTOWN_AVAILABLE	0
-+#define SMPARTOWN_NOEXIST	1
-+#define SMPARTOWN_UNAVAILABLE	2
-+#define SMPARTOWN_OURS		3
-+
-+/* Maximum number of pages possible */
-+#define SMPART_MAX_NUMPG_SHIFT	16
-+#define SMPART_MAX_NUMPG_MASK	(0x3f << SMPART_MAX_NUMPG_SHIFT)
-+
-+/* Maximum partition number */
-+#define SMPART_MAX_PNUM_SHIFT	12
-+#define SMPART_MAX_PNUM_MASK	(0xf << SMPART_MAX_PNUM_SHIFT)
-+
-+/* Highest possible page number */
-+#define SMPART_MAX_PG_SHIFT	0
-+#define SMPART_MAX_PG_MASK	(0x3f << SMPART_MAX_PG_SHIFT)
-+
-+/* Max size of a page */
-+#define SMVID_PG_SIZE_SHIFT	16
-+#define SMVID_PG_SIZE_MASK	(0x7 << SMVID_PG_SIZE_SHIFT)
-+
-+/* Major/Minor Version ID */
-+#define SMVID_MAJ_VERS_SHIFT	8
-+#define SMVID_MAJ_VERS		(0xf << SMVID_MAJ_VERS_SHIFT)
-+#define SMVID_MIN_VERS_SHIFT	0
-+#define SMVID_MIN_VERS		(0xf << SMVID_MIN_VERS_SHIFT)
- 
- /* LIODN programming for DMA configuration */
- #define MSTRID_LOCK_LIODN	0x80000000
-@@ -270,17 +372,7 @@
- 
- /* RNG4 TRNG test registers */
- struct rng4tst {
--#define RTMCTL_PRGM	0x00010000	/* 1 -> program mode, 0 -> run mode */
--#define RTMCTL_SAMP_MODE_VON_NEUMANN_ES_SC	0 /* use von Neumann data in
--						     both entropy shifter and
--						     statistical checker */
--#define RTMCTL_SAMP_MODE_RAW_ES_SC		1 /* use raw data in both
--						     entropy shifter and
--						     statistical checker */
--#define RTMCTL_SAMP_MODE_VON_NEUMANN_ES_RAW_SC	2 /* use von Neumann data in
--						     entropy shifter, raw data
--						     in statistical checker */
--#define RTMCTL_SAMP_MODE_INVALID		3 /* invalid combination */
-+#define RTMCTL_PRGM 0x00010000	/* 1 -> program mode, 0 -> run mode */
- 	u32 rtmctl;		/* misc. control register */
- 	u32 rtscmisc;		/* statistical check misc. register */
- 	u32 rtpkrrng;		/* poker range register */
-@@ -290,26 +382,22 @@
- 	};
- #define RTSDCTL_ENT_DLY_SHIFT 16
- #define RTSDCTL_ENT_DLY_MASK (0xffff << RTSDCTL_ENT_DLY_SHIFT)
--#define RTSDCTL_ENT_DLY_MIN 3200
--#define RTSDCTL_ENT_DLY_MAX 12800
- 	u32 rtsdctl;		/* seed control register */
- 	union {
- 		u32 rtsblim;	/* PRGM=1: sparse bit limit register */
- 		u32 rttotsam;	/* PRGM=0: total samples register */
- 	};
- 	u32 rtfrqmin;		/* frequency count min. limit register */
--#define RTFRQMAX_DISABLE	(1 << 20)
- 	union {
- 		u32 rtfrqmax;	/* PRGM=1: freq. count max. limit register */
- 		u32 rtfrqcnt;	/* PRGM=0: freq. count register */
- 	};
- 	u32 rsvd1[40];
--#define RDSTA_SKVT 0x80000000
--#define RDSTA_SKVN 0x40000000
--#define RDSTA_IF0 0x00000001
--#define RDSTA_IF1 0x00000002
--#define RDSTA_IFMASK (RDSTA_IF1 | RDSTA_IF0)
--	u32 rdsta;
-+#define RDSTA_IF 0x00000003 /* state handle instantiated flags 0 and 1 */
-+#define RDSTA_SKVN 0x40000000 /* Secure Key Valid Non-Test mode */
-+#define RDSTA_SKVT 0x80000000 /* Secure Key Valid Test. non-test mode */
-+#define RDSTA_TF   0x00000300 /* State handle instantiated Test-mode */
-+	u32 rdsta;              /* DRNG status register */
- 	u32 rsvd2[15];
- };
- 
-@@ -340,12 +428,9 @@
- 	/* Bus Access Configuration Section			010-11f */
- 	/* Read/Writable                                                */
- 	struct masterid jr_mid[4];	/* JRxLIODNR - JobR LIODN setup */
--	u32 rsvd3[11];
--	u32 jrstart;			/* JRSTART - Job Ring Start Register */
-+	u32 rsvd3[12];
- 	struct masterid rtic_mid[4];	/* RTICxLIODNR - RTIC LIODN setup */
--	u32 rsvd4[5];
--	u32 deco_rsr;			/* DECORSR - Deco Request Source */
--	u32 rsvd11;
-+	u32 rsvd4[7];
- 	u32 deco_rq;			/* DECORR - DECO Request */
- 	struct partid deco_mid[5];	/* DECOxLIODNR - 1 per DECO */
- 	u32 rsvd5[22];
-@@ -386,11 +471,6 @@
- #define MCFGR_DMA_RESET		0x10000000
- #define MCFGR_LONG_PTR		0x00010000 /* Use >32-bit desc addressing */
- #define SCFGR_RDBENABLE		0x00000400
--#define SCFGR_VIRT_EN		0x00008000
--#define DECORR_RQD0ENABLE	0x00000001 /* Enable DECO0 for direct access */
--#define DECORSR_JR0		0x00000001 /* JR to supply TZ, SDID, ICID */
--#define DECORSR_VALID		0x80000000
--#define DECORR_DEN0		0x00010000 /* DECO0 available for access*/
- 
- /* AXI read cache control */
- #define MCFGR_ARCACHE_SHIFT	12
-@@ -407,12 +487,6 @@
- #define MCFGR_AXIPRI		0x00000008 /* Assert AXI priority sideband */
- #define MCFGR_BURST_64		0x00000001 /* Max burst size */
- 
--/* JRSTART register offsets */
--#define JRSTART_JR0_START       0x00000001 /* Start Job ring 0 */
--#define JRSTART_JR1_START       0x00000002 /* Start Job ring 1 */
--#define JRSTART_JR2_START       0x00000004 /* Start Job ring 2 */
--#define JRSTART_JR3_START       0x00000008 /* Start Job ring 3 */
--
- /*
-  * caam_job_ring - direct job ring setup
-  * 1-4 possible per instantiation, base + 1000/2000/3000/4000
-@@ -455,7 +529,18 @@
- 	u32 rsvd11;
- 	u32 jrcommand;	/* JRCRx - JobR command */
- 
--	u32 rsvd12[932];
-+	u32 rsvd12[33];
-+
-+	/* Secure Memory Configuration - if you have it */
-+	u32 sm_cmd;	/* SMCJRx - Secure memory command */
-+	u32 rsvd13;
-+	u32 sm_status;	/* SMCSJRx - Secure memory status */
-+	u32 rsvd14;
-+	u32 sm_perm;	/* SMAPJRx - Secure memory access perms */
-+	u32 sm_group2;	/* SMAP2JRx - Secure memory access group 2 */
-+	u32 sm_group1;	/* SMAP1JRx - Secure memory access group 1 */
-+
-+	u32 rsvd15[891];
- 
- 	/* Performance Monitor                                  f00-fff */
- 	struct caam_perfmon perfmon;
-@@ -578,6 +663,62 @@
- 
- #define JRCR_RESET                  0x01
- 
-+/* secure memory command */
-+#define SMC_PAGE_SHIFT	16
-+#define SMC_PAGE_MASK	(0xffff << SMC_PAGE_SHIFT)
-+#define SMC_PART_SHIFT	8
-+#define SMC_PART_MASK	(0x0f << SMC_PART_SHIFT)
-+#define SMC_CMD_SHIFT	0
-+#define SMC_CMD_MASK	(0x0f << SMC_CMD_SHIFT)
-+
-+#define SMC_CMD_ALLOC_PAGE	0x01	/* allocate page to this partition */
-+#define SMC_CMD_DEALLOC_PAGE	0x02	/* deallocate page from partition */
-+#define SMC_CMD_DEALLOC_PART	0x03	/* deallocate partition */
-+#define SMC_CMD_PAGE_INQUIRY	0x05	/* find partition associate with page */
-+
-+/* secure memory (command) status */
-+#define SMCS_PAGE_SHIFT		16
-+#define SMCS_PAGE_MASK		(0x0fff << SMCS_PAGE_SHIFT)
-+#define SMCS_CMDERR_SHIFT	14
-+#define SMCS_CMDERR_MASK	(3 << SMCS_CMDERR_SHIFT)
-+#define SMCS_ALCERR_SHIFT	12
-+#define SMCS_ALCERR_MASK	(3 << SMCS_ALCERR_SHIFT)
-+#define SMCS_PGOWN_SHIFT	6
-+#define SMCS_PGWON_MASK		(3 << SMCS_PGOWN_SHIFT)
-+#define SMCS_PART_SHIFT		0
-+#define SMCS_PART_MASK		(0xf << SMCS_PART_SHIFT)
-+
-+#define SMCS_CMDERR_NONE	0
-+#define SMCS_CMDERR_INCOMP	1	/* Command not yet complete */
-+#define SMCS_CMDERR_SECFAIL	2	/* Security failure occurred */
-+#define SMCS_CMDERR_OVERFLOW	3	/* Command overflow */
-+
-+#define SMCS_ALCERR_NONE	0
-+#define SMCS_ALCERR_PSPERR	1	/* Partion marked PSP (dealloc only) */
-+#define SMCS_ALCERR_PAGEAVAIL	2	/* Page not available */
-+#define SMCS_ALCERR_PARTOWN	3	/* Partition ownership error */
-+
-+#define SMCS_PGOWN_AVAIL	0	/* Page is available */
-+#define SMCS_PGOWN_NOEXIST	1	/* Page initializing or nonexistent */
-+#define SMCS_PGOWN_NOOWN	2	/* Page owned by another processor */
-+#define SMCS_PGOWN_OWNED	3	/* Page belongs to this processor */
-+
-+/* secure memory access permissions */
-+#define SMCS_PERM_KEYMOD_SHIFT	16
-+#define SMCA_PERM_KEYMOD_MASK	(0xff << SMCS_PERM_KEYMOD_SHIFT)
-+#define SMCA_PERM_CSP_ZERO	0x8000	/* Zero when deallocated or released */
-+#define SMCA_PERM_PSP_LOCK	0x4000	/* Part./pages can't be deallocated */
-+#define SMCA_PERM_PERM_LOCK	0x2000	/* Lock permissions */
-+#define SMCA_PERM_GRP_LOCK	0x1000	/* Lock access groups */
-+#define SMCA_PERM_RINGID_SHIFT	10
-+#define SMCA_PERM_RINGID_MASK	(3 << SMCA_PERM_RINGID_SHIFT)
-+#define SMCA_PERM_G2_BLOB	0x0080	/* Group 2 blob import/export */
-+#define SMCA_PERM_G2_WRITE	0x0020	/* Group 2 write */
-+#define SMCA_PERM_G2_READ	0x0010	/* Group 2 read */
-+#define SMCA_PERM_G1_BLOB	0x0008	/* Group 1... */
-+#define SMCA_PERM_G1_WRITE	0x0002
-+#define SMCA_PERM_G1_READ	0x0001
-+
- /*
-  * caam_assurance - Assurance Controller View
-  * base + 0x6000 padded out to 0x1000
-@@ -746,7 +887,6 @@
- 	u32 jr_ctl_hi;	/* CxJRR - JobR Control Register      @800 */
- 	u32 jr_ctl_lo;
- 	u64 jr_descaddr;	/* CxDADR - JobR Descriptor Address */
--#define DECO_OP_STATUS_HI_ERR_MASK 0xF00000FF
- 	u32 op_status_hi;	/* DxOPSTA - DECO Operation Status */
- 	u32 op_status_lo;
- 	u32 rsvd24[2];
-@@ -760,21 +900,36 @@
- 	struct deco_sg_table sctr_tbl[4];	/* DxSTR - Scatter Tables */
- 	u32 rsvd29[48];
- 	u32 descbuf[64];	/* DxDESB - Descriptor buffer */
--	u32 rscvd30[193];
--#define DESC_DBG_DECO_STAT_HOST_ERR	0x00D00000
--#define DESC_DBG_DECO_STAT_VALID	0x80000000
--#define DESC_DBG_DECO_STAT_MASK		0x00F00000
--	u32 desc_dbg;		/* DxDDR - DECO Debug Register */
--	u32 rsvd31[126];
--};
--
--#define DECO_JQCR_WHL		0x20000000
--#define DECO_JQCR_FOUR		0x10000000
--
--#define JR_BLOCK_NUMBER		1
--#define ASSURE_BLOCK_NUMBER	6
--#define QI_BLOCK_NUMBER		7
--#define DECO_BLOCK_NUMBER	8
--#define PG_SIZE_4K		0x1000
--#define PG_SIZE_64K		0x10000
-+	u32 rsvd30[320];
-+};
-+
-+/*
-+ * Current top-level view of memory map is:
-+ *
-+ * 0x0000 - 0x0fff - CAAM Top-Level Control
-+ * 0x1000 - 0x1fff - Job Ring 0
-+ * 0x2000 - 0x2fff - Job Ring 1
-+ * 0x3000 - 0x3fff - Job Ring 2
-+ * 0x4000 - 0x4fff - Job Ring 3
-+ * 0x5000 - 0x5fff - (unused)
-+ * 0x6000 - 0x6fff - Assurance Controller
-+ * 0x7000 - 0x7fff - Queue Interface
-+ * 0x8000 - 0x8fff - DECO-CCB 0
-+ * 0x9000 - 0x9fff - DECO-CCB 1
-+ * 0xa000 - 0xafff - DECO-CCB 2
-+ * 0xb000 - 0xbfff - DECO-CCB 3
-+ * 0xc000 - 0xcfff - DECO-CCB 4
-+ *
-+ * caam_full describes the full register view of CAAM if useful,
-+ * although many configurations may choose to implement parts of
-+ * the register map separately, in differing privilege regions
-+ */
-+struct caam_full {
-+	struct caam_ctrl __iomem ctrl;
-+	struct caam_job_ring jr[4];
-+	u64 rsvd[512];
-+	struct caam_assurance assure;
-+	struct caam_queue_if qi;
-+};
-+
- #endif /* REGS_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/secvio.c linux-xbian-imx6/drivers/crypto/caam/secvio.c
---- linux-4.1.3/drivers/crypto/caam/secvio.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/secvio.c	2015-07-27 23:13:04.213947410 +0200
-@@ -0,0 +1,290 @@
-+
-+/*
-+ * SNVS Security Violation Handler
-+ * Copyright (C) 2012-2015 Freescale Semiconductor, Inc., All Rights Reserved
-+ */
-+
-+#include "compat.h"
-+#include "intern.h"
-+#include "secvio.h"
-+#include "regs.h"
-+
-+/*
-+ * These names are associated with each violation handler.
-+ * The source names were taken from MX6, and are based on recommendations
-+ * for most common SoCs.
-+ */
-+static const u8 *violation_src_name[] = {
-+	"CAAM Internal Security Violation",
-+	"JTAG Alarm",
-+	"Watchdog",
-+	"(reserved)",
-+	"External Boot",
-+	"External Tamper Detect",
-+};
-+
-+/* These names help describe security monitor state for the console */
-+static const u8 *snvs_ssm_state_name[] = {
-+	"init",
-+	"hard fail",
-+	"(undef:2)",
-+	"soft fail",
-+	"(undef:4)",
-+	"(undef:5)",
-+	"(undef:6)",
-+	"(undef:7)",
-+	"transition",
-+	"check",
-+	"(undef:10)",
-+	"non-secure",
-+	"(undef:12)",
-+	"trusted",
-+	"(undef:14)",
-+	"secure",
-+};
-+
-+/* Top-level security violation interrupt */
-+static irqreturn_t snvs_secvio_interrupt(int irq, void *snvsdev)
-+{
-+	struct device *dev = snvsdev;
-+	struct snvs_secvio_drv_private *svpriv = dev_get_drvdata(dev);
-+
-+	/* Check the HP secvio status register */
-+	svpriv->irqcause = rd_reg32(&svpriv->svregs->hp.secvio_status) &
-+				    HP_SECVIOST_SECVIOMASK;
-+
-+	if (!svpriv->irqcause)
-+		return IRQ_NONE;
-+
-+	/* Now ACK cause */
-+	setbits32(&svpriv->svregs->hp.secvio_status, svpriv->irqcause);
-+
-+	/* And run deferred service */
-+	preempt_disable();
-+	tasklet_schedule(&svpriv->irqtask[smp_processor_id()]);
-+	preempt_enable();
-+
-+	return IRQ_HANDLED;
-+}
-+
-+/* Deferred service handler. Tasklet arg is simply the SNVS dev */
-+static void snvs_secvio_dispatch(unsigned long indev)
-+{
-+	struct device *dev = (struct device *)indev;
-+	struct snvs_secvio_drv_private *svpriv = dev_get_drvdata(dev);
-+	unsigned long flags;
-+	int i;
-+
-+
-+	/* Look through stored causes, call each handler if exists */
-+	for (i = 0; i < MAX_SECVIO_SOURCES; i++)
-+		if (svpriv->irqcause & (1 << i)) {
-+			spin_lock_irqsave(&svpriv->svlock, flags);
-+			svpriv->intsrc[i].handler(dev, i,
-+						  svpriv->intsrc[i].ext);
-+			spin_unlock_irqrestore(&svpriv->svlock, flags);
-+		};
-+
-+	/* Re-enable now-serviced interrupts */
-+	setbits32(&svpriv->svregs->hp.secvio_intcfg, svpriv->irqcause);
-+}
-+
-+/*
-+ * Default cause handler, used in lieu of an application-defined handler.
-+ * All it does at this time is print a console message. It could force a halt.
-+ */
-+static void snvs_secvio_default(struct device *dev, u32 cause, void *ext)
-+{
-+	struct snvs_secvio_drv_private *svpriv = dev_get_drvdata(dev);
-+
-+	dev_err(dev, "Unhandled Security Violation Interrupt %d = %s\n",
-+		cause, svpriv->intsrc[cause].intname);
-+}
-+
-+/*
-+ * Install an application-defined handler for a specified cause
-+ * Arguments:
-+ * - dev        points to SNVS-owning device
-+ * - cause      interrupt source cause
-+ * - handler    application-defined handler, gets called with dev
-+ *              source cause, and locally-defined handler argument
-+ * - cause_description   points to a string to override the default cause
-+ *                       name, this can be used as an alternate for error
-+ *                       messages and such. If left NULL, the default
-+ *                       description string is used.
-+ * - ext        pointer to any extra data needed by the handler.
-+ */
-+int snvs_secvio_install_handler(struct device *dev, enum secvio_cause cause,
-+				void (*handler)(struct device *dev, u32 cause,
-+						void *ext),
-+				u8 *cause_description, void *ext)
-+{
-+	unsigned long flags;
-+	struct snvs_secvio_drv_private *svpriv;
-+
-+	svpriv = dev_get_drvdata(dev);
-+
-+	if ((handler == NULL) || (cause > SECVIO_CAUSE_SOURCE_5))
-+		return -EINVAL;
-+
-+	spin_lock_irqsave(&svpriv->svlock, flags);
-+	svpriv->intsrc[cause].handler = handler;
-+	if (cause_description != NULL)
-+		svpriv->intsrc[cause].intname = cause_description;
-+	if (ext != NULL)
-+		svpriv->intsrc[cause].ext = ext;
-+	spin_unlock_irqrestore(&svpriv->svlock, flags);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(snvs_secvio_install_handler);
-+
-+/*
-+ * Remove an application-defined handler for a specified cause (and, by
-+ * implication, restore the "default".
-+ * Arguments:
-+ * - dev	points to SNVS-owning device
-+ * - cause	interrupt source cause
-+ */
-+int snvs_secvio_remove_handler(struct device *dev, enum secvio_cause cause)
-+{
-+	unsigned long flags;
-+	struct snvs_secvio_drv_private *svpriv;
-+
-+	svpriv = dev_get_drvdata(dev);
-+
-+	if (cause > SECVIO_CAUSE_SOURCE_5)
-+		return -EINVAL;
-+
-+	spin_lock_irqsave(&svpriv->svlock, flags);
-+	svpriv->intsrc[cause].intname = violation_src_name[cause];
-+	svpriv->intsrc[cause].handler = snvs_secvio_default;
-+	svpriv->intsrc[cause].ext = NULL;
-+	spin_unlock_irqrestore(&svpriv->svlock, flags);
-+	return 0;
-+}
-+EXPORT_SYMBOL(snvs_secvio_remove_handler);
-+
-+static int snvs_secvio_remove(struct platform_device *pdev)
-+{
-+	struct device *svdev;
-+	struct snvs_secvio_drv_private *svpriv;
-+	int i;
-+
-+	svdev = &pdev->dev;
-+	svpriv = dev_get_drvdata(svdev);
-+
-+	/* Set all sources to nonfatal */
-+	wr_reg32(&svpriv->svregs->hp.secvio_intcfg, 0);
-+
-+	/* Remove tasklets and release interrupt */
-+	for_each_possible_cpu(i)
-+		tasklet_kill(&svpriv->irqtask[i]);
-+
-+	free_irq(svpriv->irq, svdev);
-+	iounmap(svpriv->svregs);
-+	kfree(svpriv);
-+
-+	return 0;
-+}
-+
-+static int snvs_secvio_probe(struct platform_device *pdev)
-+{
-+	struct device *svdev;
-+	struct snvs_secvio_drv_private *svpriv;
-+	struct device_node *np, *npirq;
-+	struct snvs_full __iomem *snvsregs;
-+	int i, error;
-+	u32 hpstate;
-+
-+	svpriv = kzalloc(sizeof(struct snvs_secvio_drv_private), GFP_KERNEL);
-+	if (!svpriv)
-+		return -ENOMEM;
-+
-+	svdev = &pdev->dev;
-+	dev_set_drvdata(svdev, svpriv);
-+	svpriv->pdev = pdev;
-+	np = pdev->dev.of_node;
-+
-+	npirq = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-secvio");
-+	if (!npirq) {
-+		dev_err(svdev, "can't identify secvio interrupt\n");
-+		kfree(svpriv);
-+		return -EINVAL;
-+	}
-+	svpriv->irq = irq_of_parse_and_map(npirq, 0);
-+	if (svpriv->irq <= 0) {
-+		kfree(svpriv);
-+		return -EINVAL;
-+	}
-+
-+	snvsregs = of_iomap(np, 0);
-+	if (!snvsregs) {
-+		dev_err(svdev, "register mapping failed\n");
-+		return -ENOMEM;
-+	}
-+	svpriv->svregs = (struct snvs_full __force *)snvsregs;
-+
-+	 /* Device data set up. Now init interrupt source descriptions */
-+	for (i = 0; i < MAX_SECVIO_SOURCES; i++) {
-+		svpriv->intsrc[i].intname = violation_src_name[i];
-+		svpriv->intsrc[i].handler = snvs_secvio_default;
-+	}
-+	/* Connect main handler */
-+	for_each_possible_cpu(i)
-+		tasklet_init(&svpriv->irqtask[i], snvs_secvio_dispatch,
-+			     (unsigned long)svdev);
-+
-+	error = request_irq(svpriv->irq, snvs_secvio_interrupt,
-+			    IRQF_SHARED, "snvs-secvio", svdev);
-+	if (error) {
-+		dev_err(svdev, "can't connect secvio interrupt\n");
-+		irq_dispose_mapping(svpriv->irq);
-+		svpriv->irq = 0;
-+		iounmap(svpriv->svregs);
-+		kfree(svpriv);
-+		return -EINVAL;
-+	}
-+
-+	/*
-+	 * Configure all sources as fatal violations except LP section,
-+	 * source #5 (typically used as an external tamper detect), and
-+	 * source #3 (typically unused). Whenever the transition to
-+	 * secure mode has occurred, these will now be "fatal" violations
-+	 */
-+	wr_reg32(&svpriv->svregs->hp.secvio_intcfg,
-+		 HP_SECVIO_INTEN_SRC4 | HP_SECVIO_INTEN_SRC2 |
-+		 HP_SECVIO_INTEN_SRC1 | HP_SECVIO_INTEN_SRC0);
-+
-+	hpstate = (rd_reg32(&svpriv->svregs->hp.status) &
-+			    HP_STATUS_SSM_ST_MASK) >> HP_STATUS_SSM_ST_SHIFT;
-+	dev_info(svdev, "violation handlers armed - %s state\n",
-+		 snvs_ssm_state_name[hpstate]);
-+
-+	return 0;
-+}
-+
-+static struct of_device_id snvs_secvio_match[] = {
-+	{
-+		.compatible = "fsl,imx6q-caam-snvs",
-+	},
-+	{},
-+};
-+MODULE_DEVICE_TABLE(of, snvs_secvio_match);
-+
-+static struct platform_driver snvs_secvio_driver = {
-+	.driver = {
-+		.name = "snvs-secvio",
-+		.owner = THIS_MODULE,
-+		.of_match_table = snvs_secvio_match,
-+	},
-+	.probe       = snvs_secvio_probe,
-+	.remove      = snvs_secvio_remove,
-+};
-+
-+module_platform_driver(snvs_secvio_driver);
-+
-+MODULE_LICENSE("Dual BSD/GPL");
-+MODULE_DESCRIPTION("FSL SNVS Security Violation Handler");
-+MODULE_AUTHOR("Freescale Semiconductor - MCU");
-+
-diff -Nur linux-4.1.3/drivers/crypto/caam/secvio.h linux-xbian-imx6/drivers/crypto/caam/secvio.h
---- linux-4.1.3/drivers/crypto/caam/secvio.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/secvio.h	2015-07-27 23:13:04.213947410 +0200
-@@ -0,0 +1,66 @@
-+
-+/*
-+ * CAAM Security Violation Handler
-+ * Copyright (C) 2012-2014 Freescale Semiconductor, Inc., All Rights Reserved
-+ */
-+
-+#ifndef SECVIO_H
-+#define SECVIO_H
-+
-+#include "snvsregs.h"
-+
-+
-+/*
-+ * Defines the published interfaces to install/remove application-specified
-+ * handlers for catching violations
-+ */
-+
-+#define MAX_SECVIO_SOURCES 6
-+
-+/* these are the untranslated causes */
-+enum secvio_cause {
-+	SECVIO_CAUSE_SOURCE_0,
-+	SECVIO_CAUSE_SOURCE_1,
-+	SECVIO_CAUSE_SOURCE_2,
-+	SECVIO_CAUSE_SOURCE_3,
-+	SECVIO_CAUSE_SOURCE_4,
-+	SECVIO_CAUSE_SOURCE_5
-+};
-+
-+/* These are common "recommended" cause definitions for most devices */
-+#define SECVIO_CAUSE_CAAM_VIOLATION	SECVIO_CAUSE_SOURCE_0
-+#define SECVIO_CAUSE_JTAG_ALARM		SECVIO_CAUSE_SOURCE_1
-+#define SECVIO_CAUSE_WATCHDOG		SECVIO_CAUSE_SOURCE_2
-+#define SECVIO_CAUSE_EXTERNAL_BOOT	SECVIO_CAUSE_SOURCE_4
-+#define SECVIO_CAUSE_TAMPER_DETECT	SECVIO_CAUSE_SOURCE_5
-+
-+int snvs_secvio_install_handler(struct device *dev, enum secvio_cause cause,
-+				void (*handler)(struct device *dev, u32 cause,
-+						void *ext),
-+				u8 *cause_description, void *ext);
-+int snvs_secvio_remove_handler(struct device *dev, enum  secvio_cause cause);
-+
-+/*
-+ * Private data definitions for the secvio "driver"
-+ */
-+
-+struct secvio_int_src {
-+	const u8 *intname;	/* Points to a descriptive name for source */
-+	void *ext;		/* Extended data to pass to the handler */
-+	void (*handler)(struct device *dev, u32 cause, void *ext);
-+};
-+
-+struct snvs_secvio_drv_private {
-+	struct platform_device *pdev;
-+	spinlock_t svlock ____cacheline_aligned;
-+	struct tasklet_struct irqtask[NR_CPUS];
-+	struct snvs_full __iomem *svregs;	/* both HP and LP domains */
-+	int irq;
-+	u32 irqcause; /* stashed cause of violation interrupt */
-+
-+	/* Registered handlers for each violation */
-+	struct secvio_int_src intsrc[MAX_SECVIO_SOURCES];
-+
-+};
-+
-+#endif /* SECVIO_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/sg_sw_sec4.h linux-xbian-imx6/drivers/crypto/caam/sg_sw_sec4.h
---- linux-4.1.3/drivers/crypto/caam/sg_sw_sec4.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/crypto/caam/sg_sw_sec4.h	2015-07-27 23:13:04.213947410 +0200
-@@ -1,7 +1,7 @@
- /*
-  * CAAM/SEC 4.x functions for using scatterlists in caam driver
-  *
-- * Copyright 2008-2011 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-  *
-  */
- 
-@@ -91,13 +91,22 @@
- {
- 	if (unlikely(chained)) {
- 		int i;
-+	struct scatterlist *tsg = sg;
-+
-+	/* We use a local copy of the sg pointer to avoid moving the
-+	 * head of the list pointed to by sg as we wall the list.
-+	 */
- 		for (i = 0; i < nents; i++) {
--			dma_map_sg(dev, sg, 1, dir);
--			sg = sg_next(sg);
-+			dma_map_sg(dev, tsg, 1, dir);
-+			tsg = sg_next(tsg);
- 		}
- 	} else {
- 		dma_map_sg(dev, sg, nents, dir);
- 	}
-+
-+	if ((dir == DMA_TO_DEVICE) || (dir == DMA_BIDIRECTIONAL))
-+		dma_sync_sg_for_device(dev, sg, nents, dir);
-+
- 	return nents;
- }
- 
-@@ -105,6 +114,9 @@
- 				unsigned int nents, enum dma_data_direction dir,
- 				bool chained)
- {
-+	if ((dir == DMA_FROM_DEVICE) || (dir == DMA_BIDIRECTIONAL))
-+		dma_sync_sg_for_cpu(dev, sg, nents, dir);
-+
- 	if (unlikely(chained)) {
- 		int i;
- 		for (i = 0; i < nents; i++) {
-@@ -116,3 +128,41 @@
- 	}
- 	return nents;
- }
-+
-+/* Copy from len bytes of sg to dest, starting from beginning */
-+static inline void sg_copy(u8 *dest, struct scatterlist *sg, unsigned int len)
-+{
-+	struct scatterlist *current_sg = sg;
-+	int cpy_index = 0, next_cpy_index = current_sg->length;
-+
-+	while (next_cpy_index < len) {
-+		memcpy(dest + cpy_index, (u8 *) sg_virt(current_sg),
-+		       current_sg->length);
-+		current_sg = sg_next(current_sg);
-+		cpy_index = next_cpy_index;
-+		next_cpy_index += current_sg->length;
-+	}
-+	if (cpy_index < len)
-+		memcpy(dest + cpy_index, (u8 *) sg_virt(current_sg),
-+		       len - cpy_index);
-+}
-+
-+/* Copy sg data, from to_skip to end, to dest */
-+static inline void sg_copy_part(u8 *dest, struct scatterlist *sg,
-+				      int to_skip, unsigned int end)
-+{
-+	struct scatterlist *current_sg = sg;
-+	int sg_index, cpy_index;
-+
-+	sg_index = current_sg->length;
-+	while (sg_index <= to_skip) {
-+		current_sg = sg_next(current_sg);
-+		sg_index += current_sg->length;
-+	}
-+	cpy_index = sg_index - to_skip;
-+	memcpy(dest, (u8 *) sg_virt(current_sg) +
-+	       current_sg->length - cpy_index, cpy_index);
-+	current_sg = sg_next(current_sg);
-+	if (end - sg_index)
-+		sg_copy(dest + cpy_index, current_sg, end - sg_index);
-+}
-diff -Nur linux-4.1.3/drivers/crypto/caam/sm.h linux-xbian-imx6/drivers/crypto/caam/sm.h
---- linux-4.1.3/drivers/crypto/caam/sm.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/sm.h	2015-07-27 23:13:04.213947410 +0200
-@@ -0,0 +1,88 @@
-+
-+/*
-+ * CAAM Secure Memory/Keywrap API Definitions
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-+ */
-+
-+#ifndef SM_H
-+#define SM_H
-+
-+
-+/* Storage access permissions */
-+#define SM_PERM_READ 0x01
-+#define SM_PERM_WRITE 0x02
-+#define SM_PERM_BLOB 0x03
-+
-+
-+/* Keystore maintenance functions */
-+void sm_init_keystore(struct device *dev);
-+u32 sm_detect_keystore_units(struct device *dev);
-+int sm_establish_keystore(struct device *dev, u32 unit);
-+void sm_release_keystore(struct device *dev, u32 unit);
-+void caam_sm_shutdown(struct platform_device *pdev);
-+int caam_sm_example_init(struct platform_device *pdev);
-+
-+/* Keystore accessor functions */
-+extern int sm_keystore_slot_alloc(struct device *dev, u32 unit, u32 size,
-+				  u32 *slot);
-+extern int sm_keystore_slot_dealloc(struct device *dev, u32 unit, u32 slot);
-+extern int sm_keystore_slot_load(struct device *dev, u32 unit, u32 slot,
-+				 const u8 *key_data, u32 key_length);
-+extern int sm_keystore_slot_read(struct device *dev, u32 unit, u32 slot,
-+				 u32 key_length, u8 *key_data);
-+extern int sm_keystore_slot_encapsulate(struct device *dev, u32 unit,
-+					u32 inslot, u32 outslot, u16 secretlen,
-+					u8 *keymod, u16 keymodlen);
-+extern int sm_keystore_slot_decapsulate(struct device *dev, u32 unit,
-+					u32 inslot, u32 outslot, u16 secretlen,
-+					u8 *keymod, u16 keymodlen);
-+
-+/* Data structure to hold per-slot information */
-+struct keystore_data_slot_info {
-+	u8	allocated;	/* Track slot assignments */
-+	u32	key_length;	/* Size of the key */
-+};
-+
-+/* Data structure to hold keystore information */
-+struct keystore_data {
-+	void	*base_address;	/* Base of the Secure Partition */
-+	u32	slot_count;	/* Number of slots in the keystore */
-+	struct keystore_data_slot_info *slot; /* Per-slot information */
-+};
-+
-+/* store the detected attributes of a secure memory page */
-+struct sm_page_descriptor {
-+	u16 phys_pagenum;	/* may be discontiguous */
-+	u16 own_part;		/* Owning partition */
-+	void *pg_base;		/* Calculated virtual address */
-+	struct keystore_data *ksdata;
-+};
-+
-+struct caam_drv_private_sm {
-+	struct device *parentdev;	/* this ends up as the controller */
-+	struct device *smringdev;	/* ring that owns this instance */
-+	spinlock_t kslock ____cacheline_aligned;
-+
-+	/* Default parameters for geometry */
-+	u32 max_pages;		/* maximum pages this instance can support */
-+	u32 top_partition;	/* highest partition number in this instance */
-+	u32 top_page;		/* highest page number in this instance */
-+	u32 page_size;		/* page size */
-+	u32 slot_size;		/* selected size of each storage block */
-+
-+	/* Partition/Page Allocation Map */
-+	u32 localpages;		/* Number of pages we can access */
-+	struct sm_page_descriptor *pagedesc;	/* Allocated per-page */
-+
-+	/* Installed handlers for keystore access */
-+	int (*data_init)(struct device *dev, u32 unit);
-+	void (*data_cleanup)(struct device *dev, u32 unit);
-+	int (*slot_alloc)(struct device *dev, u32 unit, u32 size, u32 *slot);
-+	int (*slot_dealloc)(struct device *dev, u32 unit, u32 slot);
-+	void *(*slot_get_address)(struct device *dev, u32 unit, u32 handle);
-+	u32 (*slot_get_base)(struct device *dev, u32 unit, u32 handle);
-+	u32 (*slot_get_offset)(struct device *dev, u32 unit, u32 handle);
-+	u32 (*slot_get_slot_size)(struct device *dev, u32 unit, u32 handle);
-+};
-+
-+#endif /* SM_H */
-diff -Nur linux-4.1.3/drivers/crypto/caam/sm_store.c linux-xbian-imx6/drivers/crypto/caam/sm_store.c
---- linux-4.1.3/drivers/crypto/caam/sm_store.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/sm_store.c	2015-07-27 23:13:04.213947410 +0200
-@@ -0,0 +1,896 @@
-+
-+/*
-+ * CAAM Secure Memory Storage Interface
-+ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
-+ *
-+ * Loosely based on the SHW Keystore API for SCC/SCC2
-+ * Experimental implementation and NOT intended for upstream use. Expect
-+ * this interface to be amended significantly in the future once it becomes
-+ * integrated into live applications.
-+ *
-+ * Known issues:
-+ *
-+ * - Executes one instance of an secure memory "driver". This is tied to the
-+ *   fact that job rings can't run as standalone instances in the present
-+ *   configuration.
-+ *
-+ * - It does not expose a userspace interface. The value of a userspace
-+ *   interface for access to secrets is a point for further architectural
-+ *   discussion.
-+ *
-+ * - Partition/permission management is not part of this interface. It
-+ *   depends on some level of "knowledge" agreed upon between bootloader,
-+ *   provisioning applications, and OS-hosted software (which uses this
-+ *   driver).
-+ *
-+ * - No means of identifying the location or purpose of secrets managed by
-+ *   this interface exists; "slot location" and format of a given secret
-+ *   needs to be agreed upon between bootloader, provisioner, and OS-hosted
-+ *   application.
-+ */
-+
-+#include "compat.h"
-+#include "regs.h"
-+#include "jr.h"
-+#include "desc.h"
-+#include "intern.h"
-+#include "error.h"
-+#include "sm.h"
-+
-+#ifdef SM_DEBUG_CONT
-+void sm_show_page(struct device *dev, struct sm_page_descriptor *pgdesc)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	u32 i, *smdata;
-+
-+	dev_info(dev, "physical page %d content at 0x%08x\n",
-+		 pgdesc->phys_pagenum, pgdesc->pg_base);
-+	smdata = pgdesc->pg_base;
-+	for (i = 0; i < (smpriv->page_size / sizeof(u32)); i += 4)
-+		dev_info(dev, "[0x%08x] 0x%08x 0x%08x 0x%08x 0x%08x\n",
-+			 (u32)&smdata[i], smdata[i], smdata[i+1], smdata[i+2],
-+			 smdata[i+3]);
-+}
-+#endif
-+
-+/*
-+ * Construct a secure memory blob encapsulation job descriptor
-+ *
-+ * - desc	pointer to hold new (to be allocated) pointer to the generated
-+ *		descriptor for later use. Calling thread can kfree the
-+ *		descriptor after execution.
-+ * - keymod	Physical pointer to key modifier (contiguous piece).
-+ * - keymodsz	Size of key modifier in bytes (should normally be 8).
-+ * - secretbuf	Physical pointer (within an accessible secure memory page)
-+ *		of the secret to be encapsulated.
-+ * - outbuf	Physical pointer (within an accessible secure memory page)
-+ *		of the encapsulated output. This will be larger than the
-+ *		input secret because of the added encapsulation data.
-+ * - secretsz	Size of input secret, in bytes.
-+ * - auth	If nonzero, use AES-CCM for encapsulation, else use ECB
-+ *
-+ * Note: this uses 32-bit pointers at present
-+ */
-+#define INITIAL_DESCSZ 16	/* size of tmp buffer for descriptor const. */
-+static int blob_encap_desc(u32 **desc, dma_addr_t keymod, u16 keymodsz,
-+			   dma_addr_t secretbuf, dma_addr_t outbuf,
-+			   u16 secretsz, bool auth)
-+{
-+	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
-+	u16 dsize, idx;
-+
-+	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
-+	idx = 1;
-+
-+	/* Load key modifier */
-+	tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB | LDST_SRCDST_BYTE_KEY |
-+			 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK) |
-+			 (keymodsz & LDST_LEN_MASK);
-+
-+	tmpdesc[idx++] = (u32)keymod;
-+
-+	/* Encapsulate to secure memory */
-+	tmpdesc[idx++] = CMD_SEQ_IN_PTR | secretsz;
-+	tmpdesc[idx++] = (u32)secretbuf;
-+
-+	/* Add space for BKEK and MAC tag */
-+	tmpdesc[idx++] = CMD_SEQ_IN_PTR | (secretsz + (32 + 16));
-+
-+	tmpdesc[idx++] = (u32)outbuf;
-+	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_ENCAP_PROTOCOL | OP_PCLID_BLOB |
-+		     OP_PCL_BLOB_PTXT_SECMEM;
-+	if (auth)
-+		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
-+
-+	idx++;
-+	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
-+	dsize = idx * sizeof(u32);
-+
-+	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
-+	if (tdesc == NULL)
-+		return 0;
-+
-+	memcpy(tdesc, tmpdesc, dsize);
-+	*desc = tdesc;
-+	return dsize;
-+}
-+
-+/*
-+ * Construct a secure memory blob decapsulation job descriptor
-+ *
-+ * - desc	pointer to hold new (to be allocated) pointer to the generated
-+ *		descriptor for later use. Calling thread can kfree the
-+ *		descriptor after execution.
-+ * - keymod	Physical pointer to key modifier (contiguous piece).
-+ * - keymodsz	Size of key modifier in bytes (should normally be 16).
-+ * - blobbuf	Physical pointer (within an accessible secure memory page)
-+ *		of the blob to be decapsulated.
-+ * - outbuf	Physical pointer (within an accessible secure memory page)
-+ *		of the decapsulated output.
-+ * - secretsz	Size of input blob, in bytes.
-+ * - auth	If nonzero, assume AES-CCM for decapsulation, else use ECB
-+ *
-+ * Note: this uses 32-bit pointers at present
-+ */
-+static int blob_decap_desc(u32 **desc, dma_addr_t keymod, u16 keymodsz,
-+			   dma_addr_t blobbuf, dma_addr_t outbuf,
-+			   u16 blobsz, bool auth)
-+{
-+	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
-+	u16 dsize, idx;
-+
-+	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
-+	idx = 1;
-+
-+	/* Load key modifier */
-+	tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB | LDST_SRCDST_BYTE_KEY |
-+			 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK) |
-+			 (keymodsz & LDST_LEN_MASK);
-+
-+	tmpdesc[idx++] = (u32)keymod;
-+
-+	/* Compensate BKEK + MAC tag */
-+	tmpdesc[idx++] = CMD_SEQ_IN_PTR | (blobsz + 32 + 16);
-+
-+	tmpdesc[idx++] = (u32)blobbuf;
-+	tmpdesc[idx++] = CMD_SEQ_OUT_PTR | blobsz;
-+	tmpdesc[idx++] = (u32)outbuf;
-+
-+	/* Decapsulate from secure memory partition to black blob */
-+	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_DECAP_PROTOCOL | OP_PCLID_BLOB |
-+		     OP_PCL_BLOB_PTXT_SECMEM | OP_PCL_BLOB_BLACK;
-+	if (auth)
-+		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
-+
-+	idx++;
-+	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
-+	dsize = idx * sizeof(u32);
-+
-+	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
-+	if (tdesc == NULL)
-+		return 0;
-+
-+	memcpy(tdesc, tmpdesc, dsize);
-+	*desc = tdesc;
-+	return dsize;
-+}
-+
-+/*
-+ * Pseudo-synchronous ring access functions for carrying out key
-+ * encapsulation and decapsulation
-+ */
-+
-+struct sm_key_job_result {
-+	int error;
-+	struct completion completion;
-+};
-+
-+void sm_key_job_done(struct device *dev, u32 *desc, u32 err, void *context)
-+{
-+	struct sm_key_job_result *res = context;
-+
-+	res->error = err;	/* save off the error for postprocessing */
-+	complete(&res->completion);	/* mark us complete */
-+}
-+
-+static int sm_key_job(struct device *ksdev, u32 *jobdesc)
-+{
-+	struct sm_key_job_result testres;
-+	struct caam_drv_private_sm *kspriv;
-+	int rtn = 0;
-+
-+	kspriv = dev_get_drvdata(ksdev);
-+
-+	init_completion(&testres.completion);
-+
-+	rtn = caam_jr_enqueue(kspriv->smringdev, jobdesc, sm_key_job_done,
-+			      &testres);
-+	if (!rtn) {
-+		wait_for_completion_interruptible(&testres.completion);
-+		rtn = testres.error;
-+	}
-+	return rtn;
-+}
-+
-+/*
-+ * Following section establishes the default methods for keystore access
-+ * They are NOT intended for use external to this module
-+ *
-+ * In the present version, these are the only means for the higher-level
-+ * interface to deal with the mechanics of accessing the phyiscal keystore
-+ */
-+
-+
-+int slot_alloc(struct device *dev, u32 unit, u32 size, u32 *slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
-+	u32 i;
-+#ifdef SM_DEBUG
-+	dev_info(dev, "slot_alloc(): requesting slot for %d bytes\n", size);
-+#endif
-+
-+	if (size > smpriv->slot_size)
-+		return -EKEYREJECTED;
-+
-+	for (i = 0; i < ksdata->slot_count; i++) {
-+		if (ksdata->slot[i].allocated == 0) {
-+			ksdata->slot[i].allocated = 1;
-+			(*slot) = i;
-+#ifdef SM_DEBUG
-+			dev_info(dev, "slot_alloc(): new slot %d allocated\n",
-+				 *slot);
-+#endif
-+			return 0;
-+		}
-+	}
-+
-+	return -ENOSPC;
-+}
-+EXPORT_SYMBOL(slot_alloc);
-+
-+int slot_dealloc(struct device *dev, u32 unit, u32 slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
-+	u8 __iomem *slotdata;
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "slot_dealloc(): releasing slot %d\n", slot);
-+#endif
-+	if (slot >= ksdata->slot_count)
-+		return -EINVAL;
-+	slotdata = ksdata->base_address + slot * smpriv->slot_size;
-+
-+	if (ksdata->slot[slot].allocated == 1) {
-+		/* Forcibly overwrite the data from the keystore */
-+		memset(ksdata->base_address + slot * smpriv->slot_size, 0,
-+		       smpriv->slot_size);
-+
-+		ksdata->slot[slot].allocated = 0;
-+#ifdef SM_DEBUG
-+		dev_info(dev, "slot_dealloc(): slot %d released\n", slot);
-+#endif
-+		return 0;
-+	}
-+
-+	return -EINVAL;
-+}
-+EXPORT_SYMBOL(slot_dealloc);
-+
-+void *slot_get_address(struct device *dev, u32 unit, u32 slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
-+
-+	if (slot >= ksdata->slot_count)
-+		return NULL;
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "slot_get_address(): slot %d is 0x%08x\n", slot,
-+		 (u32)ksdata->base_address + slot * smpriv->slot_size);
-+#endif
-+
-+	return ksdata->base_address + slot * smpriv->slot_size;
-+}
-+
-+u32 slot_get_base(struct device *dev, u32 unit, u32 slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
-+
-+	/*
-+	 * There could potentially be more than one secure partition object
-+	 * associated with this keystore.  For now, there is just one.
-+	 */
-+
-+	(void)slot;
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "slot_get_base(): slot %d = 0x%08x\n",
-+		slot, (u32)ksdata->base_address);
-+#endif
-+
-+	return (u32)(ksdata->base_address);
-+}
-+
-+u32 slot_get_offset(struct device *dev, u32 unit, u32 slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
-+
-+	if (slot >= ksdata->slot_count)
-+		return -EINVAL;
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "slot_get_offset(): slot %d = %d\n", slot,
-+		slot * smpriv->slot_size);
-+#endif
-+
-+	return slot * smpriv->slot_size;
-+}
-+
-+u32 slot_get_slot_size(struct device *dev, u32 unit, u32 slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "slot_get_slot_size(): slot %d = %d\n", slot,
-+		 smpriv->slot_size);
-+#endif
-+	/* All slots are the same size in the default implementation */
-+	return smpriv->slot_size;
-+}
-+
-+
-+
-+int kso_init_data(struct device *dev, u32 unit)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = -EINVAL;
-+	struct keystore_data *keystore_data = NULL;
-+	u32 slot_count;
-+	u32 keystore_data_size;
-+
-+	/*
-+	 * Calculate the required size of the keystore data structure, based
-+	 * on the number of keys that can fit in the partition.
-+	 */
-+	slot_count = smpriv->page_size / smpriv->slot_size;
-+#ifdef SM_DEBUG
-+	dev_info(dev, "kso_init_data: %d slots initializing\n", slot_count);
-+#endif
-+
-+	keystore_data_size = sizeof(struct keystore_data) +
-+				slot_count *
-+				sizeof(struct keystore_data_slot_info);
-+
-+	keystore_data = kzalloc(keystore_data_size, GFP_KERNEL);
-+
-+	if (keystore_data == NULL) {
-+		retval = -ENOSPC;
-+		goto out;
-+	}
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "kso_init_data: keystore data size = %d\n",
-+		 keystore_data_size);
-+#endif
-+
-+	/*
-+	 * Place the slot information structure directly after the keystore data
-+	 * structure.
-+	 */
-+	keystore_data->slot = (struct keystore_data_slot_info *)
-+			      (keystore_data + 1);
-+	keystore_data->slot_count = slot_count;
-+
-+	smpriv->pagedesc[unit].ksdata = keystore_data;
-+	smpriv->pagedesc[unit].ksdata->base_address =
-+		smpriv->pagedesc[unit].pg_base;
-+
-+	retval = 0;
-+
-+out:
-+	if (retval != 0)
-+		if (keystore_data != NULL)
-+			kfree(keystore_data);
-+
-+
-+	return retval;
-+}
-+
-+void kso_cleanup_data(struct device *dev, u32 unit)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	struct keystore_data *keystore_data = NULL;
-+
-+	if (smpriv->pagedesc[unit].ksdata != NULL)
-+		keystore_data = smpriv->pagedesc[unit].ksdata;
-+
-+	/* Release the allocated keystore management data */
-+	kfree(smpriv->pagedesc[unit].ksdata);
-+
-+	return;
-+}
-+
-+
-+
-+/*
-+ * Keystore management section
-+ */
-+
-+void sm_init_keystore(struct device *dev)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+
-+	smpriv->data_init = kso_init_data;
-+	smpriv->data_cleanup = kso_cleanup_data;
-+	smpriv->slot_alloc = slot_alloc;
-+	smpriv->slot_dealloc = slot_dealloc;
-+	smpriv->slot_get_address = slot_get_address;
-+	smpriv->slot_get_base = slot_get_base;
-+	smpriv->slot_get_offset = slot_get_offset;
-+	smpriv->slot_get_slot_size = slot_get_slot_size;
-+#ifdef SM_DEBUG
-+	dev_info(dev, "sm_init_keystore(): handlers installed\n");
-+#endif
-+}
-+EXPORT_SYMBOL(sm_init_keystore);
-+
-+/* Return available pages/units */
-+u32 sm_detect_keystore_units(struct device *dev)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+
-+	return smpriv->localpages;
-+}
-+EXPORT_SYMBOL(sm_detect_keystore_units);
-+
-+/*
-+ * Do any keystore specific initializations
-+ */
-+int sm_establish_keystore(struct device *dev, u32 unit)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "sm_establish_keystore(): unit %d initializing\n", unit);
-+#endif
-+
-+	if (smpriv->data_init == NULL)
-+		return -EINVAL;
-+
-+	/* Call the data_init function for any user setup */
-+	return smpriv->data_init(dev, unit);
-+}
-+EXPORT_SYMBOL(sm_establish_keystore);
-+
-+void sm_release_keystore(struct device *dev, u32 unit)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+
-+#ifdef SM_DEBUG
-+	dev_info(dev, "sm_establish_keystore(): unit %d releasing\n", unit);
-+#endif
-+	if ((smpriv != NULL) && (smpriv->data_cleanup != NULL))
-+		smpriv->data_cleanup(dev, unit);
-+
-+	return;
-+}
-+EXPORT_SYMBOL(sm_release_keystore);
-+
-+/*
-+ * Subsequent interfacce (sm_keystore_*) forms the accessor interfacce to
-+ * the keystore
-+ */
-+int sm_keystore_slot_alloc(struct device *dev, u32 unit, u32 size, u32 *slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = -EINVAL;
-+
-+	spin_lock(&smpriv->kslock);
-+
-+	if ((smpriv->slot_alloc == NULL) ||
-+	    (smpriv->pagedesc[unit].ksdata == NULL))
-+		goto out;
-+
-+	retval =  smpriv->slot_alloc(dev, unit, size, slot);
-+
-+out:
-+	spin_unlock(&smpriv->kslock);
-+	return retval;
-+}
-+EXPORT_SYMBOL(sm_keystore_slot_alloc);
-+
-+int sm_keystore_slot_dealloc(struct device *dev, u32 unit, u32 slot)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = -EINVAL;
-+
-+	spin_lock(&smpriv->kslock);
-+
-+	if ((smpriv->slot_alloc == NULL) ||
-+	    (smpriv->pagedesc[unit].ksdata == NULL))
-+		goto out;
-+
-+	retval = smpriv->slot_dealloc(dev, unit, slot);
-+out:
-+	spin_unlock(&smpriv->kslock);
-+	return retval;
-+}
-+EXPORT_SYMBOL(sm_keystore_slot_dealloc);
-+
-+int sm_keystore_slot_load(struct device *dev, u32 unit, u32 slot,
-+			  const u8 *key_data, u32 key_length)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = -EINVAL;
-+	u32 slot_size;
-+	u32 i;
-+	u8 __iomem *slot_location;
-+
-+	spin_lock(&smpriv->kslock);
-+
-+	slot_size = smpriv->slot_get_slot_size(dev, unit, slot);
-+
-+	if (key_length > slot_size) {
-+		retval = -EFBIG;
-+		goto out;
-+	}
-+
-+	slot_location = smpriv->slot_get_address(dev, unit, slot);
-+
-+	for (i = 0; i < key_length; i++)
-+		slot_location[i] = key_data[i];
-+
-+	retval = 0;
-+
-+out:
-+	spin_unlock(&smpriv->kslock);
-+	return retval;
-+}
-+EXPORT_SYMBOL(sm_keystore_slot_load);
-+
-+int sm_keystore_slot_read(struct device *dev, u32 unit, u32 slot,
-+			  u32 key_length, u8 *key_data)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = -EINVAL;
-+	u8 __iomem *slot_addr;
-+	u32 slot_size;
-+
-+	spin_lock(&smpriv->kslock);
-+
-+	slot_addr = smpriv->slot_get_address(dev, unit, slot);
-+	slot_size = smpriv->slot_get_slot_size(dev, unit, slot);
-+
-+	if (key_length > slot_size) {
-+		retval = -EKEYREJECTED;
-+		goto out;
-+	}
-+
-+	memcpy(key_data, slot_addr, key_length);
-+	retval = 0;
-+
-+out:
-+	spin_unlock(&smpriv->kslock);
-+	return retval;
-+}
-+EXPORT_SYMBOL(sm_keystore_slot_read);
-+
-+int sm_keystore_slot_encapsulate(struct device *dev, u32 unit, u32 inslot,
-+				 u32 outslot, u16 secretlen, u8 *keymod,
-+				 u16 keymodlen)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = 0;
-+	u32 slot_length, dsize, jstat;
-+	u32 __iomem *encapdesc = NULL;
-+	u8 __iomem *lkeymod, *inpslotaddr, *outslotaddr;
-+	dma_addr_t keymod_dma;
-+
-+	/* Ensure that the full blob  will fit in the key slot */
-+	slot_length = smpriv->slot_get_slot_size(dev, unit, outslot);
-+	if ((secretlen + 48) > slot_length)
-+		goto out;
-+
-+	/* Get the base addresses of both keystore slots */
-+	inpslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, inslot);
-+	outslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, outslot);
-+
-+	/* Build the key modifier */
-+	lkeymod = kmalloc(keymodlen, GFP_KERNEL | GFP_DMA);
-+	memcpy(lkeymod, keymod, keymodlen);
-+	keymod_dma = dma_map_single(dev, lkeymod, keymodlen, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
-+
-+	/* Build the encapsulation job descriptor */
-+	dsize = blob_encap_desc(&encapdesc, keymod_dma, keymodlen,
-+				__pa(inpslotaddr), __pa(outslotaddr),
-+				secretlen, 0);
-+	if (!dsize) {
-+		dev_err(dev, "can't alloc an encap descriptor\n");
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+	jstat = sm_key_job(dev, encapdesc);
-+
-+	dma_unmap_single(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
-+	kfree(encapdesc);
-+
-+out:
-+	return retval;
-+
-+}
-+EXPORT_SYMBOL(sm_keystore_slot_encapsulate);
-+
-+int sm_keystore_slot_decapsulate(struct device *dev, u32 unit, u32 inslot,
-+				 u32 outslot, u16 secretlen, u8 *keymod,
-+				 u16 keymodlen)
-+{
-+	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
-+	int retval = 0;
-+	u32 slot_length, dsize, jstat;
-+	u32 __iomem *decapdesc = NULL;
-+	u8 __iomem *lkeymod, *inpslotaddr, *outslotaddr;
-+	dma_addr_t keymod_dma;
-+
-+	/* Ensure that the decap data will fit in the key slot */
-+	slot_length = smpriv->slot_get_slot_size(dev, unit, outslot);
-+	if (secretlen > slot_length)
-+		goto out;
-+
-+	/* Get the base addresses of both keystore slots */
-+	inpslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, inslot);
-+	outslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, outslot);
-+
-+	/* Build the key modifier */
-+	lkeymod = kmalloc(keymodlen, GFP_KERNEL | GFP_DMA);
-+	memcpy(lkeymod, keymod, keymodlen);
-+	keymod_dma = dma_map_single(dev, lkeymod, keymodlen, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
-+
-+	/* Build the decapsulation job descriptor */
-+	dsize = blob_decap_desc(&decapdesc, keymod_dma, keymodlen,
-+				__pa(inpslotaddr), __pa(outslotaddr),
-+				secretlen, 0);
-+	if (!dsize) {
-+		dev_err(dev, "can't alloc a decap descriptor\n");
-+		retval = -ENOMEM;
-+		goto out;
-+	}
-+	jstat = sm_key_job(dev, decapdesc);
-+
-+	dma_unmap_single(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
-+	kfree(decapdesc);
-+
-+out:
-+	return retval;
-+
-+}
-+EXPORT_SYMBOL(sm_keystore_slot_decapsulate);
-+
-+
-+/*
-+ * Initialization/shutdown subsystem
-+ * Assumes statically-invoked startup/shutdown from the controller driver
-+ * for the present time, to be reworked when a device tree becomes
-+ * available. This code will not modularize in present form.
-+ *
-+ * Also, simply uses ring 0 for execution at the present
-+ */
-+
-+int caam_sm_startup(struct platform_device *pdev)
-+{
-+	struct device *ctrldev, *smdev;
-+	struct caam_drv_private *ctrlpriv;
-+	struct caam_drv_private_sm *smpriv;
-+	struct caam_drv_private_jr *jrpriv;	/* need this for reg page */
-+	struct platform_device *sm_pdev;
-+	struct sm_page_descriptor *lpagedesc;
-+	u32 page, pgstat, lpagect, detectedpage;
-+
-+	struct device_node *np;
-+	ctrldev = &pdev->dev;
-+	ctrlpriv = dev_get_drvdata(ctrldev);
-+
-+	/*
-+	 * Set up the private block for secure memory
-+	 * Only one instance is possible
-+	 */
-+	smpriv = kzalloc(sizeof(struct caam_drv_private_sm), GFP_KERNEL);
-+	if (smpriv == NULL) {
-+		dev_err(ctrldev, "can't alloc private mem for secure memory\n");
-+		return -ENOMEM;
-+	}
-+	smpriv->parentdev = ctrldev; /* copy of parent dev is handy */
-+
-+	/* Create the dev */
-+#ifdef CONFIG_OF
-+	np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-sm");
-+	sm_pdev = of_platform_device_create(np, "caam_sm", ctrldev);
-+#else
-+	sm_pdev = platform_device_register_data(ctrldev, "caam_sm", 0,
-+						smpriv,
-+					sizeof(struct caam_drv_private_sm));
-+#endif
-+	if (sm_pdev == NULL) {
-+		kfree(smpriv);
-+		return -EINVAL;
-+	}
-+	smdev = &sm_pdev->dev;
-+	dev_set_drvdata(smdev, smpriv);
-+	ctrlpriv->smdev = smdev;
-+
-+	/*
-+	 * Collect configuration limit data for reference
-+	 * This batch comes from the partition data/vid registers in perfmon
-+	 */
-+	smpriv->max_pages = ((rd_reg32(&ctrlpriv->ctrl->perfmon.smpart)
-+			    & SMPART_MAX_NUMPG_MASK) >>
-+			    SMPART_MAX_NUMPG_SHIFT) + 1;
-+	smpriv->top_partition = ((rd_reg32(&ctrlpriv->ctrl->perfmon.smpart)
-+				& SMPART_MAX_PNUM_MASK) >>
-+				SMPART_MAX_PNUM_SHIFT) + 1;
-+	smpriv->top_page =  ((rd_reg32(&ctrlpriv->ctrl->perfmon.smpart)
-+			    & SMPART_MAX_PG_MASK) >> SMPART_MAX_PG_SHIFT) + 1;
-+	smpriv->page_size = 1024 << ((rd_reg32(&ctrlpriv->ctrl->perfmon.smvid)
-+			    & SMVID_PG_SIZE_MASK) >> SMVID_PG_SIZE_SHIFT);
-+	smpriv->slot_size = 1 << CONFIG_CRYPTO_DEV_FSL_CAAM_SM_SLOTSIZE;
-+
-+#ifdef SM_DEBUG
-+	dev_info(smdev, "max pages = %d, top partition = %d\n",
-+			smpriv->max_pages, smpriv->top_partition);
-+	dev_info(smdev, "top page = %d, page size = %d (total = %d)\n",
-+			smpriv->top_page, smpriv->page_size,
-+			smpriv->top_page * smpriv->page_size);
-+	dev_info(smdev, "selected slot size = %d\n", smpriv->slot_size);
-+#endif
-+
-+	/*
-+	 * Now probe for partitions/pages to which we have access. Note that
-+	 * these have likely been set up by a bootloader or platform
-+	 * provisioning application, so we have to assume that we "inherit"
-+	 * a configuration and work within the constraints of what it might be.
-+	 *
-+	 * Assume use of the zeroth ring in the present iteration (until
-+	 * we can divorce the controller and ring drivers, and then assign
-+	 * an SM instance to any ring instance).
-+	 */
-+	smpriv->smringdev = ctrlpriv->jrdev[0];
-+	jrpriv = dev_get_drvdata(smpriv->smringdev);
-+	lpagect = 0;
-+	lpagedesc = kzalloc(sizeof(struct sm_page_descriptor)
-+			    * smpriv->max_pages, GFP_KERNEL);
-+	if (lpagedesc == NULL) {
-+		kfree(smpriv);
-+		return -ENOMEM;
-+	}
-+
-+	for (page = 0; page < smpriv->max_pages; page++) {
-+		wr_reg32(&jrpriv->rregs->sm_cmd,
-+			 ((page << SMC_PAGE_SHIFT) & SMC_PAGE_MASK) |
-+			 (SMC_CMD_PAGE_INQUIRY & SMC_CMD_MASK));
-+		pgstat = rd_reg32(&jrpriv->rregs->sm_status);
-+		if (((pgstat & SMCS_PGWON_MASK) >> SMCS_PGOWN_SHIFT)
-+		    == SMCS_PGOWN_OWNED) { /* our page? */
-+			lpagedesc[page].phys_pagenum =
-+				(pgstat & SMCS_PAGE_MASK) >> SMCS_PAGE_SHIFT;
-+			lpagedesc[page].own_part =
-+				(pgstat & SMCS_PART_SHIFT) >> SMCS_PART_MASK;
-+			lpagedesc[page].pg_base = ctrlpriv->sm_base +
-+				((smpriv->page_size * page) / sizeof(u32));
-+			lpagect++;
-+#ifdef SM_DEBUG
-+			dev_info(smdev,
-+				"physical page %d, owning partition = %d\n",
-+				lpagedesc[page].phys_pagenum,
-+				lpagedesc[page].own_part);
-+#endif
-+		}
-+	}
-+
-+	smpriv->pagedesc = kzalloc(sizeof(struct sm_page_descriptor) * lpagect,
-+				   GFP_KERNEL);
-+	if (smpriv->pagedesc == NULL) {
-+		kfree(lpagedesc);
-+		kfree(smpriv);
-+		return -ENOMEM;
-+	}
-+	smpriv->localpages = lpagect;
-+
-+	detectedpage = 0;
-+	for (page = 0; page < smpriv->max_pages; page++) {
-+		if (lpagedesc[page].pg_base != NULL) {	/* e.g. live entry */
-+			memcpy(&smpriv->pagedesc[detectedpage],
-+			       &lpagedesc[page],
-+			       sizeof(struct sm_page_descriptor));
-+#ifdef SM_DEBUG_CONT
-+			sm_show_page(smdev, &smpriv->pagedesc[detectedpage]);
-+#endif
-+			detectedpage++;
-+		}
-+	}
-+
-+	kfree(lpagedesc);
-+
-+	sm_init_keystore(smdev);
-+
-+	return 0;
-+}
-+
-+void caam_sm_shutdown(struct platform_device *pdev)
-+{
-+	struct device *ctrldev, *smdev;
-+	struct caam_drv_private *priv;
-+	struct caam_drv_private_sm *smpriv;
-+
-+	ctrldev = &pdev->dev;
-+	priv = dev_get_drvdata(ctrldev);
-+	smdev = priv->smdev;
-+	smpriv = dev_get_drvdata(smdev);
-+
-+	kfree(smpriv->pagedesc);
-+	kfree(smpriv);
-+}
-+EXPORT_SYMBOL(caam_sm_shutdown);
-+#ifdef CONFIG_OF
-+static void  __exit caam_sm_exit(void)
-+{
-+	struct device_node *dev_node;
-+	struct platform_device *pdev;
-+
-+	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
-+	if (!dev_node) {
-+		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
-+		if (!dev_node)
-+			return;
-+	}
-+
-+	pdev = of_find_device_by_node(dev_node);
-+	if (!pdev)
-+		return;
-+
-+	of_node_put(dev_node);
-+
-+	caam_sm_shutdown(pdev);
-+
-+	return;
-+}
-+
-+static int __init caam_sm_init(void)
-+{
-+	struct device_node *dev_node;
-+	struct platform_device *pdev;
-+
-+	/*
-+	 * Do of_find_compatible_node() then of_find_device_by_node()
-+	 * once a functional device tree is available
-+	 */
-+	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
-+	if (!dev_node) {
-+		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
-+		if (!dev_node)
-+			return -ENODEV;
-+	}
-+
-+	pdev = of_find_device_by_node(dev_node);
-+	if (!pdev)
-+		return -ENODEV;
-+
-+	of_node_get(dev_node);
-+
-+	caam_sm_startup(pdev);
-+
-+	return 0;
-+}
-+
-+module_init(caam_sm_init);
-+module_exit(caam_sm_exit);
-+
-+MODULE_LICENSE("Dual BSD/GPL");
-+MODULE_DESCRIPTION("FSL CAAM Secure Memory / Keystore");
-+MODULE_AUTHOR("Freescale Semiconductor - NMSG/MAD");
-+#endif
-diff -Nur linux-4.1.3/drivers/crypto/caam/sm_test.c linux-xbian-imx6/drivers/crypto/caam/sm_test.c
---- linux-4.1.3/drivers/crypto/caam/sm_test.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/sm_test.c	2015-07-27 23:13:04.213947410 +0200
-@@ -0,0 +1,844 @@
-+/*
-+ * Secure Memory / Keystore Exemplification Module
-+ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved
-+ *
-+ * Serves as a functional example, and as a self-contained unit test for
-+ * the functionality contained in sm_store.c.
-+ *
-+ * The example function, caam_sm_example_init(), runs a thread that:
-+ *
-+ * - initializes a set of fixed keys
-+ * - stores one copy in clear buffers
-+ * - stores them again in secure memory
-+ * - extracts stored keys back out for use
-+ * - intializes 3 data buffers for a test:
-+ *   (1) containing cleartext
-+ *   (2) to hold ciphertext encrypted with an extracted black key
-+ *   (3) to hold extracted cleartext decrypted with an equivalent clear key
-+ *
-+ * The function then builds simple job descriptors that reference the key
-+ * material and buffers as initialized, and executes an encryption job
-+ * with a black key, and a decryption job using a the same key held in the
-+ * clear. The output of the decryption job is compared to the original
-+ * cleartext; if they don't compare correctly, one can assume a key problem
-+ * exists, where the function will exit with an error.
-+ *
-+ * This module can use a substantial amount of refactoring, which may occur
-+ * after the API gets some mileage. Furthermore, expect this module to
-+ * eventually disappear once the API is integrated into "real" software.
-+ */
-+
-+#include "compat.h"
-+#include "intern.h"
-+#include "desc.h"
-+#include "error.h"
-+#include "jr.h"
-+#include "sm.h"
-+
-+static u8 skeymod[] = {
-+	0x0f, 0x0e, 0x0d, 0x0c, 0x0b, 0x0a, 0x09, 0x08,
-+	0x07, 0x06, 0x05, 0x04, 0x03, 0x02, 0x01, 0x00
-+};
-+static u8 symkey[] = {
-+	0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
-+	0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
-+	0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
-+	0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f
-+};
-+
-+static u8 symdata[] = {
-+	0x00, 0x01, 0x02, 0x03, 0x04, 0x0f, 0x06, 0x07,
-+	0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
-+	0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
-+	0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
-+	0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27,
-+	0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f,
-+	0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
-+	0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f,
-+	0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47,
-+	0x48, 0x49, 0x4a, 0x4b, 0x4c, 0x4d, 0x4e, 0x4f,
-+	0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57,
-+	0x58, 0x59, 0x5a, 0x5b, 0x5c, 0x5d, 0x5e, 0x5f,
-+	0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67,
-+	0x68, 0x69, 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f,
-+	0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77,
-+	0x78, 0x79, 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f,
-+	0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
-+	0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
-+	0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
-+	0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
-+	0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
-+	0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
-+	0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
-+	0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
-+	0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
-+	0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
-+	0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
-+	0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
-+	0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
-+	0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
-+	0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
-+	0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff
-+};
-+
-+static int mk_job_desc(u32 *desc, dma_addr_t key, u16 keysz, dma_addr_t indata,
-+		       dma_addr_t outdata, u16 sz, u32 cipherdir, u32 keymode)
-+{
-+	desc[1] = CMD_KEY | CLASS_1 | (keysz & KEY_LENGTH_MASK) | keymode;
-+	desc[2] = (u32)key;
-+	desc[3] = CMD_OPERATION | OP_TYPE_CLASS1_ALG | OP_ALG_AAI_ECB |
-+		  cipherdir;
-+	desc[4] = CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 |
-+		  FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1 | sz;
-+	desc[5] = (u32)indata;
-+	desc[6] = CMD_FIFO_STORE | FIFOST_TYPE_MESSAGE_DATA | sz;
-+	desc[7] = (u32)outdata;
-+
-+	desc[0] = CMD_DESC_HDR | HDR_ONE | (8 & HDR_DESCLEN_MASK);
-+	return 8 * sizeof(u32);
-+}
-+
-+struct exec_test_result {
-+	int error;
-+	struct completion completion;
-+};
-+
-+void exec_test_done(struct device *dev, u32 *desc, u32 err, void *context)
-+{
-+	struct exec_test_result *res = context;
-+
-+	if (err) {
-+		char tmp[CAAM_ERROR_STR_MAX];
-+		dev_err(dev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
-+	}
-+
-+	res->error = err;
-+	complete(&res->completion);
-+}
-+
-+static int exec_test_job(struct device *ksdev, u32 *jobdesc)
-+{
-+	struct exec_test_result testres;
-+	struct caam_drv_private_sm *kspriv;
-+	int rtn = 0;
-+
-+	kspriv = dev_get_drvdata(ksdev);
-+
-+	init_completion(&testres.completion);
-+
-+	rtn = caam_jr_enqueue(kspriv->smringdev, jobdesc, exec_test_done,
-+			      &testres);
-+	if (!rtn) {
-+		wait_for_completion_interruptible(&testres.completion);
-+		rtn = testres.error;
-+	}
-+	return rtn;
-+}
-+
-+
-+int caam_sm_example_init(struct platform_device *pdev)
-+{
-+	struct device *ctrldev, *ksdev;
-+	struct caam_drv_private *ctrlpriv;
-+	struct caam_drv_private_sm *kspriv;
-+	u32 unit, units, jdescsz;
-+	int stat, jstat, rtnval = 0;
-+	u8 __iomem *syminp, *symint, *symout = NULL;
-+	dma_addr_t syminp_dma, symint_dma, symout_dma;
-+	u8 __iomem *black_key_des, *black_key_aes128;
-+	u8 __iomem  *black_key_aes256;
-+	dma_addr_t black_key_des_dma, black_key_aes128_dma;
-+	dma_addr_t black_key_aes256_dma;
-+	u8 __iomem *clear_key_des, *clear_key_aes128, *clear_key_aes256;
-+	dma_addr_t clear_key_des_dma, clear_key_aes128_dma;
-+	dma_addr_t clear_key_aes256_dma;
-+	u32 __iomem *jdesc;
-+	u32 keyslot_des, keyslot_aes128, keyslot_aes256 = 0;
-+
-+	jdesc = NULL;
-+	black_key_des = black_key_aes128 = black_key_aes256 = NULL;
-+	clear_key_des = clear_key_aes128 = clear_key_aes256 = NULL;
-+
-+	/* We can lose this cruft once we can get a pdev by name */
-+	ctrldev = &pdev->dev;
-+	ctrlpriv = dev_get_drvdata(ctrldev);
-+	ksdev = ctrlpriv->smdev;
-+	kspriv = dev_get_drvdata(ksdev);
-+	if (kspriv == NULL)
-+		return -ENODEV;
-+
-+	/* Now that we have the dev for the single SM instance, connect */
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test_init() running\n");
-+#endif
-+	/* Probe to see what keystores are available to us */
-+	units = sm_detect_keystore_units(ksdev);
-+	if (!units)
-+		dev_err(ksdev, "caam_sm_test: no keystore units available\n");
-+
-+	/*
-+	 * MX6 bootloader stores some stuff in unit 0, so let's
-+	 * use 1 or above
-+	 */
-+	if (units < 2) {
-+		dev_err(ksdev, "caam_sm_test: insufficient keystore units\n");
-+		return -ENODEV;
-+	}
-+	unit = 1;
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: %d keystore units available\n", units);
-+#endif
-+
-+	/* Initialize/Establish Keystore */
-+	sm_establish_keystore(ksdev, unit);	/* Initalize store in #1 */
-+
-+	/*
-+	 * Top of main test thread
-+	 */
-+
-+	/* Allocate test data blocks (input, intermediate, output) */
-+	syminp = kmalloc(256, GFP_KERNEL | GFP_DMA);
-+	symint = kmalloc(256, GFP_KERNEL | GFP_DMA);
-+	symout = kmalloc(256, GFP_KERNEL | GFP_DMA);
-+	if ((syminp == NULL) || (symint == NULL) || (symout == NULL)) {
-+		rtnval = -ENOMEM;
-+		dev_err(ksdev, "caam_sm_test: can't get test data buffers\n");
-+		goto freemem;
-+	}
-+
-+	/* Allocate storage for 3 black keys: encapsulated 8, 16, 32 */
-+	black_key_des = kmalloc(16, GFP_KERNEL | GFP_DMA); /* padded to 16... */
-+	black_key_aes128 = kmalloc(16, GFP_KERNEL | GFP_DMA);
-+	black_key_aes256 = kmalloc(16, GFP_KERNEL | GFP_DMA);
-+	if ((black_key_des == NULL) || (black_key_aes128 == NULL) ||
-+	    (black_key_aes256 == NULL)) {
-+		rtnval = -ENOMEM;
-+		dev_err(ksdev, "caam_sm_test: can't black key buffers\n");
-+		goto freemem;
-+	}
-+
-+	clear_key_des = kmalloc(8, GFP_KERNEL | GFP_DMA);
-+	clear_key_aes128 = kmalloc(16, GFP_KERNEL | GFP_DMA);
-+	clear_key_aes256 = kmalloc(32, GFP_KERNEL | GFP_DMA);
-+	if ((clear_key_des == NULL) || (clear_key_aes128 == NULL) ||
-+	    (clear_key_aes256 == NULL)) {
-+		rtnval = -ENOMEM;
-+		dev_err(ksdev, "caam_sm_test: can't get clear key buffers\n");
-+		goto freemem;
-+	}
-+
-+	/* Allocate storage for job descriptor */
-+	jdesc = kmalloc(8 * sizeof(u32), GFP_KERNEL | GFP_DMA);
-+	if (jdesc == NULL) {
-+		rtnval = -ENOMEM;
-+		dev_err(ksdev, "caam_sm_test: can't get descriptor buffers\n");
-+		goto freemem;
-+	}
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: all buffers allocated\n");
-+#endif
-+
-+	/* Load up input data block, clear outputs */
-+	memcpy(syminp, symdata, 256);
-+	memset(symint, 0, 256);
-+	memset(symout, 0, 256);
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[0], syminp[1], syminp[2], syminp[3],
-+		 syminp[4], syminp[5], syminp[6], syminp[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[0], symout[1], symout[2], symout[3],
-+		 symout[4], symout[5], symout[6], symout[7]);
-+
-+	dev_info(ksdev, "caam_sm_test: data buffers initialized\n");
-+#endif
-+
-+	/* Load up clear keys */
-+	memcpy(clear_key_des, symkey, 8);
-+	memcpy(clear_key_aes128, symkey, 16);
-+	memcpy(clear_key_aes256, symkey, 32);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: all clear keys loaded\n");
-+#endif
-+
-+	/*
-+	 * Place clear keys in keystore.
-+	 * All the interesting stuff happens here.
-+	 */
-+	/* 8 bit DES key */
-+	stat = sm_keystore_slot_alloc(ksdev, unit, 8, &keyslot_des);
-+	if (stat)
-+		goto freemem;
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: 8 byte key slot in %d\n", keyslot_des);
-+#endif
-+	stat = sm_keystore_slot_load(ksdev, unit, keyslot_des, clear_key_des,
-+				     8);
-+	if (stat) {
-+#ifdef SM_TEST_DETAIL
-+		dev_info(ksdev, "caam_sm_test: can't load 8 byte key in %d\n",
-+			 keyslot_des);
-+#endif
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
-+		goto freemem;
-+	}
-+
-+	/* 16 bit AES key */
-+	stat = sm_keystore_slot_alloc(ksdev, unit, 16, &keyslot_aes128);
-+	if (stat) {
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
-+		goto freemem;
-+	}
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: 16 byte key slot in %d\n",
-+		 keyslot_aes128);
-+#endif
-+	stat = sm_keystore_slot_load(ksdev, unit, keyslot_aes128,
-+				     clear_key_aes128, 16);
-+	if (stat) {
-+#ifdef SM_TEST_DETAIL
-+		dev_info(ksdev, "caam_sm_test: can't load 16 byte key in %d\n",
-+			 keyslot_aes128);
-+#endif
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
-+		goto freemem;
-+	}
-+
-+	/* 32 bit AES key */
-+	stat = sm_keystore_slot_alloc(ksdev, unit, 32, &keyslot_aes256);
-+	if (stat) {
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
-+		goto freemem;
-+	}
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: 32 byte key slot in %d\n",
-+		 keyslot_aes256);
-+#endif
-+	stat = sm_keystore_slot_load(ksdev, unit, keyslot_aes256,
-+				     clear_key_aes256, 32);
-+	if (stat) {
-+#ifdef SM_TEST_DETAIL
-+		dev_info(ksdev, "caam_sm_test: can't load 32 byte key in %d\n",
-+			 keyslot_aes128);
-+#endif
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes256);
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
-+		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
-+		goto freemem;
-+	}
-+
-+	/* Encapsulate all keys as SM blobs */
-+	stat = sm_keystore_slot_encapsulate(ksdev, unit, keyslot_des,
-+					    keyslot_des, 8, skeymod, 8);
-+	if (stat) {
-+		dev_info(ksdev, "caam_sm_test: can't encapsulate DES key\n");
-+		goto freekeys;
-+	}
-+
-+	stat = sm_keystore_slot_encapsulate(ksdev, unit, keyslot_aes128,
-+					    keyslot_aes128, 16, skeymod, 8);
-+	if (stat) {
-+		dev_info(ksdev, "caam_sm_test: can't encapsulate AES128 key\n");
-+		goto freekeys;
-+	}
-+
-+	stat = sm_keystore_slot_encapsulate(ksdev, unit, keyslot_aes256,
-+					    keyslot_aes256, 32, skeymod, 8);
-+	if (stat) {
-+		dev_info(ksdev, "caam_sm_test: can't encapsulate AES256 key\n");
-+		goto freekeys;
-+	}
-+
-+	/* Now decapsulate as black key blobs */
-+	stat = sm_keystore_slot_decapsulate(ksdev, unit, keyslot_des,
-+					    keyslot_des, 8, skeymod, 8);
-+	if (stat) {
-+		dev_info(ksdev, "caam_sm_test: can't decapsulate DES key\n");
-+		goto freekeys;
-+	}
-+
-+	stat = sm_keystore_slot_decapsulate(ksdev, unit, keyslot_aes128,
-+					    keyslot_aes128, 16, skeymod, 8);
-+	if (stat) {
-+		dev_info(ksdev, "caam_sm_test: can't decapsulate AES128 key\n");
-+		goto freekeys;
-+	}
-+
-+	stat = sm_keystore_slot_decapsulate(ksdev, unit, keyslot_aes256,
-+					    keyslot_aes256, 32, skeymod, 8);
-+	if (stat) {
-+		dev_info(ksdev, "caam_sm_test: can't decapsulate AES128 key\n");
-+		goto freekeys;
-+	}
-+
-+	/* Extract 8/16/32 byte black keys */
-+	sm_keystore_slot_read(ksdev, unit, keyslot_des, 8, black_key_des);
-+	sm_keystore_slot_read(ksdev, unit, keyslot_aes128, 16,
-+			      black_key_aes128);
-+	sm_keystore_slot_read(ksdev, unit, keyslot_aes256, 32,
-+			      black_key_aes256);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: all black keys extracted\n");
-+#endif
-+
-+	/* DES encrypt using 8 byte black key */
-+	black_key_des_dma = dma_map_single(ksdev, black_key_des, 8,
-+					   DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, black_key_des_dma, 8, DMA_TO_DEVICE);
-+	syminp_dma = dma_map_single(ksdev, syminp, 256, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
-+	symint_dma = dma_map_single(ksdev, symint, 256, DMA_FROM_DEVICE);
-+
-+	jdescsz = mk_job_desc(jdesc, black_key_des_dma, 8, syminp_dma,
-+			      symint_dma, 256,
-+			      OP_ALG_ENCRYPT | OP_ALG_ALGSEL_DES, 0);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "jobdesc:\n");
-+	dev_info(ksdev, "0x%08x\n", jdesc[0]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[1]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[2]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[3]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[4]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[5]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[6]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[7]);
-+#endif
-+
-+	jstat = exec_test_job(ksdev, jdesc);
-+
-+	dma_sync_single_for_cpu(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
-+	dma_unmap_single(ksdev, black_key_des_dma, 8, DMA_TO_DEVICE);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "input block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[0], syminp[1], syminp[2], syminp[3],
-+		 syminp[4], syminp[5], syminp[6], syminp[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[8], syminp[9], syminp[10], syminp[11],
-+		 syminp[12], syminp[13], syminp[14], syminp[15]);
-+	dev_info(ksdev, "intermediate block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[8], symint[9], symint[10], symint[11],
-+		 symint[12], symint[13], symint[14], symint[15]);
-+	dev_info(ksdev, "caam_sm_test: encrypt cycle with 8 byte key\n");
-+#endif
-+
-+	/* DES decrypt using 8 byte clear key */
-+	clear_key_des_dma = dma_map_single(ksdev, clear_key_des, 8,
-+					   DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, clear_key_des_dma, 8, DMA_TO_DEVICE);
-+	symint_dma = dma_map_single(ksdev, symint, 256, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, symint_dma, 256, DMA_TO_DEVICE);
-+	symout_dma = dma_map_single(ksdev, symout, 256, DMA_FROM_DEVICE);
-+
-+	jdescsz = mk_job_desc(jdesc, clear_key_des_dma, 8, symint_dma,
-+			      symout_dma, 256,
-+			      OP_ALG_DECRYPT | OP_ALG_ALGSEL_DES, 0);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "jobdesc:\n");
-+	dev_info(ksdev, "0x%08x\n", jdesc[0]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[1]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[2]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[3]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[4]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[5]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[6]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[7]);
-+#endif
-+
-+	jstat = exec_test_job(ksdev, jdesc);
-+
-+	dma_sync_single_for_cpu(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symint_dma, 256, DMA_TO_DEVICE);
-+	dma_unmap_single(ksdev, clear_key_des_dma, 8, DMA_TO_DEVICE);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "intermediate block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[8], symint[9], symint[10], symint[11],
-+		 symint[12], symint[13], symint[14], symint[15]);
-+	dev_info(ksdev, "decrypted block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[0], symout[1], symout[2], symout[3],
-+		 symout[4], symout[5], symout[6], symout[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[8], symout[9], symout[10], symout[11],
-+		 symout[12], symout[13], symout[14], symout[15]);
-+	dev_info(ksdev, "caam_sm_test: decrypt cycle with 8 byte key\n");
-+#endif
-+
-+	/* Check result */
-+	if (memcmp(symout, syminp, 256)) {
-+		dev_info(ksdev, "caam_sm_test: 8-byte key test mismatch\n");
-+		rtnval = -1;
-+		goto freekeys;
-+	} else
-+		dev_info(ksdev, "caam_sm_test: 8-byte key test match OK\n");
-+
-+	/* AES-128 encrypt using 16 byte black key */
-+	black_key_aes128_dma = dma_map_single(ksdev, black_key_aes128, 16,
-+					      DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, black_key_aes128_dma, 16,
-+				   DMA_TO_DEVICE);
-+	syminp_dma = dma_map_single(ksdev, syminp, 256, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
-+	symint_dma = dma_map_single(ksdev, symint, 256, DMA_FROM_DEVICE);
-+
-+	jdescsz = mk_job_desc(jdesc, black_key_aes128_dma, 16, syminp_dma,
-+			      symint_dma, 256,
-+			      OP_ALG_ENCRYPT | OP_ALG_ALGSEL_AES, 0);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "jobdesc:\n");
-+	dev_info(ksdev, "0x%08x\n", jdesc[0]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[1]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[2]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[3]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[4]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[5]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[6]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[7]);
-+#endif
-+
-+	jstat = exec_test_job(ksdev, jdesc);
-+
-+	dma_sync_single_for_cpu(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
-+	dma_unmap_single(ksdev, black_key_aes128_dma, 16, DMA_TO_DEVICE);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "input block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[0], syminp[1], syminp[2], syminp[3],
-+		 syminp[4], syminp[5], syminp[6], syminp[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[8], syminp[9], syminp[10], syminp[11],
-+		 syminp[12], syminp[13], syminp[14], syminp[15]);
-+	dev_info(ksdev, "intermediate block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[8], symint[9], symint[10], symint[11],
-+		 symint[12], symint[13], symint[14], symint[15]);
-+	dev_info(ksdev, "caam_sm_test: encrypt cycle with 16 byte key\n");
-+#endif
-+
-+	/* AES-128 decrypt using 16 byte clear key */
-+	clear_key_aes128_dma = dma_map_single(ksdev, clear_key_aes128, 16,
-+					      DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, clear_key_aes128_dma, 16,
-+				   DMA_TO_DEVICE);
-+	symint_dma = dma_map_single(ksdev, symint, 256, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, symint_dma, 256, DMA_TO_DEVICE);
-+	symout_dma = dma_map_single(ksdev, symout, 256, DMA_FROM_DEVICE);
-+
-+	jdescsz = mk_job_desc(jdesc, clear_key_aes128_dma, 16, symint_dma,
-+			      symout_dma, 256,
-+			      OP_ALG_DECRYPT | OP_ALG_ALGSEL_AES, 0);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "jobdesc:\n");
-+	dev_info(ksdev, "0x%08x\n", jdesc[0]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[1]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[2]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[3]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[4]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[5]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[6]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[7]);
-+#endif
-+	jstat = exec_test_job(ksdev, jdesc);
-+
-+	dma_sync_single_for_cpu(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symint_dma, 256, DMA_TO_DEVICE);
-+	dma_unmap_single(ksdev, clear_key_aes128_dma, 16, DMA_TO_DEVICE);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "intermediate block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[8], symint[9], symint[10], symint[11],
-+		 symint[12], symint[13], symint[14], symint[15]);
-+	dev_info(ksdev, "decrypted block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[0], symout[1], symout[2], symout[3],
-+		 symout[4], symout[5], symout[6], symout[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[8], symout[9], symout[10], symout[11],
-+		 symout[12], symout[13], symout[14], symout[15]);
-+	dev_info(ksdev, "caam_sm_test: decrypt cycle with 16 byte key\n");
-+#endif
-+
-+	/* Check result */
-+	if (memcmp(symout, syminp, 256)) {
-+		dev_info(ksdev, "caam_sm_test: 16-byte key test mismatch\n");
-+		rtnval = -1;
-+		goto freekeys;
-+	} else
-+		dev_info(ksdev, "caam_sm_test: 16-byte key test match OK\n");
-+
-+	/* AES-256 encrypt using 32 byte black key */
-+	black_key_aes256_dma = dma_map_single(ksdev, black_key_aes256, 32,
-+					      DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, black_key_aes256_dma, 32,
-+				   DMA_TO_DEVICE);
-+	syminp_dma = dma_map_single(ksdev, syminp, 256, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
-+	symint_dma = dma_map_single(ksdev, symint, 256, DMA_FROM_DEVICE);
-+
-+	jdescsz = mk_job_desc(jdesc, black_key_aes256_dma, 32, syminp_dma,
-+			      symint_dma, 256,
-+			      OP_ALG_ENCRYPT | OP_ALG_ALGSEL_AES, 0);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "jobdesc:\n");
-+	dev_info(ksdev, "0x%08x\n", jdesc[0]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[1]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[2]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[3]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[4]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[5]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[6]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[7]);
-+#endif
-+
-+	jstat = exec_test_job(ksdev, jdesc);
-+
-+	dma_sync_single_for_cpu(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
-+	dma_unmap_single(ksdev, black_key_aes256_dma, 32, DMA_TO_DEVICE);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "input block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[0], syminp[1], syminp[2], syminp[3],
-+		 syminp[4], syminp[5], syminp[6], syminp[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 syminp[8], syminp[9], syminp[10], syminp[11],
-+		 syminp[12], syminp[13], syminp[14], syminp[15]);
-+	dev_info(ksdev, "intermediate block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[8], symint[9], symint[10], symint[11],
-+		 symint[12], symint[13], symint[14], symint[15]);
-+	dev_info(ksdev, "caam_sm_test: encrypt cycle with 32 byte key\n");
-+#endif
-+
-+	/* AES-256 decrypt using 32-byte black key */
-+	clear_key_aes256_dma = dma_map_single(ksdev, clear_key_aes256, 32,
-+					      DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, clear_key_aes256_dma, 32,
-+				   DMA_TO_DEVICE);
-+	symint_dma = dma_map_single(ksdev, symint, 256, DMA_TO_DEVICE);
-+	dma_sync_single_for_device(ksdev, symint_dma, 256, DMA_TO_DEVICE);
-+	symout_dma = dma_map_single(ksdev, symout, 256, DMA_FROM_DEVICE);
-+
-+	jdescsz = mk_job_desc(jdesc, clear_key_aes256_dma, 32, symint_dma,
-+			      symout_dma, 256,
-+			      OP_ALG_DECRYPT | OP_ALG_ALGSEL_AES, 0);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "jobdesc:\n");
-+	dev_info(ksdev, "0x%08x\n", jdesc[0]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[1]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[2]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[3]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[4]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[5]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[6]);
-+	dev_info(ksdev, "0x%08x\n", jdesc[7]);
-+#endif
-+
-+	jstat = exec_test_job(ksdev, jdesc);
-+
-+	dma_sync_single_for_cpu(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
-+	dma_unmap_single(ksdev, symint_dma, 256, DMA_TO_DEVICE);
-+	dma_unmap_single(ksdev, clear_key_aes256_dma, 32, DMA_TO_DEVICE);
-+
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "intermediate block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[0], symint[1], symint[2], symint[3],
-+		 symint[4], symint[5], symint[6], symint[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symint[8], symint[9], symint[10], symint[11],
-+		 symint[12], symint[13], symint[14], symint[15]);
-+	dev_info(ksdev, "decrypted block:\n");
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[0], symout[1], symout[2], symout[3],
-+		 symout[4], symout[5], symout[6], symout[7]);
-+	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
-+			"0x%02x 0x%02x 0x%02x 0x%02x\n",
-+		 symout[8], symout[9], symout[10], symout[11],
-+		 symout[12], symout[13], symout[14], symout[15]);
-+	dev_info(ksdev, "caam_sm_test: decrypt cycle with 32 byte key\n");
-+#endif
-+
-+	/* Check result */
-+	if (memcmp(symout, syminp, 256)) {
-+		dev_info(ksdev, "caam_sm_test: 32-byte key test mismatch\n");
-+		rtnval = -1;
-+		goto freekeys;
-+	} else
-+		dev_info(ksdev, "caam_sm_test: 32-byte key test match OK\n");
-+
-+
-+	/* Remove 8/16/32 byte keys from keystore */
-+freekeys:
-+	stat = sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
-+	if (stat)
-+		dev_info(ksdev, "caam_sm_test: can't release slot %d\n",
-+			 keyslot_des);
-+
-+	stat = sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
-+	if (stat)
-+		dev_info(ksdev, "caam_sm_test: can't release slot %d\n",
-+			 keyslot_aes128);
-+
-+	stat = sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes256);
-+	if (stat)
-+		dev_info(ksdev, "caam_sm_test: can't release slot %d\n",
-+			 keyslot_aes256);
-+
-+
-+	/* Free resources */
-+freemem:
-+#ifdef SM_TEST_DETAIL
-+	dev_info(ksdev, "caam_sm_test: cleaning up\n");
-+#endif
-+	kfree(syminp);
-+	kfree(symint);
-+	kfree(symout);
-+	kfree(clear_key_des);
-+	kfree(clear_key_aes128);
-+	kfree(clear_key_aes256);
-+	kfree(black_key_des);
-+	kfree(black_key_aes128);
-+	kfree(black_key_aes256);
-+	kfree(jdesc);
-+
-+	/* Disconnect from keystore and leave */
-+	sm_release_keystore(ksdev, unit);
-+
-+	return rtnval;
-+}
-+EXPORT_SYMBOL(caam_sm_example_init);
-+
-+void caam_sm_example_shutdown(void)
-+{
-+	/* unused in present version */
-+	struct device_node *dev_node;
-+	struct platform_device *pdev;
-+
-+	/*
-+	 * Do of_find_compatible_node() then of_find_device_by_node()
-+	 * once a functional device tree is available
-+	 */
-+	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
-+	if (!dev_node) {
-+		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
-+		if (!dev_node)
-+			return;
-+	}
-+
-+	pdev = of_find_device_by_node(dev_node);
-+	if (!pdev)
-+		return;
-+
-+	of_node_get(dev_node);
-+
-+}
-+
-+static int __init caam_sm_test_init(void)
-+{
-+	struct device_node *dev_node;
-+	struct platform_device *pdev;
-+
-+	/*
-+	 * Do of_find_compatible_node() then of_find_device_by_node()
-+	 * once a functional device tree is available
-+	 */
-+	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
-+	if (!dev_node) {
-+		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
-+		if (!dev_node)
-+			return -ENODEV;
-+	}
-+
-+	pdev = of_find_device_by_node(dev_node);
-+	if (!pdev)
-+		return -ENODEV;
-+
-+	of_node_put(dev_node);
-+
-+	caam_sm_example_init(pdev);
-+
-+	return 0;
-+}
-+
-+
-+/* Module-based initialization needs to wait for dev tree */
-+#ifdef CONFIG_OF
-+module_init(caam_sm_test_init);
-+module_exit(caam_sm_example_shutdown);
-+
-+MODULE_LICENSE("Dual BSD/GPL");
-+MODULE_DESCRIPTION("FSL CAAM Keystore Usage Example");
-+MODULE_AUTHOR("Freescale Semiconductor - NMSG/MAD");
-+#endif
-diff -Nur linux-4.1.3/drivers/crypto/caam/snvsregs.h linux-xbian-imx6/drivers/crypto/caam/snvsregs.h
---- linux-4.1.3/drivers/crypto/caam/snvsregs.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/crypto/caam/snvsregs.h	2015-07-27 23:13:04.213947410 +0200
-@@ -0,0 +1,237 @@
-+/*
-+ * SNVS hardware register-level view
-+ *
-+ * Copyright (C) 2012-2014 Freescale Semiconductor, Inc., All Rights Reserved
-+ */
-+
-+#ifndef SNVSREGS_H
-+#define SNVSREGS_H
-+
-+#include <linux/types.h>
-+#include <linux/io.h>
-+
-+/*
-+ * SNVS High Power Domain
-+ * Includes security violations, HA counter, RTC, alarm
-+ */
-+struct snvs_hp {
-+	u32 lock;		/* HPLR - HP Lock */
-+	u32 cmd;		/* HPCOMR - HP Command */
-+	u32 ctl;		/* HPCR - HP Control */
-+	u32 secvio_intcfg;	/* HPSICR - Security Violation Int Config */
-+	u32 secvio_ctl;		/* HPSVCR - Security Violation Control */
-+	u32 status;		/* HPSR - HP Status */
-+	u32 secvio_status;	/* HPSVSR - Security Violation Status */
-+	u32 ha_counteriv;	/* High Assurance Counter IV */
-+	u32 ha_counter;		/* High Assurance Counter */
-+	u32 rtc_msb;		/* Real Time Clock/Counter MSB */
-+	u32 rtc_lsb;		/* Real Time Counter LSB */
-+	u32 time_alarm_msb;	/* Time Alarm MSB */
-+	u32 time_alarm_lsb;	/* Time Alarm LSB */
-+};
-+
-+#define HP_LOCK_HAC_LCK		0x00040000
-+#define HP_LOCK_HPSICR_LCK	0x00020000
-+#define HP_LOCK_HPSVCR_LCK	0x00010000
-+#define HP_LOCK_MKEYSEL_LCK	0x00000200
-+#define HP_LOCK_TAMPCFG_LCK	0x00000100
-+#define HP_LOCK_TAMPFLT_LCK	0x00000080
-+#define HP_LOCK_SECVIO_LCK	0x00000040
-+#define HP_LOCK_GENP_LCK	0x00000020
-+#define HP_LOCK_MONOCTR_LCK	0x00000010
-+#define HP_LOCK_CALIB_LCK	0x00000008
-+#define HP_LOCK_SRTC_LCK	0x00000004
-+#define HP_LOCK_ZMK_RD_LCK	0x00000002
-+#define HP_LOCK_ZMK_WT_LCK	0x00000001
-+
-+#define HP_CMD_NONPRIV_AXS	0x80000000
-+#define HP_CMD_HAC_STOP		0x00080000
-+#define HP_CMD_HAC_CLEAR	0x00040000
-+#define HP_CMD_HAC_LOAD		0x00020000
-+#define HP_CMD_HAC_CFG_EN	0x00010000
-+#define HP_CMD_SNVS_MSTR_KEY	0x00002000
-+#define HP_CMD_PROG_ZMK		0x00001000
-+#define HP_CMD_SW_LPSV		0x00000400
-+#define HP_CMD_SW_FSV		0x00000200
-+#define HP_CMD_SW_SV		0x00000100
-+#define HP_CMD_LP_SWR_DIS	0x00000020
-+#define HP_CMD_LP_SWR		0x00000010
-+#define HP_CMD_SSM_SFNS_DIS	0x00000004
-+#define HP_CMD_SSM_ST_DIS	0x00000002
-+#define HP_CMD_SMM_ST		0x00000001
-+
-+#define HP_CTL_TIME_SYNC	0x00010000
-+#define HP_CTL_CAL_VAL_SHIFT	10
-+#define HP_CTL_CAL_VAL_MASK	(0x1f << HP_CTL_CALIB_SHIFT)
-+#define HP_CTL_CALIB_EN		0x00000100
-+#define HP_CTL_PI_FREQ_SHIFT	4
-+#define HP_CTL_PI_FREQ_MASK	(0xf << HP_CTL_PI_FREQ_SHIFT)
-+#define HP_CTL_PI_EN		0x00000008
-+#define HP_CTL_TIMEALARM_EN	0x00000002
-+#define HP_CTL_RTC_EN		0x00000001
-+
-+#define HP_SECVIO_INTEN_EN	0x10000000
-+#define HP_SECVIO_INTEN_SRC5	0x00000020
-+#define HP_SECVIO_INTEN_SRC4	0x00000010
-+#define HP_SECVIO_INTEN_SRC3	0x00000008
-+#define HP_SECVIO_INTEN_SRC2	0x00000004
-+#define HP_SECVIO_INTEN_SRC1	0x00000002
-+#define HP_SECVIO_INTEN_SRC0	0x00000001
-+#define HP_SECVIO_INTEN_ALL	0x8000003f
-+
-+#define HP_SECVIO_ICTL_CFG_SHIFT	30
-+#define HP_SECVIO_ICTL_CFG_MASK		(0x3 << HP_SECVIO_ICTL_CFG_SHIFT)
-+#define HP_SECVIO_ICTL_CFG5_SHIFT	5
-+#define HP_SECVIO_ICTL_CFG5_MASK	(0x3 << HP_SECVIO_ICTL_CFG5_SHIFT)
-+#define HP_SECVIO_ICTL_CFG_DISABLE	0
-+#define HP_SECVIO_ICTL_CFG_NONFATAL	1
-+#define HP_SECVIO_ICTL_CFG_FATAL	2
-+#define HP_SECVIO_ICTL_CFG4_FATAL	0x00000010
-+#define HP_SECVIO_ICTL_CFG3_FATAL	0x00000008
-+#define HP_SECVIO_ICTL_CFG2_FATAL	0x00000004
-+#define HP_SECVIO_ICTL_CFG1_FATAL	0x00000002
-+#define HP_SECVIO_ICTL_CFG0_FATAL	0x00000001
-+
-+#define HP_STATUS_ZMK_ZERO		0x80000000
-+#define HP_STATUS_OTPMK_ZERO		0x08000000
-+#define HP_STATUS_OTPMK_SYN_SHIFT	16
-+#define HP_STATUS_OTPMK_SYN_MASK	(0x1ff << HP_STATUS_OTPMK_SYN_SHIFT)
-+#define HP_STATUS_SSM_ST_SHIFT		8
-+#define HP_STATUS_SSM_ST_MASK		(0xf << HP_STATUS_SSM_ST_SHIFT)
-+#define HP_STATUS_SSM_ST_INIT		0
-+#define HP_STATUS_SSM_ST_HARDFAIL	1
-+#define HP_STATUS_SSM_ST_SOFTFAIL	3
-+#define HP_STATUS_SSM_ST_INITINT	8
-+#define HP_STATUS_SSM_ST_CHECK		9
-+#define HP_STATUS_SSM_ST_NONSECURE	11
-+#define HP_STATUS_SSM_ST_TRUSTED	13
-+#define HP_STATUS_SSM_ST_SECURE		15
-+
-+#define HP_SECVIOST_ZMK_ECC_FAIL	0x08000000	/* write to clear */
-+#define HP_SECVIOST_ZMK_SYN_SHIFT	16
-+#define HP_SECVIOST_ZMK_SYN_MASK	(0x1ff << HP_SECVIOST_ZMK_SYN_SHIFT)
-+#define HP_SECVIOST_SECVIO5		0x00000020
-+#define HP_SECVIOST_SECVIO4		0x00000010
-+#define HP_SECVIOST_SECVIO3		0x00000008
-+#define HP_SECVIOST_SECVIO2		0x00000004
-+#define HP_SECVIOST_SECVIO1		0x00000002
-+#define HP_SECVIOST_SECVIO0		0x00000001
-+#define HP_SECVIOST_SECVIOMASK		0x0000003f
-+
-+/*
-+ * SNVS Low Power Domain
-+ * Includes glitch detector, SRTC, alarm, monotonic counter, ZMK
-+ */
-+struct snvs_lp {
-+	u32 lock;
-+	u32 ctl;
-+	u32 mstr_key_ctl;	/* Master Key Control */
-+	u32 secvio_ctl;		/* Security Violation Control */
-+	u32 tamper_filt_cfg;	/* Tamper Glitch Filters Configuration */
-+	u32 tamper_det_cfg;	/* Tamper Detectors Configuration */
-+	u32 status;
-+	u32 srtc_msb;		/* Secure Real Time Clock/Counter MSB */
-+	u32 srtc_lsb;		/* Secure Real Time Clock/Counter LSB */
-+	u32 time_alarm;		/* Time Alarm */
-+	u32 smc_msb;		/* Secure Monotonic Counter MSB */
-+	u32 smc_lsb;		/* Secure Monotonic Counter LSB */
-+	u32 pwr_glitch_det;	/* Power Glitch Detector */
-+	u32 gen_purpose;
-+	u32 zmk[8];		/* Zeroizable Master Key */
-+};
-+
-+#define LP_LOCK_MKEYSEL_LCK	0x00000200
-+#define LP_LOCK_TAMPDET_LCK	0x00000100
-+#define LP_LOCK_TAMPFLT_LCK	0x00000080
-+#define LP_LOCK_SECVIO_LCK	0x00000040
-+#define LP_LOCK_GENP_LCK	0x00000020
-+#define LP_LOCK_MONOCTR_LCK	0x00000010
-+#define LP_LOCK_CALIB_LCK	0x00000008
-+#define LP_LOCK_SRTC_LCK	0x00000004
-+#define LP_LOCK_ZMK_RD_LCK	0x00000002
-+#define LP_LOCK_ZMK_WT_LCK	0x00000001
-+
-+#define LP_CTL_CAL_VAL_SHIFT	10
-+#define LP_CTL_CAL_VAL_MASK	(0x1f << LP_CTL_CAL_VAL_SHIFT)
-+#define LP_CTL_CALIB_EN		0x00000100
-+#define LP_CTL_SRTC_INVAL_EN	0x00000010
-+#define LP_CTL_WAKE_INT_EN	0x00000008
-+#define LP_CTL_MONOCTR_EN	0x00000004
-+#define LP_CTL_TIMEALARM_EN	0x00000002
-+#define LP_CTL_SRTC_EN		0x00000001
-+
-+#define LP_MKEYCTL_ZMKECC_SHIFT	8
-+#define LP_MKEYCTL_ZMKECC_MASK	(0xff << LP_MKEYCTL_ZMKECC_SHIFT)
-+#define LP_MKEYCTL_ZMKECC_EN	0x00000010
-+#define LP_MKEYCTL_ZMKECC_VAL	0x00000008
-+#define LP_MKEYCTL_ZMKECC_PROG	0x00000004
-+#define LP_MKEYCTL_MKSEL_SHIFT	0
-+#define LP_MKEYCTL_MKSEL_MASK	(3 << LP_MKEYCTL_MKSEL_SHIFT)
-+#define LP_MKEYCTL_MK_OTP	0
-+#define LP_MKEYCTL_MK_ZMK	2
-+#define LP_MKEYCTL_MK_COMB	3
-+
-+#define LP_SECVIO_CTL_SRC5	0x20
-+#define LP_SECVIO_CTL_SRC4	0x10
-+#define LP_SECVIO_CTL_SRC3	0x08
-+#define LP_SECVIO_CTL_SRC2	0x04
-+#define LP_SECVIO_CTL_SRC1	0x02
-+#define LP_SECVIO_CTL_SRC0	0x01
-+
-+#define LP_TAMPFILT_EXT2_EN	0x80000000
-+#define LP_TAMPFILT_EXT2_SHIFT	24
-+#define LP_TAMPFILT_EXT2_MASK	(0x1f << LP_TAMPFILT_EXT2_SHIFT)
-+#define LP_TAMPFILT_EXT1_EN	0x00800000
-+#define LP_TAMPFILT_EXT1_SHIFT	16
-+#define LP_TAMPFILT_EXT1_MASK	(0x1f << LP_TAMPFILT_EXT1_SHIFT)
-+#define LP_TAMPFILT_WM_EN	0x00000080
-+#define LP_TAMPFILT_WM_SHIFT	0
-+#define LP_TAMPFILT_WM_MASK	(0x1f << LP_TAMPFILT_WM_SHIFT)
-+
-+#define LP_TAMPDET_OSC_BPS	0x10000000
-+#define LP_TAMPDET_VRC_SHIFT	24
-+#define LP_TAMPDET_VRC_MASK	(3 << LP_TAMPFILT_VRC_SHIFT)
-+#define LP_TAMPDET_HTDC_SHIFT	20
-+#define LP_TAMPDET_HTDC_MASK	(3 << LP_TAMPFILT_HTDC_SHIFT)
-+#define LP_TAMPDET_LTDC_SHIFT	16
-+#define LP_TAMPDET_LTDC_MASK	(3 << LP_TAMPFILT_LTDC_SHIFT)
-+#define LP_TAMPDET_POR_OBS	0x00008000
-+#define LP_TAMPDET_PFD_OBS	0x00004000
-+#define LP_TAMPDET_ET2_EN	0x00000400
-+#define LP_TAMPDET_ET1_EN	0x00000200
-+#define LP_TAMPDET_WMT2_EN	0x00000100
-+#define LP_TAMPDET_WMT1_EN	0x00000080
-+#define LP_TAMPDET_VT_EN	0x00000040
-+#define LP_TAMPDET_TT_EN	0x00000020
-+#define LP_TAMPDET_CT_EN	0x00000010
-+#define LP_TAMPDET_MCR_EN	0x00000004
-+#define LP_TAMPDET_SRTCR_EN	0x00000002
-+
-+#define LP_STATUS_SECURE
-+#define LP_STATUS_NONSECURE
-+#define LP_STATUS_SCANEXIT	0x00100000	/* all write 1 clear here on */
-+#define LP_STATUS_EXT_SECVIO	0x00010000
-+#define LP_STATUS_ET2		0x00000400
-+#define LP_STATUS_ET1		0x00000200
-+#define LP_STATUS_WMT2		0x00000100
-+#define LP_STATUS_WMT1		0x00000080
-+#define LP_STATUS_VTD		0x00000040
-+#define LP_STATUS_TTD		0x00000020
-+#define LP_STATUS_CTD		0x00000010
-+#define LP_STATUS_PGD		0x00000008
-+#define LP_STATUS_MCR		0x00000004
-+#define LP_STATUS_SRTCR		0x00000002
-+#define LP_STATUS_LPTA		0x00000001
-+
-+/* Full SNVS register page, including version/options */
-+struct snvs_full {
-+	struct snvs_hp hp;
-+	struct snvs_lp lp;
-+	u32 rsvd[731];		/* deadspace 0x08c-0xbf7 */
-+
-+	/* Version / Revision / Option ID space - end of register page */
-+	u32 vid;		/* 0xbf8 HP Version ID (VID 1) */
-+	u32 opt_rev;		/* 0xbfc HP Options / Revision (VID 2) */
-+};
-+
-+#endif /* SNVSREGS_H */
-diff -Nur linux-4.1.3/drivers/dma/imx-sdma.c linux-xbian-imx6/drivers/dma/imx-sdma.c
---- linux-4.1.3/drivers/dma/imx-sdma.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/dma/imx-sdma.c	2015-07-27 23:13:04.285691435 +0200
-@@ -29,6 +29,7 @@
- #include <linux/semaphore.h>
- #include <linux/spinlock.h>
- #include <linux/device.h>
-+#include <linux/genalloc.h>
- #include <linux/dma-mapping.h>
- #include <linux/firmware.h>
- #include <linux/slab.h>
-@@ -232,6 +233,14 @@
- 
- struct sdma_engine;
- 
-+enum sdma_mode {
-+	SDMA_MODE_INVALID = 0,
-+	SDMA_MODE_LOOP,
-+	SDMA_MODE_NORMAL,
-+	SDMA_MODE_P2P,
-+	SDMA_MODE_NO_BD,
-+};
-+
- /**
-  * struct sdma_channel - housekeeping for a SDMA channel
-  *
-@@ -244,6 +253,7 @@
-  * @word_size		peripheral access size
-  * @buf_tail		ID of the buffer that was processed
-  * @num_bd		max NUM_BD. number of descriptors currently handling
-+ * @bd_iram		flag indicating the memory location of buffer descriptor
-  */
- struct sdma_channel {
- 	struct sdma_engine		*sdma;
-@@ -258,12 +268,16 @@
- 	unsigned int			period_len;
- 	struct sdma_buffer_descriptor	*bd;
- 	dma_addr_t			bd_phys;
-+	bool				bd_iram;
- 	unsigned int			pc_from_device, pc_to_device;
--	unsigned long			flags;
--	dma_addr_t			per_address;
-+	unsigned int			device_to_device;
-+	unsigned int			other_script;
-+	enum sdma_mode			mode;
-+	dma_addr_t			per_address, per_address2;
- 	unsigned long			event_mask[2];
- 	unsigned long			watermark_level;
- 	u32				shp_addr, per_addr;
-+	u32				data_addr1, data_addr2;
- 	struct dma_chan			chan;
- 	spinlock_t			lock;
- 	struct dma_async_tx_descriptor	desc;
-@@ -271,11 +285,8 @@
- 	unsigned int			chn_count;
- 	unsigned int			chn_real_count;
- 	struct tasklet_struct		tasklet;
--	struct imx_dma_data		data;
- };
- 
--#define IMX_DMA_SG_LOOP		BIT(0)
--
- #define MAX_DMA_CHANNELS 32
- #define MXC_SDMA_DEFAULT_PRIORITY 1
- #define MXC_SDMA_MIN_PRIORITY 1
-@@ -327,6 +338,7 @@
- 	spinlock_t			channel_0_lock;
- 	u32				script_number;
- 	struct sdma_script_start_addrs	*script_addrs;
-+	struct gen_pool 		*iram_pool;
- 	const struct sdma_driver_data	*drvdata;
- };
- 
-@@ -546,12 +558,14 @@
- 	dma_addr_t buf_phys;
- 	int ret;
- 	unsigned long flags;
-+	bool use_iram = true;
- 
--	buf_virt = dma_alloc_coherent(NULL,
--			size,
--			&buf_phys, GFP_KERNEL);
-+	buf_virt = gen_pool_dma_alloc(sdma->iram_pool, size, &buf_phys);
- 	if (!buf_virt) {
--		return -ENOMEM;
-+		use_iram = false;
-+		buf_virt = dma_alloc_coherent(NULL, size, &buf_phys, GFP_KERNEL);
-+		if (!buf_virt)
-+			return -ENOMEM;
- 	}
- 
- 	spin_lock_irqsave(&sdma->channel_0_lock, flags);
-@@ -568,7 +582,10 @@
- 
- 	spin_unlock_irqrestore(&sdma->channel_0_lock, flags);
- 
--	dma_free_coherent(NULL, size, buf_virt, buf_phys);
-+	if (use_iram)
-+		gen_pool_free(sdma->iram_pool, (unsigned long)buf_virt, size);
-+	else
-+		dma_free_coherent(NULL, size, buf_virt, buf_phys);
- 
- 	return ret;
- }
-@@ -654,14 +671,31 @@
- 		sdmac->desc.callback(sdmac->desc.callback_param);
- }
- 
-+static void sdma_handle_other_intr(struct sdma_channel *sdmac)
-+{
-+	if (sdmac->desc.callback)
-+		sdmac->desc.callback(sdmac->desc.callback_param);
-+}
-+
- static void sdma_tasklet(unsigned long data)
- {
- 	struct sdma_channel *sdmac = (struct sdma_channel *) data;
-+	struct sdma_engine *sdma = sdmac->sdma;
- 
--	if (sdmac->flags & IMX_DMA_SG_LOOP)
-+	switch (sdmac->mode) {
-+	case SDMA_MODE_LOOP:
- 		sdma_handle_channel_loop(sdmac);
--	else
-+		break;
-+	case SDMA_MODE_NORMAL:
- 		mxc_sdma_handle_channel_normal(sdmac);
-+		break;
-+	case SDMA_MODE_NO_BD:
-+		sdma_handle_other_intr(sdmac);
-+		break;
-+	default:
-+		dev_err(sdma->dev, "invalid SDMA MODE!\n");
-+		break;
-+	}
- }
- 
- static irqreturn_t sdma_int_handler(int irq, void *dev_id)
-@@ -678,7 +712,7 @@
- 		int channel = fls(stat) - 1;
- 		struct sdma_channel *sdmac = &sdma->channel[channel];
- 
--		if (sdmac->flags & IMX_DMA_SG_LOOP)
-+		if (sdmac->mode & SDMA_MODE_LOOP)
- 			sdma_update_channel_loop(sdmac);
- 
- 		tasklet_schedule(&sdmac->tasklet);
-@@ -702,9 +736,12 @@
- 	 * two peripherals or memory-to-memory transfers
- 	 */
- 	int per_2_per = 0, emi_2_emi = 0;
-+	int other = 0;
- 
- 	sdmac->pc_from_device = 0;
- 	sdmac->pc_to_device = 0;
-+	sdmac->device_to_device = 0;
-+	sdmac->other_script = 0;
- 
- 	switch (peripheral_type) {
- 	case IMX_DMATYPE_MEMORY:
-@@ -733,7 +770,6 @@
- 	case IMX_DMATYPE_CSPI:
- 	case IMX_DMATYPE_EXT:
- 	case IMX_DMATYPE_SSI:
--	case IMX_DMATYPE_SAI:
- 		per_2_emi = sdma->script_addrs->app_2_mcu_addr;
- 		emi_2_per = sdma->script_addrs->mcu_2_app_addr;
- 		break;
-@@ -751,11 +787,6 @@
- 		emi_2_per = sdma->script_addrs->mcu_2_shp_addr;
- 		break;
- 	case IMX_DMATYPE_ASRC:
--		per_2_emi = sdma->script_addrs->asrc_2_mcu_addr;
--		emi_2_per = sdma->script_addrs->asrc_2_mcu_addr;
--		per_2_per = sdma->script_addrs->per_2_per_addr;
--		break;
--	case IMX_DMATYPE_ASRC_SP:
- 		per_2_emi = sdma->script_addrs->shp_2_mcu_addr;
- 		emi_2_per = sdma->script_addrs->mcu_2_shp_addr;
- 		per_2_per = sdma->script_addrs->per_2_per_addr;
-@@ -774,12 +805,17 @@
- 	case IMX_DMATYPE_IPU_MEMORY:
- 		emi_2_per = sdma->script_addrs->ext_mem_2_ipu_addr;
- 		break;
-+	case IMX_DMATYPE_HDMI:
-+		other = sdma->script_addrs->hdmi_dma_addr;
-+		break;
- 	default:
- 		break;
- 	}
- 
- 	sdmac->pc_from_device = per_2_emi;
- 	sdmac->pc_to_device = emi_2_per;
-+	sdmac->device_to_device = per_2_per;
-+	sdmac->other_script = other;
- }
- 
- static int sdma_load_context(struct sdma_channel *sdmac)
-@@ -792,11 +828,14 @@
- 	int ret;
- 	unsigned long flags;
- 
--	if (sdmac->direction == DMA_DEV_TO_MEM) {
-+	if (sdmac->direction == DMA_DEV_TO_MEM)
- 		load_address = sdmac->pc_from_device;
--	} else {
-+	else if (sdmac->direction == DMA_DEV_TO_DEV)
-+		load_address = sdmac->device_to_device;
-+	else if (sdmac->direction == DMA_MEM_TO_DEV)
- 		load_address = sdmac->pc_to_device;
--	}
-+	else
-+		load_address = sdmac->other_script;
- 
- 	if (load_address < 0)
- 		return load_address;
-@@ -816,11 +855,16 @@
- 	/* Send by context the event mask,base address for peripheral
- 	 * and watermark level
- 	 */
--	context->gReg[0] = sdmac->event_mask[1];
--	context->gReg[1] = sdmac->event_mask[0];
--	context->gReg[2] = sdmac->per_addr;
--	context->gReg[6] = sdmac->shp_addr;
--	context->gReg[7] = sdmac->watermark_level;
-+	if (sdmac->peripheral_type == IMX_DMATYPE_HDMI) {
-+		context->gReg[4] = sdmac->data_addr1;
-+		context->gReg[6] = sdmac->data_addr2;
-+	} else {
-+		context->gReg[0] = sdmac->event_mask[1];
-+		context->gReg[1] = sdmac->event_mask[0];
-+		context->gReg[2] = sdmac->per_addr;
-+		context->gReg[6] = sdmac->shp_addr;
-+		context->gReg[7] = sdmac->watermark_level;
-+	}
- 
- 	bd0->mode.command = C0_SETDM;
- 	bd0->mode.status = BD_DONE | BD_INTR | BD_WRAP | BD_EXTD;
-@@ -854,6 +898,7 @@
- static int sdma_config_channel(struct dma_chan *chan)
- {
- 	struct sdma_channel *sdmac = to_sdma_chan(chan);
-+	struct imx_dma_data *data = sdmac->chan.private;
- 	int ret;
- 
- 	sdma_disable_channel(chan);
-@@ -862,12 +907,19 @@
- 	sdmac->event_mask[1] = 0;
- 	sdmac->shp_addr = 0;
- 	sdmac->per_addr = 0;
-+	sdmac->data_addr1 = 0;
-+	sdmac->data_addr2 = 0;
- 
--	if (sdmac->event_id0) {
-+	if (sdmac->event_id0 >= 0) {
- 		if (sdmac->event_id0 >= sdmac->sdma->drvdata->num_events)
- 			return -EINVAL;
- 		sdma_event_enable(sdmac, sdmac->event_id0);
- 	}
-+	if (sdmac->event_id1) {
-+		if (sdmac->event_id1 >= sdmac->sdma->drvdata->num_events)
-+			return -EINVAL;
-+		sdma_event_enable(sdmac, sdmac->event_id1);
-+	}
- 
- 	switch (sdmac->peripheral_type) {
- 	case IMX_DMATYPE_DSP:
-@@ -887,19 +939,75 @@
- 			(sdmac->peripheral_type != IMX_DMATYPE_DSP)) {
- 		/* Handle multiple event channels differently */
- 		if (sdmac->event_id1) {
--			sdmac->event_mask[1] = BIT(sdmac->event_id1 % 32);
--			if (sdmac->event_id1 > 31)
--				__set_bit(31, &sdmac->watermark_level);
--			sdmac->event_mask[0] = BIT(sdmac->event_id0 % 32);
--			if (sdmac->event_id0 > 31)
--				__set_bit(30, &sdmac->watermark_level);
-+			if (sdmac->event_id0 > 31) {
-+				sdmac->event_mask[0] |= 0;
-+				__set_bit(28, &sdmac->watermark_level);
-+				sdmac->event_mask[1] |=
-+						BIT(sdmac->event_id0 % 32);
-+			} else {
-+				sdmac->event_mask[1] |= 0;
-+				sdmac->event_mask[0] |=
-+						BIT(sdmac->event_id0 % 32);
-+			}
-+			if (sdmac->event_id1 > 31) {
-+				sdmac->event_mask[0] |= 0;
-+				__set_bit(29, &sdmac->watermark_level);
-+				sdmac->event_mask[1] |=
-+						BIT(sdmac->event_id1 % 32);
-+			} else {
-+				sdmac->event_mask[1] |= 0;
-+				sdmac->event_mask[0] |=
-+						BIT(sdmac->event_id1 % 32);
-+			}
-+			/* BIT 11:
-+			 * 1 : Source on SPBA
-+			 * 0 : Source on AIPS
-+			 */
-+			__set_bit(11, &sdmac->watermark_level);
-+			/* BIT 12:
-+			 * 1 : Destination on SPBA
-+			 * 0 : Destination on AIPS
-+			 */
-+			__set_bit(12, &sdmac->watermark_level);
-+			__set_bit(31, &sdmac->watermark_level);
-+			/* BIT 31:
-+			 * 1 : Amount of samples to be transferred is
-+			 * unknown and script will keep on transferring
-+			 * samples as long as both events are detected
-+			 * and script must be manually stopped by the
-+			 * application.
-+			 * 0 : The amount of samples to be is equal to
-+			 * the count field of mode word
-+			 * */
-+			__set_bit(25, &sdmac->watermark_level);
-+			__clear_bit(24, &sdmac->watermark_level);
- 		} else {
--			__set_bit(sdmac->event_id0, sdmac->event_mask);
-+			if (sdmac->event_id0 > 31) {
-+				sdmac->event_mask[0] = 0;
-+				sdmac->event_mask[1] |=
-+						BIT(sdmac->event_id0 % 32);
-+			} else {
-+				sdmac->event_mask[0] |=
-+						BIT(sdmac->event_id0 % 32);
-+				sdmac->event_mask[1] = 0;
-+			}
- 		}
- 		/* Watermark Level */
- 		sdmac->watermark_level |= sdmac->watermark_level;
- 		/* Address */
--		sdmac->shp_addr = sdmac->per_address;
-+		if (sdmac->direction == DMA_DEV_TO_DEV) {
-+			sdmac->shp_addr = sdmac->per_address2;
-+			sdmac->per_addr = sdmac->per_address;
-+		} else if (sdmac->direction == DMA_TRANS_NONE) {
-+			if (sdmac->peripheral_type != IMX_DMATYPE_HDMI ||
-+					!data->data_addr1 || !data->data_addr2)
-+				return -EINVAL;
-+			sdmac->data_addr1 = *(u32 *)data->data_addr1;
-+			sdmac->data_addr2 = *(u32 *)data->data_addr2;
-+			sdmac->watermark_level = 0;
-+		} else {
-+			sdmac->shp_addr = sdmac->per_address;
-+		}
- 	} else {
- 		sdmac->watermark_level = 0; /* FIXME: M3_BASE_ADDRESS */
- 	}
-@@ -931,13 +1039,19 @@
- 	int channel = sdmac->channel;
- 	int ret = -EBUSY;
- 
--	sdmac->bd = dma_zalloc_coherent(NULL, PAGE_SIZE, &sdmac->bd_phys,
--					GFP_KERNEL);
-+	sdmac->bd_iram = true;
-+	sdmac->bd = gen_pool_dma_alloc(sdma->iram_pool, PAGE_SIZE, &sdmac->bd_phys);
- 	if (!sdmac->bd) {
--		ret = -ENOMEM;
--		goto out;
-+		sdmac->bd_iram = false;
-+		sdmac->bd = dma_alloc_coherent(NULL, PAGE_SIZE, &sdmac->bd_phys, GFP_KERNEL);
-+		if (!sdmac->bd) {
-+			ret = -ENOMEM;
-+			goto out;
-+		}
- 	}
- 
-+	memset(sdmac->bd, 0, PAGE_SIZE);
-+
- 	sdma->channel_control[channel].base_bd_ptr = sdmac->bd_phys;
- 	sdma->channel_control[channel].current_bd_ptr = sdmac->bd_phys;
- 
-@@ -987,6 +1101,7 @@
- 
- 	sdmac->peripheral_type = data->peripheral_type;
- 	sdmac->event_id0 = data->dma_request;
-+	sdmac->event_id1 = data->dma_request2;
- 
- 	clk_enable(sdmac->sdma->clk_ipg);
- 	clk_enable(sdmac->sdma->clk_ahb);
-@@ -1004,6 +1119,9 @@
- 	/* txd.flags will be overwritten in prep funcs */
- 	sdmac->desc.flags = DMA_CTRL_ACK;
- 
-+	/* Set SDMA channel mode to unvalid to avoid misconfig */
-+	sdmac->mode = SDMA_MODE_INVALID;
-+
- 	return 0;
- }
- 
-@@ -1014,7 +1132,7 @@
- 
- 	sdma_disable_channel(chan);
- 
--	if (sdmac->event_id0)
-+	if (sdmac->event_id0 >= 0)
- 		sdma_event_disable(sdmac, sdmac->event_id0);
- 	if (sdmac->event_id1)
- 		sdma_event_disable(sdmac, sdmac->event_id1);
-@@ -1024,7 +1142,10 @@
- 
- 	sdma_set_channel_priority(sdmac, 0);
- 
--	dma_free_coherent(NULL, PAGE_SIZE, sdmac->bd, sdmac->bd_phys);
-+	if (sdmac->bd_iram)
-+		gen_pool_free(sdma->iram_pool, (unsigned long)sdmac->bd, PAGE_SIZE);
-+	else
-+		dma_free_coherent(NULL, PAGE_SIZE, sdmac->bd, sdmac->bd_phys);
- 
- 	clk_disable(sdma->clk_ipg);
- 	clk_disable(sdma->clk_ahb);
-@@ -1045,7 +1166,7 @@
- 		return NULL;
- 	sdmac->status = DMA_IN_PROGRESS;
- 
--	sdmac->flags = 0;
-+	sdmac->mode = SDMA_MODE_NORMAL;
- 
- 	sdmac->buf_tail = 0;
- 
-@@ -1134,13 +1255,13 @@
- static struct dma_async_tx_descriptor *sdma_prep_dma_cyclic(
- 		struct dma_chan *chan, dma_addr_t dma_addr, size_t buf_len,
- 		size_t period_len, enum dma_transfer_direction direction,
--		unsigned long flags)
-+		unsigned long flags, void *context)
- {
- 	struct sdma_channel *sdmac = to_sdma_chan(chan);
- 	struct sdma_engine *sdma = sdmac->sdma;
--	int num_periods = buf_len / period_len;
- 	int channel = sdmac->channel;
- 	int ret, i = 0, buf = 0;
-+	int num_periods;
- 
- 	dev_dbg(sdma->dev, "%s channel: %d\n", __func__, channel);
- 
-@@ -1152,12 +1273,33 @@
- 	sdmac->buf_tail = 0;
- 	sdmac->period_len = period_len;
- 
--	sdmac->flags |= IMX_DMA_SG_LOOP;
- 	sdmac->direction = direction;
-+
-+	switch (sdmac->direction) {
-+	case DMA_DEV_TO_DEV:
-+		sdmac->mode = SDMA_MODE_P2P;
-+		break;
-+	case DMA_TRANS_NONE:
-+		sdmac->mode = SDMA_MODE_NO_BD;
-+		break;
-+	case DMA_MEM_TO_DEV:
-+	case DMA_DEV_TO_MEM:
-+		sdmac->mode = SDMA_MODE_LOOP;
-+		break;
-+	default:
-+		dev_err(sdma->dev, "invalid SDMA direction %d\n", direction);
-+		return NULL;
-+	}
-+
- 	ret = sdma_load_context(sdmac);
- 	if (ret)
- 		goto err_out;
- 
-+	if (period_len)
-+		num_periods = buf_len / period_len;
-+	else
-+		return &sdmac->desc;
-+
- 	if (num_periods > NUM_BD) {
- 		dev_err(sdma->dev, "SDMA channel %d: maximum number of sg exceeded: %d > %d\n",
- 				channel, num_periods, NUM_BD);
-@@ -1216,7 +1358,16 @@
- {
- 	struct sdma_channel *sdmac = to_sdma_chan(chan);
- 
--	if (dmaengine_cfg->direction == DMA_DEV_TO_MEM) {
-+	if (dmaengine_cfg->direction == DMA_DEV_TO_DEV) {
-+		sdmac->per_address = dmaengine_cfg->src_addr;
-+		sdmac->per_address2 = dmaengine_cfg->dst_addr;
-+		sdmac->watermark_level = 0;
-+		sdmac->watermark_level |=
-+		dmaengine_cfg->src_maxburst;
-+		sdmac->watermark_level |=
-+			dmaengine_cfg->dst_maxburst << 16;
-+		sdmac->word_size = dmaengine_cfg->dst_addr_width;
-+	} else if (dmaengine_cfg->direction == DMA_DEV_TO_MEM) {
- 		sdmac->per_address = dmaengine_cfg->src_addr;
- 		sdmac->watermark_level = dmaengine_cfg->src_maxburst *
- 			dmaengine_cfg->src_addr_width;
-@@ -1238,7 +1389,7 @@
- 	struct sdma_channel *sdmac = to_sdma_chan(chan);
- 	u32 residue;
- 
--	if (sdmac->flags & IMX_DMA_SG_LOOP)
-+	if (sdmac->mode & SDMA_MODE_LOOP)
- 		residue = (sdmac->num_bd - sdmac->buf_tail) * sdmac->period_len;
- 	else
- 		residue = sdmac->chn_count - sdmac->chn_real_count;
-@@ -1286,8 +1437,7 @@
- 	unsigned short *ram_code;
- 
- 	if (!fw) {
--		dev_info(sdma->dev, "external firmware not found, using ROM firmware\n");
--		/* In this case we just use the ROM firmware. */
-+		dev_err(sdma->dev, "firmware not found\n");
- 		return;
- 	}
- 
-@@ -1302,7 +1452,10 @@
- 		goto err_firmware;
- 	switch (header->version_major) {
- 	case 1:
--		sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V1;
-+		if (header->version_minor > 0)
-+			sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V2;
-+		else
-+			sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V1;
- 		break;
- 	case 2:
- 		sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V2;
-@@ -1337,7 +1490,7 @@
- 	release_firmware(fw);
- }
- 
--static int sdma_get_firmware(struct sdma_engine *sdma,
-+static int __init sdma_get_firmware(struct sdma_engine *sdma,
- 		const char *fw_name)
- {
- 	int ret;
-@@ -1349,9 +1502,9 @@
- 	return ret;
- }
- 
--static int sdma_init(struct sdma_engine *sdma)
-+static int __init sdma_init(struct sdma_engine *sdma)
- {
--	int i, ret;
-+	int i, ret, ccbsize;
- 	dma_addr_t ccb_phys;
- 
- 	clk_enable(sdma->clk_ipg);
-@@ -1360,14 +1513,17 @@
- 	/* Be sure SDMA has not started yet */
- 	writel_relaxed(0, sdma->regs + SDMA_H_C0PTR);
- 
--	sdma->channel_control = dma_alloc_coherent(NULL,
--			MAX_DMA_CHANNELS * sizeof (struct sdma_channel_control) +
--			sizeof(struct sdma_context_data),
--			&ccb_phys, GFP_KERNEL);
-+	ccbsize = MAX_DMA_CHANNELS * sizeof (struct sdma_channel_control)
-+		+ sizeof(struct sdma_context_data);
- 
-+	sdma->channel_control = gen_pool_dma_alloc(sdma->iram_pool, ccbsize, &ccb_phys);
- 	if (!sdma->channel_control) {
--		ret = -ENOMEM;
--		goto err_dma_alloc;
-+		sdma->channel_control = dma_alloc_coherent(NULL, ccbsize,
-+						&ccb_phys, GFP_KERNEL);
-+		if (!sdma->channel_control) {
-+			ret = -ENOMEM;
-+			goto err_dma_alloc;
-+		}
- 	}
- 
- 	sdma->context = (void *)sdma->channel_control +
-@@ -1419,14 +1575,12 @@
- 
- static bool sdma_filter_fn(struct dma_chan *chan, void *fn_param)
- {
--	struct sdma_channel *sdmac = to_sdma_chan(chan);
- 	struct imx_dma_data *data = fn_param;
- 
- 	if (!imx_dma_is_general_purpose(chan))
- 		return false;
- 
--	sdmac->data = *data;
--	chan->private = &sdmac->data;
-+	chan->private = data;
- 
- 	return true;
- }
-@@ -1444,11 +1598,12 @@
- 	data.dma_request = dma_spec->args[0];
- 	data.peripheral_type = dma_spec->args[1];
- 	data.priority = dma_spec->args[2];
-+	data.dma_request2 = 0;
- 
- 	return dma_request_channel(mask, sdma_filter_fn, &data);
- }
- 
--static int sdma_probe(struct platform_device *pdev)
-+static int __init sdma_probe(struct platform_device *pdev)
- {
- 	const struct of_device_id *of_id =
- 			of_match_device(sdma_dt_ids, &pdev->dev);
-@@ -1547,6 +1702,11 @@
- 					&sdma->dma_device.channels);
- 	}
- 
-+	if (np)
-+		sdma->iram_pool = of_get_named_gen_pool(np, "iram", 0);
-+	if (!sdma->iram_pool)
-+		dev_warn(&pdev->dev, "no iram assigned, using external mem\n");
-+
- 	ret = sdma_init(sdma);
- 	if (ret)
- 		goto err_init;
-@@ -1583,7 +1743,7 @@
- 	sdma->dma_device.device_free_chan_resources = sdma_free_chan_resources;
- 	sdma->dma_device.device_tx_status = sdma_tx_status;
- 	sdma->dma_device.device_prep_slave_sg = sdma_prep_slave_sg;
--	sdma->dma_device.device_prep_dma_cyclic = sdma_prep_dma_cyclic;
-+	sdma->dma_device.device_prep_dma_cyclic = (void*)sdma_prep_dma_cyclic;
- 	sdma->dma_device.device_config = sdma_config;
- 	sdma->dma_device.device_terminate_all = sdma_disable_channel;
- 	sdma->dma_device.src_addr_widths = BIT(DMA_SLAVE_BUSWIDTH_4_BYTES);
-@@ -1594,8 +1754,6 @@
- 	sdma->dma_device.dev->dma_parms = &sdma->dma_parms;
- 	dma_set_max_seg_size(sdma->dma_device.dev, 65535);
- 
--	platform_set_drvdata(pdev, sdma);
--
- 	ret = dma_async_device_register(&sdma->dma_device);
- 	if (ret) {
- 		dev_err(&pdev->dev, "unable to register\n");
-@@ -1647,10 +1805,13 @@
- 	},
- 	.id_table	= sdma_devtypes,
- 	.remove		= sdma_remove,
--	.probe		= sdma_probe,
- };
- 
--module_platform_driver(sdma_driver);
-+static int __init sdma_module_init(void)
-+{
-+	return platform_driver_probe(&sdma_driver, sdma_probe);
-+}
-+module_init(sdma_module_init);
- 
- MODULE_AUTHOR("Sascha Hauer, Pengutronix <s.hauer@pengutronix.de>");
- MODULE_DESCRIPTION("i.MX SDMA driver");
-diff -Nur linux-4.1.3/drivers/gpu/drm/Kconfig linux-xbian-imx6/drivers/gpu/drm/Kconfig
---- linux-4.1.3/drivers/gpu/drm/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/gpu/drm/Kconfig	2015-07-27 23:13:04.353449682 +0200
-@@ -217,3 +217,5 @@
- source "drivers/gpu/drm/amd/amdkfd/Kconfig"
- 
- source "drivers/gpu/drm/imx/Kconfig"
-+
-+source "drivers/gpu/drm/vivante/Kconfig"
-diff -Nur linux-4.1.3/drivers/gpu/drm/Makefile linux-xbian-imx6/drivers/gpu/drm/Makefile
---- linux-4.1.3/drivers/gpu/drm/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/gpu/drm/Makefile	2015-07-27 23:13:04.353449682 +0200
-@@ -67,6 +67,7 @@
- obj-$(CONFIG_DRM_TEGRA) += tegra/
- obj-$(CONFIG_DRM_STI) += sti/
- obj-$(CONFIG_DRM_IMX) += imx/
-+obj-$(CONFIG_DRM_VIVANTE) += vivante/
- obj-y			+= i2c/
- obj-y			+= panel/
- obj-y			+= bridge/
-diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/Kconfig linux-xbian-imx6/drivers/gpu/drm/vivante/Kconfig
---- linux-4.1.3/drivers/gpu/drm/vivante/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/gpu/drm/vivante/Kconfig	2015-07-27 23:13:04.744056042 +0200
-@@ -0,0 +1,6 @@
-+config DRM_VIVANTE
-+        tristate "Vivante GCCore"
-+        depends on DRM
-+        help
-+          Choose this option if you have a Vivante graphics card.
-+          If M is selected, the module will be called vivante.
-diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/Makefile linux-xbian-imx6/drivers/gpu/drm/vivante/Makefile
---- linux-4.1.3/drivers/gpu/drm/vivante/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/gpu/drm/vivante/Makefile	2015-07-27 23:13:04.744056042 +0200
-@@ -0,0 +1,29 @@
-+##############################################################################
-+#
-+#    Copyright (C) 2005 - 2013 by Vivante Corp.
-+#
-+#    This program is free software; you can redistribute it and/or modify
-+#    it under the terms of the GNU General Public License as published by
-+#    the Free Software Foundation; either version 2 of the license, or
-+#    (at your option) any later version.
-+#
-+#    This program is distributed in the hope that it will be useful,
-+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+#    GNU General Public License for more details.
-+#
-+#    You should have received a copy of the GNU General Public License
-+#    along with this program; if not write to the Free Software
-+#    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+#
-+##############################################################################
-+
-+
-+#
-+# Makefile for the drm device driver.  This driver provides support for the
-+# Direct Rendering Infrastructure (DRI) in XFree86 4.1.0 and higher.
-+
-+ccflags-y := -Iinclude/drm
-+vivante-y := vivante_drv.o
-+
-+obj-$(CONFIG_DRM_VIVANTE)	+= vivante.o
-diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.c linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.c
---- linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.c	2015-07-27 23:13:04.744056042 +0200
-@@ -0,0 +1,112 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+/* vivante_drv.c -- vivante driver -*- linux-c -*-
-+ *
-+ *
-+ * Permission is hereby granted, free of charge, to any person obtaining a
-+ * copy of this software and associated documentation files (the "Software"),
-+ * to deal in the Software without restriction, including without limitation
-+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
-+ * and/or sell copies of the Software, and to permit persons to whom the
-+ * Software is furnished to do so, subject to the following conditions:
-+ *
-+ * The above copyright notice and this permission notice (including the next
-+ * paragraph) shall be included in all copies or substantial portions of the
-+ * Software.
-+ *
-+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
-+ * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
-+ * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
-+ * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
-+ * DEALINGS IN THE SOFTWARE.
-+ *
-+ * Authors:
-+ *    Rickard E. (Rik) Faith <faith@valinux.com>
-+ *    Daryll Strauss <daryll@valinux.com>
-+ *    Gareth Hughes <gareth@valinux.com>
-+ */
-+
-+#include <linux/version.h>
-+#include <linux/module.h>
-+
-+#include "drmP.h"
-+#include "vivante_drv.h"
-+
-+#include "drm_pciids.h"
-+
-+static char platformdevicename[] = "Vivante GCCore";
-+static struct platform_device *pplatformdev;
-+
-+static const struct file_operations viv_driver_fops = {
-+	.owner = THIS_MODULE,
-+	.open = drm_open,
-+	.release = drm_release,
-+	.unlocked_ioctl = drm_ioctl,
-+	.mmap = drm_legacy_mmap,
-+	.poll = drm_poll,
-+	.llseek = noop_llseek,
-+};
-+
-+static struct drm_driver driver = {
-+//	.driver_features = DRIVER_RENDER,
-+	.fops = &viv_driver_fops,
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 18, 0)
-+	.set_busid = drm_platform_set_busid,
-+#endif
-+	.name = DRIVER_NAME,
-+	.desc = DRIVER_DESC,
-+	.date = DRIVER_DATE,
-+	.major = DRIVER_MAJOR,
-+	.minor = DRIVER_MINOR,
-+	.patchlevel = DRIVER_PATCHLEVEL,
-+};
-+
-+static int __init vivante_init(void)
-+{
-+	int retcode;
-+
-+	pplatformdev = platform_device_register_simple(platformdevicename,
-+			-1, NULL, 0);
-+	if (pplatformdev == NULL)
-+		printk(KERN_ERR"Platform device is null\n");
-+
-+	retcode = drm_platform_init(&driver, pplatformdev);
-+
-+	return retcode;
-+}
-+
-+static void __exit vivante_exit(void)
-+{
-+	if (pplatformdev) {
-+		platform_device_unregister(pplatformdev);
-+		pplatformdev = NULL;
-+	}
-+}
-+
-+module_init(vivante_init);
-+module_exit(vivante_exit);
-+
-+MODULE_AUTHOR(DRIVER_AUTHOR);
-+MODULE_DESCRIPTION(DRIVER_DESC);
-+MODULE_LICENSE("GPL and additional rights");
-diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.h linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.h
---- linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.h	2015-07-27 23:13:04.744056042 +0200
-@@ -0,0 +1,69 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+/* vivante_drv.h -- Vivante DRM template customization -*- linux-c -*-
-+ * Created: Wed Feb 14 12:32:32 2012 by John Zhao
-+ */
-+/*
-+ *
-+ * Permission is hereby granted, free of charge, to any person obtaining a
-+ * copy of this software and associated documentation files (the "Software"),
-+ * to deal in the Software without restriction, including without limitation
-+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
-+ * and/or sell copies of the Software, and to permit persons to whom the
-+ * Software is furnished to do so, subject to the following conditions:
-+ *
-+ * The above copyright notice and this permission notice (including the next
-+ * paragraph) shall be included in all copies or substantial portions of the
-+ * Software.
-+ *
-+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
-+ * VA LINUX SYSTEMS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
-+ * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
-+ * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
-+ * OTHER DEALINGS IN THE SOFTWARE.
-+ *
-+ * Authors:
-+ *    Gareth Hughes <gareth@valinux.com>
-+ */
-+
-+#ifndef __VIVANTE_DRV_H__
-+#define __VIVANTE_DRV_H__
-+
-+/* General customization:
-+ */
-+
-+#include <drm/drm_legacy.h>
-+#include <drm/drm_mm.h>
-+
-+#define DRIVER_AUTHOR		"Vivante Inc."
-+
-+#define DRIVER_NAME		"vivante"
-+#define DRIVER_DESC		"Vivante GCCore"
-+#define DRIVER_DATE		"20120216"
-+
-+#define DRIVER_MAJOR		1
-+#define DRIVER_MINOR		0
-+#define DRIVER_PATCHLEVEL	0
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/Kconfig linux-xbian-imx6/drivers/Kconfig
---- linux-4.1.3/drivers/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/Kconfig	2015-07-27 23:13:03.699781896 +0200
-@@ -182,4 +182,6 @@
- 
- source "drivers/android/Kconfig"
- 
-+source "drivers/mxc/Kconfig"
-+
- endmenu
-diff -Nur linux-4.1.3/drivers/Makefile linux-xbian-imx6/drivers/Makefile
---- linux-4.1.3/drivers/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/Makefile	2015-07-27 23:13:03.699781896 +0200
-@@ -165,3 +165,4 @@
- obj-$(CONFIG_THUNDERBOLT)	+= thunderbolt/
- obj-$(CONFIG_CORESIGHT)		+= hwtracing/coresight/
- obj-$(CONFIG_ANDROID)		+= android/
-+obj-y                           += mxc/
-diff -Nur linux-4.1.3/drivers/mfd/Kconfig linux-xbian-imx6/drivers/mfd/Kconfig
---- linux-4.1.3/drivers/mfd/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mfd/Kconfig	2015-07-27 23:13:06.023491162 +0200
-@@ -207,6 +207,13 @@
- 	  Additional drivers must be enabled in order to use the specific
- 	  features of the device.
- 
-+config MFD_MXC_HDMI
-+	tristate "Freescale HDMI Core"
-+	select MFD_CORE
-+	help
-+	  This is the core driver for the Freescale i.MX6 on-chip HDMI.
-+	  This MFD driver connects with the video and audio drivers for HDMI.
-+
- config MFD_DLN2
- 	tristate "Diolan DLN2 support"
- 	select MFD_CORE
-diff -Nur linux-4.1.3/drivers/mfd/Makefile linux-xbian-imx6/drivers/mfd/Makefile
---- linux-4.1.3/drivers/mfd/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mfd/Makefile	2015-07-27 23:13:06.023491162 +0200
-@@ -185,3 +185,4 @@
- intel-soc-pmic-objs		:= intel_soc_pmic_core.o intel_soc_pmic_crc.o
- obj-$(CONFIG_INTEL_SOC_PMIC)	+= intel-soc-pmic.o
- obj-$(CONFIG_MFD_MT6397)	+= mt6397-core.o
-+obj-$(CONFIG_MFD_MXC_HDMI)      += mxc-hdmi-core.o
-diff -Nur linux-4.1.3/drivers/mfd/mxc-hdmi-core.c linux-xbian-imx6/drivers/mfd/mxc-hdmi-core.c
---- linux-4.1.3/drivers/mfd/mxc-hdmi-core.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mfd/mxc-hdmi-core.c	2015-07-27 23:13:06.051391618 +0200
-@@ -0,0 +1,723 @@
-+/*
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+#include <linux/kernel.h>
-+#include <linux/module.h>
-+#include <linux/init.h>
-+#include <linux/slab.h>
-+#include <linux/device.h>
-+#include <linux/err.h>
-+#include <linux/io.h>
-+#include <linux/clk.h>
-+#include <linux/spinlock.h>
-+#include <linux/irq.h>
-+#include <linux/interrupt.h>
-+
-+#include <linux/platform_device.h>
-+#include <linux/regulator/machine.h>
-+#include <asm/mach-types.h>
-+
-+#include <video/mxc_hdmi.h>
-+#include <linux/ipu-v3.h>
-+#include <video/mxc_edid.h>
-+#include "../mxc/ipu3/ipu_prv.h"
-+#include <linux/mfd/mxc-hdmi-core.h>
-+#include <linux/of_device.h>
-+#include <linux/mod_devicetable.h>
-+
-+struct mxc_hdmi_data {
-+	struct platform_device *pdev;
-+	unsigned long __iomem *reg_base;
-+	unsigned long reg_phys_base;
-+	struct device *dev;
-+};
-+
-+static void __iomem *hdmi_base;
-+static struct clk *isfr_clk;
-+static struct clk *iahb_clk;
-+static spinlock_t irq_spinlock;
-+static spinlock_t edid_spinlock;
-+static unsigned int sample_rate;
-+static unsigned long pixel_clk_rate;
-+static struct clk *pixel_clk;
-+static int hdmi_ratio;
-+int mxc_hdmi_ipu_id;
-+int mxc_hdmi_disp_id;
-+static int hdmi_core_edid_status;
-+static struct mxc_edid_cfg hdmi_core_edid_cfg;
-+static int hdmi_core_init;
-+static unsigned int hdmi_dma_running;
-+static struct snd_pcm_substream *hdmi_audio_stream_playback;
-+static unsigned int hdmi_cable_state;
-+static unsigned int hdmi_blank_state;
-+static unsigned int hdmi_abort_state;
-+static spinlock_t hdmi_audio_lock, hdmi_blank_state_lock, hdmi_cable_state_lock;
-+
-+void hdmi_set_dvi_mode(unsigned int state)
-+{
-+	if (state) {
-+		mxc_hdmi_abort_stream();
-+		hdmi_cec_stop_device();
-+	} else {
-+		hdmi_cec_start_device();
-+	}
-+}
-+EXPORT_SYMBOL(hdmi_set_dvi_mode);
-+
-+unsigned int hdmi_set_cable_state(unsigned int state)
-+{
-+	unsigned long flags;
-+	struct snd_pcm_substream *substream = hdmi_audio_stream_playback;
-+
-+	spin_lock_irqsave(&hdmi_cable_state_lock, flags);
-+	hdmi_cable_state = state;
-+	spin_unlock_irqrestore(&hdmi_cable_state_lock, flags);
-+
-+	if (check_hdmi_state() && substream && hdmi_abort_state) {
-+		hdmi_abort_state = 0;
-+		substream->ops->trigger(substream, SNDRV_PCM_TRIGGER_START);
-+	}
-+	return 0;
-+}
-+EXPORT_SYMBOL(hdmi_set_cable_state);
-+
-+unsigned int hdmi_set_blank_state(unsigned int state)
-+{
-+	unsigned long flags;
-+	struct snd_pcm_substream *substream = hdmi_audio_stream_playback;
-+
-+	spin_lock_irqsave(&hdmi_blank_state_lock, flags);
-+	hdmi_blank_state = state;
-+	spin_unlock_irqrestore(&hdmi_blank_state_lock, flags);
-+
-+	if (check_hdmi_state() && substream && hdmi_abort_state) {
-+		hdmi_abort_state = 0;
-+		substream->ops->trigger(substream, SNDRV_PCM_TRIGGER_START);
-+	}
-+	return 0;
-+}
-+EXPORT_SYMBOL(hdmi_set_blank_state);
-+
-+static void hdmi_audio_abort_stream(struct snd_pcm_substream *substream)
-+{
-+	unsigned long flags;
-+
-+	snd_pcm_stream_lock_irqsave(substream, flags);
-+
-+	if (snd_pcm_running(substream)) {
-+		hdmi_abort_state = 1;
-+		substream->ops->trigger(substream, SNDRV_PCM_TRIGGER_STOP);
-+	}
-+
-+	snd_pcm_stream_unlock_irqrestore(substream, flags);
-+}
-+
-+int mxc_hdmi_abort_stream(void)
-+{
-+	unsigned long flags;
-+	spin_lock_irqsave(&hdmi_audio_lock, flags);
-+	if (hdmi_audio_stream_playback)
-+		hdmi_audio_abort_stream(hdmi_audio_stream_playback);
-+	spin_unlock_irqrestore(&hdmi_audio_lock, flags);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(mxc_hdmi_abort_stream);
-+
-+int check_hdmi_state(void)
-+{
-+	unsigned long flags1, flags2;
-+	unsigned int ret;
-+
-+	spin_lock_irqsave(&hdmi_cable_state_lock, flags1);
-+	spin_lock_irqsave(&hdmi_blank_state_lock, flags2);
-+
-+	ret = hdmi_cable_state && hdmi_blank_state;
-+
-+	spin_unlock_irqrestore(&hdmi_blank_state_lock, flags2);
-+	spin_unlock_irqrestore(&hdmi_cable_state_lock, flags1);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(check_hdmi_state);
-+
-+int mxc_hdmi_register_audio(struct snd_pcm_substream *substream)
-+{
-+	unsigned long flags, flags1;
-+	int ret = 0;
-+
-+	snd_pcm_stream_lock_irqsave(substream, flags);
-+
-+	if (substream && check_hdmi_state()) {
-+		spin_lock_irqsave(&hdmi_audio_lock, flags1);
-+		if (hdmi_audio_stream_playback) {
-+			pr_err("%s unconsist hdmi auido stream!\n", __func__);
-+			ret = -EINVAL;
-+		}
-+		hdmi_audio_stream_playback = substream;
-+		hdmi_abort_state = 0;
-+		spin_unlock_irqrestore(&hdmi_audio_lock, flags1);
-+	} else
-+		ret = -EINVAL;
-+
-+	snd_pcm_stream_unlock_irqrestore(substream, flags);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(mxc_hdmi_register_audio);
-+
-+void mxc_hdmi_unregister_audio(struct snd_pcm_substream *substream)
-+{
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&hdmi_audio_lock, flags);
-+	hdmi_audio_stream_playback = NULL;
-+	hdmi_abort_state = 0;
-+	spin_unlock_irqrestore(&hdmi_audio_lock, flags);
-+}
-+EXPORT_SYMBOL(mxc_hdmi_unregister_audio);
-+
-+u8 hdmi_readb(unsigned int reg)
-+{
-+	u8 value;
-+
-+	value = __raw_readb(hdmi_base + reg);
-+
-+	return value;
-+}
-+EXPORT_SYMBOL(hdmi_readb);
-+
-+#ifdef DEBUG
-+static bool overflow_lo;
-+static bool overflow_hi;
-+
-+bool hdmi_check_overflow(void)
-+{
-+	u8 val, lo, hi;
-+
-+	val = hdmi_readb(HDMI_IH_FC_STAT2);
-+	lo = (val & HDMI_IH_FC_STAT2_LOW_PRIORITY_OVERFLOW) != 0;
-+	hi = (val & HDMI_IH_FC_STAT2_HIGH_PRIORITY_OVERFLOW) != 0;
-+
-+	if ((lo != overflow_lo) || (hi != overflow_hi)) {
-+		pr_debug("%s LowPriority=%d HighPriority=%d  <=======================\n",
-+			__func__, lo, hi);
-+		overflow_lo = lo;
-+		overflow_hi = hi;
-+		return true;
-+	}
-+	return false;
-+}
-+#else
-+bool hdmi_check_overflow(void)
-+{
-+	return false;
-+}
-+#endif
-+EXPORT_SYMBOL(hdmi_check_overflow);
-+
-+void hdmi_writeb(u8 value, unsigned int reg)
-+{
-+	hdmi_check_overflow();
-+	__raw_writeb(value, hdmi_base + reg);
-+	hdmi_check_overflow();
-+}
-+EXPORT_SYMBOL(hdmi_writeb);
-+
-+void hdmi_mask_writeb(u8 data, unsigned int reg, u8 shift, u8 mask)
-+{
-+	u8 value = hdmi_readb(reg) & ~mask;
-+	value |= (data << shift) & mask;
-+	hdmi_writeb(value, reg);
-+}
-+EXPORT_SYMBOL(hdmi_mask_writeb);
-+
-+unsigned int hdmi_read4(unsigned int reg)
-+{
-+	/* read a four byte address from registers */
-+	return (hdmi_readb(reg + 3) << 24) |
-+		(hdmi_readb(reg + 2) << 16) |
-+		(hdmi_readb(reg + 1) << 8) |
-+		hdmi_readb(reg);
-+}
-+EXPORT_SYMBOL(hdmi_read4);
-+
-+void hdmi_write4(unsigned int value, unsigned int reg)
-+{
-+	/* write a four byte address to hdmi regs */
-+	hdmi_writeb(value & 0xff, reg);
-+	hdmi_writeb((value >> 8) & 0xff, reg + 1);
-+	hdmi_writeb((value >> 16) & 0xff, reg + 2);
-+	hdmi_writeb((value >> 24) & 0xff, reg + 3);
-+}
-+EXPORT_SYMBOL(hdmi_write4);
-+
-+static void initialize_hdmi_ih_mutes(void)
-+{
-+	u8 ih_mute;
-+
-+	/*
-+	 * Boot up defaults are:
-+	 * HDMI_IH_MUTE   = 0x03 (disabled)
-+	 * HDMI_IH_MUTE_* = 0x00 (enabled)
-+	 */
-+
-+	/* Disable top level interrupt bits in HDMI block */
-+	ih_mute = hdmi_readb(HDMI_IH_MUTE) |
-+		  HDMI_IH_MUTE_MUTE_WAKEUP_INTERRUPT |
-+		  HDMI_IH_MUTE_MUTE_ALL_INTERRUPT;
-+
-+	hdmi_writeb(ih_mute, HDMI_IH_MUTE);
-+
-+	/* by default mask all interrupts */
-+	hdmi_writeb(0xff, HDMI_VP_MASK);
-+	hdmi_writeb(0xff, HDMI_FC_MASK0);
-+	hdmi_writeb(0xff, HDMI_FC_MASK1);
-+	hdmi_writeb(0xff, HDMI_FC_MASK2);
-+	hdmi_writeb(0xff, HDMI_PHY_MASK0);
-+	hdmi_writeb(0xff, HDMI_PHY_I2CM_INT_ADDR);
-+	hdmi_writeb(0xff, HDMI_PHY_I2CM_CTLINT_ADDR);
-+	hdmi_writeb(0xff, HDMI_AUD_INT);
-+	hdmi_writeb(0xff, HDMI_AUD_SPDIFINT);
-+	hdmi_writeb(0xff, HDMI_AUD_HBR_MASK);
-+	hdmi_writeb(0xff, HDMI_GP_MASK);
-+	hdmi_writeb(0xff, HDMI_A_APIINTMSK);
-+	hdmi_writeb(0xff, HDMI_CEC_MASK);
-+	hdmi_writeb(0xff, HDMI_I2CM_INT);
-+	hdmi_writeb(0xff, HDMI_I2CM_CTLINT);
-+
-+	/* Disable interrupts in the IH_MUTE_* registers */
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_FC_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_FC_STAT1);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_FC_STAT2);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_AS_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_PHY_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_I2CM_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_CEC_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_VP_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_I2CMPHY_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
-+
-+	/* Enable top level interrupt bits in HDMI block */
-+	ih_mute &= ~(HDMI_IH_MUTE_MUTE_WAKEUP_INTERRUPT |
-+		    HDMI_IH_MUTE_MUTE_ALL_INTERRUPT);
-+	hdmi_writeb(ih_mute, HDMI_IH_MUTE);
-+}
-+
-+static void hdmi_set_clock_regenerator_n(unsigned int value)
-+{
-+	u8 val;
-+
-+	if (!hdmi_dma_running) {
-+		hdmi_writeb(value & 0xff, HDMI_AUD_N1);
-+		hdmi_writeb(0, HDMI_AUD_N2);
-+		hdmi_writeb(0, HDMI_AUD_N3);
-+	}
-+
-+	hdmi_writeb(value & 0xff, HDMI_AUD_N1);
-+	hdmi_writeb((value >> 8) & 0xff, HDMI_AUD_N2);
-+	hdmi_writeb((value >> 16) & 0x0f, HDMI_AUD_N3);
-+
-+	/* nshift factor = 0 */
-+	val = hdmi_readb(HDMI_AUD_CTS3);
-+	val &= ~HDMI_AUD_CTS3_N_SHIFT_MASK;
-+	hdmi_writeb(val, HDMI_AUD_CTS3);
-+}
-+
-+static void hdmi_set_clock_regenerator_cts(unsigned int cts)
-+{
-+	u8 val;
-+
-+	if (!hdmi_dma_running) {
-+		hdmi_writeb(cts & 0xff, HDMI_AUD_CTS1);
-+		hdmi_writeb(0, HDMI_AUD_CTS2);
-+		hdmi_writeb(0, HDMI_AUD_CTS3);
-+	}
-+
-+	/* Must be set/cleared first */
-+	val = hdmi_readb(HDMI_AUD_CTS3);
-+	val &= ~HDMI_AUD_CTS3_CTS_MANUAL;
-+	hdmi_writeb(val, HDMI_AUD_CTS3);
-+
-+	hdmi_writeb(cts & 0xff, HDMI_AUD_CTS1);
-+	hdmi_writeb((cts >> 8) & 0xff, HDMI_AUD_CTS2);
-+	hdmi_writeb(((cts >> 16) & HDMI_AUD_CTS3_AUDCTS19_16_MASK) |
-+		    HDMI_AUD_CTS3_CTS_MANUAL, HDMI_AUD_CTS3);
-+}
-+
-+struct imx6_hdmi_acr {
-+	int		FREQ;
-+	int		N;
-+	int		CTS;
-+};
-+
-+struct imx6_hdmi_acr_def {
-+	int			CLK;
-+	struct imx6_hdmi_acr	imx6_data[3];
-+};
-+
-+static const struct imx6_hdmi_acr_def imx6_hdmi_conv[] = {
-+	/*		 32kHz			  44.1kHz		    48kHz    */
-+	/* Clock                  N     CTS                N     CTS                 N     CTS */
-+	{ 2517/*5*/, { { 32000, 4096,  25175 }, { 44100, 28224, 125875 }, { 48000,  6144,  25175 } } }, /*  25,20/1.001 MHz */
-+	{ 2520/*0*/, { { 32000, 4096,  25200 }, { 44100,  6272,  28000 }, { 48000,  6144,  25200 } } }, /*  25.20       MHz */
-+	{ 2700/*0*/, { { 32000, 4096,  27000 }, { 44100,  6272,  30000 }, { 48000,  6144,  27000 } } }, /*  27.00       MHz */
-+	{ 2702/*7*/, { { 32000, 4096,  27027 }, { 44100,  6272,  30030 }, { 48000,  6144,  27027 } } }, /*  27.00*1.001 MHz */
-+	{ 5400/*0*/, { { 32000, 4096,  54000 }, { 44100,  6272,  60000 }, { 48000,  6144,  54000 } } }, /*  54.00       MHz */
-+	{ 5405/*4*/, { { 32000, 4096,  54054 }, { 44100,  6272,  60060 }, { 48000,  6144,  54054 } } }, /*  54.00*1.001 MHz */
-+	{ 7417/*6*/, { { 32000, 4096,  74176 }, { 44100,  5733,  75335 }, { 48000,  6144,  74176 } } }, /*  74.25/1.001 MHz */
-+	{ 7425/*0*/, { { 32000, 4096,  74250 }, { 44100,  6272,  82500 }, { 48000,  6144,  74250 } } }, /*  74.25       MHz */
-+	{14836/*2*/, { { 32000, 4096, 148352 }, { 44100,  5733, 150670 }, { 48000,  6144, 148352 } } }, /* 148.50/1.001 MHz */
-+	{14850/*0*/, { { 32000, 4096, 148500 }, { 44100,  6272, 165000 }, { 48000,  6144, 148500 } } }, /* 148.50       MHz */
-+	{         0, { { 32000, 4096,      0 }, { 44100,  6272,      0 }, { 48000,  6144,      0 } } }  /* Other */
-+};
-+
-+static void hdmi_compute_cts_n(unsigned int freq, unsigned long pixel_clk,
-+				   unsigned int *n, unsigned int *cts)
-+{
-+	unsigned int clk = pixel_clk / 10000;
-+	unsigned int frq = freq;
-+	int i, j;
-+
-+	*n = 1;
-+	switch (frq) {
-+	case 88200:
-+		frq = 44100;
-+		*n = 2;
-+		break;
-+	case 96000:
-+		frq = 48000;
-+		*n = 2;
-+		break;
-+	case 176400:
-+		frq = 44100;
-+		*n = 4;
-+		break;
-+	case 192000:
-+		frq = 48000;
-+		*n = 4;
-+		break;
-+	default:
-+		break;
-+	}
-+
-+	for (i = 0; i < ARRAY_SIZE(imx6_hdmi_conv); i++) {
-+		if (imx6_hdmi_conv[i].CLK == clk || imx6_hdmi_conv[i].CLK == 0) {
-+			for (j = 0; j < 3; j++) {
-+				if (imx6_hdmi_conv[i].imx6_data[j].FREQ == frq) {
-+					*n *= imx6_hdmi_conv[i].imx6_data[j].N;
-+					*cts = imx6_hdmi_conv[i].imx6_data[j].CTS;
-+					return;
-+				}
-+			}
-+		}
-+	}
-+}
-+
-+static void hdmi_set_clk_regenerator(void)
-+{
-+	unsigned int clk_n, clk_cts = 0;
-+
-+	hdmi_compute_cts_n(sample_rate, pixel_clk_rate, &clk_n, &clk_cts);
-+
-+	if (clk_cts == 0) {
-+		clk_n = (128 * sample_rate) / 1000;
-+		clk_cts = (clk_n / 128) * pixel_clk_rate;
-+		clk_cts += (clk_n % 128) * pixel_clk_rate / 128;
-+		clk_cts /= (sample_rate / 10);
-+		pr_debug("%s: pixel clock not supported - fallback calculation: %d, N=%d, cts: %d\n",
-+			__func__, (int)pixel_clk_rate, clk_n, clk_cts);
-+	}
-+//	if (ratio != 100)
-+//		clk_cts = (clk_cts * ratio) / 100;
-+
-+	pr_debug("%s: samplerate=%d  ratio=%d  pixelclk=%d  N=%d  cts=%d\n",
-+		__func__, sample_rate, hdmi_ratio, (int)pixel_clk_rate,
-+		clk_n, clk_cts);
-+
-+	hdmi_set_clock_regenerator_cts(clk_cts);
-+	hdmi_set_clock_regenerator_n(clk_n);
-+}
-+
-+static int hdmi_core_get_of_property(struct platform_device *pdev)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+	int err;
-+	int ipu_id, disp_id;
-+
-+	err = of_property_read_u32(np, "ipu_id", &ipu_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property ipu_id fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "disp_id", &disp_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property disp_id fail\n");
-+		return err;
-+	}
-+
-+	mxc_hdmi_ipu_id = ipu_id;
-+	mxc_hdmi_disp_id = disp_id;
-+
-+	return err;
-+}
-+
-+/* Need to run this before phy is enabled the first time to prevent
-+ * overflow condition in HDMI_IH_FC_STAT2 */
-+void hdmi_init_clk_regenerator(void)
-+{
-+	if (pixel_clk_rate == 0) {
-+		pixel_clk_rate = 74250000;
-+		hdmi_set_clk_regenerator();
-+	}
-+}
-+EXPORT_SYMBOL(hdmi_init_clk_regenerator);
-+
-+void hdmi_clk_regenerator_update_pixel_clock(u32 pixclock)
-+{
-+
-+	/* Translate pixel clock in ps (pico seconds) to Hz  */
-+	pixel_clk_rate = PICOS2KHZ(pixclock) * 1000UL;
-+	hdmi_set_clk_regenerator();
-+}
-+EXPORT_SYMBOL(hdmi_clk_regenerator_update_pixel_clock);
-+
-+void hdmi_set_dma_mode(unsigned int dma_running)
-+{
-+	hdmi_dma_running = dma_running;
-+	hdmi_set_clk_regenerator();
-+}
-+EXPORT_SYMBOL(hdmi_set_dma_mode);
-+
-+void hdmi_set_sample_rate(unsigned int rate)
-+{
-+	sample_rate = rate;
-+}
-+EXPORT_SYMBOL(hdmi_set_sample_rate);
-+
-+void hdmi_set_edid_cfg(int edid_status, struct mxc_edid_cfg *cfg)
-+{
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&edid_spinlock, flags);
-+	hdmi_core_edid_status = edid_status;
-+	memcpy(&hdmi_core_edid_cfg, cfg, sizeof(struct mxc_edid_cfg));
-+	spin_unlock_irqrestore(&edid_spinlock, flags);
-+}
-+EXPORT_SYMBOL(hdmi_set_edid_cfg);
-+
-+int hdmi_get_edid_cfg(struct mxc_edid_cfg *cfg)
-+{
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&edid_spinlock, flags);
-+	memcpy(cfg, &hdmi_core_edid_cfg, sizeof(struct mxc_edid_cfg));
-+	spin_unlock_irqrestore(&edid_spinlock, flags);
-+
-+	return hdmi_core_edid_status;
-+}
-+EXPORT_SYMBOL(hdmi_get_edid_cfg);
-+
-+void hdmi_set_registered(int registered)
-+{
-+	hdmi_core_init = registered;
-+}
-+EXPORT_SYMBOL(hdmi_set_registered);
-+
-+int hdmi_get_registered(void)
-+{
-+	return hdmi_core_init;
-+}
-+EXPORT_SYMBOL(hdmi_get_registered);
-+
-+static int mxc_hdmi_core_probe(struct platform_device *pdev)
-+{
-+	struct mxc_hdmi_data *hdmi_data;
-+	struct resource *res;
-+	unsigned long flags;
-+	int ret = 0;
-+
-+#ifdef DEBUG
-+	overflow_lo = false;
-+	overflow_hi = false;
-+#endif
-+
-+	hdmi_core_init = 0;
-+	hdmi_dma_running = 0;
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res)
-+		return -ENOENT;
-+
-+	ret = hdmi_core_get_of_property(pdev);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "get hdmi of property fail\n");
-+		return -ENOENT;
-+	}
-+
-+	hdmi_data = devm_kzalloc(&pdev->dev, sizeof(struct mxc_hdmi_data), GFP_KERNEL);
-+	if (!hdmi_data) {
-+		dev_err(&pdev->dev, "Couldn't allocate mxc hdmi mfd device\n");
-+		return -ENOMEM;
-+	}
-+	hdmi_data->pdev = pdev;
-+
-+	pixel_clk = NULL;
-+	sample_rate = 48000;
-+	pixel_clk_rate = 0;
-+	hdmi_ratio = 100;
-+
-+	spin_lock_init(&irq_spinlock);
-+	spin_lock_init(&edid_spinlock);
-+
-+
-+	spin_lock_init(&hdmi_cable_state_lock);
-+	spin_lock_init(&hdmi_blank_state_lock);
-+	spin_lock_init(&hdmi_audio_lock);
-+
-+	spin_lock_irqsave(&hdmi_cable_state_lock, flags);
-+	hdmi_cable_state = 0;
-+	spin_unlock_irqrestore(&hdmi_cable_state_lock, flags);
-+
-+	spin_lock_irqsave(&hdmi_blank_state_lock, flags);
-+	hdmi_blank_state = 0;
-+	spin_unlock_irqrestore(&hdmi_blank_state_lock, flags);
-+
-+	spin_lock_irqsave(&hdmi_audio_lock, flags);
-+	hdmi_audio_stream_playback = NULL;
-+	hdmi_abort_state = 0;
-+	spin_unlock_irqrestore(&hdmi_audio_lock, flags);
-+
-+	isfr_clk = clk_get(&hdmi_data->pdev->dev, "hdmi_isfr");
-+	if (IS_ERR(isfr_clk)) {
-+		ret = PTR_ERR(isfr_clk);
-+		dev_err(&hdmi_data->pdev->dev,
-+			"Unable to get HDMI isfr clk: %d\n", ret);
-+		goto eclkg;
-+	}
-+
-+	ret = clk_prepare_enable(isfr_clk);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "Cannot enable HDMI clock: %d\n", ret);
-+		goto eclke;
-+	}
-+
-+	pr_debug("%s isfr_clk:%d\n", __func__,
-+		(int)clk_get_rate(isfr_clk));
-+
-+	iahb_clk = clk_get(&hdmi_data->pdev->dev, "hdmi_iahb");
-+	if (IS_ERR(iahb_clk)) {
-+		ret = PTR_ERR(iahb_clk);
-+		dev_err(&hdmi_data->pdev->dev,
-+			"Unable to get HDMI iahb clk: %d\n", ret);
-+		goto eclkg2;
-+	}
-+
-+	ret = clk_prepare_enable(iahb_clk);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "Cannot enable HDMI clock: %d\n", ret);
-+		goto eclke2;
-+	}
-+
-+	hdmi_data->reg_phys_base = res->start;
-+	if (!request_mem_region(res->start, resource_size(res),
-+				dev_name(&pdev->dev))) {
-+		dev_err(&pdev->dev, "request_mem_region failed\n");
-+		ret = -EBUSY;
-+		goto emem;
-+	}
-+
-+	hdmi_data->reg_base = ioremap(res->start, resource_size(res));
-+	if (!hdmi_data->reg_base) {
-+		dev_err(&pdev->dev, "ioremap failed\n");
-+		ret = -ENOMEM;
-+		goto eirq;
-+	}
-+	hdmi_base = hdmi_data->reg_base;
-+
-+	pr_debug("\n%s hdmi hw base = 0x%08x\n\n", __func__, (int)res->start);
-+
-+	initialize_hdmi_ih_mutes();
-+
-+	/* Disable HDMI clocks until video/audio sub-drivers are initialized */
-+	clk_disable_unprepare(isfr_clk);
-+	clk_disable_unprepare(iahb_clk);
-+
-+	/* Replace platform data coming in with a local struct */
-+	platform_set_drvdata(pdev, hdmi_data);
-+
-+	return ret;
-+
-+eirq:
-+	release_mem_region(res->start, resource_size(res));
-+emem:
-+	clk_disable_unprepare(iahb_clk);
-+eclke2:
-+	clk_put(iahb_clk);
-+eclkg2:
-+	clk_disable_unprepare(isfr_clk);
-+eclke:
-+	clk_put(isfr_clk);
-+eclkg:
-+	return ret;
-+}
-+
-+
-+static int __exit mxc_hdmi_core_remove(struct platform_device *pdev)
-+{
-+	struct mxc_hdmi_data *hdmi_data = platform_get_drvdata(pdev);
-+	struct resource *res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+
-+	iounmap(hdmi_data->reg_base);
-+	release_mem_region(res->start, resource_size(res));
-+
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_hdmi_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-hdmi-core", },
-+	{ .compatible = "fsl,imx6dl-hdmi-core", },
-+	{ /* sentinel */ }
-+};
-+
-+static struct platform_driver mxc_hdmi_core_driver = {
-+	.driver = {
-+		.name = "mxc_hdmi_core",
-+		.of_match_table	= imx_hdmi_dt_ids,
-+		.owner = THIS_MODULE,
-+	},
-+	.remove = __exit_p(mxc_hdmi_core_remove),
-+};
-+
-+static int __init mxc_hdmi_core_init(void)
-+{
-+	return platform_driver_probe(&mxc_hdmi_core_driver,
-+				     mxc_hdmi_core_probe);
-+}
-+
-+static void __exit mxc_hdmi_core_exit(void)
-+{
-+	platform_driver_unregister(&mxc_hdmi_core_driver);
-+}
-+
-+subsys_initcall(mxc_hdmi_core_init);
-+module_exit(mxc_hdmi_core_exit);
-+
-+MODULE_DESCRIPTION("Core driver for Freescale i.Mx on-chip HDMI");
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/misc/sram.c linux-xbian-imx6/drivers/misc/sram.c
---- linux-4.1.3/drivers/misc/sram.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/misc/sram.c	2015-07-27 23:13:06.095235186 +0200
-@@ -17,6 +17,7 @@
-  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
-  * MA 02110-1301, USA.
-  */
-+#define DEBUG
- 
- #include <linux/kernel.h>
- #include <linux/init.h>
-diff -Nur linux-4.1.3/drivers/mmc/core/core.c linux-xbian-imx6/drivers/mmc/core/core.c
---- linux-4.1.3/drivers/mmc/core/core.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mmc/core/core.c	2015-07-27 23:13:06.115164084 +0200
-@@ -13,11 +13,13 @@
- #include <linux/module.h>
- #include <linux/init.h>
- #include <linux/interrupt.h>
-+#include <linux/clk.h>
- #include <linux/completion.h>
- #include <linux/device.h>
- #include <linux/delay.h>
- #include <linux/pagemap.h>
- #include <linux/err.h>
-+#include <linux/gpio/consumer.h>
- #include <linux/leds.h>
- #include <linux/scatterlist.h>
- #include <linux/log2.h>
-@@ -1601,6 +1603,43 @@
- 	mmc_host_clk_release(host);
- }
- 
-+static void mmc_card_power_up(struct mmc_host *host)
-+{
-+	int i;
-+	struct gpio_desc **gds = host->card_reset_gpios;
-+
-+	for (i = 0; i < ARRAY_SIZE(host->card_reset_gpios); i++) {
-+		if (gds[i]) {
-+			dev_dbg(host->parent, "Asserting reset line %d", i);
-+			gpiod_set_value(gds[i], 1);
-+		}
-+	}
-+
-+	if (host->card_regulator) {
-+		dev_dbg(host->parent, "Enabling external regulator");
-+		if (regulator_enable(host->card_regulator))
-+			dev_err(host->parent, "Failed to enable external regulator");
-+	}
-+
-+	if (host->card_clk) {
-+		dev_dbg(host->parent, "Enabling external clock");
-+		clk_prepare_enable(host->card_clk);
-+	}
-+
-+	/* 2ms delay to let clocks and power settle */
-+	mmc_delay(20);
-+
-+	for (i = 0; i < ARRAY_SIZE(host->card_reset_gpios); i++) {
-+		if (gds[i]) {
-+			dev_dbg(host->parent, "Deasserting reset line %d", i);
-+			gpiod_set_value(gds[i], 0);
-+		}
-+	}
-+
-+	/* 2ms delay to after reset release */
-+	mmc_delay(20);
-+}
-+
- /*
-  * Apply power to the MMC stack.  This is a two-stage process.
-  * First, we enable power to the card without the clock running.
-@@ -1661,6 +1700,9 @@
- 	if (host->ios.power_mode == MMC_POWER_OFF)
- 		return;
- 
-+	/* Power up the card/module first, if needed */
-+	mmc_card_power_up(host);
-+
- 	mmc_host_clk_hold(host);
- 
- 	mmc_pwrseq_power_off(host);
-@@ -1686,7 +1728,7 @@
- {
- 	mmc_power_off(host);
- 	/* Wait at least 1 ms according to SD spec */
--	mmc_delay(1);
-+	mmc_delay(3);
- 	mmc_power_up(host, ocr);
- }
- 
-diff -Nur linux-4.1.3/drivers/mmc/core/host.c linux-xbian-imx6/drivers/mmc/core/host.c
---- linux-4.1.3/drivers/mmc/core/host.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mmc/core/host.c	2015-07-27 23:13:06.115164084 +0200
-@@ -12,14 +12,18 @@
-  *  MMC host class device management
-  */
- 
-+#include <linux/kernel.h>
-+#include <linux/clk.h>
- #include <linux/device.h>
- #include <linux/err.h>
-+#include <linux/gpio/consumer.h>
- #include <linux/idr.h>
- #include <linux/of.h>
- #include <linux/of_gpio.h>
- #include <linux/pagemap.h>
- #include <linux/export.h>
- #include <linux/leds.h>
-+#include <linux/regulator/consumer.h>
- #include <linux/slab.h>
- #include <linux/suspend.h>
- 
-@@ -454,6 +458,66 @@
- 
- EXPORT_SYMBOL(mmc_of_parse);
- 
-+static int mmc_of_parse_child(struct mmc_host *host)
-+{
-+	struct device_node *np;
-+	struct clk *clk;
-+	int i;
-+
-+	if (!host->parent || !host->parent->of_node)
-+		return 0;
-+
-+	np = host->parent->of_node;
-+
-+	host->card_regulator = regulator_get(host->parent, "card-external-vcc");
-+	if (IS_ERR(host->card_regulator)) {
-+		if (PTR_ERR(host->card_regulator) == -EPROBE_DEFER)
-+			return PTR_ERR(host->card_regulator);
-+		host->card_regulator = NULL;
-+	}
-+
-+	/* Parse card power/reset/clock control */
-+	if (of_find_property(np, "card-reset-gpios", NULL)) {
-+		struct gpio_desc *gpd;
-+		int level = 0;
-+
-+		/*
-+		 * If the regulator is enabled, then we can hold the
-+		 * card in reset with an active high resets.  Otherwise,
-+		 * hold the resets low.
-+		 */
-+		if (host->card_regulator && regulator_is_enabled(host->card_regulator))
-+			level = 1;
-+
-+		for (i = 0; i < ARRAY_SIZE(host->card_reset_gpios); i++) {
-+			gpd = devm_gpiod_get_index(host->parent, "card-reset", i);
-+			if (IS_ERR(gpd)) {
-+				if (PTR_ERR(gpd) == -EPROBE_DEFER)
-+					return PTR_ERR(gpd);
-+				break;
-+			}
-+			gpiod_direction_output(gpd, gpiod_is_active_low(gpd) | level);
-+			host->card_reset_gpios[i] = gpd;
-+		}
-+
-+		gpd = devm_gpiod_get_index(host->parent, "card-reset", ARRAY_SIZE(host->card_reset_gpios));
-+		if (!IS_ERR(gpd)) {
-+			dev_warn(host->parent, "More reset gpios than we can handle");
-+			gpiod_put(gpd);
-+		}
-+	}
-+
-+	clk = of_clk_get_by_name(np, "card_ext_clock");
-+	if (IS_ERR(clk)) {
-+		if (PTR_ERR(clk) == -EPROBE_DEFER)
-+			return PTR_ERR(clk);
-+		clk = NULL;
-+	}
-+	host->card_clk = clk;
-+
-+	return 0;
-+}
-+
- /**
-  *	mmc_alloc_host - initialise the per-host structure.
-  *	@extra: sizeof private data structure
-@@ -533,6 +597,10 @@
- {
- 	int err;
- 
-+	err = mmc_of_parse_child(host);
-+	if (err)
-+		return err;
-+
- 	WARN_ON((host->caps & MMC_CAP_SDIO_IRQ) &&
- 		!host->ops->enable_sdio_irq);
- 
-diff -Nur linux-4.1.3/drivers/mmc/core/mmc_ops.c linux-xbian-imx6/drivers/mmc/core/mmc_ops.c
---- linux-4.1.3/drivers/mmc/core/mmc_ops.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mmc/core/mmc_ops.c	2015-07-27 23:13:06.115164084 +0200
-@@ -513,6 +513,12 @@
- 		return 0;
- 
- 	/*
-+	 * WORKAROUND: for Sandisk eMMC cards, it might need certain delay
-+	 * before sending CMD13 after CMD6
-+	 */
-+	mdelay(1);
-+
-+	/*
- 	 * CRC errors shall only be ignored in cases were CMD13 is used to poll
- 	 * to detect busy completion.
- 	 */
-diff -Nur linux-4.1.3/drivers/mmc/core/sd.c linux-xbian-imx6/drivers/mmc/core/sd.c
---- linux-4.1.3/drivers/mmc/core/sd.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mmc/core/sd.c	2015-07-27 23:13:06.119149862 +0200
-@@ -521,6 +521,13 @@
- 	else {
- 		mmc_set_timing(card->host, timing);
- 		mmc_set_clock(card->host, card->sw_caps.uhs_max_dtr);
-+
-+		/*
-+		 * FIXME: Sandisk SD3.0 cards DDR50 mode requires such
-+		 * delay to get stable, without this delay we may encounter
-+		 * CRC errors after switch to DDR50 mode
-+		 */
-+		mmc_delay(100);
- 	}
- 
- 	return 0;
-diff -Nur linux-4.1.3/drivers/mmc/host/sdhci-esdhc-imx.c linux-xbian-imx6/drivers/mmc/host/sdhci-esdhc-imx.c
---- linux-4.1.3/drivers/mmc/host/sdhci-esdhc-imx.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/mmc/host/sdhci-esdhc-imx.c	2015-07-27 23:13:06.131107202 +0200
-@@ -65,6 +65,8 @@
- /* NOTE: the minimum valid tuning start tap for mx6sl is 1 */
- #define ESDHC_TUNING_START_TAP		0x1
- 
-+#define ESDHC_TUNING_BLOCK_PATTERN_LEN	64
-+
- /* pinctrl state */
- #define ESDHC_PINCTRL_STATE_100MHZ	"state_100mhz"
- #define ESDHC_PINCTRL_STATE_200MHZ	"state_200mhz"
-@@ -112,6 +114,12 @@
- #define ESDHC_FLAG_STD_TUNING		BIT(5)
- /* The IP has SDHCI_CAPABILITIES_1 register */
- #define ESDHC_FLAG_HAVE_CAP1		BIT(6)
-+/*
-+ * The IP has errata ERR004536
-+ * uSDHC: ADMA Length Mismatch Error occurs if the AHB read access is slow,
-+ * when reading data from the card
-+ */
-+#define ESDHC_FLAG_ERR004536		BIT(7)
- 
- struct esdhc_soc_data {
- 	u32 flags;
-@@ -445,6 +453,10 @@
- 			if (val & SDHCI_CTRL_EXEC_TUNING) {
- 				v |= ESDHC_MIX_CTRL_EXE_TUNE;
- 				m |= ESDHC_MIX_CTRL_FBCLK_SEL;
-+				writel(readl(host->ioaddr + ESDHC_TUNING_CTRL) |
-+					ESDHC_STD_TUNING_EN |
-+					ESDHC_TUNING_START_TAP,
-+					host->ioaddr + ESDHC_TUNING_CTRL);
- 			} else {
- 				v &= ~ESDHC_MIX_CTRL_EXE_TUNE;
- 			}
-@@ -700,6 +712,56 @@
- 			val, readl(host->ioaddr + ESDHC_TUNE_CTRL_STATUS));
- }
- 
-+static void esdhc_request_done(struct mmc_request *mrq)
-+{
-+	complete(&mrq->completion);
-+}
-+
-+static int esdhc_send_tuning_cmd(struct sdhci_host *host, u32 opcode,
-+				 struct scatterlist *sg)
-+{
-+	struct mmc_command cmd = {0};
-+	struct mmc_request mrq = {NULL};
-+	struct mmc_data data = {0};
-+
-+	cmd.opcode = opcode;
-+	cmd.arg = 0;
-+	cmd.flags = MMC_RSP_R1 | MMC_CMD_ADTC;
-+
-+	data.blksz = ESDHC_TUNING_BLOCK_PATTERN_LEN;
-+	data.blocks = 1;
-+	data.flags = MMC_DATA_READ;
-+	data.sg = sg;
-+	data.sg_len = 1;
-+
-+	mrq.cmd = &cmd;
-+	mrq.cmd->mrq = &mrq;
-+	mrq.data = &data;
-+	mrq.data->mrq = &mrq;
-+	mrq.cmd->data = mrq.data;
-+
-+	mrq.done = esdhc_request_done;
-+	init_completion(&(mrq.completion));
-+
-+	disable_irq(host->irq);
-+	spin_lock(&host->lock);
-+	host->mrq = &mrq;
-+
-+	sdhci_send_command(host, mrq.cmd);
-+
-+	spin_unlock(&host->lock);
-+	enable_irq(host->irq);
-+
-+	wait_for_completion(&mrq.completion);
-+
-+	if (cmd.error)
-+		return cmd.error;
-+	if (data.error)
-+		return data.error;
-+
-+	return 0;
-+}
-+
- static void esdhc_post_tuning(struct sdhci_host *host)
- {
- 	u32 reg;
-@@ -711,13 +773,21 @@
- 
- static int esdhc_executing_tuning(struct sdhci_host *host, u32 opcode)
- {
-+	struct scatterlist sg;
-+	char *tuning_pattern;
- 	int min, max, avg, ret;
- 
-+	tuning_pattern = kmalloc(ESDHC_TUNING_BLOCK_PATTERN_LEN, GFP_KERNEL);
-+	if (!tuning_pattern)
-+		return -ENOMEM;
-+
-+	sg_init_one(&sg, tuning_pattern, ESDHC_TUNING_BLOCK_PATTERN_LEN);
-+
- 	/* find the mininum delay first which can pass tuning */
- 	min = ESDHC_TUNE_CTRL_MIN;
- 	while (min < ESDHC_TUNE_CTRL_MAX) {
- 		esdhc_prepare_tuning(host, min);
--		if (!mmc_send_tuning(host->mmc))
-+		if (!esdhc_send_tuning_cmd(host, opcode, &sg))
- 			break;
- 		min += ESDHC_TUNE_CTRL_STEP;
- 	}
-@@ -726,7 +796,7 @@
- 	max = min + ESDHC_TUNE_CTRL_STEP;
- 	while (max < ESDHC_TUNE_CTRL_MAX) {
- 		esdhc_prepare_tuning(host, max);
--		if (mmc_send_tuning(host->mmc)) {
-+		if (esdhc_send_tuning_cmd(host, opcode, &sg)) {
- 			max -= ESDHC_TUNE_CTRL_STEP;
- 			break;
- 		}
-@@ -736,9 +806,11 @@
- 	/* use average delay to get the best timing */
- 	avg = (min + max) / 2;
- 	esdhc_prepare_tuning(host, avg);
--	ret = mmc_send_tuning(host->mmc);
-+	ret = esdhc_send_tuning_cmd(host, opcode, &sg);
- 	esdhc_post_tuning(host);
- 
-+	kfree(tuning_pattern);
-+
- 	dev_dbg(mmc_dev(host->mmc), "tunning %s at 0x%x ret %d\n",
- 		ret ? "failed" : "passed", avg, ret);
- 
-@@ -901,6 +973,9 @@
- 	if (of_property_read_u32(np, "fsl,delay-line", &boarddata->delay_line))
- 		boarddata->delay_line = 0;
- 
-+	if (of_find_property(np, "keep-power-in-suspend", NULL))
-+		host->mmc->pm_caps |= MMC_PM_KEEP_POWER;
-+
- 	mmc_of_parse_voltage(np, &host->ocr_mask);
- 
- 	return 0;
-@@ -997,10 +1072,8 @@
- 		sdhci_esdhc_ops.platform_execute_tuning =
- 					esdhc_executing_tuning;
- 
--	if (imx_data->socdata->flags & ESDHC_FLAG_STD_TUNING)
--		writel(readl(host->ioaddr + ESDHC_TUNING_CTRL) |
--			ESDHC_STD_TUNING_EN | ESDHC_TUNING_START_TAP,
--			host->ioaddr + ESDHC_TUNING_CTRL);
-+	if (imx_data->socdata->flags & ESDHC_FLAG_ERR004536)
-+		host->quirks |= SDHCI_QUIRK_BROKEN_ADMA;
- 
- 	boarddata = &imx_data->boarddata;
- 	if (sdhci_esdhc_imx_probe_dt(pdev, host, boarddata) < 0) {
-diff -Nur linux-4.1.3/drivers/mxc/asrc/Kconfig linux-xbian-imx6/drivers/mxc/asrc/Kconfig
---- linux-4.1.3/drivers/mxc/asrc/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/asrc/Kconfig	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,14 @@
-+#
-+# ASRC configuration
-+#
-+
-+menu "MXC Asynchronous Sample Rate Converter support"
-+
-+config MXC_ASRC
-+	tristate "ASRC support"
-+	depends on SOC_IMX35 || SOC_IMX53 || SOC_IMX6
-+#	select SND_SOC_FSL_ASRC
-+	---help---
-+         Say Y to get the ASRC service.
-+
-+endmenu
-diff -Nur linux-4.1.3/drivers/mxc/asrc/Makefile linux-xbian-imx6/drivers/mxc/asrc/Makefile
---- linux-4.1.3/drivers/mxc/asrc/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/asrc/Makefile	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,4 @@
-+#
-+# Makefile for the kernel Asynchronous Sample Rate Converter driver
-+#
-+obj-$(CONFIG_MXC_ASRC) += mxc_asrc.o
-diff -Nur linux-4.1.3/drivers/mxc/asrc/mxc_asrc.c linux-xbian-imx6/drivers/mxc/asrc/mxc_asrc.c
---- linux-4.1.3/drivers/mxc/asrc/mxc_asrc.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/asrc/mxc_asrc.c	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,2045 @@
-+/*
-+ * Freescale Asynchronous Sample Rate Converter (ASRC) driver
-+ *
-+ * Copyright 2008-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This file is licensed under the terms of the GNU General Public License
-+ * version 2.  This program  is licensed "as is" without any warranty of any
-+ * kind, whether express or implied.
-+ */
-+
-+#include <linux/clk.h>
-+#include <linux/slab.h>
-+#include <linux/delay.h>
-+#include <linux/sched.h>
-+#include <linux/regmap.h>
-+#include <linux/module.h>
-+#include <linux/proc_fs.h>
-+#include <linux/pagemap.h>
-+#include <linux/interrupt.h>
-+#include <linux/miscdevice.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/of_platform.h>
-+#include <linux/platform_data/dma-imx.h>
-+
-+#include <linux/mxc_asrc.h>
-+
-+#define ASRC_PROC_PATH "driver/asrc"
-+
-+#define ASRC_RATIO_DECIMAL_DEPTH 26
-+
-+#define pair_err(fmt, ...) \
-+	dev_err(asrc->dev, "Pair %c: " fmt, 'A' + index, ##__VA_ARGS__)
-+
-+#define pair_dbg(fmt, ...) \
-+	dev_dbg(asrc->dev, "Pair %c: " fmt, 'A' + index, ##__VA_ARGS__)
-+
-+DEFINE_SPINLOCK(data_lock);
-+DEFINE_SPINLOCK(pair_lock);
-+
-+/* Sample rates are aligned with that defined in pcm.h file */
-+static const unsigned char asrc_process_table[][8][2] = {
-+	/* 32kHz 44.1kHz 48kHz   64kHz   88.2kHz 96kHz   176kHz  192kHz */
-+	{{0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 5512Hz */
-+	{{0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 8kHz */
-+	{{0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 11025Hz */
-+	{{0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 16kHz */
-+	{{0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 22050Hz */
-+	{{0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0}, {0, 0},},	/* 32kHz */
-+	{{0, 2}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0},},	/* 44.1kHz */
-+	{{0, 2}, {0, 2}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0},},	/* 48kHz */
-+	{{1, 2}, {0, 2}, {0, 2}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0},},	/* 64kHz */
-+	{{1, 2}, {1, 2}, {1, 2}, {1, 1}, {1, 1}, {1, 1}, {1, 1}, {1, 1},},	/* 88.2kHz */
-+	{{1, 2}, {1, 2}, {1, 2}, {1, 1}, {1, 1}, {1, 1}, {1, 1}, {1, 1},},	/* 96kHz */
-+	{{2, 2}, {2, 2}, {2, 2}, {2, 1}, {2, 1}, {2, 1}, {2, 1}, {2, 1},},	/* 176kHz */
-+	{{2, 2}, {2, 2}, {2, 2}, {2, 1}, {2, 1}, {2, 1}, {2, 1}, {2, 1},},	/* 192kHz */
-+};
-+
-+static struct asrc_data *asrc;
-+
-+/*
-+ * The following tables map the relationship between asrc_inclk/asrc_outclk in
-+ * mxc_asrc.h and the registers of ASRCSR
-+ */
-+static unsigned char input_clk_map_v1[] = {
-+	0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0xa, 0xb, 0xc, 0xd, 0xe, 0xf,
-+};
-+
-+static unsigned char output_clk_map_v1[] = {
-+	0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0xa, 0xb, 0xc, 0xd, 0xe, 0xf,
-+};
-+
-+/* V2 uses the same map for input and output */
-+static unsigned char input_clk_map_v2[] = {
-+/*	0x0  0x1  0x2  0x3  0x4  0x5  0x6  0x7  0x8  0x9  0xa  0xb  0xc  0xd  0xe  0xf */
-+	0x0, 0x1, 0x2, 0x7, 0x4, 0x5, 0x6, 0x3, 0x8, 0x9, 0xa, 0xb, 0xc, 0xf, 0xe, 0xd,
-+};
-+
-+static unsigned char output_clk_map_v2[] = {
-+/*	0x0  0x1  0x2  0x3  0x4  0x5  0x6  0x7  0x8  0x9  0xa  0xb  0xc  0xd  0xe  0xf */
-+	0x8, 0x9, 0xa, 0x7, 0xc, 0x5, 0x6, 0xb, 0x0, 0x1, 0x2, 0x3, 0x4, 0xf, 0xe, 0xd,
-+};
-+
-+static unsigned char *input_clk_map, *output_clk_map;
-+
-+enum mxc_asrc_type {
-+	IMX35_ASRC,
-+	IMX53_ASRC,
-+};
-+
-+static const struct platform_device_id mxc_asrc_devtype[] = {
-+	{
-+		.name = "imx35-asrc",
-+		.driver_data = IMX35_ASRC,
-+	}, {
-+		.name = "imx53-asrc",
-+		.driver_data = IMX53_ASRC,
-+	}, {
-+		/* sentinel */
-+	}
-+};
-+MODULE_DEVICE_TABLE(platform, mxc_asrc_devtype);
-+
-+static const struct of_device_id fsl_asrc_ids[] = {
-+	{
-+		.compatible = "fsl,imx35-asrc",
-+		.data = &mxc_asrc_devtype[IMX35_ASRC],
-+	}, {
-+		.compatible = "fsl,imx53-asrc",
-+		.data = &mxc_asrc_devtype[IMX53_ASRC],
-+	}, {
-+		/* sentinel */
-+	}
-+};
-+MODULE_DEVICE_TABLE(of, fsl_asrc_ids);
-+
-+
-+#ifdef DEBUG
-+u32 asrc_reg[] = {
-+	REG_ASRCTR,
-+	REG_ASRIER,
-+	REG_ASRCNCR,
-+	REG_ASRCFG,
-+	REG_ASRCSR,
-+	REG_ASRCDR1,
-+	REG_ASRCDR2,
-+	REG_ASRSTR,
-+	REG_ASRRA,
-+	REG_ASRRB,
-+	REG_ASRRC,
-+	REG_ASRPM1,
-+	REG_ASRPM2,
-+	REG_ASRPM3,
-+	REG_ASRPM4,
-+	REG_ASRPM5,
-+	REG_ASRTFR1,
-+	REG_ASRCCR,
-+	REG_ASRIDRHA,
-+	REG_ASRIDRLA,
-+	REG_ASRIDRHB,
-+	REG_ASRIDRLB,
-+	REG_ASRIDRHC,
-+	REG_ASRIDRLC,
-+	REG_ASR76K,
-+	REG_ASR56K,
-+	REG_ASRMCRA,
-+	REG_ASRFSTA,
-+	REG_ASRMCRB,
-+	REG_ASRFSTB,
-+	REG_ASRMCRC,
-+	REG_ASRFSTC,
-+	REG_ASRMCR1A,
-+	REG_ASRMCR1B,
-+	REG_ASRMCR1C,
-+};
-+
-+static void dump_regs(void)
-+{
-+	u32 reg, val;
-+	int i;
-+
-+	for (i = 0; i < ARRAY_SIZE(asrc_reg); i++) {
-+		reg = asrc_reg[i];
-+		regmap_read(asrc->regmap, reg, &val);
-+		dev_dbg(asrc->dev, "REG addr=0x%x val=0x%x\n", reg, val);
-+	}
-+}
-+#else
-+static void dump_regs(void) {}
-+#endif
-+
-+/* Only used for Ideal Ratio mode */
-+static int asrc_set_clock_ratio(enum asrc_pair_index index,
-+				int inrate, int outrate)
-+{
-+	unsigned long val = 0;
-+	int integ, i;
-+
-+	if (outrate == 0) {
-+		dev_err(asrc->dev, "wrong output sample rate: %d\n", outrate);
-+		return -EINVAL;
-+	}
-+
-+	/* Formula: r = (1 << ASRC_RATIO_DECIMAL_DEPTH) / outrate * inrate; */
-+	for (integ = 0; inrate >= outrate; integ++)
-+		inrate -= outrate;
-+
-+	val |= (integ << ASRC_RATIO_DECIMAL_DEPTH);
-+
-+	for (i = 1; i <= ASRC_RATIO_DECIMAL_DEPTH; i++) {
-+		if ((inrate * 2) >= outrate) {
-+			val |= (1 << (ASRC_RATIO_DECIMAL_DEPTH - i));
-+			inrate = inrate * 2 - outrate;
-+		} else
-+			inrate = inrate << 1;
-+
-+		if (inrate == 0)
-+			break;
-+	}
-+
-+	regmap_write(asrc->regmap, REG_ASRIDRL(index), val);
-+	regmap_write(asrc->regmap, REG_ASRIDRH(index), (val >> 24));
-+
-+	return 0;
-+}
-+
-+/* Corresponding to asrc_process_table */
-+static int supported_input_rate[] = {
-+	5512, 8000, 11025, 16000, 22050, 32000, 44100, 48000, 64000, 88200,
-+	96000, 176400, 192000,
-+};
-+
-+static int supported_output_rate[] = {
-+	32000, 44100, 48000, 64000, 88200, 96000, 176400, 192000,
-+};
-+
-+static int asrc_set_process_configuration(enum asrc_pair_index index,
-+					int inrate, int outrate)
-+{
-+	int in, out;
-+
-+	for (in = 0; in < ARRAY_SIZE(supported_input_rate); in++) {
-+		if (inrate == supported_input_rate[in])
-+			break;
-+	}
-+
-+	if (in == ARRAY_SIZE(supported_input_rate)) {
-+		dev_err(asrc->dev, "unsupported input sample rate: %d\n", in);
-+		return -EINVAL;
-+	}
-+
-+	for (out = 0; out < ARRAY_SIZE(supported_output_rate); out++) {
-+		if (outrate == supported_output_rate[out])
-+			break;
-+	}
-+
-+	if (out == ARRAY_SIZE(supported_output_rate)) {
-+		dev_err(asrc->dev, "unsupported output sample rate: %d\n", out);
-+		return -EINVAL;
-+	}
-+
-+	regmap_update_bits(asrc->regmap, REG_ASRCFG,
-+			ASRCFG_PREMODx_MASK(index) | ASRCFG_POSTMODx_MASK(index),
-+			ASRCFG_PREMOD(index, asrc_process_table[in][out][0]) |
-+			ASRCFG_POSTMOD(index, asrc_process_table[in][out][1]));
-+
-+	return 0;
-+}
-+
-+static int asrc_get_asrck_clock_divider(int samplerate)
-+{
-+	unsigned int prescaler, divider, ratio, ra, i;
-+	unsigned long bitclk;
-+
-+	if (samplerate == 0) {
-+		dev_err(asrc->dev, "invalid sample rate: %d\n", samplerate);
-+		return -EINVAL;
-+	}
-+
-+	bitclk = clk_get_rate(asrc->asrck_clk);
-+
-+	ra = bitclk / samplerate;
-+	ratio = ra;
-+
-+	/* Calculate the prescaler */
-+	for (i = 0; ratio > 8; i++)
-+		ratio >>= 1;
-+
-+	prescaler = i;
-+
-+	/* Calculate the divider */
-+	divider = i ? (((ra + (1 << (i - 1)) - 1) >> i) - 1) : (ra - 1);
-+
-+	/* The totally divider is (2 ^ prescaler) * divider */
-+	return (divider << ASRCDRx_AxCPx_WIDTH) + prescaler;
-+}
-+
-+int asrc_req_pair(int chn_num, enum asrc_pair_index *index)
-+{
-+	int imax = 0, busy = 0, i, ret = 0;
-+	unsigned long lock_flags;
-+	struct asrc_pair *pair;
-+
-+	spin_lock_irqsave(&data_lock, lock_flags);
-+
-+	for (i = ASRC_PAIR_A; i < ASRC_PAIR_MAX_NUM; i++) {
-+		pair = &asrc->asrc_pair[i];
-+		if (chn_num > pair->chn_max) {
-+			imax++;
-+			continue;
-+		} else if (pair->active) {
-+			busy++;
-+			continue;
-+		}
-+		/* Save the current qualified pair */
-+		*index = i;
-+
-+		/* Check if this pair is a perfect one */
-+		if (chn_num == pair->chn_max)
-+			break;
-+	}
-+
-+	if (imax == ASRC_PAIR_MAX_NUM) {
-+		dev_err(asrc->dev, "no pair could afford required channel number\n");
-+		ret = -EINVAL;
-+	} else if (busy == ASRC_PAIR_MAX_NUM) {
-+		dev_err(asrc->dev, "all pairs are busy now\n");
-+		ret = -EBUSY;
-+	} else if (busy + imax >= ASRC_PAIR_MAX_NUM) {
-+		dev_err(asrc->dev, "all affordable pairs are busy now\n");
-+		ret = -EBUSY;
-+	} else {
-+		pair = &asrc->asrc_pair[*index];
-+		pair->chn_num = chn_num;
-+		pair->active = 1;
-+	}
-+
-+	spin_unlock_irqrestore(&data_lock, lock_flags);
-+
-+	if (!ret) {
-+		clk_prepare_enable(asrc->mem_clk);
-+		clk_prepare_enable(asrc->ipg_clk);
-+		clk_prepare_enable(asrc->asrck_clk);
-+		clk_prepare_enable(asrc->dma_clk);
-+	}
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(asrc_req_pair);
-+
-+void asrc_release_pair(enum asrc_pair_index index)
-+{
-+	struct asrc_pair *pair = &asrc->asrc_pair[index];
-+	unsigned long lock_flags;
-+
-+	spin_lock_irqsave(&data_lock, lock_flags);
-+
-+	pair->active = 0;
-+	pair->overload_error = 0;
-+
-+	spin_unlock_irqrestore(&data_lock, lock_flags);
-+
-+	/* Disable PAIR */
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEx_MASK(index), 0);
-+}
-+EXPORT_SYMBOL(asrc_release_pair);
-+
-+int asrc_config_pair(struct asrc_config *config)
-+{
-+	u32 inrate = config->input_sample_rate, indiv;
-+	u32 outrate = config->output_sample_rate, outdiv;
-+	int ret, channels, index = config->pair;
-+	unsigned long lock_flags;
-+
-+	/* Set the channel number */
-+	spin_lock_irqsave(&data_lock, lock_flags);
-+	asrc->asrc_pair[index].chn_num = config->channel_num;
-+	spin_unlock_irqrestore(&data_lock, lock_flags);
-+
-+	if (asrc->channel_bits > 3)
-+		channels = config->channel_num;
-+	else
-+		channels = (config->channel_num + 1) / 2;
-+
-+	/* Update channel number of current pair */
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(index, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(index, channels, asrc->channel_bits));
-+
-+	/* Set the clock source */
-+	regmap_update_bits(asrc->regmap, REG_ASRCSR,
-+			ASRCSR_AICSx_MASK(index) | ASRCSR_AOCSx_MASK(index),
-+			ASRCSR_AICS(index, input_clk_map[config->inclk]) |
-+			ASRCSR_AOCS(index, output_clk_map[config->outclk]));
-+
-+	/* Default setting: Automatic selection for processing mode */
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR,
-+			ASRCTR_ATSx_MASK(index), ASRCTR_ATS(index));
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_USRx_MASK(index), 0);
-+
-+	/* Default Input Clock Divider Setting */
-+	switch (config->inclk & ASRCSR_AxCSx_MASK) {
-+	case INCLK_SPDIF_RX:
-+		indiv = ASRC_PRESCALER_SPDIF_RX;
-+		break;
-+	case INCLK_SPDIF_TX:
-+		indiv = ASRC_PRESCALER_SPDIF_TX;
-+		break;
-+	case INCLK_ASRCK1_CLK:
-+		indiv = asrc_get_asrck_clock_divider(inrate);
-+		break;
-+	default:
-+		switch (config->input_word_width) {
-+		case ASRC_WIDTH_16_BIT:
-+			indiv = ASRC_PRESCALER_I2S_16BIT;
-+			break;
-+		case ASRC_WIDTH_24_BIT:
-+			indiv = ASRC_PRESCALER_I2S_24BIT;
-+			break;
-+		default:
-+			pair_err("unsupported input word width %d\n",
-+					config->input_word_width);
-+			return -EINVAL;
-+		}
-+		break;
-+	}
-+
-+	/* Default Output Clock Divider Setting */
-+	switch (config->outclk & ASRCSR_AxCSx_MASK) {
-+	case OUTCLK_SPDIF_RX:
-+		outdiv = ASRC_PRESCALER_SPDIF_RX;
-+		break;
-+	case OUTCLK_SPDIF_TX:
-+		outdiv = ASRC_PRESCALER_SPDIF_TX;
-+		break;
-+	case OUTCLK_ASRCK1_CLK:
-+		if ((config->inclk & ASRCSR_AxCSx_MASK) == INCLK_NONE)
-+			outdiv = ASRC_PRESCALER_IDEAL_RATIO;
-+		else
-+			outdiv = asrc_get_asrck_clock_divider(outrate);
-+		break;
-+	default:
-+		switch (config->output_word_width) {
-+		case ASRC_WIDTH_16_BIT:
-+			outdiv = ASRC_PRESCALER_I2S_16BIT;
-+			break;
-+		case ASRC_WIDTH_24_BIT:
-+			outdiv = ASRC_PRESCALER_I2S_24BIT;
-+			break;
-+		default:
-+			pair_err("unsupported output word width %d\n",
-+					config->input_word_width);
-+			return -EINVAL;
-+		}
-+		break;
-+	}
-+
-+	/* indiv and outdiv'd include prescaler's value, so add its MASK too */
-+	regmap_update_bits(asrc->regmap, REG_ASRCDR(index),
-+			ASRCDRx_AOCPx_MASK(index) | ASRCDRx_AICPx_MASK(index) |
-+			ASRCDRx_AOCDx_MASK(index) | ASRCDRx_AICDx_MASK(index),
-+			ASRCDRx_AOCP(index, outdiv) | ASRCDRx_AICP(index, indiv));
-+
-+	/* Check whether ideal ratio is a must */
-+	switch (config->inclk & ASRCSR_AxCSx_MASK) {
-+	case INCLK_NONE:
-+		/* Clear ASTSx bit to use ideal ratio */
-+		regmap_update_bits(asrc->regmap, REG_ASRCTR,
-+				ASRCTR_ATSx_MASK(index), 0);
-+
-+		regmap_update_bits(asrc->regmap, REG_ASRCTR,
-+				ASRCTR_IDRx_MASK(index) | ASRCTR_USRx_MASK(index),
-+				ASRCTR_IDR(index) | ASRCTR_USR(index));
-+
-+		ret = asrc_set_clock_ratio(index, inrate, outrate);
-+		if (ret)
-+			return ret;
-+
-+		ret = asrc_set_process_configuration(index, inrate, outrate);
-+		if (ret)
-+			return ret;
-+
-+		break;
-+	case INCLK_ASRCK1_CLK:
-+		/* This case and default are both remained for v1 */
-+		if (inrate == 44100 || inrate == 88200) {
-+			pair_err("unsupported sample rate %d by selected clock\n",
-+					inrate);
-+			return -EINVAL;
-+		}
-+		break;
-+	default:
-+		if ((config->outclk & ASRCSR_AxCSx_MASK) != OUTCLK_ASRCK1_CLK)
-+			break;
-+
-+		if (outrate == 44100 || outrate == 88200) {
-+			pair_err("unsupported sample rate %d by selected clock\n",
-+					outrate);
-+			return -EINVAL;
-+		}
-+		break;
-+	}
-+
-+	/* Config input and output wordwidth */
-+	if (config->output_word_width == ASRC_WIDTH_8_BIT) {
-+		pair_err("unsupported wordwidth for output: 8bit\n");
-+		pair_err("output only support: 16bit or 24bit\n");
-+		return -EINVAL;
-+	}
-+
-+	regmap_update_bits(asrc->regmap, REG_ASRMCR1(index),
-+			ASRMCR1x_OW16_MASK | ASRMCR1x_IWD_MASK,
-+			ASRMCR1x_OW16(config->output_word_width) |
-+			ASRMCR1x_IWD(config->input_word_width));
-+
-+	/* Enable BUFFER STALL */
-+	regmap_update_bits(asrc->regmap, REG_ASRMCR(index),
-+			ASRMCRx_BUFSTALLx_MASK, ASRMCRx_BUFSTALLx);
-+
-+	/* Set Threshold for input and output FIFO */
-+	return asrc_set_watermark(index, ASRC_INPUTFIFO_THRESHOLD,
-+			ASRC_INPUTFIFO_THRESHOLD);
-+}
-+EXPORT_SYMBOL(asrc_config_pair);
-+
-+int asrc_set_watermark(enum asrc_pair_index index, u32 in_wm, u32 out_wm)
-+{
-+	if (in_wm > ASRC_FIFO_THRESHOLD_MAX || out_wm > ASRC_FIFO_THRESHOLD_MAX) {
-+		pair_err("invalid watermark!\n");
-+		return -EINVAL;
-+	}
-+
-+	return regmap_update_bits(asrc->regmap, REG_ASRMCR(index),
-+			ASRMCRx_EXTTHRSHx_MASK | ASRMCRx_INFIFO_THRESHOLD_MASK |
-+			ASRMCRx_OUTFIFO_THRESHOLD_MASK,
-+			ASRMCRx_EXTTHRSHx | ASRMCRx_INFIFO_THRESHOLD(in_wm) |
-+			ASRMCRx_OUTFIFO_THRESHOLD(out_wm));
-+}
-+EXPORT_SYMBOL(asrc_set_watermark);
-+
-+void asrc_start_conv(enum asrc_pair_index index)
-+{
-+	int reg, retry, channels, i;
-+
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR,
-+			ASRCTR_ASRCEx_MASK(index), ASRCTR_ASRCE(index));
-+
-+	/* Wait for status of initialization */
-+	for (retry = 10, reg = 0; !reg && retry; --retry) {
-+		udelay(5);
-+		regmap_read(asrc->regmap, REG_ASRCFG, &reg);
-+		reg &= ASRCFG_INIRQx_MASK(index);
-+	}
-+
-+	/* Set the input fifo to ASRC STALL level */
-+	regmap_read(asrc->regmap, REG_ASRCNCR, &reg);
-+	channels = ASRCNCR_ANCx_get(index, reg, asrc->channel_bits);
-+	for (i = 0; i < channels * 4; i++)
-+		regmap_write(asrc->regmap, REG_ASRDI(index), 0);
-+
-+	/* Overload Interrupt Enable */
-+	regmap_write(asrc->regmap, REG_ASRIER, ASRIER_AOLIE);
-+}
-+EXPORT_SYMBOL(asrc_start_conv);
-+
-+void asrc_stop_conv(enum asrc_pair_index index)
-+{
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEx_MASK(index), 0);
-+}
-+EXPORT_SYMBOL(asrc_stop_conv);
-+
-+void asrc_finish_conv(enum asrc_pair_index index)
-+{
-+	clk_disable_unprepare(asrc->dma_clk);
-+	clk_disable_unprepare(asrc->asrck_clk);
-+	clk_disable_unprepare(asrc->ipg_clk);
-+	clk_disable_unprepare(asrc->mem_clk);
-+}
-+EXPORT_SYMBOL(asrc_finish_conv);
-+
-+#define SET_OVERLOAD_ERR(index, err, msg) \
-+	do { \
-+		asrc->asrc_pair[index].overload_error |= err; \
-+		pair_dbg(msg); \
-+	} while (0)
-+
-+static irqreturn_t asrc_isr(int irq, void *dev_id)
-+{
-+	enum asrc_pair_index index;
-+	u32 status;
-+
-+	regmap_read(asrc->regmap, REG_ASRSTR, &status);
-+
-+	for (index = ASRC_PAIR_A; index < ASRC_PAIR_MAX_NUM; index++) {
-+		if (asrc->asrc_pair[index].active == 0)
-+			continue;
-+		if (status & ASRSTR_ATQOL)
-+			SET_OVERLOAD_ERR(index, ASRC_TASK_Q_OVERLOAD,
-+					"Task Queue FIFO overload");
-+		if (status & ASRSTR_AOOL(index))
-+			SET_OVERLOAD_ERR(index, ASRC_OUTPUT_TASK_OVERLOAD,
-+					"Output Task Overload");
-+		if (status & ASRSTR_AIOL(index))
-+			SET_OVERLOAD_ERR(index, ASRC_INPUT_TASK_OVERLOAD,
-+					"Input Task Overload");
-+		if (status & ASRSTR_AODO(index))
-+			SET_OVERLOAD_ERR(index, ASRC_OUTPUT_BUFFER_OVERFLOW,
-+					"Output Data Buffer has overflowed");
-+		if (status & ASRSTR_AIDU(index))
-+			SET_OVERLOAD_ERR(index, ASRC_INPUT_BUFFER_UNDERRUN,
-+					"Input Data Buffer has underflowed");
-+	}
-+
-+	/* Clean overload error  */
-+	regmap_write(asrc->regmap, REG_ASRSTR, ASRSTR_AOLE);
-+
-+	return IRQ_HANDLED;
-+}
-+
-+void asrc_get_status(struct asrc_status_flags *flags)
-+{
-+	enum asrc_pair_index index = flags->index;
-+	unsigned long lock_flags;
-+
-+	spin_lock_irqsave(&data_lock, lock_flags);
-+
-+	flags->overload_error = asrc->asrc_pair[index].overload_error;
-+
-+	spin_unlock_irqrestore(&data_lock, lock_flags);
-+}
-+EXPORT_SYMBOL(asrc_get_status);
-+
-+u32 asrc_get_per_addr(enum asrc_pair_index index, bool in)
-+{
-+	return asrc->paddr + (in ? REG_ASRDI(index) : REG_ASRDO(index));
-+}
-+EXPORT_SYMBOL(asrc_get_per_addr);
-+
-+static int mxc_init_asrc(void)
-+{
-+	/* Halt ASRC internal FP when input FIFO needs data for pair A, B, C */
-+	regmap_write(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEN);
-+
-+	/* Disable interrupt by default */
-+	regmap_write(asrc->regmap, REG_ASRIER, 0x0);
-+
-+	/* Default 2: 6: 2 channel assignment */
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(ASRC_PAIR_A, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(ASRC_PAIR_A, 2, asrc->channel_bits));
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(ASRC_PAIR_B, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(ASRC_PAIR_B, 6, asrc->channel_bits));
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(ASRC_PAIR_C, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(ASRC_PAIR_C, 2, asrc->channel_bits));
-+
-+	/* Parameter Registers recommended settings */
-+	regmap_write(asrc->regmap, REG_ASRPM1, 0x7fffff);
-+	regmap_write(asrc->regmap, REG_ASRPM2, 0x255555);
-+	regmap_write(asrc->regmap, REG_ASRPM3, 0xff7280);
-+	regmap_write(asrc->regmap, REG_ASRPM4, 0xff7280);
-+	regmap_write(asrc->regmap, REG_ASRPM5, 0xff7280);
-+
-+	/* Base address for task queue FIFO. Set to 0x7C */
-+	regmap_update_bits(asrc->regmap, REG_ASRTFR1,
-+			ASRTFR1_TF_BASE_MASK, ASRTFR1_TF_BASE(0xfc));
-+
-+	/* Set the processing clock for 76KHz, 133M */
-+	regmap_write(asrc->regmap, REG_ASR76K, 0x06D6);
-+
-+	/* Set the processing clock for 56KHz, 133M */
-+	return regmap_write(asrc->regmap, REG_ASR56K, 0x0947);
-+}
-+
-+#define ASRC_xPUT_DMA_CALLBACK(in) \
-+	((in) ? asrc_input_dma_callback : asrc_output_dma_callback)
-+
-+static void asrc_input_dma_callback(void *data)
-+{
-+	struct asrc_pair_params *params = (struct asrc_pair_params *)data;
-+
-+	complete(&params->input_complete);
-+}
-+
-+static void asrc_output_dma_callback(void *data)
-+{
-+	struct asrc_pair_params *params = (struct asrc_pair_params *)data;
-+
-+	complete(&params->output_complete);
-+}
-+
-+static unsigned int asrc_get_output_FIFO_size(enum asrc_pair_index index)
-+{
-+	u32 val;
-+
-+	regmap_read(asrc->regmap, REG_ASRFST(index), &val);
-+
-+	val &= ASRFSTx_OUTPUT_FIFO_MASK;
-+
-+	return val >> ASRFSTx_OUTPUT_FIFO_SHIFT;
-+}
-+
-+static u32 asrc_read_one_from_output_FIFO(enum asrc_pair_index index)
-+{
-+	u32 val;
-+
-+	regmap_read(asrc->regmap, REG_ASRDO(index), &val);
-+
-+	return val;
-+}
-+
-+static void asrc_read_output_FIFO(struct asrc_pair_params *params)
-+{
-+	u32 *reg24 = params->output_last_period.dma_vaddr;
-+	u16 *reg16 = params->output_last_period.dma_vaddr;
-+	enum asrc_pair_index index = params->index;
-+	u32 i, j, reg, size, t_size;
-+	bool bit24 = false;
-+
-+	if (params->output_word_width == ASRC_WIDTH_24_BIT)
-+		bit24 = true;
-+
-+	t_size = 0;
-+	do {
-+		size = asrc_get_output_FIFO_size(index);
-+		for (i = 0; i < size; i++) {
-+			for (j = 0; j < params->channel_nums; j++) {
-+				reg = asrc_read_one_from_output_FIFO(index);
-+				if (bit24) {
-+					*(reg24) = reg;
-+					reg24++;
-+				} else {
-+					*(reg16) = (u16)reg;
-+					reg16++;
-+				}
-+			}
-+		}
-+		t_size += size;
-+	} while (size);
-+
-+	if (t_size > params->last_period_sample)
-+		t_size = params->last_period_sample;
-+
-+	params->output_last_period.length = t_size * params->channel_nums * 2;
-+	if (bit24)
-+		params->output_last_period.length *= 2;
-+}
-+
-+static void mxc_free_dma_buf(struct asrc_pair_params *params)
-+{
-+	if (params->input_dma_total.dma_vaddr != NULL) {
-+		kfree(params->input_dma_total.dma_vaddr);
-+		params->input_dma_total.dma_vaddr = NULL;
-+	}
-+
-+	if (params->output_dma_total.dma_vaddr != NULL) {
-+		kfree(params->output_dma_total.dma_vaddr);
-+		params->output_dma_total.dma_vaddr = NULL;
-+	}
-+
-+	if (params->output_last_period.dma_vaddr) {
-+		dma_free_coherent(asrc->dev, 1024 * params->last_period_sample,
-+				params->output_last_period.dma_vaddr,
-+				params->output_last_period.dma_paddr);
-+		params->output_last_period.dma_vaddr = NULL;
-+	}
-+}
-+
-+static int mxc_allocate_dma_buf(struct asrc_pair_params *params)
-+{
-+	struct dma_block *input_a, *output_a, *last_period;
-+	enum asrc_pair_index index = params->index;
-+
-+	input_a = &params->input_dma_total;
-+	output_a = &params->output_dma_total;
-+	last_period = &params->output_last_period;
-+
-+	input_a->dma_vaddr = kzalloc(input_a->length, GFP_KERNEL);
-+	if (!input_a->dma_vaddr) {
-+		pair_err("failed to allocate input dma buffer\n");
-+		goto exit;
-+	}
-+	input_a->dma_paddr = virt_to_dma(NULL, input_a->dma_vaddr);
-+
-+	output_a->dma_vaddr = kzalloc(output_a->length, GFP_KERNEL);
-+	if (!output_a->dma_vaddr) {
-+		pair_err("failed to allocate output dma buffer\n");
-+		goto exit;
-+	}
-+	output_a->dma_paddr = virt_to_dma(NULL, output_a->dma_vaddr);
-+
-+	last_period->dma_vaddr = dma_zalloc_coherent(asrc->dev,
-+			1024 * params->last_period_sample,
-+			&last_period->dma_paddr, GFP_KERNEL);
-+	if (!last_period->dma_vaddr) {
-+		pair_err("failed to allocate last period buffer\n");
-+		goto exit;
-+	}
-+
-+	return 0;
-+
-+exit:
-+	mxc_free_dma_buf(params);
-+
-+	return -ENOBUFS;
-+}
-+
-+static struct dma_chan *imx_asrc_get_dma_channel(enum asrc_pair_index index, bool in)
-+{
-+	char name[4];
-+
-+	sprintf(name, "%cx%c", in ? 'r' : 't', index + 'a');
-+
-+	return dma_request_slave_channel(asrc->dev, name);
-+}
-+
-+static int imx_asrc_dma_config(struct asrc_pair_params *params,
-+				struct dma_chan *chan, u32 dma_addr,
-+				void *buf_addr, u32 buf_len, bool in,
-+				enum asrc_word_width word_width)
-+{
-+	enum asrc_pair_index index = params->index;
-+	struct dma_async_tx_descriptor *desc;
-+	struct dma_slave_config slave_config;
-+	enum dma_slave_buswidth buswidth;
-+	struct scatterlist *sg;
-+	unsigned int sg_nent, i;
-+	int ret;
-+
-+	if (in) {
-+		sg = params->input_sg;
-+		sg_nent = params->input_sg_nodes;
-+		desc = params->desc_in;
-+	} else {
-+		sg = params->output_sg;
-+		sg_nent = params->output_sg_nodes;
-+		desc = params->desc_out;
-+	}
-+
-+	switch (word_width) {
-+	case ASRC_WIDTH_16_BIT:
-+		buswidth = DMA_SLAVE_BUSWIDTH_2_BYTES;
-+		break;
-+	case ASRC_WIDTH_24_BIT:
-+		buswidth = DMA_SLAVE_BUSWIDTH_4_BYTES;
-+		break;
-+	default:
-+		pair_err("invalid word width\n");
-+		return -EINVAL;
-+	}
-+
-+//	slave_config.dma_request0 = 0;
-+//	slave_config.dma_request1 = 0;
-+
-+	if (in) {
-+		slave_config.direction = DMA_MEM_TO_DEV;
-+		slave_config.dst_addr = dma_addr;
-+		slave_config.dst_addr_width = buswidth;
-+		slave_config.dst_maxburst =
-+			params->input_wm * params->channel_nums;
-+	} else {
-+		slave_config.direction = DMA_DEV_TO_MEM;
-+		slave_config.src_addr = dma_addr;
-+		slave_config.src_addr_width = buswidth;
-+		slave_config.src_maxburst =
-+			params->output_wm * params->channel_nums;
-+	}
-+	ret = dmaengine_slave_config(chan, &slave_config);
-+	if (ret) {
-+		pair_err("failed to config dmaengine for %sput task: %d\n",
-+				in ? "in" : "out", ret);
-+		return -EINVAL;
-+	}
-+
-+	sg_init_table(sg, sg_nent);
-+	switch (sg_nent) {
-+	case 1:
-+		sg_init_one(sg, buf_addr, buf_len);
-+		break;
-+	case 2:
-+	case 3:
-+	case 4:
-+		for (i = 0; i < (sg_nent - 1); i++)
-+			sg_set_buf(&sg[i], buf_addr + i * ASRC_MAX_BUFFER_SIZE,
-+					ASRC_MAX_BUFFER_SIZE);
-+
-+		sg_set_buf(&sg[i], buf_addr + i * ASRC_MAX_BUFFER_SIZE,
-+				buf_len - ASRC_MAX_BUFFER_SIZE * i);
-+		break;
-+	default:
-+		pair_err("invalid input DMA nodes number: %d\n", sg_nent);
-+		return -EINVAL;
-+	}
-+
-+	ret = dma_map_sg(NULL, sg, sg_nent, slave_config.direction);
-+	if (ret != sg_nent) {
-+		pair_err("failed to map dma sg for %sput task\n",
-+				in ? "in" : "out");
-+		return -EINVAL;
-+	}
-+
-+	desc = dmaengine_prep_slave_sg(chan, sg, sg_nent,
-+			slave_config.direction, DMA_PREP_INTERRUPT);
-+	if (!desc) {
-+		pair_err("failed to prepare slave sg for %sput task\n",
-+				in ? "in" : "out");
-+		return -EINVAL;
-+	}
-+
-+	if (in) {
-+		params->desc_in = desc;
-+		params->desc_in->callback = asrc_input_dma_callback;
-+	} else {
-+		params->desc_out = desc;
-+		params->desc_out->callback = asrc_output_dma_callback;
-+	}
-+
-+	desc->callback = ASRC_xPUT_DMA_CALLBACK(in);
-+	desc->callback_param = params;
-+
-+	return 0;
-+}
-+
-+static int mxc_asrc_prepare_io_buffer(struct asrc_pair_params *params,
-+				struct asrc_convert_buffer *pbuf, bool in)
-+{
-+	enum asrc_pair_index index = params->index;
-+	struct dma_chan *dma_channel;
-+	enum asrc_word_width width;
-+	unsigned int *dma_len, *sg_nodes, buf_len, wm;
-+	void __user *buf_vaddr;
-+	void *dma_vaddr;
-+	u32 word_size, fifo_addr;
-+
-+	if (in) {
-+		dma_channel = params->input_dma_channel;
-+		dma_vaddr = params->input_dma_total.dma_vaddr;
-+		dma_len = &params->input_dma_total.length;
-+		width = params->input_word_width;
-+		sg_nodes = &params->input_sg_nodes;
-+		wm = params->input_wm;
-+		buf_vaddr = (void __user *)pbuf->input_buffer_vaddr;
-+		buf_len = pbuf->input_buffer_length;
-+	} else {
-+		dma_channel = params->output_dma_channel;
-+		dma_vaddr = params->output_dma_total.dma_vaddr;
-+		dma_len = &params->output_dma_total.length;
-+		width = params->output_word_width;
-+		sg_nodes = &params->output_sg_nodes;
-+		wm = params->last_period_sample;
-+		buf_vaddr = (void __user *)pbuf->output_buffer_vaddr;
-+		buf_len = pbuf->output_buffer_length;
-+	}
-+
-+	switch (width) {
-+	case ASRC_WIDTH_24_BIT:
-+		word_size = 4;
-+		break;
-+	case ASRC_WIDTH_16_BIT:
-+	case ASRC_WIDTH_8_BIT:
-+		word_size = 2;
-+		break;
-+	default:
-+		pair_err("invalid %sput word size!\n", in ? "in" : "out");
-+		return -EINVAL;
-+	}
-+
-+	if (buf_len < word_size * params->channel_nums * wm) {
-+		pair_err("%sput buffer size[%d] is too small!\n",
-+				in ? "in" : "out", buf_len);
-+		return -EINVAL;
-+	}
-+
-+	/* Copy origin data into input buffer */
-+	if (in && copy_from_user(dma_vaddr, buf_vaddr, buf_len))
-+		return -EFAULT;
-+
-+	*dma_len = buf_len;
-+	if (!in)
-+		*dma_len -= wm * word_size * params->channel_nums;
-+
-+	*sg_nodes = *dma_len / ASRC_MAX_BUFFER_SIZE + 1;
-+
-+	fifo_addr = asrc_get_per_addr(params->index, in);
-+
-+	return imx_asrc_dma_config(params, dma_channel, fifo_addr, dma_vaddr,
-+			*dma_len, in, width);
-+}
-+
-+static int mxc_asrc_prepare_buffer(struct asrc_pair_params *params,
-+				struct asrc_convert_buffer *pbuf)
-+{
-+	enum asrc_pair_index index = params->index;
-+	int ret;
-+
-+	ret = mxc_asrc_prepare_io_buffer(params, pbuf, true);
-+	if (ret) {
-+		pair_err("failed to prepare input buffer: %d\n", ret);
-+		return ret;
-+	}
-+
-+	ret = mxc_asrc_prepare_io_buffer(params, pbuf, false);
-+	if (ret) {
-+		pair_err("failed to prepare output buffer: %d\n", ret);
-+		return ret;
-+	}
-+
-+	return 0;
-+}
-+
-+int mxc_asrc_process_buffer_pre(struct completion *complete,
-+				enum asrc_pair_index index, bool in)
-+{
-+	if (!wait_for_completion_interruptible_timeout(complete, 10 * HZ)) {
-+		pair_err("%sput dma task timeout\n", in ? "in" : "out");
-+		return -ETIME;
-+	} else if (signal_pending(current)) {
-+		pair_err("%sput task forcibly aborted\n", in ? "in" : "out");
-+		return -EBUSY;
-+	}
-+
-+	init_completion(complete);
-+
-+	return 0;
-+}
-+
-+#define mxc_asrc_dma_umap(params) \
-+	do { \
-+		dma_unmap_sg(NULL, params->input_sg, params->input_sg_nodes, \
-+				DMA_MEM_TO_DEV); \
-+		dma_unmap_sg(NULL, params->output_sg, params->output_sg_nodes, \
-+				DMA_DEV_TO_MEM); \
-+	} while (0)
-+
-+int mxc_asrc_process_buffer(struct asrc_pair_params *params,
-+			struct asrc_convert_buffer *pbuf)
-+{
-+	enum asrc_pair_index index = params->index;
-+	unsigned long lock_flags;
-+	int ret;
-+
-+	/* Check input task first */
-+	ret = mxc_asrc_process_buffer_pre(&params->input_complete, index, false);
-+	if (ret) {
-+		mxc_asrc_dma_umap(params);
-+		return ret;
-+	}
-+
-+	/* ...then output task*/
-+	ret = mxc_asrc_process_buffer_pre(&params->output_complete, index, true);
-+	if (ret) {
-+		mxc_asrc_dma_umap(params);
-+		return ret;
-+	}
-+
-+	mxc_asrc_dma_umap(params);
-+
-+	pbuf->input_buffer_length = params->input_dma_total.length;
-+	pbuf->output_buffer_length = params->output_dma_total.length;
-+
-+	spin_lock_irqsave(&pair_lock, lock_flags);
-+	if (!params->pair_hold) {
-+		spin_unlock_irqrestore(&pair_lock, lock_flags);
-+		return -EFAULT;
-+	}
-+	spin_unlock_irqrestore(&pair_lock, lock_flags);
-+
-+	asrc_read_output_FIFO(params);
-+
-+	if (copy_to_user((void __user *)pbuf->output_buffer_vaddr,
-+			 params->output_dma_total.dma_vaddr,
-+			 params->output_dma_total.length))
-+		return -EFAULT;
-+
-+	pbuf->output_buffer_length += params->output_last_period.length;
-+
-+	if (copy_to_user((void __user *)pbuf->output_buffer_vaddr +
-+			 params->output_dma_total.length,
-+			 params->output_last_period.dma_vaddr,
-+			 params->output_last_period.length))
-+		return -EFAULT;
-+
-+	return 0;
-+}
-+
-+#ifdef ASRC_POLLING_WITHOUT_DMA
-+static void asrc_write_one_to_input_FIFO(enum asrc_pair_index index, u32 val)
-+{
-+	regmap_write(asrc->regmap, REG_ASRDI(index), val);
-+}
-+
-+/* THIS FUNCTION ONLY EXISTS FOR DEBUGGING AND ONLY SUPPORTS TWO CHANNELS */
-+static void asrc_polling_debug(struct asrc_pair_params *params)
-+{
-+	enum asrc_pair_index index = params->index;
-+	u32 *in24 = params->input_dma_total.dma_vaddr;
-+	u32 dma_len = params->input_dma_total.length / (params->channel_nums * 4);
-+	u32 size, i, j, t_size, reg;
-+	u32 *reg24 = params->output_dma_total.dma_vaddr;
-+
-+	t_size = 0;
-+
-+	for (i = 0; i < dma_len; ) {
-+		for (j = 0; j < 2; j++) {
-+			asrc_write_one_to_input_FIFO(index, *in24);
-+			in24++;
-+			asrc_write_one_to_input_FIFO(index, *in24);
-+			in24++;
-+			i++;
-+		}
-+		udelay(50);
-+		udelay(50 * params->output_sample_rate / params->input_sample_rate);
-+
-+		size = asrc_get_output_FIFO_size(index);
-+		for (j = 0; j < size; j++) {
-+			reg = asrc_read_one_from_output_FIFO(index);
-+			*(reg24) = reg;
-+			reg24++;
-+			reg = asrc_read_one_from_output_FIFO(index);
-+			*(reg24) = reg;
-+			reg24++;
-+		}
-+		t_size += size;
-+	}
-+
-+	mdelay(1);
-+	size = asrc_get_output_FIFO_size(index);
-+	for (j = 0; j < size; j++) {
-+		reg = asrc_read_one_from_output_FIFO(index);
-+		*(reg24) = reg;
-+		reg24++;
-+		reg = asrc_read_one_from_output_FIFO(index);
-+		*(reg24) = reg;
-+		reg24++;
-+	}
-+	t_size += size;
-+
-+	params->output_dma_total.length = t_size * params->channel_nums * 4;
-+	params->output_last_period.length = 0;
-+
-+	complete(&params->input_complete);
-+}
-+#else
-+static void mxc_asrc_submit_dma(struct asrc_pair_params *params)
-+{
-+	enum asrc_pair_index index = params->index;
-+	u32 size = asrc_get_output_FIFO_size(params->index);
-+	int i, j;
-+
-+	/* Read all data in OUTPUT FIFO */
-+	while (size) {
-+		for (j = 0; j < size; j++)
-+			for (i = 0; i < params->channel_nums; i++)
-+				asrc_read_one_from_output_FIFO(index);
-+		/* Fetch the data every 100us */
-+		udelay(100);
-+
-+		size = asrc_get_output_FIFO_size(index);
-+	}
-+
-+	/* Submit dma request */
-+	dmaengine_submit(params->desc_in);
-+	dma_async_issue_pending(params->desc_in->chan);
-+
-+	dmaengine_submit(params->desc_out);
-+	dma_async_issue_pending(params->desc_out->chan);
-+
-+	/*
-+	 * Clear dma request during the stall state of ASRC:
-+	 * During STALL state, the remaining in input fifo would never be
-+	 * smaller than the input threshold while the output fifo would not
-+	 * be bigger than output one. Thus the dma request would be cleared.
-+	 */
-+	asrc_set_watermark(index, ASRC_FIFO_THRESHOLD_MIN, ASRC_FIFO_THRESHOLD_MAX);
-+
-+	/* Update the real input threshold to raise dma request */
-+	asrc_set_watermark(index, params->input_wm, params->output_wm);
-+}
-+#endif
-+
-+static long asrc_ioctl_req_pair(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	unsigned long lock_flags;
-+	struct asrc_req req;
-+	long ret;
-+
-+	ret = copy_from_user(&req, user, sizeof(req));
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to get req from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	ret = asrc_req_pair(req.chn_num, &req.index);
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to request pair: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	spin_lock_irqsave(&pair_lock, lock_flags);
-+	params->pair_hold = 1;
-+	spin_unlock_irqrestore(&pair_lock, lock_flags);
-+	params->index = req.index;
-+	params->channel_nums = req.chn_num;
-+
-+	ret = copy_to_user(user, &req, sizeof(req));
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to send req to user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_config_pair(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	struct asrc_config config;
-+	enum asrc_pair_index index;
-+	long ret;
-+
-+	ret = copy_from_user(&config, user, sizeof(config));
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to get config from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	index = config.pair;
-+
-+	ret = asrc_config_pair(&config);
-+	if (ret) {
-+		pair_err("failed to config pair: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	params->input_wm = 4;
-+	params->output_wm = 2;
-+
-+	ret = asrc_set_watermark(index, params->input_wm, params->output_wm);
-+	if (ret)
-+		return ret;
-+
-+	params->output_buffer_size = config.dma_buffer_size;
-+	params->input_buffer_size = config.dma_buffer_size;
-+	if (config.buffer_num > ASRC_DMA_BUFFER_NUM)
-+		params->buffer_num = ASRC_DMA_BUFFER_NUM;
-+	else
-+		params->buffer_num = config.buffer_num;
-+
-+	params->input_dma_total.length = ASRC_DMA_BUFFER_SIZE;
-+	params->output_dma_total.length = ASRC_DMA_BUFFER_SIZE;
-+
-+	params->input_word_width = config.input_word_width;
-+	params->output_word_width = config.output_word_width;
-+
-+	params->input_sample_rate = config.input_sample_rate;
-+	params->output_sample_rate = config.output_sample_rate;
-+
-+	if (params->output_sample_rate > params->input_sample_rate)
-+		params->last_period_sample = ASRC_OUTPUT_LAST_SAMPLE_DEFAULT_MAX;
-+	else
-+	params->last_period_sample = ASRC_OUTPUT_LAST_SAMPLE_DEFAULT;
-+
-+
-+	ret = mxc_allocate_dma_buf(params);
-+	if (ret) {
-+		pair_err("failed to allocate dma buffer: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	/* Request DMA channel for both input and output */
-+	params->input_dma_channel = imx_asrc_get_dma_channel(index, true);
-+	if (params->input_dma_channel == NULL) {
-+		pair_err("failed to request input task dma channel\n");
-+		return  -EBUSY;
-+	}
-+
-+	params->output_dma_channel = imx_asrc_get_dma_channel(index, false);
-+	if (params->output_dma_channel == NULL) {
-+		pair_err("failed to request output task dma channel\n");
-+		return  -EBUSY;
-+	}
-+
-+	ret = copy_to_user(user, &config, sizeof(config));
-+	if (ret) {
-+		pair_err("failed to send config to user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_release_pair(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	enum asrc_pair_index index;
-+	unsigned long lock_flags;
-+	long ret;
-+
-+	ret = copy_from_user(&index, user, sizeof(index));
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to get index from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	/* index might be not valid due to some application failure. */
-+	if (index < 0)
-+		return -EINVAL;
-+
-+	params->asrc_active = 0;
-+
-+	spin_lock_irqsave(&pair_lock, lock_flags);
-+	params->pair_hold = 0;
-+	spin_unlock_irqrestore(&pair_lock, lock_flags);
-+
-+	if (params->input_dma_channel)
-+		dma_release_channel(params->input_dma_channel);
-+	if (params->output_dma_channel)
-+		dma_release_channel(params->output_dma_channel);
-+	mxc_free_dma_buf(params);
-+	asrc_release_pair(index);
-+	asrc_finish_conv(index);
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_convert(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	enum asrc_pair_index index = params->index;
-+	struct asrc_convert_buffer buf;
-+	long ret;
-+
-+	ret = copy_from_user(&buf, user, sizeof(buf));
-+	if (ret) {
-+		pair_err("failed to get buf from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	ret = mxc_asrc_prepare_buffer(params, &buf);
-+	if (ret) {
-+		pair_err("failed to prepare buffer: %ld\n", ret);
-+		return ret;
-+	}
-+
-+#ifdef ASRC_POLLING_WITHOUT_DMA
-+	asrc_polling_debug(params);
-+#else
-+	mxc_asrc_submit_dma(params);
-+#endif
-+
-+	ret = mxc_asrc_process_buffer(params, &buf);
-+	if (ret) {
-+		pair_err("failed to process buffer: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	ret = copy_to_user(user, &buf, sizeof(buf));
-+	if (ret) {
-+		pair_err("failed to send buf to user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_start_conv(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	enum asrc_pair_index index;
-+	long ret;
-+
-+	ret = copy_from_user(&index, user, sizeof(index));
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to get index from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	params->asrc_active = 1;
-+	asrc_start_conv(index);
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_stop_conv(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	enum asrc_pair_index index;
-+	long ret;
-+
-+	ret = copy_from_user(&index, user, sizeof(index));
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to get index from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	dmaengine_terminate_all(params->input_dma_channel);
-+	dmaengine_terminate_all(params->output_dma_channel);
-+
-+	asrc_stop_conv(index);
-+	params->asrc_active = 0;
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_status(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	enum asrc_pair_index index = params->index;
-+	struct asrc_status_flags flags;
-+	long ret;
-+
-+	ret = copy_from_user(&flags, user, sizeof(flags));
-+	if (ret) {
-+		pair_err("failed to get flags from user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	asrc_get_status(&flags);
-+
-+	ret = copy_to_user(user, &flags, sizeof(flags));
-+	if (ret) {
-+		pair_err("failed to send flags to user space: %ld\n", ret);
-+		return ret;
-+	}
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl_flush(struct asrc_pair_params *params,
-+				void __user *user)
-+{
-+	enum asrc_pair_index index = params->index;
-+	init_completion(&params->input_complete);
-+	init_completion(&params->output_complete);
-+
-+	/* Release DMA and request again */
-+	dma_release_channel(params->input_dma_channel);
-+	dma_release_channel(params->output_dma_channel);
-+
-+	params->input_dma_channel = imx_asrc_get_dma_channel(index, true);
-+	if (params->input_dma_channel == NULL) {
-+		pair_err("failed to request input task dma channel\n");
-+		return -EBUSY;
-+	}
-+
-+	params->output_dma_channel = imx_asrc_get_dma_channel(index, false);
-+	if (params->output_dma_channel == NULL) {
-+		pair_err("failed to request output task dma channel\n");
-+		return -EBUSY;
-+	}
-+
-+	return 0;
-+}
-+
-+static long asrc_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
-+{
-+	struct asrc_pair_params *params = file->private_data;
-+	void __user *user = (void __user *)arg;
-+	long ret = 0;
-+
-+	switch (cmd) {
-+	case ASRC_REQ_PAIR:
-+		ret = asrc_ioctl_req_pair(params, user);
-+		break;
-+	case ASRC_CONFIG_PAIR:
-+		ret = asrc_ioctl_config_pair(params, user);
-+		break;
-+	case ASRC_RELEASE_PAIR:
-+		ret = asrc_ioctl_release_pair(params, user);
-+		break;
-+	case ASRC_CONVERT:
-+		ret = asrc_ioctl_convert(params, user);
-+		break;
-+	case ASRC_START_CONV:
-+		ret = asrc_ioctl_start_conv(params, user);
-+		dump_regs();
-+		break;
-+	case ASRC_STOP_CONV:
-+		ret = asrc_ioctl_stop_conv(params, user);
-+		break;
-+	case ASRC_STATUS:
-+		ret = asrc_ioctl_status(params, user);
-+		break;
-+	case ASRC_FLUSH:
-+		ret = asrc_ioctl_flush(params, user);
-+		break;
-+	default:
-+		dev_err(asrc->dev, "invalid ioctl cmd!\n");
-+		break;
-+	}
-+
-+	return ret;
-+}
-+
-+static int mxc_asrc_open(struct inode *inode, struct file *file)
-+{
-+	struct asrc_pair_params *params;
-+	unsigned long lock_flags;
-+	int i = 0, ret = 0;
-+
-+	ret = signal_pending(current);
-+	if (ret) {
-+		dev_err(asrc->dev, "current process has a signal pending\n");
-+		return ret;
-+	}
-+
-+	params = kzalloc(sizeof(struct asrc_pair_params), GFP_KERNEL);
-+	if (params == NULL) {
-+		dev_err(asrc->dev, "failed to allocate pair_params\n");
-+		return -ENOBUFS;
-+	}
-+
-+	file->private_data = params;
-+
-+	while (asrc->params[i])
-+		i++;
-+
-+	if (i >= ASRC_PAIR_MAX_NUM) {
-+		dev_err(asrc->dev, "All pairs are being occupied\n");
-+		return -EBUSY;
-+	}
-+
-+	init_completion(&params->input_complete);
-+	init_completion(&params->output_complete);
-+
-+	spin_lock_irqsave(&pair_lock, lock_flags);
-+	asrc->params[i] = params;
-+	spin_unlock_irqrestore(&pair_lock, lock_flags);
-+
-+	return ret;
-+}
-+
-+static int mxc_asrc_close(struct inode *inode, struct file *file)
-+{
-+	struct asrc_pair_params *params;
-+	unsigned long lock_flags;
-+	int i;
-+
-+	params = file->private_data;
-+
-+	spin_lock_irqsave(&pair_lock, lock_flags);
-+	for (i = 0; i < ASRC_PAIR_MAX_NUM; i++)
-+		if (asrc->params[i] == params)
-+			asrc->params[i] = NULL;
-+	spin_unlock_irqrestore(&pair_lock, lock_flags);
-+
-+	if (!params)
-+		return 0;
-+
-+	if (params->asrc_active) {
-+		params->asrc_active = 0;
-+
-+		dmaengine_terminate_all(params->input_dma_channel);
-+		dmaengine_terminate_all(params->output_dma_channel);
-+
-+		asrc_stop_conv(params->index);
-+
-+		complete(&params->input_complete);
-+		complete(&params->output_complete);
-+	}
-+
-+		spin_lock_irqsave(&pair_lock, lock_flags);
-+	if (params->pair_hold) {
-+		params->pair_hold = 0;
-+		spin_unlock_irqrestore(&pair_lock, lock_flags);
-+
-+		if (params->input_dma_channel)
-+			dma_release_channel(params->input_dma_channel);
-+		if (params->output_dma_channel)
-+			dma_release_channel(params->output_dma_channel);
-+
-+		mxc_free_dma_buf(params);
-+
-+		asrc_release_pair(params->index);
-+		asrc_finish_conv(params->index);
-+	} else {
-+		spin_unlock_irqrestore(&pair_lock, lock_flags);
-+	}
-+
-+	spin_lock_irqsave(&pair_lock, lock_flags);
-+	kfree(params);
-+	spin_unlock_irqrestore(&pair_lock, lock_flags);
-+	file->private_data = NULL;
-+
-+	return 0;
-+}
-+
-+static int mxc_asrc_mmap(struct file *file, struct vm_area_struct *vma)
-+{
-+	unsigned long size = vma->vm_end - vma->vm_start;
-+	int ret;
-+
-+	vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
-+
-+	ret = remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
-+			size, vma->vm_page_prot);
-+	if (ret) {
-+		dev_err(asrc->dev, "failed to memory map!\n");
-+		return ret;
-+	}
-+
-+	vma->vm_flags &= ~VM_IO;
-+
-+	return ret;
-+}
-+
-+static const struct file_operations asrc_fops = {
-+	.owner		= THIS_MODULE,
-+	.unlocked_ioctl	= asrc_ioctl,
-+	.mmap		= mxc_asrc_mmap,
-+	.open		= mxc_asrc_open,
-+	.release	= mxc_asrc_close,
-+};
-+
-+static struct miscdevice asrc_miscdev = {
-+	.name	= "mxc_asrc",
-+	.fops	= &asrc_fops,
-+	.minor	= MISC_DYNAMIC_MINOR,
-+};
-+
-+static int asrc_read_proc_attr(struct file *file, char __user *buf,
-+				size_t count, loff_t *off)
-+{
-+	char tmpbuf[80];
-+	int len = 0;
-+	u32 reg;
-+
-+	if (*off)
-+		return 0;
-+
-+	regmap_read(asrc->regmap, REG_ASRCNCR, &reg);
-+
-+	len += sprintf(tmpbuf, "ANCA: %d\nANCB: %d\nANCC: %d\n",
-+			ASRCNCR_ANCx_get(ASRC_PAIR_A, reg, asrc->channel_bits),
-+			ASRCNCR_ANCx_get(ASRC_PAIR_B, reg, asrc->channel_bits),
-+			ASRCNCR_ANCx_get(ASRC_PAIR_C, reg, asrc->channel_bits));
-+
-+	if (len > count)
-+		return 0;
-+
-+	if (copy_to_user(buf, &tmpbuf, len))
-+		return -EFAULT;
-+
-+	*off += len;
-+
-+	return len;
-+}
-+
-+#define ASRC_MAX_PROC_BUFFER_SIZE 63
-+
-+static int asrc_write_proc_attr(struct file *file, const char __user *buffer,
-+				size_t count, loff_t *data)
-+{
-+	char buf[ASRC_MAX_PROC_BUFFER_SIZE];
-+	int na, nb, nc;
-+	int total;
-+
-+	if (count > ASRC_MAX_PROC_BUFFER_SIZE) {
-+		dev_err(asrc->dev, "proc write: the input string was too long\n");
-+		return -EINVAL;
-+	}
-+
-+	if (copy_from_user(buf, buffer, count)) {
-+		dev_err(asrc->dev, "proc write: failed to copy buffer from user\n");
-+		return -EFAULT;
-+	}
-+
-+	sscanf(buf, "ANCA: %d\nANCB: %d\nANCC: %d", &na, &nb, &nc);
-+
-+	total = asrc->channel_bits > 3 ? 10 : 5;
-+
-+	if (na + nb + nc > total) {
-+		dev_err(asrc->dev, "don't surpass %d for total\n", total);
-+		return -EINVAL;
-+	} else if (asrc->channel_bits < 4 &&
-+		   (na % 2 != 0 || nb % 2 != 0 || nc % 2 != 0)) {
-+		dev_err(asrc->dev, "please set an even number for each pair\n");
-+		return -EINVAL;
-+	} else if (na < 0 || nb < 0 || nc < 0) {
-+		dev_err(asrc->dev, "please set an positive number for each pair\n");
-+		return -EINVAL;
-+	}
-+
-+
-+	asrc->asrc_pair[ASRC_PAIR_A].chn_max = na;
-+	asrc->asrc_pair[ASRC_PAIR_B].chn_max = nb;
-+	asrc->asrc_pair[ASRC_PAIR_C].chn_max = nc;
-+
-+	/* Update channel number settings */
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(ASRC_PAIR_A, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(ASRC_PAIR_A, na, asrc->channel_bits));
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(ASRC_PAIR_B, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(ASRC_PAIR_B, nb, asrc->channel_bits));
-+	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
-+			ASRCNCR_ANCx_MASK(ASRC_PAIR_C, asrc->channel_bits),
-+			ASRCNCR_ANCx_set(ASRC_PAIR_C, nc, asrc->channel_bits));
-+
-+	return count;
-+}
-+
-+static const struct file_operations asrc_proc_fops = {
-+	.read		= asrc_read_proc_attr,
-+	.write		= asrc_write_proc_attr,
-+};
-+
-+static void asrc_proc_create(void)
-+{
-+	struct proc_dir_entry *proc_attr;
-+
-+	asrc->proc_asrc = proc_mkdir(ASRC_PROC_PATH, NULL);
-+	if (!asrc->proc_asrc) {
-+		dev_err(asrc->dev, "failed to create proc entry %s\n", ASRC_PROC_PATH);
-+		return;
-+	}
-+
-+	proc_attr = proc_create("ChSettings", S_IFREG | S_IRUGO | S_IWUSR,
-+			asrc->proc_asrc, &asrc_proc_fops);
-+	if (!proc_attr) {
-+		remove_proc_entry(ASRC_PROC_PATH, NULL);
-+		dev_err(asrc->dev, "failed to create proc attribute entry\n");
-+	}
-+}
-+
-+static void asrc_proc_remove(void)
-+{
-+	remove_proc_entry("ChSettings", asrc->proc_asrc);
-+	remove_proc_entry(ASRC_PROC_PATH, NULL);
-+}
-+
-+
-+static bool asrc_readable_reg(struct device *dev, unsigned int reg)
-+{
-+	switch (reg) {
-+	case REG_ASRCTR:
-+	case REG_ASRIER:
-+	case REG_ASRCNCR:
-+	case REG_ASRCFG:
-+	case REG_ASRCSR:
-+	case REG_ASRCDR1:
-+	case REG_ASRCDR2:
-+	case REG_ASRSTR:
-+	case REG_ASRPM1:
-+	case REG_ASRPM2:
-+	case REG_ASRPM3:
-+	case REG_ASRPM4:
-+	case REG_ASRPM5:
-+	case REG_ASRTFR1:
-+	case REG_ASRCCR:
-+	case REG_ASRDOA:
-+	case REG_ASRDOB:
-+	case REG_ASRDOC:
-+	case REG_ASRIDRHA:
-+	case REG_ASRIDRLA:
-+	case REG_ASRIDRHB:
-+	case REG_ASRIDRLB:
-+	case REG_ASRIDRHC:
-+	case REG_ASRIDRLC:
-+	case REG_ASR76K:
-+	case REG_ASR56K:
-+	case REG_ASRMCRA:
-+	case REG_ASRFSTA:
-+	case REG_ASRMCRB:
-+	case REG_ASRFSTB:
-+	case REG_ASRMCRC:
-+	case REG_ASRFSTC:
-+	case REG_ASRMCR1A:
-+	case REG_ASRMCR1B:
-+	case REG_ASRMCR1C:
-+		return true;
-+	default:
-+		return false;
-+	}
-+}
-+
-+static bool asrc_volatile_reg(struct device *dev, unsigned int reg)
-+{
-+	switch (reg) {
-+	case REG_ASRSTR:
-+	case REG_ASRDIA:
-+	case REG_ASRDIB:
-+	case REG_ASRDIC:
-+	case REG_ASRDOA:
-+	case REG_ASRDOB:
-+	case REG_ASRDOC:
-+	case REG_ASRFSTA:
-+	case REG_ASRFSTB:
-+	case REG_ASRFSTC:
-+	case REG_ASRCFG:
-+		return true;
-+	default:
-+		return false;
-+	}
-+}
-+
-+static bool asrc_writeable_reg(struct device *dev, unsigned int reg)
-+{
-+	switch (reg) {
-+	case REG_ASRCTR:
-+	case REG_ASRIER:
-+	case REG_ASRCNCR:
-+	case REG_ASRCFG:
-+	case REG_ASRCSR:
-+	case REG_ASRCDR1:
-+	case REG_ASRCDR2:
-+	case REG_ASRSTR:
-+	case REG_ASRPM1:
-+	case REG_ASRPM2:
-+	case REG_ASRPM3:
-+	case REG_ASRPM4:
-+	case REG_ASRPM5:
-+	case REG_ASRTFR1:
-+	case REG_ASRCCR:
-+	case REG_ASRDIA:
-+	case REG_ASRDIB:
-+	case REG_ASRDIC:
-+	case REG_ASRIDRHA:
-+	case REG_ASRIDRLA:
-+	case REG_ASRIDRHB:
-+	case REG_ASRIDRLB:
-+	case REG_ASRIDRHC:
-+	case REG_ASRIDRLC:
-+	case REG_ASR76K:
-+	case REG_ASR56K:
-+	case REG_ASRMCRA:
-+	case REG_ASRMCRB:
-+	case REG_ASRMCRC:
-+	case REG_ASRMCR1A:
-+	case REG_ASRMCR1B:
-+	case REG_ASRMCR1C:
-+		return true;
-+	default:
-+		return false;
-+	}
-+}
-+
-+static struct regmap_config asrc_regmap_config = {
-+	.reg_bits = 32,
-+	.reg_stride = 4,
-+	.val_bits = 32,
-+
-+	.max_register = REG_ASRMCR1C,
-+	.readable_reg = asrc_readable_reg,
-+	.volatile_reg = asrc_volatile_reg,
-+	.writeable_reg = asrc_writeable_reg,
-+	.cache_type = REGCACHE_RBTREE,
-+};
-+
-+static int mxc_asrc_probe(struct platform_device *pdev)
-+{
-+	const struct of_device_id *of_id = of_match_device(fsl_asrc_ids, &pdev->dev);
-+	struct device_node *np = pdev->dev.of_node;
-+	enum mxc_asrc_type devtype;
-+	struct resource *res;
-+	void __iomem *regs;
-+	int ret;
-+
-+	/* Check if the device is existed */
-+	if (!np)
-+		return -ENODEV;
-+
-+	asrc = devm_kzalloc(&pdev->dev, sizeof(struct asrc_data), GFP_KERNEL);
-+	if (!asrc)
-+		return -ENOMEM;
-+
-+	if (of_id) {
-+		const struct platform_device_id *id_entry = of_id->data;
-+		devtype = id_entry->driver_data;
-+	} else {
-+		devtype = pdev->id_entry->driver_data;
-+	}
-+
-+	asrc->dev = &pdev->dev;
-+	asrc->dev->coherent_dma_mask = DMA_BIT_MASK(32);
-+
-+	asrc->asrc_pair[ASRC_PAIR_A].chn_max = 2;
-+	asrc->asrc_pair[ASRC_PAIR_B].chn_max = 6;
-+	asrc->asrc_pair[ASRC_PAIR_C].chn_max = 2;
-+	asrc->asrc_pair[ASRC_PAIR_A].overload_error = 0;
-+	asrc->asrc_pair[ASRC_PAIR_B].overload_error = 0;
-+	asrc->asrc_pair[ASRC_PAIR_C].overload_error = 0;
-+
-+	/* Map the address */
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (IS_ERR(res)) {
-+		dev_err(&pdev->dev, "could not determine device resources\n");
-+		return PTR_ERR(res);
-+	}
-+
-+	regs = devm_ioremap_resource(&pdev->dev, res);
-+	if (IS_ERR(regs)) {
-+		dev_err(&pdev->dev, "could not map device resources\n");
-+		return PTR_ERR(regs);
-+	}
-+	asrc->paddr = res->start;
-+
-+	/* Register regmap and let it prepare core clock */
-+	asrc->regmap = devm_regmap_init_mmio_clk(&pdev->dev,
-+			"mem", regs, &asrc_regmap_config);
-+	if (IS_ERR(asrc->regmap)) {
-+		dev_err(&pdev->dev, "regmap init failed\n");
-+		return PTR_ERR(asrc->regmap);
-+	}
-+
-+	asrc->irq = platform_get_irq(pdev, 0);
-+	if (asrc->irq == NO_IRQ) {
-+		dev_err(&pdev->dev, "no irq for node %s\n", np->full_name);
-+		return asrc->irq;
-+	}
-+
-+	ret = devm_request_irq(&pdev->dev, asrc->irq, asrc_isr, 0, np->name, NULL);
-+	if (ret) {
-+		dev_err(&pdev->dev, "could not claim irq %u: %d\n", asrc->irq, ret);
-+		return ret;
-+	}
-+
-+	asrc->mem_clk = devm_clk_get(&pdev->dev, "mem");
-+	if (IS_ERR(asrc->mem_clk)) {
-+		dev_err(&pdev->dev, "failed to get mem clock\n");
-+		return PTR_ERR(asrc->ipg_clk);
-+	}
-+
-+	asrc->ipg_clk = devm_clk_get(&pdev->dev, "ipg");
-+	if (IS_ERR(asrc->ipg_clk)) {
-+		dev_err(&pdev->dev, "failed to get ipg clock\n");
-+		return PTR_ERR(asrc->ipg_clk);
-+	}
-+
-+	asrc->asrck_clk = devm_clk_get(&pdev->dev, "asrck");
-+	if (IS_ERR(asrc->asrck_clk)) {
-+		dev_err(&pdev->dev, "failed to get asrck clock\n");
-+		return PTR_ERR(asrc->asrck_clk);
-+	}
-+
-+	asrc->dma_clk = devm_clk_get(&pdev->dev, "dma");
-+	if (IS_ERR(asrc->dma_clk)) {
-+		dev_err(&pdev->dev, "failed to get dma script clock\n");
-+		return PTR_ERR(asrc->dma_clk);
-+	}
-+
-+	switch (devtype) {
-+	case IMX35_ASRC:
-+		asrc->channel_bits = 3;
-+		input_clk_map = input_clk_map_v1;
-+		output_clk_map = output_clk_map_v1;
-+		break;
-+	case IMX53_ASRC:
-+		asrc->channel_bits = 4;
-+		input_clk_map = input_clk_map_v2;
-+		output_clk_map = output_clk_map_v2;
-+		break;
-+	default:
-+		dev_err(&pdev->dev, "unsupported device type\n");
-+		return -EINVAL;
-+	}
-+
-+	ret = misc_register(&asrc_miscdev);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to register char device %d\n", ret);
-+		return ret;
-+	}
-+
-+	asrc_proc_create();
-+
-+	ret = mxc_init_asrc();
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to init asrc %d\n", ret);
-+		goto err_misc;
-+	}
-+
-+	dev_info(&pdev->dev, "mxc_asrc registered\n");
-+
-+	return ret;
-+
-+err_misc:
-+	misc_deregister(&asrc_miscdev);
-+
-+	return ret;
-+}
-+
-+static int mxc_asrc_remove(struct platform_device *pdev)
-+{
-+	asrc_proc_remove();
-+	misc_deregister(&asrc_miscdev);
-+
-+	return 0;
-+}
-+
-+#if CONFIG_PM_SLEEP
-+static int mxc_asrc_suspend(struct device *dev)
-+{
-+	struct asrc_pair_params *params;
-+	unsigned long lock_flags;
-+	int i;
-+
-+	for (i = 0; i < ASRC_PAIR_MAX_NUM; i++) {
-+		spin_lock_irqsave(&pair_lock, lock_flags);
-+
-+		params = asrc->params[i];
-+		if (!params || !params->pair_hold) {
-+			spin_unlock_irqrestore(&pair_lock, lock_flags);
-+			continue;
-+		}
-+
-+		if (!completion_done(&params->input_complete)) {
-+			if (params->input_dma_channel)
-+				dmaengine_terminate_all(params->input_dma_channel);
-+			asrc_input_dma_callback((void *)params);
-+		}
-+		if (!completion_done(&params->output_complete)) {
-+			if (params->output_dma_channel)
-+				dmaengine_terminate_all(params->output_dma_channel);
-+			asrc_output_dma_callback((void *)params);
-+		}
-+
-+		spin_unlock_irqrestore(&pair_lock, lock_flags);
-+	}
-+
-+	regcache_cache_only(asrc->regmap, true);
-+	regcache_mark_dirty(asrc->regmap);
-+
-+	return 0;
-+}
-+
-+static int mxc_asrc_resume(struct device *dev)
-+{
-+	u32 asrctr;
-+
-+	/* Stop all pairs provisionally */
-+	regmap_read(asrc->regmap, REG_ASRCTR, &asrctr);
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEx_ALL_MASK, 0);
-+
-+	regcache_cache_only(asrc->regmap, false);
-+	regcache_sync(asrc->regmap);
-+
-+	/* Restart enabled pairs */
-+	regmap_update_bits(asrc->regmap, REG_ASRCTR,
-+			   ASRCTR_ASRCEx_ALL_MASK, asrctr);
-+
-+	return 0;
-+}
-+#endif /* CONFIG_PM_SLEEP */
-+
-+static const struct dev_pm_ops mxc_asrc_pm_ops = {
-+	SET_SYSTEM_SLEEP_PM_OPS(mxc_asrc_suspend, mxc_asrc_resume)
-+};
-+
-+static struct platform_driver mxc_asrc_driver = {
-+	.driver = {
-+		.name = "mxc_asrc",
-+		.of_match_table = fsl_asrc_ids,
-+		.pm = &mxc_asrc_pm_ops,
-+	},
-+	.probe = mxc_asrc_probe,
-+	.remove = mxc_asrc_remove,
-+};
-+
-+module_platform_driver(mxc_asrc_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("Asynchronous Sample Rate Converter");
-+MODULE_LICENSE("GPL");
-+MODULE_ALIAS("platform:mxc_asrc");
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,932 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+
-+#if gcdENABLE_VG
-+
-+#include "gc_hal_kernel_hardware_command_vg.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_COMMAND
-+
-+/******************************************************************************\
-+****************************** gckVGCOMMAND API code *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_InitializeInfo
-+**
-+**  Initialize architecture dependent command buffer information.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to the Command object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_InitializeInfo(
-+    IN gckVGCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    do
-+    {
-+        /* Reset interrupts. */
-+        Command->info.feBufferInt   = -1;
-+        Command->info.tsOverflowInt = -1;
-+
-+        /* Set command buffer attributes. */
-+        Command->info.addressAlignment = 64;
-+        Command->info.commandAlignment = 8;
-+
-+        /* Determine command alignment address mask. */
-+        Command->info.addressMask = ((((gctUINT32) (Command->info.addressAlignment - 1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0 ) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+        /* Query the number of bytes needed by the STATE command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_StateCommand(
-+            Command, 0x0, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.stateCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the RESTART command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_RestartCommand(
-+            Command, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.restartCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the FETCH command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_FetchCommand(
-+            Command, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.fetchCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the CALL command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_CallCommand(
-+            Command, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.callCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the RETURN command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_ReturnCommand(
-+            Command, gcvNULL,
-+            &Command->info.returnCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the EVENT command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
-+            Command, gcvNULL, gcvBLOCK_PIXEL, -1,
-+            &Command->info.eventCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the END command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
-+            Command, gcvNULL, -1,
-+            &Command->info.endCommandSize
-+            ));
-+
-+        /* Determine the tail reserve size. */
-+        Command->info.staticTailSize = gcmMAX(
-+            Command->info.fetchCommandSize,
-+            gcmMAX(
-+                Command->info.returnCommandSize,
-+                Command->info.endCommandSize
-+                )
-+            );
-+
-+        /* Determine the maximum tail size. */
-+        Command->info.dynamicTailSize
-+            = Command->info.staticTailSize
-+            + Command->info.eventCommandSize * gcvBLOCK_COUNT;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_StateCommand
-+**
-+**  Append a STATE command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctUINT32 Pipe
-+**          Harwdare destination pipe.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          STATE command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 Address
-+**          Starting register address of the state buffer.
-+**          If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT32 Count
-+**          Number of states in state buffer.
-+**          If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the STATE command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the STATE command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_StateCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT32 Pipe,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Count,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Pipe=0x%x Logical=0x%x Address=0x%x Count=0x%x Bytes = 0x%x",
-+                   Command, Pipe, Logical, Address, Count, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append STATE. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) ((gctUINT32) (Pipe) & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the STATE command. */
-+            *Bytes = 4 * (Count + 1);
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append LOAD_STATE. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the STATE command. */
-+            *Bytes = 4 * (Count + 1);
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_RestartCommand
-+**
-+**  Form a RESTART command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          RESTART command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 FetchAddress
-+**          The address of another command buffer to be executed by this RESTART
-+**          command.  If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT FetchCount
-+**          The number of 64-bit data quantities in another command buffer to
-+**          be executed by this RESTART command.  If 'Logical' is gcvNULL, this
-+**          argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the RESTART command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the RESTART command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_RestartCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
-+                   Command, Logical, FetchAddress, FetchCount, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+            gctUINT32 beginEndMark;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Determine Begin/End flag. */
-+            beginEndMark = (FetchCount > 0)
-+                ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
-+                : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)));
-+
-+            /* Append RESTART. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x9 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)))
-+                | beginEndMark;
-+
-+            buffer[1]
-+                = FetchAddress;
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the RESTART command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_FetchCommand
-+**
-+**  Form a FETCH command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          FETCH command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 FetchAddress
-+**          The address of another command buffer to be executed by this FETCH
-+**          command.  If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT FetchCount
-+**          The number of 64-bit data quantities in another command buffer to
-+**          be executed by this FETCH command.  If 'Logical' is gcvNULL, this
-+**          argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the FETCH command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the FETCH command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_FetchCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
-+                   Command, Logical, FetchAddress, FetchCount, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append FETCH. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x5 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
-+
-+            buffer[1]
-+                = gcmkFIXADDRESS(FetchAddress);
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the FETCH command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append LINK. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            buffer[1]
-+                = gcmkFIXADDRESS(FetchAddress);
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the LINK command. */
-+            *Bytes = 8;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_CallCommand
-+**
-+**  Append a CALL command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          CALL command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 FetchAddress
-+**          The address of another command buffer to be executed by this CALL
-+**          command.  If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT FetchCount
-+**          The number of 64-bit data quantities in another command buffer to
-+**          be executed by this CALL command.  If 'Logical' is gcvNULL, this
-+**          argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the CALL command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the CALL command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_CallCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
-+                   Command, Logical, FetchAddress, FetchCount, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append CALL. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x6 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
-+
-+            buffer[1]
-+                = gcmkFIXADDRESS(FetchAddress);
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the CALL command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_ReturnCommand
-+**
-+**  Append a RETURN command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          RETURN command at or gcvNULL to query the size of the command.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the RETURN command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the RETURN command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_ReturnCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x  Bytes = 0x%x",
-+                   Command, Logical, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append RETURN. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x7 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the RETURN command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_EventCommand
-+**
-+**  Form an EVENT command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to the Command object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          EVENT command at or gcvNULL to query the size of the command.
-+**
-+**      gctINT32 InterruptId
-+**          The ID of the interrupt to generate.
-+**          If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gceBLOCK Block
-+**          Block that will generate the interrupt.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the EVENT command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_EventCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gceBLOCK Block,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x Block=0x%x InterruptId=0x%x Bytes = 0x%x",
-+                   Command, Logical, Block, InterruptId, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        typedef struct _gcsEVENTSTATES
-+        {
-+            /* Chips before VG21 use these values. */
-+            gctUINT     eventFromFE;
-+            gctUINT     eventFromPE;
-+
-+            /* VG21 chips and later use SOURCE field. */
-+            gctUINT     eventSource;
-+        }
-+        gcsEVENTSTATES;
-+
-+        static gcsEVENTSTATES states[] =
-+        {
-+            /* gcvBLOCK_COMMAND */
-+            {
-+                (gctUINT)~0,
-+                (gctUINT)~0,
-+                (gctUINT)~0
-+            },
-+
-+            /* gcvBLOCK_TESSELLATOR */
-+            {
-+                0x0,
-+                0x1,
-+                0x10
-+            },
-+
-+            /* gcvBLOCK_TESSELLATOR2 */
-+            {
-+                0x0,
-+                0x1,
-+                0x12
-+            },
-+
-+            /* gcvBLOCK_TESSELLATOR3 */
-+            {
-+                0x0,
-+                0x1,
-+                0x14
-+            },
-+
-+            /* gcvBLOCK_RASTER */
-+            {
-+                0x0,
-+                0x1,
-+                0x07,
-+            },
-+
-+            /* gcvBLOCK_VG */
-+            {
-+                0x0,
-+                0x1,
-+                0x0F
-+            },
-+
-+            /* gcvBLOCK_VG2 */
-+            {
-+                0x0,
-+                0x1,
-+                0x11
-+            },
-+
-+            /* gcvBLOCK_VG3 */
-+            {
-+                0x0,
-+                0x1,
-+                0x13
-+            },
-+
-+            /* gcvBLOCK_PIXEL */
-+            {
-+                0x0,
-+                0x1,
-+                0x07
-+            },
-+        };
-+
-+        /* Verify block ID. */
-+        gcmkVERIFY_ARGUMENT(gcmIS_VALID_INDEX(Block, states));
-+
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append EVENT. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
-+
-+            /* Determine chip version. */
-+            if (Command->vg21)
-+            {
-+                /* Get the event source for the block. */
-+                gctUINT eventSource = states[Block].eventSource;
-+
-+                /* Supported? */
-+                if (eventSource == ~0)
-+                {
-+                    gcmkFOOTER_NO();
-+                    return gcvSTATUS_NOT_SUPPORTED;
-+                }
-+
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) ((gctUINT32) (eventSource) & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+            }
-+            else
-+            {
-+                /* Get the event source for the block. */
-+                gctUINT eventFromFE = states[Block].eventFromFE;
-+                gctUINT eventFromPE = states[Block].eventFromPE;
-+
-+                /* Supported? */
-+                if (eventFromFE == ~0)
-+                {
-+                    gcmkFOOTER_NO();
-+                    return gcvSTATUS_NOT_SUPPORTED;
-+                }
-+
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (eventFromFE) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (eventFromPE) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+            }
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Make sure the events are directly supported for the block. */
-+            if (states[Block].eventSource == ~0)
-+            {
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_NOT_SUPPORTED;
-+            }
-+
-+            /* Return number of bytes required by the END command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append EVENT. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            /* Determine event source. */
-+            if (Block == gcvBLOCK_COMMAND)
-+            {
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+            }
-+            else
-+            {
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+            }
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the EVENT and END commands. */
-+            *Bytes = 8;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_EndCommand
-+**
-+**  Form an END command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to the Command object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          END command at or gcvNULL to query the size of the command.
-+**
-+**      gctINT32 InterruptId
-+**          The ID of the interrupt to generate.
-+**          If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the END command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_EndCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x InterruptId=0x%x Bytes = 0x%x",
-+                   Command, Logical, InterruptId, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append END. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the END command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR memory;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+
-+            /* Cast the buffer pointer. */
-+            memory = (gctUINT32_PTR) Logical;
-+
-+            /* Append EVENT. */
-+            memory[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            memory[1]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+            /* Append END. */
-+            memory[2]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the EVENT and END commands. */
-+            *Bytes = 16;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+#endif /* gcdENABLE_VG */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,319 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_hardware_command_vg_h_
-+#define __gc_hal_kernel_hardware_command_vg_h_
-+
-+/******************************************************************************\
-+******************* Task and Interrupt Management Structures. ******************
-+\******************************************************************************/
-+
-+/* Task storage header. */
-+typedef struct _gcsTASK_STORAGE * gcsTASK_STORAGE_PTR;
-+typedef struct _gcsTASK_STORAGE
-+{
-+    /* Next allocated storage buffer. */
-+    gcsTASK_STORAGE_PTR         next;
-+}
-+gcsTASK_STORAGE;
-+
-+/* Task container header. */
-+typedef struct _gcsTASK_CONTAINER * gcsTASK_CONTAINER_PTR;
-+typedef struct _gcsTASK_CONTAINER
-+{
-+    /* The number of tasks left to be processed in the container. */
-+    gctINT                      referenceCount;
-+
-+    /* Size of the buffer. */
-+    gctUINT                     size;
-+
-+    /* Link to the previous and the next allocated containers. */
-+    gcsTASK_CONTAINER_PTR       allocPrev;
-+    gcsTASK_CONTAINER_PTR       allocNext;
-+
-+    /* Link to the previous and the next containers in the free list. */
-+    gcsTASK_CONTAINER_PTR       freePrev;
-+    gcsTASK_CONTAINER_PTR       freeNext;
-+}
-+gcsTASK_CONTAINER;
-+
-+/* Kernel space task master table entry. */
-+typedef struct _gcsBLOCK_TASK_ENTRY * gcsBLOCK_TASK_ENTRY_PTR;
-+typedef struct _gcsBLOCK_TASK_ENTRY
-+{
-+    /* Pointer to the current task container for the block. */
-+    gcsTASK_CONTAINER_PTR       container;
-+
-+    /* Pointer to the current task data within the container. */
-+    gcsTASK_HEADER_PTR          task;
-+
-+    /* Pointer to the last link task within the container. */
-+    gcsTASK_LINK_PTR            link;
-+
-+    /* Number of interrupts allocated for this block. */
-+    gctUINT                     interruptCount;
-+
-+    /* The index of the current interrupt. */
-+    gctUINT                     interruptIndex;
-+
-+    /* Interrupt semaphore. */
-+    gctSEMAPHORE                interruptSemaphore;
-+
-+    /* Interrupt value array. */
-+    gctINT32                    interruptArray[32];
-+}
-+gcsBLOCK_TASK_ENTRY;
-+
-+
-+/******************************************************************************\
-+********************* Command Queue Management Structures. *********************
-+\******************************************************************************/
-+
-+/* Command queue kernel element pointer. */
-+typedef struct _gcsKERNEL_CMDQUEUE * gcsKERNEL_CMDQUEUE_PTR;
-+
-+/* Command queue object handler function type. */
-+typedef gceSTATUS (* gctOBJECT_HANDLER) (
-+    gckVGKERNEL Kernel,
-+    gcsKERNEL_CMDQUEUE_PTR Entry
-+    );
-+
-+/* Command queue kernel element. */
-+typedef struct _gcsKERNEL_CMDQUEUE
-+{
-+    /* The number of buffers in the queue. */
-+    gcsCMDBUFFER_PTR            commandBuffer;
-+
-+    /* Pointer to the object handler function. */
-+    gctOBJECT_HANDLER           handler;
-+}
-+gcsKERNEL_CMDQUEUE;
-+
-+/* Command queue header. */
-+typedef struct _gcsKERNEL_QUEUE_HEADER * gcsKERNEL_QUEUE_HEADER_PTR;
-+typedef struct _gcsKERNEL_QUEUE_HEADER
-+{
-+    /* The size of the buffer in bytes. */
-+    gctUINT                     size;
-+
-+    /* The number of pending entries to be processed. */
-+    volatile gctUINT            pending;
-+
-+    /* The current command queue entry. */
-+    gcsKERNEL_CMDQUEUE_PTR      currentEntry;
-+
-+    /* Next buffer. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  next;
-+}
-+gcsKERNEL_QUEUE_HEADER;
-+
-+
-+/******************************************************************************\
-+******************************* gckVGCOMMAND Object *******************************
-+\******************************************************************************/
-+
-+/* gckVGCOMMAND object. */
-+struct _gckVGCOMMAND
-+{
-+    /***************************************************************************
-+    ** Object data and pointers.
-+    */
-+
-+    gcsOBJECT                   object;
-+    gckVGKERNEL                 kernel;
-+    gckOS                       os;
-+    gckVGHARDWARE                   hardware;
-+
-+    /* Features. */
-+    gctBOOL                     fe20;
-+    gctBOOL                     vg20;
-+    gctBOOL                     vg21;
-+
-+
-+    /***************************************************************************
-+    ** Enable command queue dumping.
-+    */
-+
-+    gctBOOL                     enableDumping;
-+
-+
-+    /***************************************************************************
-+    ** Bus Error interrupt.
-+    */
-+
-+    gctINT32                    busErrorInt;
-+
-+
-+    /***************************************************************************
-+    ** Command buffer information.
-+    */
-+
-+    gcsCOMMAND_BUFFER_INFO      info;
-+
-+
-+    /***************************************************************************
-+    ** Synchronization objects.
-+    */
-+
-+    gctPOINTER                  queueMutex;
-+    gctPOINTER                  taskMutex;
-+    gctPOINTER                  commitMutex;
-+
-+
-+    /***************************************************************************
-+    ** Task management.
-+    */
-+
-+    /* The head of the storage buffer linked list. */
-+    gcsTASK_STORAGE_PTR         taskStorage;
-+
-+    /* Allocation size. */
-+    gctUINT                     taskStorageGranularity;
-+    gctUINT                     taskStorageUsable;
-+
-+    /* The free container list. */
-+    gcsTASK_CONTAINER_PTR       taskFreeHead;
-+    gcsTASK_CONTAINER_PTR       taskFreeTail;
-+
-+    /* Task table */
-+    gcsBLOCK_TASK_ENTRY         taskTable[gcvBLOCK_COUNT];
-+
-+
-+    /***************************************************************************
-+    ** Command queue.
-+    */
-+
-+    /* Pointer to the allocated queue memory. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  queue;
-+
-+    /* Pointer to the current available queue from which new queue entries
-+       will be allocated. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  queueHead;
-+
-+    /* If different from queueHead, points to the command queue which is
-+       currently being executed by the hardware. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  queueTail;
-+
-+    /* Points to the queue to merge the tail with when the tail is processed. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  mergeQueue;
-+
-+    /* Queue overflow counter. */
-+    gctUINT                     queueOverflow;
-+
-+
-+    /***************************************************************************
-+    ** Context.
-+    */
-+
-+    /* Context counter used for unique ID. */
-+    gctUINT64                   contextCounter;
-+
-+    /* Current context ID. */
-+    gctUINT64                   currentContext;
-+
-+    /* Command queue power semaphore. */
-+    gctPOINTER                  powerSemaphore;
-+    gctINT32                    powerStallInt;
-+    gcsCMDBUFFER_PTR            powerStallBuffer;
-+    gctSIGNAL                   powerStallSignal;
-+
-+};
-+
-+/******************************************************************************\
-+************************ gckVGCOMMAND Object Internal API. ***********************
-+\******************************************************************************/
-+
-+/* Initialize architecture dependent command buffer information. */
-+gceSTATUS
-+gckVGCOMMAND_InitializeInfo(
-+    IN gckVGCOMMAND Command
-+    );
-+
-+/* Form a STATE command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_StateCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT32 Pipe,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Count,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Form a RESTART command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_RestartCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Form a FETCH command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_FetchCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Form a CALL command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_CallCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Form a RETURN command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_ReturnCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Form an EVENT command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_EventCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gceBLOCK Block,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Form an END command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_EndCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+#endif  /* __gc_hal_kernel_hardware_command_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,2114 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#include "gc_hal_kernel_hardware_command_vg.h"
-+
-+#if gcdENABLE_VG
-+
-+#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
-+
-+typedef enum
-+{
-+    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
-+    gcvPOWER_FLAG_STALL         = 1 << 1,
-+    gcvPOWER_FLAG_STOP          = 1 << 2,
-+    gcvPOWER_FLAG_START         = 1 << 3,
-+    gcvPOWER_FLAG_RELEASE       = 1 << 4,
-+    gcvPOWER_FLAG_DELAY         = 1 << 5,
-+    gcvPOWER_FLAG_SAVE          = 1 << 6,
-+    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
-+    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
-+    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
-+    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
-+    gcvPOWER_FLAG_NOP           = 1 << 11,
-+}
-+gcePOWER_FLAGS;
-+
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+static gceSTATUS
-+_ResetGPU(
-+    IN gckOS Os
-+    )
-+{
-+    gctUINT32 control, idle;
-+    gceSTATUS status;
-+
-+    /* Read register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                     gcvCORE_VG,
-+                                     0x00000,
-+                                     &control));
-+
-+    for (;;)
-+    {
-+        /* Disable clock gating. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    gcvCORE_VG,
-+                    0x00104,
-+                    0x00000000));
-+
-+        /* Wait for clock being stable. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Isolate the GPU. */
-+        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Set soft reset. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Wait for reset. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Reset soft reset bit. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Reset GPU isolation. */
-+        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Read idle register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         gcvCORE_VG,
-+                                         0x00004,
-+                                         &idle));
-+
-+        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
-+        {
-+            continue;
-+        }
-+
-+        /* Read reset register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         gcvCORE_VG,
-+                                         0x00000,
-+                                         &control));
-+
-+        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
-+        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
-+        )
-+        {
-+            continue;
-+        }
-+
-+        /* GPU is idle. */
-+        break;
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the error. */
-+    return status;
-+}
-+
-+
-+static gceSTATUS
-+_IdentifyHardware(
-+    IN gckOS Os,
-+    OUT gceCHIPMODEL * ChipModel,
-+    OUT gctUINT32 * ChipRevision,
-+    OUT gctUINT32 * ChipFeatures,
-+    OUT gctUINT32 * ChipMinorFeatures,
-+    OUT gctUINT32 * ChipMinorFeatures2
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 chipIdentity;
-+
-+    do
-+    {
-+        /* Read chip identity register. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG, 0x00018, &chipIdentity));
-+
-+        /* Special case for older graphic cores. */
-+        if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
-+        {
-+            *ChipModel    = gcv500;
-+            *ChipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
-+        }
-+
-+        else
-+        {
-+            /* Read chip identity register. */
-+            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
-+                                            0x00020,
-+                                            (gctUINT32 *) ChipModel));
-+
-+            /* Read CHIP_REV register. */
-+            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
-+                                            0x00024,
-+                                            ChipRevision));
-+        }
-+
-+        /* Read chip feature register. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(
-+            Os, gcvCORE_VG, 0x0001C, ChipFeatures
-+            ));
-+
-+        /* Read chip minor feature register. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(
-+            Os, gcvCORE_VG, 0x00034, ChipMinorFeatures
-+            ));
-+
-+        /* Read chip minor feature register #2. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(
-+            Os, gcvCORE_VG, 0x00074, ChipMinorFeatures2
-+            ));
-+
-+        gcmkTRACE(
-+            gcvLEVEL_VERBOSE,
-+            "ChipModel=0x%08X\n"
-+            "ChipRevision=0x%08X\n"
-+            "ChipFeatures=0x%08X\n"
-+            "ChipMinorFeatures=0x%08X\n"
-+            "ChipMinorFeatures2=0x%08X\n",
-+            *ChipModel,
-+            *ChipRevision,
-+            *ChipFeatures,
-+            *ChipMinorFeatures,
-+            *ChipMinorFeatures2
-+            );
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+#if gcdPOWEROFF_TIMEOUT
-+void
-+_VGPowerTimerFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gckVGHARDWARE hardware = (gckVGHARDWARE)Data;
-+    gcmkVERIFY_OK(
-+        gckVGHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
-+}
-+#endif
-+
-+/******************************************************************************\
-+****************************** gckVGHARDWARE API code *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_Construct
-+**
-+**  Construct a new gckVGHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an initialized gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gckVGHARDWARE * Hardware
-+**          Pointer to a variable that will hold the pointer to the gckVGHARDWARE
-+**          object.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_Construct(
-+    IN gckOS Os,
-+    OUT gckVGHARDWARE * Hardware
-+    )
-+{
-+    gckVGHARDWARE hardware = gcvNULL;
-+    gceSTATUS status;
-+    gceCHIPMODEL chipModel;
-+    gctUINT32 chipRevision;
-+    gctUINT32 chipFeatures;
-+    gctUINT32 chipMinorFeatures;
-+    gctUINT32 chipMinorFeatures2;
-+
-+    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x ", Os, Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
-+
-+    do
-+    {
-+        gcmkERR_BREAK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvTRUE, gcvTRUE));
-+
-+        status = _ResetGPU(Os);
-+
-+        if (status != gcvSTATUS_OK)
-+        {
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                "_ResetGPU failed: status=%d\n", status);
-+        }
-+
-+        /* Identify the hardware. */
-+        gcmkERR_BREAK(_IdentifyHardware(Os,
-+            &chipModel, &chipRevision,
-+            &chipFeatures, &chipMinorFeatures, &chipMinorFeatures2
-+            ));
-+
-+        /* Allocate the gckVGHARDWARE object. */
-+        gcmkERR_BREAK(gckOS_Allocate(Os,
-+            gcmSIZEOF(struct _gckVGHARDWARE), (gctPOINTER *) &hardware
-+            ));
-+
-+        /* Initialize the gckVGHARDWARE object. */
-+        hardware->object.type = gcvOBJ_HARDWARE;
-+        hardware->os = Os;
-+
-+        /* Set chip identity. */
-+        hardware->chipModel          = chipModel;
-+        hardware->chipRevision       = chipRevision;
-+        hardware->chipFeatures       = chipFeatures;
-+        hardware->chipMinorFeatures  = chipMinorFeatures;
-+        hardware->chipMinorFeatures2 = chipMinorFeatures2;
-+
-+        hardware->powerMutex            = gcvNULL;
-+        hardware->chipPowerState        = gcvPOWER_ON;
-+        hardware->chipPowerStateGlobal  = gcvPOWER_ON;
-+        hardware->clockState            = gcvTRUE;
-+        hardware->powerState            = gcvTRUE;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+        hardware->powerOffTime          = 0;
-+        hardware->powerOffTimeout = gcdPOWEROFF_TIMEOUT;
-+
-+        gcmkVERIFY_OK(gckOS_CreateTimer(Os,
-+                                        _VGPowerTimerFunction,
-+                                        (gctPOINTER)hardware,
-+                                        &hardware->powerOffTimer));
-+#endif
-+
-+        /* Determine whether FE 2.0 is present. */
-+        hardware->fe20 = ((((gctUINT32) (hardware->chipFeatures)) >> (0 ? 28:28) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))));
-+
-+        /* Determine whether VG 2.0 is present. */
-+        hardware->vg20 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 13:13) & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))));
-+
-+        /* Determine whether VG 2.1 is present. */
-+        hardware->vg21 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
-+
-+        /* Set default event mask. */
-+        hardware->eventMask = 0xFFFFFFFF;
-+
-+        gcmkERR_BREAK(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
-+
-+        /* Set fast clear to auto. */
-+        gcmkVERIFY_OK(gckVGHARDWARE_SetFastClear(hardware, -1));
-+
-+        gcmkERR_BREAK(gckOS_CreateMutex(Os, &hardware->powerMutex));
-+
-+        /* Enable power management by default. */
-+        hardware->powerManagement = gcvTRUE;
-+
-+        /* Return pointer to the gckVGHARDWARE object. */
-+        *Hardware = hardware;
-+
-+        gcmkFOOTER_NO();
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+#if gcdPOWEROFF_TIMEOUT
-+        if (hardware->powerOffTimer != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
-+            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
-+        }
-+#endif
-+
-+    if (hardware->pageTableDirty != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
-+    }
-+
-+    if (hardware != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_Free(Os, hardware));
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvFALSE, gcvFALSE));
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_Destroy
-+**
-+**  Destroy an gckVGHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object that needs to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_Destroy(
-+    IN gckVGHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Mark the object as unknown. */
-+    Hardware->object.type = gcvOBJ_UNKNOWN;
-+
-+    if (Hardware->powerMutex != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(
-+            Hardware->os, Hardware->powerMutex));
-+    }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
-+    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
-+#endif
-+
-+    if (Hardware->pageTableDirty != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
-+    }
-+
-+    /* Free the object. */
-+    status = gckOS_Free(Hardware->os, Hardware);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_QueryMemory
-+**
-+**  Query the amount of memory available on the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * InternalSize
-+**          Pointer to a variable that will hold the size of the internal video
-+**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
-+**          internal memory will be returned.
-+**
-+**      gctUINT32 * InternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * InternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctSIZE_T * ExternalSize
-+**          Pointer to a variable that will hold the size of the external video
-+**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
-+**          external memory will be returned.
-+**
-+**      gctUINT32 * ExternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * ExternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * HorizontalTileSize
-+**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
-+**          gcvNULL, no horizontal pixel per tile will be returned.
-+**
-+**      gctUINT32 * VerticalTileSize
-+**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
-+**          gcvNULL, no vertical pixel per tile will be returned.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_QueryMemory(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctUINT32 * InternalBaseAddress,
-+    OUT gctUINT32 * InternalAlignment,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctUINT32 * ExternalBaseAddress,
-+    OUT gctUINT32 * ExternalAlignment,
-+    OUT gctUINT32 * HorizontalTileSize,
-+    OUT gctUINT32 * VerticalTileSize
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x InternalSize=0x%x InternalBaseAddress=0x%x InternalAlignment=0x%x"
-+        "ExternalSize=0x%x ExternalBaseAddress=0x%x ExternalAlignment=0x%x HorizontalTileSize=0x%x VerticalTileSize=0x%x",
-+        Hardware, InternalSize, InternalBaseAddress, InternalAlignment,
-+        ExternalSize, ExternalBaseAddress, ExternalAlignment, HorizontalTileSize, VerticalTileSize);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (InternalSize != gcvNULL)
-+    {
-+        /* No internal memory. */
-+        *InternalSize = 0;
-+    }
-+
-+    if (ExternalSize != gcvNULL)
-+    {
-+        /* No external memory. */
-+        *ExternalSize = 0;
-+    }
-+
-+    if (HorizontalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *HorizontalTileSize = 4;
-+    }
-+
-+    if (VerticalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *VerticalTileSize = 4;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_QueryChipIdentity
-+**
-+**  Query the identity of the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gceCHIPMODEL * ChipModel
-+**          If 'ChipModel' is not gcvNULL, the variable it points to will
-+**          receive the model of the chip.
-+**
-+**      gctUINT32 * ChipRevision
-+**          If 'ChipRevision' is not gcvNULL, the variable it points to will
-+**          receive the revision of the chip.
-+**
-+**      gctUINT32 * ChipFeatures
-+**          If 'ChipFeatures' is not gcvNULL, the variable it points to will
-+**          receive the feature set of the chip.
-+**
-+**      gctUINT32 * ChipMinorFeatures
-+**          If 'ChipMinorFeatures' is not gcvNULL, the variable it points to
-+**          will receive the minor feature set of the chip.
-+**
-+**      gctUINT32 * ChipMinorFeatures2
-+**          If 'ChipMinorFeatures2' is not gcvNULL, the variable it points to
-+**          will receive the minor feature set of the chip.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_QueryChipIdentity(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gceCHIPMODEL * ChipModel,
-+    OUT gctUINT32 * ChipRevision,
-+    OUT gctUINT32* ChipFeatures,
-+    OUT gctUINT32* ChipMinorFeatures,
-+    OUT gctUINT32* ChipMinorFeatures2
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x ChipModel=0x%x ChipRevision=0x%x ChipFeatures = 0x%x ChipMinorFeatures = 0x%x ChipMinorFeatures2 = 0x%x",
-+                   Hardware, ChipModel, ChipRevision, ChipFeatures, ChipMinorFeatures, ChipMinorFeatures2);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Return chip model. */
-+    if (ChipModel != gcvNULL)
-+    {
-+        *ChipModel = Hardware->chipModel;
-+    }
-+
-+    /* Return revision number. */
-+    if (ChipRevision != gcvNULL)
-+    {
-+        *ChipRevision = Hardware->chipRevision;
-+    }
-+
-+    /* Return feature set. */
-+    if (ChipFeatures != gcvNULL)
-+    {
-+        gctUINT32 features = Hardware->chipFeatures;
-+
-+        if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+        {
-+            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+        }
-+
-+        /* Mark 2D pipe as available for GC500.0 since it did not have this *\
-+        \* bit.                                                             */
-+        if ((Hardware->chipModel == gcv500)
-+        &&  (Hardware->chipRevision == 0)
-+        )
-+        {
-+            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+        }
-+
-+        /* Mark 2D pipe as available for GC300 since it did not have this   *\
-+        \* bit.                                                             */
-+        if (Hardware->chipModel == gcv300)
-+        {
-+            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+        }
-+
-+        *ChipFeatures = features;
-+    }
-+
-+    /* Return minor feature set. */
-+    if (ChipMinorFeatures != gcvNULL)
-+    {
-+        *ChipMinorFeatures = Hardware->chipMinorFeatures;
-+    }
-+
-+    /* Return minor feature set #2. */
-+    if (ChipMinorFeatures2 != gcvNULL)
-+    {
-+        *ChipMinorFeatures2 = Hardware->chipMinorFeatures2;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_ConvertFormat
-+**
-+**  Convert an API format to hardware parameters.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**      gceSURF_FORMAT Format
-+**          API format to convert.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * BitsPerPixel
-+**          Pointer to a variable that will hold the number of bits per pixel.
-+**
-+**      gctUINT32 * BytesPerTile
-+**          Pointer to a variable that will hold the number of bytes per tile.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_ConvertFormat(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceSURF_FORMAT Format,
-+    OUT gctUINT32 * BitsPerPixel,
-+    OUT gctUINT32 * BytesPerTile
-+    )
-+{
-+    gctUINT32 bitsPerPixel;
-+    gctUINT32 bytesPerTile;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Format=0x%x BitsPerPixel=0x%x BytesPerTile = 0x%x",
-+                   Hardware, Format, BitsPerPixel, BytesPerTile);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Dispatch on format. */
-+    switch (Format)
-+    {
-+    case gcvSURF_A1:
-+    case gcvSURF_L1:
-+        /* 1-bpp format. */
-+        bitsPerPixel  = 1;
-+        bytesPerTile  = (1 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_A4:
-+        /* 4-bpp format. */
-+        bitsPerPixel  = 4;
-+        bytesPerTile  = (4 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_INDEX8:
-+    case gcvSURF_A8:
-+    case gcvSURF_L8:
-+        /* 8-bpp format. */
-+        bitsPerPixel  = 8;
-+        bytesPerTile  = (8 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_YV12:
-+        /* 12-bpp planar YUV formats. */
-+        bitsPerPixel  = 12;
-+        bytesPerTile  = (12 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_NV12:
-+        /* 12-bpp planar YUV formats. */
-+        bitsPerPixel  = 12;
-+        bytesPerTile  = (12 * 4 * 4) / 8;
-+        break;
-+
-+    /* 4444 variations. */
-+    case gcvSURF_X4R4G4B4:
-+    case gcvSURF_A4R4G4B4:
-+    case gcvSURF_R4G4B4X4:
-+    case gcvSURF_R4G4B4A4:
-+    case gcvSURF_B4G4R4X4:
-+    case gcvSURF_B4G4R4A4:
-+    case gcvSURF_X4B4G4R4:
-+    case gcvSURF_A4B4G4R4:
-+
-+    /* 1555 variations. */
-+    case gcvSURF_X1R5G5B5:
-+    case gcvSURF_A1R5G5B5:
-+    case gcvSURF_R5G5B5X1:
-+    case gcvSURF_R5G5B5A1:
-+    case gcvSURF_X1B5G5R5:
-+    case gcvSURF_A1B5G5R5:
-+    case gcvSURF_B5G5R5X1:
-+    case gcvSURF_B5G5R5A1:
-+
-+    /* 565 variations. */
-+    case gcvSURF_R5G6B5:
-+    case gcvSURF_B5G6R5:
-+
-+    case gcvSURF_A8L8:
-+    case gcvSURF_YUY2:
-+    case gcvSURF_UYVY:
-+    case gcvSURF_D16:
-+        /* 16-bpp format. */
-+        bitsPerPixel  = 16;
-+        bytesPerTile  = (16 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_X8R8G8B8:
-+    case gcvSURF_A8R8G8B8:
-+    case gcvSURF_X8B8G8R8:
-+    case gcvSURF_A8B8G8R8:
-+    case gcvSURF_R8G8B8X8:
-+    case gcvSURF_R8G8B8A8:
-+    case gcvSURF_B8G8R8X8:
-+    case gcvSURF_B8G8R8A8:
-+    case gcvSURF_D32:
-+        /* 32-bpp format. */
-+        bitsPerPixel  = 32;
-+        bytesPerTile  = (32 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_D24S8:
-+        /* 24-bpp format. */
-+        bitsPerPixel  = 32;
-+        bytesPerTile  = (32 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_DXT1:
-+    case gcvSURF_ETC1:
-+        bitsPerPixel  = 4;
-+        bytesPerTile  = (4 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_DXT2:
-+    case gcvSURF_DXT3:
-+    case gcvSURF_DXT4:
-+    case gcvSURF_DXT5:
-+        bitsPerPixel  = 8;
-+        bytesPerTile  = (8 * 4 * 4) / 8;
-+        break;
-+
-+    default:
-+        /* Invalid format. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_INVALID_ARGUMENT;
-+    }
-+
-+    /* Set the result. */
-+    if (BitsPerPixel != gcvNULL)
-+    {
-+        * BitsPerPixel = bitsPerPixel;
-+    }
-+
-+    if (BytesPerTile != gcvNULL)
-+    {
-+        * BytesPerTile = bytesPerTile;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_SplitMemory
-+**
-+**  Split a hardware specific memory address into a pool and offset.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Address in hardware specific format.
-+**
-+**  OUTPUT:
-+**
-+**      gcePOOL * Pool
-+**          Pointer to a variable that will hold the pool type for the address.
-+**
-+**      gctUINT32 * Offset
-+**          Pointer to a variable that will hold the offset for the address.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_SplitMemory(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Pool=0x%x Offset = 0x%x",
-+                   Hardware, Address, Pool, Offset);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
-+
-+    /* Dispatch on memory type. */
-+    switch ((((((gctUINT32) (Address)) >> (0 ? 1:0)) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1)))))) ))
-+    {
-+    case 0x0:
-+        /* System memory. */
-+        *Pool = gcvPOOL_SYSTEM;
-+        break;
-+
-+    case 0x2:
-+        /* Virtual memory. */
-+        *Pool = gcvPOOL_VIRTUAL;
-+        break;
-+
-+    default:
-+        /* Invalid memory type. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_INVALID_ARGUMENT;
-+    }
-+
-+    /* Return offset of address. */
-+    *Offset = ((((gctUINT32) (Address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_Execute
-+**
-+**  Kickstart the hardware's command processor with an initialized command
-+**  buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Address of the command buffer.
-+**
-+**      gctSIZE_T Count
-+**          Number of command-sized data units to be executed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_Execute(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Count
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Count=0x%x",
-+                   Hardware, Address, Count);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    do
-+    {
-+        /* Enable all events. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+            Hardware->os,
-+            gcvCORE_VG,
-+            0x00014,
-+            Hardware->eventMask
-+            ));
-+
-+        if (Hardware->fe20)
-+        {
-+            /* Write address register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00500,
-+                gcmkFIXADDRESS(Address)
-+                ));
-+
-+            /* Write control register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00504,
-+                Count
-+                ));
-+        }
-+        else
-+        {
-+            /* Write address register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00654,
-+                gcmkFIXADDRESS(Address)
-+                ));
-+
-+            /* Write control register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00658,
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                ));
-+        }
-+
-+        /* Success. */
-+        gcmkFOOTER();
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_AlignToTile
-+**
-+**  Align the specified width and height to tile boundaries.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of alignment.
-+**
-+**      gctUINT32 * Width
-+**          Pointer to the width to be aligned.  If 'Width' is gcvNULL, no width
-+**          will be aligned.
-+**
-+**      gctUINT32 * Height
-+**          Pointer to the height to be aligned.  If 'Height' is gcvNULL, no height
-+**          will be aligned.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Width
-+**          Pointer to a variable that will receive the aligned width.
-+**
-+**      gctUINT32 * Height
-+**          Pointer to a variable that will receive the aligned height.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_AlignToTile(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctUINT32 * Width,
-+    IN OUT gctUINT32 * Height
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Type=0x%x Width=0x%x Height=0x%x",
-+                   Hardware, Type, Width, Height);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Width != gcvNULL)
-+    {
-+        /* Align the width. */
-+        *Width = gcmALIGN(*Width, (Type == gcvSURF_TEXTURE) ? 4 : 16);
-+    }
-+
-+    if (Height != gcvNULL)
-+    {
-+        /* Special case for VG images. */
-+        if ((*Height == 0) && (Type == gcvSURF_IMAGE))
-+        {
-+            *Height = 4;
-+        }
-+        else
-+        {
-+            /* Align the height. */
-+            *Height = gcmALIGN(*Height, 4);
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_ConvertLogical
-+**
-+**  Convert a logical system address into a hardware specific address.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to convert.
-+**
-+**      gctUINT32* Address
-+**          Return hardware specific address.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_ConvertLogical(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Address=0x%x",
-+                   Hardware, Logical, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    do
-+    {
-+        /* Convert logical address into a physical address. */
-+        gcmkERR_BREAK(gckOS_GetPhysicalAddress(
-+            Hardware->os, Logical, &address
-+            ));
-+
-+        /* Return hardware specific address. */
-+        *Address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+        /* Success. */
-+        gcmkFOOTER();
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_QuerySystemMemory
-+**
-+**  Query the command buffer alignment and number of reserved bytes.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * SystemSize
-+**          Pointer to a variable that receives the maximum size of the system
-+**          memory.
-+**
-+**      gctUINT32 * SystemBaseAddress
-+**          Poinetr to a variable that receives the base address for system
-+**          memory.
-+*/
-+gceSTATUS gckVGHARDWARE_QuerySystemMemory(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctSIZE_T * SystemSize,
-+    OUT gctUINT32 * SystemBaseAddress
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x SystemSize=0x%x SystemBaseAddress=0x%x",
-+                   Hardware, SystemSize, SystemBaseAddress);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (SystemSize != gcvNULL)
-+    {
-+        /* Maximum system memory can be 2GB. */
-+        *SystemSize = (gctSIZE_T)(1 << 31);
-+    }
-+
-+    if (SystemBaseAddress != gcvNULL)
-+    {
-+        /* Set system memory base address. */
-+        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_SetMMU
-+**
-+**  Set the page table base address.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the page table.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGHARDWARE_SetMMU(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 address = 0;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x",
-+                   Hardware, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    do
-+    {
-+        /* Convert the logical address into an hardware address. */
-+        gcmkERR_BREAK(gckVGHARDWARE_ConvertLogical(Hardware, Logical, &address) );
-+
-+        /* Write the AQMemoryFePageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00400,
-+                                      gcmkFIXADDRESS(address)) );
-+
-+        /* Write the AQMemoryTxPageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00404,
-+                                      gcmkFIXADDRESS(address)) );
-+
-+        /* Write the AQMemoryPePageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00408,
-+                                      gcmkFIXADDRESS(address)) );
-+
-+        /* Write the AQMemoryPezPageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x0040C,
-+                                      gcmkFIXADDRESS(address)) );
-+
-+        /* Write the AQMemoryRaPageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00410,
-+                                      gcmkFIXADDRESS(address)) );
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_FlushMMU
-+**
-+**  Flush the page table.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGHARDWARE_FlushMMU(
-+    IN gckVGHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGCOMMAND command;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    do
-+    {
-+        gcsCMDBUFFER_PTR commandBuffer;
-+        gctUINT32_PTR buffer;
-+
-+        /* Create a shortcut to the command buffer object. */
-+        command = Hardware->kernel->command;
-+
-+        /* Allocate command buffer space. */
-+        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
-+            command, 8, &commandBuffer, (gctPOINTER *) &buffer
-+            ));
-+
-+        buffer[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[1]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+    }
-+    while(gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_BuildVirtualAddress
-+**
-+**  Build a virtual address.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gctUINT32 Index
-+**          Index into page table.
-+**
-+**      gctUINT32 Offset
-+**          Offset into page.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable receiving te hardware address.
-+*/
-+gceSTATUS gckVGHARDWARE_BuildVirtualAddress(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Index=0x%x Offset=0x%x Address=0x%x",
-+                   Hardware, Index, Offset, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Build virtual address. */
-+    address = (Index << 12) | Offset;
-+
-+    /* Set virtual type. */
-+    address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+    /* Set the result. */
-+    *Address = address;
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_GetIdle(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctUINT32 * Data
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%x Data=0x%x", Hardware, Data);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
-+
-+    /* Read register and return. */
-+    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, Data);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_SetFastClear(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctINT Enable
-+    )
-+{
-+    gctUINT32 debug;
-+    gceSTATUS status;
-+
-+    if (!(((((gctUINT32) (Hardware->chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+    {
-+        return gcvSTATUS_OK;
-+    }
-+
-+    do
-+    {
-+        if (Enable == -1)
-+        {
-+            Enable = (Hardware->chipModel > gcv500) ||
-+                ((Hardware->chipModel == gcv500) && (Hardware->chipRevision >= 3));
-+        }
-+
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
-+                                        0x00414,
-+                    &debug));
-+
-+        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
-+
-+#ifdef AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION
-+        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION)));
-+#endif
-+
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                     0x00414,
-+                     debug));
-+
-+        Hardware->allowFastClear = Enable;
-+
-+        status = gcvFALSE;
-+    }
-+    while (gcvFALSE);
-+
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_ReadInterrupt(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctUINT32_PTR IDs
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%x IDs=0x%x", Hardware, IDs);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(IDs != gcvNULL);
-+
-+    /* Read AQIntrAcknowledge register. */
-+    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
-+                              0x00010,
-+                              IDs);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS _CommandStall(
-+    gckVGHARDWARE Hardware)
-+{
-+    gceSTATUS status;
-+    gckVGCOMMAND command;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    do
-+    {
-+        gctUINT32_PTR buffer;
-+        command = Hardware->kernel->command;
-+
-+        /* Allocate command buffer space. */
-+        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
-+            command, 8, &command->powerStallBuffer,
-+            (gctPOINTER *) &buffer
-+            ));
-+
-+        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
-+            command, buffer, gcvBLOCK_PIXEL,
-+            command->powerStallInt, gcvNULL));
-+
-+        gcmkERR_BREAK(gckVGCOMMAND_Execute(
-+            command,
-+            command->powerStallBuffer
-+            ));
-+
-+        /* Wait the signal. */
-+        gcmkERR_BREAK(gckOS_WaitSignal(
-+            command->os,
-+            command->powerStallSignal,
-+            gcdGPU_TIMEOUT));
-+
-+
-+    }
-+    while(gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagementState
-+**
-+**  Set GPU to a specified power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_SetPowerManagementState(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceCHIPPOWERSTATE State
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGCOMMAND command = gcvNULL;
-+    gckOS os;
-+    gctUINT flag/*, clock*/;
-+
-+    gctBOOL acquired        = gcvFALSE;
-+    gctBOOL stall           = gcvTRUE;
-+    gctBOOL commitMutex     = gcvFALSE;
-+    gctBOOL mutexAcquired   = gcvFALSE;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gctBOOL timeout = gcvFALSE;
-+    gctBOOL isAfter = gcvFALSE;
-+    gctUINT32 currentTime;
-+#endif
-+
-+    gctBOOL broadcast = gcvFALSE;
-+    gctUINT32 process, thread;
-+    gctBOOL global = gcvFALSE;
-+
-+#if gcdENABLE_PROFILING
-+    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
-+              initTime, offTime, startTime, totalTime;
-+#endif
-+
-+    /* State transition flags. */
-+    static const gctUINT flags[4][4] =
-+    {
-+        /* gcvPOWER_ON           */
-+        {   /* ON                */ 0,
-+            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_NOP,
-+            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_OFF          */
-+        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_RELEASE    |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* OFF               */ 0,
-+            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_RELEASE    |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_IDLE         */
-+        {   /* ON                */ gcvPOWER_FLAG_NOP,
-+            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ 0,
-+            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_SUSPEND      */
-+        {   /* ON                */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_RELEASE   |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* OFF               */ gcvPOWER_FLAG_SAVE      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_RELEASE   |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* SUSPEND           */ 0,
-+        },
-+    };
-+
-+    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Switching to power state %d",
-+                   State);
-+#endif
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Get the gckOS object pointer. */
-+    os = Hardware->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Get the gckCOMMAND object pointer. */
-+    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
-+    command = Hardware->kernel->command;
-+    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
-+
-+    if (Hardware->powerManagement == gcvFALSE)
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Start profiler. */
-+    gcmkPROFILE_INIT(freq, time);
-+
-+    /* Convert the broadcast power state. */
-+    switch (State)
-+    {
-+    case gcvPOWER_SUSPEND_ATPOWERON:
-+        /* Convert to SUSPEND and don't wait for STALL. */
-+        State = gcvPOWER_SUSPEND;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_OFF_ATPOWERON:
-+        /* Convert to OFF and don't wait for STALL. */
-+        State = gcvPOWER_OFF;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_IDLE_BROADCAST:
-+        /* Convert to IDLE and note we are inside broadcast. */
-+        State     = gcvPOWER_IDLE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_SUSPEND_BROADCAST:
-+        /* Convert to SUSPEND and note we are inside broadcast. */
-+        State     = gcvPOWER_SUSPEND;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_BROADCAST:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_RECOVERY:
-+        /* Convert to OFF and note we are inside recovery. */
-+        State     = gcvPOWER_OFF;
-+        stall     = gcvFALSE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_ON_AUTO:
-+        /* Convert to ON and note we are inside recovery. */
-+        State = gcvPOWER_ON;
-+        break;
-+
-+    case gcvPOWER_ON:
-+    case gcvPOWER_IDLE:
-+    case gcvPOWER_SUSPEND:
-+    case gcvPOWER_OFF:
-+        /* Mark as global power management. */
-+        global = gcvTRUE;
-+        break;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    case gcvPOWER_OFF_TIMEOUT:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        /* Check time out */
-+        timeout = gcvTRUE;
-+        break;
-+#endif
-+
-+    default:
-+        break;
-+    }
-+
-+    /* Get current process and thread IDs. */
-+    gcmkONERROR(gckOS_GetProcessID(&process));
-+    gcmkONERROR(gckOS_GetThreadID(&thread));
-+
-+    /* Acquire the power mutex. */
-+    if (broadcast)
-+    {
-+        /* Try to acquire the power mutex. */
-+        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
-+
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            /* Check if we already own this mutex. */
-+            if ((Hardware->powerProcess == process)
-+            &&  (Hardware->powerThread  == thread)
-+            )
-+            {
-+                /* Bail out on recursive power management. */
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_OK;
-+            }
-+            else if (State == gcvPOWER_IDLE)
-+            {
-+                /* gcvPOWER_IDLE_BROADCAST is from IST,
-+                ** so waiting here will cause deadlock,
-+                ** if lock holder call gckCOMMAND_Stall() */
-+                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+            }
-+            else
-+            {
-+                /* Acquire the power mutex. */
-+                gcmkONERROR(gckOS_AcquireMutex(os,
-+                                               Hardware->powerMutex,
-+                                               gcvINFINITE));
-+            }
-+        }
-+    }
-+    else
-+    {
-+        /* Acquire the power mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
-+    }
-+
-+    /* Get time until mtuex acquired. */
-+    gcmkPROFILE_QUERY(time, mutexTime);
-+
-+    Hardware->powerProcess = process;
-+    Hardware->powerThread  = thread;
-+    mutexAcquired          = gcvTRUE;
-+
-+    /* Grab control flags and clock. */
-+    flag  = flags[Hardware->chipPowerState][State];
-+    /*clock = clocks[State];*/
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    if (timeout)
-+    {
-+        gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+        gcmkONERROR(
-+            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
-+
-+        /* powerOffTime is pushed forward, give up.*/
-+        if (isAfter
-+        /* Expect a transition start from IDLE. */
-+        ||  (Hardware->chipPowerState == gcvPOWER_ON)
-+        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
-+        )
-+        {
-+            /* Release the power mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+            /* No need to do anything. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+#endif
-+
-+    if (flag == 0)
-+    {
-+        /* Release the power mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+        /* No need to do anything. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* internal power control */
-+    if (!global)
-+    {
-+        if (Hardware->chipPowerStateGlobal == gcvPOWER_OFF)
-+        {
-+            /* Release the power mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+            /* No need to do anything. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+    else
-+    {
-+        if (flag & gcvPOWER_FLAG_ACQUIRE)
-+        {
-+            /* Acquire the power management semaphore. */
-+            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+            acquired = gcvTRUE;
-+
-+            /* avoid acquiring again. */
-+            flag &= ~gcvPOWER_FLAG_ACQUIRE;
-+        }
-+    }
-+
-+    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
-+    {
-+        /* Turn on the power. */
-+        gcmkONERROR(gckOS_SetGPUPower(os, gcvCORE_VG, gcvTRUE, gcvTRUE));
-+
-+        /* Mark clock and power as enabled. */
-+        Hardware->clockState = gcvTRUE;
-+        Hardware->powerState = gcvTRUE;
-+    }
-+
-+    /* Get time until powered on. */
-+    gcmkPROFILE_QUERY(time, onTime);
-+
-+    if ((flag & gcvPOWER_FLAG_STALL) && stall)
-+    {
-+        /* Acquire the mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(
-+            command->os,
-+            command->commitMutex,
-+            gcvINFINITE
-+            ));
-+
-+        commitMutex = gcvTRUE;
-+
-+        gcmkONERROR(_CommandStall(Hardware));
-+    }
-+
-+    /* Get time until stalled. */
-+    gcmkPROFILE_QUERY(time, stallTime);
-+
-+    if (flag & gcvPOWER_FLAG_ACQUIRE)
-+    {
-+        /* Acquire the power management semaphore. */
-+        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+
-+        acquired = gcvTRUE;
-+    }
-+
-+    if (flag & gcvPOWER_FLAG_STOP)
-+    {
-+    }
-+
-+    /* Get time until stopped. */
-+    gcmkPROFILE_QUERY(time, stopTime);
-+
-+    /* Only process this when hardware is enabled. */
-+    if (Hardware->clockState && Hardware->powerState)
-+    {
-+    }
-+
-+    if (flag & gcvPOWER_FLAG_DELAY)
-+    {
-+        /* Wait for the specified amount of time to settle coming back from
-+        ** power-off or suspend state. */
-+        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
-+    }
-+
-+    /* Get time until delayed. */
-+    gcmkPROFILE_QUERY(time, delayTime);
-+
-+    if (flag & gcvPOWER_FLAG_INITIALIZE)
-+    {
-+        gcmkONERROR(gckVGHARDWARE_SetMMU(Hardware, Hardware->kernel->mmu->pageTableLogical));
-+
-+        /* Force the command queue to reload the next context. */
-+        command->currentContext = 0;
-+    }
-+
-+    /* Get time until initialized. */
-+    gcmkPROFILE_QUERY(time, initTime);
-+
-+    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
-+    {
-+        /* Turn off the GPU power. */
-+        gcmkONERROR(
-+            gckOS_SetGPUPower(os,
-+                              gcvCORE_VG,
-+                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                               : gcvTRUE,
-+                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                               : gcvTRUE));
-+
-+        /* Save current hardware power and clock states. */
-+        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+    }
-+
-+    /* Get time until off. */
-+    gcmkPROFILE_QUERY(time, offTime);
-+
-+    if (flag & gcvPOWER_FLAG_START)
-+    {
-+    }
-+
-+    /* Get time until started. */
-+    gcmkPROFILE_QUERY(time, startTime);
-+
-+    if (flag & gcvPOWER_FLAG_RELEASE)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
-+        acquired = gcvFALSE;
-+    }
-+
-+    /* Save the new power state. */
-+    Hardware->chipPowerState = State;
-+
-+    if (global)
-+    {
-+        /* Save the new power state. */
-+        Hardware->chipPowerStateGlobal = State;
-+    }
-+
-+    if (commitMutex)
-+    {
-+        /* Acquire the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+            command->os,
-+            command->commitMutex
-+            ));
-+    }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    /* Reset power off time */
-+    gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+    Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
-+
-+    if (State == gcvPOWER_IDLE)
-+    {
-+        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
-+        gcmkVERIFY_OK(gckOS_StartTimer(os,
-+                                       Hardware->powerOffTimer,
-+                                       Hardware->powerOffTimeout));
-+    }
-+    else
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
-+
-+        /* Cancel running timer when GPU enters ON or OFF. */
-+        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
-+    }
-+#endif
-+
-+    /* Release the power mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+    /* Get total time. */
-+    gcmkPROFILE_QUERY(time, totalTime);
-+#if gcdENABLE_PROFILING
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
-+                   freq, mutexTime, onTime, stallTime, stopTime);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
-+                   delayTime, initTime, offTime, startTime, totalTime);
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    if (acquired)
-+    {
-+        /* Release semaphore. */
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
-+                                             command->powerSemaphore));
-+    }
-+
-+    if (mutexAcquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+
-+    if (commitMutex)
-+    {
-+        /* Acquire the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+            command->os,
-+            command->commitMutex
-+            ));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryPowerManagementState
-+**
-+**  Get GPU power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE* State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_QueryPowerManagementState(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gceCHIPPOWERSTATE* State
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(State != gcvNULL);
-+
-+    /* Return the statue. */
-+    *State = Hardware->chipPowerState;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*State=%d", *State);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_SetPowerManagement
-+**
-+**  Configure GPU power management function.
-+**  Only used in driver initialization stage.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL PowerManagement
-+**          Power Mangement State.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_SetPowerManagement(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctBOOL PowerManagement
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    Hardware->powerManagement = PowerManagement;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_SetPowerOffTimeout(
-+    IN gckVGHARDWARE  Hardware,
-+    IN gctUINT32    Timeout
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    Hardware->powerOffTimeout = Timeout;
-+#endif
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryPowerOffTimeout(
-+    IN gckVGHARDWARE  Hardware,
-+    OUT gctUINT32*  Timeout
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    *Timeout = Hardware->powerOffTimeout;
-+#endif
-+
-+    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryIdle(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctBOOL_PTR IsIdle
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 idle;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
-+
-+    /* We are idle when the power is not ON. */
-+    if (Hardware->chipPowerState != gcvPOWER_ON)
-+    {
-+        *IsIdle = gcvTRUE;
-+    }
-+
-+    else
-+    {
-+        /* Read idle register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, &idle));
-+
-+        /* Pipe must be idle. */
-+        if (((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 8:8)) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 10:10)) & ((gctUINT32) ((((1 ? 10:10) - (0 ? 10:10) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 10:10) - (0 ? 10:10) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) ) != 1)
-+        )
-+        {
-+            /* Something is busy. */
-+            *IsIdle = gcvFALSE;
-+        }
-+
-+        else
-+        {
-+            *IsIdle = gcvTRUE;
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif /* gcdENABLE_VG */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,75 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_hardware_vg_h_
-+#define __gc_hal_kernel_hardware_vg_h_
-+
-+/* gckHARDWARE object. */
-+struct _gckVGHARDWARE
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckKERNEL object. */
-+    gckVGKERNEL                 kernel;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Chip characteristics. */
-+    gceCHIPMODEL                chipModel;
-+    gctUINT32                   chipRevision;
-+    gctUINT32                   chipFeatures;
-+    gctUINT32                   chipMinorFeatures;
-+    gctUINT32                   chipMinorFeatures2;
-+    gctBOOL                     allowFastClear;
-+
-+    /* Features. */
-+    gctBOOL                     fe20;
-+    gctBOOL                     vg20;
-+    gctBOOL                     vg21;
-+
-+    /* Event mask. */
-+    gctUINT32                   eventMask;
-+
-+    gctBOOL                     clockState;
-+    gctBOOL                     powerState;
-+    gctPOINTER                  powerMutex;
-+    gctUINT32                   powerProcess;
-+    gctUINT32                   powerThread;
-+    gceCHIPPOWERSTATE           chipPowerState;
-+    gceCHIPPOWERSTATE           chipPowerStateGlobal;
-+    gctISRMANAGERFUNC           startIsr;
-+    gctISRMANAGERFUNC           stopIsr;
-+    gctPOINTER                  isrContext;
-+    gctPOINTER                  pageTableDirty;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gctUINT32                   powerOffTime;
-+    gctUINT32                   powerOffTimeout;
-+    gctPOINTER                  powerOffTimer;
-+#endif
-+
-+    gctBOOL                     powerManagement;
-+};
-+
-+#endif /* __gc_hal_kernel_hardware_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c	2015-07-27 23:13:06.170964992 +0200
-@@ -0,0 +1,1735 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#include "gc_hal_kernel_context.h"
-+#include "gc_hal_kernel_buffer.h"
-+
-+/******************************************************************************\
-+******************************** Debugging Macro *******************************
-+\******************************************************************************/
-+
-+/* Zone used for header/footer. */
-+#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
-+
-+
-+/******************************************************************************\
-+************************** Context State Buffer Helpers ************************
-+\******************************************************************************/
-+
-+#define _STATE(reg)                                                            \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        reg ## _Count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _STATE_COUNT(reg, count)                                               \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _STATE_COUNT_OFFSET(reg, offset, count)                                \
-+    _State(\
-+        Context, index, \
-+        (reg ## _Address >> 2) + offset, \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _STATE_MIRROR_COUNT(reg, mirror, count)                                \
-+    _StateMirror(\
-+        Context, \
-+        reg ## _Address >> 2, \
-+        count, \
-+        mirror ## _Address >> 2                                                \
-+        )
-+
-+#define _STATE_HINT(reg)                                                       \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        reg ## _Count, \
-+        gcvFALSE, gcvTRUE                                                      \
-+        )
-+
-+#define _STATE_HINT_BLOCK(reg, block, count)                                   \
-+    _State(\
-+        Context, index, \
-+        (reg ## _Address >> 2) + (block << reg ## _BLK), \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvTRUE                                                      \
-+        )
-+
-+#define _STATE_X(reg)                                                          \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        reg ## _Count, \
-+        gcvTRUE, gcvFALSE                                                      \
-+        )
-+
-+#define _CLOSE_RANGE()                                                         \
-+    _TerminateStateBlock(Context, index)
-+
-+#define _ENABLE(reg, field)                                                    \
-+    do                                                                         \
-+    {                                                                          \
-+        if (gcmVERIFYFIELDVALUE(data, reg, MASK_ ## field, ENABLED))           \
-+        {                                                                      \
-+            enable |= gcmFIELDMASK(reg, field);                                \
-+        }                                                                      \
-+    }                                                                          \
-+    while (gcvFALSE)
-+
-+#define _BLOCK_COUNT(reg)                                                      \
-+    ((reg ## _Count) >> (reg ## _BLK))
-+
-+
-+/******************************************************************************\
-+*********************** Support Functions and Definitions **********************
-+\******************************************************************************/
-+
-+#define gcdSTATE_MASK \
-+    (((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 | 0xC0FFEE & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))))
-+
-+#if !defined(VIVANTE_NO_3D)
-+static gctSIZE_T
-+_TerminateStateBlock(
-+    IN gckCONTEXT Context,
-+    IN gctSIZE_T Index
-+    )
-+{
-+    gctUINT32_PTR buffer;
-+    gctSIZE_T align;
-+
-+    /* Determine if we need alignment. */
-+    align = (Index & 1) ? 1 : 0;
-+
-+    /* Address correct index. */
-+    buffer = (Context->buffer == gcvNULL)
-+        ? gcvNULL
-+        : Context->buffer->logical;
-+
-+    /* Flush the current state block; make sure no pairing with the states
-+       to follow happens. */
-+    if (align && (buffer != gcvNULL))
-+    {
-+        buffer[Index] = 0xDEADDEAD;
-+    }
-+
-+    /* Reset last address. */
-+    Context->lastAddress = ~0U;
-+
-+    /* Return alignment requirement. */
-+    return align;
-+}
-+#endif
-+
-+
-+static gctSIZE_T
-+_FlushPipe(
-+    IN gckCONTEXT Context,
-+    IN gctSIZE_T Index,
-+    IN gcePIPE_SELECT Pipe
-+    )
-+{
-+    if (Context->buffer != gcvNULL)
-+    {
-+        gctUINT32_PTR buffer;
-+
-+        /* Address correct index. */
-+        buffer = Context->buffer->logical + Index;
-+
-+        /* Flush the current pipe. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = (Pipe == gcvPIPE_2D)
-+                ?   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+                :   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+
-+        /* Semaphore from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Stall from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+    }
-+
-+    /* Flushing 3D pipe takes 6 slots. */
-+    return 6;
-+}
-+
-+#if !defined(VIVANTE_NO_3D)
-+static gctSIZE_T
-+_SemaphoreStall(
-+    IN gckCONTEXT Context,
-+    IN gctSIZE_T Index
-+    )
-+{
-+    if (Context->buffer != gcvNULL)
-+    {
-+        gctUINT32_PTR buffer;
-+
-+        /* Address correct index. */
-+        buffer = Context->buffer->logical + Index;
-+
-+        /* Semaphore from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Stall from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+    }
-+
-+    /* Semaphore/stall takes 4 slots. */
-+    return 4;
-+}
-+#endif
-+
-+static gctSIZE_T
-+_SwitchPipe(
-+    IN gckCONTEXT Context,
-+    IN gctSIZE_T Index,
-+    IN gcePIPE_SELECT Pipe
-+    )
-+{
-+    if (Context->buffer != gcvNULL)
-+    {
-+        gctUINT32_PTR buffer;
-+
-+        /* Address correct index. */
-+        buffer = Context->buffer->logical + Index;
-+
-+        /* LoadState(AQPipeSelect, 1), pipe. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        *buffer
-+            = (Pipe == gcvPIPE_2D)
-+                ? 0x1
-+                : 0x0;
-+    }
-+
-+    return 2;
-+}
-+
-+#if !defined(VIVANTE_NO_3D)
-+static gctSIZE_T
-+_State(
-+    IN gckCONTEXT Context,
-+    IN gctSIZE_T Index,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Value,
-+    IN gctSIZE_T Size,
-+    IN gctBOOL FixedPoint,
-+    IN gctBOOL Hinted
-+    )
-+{
-+    gctUINT32_PTR buffer;
-+    gctSIZE_T align, i;
-+
-+    /* Determine if we need alignment. */
-+    align = (Index & 1) ? 1 : 0;
-+
-+    /* Address correct index. */
-+    buffer = (Context->buffer == gcvNULL)
-+        ? gcvNULL
-+        : Context->buffer->logical;
-+
-+    if ((buffer == gcvNULL) && (Address + Size > Context->stateCount))
-+    {
-+        /* Determine maximum state. */
-+        Context->stateCount = Address + Size;
-+    }
-+
-+    /* Do we need a new entry? */
-+    if ((Address != Context->lastAddress) || (FixedPoint != Context->lastFixed))
-+    {
-+        if (buffer != gcvNULL)
-+        {
-+            if (align)
-+            {
-+                /* Add filler. */
-+                buffer[Index++] = 0xDEADDEAD;
-+            }
-+
-+            /* LoadState(Address, Count). */
-+            gcmkASSERT((Index & 1) == 0);
-+
-+            if (FixedPoint)
-+            {
-+                buffer[Index]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+            }
-+            else
-+            {
-+                buffer[Index]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+            }
-+
-+            /* Walk all the states. */
-+            for (i = 0; i < Size; i += 1)
-+            {
-+                /* Set state to uninitialized value. */
-+                buffer[Index + 1 + i] = Value;
-+
-+                /* Set index in state mapping table. */
-+                Context->map[Address + i].index = Index + 1 + i;
-+
-+#if gcdSECURE_USER
-+                /* Save hint. */
-+                if (Context->hint != gcvNULL)
-+                {
-+                    Context->hint[Address + i] = Hinted;
-+                }
-+#endif
-+            }
-+        }
-+
-+        /* Save information for this LoadState. */
-+        Context->lastIndex   = Index;
-+        Context->lastAddress = Address + Size;
-+        Context->lastSize    = Size;
-+        Context->lastFixed   = FixedPoint;
-+
-+        /* Return size for load state. */
-+        return align + 1 + Size;
-+    }
-+
-+    /* Append this state to the previous one. */
-+    if (buffer != gcvNULL)
-+    {
-+        /* Update last load state. */
-+        buffer[Context->lastIndex] =
-+            ((((gctUINT32) (buffer[Context->lastIndex])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Context->lastSize + Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        /* Walk all the states. */
-+        for (i = 0; i < Size; i += 1)
-+        {
-+            /* Set state to uninitialized value. */
-+            buffer[Index + i] = Value;
-+
-+            /* Set index in state mapping table. */
-+            Context->map[Address + i].index = Index + i;
-+
-+#if gcdSECURE_USER
-+            /* Save hint. */
-+            if (Context->hint != gcvNULL)
-+            {
-+                Context->hint[Address + i] = Hinted;
-+            }
-+#endif
-+        }
-+    }
-+
-+    /* Update last address and size. */
-+    Context->lastAddress += Size;
-+    Context->lastSize    += Size;
-+
-+    /* Return number of slots required. */
-+    return Size;
-+}
-+
-+static gctSIZE_T
-+_StateMirror(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Size,
-+    IN gctUINT32 AddressMirror
-+    )
-+{
-+    gctSIZE_T i;
-+
-+    /* Process when buffer is set. */
-+    if (Context->buffer != gcvNULL)
-+    {
-+        /* Walk all states. */
-+        for (i = 0; i < Size; i++)
-+        {
-+            /* Copy the mapping address. */
-+            Context->map[Address + i].index =
-+                Context->map[AddressMirror + i].index;
-+        }
-+    }
-+
-+    /* Return the number of required maps. */
-+    return Size;
-+}
-+#endif
-+
-+static gceSTATUS
-+_InitializeContextBuffer(
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gctUINT32_PTR buffer;
-+    gctSIZE_T index;
-+
-+#if !defined(VIVANTE_NO_3D)
-+    gctUINT i;
-+    gctUINT vertexUniforms, fragmentUniforms;
-+    gctUINT fe2vsCount;
-+    gctBOOL halti0;
-+#endif
-+
-+    /* Reset the buffer index. */
-+    index = 0;
-+
-+    /* Reset the last state address. */
-+    Context->lastAddress = ~0U;
-+
-+    /* Get the buffer pointer. */
-+    buffer = (Context->buffer == gcvNULL)
-+        ? gcvNULL
-+        : Context->buffer->logical;
-+
-+
-+    /**************************************************************************/
-+    /* Build 2D states. *******************************************************/
-+
-+
-+#if !defined(VIVANTE_NO_3D)
-+    /**************************************************************************/
-+    /* Build 3D states. *******************************************************/
-+    halti0 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) );
-+
-+    /* Query shader support. */
-+    gcmkVERIFY_OK(gckHARDWARE_QueryShaderCaps(
-+        Context->hardware, &vertexUniforms, &fragmentUniforms, gcvNULL));
-+
-+    /* Store the 3D entry index. */
-+    Context->entryOffset3D = index * gcmSIZEOF(gctUINT32);
-+
-+    /* Flush 2D pipe. */
-+    index += _FlushPipe(Context, index, gcvPIPE_2D);
-+
-+    /* Switch to 3D pipe. */
-+    index += _SwitchPipe(Context, index, gcvPIPE_3D);
-+
-+    /* Current context pointer. */
-+#if gcdDEBUG
-+    index += _State(Context, index, 0x03850 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+#endif
-+
-+    index += _FlushPipe(Context, index, gcvPIPE_3D);
-+
-+    /* Global states. */
-+    index += _State(Context, index, 0x03814 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03818 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0381C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03820 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03828 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0382C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03834 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0384C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    /* Front End states. */
-+	fe2vsCount = 12;
-+	if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) ))
-+	{
-+		fe2vsCount = 16;
-+	}
-+    index += _State(Context, index, 0x00600 >> 2, 0x00000000, fe2vsCount, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    index += _State(Context, index, 0x00644 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x00648 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0064C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x00650 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00680 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x006A0 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0067C >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x006C0 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00700 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00740 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00780 >> 2, 0x3F800000, 16, gcvFALSE, gcvFALSE);
-+
-+    /* Vertex Shader states. */
-+    index += _State(Context, index, 0x00800 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00804 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00808 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0080C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00810 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00820 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00830 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    if (Context->hardware->identity.instructionCount <= 256)
-+    {
-+        index += _State(Context, index, 0x04000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
-+    }
-+
-+    index += _CLOSE_RANGE();
-+    index += _State(Context, index, 0x05000 >> 2, 0x00000000, vertexUniforms * 4, gcvFALSE, gcvFALSE);
-+
-+    /* Primitive Assembly states. */
-+    index += _State(Context, index, 0x00A00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A08 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A0C >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A10 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A1C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A28 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A2C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A30 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A40 >> 2, 0x00000000, 10, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A34 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A38 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A3C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A80 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A84 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A8C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    /* Setup states. */
-+    index += _State(Context, index, 0x00C00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C08 >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C0C >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C10 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C1C >> 2, 0x42000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C20 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C24 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+
-+    /* Raster states. */
-+    index += _State(Context, index, 0x00E00 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E10 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E04 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E40 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E08 >> 2, 0x00000031, 1, gcvFALSE, gcvFALSE);
-+
-+    /* Pixel Shader states. */
-+    index += _State(Context, index, 0x01000 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01004 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0100C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01010 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01018 >> 2, 0x01000000, 1, gcvFALSE, gcvFALSE);
-+    if (Context->hardware->identity.instructionCount <= 256)
-+    {
-+        index += _State(Context, index, 0x06000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
-+    }
-+
-+    index += _CLOSE_RANGE();
-+    index += _State(Context, index, 0x07000 >> 2, 0x00000000, fragmentUniforms * 4, gcvFALSE, gcvFALSE);
-+
-+    /* Texture states. */
-+    index += _State(Context, index, 0x02000 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02040 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02080 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x020C0 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02100 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02140 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02180 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x021C0 >> 2, 0x00321000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02200 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02240 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, (0x02400 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02440 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02480 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x024C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02500 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02540 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02580 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x025C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02600 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02640 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02680 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x026C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02700 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02740 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _CLOSE_RANGE();
-+
-+    if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) ))
-+    {
-+        gctUINT texBlockCount;
-+
-+        /* New texture block. */
-+        index += _State(Context, index, 0x10000 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10080 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10100 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10180 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10200 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10280 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        for (i = 0; i < 256 / 16; i += 1)
-+        {
-+            index += _State(Context, index, (0x02C00 >> 2) + i * 16, 0x00000000, 14, gcvFALSE, gcvFALSE);
-+        }
-+        index += _State(Context, index, 0x10300 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10380 >> 2, 0x00321000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10400 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10480 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+
-+        if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 15:15)) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1)))))) ))
-+        {
-+            index += _State(Context, index, 0x12000 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
-+            index += _State(Context, index, 0x12400 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
-+        }
-+
-+        if ((Context->hardware->identity.chipModel == gcv2000)
-+         && (Context->hardware->identity.chipRevision == 0x5108))
-+        {
-+            texBlockCount = 12;
-+        }
-+        else
-+        {
-+            texBlockCount = ((512) >> (4));
-+        }
-+        for (i = 0; i < texBlockCount; i += 1)
-+        {
-+            index += _State(Context, index, (0x10800 >> 2) + (i << 4), 0x00000000, 14, gcvFALSE, gcvTRUE);
-+        }
-+    }
-+
-+    /* YUV. */
-+    index += _State(Context, index, 0x01678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0167C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01680 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01684 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01688 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0168C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01690 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01694 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01698 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0169C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    /* Thread walker states. */
-+    index += _State(Context, index, 0x00900 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00904 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00908 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0090C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00910 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00914 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00918 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0091C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00924 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+	if (Context->hardware->identity.instructionCount > 1024)
-+	{
-+		/* New Shader instruction memory. */
-+		index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+		index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
-+		index += _State(Context, index, 0x00860 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+		index += _CLOSE_RANGE();
-+
-+		for (i = 0;
-+		     i < Context->hardware->identity.instructionCount << 2;
-+		     i += 256 << 2
-+		     )
-+		{
-+			index += _State(Context, index, (0x20000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
-+			index += _CLOSE_RANGE();
-+		}
-+	}
-+	else if (Context->hardware->identity.instructionCount > 256)
-+	{
-+		/* New Shader instruction memory. */
-+		index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+		index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
-+		index += _CLOSE_RANGE();
-+
-+		/* VX instruction memory. */
-+		for (i = 0;
-+		     i < Context->hardware->identity.instructionCount << 2;
-+		     i += 256 << 2
-+		     )
-+		{
-+			index += _State(Context, index, (0x0C000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
-+			index += _CLOSE_RANGE();
-+		}
-+
-+		_StateMirror(Context, 0x08000 >> 2, Context->hardware->identity.instructionCount << 2 , 0x0C000 >> 2);
-+	}
-+
-+    /* Store the index of the "XD" entry. */
-+    Context->entryOffsetXDFrom3D = index * gcmSIZEOF(gctUINT32);
-+
-+
-+    /* Pixel Engine states. */
-+    index += _State(Context, index, 0x01400 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01404 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01408 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0140C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01414 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01418 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0141C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01420 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01424 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01428 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0142C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01434 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01454 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01458 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0145C >> 2, 0x00000010, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014A8 >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014AC >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014B0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014A4 >> 2, 0x000E400C, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01580 >> 2, 0x00000000, 3, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014B8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    /* Composition states. */
-+    index += _State(Context, index, 0x03008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    if (Context->hardware->identity.pixelPipes == 1)
-+    {
-+        index += _State(Context, index, 0x01460 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+
-+        index += _State(Context, index, 0x01430 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+        index += _State(Context, index, 0x01410 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    }
-+    else
-+    {
-+        index += _State(Context, index, (0x01460 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+
-+        for (i = 0; i < 2; i++)
-+        {
-+            index += _State(Context, index, (0x01500 >> 2) + (i << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+        }
-+    }
-+
-+    if (Context->hardware->identity.pixelPipes > 1 || halti0)
-+    {
-+        index += _State(Context, index, (0x01480 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+    }
-+
-+    /* Resolve states. */
-+    index += _State(Context, index, 0x01604 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01608 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0160C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01610 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01614 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01620 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01630 >> 2, 0x00000000, 2, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01640 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0163C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    if (Context->hardware->identity.pixelPipes > 1)
-+    {
-+        index += _State(Context, index, (0x016C0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+
-+        index += _State(Context, index, (0x016E0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+
-+        index += _State(Context, index, 0x01700 >> 2, 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* Tile status. */
-+    index += _State(Context, index, 0x01654 >> 2, 0x00200000, 1, gcvFALSE, gcvFALSE);
-+
-+    index += _CLOSE_RANGE();
-+    index += _State(Context, index, 0x01658 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0165C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01660 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01664 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01668 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0166C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01674 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016A4 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x016AC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016A8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01720 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01740 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01760 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    /* Semaphore/stall. */
-+    index += _SemaphoreStall(Context, index);
-+#endif
-+
-+    /**************************************************************************/
-+    /* Link to another address. ***********************************************/
-+
-+    Context->linkIndex3D = index;
-+
-+    if (buffer != gcvNULL)
-+    {
-+        buffer[index + 0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[index + 1]
-+            = 0;
-+    }
-+
-+    index += 2;
-+
-+    /* Store the end of the context buffer. */
-+    Context->bufferSize = index * gcmSIZEOF(gctUINT32);
-+
-+
-+    /**************************************************************************/
-+    /* Pipe switch for the case where neither 2D nor 3D are used. *************/
-+
-+    /* Store the 3D entry index. */
-+    Context->entryOffsetXDFrom2D = index * gcmSIZEOF(gctUINT32);
-+
-+    /* Flush 2D pipe. */
-+    index += _FlushPipe(Context, index, gcvPIPE_2D);
-+
-+    /* Switch to 3D pipe. */
-+    index += _SwitchPipe(Context, index, gcvPIPE_3D);
-+
-+    /* Store the location of the link. */
-+    Context->linkIndexXD = index;
-+
-+    if (buffer != gcvNULL)
-+    {
-+        buffer[index + 0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[index + 1]
-+            = 0;
-+    }
-+
-+    index += 2;
-+
-+
-+    /**************************************************************************/
-+    /* Save size for buffer. **************************************************/
-+
-+    Context->totalSize = index * gcmSIZEOF(gctUINT32);
-+
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+_DestroyContext(
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    if (Context != gcvNULL)
-+    {
-+        gcsCONTEXT_PTR bufferHead;
-+
-+        /* Free context buffers. */
-+        for (bufferHead = Context->buffer; Context->buffer != gcvNULL;)
-+        {
-+            /* Get a shortcut to the current buffer. */
-+            gcsCONTEXT_PTR buffer = Context->buffer;
-+
-+            /* Get the next buffer. */
-+            gcsCONTEXT_PTR next = buffer->next;
-+
-+            /* Last item? */
-+            if (next == bufferHead)
-+            {
-+                next = gcvNULL;
-+            }
-+
-+            /* Destroy the signal. */
-+            if (buffer->signal != gcvNULL)
-+            {
-+                gcmkONERROR(gckOS_DestroySignal(
-+                    Context->os, buffer->signal
-+                    ));
-+
-+                buffer->signal = gcvNULL;
-+            }
-+
-+            /* Free state delta map. */
-+            if (buffer->logical != gcvNULL)
-+            {
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+                gcmkONERROR(gckEVENT_DestroyVirtualCommandBuffer(
-+                    Context->hardware->kernel->eventObj,
-+                    Context->totalSize,
-+                    buffer->physical,
-+                    buffer->logical,
-+                    gcvKERNEL_PIXEL
-+                    ));
-+
-+#else
-+                gcmkONERROR(gckEVENT_FreeContiguousMemory(
-+                    Context->hardware->kernel->eventObj,
-+                    Context->totalSize,
-+                    buffer->physical,
-+                    buffer->logical,
-+                    gcvKERNEL_PIXEL
-+                    ));
-+#endif
-+
-+                buffer->logical = gcvNULL;
-+            }
-+
-+            /* Free context buffer. */
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, buffer));
-+
-+            /* Remove from the list. */
-+            Context->buffer = next;
-+        }
-+
-+#if gcdSECURE_USER
-+        /* Free the hint array. */
-+        if (Context->hint != gcvNULL)
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->hint));
-+        }
-+#endif
-+        /* Free record array copy. */
-+        if (Context->recordArray != gcvNULL)
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->recordArray));
-+        }
-+
-+        /* Free the state mapping. */
-+        if (Context->map != gcvNULL)
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->map));
-+        }
-+
-+        /* Mark the gckCONTEXT object as unknown. */
-+        Context->object.type = gcvOBJ_UNKNOWN;
-+
-+        /* Free the gckCONTEXT object. */
-+        gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context));
-+    }
-+
-+OnError:
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+**************************** Context Management API ****************************
-+\******************************************************************************/
-+
-+/******************************************************************************\
-+**
-+**  gckCONTEXT_Construct
-+**
-+**  Construct a new gckCONTEXT object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Current process ID.
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gckCONTEXT * Context
-+**          Pointer to a variable thet will receive the gckCONTEXT object
-+**          pointer.
-+*/
-+gceSTATUS
-+gckCONTEXT_Construct(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 ProcessID,
-+    OUT gckCONTEXT * Context
-+    )
-+{
-+    gceSTATUS status;
-+    gckCONTEXT context = gcvNULL;
-+    gctSIZE_T allocationSize;
-+    gctUINT i;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%08X Hardware=0x%08X", Os, Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Context != gcvNULL);
-+
-+
-+    /**************************************************************************/
-+    /* Allocate and initialize basic fields of gckCONTEXT. ********************/
-+
-+    /* The context object size. */
-+    allocationSize = gcmSIZEOF(struct _gckCONTEXT);
-+
-+    /* Allocate the object. */
-+    gcmkONERROR(gckOS_Allocate(
-+        Os, allocationSize, &pointer
-+        ));
-+
-+    context = pointer;
-+
-+    /* Reset the entire object. */
-+    gcmkONERROR(gckOS_ZeroMemory(context, allocationSize));
-+
-+    /* Initialize the gckCONTEXT object. */
-+    context->object.type = gcvOBJ_CONTEXT;
-+    context->os          = Os;
-+    context->hardware    = Hardware;
-+
-+
-+#if defined(VIVANTE_NO_3D)
-+    context->entryPipe = gcvPIPE_2D;
-+    context->exitPipe  = gcvPIPE_2D;
-+#elif gcdCMD_NO_2D_CONTEXT
-+    context->entryPipe = gcvPIPE_3D;
-+    context->exitPipe  = gcvPIPE_3D;
-+#else
-+    context->entryPipe
-+        = (((((gctUINT32) (context->hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) )
-+            ? gcvPIPE_2D
-+            : gcvPIPE_3D;
-+    context->exitPipe = gcvPIPE_3D;
-+#endif
-+
-+    /* Get the command buffer requirements. */
-+    gcmkONERROR(gckHARDWARE_QueryCommandBuffer(
-+        Hardware,
-+        &context->alignment,
-+        &context->reservedHead,
-+        &context->reservedTail
-+        ));
-+
-+    /* Mark the context as dirty to force loading of the entire state table
-+       the first time. */
-+    context->dirty = gcvTRUE;
-+
-+
-+    /**************************************************************************/
-+    /* Get the size of the context buffer. ************************************/
-+
-+    gcmkONERROR(_InitializeContextBuffer(context));
-+
-+
-+    /**************************************************************************/
-+    /* Compute the size of the record array. **********************************/
-+
-+    context->recordArraySize
-+        = gcmSIZEOF(gcsSTATE_DELTA_RECORD) * context->stateCount;
-+
-+
-+    if (context->stateCount > 0)
-+    {
-+        /**************************************************************************/
-+        /* Allocate and reset the state mapping table. ****************************/
-+
-+        /* Allocate the state mapping table. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Os,
-+            gcmSIZEOF(gcsSTATE_MAP) * context->stateCount,
-+            &pointer
-+            ));
-+
-+        context->map = pointer;
-+
-+        /* Zero the state mapping table. */
-+        gcmkONERROR(gckOS_ZeroMemory(
-+            context->map, gcmSIZEOF(gcsSTATE_MAP) * context->stateCount
-+            ));
-+
-+
-+        /**************************************************************************/
-+        /* Allocate the hint array. ***********************************************/
-+
-+#if gcdSECURE_USER
-+        /* Allocate hints. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Os,
-+            gcmSIZEOF(gctBOOL) * context->stateCount,
-+            &pointer
-+            ));
-+
-+        context->hint = pointer;
-+#endif
-+    }
-+
-+    /**************************************************************************/
-+    /* Allocate the context and state delta buffers. **************************/
-+
-+    for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i += 1)
-+    {
-+        /* Allocate a context buffer. */
-+        gcsCONTEXT_PTR buffer;
-+
-+        /* Allocate the context buffer structure. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Os,
-+            gcmSIZEOF(gcsCONTEXT),
-+            &pointer
-+            ));
-+
-+        buffer = pointer;
-+
-+        /* Reset the context buffer structure. */
-+        gcmkVERIFY_OK(gckOS_ZeroMemory(
-+            buffer, gcmSIZEOF(gcsCONTEXT)
-+            ));
-+
-+        /* Append to the list. */
-+        if (context->buffer == gcvNULL)
-+        {
-+            buffer->next    = buffer;
-+            context->buffer = buffer;
-+        }
-+        else
-+        {
-+            buffer->next          = context->buffer->next;
-+            context->buffer->next = buffer;
-+        }
-+
-+        /* Set the number of delta in the order of creation. */
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+        buffer->num = i;
-+#endif
-+
-+        /* Create the busy signal. */
-+        gcmkONERROR(gckOS_CreateSignal(
-+            Os, gcvFALSE, &buffer->signal
-+            ));
-+
-+        /* Set the signal, buffer is currently not busy. */
-+        gcmkONERROR(gckOS_Signal(
-+            Os, buffer->signal, gcvTRUE
-+            ));
-+
-+        /* Create a new physical context buffer. */
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+        gcmkONERROR(gckKERNEL_AllocateVirtualCommandBuffer(
-+            context->hardware->kernel,
-+            gcvFALSE,
-+            &context->totalSize,
-+            &buffer->physical,
-+            &pointer
-+            ));
-+
-+#else
-+        gcmkONERROR(gckOS_AllocateContiguous(
-+            Os,
-+            gcvFALSE,
-+            &context->totalSize,
-+            &buffer->physical,
-+            &pointer
-+            ));
-+#endif
-+
-+        buffer->logical = pointer;
-+
-+        /* Set gckEVENT object pointer. */
-+        buffer->eventObj = Hardware->kernel->eventObj;
-+
-+        /* Set the pointers to the LINK commands. */
-+        if (context->linkIndex2D != 0)
-+        {
-+            buffer->link2D = &buffer->logical[context->linkIndex2D];
-+        }
-+
-+        if (context->linkIndex3D != 0)
-+        {
-+            buffer->link3D = &buffer->logical[context->linkIndex3D];
-+        }
-+
-+        if (context->linkIndexXD != 0)
-+        {
-+            gctPOINTER xdLink;
-+            gctUINT8_PTR xdEntryLogical;
-+            gctSIZE_T xdEntrySize;
-+            gctSIZE_T linkBytes;
-+
-+            /* Determine LINK parameters. */
-+            xdLink
-+                = &buffer->logical[context->linkIndexXD];
-+
-+            xdEntryLogical
-+                = (gctUINT8_PTR) buffer->logical
-+                + context->entryOffsetXDFrom3D;
-+
-+            xdEntrySize
-+                = context->bufferSize
-+                - context->entryOffsetXDFrom3D;
-+
-+            /* Query LINK size. */
-+            gcmkONERROR(gckHARDWARE_Link(
-+                Hardware, gcvNULL, gcvNULL, 0, &linkBytes
-+                ));
-+
-+            /* Generate a LINK. */
-+            gcmkONERROR(gckHARDWARE_Link(
-+                Hardware,
-+                xdLink,
-+                xdEntryLogical,
-+                xdEntrySize,
-+                &linkBytes
-+                ));
-+        }
-+    }
-+
-+
-+    /**************************************************************************/
-+    /* Initialize the context buffers. ****************************************/
-+
-+    /* Initialize the current context buffer. */
-+    gcmkONERROR(_InitializeContextBuffer(context));
-+
-+    /* Make all created contexts equal. */
-+    {
-+        gcsCONTEXT_PTR currContext, tempContext;
-+
-+        /* Set the current context buffer. */
-+        currContext = context->buffer;
-+
-+        /* Get the next context buffer. */
-+        tempContext = currContext->next;
-+
-+        /* Loop through all buffers. */
-+        while (tempContext != currContext)
-+        {
-+            if (tempContext == gcvNULL)
-+            {
-+                gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+            }
-+
-+            /* Copy the current context. */
-+            gckOS_MemCopy(
-+                tempContext->logical,
-+                currContext->logical,
-+                context->totalSize
-+                );
-+
-+            /* Get the next context buffer. */
-+            tempContext = tempContext->next;
-+        }
-+    }
-+
-+    /* Return pointer to the gckCONTEXT object. */
-+    *Context = context;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Context=0x%08X", *Context);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back on error. */
-+    gcmkVERIFY_OK(_DestroyContext(context));
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/******************************************************************************\
-+**
-+**  gckCONTEXT_Destroy
-+**
-+**  Destroy a gckCONTEXT object.
-+**
-+**  INPUT:
-+**
-+**      gckCONTEXT Context
-+**          Pointer to an gckCONTEXT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCONTEXT_Destroy(
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Context=0x%08X", Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    /* Destroy the context and all related objects. */
-+    status = _DestroyContext(Context);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return status;
-+}
-+
-+/******************************************************************************\
-+**
-+**  gckCONTEXT_Update
-+**
-+**  Merge all pending state delta buffers into the current context buffer.
-+**
-+**  INPUT:
-+**
-+**      gckCONTEXT Context
-+**          Pointer to an gckCONTEXT object.
-+**
-+**      gctUINT32 ProcessID
-+**          Current process ID.
-+**
-+**      gcsSTATE_DELTA_PTR StateDelta
-+**          Pointer to the state delta.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCONTEXT_Update(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 ProcessID,
-+    IN gcsSTATE_DELTA_PTR StateDelta
-+    )
-+{
-+#ifndef VIVANTE_NO_3D
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gcsSTATE_DELTA _stateDelta;
-+    gckKERNEL kernel;
-+    gcsCONTEXT_PTR buffer;
-+    gcsSTATE_MAP_PTR map;
-+    gctBOOL needCopy = gcvFALSE;
-+    gcsSTATE_DELTA_PTR nDelta;
-+    gcsSTATE_DELTA_PTR uDelta = gcvNULL;
-+    gcsSTATE_DELTA_PTR kDelta = gcvNULL;
-+    gcsSTATE_DELTA_RECORD_PTR record;
-+    gcsSTATE_DELTA_RECORD_PTR recordArray = gcvNULL;
-+    gctUINT elementCount;
-+    gctUINT address;
-+    gctUINT32 mask;
-+    gctUINT32 data;
-+    gctUINT index;
-+    gctUINT i, j;
-+
-+#if gcdSECURE_USER
-+    gcskSECURE_CACHE_PTR cache;
-+#endif
-+
-+    gcmkHEADER_ARG(
-+        "Context=0x%08X ProcessID=%d StateDelta=0x%08X",
-+        Context, ProcessID, StateDelta
-+        );
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    /* Get a shortcut to the kernel object. */
-+    kernel = Context->hardware->kernel;
-+
-+    /* Check wehther we need to copy the structures or not. */
-+    gcmkONERROR(gckOS_QueryNeedCopy(Context->os, ProcessID, &needCopy));
-+
-+    /* Allocate the copy buffer for the user record array. */
-+    if (needCopy && (Context->recordArray == gcvNULL))
-+    {
-+        /* Allocate the buffer. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Context->os,
-+            Context->recordArraySize,
-+            (gctPOINTER *) &Context->recordArray
-+            ));
-+    }
-+
-+    /* Get the current context buffer. */
-+    buffer = Context->buffer;
-+
-+    /* Wait until the context buffer becomes available; this will
-+       also reset the signal and mark the buffer as busy. */
-+    gcmkONERROR(gckOS_WaitSignal(
-+        Context->os, buffer->signal, gcvINFINITE
-+        ));
-+
-+#if gcdSECURE_USER
-+    /* Get the cache form the database. */
-+    gcmkONERROR(gckKERNEL_GetProcessDBCache(kernel, ProcessID, &cache));
-+#endif
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE) && 1 && !defined(VIVANTE_NO_3D)
-+    /* Update current context token. */
-+    buffer->logical[Context->map[0x0E14].index]
-+        = gcmPTR2INT(Context);
-+#endif
-+
-+    /* Are there any pending deltas? */
-+    if (buffer->deltaCount != 0)
-+    {
-+        /* Get the state map. */
-+        map = Context->map;
-+
-+        /* Get the first delta item. */
-+        uDelta = buffer->delta;
-+
-+        /* Reset the vertex stream count. */
-+        elementCount = 0;
-+
-+        /* Merge all pending deltas. */
-+        for (i = 0; i < buffer->deltaCount; i += 1)
-+        {
-+            /* Get access to the state delta. */
-+            gcmkONERROR(gckKERNEL_OpenUserData(
-+                kernel, needCopy,
-+                &_stateDelta,
-+                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+                (gctPOINTER *) &kDelta
-+                ));
-+
-+            /* Get access to the state records. */
-+            gcmkONERROR(gckKERNEL_OpenUserData(
-+                kernel, needCopy,
-+                Context->recordArray,
-+                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
-+                (gctPOINTER *) &recordArray
-+                ));
-+
-+            /* Merge all pending states. */
-+            for (j = 0; j < kDelta->recordCount; j += 1)
-+            {
-+                if (j >= Context->stateCount)
-+                {
-+                    break;
-+                }
-+
-+                /* Get the current state record. */
-+                record = &recordArray[j];
-+
-+                /* Get the state address. */
-+                address = record->address;
-+
-+                /* Make sure the state is a part of the mapping table. */
-+                if (address >= Context->stateCount)
-+                {
-+                    gcmkTRACE(
-+                        gcvLEVEL_ERROR,
-+                        "%s(%d): State 0x%04X is not mapped.\n",
-+                        __FUNCTION__, __LINE__,
-+                        address
-+                        );
-+
-+                    continue;
-+                }
-+
-+                /* Get the state index. */
-+                index = map[address].index;
-+
-+                /* Skip the state if not mapped. */
-+                if (index == 0)
-+                {
-+#if gcdDEBUG
-+                    if ((address != 0x0594)
-+                     && (address != 0x0E00)
-+                     && (address != 0x0E03)
-+                        )
-+                    {
-+#endif
-+                        gcmkTRACE(
-+                            gcvLEVEL_ERROR,
-+                            "%s(%d): State 0x%04X is not mapped.\n",
-+                            __FUNCTION__, __LINE__,
-+                            address
-+                            );
-+#if gcdDEBUG
-+                    }
-+#endif
-+                    continue;
-+                }
-+
-+                /* Get the data mask. */
-+                mask = record->mask;
-+
-+                /* Masked states that are being completly reset or regular states. */
-+                if ((mask == 0) || (mask == ~0U))
-+                {
-+                    /* Get the new data value. */
-+                    data = record->data;
-+
-+                    /* Process special states. */
-+                    if (address == 0x0595)
-+                    {
-+                        /* Force auto-disable to be disabled. */
-+                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13)));
-+                    }
-+
-+#if gcdSECURE_USER
-+                    /* Do we need to convert the logical address? */
-+                    if (Context->hint[address])
-+                    {
-+                        /* Map handle into physical address. */
-+                        gcmkONERROR(gckKERNEL_MapLogicalToPhysical(
-+                            kernel, cache, (gctPOINTER) &data
-+                            ));
-+                    }
-+#endif
-+
-+                    /* Set new data. */
-+                    buffer->logical[index] = data;
-+                }
-+
-+                /* Masked states that are being set partially. */
-+                else
-+                {
-+                    buffer->logical[index]
-+                        = (~mask & buffer->logical[index])
-+                        | (mask & record->data);
-+                }
-+            }
-+
-+            /* Get the element count. */
-+            if (kDelta->elementCount != 0)
-+            {
-+                elementCount = kDelta->elementCount;
-+            }
-+
-+            /* Dereference delta. */
-+            kDelta->refCount -= 1;
-+            gcmkASSERT(kDelta->refCount >= 0);
-+
-+            /* Get the next state delta. */
-+            nDelta = gcmUINT64_TO_PTR(kDelta->next);
-+
-+            /* Get access to the state records. */
-+            gcmkONERROR(gckKERNEL_CloseUserData(
-+                kernel, needCopy,
-+                gcvFALSE,
-+                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
-+                (gctPOINTER *) &recordArray
-+                ));
-+
-+            /* Close access to the current state delta. */
-+            gcmkONERROR(gckKERNEL_CloseUserData(
-+                kernel, needCopy,
-+                gcvTRUE,
-+                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+                (gctPOINTER *) &kDelta
-+                ));
-+
-+            /* Update the user delta pointer. */
-+            uDelta = nDelta;
-+        }
-+
-+        /* Hardware disables all input streams when the stream 0 is programmed,
-+           it then reenables those streams that were explicitely programmed by
-+           the software. Because of this we cannot program the entire array of
-+           values, otherwise we'll get all streams reenabled, but rather program
-+           only those that are actully needed by the software. */
-+        if (elementCount != 0)
-+        {
-+            gctUINT base;
-+            gctUINT nopCount;
-+            gctUINT32_PTR nop;
-+            gctUINT fe2vsCount = 12;
-+
-+            if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) ))
-+            {
-+                fe2vsCount = 16;
-+            }
-+
-+            /* Determine the base index of the vertex stream array. */
-+            base = map[0x0180].index;
-+
-+            /* Set the proper state count. */
-+            buffer->logical[base - 1]
-+                = ((((gctUINT32) (buffer->logical[base - 1])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (elementCount ) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            /* Determine the number of NOP commands. */
-+            nopCount
-+                = (fe2vsCount / 2)
-+                - (elementCount / 2);
-+
-+            /* Determine the location of the first NOP. */
-+            nop = &buffer->logical[base + (elementCount | 1)];
-+
-+            /* Fill the unused space with NOPs. */
-+            for (i = 0; i < nopCount; i += 1)
-+            {
-+                if (nop >= buffer->logical + Context->totalSize)
-+                {
-+                    break;
-+                }
-+
-+                /* Generate a NOP command. */
-+                *nop = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+                /* Advance. */
-+                nop += 2;
-+            }
-+        }
-+
-+        /* Reset pending deltas. */
-+        buffer->deltaCount = 0;
-+        buffer->delta      = gcvNULL;
-+    }
-+
-+    /* Set state delta user pointer. */
-+    uDelta = StateDelta;
-+
-+    /* Get access to the state delta. */
-+    gcmkONERROR(gckKERNEL_OpenUserData(
-+        kernel, needCopy,
-+        &_stateDelta,
-+        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+        (gctPOINTER *) &kDelta
-+        ));
-+
-+    /* State delta cannot be attached to anything yet. */
-+    if (kDelta->refCount != 0)
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): kDelta->refCount = %d (has to be 0).\n",
-+            __FUNCTION__, __LINE__,
-+            kDelta->refCount
-+            );
-+    }
-+
-+    /* Attach to all contexts. */
-+    buffer = Context->buffer;
-+
-+    do
-+    {
-+        /* Attach to the context if nothing is attached yet. If a delta
-+           is allready attached, all we need to do is to increment
-+           the number of deltas in the context. */
-+        if (buffer->delta == gcvNULL)
-+        {
-+            buffer->delta = uDelta;
-+        }
-+
-+        /* Update reference count. */
-+        kDelta->refCount += 1;
-+
-+        /* Update counters. */
-+        buffer->deltaCount += 1;
-+
-+        /* Get the next context buffer. */
-+        buffer = buffer->next;
-+
-+		if (buffer == gcvNULL)
-+		{
-+			gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+		}
-+    }
-+    while (Context->buffer != buffer);
-+
-+    /* Close access to the current state delta. */
-+    gcmkONERROR(gckKERNEL_CloseUserData(
-+        kernel, needCopy,
-+        gcvTRUE,
-+        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+        (gctPOINTER *) &kDelta
-+        ));
-+
-+    /* Schedule an event to mark the context buffer as available. */
-+    gcmkONERROR(gckEVENT_Signal(
-+        buffer->eventObj, buffer->signal, gcvKERNEL_PIXEL
-+        ));
-+
-+    /* Advance to the next context buffer. */
-+    Context->buffer = buffer->next;
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Get access to the state records. */
-+	if (kDelta != gcvNULL)
-+	{
-+        gcmkVERIFY_OK(gckKERNEL_CloseUserData(
-+            kernel, needCopy,
-+            gcvFALSE,
-+            gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
-+            (gctPOINTER *) &recordArray
-+            ));
-+	}
-+
-+    /* Close access to the current state delta. */
-+    gcmkVERIFY_OK(gckKERNEL_CloseUserData(
-+        kernel, needCopy,
-+        gcvTRUE,
-+        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+        (gctPOINTER *) &kDelta
-+        ));
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    return gcvSTATUS_OK;
-+#endif
-+}
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h	2015-07-27 23:13:06.170964992 +0200
-@@ -0,0 +1,157 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_context_h_
-+#define __gc_hal_kernel_context_h_
-+
-+#include "gc_hal_kernel_buffer.h"
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/* Maps state locations within the context buffer. */
-+typedef struct _gcsSTATE_MAP * gcsSTATE_MAP_PTR;
-+typedef struct _gcsSTATE_MAP
-+{
-+    /* Index of the state in the context buffer. */
-+    gctUINT                     index;
-+
-+    /* State mask. */
-+    gctUINT32                   mask;
-+}
-+gcsSTATE_MAP;
-+
-+/* Context buffer. */
-+typedef struct _gcsCONTEXT * gcsCONTEXT_PTR;
-+typedef struct _gcsCONTEXT
-+{
-+    /* For debugging: the number of context buffer in the order of creation. */
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    gctUINT                     num;
-+#endif
-+
-+    /* Pointer to gckEVENT object. */
-+    gckEVENT                    eventObj;
-+
-+    /* Context busy signal. */
-+    gctSIGNAL                   signal;
-+
-+    /* Physical address of the context buffer. */
-+    gctPHYS_ADDR                physical;
-+
-+    /* Logical address of the context buffer. */
-+    gctUINT32_PTR               logical;
-+
-+    /* Pointer to the LINK commands. */
-+    gctPOINTER                  link2D;
-+    gctPOINTER                  link3D;
-+
-+    /* The number of pending state deltas. */
-+    gctUINT                     deltaCount;
-+
-+    /* Pointer to the first delta to be applied. */
-+    gcsSTATE_DELTA_PTR          delta;
-+
-+    /* Next context buffer. */
-+    gcsCONTEXT_PTR              next;
-+}
-+gcsCONTEXT;
-+
-+/* gckCONTEXT structure that hold the current context. */
-+struct _gckCONTEXT
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Pointer to gckHARDWARE object. */
-+    gckHARDWARE                 hardware;
-+
-+    /* Command buffer alignment. */
-+    gctSIZE_T                   alignment;
-+    gctSIZE_T                   reservedHead;
-+    gctSIZE_T                   reservedTail;
-+
-+    /* Context buffer metrics. */
-+    gctSIZE_T                   stateCount;
-+    gctSIZE_T                   totalSize;
-+    gctSIZE_T                   bufferSize;
-+    gctUINT32                   linkIndex2D;
-+    gctUINT32                   linkIndex3D;
-+    gctUINT32                   linkIndexXD;
-+    gctUINT32                   entryOffset3D;
-+    gctUINT32                   entryOffsetXDFrom2D;
-+    gctUINT32                   entryOffsetXDFrom3D;
-+
-+    /* Dirty flags. */
-+    gctBOOL                     dirty;
-+    gctBOOL                     dirty2D;
-+    gctBOOL                     dirty3D;
-+    gcsCONTEXT_PTR              dirtyBuffer;
-+
-+    /* State mapping. */
-+    gcsSTATE_MAP_PTR            map;
-+
-+    /* List of context buffers. */
-+    gcsCONTEXT_PTR              buffer;
-+
-+    /* A copy of the user record array. */
-+    gctUINT                     recordArraySize;
-+    gcsSTATE_DELTA_RECORD_PTR   recordArray;
-+
-+    /* Requested pipe select for context. */
-+    gcePIPE_SELECT              entryPipe;
-+    gcePIPE_SELECT              exitPipe;
-+
-+    /* Variables used for building state buffer. */
-+    gctUINT32                   lastAddress;
-+    gctSIZE_T                   lastSize;
-+    gctUINT32                   lastIndex;
-+    gctBOOL                     lastFixed;
-+
-+    /* Hint array. */
-+#if gcdSECURE_USER
-+    gctBOOL_PTR                 hint;
-+#endif
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    gcsPROFILER_COUNTERS        latestProfiler;
-+    gcsPROFILER_COUNTERS        histroyProfiler;
-+    gctUINT32                   prevVSInstCount;
-+    gctUINT32                   prevVSBranchInstCount;
-+    gctUINT32                   prevVSTexInstCount;
-+    gctUINT32                   prevVSVertexCount;
-+    gctUINT32                   prevPSInstCount;
-+    gctUINT32                   prevPSBranchInstCount;
-+    gctUINT32                   prevPSTexInstCount;
-+    gctUINT32                   prevPSPixelCount;
-+#endif
-+};
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_context_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c	2015-07-27 23:13:06.170964992 +0200
-@@ -0,0 +1,7280 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#if VIVANTE_PROFILER_CONTEXT
-+#include "gc_hal_kernel_context.h"
-+#endif
-+
-+#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
-+
-+typedef struct _gcsiDEBUG_REGISTERS * gcsiDEBUG_REGISTERS_PTR;
-+typedef struct _gcsiDEBUG_REGISTERS
-+{
-+    gctSTRING       module;
-+    gctUINT         index;
-+    gctUINT         shift;
-+    gctUINT         data;
-+    gctUINT         count;
-+    gctUINT32       signature;
-+}
-+gcsiDEBUG_REGISTERS;
-+
-+extern int gpu3DMinClock;
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+static gceSTATUS
-+_ResetGPU(
-+    IN gckHARDWARE Hardware,
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+static gceSTATUS
-+_IdentifyHardware(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gctUINT32 chipIdentity;
-+
-+    gctUINT32 streamCount = 0;
-+    gctUINT32 registerMax = 0;
-+    gctUINT32 threadCount = 0;
-+    gctUINT32 shaderCoreCount = 0;
-+    gctUINT32 vertexCacheSize = 0;
-+    gctUINT32 vertexOutputBufferSize = 0;
-+    gctUINT32 pixelPipes = 0;
-+    gctUINT32 instructionCount = 0;
-+    gctUINT32 numConstants = 0;
-+    gctUINT32 bufferSize = 0;
-+    gctUINT32 varyingsCount = 0;
-+    gctBOOL useHZ;
-+
-+    gcmkHEADER_ARG("Os=0x%x", Os);
-+
-+    /***************************************************************************
-+    ** Get chip ID and revision.
-+    */
-+
-+    /* Read chip identity register. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Os, Core,
-+                             0x00018,
-+                             &chipIdentity));
-+
-+    /* Special case for older graphic cores. */
-+    if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
-+    {
-+        Identity->chipModel    = gcv500;
-+        Identity->chipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
-+    }
-+
-+    else
-+    {
-+        /* Read chip identity register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00020,
-+                                 (gctUINT32_PTR) &Identity->chipModel));
-+
-+        /* !!!! HACK ALERT !!!! */
-+        /* Because people change device IDs without letting software know
-+        ** about it - here is the hack to make it all look the same.  Only
-+        ** for GC400 family.  Next time - TELL ME!!! */
-+        if (((Identity->chipModel & 0xFF00) == 0x0400)
-+          && (Identity->chipModel != 0x0420))
-+        {
-+            Identity->chipModel = (gceCHIPMODEL) (Identity->chipModel & 0x0400);
-+        }
-+
-+        /* Read CHIP_REV register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00024,
-+                                 &Identity->chipRevision));
-+
-+        if ((Identity->chipModel    == gcv300)
-+        &&  (Identity->chipRevision == 0x2201)
-+        )
-+        {
-+            gctUINT32 chipDate;
-+            gctUINT32 chipTime;
-+
-+            /* Read date and time registers. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00028,
-+                                     &chipDate));
-+
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x0002C,
-+                                     &chipTime));
-+
-+            if ((chipDate == 0x20080814) && (chipTime == 0x12051100))
-+            {
-+                /* This IP has an ECO; put the correct revision in it. */
-+                Identity->chipRevision = 0x1051;
-+            }
-+        }
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipModel=%X",
-+                   Identity->chipModel);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipRevision=%X",
-+                   Identity->chipRevision);
-+
-+
-+    /***************************************************************************
-+    ** Get chip features.
-+    */
-+
-+    /* Read chip feature register. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Os, Core,
-+                             0x0001C,
-+                             &Identity->chipFeatures));
-+
-+#ifndef VIVANTE_NO_3D
-+    /* Disable fast clear on GC700. */
-+    if (Identity->chipModel == gcv700)
-+    {
-+        Identity->chipFeatures
-+            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+    }
-+#endif
-+
-+    if (((Identity->chipModel == gcv500) && (Identity->chipRevision < 2))
-+    ||  ((Identity->chipModel == gcv300) && (Identity->chipRevision < 0x2000))
-+    )
-+    {
-+        /* GC500 rev 1.x and GC300 rev < 2.0 doesn't have these registers. */
-+        Identity->chipMinorFeatures  = 0;
-+        Identity->chipMinorFeatures1 = 0;
-+        Identity->chipMinorFeatures2 = 0;
-+        Identity->chipMinorFeatures3 = 0;
-+        Identity->chipMinorFeatures4 = 0;
-+    }
-+    else
-+    {
-+        /* Read chip minor feature register #0. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00034,
-+                                 &Identity->chipMinorFeatures));
-+
-+        if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))))
-+        )
-+        {
-+            /* Read chip minor featuress register #1. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00074,
-+                                     &Identity->chipMinorFeatures1));
-+
-+            /* Read chip minor featuress register #2. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00084,
-+                                     &Identity->chipMinorFeatures2));
-+
-+            /*Identity->chipMinorFeatures2 &= ~(0x1 << 3);*/
-+
-+            /* Read chip minor featuress register #1. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00088,
-+                                     &Identity->chipMinorFeatures3));
-+
-+            /*The BG2 chip has no compression supertiled, and the bit of GCMinorFeature3BugFixes15 is n/a*/
-+            if(Identity->chipModel == gcv1000 && Identity->chipRevision == 0x5036)
-+            {
-+                Identity->chipMinorFeatures3
-+                    = ((((gctUINT32) (Identity->chipMinorFeatures3)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+                Identity->chipMinorFeatures3
-+                    = ((((gctUINT32) (Identity->chipMinorFeatures3)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27)));
-+            }
-+
-+            /* Read chip minor featuress register #4. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00094,
-+                                     &Identity->chipMinorFeatures4));
-+        }
-+        else
-+        {
-+            /* Chip doesn't has minor features register #1 or 2 or 3 or 4. */
-+            Identity->chipMinorFeatures1 = 0;
-+            Identity->chipMinorFeatures2 = 0;
-+            Identity->chipMinorFeatures3 = 0;
-+            Identity->chipMinorFeatures4 = 0;
-+        }
-+    }
-+
-+    /* Get the Supertile layout in the hardware. */
-+    if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))))
-+     || ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))))
-+    {
-+        Identity->superTileMode = 2;
-+    }
-+    else if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))))
-+    {
-+        Identity->superTileMode = 1;
-+    }
-+    else
-+    {
-+        Identity->superTileMode = 0;
-+    }
-+
-+    /* Exception for GC1000, revision 5035 &  GC800, revision 4612 */
-+    if (((Identity->chipModel == gcv1000) && ((Identity->chipRevision == 0x5035)
-+                                           || (Identity->chipRevision == 0x5036)
-+                                           || (Identity->chipRevision == 0x5037)))
-+	 || ((Identity->chipModel == gcv800) && (Identity->chipRevision == 0x4612))
-+     || ((Identity->chipModel == gcv860) && (Identity->chipRevision == 0x4647)))
-+    {
-+        Identity->superTileMode = 1;
-+    }
-+
-+    if (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5245)
-+    {
-+        useHZ = ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))))
-+             || ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))));
-+    }
-+    else
-+    {
-+        useHZ = gcvFALSE;
-+    }
-+
-+    if (useHZ)
-+    {
-+        /* Disable EZ. */
-+        Identity->chipFeatures
-+            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
-+    }
-+
-+    /* Disable HZ when EZ is present for older chips. */
-+    else if (!((((gctUINT32) (Identity->chipFeatures)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))))
-+    {
-+        /* Disable HIERARCHICAL_Z. */
-+        Identity->chipMinorFeatures
-+            = ((((gctUINT32) (Identity->chipMinorFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27)));
-+    }
-+
-+    /* Disable rectangle primitive when chip is gc880_5_1_0_rc6*/
-+    if ((Identity->chipModel == gcv880) && (Identity->chipRevision == 0x5106))
-+    {
-+        /* Disable rectangle primitive. */
-+        Identity->chipMinorFeatures2
-+            = ((((gctUINT32) (Identity->chipMinorFeatures2)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+    }
-+
-+    if ((Identity->chipModel == gcv800) && (Identity->chipRevision == 0x4605))
-+    {
-+        /* Correct feature bit: RTL does not have such feature. */
-+        Identity->chipFeatures
-+            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)));
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipFeatures=0x%08X",
-+                   Identity->chipFeatures);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures=0x%08X",
-+                   Identity->chipMinorFeatures);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures1=0x%08X",
-+                   Identity->chipMinorFeatures1);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures2=0x%08X",
-+                   Identity->chipMinorFeatures2);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures3=0x%08X",
-+                   Identity->chipMinorFeatures3);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures4=0x%08X",
-+                   Identity->chipMinorFeatures4);
-+
-+    /***************************************************************************
-+    ** Get chip specs.
-+    */
-+
-+    if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
-+    {
-+        gctUINT32 specs, specs2, specs3;
-+
-+        /* Read gcChipSpecs register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00048,
-+                                 &specs));
-+
-+        /* Extract the fields. */
-+        streamCount            = (((((gctUINT32) (specs)) >> (0 ? 3:0)) & ((gctUINT32) ((((1 ? 3:0) - (0 ? 3:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:0) - (0 ? 3:0) + 1)))))) );
-+        registerMax            = (((((gctUINT32) (specs)) >> (0 ? 7:4)) & ((gctUINT32) ((((1 ? 7:4) - (0 ? 7:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:4) - (0 ? 7:4) + 1)))))) );
-+        threadCount            = (((((gctUINT32) (specs)) >> (0 ? 11:8)) & ((gctUINT32) ((((1 ? 11:8) - (0 ? 11:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:8) - (0 ? 11:8) + 1)))))) );
-+        shaderCoreCount        = (((((gctUINT32) (specs)) >> (0 ? 24:20)) & ((gctUINT32) ((((1 ? 24:20) - (0 ? 24:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:20) - (0 ? 24:20) + 1)))))) );
-+        vertexCacheSize        = (((((gctUINT32) (specs)) >> (0 ? 16:12)) & ((gctUINT32) ((((1 ? 16:12) - (0 ? 16:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:12) - (0 ? 16:12) + 1)))))) );
-+        vertexOutputBufferSize = (((((gctUINT32) (specs)) >> (0 ? 31:28)) & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1)))))) );
-+        pixelPipes             = (((((gctUINT32) (specs)) >> (0 ? 27:25)) & ((gctUINT32) ((((1 ? 27:25) - (0 ? 27:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:25) - (0 ? 27:25) + 1)))))) );
-+
-+        /* Read gcChipSpecs2 register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00080,
-+                                 &specs2));
-+
-+        instructionCount       = (((((gctUINT32) (specs2)) >> (0 ? 15:8)) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1)))))) );
-+        numConstants           = (((((gctUINT32) (specs2)) >> (0 ? 31:16)) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1)))))) );
-+        bufferSize             = (((((gctUINT32) (specs2)) >> (0 ? 7:0)) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1)))))) );
-+
-+        /* Read gcChipSpecs3 register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x0008C,
-+                                 &specs3));
-+
-+        varyingsCount          = (((((gctUINT32) (specs3)) >> (0 ? 8:4)) & ((gctUINT32) ((((1 ? 8:4) - (0 ? 8:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:4) - (0 ? 8:4) + 1)))))) );
-+    }
-+
-+    /* Get the number of pixel pipes. */
-+    Identity->pixelPipes = gcmMAX(pixelPipes, 1);
-+
-+    /* Get the stream count. */
-+    Identity->streamCount = (streamCount != 0)
-+                          ? streamCount
-+                          : (Identity->chipModel >= gcv1000) ? 4 : 1;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: streamCount=%u%s",
-+                   Identity->streamCount,
-+                   (streamCount == 0) ? " (default)" : "");
-+
-+    /* Get the vertex output buffer size. */
-+    Identity->vertexOutputBufferSize = (vertexOutputBufferSize != 0)
-+                                     ? 1 << vertexOutputBufferSize
-+                                     : (Identity->chipModel == gcv400)
-+                                       ? (Identity->chipRevision < 0x4000) ? 512
-+                                       : (Identity->chipRevision < 0x4200) ? 256
-+                                       : 128
-+                                     : (Identity->chipModel == gcv530)
-+                                       ? (Identity->chipRevision < 0x4200) ? 512
-+                                       : 128
-+                                     : 512;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: vertexOutputBufferSize=%u%s",
-+                   Identity->vertexOutputBufferSize,
-+                   (vertexOutputBufferSize == 0) ? " (default)" : "");
-+
-+    /* Get the maximum number of threads. */
-+    Identity->threadCount = (threadCount != 0)
-+                          ? 1 << threadCount
-+                          : (Identity->chipModel == gcv400) ? 64
-+                          : (Identity->chipModel == gcv500) ? 128
-+                          : (Identity->chipModel == gcv530) ? 128
-+                          : 256;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: threadCount=%u%s",
-+                   Identity->threadCount,
-+                   (threadCount == 0) ? " (default)" : "");
-+
-+    /* Get the number of shader cores. */
-+    Identity->shaderCoreCount = (shaderCoreCount != 0)
-+                              ? shaderCoreCount
-+                              : (Identity->chipModel >= gcv1000) ? 2
-+                              : 1;
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: shaderCoreCount=%u%s",
-+                   Identity->shaderCoreCount,
-+                   (shaderCoreCount == 0) ? " (default)" : "");
-+
-+    /* Get the vertex cache size. */
-+    Identity->vertexCacheSize = (vertexCacheSize != 0)
-+                              ? vertexCacheSize
-+                              : 8;
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: vertexCacheSize=%u%s",
-+                   Identity->vertexCacheSize,
-+                   (vertexCacheSize == 0) ? " (default)" : "");
-+
-+    /* Get the maximum number of temporary registers. */
-+    Identity->registerMax = (registerMax != 0)
-+        /* Maximum of registerMax/4 registers are accessible to 1 shader */
-+                          ? 1 << registerMax
-+                          : (Identity->chipModel == gcv400) ? 32
-+                          : 64;
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: registerMax=%u%s",
-+                   Identity->registerMax,
-+                   (registerMax == 0) ? " (default)" : "");
-+
-+    /* Get the instruction count. */
-+    Identity->instructionCount = (instructionCount == 0) ? 256
-+                               : (instructionCount == 1) ? 1024
-+                               : (instructionCount == 2) ? 2048
-+                               : (instructionCount == 0xFF) ? 512
-+                               : 256;
-+
-+    if (Identity->instructionCount == 256)
-+    {
-+        if ((Identity->chipModel == gcv2000 && Identity->chipRevision == 0x5108)
-+        ||  Identity->chipModel == gcv880)
-+        {
-+            Identity->instructionCount = 512;
-+        }
-+    }
-+
-+    if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))))
-+    {
-+        Identity->instructionCount = 512;
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: instructionCount=%u%s",
-+                   Identity->instructionCount,
-+                   (instructionCount == 0) ? " (default)" : "");
-+
-+    /* Get the number of constants. */
-+    Identity->numConstants = (numConstants == 0) ? 168 : numConstants;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: numConstants=%u%s",
-+                   Identity->numConstants,
-+                   (numConstants == 0) ? " (default)" : "");
-+
-+    /* Get the buffer size. */
-+    Identity->bufferSize = bufferSize;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: bufferSize=%u%s",
-+                   Identity->bufferSize,
-+                   (bufferSize == 0) ? " (default)" : "");
-+
-+
-+     if (varyingsCount != 0)
-+     {
-+         /* Bug 4480. */
-+         /*Identity->varyingsCount = varyingsCount;*/
-+         Identity->varyingsCount = 12;
-+     }
-+     else if (((((gctUINT32) (Identity->chipMinorFeatures1)) >> (0 ? 23:23) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))))
-+     {
-+         Identity->varyingsCount = 12;
-+     }
-+     else
-+     {
-+         Identity->varyingsCount = 8;
-+     }
-+
-+     /* For some cores, it consumes two varying for position, so the max varying vectors should minus one. */
-+     if ((Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5222) ||
-+         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5208) ||
-+         ((Identity->chipModel == gcv2100 || Identity->chipModel == gcv2000) && Identity->chipRevision == 0x5108) ||
-+         (Identity->chipModel == gcv880 && (Identity->chipRevision == 0x5107 || Identity->chipRevision == 0x5106)))
-+     {
-+         Identity->varyingsCount -= 1;
-+     }
-+
-+    Identity->chip2DControl = 0;
-+    if (Identity->chipModel == gcv320)
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os,
-+                                 Core,
-+                                 0x0002C,
-+                                 &data));
-+
-+        if ((data != 33956864) &&
-+            ((Identity->chipRevision == 0x5007) ||
-+            (Identity->chipRevision == 0x5220)))
-+        {
-+            Identity->chip2DControl |= 0xFF &
-+                (Identity->chipRevision == 0x5220 ? 8 :
-+                (Identity->chipRevision == 0x5007 ? 12 : 0));
-+        }
-+
-+        if  (Identity->chipRevision == 0x5007)
-+        {
-+            /* Disable splitting rectangle. */
-+            Identity->chip2DControl |= 0x100;
-+
-+            /* Enable 2D Flush. */
-+            Identity->chip2DControl |= 0x200;
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdPOWEROFF_TIMEOUT
-+void
-+_PowerTimerFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gckHARDWARE hardware = (gckHARDWARE)Data;
-+    gcmkVERIFY_OK(
-+        gckHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
-+}
-+#endif
-+
-+static gceSTATUS
-+_VerifyDMA(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    gctUINT32_PTR Address1,
-+    gctUINT32_PTR Address2,
-+    gctUINT32_PTR State1,
-+    gctUINT32_PTR State2
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 i;
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State1));
-+    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address1));
-+
-+    for (i = 0; i < 500; i += 1)
-+    {
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State2));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address2));
-+
-+        if (*Address1 != *Address2)
-+        {
-+            break;
-+        }
-+
-+        if (*State1 != *State2)
-+        {
-+            break;
-+        }
-+    }
-+
-+OnError:
-+    return status;
-+}
-+
-+static gceSTATUS
-+_DumpDebugRegisters(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gcsiDEBUG_REGISTERS_PTR Descriptor
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctUINT32 select;
-+    gctUINT32 data = 0;
-+    gctUINT i;
-+
-+    gcmkHEADER_ARG("Os=0x%X Descriptor=0x%X", Os, Descriptor);
-+
-+    gcmkPRINT_N(4, "    %s debug registers:\n", Descriptor->module);
-+
-+    for (i = 0; i < Descriptor->count; i += 1)
-+    {
-+        select = i << Descriptor->shift;
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
-+#if gcdFPGA_BUILD
-+        gcmkONERROR(gckOS_Delay(Os, 1000));
-+#endif
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
-+
-+        gcmkPRINT_N(12, "      [0x%02X] 0x%08X\n", i, data);
-+    }
-+
-+    select = 0xF << Descriptor->shift;
-+
-+    for (i = 0; i < 500; i += 1)
-+    {
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
-+#if gcdFPGA_BUILD
-+        gcmkONERROR(gckOS_Delay(Os, 1000));
-+#endif
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
-+
-+        if (data == Descriptor->signature)
-+        {
-+            break;
-+        }
-+    }
-+
-+    if (i == 500)
-+    {
-+        gcmkPRINT_N(4, "      failed to obtain the signature (read 0x%08X).\n", data);
-+    }
-+    else
-+    {
-+        gcmkPRINT_N(8, "      signature = 0x%08X (%d read attempt(s))\n", data, i + 1);
-+    }
-+
-+OnError:
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+_IsGPUPresent(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_QUERY_CHIP_IDENTITY identity;
-+    gctUINT32 control;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &control));
-+
-+    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
-+    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      control));
-+
-+    /* Identify the hardware. */
-+    gcmkONERROR(_IdentifyHardware(Hardware->os,
-+                                  Hardware->core,
-+                                  &identity));
-+
-+    /* Check if these are the same values as saved before. */
-+    if ((Hardware->identity.chipModel          != identity.chipModel)
-+    ||  (Hardware->identity.chipRevision       != identity.chipRevision)
-+    ||  (Hardware->identity.chipFeatures       != identity.chipFeatures)
-+    ||  (Hardware->identity.chipMinorFeatures  != identity.chipMinorFeatures)
-+    ||  (Hardware->identity.chipMinorFeatures1 != identity.chipMinorFeatures1)
-+    ||  (Hardware->identity.chipMinorFeatures2 != identity.chipMinorFeatures2)
-+    )
-+    {
-+        gcmkPRINT("[galcore]: GPU is not present.");
-+        gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+_FlushCache(
-+    gckHARDWARE Hardware,
-+    gckCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T bytes, requested;
-+    gctPOINTER buffer;
-+
-+    /* Get the size of the flush command. */
-+    gcmkONERROR(gckHARDWARE_Flush(Hardware,
-+                                  gcvFLUSH_ALL,
-+                                  gcvNULL,
-+                                  &requested));
-+
-+    /* Reserve space in the command queue. */
-+    gcmkONERROR(gckCOMMAND_Reserve(Command,
-+                                   requested,
-+                                   &buffer,
-+                                   &bytes));
-+
-+    /* Append a flush. */
-+    gcmkONERROR(gckHARDWARE_Flush(
-+        Hardware, gcvFLUSH_ALL, buffer, &bytes
-+        ));
-+
-+    /* Execute the command queue. */
-+    gcmkONERROR(gckCOMMAND_Execute(Command, requested));
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+/******************************************************************************\
-+****************************** gckHARDWARE API code *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Construct
-+**
-+**  Construct a new gckHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an initialized gckOS object.
-+**
-+**      gceCORE Core
-+**          Specified core.
-+**
-+**  OUTPUT:
-+**
-+**      gckHARDWARE * Hardware
-+**          Pointer to a variable that will hold the pointer to the gckHARDWARE
-+**          object.
-+*/
-+gceSTATUS
-+gckHARDWARE_Construct(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gckHARDWARE * Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckHARDWARE hardware = gcvNULL;
-+    gctUINT16 data = 0xff00;
-+    gctUINT32 axi_ot;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%x", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
-+
-+    /* Enable the GPU. */
-+    gcmkONERROR(gckOS_SetGPUPower(Os, Core, gcvTRUE, gcvTRUE));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                      Core,
-+                                      0x00000,
-+                                      0x00000900));
-+
-+    /* Allocate the gckHARDWARE object. */
-+    gcmkONERROR(gckOS_Allocate(Os,
-+                               gcmSIZEOF(struct _gckHARDWARE),
-+                               &pointer));
-+
-+    hardware = (gckHARDWARE) pointer;
-+
-+    /* Initialize the gckHARDWARE object. */
-+    hardware->object.type = gcvOBJ_HARDWARE;
-+    hardware->os          = Os;
-+    hardware->core        = Core;
-+
-+    /* Identify the hardware. */
-+    gcmkONERROR(_IdentifyHardware(Os, Core, &hardware->identity));
-+
-+    /* Determine the hardware type */
-+    switch (hardware->identity.chipModel)
-+    {
-+    case gcv350:
-+    case gcv355:
-+        hardware->type = gcvHARDWARE_VG;
-+        break;
-+
-+    case gcv300:
-+    case gcv320:
-+    case gcv420:
-+        hardware->type = gcvHARDWARE_2D;
-+        /*set outstanding limit*/
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x00414, &axi_ot));
-+        axi_ot = (axi_ot & (~0xFF)) | 0x10;
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00414, axi_ot));
-+        break;
-+
-+    default:
-+        hardware->type = gcvHARDWARE_3D;
-+        if(hardware->identity.chipModel == gcv880)
-+        {
-+            /*set outstanding limit*/
-+            gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x00414, &axi_ot));
-+            axi_ot = (axi_ot & (~0xFF)) | 0x10;
-+            gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00414, axi_ot));
-+        }
-+
-+        if ((((((gctUINT32) (hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ))
-+        {
-+            hardware->type = (gceHARDWARE_TYPE) (hardware->type | gcvHARDWARE_2D);
-+        }
-+    }
-+
-+    hardware->powerBaseAddress
-+        = ((hardware->identity.chipModel   == gcv300)
-+        && (hardware->identity.chipRevision < 0x2000))
-+            ? 0x0100
-+            : 0x0000;
-+
-+    /* _ResetGPU need powerBaseAddress. */
-+    status = _ResetGPU(hardware, Os, Core);
-+
-+    if (status != gcvSTATUS_OK)
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "_ResetGPU failed: status=%d\n", status);
-+    }
-+
-+    hardware->powerMutex = gcvNULL;
-+
-+    hardware->mmuVersion
-+        = (((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 28:28)) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) );
-+
-+    /* Determine whether bug fixes #1 are present. */
-+    hardware->extraEventStates = ((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))));
-+
-+    /* Check if big endian */
-+    hardware->bigEndian = (*(gctUINT8 *)&data == 0xff);
-+
-+    /* Initialize the fast clear. */
-+    gcmkONERROR(gckHARDWARE_SetFastClear(hardware, -1, -1));
-+
-+#if !gcdENABLE_128B_MERGE
-+
-+    if (((((gctUINT32) (hardware->identity.chipMinorFeatures2)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
-+    {
-+        /* 128B merge is turned on by default. Disable it. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00558, 0));
-+    }
-+
-+#endif
-+
-+    /* Set power state to ON. */
-+    hardware->chipPowerState  = gcvPOWER_ON;
-+    hardware->clockState      = gcvTRUE;
-+    hardware->powerState      = gcvTRUE;
-+    hardware->lastWaitLink    = ~0U;
-+    hardware->globalSemaphore = gcvNULL;
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    hardware->powerOnFscaleVal = 64;
-+#endif
-+
-+    gcmkONERROR(gckOS_CreateMutex(Os, &hardware->powerMutex));
-+    gcmkONERROR(gckOS_CreateSemaphore(Os, &hardware->globalSemaphore));
-+    hardware->startIsr = gcvNULL;
-+    hardware->stopIsr = gcvNULL;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    hardware->powerOffTimeout = gcdPOWEROFF_TIMEOUT;
-+
-+    gcmkVERIFY_OK(gckOS_CreateTimer(Os,
-+                                    _PowerTimerFunction,
-+                                    (gctPOINTER)hardware,
-+                                    &hardware->powerOffTimer));
-+#endif
-+
-+    gcmkONERROR(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
-+
-+#if gcdLINK_QUEUE_SIZE
-+    hardware->linkQueue.front = 0;
-+    hardware->linkQueue.rear = 0;
-+    hardware->linkQueue.count = 0;
-+#endif
-+
-+    /* Enable power management by default. */
-+    hardware->powerManagement = gcvTRUE;
-+
-+    /* Disable profiler by default */
-+    hardware->gpuProfiler = gcvFALSE;
-+
-+    /* Return pointer to the gckHARDWARE object. */
-+    *Hardware = hardware;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Hardware=0x%x", *Hardware);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (hardware != gcvNULL)
-+    {
-+        /* Turn off the power. */
-+        gcmkVERIFY_OK(gckOS_SetGPUPower(Os, Core, gcvFALSE, gcvFALSE));
-+
-+        if (hardware->globalSemaphore != gcvNULL)
-+        {
-+            /* Destroy the global semaphore. */
-+            gcmkVERIFY_OK(gckOS_DestroySemaphore(Os,
-+                                                 hardware->globalSemaphore));
-+        }
-+
-+        if (hardware->powerMutex != gcvNULL)
-+        {
-+            /* Destroy the power mutex. */
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, hardware->powerMutex));
-+        }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+        if (hardware->powerOffTimer != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
-+            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
-+        }
-+#endif
-+
-+        if (hardware->pageTableDirty != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, hardware));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Destroy
-+**
-+**  Destroy an gckHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object that needs to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Destroy(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Destroy the power semaphore. */
-+    gcmkVERIFY_OK(gckOS_DestroySemaphore(Hardware->os,
-+                                         Hardware->globalSemaphore));
-+
-+    /* Destroy the power mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Hardware->os, Hardware->powerMutex));
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
-+    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
-+#endif
-+
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
-+
-+    /* Mark the object as unknown. */
-+    Hardware->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the object. */
-+    gcmkONERROR(gcmkOS_SAFE_FREE(Hardware->os, Hardware));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_GetType
-+**
-+**  Get the hardware type.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gceHARDWARE_TYPE * Type
-+**          Pointer to a variable that receives the type of hardware object.
-+*/
-+gceSTATUS
-+gckHARDWARE_GetType(
-+    IN gckHARDWARE Hardware,
-+    OUT gceHARDWARE_TYPE * Type
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+    gcmkVERIFY_ARGUMENT(Type != gcvNULL);
-+
-+    *Type = Hardware->type;
-+
-+    gcmkFOOTER_ARG("*Type=%d", *Type);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_InitializeHardware
-+**
-+**  Initialize the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_InitializeHardware(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 baseAddress;
-+    gctUINT32 chipRev;
-+    gctUINT32 control;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Read the chip revision register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00024,
-+                                     &chipRev));
-+
-+    if (chipRev != Hardware->identity.chipRevision)
-+    {
-+        /* Chip is not there! */
-+        gcmkONERROR(gcvSTATUS_CONTEXT_LOSSED);
-+    }
-+
-+    /* Disable isolate GPU bit. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)))));
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &control));
-+
-+    /* Enable debug register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
-+
-+    /* Reset memory counters. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      ~0U));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      0));
-+
-+    /* Get the system's physical base address. */
-+    gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
-+
-+    /* Program the base addesses. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0041C,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00418,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00428,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00420,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00424,
-+                                      baseAddress));
-+
-+#if !VIVANTE_PROFILER
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         Hardware->powerBaseAddress +
-+                                         0x00100,
-+                                         &data));
-+
-+        /* Enable clock gating. */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        if ((Hardware->identity.chipRevision == 0x4301)
-+        ||  (Hardware->identity.chipRevision == 0x4302)
-+        )
-+        {
-+            /* Disable stall module level clock gating for 4.3.0.1 and 4.3.0.2
-+            ** revisions. */
-+            data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
-+        }
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          Hardware->powerBaseAddress
-+                                          + 0x00100,
-+                                          data));
-+
-+#ifndef VIVANTE_NO_3D
-+        /* Disable PE clock gating on revs < 5.0 when HZ is present without a
-+        ** bug fix. */
-+        if ((Hardware->identity.chipRevision < 0x5000)
-+        &&  ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))))
-+        &&  ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))))
-+        )
-+        {
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     Hardware->powerBaseAddress
-+                                     + 0x00104,
-+                                     &data));
-+
-+            /* Disable PE clock gating. */
-+            data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
-+
-+            gcmkONERROR(
-+                gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      Hardware->powerBaseAddress
-+                                      + 0x00104,
-+                                      data));
-+        }
-+
-+#endif
-+    }
-+#endif
-+
-+    /* Special workaround for this core
-+    ** Make sure pulse eater kicks in only when SH is idle */
-+    if (Hardware->identity.chipModel == gcv4000 &&
-+        Hardware->identity.chipRevision == 0x5208)
-+    {
-+		gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x0010C,
-+                                  ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)))));
-+    }
-+
-+    if ((gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HALTI2) == gcvFALSE)
-+     || (gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HALTI2) && (Hardware->identity.chipRevision < 0x5422))
-+    )
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &data));
-+
-+
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15)));
-+
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  data));
-+    }
-+
-+    /* Special workaround for this core
-+    ** Make sure FE and TX are on different buses */
-+    if ((Hardware->identity.chipModel == gcv2000)
-+    &&  (Hardware->identity.chipRevision  == 0x5108))
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00480,
-+                                 &data));
-+
-+        /* Set FE bus to one, TX bus to zero */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00480,
-+                                  data));
-+    }
-+
-+    /* Test if MMU is initialized. */
-+    if ((Hardware->kernel      != gcvNULL)
-+    &&  (Hardware->kernel->mmu != gcvNULL)
-+    )
-+    {
-+        /* Reset MMU. */
-+        if (Hardware->mmuVersion == 0)
-+        {
-+            gcmkONERROR(
-+                    gckHARDWARE_SetMMU(Hardware,
-+                        Hardware->kernel->mmu->pageTableLogical));
-+        }
-+    }
-+
-+    if (Hardware->identity.chipModel >= gcv400
-+    &&  Hardware->identity.chipModel != gcv420
-+    &&  (((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 15:15) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) != gcvTRUE)
-+    )
-+    {
-+		gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &data));
-+
-+        /* Disable PA clock gating. */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  data));
-+    }
-+
-+#if gcdHZ_L2_DISALBE
-+    /* Disable HZ-L2. */
-+    if (((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) == gcvTRUE ||
-+            ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) == gcvTRUE)
-+    {
-+		gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00414,
-+                                 &data));
-+
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00414,
-+                                  data));
-+    }
-+#endif
-+
-+    /* Limit 2D outstanding request. */
-+    if(Hardware->identity.chipModel == gcv880)
-+    {
-+        gctUINT32 axi_ot;
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &axi_ot));
-+        axi_ot = (axi_ot & (~0xFF)) | 0x10;
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00414, axi_ot));
-+    }
-+
-+    if (Hardware->identity.chip2DControl & 0xFF)
-+    {
-+		gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00414,
-+                                 &data));
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (Hardware->identity.chip2DControl & 0xFF) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00414,
-+                                  data));
-+    }
-+
-+    /* Update GPU AXI cache atttribute. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00008,
-+                                      0x00002200));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryMemory
-+**
-+**  Query the amount of memory available on the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * InternalSize
-+**          Pointer to a variable that will hold the size of the internal video
-+**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
-+**          internal memory will be returned.
-+**
-+**      gctUINT32 * InternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * InternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctSIZE_T * ExternalSize
-+**          Pointer to a variable that will hold the size of the external video
-+**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
-+**          external memory will be returned.
-+**
-+**      gctUINT32 * ExternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * ExternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * HorizontalTileSize
-+**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
-+**          gcvNULL, no horizontal pixel per tile will be returned.
-+**
-+**      gctUINT32 * VerticalTileSize
-+**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
-+**          gcvNULL, no vertical pixel per tile will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryMemory(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctUINT32 * InternalBaseAddress,
-+    OUT gctUINT32 * InternalAlignment,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctUINT32 * ExternalBaseAddress,
-+    OUT gctUINT32 * ExternalAlignment,
-+    OUT gctUINT32 * HorizontalTileSize,
-+    OUT gctUINT32 * VerticalTileSize
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (InternalSize != gcvNULL)
-+    {
-+        /* No internal memory. */
-+        *InternalSize = 0;
-+    }
-+
-+    if (ExternalSize != gcvNULL)
-+    {
-+        /* No external memory. */
-+        *ExternalSize = 0;
-+    }
-+
-+    if (HorizontalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *HorizontalTileSize = 4;
-+    }
-+
-+    if (VerticalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *VerticalTileSize = 4;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*InternalSize=%lu *InternalBaseAddress=0x%08x "
-+                   "*InternalAlignment=0x%08x *ExternalSize=%lu "
-+                   "*ExternalBaseAddress=0x%08x *ExtenalAlignment=0x%08x "
-+                   "*HorizontalTileSize=%u *VerticalTileSize=%u",
-+                   gcmOPT_VALUE(InternalSize),
-+                   gcmOPT_VALUE(InternalBaseAddress),
-+                   gcmOPT_VALUE(InternalAlignment),
-+                   gcmOPT_VALUE(ExternalSize),
-+                   gcmOPT_VALUE(ExternalBaseAddress),
-+                   gcmOPT_VALUE(ExternalAlignment),
-+                   gcmOPT_VALUE(HorizontalTileSize),
-+                   gcmOPT_VALUE(VerticalTileSize));
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryChipIdentity
-+**
-+**  Query the identity of the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+**          Pointer to the identity structure.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryChipIdentity(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+    )
-+{
-+    gctUINT32 features;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Identity != gcvNULL);
-+
-+    /* Return chip model and revision. */
-+    Identity->chipModel = Hardware->identity.chipModel;
-+    Identity->chipRevision = Hardware->identity.chipRevision;
-+
-+    /* Return feature set. */
-+    features = Hardware->identity.chipFeatures;
-+
-+    if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+    {
-+        /* Override fast clear by command line. */
-+        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+    }
-+
-+    if ((((((gctUINT32) (features)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ))
-+    {
-+        /* Override compression by command line. */
-+        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (Hardware->allowCompression) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+    }
-+
-+    /* Mark 2D pipe as available for GC500.0 through GC500.2 and GC300,
-+    ** since they did not have this bit. */
-+    if (((Hardware->identity.chipModel == gcv500) && (Hardware->identity.chipRevision <= 2))
-+    ||   (Hardware->identity.chipModel == gcv300)
-+    )
-+    {
-+        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+    }
-+
-+    Identity->chipFeatures = features;
-+
-+    /* Return minor features. */
-+    Identity->chipMinorFeatures  = Hardware->identity.chipMinorFeatures;
-+    Identity->chipMinorFeatures1 = Hardware->identity.chipMinorFeatures1;
-+    Identity->chipMinorFeatures2 = Hardware->identity.chipMinorFeatures2;
-+    Identity->chipMinorFeatures3 = Hardware->identity.chipMinorFeatures3;
-+    Identity->chipMinorFeatures4 = Hardware->identity.chipMinorFeatures4;
-+
-+    /* Return chip specs. */
-+    Identity->streamCount            = Hardware->identity.streamCount;
-+    Identity->registerMax            = Hardware->identity.registerMax;
-+    Identity->threadCount            = Hardware->identity.threadCount;
-+    Identity->shaderCoreCount        = Hardware->identity.shaderCoreCount;
-+    Identity->vertexCacheSize        = Hardware->identity.vertexCacheSize;
-+    Identity->vertexOutputBufferSize = Hardware->identity.vertexOutputBufferSize;
-+    Identity->pixelPipes             = Hardware->identity.pixelPipes;
-+    Identity->instructionCount       = Hardware->identity.instructionCount;
-+    Identity->numConstants           = Hardware->identity.numConstants;
-+    Identity->bufferSize             = Hardware->identity.bufferSize;
-+    Identity->varyingsCount          = Hardware->identity.varyingsCount;
-+    Identity->superTileMode          = Hardware->identity.superTileMode;
-+    Identity->chip2DControl          = Hardware->identity.chip2DControl;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SplitMemory
-+**
-+**  Split a hardware specific memory address into a pool and offset.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Address in hardware specific format.
-+**
-+**  OUTPUT:
-+**
-+**      gcePOOL * Pool
-+**          Pointer to a variable that will hold the pool type for the address.
-+**
-+**      gctUINT32 * Offset
-+**          Pointer to a variable that will hold the offset for the address.
-+*/
-+gceSTATUS
-+gckHARDWARE_SplitMemory(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Addres=0x%08x", Hardware, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
-+
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        /* Dispatch on memory type. */
-+        switch ((((((gctUINT32) (Address)) >> (0 ? 31:31)) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) ))
-+        {
-+        case 0x0:
-+            /* System memory. */
-+            *Pool = gcvPOOL_SYSTEM;
-+            break;
-+
-+        case 0x1:
-+            /* Virtual memory. */
-+            *Pool = gcvPOOL_VIRTUAL;
-+            break;
-+
-+        default:
-+            /* Invalid memory type. */
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+        }
-+
-+        /* Return offset of address. */
-+        *Offset = (((((gctUINT32) (Address)) >> (0 ? 30:0)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1)))))) );
-+    }
-+    else
-+    {
-+        *Pool = gcvPOOL_SYSTEM;
-+        *Offset = Address;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Pool=%d *Offset=0x%08x", *Pool, *Offset);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Execute
-+**
-+**  Kickstart the hardware's command processor with an initialized command
-+**  buffer.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of command buffer.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes for the prefetch unit (until after the first LINK).
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Execute(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+#ifdef __QNXNTO__
-+    IN gctPOINTER Physical,
-+    IN gctBOOL PhysicalAddresses,
-+#endif
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 address = 0, control;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Bytes=%lu",
-+                   Hardware, Logical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+#ifdef __QNXNTO__
-+    if (PhysicalAddresses && (Hardware->mmuVersion == 0))
-+    {
-+        /* Convert physical into hardware specific address. */
-+        gcmkONERROR(
-+            gckHARDWARE_ConvertPhysical(Hardware, Physical, &address));
-+    }
-+    else
-+    {
-+#endif
-+    /* Convert logical into hardware specific address. */
-+    gcmkONERROR(
-+        gckHARDWARE_ConvertLogical(Hardware, Logical, &address));
-+#ifdef __QNXNTO__
-+    }
-+#endif
-+
-+    /* Enable all events. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00014, ~0U));
-+
-+    /* Write address register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00654, address));
-+
-+    /* Build control register. */
-+    control = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) ((Bytes + 7) >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+    /* Set big endian */
-+    if (Hardware->bigEndian)
-+    {
-+        control |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20)));
-+    }
-+
-+    /* Write control register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00658, control));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                  "Started command buffer @ 0x%08x",
-+                  address);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_WaitLink
-+**
-+**  Append a WAIT/LINK command sequence at the specified location in the command
-+**  queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          WAIT/LINK command sequence at or gcvNULL just to query the size of the
-+**          WAIT/LINK command sequence.
-+**
-+**      gctUINT32 Offset
-+**          Offset into command buffer required for alignment.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the WAIT/LINK command
-+**          sequence.  If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          by the WAIT/LINK command sequence.  If 'Bytes' is gcvNULL, nothing will
-+**          be returned.
-+**
-+**      gctUINT32 * WaitOffset
-+**          Pointer to a variable that will receive the offset of the WAIT command
-+**          from the specified logcial pointer.
-+**          If 'WaitOffset' is gcvNULL nothing will be returned.
-+**
-+**      gctSIZE_T * WaitSize
-+**          Pointer to a variable that will receive the number of bytes used by
-+**          the WAIT command.  If 'LinkSize' is gcvNULL nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_WaitLink(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctUINT32 * WaitOffset,
-+    OUT gctSIZE_T * WaitSize
-+    )
-+{
-+    static const gctUINT waitCount = 200;
-+
-+    gceSTATUS status;
-+    gctUINT32 address;
-+    gctUINT32_PTR logical;
-+    gctSIZE_T bytes;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x *Bytes=%lu",
-+                   Hardware, Logical, Offset, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical != gcvNULL) || (Bytes != gcvNULL));
-+
-+    /* Compute number of bytes required. */
-+#if gcd6000_SUPPORT
-+    bytes = gcmALIGN(Offset + 96, 8) - Offset;
-+#else
-+    bytes = gcmALIGN(Offset + 16, 8) - Offset;
-+#endif
-+
-+    /* Cast the input pointer. */
-+    logical = (gctUINT32_PTR) Logical;
-+
-+    if (logical != gcvNULL)
-+    {
-+        /* Not enough space? */
-+        if (*Bytes < bytes)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Convert logical into hardware specific address. */
-+        gcmkONERROR(gckHARDWARE_ConvertLogical(Hardware, logical, &address));
-+
-+        /* Store the WAIT/LINK address. */
-+        Hardware->lastWaitLink = address;
-+
-+        /* Append WAIT(count). */
-+        logical[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (waitCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+#if gcd6000_SUPPORT
-+        /* Send FE-PE sempahore token. */
-+        logical[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[3]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Send FE-PE stall token. */
-+        logical[4]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        logical[5]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /*************************************************************/
-+        /* Enable chip ID 0. */
-+        logical[6] =
-+            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | (1 << 0);
-+
-+        /* Send semaphore from FE to ChipID 1. */
-+        logical[8] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[9] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
-+
-+        /* Send semaphore from FE to ChipID 1. */
-+        logical[10] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        logical[11] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
-+
-+        /*************************************************************/
-+        /* Enable chip ID 1. */
-+        logical[12] =
-+            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | (1 << 1);
-+
-+        /* Send semaphore from FE to ChipID 1. */
-+        logical[14] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[15] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
-+
-+        /* Wait for semaphore from ChipID 0. */
-+        logical[16] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        logical[17] =
-+              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
-+
-+        /*************************************************************/
-+        /* Enable all chips. */
-+        logical[18] =
-+            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | (0xFFFF);
-+
-+        /* LoadState(AQFlush, 1), flush. */
-+        logical[20]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[21]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+        /* Append LINK(2, address). */
-+        logical[22]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[23] = address;
-+#else
-+        /* Append LINK(2, address). */
-+        logical[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[3] = address;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "0x%08x: WAIT %u", address, waitCount
-+            );
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "0x%08x: LINK 0x%08x, #%lu",
-+            address + 8, address, bytes
-+            );
-+#endif
-+
-+        if (WaitOffset != gcvNULL)
-+        {
-+            /* Return the offset pointer to WAIT command. */
-+            *WaitOffset = 0;
-+        }
-+
-+        if (WaitSize != gcvNULL)
-+        {
-+            /* Return number of bytes used by the WAIT command. */
-+            *WaitSize = 8;
-+        }
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the WAIT/LINK command
-+        ** sequence. */
-+        *Bytes = bytes;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu *WaitOffset=0x%x *WaitSize=%lu",
-+                   gcmOPT_VALUE(Bytes), gcmOPT_VALUE(WaitOffset),
-+                   gcmOPT_VALUE(WaitSize));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_End
-+**
-+**  Append an END command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          END command at or gcvNULL just to query the size of the END command.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the END command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the END command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_End(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
-+                   Hardware, Logical, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Append END. */
-+       logical[0] =
-+            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: END", Logical);
-+
-+        /* Make sure the CPU writes out the data to memory. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, Logical));
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the END command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Nop
-+**
-+**  Append a NOP command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          NOP command at or gcvNULL just to query the size of the NOP command.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the NOP command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the NOP command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Nop(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
-+                   Hardware, Logical, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Append NOP. */
-+        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: NOP", Logical);
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the NOP command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Wait
-+**
-+**  Append a WAIT command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          WAIT command at or gcvNULL just to query the size of the WAIT command.
-+**
-+**      gctUINT32 Count
-+**          Number of cycles to wait.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the WAIT command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the NOP command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Wait(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Count,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32_PTR logical;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Count=%u *Bytes=%lu",
-+                   Hardware, Logical, Count, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    /* Cast the input pointer. */
-+    logical = (gctUINT32_PTR) Logical;
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Append WAIT. */
-+        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+        {
-+            gctUINT32 address;
-+
-+            /* Convert logical into hardware specific address. */
-+            gcmkONERROR(gckHARDWARE_ConvertLogical(
-+                Hardware, logical, &address
-+                ));
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                "0x%08x: WAIT %u", address, Count
-+                );
-+        }
-+#endif
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the WAIT command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Event
-+**
-+**  Append an EVENT command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          the EVENT command at or gcvNULL just to query the size of the EVENT
-+**          command.
-+**
-+**      gctUINT8 Event
-+**          Event ID to program.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Location of the pipe to send the event.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the EVENT command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the EVENT command.  If 'Bytes' is gcvNULL, nothing will be
-+**          returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Event(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT8 Event,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT size;
-+    gctUINT32 destination = 0;
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Event=%u FromWhere=%d *Bytes=%lu",
-+                   Hardware, Logical, Event, FromWhere, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+    gcmkVERIFY_ARGUMENT(Event < 32);
-+
-+    /* Determine the size of the command. */
-+
-+    size = (Hardware->extraEventStates && (FromWhere == gcvKERNEL_PIXEL))
-+         ? gcmALIGN(8 + (1 + 5) * 4, 8) /* EVENT + 5 STATES */
-+         : 8;
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < size)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        switch (FromWhere)
-+        {
-+        case gcvKERNEL_COMMAND:
-+            /* From command processor. */
-+            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+            break;
-+
-+        case gcvKERNEL_PIXEL:
-+            /* From pixel engine. */
-+            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+            break;
-+
-+        default:
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        /* Append EVENT(Event, destiantion). */
-+        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[1] = ((((gctUINT32) (destination)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (Event) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
-+
-+        /* Make sure the event ID gets written out before GPU can access it. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, logical + 1));
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+        {
-+            gctUINT32 phys;
-+            gckOS_GetPhysicalAddress(Hardware->os, Logical, &phys);
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "0x%08x: EVENT %d", phys, Event);
-+        }
-+#endif
-+
-+        /* Append the extra states. These are needed for the chips that do not
-+        ** support back-to-back events due to the async interface. The extra
-+        ** states add the necessary delay to ensure that event IDs do not
-+        ** collide. */
-+        if (size > 8)
-+        {
-+            logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0100) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+            logical[3] = 0;
-+            logical[4] = 0;
-+            logical[5] = 0;
-+            logical[6] = 0;
-+            logical[7] = 0;
-+        }
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the EVENT command. */
-+        *Bytes = size;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_PipeSelect
-+**
-+**  Append a PIPESELECT command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          the PIPESELECT command at or gcvNULL just to query the size of the
-+**          PIPESELECT command.
-+**
-+**      gcePIPE_SELECT Pipe
-+**          Pipe value to select.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the PIPESELECT command.
-+**          If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the PIPESELECT command.  If 'Bytes' is gcvNULL, nothing will be
-+**          returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_PipeSelect(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gcePIPE_SELECT Pipe,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Pipe=%d *Bytes=%lu",
-+                   Hardware, Logical, Pipe, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    /* Append a PipeSelect. */
-+    if (Logical != gcvNULL)
-+    {
-+        gctUINT32 flush, stall;
-+
-+        if (*Bytes < 32)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        flush = (Pipe == gcvPIPE_2D)
-+              ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+              : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+
-+        stall = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LoadState(AQFlush, 1), flush. */
-+        logical[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[1]
-+            = flush;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: FLUSH 0x%x", logical, flush);
-+
-+        /* LoadState(AQSempahore, 1), stall. */
-+        logical[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[3]
-+            = stall;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: SEMAPHORE 0x%x", logical + 2, stall);
-+
-+        /* Stall, stall. */
-+        logical[4] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+        logical[5] = stall;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: STALL 0x%x", logical + 4, stall);
-+
-+        /* LoadState(AQPipeSelect, 1), pipe. */
-+        logical[6]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[7] = (Pipe == gcvPIPE_2D)
-+            ? 0x1
-+            : 0x0;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: PIPE %d", logical + 6, Pipe);
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the PIPESELECT command. */
-+        *Bytes = 32;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Link
-+**
-+**  Append a LINK command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          the LINK command at or gcvNULL just to query the size of the LINK
-+**          command.
-+**
-+**      gctPOINTER FetchAddress
-+**          Logical address of destination of LINK.
-+**
-+**      gctSIZE_T FetchSize
-+**          Number of bytes in destination of LINK.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the LINK command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the LINK command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Link(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctPOINTER FetchAddress,
-+    IN gctSIZE_T FetchSize,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T bytes;
-+    gctUINT32 address;
-+    gctUINT32 link;
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x FetchAddress=0x%x FetchSize=%lu "
-+                   "*Bytes=%lu",
-+                   Hardware, Logical, FetchAddress, FetchSize,
-+                   gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Convert logical address to hardware address. */
-+        gcmkONERROR(
-+            gckHARDWARE_ConvertLogical(Hardware, FetchAddress, &address));
-+
-+        gcmkONERROR(
-+            gckOS_WriteMemory(Hardware->os, logical + 1, address));
-+
-+        /* Make sure the address got written before the LINK command. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, logical + 1));
-+
-+        /* Compute number of 64-byte aligned bytes to fetch. */
-+        bytes = gcmALIGN(address + FetchSize, 8) - address;
-+
-+        /* Append LINK(bytes / 8), FetchAddress. */
-+        link = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteMemory(Hardware->os, logical, link));
-+
-+        /* Memory barrier. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, logical));
-+
-+#if gcdLINK_QUEUE_SIZE && gcdVIRTUAL_COMMAND_BUFFER
-+        if (address >= 0x80000000)
-+        {
-+            gckLINKQUEUE_Enqueue(&Hardware->linkQueue, address, address + bytes);
-+        }
-+#endif
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the LINK command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_UpdateQueueTail
-+**
-+**  Update the tail of the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the start of the command queue.
-+**
-+**      gctUINT32 Offset
-+**          Offset into the command queue of the tail (last command).
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_UpdateQueueTail(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x",
-+                   Hardware, Logical, Offset);
-+
-+    /* Verify the hardware. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Force a barrier. */
-+    gcmkONERROR(
-+        gckOS_MemoryBarrier(Hardware->os, Logical));
-+
-+    /* Notify gckKERNEL object of change. */
-+    gcmkONERROR(
-+        gckKERNEL_Notify(Hardware->kernel,
-+                         gcvNOTIFY_COMMAND_QUEUE,
-+                         gcvFALSE));
-+
-+    if (status == gcvSTATUS_CHIP_NOT_READY)
-+    {
-+        gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_ConvertLogical
-+**
-+**  Convert a logical system address into a hardware specific address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to convert.
-+**
-+**      gctUINT32* Address
-+**          Return hardware specific address.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_ConvertLogical(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+    gceSTATUS status;
-+    gctUINT32 baseAddress;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x", Hardware, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+    status = gckKERNEL_GetGPUAddress(Hardware->kernel, Logical, Address);
-+
-+    if (status == gcvSTATUS_INVALID_ADDRESS)
-+#endif
-+    {
-+        /* Convert logical address into a physical address. */
-+        gcmkONERROR(
-+            gckOS_GetPhysicalAddress(Hardware->os, Logical, &address));
-+
-+        /* For old MMU, get GPU address according to baseAddress. */
-+        if (Hardware->mmuVersion == 0)
-+        {
-+            gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
-+
-+            /* Subtract base address to get a GPU address. */
-+            gcmkASSERT(address >= baseAddress);
-+            address -= baseAddress;
-+        }
-+
-+        /* Return hardware specific address. */
-+        *Address = (Hardware->mmuVersion == 0)
-+                 ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (address) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)))
-+                 : address;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_ConvertPhysical
-+**
-+**  Convert a physical address into a hardware specific address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address to convert.
-+**
-+**      gctUINT32* Address
-+**          Return hardware specific address.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_ConvertPhysical(
-+    IN gckHARDWARE Hardware,
-+    IN gctPHYS_ADDR Physical,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+    gctUINT32 baseAddress;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Physical=0x%x", Hardware, Physical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    address = gcmPTR2INT(Physical);
-+
-+    /* For old MMU, get GPU address according to baseAddress. */
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        gcmkVERIFY_OK(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
-+
-+        /* Subtract base address to get a GPU address. */
-+        gcmkASSERT(address >= baseAddress);
-+        address -= baseAddress;
-+    }
-+
-+    /* Return hardware specific address. */
-+    *Address = (Hardware->mmuVersion == 0)
-+             ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
-+               | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (address) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)))
-+             : address;
-+
-+    /* Return the status. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Interrupt
-+**
-+**  Process an interrupt.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL InterruptValid
-+**          If gcvTRUE, this function will read the interrupt acknowledge
-+**          register, stores the data, and return whether or not the interrupt
-+**          is ours or not.  If gcvFALSE, this functions will read the interrupt
-+**          acknowledge register and combine it with any stored value to handle
-+**          the event notifications.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Interrupt(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL InterruptValid
-+    )
-+{
-+    gckEVENT eventObj;
-+    gctUINT32 data;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x InterruptValid=%d", Hardware, InterruptValid);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Extract gckEVENT object. */
-+    eventObj = Hardware->kernel->eventObj;
-+    gcmkVERIFY_OBJECT(eventObj, gcvOBJ_EVENT);
-+
-+    if (InterruptValid)
-+    {
-+        /* Read AQIntrAcknowledge register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00010,
-+                                 &data));
-+
-+        if (data == 0)
-+        {
-+            /* Not our interrupt. */
-+            status = gcvSTATUS_NOT_OUR_INTERRUPT;
-+        }
-+        else
-+        {
-+            /* Inform gckEVENT of the interrupt. */
-+            status = gckEVENT_Interrupt(eventObj, data);
-+        }
-+    }
-+    else
-+    {
-+        /* Handle events. */
-+        status = gckEVENT_Notify(eventObj, 0);
-+    }
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryCommandBuffer
-+**
-+**  Query the command buffer alignment and number of reserved bytes.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Alignment
-+**          Pointer to a variable receiving the alignment for each command.
-+**
-+**      gctSIZE_T * ReservedHead
-+**          Pointer to a variable receiving the number of reserved bytes at the
-+**          head of each command buffer.
-+**
-+**      gctSIZE_T * ReservedTail
-+**          Pointer to a variable receiving the number of bytes reserved at the
-+**          tail of each command buffer.
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryCommandBuffer(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * Alignment,
-+    OUT gctSIZE_T * ReservedHead,
-+    OUT gctSIZE_T * ReservedTail
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Alignment != gcvNULL)
-+    {
-+        /* Align every 8 bytes. */
-+        *Alignment = 8;
-+    }
-+
-+    if (ReservedHead != gcvNULL)
-+    {
-+        /* Reserve space for SelectPipe(). */
-+        *ReservedHead = 32;
-+    }
-+
-+    if (ReservedTail != gcvNULL)
-+    {
-+        /* Reserve space for Link(). */
-+        *ReservedTail = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Alignment=%lu *ReservedHead=%lu *ReservedTail=%lu",
-+                   gcmOPT_VALUE(Alignment), gcmOPT_VALUE(ReservedHead),
-+                   gcmOPT_VALUE(ReservedTail));
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QuerySystemMemory
-+**
-+**  Query the command buffer alignment and number of reserved bytes.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * SystemSize
-+**          Pointer to a variable that receives the maximum size of the system
-+**          memory.
-+**
-+**      gctUINT32 * SystemBaseAddress
-+**          Poinetr to a variable that receives the base address for system
-+**          memory.
-+*/
-+gceSTATUS
-+gckHARDWARE_QuerySystemMemory(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * SystemSize,
-+    OUT gctUINT32 * SystemBaseAddress
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (SystemSize != gcvNULL)
-+    {
-+        /* Maximum system memory can be 2GB. */
-+        *SystemSize = 1U << 31;
-+    }
-+
-+    if (SystemBaseAddress != gcvNULL)
-+    {
-+        /* Set system memory base address. */
-+        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*SystemSize=%lu *SystemBaseAddress=%lu",
-+                   gcmOPT_VALUE(SystemSize), gcmOPT_VALUE(SystemBaseAddress));
-+    return gcvSTATUS_OK;
-+}
-+
-+#ifndef VIVANTE_NO_3D
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryShaderCaps
-+**
-+**  Query the shader capabilities.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT * VertexUniforms
-+**          Pointer to a variable receiving the number of uniforms in the vertex
-+**          shader.
-+**
-+**      gctUINT * FragmentUniforms
-+**          Pointer to a variable receiving the number of uniforms in the
-+**          fragment shader.
-+**
-+**      gctUINT * Varyings
-+**          Pointer to a variable receiving the maimum number of varyings.
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryShaderCaps(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT * VertexUniforms,
-+    OUT gctUINT * FragmentUniforms,
-+    OUT gctUINT * Varyings
-+    )
-+{
-+    gctUINT32 vsConstMax;
-+    gctUINT32 psConstMax;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x VertexUniforms=0x%x "
-+                   "FragmentUniforms=0x%x Varyings=0x%x",
-+                   Hardware, VertexUniforms,
-+                   FragmentUniforms, Varyings);
-+
-+    if ((Hardware->identity.chipModel == gcv2000)
-+     && (Hardware->identity.chipRevision == 0x5118))
-+    {
-+        vsConstMax   = 256;
-+        psConstMax   = 64;
-+    }
-+    else if (Hardware->identity.numConstants > 256)
-+    {
-+        vsConstMax   = 256;
-+        psConstMax   = 256;
-+    }
-+    else if (Hardware->identity.numConstants == 256)
-+    {
-+        vsConstMax   = 256;
-+        psConstMax   = 256;
-+    }
-+    else
-+    {
-+        vsConstMax   = 168;
-+        psConstMax   = 64;
-+    }
-+
-+    if (VertexUniforms != gcvNULL)
-+    {
-+        *VertexUniforms = vsConstMax;
-+    }
-+
-+    if (FragmentUniforms != gcvNULL)
-+    {
-+        *FragmentUniforms = psConstMax;
-+    }
-+
-+    if (Varyings != gcvNULL)
-+    {
-+		/* Return the shader varyings count. */
-+        *Varyings = Hardware->identity.varyingsCount;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetMMU
-+**
-+**  Set the page table base address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the page table.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_SetMMU(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 address = 0;
-+    gctUINT32 baseAddress;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x", Hardware, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Convert the logical address into an hardware address. */
-+    gcmkONERROR(
-+        gckHARDWARE_ConvertLogical(Hardware, Logical, &address));
-+
-+    /* Also get the base address - we need a real physical address. */
-+    gcmkONERROR(
-+        gckOS_GetBaseAddress(Hardware->os, &baseAddress));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Setting page table to 0x%08X",
-+                   address + baseAddress);
-+
-+    /* Write the AQMemoryFePageTable register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              0x00400,
-+                              address + baseAddress));
-+
-+    /* Write the AQMemoryRaPageTable register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              0x00410,
-+                              address + baseAddress));
-+
-+    /* Write the AQMemoryTxPageTable register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              0x00404,
-+                              address + baseAddress));
-+
-+
-+    /* Write the AQMemoryPePageTable register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              0x00408,
-+                              address + baseAddress));
-+
-+    /* Write the AQMemoryPezPageTable register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              0x0040C,
-+                              address + baseAddress));
-+
-+    /* Return the status. */
-+    gcmkFOOTER_NO();
-+    return status;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_FlushMMU
-+**
-+**  Flush the page table.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_FlushMMU(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command;
-+    gctUINT32_PTR buffer;
-+    gctSIZE_T bufferSize;
-+    gctBOOL commitEntered = gcvFALSE;
-+    gctPOINTER pointer = gcvNULL;
-+    gctUINT32 flushSize;
-+    gctUINT32 count;
-+    gctUINT32 physical;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Verify the gckCOMMAND object pointer. */
-+    command = Hardware->kernel->command;
-+
-+    /* Acquire the command queue. */
-+    gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvFALSE));
-+    commitEntered = gcvTRUE;
-+
-+    /* Flush the memory controller. */
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        gcmkONERROR(gckCOMMAND_Reserve(
-+            command, 8, &pointer, &bufferSize
-+            ));
-+
-+        buffer = (gctUINT32_PTR) pointer;
-+
-+        buffer[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[1]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+
-+        gcmkONERROR(gckCOMMAND_Execute(command, 8));
-+    }
-+    else
-+    {
-+        flushSize =  16 * 4;
-+
-+        gcmkONERROR(gckCOMMAND_Reserve(
-+            command, flushSize, &pointer, &bufferSize
-+            ));
-+
-+        buffer = (gctUINT32_PTR) pointer;
-+
-+        count = (bufferSize - flushSize + 7) >> 3;
-+
-+        gcmkONERROR(gckOS_GetPhysicalAddress(command->os, buffer, &physical));
-+
-+        /* Flush cache. */
-+        buffer[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[1]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+        /* Arm the PE-FE Semaphore. */
-+        buffer[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[3]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        buffer[4]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        buffer[5]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LINK to next slot to flush FE FIFO. */
-+        buffer[6]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[7]
-+            = physical + 8 * gcmSIZEOF(gctUINT32);
-+
-+        /* Flush MMU cache. */
-+        buffer[8]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[9]
-+            = (((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) &  ((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))));
-+
-+        /* Arm the PE-FE Semaphore. */
-+        buffer[10]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[11]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        buffer[12]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        buffer[13]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LINK to next slot to flush FE FIFO. */
-+        buffer[14]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[15]
-+            = physical + flushSize;
-+
-+        gcmkONERROR(gckCOMMAND_Execute(command, flushSize));
-+    }
-+
-+    /* Release the command queue. */
-+    gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvFALSE));
-+    commitEntered = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(Hardware->kernel->command,
-+                                            gcvFALSE));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetMMUv2
-+**
-+**  Set the page table base address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_SetMMUv2(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Enable,
-+    IN gctPOINTER MtlbAddress,
-+    IN gceMMU_MODE Mode,
-+    IN gctPOINTER SafeAddress,
-+    IN gctBOOL FromPower
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 config, address;
-+    gckCOMMAND command;
-+    gctUINT32_PTR buffer;
-+    gctSIZE_T bufferSize;
-+    gctBOOL commitEntered = gcvFALSE;
-+    gctPOINTER pointer = gcvNULL;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL config2D;
-+    gctSIZE_T configSize;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Enable=%d", Hardware, Enable);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    config2D =  gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_3D)
-+             && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_2D);
-+
-+    configSize = 4 * 4;
-+
-+    if (config2D)
-+    {
-+        configSize +=
-+            /* Pipe Select. */
-+            4 * 4
-+            /* Configure MMU States. */
-+          + 4 * 4;
-+    }
-+
-+    /* Convert logical address into physical address. */
-+    gcmkONERROR(
-+        gckOS_GetPhysicalAddress(Hardware->os, MtlbAddress, &config));
-+
-+    gcmkONERROR(
-+        gckOS_GetPhysicalAddress(Hardware->os, SafeAddress, &address));
-+
-+    if (address & 0x3F)
-+    {
-+        gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+    }
-+
-+    switch (Mode)
-+    {
-+    case gcvMMU_MODE_1K:
-+        if (config & 0x3FF)
-+        {
-+            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+        }
-+
-+        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        break;
-+
-+    case gcvMMU_MODE_4K:
-+        if (config & 0xFFF)
-+        {
-+            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+        }
-+
-+        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        break;
-+
-+    default:
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Verify the gckCOMMAND object pointer. */
-+    command = Hardware->kernel->command;
-+
-+    /* Acquire the command queue. */
-+    gcmkONERROR(gckCOMMAND_EnterCommit(command, FromPower));
-+    commitEntered = gcvTRUE;
-+
-+    gcmkONERROR(gckCOMMAND_Reserve(
-+        command, configSize, &pointer, &bufferSize
-+        ));
-+
-+    buffer = pointer;
-+
-+    buffer[0]
-+        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+    buffer[1] = config;
-+
-+    buffer[2]
-+        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+    buffer[3] = address;
-+
-+    if (config2D)
-+    {
-+        /* LoadState(AQPipeSelect, 1), pipe. */
-+        buffer[4]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[5] = 0x1;
-+
-+        buffer[6]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[7] = config;
-+
-+        buffer[8]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[9] = address;
-+
-+        /* LoadState(AQPipeSelect, 1), pipe. */
-+        buffer[10]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[11] = 0x0;
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+        "Setup MMU: config=%08x, Safe Address=%08x\n.", config, address);
-+
-+    gcmkONERROR(gckCOMMAND_Execute(command, configSize));
-+
-+    if (FromPower == gcvFALSE)
-+    {
-+        /* Acquire global semaphore to suspend power management until MMU
-+        ** is enabled. And acquired it before gckCOMMAND_ExitCommit to
-+        ** make sure GPU keeps ON. */
-+        gcmkONERROR(
-+            gckOS_AcquireSemaphore(Hardware->os, Hardware->globalSemaphore));
-+
-+        acquired = gcvTRUE;
-+    }
-+
-+    /* Release the command queue. */
-+    gcmkONERROR(gckCOMMAND_ExitCommit(command, FromPower));
-+    commitEntered = gcvFALSE;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+        "call gckCOMMAND_Stall to make sure the config is done.\n ");
-+
-+    gcmkONERROR(gckCOMMAND_Stall(command, FromPower));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+        "Enable MMU through GCREG_MMU_CONTROL.");
-+
-+    /* Enable MMU. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              0x0018C,
-+                              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Enable) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))));
-+
-+    if (FromPower == gcvFALSE)
-+    {
-+        /* Relase global semaphore. */
-+        gcmkVERIFY_OK(
-+            gckOS_ReleaseSemaphore(Hardware->os, Hardware->globalSemaphore));
-+
-+        acquired = gcvFALSE;
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+        "call gckCOMMAND_Stall to check MMU available.\n");
-+
-+    gcmkONERROR(gckCOMMAND_Stall(command, FromPower));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+        "The MMU is available.\n");
-+
-+    /* Return the status. */
-+    gcmkFOOTER_NO();
-+    return status;
-+
-+OnError:
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(Hardware->kernel->command,
-+                                            FromPower));
-+    }
-+
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_ReleaseSemaphore(Hardware->os, Hardware->globalSemaphore));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_BuildVirtualAddress
-+**
-+**  Build a virtual address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctUINT32 Index
-+**          Index into page table.
-+**
-+**      gctUINT32 Offset
-+**          Offset into page.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable receiving te hardware address.
-+*/
-+gceSTATUS
-+gckHARDWARE_BuildVirtualAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Index=%u Offset=%u", Hardware, Index, Offset);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Build virtual address. */
-+    *Address = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
-+             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (Offset | (Index << 12)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetIdle(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Wait,
-+    OUT gctUINT32 * Data
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 idle = 0;
-+    gctINT retry, poll, pollCount;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Wait=%d", Hardware, Wait);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
-+
-+
-+    /* If we have to wait, try 100 polls per millisecond. */
-+    pollCount = Wait ? 100 : 1;
-+
-+    /* At most, try for 1 second. */
-+    for (retry = 0; retry < 1000; ++retry)
-+    {
-+        /* If we have to wait, try 100 polls per millisecond. */
-+        for (poll = pollCount; poll > 0; --poll)
-+        {
-+            /* Read register. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
-+
-+            /* See if we have to wait for FE idle. */
-+            if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+            {
-+                /* FE is idle. */
-+                break;
-+            }
-+        }
-+
-+        /* Check if we need to wait for FE and FE is busy. */
-+        if (Wait && !(((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+        {
-+            /* Wait a little. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "%s: Waiting for idle: 0x%08X",
-+                           __FUNCTION__, idle);
-+
-+            gcmkVERIFY_OK(gckOS_Delay(Hardware->os, 1));
-+        }
-+        else
-+        {
-+            break;
-+        }
-+    }
-+
-+    /* Return idle to caller. */
-+    *Data = idle;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/* Flush the caches. */
-+gceSTATUS
-+gckHARDWARE_Flush(
-+    IN gckHARDWARE Hardware,
-+    IN gceKERNEL_FLUSH Flush,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT32 pipe;
-+    gctUINT32 flush = 0;
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+    gctBOOL fcFlushStall;
-+    gctUINT32 reserveBytes = 8;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Flush=0x%x Logical=0x%x *Bytes=%lu",
-+                   Hardware, Flush, Logical, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Get current pipe. */
-+    pipe = Hardware->kernel->command->pipeSelect;
-+
-+    fcFlushStall
-+        = ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 31:31) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))))
-+        && (Flush == gcvFLUSH_ALL)
-+        ;
-+
-+    if (fcFlushStall)
-+    {
-+        reserveBytes += 8;
-+    }
-+
-+    /* Flush 3D color cache. */
-+    if ((Flush & gcvFLUSH_COLOR) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
-+    }
-+
-+    /* Flush 3D depth cache. */
-+    if ((Flush & gcvFLUSH_DEPTH) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+    }
-+
-+    /* Flush 3D texture cache. */
-+    if ((Flush & gcvFLUSH_TEXTURE) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+    }
-+
-+    /* Flush 2D cache. */
-+    if ((Flush & gcvFLUSH_2D) && (pipe == 0x1))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+    }
-+
-+    /* See if there is a valid flush. */
-+    if (flush == 0)
-+    {
-+        if (Bytes != gcvNULL)
-+        {
-+            /* No bytes required. */
-+            *Bytes = 0;
-+        }
-+    }
-+
-+    else
-+    {
-+        /* Copy to command queue. */
-+        if (Logical != gcvNULL)
-+        {
-+            if (*Bytes < reserveBytes)
-+            {
-+                /* Command queue too small. */
-+                gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+            }
-+
-+            /* Append LOAD_STATE to AQFlush. */
-+            logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            logical[1] = flush;
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "0x%x: FLUSH 0x%x", logical, flush);
-+
-+            if (fcFlushStall)
-+            {
-+                logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                           | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                           | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+                logical[3] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+
-+                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                               "0x%x: FLUSH 0x%x", logical + 3, logical[3]);
-+            }
-+
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* bytes required. */
-+            *Bytes = reserveBytes;
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetFastClear(
-+    IN gckHARDWARE Hardware,
-+    IN gctINT Enable,
-+    IN gctINT Compression
-+    )
-+{
-+#ifndef VIVANTE_NO_3D
-+    gctUINT32 debug;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Enable=%d Compression=%d",
-+                   Hardware, Enable, Compression);
-+
-+    /* Only process if fast clear is available. */
-+    if ((((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+    {
-+        if (Enable == -1)
-+        {
-+            /* Determine automatic value for fast clear. */
-+            Enable = ((Hardware->identity.chipModel    != gcv500)
-+                     || (Hardware->identity.chipRevision >= 3)
-+                     ) ? 1 : 0;
-+        }
-+
-+        if (Compression == -1)
-+        {
-+            /* Determine automatic value for compression. */
-+            Compression = Enable
-+                        & (((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) );
-+        }
-+
-+        /* Read AQMemoryDebug register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &debug));
-+
-+        /* Set fast clear bypass. */
-+        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
-+
-+        if (
-+            ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) ||
-+            (Hardware->identity.chipModel >= gcv4000))
-+        {
-+            /* Set compression bypass. */
-+            debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21))) | (((gctUINT32) ((gctUINT32) (Compression == 0) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21)));
-+        }
-+
-+        /* Write back AQMemoryDebug register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00414,
-+                                  debug));
-+
-+        /* Store fast clear and comprersison flags. */
-+        Hardware->allowFastClear   = Enable;
-+        Hardware->allowCompression = Compression;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "FastClear=%d Compression=%d", Enable, Compression);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    return gcvSTATUS_OK;
-+#endif
-+}
-+
-+typedef enum
-+{
-+    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
-+    gcvPOWER_FLAG_STALL         = 1 << 1,
-+    gcvPOWER_FLAG_STOP          = 1 << 2,
-+    gcvPOWER_FLAG_START         = 1 << 3,
-+    gcvPOWER_FLAG_RELEASE       = 1 << 4,
-+    gcvPOWER_FLAG_DELAY         = 1 << 5,
-+    gcvPOWER_FLAG_SAVE          = 1 << 6,
-+    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
-+    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
-+    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
-+    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
-+}
-+gcePOWER_FLAGS;
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+static gctCONST_STRING
-+_PowerEnum(gceCHIPPOWERSTATE State)
-+{
-+    const gctCONST_STRING states[] =
-+    {
-+        gcmSTRING(gcvPOWER_ON),
-+        gcmSTRING(gcvPOWER_OFF),
-+        gcmSTRING(gcvPOWER_IDLE),
-+        gcmSTRING(gcvPOWER_SUSPEND),
-+        gcmSTRING(gcvPOWER_SUSPEND_ATPOWERON),
-+        gcmSTRING(gcvPOWER_OFF_ATPOWERON),
-+        gcmSTRING(gcvPOWER_IDLE_BROADCAST),
-+        gcmSTRING(gcvPOWER_SUSPEND_BROADCAST),
-+        gcmSTRING(gcvPOWER_OFF_BROADCAST),
-+        gcmSTRING(gcvPOWER_OFF_RECOVERY),
-+        gcmSTRING(gcvPOWER_ON_AUTO)
-+    };
-+
-+    if ((State >= gcvPOWER_ON) && (State <= gcvPOWER_ON_AUTO))
-+    {
-+        return states[State - gcvPOWER_ON];
-+    }
-+
-+    return "unknown";
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagementState
-+**
-+**  Set GPU to a specified power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetPowerManagementState(
-+    IN gckHARDWARE Hardware,
-+    IN gceCHIPPOWERSTATE State
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command = gcvNULL;
-+    gckOS os;
-+    gctUINT flag, clock;
-+    gctPOINTER buffer;
-+    gctSIZE_T bytes, requested;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL mutexAcquired = gcvFALSE;
-+    gctBOOL stall = gcvTRUE;
-+    gctBOOL broadcast = gcvFALSE;
-+#if gcdPOWEROFF_TIMEOUT
-+    gctBOOL timeout = gcvFALSE;
-+    gctBOOL isAfter = gcvFALSE;
-+    gctUINT32 currentTime;
-+#endif
-+    gctUINT32 process, thread;
-+    gctBOOL commitEntered = gcvFALSE;
-+    gctBOOL commandStarted = gcvFALSE;
-+    gctBOOL isrStarted = gcvFALSE;
-+
-+#if gcdENABLE_PROFILING
-+    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
-+              initTime, offTime, startTime, totalTime;
-+#endif
-+    gctBOOL global = gcvFALSE;
-+    gctBOOL globalAcquired = gcvFALSE;
-+    gctBOOL configMmu = gcvFALSE;
-+
-+    /* State transition flags. */
-+    static const gctUINT flags[4][4] =
-+    {
-+        /* gcvPOWER_ON           */
-+        {   /* ON                */ 0,
-+            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL,
-+            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_OFF          */
-+        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_RELEASE    |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* OFF               */ 0,
-+            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_IDLE         */
-+        {   /* ON                */ gcvPOWER_FLAG_RELEASE,
-+            /* OFF               */ gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ 0,
-+            /* SUSPEND           */ gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_SUSPEND      */
-+        {   /* ON                */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_RELEASE   |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* OFF               */ gcvPOWER_FLAG_SAVE      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* SUSPEND           */ 0,
-+        },
-+    };
-+
-+    /* Clocks. */
-+    static const gctUINT clocks[4] =
-+    {
-+        /* gcvPOWER_ON */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (64) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+
-+        /* gcvPOWER_OFF */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+
-+        /* gcvPOWER_IDLE */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+
-+        /* gcvPOWER_SUSPEND */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+    };
-+
-+    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Switching to power state %d(%s)",
-+                   State, _PowerEnum(State));
-+#endif
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Get the gckOS object pointer. */
-+    os = Hardware->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Get the gckCOMMAND object pointer. */
-+    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
-+    command = Hardware->kernel->command;
-+    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
-+
-+    if (Hardware->powerManagement == gcvFALSE)
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Start profiler. */
-+    gcmkPROFILE_INIT(freq, time);
-+
-+    /* Convert the broadcast power state. */
-+    switch (State)
-+    {
-+    case gcvPOWER_SUSPEND_ATPOWERON:
-+        /* Convert to SUSPEND and don't wait for STALL. */
-+        State = gcvPOWER_SUSPEND;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_OFF_ATPOWERON:
-+        /* Convert to OFF and don't wait for STALL. */
-+        State = gcvPOWER_OFF;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_IDLE_BROADCAST:
-+        /* Convert to IDLE and note we are inside broadcast. */
-+        State     = gcvPOWER_IDLE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_SUSPEND_BROADCAST:
-+        /* Convert to SUSPEND and note we are inside broadcast. */
-+        State     = gcvPOWER_SUSPEND;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_BROADCAST:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_RECOVERY:
-+        /* Convert to OFF and note we are inside recovery. */
-+        State     = gcvPOWER_OFF;
-+        stall     = gcvFALSE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_ON_AUTO:
-+        /* Convert to ON and note we are inside recovery. */
-+        State = gcvPOWER_ON;
-+        break;
-+
-+    case gcvPOWER_ON:
-+    case gcvPOWER_IDLE:
-+    case gcvPOWER_SUSPEND:
-+    case gcvPOWER_OFF:
-+        /* Mark as global power management. */
-+        global = gcvTRUE;
-+        break;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    case gcvPOWER_OFF_TIMEOUT:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        /* Check time out */
-+        timeout = gcvTRUE;
-+        break;
-+#endif
-+
-+    default:
-+        break;
-+    }
-+
-+    /* Get current process and thread IDs. */
-+    gcmkONERROR(gckOS_GetProcessID(&process));
-+    gcmkONERROR(gckOS_GetThreadID(&thread));
-+
-+    /* Before we grab locks see if this is actually a needed change */
-+    if (State == Hardware->chipPowerState)
-+        return gcvSTATUS_OK;
-+
-+    if (broadcast)
-+    {
-+        /* Try to acquire the power mutex. */
-+        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
-+
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            /* Check if we already own this mutex. */
-+            if ((Hardware->powerProcess == process)
-+            &&  (Hardware->powerThread  == thread)
-+            )
-+            {
-+                /* Bail out on recursive power management. */
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_OK;
-+            }
-+            else if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
-+            {
-+                /* Called from IST,
-+                ** so waiting here will cause deadlock,
-+                ** if lock holder call gckCOMMAND_Stall() */
-+                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+            }
-+#if gcdPOWEROFF_TIMEOUT
-+            else if(State == gcvPOWER_OFF && timeout == gcvTRUE)
-+            {
-+                /*
-+                ** try to aqcuire the mutex with more milliseconds,
-+                ** flush_delayed_work should be running with timeout,
-+                ** so waiting here will cause deadlock */
-+                status = gckOS_AcquireMutex(os, Hardware->powerMutex, gcdPOWEROFF_TIMEOUT);
-+
-+                if (status == gcvSTATUS_TIMEOUT)
-+                {
-+                    gckOS_Print("GPU Timer deadlock, exit by timeout!!!!\n");
-+
-+                    gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+                }
-+            }
-+#endif
-+            else
-+            {
-+                /* Acquire the power mutex. */
-+                gcmkONERROR(gckOS_AcquireMutex(os,
-+                                               Hardware->powerMutex,
-+                                               gcvINFINITE));
-+            }
-+        }
-+    }
-+    else
-+    {
-+        /* Acquire the power mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
-+    }
-+
-+    /* Get time until mtuex acquired. */
-+    gcmkPROFILE_QUERY(time, mutexTime);
-+
-+    Hardware->powerProcess = process;
-+    Hardware->powerThread  = thread;
-+    mutexAcquired          = gcvTRUE;
-+
-+    /* Grab control flags and clock. */
-+    flag  = flags[Hardware->chipPowerState][State];
-+    clock = clocks[State];
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    if (State == gcvPOWER_ON)
-+    {
-+        clock = ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (Hardware->powerOnFscaleVal) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)));
-+    }
-+#endif
-+
-+    if (State == gcvPOWER_SUSPEND && Hardware->chipPowerState == gcvPOWER_OFF && broadcast)
-+    {
-+#if gcdPOWER_SUSNPEND_WHEN_IDLE
-+	/* Do nothing */
-+
-+    	/* Release the power mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+       	gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+#else
-+	/* Clock should be on when switch power from off to suspend */
-+        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) ;
-+#endif
-+    }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    if (timeout)
-+    {
-+        gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+        gcmkONERROR(
-+            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
-+
-+        /* powerOffTime is pushed forward, give up.*/
-+        if (isAfter
-+        /* Expect a transition start from IDLE or SUSPEND. */
-+        ||  (Hardware->chipPowerState == gcvPOWER_ON)
-+        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
-+        )
-+        {
-+            /* Release the power mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+            /* No need to do anything. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Power Off GPU[%d] at %u [supposed to be at %u]",
-+                       Hardware->core, currentTime, Hardware->powerOffTime);
-+    }
-+
-+    if (State == gcvPOWER_ON || State == gcvPOWER_OFF)
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
-+
-+        /* Cancel running timer when GPU enters ON or OFF. */
-+        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
-+    }
-+#endif
-+
-+    if (flag == 0)
-+    {
-+        /* Release the power mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+        /* No need to do anything. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* If this is an internal power management, we have to check if we can grab
-+    ** the global power semaphore. If we cannot, we have to wait until the
-+    ** external world changes power management. */
-+    if (!global)
-+    {
-+        /* Try to acquire the global semaphore. */
-+        status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
-+            {
-+                /* Called from thread routine which should NEVER sleep.*/
-+                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+            }
-+
-+            /* Release the power mutex. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "Releasing the power mutex.");
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+            mutexAcquired = gcvFALSE;
-+
-+            /* Wait for the semaphore. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "Waiting for global semaphore.");
-+            gcmkONERROR(gckOS_AcquireSemaphore(os, Hardware->globalSemaphore));
-+            globalAcquired = gcvTRUE;
-+
-+            /* Acquire the power mutex. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "Reacquiring the power mutex.");
-+            gcmkONERROR(gckOS_AcquireMutex(os,
-+                                           Hardware->powerMutex,
-+                                           gcvINFINITE));
-+            mutexAcquired = gcvTRUE;
-+
-+            /* chipPowerState may be changed by external world during the time
-+            ** we give up powerMutex, so updating flag now is necessary. */
-+            flag = flags[Hardware->chipPowerState][State];
-+
-+            if (flag == 0)
-+            {
-+                gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
-+                globalAcquired = gcvFALSE;
-+
-+                gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+                mutexAcquired = gcvFALSE;
-+
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_OK;
-+            }
-+        }
-+        else
-+        {
-+            /* Error. */
-+            gcmkONERROR(status);
-+        }
-+
-+        /* Release the global semaphore again. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
-+        globalAcquired = gcvFALSE;
-+    }
-+    else
-+    {
-+        if (State == gcvPOWER_OFF || State == gcvPOWER_SUSPEND || State == gcvPOWER_IDLE)
-+        {
-+            /* Acquire the global semaphore if it has not been acquired. */
-+            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
-+            if (status == gcvSTATUS_OK)
-+            {
-+                globalAcquired = gcvTRUE;
-+            }
-+            else if (status != gcvSTATUS_TIMEOUT)
-+            {
-+                /* Other errors. */
-+                gcmkONERROR(status);
-+            }
-+            /* Ignore gcvSTATUS_TIMEOUT and leave globalAcquired as gcvFALSE.
-+            ** gcvSTATUS_TIMEOUT means global semaphore has already
-+            ** been acquired before this operation, so even if we fail,
-+            ** we should not release it in our error handling. It should be
-+            ** released by the next successful global gcvPOWER_ON. */
-+        }
-+
-+        /* Global power management can't be aborted, so sync with
-+        ** proceeding last commit. */
-+        if (flag & gcvPOWER_FLAG_ACQUIRE)
-+        {
-+            /* Acquire the power management semaphore. */
-+            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+            acquired = gcvTRUE;
-+
-+            /* avoid acquiring again. */
-+            flag &= ~gcvPOWER_FLAG_ACQUIRE;
-+        }
-+    }
-+
-+    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
-+    {
-+        /* Turn on the power. */
-+        gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
-+
-+        /* Mark clock and power as enabled. */
-+        Hardware->clockState = gcvTRUE;
-+        Hardware->powerState = gcvTRUE;
-+
-+        for (;;)
-+        {
-+            /* Check if GPU is present and awake. */
-+            status = _IsGPUPresent(Hardware);
-+
-+            /* Check if the GPU is not responding. */
-+            if (status == gcvSTATUS_GPU_NOT_RESPONDING)
-+            {
-+                /* Turn off the power and clock. */
-+                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvFALSE, gcvFALSE));
-+
-+                Hardware->clockState = gcvFALSE;
-+                Hardware->powerState = gcvFALSE;
-+
-+                /* Wait a little. */
-+                gckOS_Delay(os, 1);
-+
-+                /* Turn on the power and clock. */
-+                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
-+
-+                Hardware->clockState = gcvTRUE;
-+                Hardware->powerState = gcvTRUE;
-+
-+                /* We need to initialize the hardware and start the command
-+                 * processor. */
-+                flag |= gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_START;
-+            }
-+            else
-+            {
-+                /* Test for error. */
-+                gcmkONERROR(status);
-+
-+                /* Break out of loop. */
-+                break;
-+            }
-+        }
-+    }
-+
-+    /* Get time until powered on. */
-+    gcmkPROFILE_QUERY(time, onTime);
-+
-+    if ((flag & gcvPOWER_FLAG_STALL) && stall)
-+    {
-+        gctBOOL idle;
-+        gctINT32 atomValue;
-+
-+        /* For global operation, all pending commits have already been
-+        ** blocked by globalSemaphore or powerSemaphore.*/
-+        if (!global)
-+        {
-+            /* Check commit atom. */
-+            gcmkONERROR(gckOS_AtomGet(os, command->atomCommit, &atomValue));
-+
-+            if (atomValue > 0)
-+            {
-+                /* Commits are pending - abort power management. */
-+                status = broadcast ? gcvSTATUS_CHIP_NOT_READY
-+                                   : gcvSTATUS_MORE_DATA;
-+                goto OnError;
-+            }
-+        }
-+
-+        if (broadcast)
-+        {
-+            /* Check for idle. */
-+            gcmkONERROR(gckHARDWARE_QueryIdle(Hardware, &idle));
-+
-+            if (!idle)
-+            {
-+                status = gcvSTATUS_CHIP_NOT_READY;
-+                goto OnError;
-+            }
-+        }
-+
-+        else
-+        {
-+            /* Acquire the command queue. */
-+            gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvTRUE));
-+            commitEntered = gcvTRUE;
-+
-+            /* Get the size of the flush command. */
-+            gcmkONERROR(gckHARDWARE_Flush(Hardware,
-+                                          gcvFLUSH_ALL,
-+                                          gcvNULL,
-+                                          &requested));
-+
-+            /* Reserve space in the command queue. */
-+            gcmkONERROR(gckCOMMAND_Reserve(command,
-+                                           requested,
-+                                           &buffer,
-+                                           &bytes));
-+
-+            /* Append a flush. */
-+            gcmkONERROR(gckHARDWARE_Flush(
-+                Hardware, gcvFLUSH_ALL, buffer, &bytes
-+                ));
-+
-+            /* Execute the command queue. */
-+            gcmkONERROR(gckCOMMAND_Execute(command, requested));
-+
-+            /* Release the command queue. */
-+            gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvTRUE));
-+            commitEntered = gcvFALSE;
-+
-+            /* Wait to finish all commands. */
-+            gcmkONERROR(gckCOMMAND_Stall(command, gcvTRUE));
-+        }
-+    }
-+
-+    /* Get time until stalled. */
-+    gcmkPROFILE_QUERY(time, stallTime);
-+
-+    if (flag & gcvPOWER_FLAG_ACQUIRE)
-+    {
-+        /* Acquire the power management semaphore. */
-+        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+        acquired = gcvTRUE;
-+    }
-+
-+    if (flag & gcvPOWER_FLAG_STOP)
-+    {
-+        /* Stop the command parser. */
-+        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
-+
-+        /* Stop the Isr. */
-+        if (Hardware->stopIsr)
-+        {
-+            gcmkONERROR(Hardware->stopIsr(Hardware->isrContext, Hardware->core));
-+        }
-+    }
-+
-+    /* Flush Cache before Power Off. */
-+    if (flag & gcvPOWER_FLAG_POWER_OFF)
-+    {
-+        if (Hardware->clockState == gcvFALSE)
-+        {
-+            /* Turn off the GPU power. */
-+            gcmkONERROR(
-+                    gckOS_SetGPUPower(os,
-+                        Hardware->core,
-+                        gcvTRUE,
-+                        gcvTRUE));
-+
-+            Hardware->clockState = gcvTRUE;
-+
-+            if (gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE)
-+            {
-+                /* Write the clock control register. */
-+                gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                                  Hardware->core,
-+                                                  0x00000,
-+                                                  clocks[0]));
-+
-+                /* Done loading the frequency scaler. */
-+                gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                                  Hardware->core,
-+                                                  0x00000,
-+                                                  ((((gctUINT32) (clocks[0])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+            }
-+        }
-+
-+        gcmkONERROR(gckCOMMAND_Start(command));
-+
-+        gcmkONERROR(_FlushCache(Hardware, command));
-+
-+        gckOS_Delay(gcvNULL, 1);
-+
-+        /* Stop the command parser. */
-+        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
-+
-+        flag |= gcvPOWER_FLAG_CLOCK_OFF;
-+    }
-+
-+    /* Get time until stopped. */
-+    gcmkPROFILE_QUERY(time, stopTime);
-+
-+    /* Only process this when hardware is enabled. */
-+    if (Hardware->clockState && Hardware->powerState
-+    /* Don't touch clock control if dynamic frequency scaling is available. */
-+    && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE
-+    )
-+    {
-+        if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
-+        {
-+            if (Hardware->identity.chipModel == gcv4000
-+            && Hardware->identity.chipRevision == 0x5208)
-+            {
-+                clock &= ~2U;
-+            }
-+        }
-+
-+        /* Write the clock control register. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          clock));
-+
-+        /* Done loading the frequency scaler. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+    }
-+
-+    if (flag & gcvPOWER_FLAG_DELAY)
-+    {
-+        /* Wait for the specified amount of time to settle coming back from
-+        ** power-off or suspend state. */
-+        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
-+    }
-+
-+    /* Get time until delayed. */
-+    gcmkPROFILE_QUERY(time, delayTime);
-+
-+    if (flag & gcvPOWER_FLAG_INITIALIZE)
-+    {
-+        /* Initialize hardware. */
-+        gcmkONERROR(gckHARDWARE_InitializeHardware(Hardware));
-+
-+        gcmkONERROR(gckHARDWARE_SetFastClear(Hardware,
-+                                             Hardware->allowFastClear,
-+                                             Hardware->allowCompression));
-+
-+        /* Force the command queue to reload the next context. */
-+        command->currContext = gcvNULL;
-+
-+        /* Need to config mmu after command start. */
-+        configMmu = gcvTRUE;
-+    }
-+
-+    /* Get time until initialized. */
-+    gcmkPROFILE_QUERY(time, initTime);
-+
-+    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
-+    {
-+        /* Turn off the GPU power. */
-+        gcmkONERROR(
-+            gckOS_SetGPUPower(os,
-+                              Hardware->core,
-+                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                               : gcvTRUE,
-+                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                               : gcvTRUE));
-+
-+        /* Save current hardware power and clock states. */
-+        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+    }
-+
-+    /* Get time until off. */
-+    gcmkPROFILE_QUERY(time, offTime);
-+
-+    if (flag & gcvPOWER_FLAG_START)
-+    {
-+        /* Start the command processor. */
-+        gcmkONERROR(gckCOMMAND_Start(command));
-+        commandStarted = gcvTRUE;
-+
-+        if (Hardware->startIsr)
-+        {
-+            /* Start the Isr. */
-+            gcmkONERROR(Hardware->startIsr(Hardware->isrContext, Hardware->core));
-+            isrStarted = gcvTRUE;
-+        }
-+
-+        /* Set NEW MMU. */
-+        if (Hardware->mmuVersion != 0 && configMmu)
-+        {
-+            gcmkONERROR(
-+                    gckHARDWARE_SetMMUv2(
-+                        Hardware,
-+                        gcvTRUE,
-+                        Hardware->kernel->mmu->mtlbLogical,
-+                        gcvMMU_MODE_4K,
-+                        (gctUINT8_PTR)Hardware->kernel->mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
-+                        gcvTRUE
-+                        ));
-+        }
-+    }
-+
-+    /* Get time until started. */
-+    gcmkPROFILE_QUERY(time, startTime);
-+
-+    if (flag & gcvPOWER_FLAG_RELEASE)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
-+        acquired = gcvFALSE;
-+
-+        if (global)
-+        {
-+            /* Verify global semaphore has been acquired already before
-+            ** we release it.
-+            ** If it was acquired, gckOS_TryAcquireSemaphore will return
-+            ** gcvSTATUS_TIMEOUT and we release it. Otherwise, global
-+            ** semaphore will be acquried now, but it still is released
-+            ** immediately. */
-+            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
-+            if (status != gcvSTATUS_TIMEOUT)
-+            {
-+                gcmkONERROR(status);
-+            }
-+
-+            /* Release the global semaphore. */
-+            gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
-+            globalAcquired = gcvFALSE;
-+        }
-+    }
-+
-+    /* Save the new power state. */
-+    Hardware->chipPowerState = State;
-+
-+#if gcdDVFS
-+    if (State == gcvPOWER_ON && Hardware->kernel->dvfs)
-+    {
-+        gckDVFS_Start(Hardware->kernel->dvfs);
-+    }
-+#endif
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
-+    {
-+        gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+        Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
-+        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
-+        gcmkVERIFY_OK(gckOS_StartTimer(os,
-+                                       Hardware->powerOffTimer,
-+                                       Hardware->powerOffTimeout));
-+    }
-+#endif
-+
-+    /* Release the power mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+    /* Get total time. */
-+    gcmkPROFILE_QUERY(time, totalTime);
-+#if gcdENABLE_PROFILING
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
-+                   freq, mutexTime, onTime, stallTime, stopTime);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
-+                   delayTime, initTime, offTime, startTime, totalTime);
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (commandStarted)
-+    {
-+        gcmkVERIFY_OK(gckCOMMAND_Stop(command, gcvFALSE));
-+    }
-+
-+    if (isrStarted)
-+    {
-+        gcmkVERIFY_OK(Hardware->stopIsr(Hardware->isrContext, Hardware->core));
-+    }
-+
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, gcvTRUE));
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Release semaphore. */
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
-+                                             command->powerSemaphore));
-+    }
-+
-+    if (globalAcquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
-+                                             Hardware->globalSemaphore));
-+    }
-+
-+    if (mutexAcquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryPowerManagementState
-+**
-+**  Get GPU power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE* State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryPowerManagementState(
-+    IN gckHARDWARE Hardware,
-+    OUT gceCHIPPOWERSTATE* State
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(State != gcvNULL);
-+
-+    /* Return the statue. */
-+    *State = Hardware->chipPowerState;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*State=%d", *State);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagement
-+**
-+**  Configure GPU power management function.
-+**  Only used in driver initialization stage.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL PowerManagement
-+**          Power Mangement State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetPowerManagement(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL PowerManagement
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    Hardware->powerManagement = PowerManagement;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetGpuProfiler
-+**
-+**  Configure GPU profiler function.
-+**  Only used in driver initialization stage.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL GpuProfiler
-+**          GOU Profiler State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetGpuProfiler(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL GpuProfiler
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    Hardware->gpuProfiler = GpuProfiler;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+gceSTATUS
-+gckHARDWARE_SetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32   FscaleValue
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 clock;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x FscaleValue=%d", Hardware, FscaleValue);
-+
-+    gcmkVERIFY_ARGUMENT(FscaleValue > 0 && FscaleValue <= 64);
-+
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE));
-+    acquired =  gcvTRUE;
-+
-+    Hardware->powerOnFscaleVal = FscaleValue;
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+		gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &data));
-+
-+        /* Disable all clock gating. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
-+
-+        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (FscaleValue) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          clock));
-+
-+        /* Done loading the frequency scaler. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+
-+        /* Restore all clock gating. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  data));
-+    }
-+
-+    gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT * FscaleValue,
-+    IN gctUINT * MinFscaleValue,
-+    IN gctUINT * MaxFscaleValue
-+    )
-+{
-+    *FscaleValue = Hardware->powerOnFscaleVal;
-+    if ((gpu3DMinClock > 0) && (gpu3DMinClock <= 64) && (Hardware->core == gcvCORE_MAJOR))
-+        *MinFscaleValue = gpu3DMinClock;
-+    else
-+        *MinFscaleValue = 1;
-+    *MaxFscaleValue = 64;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+#endif
-+
-+#if gcdPOWEROFF_TIMEOUT
-+gceSTATUS
-+gckHARDWARE_SetPowerOffTimeout(
-+    IN gckHARDWARE  Hardware,
-+    IN gctUINT32    Timeout
-+)
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
-+
-+    Hardware->powerOffTimeout = Timeout;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+gceSTATUS
-+gckHARDWARE_QueryPowerOffTimeout(
-+    IN gckHARDWARE  Hardware,
-+    OUT gctUINT32*  Timeout
-+)
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    *Timeout = Hardware->powerOffTimeout;
-+
-+    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+gceSTATUS
-+gckHARDWARE_QueryIdle(
-+    IN gckHARDWARE Hardware,
-+    OUT gctBOOL_PTR IsIdle
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 idle, address;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
-+
-+    /* We are idle when the power is not ON. */
-+    if (Hardware->chipPowerState != gcvPOWER_ON)
-+    {
-+        *IsIdle = gcvTRUE;
-+    }
-+
-+    else
-+    {
-+        /* Read idle register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
-+
-+        /* Pipe must be idle. */
-+        if (((((((gctUINT32) (idle)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) ) != 1)
-+        )
-+        {
-+            /* Something is busy. */
-+            *IsIdle = gcvFALSE;
-+        }
-+
-+        else
-+        {
-+            /* Read the current FE address. */
-+            gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                             Hardware->core,
-+                                             0x00664,
-+                                             &address));
-+
-+            /* Test if address is inside the last WAIT/LINK sequence. */
-+            if ((address >= Hardware->lastWaitLink)
-+            &&  (address <= Hardware->lastWaitLink + 16)
-+            )
-+            {
-+                /* FE is in last WAIT/LINK and the pipe is idle. */
-+                *IsIdle = gcvTRUE;
-+            }
-+            else
-+            {
-+                /* FE is not in WAIT/LINK yet. */
-+                *IsIdle = gcvFALSE;
-+            }
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+** Handy macros that will help in reading those debug registers.
-+*/
-+
-+#define gcmkREAD_DEBUG_REGISTER(control, block, index, data) \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          index))); \
-+    gcmkONERROR(\
-+        gckOS_ReadRegisterEx(Hardware->os, \
-+                             Hardware->core, \
-+                             GC_DEBUG_SIGNALS_##block##_Address, \
-+                             &profiler->data))
-+
-+#define gcmkREAD_DEBUG_REGISTER_N(control, block, index, data) \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          index))); \
-+    gcmkONERROR(\
-+        gckOS_ReadRegisterEx(Hardware->os, \
-+                             Hardware->core, \
-+                             GC_DEBUG_SIGNALS_##block##_Address, \
-+                             &data))
-+
-+#define gcmkRESET_DEBUG_REGISTER(control, block) \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          15))); \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          0)))
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_ProfileEngine2D
-+**
-+**  Read the profile registers available in the 2D engine and sets them in the
-+**  profile.  The function will also reset the pixelsRendered counter every time.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      OPTIONAL gcs2D_PROFILE_PTR Profile
-+**          Pointer to a gcs2D_Profile structure.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_ProfileEngine2D(
-+    IN gckHARDWARE Hardware,
-+    OPTIONAL gcs2D_PROFILE_PTR Profile
-+    )
-+{
-+    gceSTATUS status;
-+    gcs2D_PROFILE_PTR profiler = Profile;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Profile != gcvNULL)
-+    {
-+        /* Read the cycle count. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00438,
-+                                 &Profile->cycleCount));
-+
-+        /* Read pixels rendered by 2D engine. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &profiler->pixelsRendered));
-+
-+        /* Reset counter. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if VIVANTE_PROFILER
-+gceSTATUS
-+gckHARDWARE_QueryProfileRegisters(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL   Reset,
-+    OUT gcsPROFILER_COUNTERS * Counters
-+    )
-+{
-+    gceSTATUS status;
-+    gcsPROFILER_COUNTERS * profiler = Counters;
-+    gctUINT i, clock;
-+    gctUINT32 colorKilled, colorDrawn, depthKilled, depthDrawn;
-+    gctUINT32 totalRead, totalWrite;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Read the counters. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00438,
-+                             &profiler->gpuCyclesCounter));
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00078,
-+                             &profiler->gpuTotalCyclesCounter));
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+	                     Hardware->core,
-+                             0x0007C,
-+                             &profiler->gpuIdleCyclesCounter));
-+
-+
-+    /* Read clock control register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &clock));
-+
-+    profiler->gpuTotalRead64BytesPerFrame = 0;
-+    profiler->gpuTotalWrite64BytesPerFrame = 0;
-+    profiler->pe_pixel_count_killed_by_color_pipe = 0;
-+    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
-+
-+     /* Walk through all avaiable pixel pipes. */
-+    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
-+    {
-+        /* Select proper pipe. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                           Hardware->core,
-+                                           0x00000,
-+                                           ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
-+
-+        /* BW */
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00040,
-+                             &totalRead));
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00044,
-+                             &totalWrite));
-+
-+        profiler->gpuTotalRead64BytesPerFrame += totalRead;
-+        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
-+
-+        /* PE */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
-+
-+        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
-+        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
-+        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
-+        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
-+    }
-+
-+    /* Reset clock control register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      clock));
-+
-+    if(Reset){
-+            /* Reset counters. */
-+            gcmkONERROR(
-+                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
-+            gcmkONERROR(
-+                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
-+            gcmkONERROR(
-+                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
-+            gcmkONERROR(
-+                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
-+            gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+    }
-+
-+    /* SH */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
-+    if(Reset){  gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));}
-+
-+    /* PA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
-+    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));}
-+
-+    /* SE */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
-+    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));}
-+
-+    /* RA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
-+    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));}
-+
-+    /* TX */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
-+    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));}
-+
-+    /* MC */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
-+    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));}
-+
-+    /* HI */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
-+    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));}
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+#define gcmkUPDATE_PROFILE_DATA(data) \
-+    profilerHistroy->data += profiler->data
-+
-+gceSTATUS
-+gckHARDWARE_QueryContextProfile(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL   Reset,
-+    IN gckCONTEXT Context,
-+    OUT gcsPROFILER_COUNTERS * Counters
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command = Hardware->kernel->command;
-+    gcsPROFILER_COUNTERS * profiler = Counters;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Acquire the context sequnence mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(
-+        command->os, command->mutexContextSeq, gcvINFINITE
-+        ));
-+
-+    /* Read the counters. */
-+    gcmkVERIFY_OK(gckOS_MemCopy(
-+        profiler, &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
-+        ));
-+
-+    if (Reset)
-+    {
-+        /* Reset counters. */
-+        gcmkVERIFY_OK(gckOS_ZeroMemory(
-+            &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
-+            ));
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+        command->os, command->mutexContextSeq
-+        ));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-+gceSTATUS
-+gckHARDWARE_UpdateContextProfile(
-+    IN gckHARDWARE Hardware,
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status;
-+    gcsPROFILER_COUNTERS * profiler = &Context->latestProfiler;
-+    gcsPROFILER_COUNTERS * profilerHistroy = &Context->histroyProfiler;
-+    gctUINT i, clock;
-+    gctUINT32 colorKilled, colorDrawn, depthKilled, depthDrawn;
-+    gctUINT32 totalRead, totalWrite;
-+    gceCHIPMODEL chipModel;
-+    gctUINT32 chipRevision;
-+    gctUINT32 temp;
-+    gctBOOL needResetShader = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Context=0x%x", Hardware, Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    chipModel = Hardware->identity.chipModel;
-+    chipRevision = Hardware->identity.chipRevision;
-+    if (chipModel == gcv2000 || (chipModel == gcv2100 && chipRevision == 0x5118))
-+    {
-+        needResetShader = gcvTRUE;
-+    }
-+
-+    /* Read the counters. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00438,
-+                             &profiler->gpuCyclesCounter));
-+    gcmkUPDATE_PROFILE_DATA(gpuCyclesCounter);
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00078,
-+                             &profiler->gpuTotalCyclesCounter));
-+    gcmkUPDATE_PROFILE_DATA(gpuTotalCyclesCounter);
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x0007C,
-+                             &profiler->gpuIdleCyclesCounter));
-+    gcmkUPDATE_PROFILE_DATA(gpuIdleCyclesCounter);
-+
-+    /* Read clock control register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &clock));
-+
-+    profiler->gpuTotalRead64BytesPerFrame = 0;
-+    profiler->gpuTotalWrite64BytesPerFrame = 0;
-+    profiler->pe_pixel_count_killed_by_color_pipe = 0;
-+    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
-+
-+    /* Walk through all avaiable pixel pipes. */
-+    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
-+    {
-+        /* Select proper pipe. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                           Hardware->core,
-+                                           0x00000,
-+                                           ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
-+
-+        /* BW */
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00040,
-+                             &totalRead));
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00044,
-+                             &totalWrite));
-+
-+        profiler->gpuTotalRead64BytesPerFrame += totalRead;
-+        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
-+        gcmkUPDATE_PROFILE_DATA(gpuTotalRead64BytesPerFrame);
-+        gcmkUPDATE_PROFILE_DATA(gpuTotalWrite64BytesPerFrame);
-+
-+        /* PE */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
-+
-+        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
-+        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
-+        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
-+        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_color_pipe);
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_depth_pipe);
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_color_pipe);
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_depth_pipe);
-+    }
-+
-+    /* Reset clock control register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      clock));
-+
-+
-+
-+
-+    /* Reset counters. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+
-+    /* SH */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->ps_inst_counter;
-+        profiler->ps_inst_counter -= Context->prevPSInstCount;
-+        Context->prevPSInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(ps_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->rendered_pixel_counter;
-+        profiler->rendered_pixel_counter -= Context->prevPSPixelCount;
-+        Context->prevPSPixelCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(rendered_pixel_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->vs_inst_counter;
-+        profiler->vs_inst_counter -= Context->prevVSInstCount;
-+        Context->prevVSInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(vs_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->rendered_vertice_counter;
-+        profiler->rendered_vertice_counter -= Context->prevVSVertexCount;
-+        Context->prevVSVertexCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(rendered_vertice_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->vtx_branch_inst_counter;
-+        profiler->vtx_branch_inst_counter -= Context->prevVSBranchInstCount;
-+        Context->prevVSBranchInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(vtx_branch_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->vtx_texld_inst_counter;
-+        profiler->vtx_texld_inst_counter -= Context->prevVSTexInstCount;
-+        Context->prevVSTexInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(vtx_texld_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->pxl_branch_inst_counter;
-+        profiler->pxl_branch_inst_counter -= Context->prevPSBranchInstCount;
-+        Context->prevPSBranchInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(pxl_branch_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->pxl_texld_inst_counter;
-+        profiler->pxl_texld_inst_counter -= Context->prevPSTexInstCount;
-+        Context->prevPSTexInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(pxl_texld_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));
-+
-+    /* PA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_input_vtx_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_input_prim_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_output_prim_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_depth_clipped_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_trivial_rejected_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_culled_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));
-+
-+    /* SE */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
-+    gcmkUPDATE_PROFILE_DATA(se_culled_triangle_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
-+    gcmkUPDATE_PROFILE_DATA(se_culled_lines_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));
-+
-+    /* RA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
-+    gcmkUPDATE_PROFILE_DATA(ra_valid_pixel_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
-+    gcmkUPDATE_PROFILE_DATA(ra_total_quad_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
-+    gcmkUPDATE_PROFILE_DATA(ra_valid_quad_count_after_early_z);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
-+    gcmkUPDATE_PROFILE_DATA(ra_total_primitive_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
-+    gcmkUPDATE_PROFILE_DATA(ra_pipe_cache_miss_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
-+    gcmkUPDATE_PROFILE_DATA(ra_prefetch_cache_miss_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+
-+    /* TX */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_bilinear_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_trilinear_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_discarded_texture_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_texture_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_mem_read_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_mem_read_in_8B_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_cache_hit_texel_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_texel_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));
-+
-+    /* MC */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
-+    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_pipeline);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
-+    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_IP);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
-+    gcmkUPDATE_PROFILE_DATA(mc_total_write_req_8B_from_pipeline);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));
-+
-+    /* HI */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
-+    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_read_request_stalled);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
-+    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_request_stalled);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
-+    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_data_stalled);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+static gceSTATUS
-+_ResetGPU(
-+    IN gckHARDWARE Hardware,
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+    gctUINT32 control, idle;
-+    gceSTATUS status;
-+
-+    for (;;)
-+    {
-+        /* Disable clock gating. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    Hardware->powerBaseAddress +
-+                    0x00104,
-+                    0x00000000));
-+
-+        control = ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
-+
-+        /* Disable pulse-eater. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x0010C,
-+                    control));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x0010C,
-+                    ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x0010C,
-+                    control));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x00000,
-+                    ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x00000,
-+                    0x00000900));
-+
-+        /* Wait for clock being stable. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Isolate the GPU. */
-+        control = ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Set soft reset. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Wait for reset. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Reset soft reset bit. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Reset GPU isolation. */
-+        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Read idle register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         Core,
-+                                         0x00004,
-+                                         &idle));
-+
-+        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
-+        {
-+            continue;
-+        }
-+
-+        /* Read reset register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         Core,
-+                                         0x00000,
-+                                         &control));
-+
-+        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
-+        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
-+        )
-+        {
-+            continue;
-+        }
-+
-+        /* GPU is idle. */
-+        break;
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the error. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_Reset(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL mutexAcquired = gcvFALSE;
-+    gctUINT32 process, thread;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
-+    command = Hardware->kernel->command;
-+    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
-+
-+    if (Hardware->identity.chipRevision < 0x4600)
-+    {
-+        /* Not supported - we need the isolation bit. */
-+        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+    }
-+
-+    status = gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, 0);
-+    if (status == gcvSTATUS_TIMEOUT)
-+    {
-+        gcmkONERROR(gckOS_GetProcessID(&process));
-+        gcmkONERROR(gckOS_GetThreadID(&thread));
-+
-+        if ((Hardware->powerProcess == process)
-+        &&  (Hardware->powerThread  == thread))
-+        {
-+            /* No way to recovery from a error in power management. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+    else
-+    {
-+        mutexAcquired = gcvTRUE;
-+    }
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+        /* Acquire the power management semaphore. */
-+        gcmkONERROR(
-+            gckOS_AcquireSemaphore(Hardware->os, command->powerSemaphore));
-+        acquired = gcvTRUE;
-+    }
-+
-+    if ((Hardware->chipPowerState == gcvPOWER_ON)
-+    ||  (Hardware->chipPowerState == gcvPOWER_IDLE)
-+    )
-+    {
-+        /* Stop the command processor. */
-+        gcmkONERROR(gckCOMMAND_Stop(command, gcvTRUE));
-+    }
-+
-+    /* Stop isr, we will start it again when power on GPU. */
-+    if (Hardware->stopIsr)
-+    {
-+        gcmkONERROR(Hardware->stopIsr(Hardware->isrContext, Hardware->core));
-+    }
-+
-+    /* Hardware reset. */
-+    status = gckOS_ResetGPU(Hardware->os, Hardware->core);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        /* Soft reset. */
-+        gcmkONERROR(_ResetGPU(Hardware, Hardware->os, Hardware->core));
-+    }
-+
-+    /* Force an OFF to ON power switch. */
-+    Hardware->chipPowerState = gcvPOWER_OFF;
-+
-+    gcmkONERROR(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    mutexAcquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkVERIFY_OK(
-+            gckOS_ReleaseSemaphore(Hardware->os, command->powerSemaphore));
-+    }
-+
-+    if (mutexAcquired)
-+    {
-+        gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
-+    }
-+
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32_PTR BaseAddress
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(BaseAddress != gcvNULL);
-+
-+    /* Test if we have a new Memory Controller. */
-+    if (((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))))
-+    {
-+        /* No base address required. */
-+        *BaseAddress = 0;
-+    }
-+    else
-+    {
-+        /* Get the base address from the OS. */
-+        gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, BaseAddress));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*BaseAddress=0x%08x", *BaseAddress);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_NeedBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 State,
-+    OUT gctBOOL_PTR NeedBase
-+    )
-+{
-+    gctBOOL need = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x State=0x%08x", Hardware, State);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(NeedBase != gcvNULL);
-+
-+    /* Make sure this is a load state. */
-+    if (((((gctUINT32) (State)) >> (0 ? 31:27) & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))))
-+    {
-+#ifndef VIVANTE_NO_3D
-+        /* Get the state address. */
-+        switch ((((((gctUINT32) (State)) >> (0 ? 15:0)) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1)))))) ))
-+        {
-+        case 0x0596:
-+        case 0x0597:
-+        case 0x0599:
-+        case 0x059A:
-+        case 0x05A9:
-+            /* These states need a TRUE physical address. */
-+            need = gcvTRUE;
-+            break;
-+        }
-+#else
-+        /* 2D addresses don't need a base address. */
-+#endif
-+    }
-+
-+    /* Return the flag. */
-+    *NeedBase = need;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*NeedBase=%d", *NeedBase);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetIsrManager(
-+   IN gckHARDWARE Hardware,
-+   IN gctISRMANAGERFUNC StartIsr,
-+   IN gctISRMANAGERFUNC StopIsr,
-+   IN gctPOINTER Context
-+   )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x, StartIsr=0x%x, StopIsr=0x%x, Context=0x%x",
-+                   Hardware, StartIsr, StopIsr, Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (StartIsr == gcvNULL ||
-+        StopIsr == gcvNULL ||
-+        Context == gcvNULL)
-+    {
-+        status = gcvSTATUS_INVALID_ARGUMENT;
-+
-+        gcmkFOOTER();
-+        return status;
-+    }
-+
-+    Hardware->startIsr = StartIsr;
-+    Hardware->stopIsr = StopIsr;
-+    Hardware->isrContext = Context;
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Compose
-+**
-+**  Start a composition.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Compose(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Offset,
-+    IN gctSIZE_T Size,
-+    IN gctUINT8 EventID
-+    )
-+{
-+#ifndef VIVANTE_NO_3D
-+    gceSTATUS status;
-+    gctUINT32_PTR triggerState;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Physical=0x%x Logical=0x%x"
-+                   " Offset=%d Size=%d EventID=%d",
-+                   Hardware, Physical, Logical, Offset, Size, EventID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(((Size + 8) & 63) == 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Program the trigger state. */
-+    triggerState = (gctUINT32_PTR) ((gctUINT8_PTR) Logical + Offset + Size);
-+    triggerState[0] = 0x0C03;
-+    triggerState[1]
-+        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16))) | (((gctUINT32) ((gctUINT32) (EventID) & ((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16)))
-+        ;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache for the wait/link. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Hardware->os, ProcessID, gcvNULL,
-+        Physical, Logical, Offset + Size
-+        ));
-+#endif
-+
-+    /* Start composition. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(
-+        Hardware->os, Hardware->core, 0x00554,
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
-+        ));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    /* Return the status. */
-+    return gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_IsFeatureAvailable
-+**
-+**  Verifies whether the specified feature is available in hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceFEATURE Feature
-+**          Feature to be verified.
-+*/
-+gceSTATUS
-+gckHARDWARE_IsFeatureAvailable(
-+    IN gckHARDWARE Hardware,
-+    IN gceFEATURE Feature
-+    )
-+{
-+    gctBOOL available;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Feature=%d", Hardware, Feature);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Only features needed by common kernel logic added here. */
-+    switch (Feature)
-+    {
-+    case gcvFEATURE_END_EVENT:
-+        /*available = gcmVERIFYFIELDVALUE(Hardware->identity.chipMinorFeatures2,
-+            GC_MINOR_FEATURES2, END_EVENT, AVAILABLE
-+            );*/
-+        available = gcvFALSE;
-+        break;
-+    case gcvFEATURE_MC20:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))));
-+        break;
-+    case gcvFEATURE_DYNAMIC_FREQUENCY_SCALING:
-+        /* This feature doesn't apply for 2D cores. */
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 14:14) & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))))
-+            &&      ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_PIPE_2D:
-+        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_PIPE_3D:
-+#ifndef VIVANTE_NO_3D
-+        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
-+#else
-+        available = gcvFALSE;
-+#endif
-+        break;
-+
-+    case gcvFEATURE_HALTI2:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures4)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))));
-+        break;
-+
-+    default:
-+        gcmkFATAL("Invalid feature has been requested.");
-+        available = gcvFALSE;
-+    }
-+
-+    /* Return result. */
-+    gcmkFOOTER_ARG("%d", available ? gcvSTATUS_TRUE : gcvSTATUS_OK);
-+    return available ? gcvSTATUS_TRUE : gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_DumpMMUException
-+**
-+**  Dump the MMU debug info on an MMU exception.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_DumpMMUException(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+#if !gcdPOWER_SUSNPEND_WHEN_IDLE && !gcdPOWEROFF_TIMEOUT
-+    gctUINT32 mmu, mmuStatus, address, i;
-+#if gcdDEBUG
-+    gctUINT32 mtlb, stlb, offset;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    gcmkPRINT("GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
-+              Hardware->core,
-+              Hardware->identity.chipModel,
-+              Hardware->identity.chipRevision);
-+
-+    gcmkPRINT("**************************\n");
-+    gcmkPRINT("***   MMU ERROR DUMP   ***\n");
-+    gcmkPRINT("**************************\n");
-+
-+    gcmkVERIFY_OK(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00188,
-+                             &mmuStatus));
-+
-+    gcmkPRINT("  MMU status = 0x%08X\n", mmuStatus);
-+
-+    for (i = 0; i < 4; i += 1)
-+    {
-+        mmu = mmuStatus & 0xF;
-+        mmuStatus >>= 4;
-+
-+        if (mmu == 0)
-+        {
-+            continue;
-+        }
-+
-+        switch (mmu)
-+        {
-+        case 1:
-+              gcmkPRINT("  MMU%d: slave not present\n", i);
-+              break;
-+
-+        case 2:
-+              gcmkPRINT("  MMU%d: page not present\n", i);
-+              break;
-+
-+        case 3:
-+              gcmkPRINT("  MMU%d: write violation\n", i);
-+              break;
-+
-+        default:
-+              gcmkPRINT("  MMU%d: unknown state\n", i);
-+        }
-+
-+        gcmkVERIFY_OK(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00190 + i * 4,
-+                                 &address));
-+
-+        mtlb   = (address & gcdMMU_MTLB_MASK) >> gcdMMU_MTLB_SHIFT;
-+        stlb   = (address & gcdMMU_STLB_4K_MASK) >> gcdMMU_STLB_4K_SHIFT;
-+        offset =  address & gcdMMU_OFFSET_4K_MASK;
-+
-+        gcmkPRINT("  MMU%d: exception address = 0x%08X\n", i, address);
-+
-+        gcmkPRINT("    MTLB entry = %d\n", mtlb);
-+
-+        gcmkPRINT("    STLB entry = %d\n", stlb);
-+
-+        gcmkPRINT("    Offset = 0x%08X (%d)\n", offset, offset);
-+
-+        gckMMU_DumpPageTableEntry(Hardware->kernel->mmu, address);
-+
-+    }
-+
-+	gcmkFOOTER_NO();
-+#else
-+    /* If clock could be off automatically, we can't read mmu debug
-+    ** register here; build driver with gcdPOWER_SUSPEND_WHEN_IDLE = 0
-+    ** and gcdPOWEROFF_TIMEOUT = 0 to make it safe to read mmu register. */
-+    gcmkPRINT("[galcore] %s(%d): MMU Exception!", __FUNCTION__, __LINE__);
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_DumpGPUState
-+**
-+**  Dump the GPU debug registers.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_DumpGPUState(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    static gctCONST_STRING _cmdState[] =
-+    {
-+        "PAR_IDLE_ST", "PAR_DEC_ST", "PAR_ADR0_ST", "PAR_LOAD0_ST",
-+        "PAR_ADR1_ST", "PAR_LOAD1_ST", "PAR_3DADR_ST", "PAR_3DCMD_ST",
-+        "PAR_3DCNTL_ST", "PAR_3DIDXCNTL_ST", "PAR_INITREQDMA_ST",
-+        "PAR_DRAWIDX_ST", "PAR_DRAW_ST", "PAR_2DRECT0_ST", "PAR_2DRECT1_ST",
-+        "PAR_2DDATA0_ST", "PAR_2DDATA1_ST", "PAR_WAITFIFO_ST", "PAR_WAIT_ST",
-+        "PAR_LINK_ST", "PAR_END_ST", "PAR_STALL_ST"
-+    };
-+
-+    static gctCONST_STRING _cmdDmaState[] =
-+    {
-+        "CMD_IDLE_ST", "CMD_START_ST", "CMD_REQ_ST", "CMD_END_ST"
-+    };
-+
-+    static gctCONST_STRING _cmdFetState[] =
-+    {
-+        "FET_IDLE_ST", "FET_RAMVALID_ST", "FET_VALID_ST"
-+    };
-+
-+    static gctCONST_STRING _reqDmaState[] =
-+    {
-+        "REQ_IDLE_ST", "REQ_WAITIDX_ST", "REQ_CAL_ST"
-+    };
-+
-+    static gctCONST_STRING _calState[] =
-+    {
-+        "CAL_IDLE_ST", "CAL_LDADR_ST", "CAL_IDXCALC_ST"
-+    };
-+
-+    static gctCONST_STRING _veReqState[] =
-+    {
-+        "VER_IDLE_ST", "VER_CKCACHE_ST", "VER_MISS_ST"
-+    };
-+
-+    static gcsiDEBUG_REGISTERS _dbgRegs[] =
-+    {
-+        { "RA", 0x474, 16, 0x448, 16, 0x12344321 },
-+        { "TX", 0x474, 24, 0x44C, 16, 0x12211221 },
-+        { "FE", 0x470, 0, 0x450, 16, 0xBABEF00D },
-+        { "PE", 0x470, 16, 0x454, 16, 0xBABEF00D },
-+        { "DE", 0x470, 8, 0x458, 16, 0xBABEF00D },
-+        { "SH", 0x470, 24, 0x45C, 16, 0xDEADBEEF },
-+        { "PA", 0x474, 0, 0x460, 16, 0x0000AAAA },
-+        { "SE", 0x474, 8, 0x464, 16, 0x5E5E5E5E },
-+        { "MC", 0x478, 0, 0x468, 16, 0x12345678 },
-+        { "HI", 0x478, 8, 0x46C, 16, 0xAAAAAAAA }
-+    };
-+
-+    static gctUINT32 _otherRegs[] =
-+    {
-+        0x040, 0x044, 0x04C, 0x050, 0x054, 0x058, 0x05C, 0x060,
-+        0x43c, 0x440, 0x444, 0x414,
-+    };
-+
-+    gceSTATUS status;
-+    gckKERNEL kernel;
-+    gctUINT32 idle, axi;
-+    gctUINT32 dmaAddress1, dmaAddress2;
-+    gctUINT32 dmaState1, dmaState2;
-+    gctUINT32 dmaLow, dmaHigh;
-+    gctUINT32 cmdState, cmdDmaState, cmdFetState;
-+    gctUINT32 dmaReqState, calState, veReqState;
-+    gctUINT i;
-+    gctUINT pipe, pixelPipes;
-+    gctUINT32 control, oldControl;
-+    gckOS os = Hardware->os;
-+    gceCORE core = Hardware->core;
-+
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    kernel = Hardware->kernel;
-+
-+    gcmkPRINT_N(12, "GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
-+                core,
-+                Hardware->identity.chipModel,
-+                Hardware->identity.chipRevision);
-+
-+    pixelPipes = Hardware->identity.pixelPipes
-+               ? Hardware->identity.pixelPipes
-+               : 1;
-+
-+    /* Reset register values. */
-+    idle        = axi         =
-+    dmaState1   = dmaState2   =
-+    dmaAddress1 = dmaAddress2 =
-+    dmaLow      = dmaHigh     = 0;
-+
-+    /* Verify whether DMA is running. */
-+    gcmkONERROR(_VerifyDMA(
-+        os, core, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
-+        ));
-+
-+    cmdState    =  dmaState2        & 0x1F;
-+    cmdDmaState = (dmaState2 >>  8) & 0x03;
-+    cmdFetState = (dmaState2 >> 10) & 0x03;
-+    dmaReqState = (dmaState2 >> 12) & 0x03;
-+    calState    = (dmaState2 >> 14) & 0x03;
-+    veReqState  = (dmaState2 >> 16) & 0x03;
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x004, &idle));
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x00C, &axi));
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x668, &dmaLow));
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x66C, &dmaHigh));
-+
-+    gcmkPRINT_N(0, "**************************\n");
-+    gcmkPRINT_N(0, "***   GPU STATE DUMP   ***\n");
-+    gcmkPRINT_N(0, "**************************\n");
-+
-+    gcmkPRINT_N(4, "  axi      = 0x%08X\n", axi);
-+
-+    gcmkPRINT_N(4, "  idle     = 0x%08X\n", idle);
-+    if ((idle & 0x00000001) == 0) gcmkPRINT_N(0, "    FE not idle\n");
-+    if ((idle & 0x00000002) == 0) gcmkPRINT_N(0, "    DE not idle\n");
-+    if ((idle & 0x00000004) == 0) gcmkPRINT_N(0, "    PE not idle\n");
-+    if ((idle & 0x00000008) == 0) gcmkPRINT_N(0, "    SH not idle\n");
-+    if ((idle & 0x00000010) == 0) gcmkPRINT_N(0, "    PA not idle\n");
-+    if ((idle & 0x00000020) == 0) gcmkPRINT_N(0, "    SE not idle\n");
-+    if ((idle & 0x00000040) == 0) gcmkPRINT_N(0, "    RA not idle\n");
-+    if ((idle & 0x00000080) == 0) gcmkPRINT_N(0, "    TX not idle\n");
-+    if ((idle & 0x00000100) == 0) gcmkPRINT_N(0, "    VG not idle\n");
-+    if ((idle & 0x00000200) == 0) gcmkPRINT_N(0, "    IM not idle\n");
-+    if ((idle & 0x00000400) == 0) gcmkPRINT_N(0, "    FP not idle\n");
-+    if ((idle & 0x00000800) == 0) gcmkPRINT_N(0, "    TS not idle\n");
-+    if ((idle & 0x80000000) != 0) gcmkPRINT_N(0, "    AXI low power mode\n");
-+
-+    if (
-+        (dmaAddress1 == dmaAddress2)
-+     && (dmaState1 == dmaState2)
-+    )
-+    {
-+        gcmkPRINT_N(0, "  DMA appears to be stuck at this address:\n");
-+        gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
-+    }
-+    else
-+    {
-+        if (dmaAddress1 == dmaAddress2)
-+        {
-+            gcmkPRINT_N(0, "  DMA address is constant, but state is changing:\n");
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaState1);
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaState2);
-+        }
-+        else
-+        {
-+            gcmkPRINT_N(0, "  DMA is running; known addresses are:\n");
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress2);
-+        }
-+    }
-+    gcmkPRINT_N(4, "  dmaLow   = 0x%08X\n", dmaLow);
-+    gcmkPRINT_N(4, "  dmaHigh  = 0x%08X\n", dmaHigh);
-+    gcmkPRINT_N(4, "  dmaState = 0x%08X\n", dmaState2);
-+    gcmkPRINT_N(8, "    command state       = %d (%s)\n", cmdState, _cmdState   [cmdState]);
-+    gcmkPRINT_N(8, "    command DMA state   = %d (%s)\n", cmdDmaState, _cmdDmaState[cmdDmaState]);
-+    gcmkPRINT_N(8, "    command fetch state = %d (%s)\n", cmdFetState, _cmdFetState[cmdFetState]);
-+    gcmkPRINT_N(8, "    DMA request state   = %d (%s)\n", dmaReqState, _reqDmaState[dmaReqState]);
-+    gcmkPRINT_N(8, "    cal state           = %d (%s)\n", calState, _calState   [calState]);
-+    gcmkPRINT_N(8, "    VE request state    = %d (%s)\n", veReqState, _veReqState [veReqState]);
-+
-+    /* Record control. */
-+    gckOS_ReadRegisterEx(os, core, 0x0, &oldControl);
-+
-+    for (pipe = 0; pipe < pixelPipes; pipe++)
-+    {
-+        gcmkPRINT_N(4, "  Debug registers of pipe[%d]:\n", pipe);
-+
-+        /* Switch pipe. */
-+        gckOS_ReadRegisterEx(os, core, 0x0, &control);
-+        control &= ~(0xF << 20);
-+        control |= (pipe << 20);
-+        gckOS_WriteRegisterEx(os, core, 0x0, control);
-+
-+        for (i = 0; i < gcmCOUNTOF(_dbgRegs); i += 1)
-+        {
-+            gcmkONERROR(_DumpDebugRegisters(os, core, &_dbgRegs[i]));
-+        }
-+
-+        gcmkPRINT_N(0, "    Other Registers:\n");
-+        for (i = 0; i < gcmCOUNTOF(_otherRegs); i += 1)
-+        {
-+            gctUINT32 read;
-+            gcmkONERROR(gckOS_ReadRegisterEx(os, core, _otherRegs[i], &read));
-+            gcmkPRINT_N(12, "      [0x%04X] 0x%08X\n", _otherRegs[i], read);
-+        }
-+    }
-+
-+    if (kernel->hardware->identity.chipFeatures & (1 << 4))
-+    {
-+        gctUINT32 read0, read1, write;
-+
-+        read0 = read1 = write = 0;
-+
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x43C, &read0));
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x440, &read1));
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x444, &write));
-+
-+        gcmkPRINT_N(4, "  read0    = 0x%08X\n", read0);
-+        gcmkPRINT_N(4, "  read1    = 0x%08X\n", read1);
-+        gcmkPRINT_N(4, "  write    = 0x%08X\n", write);
-+    }
-+
-+    /* Restore control. */
-+    gckOS_WriteRegisterEx(os, core, 0x0, oldControl);
-+
-+    /* dump stack. */
-+    gckOS_DumpCallStack(os);
-+
-+OnError:
-+
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-+#if gcdFRAME_DB
-+static gceSTATUS
-+gckHARDWARE_ReadPerformanceRegister(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT PerformanceAddress,
-+    IN gctUINT IndexAddress,
-+    IN gctUINT IndexShift,
-+    IN gctUINT Index,
-+    OUT gctUINT32_PTR Value
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x PerformanceAddress=0x%x IndexAddress=0x%x "
-+                   "IndexShift=%u Index=%u",
-+                   Hardware, PerformanceAddress, IndexAddress, IndexShift,
-+                   Index);
-+
-+    /* Write the index. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      IndexAddress,
-+                                      Index << IndexShift));
-+
-+    /* Read the register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     PerformanceAddress,
-+                                     Value));
-+
-+    /* Test for reset. */
-+    if (Index == 15)
-+    {
-+        /* Index another register to get out of reset. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, IndexAddress, 0));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Value=0x%x", *Value);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetFrameInfo(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_FRAME_INFO * FrameInfo
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT i, clock;
-+    gcsHAL_FRAME_INFO info;
-+#if gcdFRAME_DB_RESET
-+	gctUINT reset;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Get profile tick. */
-+    gcmkONERROR(gckOS_GetProfileTick(&info.ticks));
-+
-+    /* Read SH counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        4,
-+        &info.shaderCycles));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        9,
-+        &info.vsInstructionCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        12,
-+        &info.vsTextureCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        7,
-+        &info.psInstructionCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        14,
-+        &info.psTextureCount));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read PA counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        3,
-+        &info.vertexCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        4,
-+        &info.primitiveCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        7,
-+        &info.rejectedPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        8,
-+        &info.culledPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        6,
-+        &info.clippedPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        5,
-+        &info.outPrimitives));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read RA counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        3,
-+        &info.inPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        11,
-+        &info.culledQuadCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        1,
-+        &info.totalQuadCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        2,
-+        &info.quadCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        0,
-+        &info.totalPixelCount));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read TX counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        0,
-+        &info.bilinearRequests));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        1,
-+        &info.trilinearRequests));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        8,
-+        &info.txHitCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        9,
-+        &info.txMissCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        6,
-+        &info.txBytes8));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read clock control register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &clock));
-+
-+    /* Walk through all avaiable pixel pipes. */
-+    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
-+    {
-+        /* Select proper pipe. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
-+
-+        /* Read cycle registers. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00078,
-+                                         &info.cycles[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x0007C,
-+                                         &info.idleCycles[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00438,
-+                                         &info.mcCycles[i]));
-+
-+        /* Read bandwidth registers. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x0005C,
-+                                         &info.readRequests[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00040,
-+                                         &info.readBytes8[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00050,
-+                                         &info.writeRequests[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00044,
-+                                         &info.writeBytes8[i]));
-+
-+        /* Read PE counters. */
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            0,
-+            &info.colorKilled[i]));
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            2,
-+            &info.colorDrawn[i]));
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            1,
-+            &info.depthKilled[i]));
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            3,
-+            &info.depthDrawn[i]));
-+    }
-+
-+    /* Zero out remaning reserved counters. */
-+    for (; i < 8; ++i)
-+    {
-+        info.readBytes8[i]    = 0;
-+        info.writeBytes8[i]   = 0;
-+        info.cycles[i]        = 0;
-+        info.idleCycles[i]    = 0;
-+        info.mcCycles[i]      = 0;
-+        info.readRequests[i]  = 0;
-+        info.writeRequests[i] = 0;
-+        info.colorKilled[i]   = 0;
-+        info.colorDrawn[i]    = 0;
-+        info.depthKilled[i]   = 0;
-+        info.depthDrawn[i]    = 0;
-+    }
-+
-+    /* Reset clock control register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      clock));
-+
-+    /* Reset cycle and bandwidth counters. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      1));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      0));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00078,
-+                                      0));
-+
-+#if gcdFRAME_DB_RESET
-+    /* Reset PE counters. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00454,
-+        0x00470,
-+        16,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Copy to user. */
-+    gcmkONERROR(gckOS_CopyToUserData(Hardware->os,
-+                                     &info,
-+                                     FrameInfo,
-+                                     gcmSIZEOF(info)));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+#if gcdDVFS
-+#define READ_FROM_EATER1 0
-+
-+gceSTATUS
-+gckHARDWARE_QueryLoad(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32 * Load
-+    )
-+{
-+    gctUINT32 debug1;
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Load != gcvNULL);
-+
-+    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00110,
-+                                         Load));
-+#if READ_FROM_EATER1
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00134,
-+                                         Load));
-+#endif
-+
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00114,
-+                                         &debug1));
-+
-+        /* Patch result of 0x110 with result of 0x114. */
-+        if ((debug1 & 0xFF) == 1)
-+        {
-+            *Load &= ~0xFF;
-+            *Load |= 1;
-+        }
-+
-+        if (((debug1 & 0xFF00) >> 8) == 1)
-+        {
-+            *Load &= ~(0xFF << 8);
-+            *Load |= 1 << 8;
-+        }
-+
-+        if (((debug1 & 0xFF0000) >> 16) == 1)
-+        {
-+            *Load &= ~(0xFF << 16);
-+            *Load |= 1 << 16;
-+        }
-+
-+        if (((debug1 & 0xFF000000) >> 24) == 1)
-+        {
-+            *Load &= ~(0xFF << 24);
-+            *Load |= 1 << 24;
-+        }
-+    }
-+    else
-+    {
-+        status = gcvSTATUS_INVALID_REQUEST;
-+    }
-+
-+OnError:
-+
-+    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetDVFSPeroid(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32 Frequency
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 period;
-+    gctUINT32 eater;
-+
-+#if READ_FROM_EATER1
-+    gctUINT32 period1;
-+    gctUINT32 eater1;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%X Frequency=%d", Hardware, Frequency);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    period = 0;
-+
-+    while((64 << period) < (gcdDVFS_ANAYLSE_WINDOW * Frequency * 1000) )
-+    {
-+        period++;
-+    }
-+
-+#if READ_FROM_EATER1
-+    /*
-+    *  Peroid = F * 1000 * 1000 / (60 * 16 * 1024);
-+    */
-+    period1 = Frequency * 6250 / 6114;
-+#endif
-+
-+    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+        /* Get current configure. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x0010C,
-+                                         &eater));
-+
-+        /* Change peroid. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x0010C,
-+                                          ((((gctUINT32) (eater)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (period) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))));
-+
-+#if READ_FROM_EATER1
-+        /* Config eater1. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00130,
-+                                         &eater1));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00130,
-+                                          ((((gctUINT32) (eater1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16))) | (((gctUINT32) ((gctUINT32) (period1) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16)))));
-+#endif
-+    }
-+    else
-+    {
-+        status = gcvSTATUS_INVALID_REQUEST;
-+    }
-+
-+OnError:
-+    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_InitDVFS(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 data;
-+
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x0010C,
-+                                     &data));
-+
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22)));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "DVFS Configure=0x%X",
-+                   data);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0010C,
-+                                      data));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h
---- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h	2015-07-27 23:13:06.170964992 +0200
-@@ -0,0 +1,136 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_hardware_h_
-+#define __gc_hal_kernel_hardware_h_
-+
-+#if gcdENABLE_VG
-+#include "gc_hal_kernel_hardware_vg.h"
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/* gckHARDWARE object. */
-+struct _gckHARDWARE
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gctKERNEL object. */
-+    gckKERNEL                   kernel;
-+
-+    /* Pointer to gctOS object. */
-+    gckOS                       os;
-+
-+    /* Core */
-+    gceCORE                     core;
-+
-+    /* Chip characteristics. */
-+    gcsHAL_QUERY_CHIP_IDENTITY  identity;
-+    gctBOOL                     allowFastClear;
-+    gctBOOL                     allowCompression;
-+    gctUINT32                   powerBaseAddress;
-+    gctBOOL                     extraEventStates;
-+
-+    /* Big endian */
-+    gctBOOL                     bigEndian;
-+
-+    /* Chip status */
-+    gctPOINTER                  powerMutex;
-+    gctUINT32                   powerProcess;
-+    gctUINT32                   powerThread;
-+    gceCHIPPOWERSTATE           chipPowerState;
-+    gctUINT32                   lastWaitLink;
-+    gctBOOL                     clockState;
-+    gctBOOL                     powerState;
-+    gctPOINTER                  globalSemaphore;
-+
-+    gctISRMANAGERFUNC           startIsr;
-+    gctISRMANAGERFUNC           stopIsr;
-+    gctPOINTER                  isrContext;
-+
-+    gctUINT32                   mmuVersion;
-+
-+    /* Type */
-+    gceHARDWARE_TYPE            type;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gctUINT32                   powerOffTime;
-+    gctUINT32                   powerOffTimeout;
-+    gctPOINTER                  powerOffTimer;
-+#endif
-+
-+    gctPOINTER                  pageTableDirty;
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    /* FSCALE_VAL when gcvPOWER_ON. */
-+    gctUINT32                   powerOnFscaleVal;
-+#endif
-+
-+#if gcdLINK_QUEUE_SIZE
-+    struct _gckLINKQUEUE        linkQueue;
-+#endif
-+
-+    gctBOOL                     powerManagement;
-+    gctBOOL                     gpuProfiler;
-+};
-+
-+gceSTATUS
-+gckHARDWARE_GetBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32_PTR BaseAddress
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_NeedBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 State,
-+    OUT gctBOOL_PTR NeedBase
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_GetFrameInfo(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_FRAME_INFO * FrameInfo
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_SetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32   FscaleValue
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_GetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT * FscaleValue,
-+    IN gctUINT * MinFscaleValue,
-+    IN gctUINT * MaxFscaleValue
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_hardware_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/config linux-xbian-imx6/drivers/mxc/gpu-viv/config
---- linux-4.1.3/drivers/mxc/gpu-viv/config	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/config	2015-07-27 23:13:06.170964992 +0200
-@@ -0,0 +1,38 @@
-+##############################################################################
-+#
-+#    Copyright (C) 2005 - 2013 by Vivante Corp.
-+#
-+#    This program is free software; you can redistribute it and/or modify
-+#    it under the terms of the GNU General Public License as published by
-+#    the Free Software Foundation; either version 2 of the license, or
-+#    (at your option) any later version.
-+#
-+#    This program is distributed in the hope that it will be useful,
-+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+#    GNU General Public License for more details.
-+#
-+#    You should have received a copy of the GNU General Public License
-+#    along with this program; if not write to the Free Software
-+#    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+#
-+##############################################################################
-+
-+
-+ARCH_TYPE                         ?= arm
-+SDK_DIR                           ?= $(AQROOT)/build/sdk
-+USE_3D_VG                         ?= 1
-+FORCE_ALL_VIDEO_MEMORY_CACHED     ?= 0
-+NONPAGED_MEMORY_CACHEABLE         ?= 0
-+NONPAGED_MEMORY_BUFFERABLE        ?= 1
-+CACHE_FUNCTION_UNIMPLEMENTED      ?= 0
-+VIVANTE_ENABLE_VG                 ?= 1
-+NO_USER_DIRECT_ACCESS_FROM_KERNEL ?= 1
-+VIVANTE_NO_3D                     ?= 0
-+ENABLE_OUTER_CACHE_PATCH          ?= 1
-+USE_BANK_ALIGNMENT                ?= 1
-+BANK_BIT_START                    ?= 13
-+BANK_BIT_END                      ?= 15
-+BANK_CHANNEL_BIT                  ?= 12
-+ENABLE_GPU_CLOCK_BY_DRIVER        = 1
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c	2015-07-27 23:13:06.186908111 +0200
-@@ -0,0 +1,2317 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#include "gc_hal_kernel_context.h"
-+#include "gc_hal_kernel_buffer.h"
-+
-+/******************************************************************************\
-+******************************** Debugging Macro *******************************
-+\******************************************************************************/
-+
-+/* Zone used for header/footer. */
-+#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
-+
-+
-+/******************************************************************************\
-+************************** Context State Buffer Helpers ************************
-+\******************************************************************************/
-+
-+#define _STATE(reg)                                                            \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        reg ## _Count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _STATE_COUNT(reg, count)                                               \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _STATE_COUNT_OFFSET(reg, offset, count)                                \
-+    _State(\
-+        Context, index, \
-+        (reg ## _Address >> 2) + offset, \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _STATE_MIRROR_COUNT(reg, mirror, count)                                \
-+    _StateMirror(\
-+        Context, \
-+        reg ## _Address >> 2, \
-+        count, \
-+        mirror ## _Address >> 2                                                \
-+        )
-+
-+#define _STATE_HINT(reg)                                                       \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        reg ## _Count, \
-+        gcvFALSE, gcvTRUE                                                      \
-+        )
-+
-+#define _STATE_HINT_BLOCK(reg, block, count)                                   \
-+    _State(\
-+        Context, index, \
-+        (reg ## _Address >> 2) + (block << reg ## _BLK), \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvTRUE                                                      \
-+        )
-+
-+#define _STATE_COUNT_OFFSET_HINT(reg, offset, count)                           \
-+    _State(\
-+        Context, index, \
-+        (reg ## _Address >> 2) + offset, \
-+        reg ## _ResetValue, \
-+        count, \
-+        gcvFALSE, gcvTRUE                                                      \
-+        )
-+
-+#define _STATE_X(reg)                                                          \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        reg ## _ResetValue, \
-+        reg ## _Count, \
-+        gcvTRUE, gcvFALSE                                                      \
-+        )
-+
-+#define _STATE_INIT_VALUE(reg, value)                                          \
-+    _State(\
-+        Context, index, \
-+        reg ## _Address >> 2, \
-+        value, \
-+        reg ## _Count, \
-+        gcvFALSE, gcvFALSE                                                     \
-+        )
-+
-+#define _CLOSE_RANGE()                                                         \
-+    _TerminateStateBlock(Context, index)
-+
-+#define _ENABLE(reg, field)                                                    \
-+    do                                                                         \
-+    {                                                                          \
-+        if (gcmVERIFYFIELDVALUE(data, reg, MASK_ ## field, ENABLED))           \
-+        {                                                                      \
-+            enable |= gcmFIELDMASK(reg, field);                                \
-+        }                                                                      \
-+    }                                                                          \
-+    while (gcvFALSE)
-+
-+#define _BLOCK_COUNT(reg)                                                      \
-+    ((reg ## _Count) >> (reg ## _BLK))
-+
-+
-+/******************************************************************************\
-+*********************** Support Functions and Definitions **********************
-+\******************************************************************************/
-+
-+#define gcdSTATE_MASK \
-+    (((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 | 0xC0FFEE & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))))
-+
-+#if gcdENABLE_3D
-+static gctUINT32
-+_TerminateStateBlock(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Index
-+    )
-+{
-+    gctUINT32_PTR buffer;
-+    gctUINT32 align;
-+
-+    /* Determine if we need alignment. */
-+    align = (Index & 1) ? 1 : 0;
-+
-+    /* Address correct index. */
-+    buffer = (Context->buffer == gcvNULL)
-+        ? gcvNULL
-+        : Context->buffer->logical;
-+
-+    /* Flush the current state block; make sure no pairing with the states
-+       to follow happens. */
-+    if (align && (buffer != gcvNULL))
-+    {
-+        buffer[Index] = 0xDEADDEAD;
-+    }
-+
-+    /* Reset last address. */
-+    Context->lastAddress = ~0U;
-+
-+    /* Return alignment requirement. */
-+    return align;
-+}
-+#endif
-+
-+
-+#if (gcdENABLE_3D || gcdENABLE_2D)
-+static gctUINT32
-+_FlushPipe(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Index,
-+    IN gcePIPE_SELECT Pipe
-+    )
-+{
-+    gctBOOL fcFlushStall;
-+    gctUINT32 flushSlots;
-+    gctBOOL iCacheInvalidate;
-+
-+    fcFlushStall
-+        = gckHARDWARE_IsFeatureAvailable(Context->hardware, gcvFEATURE_FC_FLUSH_STALL);
-+
-+    iCacheInvalidate
-+        = ((((gctUINT32) (Context->hardware->identity.chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))));
-+
-+    flushSlots = 6;
-+
-+    if (fcFlushStall)
-+    {
-+        /* Flush tile status cache. */
-+        flushSlots += 6;
-+    }
-+
-+    if (iCacheInvalidate)
-+    {
-+        flushSlots += 12;
-+    }
-+
-+    if (Context->buffer != gcvNULL)
-+    {
-+        gctUINT32_PTR buffer;
-+
-+        /* Address correct index. */
-+        buffer = Context->buffer->logical + Index;
-+
-+        /* Flush the current pipe. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = (Pipe == gcvPIPE_2D)
-+                ?   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+                :   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+
-+        /* Semaphore from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Stall from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        if (fcFlushStall)
-+        {
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+            /* Semaphore from FE to PE. */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+            /* Stall from FE to PE. */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+        }
-+
-+        if (iCacheInvalidate)
-+        {
-+            /* Invalidate I$ after pipe is stalled */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0218) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x021A) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0218) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x021A) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+
-+            /* Semaphore from FE to PE. */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+            /* Stall from FE to PE. */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+        }
-+    }
-+
-+    /* Number of slots taken by flushing pipe. */
-+    return flushSlots;
-+}
-+#endif
-+
-+#if gcdENABLE_3D
-+static gctUINT32
-+_SemaphoreStall(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Index
-+    )
-+{
-+    if (Context->buffer != gcvNULL)
-+    {
-+        gctUINT32_PTR buffer;
-+
-+        /* Address correct index. */
-+        buffer = Context->buffer->logical + Index;
-+
-+        /* Semaphore from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Stall from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+    }
-+
-+    /* Semaphore/stall takes 4 slots. */
-+    return 4;
-+}
-+#endif
-+
-+#if (gcdENABLE_3D || gcdENABLE_2D)
-+static gctUINT32
-+_SwitchPipe(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Index,
-+    IN gcePIPE_SELECT Pipe
-+    )
-+{
-+    gctUINT32 slots = 6;
-+
-+    if (Context->buffer != gcvNULL)
-+    {
-+        gctUINT32_PTR buffer;
-+
-+        /* Address correct index. */
-+        buffer = Context->buffer->logical + Index;
-+
-+        /* LoadState(AQPipeSelect, 1), pipe. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        *buffer++
-+            = (Pipe == gcvPIPE_2D)
-+                ? 0x1
-+                : 0x0;
-+
-+        /* Semaphore from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Stall from FE to PE. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+    }
-+
-+    Context->pipeSelectBytes = slots * gcmSIZEOF(gctUINT32);
-+
-+    return slots;
-+}
-+#endif
-+
-+#if gcdENABLE_3D
-+static gctUINT32
-+_State(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Value,
-+    IN gctUINT32 Size,
-+    IN gctBOOL FixedPoint,
-+    IN gctBOOL Hinted
-+    )
-+{
-+    gctUINT32_PTR buffer;
-+    gctUINT32 align;
-+    gctUINT32 i;
-+
-+    /* Determine if we need alignment. */
-+    align = (Index & 1) ? 1 : 0;
-+
-+    /* Address correct index. */
-+    buffer = (Context->buffer == gcvNULL)
-+        ? gcvNULL
-+        : Context->buffer->logical;
-+
-+    if ((buffer == gcvNULL) && (Address + Size > Context->stateCount))
-+    {
-+        /* Determine maximum state. */
-+        Context->stateCount = Address + Size;
-+    }
-+
-+    /* Do we need a new entry? */
-+    if ((Address != Context->lastAddress) || (FixedPoint != Context->lastFixed))
-+    {
-+        if (buffer != gcvNULL)
-+        {
-+            if (align)
-+            {
-+                /* Add filler. */
-+                buffer[Index++] = 0xDEADDEAD;
-+            }
-+
-+            /* LoadState(Address, Count). */
-+            gcmkASSERT((Index & 1) == 0);
-+
-+            if (FixedPoint)
-+            {
-+                buffer[Index]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+            }
-+            else
-+            {
-+                buffer[Index]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+            }
-+
-+            /* Walk all the states. */
-+            for (i = 0; i < (gctUINT32)Size; i += 1)
-+            {
-+                /* Set state to uninitialized value. */
-+                buffer[Index + 1 + i] = Value;
-+
-+                /* Set index in state mapping table. */
-+                Context->map[Address + i].index = (gctUINT)Index + 1 + i;
-+
-+#if gcdSECURE_USER
-+                /* Save hint. */
-+                if (Context->hint != gcvNULL)
-+                {
-+                    Context->hint[Address + i] = Hinted;
-+                }
-+#endif
-+            }
-+        }
-+
-+        /* Save information for this LoadState. */
-+        Context->lastIndex   = (gctUINT)Index;
-+        Context->lastAddress = Address + (gctUINT32)Size;
-+        Context->lastSize    = Size;
-+        Context->lastFixed   = FixedPoint;
-+
-+        /* Return size for load state. */
-+        return align + 1 + Size;
-+    }
-+
-+    /* Append this state to the previous one. */
-+    if (buffer != gcvNULL)
-+    {
-+        /* Update last load state. */
-+        buffer[Context->lastIndex] =
-+            ((((gctUINT32) (buffer[Context->lastIndex])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Context->lastSize + Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        /* Walk all the states. */
-+        for (i = 0; i < (gctUINT32)Size; i += 1)
-+        {
-+            /* Set state to uninitialized value. */
-+            buffer[Index + i] = Value;
-+
-+            /* Set index in state mapping table. */
-+            Context->map[Address + i].index = (gctUINT)Index + i;
-+
-+#if gcdSECURE_USER
-+            /* Save hint. */
-+            if (Context->hint != gcvNULL)
-+            {
-+                Context->hint[Address + i] = Hinted;
-+            }
-+#endif
-+        }
-+    }
-+
-+    /* Update last address and size. */
-+    Context->lastAddress += (gctUINT32)Size;
-+    Context->lastSize    += Size;
-+
-+    /* Return number of slots required. */
-+    return Size;
-+}
-+
-+static gctUINT32
-+_StateMirror(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Size,
-+    IN gctUINT32 AddressMirror
-+    )
-+{
-+    gctUINT32 i;
-+
-+    /* Process when buffer is set. */
-+    if (Context->buffer != gcvNULL)
-+    {
-+        /* Walk all states. */
-+        for (i = 0; i < Size; i++)
-+        {
-+            /* Copy the mapping address. */
-+            Context->map[Address + i].index =
-+                Context->map[AddressMirror + i].index;
-+        }
-+    }
-+
-+    /* Return the number of required maps. */
-+    return Size;
-+}
-+#endif
-+
-+#if (gcdENABLE_3D || gcdENABLE_2D)
-+static gceSTATUS
-+_InitializeContextBuffer(
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gctUINT32_PTR buffer;
-+    gctUINT32 index;
-+
-+#if gcdENABLE_3D
-+    gctBOOL halti0, halti1, halti2, halti3;
-+    gctUINT i;
-+    gctUINT vertexUniforms, fragmentUniforms, vsConstBase, psConstBase, constMax;
-+    gctBOOL unifiedUniform;
-+    gctUINT fe2vsCount;
-+#endif
-+
-+    /* Reset the buffer index. */
-+    index = 0;
-+
-+    /* Reset the last state address. */
-+    Context->lastAddress = ~0U;
-+
-+    /* Get the buffer pointer. */
-+    buffer = (Context->buffer == gcvNULL)
-+        ? gcvNULL
-+        : Context->buffer->logical;
-+
-+
-+    /**************************************************************************/
-+    /* Build 2D states. *******************************************************/
-+
-+
-+#if gcdENABLE_3D
-+    /**************************************************************************/
-+    /* Build 3D states. *******************************************************/
-+
-+    halti0 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) );
-+    halti1 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) );
-+    halti2 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures4)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) );
-+    halti3 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures5)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) );
-+
-+    /* Query how many uniforms can support for non-unified uniform mode. */
-+    {if (Context->hardware->identity.numConstants > 256){    unifiedUniform = gcvTRUE;    vsConstBase  = 0xC000;    psConstBase  = 0xC000;    constMax     = Context->hardware->identity.numConstants;    vertexUniforms   = 256;    fragmentUniforms   = constMax - vertexUniforms;}else if (Context->hardware->identity.numConstants == 256){    if (Context->hardware->identity.chipModel == gcv2000 && Context->hardware->identity.chipRevision == 0x5118)    {        unifiedUniform = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vertexUniforms   = 256;        fragmentUniforms   = 64;        constMax     = 320;    }    else    {        unifiedUniform = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vertexUniforms   = 256;        fragmentUniforms   = 256;        constMax     = 512;    }}else{    unifiedUniform = gcvFALSE;    vsConstBase  = 0x1400;    psConstBase  = 0x1C00;    vertexUniforms   = 168;    fragmentUniforms   = 64;    constMax     = 232;}};
-+
-+#if !gcdENABLE_UNIFIED_CONSTANT
-+    if (Context->hardware->identity.numConstants > 256)
-+    {
-+        unifiedUniform = gcvTRUE;
-+    }
-+    else
-+    {
-+        unifiedUniform = gcvFALSE;
-+    }
-+#endif
-+
-+    /* Store the 3D entry index. */
-+    Context->entryOffset3D = (gctUINT)index * gcmSIZEOF(gctUINT32);
-+
-+    /* Switch to 3D pipe. */
-+    index += _SwitchPipe(Context, index, gcvPIPE_3D);
-+
-+    /* Current context pointer. */
-+#if gcdDEBUG
-+    index += _State(Context, index, 0x03850 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+#endif
-+
-+    index += _FlushPipe(Context, index, gcvPIPE_3D);
-+
-+    /* Global states. */
-+    index += _State(Context, index, 0x03814 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03818 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0381C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03820 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03828 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0382C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03834 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03854 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0384C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    /* Front End states. */
-+    fe2vsCount = 12;
-+    if (halti0)
-+    {
-+        fe2vsCount = 16;
-+    }
-+    index += _State(Context, index, 0x00600 >> 2, 0x00000000, fe2vsCount, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    index += _State(Context, index, 0x00644 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x00648 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0064C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x00650 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00680 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x006A0 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00674 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0067C >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x006C0 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00700 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00740 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00780 >> 2, 0x3F800000, 16, gcvFALSE, gcvFALSE);
-+
-+    if (halti2)
-+    {
-+        index += _State(Context, index, 0x14600 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x14640 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x14680 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* This register is programed by all chips, which program all DECODE_SELECT as VS
-+    ** except SAMPLER_DECODE_SELECT.
-+    */
-+    index += _State(Context, index, 0x00860 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    if (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))))
-+    {
-+        /* I-Cache states. */
-+        index += _State(Context, index, 0x00868 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x0086C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x0304C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x01028 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _CLOSE_RANGE();
-+
-+        if (halti3)
-+        {
-+            index += _State(Context, index, 0x00890 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+            index += _State(Context, index, 0x0104C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+            index += _CLOSE_RANGE();
-+        }
-+    }
-+
-+    /* Vertex Shader states. */
-+    index += _State(Context, index, 0x00804 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00808 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0080C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00810 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00820 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00830 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    index += _CLOSE_RANGE();
-+
-+    /* Primitive Assembly states. */
-+    index += _State(Context, index, 0x00A00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A08 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A0C >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A10 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A1C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A28 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A2C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A30 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A40 >> 2, 0x00000000, Context->hardware->identity.varyingsCount, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A34 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A38 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A3C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A80 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A84 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00A8C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00A88 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+#if gcdMULTI_GPU
-+    index += _State(Context, index, 0x03A00 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03A04 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x03A08 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+#endif
-+    /* Setup states. */
-+    index += _State(Context, index, 0x00C00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C08 >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C0C >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C10 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C1C >> 2, 0x42000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00C20 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+    index += _State(Context, index, 0x00C24 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
-+
-+    /* Raster states. */
-+    index += _State(Context, index, 0x00E00 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E10 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E04 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E40 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E08 >> 2, 0x00000031, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E24 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00E20 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    if (halti2)
-+    {
-+        index += _State(Context, index, 0x00E0C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* Pixel Shader states. */
-+    index += _State(Context, index, 0x01004 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0100C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01010 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01030 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    index += _CLOSE_RANGE();
-+
-+    /* Texture states. */
-+    index += _State(Context, index, 0x02000 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02040 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02080 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x020C0 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02100 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02140 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02180 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x021C0 >> 2, 0x00321000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02200 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x02240 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, (0x02400 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02440 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02480 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x024C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02500 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02540 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02580 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x025C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02600 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02640 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02680 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x026C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02700 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, (0x02740 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
-+    index += _CLOSE_RANGE();
-+
-+    if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 22:22)) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) ))
-+    {
-+        /*
-+         * Linear stride LODn will overwrite LOD0 on GC880,GC2000.
-+         * And only LOD0 is valid for this register.
-+         */
-+        gctUINT count = halti1 ? 14 : 1;
-+
-+        for (i = 0; i < 12; i += 1)
-+        {
-+            index += _State(Context, index, (0x02C00 >> 2) + i * 16, 0x00000000, count, gcvFALSE, gcvFALSE);
-+        }
-+    }
-+
-+    if (halti1)
-+    {
-+        gctUINT texBlockCount;
-+        gctUINT gcregTXLogSizeResetValue;
-+
-+        /* Enable the integer filter pipe for all texture samplers
-+           so that the floating point filter clock will shut off until
-+           we start using the floating point filter.
-+        */
-+        gcregTXLogSizeResetValue = ((((gctUINT32) (0x00000000)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 29:29) - (0 ? 29:29) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 29:29) - (0 ? 29:29) + 1))))))) << (0 ? 29:29))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 29:29) - (0 ? 29:29) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 29:29) - (0 ? 29:29) + 1))))))) << (0 ? 29:29)));
-+
-+        /* New texture block. */
-+        index += _State(Context, index, 0x10000 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10080 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10100 >> 2, gcregTXLogSizeResetValue, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10180 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10200 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10280 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10300 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10380 >> 2, 0x00321000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10400 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10480 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+
-+        if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 15:15)) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1)))))) ))
-+        {
-+            index += _State(Context, index, 0x12000 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
-+            index += _State(Context, index, 0x12400 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
-+        }
-+
-+        texBlockCount = ((512) >> (4));
-+
-+        for (i = 0; i < texBlockCount; i += 1)
-+        {
-+            index += _State(Context, index, (0x10800 >> 2) + (i << 4), 0x00000000, 14, gcvFALSE, gcvTRUE);
-+        }
-+    }
-+
-+    if (halti2)
-+    {
-+        index += _State(Context, index, 0x10700 >> 2, 0x00000F00, 32, gcvFALSE, gcvFALSE);
-+    }
-+
-+    if (halti3)
-+    {
-+        index += _State(Context, index, 0x10780 >> 2, 0x00030000, 32, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* ASTC */
-+    if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures4)) >> (0 ? 13:13)) & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))) ))
-+    {
-+        index += _State(Context, index, 0x10500 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10580 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10600 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x10680 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* YUV. */
-+    index += _State(Context, index, 0x01678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0167C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01680 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01684 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01688 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0168C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01690 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01694 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01698 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0169C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    /* Thread walker states. */
-+    index += _State(Context, index, 0x00900 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00904 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00908 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0090C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00910 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00914 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00918 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0091C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x00924 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    if (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures3)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
-+    {
-+        index += _State(Context, index, 0x00940 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x00944 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x00948 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x0094C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x00950 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x00954 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    }
-+
-+    index += _CLOSE_RANGE();
-+
-+    if (!halti3)
-+    {
-+        if (Context->hardware->identity.instructionCount > 1024)
-+        {
-+            /* New Shader instruction PC registers. */
-+            index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+            index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
-+            index += _CLOSE_RANGE();
-+
-+            for (i = 0;
-+                 i < Context->hardware->identity.instructionCount << 2;
-+                 i += 256 << 2
-+                 )
-+            {
-+                index += _State(Context, index, (0x20000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
-+                index += _CLOSE_RANGE();
-+            }
-+        }
-+        else if (Context->hardware->identity.instructionCount > 256)
-+        {
-+            /* New Shader instruction PC registers. */
-+            index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+            index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
-+            index += _CLOSE_RANGE();
-+
-+            /* VX instruction memory. */
-+            for (i = 0;
-+                 i < Context->hardware->identity.instructionCount << 2;
-+                 i += 256 << 2
-+                 )
-+            {
-+                index += _State(Context, index, (0x0C000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
-+                index += _CLOSE_RANGE();
-+            }
-+
-+            _StateMirror(Context, 0x08000 >> 2, Context->hardware->identity.instructionCount << 2 , 0x0C000 >> 2);
-+        }
-+        else /* if (Context->hardware->identity.instructionCount <= 256) */
-+        {
-+            /* old shader instruction PC registers */
-+            index += _State(Context, index, 0x00800 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+            index += _State(Context, index, 0x00838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+            index += _CLOSE_RANGE();
-+
-+            index += _State(Context, index, 0x01000 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+            index += _State(Context, index, 0x01018 >> 2, 0x01000000, 1, gcvFALSE, gcvFALSE);
-+            index += _CLOSE_RANGE();
-+
-+            index += _State(Context, index, 0x04000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
-+            index += _CLOSE_RANGE();
-+            index += _State(Context, index, 0x06000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
-+            index += _CLOSE_RANGE();
-+        }
-+    }
-+    /* I cache use the new instruction PC registers */
-+    else
-+    {
-+        /* New Shader instruction PC registers. */
-+        index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
-+        index += _CLOSE_RANGE();
-+    }
-+
-+    if (unifiedUniform)
-+    {
-+        gctINT numConstants = Context->hardware->identity.numConstants;
-+
-+        index += _State(Context, index, 0x01024 >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x00864 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _CLOSE_RANGE();
-+
-+        for (i = 0;
-+             numConstants > 0;
-+             i += 256 << 2,
-+             numConstants -= 256
-+             )
-+        {
-+            if (numConstants >= 256)
-+            {
-+                index += _State(Context, index, (0x30000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
-+            }
-+            else
-+            {
-+                index += _State(Context, index, (0x30000 >> 2) + i, 0x00000000, numConstants << 2, gcvFALSE, gcvFALSE);
-+            }
-+            index += _CLOSE_RANGE();
-+        }
-+    }
-+#if gcdENABLE_UNIFIED_CONSTANT
-+    else
-+#endif
-+    {
-+        index += _State(Context, index, 0x05000 >> 2, 0x00000000, vertexUniforms * 4, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x07000 >> 2, 0x00000000, fragmentUniforms * 4, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* Store the index of the "XD" entry. */
-+    Context->entryOffsetXDFrom3D = (gctUINT)index * gcmSIZEOF(gctUINT32);
-+
-+
-+    /* Pixel Engine states. */
-+    index += _State(Context, index, 0x01400 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01404 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01408 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0140C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01414 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01418 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0141C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01420 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01424 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01428 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0142C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01434 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01454 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01458 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0145C >> 2, 0x00000010, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014A8 >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014AC >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014B0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014A4 >> 2, 0x000E400C, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01580 >> 2, 0x00000000, 3, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x014B8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    /* Composition states. */
-+    index += _State(Context, index, 0x03008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    if (Context->hardware->identity.pixelPipes == 1)
-+    {
-+        index += _State(Context, index, 0x01460 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+
-+        index += _State(Context, index, 0x01430 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+        index += _State(Context, index, 0x01410 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    }
-+    else
-+    {
-+        index += _State(Context, index, (0x01460 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+    }
-+
-+    if (Context->hardware->identity.pixelPipes > 1 || halti0)
-+    {
-+        index += _State(Context, index, (0x01480 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+    }
-+
-+    for (i = 0; i < 3; i++)
-+    {
-+        index += _State(Context, index, (0x01500 >> 2) + (i << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+    }
-+
-+    if (halti2)
-+    {
-+        for (i = 0; i < 7; i++)
-+        {
-+          index += _State(Context, index, (0x14800 >> 2) + (i << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+        }
-+        index += _State(Context, index, 0x14900 >> 2, 0x00000000, 7, gcvFALSE, gcvFALSE);
-+    }
-+
-+
-+    if (halti3)
-+    {
-+        index += _State(Context, index, 0x014BC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    }
-+
-+    /* Resolve states. */
-+    index += _State(Context, index, 0x01604 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01608 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0160C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01610 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01614 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01620 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01630 >> 2, 0x00000000, 2, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01640 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x0163C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _CLOSE_RANGE();
-+
-+    if ((Context->hardware->identity.pixelPipes > 1) || halti1)
-+    {
-+        index += _State(Context, index, (0x016C0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+
-+        index += _State(Context, index, (0x016E0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
-+
-+        index += _State(Context, index, 0x01700 >> 2, 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvFALSE);
-+    }
-+
-+#if gcd3DBLIT
-+    index += _State(Context, index, (0x14000 >> 2) + (0 << 1), 0x00000000, 2, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x14008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1400C >> 2, 0x0001C800, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14010 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x14014 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, (0x14018 >> 2) + (0 << 1), 0x00000000, 2, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x14020 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x14024 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14028 >> 2, 0x0001C800, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1402C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14030 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14034 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14038 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1403C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14040 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14044 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14048 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1404C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14050 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14058 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1405C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14054 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14100 >> 2, 0x00000000, 64, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14200 >> 2, 0x00000000, 64, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14064 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14068 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    index += _State(Context, index, 0x1406C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14070 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14074 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14078 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1407C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14080 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14084 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14088 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x1408C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14090 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+
-+    index += _State(Context, index, 0x14094 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x14098 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+#endif
-+
-+    /* Tile status. */
-+    index += _State(Context, index, 0x01654 >> 2, 0x00200000, 1, gcvFALSE, gcvFALSE);
-+
-+    index += _CLOSE_RANGE();
-+    index += _State(Context, index, 0x01658 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0165C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01660 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01664 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01668 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x0166C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01674 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016A4 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x016AC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x016A8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01720 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+    index += _State(Context, index, 0x01740 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+    index += _State(Context, index, 0x01760 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+
-+
-+    if (halti2)
-+    {
-+        index += _State(Context, index, 0x01780 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, 0x016BC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, (0x017A0 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, (0x017C0 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvTRUE);
-+        index += _State(Context, index, (0x017E0 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvTRUE);
-+        index += _State(Context, index, (0x01A00 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, (0x01A20 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
-+        index += _State(Context, index, (0x01A40 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
-+    }
-+
-+    index += _CLOSE_RANGE();
-+
-+    if(((((gctUINT32) (Context->hardware->identity.chipMinorFeatures4)) >> (0 ? 25:25) & ((gctUINT32) ((((1 ? 25:25) - (0 ? 25:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:25) - (0 ? 25:25) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 25:25) - (0 ? 25:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:25) - (0 ? 25:25) + 1))))))))
-+    {
-+        index += _State(Context, index, 0x03860 >> 2, 0x6, 1, gcvFALSE, gcvFALSE);
-+        index += _CLOSE_RANGE();
-+    }
-+
-+    if (halti3)
-+    {
-+        index += _State(Context, index, 0x01A80 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
-+        index += _CLOSE_RANGE();
-+    }
-+
-+    /* Semaphore/stall. */
-+    index += _SemaphoreStall(Context, index);
-+#endif
-+
-+    /**************************************************************************/
-+    /* Link to another address. ***********************************************/
-+
-+    Context->linkIndex3D = (gctUINT)index;
-+
-+    if (buffer != gcvNULL)
-+    {
-+        buffer[index + 0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[index + 1]
-+            = 0;
-+    }
-+
-+    index += 2;
-+
-+    /* Store the end of the context buffer. */
-+    Context->bufferSize = index * gcmSIZEOF(gctUINT32);
-+
-+
-+    /**************************************************************************/
-+    /* Pipe switch for the case where neither 2D nor 3D are used. *************/
-+
-+    /* Store the 3D entry index. */
-+    Context->entryOffsetXDFrom2D = (gctUINT)index * gcmSIZEOF(gctUINT32);
-+
-+    /* Flush 2D pipe. */
-+    index += _FlushPipe(Context, index, gcvPIPE_2D);
-+
-+    /* Switch to 3D pipe. */
-+    index += _SwitchPipe(Context, index, gcvPIPE_3D);
-+
-+    /* Store the location of the link. */
-+    Context->linkIndexXD = (gctUINT)index;
-+
-+    if (buffer != gcvNULL)
-+    {
-+        buffer[index + 0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[index + 1]
-+            = 0;
-+    }
-+
-+    index += 2;
-+
-+
-+    /**************************************************************************/
-+    /* Save size for buffer. **************************************************/
-+
-+    Context->totalSize = index * gcmSIZEOF(gctUINT32);
-+
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+static gceSTATUS
-+_DestroyContext(
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    if (Context != gcvNULL)
-+    {
-+        gcsCONTEXT_PTR bufferHead;
-+
-+        /* Free context buffers. */
-+        for (bufferHead = Context->buffer; Context->buffer != gcvNULL;)
-+        {
-+            /* Get a shortcut to the current buffer. */
-+            gcsCONTEXT_PTR buffer = Context->buffer;
-+
-+            /* Get the next buffer. */
-+            gcsCONTEXT_PTR next = buffer->next;
-+
-+            /* Last item? */
-+            if (next == bufferHead)
-+            {
-+                next = gcvNULL;
-+            }
-+
-+            /* Destroy the signal. */
-+            if (buffer->signal != gcvNULL)
-+            {
-+                gcmkONERROR(gckOS_DestroySignal(
-+                    Context->os, buffer->signal
-+                    ));
-+
-+                buffer->signal = gcvNULL;
-+            }
-+
-+            /* Free state delta map. */
-+            if (buffer->logical != gcvNULL)
-+            {
-+                if (Context->hardware->kernel->virtualCommandBuffer)
-+                {
-+                    gcmkONERROR(gckEVENT_DestroyVirtualCommandBuffer(
-+                        Context->hardware->kernel->eventObj,
-+                        Context->totalSize,
-+                        buffer->physical,
-+                        buffer->logical,
-+                        gcvKERNEL_PIXEL
-+                        ));
-+                }
-+                else
-+                {
-+                    gcmkONERROR(gckEVENT_FreeContiguousMemory(
-+                        Context->hardware->kernel->eventObj,
-+                        Context->totalSize,
-+                        buffer->physical,
-+                        buffer->logical,
-+                        gcvKERNEL_PIXEL
-+                        ));
-+                }
-+
-+                buffer->logical = gcvNULL;
-+            }
-+
-+            /* Free context buffer. */
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, buffer));
-+
-+            /* Remove from the list. */
-+            Context->buffer = next;
-+        }
-+
-+#if gcdSECURE_USER
-+        /* Free the hint array. */
-+        if (Context->hint != gcvNULL)
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->hint));
-+        }
-+#endif
-+        /* Free record array copy. */
-+#if REMOVE_DUPLICATED_COPY_FROM_USER
-+        if (Context->recordArrayMap != gcvNULL)
-+        {
-+            gcsRECORD_ARRAY_MAP_PTR map = Context->recordArrayMap;
-+
-+            do
-+            {
-+                /* Free record array. */
-+                gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, map->kData));
-+                map = map->next;
-+            }
-+            while (map != Context->recordArrayMap);
-+
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->recordArrayMap));
-+        }
-+#else
-+        if (Context->recordArray != gcvNULL)
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->recordArray));
-+        }
-+#endif
-+
-+        /* Free the state mapping. */
-+        if (Context->map != gcvNULL)
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->map));
-+        }
-+
-+        /* Mark the gckCONTEXT object as unknown. */
-+        Context->object.type = gcvOBJ_UNKNOWN;
-+
-+        /* Free the gckCONTEXT object. */
-+        gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context));
-+    }
-+
-+OnError:
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+**************************** Context Management API ****************************
-+\******************************************************************************/
-+
-+/******************************************************************************\
-+**
-+**  gckCONTEXT_Construct
-+**
-+**  Construct a new gckCONTEXT object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Current process ID.
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gckCONTEXT * Context
-+**          Pointer to a variable thet will receive the gckCONTEXT object
-+**          pointer.
-+*/
-+#if (gcdENABLE_3D || gcdENABLE_2D)
-+gceSTATUS
-+gckCONTEXT_Construct(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 ProcessID,
-+    OUT gckCONTEXT * Context
-+    )
-+{
-+    gceSTATUS status;
-+    gckCONTEXT context = gcvNULL;
-+    gctUINT32 allocationSize;
-+    gctUINT i;
-+    gctPOINTER pointer = gcvNULL;
-+    gctUINT32 address;
-+
-+    gcmkHEADER_ARG("Os=0x%08X Hardware=0x%08X", Os, Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Context != gcvNULL);
-+
-+
-+    /**************************************************************************/
-+    /* Allocate and initialize basic fields of gckCONTEXT. ********************/
-+
-+    /* The context object size. */
-+    allocationSize = gcmSIZEOF(struct _gckCONTEXT);
-+
-+    /* Allocate the object. */
-+    gcmkONERROR(gckOS_Allocate(
-+        Os, allocationSize, &pointer
-+        ));
-+
-+    context = pointer;
-+
-+    /* Reset the entire object. */
-+    gcmkONERROR(gckOS_ZeroMemory(context, allocationSize));
-+
-+    /* Initialize the gckCONTEXT object. */
-+    context->object.type = gcvOBJ_CONTEXT;
-+    context->os          = Os;
-+    context->hardware    = Hardware;
-+
-+
-+#if !gcdENABLE_3D
-+    context->entryPipe = gcvPIPE_2D;
-+    context->exitPipe  = gcvPIPE_2D;
-+#elif gcdCMD_NO_2D_CONTEXT
-+    context->entryPipe = gcvPIPE_3D;
-+    context->exitPipe  = gcvPIPE_3D;
-+#else
-+    context->entryPipe
-+        = (((((gctUINT32) (context->hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) )
-+            ? gcvPIPE_2D
-+            : gcvPIPE_3D;
-+    context->exitPipe = gcvPIPE_3D;
-+#endif
-+
-+    /* Get the command buffer requirements. */
-+    gcmkONERROR(gckHARDWARE_QueryCommandBuffer(
-+        Hardware,
-+        &context->alignment,
-+        &context->reservedHead,
-+        &context->reservedTail
-+        ));
-+
-+    /* Mark the context as dirty to force loading of the entire state table
-+       the first time. */
-+    context->dirty = gcvTRUE;
-+
-+
-+    /**************************************************************************/
-+    /* Get the size of the context buffer. ************************************/
-+
-+    gcmkONERROR(_InitializeContextBuffer(context));
-+
-+
-+    /**************************************************************************/
-+    /* Compute the size of the record array. **********************************/
-+
-+    context->recordArraySize
-+        = gcmSIZEOF(gcsSTATE_DELTA_RECORD) * (gctUINT)context->stateCount;
-+
-+
-+    if (context->stateCount > 0)
-+    {
-+        /**************************************************************************/
-+        /* Allocate and reset the state mapping table. ****************************/
-+
-+        /* Allocate the state mapping table. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Os,
-+            gcmSIZEOF(gcsSTATE_MAP) * context->stateCount,
-+            &pointer
-+            ));
-+
-+        context->map = pointer;
-+
-+        /* Zero the state mapping table. */
-+        gcmkONERROR(gckOS_ZeroMemory(
-+            context->map, gcmSIZEOF(gcsSTATE_MAP) * context->stateCount
-+            ));
-+
-+
-+        /**************************************************************************/
-+        /* Allocate the hint array. ***********************************************/
-+
-+#if gcdSECURE_USER
-+        /* Allocate hints. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Os,
-+            gcmSIZEOF(gctBOOL) * context->stateCount,
-+            &pointer
-+            ));
-+
-+        context->hint = pointer;
-+#endif
-+    }
-+
-+    /**************************************************************************/
-+    /* Allocate the context and state delta buffers. **************************/
-+
-+    for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i += 1)
-+    {
-+        /* Allocate a context buffer. */
-+        gcsCONTEXT_PTR buffer;
-+
-+        gctSIZE_T totalSize = context->totalSize;
-+
-+        /* Allocate the context buffer structure. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Os,
-+            gcmSIZEOF(gcsCONTEXT),
-+            &pointer
-+            ));
-+
-+        buffer = pointer;
-+
-+        /* Reset the context buffer structure. */
-+        gcmkVERIFY_OK(gckOS_ZeroMemory(
-+            buffer, gcmSIZEOF(gcsCONTEXT)
-+            ));
-+
-+        /* Append to the list. */
-+        if (context->buffer == gcvNULL)
-+        {
-+            buffer->next    = buffer;
-+            context->buffer = buffer;
-+        }
-+        else
-+        {
-+            buffer->next          = context->buffer->next;
-+            context->buffer->next = buffer;
-+        }
-+
-+        /* Set the number of delta in the order of creation. */
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+        buffer->num = i;
-+#endif
-+
-+        /* Create the busy signal. */
-+        gcmkONERROR(gckOS_CreateSignal(
-+            Os, gcvFALSE, &buffer->signal
-+            ));
-+
-+        /* Set the signal, buffer is currently not busy. */
-+        gcmkONERROR(gckOS_Signal(
-+            Os, buffer->signal, gcvTRUE
-+            ));
-+
-+        /* Create a new physical context buffer. */
-+        if (context->hardware->kernel->virtualCommandBuffer)
-+        {
-+            gcmkONERROR(gckKERNEL_AllocateVirtualCommandBuffer(
-+                context->hardware->kernel,
-+                gcvFALSE,
-+                &totalSize,
-+                &buffer->physical,
-+                &pointer
-+                ));
-+
-+            gcmkONERROR(gckKERNEL_GetGPUAddress(
-+                context->hardware->kernel,
-+                pointer,
-+                gcvFALSE,
-+                &address
-+                ));
-+        }
-+        else
-+        {
-+            gcmkONERROR(gckOS_AllocateContiguous(
-+                Os,
-+                gcvFALSE,
-+                &totalSize,
-+                &buffer->physical,
-+                &pointer
-+                ));
-+
-+            gcmkONERROR(gckHARDWARE_ConvertLogical(
-+                context->hardware,
-+                pointer,
-+                gcvFALSE,
-+                &address
-+                ));
-+        }
-+
-+        buffer->logical = pointer;
-+        buffer->address = address;
-+
-+        /* Set gckEVENT object pointer. */
-+        buffer->eventObj = Hardware->kernel->eventObj;
-+
-+        /* Set the pointers to the LINK commands. */
-+        if (context->linkIndex2D != 0)
-+        {
-+            buffer->link2D = &buffer->logical[context->linkIndex2D];
-+        }
-+
-+        if (context->linkIndex3D != 0)
-+        {
-+            buffer->link3D = &buffer->logical[context->linkIndex3D];
-+        }
-+
-+        if (context->linkIndexXD != 0)
-+        {
-+            gctPOINTER xdLink;
-+            gctUINT32 xdEntryAddress;
-+            gctUINT32 xdEntrySize;
-+            gctUINT32 linkBytes;
-+
-+            /* Determine LINK parameters. */
-+            xdLink
-+                = &buffer->logical[context->linkIndexXD];
-+
-+            xdEntryAddress
-+                = buffer->address
-+                + context->entryOffsetXDFrom3D;
-+
-+            xdEntrySize
-+                = context->bufferSize
-+                - context->entryOffsetXDFrom3D;
-+
-+            /* Query LINK size. */
-+            gcmkONERROR(gckHARDWARE_Link(
-+                Hardware, gcvNULL, 0, 0, &linkBytes
-+                ));
-+
-+            /* Generate a LINK. */
-+            gcmkONERROR(gckHARDWARE_Link(
-+                Hardware,
-+                xdLink,
-+                xdEntryAddress,
-+                xdEntrySize,
-+                &linkBytes
-+                ));
-+        }
-+    }
-+
-+
-+    /**************************************************************************/
-+    /* Initialize the context buffers. ****************************************/
-+
-+    /* Initialize the current context buffer. */
-+    gcmkONERROR(_InitializeContextBuffer(context));
-+
-+    /* Make all created contexts equal. */
-+    {
-+        gcsCONTEXT_PTR currContext, tempContext;
-+
-+        /* Set the current context buffer. */
-+        currContext = context->buffer;
-+
-+        /* Get the next context buffer. */
-+        tempContext = currContext->next;
-+
-+        /* Loop through all buffers. */
-+        while (tempContext != currContext)
-+        {
-+            if (tempContext == gcvNULL)
-+            {
-+                gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+            }
-+
-+            /* Copy the current context. */
-+            gckOS_MemCopy(
-+                tempContext->logical,
-+                currContext->logical,
-+                context->totalSize
-+                );
-+
-+            /* Get the next context buffer. */
-+            tempContext = tempContext->next;
-+        }
-+    }
-+
-+    /* Return pointer to the gckCONTEXT object. */
-+    *Context = context;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Context=0x%08X", *Context);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back on error. */
-+    gcmkVERIFY_OK(_DestroyContext(context));
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+/******************************************************************************\
-+**
-+**  gckCONTEXT_Destroy
-+**
-+**  Destroy a gckCONTEXT object.
-+**
-+**  INPUT:
-+**
-+**      gckCONTEXT Context
-+**          Pointer to an gckCONTEXT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCONTEXT_Destroy(
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Context=0x%08X", Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    /* Destroy the context and all related objects. */
-+    status = _DestroyContext(Context);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return status;
-+}
-+
-+/******************************************************************************\
-+**
-+**  gckCONTEXT_Update
-+**
-+**  Merge all pending state delta buffers into the current context buffer.
-+**
-+**  INPUT:
-+**
-+**      gckCONTEXT Context
-+**          Pointer to an gckCONTEXT object.
-+**
-+**      gctUINT32 ProcessID
-+**          Current process ID.
-+**
-+**      gcsSTATE_DELTA_PTR StateDelta
-+**          Pointer to the state delta.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCONTEXT_Update(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 ProcessID,
-+    IN gcsSTATE_DELTA_PTR StateDelta
-+    )
-+{
-+#if gcdENABLE_3D
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gcsSTATE_DELTA _stateDelta;
-+    gckKERNEL kernel;
-+    gcsCONTEXT_PTR buffer;
-+    gcsSTATE_MAP_PTR map;
-+    gctBOOL needCopy = gcvFALSE;
-+    gcsSTATE_DELTA_PTR nDelta;
-+    gcsSTATE_DELTA_PTR uDelta = gcvNULL;
-+    gcsSTATE_DELTA_PTR kDelta = gcvNULL;
-+    gcsSTATE_DELTA_RECORD_PTR record;
-+    gcsSTATE_DELTA_RECORD_PTR recordArray = gcvNULL;
-+#if REMOVE_DUPLICATED_COPY_FROM_USER
-+    gcsRECORD_ARRAY_MAP_PTR recordArrayMap = gcvNULL;
-+#endif
-+    gctUINT elementCount;
-+    gctUINT address;
-+    gctUINT32 mask;
-+    gctUINT32 data;
-+    gctUINT index;
-+    gctUINT i, j;
-+
-+#if gcdSECURE_USER
-+    gcskSECURE_CACHE_PTR cache;
-+#endif
-+
-+    gcmkHEADER_ARG(
-+        "Context=0x%08X ProcessID=%d StateDelta=0x%08X",
-+        Context, ProcessID, StateDelta
-+        );
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    /* Get a shortcut to the kernel object. */
-+    kernel = Context->hardware->kernel;
-+
-+    /* Check wehther we need to copy the structures or not. */
-+    gcmkONERROR(gckOS_QueryNeedCopy(Context->os, ProcessID, &needCopy));
-+
-+    /* Allocate the copy buffer for the user record array. */
-+#if REMOVE_DUPLICATED_COPY_FROM_USER
-+    if (needCopy && (Context->recordArrayMap == gcvNULL))
-+    {
-+        /* Allocate enough maps. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Context->os,
-+            gcmSIZEOF(gcsRECORD_ARRAY_MAP_PTR) * gcdCONTEXT_BUFFER_COUNT,
-+            (gctPOINTER *) &Context->recordArrayMap
-+            ));
-+
-+        for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i++)
-+        {
-+            /* Next mapping id. */
-+            gctUINT n = (i + 1) % gcdCONTEXT_BUFFER_COUNT;
-+
-+            recordArrayMap = &Context->recordArrayMap[i];
-+
-+            /* Allocate the buffer. */
-+            gcmkONERROR(gckOS_Allocate(
-+                Context->os,
-+                Context->recordArraySize,
-+                (gctPOINTER *) &recordArrayMap->kData
-+                ));
-+
-+            /* Initialize fields. */
-+            recordArrayMap->key  = 0;
-+            recordArrayMap->next = &Context->recordArrayMap[n];
-+        }
-+    }
-+#else
-+    if (needCopy && (Context->recordArray == gcvNULL))
-+    {
-+        /* Allocate the buffer. */
-+        gcmkONERROR(gckOS_Allocate(
-+            Context->os,
-+            Context->recordArraySize,
-+            (gctPOINTER *) &Context->recordArray
-+            ));
-+    }
-+#endif
-+
-+    /* Get the current context buffer. */
-+    buffer = Context->buffer;
-+
-+    /* Wait until the context buffer becomes available; this will
-+       also reset the signal and mark the buffer as busy. */
-+    gcmkONERROR(gckOS_WaitSignal(
-+        Context->os, buffer->signal, gcvINFINITE
-+        ));
-+
-+#if gcdSECURE_USER
-+    /* Get the cache form the database. */
-+    gcmkONERROR(gckKERNEL_GetProcessDBCache(kernel, ProcessID, &cache));
-+#endif
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE) && 1 && gcdENABLE_3D
-+    /* Update current context token. */
-+    buffer->logical[Context->map[0x0E14].index]
-+        = (gctUINT32)gcmPTR2INT32(Context);
-+#endif
-+
-+    /* Are there any pending deltas? */
-+    if (buffer->deltaCount != 0)
-+    {
-+        /* Get the state map. */
-+        map = Context->map;
-+
-+        /* Get the first delta item. */
-+        uDelta = buffer->delta;
-+
-+        /* Reset the vertex stream count. */
-+        elementCount = 0;
-+
-+        /* Merge all pending deltas. */
-+        for (i = 0; i < buffer->deltaCount; i += 1)
-+        {
-+            /* Get access to the state delta. */
-+            gcmkONERROR(gckKERNEL_OpenUserData(
-+                kernel, needCopy,
-+                &_stateDelta,
-+                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+                (gctPOINTER *) &kDelta
-+                ));
-+
-+#if REMOVE_DUPLICATED_COPY_FROM_USER
-+            if (needCopy)
-+            {
-+                recordArray    = gcvNULL;
-+                recordArrayMap = Context->recordArrayMap;
-+
-+                do
-+                {
-+                    /* Check if recordArray is alreay opened. */
-+                    if (recordArrayMap->key == kDelta->recordArray)
-+                    {
-+                        /* Found. */
-+                        recordArray = recordArrayMap->kData;
-+                        break;
-+                    }
-+
-+                    recordArrayMap = recordArrayMap->next;
-+                }
-+                while (recordArrayMap != Context->recordArrayMap);
-+
-+                if (recordArray == gcvNULL)
-+                {
-+                    while (recordArrayMap->key != 0)
-+                    {
-+                        /* Found an empty slot. */
-+                        recordArrayMap = recordArrayMap->next;
-+                    }
-+
-+                    /* Get access to the state records. */
-+                    gcmkONERROR(gckOS_CopyFromUserData(
-+                        kernel->os,
-+                        recordArrayMap->kData,
-+                        gcmUINT64_TO_PTR(kDelta->recordArray),
-+                        Context->recordArraySize
-+                        ));
-+
-+                    /* Save user pointer as key. */
-+                    recordArrayMap->key = kDelta->recordArray;
-+                    recordArray         = recordArrayMap->kData;
-+                }
-+            }
-+            else
-+            {
-+                /* Get access to the state records. */
-+                gcmkONERROR(gckOS_MapUserPointer(
-+                    kernel->os,
-+                    gcmUINT64_TO_PTR(kDelta->recordArray),
-+                    Context->recordArraySize,
-+                    (gctPOINTER *) &recordArray
-+                    ));
-+            }
-+#else
-+            /* Get access to the state records. */
-+            gcmkONERROR(gckKERNEL_OpenUserData(
-+                kernel, needCopy,
-+                Context->recordArray,
-+                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
-+                (gctPOINTER *) &recordArray
-+                ));
-+#endif
-+
-+            /* Merge all pending states. */
-+            for (j = 0; j < kDelta->recordCount; j += 1)
-+            {
-+                if (j >= Context->stateCount)
-+                {
-+                    break;
-+                }
-+
-+                /* Get the current state record. */
-+                record = &recordArray[j];
-+
-+                /* Get the state address. */
-+                address = record->address;
-+
-+                /* Make sure the state is a part of the mapping table. */
-+                if (address >= Context->stateCount)
-+                {
-+                    gcmkTRACE(
-+                        gcvLEVEL_ERROR,
-+                        "%s(%d): State 0x%04X is not mapped.\n",
-+                        __FUNCTION__, __LINE__,
-+                        address
-+                        );
-+
-+                    continue;
-+                }
-+
-+                /* Get the state index. */
-+                index = map[address].index;
-+
-+                /* Skip the state if not mapped. */
-+                if (index == 0)
-+                {
-+                    continue;
-+                }
-+
-+                /* Get the data mask. */
-+                mask = record->mask;
-+
-+                /* Masked states that are being completly reset or regular states. */
-+                if ((mask == 0) || (mask == ~0U))
-+                {
-+                    /* Get the new data value. */
-+                    data = record->data;
-+
-+                    /* Process special states. */
-+                    if (address == 0x0595)
-+                    {
-+                        /* Force auto-disable to be disabled. */
-+                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13)));
-+                    }
-+
-+#if gcdSECURE_USER
-+                    /* Do we need to convert the logical address? */
-+                    if (Context->hint[address])
-+                    {
-+                        /* Map handle into physical address. */
-+                        gcmkONERROR(gckKERNEL_MapLogicalToPhysical(
-+                            kernel, cache, (gctPOINTER) &data
-+                            ));
-+                    }
-+#endif
-+
-+                    /* Set new data. */
-+                    buffer->logical[index] = data;
-+                }
-+
-+                /* Masked states that are being set partially. */
-+                else
-+                {
-+                    buffer->logical[index]
-+                        = (~mask & buffer->logical[index])
-+                        | (mask & record->data);
-+                }
-+            }
-+
-+            /* Get the element count. */
-+            if (kDelta->elementCount != 0)
-+            {
-+                elementCount = kDelta->elementCount;
-+            }
-+
-+            /* Dereference delta. */
-+            kDelta->refCount -= 1;
-+            gcmkASSERT(kDelta->refCount >= 0);
-+
-+            /* Get the next state delta. */
-+            nDelta = gcmUINT64_TO_PTR(kDelta->next);
-+
-+#if REMOVE_DUPLICATED_COPY_FROM_USER
-+            if (needCopy)
-+            {
-+                if (kDelta->refCount == 0)
-+                {
-+                    /* No other reference, reset the mapping. */
-+                    recordArrayMap->key = 0;
-+                }
-+            }
-+            else
-+            {
-+                /* Close access to the state records. */
-+                gcmkONERROR(gckOS_UnmapUserPointer(
-+                    kernel->os,
-+                    gcmUINT64_TO_PTR(kDelta->recordArray),
-+                    Context->recordArraySize,
-+                    (gctPOINTER *) recordArray
-+                    ));
-+
-+                recordArray = gcvNULL;
-+            }
-+#else
-+            /* Get access to the state records. */
-+            gcmkONERROR(gckKERNEL_CloseUserData(
-+                kernel, needCopy,
-+                gcvFALSE,
-+                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
-+                (gctPOINTER *) &recordArray
-+                ));
-+#endif
-+
-+            /* Close access to the current state delta. */
-+            gcmkONERROR(gckKERNEL_CloseUserData(
-+                kernel, needCopy,
-+                gcvTRUE,
-+                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+                (gctPOINTER *) &kDelta
-+                ));
-+
-+            /* Update the user delta pointer. */
-+            uDelta = nDelta;
-+        }
-+
-+        /* Hardware disables all input streams when the stream 0 is programmed,
-+           it then reenables those streams that were explicitely programmed by
-+           the software. Because of this we cannot program the entire array of
-+           values, otherwise we'll get all streams reenabled, but rather program
-+           only those that are actully needed by the software. */
-+        if (elementCount != 0)
-+        {
-+            gctUINT base;
-+            gctUINT nopCount;
-+            gctUINT32_PTR nop;
-+            gctUINT fe2vsCount = 12;
-+
-+            if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) ))
-+            {
-+                fe2vsCount = 16;
-+            }
-+
-+            /* Determine the base index of the vertex stream array. */
-+            base = map[0x0180].index;
-+
-+            /* Set the proper state count. */
-+            buffer->logical[base - 1]
-+                = ((((gctUINT32) (buffer->logical[base - 1])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (elementCount ) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            /* Determine the number of NOP commands. */
-+            nopCount
-+                = (fe2vsCount / 2)
-+                - (elementCount / 2);
-+
-+            /* Determine the location of the first NOP. */
-+            nop = &buffer->logical[base + (elementCount | 1)];
-+
-+            /* Fill the unused space with NOPs. */
-+            for (i = 0; i < nopCount; i += 1)
-+            {
-+                if (nop >= buffer->logical + Context->totalSize)
-+                {
-+                    break;
-+                }
-+
-+                /* Generate a NOP command. */
-+                *nop = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+                /* Advance. */
-+                nop += 2;
-+            }
-+        }
-+
-+        /* Reset pending deltas. */
-+        buffer->deltaCount = 0;
-+        buffer->delta      = gcvNULL;
-+    }
-+
-+    /* Set state delta user pointer. */
-+    uDelta = StateDelta;
-+
-+    /* Get access to the state delta. */
-+    gcmkONERROR(gckKERNEL_OpenUserData(
-+        kernel, needCopy,
-+        &_stateDelta,
-+        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+        (gctPOINTER *) &kDelta
-+        ));
-+
-+    /* State delta cannot be attached to anything yet. */
-+    if (kDelta->refCount != 0)
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): kDelta->refCount = %d (has to be 0).\n",
-+            __FUNCTION__, __LINE__,
-+            kDelta->refCount
-+            );
-+    }
-+
-+    /* Attach to all contexts. */
-+    buffer = Context->buffer;
-+
-+    do
-+    {
-+        /* Attach to the context if nothing is attached yet. If a delta
-+           is allready attached, all we need to do is to increment
-+           the number of deltas in the context. */
-+        if (buffer->delta == gcvNULL)
-+        {
-+            buffer->delta = uDelta;
-+        }
-+
-+        /* Update reference count. */
-+        kDelta->refCount += 1;
-+
-+        /* Update counters. */
-+        buffer->deltaCount += 1;
-+
-+        /* Get the next context buffer. */
-+        buffer = buffer->next;
-+
-+        if (buffer == gcvNULL)
-+        {
-+            gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+        }
-+    }
-+    while (Context->buffer != buffer);
-+
-+    /* Close access to the current state delta. */
-+    gcmkONERROR(gckKERNEL_CloseUserData(
-+        kernel, needCopy,
-+        gcvTRUE,
-+        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+        (gctPOINTER *) &kDelta
-+        ));
-+
-+    /* Schedule an event to mark the context buffer as available. */
-+    gcmkONERROR(gckEVENT_Signal(
-+        buffer->eventObj, buffer->signal, gcvKERNEL_PIXEL
-+        ));
-+
-+    /* Advance to the next context buffer. */
-+    Context->buffer = buffer->next;
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Get access to the state records. */
-+    if (kDelta != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckKERNEL_CloseUserData(
-+            kernel, needCopy,
-+            gcvFALSE,
-+            gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
-+            (gctPOINTER *) &recordArray
-+            ));
-+    }
-+
-+    /* Close access to the current state delta. */
-+    gcmkVERIFY_OK(gckKERNEL_CloseUserData(
-+        kernel, needCopy,
-+        gcvTRUE,
-+        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
-+        (gctPOINTER *) &kDelta
-+        ));
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    return gcvSTATUS_OK;
-+#endif
-+}
-+
-+gceSTATUS
-+gckCONTEXT_MapBuffer(
-+    IN gckCONTEXT Context,
-+    OUT gctUINT32 *Physicals,
-+    OUT gctUINT64 *Logicals,
-+    OUT gctUINT32 *Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    int i = 0;
-+    gctSIZE_T pageCount;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR commandBuffer;
-+    gckKERNEL kernel = Context->hardware->kernel;
-+    gctPOINTER logical;
-+    gctPHYS_ADDR physical;
-+
-+    gcsCONTEXT_PTR buffer;
-+
-+    gcmkHEADER();
-+
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    buffer = Context->buffer;
-+
-+    for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i++)
-+    {
-+        if (kernel->virtualCommandBuffer)
-+        {
-+            commandBuffer = (gckVIRTUAL_COMMAND_BUFFER_PTR)buffer->physical;
-+            physical = commandBuffer->physical;
-+
-+            gcmkONERROR(gckOS_CreateUserVirtualMapping(
-+                kernel->os,
-+                physical,
-+                Context->totalSize,
-+                &logical,
-+                &pageCount));
-+        }
-+        else
-+        {
-+            physical = buffer->physical;
-+
-+            gcmkONERROR(gckOS_MapMemory(
-+                kernel->os,
-+                physical,
-+                Context->totalSize,
-+                &logical));
-+        }
-+
-+        Physicals[i] = gcmPTR_TO_NAME(physical);
-+
-+        Logicals[i] = gcmPTR_TO_UINT64(logical);
-+
-+        buffer = buffer->next;
-+    }
-+
-+    *Bytes = (gctUINT)Context->totalSize;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h	2015-07-27 23:13:06.186908111 +0200
-@@ -0,0 +1,183 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_context_h_
-+#define __gc_hal_kernel_context_h_
-+
-+#include "gc_hal_kernel_buffer.h"
-+
-+/* Exprimental optimization. */
-+#define REMOVE_DUPLICATED_COPY_FROM_USER 1
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/* Maps state locations within the context buffer. */
-+typedef struct _gcsSTATE_MAP * gcsSTATE_MAP_PTR;
-+typedef struct _gcsSTATE_MAP
-+{
-+    /* Index of the state in the context buffer. */
-+    gctUINT                     index;
-+
-+    /* State mask. */
-+    gctUINT32                   mask;
-+}
-+gcsSTATE_MAP;
-+
-+/* Context buffer. */
-+typedef struct _gcsCONTEXT * gcsCONTEXT_PTR;
-+typedef struct _gcsCONTEXT
-+{
-+    /* For debugging: the number of context buffer in the order of creation. */
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    gctUINT                     num;
-+#endif
-+
-+    /* Pointer to gckEVENT object. */
-+    gckEVENT                    eventObj;
-+
-+    /* Context busy signal. */
-+    gctSIGNAL                   signal;
-+
-+    /* Physical address of the context buffer. */
-+    gctPHYS_ADDR                physical;
-+
-+    /* Logical address of the context buffer. */
-+    gctUINT32_PTR               logical;
-+
-+    /* Hardware address of the context buffer. */
-+    gctUINT32                   address;
-+
-+    /* Pointer to the LINK commands. */
-+    gctPOINTER                  link2D;
-+    gctPOINTER                  link3D;
-+
-+    /* The number of pending state deltas. */
-+    gctUINT                     deltaCount;
-+
-+    /* Pointer to the first delta to be applied. */
-+    gcsSTATE_DELTA_PTR          delta;
-+
-+    /* Next context buffer. */
-+    gcsCONTEXT_PTR              next;
-+}
-+gcsCONTEXT;
-+
-+typedef struct _gcsRECORD_ARRAY_MAP * gcsRECORD_ARRAY_MAP_PTR;
-+struct  _gcsRECORD_ARRAY_MAP
-+{
-+    /* User pointer key. */
-+    gctUINT64                   key;
-+
-+    /* Kernel memory buffer. */
-+    gcsSTATE_DELTA_RECORD_PTR   kData;
-+
-+    /* Next map. */
-+    gcsRECORD_ARRAY_MAP_PTR     next;
-+
-+};
-+
-+/* gckCONTEXT structure that hold the current context. */
-+struct _gckCONTEXT
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Pointer to gckHARDWARE object. */
-+    gckHARDWARE                 hardware;
-+
-+    /* Command buffer alignment. */
-+    gctUINT32                   alignment;
-+    gctUINT32                   reservedHead;
-+    gctUINT32                   reservedTail;
-+
-+    /* Context buffer metrics. */
-+    gctSIZE_T                   stateCount;
-+    gctUINT32                   totalSize;
-+    gctUINT32                   bufferSize;
-+    gctUINT32                   linkIndex2D;
-+    gctUINT32                   linkIndex3D;
-+    gctUINT32                   linkIndexXD;
-+    gctUINT32                   entryOffset3D;
-+    gctUINT32                   entryOffsetXDFrom2D;
-+    gctUINT32                   entryOffsetXDFrom3D;
-+
-+    /* Dirty flags. */
-+    gctBOOL                     dirty;
-+    gctBOOL                     dirty2D;
-+    gctBOOL                     dirty3D;
-+    gcsCONTEXT_PTR              dirtyBuffer;
-+
-+    /* State mapping. */
-+    gcsSTATE_MAP_PTR            map;
-+
-+    /* List of context buffers. */
-+    gcsCONTEXT_PTR              buffer;
-+
-+    /* A copy of the user record array. */
-+    gctUINT                     recordArraySize;
-+#if REMOVE_DUPLICATED_COPY_FROM_USER
-+    gcsRECORD_ARRAY_MAP_PTR     recordArrayMap;
-+#else
-+    gcsSTATE_DELTA_RECORD_PTR   recordArray;
-+#endif
-+
-+    /* Requested pipe select for context. */
-+    gcePIPE_SELECT              entryPipe;
-+    gcePIPE_SELECT              exitPipe;
-+
-+    /* Variables used for building state buffer. */
-+    gctUINT32                   lastAddress;
-+    gctSIZE_T                   lastSize;
-+    gctUINT32                   lastIndex;
-+    gctBOOL                     lastFixed;
-+
-+    gctUINT32                   pipeSelectBytes;
-+
-+    /* Hint array. */
-+#if gcdSECURE_USER
-+    gctBOOL_PTR                 hint;
-+#endif
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    gcsPROFILER_COUNTERS        latestProfiler;
-+    gcsPROFILER_COUNTERS        histroyProfiler;
-+    gctUINT32                   prevVSInstCount;
-+    gctUINT32                   prevVSBranchInstCount;
-+    gctUINT32                   prevVSTexInstCount;
-+    gctUINT32                   prevVSVertexCount;
-+    gctUINT32                   prevPSInstCount;
-+    gctUINT32                   prevPSBranchInstCount;
-+    gctUINT32                   prevPSTexInstCount;
-+    gctUINT32                   prevPSPixelCount;
-+#endif
-+};
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_context_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c	2015-07-27 23:13:06.186908111 +0200
-@@ -0,0 +1,8036 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#if VIVANTE_PROFILER_CONTEXT
-+#include "gc_hal_kernel_context.h"
-+#endif
-+
-+#define gcdDISABLE_FE_L2    1
-+
-+#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
-+
-+#define gcmSEMAPHORESTALL(buffer) \
-+        do \
-+        { \
-+            /* Arm the PE-FE Semaphore. */ \
-+            *buffer++ \
-+                = gcmSETFIELDVALUE(0, AQ_COMMAND_LOAD_STATE_COMMAND, OPCODE, LOAD_STATE) \
-+                | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, COUNT, 1) \
-+                | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, ADDRESS, 0x0E02); \
-+            \
-+            *buffer++ \
-+                = gcmSETFIELDVALUE(0, AQ_SEMAPHORE, SOURCE, FRONT_END) \
-+                | gcmSETFIELDVALUE(0, AQ_SEMAPHORE, DESTINATION, PIXEL_ENGINE);\
-+            \
-+            /* STALL FE until PE is done flushing. */ \
-+            *buffer++ \
-+                = gcmSETFIELDVALUE(0, STALL_COMMAND, OPCODE, STALL); \
-+            \
-+            *buffer++ \
-+                = gcmSETFIELDVALUE(0, STALL_STALL, SOURCE, FRONT_END) \
-+                | gcmSETFIELDVALUE(0, STALL_STALL, DESTINATION, PIXEL_ENGINE); \
-+        } while(0)
-+
-+typedef struct _gcsiDEBUG_REGISTERS * gcsiDEBUG_REGISTERS_PTR;
-+typedef struct _gcsiDEBUG_REGISTERS
-+{
-+    gctSTRING       module;
-+    gctUINT         index;
-+    gctUINT         shift;
-+    gctUINT         data;
-+    gctUINT         count;
-+    gctUINT32       signature;
-+}
-+gcsiDEBUG_REGISTERS;
-+
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+static gctBOOL
-+_IsHardwareMatch(
-+    IN gckHARDWARE Hardware,
-+    IN gctINT32 ChipModel,
-+    IN gctUINT32 ChipRevision
-+    )
-+{
-+    return ((Hardware->identity.chipModel == ChipModel) &&
-+            (Hardware->identity.chipRevision == ChipRevision));
-+}
-+
-+static gceSTATUS
-+_ResetGPU(
-+    IN gckHARDWARE Hardware,
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+static gceSTATUS
-+_IdentifyHardware(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gctUINT32 chipIdentity;
-+
-+    gctUINT32 streamCount = 0;
-+    gctUINT32 registerMax = 0;
-+    gctUINT32 threadCount = 0;
-+    gctUINT32 shaderCoreCount = 0;
-+    gctUINT32 vertexCacheSize = 0;
-+    gctUINT32 vertexOutputBufferSize = 0;
-+    gctUINT32 pixelPipes = 0;
-+    gctUINT32 instructionCount = 0;
-+    gctUINT32 numConstants = 0;
-+    gctUINT32 bufferSize = 0;
-+    gctUINT32 varyingsCount = 0;
-+#if gcdMULTI_GPU
-+    gctUINT32 gpuCoreCount = 0;
-+#endif
-+
-+    gcmkHEADER_ARG("Os=0x%x", Os);
-+
-+    /***************************************************************************
-+    ** Get chip ID and revision.
-+    */
-+
-+    /* Read chip identity register. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Os, Core,
-+                             0x00018,
-+                             &chipIdentity));
-+
-+    /* Special case for older graphic cores. */
-+    if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
-+    {
-+        Identity->chipModel    = gcv500;
-+        Identity->chipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
-+    }
-+
-+    else
-+    {
-+        /* Read chip identity register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00020,
-+                                 (gctUINT32_PTR) &Identity->chipModel));
-+
-+        if (((Identity->chipModel & 0xFF00) == 0x0400)
-+          && (Identity->chipModel != 0x0420)
-+          && (Identity->chipModel != 0x0428))
-+        {
-+            Identity->chipModel = (gceCHIPMODEL) (Identity->chipModel & 0x0400);
-+        }
-+
-+        /* Read CHIP_REV register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00024,
-+                                 &Identity->chipRevision));
-+
-+        if ((Identity->chipModel    == gcv300)
-+        &&  (Identity->chipRevision == 0x2201)
-+        )
-+        {
-+            gctUINT32 chipDate;
-+            gctUINT32 chipTime;
-+
-+            /* Read date and time registers. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00028,
-+                                     &chipDate));
-+
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x0002C,
-+                                     &chipTime));
-+
-+            if ((chipDate == 0x20080814) && (chipTime == 0x12051100))
-+            {
-+                /* This IP has an ECO; put the correct revision in it. */
-+                Identity->chipRevision = 0x1051;
-+            }
-+        }
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x000A8,
-+                                 &Identity->productID));
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipModel=%X",
-+                   Identity->chipModel);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipRevision=%X",
-+                   Identity->chipRevision);
-+
-+
-+    /***************************************************************************
-+    ** Get chip features.
-+    */
-+
-+    /* Read chip feature register. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Os, Core,
-+                             0x0001C,
-+                             &Identity->chipFeatures));
-+
-+#if gcdENABLE_3D
-+    /* Disable fast clear on GC700. */
-+    if (Identity->chipModel == gcv700)
-+    {
-+        Identity->chipFeatures
-+            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+    }
-+#endif
-+
-+    if (((Identity->chipModel == gcv500) && (Identity->chipRevision < 2))
-+    ||  ((Identity->chipModel == gcv300) && (Identity->chipRevision < 0x2000))
-+    )
-+    {
-+        /* GC500 rev 1.x and GC300 rev < 2.0 doesn't have these registers. */
-+        Identity->chipMinorFeatures  = 0;
-+        Identity->chipMinorFeatures1 = 0;
-+        Identity->chipMinorFeatures2 = 0;
-+        Identity->chipMinorFeatures3 = 0;
-+        Identity->chipMinorFeatures4 = 0;
-+        Identity->chipMinorFeatures5 = 0;
-+    }
-+    else
-+    {
-+        /* Read chip minor feature register #0. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00034,
-+                                 &Identity->chipMinorFeatures));
-+
-+        if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))))
-+        )
-+        {
-+            /* Read chip minor featuress register #1. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00074,
-+                                     &Identity->chipMinorFeatures1));
-+
-+            /* Read chip minor featuress register #2. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00084,
-+                                     &Identity->chipMinorFeatures2));
-+
-+            /*Identity->chipMinorFeatures2 &= ~(0x1 << 3);*/
-+
-+            /* Read chip minor featuress register #1. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00088,
-+                                     &Identity->chipMinorFeatures3));
-+
-+
-+            /* Read chip minor featuress register #4. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x00094,
-+                                     &Identity->chipMinorFeatures4));
-+
-+            /* Read chip minor featuress register #5. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Os, Core,
-+                                     0x000A0,
-+                                     &Identity->chipMinorFeatures5));
-+        }
-+        else
-+        {
-+            /* Chip doesn't has minor features register #1 or 2 or 3 or 4. */
-+            Identity->chipMinorFeatures1 = 0;
-+            Identity->chipMinorFeatures2 = 0;
-+            Identity->chipMinorFeatures3 = 0;
-+            Identity->chipMinorFeatures4 = 0;
-+            Identity->chipMinorFeatures5 = 0;
-+        }
-+    }
-+
-+    /* Get the Supertile layout in the hardware. */
-+    if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))))
-+     || ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))))
-+    {
-+        Identity->superTileMode = 2;
-+    }
-+    else if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))))
-+    {
-+        Identity->superTileMode = 1;
-+    }
-+    else
-+    {
-+        Identity->superTileMode = 0;
-+    }
-+
-+    /* Exception for GC1000, revision 5035 &  GC800, revision 4612 */
-+    if (((Identity->chipModel == gcv1000) && ((Identity->chipRevision == 0x5035)
-+                                           || (Identity->chipRevision == 0x5036)
-+                                           || (Identity->chipRevision == 0x5037)
-+                                           || (Identity->chipRevision == 0x5039)
-+                                           || (Identity->chipRevision >= 0x5040)))
-+    || ((Identity->chipModel == gcv800) && (Identity->chipRevision == 0x4612))
-+    || ((Identity->chipModel == gcv600) && (Identity->chipRevision >= 0x4650))
-+    || ((Identity->chipModel == gcv860) && (Identity->chipRevision == 0x4647))
-+    || ((Identity->chipModel == gcv400) && (Identity->chipRevision >= 0x4633)))
-+    {
-+        Identity->superTileMode = 1;
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipFeatures=0x%08X",
-+                   Identity->chipFeatures);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures=0x%08X",
-+                   Identity->chipMinorFeatures);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures1=0x%08X",
-+                   Identity->chipMinorFeatures1);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures2=0x%08X",
-+                   Identity->chipMinorFeatures2);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures3=0x%08X",
-+                   Identity->chipMinorFeatures3);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures4=0x%08X",
-+                   Identity->chipMinorFeatures4);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Identity: chipMinorFeatures5=0x%08X",
-+                   Identity->chipMinorFeatures5);
-+
-+    /***************************************************************************
-+    ** Get chip specs.
-+    */
-+
-+    if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
-+    {
-+        gctUINT32 specs, specs2, specs3, specs4;
-+
-+        /* Read gcChipSpecs register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00048,
-+                                 &specs));
-+
-+        /* Extract the fields. */
-+        registerMax            = (((((gctUINT32) (specs)) >> (0 ? 7:4)) & ((gctUINT32) ((((1 ? 7:4) - (0 ? 7:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:4) - (0 ? 7:4) + 1)))))) );
-+        threadCount            = (((((gctUINT32) (specs)) >> (0 ? 11:8)) & ((gctUINT32) ((((1 ? 11:8) - (0 ? 11:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:8) - (0 ? 11:8) + 1)))))) );
-+        shaderCoreCount        = (((((gctUINT32) (specs)) >> (0 ? 24:20)) & ((gctUINT32) ((((1 ? 24:20) - (0 ? 24:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:20) - (0 ? 24:20) + 1)))))) );
-+        vertexCacheSize        = (((((gctUINT32) (specs)) >> (0 ? 16:12)) & ((gctUINT32) ((((1 ? 16:12) - (0 ? 16:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:12) - (0 ? 16:12) + 1)))))) );
-+        vertexOutputBufferSize = (((((gctUINT32) (specs)) >> (0 ? 31:28)) & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1)))))) );
-+        pixelPipes             = (((((gctUINT32) (specs)) >> (0 ? 27:25)) & ((gctUINT32) ((((1 ? 27:25) - (0 ? 27:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:25) - (0 ? 27:25) + 1)))))) );
-+
-+        /* Read gcChipSpecs2 register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x00080,
-+                                 &specs2));
-+
-+        instructionCount       = (((((gctUINT32) (specs2)) >> (0 ? 15:8)) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1)))))) );
-+        numConstants           = (((((gctUINT32) (specs2)) >> (0 ? 31:16)) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1)))))) );
-+        bufferSize             = (((((gctUINT32) (specs2)) >> (0 ? 7:0)) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1)))))) );
-+
-+        /* Read gcChipSpecs3 register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x0008C,
-+                                 &specs3));
-+
-+        varyingsCount          = (((((gctUINT32) (specs3)) >> (0 ? 8:4)) & ((gctUINT32) ((((1 ? 8:4) - (0 ? 8:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:4) - (0 ? 8:4) + 1)))))) );
-+#if gcdMULTI_GPU
-+        gpuCoreCount           = (((((gctUINT32) (specs3)) >> (0 ? 2:0)) & ((gctUINT32) ((((1 ? 2:0) - (0 ? 2:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:0) - (0 ? 2:0) + 1)))))) );
-+#endif
-+
-+        /* Read gcChipSpecs4 register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os, Core,
-+                                 0x0009C,
-+                                 &specs4));
-+
-+
-+        streamCount            = (((((gctUINT32) (specs4)) >> (0 ? 16:12)) & ((gctUINT32) ((((1 ? 16:12) - (0 ? 16:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:12) - (0 ? 16:12) + 1)))))) );
-+        if (streamCount == 0)
-+        {
-+            /* Extract stream count from older register. */
-+            streamCount        = (((((gctUINT32) (specs)) >> (0 ? 3:0)) & ((gctUINT32) ((((1 ? 3:0) - (0 ? 3:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:0) - (0 ? 3:0) + 1)))))) );
-+        }
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Identity: chipSpecs1=0x%08X",
-+                       specs);
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Identity: chipSpecs2=0x%08X",
-+                       specs2);
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Identity: chipSpecs3=0x%08X",
-+                       specs3);
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Identity: chipSpecs4=0x%08X",
-+                       specs4);
-+    }
-+
-+    /* Get the number of pixel pipes. */
-+    Identity->pixelPipes = gcmMAX(pixelPipes, 1);
-+
-+    /* Get the stream count. */
-+    Identity->streamCount = (streamCount != 0)
-+                          ? streamCount
-+                          : (Identity->chipModel >= gcv1000) ? 4 : 1;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: streamCount=%u%s",
-+                   Identity->streamCount,
-+                   (streamCount == 0) ? " (default)" : "");
-+
-+    /* Get the vertex output buffer size. */
-+    Identity->vertexOutputBufferSize = (vertexOutputBufferSize != 0)
-+                                     ? 1 << vertexOutputBufferSize
-+                                     : (Identity->chipModel == gcv400)
-+                                       ? (Identity->chipRevision < 0x4000) ? 512
-+                                       : (Identity->chipRevision < 0x4200) ? 256
-+                                       : 128
-+                                     : (Identity->chipModel == gcv530)
-+                                       ? (Identity->chipRevision < 0x4200) ? 512
-+                                       : 128
-+                                     : 512;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: vertexOutputBufferSize=%u%s",
-+                   Identity->vertexOutputBufferSize,
-+                   (vertexOutputBufferSize == 0) ? " (default)" : "");
-+
-+    /* Get the maximum number of threads. */
-+    Identity->threadCount = (threadCount != 0)
-+                          ? 1 << threadCount
-+                          : (Identity->chipModel == gcv400) ? 64
-+                          : (Identity->chipModel == gcv500) ? 128
-+                          : (Identity->chipModel == gcv530) ? 128
-+                          : 256;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: threadCount=%u%s",
-+                   Identity->threadCount,
-+                   (threadCount == 0) ? " (default)" : "");
-+
-+    /* Get the number of shader cores. */
-+    Identity->shaderCoreCount = (shaderCoreCount != 0)
-+                              ? shaderCoreCount
-+                              : (Identity->chipModel >= gcv1000) ? 2
-+                              : 1;
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: shaderCoreCount=%u%s",
-+                   Identity->shaderCoreCount,
-+                   (shaderCoreCount == 0) ? " (default)" : "");
-+
-+    /* Get the vertex cache size. */
-+    Identity->vertexCacheSize = (vertexCacheSize != 0)
-+                              ? vertexCacheSize
-+                              : 8;
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: vertexCacheSize=%u%s",
-+                   Identity->vertexCacheSize,
-+                   (vertexCacheSize == 0) ? " (default)" : "");
-+
-+    /* Get the maximum number of temporary registers. */
-+    Identity->registerMax = (registerMax != 0)
-+        /* Maximum of registerMax/4 registers are accessible to 1 shader */
-+                          ? 1 << registerMax
-+                          : (Identity->chipModel == gcv400) ? 32
-+                          : 64;
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: registerMax=%u%s",
-+                   Identity->registerMax,
-+                   (registerMax == 0) ? " (default)" : "");
-+
-+    /* Get the instruction count. */
-+    Identity->instructionCount = (instructionCount == 0) ? 256
-+                               : (instructionCount == 1) ? 1024
-+                               : (instructionCount == 2) ? 2048
-+                               : (instructionCount == 0xFF) ? 512
-+                               : 256;
-+
-+    if (Identity->instructionCount == 256)
-+    {
-+        if ((Identity->chipModel == gcv2000 && Identity->chipRevision == 0x5108)
-+        ||  Identity->chipModel == gcv880)
-+        {
-+            Identity->instructionCount = 512;
-+        }
-+        else if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))))
-+        {
-+            Identity->instructionCount = 512;
-+        }
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: instructionCount=%u%s",
-+                   Identity->instructionCount,
-+                   (instructionCount == 0) ? " (default)" : "");
-+
-+    /* Get the number of constants. */
-+    Identity->numConstants = (numConstants == 0) ? 168 : numConstants;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: numConstants=%u%s",
-+                   Identity->numConstants,
-+                   (numConstants == 0) ? " (default)" : "");
-+
-+    /* Get the buffer size. */
-+    Identity->bufferSize = bufferSize;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Specs: bufferSize=%u%s",
-+                   Identity->bufferSize,
-+                   (bufferSize == 0) ? " (default)" : "");
-+
-+
-+     if (varyingsCount != 0)
-+     {
-+         Identity->varyingsCount = varyingsCount;
-+     }
-+     else if (((((gctUINT32) (Identity->chipMinorFeatures1)) >> (0 ? 23:23) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))))
-+     {
-+         Identity->varyingsCount = 12;
-+     }
-+     else
-+     {
-+         Identity->varyingsCount = 8;
-+     }
-+
-+     /* For some cores, it consumes two varying for position, so the max varying vectors should minus one. */
-+     if ((Identity->chipModel == gcv5000 && Identity->chipRevision == 0x5434) ||
-+         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5222) ||
-+         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5208) ||
-+         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5245) ||
-+         (Identity->chipModel == gcv3000 && Identity->chipRevision == 0x5435) ||
-+         (Identity->chipModel == gcv2200 && Identity->chipRevision == 0x5244) ||
-+         (Identity->chipModel == gcv1500 && Identity->chipRevision == 0x5246) ||
-+         ((Identity->chipModel == gcv2100 || Identity->chipModel == gcv2000) && Identity->chipRevision == 0x5108) ||
-+         (Identity->chipModel == gcv880 && (Identity->chipRevision == 0x5107 || Identity->chipRevision == 0x5106)))
-+     {
-+         Identity->varyingsCount -= 1;
-+     }
-+
-+    Identity->chip2DControl = 0;
-+    if (Identity->chipModel == gcv320)
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Os,
-+                                 Core,
-+                                 0x0002C,
-+                                 &data));
-+
-+        if ((data != 33956864) &&
-+            ((Identity->chipRevision == 0x5007) ||
-+            (Identity->chipRevision == 0x5220)))
-+        {
-+            Identity->chip2DControl |= 0xFF &
-+                (Identity->chipRevision == 0x5220 ? 8 :
-+                (Identity->chipRevision == 0x5007 ? 12 : 0));
-+        }
-+
-+        if  (Identity->chipRevision == 0x5007)
-+        {
-+            /* Disable splitting rectangle. */
-+            Identity->chip2DControl |= 0x100;
-+
-+            /* Enable 2D Flush. */
-+            Identity->chip2DControl |= 0x200;
-+        }
-+    }
-+
-+#if gcdMULTI_GPU
-+#if gcdMULTI_GPU > 1
-+     Identity->gpuCoreCount = gpuCoreCount + 1;
-+#else
-+     Identity->gpuCoreCount = 1;
-+#endif
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#define gcdDEBUG_MODULE_CLOCK_GATING   0
-+#define gcdDISABLE_MODULE_CLOCK_GATING 0
-+#define gcdDISABLE_FE_CLOCK_GATING     0
-+#define gcdDISABLE_PE_CLOCK_GATING     0
-+#define gcdDISABLE_SH_CLOCK_GATING     0
-+#define gcdDISABLE_PA_CLOCK_GATING     0
-+#define gcdDISABLE_SE_CLOCK_GATING     0
-+#define gcdDISABLE_RA_CLOCK_GATING     0
-+#define gcdDISABLE_RA_EZ_CLOCK_GATING  0
-+#define gcdDISABLE_RA_HZ_CLOCK_GATING  0
-+#define gcdDISABLE_TX_CLOCK_GATING     0
-+
-+#if gcdDEBUG_MODULE_CLOCK_GATING
-+gceSTATUS
-+_ConfigureModuleLevelClockGating(
-+    gckHARDWARE Hardware
-+    )
-+{
-+    gctUINT32 data;
-+
-+    gcmkVERIFY_OK(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             Hardware->powerBaseAddress
-+                             + 0x00104,
-+                             &data));
-+
-+#if gcdDISABLE_FE_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+#endif
-+
-+#if gcdDISABLE_PE_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
-+#endif
-+
-+#if gcdDISABLE_SH_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+#endif
-+
-+#if gcdDISABLE_PA_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+#endif
-+
-+#if gcdDISABLE_SE_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+#endif
-+
-+#if gcdDISABLE_RA_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+#endif
-+
-+#if gcdDISABLE_TX_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
-+#endif
-+
-+#if gcdDISABLE_RA_EZ_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
-+#endif
-+
-+#if gcdDISABLE_RA_HZ_CLOCK_GATING
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
-+#endif
-+
-+    gcmkVERIFY_OK(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              Hardware->powerBaseAddress
-+                              + 0x00104,
-+                              data));
-+
-+#if gcdDISABLE_MODULE_CLOCK_GATING
-+    gcmkVERIFY_OK(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             Hardware->powerBaseAddress +
-+                             0x00100,
-+                             &data));
-+
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+
-+    gcmkVERIFY_OK(
-+        gckOS_WriteRegisterEx(Hardware->os,
-+                              Hardware->core,
-+                              Hardware->powerBaseAddress
-+                              + 0x00100,
-+                              data));
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+#if gcdPOWEROFF_TIMEOUT
-+void
-+_PowerTimerFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gckHARDWARE hardware = (gckHARDWARE)Data;
-+    gcmkVERIFY_OK(
-+        gckHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
-+}
-+#endif
-+
-+static gceSTATUS
-+_VerifyDMA(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    gctUINT32_PTR Address1,
-+    gctUINT32_PTR Address2,
-+    gctUINT32_PTR State1,
-+    gctUINT32_PTR State2
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 i;
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State1));
-+    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address1));
-+
-+    for (i = 0; i < 500; i += 1)
-+    {
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State2));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address2));
-+
-+        if (*Address1 != *Address2)
-+        {
-+            break;
-+        }
-+
-+        if (*State1 != *State2)
-+        {
-+            break;
-+        }
-+    }
-+
-+OnError:
-+    return status;
-+}
-+
-+static gceSTATUS
-+_DumpDebugRegisters(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gcsiDEBUG_REGISTERS_PTR Descriptor
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctUINT32 select;
-+    gctUINT32 data = 0;
-+    gctUINT i;
-+
-+    gcmkHEADER_ARG("Os=0x%X Descriptor=0x%X", Os, Descriptor);
-+
-+    gcmkPRINT_N(4, "    %s debug registers:\n", Descriptor->module);
-+
-+    for (i = 0; i < Descriptor->count; i += 1)
-+    {
-+        select = i << Descriptor->shift;
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
-+#if gcdFPGA_BUILD
-+        gcmkONERROR(gckOS_Delay(Os, 1000));
-+#endif
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
-+
-+        gcmkPRINT_N(12, "      [0x%02X] 0x%08X\n", i, data);
-+    }
-+
-+    select = 0xF << Descriptor->shift;
-+
-+    for (i = 0; i < 500; i += 1)
-+    {
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
-+#if gcdFPGA_BUILD
-+        gcmkONERROR(gckOS_Delay(Os, 1000));
-+#endif
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
-+
-+        if (data == Descriptor->signature)
-+        {
-+            break;
-+        }
-+    }
-+
-+    if (i == 500)
-+    {
-+        gcmkPRINT_N(4, "      failed to obtain the signature (read 0x%08X).\n", data);
-+    }
-+    else
-+    {
-+        gcmkPRINT_N(8, "      signature = 0x%08X (%d read attempt(s))\n", data, i + 1);
-+    }
-+
-+OnError:
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+_IsGPUPresent(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_QUERY_CHIP_IDENTITY identity;
-+    gctUINT32 control;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &control));
-+
-+    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
-+    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      control));
-+
-+    /* Identify the hardware. */
-+    gcmkONERROR(_IdentifyHardware(Hardware->os,
-+                                  Hardware->core,
-+                                  &identity));
-+
-+    /* Check if these are the same values as saved before. */
-+    if ((Hardware->identity.chipModel          != identity.chipModel)
-+    ||  (Hardware->identity.chipRevision       != identity.chipRevision)
-+    ||  (Hardware->identity.chipFeatures       != identity.chipFeatures)
-+    ||  (Hardware->identity.chipMinorFeatures  != identity.chipMinorFeatures)
-+    ||  (Hardware->identity.chipMinorFeatures1 != identity.chipMinorFeatures1)
-+    ||  (Hardware->identity.chipMinorFeatures2 != identity.chipMinorFeatures2)
-+    )
-+    {
-+        gcmkPRINT("[galcore]: GPU is not present.");
-+        gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+_FlushCache(
-+    gckHARDWARE Hardware,
-+    gckCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 bytes, requested;
-+    gctPOINTER buffer;
-+
-+    /* Get the size of the flush command. */
-+    gcmkONERROR(gckHARDWARE_Flush(Hardware,
-+                                  gcvFLUSH_ALL,
-+                                  gcvNULL,
-+                                  &requested));
-+
-+    /* Reserve space in the command queue. */
-+    gcmkONERROR(gckCOMMAND_Reserve(Command,
-+                                   requested,
-+                                   &buffer,
-+                                   &bytes));
-+
-+    /* Append a flush. */
-+    gcmkONERROR(gckHARDWARE_Flush(
-+        Hardware, gcvFLUSH_ALL, buffer, &bytes
-+        ));
-+
-+    /* Execute the command queue. */
-+    gcmkONERROR(gckCOMMAND_Execute(Command, requested));
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+gctBOOL
-+_IsGPUIdle(
-+    IN gctUINT32 Idle
-+    )
-+{
-+   return  (((((gctUINT32) (Idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) )
-+        && (((((gctUINT32) (Idle)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) )
-+        ;
-+}
-+
-+/******************************************************************************\
-+****************************** gckHARDWARE API code *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Construct
-+**
-+**  Construct a new gckHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an initialized gckOS object.
-+**
-+**      gceCORE Core
-+**          Specified core.
-+**
-+**  OUTPUT:
-+**
-+**      gckHARDWARE * Hardware
-+**          Pointer to a variable that will hold the pointer to the gckHARDWARE
-+**          object.
-+*/
-+gceSTATUS
-+gckHARDWARE_Construct(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gckHARDWARE * Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckHARDWARE hardware = gcvNULL;
-+    gctUINT16 data = 0xff00;
-+    gctPOINTER pointer = gcvNULL;
-+#if gcdMULTI_GPU_AFFINITY
-+    gctUINT32 control;
-+#endif
-+
-+    gcmkHEADER_ARG("Os=0x%x", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
-+
-+    /* Enable the GPU. */
-+    gcmkONERROR(gckOS_SetGPUPower(Os, Core, gcvTRUE, gcvTRUE));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                      Core,
-+                                      0x00000,
-+                                      0x00000900));
-+
-+    /* Allocate the gckHARDWARE object. */
-+    gcmkONERROR(gckOS_Allocate(Os,
-+                               gcmSIZEOF(struct _gckHARDWARE),
-+                               &pointer));
-+
-+    hardware = (gckHARDWARE) pointer;
-+
-+    /* Initialize the gckHARDWARE object. */
-+    hardware->object.type = gcvOBJ_HARDWARE;
-+    hardware->os          = Os;
-+    hardware->core        = Core;
-+
-+    /* Identify the hardware. */
-+    gcmkONERROR(_IdentifyHardware(Os, Core, &hardware->identity));
-+
-+    /* Determine the hardware type */
-+    switch (hardware->identity.chipModel)
-+    {
-+    case gcv350:
-+    case gcv355:
-+        hardware->type = gcvHARDWARE_VG;
-+        break;
-+
-+    case gcv200:
-+    case gcv300:
-+    case gcv320:
-+    case gcv328:
-+    case gcv420:
-+    case gcv428:
-+        hardware->type = gcvHARDWARE_2D;
-+        break;
-+
-+    default:
-+#if gcdMULTI_GPU_AFFINITY
-+        hardware->type = (Core == gcvCORE_MAJOR) ? gcvHARDWARE_3D : gcvHARDWARE_OCL;
-+#else
-+        hardware->type = gcvHARDWARE_3D;
-+#endif
-+
-+        if(hardware->identity.chipModel == gcv880 && hardware->identity.chipRevision == 0x5107)
-+        {
-+            /*set outstanding limit*/
-+            gctUINT32 axi_ot;
-+            gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x00414, &axi_ot));
-+            axi_ot = (axi_ot & (~0xFF)) | 0x00010;
-+            gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00414, axi_ot));
-+        }
-+
-+
-+        if ((((((gctUINT32) (hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ))
-+        {
-+            hardware->type = (gceHARDWARE_TYPE) (hardware->type | gcvHARDWARE_2D);
-+        }
-+    }
-+
-+    hardware->powerBaseAddress
-+        = ((hardware->identity.chipModel   == gcv300)
-+        && (hardware->identity.chipRevision < 0x2000))
-+            ? 0x0100
-+            : 0x0000;
-+
-+    /* _ResetGPU need powerBaseAddress. */
-+    status = _ResetGPU(hardware, Os, Core);
-+
-+    if (status != gcvSTATUS_OK)
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "_ResetGPU failed: status=%d\n", status);
-+    }
-+
-+#if gcdMULTI_GPU
-+    gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                      Core,
-+                                      0x0055C,
-+#if gcdDISABLE_FE_L2
-+                                      0x00FFFFFF));
-+#else
-+                                      0x00FFFF05));
-+#endif
-+
-+#elif gcdMULTI_GPU_AFFINITY
-+    control = ((((gctUINT32) (0x00FF0A05)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27)));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                      Core,
-+                                      0x0055C,
-+                                      control));
-+#endif
-+
-+    hardware->powerMutex = gcvNULL;
-+
-+    hardware->mmuVersion
-+        = (((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 28:28)) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) );
-+
-+    /* Determine whether bug fixes #1 are present. */
-+    hardware->extraEventStates = ((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))));
-+
-+    /* Check if big endian */
-+    hardware->bigEndian = (*(gctUINT8 *)&data == 0xff);
-+
-+    /* Initialize the fast clear. */
-+    gcmkONERROR(gckHARDWARE_SetFastClear(hardware, -1, -1));
-+
-+#if !gcdENABLE_128B_MERGE
-+
-+    if (((((gctUINT32) (hardware->identity.chipMinorFeatures2)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
-+    {
-+        /* 128B merge is turned on by default. Disable it. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00558, 0));
-+    }
-+
-+#endif
-+
-+    /* Set power state to ON. */
-+    hardware->chipPowerState  = gcvPOWER_ON;
-+    hardware->clockState      = gcvTRUE;
-+    hardware->powerState      = gcvTRUE;
-+    hardware->lastWaitLink    = ~0U;
-+    hardware->lastEnd         = ~0U;
-+    hardware->globalSemaphore = gcvNULL;
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    hardware->powerOnFscaleVal = 64;
-+#endif
-+
-+    gcmkONERROR(gckOS_CreateMutex(Os, &hardware->powerMutex));
-+    gcmkONERROR(gckOS_CreateSemaphore(Os, &hardware->globalSemaphore));
-+    hardware->startIsr = gcvNULL;
-+    hardware->stopIsr = gcvNULL;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    hardware->powerOffTimeout = gcdPOWEROFF_TIMEOUT;
-+
-+    gcmkVERIFY_OK(gckOS_CreateTimer(Os,
-+                                    _PowerTimerFunction,
-+                                    (gctPOINTER)hardware,
-+                                    &hardware->powerOffTimer));
-+#endif
-+
-+    gcmkONERROR(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
-+    gcmkONERROR(gckOS_AtomConstruct(Os, &hardware->pendingEvent));
-+
-+#if gcdLINK_QUEUE_SIZE
-+    hardware->linkQueue.front = 0;
-+    hardware->linkQueue.rear = 0;
-+    hardware->linkQueue.count = 0;
-+#endif
-+
-+    /* Enable power management by default. */
-+    hardware->powerManagement = gcvTRUE;
-+
-+    /* Disable profiler by default */
-+    hardware->gpuProfiler = gcvFALSE;
-+
-+#if defined(LINUX) || defined(__QNXNTO__) || defined(UNDERCE)
-+    if (hardware->mmuVersion)
-+    {
-+        hardware->endAfterFlushMmuCache = gcvTRUE;
-+    }
-+    else
-+#endif
-+    {
-+        hardware->endAfterFlushMmuCache = gcvFALSE;
-+    }
-+
-+    gcmkONERROR(gckOS_QueryOption(Os, "mmu", (gctUINT32_PTR)&hardware->enableMMU));
-+
-+    hardware->minFscaleValue = 1;
-+
-+    /* Return pointer to the gckHARDWARE object. */
-+    *Hardware = hardware;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Hardware=0x%x", *Hardware);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (hardware != gcvNULL)
-+    {
-+        /* Turn off the power. */
-+        gcmkVERIFY_OK(gckOS_SetGPUPower(Os, Core, gcvFALSE, gcvFALSE));
-+
-+        if (hardware->globalSemaphore != gcvNULL)
-+        {
-+            /* Destroy the global semaphore. */
-+            gcmkVERIFY_OK(gckOS_DestroySemaphore(Os,
-+                                                 hardware->globalSemaphore));
-+        }
-+
-+        if (hardware->powerMutex != gcvNULL)
-+        {
-+            /* Destroy the power mutex. */
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, hardware->powerMutex));
-+        }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+        if (hardware->powerOffTimer != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
-+            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
-+        }
-+#endif
-+
-+        if (hardware->pageTableDirty != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
-+        }
-+
-+        if (hardware->pendingEvent != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pendingEvent));
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, hardware));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Destroy
-+**
-+**  Destroy an gckHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object that needs to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Destroy(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Destroy the power semaphore. */
-+    gcmkVERIFY_OK(gckOS_DestroySemaphore(Hardware->os,
-+                                         Hardware->globalSemaphore));
-+
-+    /* Destroy the power mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Hardware->os, Hardware->powerMutex));
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
-+    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
-+#endif
-+
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
-+
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pendingEvent));
-+
-+    gcmkVERIFY_OK(gckOS_FreeNonPagedMemory(
-+        Hardware->os,
-+        Hardware->functionBytes,
-+        Hardware->functionPhysical,
-+        Hardware->functionLogical
-+        ));
-+
-+    /* Mark the object as unknown. */
-+    Hardware->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the object. */
-+    gcmkONERROR(gcmkOS_SAFE_FREE(Hardware->os, Hardware));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_GetType
-+**
-+**  Get the hardware type.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gceHARDWARE_TYPE * Type
-+**          Pointer to a variable that receives the type of hardware object.
-+*/
-+gceSTATUS
-+gckHARDWARE_GetType(
-+    IN gckHARDWARE Hardware,
-+    OUT gceHARDWARE_TYPE * Type
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+    gcmkVERIFY_ARGUMENT(Type != gcvNULL);
-+
-+    *Type = Hardware->type;
-+
-+    gcmkFOOTER_ARG("*Type=%d", *Type);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_InitializeHardware
-+**
-+**  Initialize the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_InitializeHardware(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 baseAddress;
-+    gctUINT32 chipRev;
-+    gctUINT32 control;
-+    gctUINT32 data;
-+    gctUINT32 regPMC = 0;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Read the chip revision register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00024,
-+                                     &chipRev));
-+
-+    if (chipRev != Hardware->identity.chipRevision)
-+    {
-+        /* Chip is not there! */
-+        gcmkONERROR(gcvSTATUS_CONTEXT_LOSSED);
-+    }
-+
-+    /* Disable isolate GPU bit. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)))));
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &control));
-+
-+    /* Enable debug register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
-+
-+    /* Reset memory counters. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      ~0U));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      0));
-+
-+    /* Get the system's physical base address. */
-+    gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
-+
-+    /* Program the base addesses. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0041C,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00418,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00428,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00420,
-+                                      baseAddress));
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00424,
-+                                      baseAddress));
-+
-+    {
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         Hardware->powerBaseAddress +
-+                                         0x00100,
-+                                         &data));
-+
-+        /* Enable clock gating. */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        if ((Hardware->identity.chipRevision == 0x4301)
-+        ||  (Hardware->identity.chipRevision == 0x4302)
-+        )
-+        {
-+            /* Disable stall module level clock gating for 4.3.0.1 and 4.3.0.2
-+            ** revisions. */
-+            data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
-+        }
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          Hardware->powerBaseAddress
-+                                          + 0x00100,
-+                                          data));
-+
-+#if gcdENABLE_3D
-+        /* Disable PE clock gating on revs < 5.0 when HZ is present without a
-+        ** bug fix. */
-+        if ((Hardware->identity.chipRevision < 0x5000)
-+        &&  gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HZ)
-+        &&  ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))))
-+        )
-+        {
-+            if (regPMC == 0)
-+            {
-+                gcmkONERROR(
-+                    gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         Hardware->powerBaseAddress
-+                                         + 0x00104,
-+                                         &regPMC));
-+            }
-+
-+            /* Disable PE clock gating. */
-+            regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
-+        }
-+
-+#endif
-+    }
-+
-+    if (Hardware->identity.chipModel == gcv4000 &&
-+        ((Hardware->identity.chipRevision == 0x5208) || (Hardware->identity.chipRevision == 0x5222)))
-+    {
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x0010C,
-+                                  ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)))));
-+    }
-+
-+    if (Hardware->identity.chipModel == gcv1000 &&
-+        (Hardware->identity.chipRevision == 0x5039 ||
-+        Hardware->identity.chipRevision == 0x5040))
-+    {
-+        gctUINT32 pulseEater;
-+
-+        pulseEater = ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x0010C,
-+                                  ((((gctUINT32) (pulseEater)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)))));
-+    }
-+
-+    if ((gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HALTI2) == gcvSTATUS_FALSE)
-+     || (Hardware->identity.chipRevision < 0x5422)
-+    )
-+    {
-+        if (regPMC == 0)
-+        {
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     Hardware->powerBaseAddress
-+                                     + 0x00104,
-+                                     &regPMC));
-+        }
-+
-+        regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15)));
-+    }
-+
-+    if (_IsHardwareMatch(Hardware, gcv2000, 0x5108))
-+    {
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00480,
-+                                 &data));
-+
-+        /* Set FE bus to one, TX bus to zero */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00480,
-+                                  data));
-+    }
-+
-+    gcmkONERROR(
-+        gckHARDWARE_SetMMU(Hardware,
-+                           Hardware->kernel->mmu->pageTableLogical));
-+
-+    if (Hardware->identity.chipModel >= gcv400
-+    &&  Hardware->identity.chipModel != gcv420)
-+    {
-+        if (regPMC == 0)
-+        {
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &regPMC));
-+        }
-+
-+        /* Disable PA clock gating. */
-+        regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+    }
-+
-+    /* Limit 2D outstanding request. */
-+    if (_IsHardwareMatch(Hardware, gcv880, 0x5107))
-+    {
-+        gctUINT32 axi_ot;
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &axi_ot));
-+        axi_ot = (axi_ot & (~0xFF)) | 0x00010;
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00414, axi_ot));
-+    }
-+
-+    if (Hardware->identity.chip2DControl & 0xFF)
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00414,
-+                                 &data));
-+
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (Hardware->identity.chip2DControl & 0xFF) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00414,
-+                                  data));
-+    }
-+
-+    if (_IsHardwareMatch(Hardware, gcv1000, 0x5035))
-+    {
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00414,
-+                                 &data));
-+
-+        /* Disable HZ-L2. */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00414,
-+                                  data));
-+    }
-+
-+    if (_IsHardwareMatch(Hardware, gcv4000, 0x5222))
-+    {
-+        if (regPMC == 0)
-+        {
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &regPMC));
-+        }
-+
-+        /* Disable TX clock gating. */
-+        regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
-+    }
-+
-+    if (_IsHardwareMatch(Hardware, gcv880, 0x5106))
-+    {
-+        Hardware->kernel->timeOut = 140 * 1000;
-+    }
-+
-+    if (regPMC == 0)
-+    {
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &regPMC));
-+    }
-+
-+    /* Disable RA HZ clock gating. */
-+    regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
-+
-+    /* Disable RA EZ clock gating. */
-+    regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
-+
-+    if (regPMC != 0)
-+    {
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  regPMC));
-+    }
-+
-+    if (_IsHardwareMatch(Hardware, gcv2000, 0x5108)
-+     || _IsHardwareMatch(Hardware, gcv320, 0x5007)
-+     || _IsHardwareMatch(Hardware, gcv880, 0x5106)
-+     || _IsHardwareMatch(Hardware, gcv400, 0x4645)
-+    )
-+    {
-+        /* Update GPU AXI cache atttribute. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00008,
-+                                          0x00002200));
-+    }
-+
-+
-+    if ((Hardware->identity.chipRevision > 0x5420)
-+     && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_3D))
-+    {
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x0010C,
-+                                     &data));
-+
-+        /* Disable internal DFS. */
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0010C,
-+                                      data));
-+    }
-+
-+#if gcdDEBUG_MODULE_CLOCK_GATING
-+    _ConfigureModuleLevelClockGating(Hardware);
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryMemory
-+**
-+**  Query the amount of memory available on the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * InternalSize
-+**          Pointer to a variable that will hold the size of the internal video
-+**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
-+**          internal memory will be returned.
-+**
-+**      gctUINT32 * InternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * InternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctSIZE_T * ExternalSize
-+**          Pointer to a variable that will hold the size of the external video
-+**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
-+**          external memory will be returned.
-+**
-+**      gctUINT32 * ExternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * ExternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * HorizontalTileSize
-+**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
-+**          gcvNULL, no horizontal pixel per tile will be returned.
-+**
-+**      gctUINT32 * VerticalTileSize
-+**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
-+**          gcvNULL, no vertical pixel per tile will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryMemory(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctUINT32 * InternalBaseAddress,
-+    OUT gctUINT32 * InternalAlignment,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctUINT32 * ExternalBaseAddress,
-+    OUT gctUINT32 * ExternalAlignment,
-+    OUT gctUINT32 * HorizontalTileSize,
-+    OUT gctUINT32 * VerticalTileSize
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (InternalSize != gcvNULL)
-+    {
-+        /* No internal memory. */
-+        *InternalSize = 0;
-+    }
-+
-+    if (ExternalSize != gcvNULL)
-+    {
-+        /* No external memory. */
-+        *ExternalSize = 0;
-+    }
-+
-+    if (HorizontalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *HorizontalTileSize = 4;
-+    }
-+
-+    if (VerticalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *VerticalTileSize = 4;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*InternalSize=%lu *InternalBaseAddress=0x%08x "
-+                   "*InternalAlignment=0x%08x *ExternalSize=%lu "
-+                   "*ExternalBaseAddress=0x%08x *ExtenalAlignment=0x%08x "
-+                   "*HorizontalTileSize=%u *VerticalTileSize=%u",
-+                   gcmOPT_VALUE(InternalSize),
-+                   gcmOPT_VALUE(InternalBaseAddress),
-+                   gcmOPT_VALUE(InternalAlignment),
-+                   gcmOPT_VALUE(ExternalSize),
-+                   gcmOPT_VALUE(ExternalBaseAddress),
-+                   gcmOPT_VALUE(ExternalAlignment),
-+                   gcmOPT_VALUE(HorizontalTileSize),
-+                   gcmOPT_VALUE(VerticalTileSize));
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryChipIdentity
-+**
-+**  Query the identity of the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+**          Pointer to the identity structure.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryChipIdentity(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+    )
-+{
-+    gctUINT32 features;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Identity != gcvNULL);
-+
-+    /* Return chip model and revision. */
-+    Identity->chipModel = Hardware->identity.chipModel;
-+    Identity->chipRevision = Hardware->identity.chipRevision;
-+
-+    /* Return feature set. */
-+    features = Hardware->identity.chipFeatures;
-+
-+    if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+    {
-+        /* Override fast clear by command line. */
-+        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+    }
-+
-+    if ((((((gctUINT32) (features)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ))
-+    {
-+        /* Override compression by command line. */
-+        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (Hardware->allowCompression) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+    }
-+
-+    /* Mark 2D pipe as available for GC500.0 through GC500.2 and GC300,
-+    ** since they did not have this bit. */
-+    if (((Hardware->identity.chipModel == gcv500) && (Hardware->identity.chipRevision <= 2))
-+    ||   (Hardware->identity.chipModel == gcv300)
-+    )
-+    {
-+        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+    }
-+
-+    Identity->chipFeatures = features;
-+
-+    /* Return minor features. */
-+    Identity->chipMinorFeatures  = Hardware->identity.chipMinorFeatures;
-+    Identity->chipMinorFeatures1 = Hardware->identity.chipMinorFeatures1;
-+    Identity->chipMinorFeatures2 = Hardware->identity.chipMinorFeatures2;
-+    Identity->chipMinorFeatures3 = Hardware->identity.chipMinorFeatures3;
-+    Identity->chipMinorFeatures4 = Hardware->identity.chipMinorFeatures4;
-+    Identity->chipMinorFeatures5 = Hardware->identity.chipMinorFeatures5;
-+
-+    /* Return chip specs. */
-+    Identity->streamCount            = Hardware->identity.streamCount;
-+    Identity->registerMax            = Hardware->identity.registerMax;
-+    Identity->threadCount            = Hardware->identity.threadCount;
-+    Identity->shaderCoreCount        = Hardware->identity.shaderCoreCount;
-+    Identity->vertexCacheSize        = Hardware->identity.vertexCacheSize;
-+    Identity->vertexOutputBufferSize = Hardware->identity.vertexOutputBufferSize;
-+    Identity->pixelPipes             = Hardware->identity.pixelPipes;
-+    Identity->instructionCount       = Hardware->identity.instructionCount;
-+    Identity->numConstants           = Hardware->identity.numConstants;
-+    Identity->bufferSize             = Hardware->identity.bufferSize;
-+    Identity->varyingsCount          = Hardware->identity.varyingsCount;
-+    Identity->superTileMode          = Hardware->identity.superTileMode;
-+#if gcdMULTI_GPU
-+    Identity->gpuCoreCount           = Hardware->identity.gpuCoreCount;
-+#endif
-+    Identity->chip2DControl          = Hardware->identity.chip2DControl;
-+
-+    Identity->productID              = Hardware->identity.productID;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SplitMemory
-+**
-+**  Split a hardware specific memory address into a pool and offset.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Address in hardware specific format.
-+**
-+**  OUTPUT:
-+**
-+**      gcePOOL * Pool
-+**          Pointer to a variable that will hold the pool type for the address.
-+**
-+**      gctUINT32 * Offset
-+**          Pointer to a variable that will hold the offset for the address.
-+*/
-+gceSTATUS
-+gckHARDWARE_SplitMemory(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Addres=0x%08x", Hardware, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
-+
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        /* Dispatch on memory type. */
-+        switch ((((((gctUINT32) (Address)) >> (0 ? 31:31)) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) ))
-+        {
-+        case 0x0:
-+            /* System memory. */
-+            *Pool = gcvPOOL_SYSTEM;
-+            break;
-+
-+        case 0x1:
-+            /* Virtual memory. */
-+            *Pool = gcvPOOL_VIRTUAL;
-+            break;
-+
-+        default:
-+            /* Invalid memory type. */
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+        }
-+
-+        /* Return offset of address. */
-+        *Offset = (((((gctUINT32) (Address)) >> (0 ? 30:0)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1)))))) );
-+    }
-+    else
-+    {
-+        *Pool = gcvPOOL_SYSTEM;
-+        *Offset = Address;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Pool=%d *Offset=0x%08x", *Pool, *Offset);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Execute
-+**
-+**  Kickstart the hardware's command processor with an initialized command
-+**  buffer.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Hardware address of command buffer.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes for the prefetch unit (until after the first LINK).
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Execute(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 control;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Bytes=%lu",
-+                   Hardware, Address, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Enable all events. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00014, ~0U));
-+
-+    /* Write address register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00654, Address));
-+
-+    /* Build control register. */
-+    control = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) ((Bytes + 7) >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+    /* Set big endian */
-+    if (Hardware->bigEndian)
-+    {
-+        control |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20)));
-+    }
-+
-+    /* Write control register. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00658, control));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                  "Started command buffer @ 0x%08x",
-+                  Address);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_WaitLink
-+**
-+**  Append a WAIT/LINK command sequence at the specified location in the command
-+**  queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          WAIT/LINK command sequence at or gcvNULL just to query the size of the
-+**          WAIT/LINK command sequence.
-+**
-+**      gctUINT32 Offset
-+**          Offset into command buffer required for alignment.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the WAIT/LINK command
-+**          sequence.  If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          by the WAIT/LINK command sequence.  If 'Bytes' is gcvNULL, nothing will
-+**          be returned.
-+**
-+**      gctUINT32 * WaitOffset
-+**          Pointer to a variable that will receive the offset of the WAIT command
-+**          from the specified logcial pointer.
-+**          If 'WaitOffset' is gcvNULL nothing will be returned.
-+**
-+**      gctSIZE_T * WaitSize
-+**          Pointer to a variable that will receive the number of bytes used by
-+**          the WAIT command.  If 'LinkSize' is gcvNULL nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_WaitLink(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset,
-+    IN OUT gctUINT32 * Bytes,
-+    OUT gctUINT32 * WaitOffset,
-+    OUT gctUINT32 * WaitSize
-+    )
-+{
-+    static const gctUINT waitCount = 200;
-+
-+    gceSTATUS status;
-+    gctUINT32 address;
-+    gctUINT32_PTR logical;
-+    gctUINT32 bytes;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x *Bytes=%lu",
-+                   Hardware, Logical, Offset, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical != gcvNULL) || (Bytes != gcvNULL));
-+
-+#if gcdMULTI_GPU && !gcdDISABLE_FE_L2
-+    bytes = gcmALIGN(Offset + 40, 8) - Offset;
-+#else
-+    /* Compute number of bytes required. */
-+    bytes = gcmALIGN(Offset + 16, 8) - Offset;
-+#endif
-+    /* Cast the input pointer. */
-+    logical = (gctUINT32_PTR) Logical;
-+
-+    if (logical != gcvNULL)
-+    {
-+        /* Not enough space? */
-+        if (*Bytes < bytes)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Convert logical into hardware specific address. */
-+        gcmkONERROR(gckHARDWARE_ConvertLogical(Hardware, logical, gcvFALSE, &address));
-+
-+        /* Store the WAIT/LINK address. */
-+        Hardware->lastWaitLink = address;
-+
-+        /* Append WAIT(count). */
-+        logical[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (waitCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+#if gcdMULTI_GPU && !gcdDISABLE_FE_L2
-+        logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | gcvCORE_3D_0_MASK;
-+
-+        logical[3] = 0;
-+
-+        /* LoadState(AQFlush, 1), flush. */
-+        logical[4] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[5] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+        logical[6] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | gcvCORE_3D_ALL_MASK;
-+
-+        logical[7] = 0;
-+
-+        /* Append LINK(2, address). */
-+        logical[8] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[9] = address;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "0x%08x: WAIT %u", address, waitCount
-+            );
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                        "0x%x: FLUSH 0x%x", address + 8, logical[3]);
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "0x%08x: LINK 0x%08x, #%lu",
-+            address + 16, address, bytes
-+            );
-+#else
-+
-+        /* Append LINK(2, address). */
-+        logical[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[3] = address;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "0x%08x: WAIT %u", address, waitCount
-+            );
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+            "0x%08x: LINK 0x%08x, #%lu",
-+            address + 8, address, bytes
-+            );
-+#endif
-+        if (WaitOffset != gcvNULL)
-+        {
-+            /* Return the offset pointer to WAIT command. */
-+            *WaitOffset = 0;
-+        }
-+
-+        if (WaitSize != gcvNULL)
-+        {
-+            /* Return number of bytes used by the WAIT command. */
-+#if gcdMULTI_GPU && !gcdDISABLE_FE_L2
-+            *WaitSize = 32;
-+#else
-+            *WaitSize = 8;
-+#endif
-+        }
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the WAIT/LINK command
-+        ** sequence. */
-+        *Bytes = bytes;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu *WaitOffset=0x%x *WaitSize=%lu",
-+                   gcmOPT_VALUE(Bytes), gcmOPT_VALUE(WaitOffset),
-+                   gcmOPT_VALUE(WaitSize));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_End
-+**
-+**  Append an END command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          END command at or gcvNULL just to query the size of the END command.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the END command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the END command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_End(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gctUINT32 address;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
-+                   Hardware, Logical, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Append END. */
-+       logical[0] =
-+            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: END", Logical);
-+
-+        /* Make sure the CPU writes out the data to memory. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, Logical));
-+
-+        gcmkONERROR(gckHARDWARE_ConvertLogical(Hardware, logical, gcvFALSE, &address));
-+
-+        Hardware->lastEnd = address;
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the END command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdMULTI_GPU
-+gceSTATUS
-+gckHARDWARE_ChipEnable(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gceCORE_3D_MASK ChipEnable,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x ChipEnable=0x%x *Bytes=%lu",
-+                   Hardware, Logical, ChipEnable, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Append CHIPENABLE. */
-+        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | ChipEnable;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: CHIPENABLE 0x%x", Logical, ChipEnable);
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the CHIPENABLE command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Nop
-+**
-+**  Append a NOP command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          NOP command at or gcvNULL just to query the size of the NOP command.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the NOP command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the NOP command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Nop(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
-+                   Hardware, Logical, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        /* Append NOP. */
-+        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: NOP", Logical);
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the NOP command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Event
-+**
-+**  Append an EVENT command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          the EVENT command at or gcvNULL just to query the size of the EVENT
-+**          command.
-+**
-+**      gctUINT8 Event
-+**          Event ID to program.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Location of the pipe to send the event.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the EVENT command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the EVENT command.  If 'Bytes' is gcvNULL, nothing will be
-+**          returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Event(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT8 Event,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gctUINT size;
-+    gctUINT32 destination = 0;
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Event=%u FromWhere=%d *Bytes=%lu",
-+                   Hardware, Logical, Event, FromWhere, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+    gcmkVERIFY_ARGUMENT(Event < 32);
-+
-+#if gcdMULTI_GPU
-+    if (FromWhere == gcvKERNEL_COMMAND) FromWhere = gcvKERNEL_PIXEL;
-+#endif
-+
-+    /* Determine the size of the command. */
-+
-+    size = (Hardware->extraEventStates && (FromWhere == gcvKERNEL_PIXEL))
-+         ? gcmALIGN(8 + (1 + 5) * 4, 8) /* EVENT + 5 STATES */
-+         : 8;
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < size)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        switch (FromWhere)
-+        {
-+        case gcvKERNEL_COMMAND:
-+            /* From command processor. */
-+            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+            break;
-+
-+        case gcvKERNEL_PIXEL:
-+            /* From pixel engine. */
-+            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+            break;
-+
-+        default:
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        /* Append EVENT(Event, destiantion). */
-+        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[1] = ((((gctUINT32) (destination)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (Event) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
-+
-+        /* Make sure the event ID gets written out before GPU can access it. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, logical + 1));
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+        {
-+            gctUINT32 phys;
-+            gckOS_GetPhysicalAddress(Hardware->os, Logical, &phys);
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "0x%08x: EVENT %d", phys, Event);
-+        }
-+#endif
-+
-+        /* Append the extra states. These are needed for the chips that do not
-+        ** support back-to-back events due to the async interface. The extra
-+        ** states add the necessary delay to ensure that event IDs do not
-+        ** collide. */
-+        if (size > 8)
-+        {
-+            logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0100) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+            logical[3] = 0;
-+            logical[4] = 0;
-+            logical[5] = 0;
-+            logical[6] = 0;
-+            logical[7] = 0;
-+        }
-+
-+#if gcdINTERRUPT_STATISTIC
-+        if (Event < gcmCOUNTOF(Hardware->kernel->eventObj->queues))
-+        {
-+            gckOS_AtomSetMask(Hardware->pendingEvent, 1 << Event);
-+        }
-+#endif
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the EVENT command. */
-+        *Bytes = size;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_PipeSelect
-+**
-+**  Append a PIPESELECT command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          the PIPESELECT command at or gcvNULL just to query the size of the
-+**          PIPESELECT command.
-+**
-+**      gcePIPE_SELECT Pipe
-+**          Pipe value to select.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the PIPESELECT command.
-+**          If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the PIPESELECT command.  If 'Bytes' is gcvNULL, nothing will be
-+**          returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_PipeSelect(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gcePIPE_SELECT Pipe,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Pipe=%d *Bytes=%lu",
-+                   Hardware, Logical, Pipe, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    /* Append a PipeSelect. */
-+    if (Logical != gcvNULL)
-+    {
-+        gctUINT32 flush, stall;
-+
-+        if (*Bytes < 32)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        flush = (Pipe == gcvPIPE_2D)
-+              ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+              : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+
-+        stall = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LoadState(AQFlush, 1), flush. */
-+        logical[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[1]
-+            = flush;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: FLUSH 0x%x", logical, flush);
-+
-+        /* LoadState(AQSempahore, 1), stall. */
-+        logical[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        logical[3]
-+            = stall;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: SEMAPHORE 0x%x", logical + 2, stall);
-+
-+        /* Stall, stall. */
-+        logical[4] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+        logical[5] = stall;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: STALL 0x%x", logical + 4, stall);
-+
-+        /* LoadState(AQPipeSelect, 1), pipe. */
-+        logical[6]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        logical[7] = (Pipe == gcvPIPE_2D)
-+            ? 0x1
-+            : 0x0;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "0x%x: PIPE %d", logical + 6, Pipe);
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the PIPESELECT command. */
-+        *Bytes = 32;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Link
-+**
-+**  Append a LINK command at the specified location in the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          the LINK command at or gcvNULL just to query the size of the LINK
-+**          command.
-+**
-+**      gctUINT32 FetchAddress
-+**          Hardware address of destination of LINK.
-+**
-+**      gctSIZE_T FetchSize
-+**          Number of bytes in destination of LINK.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the LINK command.  If
-+**          'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the LINK command.  If 'Bytes' is gcvNULL, nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_Link(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT32 FetchSize,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T bytes;
-+    gctUINT32 link;
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x FetchAddress=0x%x FetchSize=%lu "
-+                   "*Bytes=%lu",
-+                   Hardware, Logical, FetchAddress, FetchSize,
-+                   gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
-+
-+    if (Logical != gcvNULL)
-+    {
-+        if (*Bytes < 8)
-+        {
-+            /* Command queue too small. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+
-+        gcmkONERROR(
-+            gckOS_WriteMemory(Hardware->os, logical + 1, FetchAddress));
-+
-+        /* Make sure the address got written before the LINK command. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, logical + 1));
-+
-+        /* Compute number of 64-byte aligned bytes to fetch. */
-+        bytes = gcmALIGN(FetchAddress + FetchSize, 64) - FetchAddress;
-+
-+        /* Append LINK(bytes / 8), FetchAddress. */
-+        link = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        gcmkONERROR(
-+            gckOS_WriteMemory(Hardware->os, logical, link));
-+
-+        /* Memory barrier. */
-+        gcmkONERROR(
-+            gckOS_MemoryBarrier(Hardware->os, logical));
-+
-+#if gcdLINK_QUEUE_SIZE && !gcdPROCESS_ADDRESS_SPACE
-+        if ((Hardware->kernel->virtualCommandBuffer)
-+         && (Hardware->kernel->stuckDump > 2)
-+        )
-+        {
-+            gctBOOL in;
-+
-+            gcmkVERIFY_OK(gckCOMMAND_AddressInKernelCommandBuffer(
-+                Hardware->kernel->command, FetchAddress, &in));
-+
-+            if (in == gcvFALSE)
-+            {
-+                /* Record user command buffer and context buffer link
-+                ** information for stuck dump.
-+                **/
-+                gckLINKQUEUE_Enqueue(
-+                    &Hardware->linkQueue, FetchAddress, FetchAddress + (gctUINT)bytes);
-+            }
-+        }
-+#endif
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return number of bytes required by the LINK command. */
-+        *Bytes = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_UpdateQueueTail
-+**
-+**  Update the tail of the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the start of the command queue.
-+**
-+**      gctUINT32 Offset
-+**          Offset into the command queue of the tail (last command).
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_UpdateQueueTail(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x",
-+                   Hardware, Logical, Offset);
-+
-+    /* Verify the hardware. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Force a barrier. */
-+    gcmkONERROR(
-+        gckOS_MemoryBarrier(Hardware->os, Logical));
-+
-+    /* Notify gckKERNEL object of change. */
-+#if gcdMULTI_GPU
-+    gcmkONERROR(
-+        gckKERNEL_Notify(Hardware->kernel,
-+                         0,
-+                         gcvNOTIFY_COMMAND_QUEUE,
-+                         gcvFALSE));
-+#else
-+    gcmkONERROR(
-+        gckKERNEL_Notify(Hardware->kernel,
-+                         gcvNOTIFY_COMMAND_QUEUE,
-+                         gcvFALSE));
-+#endif
-+
-+    if (status == gcvSTATUS_CHIP_NOT_READY)
-+    {
-+        gcmkONERROR(gcvSTATUS_DEVICE);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_ConvertLogical
-+**
-+**  Convert a logical system address into a hardware specific address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to convert.
-+**
-+**      gctBOOL InUserSpace
-+**          gcvTRUE if the memory in user space.
-+**
-+**      gctUINT32* Address
-+**          Return hardware specific address.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_ConvertLogical(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctBOOL InUserSpace,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+    gceSTATUS status;
-+    gctUINT32 baseAddress;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x InUserSpace=%d",
-+                   Hardware, Logical, InUserSpace);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Convert logical address into a physical address. */
-+    if (InUserSpace)
-+    {
-+        gcmkONERROR(gckOS_UserLogicalToPhysical(Hardware->os, Logical, &address));
-+    }
-+    else
-+    {
-+        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, Logical, &address));
-+    }
-+
-+    /* For old MMU, get GPU address according to baseAddress. */
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
-+
-+        /* Subtract base address to get a GPU address. */
-+        gcmkASSERT(address >= baseAddress);
-+        address -= baseAddress;
-+    }
-+
-+    /* Return hardware specific address. */
-+    *Address = (Hardware->mmuVersion == 0)
-+             ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
-+               | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (address) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)))
-+             : address;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Interrupt
-+**
-+**  Process an interrupt.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL InterruptValid
-+**          If gcvTRUE, this function will read the interrupt acknowledge
-+**          register, stores the data, and return whether or not the interrupt
-+**          is ours or not.  If gcvFALSE, this functions will read the interrupt
-+**          acknowledge register and combine it with any stored value to handle
-+**          the event notifications.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Interrupt(
-+    IN gckHARDWARE Hardware,
-+#if gcdMULTI_GPU
-+    IN gctUINT CoreId,
-+#endif
-+    IN gctBOOL InterruptValid
-+    )
-+{
-+    gckEVENT eventObj;
-+    gctUINT32 data = 0;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x InterruptValid=%d", Hardware, InterruptValid);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Extract gckEVENT object. */
-+    eventObj = Hardware->kernel->eventObj;
-+    gcmkVERIFY_OBJECT(eventObj, gcvOBJ_EVENT);
-+
-+    if (InterruptValid)
-+    {
-+        /* Read AQIntrAcknowledge register. */
-+#if gcdMULTI_GPU
-+        if (Hardware->core == gcvCORE_MAJOR)
-+        {
-+            gcmkONERROR(
-+                gckOS_ReadRegisterByCoreId(Hardware->os,
-+                                           Hardware->core,
-+                                           CoreId,
-+                                           0x00010,
-+                                           &data));
-+        }
-+        else
-+        {
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00010,
-+                                     &data));
-+        }
-+#else
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00010,
-+                                 &data));
-+#endif
-+
-+        if (data == 0)
-+        {
-+            /* Not our interrupt. */
-+            status = gcvSTATUS_NOT_OUR_INTERRUPT;
-+        }
-+        else
-+        {
-+
-+#if gcdINTERRUPT_STATISTIC
-+            gckOS_AtomClearMask(Hardware->pendingEvent, data);
-+#endif
-+
-+            /* Inform gckEVENT of the interrupt. */
-+            status = gckEVENT_Interrupt(eventObj,
-+#if gcdMULTI_GPU
-+                                        CoreId,
-+#endif
-+                                        data);
-+        }
-+    }
-+    else
-+    {
-+            /* Handle events. */
-+            status = gckEVENT_Notify(eventObj, 0);
-+    }
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryCommandBuffer
-+**
-+**  Query the command buffer alignment and number of reserved bytes.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Alignment
-+**          Pointer to a variable receiving the alignment for each command.
-+**
-+**      gctSIZE_T * ReservedHead
-+**          Pointer to a variable receiving the number of reserved bytes at the
-+**          head of each command buffer.
-+**
-+**      gctSIZE_T * ReservedTail
-+**          Pointer to a variable receiving the number of bytes reserved at the
-+**          tail of each command buffer.
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryCommandBuffer(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32 * Alignment,
-+    OUT gctUINT32 * ReservedHead,
-+    OUT gctUINT32 * ReservedTail
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Alignment != gcvNULL)
-+    {
-+        /* Align every 8 bytes. */
-+        *Alignment = 8;
-+    }
-+
-+    if (ReservedHead != gcvNULL)
-+    {
-+        /* Reserve space for SelectPipe(). */
-+        *ReservedHead = 32;
-+    }
-+
-+    if (ReservedTail != gcvNULL)
-+    {
-+        /* Reserve space for Link(). */
-+        *ReservedTail = 8;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Alignment=%lu *ReservedHead=%lu *ReservedTail=%lu",
-+                   gcmOPT_VALUE(Alignment), gcmOPT_VALUE(ReservedHead),
-+                   gcmOPT_VALUE(ReservedTail));
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QuerySystemMemory
-+**
-+**  Query the command buffer alignment and number of reserved bytes.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * SystemSize
-+**          Pointer to a variable that receives the maximum size of the system
-+**          memory.
-+**
-+**      gctUINT32 * SystemBaseAddress
-+**          Poinetr to a variable that receives the base address for system
-+**          memory.
-+*/
-+gceSTATUS
-+gckHARDWARE_QuerySystemMemory(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * SystemSize,
-+    OUT gctUINT32 * SystemBaseAddress
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (SystemSize != gcvNULL)
-+    {
-+        /* Maximum system memory can be 2GB. */
-+        *SystemSize = 1U << 31;
-+    }
-+
-+    if (SystemBaseAddress != gcvNULL)
-+    {
-+        /* Set system memory base address. */
-+        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*SystemSize=%lu *SystemBaseAddress=%lu",
-+                   gcmOPT_VALUE(SystemSize), gcmOPT_VALUE(SystemBaseAddress));
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdENABLE_3D
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryShaderCaps
-+**
-+**  Query the shader capabilities.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT * VertexUniforms
-+**          Pointer to a variable receiving the number of uniforms in the vertex
-+**          shader.
-+**
-+**      gctUINT * FragmentUniforms
-+**          Pointer to a variable receiving the number of uniforms in the
-+**          fragment shader.
-+**
-+**      gctBOOL * UnifiedUnforms
-+**          Pointer to a variable receiving whether the uniformas are unified.
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryShaderCaps(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT * VertexUniforms,
-+    OUT gctUINT * FragmentUniforms,
-+    OUT gctBOOL * UnifiedUnforms
-+    )
-+{
-+    gctBOOL unifiedConst;
-+    gctUINT32 vsConstMax;
-+    gctUINT32 psConstMax;
-+    gctUINT32 vsConstBase;
-+    gctUINT32 psConstBase;
-+    gctUINT32 ConstMax;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x VertexUniforms=0x%x "
-+                   "FragmentUniforms=0x%x UnifiedUnforms=0x%x",
-+                   Hardware, VertexUniforms,
-+                   FragmentUniforms, UnifiedUnforms);
-+
-+    {if (Hardware->identity.numConstants > 256){    unifiedConst = gcvTRUE;    vsConstBase  = 0xC000;    psConstBase  = 0xC000;    ConstMax     = Hardware->identity.numConstants;    vsConstMax   = 256;    psConstMax   = ConstMax - vsConstMax;}else if (Hardware->identity.numConstants == 256){    if (Hardware->identity.chipModel == gcv2000 && Hardware->identity.chipRevision == 0x5118)    {        unifiedConst = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vsConstMax   = 256;        psConstMax   = 64;        ConstMax     = 320;    }    else    {        unifiedConst = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vsConstMax   = 256;        psConstMax   = 256;        ConstMax     = 512;    }}else{    unifiedConst = gcvFALSE;    vsConstBase  = 0x1400;    psConstBase  = 0x1C00;    vsConstMax   = 168;    psConstMax   = 64;    ConstMax     = 232;}};
-+
-+    if (VertexUniforms != gcvNULL)
-+    {
-+        /* Return the vs shader const count. */
-+        *VertexUniforms = vsConstMax;
-+    }
-+
-+    if (FragmentUniforms != gcvNULL)
-+    {
-+        /* Return the ps shader const count. */
-+        *FragmentUniforms = psConstMax;
-+    }
-+
-+    if (UnifiedUnforms != gcvNULL)
-+    {
-+        /* Return whether the uniformas are unified. */
-+        *UnifiedUnforms = unifiedConst;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetMMU
-+**
-+**  Set the page table base address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the page table.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_SetMMU(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 address = 0;
-+    gctUINT32 idle;
-+    gctUINT32 timer = 0, delay = 1;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x", Hardware, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+        /* Convert the logical address into physical address. */
-+        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, Logical, &address));
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Setting page table to 0x%08X",
-+                       address);
-+
-+        /* Write the AQMemoryFePageTable register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00400,
-+                                  address));
-+
-+        /* Write the AQMemoryRaPageTable register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00410,
-+                                  address));
-+
-+        /* Write the AQMemoryTxPageTable register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00404,
-+                                  address));
-+
-+
-+        /* Write the AQMemoryPePageTable register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00408,
-+                                  address));
-+
-+        /* Write the AQMemoryPezPageTable register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x0040C,
-+                                  address));
-+    }
-+    else if (Hardware->enableMMU == gcvTRUE)
-+    {
-+        /* Execute prepared command sequence. */
-+        gcmkONERROR(gckHARDWARE_Execute(
-+            Hardware,
-+            Hardware->functions[gcvHARDWARE_FUNCTION_MMU].address,
-+            Hardware->functions[gcvHARDWARE_FUNCTION_MMU].bytes
-+            ));
-+
-+        /* Wait until MMU configure finishes. */
-+        do
-+        {
-+            gckOS_Delay(Hardware->os, delay);
-+
-+            gcmkONERROR(gckOS_ReadRegisterEx(
-+                Hardware->os,
-+                Hardware->core,
-+                0x00004,
-+                &idle));
-+
-+            timer += delay;
-+            delay *= 2;
-+
-+#if gcdGPU_TIMEOUT
-+            if (timer >= Hardware->kernel->timeOut)
-+            {
-+                /* Even if hardware is not reset correctly, let software
-+                ** continue to avoid software stuck. Software will timeout again
-+                ** and try to recover GPU in next timeout.
-+                */
-+                gcmkONERROR(gcvSTATUS_DEVICE);
-+            }
-+#endif
-+        }
-+        while (!(((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ));
-+
-+        /* Enable MMU. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(
-+            Hardware->os,
-+            Hardware->core,
-+            0x0018C,
-+            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (gcvTRUE) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+            ));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_FlushMMU
-+**
-+**  Flush the page table.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_FlushMMU(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command;
-+    gctUINT32_PTR buffer;
-+    gctUINT32 bufferSize;
-+    gctPOINTER pointer = gcvNULL;
-+    gctUINT32 flushSize;
-+    gctUINT32 count;
-+    gctUINT32 physical;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Verify the gckCOMMAND object pointer. */
-+    command = Hardware->kernel->command;
-+
-+    /* Flush the memory controller. */
-+    if (Hardware->mmuVersion == 0)
-+    {
-+        gcmkONERROR(gckCOMMAND_Reserve(
-+            command, 8, &pointer, &bufferSize
-+            ));
-+
-+        buffer = (gctUINT32_PTR) pointer;
-+
-+        buffer[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[1]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+
-+        gcmkONERROR(gckCOMMAND_Execute(command, 8));
-+    }
-+    else
-+    {
-+        flushSize =  16 * 4;
-+
-+        gcmkONERROR(gckCOMMAND_Reserve(
-+            command, flushSize, &pointer, &bufferSize
-+            ));
-+
-+        buffer = (gctUINT32_PTR) pointer;
-+
-+        count = ((gctUINT)bufferSize - flushSize + 7) >> 3;
-+
-+        gcmkONERROR(gckOS_GetPhysicalAddress(command->os, buffer, &physical));
-+
-+        /* Flush cache. */
-+        buffer[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[1]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+        /* Arm the PE-FE Semaphore. */
-+        buffer[2]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[3]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        buffer[4]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        buffer[5]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LINK to next slot to flush FE FIFO. */
-+        buffer[6]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[7]
-+            = physical + 8 * gcmSIZEOF(gctUINT32);
-+
-+        /* Flush MMU cache. */
-+        buffer[8]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[9]
-+            = (((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) &  ((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))));
-+
-+        /* Arm the PE-FE Semaphore. */
-+        buffer[10]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[11]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        buffer[12]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        buffer[13]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LINK to next slot to flush FE FIFO. */
-+        buffer[14]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        buffer[15]
-+            = physical + flushSize;
-+
-+        gcmkONERROR(gckCOMMAND_Execute(command, flushSize));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetMMUStates(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER MtlbAddress,
-+    IN gceMMU_MODE Mode,
-+    IN gctPOINTER SafeAddress,
-+    IN gctPOINTER Logical,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 config, address;
-+    gctUINT32_PTR buffer;
-+    gctBOOL ace;
-+    gctUINT32 reserveBytes = 16 + 4 * 4;
-+
-+    gctBOOL config2D;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Hardware->mmuVersion != 0);
-+
-+    ace = gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_ACE);
-+
-+    if (ace)
-+    {
-+        reserveBytes += 8;
-+    }
-+
-+    config2D =  gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_3D)
-+             && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_2D);
-+
-+    if (config2D)
-+    {
-+        reserveBytes +=
-+            /* Pipe Select. */
-+            4 * 4
-+            /* Configure MMU States. */
-+          + 4 * 4
-+            /* Semaphore stall */
-+          + 4 * 8;
-+    }
-+
-+    /* Convert logical address into physical address. */
-+    gcmkONERROR(
-+        gckOS_GetPhysicalAddress(Hardware->os, MtlbAddress, &config));
-+
-+    gcmkONERROR(
-+        gckOS_GetPhysicalAddress(Hardware->os, SafeAddress, &address));
-+
-+    if (address & 0x3F)
-+    {
-+        gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+    }
-+
-+    switch (Mode)
-+    {
-+    case gcvMMU_MODE_1K:
-+        if (config & 0x3FF)
-+        {
-+            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+        }
-+
-+        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        break;
-+
-+    case gcvMMU_MODE_4K:
-+        if (config & 0xFFF)
-+        {
-+            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+        }
-+
-+        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        break;
-+
-+    default:
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if (Logical != gcvNULL)
-+    {
-+        buffer = Logical;
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        *buffer++ = config;
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        *buffer++ = address;
-+
-+        if (ace)
-+        {
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0068) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            *buffer++ = 0;
-+        }
-+
-+        do{*buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));} while(0);;
-+
-+        if (config2D)
-+        {
-+            /* LoadState(AQPipeSelect, 1), pipe. */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            *buffer++ = 0x1;
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            *buffer++ = config;
-+
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            *buffer++ = address;
-+
-+            do{*buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));} while(0);;
-+
-+            /* LoadState(AQPipeSelect, 1), pipe. */
-+            *buffer++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            *buffer++ = 0x0;
-+
-+            do{*buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));} while(0);;
-+        }
-+
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        *Bytes = reserveBytes;
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER_NO();
-+    return status;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdPROCESS_ADDRESS_SPACE
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_ConfigMMU
-+**
-+**  Append a MMU Configuration command sequence at the specified location in the command
-+**  queue. That command sequence consists of mmu configuration, LINK and WAIT/LINK.
-+**  LINK is fetched and paresed with new mmu configuration.
-+**
-+**  If MMU Configuration is not changed between commit, change last WAIT/LINK to
-+**  link to ENTRY.
-+**
-+**  -+-----------+-----------+-----------------------------------------
-+**   | WAIT/LINK | WAIT/LINK |
-+**  -+-----------+-----------+-----------------------------------------
-+**         |          /|\
-+**        \|/          |
-+**    +--------------------+
-+**    | ENTRY | ... | LINK |
-+**    +--------------------+
-+**
-+**  If MMU Configuration is changed between commit, change last WAIT/LINK to
-+**  link to MMU CONFIGURATION command sequence, and there are an EVNET and
-+**  an END at the end of this command sequence, when interrupt handler
-+**  receives this event, it will start FE at ENTRY to continue the command
-+**  buffer execution.
-+**
-+**  -+-----------+-------------------+---------+---------+-----------+--
-+**   | WAIT/LINK | MMU CONFIGURATION |  EVENT  |  END    | WAIT/LINK |
-+**  -+-----------+-------------------+---------+---------+-----------+--
-+**        |            /|\                                   /|\
-+**        +-------------+                                     |
-+**                                          +--------------------+
-+**                                          | ENTRY | ... | LINK |
-+**                                          +--------------------+
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command queue to append
-+**          command sequence at or gcvNULL just to query the size of the
-+**          command sequence.
-+**
-+**      gctPOINTER MtlbLogical
-+**          Pointer to the current Master TLB.
-+**
-+**      gctUINT32 Offset
-+**          Offset into command buffer required for alignment.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the command
-+**          sequence.  If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          by the command sequence.  If 'Bytes' is gcvNULL, nothing will
-+**          be returned.
-+**
-+**      gctUINT32 * WaitLinkOffset
-+**          Pointer to a variable that will receive the offset of the WAIT/LINK command
-+**          from the specified logcial pointer.
-+**          If 'WaitLinkOffset' is gcvNULL nothing will be returned.
-+**
-+**      gctSIZE_T * WaitLinkBytes
-+**          Pointer to a variable that will receive the number of bytes used by
-+**          the WAIT command.
-+**          If 'WaitLinkBytes' is gcvNULL nothing will be returned.
-+*/
-+gceSTATUS
-+gckHARDWARE_ConfigMMU(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctPOINTER MtlbLogical,
-+    IN gctUINT32 Offset,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctSIZE_T * WaitLinkOffset,
-+    OUT gctSIZE_T * WaitLinkBytes
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T bytes, bytesAligned;
-+    gctUINT32 config;
-+    gctUINT32_PTR buffer = (gctUINT32_PTR) Logical;
-+    gctUINT32 physical;
-+    gctUINT32 event;
-+
-+    gcmkHEADER_ARG("Hardware=0x%08X Logical=0x%08x MtlbLogical=0x%08X",
-+                   Hardware, Logical, MtlbLogical);
-+
-+    bytes
-+        /* Flush cache states. */
-+        = 18 * 4
-+        /* MMU configuration states. */
-+        + 6 * 4
-+        /* EVENT. */
-+        + 2 * 4
-+        /* END. */
-+        + 2 * 4
-+        /* WAIT/LINK. */
-+        + 4 * 4;
-+
-+    /* Compute number of bytes required. */
-+    bytesAligned = gcmALIGN(Offset + bytes, 8) - Offset;
-+
-+    if (buffer != gcvNULL)
-+    {
-+        if (MtlbLogical == gcvNULL)
-+        {
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        /* Get physical address of this command buffer segment. */
-+        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, buffer, &physical));
-+
-+        /* Get physical address of Master TLB. */
-+        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, MtlbLogical, &config));
-+
-+        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+
-+        /* Flush cache. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+        /* Flush tile status cache. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+        /* Arm the PE-FE Semaphore. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LINK to next slot to flush FE FIFO. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = physical + 10 * gcmSIZEOF(gctUINT32);
-+
-+        /* Configure MMU. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        *buffer++
-+            = (((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) &  ((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))));
-+
-+        /* Arm the PE-FE Semaphore. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* LINK to next slot to flush FE FIFO. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = physical + 18 * 4;
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        *buffer++
-+            = config;
-+
-+        /* Arm the PE-FE Semaphore. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* STALL FE until PE is done flushing. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+        /* Event 29. */
-+        *buffer++
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        event = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+        event = ((((gctUINT32) (event)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (29) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
-+
-+        *buffer++
-+            = event;
-+
-+        /* Append END. */
-+        *buffer++
-+           = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        *Bytes = bytesAligned;
-+    }
-+
-+    if (WaitLinkOffset != gcvNULL)
-+    {
-+        *WaitLinkOffset = bytes - 4 * 4;
-+    }
-+
-+    if (WaitLinkBytes != gcvNULL)
-+    {
-+#if gcdMULTI_GPU
-+        *WaitLinkBytes = 40;
-+#else
-+        *WaitLinkBytes = 4 * 4;
-+#endif
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_BuildVirtualAddress
-+**
-+**  Build a virtual address.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctUINT32 Index
-+**          Index into page table.
-+**
-+**      gctUINT32 Offset
-+**          Offset into page.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable receiving te hardware address.
-+*/
-+gceSTATUS
-+gckHARDWARE_BuildVirtualAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Index=%u Offset=%u", Hardware, Index, Offset);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Build virtual address. */
-+    *Address = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
-+             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (Offset | (Index << 12)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetIdle(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Wait,
-+    OUT gctUINT32 * Data
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 idle = 0;
-+    gctINT retry, poll, pollCount;
-+    gctUINT32 address;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Wait=%d", Hardware, Wait);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
-+
-+
-+    /* If we have to wait, try 100 polls per millisecond. */
-+    pollCount = Wait ? 100 : 1;
-+
-+    /* At most, try for 1 second. */
-+    for (retry = 0; retry < 1000; ++retry)
-+    {
-+        /* If we have to wait, try 100 polls per millisecond. */
-+        for (poll = pollCount; poll > 0; --poll)
-+        {
-+            /* Read register. */
-+            gcmkONERROR(
-+                gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
-+
-+            /* Read the current FE address. */
-+            gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                             Hardware->core,
-+                                             0x00664,
-+                                             &address));
-+
-+
-+            /* See if we have to wait for FE idle. */
-+            if (_IsGPUIdle(idle)
-+             && (address == Hardware->lastEnd + 8)
-+             )
-+            {
-+                /* FE is idle. */
-+                break;
-+            }
-+        }
-+
-+        /* Check if we need to wait for FE and FE is busy. */
-+        if (Wait && !_IsGPUIdle(idle))
-+        {
-+            /* Wait a little. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "%s: Waiting for idle: 0x%08X",
-+                           __FUNCTION__, idle);
-+
-+            gcmkVERIFY_OK(gckOS_Delay(Hardware->os, 1));
-+        }
-+        else
-+        {
-+            break;
-+        }
-+    }
-+
-+    /* Return idle to caller. */
-+    *Data = idle;
-+
-+#if defined(EMULATOR)
-+    /* Wait a little while until CModel FE gets END.
-+     * END is supposed to be appended by caller.
-+     */
-+    gckOS_Delay(gcvNULL, 100);
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/* Flush the caches. */
-+gceSTATUS
-+gckHARDWARE_Flush(
-+    IN gckHARDWARE Hardware,
-+    IN gceKERNEL_FLUSH Flush,
-+    IN gctPOINTER Logical,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gctUINT32 pipe;
-+    gctUINT32 flush = 0;
-+    gctBOOL flushTileStatus;
-+    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
-+    gceSTATUS status;
-+    gctUINT32 reserveBytes
-+        /* Semaphore/Stall */
-+        = 4 * gcmSIZEOF(gctUINT32);
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Flush=0x%x Logical=0x%x *Bytes=%lu",
-+                   Hardware, Flush, Logical, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Get current pipe. */
-+    pipe = Hardware->kernel->command->pipeSelect;
-+
-+    /* Flush tile status cache. */
-+    flushTileStatus = Flush & gcvFLUSH_TILE_STATUS;
-+
-+    /* Flush 3D color cache. */
-+    if ((Flush & gcvFLUSH_COLOR) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
-+    }
-+
-+    /* Flush 3D depth cache. */
-+    if ((Flush & gcvFLUSH_DEPTH) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+    }
-+
-+    /* Flush 3D texture cache. */
-+    if ((Flush & gcvFLUSH_TEXTURE) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
-+    }
-+
-+    /* Flush 2D cache. */
-+    if ((Flush & gcvFLUSH_2D) && (pipe == 0x1))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
-+    }
-+
-+#if gcdMULTI_GPU
-+    /* Flush L2 cache. */
-+    if ((Flush & gcvFLUSH_L2) && (pipe == 0x0))
-+    {
-+        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+    }
-+#endif
-+
-+    /* Determine reserve bytes. */
-+    if (flush)
-+    {
-+        reserveBytes += 2 * gcmSIZEOF(gctUINT32);
-+    }
-+
-+    if (flushTileStatus)
-+    {
-+        reserveBytes += 2 * gcmSIZEOF(gctUINT32);
-+    }
-+
-+    /* See if there is a valid flush. */
-+    if ((flush == 0) && (flushTileStatus == gcvFALSE))
-+    {
-+        if (Bytes != gcvNULL)
-+        {
-+            /* No bytes required. */
-+            *Bytes = 0;
-+        }
-+    }
-+
-+    else
-+    {
-+        /* Copy to command queue. */
-+        if (Logical != gcvNULL)
-+        {
-+            if (*Bytes < reserveBytes)
-+            {
-+                /* Command queue too small. */
-+                gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+            }
-+
-+            if (flush)
-+            {
-+                /* Append LOAD_STATE to AQFlush. */
-+                *logical++
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+                *logical++
-+                    = flush;
-+
-+                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                        "0x%x: FLUSH 0x%x", logical - 1, flush);
-+            }
-+
-+            if (flushTileStatus)
-+            {
-+                *logical++
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+                *logical++
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                               "0x%x: FLUSH TILE STATUS 0x%x", logical - 1, logical[-1]);
-+            }
-+
-+            /* Semaphore. */
-+            *logical++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            *logical++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+
-+            /* Stall. */
-+            *logical++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+
-+            *logical++
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x05 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* bytes required. */
-+            *Bytes = reserveBytes;
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetFastClear(
-+    IN gckHARDWARE Hardware,
-+    IN gctINT Enable,
-+    IN gctINT Compression
-+    )
-+{
-+#if gcdENABLE_3D
-+    gctUINT32 debug;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Enable=%d Compression=%d",
-+                   Hardware, Enable, Compression);
-+
-+    /* Only process if fast clear is available. */
-+    if ((((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+    {
-+        if (Enable == -1)
-+        {
-+            /* Determine automatic value for fast clear. */
-+            Enable = ((Hardware->identity.chipModel    != gcv500)
-+                     || (Hardware->identity.chipRevision >= 3)
-+                     ) ? 1 : 0;
-+        }
-+
-+        if (Compression == -1)
-+        {
-+            /* Determine automatic value for compression. */
-+            Compression = Enable
-+                        & (((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) );
-+        }
-+
-+        /* Read AQMemoryDebug register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &debug));
-+
-+        /* Set fast clear bypass. */
-+        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
-+
-+        if (
-+            ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) ||
-+            (Hardware->identity.chipModel >= gcv4000))
-+        {
-+            /* Set compression bypass. */
-+            debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21))) | (((gctUINT32) ((gctUINT32) (Compression == 0) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21)));
-+        }
-+
-+        /* Write back AQMemoryDebug register. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  0x00414,
-+                                  debug));
-+
-+        /* Store fast clear and comprersison flags. */
-+        Hardware->allowFastClear   = Enable;
-+        Hardware->allowCompression = Compression;
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "FastClear=%d Compression=%d", Enable, Compression);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    return gcvSTATUS_OK;
-+#endif
-+}
-+
-+typedef enum
-+{
-+    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
-+    gcvPOWER_FLAG_STALL         = 1 << 1,
-+    gcvPOWER_FLAG_STOP          = 1 << 2,
-+    gcvPOWER_FLAG_START         = 1 << 3,
-+    gcvPOWER_FLAG_RELEASE       = 1 << 4,
-+    gcvPOWER_FLAG_DELAY         = 1 << 5,
-+    gcvPOWER_FLAG_SAVE          = 1 << 6,
-+    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
-+    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
-+    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
-+    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
-+}
-+gcePOWER_FLAGS;
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+static gctCONST_STRING
-+_PowerEnum(gceCHIPPOWERSTATE State)
-+{
-+    const gctCONST_STRING states[] =
-+    {
-+        gcmSTRING(gcvPOWER_ON),
-+        gcmSTRING(gcvPOWER_OFF),
-+        gcmSTRING(gcvPOWER_IDLE),
-+        gcmSTRING(gcvPOWER_SUSPEND),
-+        gcmSTRING(gcvPOWER_SUSPEND_ATPOWERON),
-+        gcmSTRING(gcvPOWER_OFF_ATPOWERON),
-+        gcmSTRING(gcvPOWER_IDLE_BROADCAST),
-+        gcmSTRING(gcvPOWER_SUSPEND_BROADCAST),
-+        gcmSTRING(gcvPOWER_OFF_BROADCAST),
-+        gcmSTRING(gcvPOWER_OFF_RECOVERY),
-+        gcmSTRING(gcvPOWER_OFF_TIMEOUT),
-+        gcmSTRING(gcvPOWER_ON_AUTO)
-+    };
-+
-+    if ((State >= gcvPOWER_ON) && (State <= gcvPOWER_ON_AUTO))
-+    {
-+        return states[State - gcvPOWER_ON];
-+    }
-+
-+    return "unknown";
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagementState
-+**
-+**  Set GPU to a specified power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetPowerManagementState(
-+    IN gckHARDWARE Hardware,
-+    IN gceCHIPPOWERSTATE State
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command = gcvNULL;
-+    gckOS os;
-+    gctUINT flag, clock;
-+    gctPOINTER buffer;
-+    gctUINT32 bytes, requested;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL mutexAcquired = gcvFALSE;
-+    gctBOOL stall = gcvTRUE;
-+    gctBOOL broadcast = gcvFALSE;
-+#if gcdPOWEROFF_TIMEOUT
-+    gctBOOL timeout = gcvFALSE;
-+    gctBOOL isAfter = gcvFALSE;
-+    gctUINT32 currentTime;
-+#endif
-+    gctUINT32 process, thread;
-+    gctBOOL commitEntered = gcvFALSE;
-+    gctBOOL commandStarted = gcvFALSE;
-+    gctBOOL isrStarted = gcvFALSE;
-+
-+#if gcdENABLE_PROFILING
-+    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
-+              initTime, offTime, startTime, totalTime;
-+#endif
-+    gctBOOL global = gcvFALSE;
-+    gctBOOL globalAcquired = gcvFALSE;
-+    gctBOOL configMmu = gcvFALSE;
-+
-+    /* State transition flags. */
-+    static const gctUINT flags[4][4] =
-+    {
-+        /* gcvPOWER_ON           */
-+        {   /* ON                */ 0,
-+            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL,
-+            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_OFF          */
-+        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_RELEASE    |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* OFF               */ 0,
-+            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_IDLE         */
-+        {   /* ON                */ gcvPOWER_FLAG_RELEASE,
-+            /* OFF               */ gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ 0,
-+            /* SUSPEND           */ gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_SUSPEND      */
-+        {   /* ON                */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_RELEASE   |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* OFF               */ gcvPOWER_FLAG_SAVE      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* SUSPEND           */ 0,
-+        },
-+    };
-+
-+    /* Clocks. */
-+    static const gctUINT clocks[4] =
-+    {
-+        /* gcvPOWER_ON */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (64) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+
-+        /* gcvPOWER_OFF */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+
-+        /* gcvPOWER_IDLE */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+
-+        /* gcvPOWER_SUSPEND */
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
-+    };
-+
-+    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Switching to power state %d(%s)",
-+                   State, _PowerEnum(State));
-+#endif
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Get the gckOS object pointer. */
-+    os = Hardware->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Get the gckCOMMAND object pointer. */
-+    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
-+    command = Hardware->kernel->command;
-+    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
-+
-+    /* Start profiler. */
-+    gcmkPROFILE_INIT(freq, time);
-+
-+    /* Convert the broadcast power state. */
-+    switch (State)
-+    {
-+    case gcvPOWER_SUSPEND_ATPOWERON:
-+        /* Convert to SUSPEND and don't wait for STALL. */
-+        State = gcvPOWER_SUSPEND;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_OFF_ATPOWERON:
-+        /* Convert to OFF and don't wait for STALL. */
-+        State = gcvPOWER_OFF;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_IDLE_BROADCAST:
-+        /* Convert to IDLE and note we are inside broadcast. */
-+        State     = gcvPOWER_IDLE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_SUSPEND_BROADCAST:
-+        /* Convert to SUSPEND and note we are inside broadcast. */
-+        State     = gcvPOWER_SUSPEND;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_BROADCAST:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_RECOVERY:
-+        /* Convert to OFF and note we are inside recovery. */
-+        State     = gcvPOWER_OFF;
-+        stall     = gcvFALSE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_ON_AUTO:
-+        /* Convert to ON and note we are inside recovery. */
-+        State = gcvPOWER_ON;
-+        break;
-+
-+    case gcvPOWER_ON:
-+    case gcvPOWER_IDLE:
-+    case gcvPOWER_SUSPEND:
-+    case gcvPOWER_OFF:
-+        /* Mark as global power management. */
-+        global = gcvTRUE;
-+        break;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    case gcvPOWER_OFF_TIMEOUT:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        /* Check time out */
-+        timeout = gcvTRUE;
-+        break;
-+#endif
-+
-+    default:
-+        break;
-+    }
-+
-+    if (Hardware->powerManagement == gcvFALSE
-+     && State != gcvPOWER_ON
-+    )
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Get current process and thread IDs. */
-+    gcmkONERROR(gckOS_GetProcessID(&process));
-+    gcmkONERROR(gckOS_GetThreadID(&thread));
-+
-+    if (broadcast)
-+    {
-+        /* Try to acquire the power mutex. */
-+        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
-+
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            /* Check if we already own this mutex. */
-+            if ((Hardware->powerProcess == process)
-+            &&  (Hardware->powerThread  == thread)
-+            )
-+            {
-+                /* Bail out on recursive power management. */
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_OK;
-+            }
-+            else if (State != gcvPOWER_ON)
-+            {
-+                /* Called from IST,
-+                ** so waiting here will cause deadlock,
-+                ** if lock holder call gckCOMMAND_Stall() */
-+                status = gcvSTATUS_INVALID_REQUEST;
-+                goto OnError;
-+            }
-+            else
-+            {
-+                /* Acquire the power mutex. */
-+                gcmkONERROR(gckOS_AcquireMutex(os,
-+                                               Hardware->powerMutex,
-+                                               gcvINFINITE));
-+            }
-+        }
-+    }
-+    else
-+    {
-+        /* Acquire the power mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
-+    }
-+
-+    /* Get time until mtuex acquired. */
-+    gcmkPROFILE_QUERY(time, mutexTime);
-+
-+    Hardware->powerProcess = process;
-+    Hardware->powerThread  = thread;
-+    mutexAcquired          = gcvTRUE;
-+
-+    /* Grab control flags and clock. */
-+    flag  = flags[Hardware->chipPowerState][State];
-+    clock = clocks[State];
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    if (State == gcvPOWER_ON)
-+    {
-+        clock = ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (Hardware->powerOnFscaleVal) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)));
-+    }
-+#endif
-+
-+    if (State == gcvPOWER_SUSPEND && Hardware->chipPowerState == gcvPOWER_OFF && broadcast)
-+    {
-+#if gcdPOWER_SUSPEND_WHEN_IDLE
-+    /* Do nothing */
-+
-+        /* Release the power mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+           gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+#else
-+    /* Clock should be on when switch power from off to suspend */
-+        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) ;
-+#endif
-+    }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    if (timeout)
-+    {
-+        gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+        gcmkONERROR(
-+            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
-+
-+        /* powerOffTime is pushed forward, give up.*/
-+        if (isAfter
-+        /* Expect a transition start from IDLE or SUSPEND. */
-+        ||  (Hardware->chipPowerState == gcvPOWER_ON)
-+        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
-+        )
-+        {
-+            /* Release the power mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+            /* No need to do anything. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                       "Power Off GPU[%d] at %u [supposed to be at %u]",
-+                       Hardware->core, currentTime, Hardware->powerOffTime);
-+    }
-+#endif
-+
-+    if (flag == 0)
-+    {
-+        /* Release the power mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+        /* No need to do anything. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* If this is an internal power management, we have to check if we can grab
-+    ** the global power semaphore. If we cannot, we have to wait until the
-+    ** external world changes power management. */
-+    if (!global)
-+    {
-+        /* Try to acquire the global semaphore. */
-+        status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
-+            {
-+                /* Called from thread routine which should NEVER sleep.*/
-+                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+            }
-+
-+            /* Release the power mutex. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "Releasing the power mutex.");
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+            mutexAcquired = gcvFALSE;
-+
-+            /* Wait for the semaphore. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "Waiting for global semaphore.");
-+            gcmkONERROR(gckOS_AcquireSemaphore(os, Hardware->globalSemaphore));
-+            globalAcquired = gcvTRUE;
-+
-+            /* Acquire the power mutex. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                           "Reacquiring the power mutex.");
-+            gcmkONERROR(gckOS_AcquireMutex(os,
-+                                           Hardware->powerMutex,
-+                                           gcvINFINITE));
-+            mutexAcquired = gcvTRUE;
-+
-+            /* chipPowerState may be changed by external world during the time
-+            ** we give up powerMutex, so updating flag now is necessary. */
-+            flag = flags[Hardware->chipPowerState][State];
-+
-+            if (flag == 0)
-+            {
-+                gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
-+                globalAcquired = gcvFALSE;
-+
-+                gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+                mutexAcquired = gcvFALSE;
-+
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_OK;
-+            }
-+        }
-+        else
-+        {
-+            /* Error. */
-+            gcmkONERROR(status);
-+        }
-+
-+        /* Release the global semaphore again. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
-+        globalAcquired = gcvFALSE;
-+    }
-+    else
-+    {
-+        if (State == gcvPOWER_OFF || State == gcvPOWER_SUSPEND || State == gcvPOWER_IDLE)
-+        {
-+            /* Acquire the global semaphore if it has not been acquired. */
-+            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
-+            if (status == gcvSTATUS_OK)
-+            {
-+                globalAcquired = gcvTRUE;
-+            }
-+            else if (status != gcvSTATUS_TIMEOUT)
-+            {
-+                /* Other errors. */
-+                gcmkONERROR(status);
-+            }
-+            /* Ignore gcvSTATUS_TIMEOUT and leave globalAcquired as gcvFALSE.
-+            ** gcvSTATUS_TIMEOUT means global semaphore has already
-+            ** been acquired before this operation, so even if we fail,
-+            ** we should not release it in our error handling. It should be
-+            ** released by the next successful global gcvPOWER_ON. */
-+        }
-+
-+        /* Global power management can't be aborted, so sync with
-+        ** proceeding last commit. */
-+        if (flag & gcvPOWER_FLAG_ACQUIRE)
-+        {
-+            /* Acquire the power management semaphore. */
-+            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+            acquired = gcvTRUE;
-+
-+            /* avoid acquiring again. */
-+            flag &= ~gcvPOWER_FLAG_ACQUIRE;
-+        }
-+    }
-+
-+    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
-+    {
-+        /* Turn on the power. */
-+        gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
-+
-+        /* Mark clock and power as enabled. */
-+        Hardware->clockState = gcvTRUE;
-+        Hardware->powerState = gcvTRUE;
-+
-+        for (;;)
-+        {
-+            /* Check if GPU is present and awake. */
-+            status = _IsGPUPresent(Hardware);
-+
-+            /* Check if the GPU is not responding. */
-+            if (status == gcvSTATUS_GPU_NOT_RESPONDING)
-+            {
-+                /* Turn off the power and clock. */
-+                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvFALSE, gcvFALSE));
-+
-+                Hardware->clockState = gcvFALSE;
-+                Hardware->powerState = gcvFALSE;
-+
-+                /* Wait a little. */
-+                gckOS_Delay(os, 1);
-+
-+                /* Turn on the power and clock. */
-+                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
-+
-+                Hardware->clockState = gcvTRUE;
-+                Hardware->powerState = gcvTRUE;
-+
-+                /* We need to initialize the hardware and start the command
-+                 * processor. */
-+                flag |= gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_START;
-+            }
-+            else
-+            {
-+                /* Test for error. */
-+                gcmkONERROR(status);
-+
-+                /* Break out of loop. */
-+                break;
-+            }
-+        }
-+    }
-+
-+    /* Get time until powered on. */
-+    gcmkPROFILE_QUERY(time, onTime);
-+
-+    if ((flag & gcvPOWER_FLAG_STALL) && stall)
-+    {
-+        gctBOOL idle;
-+        gctINT32 atomValue;
-+
-+        /* For global operation, all pending commits have already been
-+        ** blocked by globalSemaphore or powerSemaphore.*/
-+        if (!global)
-+        {
-+            /* Check commit atom. */
-+            gcmkONERROR(gckOS_AtomGet(os, command->atomCommit, &atomValue));
-+
-+            if (atomValue > 0)
-+            {
-+                /* Commits are pending - abort power management. */
-+                status = broadcast ? gcvSTATUS_CHIP_NOT_READY
-+                                   : gcvSTATUS_MORE_DATA;
-+                goto OnError;
-+            }
-+        }
-+
-+        if (broadcast)
-+        {
-+            /* Check for idle. */
-+            gcmkONERROR(gckHARDWARE_QueryIdle(Hardware, &idle));
-+
-+            if (!idle)
-+            {
-+                status = gcvSTATUS_CHIP_NOT_READY;
-+                goto OnError;
-+            }
-+        }
-+
-+        else
-+        {
-+            /* Acquire the command queue. */
-+            gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvTRUE));
-+            commitEntered = gcvTRUE;
-+
-+            /* Get the size of the flush command. */
-+            gcmkONERROR(gckHARDWARE_Flush(Hardware,
-+                                          gcvFLUSH_ALL,
-+                                          gcvNULL,
-+                                          &requested));
-+
-+            /* Reserve space in the command queue. */
-+            gcmkONERROR(gckCOMMAND_Reserve(command,
-+                                           requested,
-+                                           &buffer,
-+                                           &bytes));
-+
-+            /* Append a flush. */
-+            gcmkONERROR(gckHARDWARE_Flush(
-+                Hardware, gcvFLUSH_ALL, buffer, &bytes
-+                ));
-+
-+            /* Execute the command queue. */
-+            gcmkONERROR(gckCOMMAND_Execute(command, requested));
-+
-+            /* Release the command queue. */
-+            gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvTRUE));
-+            commitEntered = gcvFALSE;
-+
-+            /* Wait to finish all commands. */
-+#if gcdMULTI_GPU
-+            gcmkONERROR(gckCOMMAND_Stall(command, gcvTRUE, gcvCORE_3D_ALL_MASK));
-+#else
-+            gcmkONERROR(gckCOMMAND_Stall(command, gcvTRUE));
-+#endif
-+        }
-+    }
-+
-+    /* Get time until stalled. */
-+    gcmkPROFILE_QUERY(time, stallTime);
-+
-+    if (flag & gcvPOWER_FLAG_ACQUIRE)
-+    {
-+        /* Acquire the power management semaphore. */
-+        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+        acquired = gcvTRUE;
-+    }
-+
-+    if (flag & gcvPOWER_FLAG_STOP)
-+    {
-+        /* Stop the command parser. */
-+        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
-+
-+        /* Stop the Isr. */
-+        if (Hardware->stopIsr)
-+        {
-+            gcmkONERROR(Hardware->stopIsr(Hardware->isrContext));
-+        }
-+    }
-+
-+    /* Flush Cache before Power Off. */
-+    if (flag & gcvPOWER_FLAG_POWER_OFF)
-+    {
-+        if (Hardware->clockState == gcvFALSE)
-+        {
-+            /* Turn off the GPU power. */
-+            gcmkONERROR(
-+                    gckOS_SetGPUPower(os,
-+                        Hardware->core,
-+                        gcvTRUE,
-+                        gcvTRUE));
-+
-+            Hardware->clockState = gcvTRUE;
-+
-+            if (gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE)
-+            {
-+                /* Write the clock control register. */
-+                gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                                  Hardware->core,
-+                                                  0x00000,
-+                                                  clocks[0]));
-+
-+                /* Done loading the frequency scaler. */
-+                gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                                  Hardware->core,
-+                                                  0x00000,
-+                                                  ((((gctUINT32) (clocks[0])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+            }
-+        }
-+
-+        gcmkONERROR(gckCOMMAND_Start(command));
-+
-+        gcmkONERROR(_FlushCache(Hardware, command));
-+
-+        gckOS_Delay(gcvNULL, 1);
-+
-+        /* Stop the command parser. */
-+        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
-+
-+        flag |= gcvPOWER_FLAG_CLOCK_OFF;
-+    }
-+
-+    /* Get time until stopped. */
-+    gcmkPROFILE_QUERY(time, stopTime);
-+
-+    /* Only process this when hardware is enabled. */
-+    if (Hardware->clockState && Hardware->powerState
-+    /* Don't touch clock control if dynamic frequency scaling is available. */
-+    && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE
-+    )
-+    {
-+        if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
-+        {
-+            if (Hardware->identity.chipModel == gcv4000
-+            && ((Hardware->identity.chipRevision == 0x5208) || (Hardware->identity.chipRevision == 0x5222)))
-+            {
-+                clock &= ~2U;
-+            }
-+        }
-+
-+        /* Write the clock control register. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          clock));
-+
-+        /* Done loading the frequency scaler. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+    }
-+
-+    if (flag & gcvPOWER_FLAG_DELAY)
-+    {
-+        /* Wait for the specified amount of time to settle coming back from
-+        ** power-off or suspend state. */
-+        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
-+    }
-+
-+    /* Get time until delayed. */
-+    gcmkPROFILE_QUERY(time, delayTime);
-+
-+    if (flag & gcvPOWER_FLAG_INITIALIZE)
-+    {
-+        /* Initialize hardware. */
-+        gcmkONERROR(gckHARDWARE_InitializeHardware(Hardware));
-+
-+        gcmkONERROR(gckHARDWARE_SetFastClear(Hardware,
-+                                             Hardware->allowFastClear,
-+                                             Hardware->allowCompression));
-+
-+        /* Force the command queue to reload the next context. */
-+        command->currContext = gcvNULL;
-+
-+        /* Need to config mmu after command start. */
-+        configMmu = gcvTRUE;
-+    }
-+
-+    /* Get time until initialized. */
-+    gcmkPROFILE_QUERY(time, initTime);
-+
-+    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
-+    {
-+        /* Turn off the GPU power. */
-+        gcmkONERROR(
-+            gckOS_SetGPUPower(os,
-+                              Hardware->core,
-+                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                               : gcvTRUE,
-+                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                               : gcvTRUE));
-+
-+        /* Save current hardware power and clock states. */
-+        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+    }
-+
-+    /* Get time until off. */
-+    gcmkPROFILE_QUERY(time, offTime);
-+
-+    if (flag & gcvPOWER_FLAG_START)
-+    {
-+        /* Start the command processor. */
-+        gcmkONERROR(gckCOMMAND_Start(command));
-+        commandStarted = gcvTRUE;
-+
-+        if (Hardware->startIsr)
-+        {
-+            /* Start the Isr. */
-+            gcmkONERROR(Hardware->startIsr(Hardware->isrContext));
-+            isrStarted = gcvTRUE;
-+        }
-+    }
-+
-+    /* Get time until started. */
-+    gcmkPROFILE_QUERY(time, startTime);
-+
-+    if (flag & gcvPOWER_FLAG_RELEASE)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
-+        acquired = gcvFALSE;
-+
-+        if (global)
-+        {
-+            /* Verify global semaphore has been acquired already before
-+            ** we release it.
-+            ** If it was acquired, gckOS_TryAcquireSemaphore will return
-+            ** gcvSTATUS_TIMEOUT and we release it. Otherwise, global
-+            ** semaphore will be acquried now, but it still is released
-+            ** immediately. */
-+            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
-+            if (status != gcvSTATUS_TIMEOUT)
-+            {
-+                gcmkONERROR(status);
-+            }
-+
-+            /* Release the global semaphore. */
-+            gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
-+            globalAcquired = gcvFALSE;
-+        }
-+    }
-+
-+    /* Save the new power state. */
-+    Hardware->chipPowerState = State;
-+
-+#if gcdDVFS
-+    if (State == gcvPOWER_ON && Hardware->kernel->dvfs)
-+    {
-+        gckDVFS_Start(Hardware->kernel->dvfs);
-+    }
-+#endif
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    /* Reset power off time */
-+    gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+    Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
-+
-+    if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
-+    {
-+        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
-+        gcmkVERIFY_OK(gckOS_StartTimer(os,
-+                                       Hardware->powerOffTimer,
-+                                       Hardware->powerOffTimeout));
-+    }
-+    else
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
-+
-+        /* Cancel running timer when GPU enters ON or OFF. */
-+        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
-+    }
-+#endif
-+
-+    /* Release the power mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+    /* Get total time. */
-+    gcmkPROFILE_QUERY(time, totalTime);
-+#if gcdENABLE_PROFILING
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
-+                   freq, mutexTime, onTime, stallTime, stopTime);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
-+                   delayTime, initTime, offTime, startTime, totalTime);
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (commandStarted)
-+    {
-+        gcmkVERIFY_OK(gckCOMMAND_Stop(command, gcvFALSE));
-+    }
-+
-+    if (isrStarted)
-+    {
-+        gcmkVERIFY_OK(Hardware->stopIsr(Hardware->isrContext));
-+    }
-+
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, gcvTRUE));
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Release semaphore. */
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
-+                                             command->powerSemaphore));
-+    }
-+
-+    if (globalAcquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
-+                                             Hardware->globalSemaphore));
-+    }
-+
-+    if (mutexAcquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryPowerManagementState
-+**
-+**  Get GPU power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE* State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_QueryPowerManagementState(
-+    IN gckHARDWARE Hardware,
-+    OUT gceCHIPPOWERSTATE* State
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(State != gcvNULL);
-+
-+    /* Return the statue. */
-+    *State = Hardware->chipPowerState;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*State=%d", *State);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagement
-+**
-+**  Configure GPU power management function.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL PowerManagement
-+**          Power Mangement State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetPowerManagement(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL PowerManagement
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    if(!Hardware->powerManagementLock)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE));
-+
-+        Hardware->powerManagement = PowerManagement;
-+
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagementLock
-+**
-+**  Disable dynamic GPU power management switch.
-+**  Only used in driver initialization stage.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL Lock
-+**          Power Mangement Lock State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetPowerManagementLock(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Lock
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    Hardware->powerManagementLock = Lock;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetGpuProfiler
-+**
-+**  Configure GPU profiler function.
-+**  Only used in driver initialization stage.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL GpuProfiler
-+**          GOU Profiler State.
-+**
-+*/
-+gceSTATUS
-+gckHARDWARE_SetGpuProfiler(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL GpuProfiler
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (GpuProfiler == gcvTRUE)
-+    {
-+        gctUINT32 data = 0;
-+
-+        /* Need to disable clock gating when doing profiling. */
-+        gcmkVERIFY_OK(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress +
-+                                 0x00100,
-+                                 &data));
-+
-+        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+
-+
-+        gcmkVERIFY_OK(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00100,
-+                                  data));
-+    }
-+
-+    Hardware->gpuProfiler = GpuProfiler;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+gceSTATUS
-+gckHARDWARE_SetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32   FscaleValue
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 clock;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x FscaleValue=%d", Hardware, FscaleValue);
-+
-+    gcmkVERIFY_ARGUMENT(FscaleValue > 0 && FscaleValue <= 64);
-+
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE));
-+    acquired =  gcvTRUE;
-+
-+    Hardware->powerOnFscaleVal = FscaleValue;
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+        gctUINT32 data;
-+
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 Hardware->powerBaseAddress
-+                                 + 0x00104,
-+                                 &data));
-+
-+        /* Disable all clock gating. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))
-+                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
-+
-+        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (FscaleValue) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)))
-+              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          clock));
-+
-+        /* Done loading the frequency scaler. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+
-+        /* Restore all clock gating. */
-+        gcmkONERROR(
-+            gckOS_WriteRegisterEx(Hardware->os,
-+                                  Hardware->core,
-+                                  Hardware->powerBaseAddress
-+                                  + 0x00104,
-+                                  data));
-+    }
-+
-+    gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT * FscaleValue,
-+    IN gctUINT * MinFscaleValue,
-+    IN gctUINT * MaxFscaleValue
-+    )
-+{
-+    *FscaleValue = Hardware->powerOnFscaleVal;
-+    *MinFscaleValue = Hardware->minFscaleValue;
-+    *MaxFscaleValue = 64;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetMinFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT MinFscaleValue
-+    )
-+{
-+    if (MinFscaleValue >= 1 && MinFscaleValue <= 64)
-+    {
-+        Hardware->minFscaleValue = MinFscaleValue;
-+    }
-+
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+#if gcdPOWEROFF_TIMEOUT
-+gceSTATUS
-+gckHARDWARE_SetPowerOffTimeout(
-+    IN gckHARDWARE  Hardware,
-+    IN gctUINT32    Timeout
-+)
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
-+
-+    Hardware->powerOffTimeout = Timeout;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+gceSTATUS
-+gckHARDWARE_QueryPowerOffTimeout(
-+    IN gckHARDWARE  Hardware,
-+    OUT gctUINT32*  Timeout
-+)
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    *Timeout = Hardware->powerOffTimeout;
-+
-+    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+gceSTATUS
-+gckHARDWARE_QueryIdle(
-+    IN gckHARDWARE Hardware,
-+    OUT gctBOOL_PTR IsIdle
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 idle, address;
-+    gctBOOL   isIdle;
-+#if gcdMULTI_GPU > 1
-+    gctUINT32 idle3D1 = 0;
-+    gctUINT32 address3D1;
-+    gctBOOL   isIdle3D1 = gcvFALSE;
-+#endif
-+
-+#if gcdINTERRUPT_STATISTIC
-+    gctINT32 pendingInterrupt;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
-+
-+    /* We are idle when the power is not ON. */
-+    if (Hardware->chipPowerState != gcvPOWER_ON)
-+    {
-+        isIdle = gcvTRUE;
-+#if gcdMULTI_GPU > 1
-+        isIdle3D1 = gcvTRUE;
-+#endif
-+    }
-+
-+    else
-+    {
-+        /* Read idle register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
-+
-+#if gcdMULTI_GPU > 1
-+        if (Hardware->core == gcvCORE_MAJOR)
-+        {
-+            gcmkONERROR(
-+                gckOS_ReadRegisterByCoreId(Hardware->os,
-+                                           Hardware->core,
-+                                           gcvCORE_3D_1_ID,
-+                                           0x00004,
-+                                           &idle3D1));
-+        }
-+#endif
-+
-+        /* Pipe must be idle. */
-+        if (((((((gctUINT32) (idle)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) ) != 1)
-+        )
-+        {
-+            /* Something is busy. */
-+            isIdle = gcvFALSE;
-+        }
-+
-+        else
-+        {
-+#if gcdSECURITY
-+            isIdle = gcvTRUE;
-+            address = 0;
-+#else
-+            /* Read the current FE address. */
-+            gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                             Hardware->core,
-+                                             0x00664,
-+                                             &address));
-+
-+            /* Test if address is inside the last WAIT/LINK sequence. */
-+            if ((address >= Hardware->lastWaitLink)
-+#if gcdMULTI_GPU
-+            &&  (address <= Hardware->lastWaitLink + 40)
-+#else
-+            &&  (address <= Hardware->lastWaitLink + 16)
-+#endif
-+            )
-+            {
-+                /* FE is in last WAIT/LINK and the pipe is idle. */
-+                isIdle = gcvTRUE;
-+            }
-+            else
-+            {
-+                /* FE is not in WAIT/LINK yet. */
-+                isIdle = gcvFALSE;
-+            }
-+#endif
-+        }
-+
-+#if gcdMULTI_GPU > 1
-+        if (Hardware->core == gcvCORE_MAJOR)
-+        {
-+            /* Pipe must be idle. */
-+            if (((((((gctUINT32) (idle3D1)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) ) != 1)
-+                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) ) != 1)
-+                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) ) != 1)
-+                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ) != 1)
-+                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) ) != 1)
-+                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) ) != 1)
-+                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) ) != 1)
-+            )
-+            {
-+                /* Something is busy. */
-+                isIdle3D1 = gcvFALSE;
-+            }
-+
-+            else
-+            {
-+                /* Read the current FE address. */
-+                gcmkONERROR(gckOS_ReadRegisterByCoreId(Hardware->os,
-+                                                       Hardware->core,
-+                                                       gcvCORE_3D_1_ID,
-+                                                       0x00664,
-+                                                       &address3D1));
-+
-+                /* Test if address is inside the last WAIT/LINK sequence. */
-+                if ((address3D1 >= Hardware->lastWaitLink)
-+                    &&  (address3D1 <= Hardware->lastWaitLink + 40)
-+                )
-+                {
-+                    /* FE is in last WAIT/LINK and the pipe is idle. */
-+                    isIdle3D1 = gcvTRUE;
-+                }
-+                else
-+                {
-+                    /* FE is not in WAIT/LINK yet. */
-+                    isIdle3D1 = gcvFALSE;
-+                }
-+            }
-+        }
-+#endif
-+
-+    }
-+
-+#if gcdINTERRUPT_STATISTIC
-+    gcmkONERROR(gckOS_AtomGet(
-+        Hardware->os,
-+        Hardware->kernel->eventObj->interruptCount,
-+        &pendingInterrupt
-+        ));
-+
-+    if (pendingInterrupt)
-+    {
-+        isIdle = gcvFALSE;
-+    }
-+#endif
-+
-+#if gcdMULTI_GPU > 1
-+    if (Hardware->core == gcvCORE_MAJOR)
-+    {
-+        *IsIdle = (isIdle & isIdle3D1);
-+    }
-+    else
-+#endif
-+    {
-+        *IsIdle = isIdle;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+** Handy macros that will help in reading those debug registers.
-+*/
-+
-+#define gcmkREAD_DEBUG_REGISTER(control, block, index, data) \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          index))); \
-+    gcmkONERROR(\
-+        gckOS_ReadRegisterEx(Hardware->os, \
-+                             Hardware->core, \
-+                             GC_DEBUG_SIGNALS_##block##_Address, \
-+                             &profiler->data))
-+
-+#define gcmkREAD_DEBUG_REGISTER_N(control, block, index, data) \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          index))); \
-+    gcmkONERROR(\
-+        gckOS_ReadRegisterEx(Hardware->os, \
-+                             Hardware->core, \
-+                             GC_DEBUG_SIGNALS_##block##_Address, \
-+                             &data))
-+
-+#define gcmkRESET_DEBUG_REGISTER(control, block) \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          15))); \
-+    gcmkONERROR(\
-+        gckOS_WriteRegisterEx(Hardware->os, \
-+                              Hardware->core, \
-+                              GC_DEBUG_CONTROL##control##_Address, \
-+                              gcmSETFIELD(0, \
-+                                          GC_DEBUG_CONTROL##control, \
-+                                          block, \
-+                                          0)))
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_ProfileEngine2D
-+**
-+**  Read the profile registers available in the 2D engine and sets them in the
-+**  profile.  The function will also reset the pixelsRendered counter every time.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      OPTIONAL gcs2D_PROFILE_PTR Profile
-+**          Pointer to a gcs2D_Profile structure.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_ProfileEngine2D(
-+    IN gckHARDWARE Hardware,
-+    OPTIONAL gcs2D_PROFILE_PTR Profile
-+    )
-+{
-+    gceSTATUS status;
-+    gcs2D_PROFILE_PTR profiler = Profile;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Profile != gcvNULL)
-+    {
-+        /* Read the cycle count. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00438,
-+                                 &Profile->cycleCount));
-+
-+        /* Read pixels rendered by 2D engine. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &profiler->pixelsRendered));
-+
-+        /* Reset counter. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if VIVANTE_PROFILER
-+gceSTATUS
-+gckHARDWARE_QueryProfileRegisters(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Reset,
-+    OUT gcsPROFILER_COUNTERS * Counters
-+    )
-+{
-+    gceSTATUS status;
-+    gcsPROFILER_COUNTERS * profiler = Counters;
-+    gctUINT i, clock;
-+    gctUINT32 colorKilled, colorDrawn, depthKilled, depthDrawn;
-+    gctUINT32 totalRead, totalWrite;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Read the counters. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00438,
-+                             &profiler->gpuCyclesCounter));
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00078,
-+                             &profiler->gpuTotalCyclesCounter));
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x0007C,
-+                             &profiler->gpuIdleCyclesCounter));
-+
-+
-+    /* Read clock control register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &clock));
-+
-+    profiler->gpuTotalRead64BytesPerFrame = 0;
-+    profiler->gpuTotalWrite64BytesPerFrame = 0;
-+    profiler->pe_pixel_count_killed_by_color_pipe = 0;
-+    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
-+
-+    /* Walk through all avaiable pixel pipes. */
-+    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
-+    {
-+        /* Select proper pipe. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
-+
-+        /* BW */
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00040,
-+                             &totalRead));
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00044,
-+                             &totalWrite));
-+
-+        profiler->gpuTotalRead64BytesPerFrame += totalRead;
-+        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
-+
-+        /* PE */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
-+
-+        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
-+        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
-+        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
-+        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
-+    }
-+
-+    /* Reset clock control register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      clock));
-+
-+    /* Reset counters. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+
-+    /* SH */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));
-+
-+    /* PA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));
-+
-+    /* SE */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));
-+
-+    /* RA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+
-+    /* TX */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));
-+
-+    /* MC */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));
-+
-+    /* HI */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+#define gcmkUPDATE_PROFILE_DATA(data) \
-+    profilerHistroy->data += profiler->data
-+
-+gceSTATUS
-+gckHARDWARE_QueryContextProfile(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Reset,
-+    IN gckCONTEXT Context,
-+    OUT gcsPROFILER_COUNTERS * Counters
-+    )
-+{
-+    gceSTATUS status;
-+    gckCOMMAND command = Hardware->kernel->command;
-+    gcsPROFILER_COUNTERS * profiler = Counters;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Acquire the context sequnence mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(
-+        command->os, command->mutexContextSeq, gcvINFINITE
-+        ));
-+
-+    /* Read the counters. */
-+    gcmkVERIFY_OK(gckOS_MemCopy(
-+        profiler, &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
-+        ));
-+
-+    /* Reset counters. */
-+    gcmkVERIFY_OK(gckOS_ZeroMemory(
-+        &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
-+        ));
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+        command->os, command->mutexContextSeq
-+        ));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gctUINT32
-+CalcDelta(
-+    IN gctUINT32 new,
-+    IN gctUINT32 old
-+    )
-+{
-+    if (new >= old)
-+    {
-+        return new - old;
-+    }
-+    else
-+    {
-+        return (gctUINT32)((gctUINT64)new + 0x100000000ll - old);
-+    }
-+}
-+
-+gceSTATUS
-+gckHARDWARE_UpdateContextProfile(
-+    IN gckHARDWARE Hardware,
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status;
-+    gcsPROFILER_COUNTERS * profiler = &Context->latestProfiler;
-+    gcsPROFILER_COUNTERS * profilerHistroy = &Context->histroyProfiler;
-+    gctUINT i, clock;
-+    gctUINT32 colorKilled = 0, colorDrawn = 0, depthKilled = 0, depthDrawn = 0;
-+    gctUINT32 totalRead, totalWrite;
-+    gceCHIPMODEL chipModel;
-+    gctUINT32 chipRevision;
-+    gctUINT32 temp;
-+    gctBOOL needResetShader = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Context=0x%x", Hardware, Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
-+
-+    chipModel = Hardware->identity.chipModel;
-+    chipRevision = Hardware->identity.chipRevision;
-+    if (chipModel == gcv2000 || (chipModel == gcv2100 && chipRevision == 0x5118))
-+    {
-+        needResetShader = gcvTRUE;
-+    }
-+
-+    /* Read the counters. */
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00438,
-+                             &profiler->gpuCyclesCounter));
-+    gcmkUPDATE_PROFILE_DATA(gpuCyclesCounter);
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00078,
-+                             &profiler->gpuTotalCyclesCounter));
-+    gcmkUPDATE_PROFILE_DATA(gpuTotalCyclesCounter);
-+
-+    gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x0007C,
-+                             &profiler->gpuIdleCyclesCounter));
-+    gcmkUPDATE_PROFILE_DATA(gpuIdleCyclesCounter);
-+
-+    /* Read clock control register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &clock));
-+
-+    profiler->gpuTotalRead64BytesPerFrame = 0;
-+    profiler->gpuTotalWrite64BytesPerFrame = 0;
-+    profiler->pe_pixel_count_killed_by_color_pipe = 0;
-+    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
-+    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
-+
-+    /* Walk through all avaiable pixel pipes. */
-+    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
-+    {
-+        /* Select proper pipe. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                           Hardware->core,
-+                                           0x00000,
-+                                           ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
-+
-+        /* BW */
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00040,
-+                             &totalRead));
-+        gcmkONERROR(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00044,
-+                             &totalWrite));
-+
-+        profiler->gpuTotalRead64BytesPerFrame += totalRead;
-+        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
-+        gcmkUPDATE_PROFILE_DATA(gpuTotalRead64BytesPerFrame);
-+        gcmkUPDATE_PROFILE_DATA(gpuTotalWrite64BytesPerFrame);
-+
-+        /* PE */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
-+
-+        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
-+        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
-+        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
-+        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_color_pipe);
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_depth_pipe);
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_color_pipe);
-+        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_depth_pipe);
-+    }
-+
-+    /* Reset clock control register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      clock));
-+
-+
-+    /* Reset counters. */
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
-+    gcmkONERROR(
-+        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+
-+    /* SH */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->ps_inst_counter;
-+        profiler->ps_inst_counter = CalcDelta(temp, Context->prevPSInstCount);
-+        Context->prevPSInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(ps_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->rendered_pixel_counter;
-+        profiler->rendered_pixel_counter = CalcDelta(temp, Context->prevPSPixelCount);
-+        Context->prevPSPixelCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(rendered_pixel_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->vs_inst_counter;
-+        profiler->vs_inst_counter = CalcDelta(temp, Context->prevVSInstCount);
-+        Context->prevVSInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(vs_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->rendered_vertice_counter;
-+        profiler->rendered_vertice_counter = CalcDelta(temp, Context->prevVSVertexCount);
-+        Context->prevVSVertexCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(rendered_vertice_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->vtx_branch_inst_counter;
-+        profiler->vtx_branch_inst_counter = CalcDelta(temp, Context->prevVSBranchInstCount);
-+        Context->prevVSBranchInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(vtx_branch_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->vtx_texld_inst_counter;
-+        profiler->vtx_texld_inst_counter = CalcDelta(temp, Context->prevVSTexInstCount);
-+        Context->prevVSTexInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(vtx_texld_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->pxl_branch_inst_counter;
-+        profiler->pxl_branch_inst_counter = CalcDelta(temp, Context->prevPSBranchInstCount);
-+        Context->prevPSBranchInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(pxl_branch_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
-+    if (needResetShader)
-+    {
-+        temp = profiler->pxl_texld_inst_counter;
-+        profiler->pxl_texld_inst_counter = CalcDelta(temp, Context->prevPSTexInstCount);
-+        Context->prevPSTexInstCount = temp;
-+    }
-+    gcmkUPDATE_PROFILE_DATA(pxl_texld_inst_counter);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));
-+
-+    /* PA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_input_vtx_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_input_prim_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_output_prim_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_depth_clipped_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_trivial_rejected_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
-+    gcmkUPDATE_PROFILE_DATA(pa_culled_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));
-+
-+    /* SE */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
-+    gcmkUPDATE_PROFILE_DATA(se_culled_triangle_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
-+    gcmkUPDATE_PROFILE_DATA(se_culled_lines_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));
-+
-+    /* RA */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
-+    gcmkUPDATE_PROFILE_DATA(ra_valid_pixel_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
-+    gcmkUPDATE_PROFILE_DATA(ra_total_quad_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
-+    gcmkUPDATE_PROFILE_DATA(ra_valid_quad_count_after_early_z);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
-+    gcmkUPDATE_PROFILE_DATA(ra_total_primitive_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
-+    gcmkUPDATE_PROFILE_DATA(ra_pipe_cache_miss_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
-+    gcmkUPDATE_PROFILE_DATA(ra_prefetch_cache_miss_counter);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
-+));
-+
-+    /* TX */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_bilinear_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_trilinear_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_discarded_texture_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
-+    gcmkUPDATE_PROFILE_DATA(tx_total_texture_requests);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_mem_read_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_mem_read_in_8B_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_cache_hit_texel_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
-+    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_texel_count);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
-+));
-+
-+    /* MC */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
-+    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_pipeline);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
-+    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_IP);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
-+    gcmkUPDATE_PROFILE_DATA(mc_total_write_req_8B_from_pipeline);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
-+));
-+
-+    /* HI */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
-+    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_read_request_stalled);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
-+    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_request_stalled);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
-+    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_data_stalled);
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
-+gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
-+));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+
-+#if VIVANTE_PROFILER_NEW
-+gceSTATUS
-+gckHARDWARE_InitProfiler(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 control;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &control));
-+    /* Enable debug register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+static gceSTATUS
-+_ResetGPU(
-+    IN gckHARDWARE Hardware,
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+    gctUINT32 control, idle;
-+    gceSTATUS status;
-+
-+    for (;;)
-+    {
-+        /* Disable clock gating. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    Hardware->powerBaseAddress +
-+                    0x00104,
-+                    0x00000000));
-+
-+        control = ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
-+
-+        /* Disable pulse-eater. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x0010C,
-+                    control));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x0010C,
-+                    ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x0010C,
-+                    control));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x00000,
-+                    ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    Core,
-+                    0x00000,
-+                    0x00000900));
-+
-+        /* Wait for clock being stable. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Isolate the GPU. */
-+        control = ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Set soft reset. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Wait for reset. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Reset soft reset bit. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Reset GPU isolation. */
-+        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          Core,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Read idle register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         Core,
-+                                         0x00004,
-+                                         &idle));
-+
-+        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
-+        {
-+            continue;
-+        }
-+
-+#if gcdMULTI_GPU > 1
-+        if (Core == gcvCORE_MAJOR)
-+        {
-+            /* Read idle register. */
-+            gcmkONERROR(gckOS_ReadRegisterByCoreId(Os,
-+                                                   Core,
-+                                                   gcvCORE_3D_1_ID,
-+                                                   0x00004,
-+                                                   &idle));
-+
-+            if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
-+            {
-+                continue;
-+            }
-+        }
-+#endif
-+        /* Read reset register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         Core,
-+                                         0x00000,
-+                                         &control));
-+
-+        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
-+        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
-+        )
-+        {
-+            continue;
-+        }
-+
-+#if gcdMULTI_GPU > 1
-+        if (Core == gcvCORE_MAJOR)
-+        {
-+            /* Read reset register. */
-+            gcmkONERROR(gckOS_ReadRegisterByCoreId(Os,
-+                                                   Core,
-+                                                   gcvCORE_3D_1_ID,
-+                                                   0x00000,
-+                                                   &control));
-+
-+            if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
-+                ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
-+            )
-+            {
-+                continue;
-+            }
-+        }
-+#endif
-+        /* GPU is idle. */
-+        break;
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the error. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_Reset(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
-+
-+    /* Hardware reset. */
-+    status = gckOS_ResetGPU(Hardware->os, Hardware->core);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        if (Hardware->identity.chipRevision < 0x4600)
-+        {
-+            /* Not supported - we need the isolation bit. */
-+            gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+        }
-+
-+        /* Soft reset. */
-+        gcmkONERROR(_ResetGPU(Hardware, Hardware->os, Hardware->core));
-+    }
-+
-+    /* Initialize hardware. */
-+    gcmkONERROR(gckHARDWARE_InitializeHardware(Hardware));
-+
-+    /* Jump to address into which GPU should run if it doesn't stuck. */
-+    gcmkONERROR(gckHARDWARE_Execute(Hardware, Hardware->kernel->restoreAddress, 16));
-+
-+    gcmkPRINT("[galcore]: recovery done");
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkPRINT("[galcore]: Hardware not reset successfully, give up");
-+
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32_PTR BaseAddress
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(BaseAddress != gcvNULL);
-+
-+    /* Test if we have a new Memory Controller. */
-+    if (((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))))
-+    {
-+        /* No base address required. */
-+        *BaseAddress = 0;
-+    }
-+    else
-+    {
-+        /* Get the base address from the OS. */
-+        gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, BaseAddress));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*BaseAddress=0x%08x", *BaseAddress);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_NeedBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 State,
-+    OUT gctBOOL_PTR NeedBase
-+    )
-+{
-+    gctBOOL need = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x State=0x%08x", Hardware, State);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(NeedBase != gcvNULL);
-+
-+    /* Make sure this is a load state. */
-+    if (((((gctUINT32) (State)) >> (0 ? 31:27) & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))))
-+    {
-+#if gcdENABLE_3D
-+        /* Get the state address. */
-+        switch ((((((gctUINT32) (State)) >> (0 ? 15:0)) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1)))))) ))
-+        {
-+        case 0x0596:
-+        case 0x0597:
-+        case 0x0599:
-+        case 0x059A:
-+        case 0x05A9:
-+            /* These states need a TRUE physical address. */
-+            need = gcvTRUE;
-+            break;
-+        }
-+#else
-+        /* 2D addresses don't need a base address. */
-+#endif
-+    }
-+
-+    /* Return the flag. */
-+    *NeedBase = need;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*NeedBase=%d", *NeedBase);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetIsrManager(
-+   IN gckHARDWARE Hardware,
-+   IN gctISRMANAGERFUNC StartIsr,
-+   IN gctISRMANAGERFUNC StopIsr,
-+   IN gctPOINTER Context
-+   )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x, StartIsr=0x%x, StopIsr=0x%x, Context=0x%x",
-+                   Hardware, StartIsr, StopIsr, Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (StartIsr == gcvNULL ||
-+        StopIsr == gcvNULL ||
-+        Context == gcvNULL)
-+    {
-+        status = gcvSTATUS_INVALID_ARGUMENT;
-+
-+        gcmkFOOTER();
-+        return status;
-+    }
-+
-+    Hardware->startIsr = StartIsr;
-+    Hardware->stopIsr = StopIsr;
-+    Hardware->isrContext = Context;
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_Compose
-+**
-+**  Start a composition.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_Compose(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Offset,
-+    IN gctSIZE_T Size,
-+    IN gctUINT8 EventID
-+    )
-+{
-+#if gcdENABLE_3D
-+    gceSTATUS status;
-+    gctUINT32_PTR triggerState;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Physical=0x%x Logical=0x%x"
-+                   " Offset=%d Size=%d EventID=%d",
-+                   Hardware, Physical, Logical, Offset, Size, EventID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(((Size + 8) & 63) == 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Program the trigger state. */
-+    triggerState = (gctUINT32_PTR) ((gctUINT8_PTR) Logical + Offset + Size);
-+    triggerState[0] = 0x0C03;
-+    triggerState[1]
-+        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))
-+        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16))) | (((gctUINT32) ((gctUINT32) (EventID) & ((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16)))
-+        ;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache for the wait/link. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Hardware->os, ProcessID, gcvNULL,
-+        (gctUINT32)Physical, Logical, Offset + Size
-+        ));
-+#endif
-+
-+    /* Start composition. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(
-+        Hardware->os, Hardware->core, 0x00554,
-+        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
-+        ));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    /* Return the status. */
-+    return gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_IsFeatureAvailable
-+**
-+**  Verifies whether the specified feature is available in hardware.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceFEATURE Feature
-+**          Feature to be verified.
-+*/
-+gceSTATUS
-+gckHARDWARE_IsFeatureAvailable(
-+    IN gckHARDWARE Hardware,
-+    IN gceFEATURE Feature
-+    )
-+{
-+    gctBOOL available;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Feature=%d", Hardware, Feature);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Only features needed by common kernel logic added here. */
-+    switch (Feature)
-+    {
-+    case gcvFEATURE_END_EVENT:
-+        /*available = gcmVERIFYFIELDVALUE(Hardware->identity.chipMinorFeatures2,
-+            GC_MINOR_FEATURES2, END_EVENT, AVAILABLE
-+            );*/
-+        available = gcvFALSE;
-+        break;
-+
-+    case gcvFEATURE_MC20:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_EARLY_Z:
-+        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_HZ:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_NEW_HZ:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_FAST_MSAA:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_SMALL_MSAA:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures4)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_DYNAMIC_FREQUENCY_SCALING:
-+        /* This feature doesn't apply for 2D cores. */
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 14:14) & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))))
-+            &&      ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
-+
-+        if (Hardware->identity.chipModel == gcv1000 &&
-+            (Hardware->identity.chipRevision == 0x5039 ||
-+            Hardware->identity.chipRevision == 0x5040))
-+        {
-+            available = gcvFALSE;
-+        }
-+        break;
-+
-+    case gcvFEATURE_ACE:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_HALTI2:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures4)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_PIPE_2D:
-+        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))));
-+        break;
-+
-+    case gcvFEATURE_PIPE_3D:
-+#if gcdENABLE_3D
-+        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
-+#else
-+        available = gcvFALSE;
-+#endif
-+        break;
-+
-+    case gcvFEATURE_FC_FLUSH_STALL:
-+        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 31:31) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))));
-+        break;
-+
-+    default:
-+        gcmkFATAL("Invalid feature has been requested.");
-+        available = gcvFALSE;
-+    }
-+
-+    /* Return result. */
-+    gcmkFOOTER_ARG("%d", available ? gcvSTATUS_TRUE : gcvSTATUS_FALSE);
-+    return available ? gcvSTATUS_TRUE : gcvSTATUS_FALSE;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_DumpMMUException
-+**
-+**  Dump the MMU debug info on an MMU exception.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_DumpMMUException(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gctUINT32 mmu       = 0;
-+    gctUINT32 mmuStatus = 0;
-+    gctUINT32 address   = 0;
-+    gctUINT32 i         = 0;
-+    gctUINT32 mtlb      = 0;
-+    gctUINT32 stlb      = 0;
-+    gctUINT32 offset    = 0;
-+#if gcdPROCESS_ADDRESS_SPACE
-+    gcsDATABASE_PTR database;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    gcmkPRINT("GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
-+              Hardware->core,
-+              Hardware->identity.chipModel,
-+              Hardware->identity.chipRevision);
-+
-+    gcmkPRINT("**************************\n");
-+    gcmkPRINT("***   MMU ERROR DUMP   ***\n");
-+    gcmkPRINT("**************************\n");
-+
-+    gcmkVERIFY_OK(
-+        gckOS_ReadRegisterEx(Hardware->os,
-+                             Hardware->core,
-+                             0x00188,
-+                             &mmuStatus));
-+
-+    gcmkPRINT("  MMU status = 0x%08X\n", mmuStatus);
-+
-+    for (i = 0; i < 4; i += 1)
-+    {
-+        mmu = mmuStatus & 0xF;
-+        mmuStatus >>= 4;
-+
-+        if (mmu == 0)
-+        {
-+            continue;
-+        }
-+
-+        switch (mmu)
-+        {
-+        case 1:
-+              gcmkPRINT("  MMU%d: slave not present\n", i);
-+              break;
-+
-+        case 2:
-+              gcmkPRINT("  MMU%d: page not present\n", i);
-+              break;
-+
-+        case 3:
-+              gcmkPRINT("  MMU%d: write violation\n", i);
-+              break;
-+
-+        default:
-+              gcmkPRINT("  MMU%d: unknown state\n", i);
-+        }
-+
-+        gcmkVERIFY_OK(
-+            gckOS_ReadRegisterEx(Hardware->os,
-+                                 Hardware->core,
-+                                 0x00190 + i * 4,
-+                                 &address));
-+
-+        mtlb   = (address & gcdMMU_MTLB_MASK) >> gcdMMU_MTLB_SHIFT;
-+        stlb   = (address & gcdMMU_STLB_4K_MASK) >> gcdMMU_STLB_4K_SHIFT;
-+        offset =  address & gcdMMU_OFFSET_4K_MASK;
-+
-+        gcmkPRINT("  MMU%d: exception address = 0x%08X\n", i, address);
-+
-+        gcmkPRINT("    MTLB entry = %d\n", mtlb);
-+
-+        gcmkPRINT("    STLB entry = %d\n", stlb);
-+
-+        gcmkPRINT("    Offset = 0x%08X (%d)\n", offset, offset);
-+
-+        gckMMU_DumpPageTableEntry(Hardware->kernel->mmu, address);
-+
-+#if gcdPROCESS_ADDRESS_SPACE
-+        for (i = 0; i < gcmCOUNTOF(Hardware->kernel->db->db); ++i)
-+        {
-+            for (database = Hardware->kernel->db->db[i];
-+                    database != gcvNULL;
-+                    database = database->next)
-+            {
-+                gcmkPRINT("    database [%d] :", database->processID);
-+                gckMMU_DumpPageTableEntry(database->mmu, address);
-+            }
-+        }
-+#endif
-+    }
-+
-+    gckHARDWARE_DumpGPUState(Hardware);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_DumpGPUState
-+**
-+**  Dump the GPU debug registers.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHARDWARE_DumpGPUState(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    static gctCONST_STRING _cmdState[] =
-+    {
-+        "PAR_IDLE_ST", "PAR_DEC_ST", "PAR_ADR0_ST", "PAR_LOAD0_ST",
-+        "PAR_ADR1_ST", "PAR_LOAD1_ST", "PAR_3DADR_ST", "PAR_3DCMD_ST",
-+        "PAR_3DCNTL_ST", "PAR_3DIDXCNTL_ST", "PAR_INITREQDMA_ST",
-+        "PAR_DRAWIDX_ST", "PAR_DRAW_ST", "PAR_2DRECT0_ST", "PAR_2DRECT1_ST",
-+        "PAR_2DDATA0_ST", "PAR_2DDATA1_ST", "PAR_WAITFIFO_ST", "PAR_WAIT_ST",
-+        "PAR_LINK_ST", "PAR_END_ST", "PAR_STALL_ST"
-+    };
-+
-+    static gctCONST_STRING _cmdDmaState[] =
-+    {
-+        "CMD_IDLE_ST", "CMD_START_ST", "CMD_REQ_ST", "CMD_END_ST"
-+    };
-+
-+    static gctCONST_STRING _cmdFetState[] =
-+    {
-+        "FET_IDLE_ST", "FET_RAMVALID_ST", "FET_VALID_ST"
-+    };
-+
-+    static gctCONST_STRING _reqDmaState[] =
-+    {
-+        "REQ_IDLE_ST", "REQ_WAITIDX_ST", "REQ_CAL_ST"
-+    };
-+
-+    static gctCONST_STRING _calState[] =
-+    {
-+        "CAL_IDLE_ST", "CAL_LDADR_ST", "CAL_IDXCALC_ST"
-+    };
-+
-+    static gctCONST_STRING _veReqState[] =
-+    {
-+        "VER_IDLE_ST", "VER_CKCACHE_ST", "VER_MISS_ST"
-+    };
-+
-+    static gcsiDEBUG_REGISTERS _dbgRegs[] =
-+    {
-+        { "RA", 0x474, 16, 0x448, 16, 0x12344321 },
-+        { "TX", 0x474, 24, 0x44C, 16, 0x12211221 },
-+        { "FE", 0x470, 0, 0x450, 16, 0xBABEF00D },
-+        { "PE", 0x470, 16, 0x454, 16, 0xBABEF00D },
-+        { "DE", 0x470, 8, 0x458, 16, 0xBABEF00D },
-+        { "SH", 0x470, 24, 0x45C, 16, 0xDEADBEEF },
-+        { "PA", 0x474, 0, 0x460, 16, 0x0000AAAA },
-+        { "SE", 0x474, 8, 0x464, 16, 0x5E5E5E5E },
-+        { "MC", 0x478, 0, 0x468, 16, 0x12345678 },
-+        { "HI", 0x478, 8, 0x46C, 16, 0xAAAAAAAA }
-+    };
-+
-+    static gctUINT32 _otherRegs[] =
-+    {
-+        0x040, 0x044, 0x04C, 0x050, 0x054, 0x058, 0x05C, 0x060,
-+        0x43c, 0x440, 0x444, 0x414,
-+    };
-+
-+    gceSTATUS status;
-+    gckKERNEL kernel = gcvNULL;
-+    gctUINT32 idle = 0, axi = 0;
-+    gctUINT32 dmaAddress1 = 0, dmaAddress2 = 0;
-+    gctUINT32 dmaState1 = 0, dmaState2 = 0;
-+    gctUINT32 dmaLow = 0, dmaHigh = 0;
-+    gctUINT32 cmdState = 0, cmdDmaState = 0, cmdFetState = 0;
-+    gctUINT32 dmaReqState = 0, calState = 0, veReqState = 0;
-+    gctUINT i;
-+    gctUINT pipe = 0, pixelPipes = 0;
-+    gctUINT32 control = 0, oldControl = 0;
-+    gckOS os = Hardware->os;
-+    gceCORE core = Hardware->core;
-+
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    kernel = Hardware->kernel;
-+
-+    gcmkPRINT_N(12, "GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
-+                core,
-+                Hardware->identity.chipModel,
-+                Hardware->identity.chipRevision);
-+
-+    pixelPipes = Hardware->identity.pixelPipes
-+               ? Hardware->identity.pixelPipes
-+               : 1;
-+
-+    /* Reset register values. */
-+    idle        = axi         =
-+    dmaState1   = dmaState2   =
-+    dmaAddress1 = dmaAddress2 =
-+    dmaLow      = dmaHigh     = 0;
-+
-+    /* Verify whether DMA is running. */
-+    gcmkONERROR(_VerifyDMA(
-+        os, core, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
-+        ));
-+
-+    cmdState    =  dmaState2        & 0x1F;
-+    cmdDmaState = (dmaState2 >>  8) & 0x03;
-+    cmdFetState = (dmaState2 >> 10) & 0x03;
-+    dmaReqState = (dmaState2 >> 12) & 0x03;
-+    calState    = (dmaState2 >> 14) & 0x03;
-+    veReqState  = (dmaState2 >> 16) & 0x03;
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x004, &idle));
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x00C, &axi));
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x668, &dmaLow));
-+    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x66C, &dmaHigh));
-+
-+    gcmkPRINT_N(0, "**************************\n");
-+    gcmkPRINT_N(0, "***   GPU STATE DUMP   ***\n");
-+    gcmkPRINT_N(0, "**************************\n");
-+
-+    gcmkPRINT_N(4, "  axi      = 0x%08X\n", axi);
-+
-+    gcmkPRINT_N(4, "  idle     = 0x%08X\n", idle);
-+    if ((idle & 0x00000001) == 0) gcmkPRINT_N(0, "    FE not idle\n");
-+    if ((idle & 0x00000002) == 0) gcmkPRINT_N(0, "    DE not idle\n");
-+    if ((idle & 0x00000004) == 0) gcmkPRINT_N(0, "    PE not idle\n");
-+    if ((idle & 0x00000008) == 0) gcmkPRINT_N(0, "    SH not idle\n");
-+    if ((idle & 0x00000010) == 0) gcmkPRINT_N(0, "    PA not idle\n");
-+    if ((idle & 0x00000020) == 0) gcmkPRINT_N(0, "    SE not idle\n");
-+    if ((idle & 0x00000040) == 0) gcmkPRINT_N(0, "    RA not idle\n");
-+    if ((idle & 0x00000080) == 0) gcmkPRINT_N(0, "    TX not idle\n");
-+    if ((idle & 0x00000100) == 0) gcmkPRINT_N(0, "    VG not idle\n");
-+    if ((idle & 0x00000200) == 0) gcmkPRINT_N(0, "    IM not idle\n");
-+    if ((idle & 0x00000400) == 0) gcmkPRINT_N(0, "    FP not idle\n");
-+    if ((idle & 0x00000800) == 0) gcmkPRINT_N(0, "    TS not idle\n");
-+    if ((idle & 0x80000000) != 0) gcmkPRINT_N(0, "    AXI low power mode\n");
-+
-+    if (
-+        (dmaAddress1 == dmaAddress2)
-+     && (dmaState1 == dmaState2)
-+    )
-+    {
-+        gcmkPRINT_N(0, "  DMA appears to be stuck at this address:\n");
-+        gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
-+    }
-+    else
-+    {
-+        if (dmaAddress1 == dmaAddress2)
-+        {
-+            gcmkPRINT_N(0, "  DMA address is constant, but state is changing:\n");
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaState1);
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaState2);
-+        }
-+        else
-+        {
-+            gcmkPRINT_N(0, "  DMA is running; known addresses are:\n");
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
-+            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress2);
-+        }
-+    }
-+
-+    gcmkPRINT_N(4, "  dmaLow   = 0x%08X\n", dmaLow);
-+    gcmkPRINT_N(4, "  dmaHigh  = 0x%08X\n", dmaHigh);
-+    gcmkPRINT_N(4, "  dmaState = 0x%08X\n", dmaState2);
-+    gcmkPRINT_N(8, "    command state       = %d (%s)\n", cmdState, _cmdState   [cmdState]);
-+    gcmkPRINT_N(8, "    command DMA state   = %d (%s)\n", cmdDmaState, _cmdDmaState[cmdDmaState]);
-+    gcmkPRINT_N(8, "    command fetch state = %d (%s)\n", cmdFetState, _cmdFetState[cmdFetState]);
-+    gcmkPRINT_N(8, "    DMA request state   = %d (%s)\n", dmaReqState, _reqDmaState[dmaReqState]);
-+    gcmkPRINT_N(8, "    cal state           = %d (%s)\n", calState, _calState   [calState]);
-+    gcmkPRINT_N(8, "    VE request state    = %d (%s)\n", veReqState, _veReqState [veReqState]);
-+
-+    /* Record control. */
-+    gckOS_ReadRegisterEx(os, core, 0x0, &oldControl);
-+
-+    for (pipe = 0; pipe < pixelPipes; pipe++)
-+    {
-+        gcmkPRINT_N(4, "  Debug registers of pipe[%d]:\n", pipe);
-+
-+        /* Switch pipe. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x0, &control));
-+        control &= ~(0xF << 20);
-+        control |= (pipe << 20);
-+        gcmkONERROR(gckOS_WriteRegisterEx(os, core, 0x0, control));
-+
-+        for (i = 0; i < gcmCOUNTOF(_dbgRegs); i += 1)
-+        {
-+            gcmkONERROR(_DumpDebugRegisters(os, core, &_dbgRegs[i]));
-+        }
-+
-+        gcmkPRINT_N(0, "    Other Registers:\n");
-+        for (i = 0; i < gcmCOUNTOF(_otherRegs); i += 1)
-+        {
-+            gctUINT32 read;
-+            gcmkONERROR(gckOS_ReadRegisterEx(os, core, _otherRegs[i], &read));
-+            gcmkPRINT_N(12, "      [0x%04X] 0x%08X\n", _otherRegs[i], read);
-+        }
-+    }
-+
-+    if (kernel->hardware->identity.chipFeatures & (1 << 4))
-+    {
-+        gctUINT32 read0, read1, write;
-+
-+        read0 = read1 = write = 0;
-+
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x43C, &read0));
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x440, &read1));
-+        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x444, &write));
-+
-+        gcmkPRINT_N(4, "  read0    = 0x%08X\n", read0);
-+        gcmkPRINT_N(4, "  read1    = 0x%08X\n", read1);
-+        gcmkPRINT_N(4, "  write    = 0x%08X\n", write);
-+    }
-+
-+    /* Restore control. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(os, core, 0x0, oldControl));
-+
-+    /* dump stack. */
-+    gckOS_DumpCallStack(os);
-+
-+OnError:
-+
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+gckHARDWARE_ReadPerformanceRegister(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT PerformanceAddress,
-+    IN gctUINT IndexAddress,
-+    IN gctUINT IndexShift,
-+    IN gctUINT Index,
-+    OUT gctUINT32_PTR Value
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x PerformanceAddress=0x%x IndexAddress=0x%x "
-+                   "IndexShift=%u Index=%u",
-+                   Hardware, PerformanceAddress, IndexAddress, IndexShift,
-+                   Index);
-+
-+    /* Write the index. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      IndexAddress,
-+                                      Index << IndexShift));
-+
-+    /* Read the register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     PerformanceAddress,
-+                                     Value));
-+
-+    /* Test for reset. */
-+    if (Index == 15)
-+    {
-+        /* Index another register to get out of reset. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, IndexAddress, 0));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Value=0x%x", *Value);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_GetFrameInfo(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_FRAME_INFO * FrameInfo
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT i, clock;
-+    gcsHAL_FRAME_INFO info;
-+#if gcdFRAME_DB_RESET
-+    gctUINT reset;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Get profile tick. */
-+    gcmkONERROR(gckOS_GetProfileTick(&info.ticks));
-+
-+    /* Read SH counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        4,
-+        &info.shaderCycles));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        9,
-+        &info.vsInstructionCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        12,
-+        &info.vsTextureCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        7,
-+        &info.psInstructionCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        14,
-+        &info.psTextureCount));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0045C,
-+        0x00470,
-+        24,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read PA counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        3,
-+        &info.vertexCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        4,
-+        &info.primitiveCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        7,
-+        &info.rejectedPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        8,
-+        &info.culledPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        6,
-+        &info.clippedPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        5,
-+        &info.outPrimitives));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00460,
-+        0x00474,
-+        0,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read RA counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        3,
-+        &info.inPrimitives));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        11,
-+        &info.culledQuadCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        1,
-+        &info.totalQuadCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        2,
-+        &info.quadCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        0,
-+        &info.totalPixelCount));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00448,
-+        0x00474,
-+        16,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read TX counters and reset them. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        0,
-+        &info.bilinearRequests));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        1,
-+        &info.trilinearRequests));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        8,
-+        &info.txHitCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        9,
-+        &info.txMissCount));
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        6,
-+        &info.txBytes8));
-+#if gcdFRAME_DB_RESET
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x0044C,
-+        0x00474,
-+        24,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Read clock control register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x00000,
-+                                     &clock));
-+
-+    /* Walk through all avaiable pixel pipes. */
-+    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
-+    {
-+        /* Select proper pipe. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00000,
-+                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
-+
-+        /* Read cycle registers. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00078,
-+                                         &info.cycles[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x0007C,
-+                                         &info.idleCycles[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00438,
-+                                         &info.mcCycles[i]));
-+
-+        /* Read bandwidth registers. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x0005C,
-+                                         &info.readRequests[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00040,
-+                                         &info.readBytes8[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00050,
-+                                         &info.writeRequests[i]));
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00044,
-+                                         &info.writeBytes8[i]));
-+
-+        /* Read PE counters. */
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            0,
-+            &info.colorKilled[i]));
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            2,
-+            &info.colorDrawn[i]));
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            1,
-+            &info.depthKilled[i]));
-+        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+            Hardware,
-+            0x00454,
-+            0x00470,
-+            16,
-+            3,
-+            &info.depthDrawn[i]));
-+    }
-+
-+    /* Zero out remaning reserved counters. */
-+    for (; i < 8; ++i)
-+    {
-+        info.readBytes8[i]    = 0;
-+        info.writeBytes8[i]   = 0;
-+        info.cycles[i]        = 0;
-+        info.idleCycles[i]    = 0;
-+        info.mcCycles[i]      = 0;
-+        info.readRequests[i]  = 0;
-+        info.writeRequests[i] = 0;
-+        info.colorKilled[i]   = 0;
-+        info.colorDrawn[i]    = 0;
-+        info.depthKilled[i]   = 0;
-+        info.depthDrawn[i]    = 0;
-+    }
-+
-+    /* Reset clock control register. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00000,
-+                                      clock));
-+
-+    /* Reset cycle and bandwidth counters. */
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      1));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0003C,
-+                                      0));
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x00078,
-+                                      0));
-+
-+#if gcdFRAME_DB_RESET
-+    /* Reset PE counters. */
-+    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
-+        Hardware,
-+        0x00454,
-+        0x00470,
-+        16,
-+        15,
-+        &reset));
-+#endif
-+
-+    /* Copy to user. */
-+    gcmkONERROR(gckOS_CopyToUserData(Hardware->os,
-+                                     &info,
-+                                     FrameInfo,
-+                                     gcmSIZEOF(info)));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdDVFS
-+#define READ_FROM_EATER1 0
-+
-+gceSTATUS
-+gckHARDWARE_QueryLoad(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32 * Load
-+    )
-+{
-+    gctUINT32 debug1;
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Load != gcvNULL);
-+
-+    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00110,
-+                                         Load));
-+#if READ_FROM_EATER1
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00134,
-+                                         Load));
-+#endif
-+
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00114,
-+                                         &debug1));
-+
-+        /* Patch result of 0x110 with result of 0x114. */
-+        if ((debug1 & 0xFF) == 1)
-+        {
-+            *Load &= ~0xFF;
-+            *Load |= 1;
-+        }
-+
-+        if (((debug1 & 0xFF00) >> 8) == 1)
-+        {
-+            *Load &= ~(0xFF << 8);
-+            *Load |= 1 << 8;
-+        }
-+
-+        if (((debug1 & 0xFF0000) >> 16) == 1)
-+        {
-+            *Load &= ~(0xFF << 16);
-+            *Load |= 1 << 16;
-+        }
-+
-+        if (((debug1 & 0xFF000000) >> 24) == 1)
-+        {
-+            *Load &= ~(0xFF << 24);
-+            *Load |= 1 << 24;
-+        }
-+    }
-+    else
-+    {
-+        status = gcvSTATUS_INVALID_REQUEST;
-+    }
-+
-+OnError:
-+
-+    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_SetDVFSPeroid(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32 Frequency
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 period;
-+    gctUINT32 eater;
-+
-+#if READ_FROM_EATER1
-+    gctUINT32 period1;
-+    gctUINT32 eater1;
-+#endif
-+
-+    gcmkHEADER_ARG("Hardware=0x%X Frequency=%d", Hardware, Frequency);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    period = 0;
-+
-+    while((64 << period) < (gcdDVFS_ANAYLSE_WINDOW * Frequency * 1000) )
-+    {
-+        period++;
-+    }
-+
-+#if READ_FROM_EATER1
-+    /*
-+    *  Peroid = F * 1000 * 1000 / (60 * 16 * 1024);
-+    */
-+    period1 = Frequency * 6250 / 6114;
-+#endif
-+
-+    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
-+
-+    if (Hardware->chipPowerState == gcvPOWER_ON)
-+    {
-+        /* Get current configure. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x0010C,
-+                                         &eater));
-+
-+        /* Change peroid. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x0010C,
-+                                          ((((gctUINT32) (eater)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (period) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))));
-+
-+#if READ_FROM_EATER1
-+        /* Config eater1. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                         Hardware->core,
-+                                         0x00130,
-+                                         &eater1));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                          Hardware->core,
-+                                          0x00130,
-+                                          ((((gctUINT32) (eater1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16))) | (((gctUINT32) ((gctUINT32) (period1) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16)))));
-+#endif
-+    }
-+    else
-+    {
-+        status = gcvSTATUS_INVALID_REQUEST;
-+    }
-+
-+OnError:
-+    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckHARDWARE_InitDVFS(
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 data;
-+
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
-+                                     Hardware->core,
-+                                     0x0010C,
-+                                     &data));
-+
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)));
-+    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22)));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "DVFS Configure=0x%X",
-+                   data);
-+
-+    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
-+                                      Hardware->core,
-+                                      0x0010C,
-+                                      data));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_PrepareFunctions
-+**
-+**  Generate command buffer snippets which will be used by gckHARDWARE, by which
-+**  gckHARDWARE can manipulate GPU by FE command without using gckCOMMAND to avoid
-+**  race condition and deadlock.
-+**
-+**  Notice:
-+**  1. Each snippet can only be executed when GPU is idle.
-+**  2. Execution is triggered by AHB (0x658)
-+**  3. Each snippet followed by END so software can sync with GPU by checking GPU
-+**     idle
-+**  4. It is transparent to gckCOMMAND command buffer.
-+**
-+**  Existing Snippets:
-+**  1. MMU Configure
-+**     For new MMU, after GPU is reset, FE execute this command sequence to enble MMU.
-+*/
-+gceSTATUS
-+gckHARDWARE_PrepareFunctions(
-+    gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckOS os;
-+    gctUINT32 offset = 0;
-+    gctUINT32 mmuBytes;
-+    gctUINT32 endBytes;
-+    gctUINT8_PTR logical;
-+
-+    gcmkHEADER_ARG("%x", Hardware);
-+
-+    os = Hardware->os;
-+
-+    gcmkVERIFY_OK(gckOS_GetPageSize(os, &Hardware->functionBytes));
-+
-+    /* Allocate a command buffer. */
-+    gcmkONERROR(gckOS_AllocateNonPagedMemory(
-+        os,
-+        gcvFALSE,
-+        &Hardware->functionBytes,
-+        &Hardware->functionPhysical,
-+        &Hardware->functionLogical
-+        ));
-+
-+    gcmkONERROR(gckOS_GetPhysicalAddress(
-+        os,
-+        Hardware->functionLogical,
-+        &Hardware->functionAddress
-+        ));
-+
-+    if (Hardware->mmuVersion > 0)
-+    {
-+        /* MMU configure command sequence. */
-+        logical = (gctUINT8_PTR)Hardware->functionLogical + offset;
-+
-+        Hardware->functions[gcvHARDWARE_FUNCTION_MMU].address
-+            = Hardware->functionAddress + offset;
-+
-+        gcmkONERROR(gckHARDWARE_SetMMUStates(
-+            Hardware,
-+            Hardware->kernel->mmu->mtlbLogical,
-+            gcvMMU_MODE_4K,
-+            (gctUINT8_PTR)Hardware->kernel->mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
-+            logical,
-+            &mmuBytes
-+            ));
-+
-+        offset += mmuBytes;
-+
-+        logical = (gctUINT8_PTR)Hardware->functionLogical + offset;
-+
-+        gcmkONERROR(gckHARDWARE_End(
-+            Hardware,
-+            gcvNULL,
-+            &endBytes
-+            ));
-+
-+        gcmkONERROR(gckHARDWARE_End(
-+            Hardware,
-+            logical,
-+            &endBytes
-+            ));
-+
-+        offset += endBytes;
-+
-+        Hardware->functions[gcvHARDWARE_FUNCTION_MMU].bytes = mmuBytes + endBytes;
-+    }
-+
-+    gcmkASSERT(offset < Hardware->functionBytes);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h	2015-07-27 23:13:06.186908111 +0200
-@@ -0,0 +1,160 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_hardware_h_
-+#define __gc_hal_kernel_hardware_h_
-+
-+#if gcdENABLE_VG
-+#include "gc_hal_kernel_hardware_vg.h"
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+typedef enum {
-+    gcvHARDWARE_FUNCTION_MMU,
-+    gcvHARDWARE_FUNCTION_FLUSH,
-+
-+    gcvHARDWARE_FUNCTION_NUM,
-+}
-+gceHARDWARE_FUNCTION;
-+
-+
-+typedef struct _gcsHARWARE_FUNCTION
-+{
-+    /* Entry of the function. */
-+    gctUINT32                   address;
-+
-+    /* Bytes of the function. */
-+    gctUINT32                   bytes;
-+}
-+gcsHARDWARE_FUNCTION;
-+
-+/* gckHARDWARE object. */
-+struct _gckHARDWARE
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gctKERNEL object. */
-+    gckKERNEL                   kernel;
-+
-+    /* Pointer to gctOS object. */
-+    gckOS                       os;
-+
-+    /* Core */
-+    gceCORE                     core;
-+
-+    /* Chip characteristics. */
-+    gcsHAL_QUERY_CHIP_IDENTITY  identity;
-+    gctBOOL                     allowFastClear;
-+    gctBOOL                     allowCompression;
-+    gctUINT32                   powerBaseAddress;
-+    gctBOOL                     extraEventStates;
-+
-+    /* Big endian */
-+    gctBOOL                     bigEndian;
-+
-+    /* Chip status */
-+    gctPOINTER                  powerMutex;
-+    gctUINT32                   powerProcess;
-+    gctUINT32                   powerThread;
-+    gceCHIPPOWERSTATE           chipPowerState;
-+    gctUINT32                   lastWaitLink;
-+    gctUINT32                   lastEnd;
-+    gctBOOL                     clockState;
-+    gctBOOL                     powerState;
-+    gctPOINTER                  globalSemaphore;
-+
-+    gctISRMANAGERFUNC           startIsr;
-+    gctISRMANAGERFUNC           stopIsr;
-+    gctPOINTER                  isrContext;
-+
-+    gctUINT32                   mmuVersion;
-+
-+    /* Whether use new MMU. It is meaningless
-+    ** for old MMU since old MMU is always enabled.
-+    */
-+    gctBOOL                     enableMMU;
-+
-+    /* Type */
-+    gceHARDWARE_TYPE            type;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gctUINT32                   powerOffTime;
-+    gctUINT32                   powerOffTimeout;
-+    gctPOINTER                  powerOffTimer;
-+#endif
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    gctUINT32                   powerOnFscaleVal;
-+#endif
-+    gctPOINTER                  pageTableDirty;
-+
-+#if gcdLINK_QUEUE_SIZE
-+    struct _gckLINKQUEUE        linkQueue;
-+#endif
-+
-+    gctBOOL                     powerManagement;
-+    gctBOOL                     powerManagementLock;
-+    gctBOOL                     gpuProfiler;
-+
-+    gctBOOL                     endAfterFlushMmuCache;
-+
-+    gctUINT32                   minFscaleValue;
-+
-+    gctPOINTER                  pendingEvent;
-+
-+    /* Function used by gckHARDWARE. */
-+    gctPHYS_ADDR                functionPhysical;
-+    gctPOINTER                  functionLogical;
-+    gctUINT32                   functionAddress;
-+    gctSIZE_T                   functionBytes;
-+
-+    gcsHARDWARE_FUNCTION        functions[gcvHARDWARE_FUNCTION_NUM];
-+};
-+
-+gceSTATUS
-+gckHARDWARE_GetBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32_PTR BaseAddress
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_NeedBaseAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 State,
-+    OUT gctBOOL_PTR NeedBase
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_GetFrameInfo(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_FRAME_INFO * FrameInfo
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_hardware_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,679 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#include "gc_hal_kernel_context.h"
-+
-+/*
-+ *                          -----------------------
-+ *                          HARDWARE STATE RECORDER
-+ *                          -----------------------
-+ *
-+ * State mirror buffer is used to 'mirror' hardware states since hardware
-+ * states can't be dumpped. It is a context buffer which stores 'global'
-+ * context.
-+ *
-+ * For each commit, state recorder
-+ * 1) Records context buffer (if there is) and command buffers in this commit.
-+ * 2) Parse those buffers to estimate the state changed.
-+ * 3) Stores result to a mirror buffer.
-+ *
-+ * == Commit 0 ====================================================================
-+ *
-+ *      Context Buffer 0
-+ *
-+ *      Command Buffer 0
-+ *
-+ *      Mirror Buffer  0  <- Context Buffer 0 + Command Buffer 0
-+ *
-+ * == Commit 1 ====================================================================
-+ *
-+ *      Command Buffer 1
-+ *
-+ *      Mirror Buffer  1  <- Command buffer 1 + Mirror Buffer 0
-+ *
-+ * == Commit 2 ====================================================================
-+ *
-+ *      Context Buffer 2 (optional)
-+ *
-+ *      Command Buffer 2
-+ *
-+ *      Mirror  Buffer 2  <- Command buffer 2 + Context Buffer 2 + Mirror Buffer 1
-+ *
-+ * == Commit N ====================================================================
-+ *
-+ * For Commit N, these buffers are needed to reproduce hardware's behavior in
-+ * this commit.
-+ *
-+ *  Mirror  Buffer [N - 1] : State Mirror accumlated by past commits,
-+ *                           which is used to restore hardware state.
-+ *  Context Buffer [N]     :
-+ *  Command Buffer [N]     : Command buffer executed by hardware in this commit.
-+ *
-+ *  If sequence of states programming matters, hardware's behavior can't be reproduced,
-+ *  but the state values stored in mirror buffer are assuring.
-+ */
-+
-+/* Queue size. */
-+#define gcdNUM_RECORDS  6
-+
-+typedef struct _gcsPARSER_HANDLER * gckPARSER_HANDLER;
-+
-+typedef void
-+(*HandlerFunction)(
-+    IN gckPARSER_HANDLER Handler,
-+    IN gctUINT32 Addr,
-+    IN gctUINT32 Data
-+    );
-+
-+typedef struct _gcsPARSER_HANDLER
-+{
-+    gctUINT32           type;
-+    gctUINT32           cmd;
-+    gctPOINTER          private;
-+    HandlerFunction     function;
-+}
-+gcsPARSER_HANDLER;
-+
-+typedef struct _gcsPARSER * gckPARSER;
-+typedef struct _gcsPARSER
-+{
-+    gctUINT8_PTR        currentCmdBufferAddr;
-+
-+    /* Current command. */
-+    gctUINT32           lo;
-+    gctUINT32           hi;
-+
-+    gctUINT8            cmdOpcode;
-+    gctUINT16           cmdAddr;
-+    gctUINT32           cmdSize;
-+    gctUINT32           cmdRectCount;
-+    gctUINT8            skip;
-+    gctUINT32           skipCount;
-+
-+    gctBOOL             allow;
-+
-+    /* Callback used by parser to handle a command. */
-+    gckPARSER_HANDLER   commandHandler;
-+}
-+gcsPARSER;
-+
-+typedef struct _gcsMIRROR
-+{
-+    gctUINT32_PTR       logical[gcdNUM_RECORDS];
-+    gctUINT32           bytes;
-+    gcsSTATE_MAP_PTR    map;
-+    gctUINT32           stateCount;
-+}
-+gcsMIRROR;
-+
-+typedef struct _gcsDELTA
-+{
-+    gctUINT64           commitStamp;
-+    gctUINT32_PTR       command;
-+    gctUINT32           commandBytes;
-+    gctUINT32_PTR       context;
-+    gctUINT32           contextBytes;
-+}
-+gcsDELTA;
-+
-+typedef struct _gcsRECORDER
-+{
-+    gckOS               os;
-+    gcsMIRROR           mirror;
-+    gcsDELTA            deltas[gcdNUM_RECORDS];
-+
-+    /* Index of current record. */
-+    gctUINT             index;
-+
-+    /* Number of records. */
-+    gctUINT             num;
-+
-+    /* Plugin used by gckPARSER. */
-+    gcsPARSER_HANDLER   recorderHandler;
-+    gckPARSER           parser;
-+}
-+gcsRECORDER;
-+
-+
-+/******************************************************************************\
-+***************************** Command Buffer Parser ****************************
-+\******************************************************************************/
-+
-+/*
-+** Command buffer parser checks command buffer in FE's view to make sure there
-+** is no format error.
-+**
-+** Parser provide a callback mechnisam, so plug-in can be added to implement
-+** other functions.
-+*/
-+
-+static void
-+_HandleLoadState(
-+    IN OUT gckPARSER Parser
-+    )
-+{
-+    gctUINT i;
-+    gctUINT32_PTR data = (gctUINT32_PTR)Parser->currentCmdBufferAddr;
-+    gctUINT32 cmdAddr = Parser->cmdAddr;
-+
-+    if (Parser->commandHandler == gcvNULL
-+     || Parser->commandHandler->cmd != 0x01
-+    )
-+    {
-+        /* No handler for this command. */
-+        return;
-+    }
-+
-+    for (i = 0; i < Parser->cmdSize; i++)
-+    {
-+        Parser->commandHandler->function(Parser->commandHandler, cmdAddr, *data);
-+
-+        /* Advance to next state. */
-+        cmdAddr++;
-+        data++;
-+    }
-+}
-+
-+static void
-+_GetCommand(
-+    IN OUT gckPARSER Parser
-+    )
-+{
-+    gctUINT32 * buffer = (gctUINT32 *)Parser->currentCmdBufferAddr;
-+
-+    gctUINT16 cmdRectCount;
-+    gctUINT16 cmdDataCount;
-+
-+    Parser->hi = buffer[0];
-+    Parser->lo = buffer[1];
-+
-+    Parser->cmdOpcode = (((((gctUINT32) (Parser->hi)) >> (0 ? 31:27)) & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1)))))) );
-+    Parser->cmdRectCount = 1;
-+
-+    switch (Parser->cmdOpcode)
-+    {
-+    case 0x01:
-+        /* Extract count. */
-+        Parser->cmdSize = (((((gctUINT32) (Parser->hi)) >> (0 ? 25:16)) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1)))))) );
-+        if (Parser->cmdSize == 0)
-+        {
-+            /* 0 means 1024. */
-+            Parser->cmdSize = 1024;
-+        }
-+        Parser->skip = (Parser->cmdSize & 0x1) ? 0 : 1;
-+
-+        /* Extract address. */
-+        Parser->cmdAddr = (((((gctUINT32) (Parser->hi)) >> (0 ? 15:0)) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1)))))) );
-+
-+        Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr + 4;
-+        Parser->skipCount = Parser->cmdSize + Parser->skip;
-+        break;
-+
-+     case 0x05:
-+        Parser->cmdSize   = 4;
-+        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
-+        break;
-+
-+    case 0x06:
-+        Parser->cmdSize   = 5;
-+        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
-+        break;
-+
-+    case 0x0C:
-+        Parser->cmdSize   = 3;
-+        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
-+        break;
-+
-+    case 0x09:
-+        Parser->cmdSize   = 2;
-+        Parser->cmdAddr   = 0x0F16;
-+        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
-+        break;
-+
-+     case 0x04:
-+        Parser->cmdSize = 1;
-+        Parser->cmdAddr = 0x0F06;
-+
-+        cmdRectCount = (((((gctUINT32) (Parser->hi)) >> (0 ? 15:8)) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1)))))) );
-+        cmdDataCount = (((((gctUINT32) (Parser->hi)) >> (0 ? 26:16)) & ((gctUINT32) ((((1 ? 26:16) - (0 ? 26:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:16) - (0 ? 26:16) + 1)))))) );
-+
-+        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2)
-+                          + cmdRectCount * 2
-+                          + gcmALIGN(cmdDataCount, 2);
-+
-+        Parser->cmdRectCount = cmdRectCount;
-+        break;
-+
-+    case 0x03:
-+        Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr + 8;
-+        Parser->skipCount = 0;
-+        break;
-+
-+    case 0x02:
-+        Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr + 8;
-+        Parser->skipCount = 0;
-+        break;
-+
-+    default:
-+        /* Unknown command is a risk. */
-+        Parser->allow = gcvFALSE;
-+        break;
-+    }
-+}
-+
-+static void
-+_ParseCommand(
-+    IN OUT gckPARSER Parser
-+    )
-+{
-+    switch(Parser->cmdOpcode)
-+    {
-+    case 0x01:
-+        _HandleLoadState(Parser);
-+        break;
-+    case 0x05:
-+    case 0x06:
-+    case 0x0C:
-+        break;
-+    case 0x04:
-+        break;
-+    default:
-+        break;
-+    }
-+
-+    /* Advance to next command. */
-+    Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr
-+                                 + (Parser->skipCount << 2);
-+}
-+
-+gceSTATUS
-+gckPARSER_Parse(
-+    IN gckPARSER Parser,
-+    IN gctUINT8_PTR Buffer,
-+    IN gctUINT32 Bytes
-+    )
-+{
-+    gckPARSER parser = Parser;
-+    gctUINT8_PTR end = (gctUINT8_PTR)Buffer + Bytes;
-+
-+    /* Initialize parser. */
-+    parser->currentCmdBufferAddr = (gctUINT8_PTR)Buffer;
-+    parser->skip = 0;
-+    parser->allow = gcvTRUE;
-+
-+    /* Go through command buffer until reaching the end
-+    ** or meeting an error. */
-+    do
-+    {
-+        _GetCommand(parser);
-+
-+        _ParseCommand(parser);
-+    }
-+    while ((parser->currentCmdBufferAddr < end) && (parser->allow == gcvTRUE));
-+
-+    if (parser->allow == gcvFALSE)
-+    {
-+        /* Error detected. */
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckPARSER_RegisterCommandHandler
-+**
-+**  Register a command handler which will be called when parser get a command.
-+**
-+*/
-+gceSTATUS
-+gckPARSER_RegisterCommandHandler(
-+    IN gckPARSER Parser,
-+    IN gckPARSER_HANDLER Handler
-+    )
-+{
-+    Parser->commandHandler = Handler;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckPARSER_Construct(
-+    IN gckOS Os,
-+    IN gckPARSER_HANDLER Handler,
-+    OUT gckPARSER * Parser
-+    )
-+{
-+    gceSTATUS status;
-+    gckPARSER pointer;
-+
-+    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcsPARSER), (gctPOINTER *)&pointer));
-+
-+    /* Put it here temp, should have a more general plug-in mechnisam. */
-+    pointer->commandHandler = Handler;
-+
-+    *Parser = pointer;
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+void
-+gckPARSER_Destroy(
-+    IN gckOS Os,
-+    IN gckPARSER Parser
-+    )
-+{
-+    gcmkOS_SAFE_FREE(Os, Parser);
-+}
-+
-+/******************************************************************************\
-+**************************** Hardware States Recorder **************************
-+\******************************************************************************/
-+
-+static void
-+_RecodeState(
-+    IN gckPARSER_HANDLER Handler,
-+    IN gctUINT32 Addr,
-+    IN gctUINT32 Data
-+    )
-+{
-+    gcmkVERIFY_OK(gckRECORDER_UpdateMirror(Handler->private, Addr, Data));
-+}
-+
-+static gctUINT
-+_Previous(
-+    IN gctUINT Index
-+    )
-+{
-+    if (Index == 0)
-+    {
-+        return gcdNUM_RECORDS - 1;
-+    }
-+
-+    return Index - 1;
-+}
-+
-+static gctUINT
-+_Next(
-+    IN gctUINT Index
-+    )
-+{
-+    return (Index + 1) % gcdNUM_RECORDS;
-+}
-+
-+gceSTATUS
-+gckRECORDER_Construct(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    OUT gckRECORDER * Recorder
-+    )
-+{
-+    gceSTATUS status;
-+    gckCONTEXT context = gcvNULL;
-+    gckRECORDER recorder = gcvNULL;
-+    gctUINT32 mapSize;
-+    gctUINT i;
-+    gctBOOL virtualCommandBuffer = Hardware->kernel->virtualCommandBuffer;
-+
-+    /* TODO: We only need context buffer and state map, it should be able to get without construct a
-+    ** new context.
-+    ** Now it is leaked, since we can't free it when command buffer is gone.
-+    */
-+
-+    /* MMU is not ready now. */
-+    Hardware->kernel->virtualCommandBuffer = gcvFALSE;
-+
-+    gcmkONERROR(gckCONTEXT_Construct(Os, Hardware, 0, &context));
-+
-+    /* Restore. */
-+    Hardware->kernel->virtualCommandBuffer = virtualCommandBuffer;
-+
-+    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcsRECORDER), (gctPOINTER *)&recorder));
-+
-+    gckOS_ZeroMemory(recorder, gcmSIZEOF(gcsRECORDER));
-+
-+    /* Copy state map. */
-+    recorder->mirror.stateCount = context->stateCount;
-+
-+    mapSize = context->stateCount * gcmSIZEOF(gcsSTATE_MAP);
-+
-+    gcmkONERROR(gckOS_Allocate(Os, mapSize, (gctPOINTER *)&recorder->mirror.map));
-+
-+    gckOS_MemCopy(recorder->mirror.map, context->map, mapSize);
-+
-+    /* Copy context buffer. */
-+    recorder->mirror.bytes = context->totalSize;
-+
-+    for (i = 0; i < gcdNUM_RECORDS; i++)
-+    {
-+        gcmkONERROR(gckOS_Allocate(Os, context->totalSize, (gctPOINTER *)&recorder->mirror.logical[i]));
-+        gckOS_MemCopy(recorder->mirror.logical[i], context->buffer->logical, context->totalSize);
-+    }
-+
-+    for (i = 0; i < gcdNUM_RECORDS; i++)
-+    {
-+        /* TODO : Optimize size. */
-+        gcmkONERROR(gckOS_Allocate(Os, gcdCMD_BUFFER_SIZE, (gctPOINTER *)&recorder->deltas[i].command));
-+        gcmkONERROR(gckOS_Allocate(Os, context->totalSize, (gctPOINTER *)&recorder->deltas[i].context));
-+    }
-+
-+    recorder->index = 0;
-+    recorder->num   = 0;
-+
-+    /* Initialize Parser plugin. */
-+    recorder->recorderHandler.cmd = 0x01;
-+    recorder->recorderHandler.private = recorder;
-+    recorder->recorderHandler.function = _RecodeState;
-+
-+    gcmkONERROR(gckPARSER_Construct(Os, &recorder->recorderHandler, &recorder->parser));
-+
-+    recorder->os = Os;
-+
-+    *Recorder = recorder;
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (recorder)
-+    {
-+        gckRECORDER_Destory(Os, recorder);
-+    }
-+
-+    return status;
-+}
-+
-+gceSTATUS
-+gckRECORDER_Destory(
-+    IN gckOS Os,
-+    IN gckRECORDER Recorder
-+    )
-+{
-+    gctUINT i;
-+
-+    if (Recorder->mirror.map)
-+    {
-+        gcmkOS_SAFE_FREE(Os, Recorder->mirror.map);
-+    }
-+
-+    for (i = 0; i < gcdNUM_RECORDS; i++)
-+    {
-+        if (Recorder->mirror.logical[i])
-+        {
-+            gcmkOS_SAFE_FREE(Os, Recorder->mirror.logical[i]);
-+        }
-+    }
-+
-+    for (i = 0; i < gcdNUM_RECORDS; i++)
-+    {
-+        if (Recorder->deltas[i].command)
-+        {
-+            gcmkOS_SAFE_FREE(Os, Recorder->deltas[i].command);
-+        }
-+
-+        if (Recorder->deltas[i].context)
-+        {
-+            gcmkOS_SAFE_FREE(Os, Recorder->deltas[i].context);
-+        }
-+    }
-+
-+    if (Recorder->parser)
-+    {
-+        gckPARSER_Destroy(Os, Recorder->parser);
-+    }
-+
-+    gcmkOS_SAFE_FREE(Os, Recorder);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckRECORDER_UpdateMirror(
-+    IN gckRECORDER Recorder,
-+    IN gctUINT32 State,
-+    IN gctUINT32 Data
-+    )
-+{
-+    gctUINT32 index;
-+    gcsSTATE_MAP_PTR map = Recorder->mirror.map;
-+    gctUINT32_PTR buffer = Recorder->mirror.logical[Recorder->index];
-+
-+    if (State >= Recorder->mirror.stateCount)
-+    {
-+        /* Ignore them just like HW does. */
-+        return gcvSTATUS_OK;
-+    }
-+
-+    index = map[State].index;
-+
-+    if (index)
-+    {
-+        buffer[index] = Data;
-+    }
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+void
-+gckRECORDER_AdvanceIndex(
-+    IN gckRECORDER Recorder,
-+    IN gctUINT64 CommitStamp
-+    )
-+{
-+    /* Get next record. */
-+    gctUINT next = (Recorder->index + 1) % gcdNUM_RECORDS;
-+
-+    /* Record stamp of this commit. */
-+    Recorder->deltas[Recorder->index].commitStamp = CommitStamp;
-+
-+    /* Mirror of next record is mirror of this record and delta in next record. */
-+    gckOS_MemCopy(Recorder->mirror.logical[next],
-+        Recorder->mirror.logical[Recorder->index], Recorder->mirror.bytes);
-+
-+    /* Advance to next record. */
-+    Recorder->index = next;
-+
-+    Recorder->num = gcmMIN(Recorder->num + 1, gcdNUM_RECORDS - 1);
-+
-+
-+    /* Reset delta. */
-+    Recorder->deltas[Recorder->index].commandBytes = 0;
-+    Recorder->deltas[Recorder->index].contextBytes = 0;
-+}
-+
-+void
-+gckRECORDER_Record(
-+    IN gckRECORDER Recorder,
-+    IN gctUINT8_PTR CommandBuffer,
-+    IN gctUINT32 CommandBytes,
-+    IN gctUINT8_PTR ContextBuffer,
-+    IN gctUINT32 ContextBytes
-+    )
-+{
-+    gcsDELTA * delta = &Recorder->deltas[Recorder->index];
-+
-+    if (CommandBytes != 0xFFFFFFFF)
-+    {
-+        gckPARSER_Parse(Recorder->parser, CommandBuffer, CommandBytes);
-+        gckOS_MemCopy(delta->command, CommandBuffer, CommandBytes);
-+        delta->commandBytes = CommandBytes;
-+    }
-+
-+    if (ContextBytes != 0xFFFFFFFF)
-+    {
-+        gckPARSER_Parse(Recorder->parser, ContextBuffer, ContextBytes);
-+        gckOS_MemCopy(delta->context, ContextBuffer, ContextBytes);
-+        delta->contextBytes = ContextBytes;
-+    }
-+}
-+
-+void
-+gckRECORDER_Dump(
-+    IN gckRECORDER Recorder
-+    )
-+{
-+    gctUINT last = Recorder->index;
-+    gctUINT previous;
-+    gctUINT i;
-+    gcsMIRROR *mirror = &Recorder->mirror;
-+    gcsDELTA *delta;
-+    gckOS os = Recorder->os;
-+
-+    for (i = 0; i < Recorder->num; i++)
-+    {
-+        last = _Previous(last);
-+    }
-+
-+    for (i = 0; i < Recorder->num; i++)
-+    {
-+        delta = &Recorder->deltas[last];
-+
-+        /* Dump record */
-+        gcmkPRINT("#[commit %llu]", delta->commitStamp);
-+
-+        if (delta->commitStamp)
-+        {
-+            previous = _Previous(last);
-+
-+            gcmkPRINT("#[mirror]");
-+            gckOS_DumpBuffer(os, mirror->logical[previous], mirror->bytes, gceDUMP_BUFFER_CONTEXT, gcvTRUE);
-+            gcmkPRINT("@[kernel.execute]");
-+        }
-+
-+        if (delta->contextBytes)
-+        {
-+            gckOS_DumpBuffer(os, delta->context, delta->contextBytes, gceDUMP_BUFFER_CONTEXT, gcvTRUE);
-+            gcmkPRINT("@[kernel.execute]");
-+        }
-+
-+        gckOS_DumpBuffer(os, delta->command, delta->commandBytes, gceDUMP_BUFFER_USER, gcvTRUE);
-+        gcmkPRINT("@[kernel.execute]");
-+
-+        last = _Next(last);
-+    }
-+}
-+
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,932 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+
-+#if gcdENABLE_VG
-+
-+#include "gc_hal_kernel_hardware_command_vg.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_COMMAND
-+
-+/******************************************************************************\
-+****************************** gckVGCOMMAND API code *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_InitializeInfo
-+**
-+**  Initialize architecture dependent command buffer information.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to the Command object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_InitializeInfo(
-+    IN gckVGCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    do
-+    {
-+        /* Reset interrupts. */
-+        Command->info.feBufferInt   = -1;
-+        Command->info.tsOverflowInt = -1;
-+
-+        /* Set command buffer attributes. */
-+        Command->info.addressAlignment = 64;
-+        Command->info.commandAlignment = 8;
-+
-+        /* Determine command alignment address mask. */
-+        Command->info.addressMask = ((((gctUINT32) (Command->info.addressAlignment - 1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0 ) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+        /* Query the number of bytes needed by the STATE command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_StateCommand(
-+            Command, 0x0, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.stateCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the RESTART command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_RestartCommand(
-+            Command, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.restartCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the FETCH command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_FetchCommand(
-+            Command, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.fetchCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the CALL command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_CallCommand(
-+            Command, gcvNULL, (gctUINT32)~0, 0,
-+            &Command->info.callCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the RETURN command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_ReturnCommand(
-+            Command, gcvNULL,
-+            &Command->info.returnCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the EVENT command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
-+            Command, gcvNULL, gcvBLOCK_PIXEL, -1,
-+            &Command->info.eventCommandSize
-+            ));
-+
-+        /* Query the number of bytes needed by the END command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
-+            Command, gcvNULL, -1,
-+            &Command->info.endCommandSize
-+            ));
-+
-+        /* Determine the tail reserve size. */
-+        Command->info.staticTailSize = gcmMAX(
-+            Command->info.fetchCommandSize,
-+            gcmMAX(
-+                Command->info.returnCommandSize,
-+                Command->info.endCommandSize
-+                )
-+            );
-+
-+        /* Determine the maximum tail size. */
-+        Command->info.dynamicTailSize
-+            = Command->info.staticTailSize
-+            + Command->info.eventCommandSize * gcvBLOCK_COUNT;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_StateCommand
-+**
-+**  Append a STATE command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctUINT32 Pipe
-+**          Harwdare destination pipe.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          STATE command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 Address
-+**          Starting register address of the state buffer.
-+**          If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT32 Count
-+**          Number of states in state buffer.
-+**          If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the STATE command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the STATE command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_StateCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT32 Pipe,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Count,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Pipe=0x%x Logical=0x%x Address=0x%x Count=0x%x Bytes = 0x%x",
-+                   Command, Pipe, Logical, Address, Count, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append STATE. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) ((gctUINT32) (Pipe) & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the STATE command. */
-+            *Bytes = 4 * (Count + 1);
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append LOAD_STATE. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the STATE command. */
-+            *Bytes = 4 * (Count + 1);
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_RestartCommand
-+**
-+**  Form a RESTART command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          RESTART command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 FetchAddress
-+**          The address of another command buffer to be executed by this RESTART
-+**          command.  If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT FetchCount
-+**          The number of 64-bit data quantities in another command buffer to
-+**          be executed by this RESTART command.  If 'Logical' is gcvNULL, this
-+**          argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the RESTART command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the RESTART command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_RestartCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
-+                   Command, Logical, FetchAddress, FetchCount, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+            gctUINT32 beginEndMark;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Determine Begin/End flag. */
-+            beginEndMark = (FetchCount > 0)
-+                ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
-+                : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)));
-+
-+            /* Append RESTART. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x9 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)))
-+                | beginEndMark;
-+
-+            buffer[1]
-+                = FetchAddress;
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the RESTART command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_FetchCommand
-+**
-+**  Form a FETCH command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          FETCH command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 FetchAddress
-+**          The address of another command buffer to be executed by this FETCH
-+**          command.  If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT FetchCount
-+**          The number of 64-bit data quantities in another command buffer to
-+**          be executed by this FETCH command.  If 'Logical' is gcvNULL, this
-+**          argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the FETCH command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the FETCH command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_FetchCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
-+                   Command, Logical, FetchAddress, FetchCount, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append FETCH. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x5 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
-+
-+            buffer[1]
-+                = gcmkFIXADDRESS(FetchAddress);
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the FETCH command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append LINK. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
-+
-+            buffer[1]
-+                = gcmkFIXADDRESS(FetchAddress);
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the LINK command. */
-+            *Bytes = 8;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_CallCommand
-+**
-+**  Append a CALL command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          CALL command at or gcvNULL to query the size of the command.
-+**
-+**      gctUINT32 FetchAddress
-+**          The address of another command buffer to be executed by this CALL
-+**          command.  If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gctUINT FetchCount
-+**          The number of 64-bit data quantities in another command buffer to
-+**          be executed by this CALL command.  If 'Logical' is gcvNULL, this
-+**          argument is ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the CALL command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the CALL command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_CallCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
-+                   Command, Logical, FetchAddress, FetchCount, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append CALL. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x6 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
-+
-+            buffer[1]
-+                = gcmkFIXADDRESS(FetchAddress);
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the CALL command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_ReturnCommand
-+**
-+**  Append a RETURN command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to an gckVGCOMMAND object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          RETURN command at or gcvNULL to query the size of the command.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the RETURN command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the RETURN command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_ReturnCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x  Bytes = 0x%x",
-+                   Command, Logical, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append RETURN. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x7 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the RETURN command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_NOT_SUPPORTED;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_EventCommand
-+**
-+**  Form an EVENT command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to the Command object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          EVENT command at or gcvNULL to query the size of the command.
-+**
-+**      gctINT32 InterruptId
-+**          The ID of the interrupt to generate.
-+**          If 'Logical' is gcvNULL, this argument is ignored.
-+**
-+**      gceBLOCK Block
-+**          Block that will generate the interrupt.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the EVENT command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_EventCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gceBLOCK Block,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x Block=0x%x InterruptId=0x%x Bytes = 0x%x",
-+                   Command, Logical, Block, InterruptId, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        typedef struct _gcsEVENTSTATES
-+        {
-+            /* Chips before VG21 use these values. */
-+            gctUINT     eventFromFE;
-+            gctUINT     eventFromPE;
-+
-+            /* VG21 chips and later use SOURCE field. */
-+            gctUINT     eventSource;
-+        }
-+        gcsEVENTSTATES;
-+
-+        static gcsEVENTSTATES states[] =
-+        {
-+            /* gcvBLOCK_COMMAND */
-+            {
-+                (gctUINT)~0,
-+                (gctUINT)~0,
-+                (gctUINT)~0
-+            },
-+
-+            /* gcvBLOCK_TESSELLATOR */
-+            {
-+                0x0,
-+                0x1,
-+                0x10
-+            },
-+
-+            /* gcvBLOCK_TESSELLATOR2 */
-+            {
-+                0x0,
-+                0x1,
-+                0x12
-+            },
-+
-+            /* gcvBLOCK_TESSELLATOR3 */
-+            {
-+                0x0,
-+                0x1,
-+                0x14
-+            },
-+
-+            /* gcvBLOCK_RASTER */
-+            {
-+                0x0,
-+                0x1,
-+                0x07,
-+            },
-+
-+            /* gcvBLOCK_VG */
-+            {
-+                0x0,
-+                0x1,
-+                0x0F
-+            },
-+
-+            /* gcvBLOCK_VG2 */
-+            {
-+                0x0,
-+                0x1,
-+                0x11
-+            },
-+
-+            /* gcvBLOCK_VG3 */
-+            {
-+                0x0,
-+                0x1,
-+                0x13
-+            },
-+
-+            /* gcvBLOCK_PIXEL */
-+            {
-+                0x0,
-+                0x1,
-+                0x07
-+            },
-+        };
-+
-+        /* Verify block ID. */
-+        gcmkVERIFY_ARGUMENT(gcmIS_VALID_INDEX(Block, states));
-+
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append EVENT. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
-+
-+            /* Determine chip version. */
-+            if (Command->vg21)
-+            {
-+                /* Get the event source for the block. */
-+                gctUINT eventSource = states[Block].eventSource;
-+
-+                /* Supported? */
-+                if (eventSource == ~0)
-+                {
-+                    gcmkFOOTER_NO();
-+                    return gcvSTATUS_NOT_SUPPORTED;
-+                }
-+
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) ((gctUINT32) (eventSource) & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
-+            }
-+            else
-+            {
-+                /* Get the event source for the block. */
-+                gctUINT eventFromFE = states[Block].eventFromFE;
-+                gctUINT eventFromPE = states[Block].eventFromPE;
-+
-+                /* Supported? */
-+                if (eventFromFE == ~0)
-+                {
-+                    gcmkFOOTER_NO();
-+                    return gcvSTATUS_NOT_SUPPORTED;
-+                }
-+
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (eventFromFE) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (eventFromPE) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+            }
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Make sure the events are directly supported for the block. */
-+            if (states[Block].eventSource == ~0)
-+            {
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_NOT_SUPPORTED;
-+            }
-+
-+            /* Return number of bytes required by the END command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append EVENT. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            /* Determine event source. */
-+            if (Block == gcvBLOCK_COMMAND)
-+            {
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
-+            }
-+            else
-+            {
-+                buffer[1]
-+                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+            }
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the EVENT and END commands. */
-+            *Bytes = 8;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGCOMMAND_EndCommand
-+**
-+**  Form an END command at the specified location in the command buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGCOMMAND Command
-+**          Pointer to the Command object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the current location inside the command buffer to append
-+**          END command at or gcvNULL to query the size of the command.
-+**
-+**      gctINT32 InterruptId
-+**          The ID of the interrupt to generate.
-+**          If 'Logical' is gcvNULL, this argument will be ignored.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes available for the END command.
-+**          If 'Logical' is gcvNULL, the value from this argument is ignored.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that will receive the number of bytes required
-+**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
-+*/
-+gceSTATUS
-+gckVGCOMMAND_EndCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctUINT32 * Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Logical=0x%x InterruptId=0x%x Bytes = 0x%x",
-+                   Command, Logical, InterruptId, Bytes);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->fe20)
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR buffer;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+
-+            /* Cast the buffer pointer. */
-+            buffer = (gctUINT32_PTR) Logical;
-+
-+            /* Append END. */
-+            buffer[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the END command. */
-+            *Bytes = 8;
-+        }
-+    }
-+    else
-+    {
-+        if (Logical != gcvNULL)
-+        {
-+            gctUINT32_PTR memory;
-+
-+            /* Verify the event ID. */
-+            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
-+
-+            /* Cast the buffer pointer. */
-+            memory = (gctUINT32_PTR) Logical;
-+
-+            /* Append EVENT. */
-+            memory[0]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+            memory[1]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
-+                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
-+
-+            /* Append END. */
-+            memory[2]
-+                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
-+        }
-+
-+        if (Bytes != gcvNULL)
-+        {
-+            /* Return number of bytes required by the EVENT and END commands. */
-+            *Bytes = 16;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+#endif /* gcdENABLE_VG */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,319 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_hardware_command_vg_h_
-+#define __gc_hal_kernel_hardware_command_vg_h_
-+
-+/******************************************************************************\
-+******************* Task and Interrupt Management Structures. ******************
-+\******************************************************************************/
-+
-+/* Task storage header. */
-+typedef struct _gcsTASK_STORAGE * gcsTASK_STORAGE_PTR;
-+typedef struct _gcsTASK_STORAGE
-+{
-+    /* Next allocated storage buffer. */
-+    gcsTASK_STORAGE_PTR         next;
-+}
-+gcsTASK_STORAGE;
-+
-+/* Task container header. */
-+typedef struct _gcsTASK_CONTAINER * gcsTASK_CONTAINER_PTR;
-+typedef struct _gcsTASK_CONTAINER
-+{
-+    /* The number of tasks left to be processed in the container. */
-+    gctINT                      referenceCount;
-+
-+    /* Size of the buffer. */
-+    gctUINT                     size;
-+
-+    /* Link to the previous and the next allocated containers. */
-+    gcsTASK_CONTAINER_PTR       allocPrev;
-+    gcsTASK_CONTAINER_PTR       allocNext;
-+
-+    /* Link to the previous and the next containers in the free list. */
-+    gcsTASK_CONTAINER_PTR       freePrev;
-+    gcsTASK_CONTAINER_PTR       freeNext;
-+}
-+gcsTASK_CONTAINER;
-+
-+/* Kernel space task master table entry. */
-+typedef struct _gcsBLOCK_TASK_ENTRY * gcsBLOCK_TASK_ENTRY_PTR;
-+typedef struct _gcsBLOCK_TASK_ENTRY
-+{
-+    /* Pointer to the current task container for the block. */
-+    gcsTASK_CONTAINER_PTR       container;
-+
-+    /* Pointer to the current task data within the container. */
-+    gcsTASK_HEADER_PTR          task;
-+
-+    /* Pointer to the last link task within the container. */
-+    gcsTASK_LINK_PTR            link;
-+
-+    /* Number of interrupts allocated for this block. */
-+    gctUINT                     interruptCount;
-+
-+    /* The index of the current interrupt. */
-+    gctUINT                     interruptIndex;
-+
-+    /* Interrupt semaphore. */
-+    gctSEMAPHORE                interruptSemaphore;
-+
-+    /* Interrupt value array. */
-+    gctINT32                    interruptArray[32];
-+}
-+gcsBLOCK_TASK_ENTRY;
-+
-+
-+/******************************************************************************\
-+********************* Command Queue Management Structures. *********************
-+\******************************************************************************/
-+
-+/* Command queue kernel element pointer. */
-+typedef struct _gcsKERNEL_CMDQUEUE * gcsKERNEL_CMDQUEUE_PTR;
-+
-+/* Command queue object handler function type. */
-+typedef gceSTATUS (* gctOBJECT_HANDLER) (
-+    gckVGKERNEL Kernel,
-+    gcsKERNEL_CMDQUEUE_PTR Entry
-+    );
-+
-+/* Command queue kernel element. */
-+typedef struct _gcsKERNEL_CMDQUEUE
-+{
-+    /* The number of buffers in the queue. */
-+    gcsCMDBUFFER_PTR            commandBuffer;
-+
-+    /* Pointer to the object handler function. */
-+    gctOBJECT_HANDLER           handler;
-+}
-+gcsKERNEL_CMDQUEUE;
-+
-+/* Command queue header. */
-+typedef struct _gcsKERNEL_QUEUE_HEADER * gcsKERNEL_QUEUE_HEADER_PTR;
-+typedef struct _gcsKERNEL_QUEUE_HEADER
-+{
-+    /* The size of the buffer in bytes. */
-+    gctUINT                     size;
-+
-+    /* The number of pending entries to be processed. */
-+    volatile gctUINT            pending;
-+
-+    /* The current command queue entry. */
-+    gcsKERNEL_CMDQUEUE_PTR      currentEntry;
-+
-+    /* Next buffer. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  next;
-+}
-+gcsKERNEL_QUEUE_HEADER;
-+
-+
-+/******************************************************************************\
-+******************************* gckVGCOMMAND Object *******************************
-+\******************************************************************************/
-+
-+/* gckVGCOMMAND object. */
-+struct _gckVGCOMMAND
-+{
-+    /***************************************************************************
-+    ** Object data and pointers.
-+    */
-+
-+    gcsOBJECT                   object;
-+    gckVGKERNEL                 kernel;
-+    gckOS                       os;
-+    gckVGHARDWARE                   hardware;
-+
-+    /* Features. */
-+    gctBOOL                     fe20;
-+    gctBOOL                     vg20;
-+    gctBOOL                     vg21;
-+
-+
-+    /***************************************************************************
-+    ** Enable command queue dumping.
-+    */
-+
-+    gctBOOL                     enableDumping;
-+
-+
-+    /***************************************************************************
-+    ** Bus Error interrupt.
-+    */
-+
-+    gctINT32                    busErrorInt;
-+
-+
-+    /***************************************************************************
-+    ** Command buffer information.
-+    */
-+
-+    gcsCOMMAND_BUFFER_INFO      info;
-+
-+
-+    /***************************************************************************
-+    ** Synchronization objects.
-+    */
-+
-+    gctPOINTER                  queueMutex;
-+    gctPOINTER                  taskMutex;
-+    gctPOINTER                  commitMutex;
-+
-+
-+    /***************************************************************************
-+    ** Task management.
-+    */
-+
-+    /* The head of the storage buffer linked list. */
-+    gcsTASK_STORAGE_PTR         taskStorage;
-+
-+    /* Allocation size. */
-+    gctUINT                     taskStorageGranularity;
-+    gctUINT                     taskStorageUsable;
-+
-+    /* The free container list. */
-+    gcsTASK_CONTAINER_PTR       taskFreeHead;
-+    gcsTASK_CONTAINER_PTR       taskFreeTail;
-+
-+    /* Task table */
-+    gcsBLOCK_TASK_ENTRY         taskTable[gcvBLOCK_COUNT];
-+
-+
-+    /***************************************************************************
-+    ** Command queue.
-+    */
-+
-+    /* Pointer to the allocated queue memory. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  queue;
-+
-+    /* Pointer to the current available queue from which new queue entries
-+       will be allocated. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  queueHead;
-+
-+    /* If different from queueHead, points to the command queue which is
-+       currently being executed by the hardware. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  queueTail;
-+
-+    /* Points to the queue to merge the tail with when the tail is processed. */
-+    gcsKERNEL_QUEUE_HEADER_PTR  mergeQueue;
-+
-+    /* Queue overflow counter. */
-+    gctUINT                     queueOverflow;
-+
-+
-+    /***************************************************************************
-+    ** Context.
-+    */
-+
-+    /* Context counter used for unique ID. */
-+    gctUINT64                   contextCounter;
-+
-+    /* Current context ID. */
-+    gctUINT64                   currentContext;
-+
-+    /* Command queue power semaphore. */
-+    gctPOINTER                  powerSemaphore;
-+    gctINT32                    powerStallInt;
-+    gcsCMDBUFFER_PTR            powerStallBuffer;
-+    gctSIGNAL                   powerStallSignal;
-+
-+};
-+
-+/******************************************************************************\
-+************************ gckVGCOMMAND Object Internal API. ***********************
-+\******************************************************************************/
-+
-+/* Initialize architecture dependent command buffer information. */
-+gceSTATUS
-+gckVGCOMMAND_InitializeInfo(
-+    IN gckVGCOMMAND Command
-+    );
-+
-+/* Form a STATE command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_StateCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT32 Pipe,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Count,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+/* Form a RESTART command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_RestartCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+/* Form a FETCH command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_FetchCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+/* Form a CALL command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_CallCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 FetchAddress,
-+    IN gctUINT FetchCount,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+/* Form a RETURN command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_ReturnCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+/* Form an EVENT command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_EventCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gceBLOCK Block,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+/* Form an END command at the specified location in the command buffer. */
-+gceSTATUS
-+gckVGCOMMAND_EndCommand(
-+    IN gckVGCOMMAND Command,
-+    IN gctPOINTER Logical,
-+    IN gctINT32 InterruptId,
-+    IN OUT gctUINT32 * Bytes
-+    );
-+
-+#endif  /* __gc_hal_kernel_hardware_command_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,2119 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel.h"
-+#include "gc_hal_kernel_hardware_command_vg.h"
-+
-+#if gcdENABLE_VG
-+
-+#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
-+
-+typedef enum
-+{
-+    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
-+    gcvPOWER_FLAG_STALL         = 1 << 1,
-+    gcvPOWER_FLAG_STOP          = 1 << 2,
-+    gcvPOWER_FLAG_START         = 1 << 3,
-+    gcvPOWER_FLAG_RELEASE       = 1 << 4,
-+    gcvPOWER_FLAG_DELAY         = 1 << 5,
-+    gcvPOWER_FLAG_SAVE          = 1 << 6,
-+    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
-+    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
-+    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
-+    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
-+    gcvPOWER_FLAG_NOP           = 1 << 11,
-+}
-+gcePOWER_FLAGS;
-+
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+static gceSTATUS
-+_ResetGPU(
-+    IN gckOS Os
-+    )
-+{
-+    gctUINT32 control, idle;
-+    gceSTATUS status;
-+
-+    /* Read register. */
-+    gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                     gcvCORE_VG,
-+                                     0x00000,
-+                                     &control));
-+
-+    for (;;)
-+    {
-+        /* Disable clock gating. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                    gcvCORE_VG,
-+                    0x00104,
-+                    0x00000000));
-+
-+        /* Wait for clock being stable. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Isolate the GPU. */
-+        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Set soft reset. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Wait for reset. */
-+        gcmkONERROR(gckOS_Delay(Os, 1));
-+
-+        /* Reset soft reset bit. */
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
-+
-+        /* Reset GPU isolation. */
-+        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
-+
-+        gcmkONERROR(gckOS_WriteRegisterEx(Os,
-+                                          gcvCORE_VG,
-+                                          0x00000,
-+                                          control));
-+
-+        /* Read idle register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         gcvCORE_VG,
-+                                         0x00004,
-+                                         &idle));
-+
-+        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
-+        {
-+            continue;
-+        }
-+
-+        /* Read reset register. */
-+        gcmkONERROR(gckOS_ReadRegisterEx(Os,
-+                                         gcvCORE_VG,
-+                                         0x00000,
-+                                         &control));
-+
-+        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
-+        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
-+        )
-+        {
-+            continue;
-+        }
-+
-+        /* GPU is idle. */
-+        break;
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the error. */
-+    return status;
-+}
-+
-+
-+static gceSTATUS
-+_IdentifyHardware(
-+    IN gckOS Os,
-+    OUT gceCHIPMODEL * ChipModel,
-+    OUT gctUINT32 * ChipRevision,
-+    OUT gctUINT32 * ChipFeatures,
-+    OUT gctUINT32 * ChipMinorFeatures,
-+    OUT gctUINT32 * ChipMinorFeatures2
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 chipIdentity;
-+
-+    do
-+    {
-+        /* Read chip identity register. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG, 0x00018, &chipIdentity));
-+
-+        /* Special case for older graphic cores. */
-+        if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
-+        {
-+            *ChipModel    = gcv500;
-+            *ChipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
-+        }
-+
-+        else
-+        {
-+            /* Read chip identity register. */
-+            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
-+                                            0x00020,
-+                                            (gctUINT32 *) ChipModel));
-+
-+            /* Read CHIP_REV register. */
-+            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
-+                                            0x00024,
-+                                            ChipRevision));
-+        }
-+
-+        /* Read chip feature register. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(
-+            Os, gcvCORE_VG, 0x0001C, ChipFeatures
-+            ));
-+
-+        /* Read chip minor feature register. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(
-+            Os, gcvCORE_VG, 0x00034, ChipMinorFeatures
-+            ));
-+
-+        /* Read chip minor feature register #2. */
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(
-+            Os, gcvCORE_VG, 0x00074, ChipMinorFeatures2
-+            ));
-+
-+        gcmkTRACE(
-+            gcvLEVEL_VERBOSE,
-+            "ChipModel=0x%08X\n"
-+            "ChipRevision=0x%08X\n"
-+            "ChipFeatures=0x%08X\n"
-+            "ChipMinorFeatures=0x%08X\n"
-+            "ChipMinorFeatures2=0x%08X\n",
-+            *ChipModel,
-+            *ChipRevision,
-+            *ChipFeatures,
-+            *ChipMinorFeatures,
-+            *ChipMinorFeatures2
-+            );
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+#if gcdPOWEROFF_TIMEOUT
-+void
-+_VGPowerTimerFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gckVGHARDWARE hardware = (gckVGHARDWARE)Data;
-+    gcmkVERIFY_OK(
-+        gckVGHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
-+}
-+#endif
-+
-+/******************************************************************************\
-+****************************** gckVGHARDWARE API code *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_Construct
-+**
-+**  Construct a new gckVGHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an initialized gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gckVGHARDWARE * Hardware
-+**          Pointer to a variable that will hold the pointer to the gckVGHARDWARE
-+**          object.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_Construct(
-+    IN gckOS Os,
-+    OUT gckVGHARDWARE * Hardware
-+    )
-+{
-+    gckVGHARDWARE hardware = gcvNULL;
-+    gceSTATUS status;
-+    gceCHIPMODEL chipModel;
-+    gctUINT32 chipRevision;
-+    gctUINT32 chipFeatures;
-+    gctUINT32 chipMinorFeatures;
-+    gctUINT32 chipMinorFeatures2;
-+
-+    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x ", Os, Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
-+
-+    do
-+    {
-+        gcmkERR_BREAK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvTRUE, gcvTRUE));
-+
-+        status = _ResetGPU(Os);
-+
-+        if (status != gcvSTATUS_OK)
-+        {
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                "_ResetGPU failed: status=%d\n", status);
-+        }
-+
-+        /* Identify the hardware. */
-+        gcmkERR_BREAK(_IdentifyHardware(Os,
-+            &chipModel, &chipRevision,
-+            &chipFeatures, &chipMinorFeatures, &chipMinorFeatures2
-+            ));
-+
-+        /* Allocate the gckVGHARDWARE object. */
-+        gcmkERR_BREAK(gckOS_Allocate(Os,
-+            gcmSIZEOF(struct _gckVGHARDWARE), (gctPOINTER *) &hardware
-+            ));
-+
-+        /* Initialize the gckVGHARDWARE object. */
-+        hardware->object.type = gcvOBJ_HARDWARE;
-+        hardware->os = Os;
-+
-+        /* Set chip identity. */
-+        hardware->chipModel          = chipModel;
-+        hardware->chipRevision       = chipRevision;
-+        hardware->chipFeatures       = chipFeatures;
-+        hardware->chipMinorFeatures  = chipMinorFeatures;
-+        hardware->chipMinorFeatures2 = chipMinorFeatures2;
-+
-+        hardware->powerMutex            = gcvNULL;
-+        hardware->chipPowerState        = gcvPOWER_ON;
-+        hardware->chipPowerStateGlobal  = gcvPOWER_ON;
-+        hardware->clockState            = gcvTRUE;
-+        hardware->powerState            = gcvTRUE;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+        hardware->powerOffTime          = 0;
-+        hardware->powerOffTimeout       = gcdPOWEROFF_TIMEOUT;
-+
-+        gcmkVERIFY_OK(gckOS_CreateTimer(Os,
-+                                        _VGPowerTimerFunction,
-+                                        (gctPOINTER)hardware,
-+                                        &hardware->powerOffTimer));
-+#endif
-+
-+        /* Determine whether FE 2.0 is present. */
-+        hardware->fe20 = ((((gctUINT32) (hardware->chipFeatures)) >> (0 ? 28:28) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))));
-+
-+        /* Determine whether VG 2.0 is present. */
-+        hardware->vg20 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 13:13) & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))));
-+
-+        /* Determine whether VG 2.1 is present. */
-+        hardware->vg21 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
-+
-+        /* Set default event mask. */
-+        hardware->eventMask = 0xFFFFFFFF;
-+
-+        gcmkERR_BREAK(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
-+
-+        /* Set fast clear to auto. */
-+        gcmkVERIFY_OK(gckVGHARDWARE_SetFastClear(hardware, -1));
-+
-+        gcmkERR_BREAK(gckOS_CreateMutex(Os, &hardware->powerMutex));
-+
-+        /* Enable power management by default. */
-+        hardware->powerManagement = gcvTRUE;
-+
-+        /* Return pointer to the gckVGHARDWARE object. */
-+        *Hardware = hardware;
-+
-+        gcmkFOOTER_NO();
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    if (hardware->powerOffTimer != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
-+        gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
-+    }
-+#endif
-+
-+    gcmkVERIFY_OK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvFALSE, gcvFALSE));
-+
-+    if (hardware != gcvNULL && hardware->pageTableDirty != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
-+    }
-+
-+    if (hardware != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_Free(Os, hardware));
-+    }
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_Destroy
-+**
-+**  Destroy an gckVGHARDWARE object.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object that needs to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_Destroy(
-+    IN gckVGHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Mark the object as unknown. */
-+    Hardware->object.type = gcvOBJ_UNKNOWN;
-+
-+    if (Hardware->powerMutex != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(
-+            Hardware->os, Hardware->powerMutex));
-+    }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
-+    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
-+#endif
-+
-+    if (Hardware->pageTableDirty != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
-+    }
-+
-+    /* Free the object. */
-+    status = gckOS_Free(Hardware->os, Hardware);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_QueryMemory
-+**
-+**  Query the amount of memory available on the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * InternalSize
-+**          Pointer to a variable that will hold the size of the internal video
-+**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
-+**          internal memory will be returned.
-+**
-+**      gctUINT32 * InternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * InternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the internal video memory.  This pointer cannot be gcvNULL if
-+**          'InternalSize' is also non-gcvNULL.
-+**
-+**      gctSIZE_T * ExternalSize
-+**          Pointer to a variable that will hold the size of the external video
-+**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
-+**          external memory will be returned.
-+**
-+**      gctUINT32 * ExternalBaseAddress
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * ExternalAlignment
-+**          Pointer to a variable that will hold the hardware's base address for
-+**          the external video memory.  This pointer cannot be gcvNULL if
-+**          'ExternalSize' is also non-gcvNULL.
-+**
-+**      gctUINT32 * HorizontalTileSize
-+**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
-+**          gcvNULL, no horizontal pixel per tile will be returned.
-+**
-+**      gctUINT32 * VerticalTileSize
-+**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
-+**          gcvNULL, no vertical pixel per tile will be returned.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_QueryMemory(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctUINT32 * InternalBaseAddress,
-+    OUT gctUINT32 * InternalAlignment,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctUINT32 * ExternalBaseAddress,
-+    OUT gctUINT32 * ExternalAlignment,
-+    OUT gctUINT32 * HorizontalTileSize,
-+    OUT gctUINT32 * VerticalTileSize
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x InternalSize=0x%x InternalBaseAddress=0x%x InternalAlignment=0x%x"
-+        "ExternalSize=0x%x ExternalBaseAddress=0x%x ExternalAlignment=0x%x HorizontalTileSize=0x%x VerticalTileSize=0x%x",
-+        Hardware, InternalSize, InternalBaseAddress, InternalAlignment,
-+        ExternalSize, ExternalBaseAddress, ExternalAlignment, HorizontalTileSize, VerticalTileSize);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (InternalSize != gcvNULL)
-+    {
-+        /* No internal memory. */
-+        *InternalSize = 0;
-+    }
-+
-+    if (ExternalSize != gcvNULL)
-+    {
-+        /* No external memory. */
-+        *ExternalSize = 0;
-+    }
-+
-+    if (HorizontalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *HorizontalTileSize = 4;
-+    }
-+
-+    if (VerticalTileSize != gcvNULL)
-+    {
-+        /* 4x4 tiles. */
-+        *VerticalTileSize = 4;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_QueryChipIdentity
-+**
-+**  Query the identity of the hardware.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gceCHIPMODEL * ChipModel
-+**          If 'ChipModel' is not gcvNULL, the variable it points to will
-+**          receive the model of the chip.
-+**
-+**      gctUINT32 * ChipRevision
-+**          If 'ChipRevision' is not gcvNULL, the variable it points to will
-+**          receive the revision of the chip.
-+**
-+**      gctUINT32 * ChipFeatures
-+**          If 'ChipFeatures' is not gcvNULL, the variable it points to will
-+**          receive the feature set of the chip.
-+**
-+**      gctUINT32 * ChipMinorFeatures
-+**          If 'ChipMinorFeatures' is not gcvNULL, the variable it points to
-+**          will receive the minor feature set of the chip.
-+**
-+**      gctUINT32 * ChipMinorFeatures2
-+**          If 'ChipMinorFeatures2' is not gcvNULL, the variable it points to
-+**          will receive the minor feature set of the chip.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_QueryChipIdentity(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gceCHIPMODEL * ChipModel,
-+    OUT gctUINT32 * ChipRevision,
-+    OUT gctUINT32* ChipFeatures,
-+    OUT gctUINT32* ChipMinorFeatures,
-+    OUT gctUINT32* ChipMinorFeatures2
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x ChipModel=0x%x ChipRevision=0x%x ChipFeatures = 0x%x ChipMinorFeatures = 0x%x ChipMinorFeatures2 = 0x%x",
-+                   Hardware, ChipModel, ChipRevision, ChipFeatures, ChipMinorFeatures, ChipMinorFeatures2);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Return chip model. */
-+    if (ChipModel != gcvNULL)
-+    {
-+        *ChipModel = Hardware->chipModel;
-+    }
-+
-+    /* Return revision number. */
-+    if (ChipRevision != gcvNULL)
-+    {
-+        *ChipRevision = Hardware->chipRevision;
-+    }
-+
-+    /* Return feature set. */
-+    if (ChipFeatures != gcvNULL)
-+    {
-+        gctUINT32 features = Hardware->chipFeatures;
-+
-+        if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+        {
-+            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
-+        }
-+
-+        /* Mark 2D pipe as available for GC500.0 since it did not have this *\
-+        \* bit.                                                             */
-+        if ((Hardware->chipModel == gcv500)
-+        &&  (Hardware->chipRevision == 0)
-+        )
-+        {
-+            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+        }
-+
-+        /* Mark 2D pipe as available for GC300 since it did not have this   *\
-+        \* bit.                                                             */
-+        if (Hardware->chipModel == gcv300)
-+        {
-+            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
-+        }
-+
-+        *ChipFeatures = features;
-+    }
-+
-+    /* Return minor feature set. */
-+    if (ChipMinorFeatures != gcvNULL)
-+    {
-+        *ChipMinorFeatures = Hardware->chipMinorFeatures;
-+    }
-+
-+    /* Return minor feature set #2. */
-+    if (ChipMinorFeatures2 != gcvNULL)
-+    {
-+        *ChipMinorFeatures2 = Hardware->chipMinorFeatures2;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_ConvertFormat
-+**
-+**  Convert an API format to hardware parameters.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**      gceSURF_FORMAT Format
-+**          API format to convert.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * BitsPerPixel
-+**          Pointer to a variable that will hold the number of bits per pixel.
-+**
-+**      gctUINT32 * BytesPerTile
-+**          Pointer to a variable that will hold the number of bytes per tile.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_ConvertFormat(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceSURF_FORMAT Format,
-+    OUT gctUINT32 * BitsPerPixel,
-+    OUT gctUINT32 * BytesPerTile
-+    )
-+{
-+    gctUINT32 bitsPerPixel;
-+    gctUINT32 bytesPerTile;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Format=0x%x BitsPerPixel=0x%x BytesPerTile = 0x%x",
-+                   Hardware, Format, BitsPerPixel, BytesPerTile);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Dispatch on format. */
-+    switch (Format)
-+    {
-+    case gcvSURF_A1:
-+    case gcvSURF_L1:
-+        /* 1-bpp format. */
-+        bitsPerPixel  = 1;
-+        bytesPerTile  = (1 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_A4:
-+        /* 4-bpp format. */
-+        bitsPerPixel  = 4;
-+        bytesPerTile  = (4 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_INDEX8:
-+    case gcvSURF_A8:
-+    case gcvSURF_L8:
-+        /* 8-bpp format. */
-+        bitsPerPixel  = 8;
-+        bytesPerTile  = (8 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_YV12:
-+        /* 12-bpp planar YUV formats. */
-+        bitsPerPixel  = 12;
-+        bytesPerTile  = (12 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_NV12:
-+        /* 12-bpp planar YUV formats. */
-+        bitsPerPixel  = 12;
-+        bytesPerTile  = (12 * 4 * 4) / 8;
-+        break;
-+
-+    /* 4444 variations. */
-+    case gcvSURF_X4R4G4B4:
-+    case gcvSURF_A4R4G4B4:
-+    case gcvSURF_R4G4B4X4:
-+    case gcvSURF_R4G4B4A4:
-+    case gcvSURF_B4G4R4X4:
-+    case gcvSURF_B4G4R4A4:
-+    case gcvSURF_X4B4G4R4:
-+    case gcvSURF_A4B4G4R4:
-+
-+    /* 1555 variations. */
-+    case gcvSURF_X1R5G5B5:
-+    case gcvSURF_A1R5G5B5:
-+    case gcvSURF_R5G5B5X1:
-+    case gcvSURF_R5G5B5A1:
-+    case gcvSURF_X1B5G5R5:
-+    case gcvSURF_A1B5G5R5:
-+    case gcvSURF_B5G5R5X1:
-+    case gcvSURF_B5G5R5A1:
-+
-+    /* 565 variations. */
-+    case gcvSURF_R5G6B5:
-+    case gcvSURF_B5G6R5:
-+
-+    case gcvSURF_A8L8:
-+    case gcvSURF_YUY2:
-+    case gcvSURF_UYVY:
-+    case gcvSURF_D16:
-+        /* 16-bpp format. */
-+        bitsPerPixel  = 16;
-+        bytesPerTile  = (16 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_X8R8G8B8:
-+    case gcvSURF_A8R8G8B8:
-+    case gcvSURF_X8B8G8R8:
-+    case gcvSURF_A8B8G8R8:
-+    case gcvSURF_R8G8B8X8:
-+    case gcvSURF_R8G8B8A8:
-+    case gcvSURF_B8G8R8X8:
-+    case gcvSURF_B8G8R8A8:
-+    case gcvSURF_D32:
-+        /* 32-bpp format. */
-+        bitsPerPixel  = 32;
-+        bytesPerTile  = (32 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_D24S8:
-+        /* 24-bpp format. */
-+        bitsPerPixel  = 32;
-+        bytesPerTile  = (32 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_DXT1:
-+    case gcvSURF_ETC1:
-+        bitsPerPixel  = 4;
-+        bytesPerTile  = (4 * 4 * 4) / 8;
-+        break;
-+
-+    case gcvSURF_DXT2:
-+    case gcvSURF_DXT3:
-+    case gcvSURF_DXT4:
-+    case gcvSURF_DXT5:
-+        bitsPerPixel  = 8;
-+        bytesPerTile  = (8 * 4 * 4) / 8;
-+        break;
-+
-+    default:
-+        /* Invalid format. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_INVALID_ARGUMENT;
-+    }
-+
-+    /* Set the result. */
-+    if (BitsPerPixel != gcvNULL)
-+    {
-+        * BitsPerPixel = bitsPerPixel;
-+    }
-+
-+    if (BytesPerTile != gcvNULL)
-+    {
-+        * BytesPerTile = bytesPerTile;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_SplitMemory
-+**
-+**  Split a hardware specific memory address into a pool and offset.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Address in hardware specific format.
-+**
-+**  OUTPUT:
-+**
-+**      gcePOOL * Pool
-+**          Pointer to a variable that will hold the pool type for the address.
-+**
-+**      gctUINT32 * Offset
-+**          Pointer to a variable that will hold the offset for the address.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_SplitMemory(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Pool=0x%x Offset = 0x%x",
-+                   Hardware, Address, Pool, Offset);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
-+
-+    /* Dispatch on memory type. */
-+    switch ((((((gctUINT32) (Address)) >> (0 ? 1:0)) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1)))))) ))
-+    {
-+    case 0x0:
-+        /* System memory. */
-+        *Pool = gcvPOOL_SYSTEM;
-+        break;
-+
-+    case 0x2:
-+        /* Virtual memory. */
-+        *Pool = gcvPOOL_VIRTUAL;
-+        break;
-+
-+    default:
-+        /* Invalid memory type. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_INVALID_ARGUMENT;
-+    }
-+
-+    /* Return offset of address. */
-+    *Offset = ((((gctUINT32) (Address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_Execute
-+**
-+**  Kickstart the hardware's command processor with an initialized command
-+**  buffer.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to the gckVGHARDWARE object.
-+**
-+**      gctUINT32 Address
-+**          Address of the command buffer.
-+**
-+**      gctSIZE_T Count
-+**          Number of command-sized data units to be executed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_Execute(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Count
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Count=0x%x",
-+                   Hardware, Address, Count);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    do
-+    {
-+        /* Enable all events. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+            Hardware->os,
-+            gcvCORE_VG,
-+            0x00014,
-+            Hardware->eventMask
-+            ));
-+
-+        if (Hardware->fe20)
-+        {
-+            /* Write address register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00500,
-+                gcmkFIXADDRESS(Address)
-+                ));
-+
-+            /* Write control register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00504,
-+                Count
-+                ));
-+        }
-+        else
-+        {
-+            /* Write address register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00654,
-+                gcmkFIXADDRESS(Address)
-+                ));
-+
-+            /* Write control register. */
-+            gcmkERR_BREAK(gckOS_WriteRegisterEx(
-+                Hardware->os,
-+                gcvCORE_VG,
-+                0x00658,
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) |
-+                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+                ));
-+        }
-+
-+        /* Success. */
-+        gcmkFOOTER();
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_AlignToTile
-+**
-+**  Align the specified width and height to tile boundaries.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of alignment.
-+**
-+**      gctUINT32 * Width
-+**          Pointer to the width to be aligned.  If 'Width' is gcvNULL, no width
-+**          will be aligned.
-+**
-+**      gctUINT32 * Height
-+**          Pointer to the height to be aligned.  If 'Height' is gcvNULL, no height
-+**          will be aligned.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Width
-+**          Pointer to a variable that will receive the aligned width.
-+**
-+**      gctUINT32 * Height
-+**          Pointer to a variable that will receive the aligned height.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_AlignToTile(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctUINT32 * Width,
-+    IN OUT gctUINT32 * Height
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Type=0x%x Width=0x%x Height=0x%x",
-+                   Hardware, Type, Width, Height);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (Width != gcvNULL)
-+    {
-+        /* Align the width. */
-+        *Width = gcmALIGN(*Width, (Type == gcvSURF_TEXTURE) ? 4 : 16);
-+    }
-+
-+    if (Height != gcvNULL)
-+    {
-+        /* Special case for VG images. */
-+        if ((*Height == 0) && (Type == gcvSURF_IMAGE))
-+        {
-+            *Height = 4;
-+        }
-+        else
-+        {
-+            /* Align the height. */
-+            *Height = gcmALIGN(*Height, 4);
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_ConvertLogical
-+**
-+**  Convert a logical system address into a hardware specific address.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Hardware
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to convert.
-+**
-+**      gctBOOL InUserSpace
-+**          gcvTRUE if the memory in user space.
-+**
-+**      gctUINT32* Address
-+**          Return hardware specific address.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVGHARDWARE_ConvertLogical(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctBOOL InUserSpace,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x InUserSpace=%d Address=0x%x",
-+                   Hardware, Logical, InUserSpace, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    do
-+    {
-+        /* Convert logical address into a physical address. */
-+        if (InUserSpace)
-+        {
-+            gcmkERR_BREAK(gckOS_UserLogicalToPhysical(
-+                Hardware->os, Logical, &address
-+                ));
-+        }
-+        else
-+        {
-+            gcmkERR_BREAK(gckOS_GetPhysicalAddress(
-+                Hardware->os, Logical, &address
-+                ));
-+        }
-+
-+        /* Return hardware specific address. */
-+        *Address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+        /* Success. */
-+        gcmkFOOTER();
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_QuerySystemMemory
-+**
-+**  Query the command buffer alignment and number of reserved bytes.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * SystemSize
-+**          Pointer to a variable that receives the maximum size of the system
-+**          memory.
-+**
-+**      gctUINT32 * SystemBaseAddress
-+**          Poinetr to a variable that receives the base address for system
-+**          memory.
-+*/
-+gceSTATUS gckVGHARDWARE_QuerySystemMemory(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctSIZE_T * SystemSize,
-+    OUT gctUINT32 * SystemBaseAddress
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x SystemSize=0x%x SystemBaseAddress=0x%x",
-+                   Hardware, SystemSize, SystemBaseAddress);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    if (SystemSize != gcvNULL)
-+    {
-+        /* Maximum system memory can be 2GB. */
-+        *SystemSize = (gctSIZE_T)(1 << 31);
-+    }
-+
-+    if (SystemBaseAddress != gcvNULL)
-+    {
-+        /* Set system memory base address. */
-+        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_SetMMU
-+**
-+**  Set the page table base address.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the page table.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGHARDWARE_SetMMU(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 address = 0;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x",
-+                   Hardware, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    do
-+    {
-+        /* Convert the logical address into an hardware address. */
-+        gcmkERR_BREAK(gckVGHARDWARE_ConvertLogical(Hardware, Logical,
-+                                      gcvFALSE, &address));
-+
-+        /* Write the AQMemoryFePageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00400,
-+                                      gcmkFIXADDRESS(address)));
-+
-+        /* Write the AQMemoryTxPageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00404,
-+                                      gcmkFIXADDRESS(address)));
-+
-+        /* Write the AQMemoryPePageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00408,
-+                                      gcmkFIXADDRESS(address)));
-+
-+        /* Write the AQMemoryPezPageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x0040C,
-+                                      gcmkFIXADDRESS(address)));
-+
-+        /* Write the AQMemoryRaPageTable register. */
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                      0x00410,
-+                                      gcmkFIXADDRESS(address)));
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_FlushMMU
-+**
-+**  Flush the page table.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGHARDWARE_FlushMMU(
-+    IN gckVGHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGCOMMAND command;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    do
-+    {
-+        gcsCMDBUFFER_PTR commandBuffer;
-+        gctUINT32_PTR buffer;
-+
-+        /* Create a shortcut to the command buffer object. */
-+        command = Hardware->kernel->command;
-+
-+        /* Allocate command buffer space. */
-+        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
-+            command, 8, &commandBuffer, (gctPOINTER *) &buffer
-+            ));
-+
-+        buffer[0]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
-+
-+        buffer[1]
-+            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
-+            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
-+    }
-+    while(gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_BuildVirtualAddress
-+**
-+**  Build a virtual address.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**      gctUINT32 Index
-+**          Index into page table.
-+**
-+**      gctUINT32 Offset
-+**          Offset into page.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable receiving te hardware address.
-+*/
-+gceSTATUS gckVGHARDWARE_BuildVirtualAddress(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gctUINT32 address;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x Index=0x%x Offset=0x%x Address=0x%x",
-+                   Hardware, Index, Offset, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Build virtual address. */
-+    address = (Index << 12) | Offset;
-+
-+    /* Set virtual type. */
-+    address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
-+
-+    /* Set the result. */
-+    *Address = address;
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_GetIdle(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctUINT32 * Data
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%x Data=0x%x", Hardware, Data);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
-+
-+    /* Read register and return. */
-+    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, Data);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_SetFastClear(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctINT Enable
-+    )
-+{
-+    gctUINT32 debug;
-+    gceSTATUS status;
-+
-+    if (!(((((gctUINT32) (Hardware->chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
-+    {
-+        return gcvSTATUS_OK;
-+    }
-+
-+    do
-+    {
-+        if (Enable == -1)
-+        {
-+            Enable = (Hardware->chipModel > gcv500) ||
-+                ((Hardware->chipModel == gcv500) && (Hardware->chipRevision >= 3));
-+        }
-+
-+        gcmkERR_BREAK(gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
-+                                        0x00414,
-+                    &debug));
-+
-+        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
-+
-+#ifdef AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION
-+        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION)));
-+#endif
-+
-+        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
-+                                     0x00414,
-+                     debug));
-+
-+        Hardware->allowFastClear = Enable;
-+
-+        status = gcvFALSE;
-+    }
-+    while (gcvFALSE);
-+
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGHARDWARE_ReadInterrupt(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctUINT32_PTR IDs
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Hardware=0x%x IDs=0x%x", Hardware, IDs);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(IDs != gcvNULL);
-+
-+    /* Read AQIntrAcknowledge register. */
-+    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
-+                              0x00010,
-+                              IDs);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS _CommandStall(
-+    gckVGHARDWARE Hardware)
-+{
-+    gceSTATUS status;
-+    gckVGCOMMAND command;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    do
-+    {
-+        gctUINT32_PTR buffer;
-+        command = Hardware->kernel->command;
-+
-+        /* Allocate command buffer space. */
-+        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
-+            command, 8, &command->powerStallBuffer,
-+            (gctPOINTER *) &buffer
-+            ));
-+
-+        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
-+            command, buffer, gcvBLOCK_PIXEL,
-+            command->powerStallInt, gcvNULL));
-+
-+        gcmkERR_BREAK(gckVGCOMMAND_Execute(
-+            command,
-+            command->powerStallBuffer
-+            ));
-+
-+        /* Wait the signal. */
-+        gcmkERR_BREAK(gckOS_WaitSignal(
-+            command->os,
-+            command->powerStallSignal,
-+            command->kernel->kernel->timeOut));
-+
-+
-+    }
-+    while(gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_SetPowerManagementState
-+**
-+**  Set GPU to a specified power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_SetPowerManagementState(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceCHIPPOWERSTATE State
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGCOMMAND command = gcvNULL;
-+    gckOS os;
-+    gctUINT flag/*, clock*/;
-+
-+    gctBOOL acquired        = gcvFALSE;
-+    gctBOOL stall           = gcvTRUE;
-+    gctBOOL commitMutex     = gcvFALSE;
-+    gctBOOL mutexAcquired   = gcvFALSE;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    gctBOOL timeout = gcvFALSE;
-+    gctBOOL isAfter = gcvFALSE;
-+    gctUINT32 currentTime;
-+#endif
-+
-+    gctBOOL broadcast = gcvFALSE;
-+    gctUINT32 process, thread;
-+    gctBOOL global = gcvFALSE;
-+
-+#if gcdENABLE_PROFILING
-+    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
-+              initTime, offTime, startTime, totalTime;
-+#endif
-+
-+    /* State transition flags. */
-+    static const gctUINT flags[4][4] =
-+    {
-+        /* gcvPOWER_ON           */
-+        {   /* ON                */ 0,
-+            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_NOP,
-+            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STALL     |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_OFF          */
-+        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_RELEASE    |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* OFF               */ 0,
-+            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_START      |
-+                                    gcvPOWER_FLAG_RELEASE    |
-+                                    gcvPOWER_FLAG_DELAY,
-+            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_IDLE         */
-+        {   /* ON                */ gcvPOWER_FLAG_NOP,
-+            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ 0,
-+            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
-+                                    gcvPOWER_FLAG_STOP      |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+        },
-+
-+        /* gcvPOWER_SUSPEND      */
-+        {   /* ON                */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_RELEASE   |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* OFF               */ gcvPOWER_FLAG_SAVE      |
-+                                    gcvPOWER_FLAG_POWER_OFF |
-+                                    gcvPOWER_FLAG_CLOCK_OFF,
-+            /* IDLE              */ gcvPOWER_FLAG_START     |
-+                                    gcvPOWER_FLAG_DELAY     |
-+                                    gcvPOWER_FLAG_RELEASE   |
-+                                    gcvPOWER_FLAG_CLOCK_ON,
-+            /* SUSPEND           */ 0,
-+        },
-+    };
-+
-+    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "Switching to power state %d",
-+                   State);
-+#endif
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    /* Get the gckOS object pointer. */
-+    os = Hardware->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Get the gckCOMMAND object pointer. */
-+    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
-+    command = Hardware->kernel->command;
-+    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
-+
-+    if (Hardware->powerManagement == gcvFALSE)
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Start profiler. */
-+    gcmkPROFILE_INIT(freq, time);
-+
-+    /* Convert the broadcast power state. */
-+    switch (State)
-+    {
-+    case gcvPOWER_SUSPEND_ATPOWERON:
-+        /* Convert to SUSPEND and don't wait for STALL. */
-+        State = gcvPOWER_SUSPEND;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_OFF_ATPOWERON:
-+        /* Convert to OFF and don't wait for STALL. */
-+        State = gcvPOWER_OFF;
-+        stall = gcvFALSE;
-+        break;
-+
-+    case gcvPOWER_IDLE_BROADCAST:
-+        /* Convert to IDLE and note we are inside broadcast. */
-+        State     = gcvPOWER_IDLE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_SUSPEND_BROADCAST:
-+        /* Convert to SUSPEND and note we are inside broadcast. */
-+        State     = gcvPOWER_SUSPEND;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_BROADCAST:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_OFF_RECOVERY:
-+        /* Convert to OFF and note we are inside recovery. */
-+        State     = gcvPOWER_OFF;
-+        stall     = gcvFALSE;
-+        broadcast = gcvTRUE;
-+        break;
-+
-+    case gcvPOWER_ON_AUTO:
-+        /* Convert to ON and note we are inside recovery. */
-+        State = gcvPOWER_ON;
-+        break;
-+
-+    case gcvPOWER_ON:
-+    case gcvPOWER_IDLE:
-+    case gcvPOWER_SUSPEND:
-+    case gcvPOWER_OFF:
-+        /* Mark as global power management. */
-+        global = gcvTRUE;
-+        break;
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    case gcvPOWER_OFF_TIMEOUT:
-+        /* Convert to OFF and note we are inside broadcast. */
-+        State     = gcvPOWER_OFF;
-+        broadcast = gcvTRUE;
-+        /* Check time out */
-+        timeout = gcvTRUE;
-+        break;
-+#endif
-+
-+    default:
-+        break;
-+    }
-+
-+    /* Get current process and thread IDs. */
-+    gcmkONERROR(gckOS_GetProcessID(&process));
-+    gcmkONERROR(gckOS_GetThreadID(&thread));
-+
-+    /* Acquire the power mutex. */
-+    if (broadcast)
-+    {
-+        /* Try to acquire the power mutex. */
-+        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
-+
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            /* Check if we already own this mutex. */
-+            if ((Hardware->powerProcess == process)
-+            &&  (Hardware->powerThread  == thread)
-+            )
-+            {
-+                /* Bail out on recursive power management. */
-+                gcmkFOOTER_NO();
-+                return gcvSTATUS_OK;
-+            }
-+            else if (State == gcvPOWER_IDLE)
-+            {
-+                /* gcvPOWER_IDLE_BROADCAST is from IST,
-+                ** so waiting here will cause deadlock,
-+                ** if lock holder call gckCOMMAND_Stall() */
-+                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+            }
-+            else
-+            {
-+                /* Acquire the power mutex. */
-+                gcmkONERROR(gckOS_AcquireMutex(os,
-+                                               Hardware->powerMutex,
-+                                               gcvINFINITE));
-+            }
-+        }
-+    }
-+    else
-+    {
-+        /* Acquire the power mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
-+    }
-+
-+    /* Get time until mtuex acquired. */
-+    gcmkPROFILE_QUERY(time, mutexTime);
-+
-+    Hardware->powerProcess = process;
-+    Hardware->powerThread  = thread;
-+    mutexAcquired          = gcvTRUE;
-+
-+    /* Grab control flags and clock. */
-+    flag  = flags[Hardware->chipPowerState][State];
-+    /*clock = clocks[State];*/
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    if (timeout)
-+    {
-+        gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+        gcmkONERROR(
-+            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
-+
-+        /* powerOffTime is pushed forward, give up.*/
-+        if (isAfter
-+        /* Expect a transition start from IDLE. */
-+        ||  (Hardware->chipPowerState == gcvPOWER_ON)
-+        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
-+        )
-+        {
-+            /* Release the power mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+            /* No need to do anything. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+#endif
-+
-+    if (flag == 0)
-+    {
-+        /* Release the power mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+        /* No need to do anything. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* internal power control */
-+    if (!global)
-+    {
-+        if (Hardware->chipPowerStateGlobal == gcvPOWER_OFF)
-+        {
-+            /* Release the power mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+            /* No need to do anything. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+    else
-+    {
-+        if (flag & gcvPOWER_FLAG_ACQUIRE)
-+        {
-+            /* Acquire the power management semaphore. */
-+            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+            acquired = gcvTRUE;
-+
-+            /* avoid acquiring again. */
-+            flag &= ~gcvPOWER_FLAG_ACQUIRE;
-+        }
-+    }
-+
-+    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
-+    {
-+        /* Turn on the power. */
-+        gcmkONERROR(gckOS_SetGPUPower(os, gcvCORE_VG, gcvTRUE, gcvTRUE));
-+
-+        /* Mark clock and power as enabled. */
-+        Hardware->clockState = gcvTRUE;
-+        Hardware->powerState = gcvTRUE;
-+    }
-+
-+    /* Get time until powered on. */
-+    gcmkPROFILE_QUERY(time, onTime);
-+
-+    if ((flag & gcvPOWER_FLAG_STALL) && stall)
-+    {
-+        /* Acquire the mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(
-+            command->os,
-+            command->commitMutex,
-+            gcvINFINITE
-+            ));
-+
-+        commitMutex = gcvTRUE;
-+
-+        gcmkONERROR(_CommandStall(Hardware));
-+    }
-+
-+    /* Get time until stalled. */
-+    gcmkPROFILE_QUERY(time, stallTime);
-+
-+    if (flag & gcvPOWER_FLAG_ACQUIRE)
-+    {
-+        /* Acquire the power management semaphore. */
-+        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
-+
-+        acquired = gcvTRUE;
-+    }
-+
-+
-+    /* Get time until stopped. */
-+    gcmkPROFILE_QUERY(time, stopTime);
-+
-+
-+    if (flag & gcvPOWER_FLAG_DELAY)
-+    {
-+        /* Wait for the specified amount of time to settle coming back from
-+        ** power-off or suspend state. */
-+        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
-+    }
-+
-+    /* Get time until delayed. */
-+    gcmkPROFILE_QUERY(time, delayTime);
-+
-+    if (flag & gcvPOWER_FLAG_INITIALIZE)
-+    {
-+
-+        /* Initialize GPU here, replaced by InitializeHardware later */
-+        gcmkONERROR(gckVGHARDWARE_SetMMU(Hardware, Hardware->kernel->mmu->pageTableLogical));
-+        gcmkVERIFY_OK(gckVGHARDWARE_SetFastClear(Hardware, -1));
-+
-+        /* Force the command queue to reload the next context. */
-+        command->currentContext = 0;
-+    }
-+
-+    /* Get time until initialized. */
-+    gcmkPROFILE_QUERY(time, initTime);
-+
-+    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
-+    {
-+        /* Turn off the GPU power. */
-+        gcmkONERROR(
-+            gckOS_SetGPUPower(os,
-+                              gcvCORE_VG,
-+                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                               : gcvTRUE,
-+                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                               : gcvTRUE));
-+
-+        /* Save current hardware power and clock states. */
-+        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
-+                                                                : gcvTRUE;
-+    }
-+
-+    /* Get time until off. */
-+    gcmkPROFILE_QUERY(time, offTime);
-+
-+
-+    /* Get time until started. */
-+    gcmkPROFILE_QUERY(time, startTime);
-+
-+    if (flag & gcvPOWER_FLAG_RELEASE)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
-+        acquired = gcvFALSE;
-+    }
-+
-+    /* Save the new power state. */
-+    Hardware->chipPowerState = State;
-+
-+    if (global)
-+    {
-+        /* Save the new power state. */
-+        Hardware->chipPowerStateGlobal = State;
-+    }
-+
-+    if (commitMutex)
-+    {
-+        /* Acquire the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+            command->os,
-+            command->commitMutex
-+            ));
-+    }
-+
-+#if gcdPOWEROFF_TIMEOUT
-+    /* Reset power off time */
-+    gcmkONERROR(gckOS_GetTicks(&currentTime));
-+
-+    Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
-+
-+    if (State == gcvPOWER_IDLE)
-+    {
-+        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
-+        gcmkVERIFY_OK(gckOS_StartTimer(os,
-+                                       Hardware->powerOffTimer,
-+                                       Hardware->powerOffTimeout));
-+    }
-+    else
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
-+
-+        /* Cancel running timer when GPU enters ON or OFF. */
-+        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
-+    }
-+#endif
-+
-+    /* Release the power mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
-+
-+    /* Get total time. */
-+    gcmkPROFILE_QUERY(time, totalTime);
-+#if gcdENABLE_PROFILING
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
-+                   freq, mutexTime, onTime, stallTime, stopTime);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
-+                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
-+                   delayTime, initTime, offTime, startTime, totalTime);
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    if (acquired)
-+    {
-+        /* Release semaphore. */
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
-+                                             command->powerSemaphore));
-+    }
-+
-+    if (mutexAcquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
-+    }
-+
-+    if (commitMutex)
-+    {
-+        /* Acquire the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+            command->os,
-+            command->commitMutex
-+            ));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHARDWARE_QueryPowerManagementState
-+**
-+**  Get GPU power state.
-+**
-+**  INPUT:
-+**
-+**      gckHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gceCHIPPOWERSTATE* State
-+**          Power State.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_QueryPowerManagementState(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gceCHIPPOWERSTATE* State
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(State != gcvNULL);
-+
-+    /* Return the statue. */
-+    *State = Hardware->chipPowerState;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*State=%d", *State);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGHARDWARE_SetPowerManagement
-+**
-+**  Configure GPU power management function.
-+**  Only used in driver initialization stage.
-+**
-+**  INPUT:
-+**
-+**      gckVGHARDWARE Harwdare
-+**          Pointer to an gckHARDWARE object.
-+**
-+**      gctBOOL PowerManagement
-+**          Power Mangement State.
-+**
-+*/
-+gceSTATUS
-+gckVGHARDWARE_SetPowerManagement(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctBOOL PowerManagement
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    Hardware->powerManagement = PowerManagement;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdPOWEROFF_TIMEOUT
-+gceSTATUS
-+gckVGHARDWARE_SetPowerOffTimeout(
-+    IN gckVGHARDWARE  Hardware,
-+    IN gctUINT32    Timeout
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
-+
-+    Hardware->powerOffTimeout = Timeout;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryPowerOffTimeout(
-+    IN gckVGHARDWARE  Hardware,
-+    OUT gctUINT32*  Timeout
-+    )
-+{
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    *Timeout = Hardware->powerOffTimeout;
-+
-+    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryIdle(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctBOOL_PTR IsIdle
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 idle;
-+
-+    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
-+
-+    /* We are idle when the power is not ON. */
-+    if (Hardware->chipPowerState != gcvPOWER_ON)
-+    {
-+        *IsIdle = gcvTRUE;
-+    }
-+
-+    else
-+    {
-+        /* Read idle register. */
-+        gcmkONERROR(
-+            gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, &idle));
-+
-+        /* Pipe must be idle. */
-+        if (((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 8:8)) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 10:10)) & ((gctUINT32) ((((1 ? 10:10) - (0 ? 10:10) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 10:10) - (0 ? 10:10) + 1)))))) ) != 1)
-+        ||  ((((((gctUINT32) (idle)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) ) != 1)
-+        )
-+        {
-+            /* Something is busy. */
-+            *IsIdle = gcvFALSE;
-+        }
-+
-+        else
-+        {
-+            *IsIdle = gcvTRUE;
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif /* gcdENABLE_VG */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,74 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_hardware_vg_h_
-+#define __gc_hal_kernel_hardware_vg_h_
-+
-+/* gckHARDWARE object. */
-+struct _gckVGHARDWARE
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckKERNEL object. */
-+    gckVGKERNEL                 kernel;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Chip characteristics. */
-+    gceCHIPMODEL                chipModel;
-+    gctUINT32                   chipRevision;
-+    gctUINT32                   chipFeatures;
-+    gctUINT32                   chipMinorFeatures;
-+    gctUINT32                   chipMinorFeatures2;
-+    gctBOOL                     allowFastClear;
-+
-+    /* Features. */
-+    gctBOOL                     fe20;
-+    gctBOOL                     vg20;
-+    gctBOOL                     vg21;
-+
-+    /* Event mask. */
-+    gctUINT32                   eventMask;
-+
-+    gctBOOL                     clockState;
-+    gctBOOL                     powerState;
-+    gctPOINTER                  powerMutex;
-+    gctUINT32                   powerProcess;
-+    gctUINT32                   powerThread;
-+    gceCHIPPOWERSTATE           chipPowerState;
-+    gceCHIPPOWERSTATE           chipPowerStateGlobal;
-+    gctISRMANAGERFUNC           startIsr;
-+    gctISRMANAGERFUNC           stopIsr;
-+    gctPOINTER                  isrContext;
-+    gctPOINTER                  pageTableDirty;
-+#if gcdPOWEROFF_TIMEOUT
-+    gctUINT32                   powerOffTime;
-+    gctUINT32                   powerOffTimeout;
-+    gctPOINTER                  powerOffTimer;
-+#endif
-+
-+    gctBOOL                     powerManagement;
-+};
-+
-+#endif /* __gc_hal_kernel_hardware_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,3976 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_KERNEL
-+
-+/*******************************************************************************
-+***** Version Signature *******************************************************/
-+
-+#define _gcmTXT2STR(t) #t
-+#define gcmTXT2STR(t) _gcmTXT2STR(t)
-+const char * _VERSION = "\n\0$VERSION$"
-+                        gcmTXT2STR(gcvVERSION_MAJOR) "."
-+                        gcmTXT2STR(gcvVERSION_MINOR) "."
-+                        gcmTXT2STR(gcvVERSION_PATCH) ":"
-+                        gcmTXT2STR(gcvVERSION_BUILD) "$\n";
-+
-+/******************************************************************************\
-+******************************* gckKERNEL API Code ******************************
-+\******************************************************************************/
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+#define gcmDEFINE2TEXT(d) #d
-+gctCONST_STRING _DispatchText[] =
-+{
-+    gcmDEFINE2TEXT(gcvHAL_QUERY_VIDEO_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_QUERY_CHIP_IDENTITY),
-+    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_NON_PAGED_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_FREE_NON_PAGED_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_FREE_CONTIGUOUS_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_VIDEO_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_FREE_VIDEO_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_MAP_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_UNMAP_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_MAP_USER_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_UNMAP_USER_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_LOCK_VIDEO_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_UNLOCK_VIDEO_MEMORY),
-+    gcmDEFINE2TEXT(gcvHAL_EVENT_COMMIT),
-+    gcmDEFINE2TEXT(gcvHAL_USER_SIGNAL),
-+    gcmDEFINE2TEXT(gcvHAL_SIGNAL),
-+    gcmDEFINE2TEXT(gcvHAL_WRITE_DATA),
-+    gcmDEFINE2TEXT(gcvHAL_COMMIT),
-+    gcmDEFINE2TEXT(gcvHAL_STALL),
-+    gcmDEFINE2TEXT(gcvHAL_READ_REGISTER),
-+    gcmDEFINE2TEXT(gcvHAL_WRITE_REGISTER),
-+    gcmDEFINE2TEXT(gcvHAL_GET_PROFILE_SETTING),
-+    gcmDEFINE2TEXT(gcvHAL_SET_PROFILE_SETTING),
-+    gcmDEFINE2TEXT(gcvHAL_READ_ALL_PROFILE_REGISTERS),
-+#if VIVANTE_PROFILER_PERDRAW
-+    gcmDEFINE2TEXT(gcvHAL_READ_PROFILER_REGISTER_SETTING),
-+#endif
-+    gcmDEFINE2TEXT(gcvHAL_PROFILE_REGISTERS_2D),
-+    gcmDEFINE2TEXT(gcvHAL_SET_POWER_MANAGEMENT_STATE),
-+    gcmDEFINE2TEXT(gcvHAL_QUERY_POWER_MANAGEMENT_STATE),
-+    gcmDEFINE2TEXT(gcvHAL_GET_BASE_ADDRESS),
-+    gcmDEFINE2TEXT(gcvHAL_SET_IDLE),
-+    gcmDEFINE2TEXT(gcvHAL_QUERY_KERNEL_SETTINGS),
-+    gcmDEFINE2TEXT(gcvHAL_RESET),
-+    gcmDEFINE2TEXT(gcvHAL_MAP_PHYSICAL),
-+    gcmDEFINE2TEXT(gcvHAL_DEBUG),
-+    gcmDEFINE2TEXT(gcvHAL_CACHE),
-+    gcmDEFINE2TEXT(gcvHAL_TIMESTAMP),
-+    gcmDEFINE2TEXT(gcvHAL_DATABASE),
-+    gcmDEFINE2TEXT(gcvHAL_VERSION),
-+    gcmDEFINE2TEXT(gcvHAL_CHIP_INFO),
-+    gcmDEFINE2TEXT(gcvHAL_ATTACH),
-+    gcmDEFINE2TEXT(gcvHAL_DETACH)
-+};
-+#endif
-+
-+#if gcdENABLE_RECOVERY
-+void
-+_ResetFinishFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gckKERNEL kernel = (gckKERNEL)Data;
-+
-+    gckOS_AtomSet(kernel->os, kernel->resetAtom, 0);
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Construct
-+**
-+**  Construct a new gckKERNEL object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gceCORE Core
-+**          Specified core.
-+**
-+**      IN gctPOINTER Context
-+**          Pointer to a driver defined context.
-+**
-+**      IN gckDB SharedDB,
-+**          Pointer to a shared DB.
-+**
-+**  OUTPUT:
-+**
-+**      gckKERNEL * Kernel
-+**          Pointer to a variable that will hold the pointer to the gckKERNEL
-+**          object.
-+*/
-+
-+gceSTATUS
-+gckKERNEL_Construct(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPOINTER Context,
-+    IN gckDB SharedDB,
-+    OUT gckKERNEL * Kernel
-+    )
-+{
-+    gckKERNEL kernel = gcvNULL;
-+    gceSTATUS status;
-+    gctSIZE_T i;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%x Context=0x%x", Os, Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Kernel != gcvNULL);
-+
-+    /* Allocate the gckKERNEL object. */
-+    gcmkONERROR(gckOS_Allocate(Os,
-+                               gcmSIZEOF(struct _gckKERNEL),
-+                               &pointer));
-+
-+    kernel = pointer;
-+
-+    /* Zero the object pointers. */
-+    kernel->hardware     = gcvNULL;
-+    kernel->command      = gcvNULL;
-+    kernel->eventObj     = gcvNULL;
-+    kernel->mmu          = gcvNULL;
-+#if gcdDVFS
-+    kernel->dvfs         = gcvNULL;
-+#endif
-+
-+    kernel->vidmemMutex  = gcvNULL;
-+
-+    /* Initialize the gckKERNEL object. */
-+    kernel->object.type = gcvOBJ_KERNEL;
-+    kernel->os          = Os;
-+    kernel->core        = Core;
-+
-+
-+    if (SharedDB == gcvNULL)
-+    {
-+        gcmkONERROR(gckOS_Allocate(Os,
-+                                   gcmSIZEOF(struct _gckDB),
-+                                   &pointer));
-+
-+        kernel->db               = pointer;
-+        kernel->dbCreated        = gcvTRUE;
-+        kernel->db->freeDatabase = gcvNULL;
-+        kernel->db->freeRecord   = gcvNULL;
-+        kernel->db->dbMutex      = gcvNULL;
-+        kernel->db->lastDatabase = gcvNULL;
-+        kernel->db->idleTime     = 0;
-+        kernel->db->lastIdle     = 0;
-+        kernel->db->lastSlowdown = 0;
-+
-+        for (i = 0; i < gcmCOUNTOF(kernel->db->db); ++i)
-+        {
-+            kernel->db->db[i] = gcvNULL;
-+        }
-+
-+        /* Construct a database mutex. */
-+        gcmkONERROR(gckOS_CreateMutex(Os, &kernel->db->dbMutex));
-+
-+        /* Construct a id-pointer database. */
-+        gcmkONERROR(gckKERNEL_CreateIntegerDatabase(kernel, &kernel->db->pointerDatabase));
-+
-+        /* Construct a id-pointer database mutex. */
-+        gcmkONERROR(gckOS_CreateMutex(Os, &kernel->db->pointerDatabaseMutex));
-+    }
-+    else
-+    {
-+        kernel->db               = SharedDB;
-+        kernel->dbCreated        = gcvFALSE;
-+    }
-+
-+    for (i = 0; i < gcmCOUNTOF(kernel->timers); ++i)
-+    {
-+        kernel->timers[i].startTime = 0;
-+        kernel->timers[i].stopTime = 0;
-+    }
-+
-+    kernel->timeOut      = gcdGPU_TIMEOUT;
-+
-+    /* Save context. */
-+    kernel->context = Context;
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+    kernel->virtualBufferHead =
-+    kernel->virtualBufferTail = gcvNULL;
-+
-+    gcmkONERROR(
-+        gckOS_CreateMutex(Os, (gctPOINTER)&kernel->virtualBufferLock));
-+#endif
-+
-+    /* Construct atom holding number of clients. */
-+    kernel->atomClients = gcvNULL;
-+    gcmkONERROR(gckOS_AtomConstruct(Os, &kernel->atomClients));
-+
-+#if gcdENABLE_VG
-+    kernel->vg = gcvNULL;
-+
-+    if (Core == gcvCORE_VG)
-+    {
-+        /* Construct the gckMMU object. */
-+        gcmkONERROR(
-+            gckVGKERNEL_Construct(Os, Context, kernel, &kernel->vg));
-+    }
-+    else
-+#endif
-+    {
-+        /* Construct the gckHARDWARE object. */
-+        gcmkONERROR(
-+            gckHARDWARE_Construct(Os, kernel->core, &kernel->hardware));
-+
-+        /* Set pointer to gckKERNEL object in gckHARDWARE object. */
-+        kernel->hardware->kernel = kernel;
-+
-+        /* Initialize the hardware. */
-+        gcmkONERROR(
-+            gckHARDWARE_InitializeHardware(kernel->hardware));
-+
-+        /* Construct the gckCOMMAND object. */
-+        gcmkONERROR(
-+            gckCOMMAND_Construct(kernel, &kernel->command));
-+
-+        /* Construct the gckEVENT object. */
-+        gcmkONERROR(
-+            gckEVENT_Construct(kernel, &kernel->eventObj));
-+
-+        /* Construct the gckMMU object. */
-+        gcmkONERROR(
-+            gckMMU_Construct(kernel, gcdMMU_SIZE, &kernel->mmu));
-+
-+#if gcdENABLE_RECOVERY
-+        gcmkONERROR(
-+            gckOS_AtomConstruct(Os, &kernel->resetAtom));
-+
-+        gcmkVERIFY_OK(
-+            gckOS_CreateTimer(Os,
-+                              (gctTIMERFUNCTION)_ResetFinishFunction,
-+                              (gctPOINTER)kernel,
-+                              &kernel->resetFlagClearTimer));
-+        kernel->resetTimeStamp = 0;
-+#endif
-+
-+#if gcdDVFS
-+        if (gckHARDWARE_IsFeatureAvailable(kernel->hardware,
-+                                           gcvFEATURE_DYNAMIC_FREQUENCY_SCALING))
-+        {
-+            gcmkONERROR(gckDVFS_Construct(kernel->hardware, &kernel->dvfs));
-+            gcmkONERROR(gckDVFS_Start(kernel->dvfs));
-+        }
-+#endif
-+    }
-+
-+    spin_lock_init(&kernel->irq_lock);
-+
-+#if VIVANTE_PROFILER
-+    /* Initialize profile setting */
-+    kernel->profileEnable = gcvFALSE;
-+    kernel->profileCleanRegister = gcvTRUE;
-+#endif
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    gcmkONERROR(gckOS_CreateSyncTimeline(Os, &kernel->timeline));
-+#endif
-+
-+    /* Construct a video memory mutex. */
-+    gcmkONERROR(gckOS_GetVideoMemoryMutex(Os, &kernel->vidmemMutex));
-+
-+    /* Return pointer to the gckKERNEL object. */
-+    *Kernel = kernel;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Kernel=0x%x", *Kernel);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (kernel != gcvNULL)
-+    {
-+#if gcdENABLE_VG
-+        if (Core != gcvCORE_VG)
-+#endif
-+        {
-+            if (kernel->eventObj != gcvNULL)
-+            {
-+                gcmkVERIFY_OK(gckEVENT_Destroy(kernel->eventObj));
-+            }
-+
-+            if (kernel->command != gcvNULL)
-+            {
-+            gcmkVERIFY_OK(gckCOMMAND_Destroy(kernel->command));
-+            }
-+
-+            if (kernel->hardware != gcvNULL)
-+            {
-+                /* Turn off the power. */
-+                gcmkVERIFY_OK(gckOS_SetGPUPower(kernel->hardware->os,
-+                                                kernel->hardware->core,
-+                                                gcvFALSE,
-+                                                gcvFALSE));
-+                gcmkVERIFY_OK(gckHARDWARE_Destroy(kernel->hardware));
-+            }
-+        }
-+
-+        if (kernel->atomClients != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, kernel->atomClients));
-+        }
-+
-+#if gcdENABLE_RECOVERY
-+        if (kernel->resetAtom != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, kernel->resetAtom));
-+        }
-+
-+        if (kernel->resetFlagClearTimer)
-+        {
-+            gcmkVERIFY_OK(gckOS_StopTimer(Os, kernel->resetFlagClearTimer));
-+            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, kernel->resetFlagClearTimer));
-+        }
-+#endif
-+
-+        if (kernel->dbCreated && kernel->db != gcvNULL)
-+        {
-+            if (kernel->db->dbMutex != gcvNULL)
-+            {
-+                /* Destroy the database mutex. */
-+                gcmkVERIFY_OK(gckOS_DeleteMutex(Os, kernel->db->dbMutex));
-+            }
-+
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, kernel->db));
-+        }
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+        if (kernel->virtualBufferLock != gcvNULL)
-+        {
-+            /* Destroy the virtual command buffer mutex. */
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, kernel->virtualBufferLock));
-+        }
-+#endif
-+
-+#if gcdDVFS
-+        if (kernel->dvfs)
-+        {
-+            gcmkVERIFY_OK(gckDVFS_Stop(kernel->dvfs));
-+            gcmkVERIFY_OK(gckDVFS_Destroy(kernel->dvfs));
-+        }
-+#endif
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+        if (kernel->timeline)
-+        {
-+            gcmkVERIFY_OK(gckOS_DestroySyncTimeline(Os, kernel->timeline));
-+        }
-+#endif
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, kernel));
-+    }
-+
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Destroy
-+**
-+**  Destroy an gckKERNEL object.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_Destroy(
-+    IN gckKERNEL Kernel
-+    )
-+{
-+    gctSIZE_T i;
-+    gcsDATABASE_PTR database, databaseNext;
-+    gcsDATABASE_RECORD_PTR record, recordNext;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+#if QNX_SINGLE_THREADED_DEBUGGING
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->debugMutex));
-+#endif
-+
-+    /* Destroy the database. */
-+    if (Kernel->dbCreated)
-+    {
-+        for (i = 0; i < gcmCOUNTOF(Kernel->db->db); ++i)
-+        {
-+            if (Kernel->db->db[i] != gcvNULL)
-+            {
-+                gcmkVERIFY_OK(
-+                    gckKERNEL_DestroyProcessDB(Kernel, Kernel->db->db[i]->processID));
-+            }
-+        }
-+
-+        /* Free all databases. */
-+        for (database = Kernel->db->freeDatabase;
-+             database != gcvNULL;
-+             database = databaseNext)
-+        {
-+            databaseNext = database->next;
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, database));
-+        }
-+
-+        if (Kernel->db->lastDatabase != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, Kernel->db->lastDatabase));
-+        }
-+
-+        /* Free all database records. */
-+        for (record = Kernel->db->freeRecord; record != gcvNULL; record = recordNext)
-+        {
-+            recordNext = record->next;
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, record));
-+        }
-+
-+        /* Destroy the database mutex. */
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+
-+        /* Destroy id-pointer database. */
-+        gcmkVERIFY_OK(gckKERNEL_DestroyIntegerDatabase(Kernel, Kernel->db->pointerDatabase));
-+
-+        /* Destroy id-pointer database mutex. */
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->db->pointerDatabaseMutex));
-+    }
-+
-+#if gcdENABLE_VG
-+    if (Kernel->vg)
-+    {
-+        gcmkVERIFY_OK(gckVGKERNEL_Destroy(Kernel->vg));
-+    }
-+    else
-+#endif
-+    {
-+        /* Destroy the gckMMU object. */
-+        gcmkVERIFY_OK(gckMMU_Destroy(Kernel->mmu));
-+
-+        /* Destroy the gckCOMMNAND object. */
-+        gcmkVERIFY_OK(gckCOMMAND_Destroy(Kernel->command));
-+
-+        /* Destroy the gckEVENT object. */
-+        gcmkVERIFY_OK(gckEVENT_Destroy(Kernel->eventObj));
-+
-+        /* Destroy the gckHARDWARE object. */
-+        gcmkVERIFY_OK(gckHARDWARE_Destroy(Kernel->hardware));
-+
-+#if gcdENABLE_RECOVERY
-+        gcmkVERIFY_OK(gckOS_AtomDestroy(Kernel->os, Kernel->resetAtom));
-+
-+        if (Kernel->resetFlagClearTimer)
-+        {
-+            gcmkVERIFY_OK(gckOS_StopTimer(Kernel->os, Kernel->resetFlagClearTimer));
-+            gcmkVERIFY_OK(gckOS_DestroyTimer(Kernel->os, Kernel->resetFlagClearTimer));
-+        }
-+#endif
-+    }
-+
-+    /* Detsroy the client atom. */
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Kernel->os, Kernel->atomClients));
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->virtualBufferLock));
-+#endif
-+
-+#if gcdDVFS
-+    if (Kernel->dvfs)
-+    {
-+        gcmkVERIFY_OK(gckDVFS_Stop(Kernel->dvfs));
-+        gcmkVERIFY_OK(gckDVFS_Destroy(Kernel->dvfs));
-+    }
-+#endif
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    gcmkVERIFY_OK(gckOS_DestroySyncTimeline(Kernel->os, Kernel->timeline));
-+#endif
-+
-+    /* Mark the gckKERNEL object as unknown. */
-+    Kernel->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckKERNEL object. */
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, Kernel));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+#include <linux/kernel.h>
-+#include <linux/mm.h>
-+#include <linux/oom.h>
-+#include <linux/sched.h>
-+#include <linux/notifier.h>
-+
-+extern struct task_struct *lowmem_deathpending;
-+static unsigned long lowmem_deathpending_timeout;
-+
-+static int force_contiguous_lowmem_shrink(IN gckKERNEL Kernel)
-+{
-+	struct task_struct *p;
-+	struct task_struct *selected = NULL;
-+	int tasksize;
-+        int ret = -1;
-+	int min_adj = 0;
-+	int selected_tasksize = 0;
-+	int selected_oom_adj;
-+	/*
-+	 * If we already have a death outstanding, then
-+	 * bail out right away; indicating to vmscan
-+	 * that we have nothing further to offer on
-+	 * this pass.
-+	 *
-+	 */
-+	if (lowmem_deathpending &&
-+	    time_before_eq(jiffies, lowmem_deathpending_timeout))
-+		return 0;
-+	selected_oom_adj = min_adj;
-+
-+	read_lock(&tasklist_lock);
-+	for_each_process(p) {
-+		struct mm_struct *mm;
-+		struct signal_struct *sig;
-+                gcuDATABASE_INFO info;
-+		int oom_adj, pid;
-+
-+		task_lock(p);
-+		mm = p->mm;
-+		sig = p->signal;
-+                pid = p->pid;
-+		if (!mm || !sig) {
-+			task_unlock(p);
-+			continue;
-+		}
-+		oom_adj = sig->oom_adj;
-+		task_unlock(p);
-+		if (oom_adj < min_adj) {
-+			continue;
-+		}
-+
-+                read_unlock(&tasklist_lock);
-+
-+		tasksize = 0;
-+		if (gckKERNEL_QueryProcessDB(Kernel, pid, gcvFALSE, gcvDB_VIDEO_MEMORY, &info) == gcvSTATUS_OK){
-+			tasksize += info.counters.bytes / PAGE_SIZE;
-+		}
-+		if (gckKERNEL_QueryProcessDB(Kernel, pid, gcvFALSE, gcvDB_CONTIGUOUS, &info) == gcvSTATUS_OK){
-+			tasksize += info.counters.bytes / PAGE_SIZE;
-+		}
-+
-+                read_lock(&tasklist_lock);
-+
-+		if (tasksize <= 0)
-+			continue;
-+
-+		gckOS_Print("<gpu> pid %d (%s), adj %d, size %d \n", p->pid, p->comm, oom_adj, tasksize);
-+
-+		if (selected) {
-+			if (oom_adj < selected_oom_adj)
-+				continue;
-+			if (oom_adj == selected_oom_adj &&
-+			    tasksize <= selected_tasksize)
-+				continue;
-+		}
-+		selected = p;
-+		selected_tasksize = tasksize;
-+		selected_oom_adj = oom_adj;
-+	}
-+	if (selected) {
-+		gckOS_Print("<gpu> send sigkill to %d (%s), adj %d, size %d\n",
-+			     selected->pid, selected->comm,
-+			     selected_oom_adj, selected_tasksize);
-+		lowmem_deathpending = selected;
-+		lowmem_deathpending_timeout = jiffies + HZ;
-+		force_sig(SIGKILL, selected);
-+		ret = 0;
-+	}
-+	read_unlock(&tasklist_lock);
-+	return ret;
-+}
-+
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  _AllocateMemory
-+**
-+**  Private function to walk all required memory pools to allocate the requested
-+**  amount of video memory.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to a gcsHAL_INTERFACE structure that defines the command to
-+**          be dispatched.
-+**
-+**  OUTPUT:
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to a gcsHAL_INTERFACE structure that receives any data to be
-+**          returned.
-+*/
-+static gceSTATUS
-+_AllocateMemory(
-+    IN gckKERNEL Kernel,
-+    IN OUT gcePOOL * Pool,
-+    IN gctSIZE_T Bytes,
-+    IN gctSIZE_T Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    )
-+{
-+    gcePOOL pool;
-+    gceSTATUS status;
-+    gckVIDMEM videoMemory;
-+    gctINT loopCount;
-+    gcuVIDMEM_NODE_PTR node = gcvNULL;
-+    gctBOOL tileStatusInVirtual;
-+    gctBOOL forceContiguous = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x *Pool=%d Bytes=%lu Alignment=%lu Type=%d",
-+                   Kernel, *Pool, Bytes, Alignment, Type);
-+
-+    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes != 0);
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+_AllocateMemory_Retry:
-+#endif
-+    /* Get initial pool. */
-+    switch (pool = *Pool)
-+    {
-+    case gcvPOOL_DEFAULT_FORCE_CONTIGUOUS:
-+        forceContiguous = gcvTRUE;
-+    case gcvPOOL_DEFAULT:
-+    case gcvPOOL_LOCAL:
-+        pool      = gcvPOOL_LOCAL_INTERNAL;
-+        loopCount = (gctINT) gcvPOOL_NUMBER_OF_POOLS;
-+        break;
-+
-+    case gcvPOOL_UNIFIED:
-+        pool      = gcvPOOL_SYSTEM;
-+        loopCount = (gctINT) gcvPOOL_NUMBER_OF_POOLS;
-+        break;
-+
-+    case gcvPOOL_CONTIGUOUS:
-+        loopCount = (gctINT) gcvPOOL_NUMBER_OF_POOLS;
-+        break;
-+
-+    case gcvPOOL_DEFAULT_FORCE_CONTIGUOUS_CACHEABLE:
-+        pool      = gcvPOOL_CONTIGUOUS;
-+        loopCount = 1;
-+        forceContiguous = gcvTRUE;
-+        break;
-+
-+    default:
-+        loopCount = 1;
-+        break;
-+    }
-+
-+    while (loopCount-- > 0)
-+    {
-+        if (pool == gcvPOOL_VIRTUAL)
-+        {
-+            /* Create a gcuVIDMEM_NODE for virtual memory. */
-+            gcmkONERROR(
-+                gckVIDMEM_ConstructVirtual(Kernel, gcvFALSE, Bytes, &node));
-+
-+            /* Success. */
-+            break;
-+        }
-+
-+        else
-+        if (pool == gcvPOOL_CONTIGUOUS)
-+        {
-+#if gcdCONTIGUOUS_SIZE_LIMIT
-+            if (Bytes > gcdCONTIGUOUS_SIZE_LIMIT && forceContiguous == gcvFALSE)
-+            {
-+                status = gcvSTATUS_OUT_OF_MEMORY;
-+            }
-+            else
-+#endif
-+            {
-+                /* Create a gcuVIDMEM_NODE from contiguous memory. */
-+                status = gckVIDMEM_ConstructVirtual(Kernel, gcvTRUE, Bytes, &node);
-+            }
-+
-+            if (gcmIS_SUCCESS(status) || forceContiguous == gcvTRUE)
-+            {
-+                /* Memory allocated. */
-+                if(node && forceContiguous == gcvTRUE)
-+                {
-+                    gctUINT32 physAddr=0;
-+                    gctUINT32 baseAddress = 0;
-+
-+                    gcmkONERROR(
-+                        gckOS_LockPages(Kernel->os,
-+                                        node->Virtual.physical,
-+                                        node->Virtual.bytes,
-+                                        gcvFALSE,
-+                                        &node->Virtual.logical,
-+                                        &node->Virtual.pageCount));
-+
-+                    /* Convert logical address into a physical address. */
-+                    gcmkONERROR(
-+                        gckOS_GetPhysicalAddress(Kernel->os,
-+                                                 node->Virtual.logical,
-+                                                 &physAddr));
-+
-+                    gcmkONERROR(
-+                        gckOS_UnlockPages(Kernel->os,
-+                                          node->Virtual.physical,
-+                                          node->Virtual.bytes,
-+                                          node->Virtual.logical));
-+
-+                    gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
-+
-+                    gcmkASSERT(physAddr >= baseAddress);
-+
-+                    /* Subtract baseAddress to get a GPU address used for programming. */
-+                    physAddr -= baseAddress;
-+
-+                    if((physAddr & 0x80000000) || ((physAddr + Bytes) & 0x80000000))
-+                    {
-+                        gckOS_Print("gpu virtual memory 0x%x cannot be allocated in force contiguous request!\n", physAddr);
-+
-+                        gcmkONERROR(gckVIDMEM_Free(Kernel,node));
-+
-+                        node = gcvNULL;
-+                    }
-+                }
-+
-+                break;
-+            }
-+        }
-+
-+        else
-+        {
-+            /* Get pointer to gckVIDMEM object for pool. */
-+#if gcdUSE_VIDMEM_PER_PID
-+            gctUINT32 pid;
-+            gckOS_GetProcessID(&pid);
-+
-+            status = gckKERNEL_GetVideoMemoryPoolPid(Kernel, pool, pid, &videoMemory);
-+            if (status == gcvSTATUS_NOT_FOUND)
-+            {
-+                /* Create VidMem pool for this process. */
-+                status = gckKERNEL_CreateVideoMemoryPoolPid(Kernel, pool, pid, &videoMemory);
-+            }
-+#else
-+            status = gckKERNEL_GetVideoMemoryPool(Kernel, pool, &videoMemory);
-+#endif
-+
-+            if (gcmIS_SUCCESS(status))
-+            {
-+                /* Allocate memory. */
-+                status = gckVIDMEM_AllocateLinear(Kernel,
-+                                                  videoMemory,
-+                                                  Bytes,
-+                                                  Alignment,
-+                                                  Type,
-+                                                  &node);
-+
-+                if (gcmIS_SUCCESS(status))
-+                {
-+                    /* Memory allocated. */
-+                    node->VidMem.pool = pool;
-+                    break;
-+                }
-+            }
-+        }
-+
-+        if (pool == gcvPOOL_LOCAL_INTERNAL)
-+        {
-+            /* Advance to external memory. */
-+            pool = gcvPOOL_LOCAL_EXTERNAL;
-+        }
-+
-+        else
-+        if (pool == gcvPOOL_LOCAL_EXTERNAL)
-+        {
-+            /* Advance to contiguous system memory. */
-+            pool = gcvPOOL_SYSTEM;
-+        }
-+
-+        else
-+        if (pool == gcvPOOL_SYSTEM)
-+        {
-+            /* Advance to contiguous memory. */
-+            pool = gcvPOOL_CONTIGUOUS;
-+        }
-+
-+        else
-+        if (pool == gcvPOOL_CONTIGUOUS)
-+        {
-+            tileStatusInVirtual =
-+                gckHARDWARE_IsFeatureAvailable(Kernel->hardware,
-+                                               gcvFEATURE_MC20);
-+
-+            if (Type == gcvSURF_TILE_STATUS && tileStatusInVirtual != gcvTRUE)
-+            {
-+                gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+            }
-+
-+            /* Advance to virtual memory. */
-+            pool = gcvPOOL_VIRTUAL;
-+        }
-+
-+        else
-+        {
-+            /* Out of pools. */
-+            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+        }
-+    }
-+
-+    if (node == gcvNULL)
-+    {
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+        if(forceContiguous == gcvTRUE)
-+        {
-+            if(force_contiguous_lowmem_shrink(Kernel) == 0)
-+            {
-+                 /* Sleep 1 millisecond. */
-+                 gckOS_Delay(gcvNULL, 1);
-+                 goto _AllocateMemory_Retry;
-+            }
-+        }
-+#endif
-+        /* Nothing allocated. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Return node and pool used for allocation. */
-+    *Node = node;
-+    *Pool = pool;
-+
-+    /* Return status. */
-+    gcmkFOOTER_ARG("*Pool=%d *Node=0x%x", *Pool, *Node);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Dispatch
-+**
-+**  Dispatch a command received from the user HAL layer.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL FromUser
-+**          whether the call is from the user space.
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to a gcsHAL_INTERFACE structure that defines the command to
-+**          be dispatched.
-+**
-+**  OUTPUT:
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to a gcsHAL_INTERFACE structure that receives any data to be
-+**          returned.
-+*/
-+
-+gceSTATUS
-+gckKERNEL_Dispatch(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL FromUser,
-+    IN OUT gcsHAL_INTERFACE * Interface
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctSIZE_T bytes;
-+    gcuVIDMEM_NODE_PTR node;
-+    gctBOOL locked = gcvFALSE;
-+    gctPHYS_ADDR physical = gcvNULL;
-+    gctPOINTER logical = gcvNULL;
-+    gctPOINTER info = gcvNULL;
-+    gckCONTEXT context = gcvNULL;
-+    gctUINT32 address;
-+    gctUINT32 processID;
-+    gckKERNEL kernel = Kernel;
-+#if gcdSECURE_USER
-+    gcskSECURE_CACHE_PTR cache;
-+#endif
-+    gctBOOL asynchronous;
-+    gctPOINTER paddr = gcvNULL;
-+#if !USE_NEW_LINUX_SIGNAL
-+    gctSIGNAL   signal;
-+#endif
-+    gceSURF_TYPE type;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x FromUser=%d Interface=0x%x",
-+                   Kernel, FromUser, Interface);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
-+                   "Dispatching command %d (%s)",
-+                   Interface->command, _DispatchText[Interface->command]);
-+#endif
-+#if QNX_SINGLE_THREADED_DEBUGGING
-+    gckOS_AcquireMutex(Kernel->os, Kernel->debugMutex, gcvINFINITE);
-+#endif
-+
-+    /* Get the current process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&processID));
-+
-+#if gcdSECURE_USER
-+    gcmkONERROR(gckKERNEL_GetProcessDBCache(Kernel, processID, &cache));
-+#endif
-+
-+    /* Dispatch on command. */
-+    switch (Interface->command)
-+    {
-+    case gcvHAL_GET_BASE_ADDRESS:
-+        /* Get base address. */
-+        gcmkONERROR(
-+            gckOS_GetBaseAddress(Kernel->os,
-+                                 &Interface->u.GetBaseAddress.baseAddress));
-+        break;
-+
-+    case gcvHAL_QUERY_VIDEO_MEMORY:
-+        /* Query video memory size. */
-+        gcmkONERROR(gckKERNEL_QueryVideoMemory(Kernel, Interface));
-+        break;
-+
-+    case gcvHAL_QUERY_CHIP_IDENTITY:
-+        /* Query chip identity. */
-+        gcmkONERROR(
-+            gckHARDWARE_QueryChipIdentity(
-+                Kernel->hardware,
-+                &Interface->u.QueryChipIdentity));
-+        break;
-+
-+    case gcvHAL_MAP_MEMORY:
-+        physical = gcmINT2PTR(Interface->u.MapMemory.physical);
-+
-+        /* Map memory. */
-+        gcmkONERROR(
-+            gckKERNEL_MapMemory(Kernel,
-+                                physical,
-+                                (gctSIZE_T) Interface->u.MapMemory.bytes,
-+                                &logical));
-+
-+        Interface->u.MapMemory.logical = gcmPTR_TO_UINT64(logical);
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_MAP_MEMORY,
-+                                   logical,
-+                                   physical,
-+                                   (gctSIZE_T) Interface->u.MapMemory.bytes));
-+        break;
-+
-+    case gcvHAL_UNMAP_MEMORY:
-+        physical = gcmINT2PTR(Interface->u.UnmapMemory.physical);
-+
-+        /* Unmap memory. */
-+        gcmkONERROR(
-+            gckKERNEL_UnmapMemory(Kernel,
-+                                  physical,
-+                                  (gctSIZE_T) Interface->u.UnmapMemory.bytes,
-+                                  gcmUINT64_TO_PTR(Interface->u.UnmapMemory.logical)));
-+        gcmkVERIFY_OK(
-+            gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_MAP_MEMORY,
-+                                      gcmUINT64_TO_PTR(Interface->u.UnmapMemory.logical)));
-+        break;
-+
-+    case gcvHAL_ALLOCATE_NON_PAGED_MEMORY:
-+        bytes = (gctSIZE_T) Interface->u.AllocateNonPagedMemory.bytes;
-+
-+        /* Allocate non-paged memory. */
-+        gcmkONERROR(
-+            gckOS_AllocateNonPagedMemory(
-+                Kernel->os,
-+                FromUser,
-+                &bytes,
-+                &physical,
-+                &logical));
-+
-+        Interface->u.AllocateNonPagedMemory.bytes    = bytes;
-+        Interface->u.AllocateNonPagedMemory.logical  = gcmPTR_TO_UINT64(logical);
-+        Interface->u.AllocateNonPagedMemory.physical = gcmPTR_TO_NAME(physical);
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_NON_PAGED,
-+                                   logical,
-+                                   gcmINT2PTR(Interface->u.AllocateNonPagedMemory.physical),
-+                                   bytes));
-+
-+        break;
-+
-+    case gcvHAL_ALLOCATE_VIRTUAL_COMMAND_BUFFER:
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+        bytes = (gctSIZE_T) Interface->u.AllocateVirtualCommandBuffer.bytes;
-+
-+        gcmkONERROR(
-+            gckKERNEL_AllocateVirtualCommandBuffer(
-+                Kernel,
-+                FromUser,
-+                &bytes,
-+                &physical,
-+                &logical));
-+
-+        Interface->u.AllocateVirtualCommandBuffer.bytes    = bytes;
-+        Interface->u.AllocateVirtualCommandBuffer.logical  = gcmPTR_TO_UINT64(logical);
-+        Interface->u.AllocateVirtualCommandBuffer.physical = gcmPTR_TO_NAME(physical);
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_COMMAND_BUFFER,
-+                                   logical,
-+                                   gcmINT2PTR(Interface->u.AllocateVirtualCommandBuffer.physical),
-+                                   bytes));
-+#else
-+        status = gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+        break;
-+
-+    case gcvHAL_FREE_NON_PAGED_MEMORY:
-+        physical = gcmNAME_TO_PTR(Interface->u.FreeNonPagedMemory.physical);
-+
-+        /* Unmap user logical out of physical memory first. */
-+        gcmkONERROR(gckOS_UnmapUserLogical(Kernel->os,
-+                                           physical,
-+                                           (gctSIZE_T) Interface->u.FreeNonPagedMemory.bytes,
-+                                           gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
-+
-+        /* Free non-paged memory. */
-+        gcmkONERROR(
-+            gckOS_FreeNonPagedMemory(Kernel->os,
-+                                     (gctSIZE_T) Interface->u.FreeNonPagedMemory.bytes,
-+                                     physical,
-+                                     gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_NON_PAGED,
-+                                      gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
-+
-+#if gcdSECURE_USER
-+        gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+            Kernel,
-+            cache,
-+            gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical),
-+            Interface->u.FreeNonPagedMemory.bytes));
-+#endif
-+
-+        gcmRELEASE_NAME(Interface->u.FreeNonPagedMemory.physical);
-+
-+        break;
-+
-+    case gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY:
-+        bytes = (gctSIZE_T) Interface->u.AllocateContiguousMemory.bytes;
-+
-+        /* Allocate contiguous memory. */
-+        gcmkONERROR(gckOS_AllocateContiguous(
-+            Kernel->os,
-+            FromUser,
-+            &bytes,
-+            &physical,
-+            &logical));
-+
-+        Interface->u.AllocateContiguousMemory.bytes    = bytes;
-+        Interface->u.AllocateContiguousMemory.logical  = gcmPTR_TO_UINT64(logical);
-+        Interface->u.AllocateContiguousMemory.physical = gcmPTR_TO_NAME(physical);
-+
-+        gcmkONERROR(gckHARDWARE_ConvertLogical(
-+            Kernel->hardware,
-+            gcmUINT64_TO_PTR(Interface->u.AllocateContiguousMemory.logical),
-+            &Interface->u.AllocateContiguousMemory.address));
-+
-+        gcmkVERIFY_OK(gckKERNEL_AddProcessDB(
-+            Kernel,
-+            processID, gcvDB_CONTIGUOUS,
-+            logical,
-+            gcmINT2PTR(Interface->u.AllocateContiguousMemory.physical),
-+            bytes));
-+
-+        break;
-+
-+    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
-+        physical = gcmNAME_TO_PTR(Interface->u.FreeContiguousMemory.physical);
-+
-+        /* Unmap user logical out of physical memory first. */
-+        gcmkONERROR(gckOS_UnmapUserLogical(Kernel->os,
-+                                           physical,
-+                                           (gctSIZE_T) Interface->u.FreeContiguousMemory.bytes,
-+                                           gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical)));
-+
-+        /* Free contiguous memory. */
-+        gcmkONERROR(
-+            gckOS_FreeContiguous(Kernel->os,
-+                                 physical,
-+                                 gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical),
-+                                 (gctSIZE_T) Interface->u.FreeContiguousMemory.bytes));
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_CONTIGUOUS,
-+                                      gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
-+
-+#if gcdSECURE_USER
-+        gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+            Kernel,
-+            cache,
-+            gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical),
-+            Interface->u.FreeContiguousMemory.bytes));
-+#endif
-+
-+        gcmRELEASE_NAME(Interface->u.FreeContiguousMemory.physical);
-+
-+        break;
-+
-+    case gcvHAL_ALLOCATE_VIDEO_MEMORY:
-+
-+        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+
-+        break;
-+
-+    case gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY:
-+        type = Interface->u.AllocateLinearVideoMemory.type;
-+
-+        /* Allocate memory. */
-+        gcmkONERROR(
-+            _AllocateMemory(Kernel,
-+                            &Interface->u.AllocateLinearVideoMemory.pool,
-+                            Interface->u.AllocateLinearVideoMemory.bytes,
-+                            Interface->u.AllocateLinearVideoMemory.alignment,
-+                            Interface->u.AllocateLinearVideoMemory.type,
-+                            &node));
-+
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+            bytes = node->VidMem.bytes;
-+            node->VidMem.type = type;
-+
-+            gcmkONERROR(
-+                gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_VIDEO_MEMORY_RESERVED,
-+                                   node,
-+                                   gcvNULL,
-+                                   bytes));
-+        }
-+        else
-+        {
-+            bytes = node->Virtual.bytes;
-+            node->Virtual.type = type;
-+
-+            if(node->Virtual.contiguous)
-+            {
-+                gcmkONERROR(
-+                    gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_VIDEO_MEMORY_CONTIGUOUS,
-+                                   node,
-+                                   gcvNULL,
-+                                   bytes));
-+            }
-+            else
-+            {
-+                gcmkONERROR(
-+                    gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_VIDEO_MEMORY_VIRTUAL,
-+                                   node,
-+                                   gcvNULL,
-+                                   bytes));
-+            }
-+
-+        }
-+
-+        gcmkONERROR(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_VIDEO_MEMORY,
-+                                   node,
-+                                   gcvNULL,
-+                                   bytes));
-+
-+        /* Get the node. */
-+        Interface->u.AllocateLinearVideoMemory.node = gcmPTR_TO_UINT64(node);
-+        break;
-+
-+    case gcvHAL_FREE_VIDEO_MEMORY:
-+        node = gcmUINT64_TO_PTR(Interface->u.FreeVideoMemory.node);
-+#ifdef __QNXNTO__
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM
-+         && node->VidMem.logical != gcvNULL)
-+        {
-+            gcmkONERROR(
-+                    gckKERNEL_UnmapVideoMemory(Kernel,
-+                                               node->VidMem.logical,
-+                                               processID,
-+                                               node->VidMem.bytes));
-+            node->VidMem.logical = gcvNULL;
-+        }
-+#endif
-+        /* Free video memory. */
-+        gcmkONERROR(
-+            gckVIDMEM_Free(Kernel, node));
-+
-+        gcmkONERROR(
-+            gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_VIDEO_MEMORY,
-+                                      node));
-+
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+           gcmkONERROR(
-+                gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_VIDEO_MEMORY_RESERVED,
-+                                      node));
-+        }
-+        else if(node->Virtual.contiguous)
-+        {
-+            gcmkONERROR(
-+                gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_VIDEO_MEMORY_CONTIGUOUS,
-+                                      node));
-+        }
-+        else
-+        {
-+            gcmkONERROR(
-+                gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_VIDEO_MEMORY_VIRTUAL,
-+                                      node));
-+        }
-+
-+        break;
-+
-+    case gcvHAL_LOCK_VIDEO_MEMORY:
-+        node = gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node);
-+
-+        /* Lock video memory. */
-+        gcmkONERROR(
-+            gckVIDMEM_Lock(Kernel,
-+                           node,
-+                           Interface->u.LockVideoMemory.cacheable,
-+                           &Interface->u.LockVideoMemory.address));
-+
-+        locked = gcvTRUE;
-+
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+            /* Map video memory address into user space. */
-+#ifdef __QNXNTO__
-+        if (node->VidMem.logical == gcvNULL)
-+        {
-+            gcmkONERROR(
-+                gckKERNEL_MapVideoMemory(Kernel,
-+                                         FromUser,
-+                                         Interface->u.LockVideoMemory.address,
-+                                         processID,
-+                                         node->VidMem.bytes,
-+                                         &node->VidMem.logical));
-+        }
-+        gcmkASSERT(node->VidMem.logical != gcvNULL);
-+
-+        Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->VidMem.logical);
-+#else
-+            gcmkONERROR(
-+                gckKERNEL_MapVideoMemory(Kernel,
-+                                         FromUser,
-+                                         Interface->u.LockVideoMemory.address,
-+                                         &logical));
-+
-+            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(logical);
-+#endif
-+        }
-+        else
-+        {
-+            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->Virtual.logical);
-+
-+            /* Success. */
-+            status = gcvSTATUS_OK;
-+        }
-+
-+#if gcdSECURE_USER
-+        /* Return logical address as physical address. */
-+        Interface->u.LockVideoMemory.address =
-+            Interface->u.LockVideoMemory.memory;
-+#endif
-+        gcmkONERROR(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_VIDEO_MEMORY_LOCKED,
-+                                   node,
-+                                   gcvNULL,
-+                                   0));
-+
-+        break;
-+
-+    case gcvHAL_UNLOCK_VIDEO_MEMORY:
-+        /* Unlock video memory. */
-+        node = gcmUINT64_TO_PTR(Interface->u.UnlockVideoMemory.node);
-+
-+#if gcdSECURE_USER
-+        /* Save node information before it disappears. */
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+            logical = gcvNULL;
-+            bytes   = 0;
-+        }
-+        else
-+        {
-+            logical = node->Virtual.logical;
-+            bytes   = node->Virtual.bytes;
-+        }
-+#endif
-+
-+        /* Unlock video memory. */
-+        gcmkONERROR(
-+            gckVIDMEM_Unlock(Kernel,
-+                             node,
-+                             Interface->u.UnlockVideoMemory.type,
-+                             &Interface->u.UnlockVideoMemory.asynchroneous));
-+
-+#if gcdSECURE_USER
-+        /* Flush the translation cache for virtual surfaces. */
-+        if (logical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(Kernel,
-+                                                          cache,
-+                                                          logical,
-+                                                          bytes));
-+        }
-+#endif
-+        if (Interface->u.UnlockVideoMemory.asynchroneous == gcvFALSE)
-+        {
-+            /* There isn't a event to unlock this node, remove record now */
-+            gcmkONERROR(
-+                gckKERNEL_RemoveProcessDB(Kernel,
-+                                          processID, gcvDB_VIDEO_MEMORY_LOCKED,
-+                                          node));
-+        }
-+        break;
-+
-+    case gcvHAL_EVENT_COMMIT:
-+        /* Commit an event queue. */
-+        gcmkONERROR(
-+            gckEVENT_Commit(Kernel->eventObj,
-+                            gcmUINT64_TO_PTR(Interface->u.Event.queue)));
-+        break;
-+
-+    case gcvHAL_COMMIT:
-+        /* Commit a command and context buffer. */
-+        gcmkONERROR(
-+            gckCOMMAND_Commit(Kernel->command,
-+                              Interface->u.Commit.context ?
-+                                  gcmNAME_TO_PTR(Interface->u.Commit.context) : gcvNULL,
-+                              gcmUINT64_TO_PTR(Interface->u.Commit.commandBuffer),
-+                              gcmUINT64_TO_PTR(Interface->u.Commit.delta),
-+                              gcmUINT64_TO_PTR(Interface->u.Commit.queue),
-+                              processID));
-+        break;
-+
-+    case gcvHAL_STALL:
-+        /* Stall the command queue. */
-+        gcmkONERROR(gckCOMMAND_Stall(Kernel->command, gcvFALSE));
-+        break;
-+
-+    case gcvHAL_MAP_USER_MEMORY:
-+        /* Map user memory to DMA. */
-+        gcmkONERROR(
-+            gckOS_MapUserMemory(Kernel->os,
-+                                Kernel->core,
-+                                gcmUINT64_TO_PTR(Interface->u.MapUserMemory.memory),
-+                                Interface->u.MapUserMemory.physical,
-+                                (gctSIZE_T) Interface->u.MapUserMemory.size,
-+                                &info,
-+                                &Interface->u.MapUserMemory.address));
-+
-+        Interface->u.MapUserMemory.info = gcmPTR_TO_NAME(info);
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_MAP_USER_MEMORY,
-+                                   gcmINT2PTR(Interface->u.MapUserMemory.info),
-+                                   gcmUINT64_TO_PTR(Interface->u.MapUserMemory.memory),
-+                                   (gctSIZE_T) Interface->u.MapUserMemory.size));
-+        break;
-+
-+    case gcvHAL_UNMAP_USER_MEMORY:
-+        address = Interface->u.UnmapUserMemory.address;
-+        info = gcmNAME_TO_PTR(Interface->u.UnmapUserMemory.info);
-+
-+        /* Unmap user memory. */
-+        gcmkONERROR(
-+            gckOS_UnmapUserMemory(Kernel->os,
-+                                  Kernel->core,
-+                                  gcmUINT64_TO_PTR(Interface->u.UnmapUserMemory.memory),
-+                                  (gctSIZE_T) Interface->u.UnmapUserMemory.size,
-+                                  info,
-+                                  address));
-+
-+#if gcdSECURE_USER
-+        gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+            Kernel,
-+            cache,
-+            gcmUINT64_TO_PTR(Interface->u.UnmapUserMemory.memory),
-+            Interface->u.UnmapUserMemory.size));
-+#endif
-+        gcmkVERIFY_OK(
-+            gckKERNEL_RemoveProcessDB(Kernel,
-+                                      processID, gcvDB_MAP_USER_MEMORY,
-+                                      gcmINT2PTR(Interface->u.UnmapUserMemory.info)));
-+
-+        gcmRELEASE_NAME(Interface->u.UnmapUserMemory.info);
-+
-+        break;
-+
-+#if !USE_NEW_LINUX_SIGNAL
-+    case gcvHAL_USER_SIGNAL:
-+        /* Dispatch depends on the user signal subcommands. */
-+        switch(Interface->u.UserSignal.command)
-+        {
-+        case gcvUSER_SIGNAL_CREATE:
-+            /* Create a signal used in the user space. */
-+            gcmkONERROR(
-+                gckOS_CreateUserSignal(Kernel->os,
-+                                       Interface->u.UserSignal.manualReset,
-+                                       &Interface->u.UserSignal.id));
-+
-+            gcmkVERIFY_OK(
-+                gckKERNEL_AddProcessDB(Kernel,
-+                                       processID, gcvDB_SIGNAL,
-+                                       gcmINT2PTR(Interface->u.UserSignal.id),
-+                                       gcvNULL,
-+                                       0));
-+            break;
-+
-+        case gcvUSER_SIGNAL_DESTROY:
-+            /* Destroy the signal. */
-+            gcmkONERROR(
-+                gckOS_DestroyUserSignal(Kernel->os,
-+                                        Interface->u.UserSignal.id));
-+
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Kernel,
-+                processID, gcvDB_SIGNAL,
-+                gcmINT2PTR(Interface->u.UserSignal.id)));
-+            break;
-+
-+        case gcvUSER_SIGNAL_SIGNAL:
-+            /* Signal the signal. */
-+            gcmkONERROR(
-+                gckOS_SignalUserSignal(Kernel->os,
-+                                       Interface->u.UserSignal.id,
-+                                       Interface->u.UserSignal.state));
-+            break;
-+
-+        case gcvUSER_SIGNAL_WAIT:
-+#if gcdGPU_TIMEOUT
-+            if (Interface->u.UserSignal.wait == gcvINFINITE)
-+            {
-+                gckHARDWARE hardware;
-+                gctUINT32 timer = 0;
-+
-+                for(;;)
-+                {
-+                    /* Wait on the signal. */
-+                    status = gckOS_WaitUserSignal(Kernel->os,
-+                                                  Interface->u.UserSignal.id,
-+                                                  gcdGPU_ADVANCETIMER);
-+
-+                    if (status == gcvSTATUS_TIMEOUT)
-+                    {
-+                        gcmkONERROR(
-+                            gckOS_SignalQueryHardware(Kernel->os,
-+                                                      (gctSIGNAL)(gctUINTPTR_T)Interface->u.UserSignal.id,
-+                                                      &hardware));
-+
-+                        if (hardware)
-+                        {
-+                            /* This signal is bound to a hardware,
-+                            ** so the timeout is limited by Kernel->timeOut.
-+                            */
-+                            timer += gcdGPU_ADVANCETIMER;
-+                        }
-+
-+                        if (timer >= Kernel->timeOut)
-+                        {
-+                            gcmkONERROR(
-+                                gckOS_Broadcast(Kernel->os,
-+                                                hardware,
-+                                                gcvBROADCAST_GPU_STUCK));
-+
-+                            timer = 0;
-+
-+                            /* If a few process try to reset GPU, only one
-+                            ** of them can do the real reset, other processes
-+                            ** still need to wait for this signal is triggered,
-+                            ** which menas reset is finished.
-+                            */
-+                            continue;
-+                        }
-+                    }
-+                    else
-+                    {
-+                        /* Bail out on other error. */
-+                        gcmkONERROR(status);
-+
-+                        /* Wait for signal successfully. */
-+                        break;
-+                    }
-+                }
-+            }
-+            else
-+#endif
-+            {
-+                /* Wait on the signal. */
-+                status = gckOS_WaitUserSignal(Kernel->os,
-+                                              Interface->u.UserSignal.id,
-+                                              Interface->u.UserSignal.wait);
-+            }
-+
-+            break;
-+
-+        case gcvUSER_SIGNAL_MAP:
-+            gcmkONERROR(
-+                gckOS_MapSignal(Kernel->os,
-+                               (gctSIGNAL)(gctUINTPTR_T)Interface->u.UserSignal.id,
-+                               (gctHANDLE)(gctUINTPTR_T)processID,
-+                               &signal));
-+
-+            gcmkVERIFY_OK(
-+                gckKERNEL_AddProcessDB(Kernel,
-+                                       processID, gcvDB_SIGNAL,
-+                                       gcmINT2PTR(Interface->u.UserSignal.id),
-+                                       gcvNULL,
-+                                       0));
-+            break;
-+
-+        case gcvUSER_SIGNAL_UNMAP:
-+            /* Destroy the signal. */
-+            gcmkONERROR(
-+                gckOS_DestroyUserSignal(Kernel->os,
-+                                        Interface->u.UserSignal.id));
-+
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Kernel,
-+                processID, gcvDB_SIGNAL,
-+                gcmINT2PTR(Interface->u.UserSignal.id)));
-+            break;
-+
-+        default:
-+            /* Invalid user signal command. */
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+        break;
-+#endif
-+
-+    case gcvHAL_SET_POWER_MANAGEMENT_STATE:
-+        /* Set the power management state. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetPowerManagementState(
-+                Kernel->hardware,
-+                Interface->u.SetPowerManagement.state));
-+        break;
-+
-+    case gcvHAL_QUERY_POWER_MANAGEMENT_STATE:
-+        /* Chip is not idle. */
-+        Interface->u.QueryPowerManagement.isIdle = gcvFALSE;
-+
-+        /* Query the power management state. */
-+        gcmkONERROR(gckHARDWARE_QueryPowerManagementState(
-+            Kernel->hardware,
-+            &Interface->u.QueryPowerManagement.state));
-+
-+        /* Query the idle state. */
-+        gcmkONERROR(
-+            gckHARDWARE_QueryIdle(Kernel->hardware,
-+                                  &Interface->u.QueryPowerManagement.isIdle));
-+        break;
-+
-+    case gcvHAL_READ_REGISTER:
-+#if gcdREGISTER_ACCESS_FROM_USER
-+        {
-+            gceCHIPPOWERSTATE power;
-+
-+            gckOS_AcquireMutex(Kernel->os, Kernel->hardware->powerMutex, gcvINFINITE);
-+            gcmkONERROR(gckHARDWARE_QueryPowerManagementState(Kernel->hardware,
-+                                                              &power));
-+            if (power == gcvPOWER_ON)
-+            {
-+                /* Read a register. */
-+                gcmkONERROR(gckOS_ReadRegisterEx(
-+                    Kernel->os,
-+                    Kernel->core,
-+                    Interface->u.ReadRegisterData.address,
-+                    &Interface->u.ReadRegisterData.data));
-+            }
-+            else
-+            {
-+                /* Chip is in power-state. */
-+                Interface->u.ReadRegisterData.data = 0;
-+                status = gcvSTATUS_CHIP_NOT_READY;
-+            }
-+            gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->hardware->powerMutex));
-+        }
-+#else
-+        /* No access from user land to read registers. */
-+        Interface->u.ReadRegisterData.data = 0;
-+        status = gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+        break;
-+
-+    case gcvHAL_WRITE_REGISTER:
-+#if gcdREGISTER_ACCESS_FROM_USER
-+        {
-+            gceCHIPPOWERSTATE power;
-+
-+            gckOS_AcquireMutex(Kernel->os, Kernel->hardware->powerMutex, gcvINFINITE);
-+            gcmkONERROR(gckHARDWARE_QueryPowerManagementState(Kernel->hardware,
-+                                                                  &power));
-+            if (power == gcvPOWER_ON)
-+            {
-+                /* Write a register. */
-+                gcmkONERROR(
-+                    gckOS_WriteRegisterEx(Kernel->os,
-+                                          Kernel->core,
-+                                          Interface->u.WriteRegisterData.address,
-+                                          Interface->u.WriteRegisterData.data));
-+            }
-+            else
-+            {
-+                /* Chip is in power-state. */
-+                Interface->u.WriteRegisterData.data = 0;
-+                status = gcvSTATUS_CHIP_NOT_READY;
-+            }
-+            gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->hardware->powerMutex));
-+        }
-+#else
-+        /* No access from user land to write registers. */
-+        status = gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+        break;
-+
-+    case gcvHAL_READ_ALL_PROFILE_REGISTERS:
-+#if VIVANTE_PROFILER && VIVANTE_PROFILER_CONTEXT
-+        /* Read profile data according to the context. */
-+        gcmkONERROR(
-+            gckHARDWARE_QueryContextProfile(
-+                Kernel->hardware,
-+                Kernel->profileCleanRegister,
-+                gcmNAME_TO_PTR(Interface->u.RegisterProfileData.context),
-+                &Interface->u.RegisterProfileData.counters));
-+#elif VIVANTE_PROFILER
-+        /* Read all 3D profile registers. */
-+        gcmkONERROR(
-+            gckHARDWARE_QueryProfileRegisters(
-+                Kernel->hardware,
-+                Kernel->profileCleanRegister,
-+                &Interface->u.RegisterProfileData.counters));
-+#else
-+        status = gcvSTATUS_OK;
-+#endif
-+        break;
-+
-+    case gcvHAL_PROFILE_REGISTERS_2D:
-+#if VIVANTE_PROFILER
-+        /* Read all 2D profile registers. */
-+        gcmkONERROR(
-+            gckHARDWARE_ProfileEngine2D(
-+                Kernel->hardware,
-+                gcmUINT64_TO_PTR(Interface->u.RegisterProfileData2D.hwProfile2D)));
-+#else
-+        status = gcvSTATUS_OK;
-+#endif
-+        break;
-+
-+    case gcvHAL_GET_PROFILE_SETTING:
-+#if VIVANTE_PROFILER
-+        /* Get profile setting */
-+        Interface->u.GetProfileSetting.enable = Kernel->profileEnable;
-+#endif
-+
-+        status = gcvSTATUS_OK;
-+        break;
-+    case gcvHAL_SET_PROFILE_SETTING:
-+#if VIVANTE_PROFILER
-+        /* Set profile setting */
-+        if(Kernel->hardware->gpuProfiler)
-+            Kernel->profileEnable = Interface->u.SetProfileSetting.enable;
-+        else
-+        {
-+            status = gcvSTATUS_NOT_SUPPORTED;
-+            break;
-+        }
-+#endif
-+
-+        status = gcvSTATUS_OK;
-+        break;
-+
-+#if VIVANTE_PROFILER_PERDRAW
-+    case gcvHAL_READ_PROFILER_REGISTER_SETTING:
-+    #if VIVANTE_PROFILER
-+        Kernel->profileCleanRegister = Interface->u.SetProfilerRegisterClear.bclear;
-+    #endif
-+        status = gcvSTATUS_OK;
-+        break;
-+#endif
-+
-+    case gcvHAL_QUERY_KERNEL_SETTINGS:
-+        /* Get kernel settings. */
-+        gcmkONERROR(
-+            gckKERNEL_QuerySettings(Kernel,
-+                                    &Interface->u.QueryKernelSettings.settings));
-+        break;
-+
-+    case gcvHAL_RESET:
-+        /* Reset the hardware. */
-+        gckKERNEL_Recovery(Kernel);
-+        break;
-+
-+    case gcvHAL_DEBUG:
-+        /* Set debug level and zones. */
-+        if (Interface->u.Debug.set)
-+        {
-+            gckOS_SetDebugLevel(Interface->u.Debug.level);
-+            gckOS_SetDebugZones(Interface->u.Debug.zones,
-+                                Interface->u.Debug.enable);
-+        }
-+
-+        if (Interface->u.Debug.message[0] != '\0')
-+        {
-+            /* Print a message to the debugger. */
-+            if (Interface->u.Debug.type == gcvMESSAGE_TEXT)
-+            {
-+               gckOS_CopyPrint(Interface->u.Debug.message);
-+            }
-+            else
-+            {
-+               gckOS_DumpBuffer(Kernel->os,
-+                                Interface->u.Debug.message,
-+                                Interface->u.Debug.messageSize,
-+                                gceDUMP_BUFFER_FROM_USER,
-+                                gcvTRUE);
-+            }
-+        }
-+        status = gcvSTATUS_OK;
-+        break;
-+
-+    case gcvHAL_DUMP_GPU_STATE:
-+        /* Dump GPU state */
-+        {
-+            gceCHIPPOWERSTATE power;
-+            gcmkONERROR(gckHARDWARE_QueryPowerManagementState(Kernel->hardware,
-+                                                              &power));
-+            if (power == gcvPOWER_ON)
-+            {
-+                Interface->u.ReadRegisterData.data = 1;
-+                gcmkVERIFY_OK(
-+                    gckHARDWARE_DumpGPUState(Kernel->hardware));
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+                gcmkVERIFY_OK(
-+                    gckCOMMAND_DumpExecutingBuffer(Kernel->command));
-+#endif
-+            }
-+            else
-+            {
-+                Interface->u.ReadRegisterData.data = 0;
-+                status = gcvSTATUS_CHIP_NOT_READY;
-+            }
-+        }
-+        break;
-+
-+    case gcvHAL_DUMP_EVENT:
-+        /* Dump GPU event */
-+        gcmkVERIFY_OK(gckEVENT_Dump(Kernel->eventObj));
-+
-+        /* Dump Process DB. */
-+        gcmkVERIFY_OK(gckKERNEL_DumpProcessDB(Kernel));
-+        break;
-+
-+    case gcvHAL_CACHE:
-+        node = gcmUINT64_TO_PTR(Interface->u.Cache.node);
-+        if (node == gcvNULL)
-+        {
-+            /* FIXME Surface wrap some memory which is not allocated by us,
-+            ** So we don't have physical address to handle outer cache, ignore it*/
-+            status = gcvSTATUS_OK;
-+            break;
-+        }
-+        else if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+            /* Video memory has no physical handles. */
-+            physical = gcvNULL;
-+        }
-+        else
-+        {
-+            /* Grab physical handle. */
-+            physical = node->Virtual.physical;
-+        }
-+
-+        logical = gcmUINT64_TO_PTR(Interface->u.Cache.logical);
-+        bytes = (gctSIZE_T) Interface->u.Cache.bytes;
-+        switch(Interface->u.Cache.operation)
-+        {
-+        case gcvCACHE_FLUSH:
-+            /* Clean and invalidate the cache. */
-+            status = gckOS_CacheFlush(Kernel->os,
-+                                      processID,
-+                                      physical,
-+                                      paddr,
-+                                      logical,
-+                                      bytes);
-+            break;
-+        case gcvCACHE_CLEAN:
-+            /* Clean the cache. */
-+            status = gckOS_CacheClean(Kernel->os,
-+                                      processID,
-+                                      physical,
-+                                      paddr,
-+                                      logical,
-+                                      bytes);
-+            break;
-+        case gcvCACHE_INVALIDATE:
-+            /* Invalidate the cache. */
-+            status = gckOS_CacheInvalidate(Kernel->os,
-+                                           processID,
-+                                           physical,
-+                                           paddr,
-+                                           logical,
-+                                           bytes);
-+            break;
-+
-+	case gcvCACHE_MEMORY_BARRIER:
-+	   status = gckOS_MemoryBarrier(Kernel->os,
-+                                        logical);
-+	   break;
-+        default:
-+            status = gcvSTATUS_INVALID_ARGUMENT;
-+            break;
-+        }
-+        break;
-+
-+    case gcvHAL_TIMESTAMP:
-+        /* Check for invalid timer. */
-+        if ((Interface->u.TimeStamp.timer >= gcmCOUNTOF(Kernel->timers))
-+        ||  (Interface->u.TimeStamp.request != 2))
-+        {
-+            Interface->u.TimeStamp.timeDelta = 0;
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        /* Return timer results and reset timer. */
-+        {
-+            gcsTIMER_PTR timer = &(Kernel->timers[Interface->u.TimeStamp.timer]);
-+            gctUINT64 timeDelta = 0;
-+
-+            if (timer->stopTime < timer->startTime )
-+            {
-+                Interface->u.TimeStamp.timeDelta = 0;
-+                gcmkONERROR(gcvSTATUS_TIMER_OVERFLOW);
-+            }
-+
-+            timeDelta = timer->stopTime - timer->startTime;
-+
-+            /* Check truncation overflow. */
-+            Interface->u.TimeStamp.timeDelta = (gctINT32) timeDelta;
-+			/*bit0~bit30 is available*/
-+            if (timeDelta>>31)
-+            {
-+                Interface->u.TimeStamp.timeDelta = 0;
-+                gcmkONERROR(gcvSTATUS_TIMER_OVERFLOW);
-+            }
-+
-+            status = gcvSTATUS_OK;
-+        }
-+        break;
-+
-+    case gcvHAL_DATABASE:
-+        /* Query video memory. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.Database.processID,
-+                                     !Interface->u.Database.validProcessID,
-+                                     gcvDB_VIDEO_MEMORY,
-+                                     &Interface->u.Database.vidMem));
-+
-+        /* Query non-paged memory. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.Database.processID,
-+                                     !Interface->u.Database.validProcessID,
-+                                     gcvDB_NON_PAGED,
-+                                     &Interface->u.Database.nonPaged));
-+
-+        /* Query contiguous memory. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.Database.processID,
-+                                     !Interface->u.Database.validProcessID,
-+                                     gcvDB_CONTIGUOUS,
-+                                     &Interface->u.Database.contiguous));
-+
-+        /* Query GPU idle time. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.Database.processID,
-+                                     !Interface->u.Database.validProcessID,
-+                                     gcvDB_IDLE,
-+                                     &Interface->u.Database.gpuIdle));
-+        break;
-+
-+    case gcvHAL_VIDMEM_DATABASE:
-+        /* Query reserved video memory. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.VidMemDatabase.processID,
-+                                     !Interface->u.VidMemDatabase.validProcessID,
-+                                     gcvDB_VIDEO_MEMORY_RESERVED,
-+                                     &Interface->u.VidMemDatabase.vidMemResv));
-+
-+        /* Query contiguous video memory. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.VidMemDatabase.processID,
-+                                     !Interface->u.VidMemDatabase.validProcessID,
-+                                     gcvDB_VIDEO_MEMORY_CONTIGUOUS,
-+                                     &Interface->u.VidMemDatabase.vidMemCont));
-+
-+        /* Query virtual video memory. */
-+        gcmkONERROR(
-+            gckKERNEL_QueryProcessDB(Kernel,
-+                                     Interface->u.VidMemDatabase.processID,
-+                                     !Interface->u.VidMemDatabase.validProcessID,
-+                                     gcvDB_VIDEO_MEMORY_VIRTUAL,
-+                                     &Interface->u.VidMemDatabase.vidMemVirt));
-+
-+        break;
-+
-+    case gcvHAL_VERSION:
-+        Interface->u.Version.major = gcvVERSION_MAJOR;
-+        Interface->u.Version.minor = gcvVERSION_MINOR;
-+        Interface->u.Version.patch = gcvVERSION_PATCH;
-+        Interface->u.Version.build = gcvVERSION_BUILD;
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
-+                       "KERNEL version %d.%d.%d build %u %s %s",
-+                       gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH,
-+                       gcvVERSION_BUILD, gcvVERSION_DATE, gcvVERSION_TIME);
-+#endif
-+        break;
-+
-+    case gcvHAL_CHIP_INFO:
-+        /* Only if not support multi-core */
-+        Interface->u.ChipInfo.count = 1;
-+        Interface->u.ChipInfo.types[0] = Kernel->hardware->type;
-+        break;
-+
-+    case gcvHAL_ATTACH:
-+        /* Attach user process. */
-+        gcmkONERROR(
-+            gckCOMMAND_Attach(Kernel->command,
-+                              &context,
-+                              &bytes,
-+                              processID));
-+
-+        Interface->u.Attach.stateCount = bytes;
-+        Interface->u.Attach.context = gcmPTR_TO_NAME(context);
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_CONTEXT,
-+                                   gcmINT2PTR(Interface->u.Attach.context),
-+                                   gcvNULL,
-+                                   0));
-+        break;
-+
-+    case gcvHAL_DETACH:
-+        /* Detach user process. */
-+        gcmkONERROR(
-+            gckCOMMAND_Detach(Kernel->command,
-+                              gcmNAME_TO_PTR(Interface->u.Detach.context)));
-+
-+        gcmkVERIFY_OK(
-+            gckKERNEL_RemoveProcessDB(Kernel,
-+                              processID, gcvDB_CONTEXT,
-+                              gcmINT2PTR(Interface->u.Detach.context)));
-+
-+        gcmRELEASE_NAME(Interface->u.Detach.context);
-+        break;
-+
-+    case gcvHAL_COMPOSE:
-+        Interface->u.Compose.physical = gcmPTR_TO_UINT64(gcmNAME_TO_PTR(Interface->u.Compose.physical));
-+        /* Start composition. */
-+        gcmkONERROR(
-+            gckEVENT_Compose(Kernel->eventObj,
-+                             &Interface->u.Compose));
-+        break;
-+
-+    case gcvHAL_SET_TIMEOUT:
-+         /* set timeOut value from user */
-+         gckKERNEL_SetTimeOut(Kernel, Interface->u.SetTimeOut.timeOut);
-+        break;
-+
-+#if gcdFRAME_DB
-+    case gcvHAL_GET_FRAME_INFO:
-+        gcmkONERROR(gckHARDWARE_GetFrameInfo(
-+            Kernel->hardware,
-+            gcmUINT64_TO_PTR(Interface->u.GetFrameInfo.frameInfo)));
-+        break;
-+#endif
-+
-+    case gcvHAL_GET_SHARED_INFO:
-+        if (Interface->u.GetSharedInfo.data == gcvNULL)
-+        {
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+        else
-+        {
-+            gctUINT32 pid    = Interface->u.GetSharedInfo.pid;
-+            gctUINT32 dataId = Interface->u.GetSharedInfo.dataId;
-+            gctSIZE_T bytes  = Interface->u.GetSharedInfo.bytes;
-+            gctPOINTER data  = Interface->u.GetSharedInfo.data;
-+            gcsDATABASE_RECORD record;
-+
-+            /* Find record. */
-+            gcmkONERROR(
-+                gckKERNEL_FindProcessDB(Kernel,
-+                                        pid,
-+                                        0,
-+                                        gcvDB_SHARED_INFO,
-+                                        gcmINT2PTR(dataId),
-+                                        &record));
-+
-+            /* Check memory size. */
-+            if (bytes < record.bytes)
-+            {
-+                /* Insufficient memory to hold shared data. */
-+                gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+            }
-+
-+            /* Copy to user. */
-+            status = gckOS_CopyToUserData(Kernel->os,
-+                                          record.physical,
-+                                          data,
-+                                          record.bytes);
-+
-+            /*
-+             * Remove from process db.
-+             * Every time when shared info is taken, the record is erased in
-+             * kernel side.
-+             */
-+            gcmkVERIFY_OK(
-+                gckKERNEL_RemoveProcessDB(Kernel,
-+                                          pid,
-+                                          gcvDB_SHARED_INFO,
-+                                          gcmINT2PTR(dataId)));
-+            /* Free existed data. */
-+            gcmkVERIFY_OK(
-+                gckOS_FreeMemory(Kernel->os, record.physical));
-+        }
-+        break;
-+
-+    case gcvHAL_SET_SHARED_INFO:
-+        {
-+            gctUINT32 dataId = Interface->u.SetSharedInfo.dataId;
-+            gctPOINTER data  = Interface->u.SetSharedInfo.data;
-+            gctUINT32 bytes  = Interface->u.SetSharedInfo.bytes;
-+            gctPOINTER memory = gcvNULL;
-+            gcsDATABASE_RECORD record;
-+
-+            if (gcmIS_SUCCESS(gckKERNEL_FindProcessDB(Kernel,
-+                                                     processID,
-+                                                     0,
-+                                                     gcvDB_SHARED_INFO,
-+                                                     gcmINT2PTR(dataId),
-+                                                     &record)))
-+            {
-+                /* Find a record with the same id. */
-+                if (bytes != record.bytes)
-+                {
-+                    /* Remove from process db. */
-+                    gcmkVERIFY_OK(
-+                        gckKERNEL_RemoveProcessDB(Kernel,
-+                                                  processID,
-+                                                  gcvDB_SHARED_INFO,
-+                                                  gcmINT2PTR(dataId)));
-+
-+                    /* Free existed data. */
-+                    gcmkVERIFY_OK(
-+                        gckOS_FreeMemory(Kernel->os, record.physical));
-+                }
-+                else
-+                {
-+                    /* Re-use allocated memory. */
-+                    memory = record.physical;
-+                }
-+            }
-+
-+            if ((data == gcvNULL) || (bytes == 0))
-+            {
-+                /* Nothing to record. */
-+                break;
-+            }
-+
-+            if (bytes > 1024)
-+            {
-+                /* Limite data size. */
-+                gcmkONERROR(gcvSTATUS_TOO_COMPLEX);
-+            }
-+
-+            if (memory == gcvNULL)
-+            {
-+                /* Allocate memory for holding shared data. */
-+                gcmkONERROR(
-+                    gckOS_AllocateMemory(Kernel->os, bytes, &memory));
-+
-+                /* Add to process db. */
-+                status = gckKERNEL_AddProcessDB(Kernel,
-+                                                processID,
-+                                                gcvDB_SHARED_INFO,
-+                                                gcmINT2PTR(dataId),
-+                                                memory,
-+                                                bytes);
-+
-+                if (gcmIS_ERROR(status))
-+                {
-+                    /* Failed to add process db. Free allocated memory. */
-+                    gcmkVERIFY_OK(gckOS_FreeMemory(Kernel->os, memory));
-+                    break;
-+                }
-+            }
-+
-+            /* Copy shared data to kernel memory. */
-+            gcmkONERROR(
-+                gckOS_CopyFromUserData(Kernel->os,
-+                                       memory,
-+                                       data,
-+                                       bytes));
-+        }
-+        break;
-+
-+    case gcvHAL_SET_FSCALE_VALUE:
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+        status = gckHARDWARE_SetFscaleValue(Kernel->hardware,
-+                                            Interface->u.SetFscaleValue.value);
-+#else
-+        status = gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+        break;
-+    case gcvHAL_GET_FSCALE_VALUE:
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+        status = gckHARDWARE_GetFscaleValue(Kernel->hardware,
-+                                            &Interface->u.GetFscaleValue.value,
-+                                            &Interface->u.GetFscaleValue.minValue,
-+                                            &Interface->u.GetFscaleValue.maxValue);
-+#else
-+        status = gcvSTATUS_NOT_SUPPORTED;
-+#endif
-+        break;
-+
-+    case gcvHAL_QUERY_RESET_TIME_STAMP:
-+#if gcdENABLE_RECOVERY
-+        Interface->u.QueryResetTimeStamp.timeStamp = Kernel->resetTimeStamp;
-+#else
-+        Interface->u.QueryResetTimeStamp.timeStamp = 0;
-+#endif
-+        break;
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    case gcvHAL_SYNC_POINT:
-+        {
-+            gctSYNC_POINT syncPoint;
-+
-+            switch (Interface->u.SyncPoint.command)
-+            {
-+            case gcvSYNC_POINT_CREATE:
-+                gcmkONERROR(gckOS_CreateSyncPoint(Kernel->os, &syncPoint));
-+
-+                Interface->u.SyncPoint.syncPoint = gcmPTR_TO_UINT64(syncPoint);
-+
-+                gcmkVERIFY_OK(
-+                    gckKERNEL_AddProcessDB(Kernel,
-+                                           processID, gcvDB_SYNC_POINT,
-+                                           syncPoint,
-+                                           gcvNULL,
-+                                           0));
-+                break;
-+
-+            case gcvSYNC_POINT_DESTROY:
-+                syncPoint = gcmUINT64_TO_PTR(Interface->u.SyncPoint.syncPoint);
-+
-+                gcmkONERROR(gckOS_DestroySyncPoint(Kernel->os, syncPoint));
-+
-+                gcmkVERIFY_OK(
-+                    gckKERNEL_RemoveProcessDB(Kernel,
-+                                              processID, gcvDB_SYNC_POINT,
-+                                              syncPoint));
-+                break;
-+
-+            default:
-+                gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+                break;
-+            }
-+        }
-+        break;
-+
-+    case gcvHAL_CREATE_NATIVE_FENCE:
-+        {
-+            gctINT fenceFD;
-+            gctSYNC_POINT syncPoint =
-+                gcmUINT64_TO_PTR(Interface->u.CreateNativeFence.syncPoint);
-+
-+            gcmkONERROR(
-+                gckOS_CreateNativeFence(Kernel->os,
-+                                        Kernel->timeline,
-+                                        syncPoint,
-+                                        &fenceFD));
-+
-+            Interface->u.CreateNativeFence.fenceFD = fenceFD;
-+        }
-+        break;
-+#endif
-+
-+    default:
-+        /* Invalid command. */
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+OnError:
-+    /* Save status. */
-+    Interface->status = status;
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        if (locked)
-+        {
-+            /* Roll back the lock. */
-+            gcmkVERIFY_OK(
-+                gckVIDMEM_Unlock(Kernel,
-+                                 gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node),
-+                                 gcvSURF_TYPE_UNKNOWN,
-+                                 &asynchronous));
-+
-+            if (gcvTRUE == asynchronous)
-+            {
-+                /* Bottom Half */
-+                gcmkVERIFY_OK(
-+                    gckVIDMEM_Unlock(Kernel,
-+                                     gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node),
-+                                     gcvSURF_TYPE_UNKNOWN,
-+                                     gcvNULL));
-+            }
-+        }
-+    }
-+
-+#if QNX_SINGLE_THREADED_DEBUGGING
-+    gckOS_ReleaseMutex(Kernel->os, Kernel->debugMutex);
-+#endif
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_AttachProcess
-+**
-+**  Attach or detach a process.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL Attach
-+**          gcvTRUE if a new process gets attached or gcFALSE when a process
-+**          gets detatched.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_AttachProcess(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL Attach
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 processID;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Attach=%d", Kernel, Attach);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Get current process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&processID));
-+
-+    gcmkONERROR(gckKERNEL_AttachProcessEx(Kernel, Attach, processID));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_AttachProcessEx
-+**
-+**  Attach or detach a process with the given PID. Can be paired with gckKERNEL_AttachProcess
-+**     provided the programmer is aware of the consequences.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL Attach
-+**          gcvTRUE if a new process gets attached or gcFALSE when a process
-+**          gets detatched.
-+**
-+**      gctUINT32 PID
-+**          PID of the process to attach or detach.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_AttachProcessEx(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL Attach,
-+    IN gctUINT32 PID
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT32 old;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Attach=%d PID=%d", Kernel, Attach, PID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    if (Attach)
-+    {
-+        /* Increment the number of clients attached. */
-+        gcmkONERROR(
-+            gckOS_AtomIncrement(Kernel->os, Kernel->atomClients, &old));
-+
-+        if (old == 0)
-+        {
-+#if gcdENABLE_VG
-+            if (Kernel->vg == gcvNULL)
-+#endif
-+            {
-+                gcmkONERROR(gckOS_Broadcast(Kernel->os,
-+                                            Kernel->hardware,
-+                                            gcvBROADCAST_FIRST_PROCESS));
-+            }
-+        }
-+
-+        if (Kernel->dbCreated)
-+        {
-+            /* Create the process database. */
-+            gcmkONERROR(gckKERNEL_CreateProcessDB(Kernel, PID));
-+        }
-+    }
-+    else
-+    {
-+        if (Kernel->dbCreated)
-+        {
-+            /* Clean up the process database. */
-+            gcmkONERROR(gckKERNEL_DestroyProcessDB(Kernel, PID));
-+
-+            /* Save the last know process ID. */
-+            Kernel->db->lastProcessID = PID;
-+        }
-+
-+#if gcdENABLE_VG
-+        if (Kernel->vg == gcvNULL)
-+#endif
-+        {
-+            status = gckEVENT_Submit(Kernel->eventObj, gcvTRUE, gcvFALSE);
-+
-+            if (status == gcvSTATUS_INTERRUPTED && Kernel->eventObj->submitTimer)
-+            {
-+                gcmkONERROR(gckOS_StartTimer(Kernel->os,
-+                                             Kernel->eventObj->submitTimer,
-+                                             1));
-+            }
-+            else
-+            {
-+                gcmkONERROR(status);
-+            }
-+        }
-+
-+        /* Decrement the number of clients attached. */
-+        gcmkONERROR(
-+            gckOS_AtomDecrement(Kernel->os, Kernel->atomClients, &old));
-+
-+        if (old == 1)
-+        {
-+#if gcdENABLE_VG
-+            if (Kernel->vg == gcvNULL)
-+#endif
-+            {
-+                /* Last client detached, switch to SUSPEND power state. */
-+                gcmkONERROR(gckOS_Broadcast(Kernel->os,
-+                                            Kernel->hardware,
-+                                            gcvBROADCAST_LAST_PROCESS));
-+            }
-+
-+            /* Flush the debug cache. */
-+            gcmkDEBUGFLUSH(~0U);
-+        }
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdSECURE_USER
-+gceSTATUS
-+gckKERNEL_MapLogicalToPhysical(
-+    IN gckKERNEL Kernel,
-+    IN gcskSECURE_CACHE_PTR Cache,
-+    IN OUT gctPOINTER * Data
-+    )
-+{
-+    gceSTATUS status;
-+    static gctBOOL baseAddressValid = gcvFALSE;
-+    static gctUINT32 baseAddress;
-+    gctBOOL needBase;
-+    gcskLOGICAL_CACHE_PTR slot;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Cache=0x%x *Data=0x%x",
-+                   Kernel, Cache, gcmOPT_POINTER(Data));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    if (!baseAddressValid)
-+    {
-+        /* Get base address. */
-+        gcmkONERROR(gckHARDWARE_GetBaseAddress(Kernel->hardware, &baseAddress));
-+
-+        baseAddressValid = gcvTRUE;
-+    }
-+
-+    /* Does this state load need a base address? */
-+    gcmkONERROR(gckHARDWARE_NeedBaseAddress(Kernel->hardware,
-+                                            ((gctUINT32_PTR) Data)[-1],
-+                                            &needBase));
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LRU
-+    {
-+        gcskLOGICAL_CACHE_PTR next;
-+        gctINT i;
-+
-+        /* Walk all used cache slots. */
-+        for (i = 1, slot = Cache->cache[0].next, next = gcvNULL;
-+             (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
-+             ++i, slot = slot->next
-+        )
-+        {
-+            if (slot->logical == *Data)
-+            {
-+                /* Bail out. */
-+                next = slot;
-+                break;
-+            }
-+        }
-+
-+        /* See if we had a miss. */
-+        if (next == gcvNULL)
-+        {
-+            /* Use the tail of the cache. */
-+            slot = Cache->cache[0].prev;
-+
-+            /* Initialize the cache line. */
-+            slot->logical = *Data;
-+
-+            /* Map the logical address to a DMA address. */
-+            gcmkONERROR(
-+                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
-+        }
-+
-+        /* Move slot to head of list. */
-+        if (slot != Cache->cache[0].next)
-+        {
-+            /* Unlink. */
-+            slot->prev->next = slot->next;
-+            slot->next->prev = slot->prev;
-+
-+            /* Move to head of chain. */
-+            slot->prev       = &Cache->cache[0];
-+            slot->next       = Cache->cache[0].next;
-+            slot->prev->next = slot;
-+            slot->next->prev = slot;
-+        }
-+    }
-+#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LINEAR
-+    {
-+        gctINT i;
-+        gcskLOGICAL_CACHE_PTR next = gcvNULL;
-+        gcskLOGICAL_CACHE_PTR oldestSlot = gcvNULL;
-+        slot = gcvNULL;
-+
-+        if (Cache->cacheIndex != gcvNULL)
-+        {
-+            /* Walk the cache forwards. */
-+            for (i = 1, slot = Cache->cacheIndex;
-+                 (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
-+                 ++i, slot = slot->next)
-+            {
-+                if (slot->logical == *Data)
-+                {
-+                    /* Bail out. */
-+                    next = slot;
-+                    break;
-+                }
-+
-+                /* Determine age of this slot. */
-+                if ((oldestSlot       == gcvNULL)
-+                ||  (oldestSlot->stamp > slot->stamp)
-+                )
-+                {
-+                    oldestSlot = slot;
-+                }
-+            }
-+
-+            if (next == gcvNULL)
-+            {
-+                /* Walk the cache backwards. */
-+                for (slot = Cache->cacheIndex->prev;
-+                     (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
-+                     ++i, slot = slot->prev)
-+                {
-+                    if (slot->logical == *Data)
-+                    {
-+                        /* Bail out. */
-+                        next = slot;
-+                        break;
-+                    }
-+
-+                    /* Determine age of this slot. */
-+                    if ((oldestSlot       == gcvNULL)
-+                    ||  (oldestSlot->stamp > slot->stamp)
-+                    )
-+                    {
-+                        oldestSlot = slot;
-+                    }
-+                }
-+            }
-+        }
-+
-+        /* See if we had a miss. */
-+        if (next == gcvNULL)
-+        {
-+            if (Cache->cacheFree != 0)
-+            {
-+                slot = &Cache->cache[Cache->cacheFree];
-+                gcmkASSERT(slot->logical == gcvNULL);
-+
-+                ++ Cache->cacheFree;
-+                if (Cache->cacheFree >= gcmCOUNTOF(Cache->cache))
-+                {
-+                    Cache->cacheFree = 0;
-+                }
-+            }
-+            else
-+            {
-+                /* Use the oldest cache slot. */
-+                gcmkASSERT(oldestSlot != gcvNULL);
-+                slot = oldestSlot;
-+
-+                /* Unlink from the chain. */
-+                slot->prev->next = slot->next;
-+                slot->next->prev = slot->prev;
-+
-+                /* Append to the end. */
-+                slot->prev       = Cache->cache[0].prev;
-+                slot->next       = &Cache->cache[0];
-+                slot->prev->next = slot;
-+                slot->next->prev = slot;
-+            }
-+
-+            /* Initialize the cache line. */
-+            slot->logical = *Data;
-+
-+            /* Map the logical address to a DMA address. */
-+            gcmkONERROR(
-+                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
-+        }
-+
-+        /* Save time stamp. */
-+        slot->stamp = ++ Cache->cacheStamp;
-+
-+        /* Save current slot for next lookup. */
-+        Cache->cacheIndex = slot;
-+    }
-+#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+    {
-+        gctINT i;
-+        gctUINT32 data = gcmPTR2INT(*Data);
-+        gctUINT32 key, index;
-+        gcskLOGICAL_CACHE_PTR hash;
-+
-+        /* Generate a hash key. */
-+        key   = (data >> 24) + (data >> 16) + (data >> 8) + data;
-+        index = key % gcmCOUNTOF(Cache->hash);
-+
-+        /* Get the hash entry. */
-+        hash = &Cache->hash[index];
-+
-+        for (slot = hash->nextHash, i = 0;
-+             (slot != gcvNULL) && (i < gcdSECURE_CACHE_SLOTS);
-+             slot = slot->nextHash, ++i
-+        )
-+        {
-+            if (slot->logical == (*Data))
-+            {
-+                break;
-+            }
-+        }
-+
-+        if (slot == gcvNULL)
-+        {
-+            /* Grab from the tail of the cache. */
-+            slot = Cache->cache[0].prev;
-+
-+            /* Unlink slot from any hash table it is part of. */
-+            if (slot->prevHash != gcvNULL)
-+            {
-+                slot->prevHash->nextHash = slot->nextHash;
-+            }
-+            if (slot->nextHash != gcvNULL)
-+            {
-+                slot->nextHash->prevHash = slot->prevHash;
-+            }
-+
-+            /* Initialize the cache line. */
-+            slot->logical = *Data;
-+
-+            /* Map the logical address to a DMA address. */
-+            gcmkONERROR(
-+                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
-+
-+            if (hash->nextHash != gcvNULL)
-+            {
-+                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
-+                               "Hash Collision: logical=0x%x key=0x%08x",
-+                               *Data, key);
-+            }
-+
-+            /* Insert the slot at the head of the hash list. */
-+            slot->nextHash     = hash->nextHash;
-+            if (slot->nextHash != gcvNULL)
-+            {
-+                slot->nextHash->prevHash = slot;
-+            }
-+            slot->prevHash     = hash;
-+            hash->nextHash     = slot;
-+        }
-+
-+        /* Move slot to head of list. */
-+        if (slot != Cache->cache[0].next)
-+        {
-+            /* Unlink. */
-+            slot->prev->next = slot->next;
-+            slot->next->prev = slot->prev;
-+
-+            /* Move to head of chain. */
-+            slot->prev       = &Cache->cache[0];
-+            slot->next       = Cache->cache[0].next;
-+            slot->prev->next = slot;
-+            slot->next->prev = slot;
-+        }
-+    }
-+#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_TABLE
-+    {
-+        gctUINT32 index = (gcmPTR2INT(*Data) % gcdSECURE_CACHE_SLOTS) + 1;
-+
-+        /* Get cache slot. */
-+        slot = &Cache->cache[index];
-+
-+        /* Check for cache miss. */
-+        if (slot->logical != *Data)
-+        {
-+            /* Initialize the cache line. */
-+            slot->logical = *Data;
-+
-+            /* Map the logical address to a DMA address. */
-+            gcmkONERROR(
-+                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
-+        }
-+    }
-+#endif
-+
-+    /* Return DMA address. */
-+    *Data = gcmINT2PTR(slot->dma + (needBase ? baseAddress : 0));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_FlushTranslationCache(
-+    IN gckKERNEL Kernel,
-+    IN gcskSECURE_CACHE_PTR Cache,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gctINT i;
-+    gcskLOGICAL_CACHE_PTR slot;
-+    gctUINT8_PTR ptr;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Cache=0x%x Logical=0x%x Bytes=%lu",
-+                   Kernel, Cache, Logical, Bytes);
-+
-+    /* Do we need to flush the entire cache? */
-+    if (Logical == gcvNULL)
-+    {
-+        /* Clear all cache slots. */
-+        for (i = 1; i <= gcdSECURE_CACHE_SLOTS; ++i)
-+        {
-+            Cache->cache[i].logical  = gcvNULL;
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+            Cache->cache[i].nextHash = gcvNULL;
-+            Cache->cache[i].prevHash = gcvNULL;
-+#endif
-+}
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+        /* Zero the hash table. */
-+        for (i = 0; i < gcmCOUNTOF(Cache->hash); ++i)
-+        {
-+            Cache->hash[i].nextHash = gcvNULL;
-+        }
-+#endif
-+
-+        /* Reset the cache functionality. */
-+        Cache->cacheIndex = gcvNULL;
-+        Cache->cacheFree  = 1;
-+        Cache->cacheStamp = 0;
-+    }
-+
-+    else
-+    {
-+        gctUINT8_PTR low  = (gctUINT8_PTR) Logical;
-+        gctUINT8_PTR high = low + Bytes;
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LRU
-+        gcskLOGICAL_CACHE_PTR next;
-+
-+        /* Walk all used cache slots. */
-+        for (i = 1, slot = Cache->cache[0].next;
-+             (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
-+             ++i, slot = next
-+        )
-+        {
-+            /* Save pointer to next slot. */
-+            next = slot->next;
-+
-+            /* Test if this slot falls within the range to flush. */
-+            ptr = (gctUINT8_PTR) slot->logical;
-+            if ((ptr >= low) && (ptr < high))
-+            {
-+                /* Unlink slot. */
-+                slot->prev->next = slot->next;
-+                slot->next->prev = slot->prev;
-+
-+                /* Append slot to tail of cache. */
-+                slot->prev       = Cache->cache[0].prev;
-+                slot->next       = &Cache->cache[0];
-+                slot->prev->next = slot;
-+                slot->next->prev = slot;
-+
-+                /* Mark slot as empty. */
-+                slot->logical = gcvNULL;
-+            }
-+        }
-+
-+#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LINEAR
-+        gcskLOGICAL_CACHE_PTR next;
-+
-+        for (i = 1, slot = Cache->cache[0].next;
-+             (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
-+             ++i, slot = next)
-+        {
-+            /* Save pointer to next slot. */
-+            next = slot->next;
-+
-+            /* Test if this slot falls within the range to flush. */
-+            ptr = (gctUINT8_PTR) slot->logical;
-+            if ((ptr >= low) && (ptr < high))
-+            {
-+                /* Test if this slot is the current slot. */
-+                if (slot == Cache->cacheIndex)
-+                {
-+                    /* Move to next or previous slot. */
-+                    Cache->cacheIndex = (slot->next->logical != gcvNULL)
-+                                      ? slot->next
-+                                      : (slot->prev->logical != gcvNULL)
-+                                      ? slot->prev
-+                                      : gcvNULL;
-+                }
-+
-+                /* Unlink slot from cache. */
-+                slot->prev->next = slot->next;
-+                slot->next->prev = slot->prev;
-+
-+                /* Insert slot to head of cache. */
-+                slot->prev       = &Cache->cache[0];
-+                slot->next       = Cache->cache[0].next;
-+                slot->prev->next = slot;
-+                slot->next->prev = slot;
-+
-+                /* Mark slot as empty. */
-+                slot->logical = gcvNULL;
-+                slot->stamp   = 0;
-+            }
-+        }
-+
-+#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+        gctINT j;
-+        gcskLOGICAL_CACHE_PTR hash, next;
-+
-+        /* Walk all hash tables. */
-+        for (i = 0, hash = Cache->hash;
-+             i < gcmCOUNTOF(Cache->hash);
-+             ++i, ++hash)
-+        {
-+            /* Walk all slots in the hash. */
-+            for (j = 0, slot = hash->nextHash;
-+                 (j < gcdSECURE_CACHE_SLOTS) && (slot != gcvNULL);
-+                 ++j, slot = next)
-+            {
-+                /* Save pointer to next slot. */
-+                next = slot->next;
-+
-+                /* Test if this slot falls within the range to flush. */
-+                ptr = (gctUINT8_PTR) slot->logical;
-+                if ((ptr >= low) && (ptr < high))
-+                {
-+                    /* Unlink slot from hash table. */
-+                    if (slot->prevHash == hash)
-+                    {
-+                        hash->nextHash = slot->nextHash;
-+                    }
-+                    else
-+                    {
-+                        slot->prevHash->nextHash = slot->nextHash;
-+                    }
-+
-+                    if (slot->nextHash != gcvNULL)
-+                    {
-+                        slot->nextHash->prevHash = slot->prevHash;
-+                    }
-+
-+                    /* Unlink slot from cache. */
-+                    slot->prev->next = slot->next;
-+                    slot->next->prev = slot->prev;
-+
-+                    /* Append slot to tail of cache. */
-+                    slot->prev       = Cache->cache[0].prev;
-+                    slot->next       = &Cache->cache[0];
-+                    slot->prev->next = slot;
-+                    slot->next->prev = slot;
-+
-+                    /* Mark slot as empty. */
-+                    slot->logical  = gcvNULL;
-+                    slot->prevHash = gcvNULL;
-+                    slot->nextHash = gcvNULL;
-+                }
-+            }
-+        }
-+
-+#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_TABLE
-+        gctUINT32 index;
-+
-+        /* Loop while inside the range. */
-+        for (i = 1; (low < high) && (i <= gcdSECURE_CACHE_SLOTS); ++i)
-+        {
-+            /* Get index into cache for this range. */
-+            index = (gcmPTR2INT(low) % gcdSECURE_CACHE_SLOTS) + 1;
-+            slot  = &Cache->cache[index];
-+
-+            /* Test if this slot falls within the range to flush. */
-+            ptr = (gctUINT8_PTR) slot->logical;
-+            if ((ptr >= low) && (ptr < high))
-+            {
-+                /* Remove entry from cache. */
-+                slot->logical = gcvNULL;
-+            }
-+
-+            /* Next block. */
-+            low += gcdSECURE_CACHE_SLOTS;
-+        }
-+#endif
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Recovery
-+**
-+**  Try to recover the GPU from a fatal error.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_Recovery(
-+    IN gckKERNEL Kernel
-+    )
-+{
-+#if gcdENABLE_RECOVERY
-+#define gcdEVENT_MASK 0x3FFFFFFF
-+    gceSTATUS status;
-+    gckEVENT eventObj;
-+    gckHARDWARE hardware;
-+#if gcdSECURE_USER
-+    gctUINT32 processID;
-+    gcskSECURE_CACHE_PTR cache;
-+#endif
-+    gctUINT32 oldValue;
-+    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
-+
-+    /* Validate the arguemnts. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Grab gckEVENT object. */
-+    eventObj = Kernel->eventObj;
-+    gcmkVERIFY_OBJECT(eventObj, gcvOBJ_EVENT);
-+
-+    /* Grab gckHARDWARE object. */
-+    hardware = Kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+#if gcdSECURE_USER
-+    /* Flush the secure mapping cache. */
-+    gcmkONERROR(gckOS_GetProcessID(&processID));
-+    gcmkONERROR(gckKERNEL_GetProcessDBCache(Kernel, processID, &cache));
-+    gcmkONERROR(gckKERNEL_FlushTranslationCache(Kernel, cache, gcvNULL, 0));
-+#endif
-+
-+    gcmkONERROR(
-+        gckOS_AtomicExchange(Kernel->os, Kernel->resetAtom, 1, &oldValue));
-+
-+    if (oldValue)
-+    {
-+        /* Some one else will recovery GPU. */
-+        return gcvSTATUS_OK;
-+    }
-+
-+    gcmkPRINT("[galcore]: GPU[%d] hang, automatic recovery.", Kernel->core);
-+
-+    /* Start a timer to clear reset flag, before timer is expired,
-+    ** other recovery request is ignored. */
-+    gcmkVERIFY_OK(
-+        gckOS_StartTimer(Kernel->os,
-+                         Kernel->resetFlagClearTimer,
-+                         gcdGPU_TIMEOUT - 500));
-+
-+
-+    /* Try issuing a soft reset for the GPU. */
-+    status = gckHARDWARE_Reset(hardware);
-+    if (status == gcvSTATUS_NOT_SUPPORTED)
-+    {
-+        /* Switch to OFF power.  The next submit should return the GPU to ON
-+        ** state. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetPowerManagementState(hardware,
-+                                                gcvPOWER_OFF_RECOVERY));
-+    }
-+    else
-+    {
-+        /* Bail out on reset error. */
-+        gcmkONERROR(status);
-+    }
-+
-+    /* Handle all outstanding events now. */
-+#if gcdSMP
-+    gcmkONERROR(gckOS_AtomSet(Kernel->os, eventObj->pending, gcdEVENT_MASK));
-+#else
-+    eventObj->pending = gcdEVENT_MASK;
-+#endif
-+    gcmkONERROR(gckEVENT_Notify(eventObj, 1));
-+
-+    /* Again in case more events got submitted. */
-+#if gcdSMP
-+    gcmkONERROR(gckOS_AtomSet(Kernel->os, eventObj->pending, gcdEVENT_MASK));
-+#else
-+    eventObj->pending = gcdEVENT_MASK;
-+#endif
-+    gcmkONERROR(gckEVENT_Notify(eventObj, 2));
-+
-+    Kernel->resetTimeStamp++;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    return gcvSTATUS_OK;
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_OpenUserData
-+**
-+**  Get access to the user data.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL NeedCopy
-+**          The flag indicating whether or not the data should be copied.
-+**
-+**      gctPOINTER StaticStorage
-+**          Pointer to the kernel storage where the data is to be copied if
-+**          NeedCopy is gcvTRUE.
-+**
-+**      gctPOINTER UserPointer
-+**          User pointer to the data.
-+**
-+**      gctSIZE_T Size
-+**          Size of the data.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * KernelPointer
-+**          Pointer to the kernel pointer that will be pointing to the data.
-+*/
-+gceSTATUS
-+gckKERNEL_OpenUserData(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL NeedCopy,
-+    IN gctPOINTER StaticStorage,
-+    IN gctPOINTER UserPointer,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG(
-+        "Kernel=0x%08X NeedCopy=%d StaticStorage=0x%08X "
-+        "UserPointer=0x%08X Size=%lu KernelPointer=0x%08X",
-+        Kernel, NeedCopy, StaticStorage, UserPointer, Size, KernelPointer
-+        );
-+
-+    /* Validate the arguemnts. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(!NeedCopy || (StaticStorage != gcvNULL));
-+    gcmkVERIFY_ARGUMENT(UserPointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+
-+    if (NeedCopy)
-+    {
-+        /* Copy the user data to the static storage. */
-+        gcmkONERROR(gckOS_CopyFromUserData(
-+            Kernel->os, StaticStorage, UserPointer, Size
-+            ));
-+
-+        /* Set the kernel pointer. */
-+        * KernelPointer = StaticStorage;
-+    }
-+    else
-+    {
-+        gctPOINTER pointer = gcvNULL;
-+
-+        /* Map the user pointer. */
-+        gcmkONERROR(gckOS_MapUserPointer(
-+            Kernel->os, UserPointer, Size, &pointer
-+            ));
-+
-+        /* Set the kernel pointer. */
-+        * KernelPointer = pointer;
-+    }
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_CloseUserData
-+**
-+**  Release resources associated with the user data connection opened by
-+**  gckKERNEL_OpenUserData.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL NeedCopy
-+**          The flag indicating whether or not the data should be copied.
-+**
-+**      gctBOOL FlushData
-+**          If gcvTRUE, the data is written back to the user.
-+**
-+**      gctPOINTER UserPointer
-+**          User pointer to the data.
-+**
-+**      gctSIZE_T Size
-+**          Size of the data.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * KernelPointer
-+**          Kernel pointer to the data.
-+*/
-+gceSTATUS
-+gckKERNEL_CloseUserData(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL NeedCopy,
-+    IN gctBOOL FlushData,
-+    IN gctPOINTER UserPointer,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctPOINTER pointer;
-+
-+    gcmkHEADER_ARG(
-+        "Kernel=0x%08X NeedCopy=%d FlushData=%d "
-+        "UserPointer=0x%08X Size=%lu KernelPointer=0x%08X",
-+        Kernel, NeedCopy, FlushData, UserPointer, Size, KernelPointer
-+        );
-+
-+    /* Validate the arguemnts. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(UserPointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+
-+    /* Get a shortcut to the kernel pointer. */
-+    pointer = * KernelPointer;
-+
-+    if (pointer != gcvNULL)
-+    {
-+        if (NeedCopy)
-+        {
-+            if (FlushData)
-+            {
-+                gcmkONERROR(gckOS_CopyToUserData(
-+                    Kernel->os, * KernelPointer, UserPointer, Size
-+                    ));
-+            }
-+        }
-+        else
-+        {
-+            /* Unmap record from kernel memory. */
-+            gcmkONERROR(gckOS_UnmapUserPointer(
-+                Kernel->os,
-+                UserPointer,
-+                Size,
-+                * KernelPointer
-+                ));
-+        }
-+
-+        /* Reset the kernel pointer. */
-+        * KernelPointer = gcvNULL;
-+    }
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+void
-+gckKERNEL_SetTimeOut(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 timeOut
-+    )
-+{
-+    gcmkHEADER_ARG("Kernel=0x%x timeOut=%d", Kernel, timeOut);
-+#if gcdGPU_TIMEOUT
-+    Kernel->timeOut = timeOut;
-+#endif
-+    gcmkFOOTER_NO();
-+}
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+gceSTATUS
-+gckKERNEL_AllocateVirtualCommandBuffer(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gckOS os = Kernel->os;
-+    gceSTATUS status;
-+    gctPOINTER logical;
-+    gctSIZE_T pageCount;
-+    gctSIZE_T bytes = *Bytes;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
-+
-+    gcmkHEADER_ARG("Os=0x%X InUserSpace=%d *Bytes=%lu",
-+                   os, InUserSpace, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(*Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    gcmkONERROR(gckOS_Allocate(os,
-+                               sizeof(gckVIRTUAL_COMMAND_BUFFER),
-+                               (gctPOINTER)&buffer));
-+
-+    gcmkONERROR(gckOS_ZeroMemory(buffer, sizeof(gckVIRTUAL_COMMAND_BUFFER)));
-+
-+    gcmkONERROR(gckOS_AllocatePagedMemoryEx(os,
-+                                            gcvFALSE,
-+                                            bytes,
-+                                            &buffer->physical));
-+
-+    if (InUserSpace)
-+    {
-+        gcmkONERROR(gckOS_LockPages(os,
-+                                    buffer->physical,
-+                                    bytes,
-+                                    gcvFALSE,
-+                                    &logical,
-+                                    &pageCount));
-+
-+        *Logical =
-+        buffer->userLogical = logical;
-+    }
-+    else
-+    {
-+        gcmkONERROR(
-+            gckOS_CreateKernelVirtualMapping(buffer->physical,
-+                                             &pageCount,
-+                                             &logical));
-+        *Logical =
-+        buffer->kernelLogical = logical;
-+    }
-+
-+    buffer->pageCount = pageCount;
-+    buffer->kernel = Kernel;
-+
-+    gcmkONERROR(gckOS_GetProcessID(&buffer->pid));
-+
-+    gcmkONERROR(gckMMU_AllocatePages(Kernel->mmu,
-+                                     pageCount,
-+                                     &buffer->pageTable,
-+                                     &buffer->gpuAddress));
-+
-+    gcmkONERROR(gckOS_MapPagesEx(os,
-+                                 Kernel->core,
-+                                 buffer->physical,
-+                                 pageCount,
-+                                 buffer->pageTable));
-+
-+    gcmkONERROR(gckMMU_Flush(Kernel->mmu));
-+
-+    *Physical = buffer;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
-+                   "gpuAddress = %x pageCount = %d kernelLogical = %x userLogical=%x",
-+                   buffer->gpuAddress, buffer->pageCount,
-+                   buffer->kernelLogical, buffer->userLogical);
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(os, Kernel->virtualBufferLock, gcvINFINITE));
-+
-+    if (Kernel->virtualBufferHead == gcvNULL)
-+    {
-+        Kernel->virtualBufferHead =
-+        Kernel->virtualBufferTail = buffer;
-+    }
-+    else
-+    {
-+        buffer->prev = Kernel->virtualBufferTail;
-+        Kernel->virtualBufferTail->next = buffer;
-+        Kernel->virtualBufferTail = buffer;
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, Kernel->virtualBufferLock));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (buffer->gpuAddress)
-+    {
-+        gcmkVERIFY_OK(
-+            gckMMU_FreePages(Kernel->mmu, buffer->pageTable, buffer->pageCount));
-+    }
-+
-+    if (buffer->userLogical)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_UnlockPages(os, buffer->physical, bytes, buffer->userLogical));
-+    }
-+
-+    if (buffer->kernelLogical)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_DestroyKernelVirtualMapping(buffer->kernelLogical));
-+    }
-+
-+    if (buffer->physical)
-+    {
-+        gcmkVERIFY_OK(gckOS_FreePagedMemory(os, buffer->physical, bytes));
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_Free(os, buffer));
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_DestroyVirtualCommandBuffer(
-+    IN gckKERNEL Kernel,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gckOS os;
-+    gckKERNEL kernel;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR buffer = (gckVIRTUAL_COMMAND_BUFFER_PTR)Physical;
-+
-+    gcmkHEADER();
-+    gcmkVERIFY_ARGUMENT(buffer != gcvNULL);
-+
-+    kernel = buffer->kernel;
-+    os = kernel->os;
-+
-+    if (buffer->userLogical)
-+    {
-+        gcmkVERIFY_OK(gckOS_UnlockPages(os, buffer->physical, Bytes, Logical));
-+    }
-+    else
-+    {
-+        gcmkVERIFY_OK(gckOS_DestroyKernelVirtualMapping(Logical));
-+    }
-+
-+    gcmkVERIFY_OK(
-+        gckMMU_FreePages(kernel->mmu, buffer->pageTable, buffer->pageCount));
-+
-+    gcmkVERIFY_OK(gckOS_FreePagedMemory(os, buffer->physical, Bytes));
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(os, kernel->virtualBufferLock, gcvINFINITE));
-+
-+    if (buffer == kernel->virtualBufferHead)
-+    {
-+        if ((kernel->virtualBufferHead = buffer->next) == gcvNULL)
-+        {
-+            kernel->virtualBufferTail = gcvNULL;
-+        }
-+    }
-+    else
-+    {
-+        buffer->prev->next = buffer->next;
-+
-+        if (buffer == kernel->virtualBufferTail)
-+        {
-+            kernel->virtualBufferTail = buffer->prev;
-+        }
-+        else
-+        {
-+            buffer->next->prev = buffer->prev;
-+        }
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, kernel->virtualBufferLock));
-+
-+    gcmkVERIFY_OK(gckOS_Free(os, buffer));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckKERNEL_GetGPUAddress(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gceSTATUS status;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
-+    gctPOINTER start;
-+    gctINT pid;
-+
-+    gcmkHEADER_ARG("Logical = %x", Logical);
-+
-+    gckOS_GetProcessID(&pid);
-+
-+    status = gcvSTATUS_INVALID_ADDRESS;
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(Kernel->os, Kernel->virtualBufferLock, gcvINFINITE));
-+
-+    /* Walk all command buffer. */
-+    for (buffer = Kernel->virtualBufferHead; buffer != gcvNULL; buffer = buffer->next)
-+    {
-+        if (buffer->userLogical)
-+        {
-+            start = buffer->userLogical;
-+        }
-+        else
-+        {
-+            start = buffer->kernelLogical;
-+        }
-+
-+        if (Logical >= start
-+        && (Logical < (start + buffer->pageCount * 4096))
-+        && pid == buffer->pid
-+        )
-+        {
-+            * Address = buffer->gpuAddress + (Logical - start);
-+            status = gcvSTATUS_OK;
-+            break;
-+        }
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->virtualBufferLock));
-+
-+    gcmkFOOTER_NO();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_QueryGPUAddress(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 GpuAddress,
-+    OUT gckVIRTUAL_COMMAND_BUFFER_PTR * Buffer
-+    )
-+{
-+    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
-+    gctUINT32 start;
-+    gceSTATUS status = gcvSTATUS_NOT_SUPPORTED;
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(Kernel->os, Kernel->virtualBufferLock, gcvINFINITE));
-+
-+    /* Walk all command buffers. */
-+    for (buffer = Kernel->virtualBufferHead; buffer != gcvNULL; buffer = buffer->next)
-+    {
-+        start = (gctUINT32)buffer->gpuAddress;
-+
-+        if (GpuAddress >= start && GpuAddress < (start + buffer->pageCount * 4096))
-+        {
-+            /* Find a range matched. */
-+            *Buffer = buffer;
-+            status = gcvSTATUS_OK;
-+            break;
-+        }
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->virtualBufferLock));
-+
-+    return status;
-+}
-+#endif
-+
-+#if gcdLINK_QUEUE_SIZE
-+static void
-+gckLINKQUEUE_Dequeue(
-+    IN gckLINKQUEUE LinkQueue
-+    )
-+{
-+    gcmkASSERT(LinkQueue->count == gcdLINK_QUEUE_SIZE);
-+
-+    LinkQueue->count--;
-+    LinkQueue->front = (LinkQueue->front + 1) % gcdLINK_QUEUE_SIZE;
-+}
-+
-+void
-+gckLINKQUEUE_Enqueue(
-+    IN gckLINKQUEUE LinkQueue,
-+    IN gctUINT32 start,
-+    IN gctUINT32 end
-+    )
-+{
-+    if (LinkQueue->count == gcdLINK_QUEUE_SIZE)
-+    {
-+        gckLINKQUEUE_Dequeue(LinkQueue);
-+    }
-+
-+    gcmkASSERT(LinkQueue->count < gcdLINK_QUEUE_SIZE);
-+
-+    LinkQueue->count++;
-+
-+    LinkQueue->data[LinkQueue->rear].start = start;
-+    LinkQueue->data[LinkQueue->rear].end = end;
-+
-+    gcmkVERIFY_OK(
-+        gckOS_GetProcessID(&LinkQueue->data[LinkQueue->rear].pid));
-+
-+    LinkQueue->rear = (LinkQueue->rear + 1) % gcdLINK_QUEUE_SIZE;
-+}
-+
-+void
-+gckLINKQUEUE_GetData(
-+    IN gckLINKQUEUE LinkQueue,
-+    IN gctUINT32 Index,
-+    OUT gckLINKDATA * Data
-+    )
-+{
-+    gcmkASSERT(Index >= 0 && Index < gcdLINK_QUEUE_SIZE);
-+
-+    *Data = &LinkQueue->data[(Index + LinkQueue->front) % gcdLINK_QUEUE_SIZE];
-+}
-+#endif
-+
-+/******************************************************************************\
-+*************************** Pointer - ID translation ***************************
-+\******************************************************************************/
-+#define gcdID_TABLE_LENGTH 1024
-+typedef struct _gcsINTEGERDB * gckINTEGERDB;
-+typedef struct _gcsINTEGERDB
-+{
-+    gckOS                       os;
-+    gctPOINTER*                 table;
-+    gctPOINTER                  mutex;
-+    gctUINT32                   tableLen;
-+    gctUINT32                   currentID;
-+    gctUINT32                   unused;
-+}
-+gcsINTEGERDB;
-+
-+gceSTATUS
-+gckKERNEL_CreateIntegerDatabase(
-+    IN gckKERNEL Kernel,
-+    OUT gctPOINTER * Database
-+    )
-+{
-+    gceSTATUS status;
-+    gckINTEGERDB database = gcvNULL;
-+
-+    gcmkHEADER_ARG("Kernel=0x%08X Datbase=0x%08X", Kernel, Database);
-+
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Database != gcvNULL);
-+
-+    /* Allocate a database. */
-+    gcmkONERROR(gckOS_Allocate(
-+        Kernel->os, gcmSIZEOF(gcsINTEGERDB), (gctPOINTER *)&database));
-+
-+    gckOS_ZeroMemory(database, gcmSIZEOF(gcsINTEGERDB));
-+
-+    /* Allocate a pointer table. */
-+    gcmkONERROR(gckOS_Allocate(
-+        Kernel->os, gcmSIZEOF(gctPOINTER) * gcdID_TABLE_LENGTH, (gctPOINTER *)&database->table));
-+
-+    gckOS_ZeroMemory(database->table, gcmSIZEOF(gctPOINTER) * gcdID_TABLE_LENGTH);
-+
-+    /* Allocate a database mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(Kernel->os, &database->mutex));
-+
-+    /* Initialize. */
-+    database->currentID = 0;
-+    database->unused = gcdID_TABLE_LENGTH;
-+    database->os = Kernel->os;
-+    database->tableLen = gcdID_TABLE_LENGTH;
-+
-+    *Database = database;
-+
-+    gcmkFOOTER_ARG("*Database=0x%08X", *Database);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Rollback. */
-+    if (database)
-+    {
-+        if (database->table)
-+        {
-+            gcmkOS_SAFE_FREE(Kernel->os, database->table);
-+        }
-+
-+        gcmkOS_SAFE_FREE(Kernel->os, database);
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_DestroyIntegerDatabase(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Database
-+    )
-+{
-+    gckINTEGERDB database = Database;
-+
-+    gcmkHEADER_ARG("Kernel=0x%08X Datbase=0x%08X", Kernel, Database);
-+
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Database != gcvNULL);
-+
-+    /* Destroy pointer table. */
-+    gcmkOS_SAFE_FREE(Kernel->os, database->table);
-+
-+    /* Destroy database mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, database->mutex));
-+
-+    /* Destroy database. */
-+    gcmkOS_SAFE_FREE(Kernel->os, database);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckKERNEL_AllocateIntegerId(
-+    IN gctPOINTER Database,
-+    IN gctPOINTER Pointer,
-+    OUT gctUINT32 * Id
-+    )
-+{
-+    gceSTATUS status;
-+    gckINTEGERDB database = Database;
-+    gctUINT32 i, unused, currentID, tableLen;
-+    gctPOINTER * table;
-+    gckOS os = database->os;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Database=0x%08X Pointer=0x%08X", Database, Pointer);
-+
-+    gcmkVERIFY_ARGUMENT(Id != gcvNULL);
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(os, database->mutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    if (database->unused < 1)
-+    {
-+        /* Extend table. */
-+        gcmkONERROR(
-+            gckOS_Allocate(os,
-+                           gcmSIZEOF(gctPOINTER) * (database->tableLen + gcdID_TABLE_LENGTH),
-+                           (gctPOINTER *)&table));
-+
-+        gckOS_ZeroMemory(table + database->tableLen,
-+                         gcmSIZEOF(gctPOINTER) * gcdID_TABLE_LENGTH);
-+
-+        /* Copy data from old table. */
-+        gckOS_MemCopy(table,
-+                      database->table,
-+                      database->tableLen * gcmSIZEOF(gctPOINTER));
-+
-+        gcmkOS_SAFE_FREE(os, database->table);
-+
-+        /* Update databse with new allocated table. */
-+        database->table = table;
-+        database->currentID = database->tableLen;
-+        database->tableLen += gcdID_TABLE_LENGTH;
-+        database->unused += gcdID_TABLE_LENGTH;
-+    }
-+
-+    table = database->table;
-+    currentID = database->currentID;
-+    tableLen = database->tableLen;
-+    unused = database->unused;
-+
-+    /* Connect id with pointer. */
-+    table[currentID] = Pointer;
-+
-+    *Id = currentID + 1;
-+
-+    /* Update the currentID. */
-+    if (--unused > 0)
-+    {
-+        for (i = 0; i < tableLen; i++)
-+        {
-+            if (++currentID >= tableLen)
-+            {
-+                /* Wrap to the begin. */
-+                currentID = 0;
-+            }
-+
-+            if (table[currentID] == gcvNULL)
-+            {
-+                break;
-+            }
-+        }
-+    }
-+
-+    database->table = table;
-+    database->currentID = currentID;
-+    database->tableLen = tableLen;
-+    database->unused = unused;
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
-+    acquired = gcvFALSE;
-+
-+    gcmkFOOTER_ARG("*Id=%d", *Id);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_FreeIntegerId(
-+    IN gctPOINTER Database,
-+    IN gctUINT32 Id
-+    )
-+{
-+    gceSTATUS status;
-+    gckINTEGERDB database = Database;
-+    gckOS os = database->os;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Database=0x%08X Id=%d", Database, Id);
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(os, database->mutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    if (!(Id > 0 && Id <= database->tableLen))
-+    {
-+        gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+    }
-+
-+    Id -= 1;
-+
-+    database->table[Id] = gcvNULL;
-+
-+    if (database->unused++ == 0)
-+    {
-+        database->currentID = Id;
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
-+    acquired = gcvFALSE;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_QueryIntegerId(
-+    IN gctPOINTER Database,
-+    IN gctUINT32 Id,
-+    OUT gctPOINTER * Pointer
-+    )
-+{
-+    gceSTATUS status;
-+    gckINTEGERDB database = Database;
-+    gctPOINTER pointer;
-+    gckOS os = database->os;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Database=0x%08X Id=%d", Database, Id);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+
-+    gcmkVERIFY_OK(gckOS_AcquireMutex(os, database->mutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    if (!(Id > 0 && Id <= database->tableLen))
-+    {
-+        gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+    }
-+
-+    Id -= 1;
-+
-+    pointer = database->table[Id];
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
-+    acquired = gcvFALSE;
-+
-+    if (pointer)
-+    {
-+        *Pointer = pointer;
-+    }
-+    else
-+    {
-+        gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+    }
-+
-+    gcmkFOOTER_ARG("*Pointer=0x%08X", *Pointer);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-+gctUINT32
-+gckKERNEL_AllocateNameFromPointer(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Pointer
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 name;
-+    gctPOINTER database = Kernel->db->pointerDatabase;
-+
-+    gcmkHEADER_ARG("Kernel=0x%X Pointer=0x%X", Kernel, Pointer);
-+
-+    gcmkONERROR(
-+        gckKERNEL_AllocateIntegerId(database, Pointer, &name));
-+
-+    gcmkFOOTER_ARG("name=%d", name);
-+    return name;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return 0;
-+}
-+
-+gctPOINTER
-+gckKERNEL_QueryPointerFromName(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 Name
-+    )
-+{
-+    gceSTATUS status;
-+    gctPOINTER pointer = gcvNULL;
-+    gctPOINTER database = Kernel->db->pointerDatabase;
-+
-+    gcmkHEADER_ARG("Kernel=0x%X Name=%d", Kernel, Name);
-+
-+    /* Lookup in database to get pointer. */
-+    gcmkONERROR(gckKERNEL_QueryIntegerId(database, Name, &pointer));
-+
-+    gcmkFOOTER_ARG("pointer=0x%X", pointer);
-+    return pointer;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return gcvNULL;
-+}
-+
-+gceSTATUS
-+gckKERNEL_DeleteName(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 Name
-+    )
-+{
-+    gctPOINTER database = Kernel->db->pointerDatabase;
-+
-+    gcmkHEADER_ARG("Kernel=0x%X Name=0x%X", Kernel, Name);
-+
-+    /* Free name if exists. */
-+    gcmkVERIFY_OK(gckKERNEL_FreeIntegerId(database, Name));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+/*******************************************************************************
-+***** Test Code ****************************************************************
-+*******************************************************************************/
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,3042 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+#include "gc_hal_kernel_context.h"
-+
-+#ifdef __QNXNTO__
-+#include <sys/slog.h>
-+#endif
-+
-+#define _GC_OBJ_ZONE            gcvZONE_COMMAND
-+
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  _NewQueue
-+**
-+**  Allocate a new command queue.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object.
-+**
-+**  OUTPUT:
-+**
-+**      gckCOMMAND Command
-+**          gckCOMMAND object has been updated with a new command queue.
-+*/
-+static gceSTATUS
-+_NewQueue(
-+    IN OUT gckCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT currentIndex, newIndex;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Switch to the next command buffer. */
-+    currentIndex = Command->index;
-+    newIndex     = (currentIndex + 1) % gcdCOMMAND_QUEUES;
-+
-+    /* Wait for availability. */
-+#if gcdDUMP_COMMAND
-+    gcmkPRINT("@[kernel.waitsignal]");
-+#endif
-+
-+    gcmkONERROR(gckOS_WaitSignal(
-+        Command->os,
-+        Command->queues[newIndex].signal,
-+        gcvINFINITE
-+        ));
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    if (newIndex < currentIndex)
-+    {
-+        Command->wrapCount += 1;
-+
-+        gcmkTRACE_ZONE_N(
-+            gcvLEVEL_INFO, gcvZONE_COMMAND,
-+            2 * 4,
-+            "%s(%d): queue array wrapped around.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+    }
-+
-+    gcmkTRACE_ZONE_N(
-+        gcvLEVEL_INFO, gcvZONE_COMMAND,
-+        3 * 4,
-+        "%s(%d): total queue wrap arounds %d.\n",
-+        __FUNCTION__, __LINE__, Command->wrapCount
-+        );
-+
-+    gcmkTRACE_ZONE_N(
-+        gcvLEVEL_INFO, gcvZONE_COMMAND,
-+        3 * 4,
-+        "%s(%d): switched to queue %d.\n",
-+        __FUNCTION__, __LINE__, newIndex
-+        );
-+#endif
-+
-+    /* Update gckCOMMAND object with new command queue. */
-+    Command->index    = newIndex;
-+    Command->newQueue = gcvTRUE;
-+    Command->logical  = Command->queues[newIndex].logical;
-+    Command->offset   = 0;
-+
-+    gcmkONERROR(
-+        gckOS_GetPhysicalAddress(
-+            Command->os,
-+            Command->logical,
-+            (gctUINT32 *) &Command->physical
-+            ));
-+
-+    if (currentIndex != -1)
-+    {
-+        /* Mark the command queue as available. */
-+        gcmkONERROR(gckEVENT_Signal(
-+            Command->kernel->eventObj,
-+            Command->queues[currentIndex].signal,
-+            gcvKERNEL_COMMAND
-+            ));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("Command->index=%d", Command->index);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+_IncrementCommitAtom(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL Increment
-+    )
-+{
-+    gceSTATUS status;
-+    gckHARDWARE hardware;
-+    gctINT32 atomValue;
-+    gctBOOL powerAcquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Extract the gckHARDWARE and gckEVENT objects. */
-+    hardware = Command->kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    /* Grab the power mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(
-+        Command->os, hardware->powerMutex, gcvINFINITE
-+        ));
-+    powerAcquired = gcvTRUE;
-+
-+    /* Increment the commit atom. */
-+    if (Increment)
-+    {
-+        gcmkONERROR(gckOS_AtomIncrement(
-+            Command->os, Command->atomCommit, &atomValue
-+            ));
-+    }
-+    else
-+    {
-+        gcmkONERROR(gckOS_AtomDecrement(
-+            Command->os, Command->atomCommit, &atomValue
-+            ));
-+    }
-+
-+    /* Release the power mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(
-+        Command->os, hardware->powerMutex
-+        ));
-+    powerAcquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (powerAcquired)
-+    {
-+        /* Release the power mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(
-+            Command->os, hardware->powerMutex
-+            ));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdSECURE_USER
-+static gceSTATUS
-+_ProcessHints(
-+    IN gckCOMMAND Command,
-+    IN gctUINT32 ProcessID,
-+    IN gcoCMDBUF CommandBuffer
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gckKERNEL kernel;
-+    gctBOOL needCopy = gcvFALSE;
-+    gcskSECURE_CACHE_PTR cache;
-+    gctUINT8_PTR commandBufferLogical;
-+    gctUINT8_PTR hintedData;
-+    gctUINT32_PTR hintArray;
-+    gctUINT i, hintCount;
-+
-+    gcmkHEADER_ARG(
-+        "Command=0x%08X ProcessID=%d CommandBuffer=0x%08X",
-+        Command, ProcessID, CommandBuffer
-+        );
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Reset state array pointer. */
-+    hintArray = gcvNULL;
-+
-+    /* Get the kernel object. */
-+    kernel = Command->kernel;
-+
-+    /* Get the cache form the database. */
-+    gcmkONERROR(gckKERNEL_GetProcessDBCache(kernel, ProcessID, &cache));
-+
-+    /* Determine the start of the command buffer. */
-+    commandBufferLogical
-+        = (gctUINT8_PTR) CommandBuffer->logical
-+        +                CommandBuffer->startOffset;
-+
-+    /* Determine the number of records in the state array. */
-+    hintCount = CommandBuffer->hintArrayTail - CommandBuffer->hintArray;
-+
-+    /* Check wehther we need to copy the structures or not. */
-+    gcmkONERROR(gckOS_QueryNeedCopy(Command->os, ProcessID, &needCopy));
-+
-+    /* Get access to the state array. */
-+    if (needCopy)
-+    {
-+        gctUINT copySize;
-+
-+        if (Command->hintArrayAllocated &&
-+            (Command->hintArraySize < CommandBuffer->hintArraySize))
-+        {
-+            gcmkONERROR(gcmkOS_SAFE_FREE(Command->os, gcmUINT64_TO_PTR(Command->hintArray)));
-+            Command->hintArraySize = gcvFALSE;
-+        }
-+
-+        if (!Command->hintArrayAllocated)
-+        {
-+            gctPOINTER pointer = gcvNULL;
-+
-+            gcmkONERROR(gckOS_Allocate(
-+                Command->os,
-+                CommandBuffer->hintArraySize,
-+                &pointer
-+                ));
-+
-+            Command->hintArray          = gcmPTR_TO_UINT64(pointer);
-+            Command->hintArrayAllocated = gcvTRUE;
-+            Command->hintArraySize      = CommandBuffer->hintArraySize;
-+        }
-+
-+        hintArray = gcmUINT64_TO_PTR(Command->hintArray);
-+        copySize   = hintCount * gcmSIZEOF(gctUINT32);
-+
-+        gcmkONERROR(gckOS_CopyFromUserData(
-+            Command->os,
-+            hintArray,
-+            gcmUINT64_TO_PTR(CommandBuffer->hintArray),
-+            copySize
-+            ));
-+    }
-+    else
-+    {
-+        gctPOINTER pointer = gcvNULL;
-+
-+        gcmkONERROR(gckOS_MapUserPointer(
-+            Command->os,
-+            gcmUINT64_TO_PTR(CommandBuffer->hintArray),
-+            CommandBuffer->hintArraySize,
-+            &pointer
-+            ));
-+
-+        hintArray = pointer;
-+    }
-+
-+    /* Scan through the buffer. */
-+    for (i = 0; i < hintCount; i += 1)
-+    {
-+        /* Determine the location of the hinted data. */
-+        hintedData = commandBufferLogical + hintArray[i];
-+
-+        /* Map handle into physical address. */
-+        gcmkONERROR(gckKERNEL_MapLogicalToPhysical(
-+            kernel, cache, (gctPOINTER) hintedData
-+            ));
-+    }
-+
-+OnError:
-+    /* Get access to the state array. */
-+    if (!needCopy && (hintArray != gcvNULL))
-+    {
-+        gcmkVERIFY_OK(gckOS_UnmapUserPointer(
-+            Command->os,
-+            gcmUINT64_TO_PTR(CommandBuffer->hintArray),
-+            CommandBuffer->hintArraySize,
-+            hintArray
-+            ));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+static gceSTATUS
-+_FlushMMU(
-+    IN gckCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 oldValue;
-+    gckHARDWARE hardware = Command->kernel->hardware;
-+
-+    gcmkONERROR(gckOS_AtomicExchange(Command->os,
-+                                     hardware->pageTableDirty,
-+                                     0,
-+                                     &oldValue));
-+
-+    if (oldValue)
-+    {
-+        /* Page Table is upated, flush mmu before commit. */
-+        gcmkONERROR(gckHARDWARE_FlushMMU(hardware));
-+    }
-+
-+    return gcvSTATUS_OK;
-+OnError:
-+    return status;
-+}
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+static void
-+_DumpBuffer(
-+    IN gctPOINTER Buffer,
-+    IN gctUINT32 GpuAddress,
-+    IN gctSIZE_T Size
-+    )
-+{
-+    gctINT i, line, left;
-+    gctUINT32_PTR data = Buffer;
-+
-+    line = Size / 32;
-+    left = Size % 32;
-+
-+
-+    for (i = 0; i < line; i++)
-+    {
-+        gcmkPRINT("%X : %08X %08X %08X %08X %08X %08X %08X %08X ",
-+                  GpuAddress, data[0], data[1], data[2], data[3], data[4], data[5], data[6], data[7]);
-+        data += 8;
-+        GpuAddress += 8 * 4;
-+    }
-+
-+    switch(left)
-+    {
-+        case 28:
-+            gcmkPRINT("%X : %08X %08X %08X %08X %08X %08X %08X ",
-+                      GpuAddress, data[0], data[1], data[2], data[3], data[4], data[5], data[6]);
-+            break;
-+        case 24:
-+            gcmkPRINT("%X : %08X %08X %08X %08X %08X %08X ",
-+                      GpuAddress, data[0], data[1], data[2], data[3], data[4], data[5]);
-+            break;
-+        case 20:
-+            gcmkPRINT("%X : %08X %08X %08X %08X %08X ",
-+                      GpuAddress, data[0], data[1], data[2], data[3], data[4]);
-+            break;
-+        case 16:
-+            gcmkPRINT("%X : %08X %08X %08X %08X ",
-+                      GpuAddress, data[0], data[1], data[2], data[3]);
-+            break;
-+        case 12:
-+            gcmkPRINT("%X : %08X %08X %08X ",
-+                      GpuAddress, data[0], data[1], data[2]);
-+            break;
-+        case 8:
-+            gcmkPRINT("%X : %08X %08X ",
-+                      GpuAddress, data[0], data[1]);
-+            break;
-+        case 4:
-+            gcmkPRINT("%X : %08X ",
-+                      GpuAddress, data[0]);
-+            break;
-+        default:
-+            break;
-+    }
-+}
-+
-+static void
-+_DumpKernelCommandBuffer(
-+    IN gckCOMMAND Command
-+)
-+{
-+    gctINT i;
-+    gctUINT32 physical;
-+    gctPOINTER entry;
-+
-+    for (i = 0; i < gcdCOMMAND_QUEUES; i++)
-+    {
-+        entry = Command->queues[i].logical;
-+
-+        gckOS_GetPhysicalAddress(Command->os, entry, &physical);
-+
-+        gcmkPRINT("Kernel command buffer %d\n", i);
-+
-+        _DumpBuffer(entry, physical, Command->pageSize);
-+    }
-+}
-+#endif
-+
-+/******************************************************************************\
-+****************************** gckCOMMAND API Code ******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Construct
-+**
-+**  Construct a new gckCOMMAND object.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**  OUTPUT:
-+**
-+**      gckCOMMAND * Command
-+**          Pointer to a variable that will hold the pointer to the gckCOMMAND
-+**          object.
-+*/
-+gceSTATUS
-+gckCOMMAND_Construct(
-+    IN gckKERNEL Kernel,
-+    OUT gckCOMMAND * Command
-+    )
-+{
-+    gckOS os;
-+    gckCOMMAND command = gcvNULL;
-+    gceSTATUS status;
-+    gctINT i;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Command != gcvNULL);
-+
-+    /* Extract the gckOS object. */
-+    os = Kernel->os;
-+
-+    /* Allocate the gckCOMMAND structure. */
-+    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(struct _gckCOMMAND), &pointer));
-+    command = pointer;
-+
-+    /* Reset the entire object. */
-+    gcmkONERROR(gckOS_ZeroMemory(command, gcmSIZEOF(struct _gckCOMMAND)));
-+
-+    /* Initialize the gckCOMMAND object.*/
-+    command->object.type    = gcvOBJ_COMMAND;
-+    command->kernel         = Kernel;
-+    command->os             = os;
-+
-+    /* Get the command buffer requirements. */
-+    gcmkONERROR(gckHARDWARE_QueryCommandBuffer(
-+        Kernel->hardware,
-+        &command->alignment,
-+        &command->reservedHead,
-+        &command->reservedTail
-+        ));
-+
-+    /* Create the command queue mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &command->mutexQueue));
-+
-+    /* Create the context switching mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &command->mutexContext));
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    /* Create the context switching mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &command->mutexContextSeq));
-+#endif
-+
-+    /* Create the power management semaphore. */
-+    gcmkONERROR(gckOS_CreateSemaphore(os, &command->powerSemaphore));
-+
-+    /* Create the commit atom. */
-+    gcmkONERROR(gckOS_AtomConstruct(os, &command->atomCommit));
-+
-+    /* Get the page size from teh OS. */
-+    gcmkONERROR(gckOS_GetPageSize(os, &command->pageSize));
-+
-+    /* Get process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&command->kernelProcessID));
-+
-+    /* Set hardware to pipe 0. */
-+    command->pipeSelect = gcvPIPE_INVALID;
-+
-+    /* Pre-allocate the command queues. */
-+    for (i = 0; i < gcdCOMMAND_QUEUES; ++i)
-+    {
-+        gcmkONERROR(gckOS_AllocateNonPagedMemory(
-+            os,
-+            gcvFALSE,
-+            &command->pageSize,
-+            &command->queues[i].physical,
-+            &command->queues[i].logical
-+            ));
-+
-+        gcmkONERROR(gckOS_CreateSignal(
-+            os, gcvFALSE, &command->queues[i].signal
-+            ));
-+
-+        gcmkONERROR(gckOS_Signal(
-+            os, command->queues[i].signal, gcvTRUE
-+            ));
-+    }
-+
-+    /* No command queue in use yet. */
-+    command->index    = -1;
-+    command->logical  = gcvNULL;
-+    command->newQueue = gcvFALSE;
-+
-+    /* Command is not yet running. */
-+    command->running = gcvFALSE;
-+
-+    /* Command queue is idle. */
-+    command->idle = gcvTRUE;
-+
-+    /* Commit stamp is zero. */
-+    command->commitStamp = 0;
-+
-+    /* END event signal not created. */
-+    command->endEventSignal = gcvNULL;
-+
-+    /* Return pointer to the gckCOMMAND object. */
-+    *Command = command;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Command=0x%x", *Command);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (command != gcvNULL)
-+    {
-+        if (command->atomCommit != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(os, command->atomCommit));
-+        }
-+
-+        if (command->powerSemaphore != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DestroySemaphore(os, command->powerSemaphore));
-+        }
-+
-+        if (command->mutexContext != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(os, command->mutexContext));
-+        }
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+        if (command->mutexContextSeq != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(os, command->mutexContextSeq));
-+        }
-+#endif
-+
-+        if (command->mutexQueue != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(os, command->mutexQueue));
-+        }
-+
-+        for (i = 0; i < gcdCOMMAND_QUEUES; ++i)
-+        {
-+            if (command->queues[i].signal != gcvNULL)
-+            {
-+                gcmkVERIFY_OK(gckOS_DestroySignal(
-+                    os, command->queues[i].signal
-+                    ));
-+            }
-+
-+            if (command->queues[i].logical != gcvNULL)
-+            {
-+                gcmkVERIFY_OK(gckOS_FreeNonPagedMemory(
-+                    os,
-+                    command->pageSize,
-+                    command->queues[i].physical,
-+                    command->queues[i].logical
-+                    ));
-+            }
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, command));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Destroy
-+**
-+**  Destroy an gckCOMMAND object.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Destroy(
-+    IN gckCOMMAND Command
-+    )
-+{
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Stop the command queue. */
-+    gcmkVERIFY_OK(gckCOMMAND_Stop(Command, gcvFALSE));
-+
-+    for (i = 0; i < gcdCOMMAND_QUEUES; ++i)
-+    {
-+        gcmkASSERT(Command->queues[i].signal != gcvNULL);
-+        gcmkVERIFY_OK(gckOS_DestroySignal(
-+            Command->os, Command->queues[i].signal
-+            ));
-+
-+        gcmkASSERT(Command->queues[i].logical != gcvNULL);
-+        gcmkVERIFY_OK(gckOS_FreeNonPagedMemory(
-+            Command->os,
-+            Command->pageSize,
-+            Command->queues[i].physical,
-+            Command->queues[i].logical
-+            ));
-+    }
-+
-+    /* END event signal. */
-+    if (Command->endEventSignal != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_DestroySignal(
-+            Command->os, Command->endEventSignal
-+            ));
-+    }
-+
-+    /* Delete the context switching mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Command->os, Command->mutexContext));
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    if (Command->mutexContextSeq != gcvNULL)
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(Command->os, Command->mutexContextSeq));
-+#endif
-+
-+    /* Delete the command queue mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Command->os, Command->mutexQueue));
-+
-+    /* Destroy the power management semaphore. */
-+    gcmkVERIFY_OK(gckOS_DestroySemaphore(Command->os, Command->powerSemaphore));
-+
-+    /* Destroy the commit atom. */
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Command->os, Command->atomCommit));
-+
-+#if gcdSECURE_USER
-+    /* Free state array. */
-+    if (Command->hintArrayAllocated)
-+    {
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Command->os, gcmUINT64_TO_PTR(Command->hintArray)));
-+        Command->hintArrayAllocated = gcvFALSE;
-+    }
-+#endif
-+
-+    /* Mark object as unknown. */
-+    Command->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckCOMMAND object. */
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Command->os, Command));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_EnterCommit
-+**
-+**  Acquire command queue synchronization objects.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object to destroy.
-+**
-+**      gctBOOL FromPower
-+**          Determines whether the call originates from inside the power
-+**          management or not.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_EnterCommit(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromPower
-+    )
-+{
-+    gceSTATUS status;
-+    gckHARDWARE hardware;
-+    gctBOOL atomIncremented = gcvFALSE;
-+    gctBOOL semaAcquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Extract the gckHARDWARE and gckEVENT objects. */
-+    hardware = Command->kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    if (!FromPower)
-+    {
-+        /* Increment COMMIT atom to let power management know that a commit is
-+        ** in progress. */
-+        gcmkONERROR(_IncrementCommitAtom(Command, gcvTRUE));
-+        atomIncremented = gcvTRUE;
-+
-+        /* Notify the system the GPU has a commit. */
-+        gcmkONERROR(gckOS_Broadcast(Command->os,
-+                                    hardware,
-+                                    gcvBROADCAST_GPU_COMMIT));
-+
-+        /* Acquire the power management semaphore. */
-+        gcmkONERROR(gckOS_AcquireSemaphore(Command->os,
-+                                           Command->powerSemaphore));
-+        semaAcquired = gcvTRUE;
-+    }
-+
-+    /* Grab the conmmand queue mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Command->os,
-+                                   Command->mutexQueue,
-+                                   gcvINFINITE));
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (semaAcquired)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(
-+            Command->os, Command->powerSemaphore
-+            ));
-+    }
-+
-+    if (atomIncremented)
-+    {
-+        /* Decrement the commit atom. */
-+        gcmkVERIFY_OK(_IncrementCommitAtom(
-+            Command, gcvFALSE
-+            ));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_ExitCommit
-+**
-+**  Release command queue synchronization objects.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object to destroy.
-+**
-+**      gctBOOL FromPower
-+**          Determines whether the call originates from inside the power
-+**          management or not.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_ExitCommit(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromPower
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Release the power mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexQueue));
-+
-+    if (!FromPower)
-+    {
-+        /* Release the power management semaphore. */
-+        gcmkONERROR(gckOS_ReleaseSemaphore(Command->os,
-+                                           Command->powerSemaphore));
-+
-+        /* Decrement the commit atom. */
-+        gcmkONERROR(_IncrementCommitAtom(Command, gcvFALSE));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Start
-+**
-+**  Start up the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object to start.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Start(
-+    IN gckCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gckHARDWARE hardware;
-+    gctUINT32 waitOffset;
-+    gctSIZE_T waitLinkBytes;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->running)
-+    {
-+        /* Command queue already running. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Extract the gckHARDWARE object. */
-+    hardware = Command->kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    if (Command->logical == gcvNULL)
-+    {
-+        /* Start at beginning of a new queue. */
-+        gcmkONERROR(_NewQueue(Command));
-+    }
-+
-+    /* Start at beginning of page. */
-+    Command->offset = 0;
-+
-+    /* Set abvailable number of bytes for WAIT/LINK command sequence. */
-+    waitLinkBytes = Command->pageSize;
-+
-+    /* Append WAIT/LINK. */
-+    gcmkONERROR(gckHARDWARE_WaitLink(
-+        hardware,
-+        Command->logical,
-+        0,
-+        &waitLinkBytes,
-+        &waitOffset,
-+        &Command->waitSize
-+        ));
-+
-+    Command->waitLogical  = (gctUINT8_PTR) Command->logical  + waitOffset;
-+    Command->waitPhysical = (gctUINT8_PTR) Command->physical + waitOffset;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache for the wait/link. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Command->os,
-+        Command->kernelProcessID,
-+        gcvNULL,
-+        Command->physical,
-+        Command->logical,
-+        waitLinkBytes
-+        ));
-+#endif
-+
-+    /* Adjust offset. */
-+    Command->offset   = waitLinkBytes;
-+    Command->newQueue = gcvFALSE;
-+
-+    /* Enable command processor. */
-+#ifdef __QNXNTO__
-+    gcmkONERROR(gckHARDWARE_Execute(
-+        hardware,
-+        Command->logical,
-+        Command->physical,
-+        gcvTRUE,
-+        waitLinkBytes
-+        ));
-+#else
-+    gcmkONERROR(gckHARDWARE_Execute(
-+        hardware,
-+        Command->logical,
-+        waitLinkBytes
-+        ));
-+#endif
-+
-+    /* Command queue is running. */
-+    Command->running = gcvTRUE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Stop
-+**
-+**  Stop the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object to stop.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Stop(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromRecovery
-+    )
-+{
-+    gckHARDWARE hardware;
-+    gceSTATUS status;
-+    gctUINT32 idle;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (!Command->running)
-+    {
-+        /* Command queue is not running. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Extract the gckHARDWARE object. */
-+    hardware = Command->kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    if (gckHARDWARE_IsFeatureAvailable(hardware,
-+                                       gcvFEATURE_END_EVENT) == gcvSTATUS_TRUE)
-+    {
-+        /* Allocate the signal. */
-+        if (Command->endEventSignal == gcvNULL)
-+        {
-+            gcmkONERROR(gckOS_CreateSignal(Command->os,
-+                                           gcvTRUE,
-+                                           &Command->endEventSignal));
-+        }
-+
-+        /* Append the END EVENT command to trigger the signal. */
-+        gcmkONERROR(gckEVENT_Stop(Command->kernel->eventObj,
-+                                  Command->kernelProcessID,
-+                                  Command->waitPhysical,
-+                                  Command->waitLogical,
-+                                  Command->endEventSignal,
-+								  &Command->waitSize));
-+    }
-+    else
-+    {
-+        /* Replace last WAIT with END. */
-+        gcmkONERROR(gckHARDWARE_End(
-+            hardware, Command->waitLogical, &Command->waitSize
-+            ));
-+
-+        /* Update queue tail pointer. */
-+        gcmkONERROR(gckHARDWARE_UpdateQueueTail(Command->kernel->hardware,
-+                                                Command->logical,
-+                                                Command->offset));
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        /* Flush the cache for the END. */
-+        gcmkONERROR(gckOS_CacheClean(
-+            Command->os,
-+            Command->kernelProcessID,
-+            gcvNULL,
-+            Command->waitPhysical,
-+            Command->waitLogical,
-+            Command->waitSize
-+            ));
-+#endif
-+
-+        /* Wait for idle. */
-+        gcmkONERROR(gckHARDWARE_GetIdle(hardware, !FromRecovery, &idle));
-+    }
-+
-+    /* Command queue is no longer running. */
-+    Command->running = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Commit
-+**
-+**  Commit a command buffer to the command queue.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to a gckCOMMAND object.
-+**
-+**      gckCONTEXT Context
-+**          Pointer to a gckCONTEXT object.
-+**
-+**      gcoCMDBUF CommandBuffer
-+**          Pointer to a gcoCMDBUF object.
-+**
-+**      gcsSTATE_DELTA_PTR StateDelta
-+**          Pointer to the state delta.
-+**
-+**      gctUINT32 ProcessID
-+**          Current process ID.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Commit(
-+    IN gckCOMMAND Command,
-+    IN gckCONTEXT Context,
-+    IN gcoCMDBUF CommandBuffer,
-+    IN gcsSTATE_DELTA_PTR StateDelta,
-+    IN gcsQUEUE_PTR EventQueue,
-+    IN gctUINT32 ProcessID
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL commitEntered = gcvFALSE;
-+    gctBOOL contextAcquired = gcvFALSE;
-+    gckHARDWARE hardware;
-+    gctBOOL needCopy = gcvFALSE;
-+    gcsQUEUE_PTR eventRecord = gcvNULL;
-+    gcsQUEUE _eventRecord;
-+    gcsQUEUE_PTR nextEventRecord;
-+    gctBOOL commandBufferMapped = gcvFALSE;
-+    gcoCMDBUF commandBufferObject = gcvNULL;
-+
-+#if !gcdNULL_DRIVER
-+    gcsCONTEXT_PTR contextBuffer;
-+    struct _gcoCMDBUF _commandBufferObject;
-+    gctPHYS_ADDR commandBufferPhysical;
-+    gctUINT8_PTR commandBufferLogical;
-+    gctUINT8_PTR commandBufferLink;
-+    gctUINT commandBufferSize;
-+    gctSIZE_T nopBytes;
-+    gctSIZE_T pipeBytes;
-+    gctSIZE_T linkBytes;
-+    gctSIZE_T bytes;
-+    gctUINT32 offset;
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    gctPHYS_ADDR entryPhysical;
-+#endif
-+    gctPOINTER entryLogical;
-+    gctSIZE_T entryBytes;
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    gctPHYS_ADDR exitPhysical;
-+#endif
-+    gctPOINTER exitLogical;
-+    gctSIZE_T exitBytes;
-+    gctPHYS_ADDR waitLinkPhysical;
-+    gctPOINTER waitLinkLogical;
-+    gctSIZE_T waitLinkBytes;
-+    gctPHYS_ADDR waitPhysical;
-+    gctPOINTER waitLogical;
-+    gctUINT32 waitOffset;
-+    gctSIZE_T waitSize;
-+
-+#if gcdDUMP_COMMAND
-+    gctPOINTER contextDumpLogical = gcvNULL;
-+    gctSIZE_T contextDumpBytes = 0;
-+    gctPOINTER bufferDumpLogical = gcvNULL;
-+    gctSIZE_T bufferDumpBytes = 0;
-+# endif
-+#endif
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    gctBOOL sequenceAcquired = gcvFALSE;
-+#endif
-+
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG(
-+        "Command=0x%x CommandBuffer=0x%x ProcessID=%d",
-+        Command, CommandBuffer, ProcessID
-+        );
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    if (Command->kernel->core == gcvCORE_2D)
-+    {
-+        /* There is no context for 2D. */
-+        Context = gcvNULL;
-+    }
-+
-+    gcmkONERROR(_FlushMMU(Command));
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    if((Command->kernel->hardware->gpuProfiler) && (Command->kernel->profileEnable))
-+    {
-+        /* Acquire the context sequnence mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(
-+            Command->os, Command->mutexContextSeq, gcvINFINITE
-+            ));
-+        sequenceAcquired = gcvTRUE;
-+    }
-+#endif
-+
-+    /* Acquire the command queue. */
-+    gcmkONERROR(gckCOMMAND_EnterCommit(Command, gcvFALSE));
-+    commitEntered = gcvTRUE;
-+
-+    /* Acquire the context switching mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(
-+        Command->os, Command->mutexContext, gcvINFINITE
-+        ));
-+    contextAcquired = gcvTRUE;
-+
-+    /* Extract the gckHARDWARE and gckEVENT objects. */
-+    hardware = Command->kernel->hardware;
-+
-+    /* Check wehther we need to copy the structures or not. */
-+    gcmkONERROR(gckOS_QueryNeedCopy(Command->os, ProcessID, &needCopy));
-+
-+#if gcdNULL_DRIVER
-+    /* Context switch required? */
-+    if ((Context != gcvNULL) && (Command->currContext != Context))
-+    {
-+        /* Yes, merge in the deltas. */
-+        gckCONTEXT_Update(Context, ProcessID, StateDelta);
-+
-+		/* Update the current context. */
-+		Command->currContext = Context;
-+	}
-+#else
-+    if (needCopy)
-+    {
-+        commandBufferObject = &_commandBufferObject;
-+
-+        gcmkONERROR(gckOS_CopyFromUserData(
-+            Command->os,
-+            commandBufferObject,
-+            CommandBuffer,
-+            gcmSIZEOF(struct _gcoCMDBUF)
-+            ));
-+
-+        gcmkVERIFY_OBJECT(commandBufferObject, gcvOBJ_COMMANDBUFFER);
-+    }
-+    else
-+    {
-+        gcmkONERROR(gckOS_MapUserPointer(
-+            Command->os,
-+            CommandBuffer,
-+            gcmSIZEOF(struct _gcoCMDBUF),
-+            &pointer
-+            ));
-+
-+        commandBufferObject = pointer;
-+
-+        gcmkVERIFY_OBJECT(commandBufferObject, gcvOBJ_COMMANDBUFFER);
-+        commandBufferMapped = gcvTRUE;
-+    }
-+
-+    /* Query the size of NOP command. */
-+    gcmkONERROR(gckHARDWARE_Nop(
-+        hardware, gcvNULL, &nopBytes
-+        ));
-+
-+    /* Query the size of pipe select command sequence. */
-+    gcmkONERROR(gckHARDWARE_PipeSelect(
-+        hardware, gcvNULL, gcvPIPE_3D, &pipeBytes
-+        ));
-+
-+    /* Query the size of LINK command. */
-+    gcmkONERROR(gckHARDWARE_Link(
-+        hardware, gcvNULL, gcvNULL, 0, &linkBytes
-+        ));
-+
-+    /* Compute the command buffer entry and the size. */
-+    commandBufferLogical
-+        = (gctUINT8_PTR) gcmUINT64_TO_PTR(commandBufferObject->logical)
-+        +                commandBufferObject->startOffset;
-+
-+    gcmkONERROR(gckOS_GetPhysicalAddress(
-+        Command->os,
-+        commandBufferLogical,
-+        (gctUINT32_PTR)&commandBufferPhysical
-+        ));
-+
-+    commandBufferSize
-+        = commandBufferObject->offset
-+        + Command->reservedTail
-+        - commandBufferObject->startOffset;
-+
-+    /* Get the current offset. */
-+    offset = Command->offset;
-+
-+    /* Compute number of bytes left in current kernel command queue. */
-+    bytes = Command->pageSize - offset;
-+
-+    /* Query the size of WAIT/LINK command sequence. */
-+    gcmkONERROR(gckHARDWARE_WaitLink(
-+        hardware,
-+        gcvNULL,
-+        offset,
-+        &waitLinkBytes,
-+        gcvNULL,
-+        gcvNULL
-+        ));
-+
-+    /* Is there enough space in the current command queue? */
-+    if (bytes < waitLinkBytes)
-+    {
-+        /* No, create a new one. */
-+        gcmkONERROR(_NewQueue(Command));
-+
-+        /* Get the new current offset. */
-+        offset = Command->offset;
-+
-+        /* Recompute the number of bytes in the new kernel command queue. */
-+        bytes = Command->pageSize - offset;
-+        gcmkASSERT(bytes >= waitLinkBytes);
-+    }
-+
-+    /* Compute the location if WAIT/LINK command sequence. */
-+    waitLinkPhysical = (gctUINT8_PTR) Command->physical + offset;
-+    waitLinkLogical  = (gctUINT8_PTR) Command->logical  + offset;
-+
-+    /* Context switch required? */
-+    if (Context == gcvNULL)
-+    {
-+        /* See if we have to switch pipes for the command buffer. */
-+        if (commandBufferObject->entryPipe == Command->pipeSelect)
-+        {
-+            /* Skip pipe switching sequence. */
-+            offset = pipeBytes;
-+        }
-+        else
-+        {
-+            /* The current hardware and the entry command buffer pipes
-+            ** are different, switch to the correct pipe. */
-+            gcmkONERROR(gckHARDWARE_PipeSelect(
-+                Command->kernel->hardware,
-+                commandBufferLogical,
-+                commandBufferObject->entryPipe,
-+                &pipeBytes
-+                ));
-+
-+            /* Do not skip pipe switching sequence. */
-+            offset = 0;
-+        }
-+
-+        /* Compute the entry. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        entryPhysical = (gctUINT8_PTR) commandBufferPhysical + offset;
-+#endif
-+        entryLogical  =                commandBufferLogical  + offset;
-+        entryBytes    =                commandBufferSize     - offset;
-+    }
-+    else if (Command->currContext != Context)
-+    {
-+        /* Temporary disable context length oprimization. */
-+        Context->dirty = gcvTRUE;
-+
-+        /* Get the current context buffer. */
-+        contextBuffer = Context->buffer;
-+
-+        /* Yes, merge in the deltas. */
-+        gcmkONERROR(gckCONTEXT_Update(Context, ProcessID, StateDelta));
-+
-+        /* Determine context entry and exit points. */
-+        if (0)
-+        {
-+            /* Reset 2D dirty flag. */
-+            Context->dirty2D = gcvFALSE;
-+
-+            if (Context->dirty || commandBufferObject->using3D)
-+            {
-+                /***************************************************************
-+                ** SWITCHING CONTEXT: 2D and 3D are used.
-+                */
-+
-+                /* Reset 3D dirty flag. */
-+                Context->dirty3D = gcvFALSE;
-+
-+                /* Compute the entry. */
-+                if (Command->pipeSelect == gcvPIPE_2D)
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
-+                    entryBytes    =                Context->bufferSize     - pipeBytes;
-+                }
-+                else
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
-+                    entryBytes    =                Context->bufferSize;
-+                }
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_3D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* Ensure the NOP between 2D and 3D is in place so that the
-+                   execution falls through from 2D to 3D. */
-+                gcmkONERROR(gckHARDWARE_Nop(
-+                    hardware,
-+                    contextBuffer->link2D,
-+                    &nopBytes
-+                    ));
-+
-+                /* Generate a LINK from the context buffer to
-+                   the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link3D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+
-+                /* Mark context as not dirty. */
-+                Context->dirty = gcvFALSE;
-+            }
-+            else
-+            {
-+                /***************************************************************
-+                ** SWITCHING CONTEXT: 2D only command buffer.
-+                */
-+
-+                /* Mark 3D as dirty. */
-+                Context->dirty3D = gcvTRUE;
-+
-+                /* Compute the entry. */
-+                if (Command->pipeSelect == gcvPIPE_2D)
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
-+                    entryBytes    =                Context->entryOffset3D  - pipeBytes;
-+                }
-+                else
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
-+                    entryBytes    =                Context->entryOffset3D;
-+                }
-+
-+                /* Store the current context buffer. */
-+                Context->dirtyBuffer = contextBuffer;
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_2D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* 3D is not used, generate a LINK from the end of 2D part of
-+                   the context buffer to the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link2D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+            }
-+        }
-+
-+        /* Not using 2D. */
-+        else
-+        {
-+            /* Mark 2D as dirty. */
-+            Context->dirty2D = gcvTRUE;
-+
-+            /* Store the current context buffer. */
-+            Context->dirtyBuffer = contextBuffer;
-+
-+            if (Context->dirty || commandBufferObject->using3D)
-+            {
-+                /***************************************************************
-+                ** SWITCHING CONTEXT: 3D only command buffer.
-+                */
-+
-+                /* Reset 3D dirty flag. */
-+                Context->dirty3D = gcvFALSE;
-+
-+                /* Determine context buffer entry offset. */
-+                offset = (Command->pipeSelect == gcvPIPE_3D)
-+
-+                    /* Skip pipe switching sequence. */
-+                    ? Context->entryOffset3D + pipeBytes
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    : Context->entryOffset3D;
-+
-+                /* Compute the entry. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                entryPhysical = (gctUINT8_PTR) contextBuffer->physical + offset;
-+#endif
-+                entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + offset;
-+                entryBytes    =                Context->bufferSize     - offset;
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_3D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* Generate a LINK from the context buffer to
-+                   the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link3D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+            }
-+            else
-+            {
-+                /***************************************************************
-+                ** SWITCHING CONTEXT: "XD" command buffer - neither 2D nor 3D.
-+                */
-+
-+                /* Mark 3D as dirty. */
-+                Context->dirty3D = gcvTRUE;
-+
-+                /* Compute the entry. */
-+                if (Command->pipeSelect == gcvPIPE_3D)
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical
-+                        = (gctUINT8_PTR) contextBuffer->physical
-+                        + Context->entryOffsetXDFrom3D;
-+#endif
-+                    entryLogical
-+                        = (gctUINT8_PTR) contextBuffer->logical
-+                        + Context->entryOffsetXDFrom3D;
-+
-+                    entryBytes
-+                        = Context->bufferSize
-+                        - Context->entryOffsetXDFrom3D;
-+                }
-+                else
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical
-+                        = (gctUINT8_PTR) contextBuffer->physical
-+                        + Context->entryOffsetXDFrom2D;
-+#endif
-+                    entryLogical
-+                        = (gctUINT8_PTR) contextBuffer->logical
-+                        + Context->entryOffsetXDFrom2D;
-+
-+                    entryBytes
-+                        = Context->totalSize
-+                        - Context->entryOffsetXDFrom2D;
-+                }
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_3D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* Generate a LINK from the context buffer to
-+                   the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link3D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+            }
-+        }
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        /* Flush the context buffer cache. */
-+        gcmkONERROR(gckOS_CacheClean(
-+            Command->os,
-+            Command->kernelProcessID,
-+            gcvNULL,
-+            entryPhysical,
-+            entryLogical,
-+            entryBytes
-+            ));
-+#endif
-+
-+        /* Update the current context. */
-+        Command->currContext = Context;
-+
-+#if gcdDUMP_COMMAND
-+        contextDumpLogical = entryLogical;
-+        contextDumpBytes   = entryBytes;
-+#endif
-+    }
-+
-+    /* Same context. */
-+    else
-+    {
-+        /* Determine context entry and exit points. */
-+        if (commandBufferObject->using2D && Context->dirty2D)
-+        {
-+            /* Reset 2D dirty flag. */
-+            Context->dirty2D = gcvFALSE;
-+
-+            /* Get the "dirty" context buffer. */
-+            contextBuffer = Context->dirtyBuffer;
-+
-+            if (commandBufferObject->using3D && Context->dirty3D)
-+            {
-+                /* Reset 3D dirty flag. */
-+                Context->dirty3D = gcvFALSE;
-+
-+                /* Compute the entry. */
-+                if (Command->pipeSelect == gcvPIPE_2D)
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
-+                    entryBytes    =                Context->bufferSize     - pipeBytes;
-+                }
-+                else
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
-+                    entryBytes    =                Context->bufferSize;
-+                }
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_3D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* Ensure the NOP between 2D and 3D is in place so that the
-+                   execution falls through from 2D to 3D. */
-+                gcmkONERROR(gckHARDWARE_Nop(
-+                    hardware,
-+                    contextBuffer->link2D,
-+                    &nopBytes
-+                    ));
-+
-+                /* Generate a LINK from the context buffer to
-+                   the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link3D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+            }
-+            else
-+            {
-+                /* Compute the entry. */
-+                if (Command->pipeSelect == gcvPIPE_2D)
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
-+                    entryBytes    =                Context->entryOffset3D  - pipeBytes;
-+                }
-+                else
-+                {
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
-+#endif
-+                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
-+                    entryBytes    =                Context->entryOffset3D;
-+                }
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_2D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* 3D is not used, generate a LINK from the end of 2D part of
-+                   the context buffer to the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link2D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+            }
-+        }
-+        else
-+        {
-+            if (commandBufferObject->using3D && Context->dirty3D)
-+            {
-+                /* Reset 3D dirty flag. */
-+                Context->dirty3D = gcvFALSE;
-+
-+                /* Get the "dirty" context buffer. */
-+                contextBuffer = Context->dirtyBuffer;
-+
-+                /* Determine context buffer entry offset. */
-+                offset = (Command->pipeSelect == gcvPIPE_3D)
-+
-+                    /* Skip pipe switching sequence. */
-+                    ? Context->entryOffset3D + pipeBytes
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    : Context->entryOffset3D;
-+
-+                /* Compute the entry. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                entryPhysical = (gctUINT8_PTR) contextBuffer->physical + offset;
-+#endif
-+                entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + offset;
-+                entryBytes    =                Context->bufferSize     - offset;
-+
-+                /* See if we have to switch pipes between the context
-+                   and command buffers. */
-+                if (commandBufferObject->entryPipe == gcvPIPE_3D)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the initial context pipes are
-+                       different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* Generate a LINK from the context buffer to
-+                   the command buffer. */
-+                gcmkONERROR(gckHARDWARE_Link(
-+                    hardware,
-+                    contextBuffer->link3D,
-+                    commandBufferLogical + offset,
-+                    commandBufferSize    - offset,
-+                    &linkBytes
-+                    ));
-+            }
-+            else
-+            {
-+                /* See if we have to switch pipes for the command buffer. */
-+                if (commandBufferObject->entryPipe == Command->pipeSelect)
-+                {
-+                    /* Skip pipe switching sequence. */
-+                    offset = pipeBytes;
-+                }
-+                else
-+                {
-+                    /* The current hardware and the entry command buffer pipes
-+                    ** are different, switch to the correct pipe. */
-+                    gcmkONERROR(gckHARDWARE_PipeSelect(
-+                        Command->kernel->hardware,
-+                        commandBufferLogical,
-+                        commandBufferObject->entryPipe,
-+                        &pipeBytes
-+                        ));
-+
-+                    /* Do not skip pipe switching sequence. */
-+                    offset = 0;
-+                }
-+
-+                /* Compute the entry. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+                entryPhysical = (gctUINT8_PTR) commandBufferPhysical + offset;
-+#endif
-+                entryLogical  =                commandBufferLogical  + offset;
-+                entryBytes    =                commandBufferSize     - offset;
-+            }
-+        }
-+    }
-+
-+#if gcdDUMP_COMMAND
-+    bufferDumpLogical = commandBufferLogical + offset;
-+    bufferDumpBytes   = commandBufferSize    - offset;
-+#endif
-+
-+#if gcdSECURE_USER
-+    /* Process user hints. */
-+    gcmkONERROR(_ProcessHints(Command, ProcessID, commandBufferObject));
-+#endif
-+
-+    /* Determine the location to jump to for the command buffer being
-+    ** scheduled. */
-+    if (Command->newQueue)
-+    {
-+        /* New command queue, jump to the beginning of it. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        exitPhysical = Command->physical;
-+#endif
-+        exitLogical  = Command->logical;
-+        exitBytes    = Command->offset + waitLinkBytes;
-+    }
-+    else
-+    {
-+        /* Still within the preexisting command queue, jump to the new
-+           WAIT/LINK command sequence. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        exitPhysical = waitLinkPhysical;
-+#endif
-+        exitLogical  = waitLinkLogical;
-+        exitBytes    = waitLinkBytes;
-+    }
-+
-+    /* Add a new WAIT/LINK command sequence. When the command buffer which is
-+       currently being scheduled is fully executed by the GPU, the FE will
-+       jump to this WAIT/LINK sequence. */
-+    gcmkONERROR(gckHARDWARE_WaitLink(
-+        hardware,
-+        waitLinkLogical,
-+        offset,
-+        &waitLinkBytes,
-+        &waitOffset,
-+        &waitSize
-+        ));
-+
-+    /* Compute the location if WAIT command. */
-+    waitPhysical = (gctUINT8_PTR) waitLinkPhysical + waitOffset;
-+    waitLogical  = (gctUINT8_PTR) waitLinkLogical  + waitOffset;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the command queue cache. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Command->os,
-+        Command->kernelProcessID,
-+        gcvNULL,
-+        exitPhysical,
-+        exitLogical,
-+        exitBytes
-+        ));
-+#endif
-+
-+    /* Determine the location of the LINK command in the command buffer. */
-+    commandBufferLink
-+        = (gctUINT8_PTR) gcmUINT64_TO_PTR(commandBufferObject->logical)
-+        +                commandBufferObject->offset;
-+
-+    /* Generate a LINK from the end of the command buffer being scheduled
-+       back to the kernel command queue. */
-+    gcmkONERROR(gckHARDWARE_Link(
-+        hardware,
-+        commandBufferLink,
-+        exitLogical,
-+        exitBytes,
-+        &linkBytes
-+        ));
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the command buffer cache. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Command->os,
-+        ProcessID,
-+        gcvNULL,
-+        commandBufferPhysical,
-+        commandBufferLogical,
-+        commandBufferSize
-+        ));
-+#endif
-+
-+    /* Generate a LINK from the previous WAIT/LINK command sequence to the
-+       entry determined above (either the context or the command buffer).
-+       This LINK replaces the WAIT instruction from the previous WAIT/LINK
-+       pair, therefore we use WAIT metrics for generation of this LINK.
-+       This action will execute the entire sequence. */
-+    gcmkONERROR(gckHARDWARE_Link(
-+        hardware,
-+        Command->waitLogical,
-+        entryLogical,
-+        entryBytes,
-+        &Command->waitSize
-+        ));
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache for the link. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Command->os,
-+        Command->kernelProcessID,
-+        gcvNULL,
-+        Command->waitPhysical,
-+        Command->waitLogical,
-+        Command->waitSize
-+        ));
-+#endif
-+
-+    gcmkDUMPCOMMAND(
-+        Command->os,
-+        Command->waitLogical,
-+        Command->waitSize,
-+        gceDUMP_BUFFER_LINK,
-+        gcvFALSE
-+        );
-+
-+    gcmkDUMPCOMMAND(
-+        Command->os,
-+        contextDumpLogical,
-+        contextDumpBytes,
-+        gceDUMP_BUFFER_CONTEXT,
-+        gcvFALSE
-+        );
-+
-+    gcmkDUMPCOMMAND(
-+        Command->os,
-+        bufferDumpLogical,
-+        bufferDumpBytes,
-+        gceDUMP_BUFFER_USER,
-+        gcvFALSE
-+        );
-+
-+    gcmkDUMPCOMMAND(
-+        Command->os,
-+        waitLinkLogical,
-+        waitLinkBytes,
-+        gceDUMP_BUFFER_WAITLINK,
-+        gcvFALSE
-+        );
-+
-+    /* Update the current pipe. */
-+    Command->pipeSelect = commandBufferObject->exitPipe;
-+
-+    /* Update command queue offset. */
-+    Command->offset  += waitLinkBytes;
-+    Command->newQueue = gcvFALSE;
-+
-+    /* Update address of last WAIT. */
-+    Command->waitPhysical = waitPhysical;
-+    Command->waitLogical  = waitLogical;
-+    Command->waitSize     = waitSize;
-+
-+    /* Update queue tail pointer. */
-+    gcmkONERROR(gckHARDWARE_UpdateQueueTail(
-+        hardware, Command->logical, Command->offset
-+        ));
-+
-+#if gcdDUMP_COMMAND
-+    gcmkPRINT("@[kernel.commit]");
-+#endif
-+#endif /* gcdNULL_DRIVER */
-+
-+    /* Release the context switching mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
-+    contextAcquired = gcvFALSE;
-+
-+    /* Release the command queue. */
-+    gcmkONERROR(gckCOMMAND_ExitCommit(Command, gcvFALSE));
-+    commitEntered = gcvFALSE;
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    if(sequenceAcquired)
-+    {
-+        gcmkONERROR(gckCOMMAND_Stall(Command, gcvTRUE));
-+        if (Command->currContext)
-+        {
-+            gcmkONERROR(gckHARDWARE_UpdateContextProfile(
-+                hardware,
-+                Command->currContext));
-+        }
-+
-+        /* Release the context switching mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContextSeq));
-+        sequenceAcquired = gcvFALSE;
-+    }
-+#endif
-+
-+    /* Loop while there are records in the queue. */
-+    while (EventQueue != gcvNULL)
-+    {
-+        if (needCopy)
-+        {
-+            /* Point to stack record. */
-+            eventRecord = &_eventRecord;
-+
-+            /* Copy the data from the client. */
-+            gcmkONERROR(gckOS_CopyFromUserData(
-+                Command->os, eventRecord, EventQueue, gcmSIZEOF(gcsQUEUE)
-+                ));
-+        }
-+        else
-+        {
-+            /* Map record into kernel memory. */
-+            gcmkONERROR(gckOS_MapUserPointer(Command->os,
-+                                             EventQueue,
-+                                             gcmSIZEOF(gcsQUEUE),
-+                                             &pointer));
-+
-+            eventRecord = pointer;
-+        }
-+
-+        /* Append event record to event queue. */
-+        gcmkONERROR(gckEVENT_AddList(
-+            Command->kernel->eventObj, &eventRecord->iface, gcvKERNEL_PIXEL, gcvTRUE, gcvFALSE
-+            ));
-+
-+        /* Next record in the queue. */
-+        nextEventRecord = gcmUINT64_TO_PTR(eventRecord->next);
-+
-+        if (!needCopy)
-+        {
-+            /* Unmap record from kernel memory. */
-+            gcmkONERROR(gckOS_UnmapUserPointer(
-+                Command->os, EventQueue, gcmSIZEOF(gcsQUEUE), (gctPOINTER *) eventRecord
-+                ));
-+
-+            eventRecord = gcvNULL;
-+        }
-+
-+        EventQueue = nextEventRecord;
-+    }
-+
-+    if (Command->kernel->eventObj->queueHead == gcvNULL
-+     && Command->kernel->hardware->powerManagement == gcvTRUE
-+    )
-+    {
-+        /* Commit done event by which work thread knows all jobs done. */
-+        gcmkVERIFY_OK(
-+            gckEVENT_CommitDone(Command->kernel->eventObj, gcvKERNEL_PIXEL));
-+    }
-+
-+    /* Submit events. */
-+    status = gckEVENT_Submit(Command->kernel->eventObj, gcvTRUE, gcvFALSE);
-+
-+    if (status == gcvSTATUS_INTERRUPTED)
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_INFO,
-+            "%s(%d): Intterupted in gckEVENT_Submit",
-+            __FUNCTION__, __LINE__
-+            );
-+        status = gcvSTATUS_OK;
-+    }
-+    else
-+    {
-+        gcmkONERROR(status);
-+    }
-+
-+    /* Unmap the command buffer pointer. */
-+    if (commandBufferMapped)
-+    {
-+        gcmkONERROR(gckOS_UnmapUserPointer(
-+            Command->os,
-+            CommandBuffer,
-+            gcmSIZEOF(struct _gcoCMDBUF),
-+            commandBufferObject
-+            ));
-+
-+        commandBufferMapped = gcvFALSE;
-+    }
-+
-+    /* Return status. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if ((eventRecord != gcvNULL) && !needCopy)
-+    {
-+        /* Roll back. */
-+        gcmkVERIFY_OK(gckOS_UnmapUserPointer(
-+            Command->os,
-+            EventQueue,
-+            gcmSIZEOF(gcsQUEUE),
-+            (gctPOINTER *) eventRecord
-+            ));
-+    }
-+
-+    if (contextAcquired)
-+    {
-+        /* Release the context switching mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
-+    }
-+
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(Command, gcvFALSE));
-+    }
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    if (sequenceAcquired)
-+    {
-+        /* Release the context sequence mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContextSeq));
-+    }
-+#endif
-+
-+    /* Unmap the command buffer pointer. */
-+    if (commandBufferMapped)
-+    {
-+        gcmkVERIFY_OK(gckOS_UnmapUserPointer(
-+            Command->os,
-+            CommandBuffer,
-+            gcmSIZEOF(struct _gcoCMDBUF),
-+            commandBufferObject
-+            ));
-+    }
-+
-+    /* Return status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Reserve
-+**
-+**  Reserve space in the command queue.  Also acquire the command queue mutex.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object.
-+**
-+**      gctSIZE_T RequestedBytes
-+**          Number of bytes previously reserved.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Buffer
-+**          Pointer to a variable that will receive the address of the reserved
-+**          space.
-+**
-+**      gctSIZE_T * BufferSize
-+**          Pointer to a variable that will receive the number of bytes
-+**          available in the command queue.
-+*/
-+gceSTATUS
-+gckCOMMAND_Reserve(
-+    IN gckCOMMAND Command,
-+    IN gctSIZE_T RequestedBytes,
-+    OUT gctPOINTER * Buffer,
-+    OUT gctSIZE_T * BufferSize
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T bytes;
-+    gctSIZE_T requiredBytes;
-+    gctUINT32 requestedAligned;
-+
-+    gcmkHEADER_ARG("Command=0x%x RequestedBytes=%lu", Command, RequestedBytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Compute aligned number of reuested bytes. */
-+    requestedAligned = gcmALIGN(RequestedBytes, Command->alignment);
-+
-+    /* Another WAIT/LINK command sequence will have to be appended after
-+       the requested area being reserved. Compute the number of bytes
-+       required for WAIT/LINK at the location after the reserved area. */
-+    gcmkONERROR(gckHARDWARE_WaitLink(
-+        Command->kernel->hardware,
-+        gcvNULL,
-+        Command->offset + requestedAligned,
-+        &requiredBytes,
-+        gcvNULL,
-+        gcvNULL
-+        ));
-+
-+    /* Compute total number of bytes required. */
-+    requiredBytes += requestedAligned;
-+
-+    /* Compute number of bytes available in command queue. */
-+    bytes = Command->pageSize - Command->offset;
-+
-+    /* Is there enough space in the current command queue? */
-+    if (bytes < requiredBytes)
-+    {
-+        /* Create a new command queue. */
-+        gcmkONERROR(_NewQueue(Command));
-+
-+        /* Recompute the number of bytes in the new kernel command queue. */
-+        bytes = Command->pageSize - Command->offset;
-+
-+        /* Still not enough space? */
-+        if (bytes < requiredBytes)
-+        {
-+            /* Rare case, not enough room in command queue. */
-+            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
-+        }
-+    }
-+
-+    /* Return pointer to empty slot command queue. */
-+    *Buffer = (gctUINT8 *) Command->logical + Command->offset;
-+
-+    /* Return number of bytes left in command queue. */
-+    *BufferSize = bytes;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Buffer=0x%x *BufferSize=%lu", *Buffer, *BufferSize);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Execute
-+**
-+**  Execute a previously reserved command queue by appending a WAIT/LINK command
-+**  sequence after it and modifying the last WAIT into a LINK command.  The
-+**  command FIFO mutex will be released whether this function succeeds or not.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object.
-+**
-+**      gctSIZE_T RequestedBytes
-+**          Number of bytes previously reserved.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Execute(
-+    IN gckCOMMAND Command,
-+    IN gctSIZE_T RequestedBytes
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gctPHYS_ADDR waitLinkPhysical;
-+    gctUINT8_PTR waitLinkLogical;
-+    gctUINT32 waitLinkOffset;
-+    gctSIZE_T waitLinkBytes;
-+
-+    gctPHYS_ADDR waitPhysical;
-+    gctPOINTER waitLogical;
-+    gctUINT32 waitOffset;
-+    gctSIZE_T waitBytes;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    gctPHYS_ADDR execPhysical;
-+#endif
-+    gctPOINTER execLogical;
-+    gctSIZE_T execBytes;
-+
-+    gcmkHEADER_ARG("Command=0x%x RequestedBytes=%lu", Command, RequestedBytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Compute offset for WAIT/LINK. */
-+    waitLinkOffset = Command->offset + RequestedBytes;
-+
-+    /* Compute number of bytes left in command queue. */
-+    waitLinkBytes = Command->pageSize - waitLinkOffset;
-+
-+    /* Compute the location if WAIT/LINK command sequence. */
-+    waitLinkPhysical = (gctUINT8_PTR) Command->physical + waitLinkOffset;
-+    waitLinkLogical  = (gctUINT8_PTR) Command->logical  + waitLinkOffset;
-+
-+    /* Append WAIT/LINK in command queue. */
-+    gcmkONERROR(gckHARDWARE_WaitLink(
-+        Command->kernel->hardware,
-+        waitLinkLogical,
-+        waitLinkOffset,
-+        &waitLinkBytes,
-+        &waitOffset,
-+        &waitBytes
-+        ));
-+
-+    /* Compute the location if WAIT command. */
-+    waitPhysical = (gctUINT8_PTR) waitLinkPhysical + waitOffset;
-+    waitLogical  =                waitLinkLogical  + waitOffset;
-+
-+    /* Determine the location to jump to for the command buffer being
-+    ** scheduled. */
-+    if (Command->newQueue)
-+    {
-+        /* New command queue, jump to the beginning of it. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        execPhysical = Command->physical;
-+#endif
-+        execLogical  = Command->logical;
-+        execBytes    = waitLinkOffset + waitLinkBytes;
-+    }
-+    else
-+    {
-+        /* Still within the preexisting command queue, jump directly to the
-+           reserved area. */
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+        execPhysical = (gctUINT8 *) Command->physical + Command->offset;
-+#endif
-+        execLogical  = (gctUINT8 *) Command->logical  + Command->offset;
-+        execBytes    = RequestedBytes + waitLinkBytes;
-+    }
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Command->os,
-+        Command->kernelProcessID,
-+        gcvNULL,
-+        execPhysical,
-+        execLogical,
-+        execBytes
-+        ));
-+#endif
-+
-+    /* Convert the last WAIT into a LINK. */
-+    gcmkONERROR(gckHARDWARE_Link(
-+        Command->kernel->hardware,
-+        Command->waitLogical,
-+        execLogical,
-+        execBytes,
-+        &Command->waitSize
-+        ));
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Command->os,
-+        Command->kernelProcessID,
-+        gcvNULL,
-+        Command->waitPhysical,
-+        Command->waitLogical,
-+        Command->waitSize
-+        ));
-+#endif
-+
-+    gcmkDUMPCOMMAND(
-+        Command->os,
-+        Command->waitLogical,
-+        Command->waitSize,
-+        gceDUMP_BUFFER_LINK,
-+        gcvFALSE
-+        );
-+
-+    gcmkDUMPCOMMAND(
-+        Command->os,
-+        execLogical,
-+        execBytes,
-+        gceDUMP_BUFFER_KERNEL,
-+        gcvFALSE
-+        );
-+
-+    /* Update the pointer to the last WAIT. */
-+    Command->waitPhysical = waitPhysical;
-+    Command->waitLogical  = waitLogical;
-+    Command->waitSize     = waitBytes;
-+
-+    /* Update the command queue. */
-+    Command->offset  += RequestedBytes + waitLinkBytes;
-+    Command->newQueue = gcvFALSE;
-+
-+    /* Update queue tail pointer. */
-+    gcmkONERROR(gckHARDWARE_UpdateQueueTail(
-+        Command->kernel->hardware, Command->logical, Command->offset
-+        ));
-+
-+#if gcdDUMP_COMMAND
-+    gcmkPRINT("@[kernel.execute]");
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Stall
-+**
-+**  The calling thread will be suspended until the command queue has been
-+**  completed.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to an gckCOMMAND object.
-+**
-+**      gctBOOL FromPower
-+**          Determines whether the call originates from inside the power
-+**          management or not.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Stall(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromPower
-+    )
-+{
-+#if gcdNULL_DRIVER
-+    /* Do nothing with infinite hardware. */
-+    return gcvSTATUS_OK;
-+#else
-+    gckOS os;
-+    gckHARDWARE hardware;
-+    gckEVENT eventObject;
-+    gceSTATUS status;
-+    gctSIGNAL signal = gcvNULL;
-+    gctUINT timer = 0;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Extract the gckOS object pointer. */
-+    os = Command->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Extract the gckHARDWARE object pointer. */
-+    hardware = Command->kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    /* Extract the gckEVENT object pointer. */
-+    eventObject = Command->kernel->eventObj;
-+    gcmkVERIFY_OBJECT(eventObject, gcvOBJ_EVENT);
-+
-+    /* Allocate the signal. */
-+    gcmkONERROR(gckOS_CreateSignal(os, gcvTRUE, &signal));
-+
-+    /* Append the EVENT command to trigger the signal. */
-+    gcmkONERROR(gckEVENT_Signal(eventObject, signal, gcvKERNEL_PIXEL));
-+
-+    /* Submit the event queue. */
-+    gcmkONERROR(gckEVENT_Submit(eventObject, gcvTRUE, FromPower));
-+
-+#if gcdDUMP_COMMAND
-+    gcmkPRINT("@[kernel.stall]");
-+#endif
-+
-+    if (status == gcvSTATUS_CHIP_NOT_READY)
-+    {
-+        /* Error. */
-+        goto OnError;
-+    }
-+
-+    do
-+    {
-+        /* Wait for the signal. */
-+        status = gckOS_WaitSignal(os, signal, gcdGPU_ADVANCETIMER);
-+
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+            gctUINT32 idle;
-+
-+            /* Read idle register. */
-+            gcmkVERIFY_OK(gckHARDWARE_GetIdle(
-+                hardware, gcvFALSE, &idle
-+                ));
-+
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): idle=%08x",
-+                __FUNCTION__, __LINE__, idle
-+                );
-+
-+            gcmkONERROR(gckOS_MemoryBarrier(os, gcvNULL));
-+
-+#ifdef __QNXNTO__
-+            gctUINT32 reg_cmdbuf_fetch;
-+            gctUINT32 reg_intr;
-+
-+            gcmkVERIFY_OK(gckOS_ReadRegisterEx(
-+                Command->kernel->hardware->os, Command->kernel->core, 0x0664, &reg_cmdbuf_fetch
-+                ));
-+
-+            if (idle == 0x7FFFFFFE)
-+            {
-+                /*
-+                 * GPU is idle so there should not be pending interrupts.
-+                 * Just double check.
-+                 *
-+                 * Note that reading interrupt register clears it.
-+                 * That's why we don't read it in all cases.
-+                 */
-+                gcmkVERIFY_OK(gckOS_ReadRegisterEx(
-+                    Command->kernel->hardware->os, Command->kernel->core, 0x10, &reg_intr
-+                    ));
-+
-+                slogf(
-+                    _SLOG_SETCODE(1, 0),
-+                    _SLOG_CRITICAL,
-+                    "GALcore: Stall timeout (idle = 0x%X, command buffer fetch = 0x%X, interrupt = 0x%X)",
-+                    idle, reg_cmdbuf_fetch, reg_intr
-+                    );
-+            }
-+            else
-+            {
-+                slogf(
-+                    _SLOG_SETCODE(1, 0),
-+                    _SLOG_CRITICAL,
-+                    "GALcore: Stall timeout (idle = 0x%X, command buffer fetch = 0x%X)",
-+                    idle, reg_cmdbuf_fetch
-+                    );
-+            }
-+#endif
-+#endif
-+            /* Advance timer. */
-+            timer += gcdGPU_ADVANCETIMER;
-+        }
-+        else if (status == gcvSTATUS_INTERRUPTED)
-+        {
-+            gcmkONERROR(gcvSTATUS_INTERRUPTED);
-+        }
-+
-+    }
-+    while (gcmIS_ERROR(status)
-+#if gcdGPU_TIMEOUT
-+           && (timer < Command->kernel->timeOut)
-+#endif
-+           );
-+
-+    /* Bail out on timeout. */
-+    if (gcmIS_ERROR(status))
-+    {
-+        /* Broadcast the stuck GPU. */
-+        gcmkONERROR(gckOS_Broadcast(
-+            os, hardware, gcvBROADCAST_GPU_STUCK
-+            ));
-+    }
-+
-+    /* Delete the signal. */
-+    gcmkVERIFY_OK(gckOS_DestroySignal(os, signal));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (signal != gcvNULL)
-+    {
-+        /* Free the signal. */
-+        gcmkVERIFY_OK(gckOS_DestroySignal(os, signal));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Attach
-+**
-+**  Attach user process.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to a gckCOMMAND object.
-+**
-+**      gctUINT32 ProcessID
-+**          Current process ID.
-+**
-+**  OUTPUT:
-+**
-+**      gckCONTEXT * Context
-+**          Pointer to a variable that will receive a pointer to a new
-+**          gckCONTEXT object.
-+**
-+**      gctSIZE_T * StateCount
-+**          Pointer to a variable that will receive the number of states
-+**          in the context buffer.
-+*/
-+gceSTATUS
-+gckCOMMAND_Attach(
-+    IN gckCOMMAND Command,
-+    OUT gckCONTEXT * Context,
-+    OUT gctSIZE_T * StateCount,
-+    IN gctUINT32 ProcessID
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Acquire the context switching mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(
-+        Command->os, Command->mutexContext, gcvINFINITE
-+        ));
-+    acquired = gcvTRUE;
-+
-+    /* Construct a gckCONTEXT object. */
-+    gcmkONERROR(gckCONTEXT_Construct(
-+        Command->os,
-+        Command->kernel->hardware,
-+        ProcessID,
-+        Context
-+        ));
-+
-+    /* Return the number of states in the context. */
-+    * StateCount = (* Context)->stateCount;
-+
-+    /* Release the context switching mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Context=0x%x", *Context);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Release mutex. */
-+    if (acquired)
-+    {
-+        /* Release the context switching mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
-+        acquired = gcvFALSE;
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_Detach
-+**
-+**  Detach user process.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to a gckCOMMAND object.
-+**
-+**      gckCONTEXT Context
-+**          Pointer to a gckCONTEXT object to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_Detach(
-+    IN gckCOMMAND Command,
-+    IN gckCONTEXT Context
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Command=0x%x Context=0x%x", Command, Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    /* Acquire the context switching mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(
-+        Command->os, Command->mutexContext, gcvINFINITE
-+        ));
-+    acquired = gcvTRUE;
-+
-+    /* Construct a gckCONTEXT object. */
-+    gcmkONERROR(gckCONTEXT_Destroy(Context));
-+
-+    if (Command->currContext == Context)
-+    {
-+        /* Detach from gckCOMMAND object if the destoryed context is current context. */
-+        Command->currContext = gcvNULL;
-+    }
-+
-+    /* Release the context switching mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
-+    acquired = gcvFALSE;
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Release mutex. */
-+    if (acquired)
-+    {
-+        /* Release the context switching mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
-+        acquired = gcvFALSE;
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+/*******************************************************************************
-+**
-+**  gckCOMMAND_DumpExecutingBuffer
-+**
-+**  Dump the command buffer which GPU is executing.
-+**
-+**  INPUT:
-+**
-+**      gckCOMMAND Command
-+**          Pointer to a gckCOMMAND object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckCOMMAND_DumpExecutingBuffer(
-+    IN gckCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
-+    gctUINT32 gpuAddress;
-+    gctSIZE_T pageCount;
-+    gctPOINTER entry;
-+    gckOS os = Command->os;
-+    gckKERNEL kernel = Command->kernel;
-+#if gcdLINK_QUEUE_SIZE
-+    gctINT pid;
-+    gctINT i, rear;
-+    gctUINT32 start, end;
-+    gctUINT32 dumpFront, dumpRear;
-+    gckLINKQUEUE queue = &kernel->hardware->linkQueue;
-+    gckLINKQUEUE queueMirror;
-+    gctUINT32 bytes;
-+    gckLINKDATA linkData;
-+#endif
-+
-+    gcmkPRINT("**************************\n");
-+    gcmkPRINT("**** COMMAND BUF DUMP ****\n");
-+    gcmkPRINT("**************************\n");
-+
-+    gcmkVERIFY_OK(gckOS_ReadRegisterEx(os, kernel->core, 0x664, &gpuAddress));
-+
-+    gcmkPRINT("DMA Address 0x%08X", gpuAddress);
-+
-+#if gcdLINK_QUEUE_SIZE
-+    /* Duplicate queue because it will be changed.*/
-+    gcmkONERROR(gckOS_AllocateMemory(os,
-+                                     sizeof(struct _gckLINKQUEUE),
-+                                     (gctPOINTER *)&queueMirror));
-+
-+    gcmkONERROR(gckOS_MemCopy(queueMirror,
-+                              queue,
-+                              sizeof(struct _gckLINKQUEUE)));
-+
-+    /* If kernel command buffer link to a context buffer, then link to a user command
-+    ** buffer, the second link will be in queue first, so we must fix this.
-+    **     In Queue:    C1 U1 U2 C2 U3 U4 U5 C3
-+    **         Real: C1 X1 U1 C2 U2 U3 U4 C3 U5
-+    ** Command buffer X1 which is after C1 is out of queue, so C1 is meaningless.
-+    */
-+    for (i = 0; i < gcdLINK_QUEUE_SIZE; i++)
-+    {
-+        gckLINKQUEUE_GetData(queueMirror, i, &linkData);
-+
-+        status = gckKERNEL_QueryGPUAddress(kernel, linkData->start, &buffer);
-+
-+        if (gcmIS_ERROR(status))
-+        {
-+            /* Can't find it in virtual command buffer list, ignore it. */
-+            continue;
-+        }
-+
-+        if (buffer->kernelLogical)
-+        {
-+            /* It is a context buffer. */
-+            if (i == 0)
-+            {
-+                /* The real command buffer is out, so clear this slot. */
-+                linkData->start = 0;
-+                linkData->end = 0;
-+                linkData->pid = 0;
-+            }
-+            else
-+            {
-+                /* switch context buffer and command buffer. */
-+                struct _gckLINKDATA tmp = *linkData;
-+                gckLINKDATA linkDataPrevious;
-+
-+                gckLINKQUEUE_GetData(queueMirror, i - 1, &linkDataPrevious);
-+                *linkData = *linkDataPrevious;
-+                *linkDataPrevious = tmp;
-+           }
-+        }
-+    }
-+
-+    /* Clear search result. */
-+    dumpFront = dumpRear = gcvINFINITE;
-+
-+    gcmkPRINT("Link Stack:");
-+
-+    /* Search stuck address in link queue from rear. */
-+    rear = gcdLINK_QUEUE_SIZE - 1;
-+    for (i = 0; i < gcdLINK_QUEUE_SIZE; i++)
-+    {
-+        gckLINKQUEUE_GetData(queueMirror, rear, &linkData);
-+
-+        start = linkData->start;
-+        end = linkData->end;
-+        pid = linkData->pid;
-+
-+        if (gpuAddress >= start && gpuAddress < end)
-+        {
-+            /* Find latest matched command buffer. */
-+            gcmkPRINT("  %d, [%08X - %08X]", pid, start, end);
-+
-+            /* Initiliaze dump information. */
-+            dumpFront = dumpRear = rear;
-+        }
-+
-+        /* Advance to previous one. */
-+        rear--;
-+
-+        if (dumpFront != gcvINFINITE)
-+        {
-+            break;
-+        }
-+    }
-+
-+    if (dumpFront == gcvINFINITE)
-+    {
-+        /* Can't find matched record in link queue, dump kernel command buffer. */
-+        _DumpKernelCommandBuffer(Command);
-+
-+        /* Free local copy. */
-+        gcmkOS_SAFE_FREE(os, queueMirror);
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Search the last context buffer linked. */
-+    while (rear >= 0)
-+    {
-+        gckLINKQUEUE_GetData(queueMirror, rear, &linkData);
-+
-+        gcmkPRINT("  %d, [%08X - %08X]",
-+                  linkData->pid,
-+                  linkData->start,
-+                  linkData->end);
-+
-+        status = gckKERNEL_QueryGPUAddress(kernel, linkData->start, &buffer);
-+
-+        if (gcmIS_SUCCESS(status) && buffer->kernelLogical)
-+        {
-+            /* Find a context buffer. */
-+            dumpFront = rear;
-+            break;
-+        }
-+
-+        rear--;
-+    }
-+
-+    /* Dump from last context buffer to last command buffer where hang happens. */
-+    for (i = dumpFront; i <= dumpRear; i++)
-+    {
-+        gckLINKQUEUE_GetData(queueMirror, i, &linkData);
-+
-+        /* Get gpu address of this command buffer. */
-+        gpuAddress = linkData->start;
-+        bytes = linkData->end - gpuAddress;
-+
-+        /* Get the whole buffer. */
-+        status = gckKERNEL_QueryGPUAddress(kernel, gpuAddress, &buffer);
-+
-+        if (gcmIS_ERROR(status))
-+        {
-+            gcmkPRINT("Buffer [%08X - %08X] is lost",
-+                      linkData->start,
-+                      linkData->end);
-+            continue;
-+        }
-+
-+        /* Get kernel logical for dump. */
-+        if (buffer->kernelLogical)
-+        {
-+            /* Get kernel logical directly if it is a context buffer. */
-+            entry = buffer->kernelLogical;
-+            gcmkPRINT("Context Buffer:");
-+        }
-+        else
-+        {
-+            /* Make it accessiable by kernel if it is a user command buffer. */
-+            gcmkVERIFY_OK(
-+                gckOS_CreateKernelVirtualMapping(buffer->physical,
-+                                                 &pageCount,
-+                                                 &entry));
-+            gcmkPRINT("User Command Buffer:");
-+        }
-+
-+        /* Dump from the entry. */
-+        _DumpBuffer(entry + (gpuAddress - buffer->gpuAddress), gpuAddress, bytes);
-+
-+        /* Release kernel logical address if neccessary. */
-+        if (!buffer->kernelLogical)
-+        {
-+            gcmkVERIFY_OK(gckOS_DestroyKernelVirtualMapping(entry));
-+        }
-+    }
-+
-+    /* Free local copy. */
-+    gcmkOS_SAFE_FREE(os, queueMirror);
-+    return gcvSTATUS_OK;
-+OnError:
-+    return status;
-+#else
-+    /* Without link queue information, we don't know the entry of last command
-+    ** buffer, just dump the page where GPU stuck. */
-+    status = gckKERNEL_QueryGPUAddress(kernel, gpuAddress, &buffer);
-+
-+    if (gcmIS_SUCCESS(status))
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_CreateKernelVirtualMapping(buffer->physical, &pageCount, &entry));
-+
-+        if (entry)
-+        {
-+            gctUINT32 offset = gpuAddress - buffer->gpuAddress;
-+            gctPOINTER entryDump = entry;
-+
-+            /* Dump one pages. */
-+            gctUINT32 bytes = 4096;
-+
-+            /* Align to page. */
-+            offset &= 0xfffff000;
-+
-+            /* Kernel address of page where stall point stay. */
-+            entryDump += offset;
-+
-+            /* Align to page. */
-+            gpuAddress &= 0xfffff000;
-+
-+            gcmkPRINT("User Command Buffer:\n");
-+            _DumpBuffer(entryDump, gpuAddress, bytes);
-+        }
-+
-+        gcmkVERIFY_OK(
-+            gckOS_DestroyKernelVirtualMapping(entry));
-+    }
-+    else
-+    {
-+        _DumpKernelCommandBuffer(Command);
-+    }
-+
-+    return gcvSTATUS_OK;
-+#endif
-+}
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,3678 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#if gcdENABLE_VG
-+
-+#include "gc_hal_kernel_hardware_command_vg.h"
-+
-+#define _GC_OBJ_ZONE            gcvZONE_COMMAND
-+
-+/******************************************************************************\
-+*********************************** Debugging **********************************
-+\******************************************************************************/
-+
-+#define gcvDISABLE_TIMEOUT      1
-+#define gcvDUMP_COMMAND_BUFFER  0
-+#define gcvDUMP_COMMAND_LINES   0
-+
-+
-+#if gcvDEBUG || defined(EMULATOR) || gcvDISABLE_TIMEOUT
-+#   define gcvQUEUE_TIMEOUT ~0
-+#else
-+#   define gcvQUEUE_TIMEOUT 10
-+#endif
-+
-+
-+/******************************************************************************\
-+********************************** Definitions *********************************
-+\******************************************************************************/
-+
-+/* Minimum buffer size. */
-+#define gcvMINUMUM_BUFFER \
-+    gcmSIZEOF(gcsKERNEL_QUEUE_HEADER) + \
-+    gcmSIZEOF(gcsKERNEL_CMDQUEUE) * 2
-+
-+#define gcmDECLARE_INTERRUPT_HANDLER(Block, Number) \
-+    static gceSTATUS \
-+    _EventHandler_##Block##_##Number( \
-+        IN gckVGKERNEL Kernel \
-+        )
-+
-+#define gcmDEFINE_INTERRUPT_HANDLER(Block, Number) \
-+    gcmDECLARE_INTERRUPT_HANDLER(Block, Number) \
-+    { \
-+        return _EventHandler_Block( \
-+            Kernel, \
-+            &Kernel->command->taskTable[gcvBLOCK_##Block], \
-+            gcvFALSE \
-+            ); \
-+    }
-+
-+#define gcmDEFINE_INTERRUPT_HANDLER_ENTRY(Block, Number) \
-+    { gcvBLOCK_##Block, _EventHandler_##Block##_##Number }
-+
-+/* Block interrupt handling table entry. */
-+typedef struct _gcsBLOCK_INTERRUPT_HANDLER * gcsBLOCK_INTERRUPT_HANDLER_PTR;
-+typedef struct _gcsBLOCK_INTERRUPT_HANDLER
-+{
-+    gceBLOCK                block;
-+    gctINTERRUPT_HANDLER    handler;
-+}
-+gcsBLOCK_INTERRUPT_HANDLER;
-+
-+/* Queue control functions. */
-+typedef struct _gcsQUEUE_UPDATE_CONTROL * gcsQUEUE_UPDATE_CONTROL_PTR;
-+typedef struct _gcsQUEUE_UPDATE_CONTROL
-+{
-+    gctOBJECT_HANDLER       execute;
-+    gctOBJECT_HANDLER       update;
-+    gctOBJECT_HANDLER       lastExecute;
-+    gctOBJECT_HANDLER       lastUpdate;
-+}
-+gcsQUEUE_UPDATE_CONTROL;
-+
-+
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+static gceSTATUS
-+_FlushMMU(
-+    IN gckVGCOMMAND Command
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 oldValue;
-+    gckVGHARDWARE hardware = Command->hardware;
-+
-+    gcmkONERROR(gckOS_AtomicExchange(Command->os,
-+                                     hardware->pageTableDirty,
-+                                     0,
-+                                     &oldValue));
-+
-+    if (oldValue)
-+    {
-+        /* Page Table is upated, flush mmu before commit. */
-+        gcmkONERROR(gckVGHARDWARE_FlushMMU(hardware));
-+    }
-+
-+    return gcvSTATUS_OK;
-+OnError:
-+    return status;
-+}
-+
-+static gceSTATUS
-+_WaitForIdle(
-+    IN gckVGCOMMAND Command,
-+    IN gcsKERNEL_QUEUE_HEADER_PTR Queue
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctUINT32 idle;
-+    gctUINT timeout = 0;
-+
-+    /* Loop while not idle. */
-+    while (Queue->pending)
-+    {
-+        /* Did we reach the timeout limit? */
-+        if (timeout == gcvQUEUE_TIMEOUT)
-+        {
-+            /* Hardware is probably dead... */
-+            return gcvSTATUS_TIMEOUT;
-+        }
-+
-+        /* Sleep for 100ms. */
-+        gcmkERR_BREAK(gckOS_Delay(Command->os, 100));
-+
-+        /* Not the first loop? */
-+        if (timeout > 0)
-+        {
-+            /* Read IDLE register. */
-+            gcmkVERIFY_OK(gckVGHARDWARE_GetIdle(Command->hardware, &idle));
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_COMMAND,
-+                "%s: timeout, IDLE=%08X\n",
-+                __FUNCTION__, idle
-+                );
-+        }
-+
-+        /* Increment the timeout counter. */
-+        timeout += 1;
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gctINT32
-+_GetNextInterrupt(
-+    IN gckVGCOMMAND Command,
-+    IN gceBLOCK Block
-+    )
-+{
-+    gctUINT index;
-+    gcsBLOCK_TASK_ENTRY_PTR entry;
-+    gctINT32 interrupt;
-+
-+    /* Get the block entry. */
-+    entry = &Command->taskTable[Block];
-+
-+    /* Make sure we have initialized interrupts. */
-+    gcmkASSERT(entry->interruptCount > 0);
-+
-+    /* Decrement the interrupt usage semaphore. */
-+    gcmkVERIFY_OK(gckOS_DecrementSemaphore(
-+        Command->os, entry->interruptSemaphore
-+        ));
-+
-+    /* Get the value index. */
-+    index = entry->interruptIndex;
-+
-+    /* Get the interrupt value. */
-+    interrupt = entry->interruptArray[index];
-+
-+    /* Must be a valid value. */
-+    gcmkASSERT((interrupt >= 0) && (interrupt <= 31));
-+
-+    /* Advance the index to the next value. */
-+    index += 1;
-+
-+    /* Set the new index. */
-+    entry->interruptIndex = (index == entry->interruptCount)
-+        ? 0
-+        : index;
-+
-+    /* Return interrupt value. */
-+    return interrupt;
-+}
-+
-+
-+/******************************************************************************\
-+***************************** Task Storage Management **************************
-+\******************************************************************************/
-+
-+/* Minimum task buffer size. */
-+#define gcvMIN_TASK_BUFFER \
-+( \
-+    gcmSIZEOF(gcsTASK_CONTAINER) + 128 \
-+)
-+
-+/* Free list terminator. */
-+#define gcvFREE_TASK_TERMINATOR \
-+( \
-+    (gcsTASK_CONTAINER_PTR) gcmINT2PTR(~0) \
-+)
-+
-+
-+/*----------------------------------------------------------------------------*/
-+/*------------------- Allocated Task Buffer List Management ------------------*/
-+
-+static void
-+_InsertTaskBuffer(
-+    IN gcsTASK_CONTAINER_PTR AddAfter,
-+    IN gcsTASK_CONTAINER_PTR Buffer
-+    )
-+{
-+    gcsTASK_CONTAINER_PTR addBefore;
-+
-+    /* Cannot add before the first buffer. */
-+    gcmkASSERT(AddAfter != gcvNULL);
-+
-+    /* Create a shortcut to the next buffer. */
-+    addBefore = AddAfter->allocNext;
-+
-+    /* Initialize the links. */
-+    Buffer->allocPrev = AddAfter;
-+    Buffer->allocNext = addBefore;
-+
-+    /* Link to the previous buffer. */
-+    AddAfter->allocNext = Buffer;
-+
-+    /* Link to the next buffer. */
-+    if (addBefore != gcvNULL)
-+    {
-+        addBefore->allocPrev = Buffer;
-+    }
-+}
-+
-+static void
-+_RemoveTaskBuffer(
-+    IN gcsTASK_CONTAINER_PTR Buffer
-+    )
-+{
-+    gcsTASK_CONTAINER_PTR prev;
-+    gcsTASK_CONTAINER_PTR next;
-+
-+    /* Cannot remove the first buffer. */
-+    gcmkASSERT(Buffer->allocPrev != gcvNULL);
-+
-+    /* Create shortcuts to the previous and next buffers. */
-+    prev = Buffer->allocPrev;
-+    next = Buffer->allocNext;
-+
-+    /* Tail buffer? */
-+    if (next == gcvNULL)
-+    {
-+        /* Remove from the list. */
-+        prev->allocNext = gcvNULL;
-+    }
-+
-+    /* Buffer from the middle. */
-+    else
-+    {
-+        prev->allocNext = next;
-+        next->allocPrev = prev;
-+    }
-+}
-+
-+
-+/*----------------------------------------------------------------------------*/
-+/*--------------------- Free Task Buffer List Management ---------------------*/
-+
-+static void
-+_AppendToFreeList(
-+    IN gckVGCOMMAND Command,
-+    IN gcsTASK_CONTAINER_PTR Buffer
-+    )
-+{
-+    /* Cannot be a part of the free list already. */
-+    gcmkASSERT(Buffer->freePrev == gcvNULL);
-+    gcmkASSERT(Buffer->freeNext == gcvNULL);
-+
-+    /* First buffer to add? */
-+    if (Command->taskFreeHead == gcvNULL)
-+    {
-+        /* Terminate the links. */
-+        Buffer->freePrev = gcvFREE_TASK_TERMINATOR;
-+        Buffer->freeNext = gcvFREE_TASK_TERMINATOR;
-+
-+        /* Initialize the list pointer. */
-+        Command->taskFreeHead = Command->taskFreeTail = Buffer;
-+    }
-+
-+    /* Not the first, add after the tail. */
-+    else
-+    {
-+        /* Initialize the new tail buffer. */
-+        Buffer->freePrev = Command->taskFreeTail;
-+        Buffer->freeNext = gcvFREE_TASK_TERMINATOR;
-+
-+        /* Add after the tail. */
-+        Command->taskFreeTail->freeNext = Buffer;
-+        Command->taskFreeTail = Buffer;
-+    }
-+}
-+
-+static void
-+_RemoveFromFreeList(
-+    IN gckVGCOMMAND Command,
-+    IN gcsTASK_CONTAINER_PTR Buffer
-+    )
-+{
-+    /* Has to be a part of the free list. */
-+    gcmkASSERT(Buffer->freePrev != gcvNULL);
-+    gcmkASSERT(Buffer->freeNext != gcvNULL);
-+
-+    /* Head buffer? */
-+    if (Buffer->freePrev == gcvFREE_TASK_TERMINATOR)
-+    {
-+        /* Tail buffer as well? */
-+        if (Buffer->freeNext == gcvFREE_TASK_TERMINATOR)
-+        {
-+            /* Reset the list pointer. */
-+            Command->taskFreeHead = Command->taskFreeTail = gcvNULL;
-+        }
-+
-+        /* No, just the head. */
-+        else
-+        {
-+            /* Update the head. */
-+            Command->taskFreeHead = Buffer->freeNext;
-+
-+            /* Terminate the next buffer. */
-+            Command->taskFreeHead->freePrev = gcvFREE_TASK_TERMINATOR;
-+        }
-+    }
-+
-+    /* Not the head. */
-+    else
-+    {
-+        /* Tail buffer? */
-+        if (Buffer->freeNext == gcvFREE_TASK_TERMINATOR)
-+        {
-+            /* Update the tail. */
-+            Command->taskFreeTail = Buffer->freePrev;
-+
-+            /* Terminate the previous buffer. */
-+            Command->taskFreeTail->freeNext = gcvFREE_TASK_TERMINATOR;
-+        }
-+
-+        /* A buffer in the middle. */
-+        else
-+        {
-+            /* Remove the buffer from the list. */
-+            Buffer->freePrev->freeNext = Buffer->freeNext;
-+            Buffer->freeNext->freePrev = Buffer->freePrev;
-+        }
-+    }
-+
-+    /* Reset free list pointers. */
-+    Buffer->freePrev = gcvNULL;
-+    Buffer->freeNext = gcvNULL;
-+}
-+
-+
-+/*----------------------------------------------------------------------------*/
-+/*-------------------------- Task Buffer Allocation --------------------------*/
-+
-+static void
-+_SplitTaskBuffer(
-+    IN gckVGCOMMAND Command,
-+    IN gcsTASK_CONTAINER_PTR Buffer,
-+    IN gctUINT Size
-+    )
-+{
-+    /* Determine the size of the new buffer. */
-+    gctINT splitBufferSize = Buffer->size - Size;
-+    gcmkASSERT(splitBufferSize >= 0);
-+
-+    /* Is the split buffer big enough to become a separate buffer? */
-+    if (splitBufferSize >= gcvMIN_TASK_BUFFER)
-+    {
-+        /* Place the new path data. */
-+        gcsTASK_CONTAINER_PTR splitBuffer = (gcsTASK_CONTAINER_PTR)
-+        (
-+            (gctUINT8_PTR) Buffer + Size
-+        );
-+
-+        /* Set the trimmed buffer size. */
-+        Buffer->size = Size;
-+
-+        /* Initialize the split buffer. */
-+        splitBuffer->referenceCount = 0;
-+        splitBuffer->size           = splitBufferSize;
-+        splitBuffer->freePrev       = gcvNULL;
-+        splitBuffer->freeNext       = gcvNULL;
-+
-+        /* Link in. */
-+        _InsertTaskBuffer(Buffer, splitBuffer);
-+        _AppendToFreeList(Command, splitBuffer);
-+    }
-+}
-+
-+static gceSTATUS
-+_AllocateTaskContainer(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT Size,
-+    OUT gcsTASK_CONTAINER_PTR * Buffer
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Command=0x%x Size=0x%x, Buffer ==0x%x", Command, Size, Buffer);
-+
-+    /* Verify arguments. */
-+    gcmkVERIFY_ARGUMENT(Buffer != gcvNULL);
-+
-+    do
-+    {
-+        gcsTASK_STORAGE_PTR storage;
-+        gcsTASK_CONTAINER_PTR buffer;
-+
-+        /* Adjust the size. */
-+        Size += gcmSIZEOF(gcsTASK_CONTAINER);
-+
-+        /* Adjust the allocation size if not big enough. */
-+        if (Size > Command->taskStorageUsable)
-+        {
-+            Command->taskStorageGranularity
-+                = gcmALIGN(Size + gcmSIZEOF(gcsTASK_STORAGE), 1024);
-+
-+            Command->taskStorageUsable
-+                = Command->taskStorageGranularity - gcmSIZEOF(gcsTASK_STORAGE);
-+        }
-+
-+        /* Is there a free buffer available? */
-+        else if (Command->taskFreeHead != gcvNULL)
-+        {
-+            /* Set the initial free buffer. */
-+            gcsTASK_CONTAINER_PTR buffer = Command->taskFreeHead;
-+
-+            do
-+            {
-+                /* Is the buffer big enough? */
-+                if (buffer->size >= Size)
-+                {
-+                    /* Remove the buffer from the free list. */
-+                    _RemoveFromFreeList(Command, buffer);
-+
-+                    /* Split the buffer. */
-+                    _SplitTaskBuffer(Command, buffer, Size);
-+
-+                    /* Set the result. */
-+                    * Buffer = buffer;
-+
-+                    gcmkFOOTER_ARG("*Buffer=0x%x",*Buffer);
-+                    /* Success. */
-+                    return gcvSTATUS_OK;
-+                }
-+
-+                /* Get the next free buffer. */
-+                buffer = buffer->freeNext;
-+            }
-+            while (buffer != gcvFREE_TASK_TERMINATOR);
-+        }
-+
-+        /* Allocate a container. */
-+        gcmkERR_BREAK(gckOS_Allocate(
-+            Command->os,
-+            Command->taskStorageGranularity,
-+            (gctPOINTER *) &storage
-+            ));
-+
-+        /* Link in the storage buffer. */
-+        storage->next = Command->taskStorage;
-+        Command->taskStorage = storage;
-+
-+        /* Place the task buffer. */
-+        buffer = (gcsTASK_CONTAINER_PTR) (storage + 1);
-+
-+        /* Determine the size of the buffer. */
-+        buffer->size
-+            = Command->taskStorageGranularity
-+            - gcmSIZEOF(gcsTASK_STORAGE);
-+
-+        /* Initialize the task buffer. */
-+        buffer->referenceCount = 0;
-+        buffer->allocPrev      = gcvNULL;
-+        buffer->allocNext      = gcvNULL;
-+        buffer->freePrev       = gcvNULL;
-+        buffer->freeNext       = gcvNULL;
-+
-+        /* Split the buffer. */
-+        _SplitTaskBuffer(Command, buffer, Size);
-+
-+        /* Set the result. */
-+        * Buffer = buffer;
-+
-+        gcmkFOOTER_ARG("*Buffer=0x%x",*Buffer);
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+static void
-+_FreeTaskContainer(
-+    IN gckVGCOMMAND Command,
-+    IN gcsTASK_CONTAINER_PTR Buffer
-+    )
-+{
-+    gcsTASK_CONTAINER_PTR prev;
-+    gcsTASK_CONTAINER_PTR next;
-+    gcsTASK_CONTAINER_PTR merged;
-+
-+    gctSIZE_T mergedSize;
-+
-+    /* Verify arguments. */
-+    gcmkASSERT(Buffer != gcvNULL);
-+    gcmkASSERT(Buffer->freePrev == gcvNULL);
-+    gcmkASSERT(Buffer->freeNext == gcvNULL);
-+
-+    /* Get shortcuts to the previous and next path data buffers. */
-+    prev = Buffer->allocPrev;
-+    next = Buffer->allocNext;
-+
-+    /* Is the previous path data buffer already free? */
-+    if (prev && prev->freeNext)
-+    {
-+        /* The previous path data buffer is the one that remains. */
-+        merged = prev;
-+
-+        /* Is the next path data buffer already free? */
-+        if (next && next->freeNext)
-+        {
-+            /* Merge all three path data buffers into the previous. */
-+            mergedSize = prev->size + Buffer->size + next->size;
-+
-+            /* Remove the next path data buffer. */
-+            _RemoveFromFreeList(Command, next);
-+            _RemoveTaskBuffer(next);
-+        }
-+        else
-+        {
-+            /* Merge the current path data buffer into the previous. */
-+            mergedSize = prev->size + Buffer->size;
-+        }
-+
-+        /* Delete the current path data buffer. */
-+        _RemoveTaskBuffer(Buffer);
-+
-+        /* Set new size. */
-+        merged->size = mergedSize;
-+    }
-+    else
-+    {
-+        /* The current path data buffer is the one that remains. */
-+        merged = Buffer;
-+
-+        /* Is the next buffer already free? */
-+        if (next && next->freeNext)
-+        {
-+            /* Merge the next into the current. */
-+            mergedSize = Buffer->size + next->size;
-+
-+            /* Remove the next buffer. */
-+            _RemoveFromFreeList(Command, next);
-+            _RemoveTaskBuffer(next);
-+
-+            /* Set new size. */
-+            merged->size = mergedSize;
-+        }
-+
-+        /* Add the current buffer into the free list. */
-+        _AppendToFreeList(Command, merged);
-+    }
-+}
-+
-+gceSTATUS
-+_RemoveRecordFromProcesDB(
-+    IN gckVGCOMMAND Command,
-+    IN gcsTASK_HEADER_PTR Task
-+    )
-+{
-+    gcsTASK_PTR task = (gcsTASK_PTR)((gctUINT8_PTR)Task - sizeof(gcsTASK));
-+    gcsTASK_FREE_VIDEO_MEMORY_PTR freeVideoMemory;
-+    gcsTASK_UNLOCK_VIDEO_MEMORY_PTR unlockVideoMemory;
-+    gctINT pid;
-+    gctUINT32 size;
-+
-+    /* Get the total size of all tasks. */
-+    size = task->size;
-+
-+    gcmkVERIFY_OK(gckOS_GetProcessID((gctUINT32_PTR)&pid));
-+
-+    do
-+    {
-+        switch (Task->id)
-+        {
-+        case gcvTASK_FREE_VIDEO_MEMORY:
-+            freeVideoMemory = (gcsTASK_FREE_VIDEO_MEMORY_PTR)Task;
-+
-+            /* Remove record from process db. */
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Command->kernel->kernel,
-+                pid,
-+                gcvDB_VIDEO_MEMORY,
-+                gcmUINT64_TO_PTR(freeVideoMemory->node)));
-+
-+            /* Advance to next task. */
-+            size -= sizeof(gcsTASK_FREE_VIDEO_MEMORY);
-+            Task = (gcsTASK_HEADER_PTR)(freeVideoMemory + 1);
-+
-+            break;
-+        case gcvTASK_UNLOCK_VIDEO_MEMORY:
-+            unlockVideoMemory = (gcsTASK_UNLOCK_VIDEO_MEMORY_PTR)Task;
-+
-+            /* Remove record from process db. */
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Command->kernel->kernel,
-+                pid,
-+                gcvDB_VIDEO_MEMORY_LOCKED,
-+                gcmUINT64_TO_PTR(unlockVideoMemory->node)));
-+
-+            /* Advance to next task. */
-+            size -= sizeof(gcsTASK_UNLOCK_VIDEO_MEMORY);
-+            Task = (gcsTASK_HEADER_PTR)(unlockVideoMemory + 1);
-+
-+            break;
-+        default:
-+            /* Skip the whole task. */
-+            size = 0;
-+            break;
-+        }
-+    }
-+    while(size);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+/******************************************************************************\
-+********************************* Task Scheduling ******************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_ScheduleTasks(
-+    IN gckVGCOMMAND Command,
-+    IN gcsTASK_MASTER_TABLE_PTR TaskTable,
-+    IN gctUINT8_PTR PreviousEnd
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        gctINT block;
-+        gcsTASK_CONTAINER_PTR container;
-+        gcsTASK_MASTER_ENTRY_PTR userTaskEntry;
-+        gcsBLOCK_TASK_ENTRY_PTR kernelTaskEntry;
-+        gcsTASK_PTR userTask;
-+        gctUINT8_PTR kernelTask;
-+        gctINT32 interrupt;
-+        gctUINT8_PTR eventCommand;
-+
-+        /* Nothing to schedule? */
-+        if (TaskTable->size == 0)
-+        {
-+            status = gcvSTATUS_OK;
-+            break;
-+        }
-+
-+        /* Acquire the mutex. */
-+        gcmkERR_BREAK(gckOS_AcquireMutex(
-+            Command->os,
-+            Command->taskMutex,
-+            gcvINFINITE
-+            ));
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+            "%s(%d)\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        do
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                "  number of tasks scheduled   = %d\n"
-+                "  size of event data in bytes = %d\n",
-+                TaskTable->count,
-+                TaskTable->size
-+                );
-+
-+            /* Allocate task buffer. */
-+            gcmkERR_BREAK(_AllocateTaskContainer(
-+                Command,
-+                TaskTable->size,
-+                &container
-+                ));
-+
-+            /* Determine the task data pointer. */
-+            kernelTask = (gctUINT8_PTR) (container + 1);
-+
-+            /* Initialize the reference count. */
-+            container->referenceCount = TaskTable->count;
-+
-+            /* Process tasks. */
-+            for (block = gcvBLOCK_COUNT - 1; block >= 0; block -= 1)
-+            {
-+                /* Get the current user table entry. */
-+                userTaskEntry = &TaskTable->table[block];
-+
-+                /* Are there tasks scheduled? */
-+                if (userTaskEntry->head == gcvNULL)
-+                {
-+                    /* No, skip to the next block. */
-+                    continue;
-+                }
-+
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                    "  processing tasks for block %d\n",
-+                    block
-+                    );
-+
-+                /* Get the current kernel table entry. */
-+                kernelTaskEntry = &Command->taskTable[block];
-+
-+                /* Are there tasks for the current block scheduled? */
-+                if (kernelTaskEntry->container == gcvNULL)
-+                {
-+                    gcmkTRACE_ZONE(
-+                        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                        "  first task container for the block added\n",
-+                        block
-+                        );
-+
-+                    /* Nothing yet, set the container buffer pointer. */
-+                    kernelTaskEntry->container = container;
-+                    kernelTaskEntry->task      = (gcsTASK_HEADER_PTR) kernelTask;
-+                }
-+
-+                /* Yes, append to the end. */
-+                else
-+                {
-+                    kernelTaskEntry->link->cotainer = container;
-+                    kernelTaskEntry->link->task     = (gcsTASK_HEADER_PTR) kernelTask;
-+                }
-+
-+                /* Set initial task. */
-+                userTask = userTaskEntry->head;
-+
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                    "  copying user tasks over to the kernel\n"
-+                    );
-+
-+                /* Copy tasks. */
-+                do
-+                {
-+                    gcsTASK_HEADER_PTR taskHeader = (gcsTASK_HEADER_PTR) (userTask + 1);
-+
-+                    gcmkVERIFY_OK(_RemoveRecordFromProcesDB(Command, taskHeader));
-+
-+                    gcmkTRACE_ZONE(
-+                        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                        "    task ID = %d, size = %d\n",
-+                        ((gcsTASK_HEADER_PTR) (userTask + 1))->id,
-+                        userTask->size
-+                        );
-+
-+#ifdef __QNXNTO__
-+                    if (taskHeader->id == gcvTASK_SIGNAL)
-+                    {
-+                        ((gcsTASK_SIGNAL_PTR)taskHeader)->coid  = TaskTable->coid;
-+                        ((gcsTASK_SIGNAL_PTR)taskHeader)->rcvid = TaskTable->rcvid;
-+                    }
-+#endif /* __QNXNTO__ */
-+                    /* Copy the task data. */
-+                    gcmkVERIFY_OK(gckOS_MemCopy(
-+                        kernelTask, taskHeader, userTask->size
-+                        ));
-+
-+                    /* Advance to the next task. */
-+                    kernelTask += userTask->size;
-+                    userTask    = userTask->next;
-+                }
-+                while (userTask != gcvNULL);
-+
-+                /* Update link pointer in the header. */
-+                kernelTaskEntry->link = (gcsTASK_LINK_PTR) kernelTask;
-+
-+                /* Initialize link task. */
-+                kernelTaskEntry->link->id       = gcvTASK_LINK;
-+                kernelTaskEntry->link->cotainer = gcvNULL;
-+                kernelTaskEntry->link->task     = gcvNULL;
-+
-+                /* Advance the task data pointer. */
-+                kernelTask += gcmSIZEOF(gcsTASK_LINK);
-+            }
-+        }
-+        while (gcvFALSE);
-+
-+        /* Release the mutex. */
-+        gcmkERR_BREAK(gckOS_ReleaseMutex(
-+            Command->os,
-+            Command->taskMutex
-+            ));
-+
-+        /* Assign interrupts to the blocks. */
-+        eventCommand = PreviousEnd;
-+
-+        for (block = gcvBLOCK_COUNT - 1; block >= 0; block -= 1)
-+        {
-+            /* Get the current user table entry. */
-+            userTaskEntry = &TaskTable->table[block];
-+
-+            /* Are there tasks scheduled? */
-+            if (userTaskEntry->head == gcvNULL)
-+            {
-+                /* No, skip to the next block. */
-+                continue;
-+            }
-+
-+            /* Get the interrupt number. */
-+            interrupt = _GetNextInterrupt(Command, block);
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                "%s(%d): block = %d interrupt = %d\n",
-+                __FUNCTION__, __LINE__,
-+                block, interrupt
-+                );
-+
-+            /* Determine the command position. */
-+            eventCommand -= Command->info.eventCommandSize;
-+
-+            /* Append an EVENT command. */
-+            gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
-+                Command, eventCommand, block, interrupt, gcvNULL
-+                ));
-+        }
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+******************************** Memory Management *****************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_HardwareToKernel(
-+    IN gckOS Os,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    gceSTATUS status;
-+    gckVIDMEM memory;
-+    gctUINT32 offset;
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY
-+    gctUINT32 nodePhysical;
-+#endif
-+    status = gcvSTATUS_OK;
-+    /* Assume a non-virtual node and get the pool manager object. */
-+    memory = Node->VidMem.memory;
-+
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY
-+    nodePhysical = memory->baseAddress
-+                 + Node->VidMem.offset
-+                 + Node->VidMem.alignment;
-+
-+    if (Node->VidMem.kernelVirtual == gcvNULL)
-+    {
-+        status = gckOS_MapPhysical(Os,
-+                        nodePhysical,
-+                        Node->VidMem.bytes,
-+                        (gctPOINTER *)&Node->VidMem.kernelVirtual);
-+
-+        if (gcmkIS_ERROR(status))
-+        {
-+            return status;
-+        }
-+    }
-+
-+    offset = Address - nodePhysical;
-+    *KernelPointer = (gctPOINTER)((gctUINT8_PTR)Node->VidMem.kernelVirtual + offset);
-+#else
-+    /* Determine the header offset within the pool it is allocated in. */
-+    offset = Address - memory->baseAddress;
-+
-+    /* Translate the offset into the kernel side pointer. */
-+    status = gckOS_GetKernelLogicalEx(
-+        Os,
-+        gcvCORE_VG,
-+        offset,
-+        KernelPointer
-+        );
-+#endif
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_ConvertUserCommandBufferPointer(
-+    IN gckVGCOMMAND Command,
-+    IN gcsCMDBUFFER_PTR UserCommandBuffer,
-+    OUT gcsCMDBUFFER_PTR * KernelCommandBuffer
-+    )
-+{
-+    gceSTATUS status, last;
-+    gcsCMDBUFFER_PTR mappedUserCommandBuffer = gcvNULL;
-+
-+    do
-+    {
-+        gctUINT32 headerAddress;
-+
-+        /* Map the command buffer structure into the kernel space. */
-+        gcmkERR_BREAK(gckOS_MapUserPointer(
-+            Command->os,
-+            UserCommandBuffer,
-+            gcmSIZEOF(gcsCMDBUFFER),
-+            (gctPOINTER *) &mappedUserCommandBuffer
-+            ));
-+
-+        /* Determine the address of the header. */
-+        headerAddress
-+            = mappedUserCommandBuffer->address
-+            - mappedUserCommandBuffer->bufferOffset;
-+
-+        /* Translate the logical address to the kernel space. */
-+        gcmkERR_BREAK(_HardwareToKernel(
-+            Command->os,
-+            gcmUINT64_TO_PTR(mappedUserCommandBuffer->node),
-+            headerAddress,
-+            (gctPOINTER *) KernelCommandBuffer
-+            ));
-+    }
-+    while (gcvFALSE);
-+
-+    /* Unmap the user command buffer. */
-+    if (mappedUserCommandBuffer != gcvNULL)
-+    {
-+        gcmkCHECK_STATUS(gckOS_UnmapUserPointer(
-+            Command->os,
-+            UserCommandBuffer,
-+            gcmSIZEOF(gcsCMDBUFFER),
-+            mappedUserCommandBuffer
-+            ));
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_AllocateLinear(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT Size,
-+    IN gctUINT Alignment,
-+    OUT gcuVIDMEM_NODE_PTR * Node,
-+    OUT gctUINT32 * Address,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gceSTATUS status, last;
-+    gcuVIDMEM_NODE_PTR node = gcvNULL;
-+    gctUINT32 address = (gctUINT32)~0;
-+
-+    do
-+    {
-+        gcePOOL pool;
-+        gctPOINTER logical;
-+
-+        /* Allocate from the system pool. */
-+        pool = gcvPOOL_SYSTEM;
-+
-+        /* Allocate memory. */
-+        gcmkERR_BREAK(gckKERNEL_AllocateLinearMemory(
-+            Command->kernel->kernel, &pool,
-+            Size, Alignment,
-+            gcvSURF_TYPE_UNKNOWN,
-+            &node
-+            ));
-+
-+        /* Do not accept virtual pools for now because we don't handle the
-+           kernel pointer translation at the moment. */
-+        if (pool == gcvPOOL_VIRTUAL)
-+        {
-+            status = gcvSTATUS_OUT_OF_MEMORY;
-+            break;
-+        }
-+
-+        /* Lock the command buffer. */
-+        gcmkERR_BREAK(gckVIDMEM_Lock(
-+            Command->kernel->kernel,
-+            node,
-+            gcvFALSE,
-+            &address
-+            ));
-+
-+        /* Translate the logical address to the kernel space. */
-+        gcmkERR_BREAK(_HardwareToKernel(
-+            Command->os,
-+            node,
-+            address,
-+            &logical
-+            ));
-+
-+        /* Set return values. */
-+        * Node    = node;
-+        * Address = address;
-+        * Logical = logical;
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Roll back. */
-+    if (node != gcvNULL)
-+    {
-+        /* Unlock the command buffer. */
-+        if (address != ~0)
-+        {
-+            gcmkCHECK_STATUS(gckVIDMEM_Unlock(
-+                Command->kernel->kernel, node, gcvSURF_TYPE_UNKNOWN, gcvNULL
-+                ));
-+        }
-+
-+        /* Free the command buffer. */
-+        gcmkCHECK_STATUS(gckVIDMEM_Free(
-+            Command->kernel->kernel,
-+            node
-+            ));
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_FreeLinear(
-+    IN gckVGKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Unlock the linear buffer. */
-+        gcmkERR_BREAK(gckVIDMEM_Unlock(Kernel->kernel, Node, gcvSURF_TYPE_UNKNOWN, gcvNULL));
-+
-+        /* Free the linear buffer. */
-+        gcmkERR_BREAK(gckVIDMEM_Free(Kernel->kernel, Node));
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+gceSTATUS
-+_AllocateCommandBuffer(
-+    IN gckVGCOMMAND Command,
-+    IN gctSIZE_T Size,
-+    OUT gcsCMDBUFFER_PTR * CommandBuffer
-+    )
-+{
-+    gceSTATUS status, last;
-+    gcuVIDMEM_NODE_PTR node = gcvNULL;
-+
-+    do
-+    {
-+        gctUINT alignedHeaderSize;
-+        gctUINT requestedSize;
-+        gctUINT allocationSize;
-+        gctUINT32 address = 0;
-+        gcsCMDBUFFER_PTR commandBuffer;
-+        gctUINT8_PTR endCommand;
-+
-+        /* Determine the aligned header size. */
-+        alignedHeaderSize
-+            = gcmALIGN(gcmSIZEOF(gcsCMDBUFFER), Command->info.addressAlignment);
-+
-+        /* Align the requested size. */
-+        requestedSize
-+            = gcmALIGN(Size, Command->info.commandAlignment);
-+
-+        /* Determine the size of the buffer to allocate. */
-+        allocationSize
-+            = alignedHeaderSize
-+            + requestedSize
-+            + Command->info.staticTailSize;
-+
-+        /* Allocate the command buffer. */
-+        gcmkERR_BREAK(_AllocateLinear(
-+            Command,
-+            allocationSize,
-+            Command->info.addressAlignment,
-+            &node,
-+            &address,
-+            (gctPOINTER *) &commandBuffer
-+            ));
-+
-+        /* Initialize the structure. */
-+        commandBuffer->completion    = gcvVACANT_BUFFER;
-+        commandBuffer->node          = gcmPTR_TO_UINT64(node);
-+        commandBuffer->address       = address + alignedHeaderSize;
-+        commandBuffer->bufferOffset  = alignedHeaderSize;
-+        commandBuffer->size          = requestedSize;
-+        commandBuffer->offset        = requestedSize;
-+        commandBuffer->nextAllocated = gcvNULL;
-+        commandBuffer->nextSubBuffer = gcvNULL;
-+
-+        /* Determine the data count. */
-+        commandBuffer->dataCount
-+            = (requestedSize + Command->info.staticTailSize)
-+            / Command->info.commandAlignment;
-+
-+        /* Determine the location of the END command. */
-+        endCommand
-+            = (gctUINT8_PTR) commandBuffer
-+            + alignedHeaderSize
-+            + requestedSize;
-+
-+        /* Append an END command. */
-+        gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
-+            Command,
-+            endCommand,
-+            Command->info.feBufferInt,
-+            gcvNULL
-+            ));
-+
-+        /* Set the return pointer. */
-+        * CommandBuffer = commandBuffer;
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Roll back. */
-+    if (node != gcvNULL)
-+    {
-+        /* Free the command buffer. */
-+        gcmkCHECK_STATUS(_FreeLinear(Command->kernel, node));
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_FreeCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsCMDBUFFER_PTR CommandBuffer
-+    )
-+{
-+    gceSTATUS status;
-+
-+    /* Free the buffer. */
-+    status = _FreeLinear(Kernel, gcmUINT64_TO_PTR(CommandBuffer->node));
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+****************************** TS Overflow Handler *****************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_EventHandler_TSOverflow(
-+    IN gckVGKERNEL Kernel
-+    )
-+{
-+    gcmkTRACE(
-+        gcvLEVEL_ERROR,
-+        "%s(%d): **** TS OVERFLOW ENCOUNTERED ****\n",
-+        __FUNCTION__, __LINE__
-+        );
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+/******************************************************************************\
-+****************************** Bus Error Handler *******************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_EventHandler_BusError(
-+    IN gckVGKERNEL Kernel
-+    )
-+{
-+    gcmkTRACE(
-+        gcvLEVEL_ERROR,
-+        "%s(%d): **** BUS ERROR ENCOUNTERED ****\n",
-+        __FUNCTION__, __LINE__
-+        );
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+/******************************************************************************\
-+****************************** Power Stall Handler *******************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_EventHandler_PowerStall(
-+    IN gckVGKERNEL Kernel
-+    )
-+{
-+    /* Signal. */
-+    return gckOS_Signal(
-+        Kernel->os,
-+        Kernel->command->powerStallSignal,
-+        gcvTRUE);
-+}
-+
-+/******************************************************************************\
-+******************************** Task Routines *********************************
-+\******************************************************************************/
-+
-+typedef gceSTATUS (* gctTASKROUTINE) (
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskLink(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskCluster(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskIncrement(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskDecrement(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskSignal(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskLockdown(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskUnlockVideoMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskFreeVideoMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskFreeContiguousMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gceSTATUS
-+_TaskUnmapUserMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    );
-+
-+static gctTASKROUTINE _taskRoutine[] =
-+{
-+    _TaskLink,                  /* gcvTASK_LINK                   */
-+    _TaskCluster,               /* gcvTASK_CLUSTER                */
-+    _TaskIncrement,             /* gcvTASK_INCREMENT              */
-+    _TaskDecrement,             /* gcvTASK_DECREMENT              */
-+    _TaskSignal,                /* gcvTASK_SIGNAL                 */
-+    _TaskLockdown,              /* gcvTASK_LOCKDOWN               */
-+    _TaskUnlockVideoMemory,     /* gcvTASK_UNLOCK_VIDEO_MEMORY    */
-+    _TaskFreeVideoMemory,       /* gcvTASK_FREE_VIDEO_MEMORY      */
-+    _TaskFreeContiguousMemory,  /* gcvTASK_FREE_CONTIGUOUS_MEMORY */
-+    _TaskUnmapUserMemory,       /* gcvTASK_UNMAP_USER_MEMORY      */
-+};
-+
-+static gceSTATUS
-+_TaskLink(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    /* Cast the task pointer. */
-+    gcsTASK_LINK_PTR task = (gcsTASK_LINK_PTR) TaskHeader->task;
-+
-+    /* Save the pointer to the container. */
-+    gcsTASK_CONTAINER_PTR container = TaskHeader->container;
-+
-+    /* No more tasks in the list? */
-+    if (task->task == gcvNULL)
-+    {
-+        /* Reset the entry. */
-+        TaskHeader->container = gcvNULL;
-+        TaskHeader->task      = gcvNULL;
-+        TaskHeader->link      = gcvNULL;
-+    }
-+    else
-+    {
-+        /* Update the entry. */
-+        TaskHeader->container = task->cotainer;
-+        TaskHeader->task      = task->task;
-+    }
-+
-+    /* Decrement the task buffer reference. */
-+    gcmkASSERT(container->referenceCount >= 0);
-+    if (container->referenceCount == 0)
-+    {
-+        /* Free the container. */
-+        _FreeTaskContainer(Command, container);
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+_TaskCluster(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    /* Cast the task pointer. */
-+    gcsTASK_CLUSTER_PTR cluster = (gcsTASK_CLUSTER_PTR) TaskHeader->task;
-+
-+    /* Get the number of tasks. */
-+    gctUINT taskCount = cluster->taskCount;
-+
-+    /* Advance to the next task. */
-+    TaskHeader->task = (gcsTASK_HEADER_PTR) (cluster + 1);
-+
-+    /* Perform all tasks in the cluster. */
-+    while (taskCount)
-+    {
-+        /* Perform the current task. */
-+        gcmkERR_BREAK(_taskRoutine[TaskHeader->task->id](
-+            Command,
-+            TaskHeader
-+            ));
-+
-+        /* Update the task count. */
-+        taskCount -= 1;
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskIncrement(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_INCREMENT_PTR task = (gcsTASK_INCREMENT_PTR) TaskHeader->task;
-+
-+        /* Convert physical into logical address. */
-+        gctUINT32_PTR logical;
-+        gcmkERR_BREAK(gckOS_MapPhysical(
-+            Command->os,
-+            task->address,
-+            gcmSIZEOF(gctUINT32),
-+            (gctPOINTER *) &logical
-+            ));
-+
-+        /* Increment data. */
-+        (* logical) += 1;
-+
-+        /* Unmap the physical memory. */
-+        gcmkERR_BREAK(gckOS_UnmapPhysical(
-+            Command->os,
-+            logical,
-+            gcmSIZEOF(gctUINT32)
-+            ));
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskDecrement(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_DECREMENT_PTR task = (gcsTASK_DECREMENT_PTR) TaskHeader->task;
-+
-+        /* Convert physical into logical address. */
-+        gctUINT32_PTR logical;
-+        gcmkERR_BREAK(gckOS_MapPhysical(
-+            Command->os,
-+            task->address,
-+            gcmSIZEOF(gctUINT32),
-+            (gctPOINTER *) &logical
-+            ));
-+
-+        /* Decrement data. */
-+        (* logical) -= 1;
-+
-+        /* Unmap the physical memory. */
-+        gcmkERR_BREAK(gckOS_UnmapPhysical(
-+            Command->os,
-+            logical,
-+            gcmSIZEOF(gctUINT32)
-+            ));
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskSignal(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_SIGNAL_PTR task = (gcsTASK_SIGNAL_PTR) TaskHeader->task;
-+
-+
-+        /* Map the signal into kernel space. */
-+#ifdef __QNXNTO__
-+        gcmkERR_BREAK(gckOS_UserSignal(
-+            Command->os, task->signal, task->rcvid, task->coid
-+            ));
-+#else
-+        gcmkERR_BREAK(gckOS_UserSignal(
-+            Command->os, task->signal, task->process
-+            ));
-+#endif /* __QNXNTO__ */
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskLockdown(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32_PTR userCounter   = gcvNULL;
-+    gctUINT32_PTR kernelCounter = gcvNULL;
-+    gctSIGNAL signal            = gcvNULL;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_LOCKDOWN_PTR task = (gcsTASK_LOCKDOWN_PTR) TaskHeader->task;
-+
-+        /* Convert physical addresses into logical. */
-+        gcmkERR_BREAK(gckOS_MapPhysical(
-+            Command->os,
-+            task->userCounter,
-+            gcmSIZEOF(gctUINT32),
-+            (gctPOINTER *) &userCounter
-+            ));
-+
-+        gcmkERR_BREAK(gckOS_MapPhysical(
-+            Command->os,
-+            task->kernelCounter,
-+            gcmSIZEOF(gctUINT32),
-+            (gctPOINTER *) &kernelCounter
-+            ));
-+
-+        /* Update the kernel counter. */
-+        (* kernelCounter) += 1;
-+
-+        /* Are the counters equal? */
-+        if ((* userCounter) == (* kernelCounter))
-+        {
-+            /* Map the signal into kernel space. */
-+            gcmkERR_BREAK(gckOS_MapSignal(
-+                Command->os, task->signal, task->process, &signal
-+                ));
-+
-+            if (signal == gcvNULL)
-+            {
-+                /* Signal. */
-+                gcmkERR_BREAK(gckOS_Signal(
-+                    Command->os, task->signal, gcvTRUE
-+                    ));
-+            }
-+            else
-+            {
-+                /* Signal. */
-+                gcmkERR_BREAK(gckOS_Signal(
-+                    Command->os, signal, gcvTRUE
-+                    ));
-+            }
-+        }
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Destroy the mapped signal. */
-+    if (signal != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_DestroySignal(
-+            Command->os, signal
-+            ));
-+    }
-+
-+    /* Unmap the physical memory. */
-+    if (kernelCounter != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_UnmapPhysical(
-+            Command->os,
-+            kernelCounter,
-+            gcmSIZEOF(gctUINT32)
-+            ));
-+    }
-+
-+    if (userCounter != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_UnmapPhysical(
-+            Command->os,
-+            userCounter,
-+            gcmSIZEOF(gctUINT32)
-+            ));
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskUnlockVideoMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_UNLOCK_VIDEO_MEMORY_PTR task
-+            = (gcsTASK_UNLOCK_VIDEO_MEMORY_PTR) TaskHeader->task;
-+
-+        /* Unlock video memory. */
-+        gcmkERR_BREAK(gckVIDMEM_Unlock(
-+            Command->kernel->kernel,
-+            gcmUINT64_TO_PTR(task->node),
-+            gcvSURF_TYPE_UNKNOWN,
-+            gcvNULL));
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskFreeVideoMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_FREE_VIDEO_MEMORY_PTR task
-+            = (gcsTASK_FREE_VIDEO_MEMORY_PTR) TaskHeader->task;
-+
-+        /* Free video memory. */
-+        gcmkERR_BREAK(gckVIDMEM_Free(Command->kernel->kernel, gcmUINT64_TO_PTR(task->node)));
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskFreeContiguousMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_FREE_CONTIGUOUS_MEMORY_PTR task
-+            = (gcsTASK_FREE_CONTIGUOUS_MEMORY_PTR) TaskHeader->task;
-+
-+        /* Free contiguous memory. */
-+        gcmkERR_BREAK(gckOS_FreeContiguous(
-+            Command->os, task->physical, task->logical, task->bytes
-+            ));
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TaskUnmapUserMemory(
-+    gckVGCOMMAND Command,
-+    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the task pointer. */
-+        gcsTASK_UNMAP_USER_MEMORY_PTR task
-+            = (gcsTASK_UNMAP_USER_MEMORY_PTR) TaskHeader->task;
-+
-+        /* Unmap the user memory. */
-+        gcmkERR_BREAK(gckOS_UnmapUserMemory(
-+            Command->os, gcvCORE_VG, task->memory, task->size, task->info, task->address
-+            ));
-+
-+        /* Update the reference counter. */
-+        TaskHeader->container->referenceCount -= 1;
-+
-+        /* Update the task pointer. */
-+        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+/******************************************************************************\
-+************ Hardware Block Interrupt Handlers For Scheduled Events ************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_EventHandler_Block(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsBLOCK_TASK_ENTRY_PTR TaskHeader,
-+    IN gctBOOL ProcessAll
-+    )
-+{
-+    gceSTATUS status, last;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x TaskHeader=0x%x ProcessAll=0x%x", Kernel, TaskHeader, ProcessAll);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    do
-+    {
-+        gckVGCOMMAND command;
-+
-+        /* Get the command buffer object. */
-+        command = Kernel->command;
-+
-+        /* Increment the interrupt usage semaphore. */
-+        gcmkERR_BREAK(gckOS_IncrementSemaphore(
-+            command->os, TaskHeader->interruptSemaphore
-+            ));
-+
-+        /* Acquire the mutex. */
-+        gcmkERR_BREAK(gckOS_AcquireMutex(
-+            command->os,
-+            command->taskMutex,
-+            gcvINFINITE
-+            ));
-+
-+        /* Verify inputs. */
-+        gcmkASSERT(TaskHeader            != gcvNULL);
-+        gcmkASSERT(TaskHeader->container != gcvNULL);
-+        gcmkASSERT(TaskHeader->task      != gcvNULL);
-+        gcmkASSERT(TaskHeader->link      != gcvNULL);
-+
-+        /* Process tasks. */
-+        do
-+        {
-+            /* Process the current task. */
-+            gcmkERR_BREAK(_taskRoutine[TaskHeader->task->id](
-+                command,
-+                TaskHeader
-+                ));
-+
-+            /* Is the next task is LINK? */
-+            if (TaskHeader->task->id == gcvTASK_LINK)
-+            {
-+                gcmkERR_BREAK(_taskRoutine[TaskHeader->task->id](
-+                    command,
-+                    TaskHeader
-+                    ));
-+
-+                /* Done. */
-+                break;
-+            }
-+        }
-+        while (ProcessAll);
-+
-+        /* Release the mutex. */
-+        gcmkCHECK_STATUS(gckOS_ReleaseMutex(
-+            command->os,
-+            command->taskMutex
-+            ));
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+gcmDECLARE_INTERRUPT_HANDLER(COMMAND, 0)
-+{
-+    gceSTATUS status, last;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+
-+    do
-+    {
-+        gckVGCOMMAND command;
-+        gcsKERNEL_QUEUE_HEADER_PTR mergeQueue;
-+        gcsKERNEL_QUEUE_HEADER_PTR queueTail;
-+        gcsKERNEL_CMDQUEUE_PTR entry;
-+        gctUINT entryCount;
-+
-+        /* Get the command buffer object. */
-+        command = Kernel->command;
-+
-+        /* Acquire the mutex. */
-+        gcmkERR_BREAK(gckOS_AcquireMutex(
-+            command->os,
-+            command->queueMutex,
-+            gcvINFINITE
-+            ));
-+
-+        /* Get the current queue. */
-+        queueTail = command->queueTail;
-+
-+        /* Get the current queue entry. */
-+        entry = queueTail->currentEntry;
-+
-+        /* Get the number of entries in the queue. */
-+        entryCount = queueTail->pending;
-+
-+        /* Process all entries. */
-+        while (gcvTRUE)
-+        {
-+            /* Call post-execution function. */
-+            status = entry->handler(Kernel, entry);
-+
-+            /* Failed? */
-+            if (gcmkIS_ERROR(status))
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_ERROR,
-+                    gcvZONE_COMMAND,
-+                    "[%s] line %d: post action failed.\n",
-+                    __FUNCTION__, __LINE__
-+                    );
-+            }
-+
-+            /* Executed the next buffer? */
-+            if (status == gcvSTATUS_EXECUTED)
-+            {
-+                /* Update the queue. */
-+                queueTail->pending      = entryCount;
-+                queueTail->currentEntry = entry;
-+
-+                /* Success. */
-+                status = gcvSTATUS_OK;
-+
-+                /* Break out of the loop. */
-+                break;
-+            }
-+
-+            /* Advance to the next entry. */
-+            entry      += 1;
-+            entryCount -= 1;
-+
-+            /* Last entry? */
-+            if (entryCount == 0)
-+            {
-+                /* Reset the queue to idle. */
-+                queueTail->pending = 0;
-+
-+                /* Get a shortcut to the queue to merge with. */
-+                mergeQueue = command->mergeQueue;
-+
-+                /* Merge the queues if necessary. */
-+                if (mergeQueue != queueTail)
-+                {
-+                    gcmkASSERT(mergeQueue < queueTail);
-+                    gcmkASSERT(mergeQueue->next == queueTail);
-+
-+                    mergeQueue->size
-+                        += gcmSIZEOF(gcsKERNEL_QUEUE_HEADER)
-+                        + queueTail->size;
-+
-+                    mergeQueue->next = queueTail->next;
-+                }
-+
-+                /* Advance to the next queue. */
-+                queueTail = queueTail->next;
-+
-+                /* Did it wrap around? */
-+                if (command->queue == queueTail)
-+                {
-+                    /* Reset merge queue. */
-+                    command->mergeQueue = queueTail;
-+                }
-+
-+                /* Set new queue. */
-+                command->queueTail = queueTail;
-+
-+                /* Is the next queue scheduled? */
-+                if (queueTail->pending > 0)
-+                {
-+                    gcsCMDBUFFER_PTR commandBuffer;
-+
-+                    /* The first entry must be a command buffer. */
-+                    commandBuffer = queueTail->currentEntry->commandBuffer;
-+
-+                    /* Start the command processor. */
-+                    status = gckVGHARDWARE_Execute(
-+                        command->hardware,
-+                        commandBuffer->address,
-+                        commandBuffer->dataCount
-+                        );
-+
-+                    /* Failed? */
-+                    if (gcmkIS_ERROR(status))
-+                    {
-+                        gcmkTRACE_ZONE(
-+                            gcvLEVEL_ERROR,
-+                            gcvZONE_COMMAND,
-+                            "[%s] line %d: failed to start the next queue.\n",
-+                            __FUNCTION__, __LINE__
-+                            );
-+                    }
-+                }
-+                else
-+                {
-+                    status = gckVGHARDWARE_SetPowerManagementState(
-+                                Kernel->command->hardware, gcvPOWER_IDLE_BROADCAST
-+                                );
-+                }
-+
-+                /* Break out of the loop. */
-+                break;
-+            }
-+        }
-+
-+        /* Release the mutex. */
-+        gcmkCHECK_STATUS(gckOS_ReleaseMutex(
-+            command->os,
-+            command->queueMutex
-+            ));
-+    }
-+    while (gcvFALSE);
-+
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+/* Define standard block interrupt handlers. */
-+gcmDEFINE_INTERRUPT_HANDLER(TESSELLATOR, 0)
-+gcmDEFINE_INTERRUPT_HANDLER(VG,          0)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       0)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       1)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       2)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       3)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       4)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       5)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       6)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       7)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       8)
-+gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       9)
-+
-+/* The entries in the array are arranged by event priority. */
-+static gcsBLOCK_INTERRUPT_HANDLER _blockHandlers[] =
-+{
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(TESSELLATOR, 0),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(VG,          0),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       0),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       1),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       2),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       3),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       4),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       5),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       6),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       7),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       8),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       9),
-+    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(COMMAND,     0),
-+};
-+
-+
-+/******************************************************************************\
-+************************* Static Command Buffer Handlers ***********************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_UpdateStaticCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "%s(%d)\n",
-+        __FUNCTION__, __LINE__
-+        );
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+_ExecuteStaticCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        gcsCMDBUFFER_PTR commandBuffer;
-+
-+        /* Cast the command buffer header. */
-+        commandBuffer = Entry->commandBuffer;
-+
-+        /* Set to update the command buffer next time. */
-+        Entry->handler = _UpdateStaticCommandBuffer;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
-+            __FUNCTION__, __LINE__,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            );
-+
-+        /* Start the command processor. */
-+        gcmkERR_BREAK(gckVGHARDWARE_Execute(
-+            Kernel->hardware,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            ));
-+
-+        /* Success. */
-+        return gcvSTATUS_EXECUTED;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_UpdateLastStaticCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+#if gcvDEBUG || gcdFORCE_MESSAGES
-+    /* Get the command buffer header. */
-+    gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
-+
-+    /* Validate the command buffer. */
-+    gcmkASSERT(commandBuffer->completion != gcvNULL);
-+    gcmkASSERT(commandBuffer->completion != gcvVACANT_BUFFER);
-+
-+#endif
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "%s(%d): processing all tasks scheduled for FE.\n",
-+        __FUNCTION__, __LINE__
-+        );
-+
-+    /* Perform scheduled tasks. */
-+    return _EventHandler_Block(
-+        Kernel,
-+        &Kernel->command->taskTable[gcvBLOCK_COMMAND],
-+        gcvTRUE
-+        );
-+}
-+
-+static gceSTATUS
-+_ExecuteLastStaticCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the command buffer header. */
-+        gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
-+
-+        /* Set to update the command buffer next time. */
-+        Entry->handler = _UpdateLastStaticCommandBuffer;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
-+            __FUNCTION__, __LINE__,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            );
-+
-+        /* Start the command processor. */
-+        gcmkERR_BREAK(gckVGHARDWARE_Execute(
-+            Kernel->hardware,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            ));
-+
-+        /* Success. */
-+        return gcvSTATUS_EXECUTED;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+************************* Dynamic Command Buffer Handlers **********************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_UpdateDynamicCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "%s(%d)\n",
-+        __FUNCTION__, __LINE__
-+        );
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+_ExecuteDynamicCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the command buffer header. */
-+        gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
-+
-+        /* Set to update the command buffer next time. */
-+        Entry->handler = _UpdateDynamicCommandBuffer;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
-+            __FUNCTION__, __LINE__,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            );
-+
-+        /* Start the command processor. */
-+        gcmkERR_BREAK(gckVGHARDWARE_Execute(
-+            Kernel->hardware,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            ));
-+
-+        /* Success. */
-+        return gcvSTATUS_EXECUTED;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_UpdateLastDynamicCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+#if gcvDEBUG || gcdFORCE_MESSAGES
-+    /* Get the command buffer header. */
-+    gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
-+
-+    /* Validate the command buffer. */
-+    gcmkASSERT(commandBuffer->completion != gcvNULL);
-+    gcmkASSERT(commandBuffer->completion != gcvVACANT_BUFFER);
-+
-+#endif
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "%s(%d): processing all tasks scheduled for FE.\n",
-+        __FUNCTION__, __LINE__
-+        );
-+
-+    /* Perform scheduled tasks. */
-+    return _EventHandler_Block(
-+        Kernel,
-+        &Kernel->command->taskTable[gcvBLOCK_COMMAND],
-+        gcvTRUE
-+        );
-+}
-+
-+static gceSTATUS
-+_ExecuteLastDynamicCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Cast the command buffer header. */
-+        gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
-+
-+        /* Set to update the command buffer next time. */
-+        Entry->handler = _UpdateLastDynamicCommandBuffer;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
-+            __FUNCTION__, __LINE__,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            );
-+
-+        /* Start the command processor. */
-+        gcmkERR_BREAK(gckVGHARDWARE_Execute(
-+            Kernel->hardware,
-+            commandBuffer->address,
-+            commandBuffer->dataCount
-+            ));
-+
-+        /* Success. */
-+        return gcvSTATUS_EXECUTED;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+********************************* Other Handlers *******************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_FreeKernelCommandBuffer(
-+    IN gckVGKERNEL Kernel,
-+    IN gcsKERNEL_CMDQUEUE_PTR Entry
-+    )
-+{
-+    gceSTATUS status;
-+
-+    /* Free the command buffer. */
-+    status = _FreeCommandBuffer(Kernel, Entry->commandBuffer);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+******************************* Queue Management *******************************
-+\******************************************************************************/
-+
-+#if gcvDUMP_COMMAND_BUFFER
-+static void
-+_DumpCommandQueue(
-+    IN gckVGCOMMAND Command,
-+    IN gcsKERNEL_QUEUE_HEADER_PTR QueueHeader,
-+    IN gctUINT EntryCount
-+    )
-+{
-+    gcsKERNEL_CMDQUEUE_PTR entry;
-+    gctUINT queueIndex;
-+
-+#if defined(gcvCOMMAND_BUFFER_NAME)
-+    static gctUINT arrayCount = 0;
-+#endif
-+
-+    /* Is dumpinng enabled? */
-+    if (!Commad->enableDumping)
-+    {
-+        return;
-+    }
-+
-+#if !defined(gcvCOMMAND_BUFFER_NAME)
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_COMMAND,
-+        "COMMAND QUEUE DUMP: %d entries\n", EntryCount
-+        );
-+#endif
-+
-+    /* Get the pointer to the first entry. */
-+    entry = QueueHeader->currentEntry;
-+
-+    /* Iterate through the queue. */
-+    for (queueIndex = 0; queueIndex < EntryCount; queueIndex += 1)
-+    {
-+        gcsCMDBUFFER_PTR buffer;
-+        gctUINT bufferCount;
-+        gctUINT bufferIndex;
-+        gctUINT i, count;
-+        gctUINT size;
-+        gctUINT32_PTR data;
-+
-+#if gcvDUMP_COMMAND_LINES
-+        gctUINT lineNumber;
-+#endif
-+
-+#if !defined(gcvCOMMAND_BUFFER_NAME)
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_COMMAND,
-+            "ENTRY %d\n", queueIndex
-+            );
-+#endif
-+
-+        /* Reset the count. */
-+        bufferCount = 0;
-+
-+        /* Set the initial buffer. */
-+        buffer = entry->commandBuffer;
-+
-+        /* Loop through all subbuffers. */
-+        while (buffer)
-+        {
-+            /* Update the count. */
-+            bufferCount += 1;
-+
-+            /* Advance to the next subbuffer. */
-+            buffer = buffer->nextSubBuffer;
-+        }
-+
-+#if !defined(gcvCOMMAND_BUFFER_NAME)
-+        if (bufferCount > 1)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO,
-+                gcvZONE_COMMAND,
-+                "  COMMAND BUFFER SET: %d buffers.\n",
-+                bufferCount
-+                );
-+        }
-+#endif
-+
-+        /* Reset the buffer index. */
-+        bufferIndex = 0;
-+
-+        /* Set the initial buffer. */
-+        buffer = entry->commandBuffer;
-+
-+        /* Loop through all subbuffers. */
-+        while (buffer)
-+        {
-+            /* Determine the size of the buffer. */
-+            size = buffer->dataCount * Command->info.commandAlignment;
-+
-+#if !defined(gcvCOMMAND_BUFFER_NAME)
-+            /* A single buffer? */
-+            if (bufferCount == 1)
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_INFO,
-+                    gcvZONE_COMMAND,
-+                    "  COMMAND BUFFER: count=%d (0x%X), size=%d bytes @ %08X.\n",
-+                    buffer->dataCount,
-+                    buffer->dataCount,
-+                    size,
-+                    buffer->address
-+                    );
-+            }
-+            else
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_INFO,
-+                    gcvZONE_COMMAND,
-+                    "  COMMAND BUFFER %d: count=%d (0x%X), size=%d bytes @ %08X\n",
-+                    bufferIndex,
-+                    buffer->dataCount,
-+                    buffer->dataCount,
-+                    size,
-+                    buffer->address
-+                    );
-+            }
-+#endif
-+
-+            /* Determine the number of double words to print. */
-+            count = size / 4;
-+
-+            /* Determine the buffer location. */
-+            data = (gctUINT32_PTR)
-+            (
-+                (gctUINT8_PTR) buffer + buffer->bufferOffset
-+            );
-+
-+#if defined(gcvCOMMAND_BUFFER_NAME)
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO,
-+                gcvZONE_COMMAND,
-+                "unsigned int _" gcvCOMMAND_BUFFER_NAME "_%d[] =\n",
-+                arrayCount
-+                );
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO,
-+                gcvZONE_COMMAND,
-+                "{\n"
-+                );
-+
-+            arrayCount += 1;
-+#endif
-+
-+#if gcvDUMP_COMMAND_LINES
-+            /* Reset the line number. */
-+            lineNumber = 0;
-+#endif
-+
-+#if defined(gcvCOMMAND_BUFFER_NAME)
-+            count -= 2;
-+#endif
-+
-+            for (i = 0; i < count; i += 1)
-+            {
-+                if ((i % 8) == 0)
-+                {
-+#if defined(gcvCOMMAND_BUFFER_NAME)
-+                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "\t");
-+#else
-+                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "    ");
-+#endif
-+                }
-+
-+#if gcvDUMP_COMMAND_LINES
-+                if (lineNumber == gcvDUMP_COMMAND_LINES)
-+                {
-+                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, " . . . . . . . . .\n");
-+                    break;
-+                }
-+#endif
-+                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "0x%08X", data[i]);
-+
-+                if (i + 1 == count)
-+                {
-+                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "\n");
-+
-+#if gcvDUMP_COMMAND_LINES
-+                    lineNumber += 1;
-+#endif
-+                }
-+                else
-+                {
-+                    if (((i + 1) % 8) == 0)
-+                    {
-+                        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, ",\n");
-+
-+#if gcvDUMP_COMMAND_LINES
-+                        lineNumber += 1;
-+#endif
-+                    }
-+                    else
-+                    {
-+                        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, ", ");
-+                    }
-+                }
-+            }
-+
-+#if defined(gcvCOMMAND_BUFFER_NAME)
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO,
-+                gcvZONE_COMMAND,
-+                "};\n\n"
-+                );
-+#endif
-+
-+            /* Advance to the next subbuffer. */
-+            buffer = buffer->nextSubBuffer;
-+            bufferIndex += 1;
-+        }
-+
-+        /* Advance to the next entry. */
-+        entry += 1;
-+    }
-+}
-+#endif
-+
-+static gceSTATUS
-+_LockCurrentQueue(
-+    IN gckVGCOMMAND Command,
-+    OUT gcsKERNEL_CMDQUEUE_PTR * Entries,
-+    OUT gctUINT_PTR EntryCount
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        gcsKERNEL_QUEUE_HEADER_PTR queueHead;
-+
-+        /* Get a shortcut to the head of the queue. */
-+        queueHead = Command->queueHead;
-+
-+        /* Is the head buffer still being worked on? */
-+        if (queueHead->pending)
-+        {
-+            /* Increment overflow count. */
-+            Command->queueOverflow += 1;
-+
-+            /* Wait until the head becomes idle. */
-+            gcmkERR_BREAK(_WaitForIdle(Command, queueHead));
-+        }
-+
-+        /* Acquire the mutex. */
-+        gcmkERR_BREAK(gckOS_AcquireMutex(
-+            Command->os,
-+            Command->queueMutex,
-+            gcvINFINITE
-+            ));
-+
-+        /* Determine the first queue entry. */
-+        queueHead->currentEntry = (gcsKERNEL_CMDQUEUE_PTR)
-+        (
-+            (gctUINT8_PTR) queueHead + gcmSIZEOF(gcsKERNEL_QUEUE_HEADER)
-+        );
-+
-+        /* Set the pointer to the first entry. */
-+        * Entries = queueHead->currentEntry;
-+
-+        /* Determine the number of available entries. */
-+        * EntryCount = queueHead->size / gcmSIZEOF(gcsKERNEL_CMDQUEUE);
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_UnlockCurrentQueue(
-+    IN gckVGCOMMAND Command,
-+    IN gctUINT EntryCount
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+#if !gcdENABLE_INFINITE_SPEED_HW
-+        gcsKERNEL_QUEUE_HEADER_PTR queueTail;
-+        gcsKERNEL_QUEUE_HEADER_PTR queueHead;
-+        gcsKERNEL_QUEUE_HEADER_PTR queueNext;
-+        gctUINT queueSize;
-+        gctUINT newSize;
-+        gctUINT unusedSize;
-+
-+        /* Get shortcut to the head and to the tail of the queue. */
-+        queueTail = Command->queueTail;
-+        queueHead = Command->queueHead;
-+
-+        /* Dump the command buffer. */
-+#if gcvDUMP_COMMAND_BUFFER
-+        _DumpCommandQueue(Command, queueHead, EntryCount);
-+#endif
-+
-+        /* Get a shortcut to the current queue size. */
-+        queueSize = queueHead->size;
-+
-+        /* Determine the new queue size. */
-+        newSize = EntryCount * gcmSIZEOF(gcsKERNEL_CMDQUEUE);
-+        gcmkASSERT(newSize <= queueSize);
-+
-+        /* Determine the size of the unused area. */
-+        unusedSize = queueSize - newSize;
-+
-+        /* Is the unused area big enough to become a buffer? */
-+        if (unusedSize >= gcvMINUMUM_BUFFER)
-+        {
-+            gcsKERNEL_QUEUE_HEADER_PTR nextHead;
-+
-+            /* Place the new header. */
-+            nextHead = (gcsKERNEL_QUEUE_HEADER_PTR)
-+            (
-+                (gctUINT8_PTR) queueHead
-+                    + gcmSIZEOF(gcsKERNEL_QUEUE_HEADER)
-+                    + newSize
-+            );
-+
-+            /* Initialize the buffer. */
-+            nextHead->size    = unusedSize - gcmSIZEOF(gcsKERNEL_QUEUE_HEADER);
-+            nextHead->pending = 0;
-+
-+            /* Link the buffer in. */
-+            nextHead->next  = queueHead->next;
-+            queueHead->next = nextHead;
-+            queueNext       = nextHead;
-+
-+            /* Update the size of the current buffer. */
-+            queueHead->size = newSize;
-+        }
-+
-+        /* Not big enough. */
-+        else
-+        {
-+            /* Determine the next queue. */
-+            queueNext = queueHead->next;
-+        }
-+
-+        /* Mark the buffer as busy. */
-+        queueHead->pending = EntryCount;
-+
-+        /* Advance to the next buffer. */
-+        Command->queueHead = queueNext;
-+
-+        /* Start the command processor if the queue was empty. */
-+        if (queueTail == queueHead)
-+        {
-+            gcsCMDBUFFER_PTR commandBuffer;
-+
-+            /* The first entry must be a command buffer. */
-+            commandBuffer = queueTail->currentEntry->commandBuffer;
-+
-+            /* Start the command processor. */
-+            gcmkERR_BREAK(gckVGHARDWARE_Execute(
-+                Command->hardware,
-+                commandBuffer->address,
-+                commandBuffer->dataCount
-+                ));
-+        }
-+
-+        /* The queue was not empty. */
-+        else
-+        {
-+            /* Advance the merge buffer if needed. */
-+            if (queueHead == Command->mergeQueue)
-+            {
-+                Command->mergeQueue = queueNext;
-+            }
-+        }
-+#endif
-+
-+        /* Release the mutex. */
-+        gcmkERR_BREAK(gckOS_ReleaseMutex(
-+            Command->os,
-+            Command->queueMutex
-+            ));
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+
-+
-+/******************************************************************************\
-+****************************** gckVGCOMMAND API Code *****************************
-+\******************************************************************************/
-+gceSTATUS
-+gckVGCOMMAND_Construct(
-+    IN gckVGKERNEL Kernel,
-+    IN gctUINT TaskGranularity,
-+    IN gctUINT QueueSize,
-+    OUT gckVGCOMMAND * Command
-+    )
-+{
-+    gceSTATUS status, last;
-+    gckVGCOMMAND command = gcvNULL;
-+    gcsKERNEL_QUEUE_HEADER_PTR queue;
-+    gctUINT i, j;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x TaskGranularity=0x%x QueueSize=0x%x Command=0x%x",
-+        Kernel, TaskGranularity, QueueSize, Command);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(QueueSize >= gcvMINUMUM_BUFFER);
-+    gcmkVERIFY_ARGUMENT(Command != gcvNULL);
-+
-+    do
-+    {
-+        /***********************************************************************
-+        ** Generic object initialization.
-+        */
-+
-+        /* Allocate the gckVGCOMMAND structure. */
-+        gcmkERR_BREAK(gckOS_Allocate(
-+            Kernel->os,
-+            gcmSIZEOF(struct _gckVGCOMMAND),
-+            (gctPOINTER *) &command
-+            ));
-+
-+        /* Initialize the object. */
-+        command->object.type = gcvOBJ_COMMAND;
-+
-+        /* Set the object pointers. */
-+        command->kernel      = Kernel;
-+        command->os          = Kernel->os;
-+        command->hardware    = Kernel->hardware;
-+
-+        /* Reset pointers. */
-+        command->queue       = gcvNULL;
-+        command->queueMutex  = gcvNULL;
-+        command->taskMutex   = gcvNULL;
-+        command->commitMutex = gcvNULL;
-+
-+        command->powerStallBuffer   = gcvNULL;
-+        command->powerStallSignal   = gcvNULL;
-+        command->powerSemaphore     = gcvNULL;
-+
-+        /* Reset context states. */
-+        command->contextCounter = 0;
-+        command->currentContext = 0;
-+
-+        /* Enable command buffer dumping. */
-+        command->enableDumping = gcvTRUE;
-+
-+        /* Set features. */
-+        command->fe20 = Kernel->hardware->fe20;
-+        command->vg20 = Kernel->hardware->vg20;
-+        command->vg21 = Kernel->hardware->vg21;
-+
-+        /* Reset task table .*/
-+        gcmkVERIFY_OK(gckOS_ZeroMemory(
-+            command->taskTable, gcmSIZEOF(command->taskTable)
-+            ));
-+
-+        /* Query command buffer attributes. */
-+        gcmkERR_BREAK(gckVGCOMMAND_InitializeInfo(command));
-+
-+        /* Create the control mutexes. */
-+        gcmkERR_BREAK(gckOS_CreateMutex(Kernel->os, &command->queueMutex));
-+        gcmkERR_BREAK(gckOS_CreateMutex(Kernel->os, &command->taskMutex));
-+        gcmkERR_BREAK(gckOS_CreateMutex(Kernel->os, &command->commitMutex));
-+
-+        /* Create the power management semaphore. */
-+        gcmkERR_BREAK(gckOS_CreateSemaphore(Kernel->os,
-+            &command->powerSemaphore));
-+
-+        gcmkERR_BREAK(gckOS_CreateSignal(Kernel->os,
-+            gcvFALSE, &command->powerStallSignal));
-+
-+        /***********************************************************************
-+        ** Command queue initialization.
-+        */
-+
-+        /* Allocate the command queue. */
-+        gcmkERR_BREAK(gckOS_Allocate(
-+            Kernel->os,
-+            QueueSize,
-+            (gctPOINTER *) &command->queue
-+            ));
-+
-+        /* Initialize the command queue. */
-+        queue = command->queue;
-+
-+        queue->size    = QueueSize - gcmSIZEOF(gcsKERNEL_QUEUE_HEADER);
-+        queue->pending = 0;
-+        queue->next    = queue;
-+
-+        command->queueHead  =
-+        command->queueTail  =
-+        command->mergeQueue = command->queue;
-+
-+        command->queueOverflow = 0;
-+
-+
-+        /***********************************************************************
-+        ** Enable TS overflow interrupt.
-+        */
-+
-+        command->info.tsOverflowInt = 0;
-+        gcmkERR_BREAK(gckVGINTERRUPT_Enable(
-+            Kernel->interrupt,
-+            &command->info.tsOverflowInt,
-+            _EventHandler_TSOverflow
-+            ));
-+
-+        /* Mask out the interrupt. */
-+        Kernel->hardware->eventMask &= ~(1 << command->info.tsOverflowInt);
-+
-+
-+        /***********************************************************************
-+        ** Enable Bus Error interrupt.
-+        */
-+
-+        /* Hardwired to bit 31. */
-+        command->busErrorInt = 31;
-+
-+        /* Enable the interrupt. */
-+        gcmkERR_BREAK(gckVGINTERRUPT_Enable(
-+            Kernel->interrupt,
-+            &command->busErrorInt,
-+            _EventHandler_BusError
-+            ));
-+
-+
-+        command->powerStallInt = 30;
-+        /* Enable the interrupt. */
-+        gcmkERR_BREAK(gckVGINTERRUPT_Enable(
-+            Kernel->interrupt,
-+            &command->powerStallInt,
-+            _EventHandler_PowerStall
-+            ));
-+
-+        /***********************************************************************
-+        ** Task management initialization.
-+        */
-+
-+        command->taskStorage            = gcvNULL;
-+        command->taskStorageGranularity = TaskGranularity;
-+        command->taskStorageUsable      = TaskGranularity - gcmSIZEOF(gcsTASK_STORAGE);
-+
-+        command->taskFreeHead = gcvNULL;
-+        command->taskFreeTail = gcvNULL;
-+
-+        /* Enable block handlers. */
-+        for (i = 0; i < gcmCOUNTOF(_blockHandlers); i += 1)
-+        {
-+            /* Get the target hardware block. */
-+            gceBLOCK block = _blockHandlers[i].block;
-+
-+            /* Get the interrupt array entry. */
-+            gcsBLOCK_TASK_ENTRY_PTR entry = &command->taskTable[block];
-+
-+            /* Determine the interrupt value index. */
-+            gctUINT index = entry->interruptCount;
-+
-+            /* Create the block semaphore. */
-+            if (entry->interruptSemaphore == gcvNULL)
-+            {
-+                gcmkERR_BREAK(gckOS_CreateSemaphoreVG(
-+                    command->os, &entry->interruptSemaphore
-+                    ));
-+            }
-+
-+            /* Enable auto-detection. */
-+            entry->interruptArray[index] = -1;
-+
-+            /* Enable interrupt for the block. */
-+            gcmkERR_BREAK(gckVGINTERRUPT_Enable(
-+                Kernel->interrupt,
-+                &entry->interruptArray[index],
-+                _blockHandlers[i].handler
-+                ));
-+
-+            /* Update the number of registered interrupts. */
-+            entry->interruptCount += 1;
-+
-+            /* Inrement the semaphore to allow the usage of the registered
-+               interrupt. */
-+            gcmkERR_BREAK(gckOS_IncrementSemaphore(
-+                command->os, entry->interruptSemaphore
-+                ));
-+
-+        }
-+
-+        /* Error? */
-+        if (gcmkIS_ERROR(status))
-+        {
-+            break;
-+        }
-+
-+        /* Get the FE interrupt. */
-+        command->info.feBufferInt
-+            = command->taskTable[gcvBLOCK_COMMAND].interruptArray[0];
-+
-+        /* Return gckVGCOMMAND object pointer. */
-+        *Command = command;
-+
-+        gcmkFOOTER_ARG("*Command=0x%x",*Command);
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Roll back. */
-+    if (command != gcvNULL)
-+    {
-+        /* Disable block handlers. */
-+        for (i = 0; i < gcvBLOCK_COUNT; i += 1)
-+        {
-+            /* Get the task table entry. */
-+            gcsBLOCK_TASK_ENTRY_PTR entry = &command->taskTable[i];
-+
-+            /* Destroy the semaphore. */
-+            if (entry->interruptSemaphore != gcvNULL)
-+            {
-+                gcmkCHECK_STATUS(gckOS_DestroySemaphore(
-+                    command->os, entry->interruptSemaphore
-+                    ));
-+            }
-+
-+            /* Disable all enabled interrupts. */
-+            for (j = 0; j < entry->interruptCount; j += 1)
-+            {
-+                /* Must be a valid value. */
-+                gcmkASSERT(entry->interruptArray[j] >= 0);
-+                gcmkASSERT(entry->interruptArray[j] <= 31);
-+
-+                /* Disable the interrupt. */
-+                gcmkCHECK_STATUS(gckVGINTERRUPT_Disable(
-+                    Kernel->interrupt,
-+                    entry->interruptArray[j]
-+                    ));
-+            }
-+        }
-+
-+        /* Disable the bus error interrupt. */
-+        gcmkCHECK_STATUS(gckVGINTERRUPT_Disable(
-+            Kernel->interrupt,
-+            command->busErrorInt
-+            ));
-+
-+        /* Disable TS overflow interrupt. */
-+        if (command->info.tsOverflowInt != -1)
-+        {
-+            gcmkCHECK_STATUS(gckVGINTERRUPT_Disable(
-+                Kernel->interrupt,
-+                command->info.tsOverflowInt
-+                ));
-+        }
-+
-+        /* Delete the commit mutex. */
-+        if (command->commitMutex != gcvNULL)
-+        {
-+            gcmkCHECK_STATUS(gckOS_DeleteMutex(
-+                Kernel->os, command->commitMutex
-+                ));
-+        }
-+
-+        /* Delete the command queue mutex. */
-+        if (command->taskMutex != gcvNULL)
-+        {
-+            gcmkCHECK_STATUS(gckOS_DeleteMutex(
-+                Kernel->os, command->taskMutex
-+                ));
-+        }
-+
-+        /* Delete the command queue mutex. */
-+        if (command->queueMutex != gcvNULL)
-+        {
-+            gcmkCHECK_STATUS(gckOS_DeleteMutex(
-+                Kernel->os, command->queueMutex
-+                ));
-+        }
-+
-+        /* Delete the command queue. */
-+        if (command->queue != gcvNULL)
-+        {
-+            gcmkCHECK_STATUS(gckOS_Free(
-+                Kernel->os, command->queue
-+                ));
-+        }
-+
-+        if (command->powerSemaphore != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DestroySemaphore(
-+                Kernel->os, command->powerSemaphore));
-+        }
-+
-+        if (command->powerStallSignal != gcvNULL)
-+        {
-+            /* Create the power management semaphore. */
-+            gcmkVERIFY_OK(gckOS_DestroySignal(
-+                Kernel->os,
-+                command->powerStallSignal));
-+        }
-+
-+        /* Free the gckVGCOMMAND structure. */
-+        gcmkCHECK_STATUS(gckOS_Free(
-+            Kernel->os, command
-+            ));
-+    }
-+
-+    gcmkFOOTER();
-+    /* Return the error. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGCOMMAND_Destroy(
-+    OUT gckVGCOMMAND Command
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    gcmkHEADER_ARG("Command=0x%x", Command);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+
-+    do
-+    {
-+        gctUINT i;
-+        gcsTASK_STORAGE_PTR nextStorage;
-+
-+        if (Command->queueHead != gcvNULL)
-+        {
-+            /* Wait until the head becomes idle. */
-+            gcmkERR_BREAK(_WaitForIdle(Command, Command->queueHead));
-+        }
-+
-+        /* Disable block handlers. */
-+        for (i = 0; i < gcvBLOCK_COUNT; i += 1)
-+        {
-+            /* Get the interrupt array entry. */
-+            gcsBLOCK_TASK_ENTRY_PTR entry = &Command->taskTable[i];
-+
-+            /* Determine the index of the last interrupt in the array. */
-+            gctINT index = entry->interruptCount - 1;
-+
-+            /* Destroy the semaphore. */
-+            if (entry->interruptSemaphore != gcvNULL)
-+            {
-+                gcmkERR_BREAK(gckOS_DestroySemaphore(
-+                    Command->os, entry->interruptSemaphore
-+                    ));
-+            }
-+
-+            /* Disable all enabled interrupts. */
-+            while (index >= 0)
-+            {
-+                /* Must be a valid value. */
-+                gcmkASSERT(entry->interruptArray[index] >= 0);
-+                gcmkASSERT(entry->interruptArray[index] <= 31);
-+
-+                /* Disable the interrupt. */
-+                gcmkERR_BREAK(gckVGINTERRUPT_Disable(
-+                    Command->kernel->interrupt,
-+                    entry->interruptArray[index]
-+                    ));
-+
-+                /* Update to the next interrupt. */
-+                index                 -= 1;
-+                entry->interruptCount -= 1;
-+            }
-+
-+            /* Error? */
-+            if (gcmkIS_ERROR(status))
-+            {
-+                break;
-+            }
-+        }
-+
-+        /* Error? */
-+        if (gcmkIS_ERROR(status))
-+        {
-+            break;
-+        }
-+
-+        /* Disable the bus error interrupt. */
-+        gcmkERR_BREAK(gckVGINTERRUPT_Disable(
-+            Command->kernel->interrupt,
-+            Command->busErrorInt
-+            ));
-+
-+        /* Disable TS overflow interrupt. */
-+        if (Command->info.tsOverflowInt != -1)
-+        {
-+            gcmkERR_BREAK(gckVGINTERRUPT_Disable(
-+                Command->kernel->interrupt,
-+                Command->info.tsOverflowInt
-+                ));
-+
-+            Command->info.tsOverflowInt = -1;
-+        }
-+
-+        /* Delete the commit mutex. */
-+        if (Command->commitMutex != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckOS_DeleteMutex(
-+                Command->os, Command->commitMutex
-+                ));
-+
-+            Command->commitMutex = gcvNULL;
-+        }
-+
-+        /* Delete the command queue mutex. */
-+        if (Command->taskMutex != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckOS_DeleteMutex(
-+                Command->os, Command->taskMutex
-+                ));
-+
-+            Command->taskMutex = gcvNULL;
-+        }
-+
-+        /* Delete the command queue mutex. */
-+        if (Command->queueMutex != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckOS_DeleteMutex(
-+                Command->os, Command->queueMutex
-+                ));
-+
-+            Command->queueMutex = gcvNULL;
-+        }
-+
-+        if (Command->powerSemaphore != gcvNULL)
-+        {
-+            /* Destroy the power management semaphore. */
-+            gcmkERR_BREAK(gckOS_DestroySemaphore(
-+                Command->os, Command->powerSemaphore));
-+        }
-+
-+        if (Command->powerStallSignal != gcvNULL)
-+        {
-+            /* Create the power management semaphore. */
-+            gcmkERR_BREAK(gckOS_DestroySignal(
-+                Command->os,
-+                Command->powerStallSignal));
-+        }
-+
-+        if (Command->queue != gcvNULL)
-+        {
-+            /* Delete the command queue. */
-+            gcmkERR_BREAK(gckOS_Free(
-+                Command->os, Command->queue
-+                ));
-+        }
-+
-+        /* Destroy all allocated buffers. */
-+        while (Command->taskStorage)
-+        {
-+            /* Copy the buffer pointer. */
-+            nextStorage = Command->taskStorage->next;
-+
-+            /* Free the current container. */
-+            gcmkERR_BREAK(gckOS_Free(
-+                Command->os, Command->taskStorage
-+                ));
-+
-+            /* Advance to the next one. */
-+            Command->taskStorage = nextStorage;
-+        }
-+
-+        /* Error? */
-+        if (gcmkIS_ERROR(status))
-+        {
-+            break;
-+        }
-+
-+        /* Mark the object as unknown. */
-+        Command->object.type = gcvOBJ_UNKNOWN;
-+
-+        /* Free the gckVGCOMMAND structure. */
-+        gcmkERR_BREAK(gckOS_Free(Command->os, Command));
-+
-+        gcmkFOOTER_NO();
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Restore the object type if failed. */
-+    Command->object.type = gcvOBJ_COMMAND;
-+
-+    gcmkFOOTER();
-+    /* Return the error. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGCOMMAND_QueryCommandBuffer(
-+    IN gckVGCOMMAND Command,
-+    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
-+    )
-+{
-+    gcmkHEADER_ARG("Command=0x%x Information=0x%x", Command, Information);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+    gcmkVERIFY_ARGUMENT(Information != gcvNULL);
-+
-+    /* Copy the information. */
-+    gcmkVERIFY_OK(gckOS_MemCopy(
-+        Information, &Command->info, sizeof(gcsCOMMAND_BUFFER_INFO)
-+        ));
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGCOMMAND_Allocate(
-+    IN gckVGCOMMAND Command,
-+    IN gctSIZE_T Size,
-+    OUT gcsCMDBUFFER_PTR * CommandBuffer,
-+    OUT gctPOINTER * Data
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Command=0x%x Size=0x%x CommandBuffer=0x%x Data=0x%x",
-+        Command, Size, CommandBuffer, Data);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
-+
-+    do
-+    {
-+        /* Allocate the buffer. */
-+        gcmkERR_BREAK(_AllocateCommandBuffer(Command, Size, CommandBuffer));
-+
-+        /* Determine the data pointer. */
-+        * Data = (gctUINT8_PTR) (*CommandBuffer) + (* CommandBuffer)->bufferOffset;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGCOMMAND_Free(
-+    IN gckVGCOMMAND Command,
-+    IN gcsCMDBUFFER_PTR CommandBuffer
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Command=0x%x CommandBuffer=0x%x",
-+        Command, CommandBuffer);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+    gcmkVERIFY_ARGUMENT(CommandBuffer != gcvNULL);
-+
-+    /* Free command buffer. */
-+    status = _FreeCommandBuffer(Command->kernel, CommandBuffer);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGCOMMAND_Execute(
-+    IN gckVGCOMMAND Command,
-+    IN gcsCMDBUFFER_PTR CommandBuffer
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Command=0x%x CommandBuffer=0x%x",
-+        Command, CommandBuffer);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+    gcmkVERIFY_ARGUMENT(CommandBuffer != gcvNULL);
-+
-+    do
-+    {
-+        gctUINT queueLength;
-+        gcsKERNEL_CMDQUEUE_PTR kernelEntry;
-+
-+        /* Lock the current queue. */
-+        gcmkERR_BREAK(_LockCurrentQueue(
-+            Command, &kernelEntry, &queueLength
-+            ));
-+
-+        /* Set the buffer. */
-+        kernelEntry->commandBuffer = CommandBuffer;
-+        kernelEntry->handler = _FreeKernelCommandBuffer;
-+
-+        /* Lock the current queue. */
-+        gcmkERR_BREAK(_UnlockCurrentQueue(
-+            Command, 1
-+            ));
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckVGCOMMAND_Commit(
-+    IN gckVGCOMMAND Command,
-+    IN gcsVGCONTEXT_PTR Context,
-+    IN gcsVGCMDQUEUE_PTR Queue,
-+    IN gctUINT EntryCount,
-+    IN gcsTASK_MASTER_TABLE_PTR TaskTable
-+    )
-+{
-+    /*
-+        The first buffer is executed through a direct gckVGHARDWARE_Execute call,
-+        therefore only an update is needed after the execution is over. All
-+        consequent buffers need to be executed upon the first update call from
-+        the FE interrupt handler.
-+    */
-+
-+    static gcsQUEUE_UPDATE_CONTROL _dynamicBuffer[] =
-+    {
-+        {
-+            _UpdateDynamicCommandBuffer,
-+            _UpdateDynamicCommandBuffer,
-+            _UpdateLastDynamicCommandBuffer,
-+            _UpdateLastDynamicCommandBuffer
-+        },
-+        {
-+            _ExecuteDynamicCommandBuffer,
-+            _UpdateDynamicCommandBuffer,
-+            _ExecuteLastDynamicCommandBuffer,
-+            _UpdateLastDynamicCommandBuffer
-+        }
-+    };
-+
-+    static gcsQUEUE_UPDATE_CONTROL _staticBuffer[] =
-+    {
-+        {
-+            _UpdateStaticCommandBuffer,
-+            _UpdateStaticCommandBuffer,
-+            _UpdateLastStaticCommandBuffer,
-+            _UpdateLastStaticCommandBuffer
-+        },
-+        {
-+            _ExecuteStaticCommandBuffer,
-+            _UpdateStaticCommandBuffer,
-+            _ExecuteLastStaticCommandBuffer,
-+            _UpdateLastStaticCommandBuffer
-+        }
-+    };
-+
-+    gceSTATUS status, last;
-+
-+    gcmkHEADER_ARG("Command=0x%x Context=0x%x Queue=0x%x EntryCount=0x%x TaskTable=0x%x",
-+        Command, Context, Queue, EntryCount, TaskTable);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
-+    gcmkVERIFY_ARGUMENT(Context != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Queue != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(EntryCount > 1);
-+
-+#ifdef __QNXNTO__
-+    TaskTable->coid     = Context->coid;
-+    TaskTable->rcvid    = Context->rcvid;
-+#endif /* __QNXNTO__ */
-+
-+    do
-+    {
-+        gctBOOL haveFETasks;
-+        gctUINT queueSize;
-+        gcsVGCMDQUEUE_PTR mappedQueue;
-+        gcsVGCMDQUEUE_PTR userEntry;
-+        gcsKERNEL_CMDQUEUE_PTR kernelEntry;
-+        gcsQUEUE_UPDATE_CONTROL_PTR queueControl;
-+        gctUINT currentLength;
-+        gctUINT queueLength;
-+        gctUINT entriesQueued;
-+        gctUINT8_PTR previousEnd;
-+        gctBOOL previousDynamic;
-+        gctBOOL previousExecuted;
-+        gctUINT controlIndex;
-+
-+        gcmkERR_BREAK(gckVGHARDWARE_SetPowerManagementState(
-+            Command->hardware, gcvPOWER_ON_AUTO
-+            ));
-+
-+        /* Acquire the power semaphore. */
-+        gcmkERR_BREAK(gckOS_AcquireSemaphore(
-+            Command->os, Command->powerSemaphore
-+            ));
-+
-+        /* Acquire the mutex. */
-+        status = gckOS_AcquireMutex(
-+            Command->os,
-+            Command->commitMutex,
-+            gcvINFINITE
-+            );
-+
-+        if (gcmIS_ERROR(status))
-+        {
-+            gcmkVERIFY_OK(gckOS_ReleaseSemaphore(
-+                Command->os, Command->powerSemaphore));
-+            break;
-+        }
-+
-+        do
-+        {
-+            gcmkERR_BREAK(_FlushMMU(Command));
-+
-+            /* Assign a context ID if not yet assigned. */
-+            if (Context->id == 0)
-+            {
-+                /* Assign the next context number. */
-+                Context->id = ++ Command->contextCounter;
-+
-+                /* See if we overflowed. */
-+                if (Command->contextCounter == 0)
-+                {
-+                    /* We actually did overflow, wow... */
-+                    status = gcvSTATUS_OUT_OF_RESOURCES;
-+                    break;
-+                }
-+            }
-+
-+            /* The first entry in the queue is always the context buffer.
-+               Verify whether the user context is the same as the current
-+               context and if that's the case, skip the first entry. */
-+            if (Context->id == Command->currentContext)
-+            {
-+                /* Same context as before, skip the first entry. */
-+                EntryCount -= 1;
-+                Queue      += 1;
-+
-+                /* Set the signal to avoid user waiting. */
-+#ifdef __QNXNTO__
-+                gcmkERR_BREAK(gckOS_UserSignal(
-+                    Command->os, Context->signal, Context->rcvid, Context->coid
-+                    ));
-+#else
-+                gcmkERR_BREAK(gckOS_UserSignal(
-+                    Command->os, Context->signal, Context->process
-+                    ));
-+
-+#endif /* __QNXNTO__ */
-+
-+            }
-+            else
-+            {
-+                /* Different user context - keep the first entry.
-+                   Set the user context as the current one. */
-+                Command->currentContext = Context->id;
-+            }
-+
-+            /* Reset pointers. */
-+            queueControl = gcvNULL;
-+            previousEnd  = gcvNULL;
-+
-+            /* Determine whether there are FE tasks to be performed. */
-+            haveFETasks = (TaskTable->table[gcvBLOCK_COMMAND].head != gcvNULL);
-+
-+            /* Determine the size of the queue. */
-+            queueSize = EntryCount * gcmSIZEOF(gcsVGCMDQUEUE);
-+
-+            /* Map the command queue into the kernel space. */
-+            gcmkERR_BREAK(gckOS_MapUserPointer(
-+                Command->os,
-+                Queue,
-+                queueSize,
-+                (gctPOINTER *) &mappedQueue
-+                ));
-+
-+            /* Set the first entry. */
-+            userEntry = mappedQueue;
-+
-+            /* Process the command queue. */
-+            while (EntryCount)
-+            {
-+                /* Lock the current queue. */
-+                gcmkERR_BREAK(_LockCurrentQueue(
-+                    Command, &kernelEntry, &queueLength
-+                    ));
-+
-+                /* Determine the number of entries to process. */
-+                currentLength = (queueLength < EntryCount)
-+                    ? queueLength
-+                    : EntryCount;
-+
-+                /* Update the number of the entries left to process. */
-+                EntryCount -= currentLength;
-+
-+                /* Reset previous flags. */
-+                previousDynamic  = gcvFALSE;
-+                previousExecuted = gcvFALSE;
-+
-+                /* Set the initial control index. */
-+                controlIndex = 0;
-+
-+                /* Process entries. */
-+                for (entriesQueued = 0; entriesQueued < currentLength; entriesQueued += 1)
-+                {
-+                    /* Get the kernel pointer to the command buffer header. */
-+                    gcsCMDBUFFER_PTR commandBuffer = gcvNULL;
-+                    gcmkERR_BREAK(_ConvertUserCommandBufferPointer(
-+                        Command,
-+                        userEntry->commandBuffer,
-+                        &commandBuffer
-+                        ));
-+
-+                    /* Is it a dynamic command buffer? */
-+                    if (userEntry->dynamic)
-+                    {
-+                        /* Select dynamic buffer control functions. */
-+                        queueControl = &_dynamicBuffer[controlIndex];
-+                    }
-+
-+                    /* No, a static command buffer. */
-+                    else
-+                    {
-+                        /* Select static buffer control functions. */
-+                        queueControl = &_staticBuffer[controlIndex];
-+                    }
-+
-+                    /* Set the command buffer pointer to the entry. */
-+                    kernelEntry->commandBuffer = commandBuffer;
-+
-+                    /* If the previous entry was a dynamic command buffer,
-+                       link it to the current. */
-+                    if (previousDynamic)
-+                    {
-+                        gcmkERR_BREAK(gckVGCOMMAND_FetchCommand(
-+                            Command,
-+                            previousEnd,
-+                            commandBuffer->address,
-+                            commandBuffer->dataCount,
-+                            gcvNULL
-+                            ));
-+
-+                        /* The buffer will be auto-executed, only need to
-+                           update it after it has been executed. */
-+                        kernelEntry->handler = queueControl->update;
-+
-+                        /* The buffer is only being updated. */
-+                        previousExecuted = gcvFALSE;
-+                    }
-+                    else
-+                    {
-+                        /* Set the buffer up for execution. */
-+                        kernelEntry->handler = queueControl->execute;
-+
-+                        /* The buffer is being updated. */
-+                        previousExecuted = gcvTRUE;
-+                    }
-+
-+                    /* The current buffer's END command becomes the last END. */
-+                    previousEnd
-+                        = ((gctUINT8_PTR) commandBuffer)
-+                        + commandBuffer->bufferOffset
-+                        + commandBuffer->dataCount * Command->info.commandAlignment
-+                        - Command->info.staticTailSize;
-+
-+                    /* Update the last entry info. */
-+                    previousDynamic = userEntry->dynamic;
-+
-+                    /* Advance entries. */
-+                    userEntry   += 1;
-+                    kernelEntry += 1;
-+
-+                    /* Update the control index. */
-+                    controlIndex = 1;
-+                }
-+
-+                /* If the previous entry was a dynamic command buffer,
-+                   terminate it with an END. */
-+                if (previousDynamic)
-+                {
-+                    gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
-+                        Command,
-+                        previousEnd,
-+                        Command->info.feBufferInt,
-+                        gcvNULL
-+                        ));
-+                }
-+
-+                /* Last buffer? */
-+                if (EntryCount == 0)
-+                {
-+                    /* Modify the last command buffer's routines to handle
-+                       tasks if any.*/
-+                    if (haveFETasks)
-+                    {
-+                        if (previousExecuted)
-+                        {
-+                            kernelEntry[-1].handler = queueControl->lastExecute;
-+                        }
-+                        else
-+                        {
-+                            kernelEntry[-1].handler = queueControl->lastUpdate;
-+                        }
-+                    }
-+
-+                    /* Release the mutex. */
-+                    gcmkERR_BREAK(gckOS_ReleaseMutex(
-+                        Command->os,
-+                        Command->queueMutex
-+                        ));
-+                    /* Schedule tasks. */
-+                    gcmkERR_BREAK(_ScheduleTasks(Command, TaskTable, previousEnd));
-+
-+                    /* Acquire the mutex. */
-+                    gcmkERR_BREAK(gckOS_AcquireMutex(
-+                        Command->os,
-+                        Command->queueMutex,
-+                        gcvINFINITE
-+                        ));
-+                }
-+
-+                /* Unkock and schedule the current queue for execution. */
-+                gcmkERR_BREAK(_UnlockCurrentQueue(
-+                    Command, currentLength
-+                    ));
-+            }
-+
-+
-+            /* Unmap the user command buffer. */
-+            gcmkERR_BREAK(gckOS_UnmapUserPointer(
-+                Command->os,
-+                Queue,
-+                queueSize,
-+                mappedQueue
-+                ));
-+        }
-+        while (gcvFALSE);
-+
-+        /* Release the mutex. */
-+        gcmkCHECK_STATUS(gckOS_ReleaseMutex(
-+            Command->os,
-+            Command->commitMutex
-+            ));
-+
-+        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(
-+            Command->os, Command->powerSemaphore));
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+#endif /* gcdENABLE_VG */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,1618 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_DATABASE
-+
-+/*******************************************************************************
-+***** Private fuctions ********************************************************/
-+
-+#define _GetSlot(database, x) \
-+    (gctUINT32)(((gcmPTR_TO_UINT64(x) >> 7) % gcmCOUNTOF(database->list)))
-+
-+/*******************************************************************************
-+**  gckKERNEL_NewDatabase
-+**
-+**  Create a new database structure and insert it to the head of the hash list.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          ProcessID that identifies the database.
-+**
-+**  OUTPUT:
-+**
-+**      gcsDATABASE_PTR * Database
-+**          Pointer to a variable receiving the database structure pointer on
-+**          success.
-+*/
-+static gceSTATUS
-+gckKERNEL_NewDatabase(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    OUT gcsDATABASE_PTR * Database
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+    gctBOOL acquired = gcvFALSE;
-+    gctSIZE_T slot;
-+    gcsDATABASE_PTR existingDatabase;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
-+
-+    /* Acquire the database mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Compute the hash for the database. */
-+    slot = ProcessID % gcmCOUNTOF(Kernel->db->db);
-+
-+    /* Walk the hash list. */
-+    for (existingDatabase = Kernel->db->db[slot];
-+         existingDatabase != gcvNULL;
-+         existingDatabase = existingDatabase->next)
-+    {
-+        if (existingDatabase->processID == ProcessID)
-+        {
-+            /* One process can't be added twice. */
-+            gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+        }
-+    }
-+
-+    if (Kernel->db->freeDatabase != gcvNULL)
-+    {
-+        /* Allocate a database from the free list. */
-+        database             = Kernel->db->freeDatabase;
-+        Kernel->db->freeDatabase = database->next;
-+    }
-+    else
-+    {
-+        gctPOINTER pointer = gcvNULL;
-+
-+        /* Allocate a new database from the heap. */
-+        gcmkONERROR(gckOS_Allocate(Kernel->os,
-+                                   gcmSIZEOF(gcsDATABASE),
-+                                   &pointer));
-+
-+        database = pointer;
-+    }
-+
-+    /* Insert the database into the hash. */
-+    database->next   = Kernel->db->db[slot];
-+    Kernel->db->db[slot] = database;
-+
-+    /* Save the hash slot. */
-+    database->slot = slot;
-+
-+    /* Release the database mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Return the database. */
-+    *Database = database;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Database=0x%x", *Database);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the database mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_FindDatabase
-+**
-+**  Find a database identified by a process ID and move it to the head of the
-+**  hash list.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          ProcessID that identifies the database.
-+**
-+**      gctBOOL LastProcessID
-+**          gcvTRUE if searching for the last known process ID.  gcvFALSE if
-+**          we need to search for the process ID specified by the ProcessID
-+**          argument.
-+**
-+**  OUTPUT:
-+**
-+**      gcsDATABASE_PTR * Database
-+**          Pointer to a variable receiving the database structure pointer on
-+**          success.
-+*/
-+static gceSTATUS
-+gckKERNEL_FindDatabase(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gctBOOL LastProcessID,
-+    OUT gcsDATABASE_PTR * Database
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database, previous;
-+    gctSIZE_T slot;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d LastProcessID=%d",
-+                   Kernel, ProcessID, LastProcessID);
-+
-+    /* Compute the hash for the database. */
-+    slot = ProcessID % gcmCOUNTOF(Kernel->db->db);
-+
-+    /* Check whether we are getting the last known database. */
-+    if (LastProcessID)
-+    {
-+        /* Use last database. */
-+        database = Kernel->db->lastDatabase;
-+
-+        if (database == gcvNULL)
-+        {
-+            /* Database not found. */
-+            gcmkONERROR(gcvSTATUS_INVALID_DATA);
-+        }
-+    }
-+    else
-+    {
-+        /* Walk the hash list. */
-+        for (previous = gcvNULL, database = Kernel->db->db[slot];
-+             database != gcvNULL;
-+             database = database->next)
-+        {
-+            if (database->processID == ProcessID)
-+            {
-+                /* Found it! */
-+                break;
-+            }
-+
-+            previous = database;
-+        }
-+
-+        if (database == gcvNULL)
-+        {
-+            /* Database not found. */
-+            gcmkONERROR(gcvSTATUS_INVALID_DATA);
-+        }
-+
-+        if (previous != gcvNULL)
-+        {
-+            /* Move database to the head of the hash list. */
-+            previous->next   = database->next;
-+            database->next   = Kernel->db->db[slot];
-+            Kernel->db->db[slot] = database;
-+        }
-+    }
-+
-+    /* Return the database. */
-+    *Database = database;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Database=0x%x", *Database);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_DeleteDatabase
-+**
-+**  Remove a database from the hash list and delete its structure.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gcsDATABASE_PTR Database
-+**          Pointer to the database structure to remove.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+static gceSTATUS
-+gckKERNEL_DeleteDatabase(
-+    IN gckKERNEL Kernel,
-+    IN gcsDATABASE_PTR Database
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x", Kernel, Database);
-+
-+    /* Check slot value. */
-+    gcmkVERIFY_ARGUMENT(Database->slot < gcmCOUNTOF(Kernel->db->db));
-+
-+    if (Database->slot < gcmCOUNTOF(Kernel->db->db))
-+    {
-+        /* Check if database if the head of the hash list. */
-+        if (Kernel->db->db[Database->slot] == Database)
-+        {
-+            /* Remove the database from the hash list. */
-+            Kernel->db->db[Database->slot] = Database->next;
-+        }
-+        else
-+        {
-+            /* Walk the has list to find the database. */
-+            for (database = Kernel->db->db[Database->slot];
-+                 database != gcvNULL;
-+                 database = database->next
-+            )
-+            {
-+                /* Check if the next list entry is this database. */
-+                if (database->next == Database)
-+                {
-+                    /* Remove the database from the hash list. */
-+                    database->next = Database->next;
-+                    break;
-+                }
-+            }
-+
-+            if (database == gcvNULL)
-+            {
-+                /* Ouch!  Something got corrupted. */
-+                gcmkONERROR(gcvSTATUS_INVALID_DATA);
-+            }
-+        }
-+    }
-+
-+    if (Kernel->db->lastDatabase != gcvNULL)
-+    {
-+        /* Insert database to the free list. */
-+        Kernel->db->lastDatabase->next = Kernel->db->freeDatabase;
-+        Kernel->db->freeDatabase       = Kernel->db->lastDatabase;
-+    }
-+
-+    /* Keep database as the last database. */
-+    Kernel->db->lastDatabase = Database;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_NewRecord
-+**
-+**  Create a new database record structure and insert it to the head of the
-+**  database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gcsDATABASE_PTR Database
-+**          Pointer to a database structure.
-+**
-+**  OUTPUT:
-+**
-+**      gcsDATABASE_RECORD_PTR * Record
-+**          Pointer to a variable receiving the database record structure
-+**          pointer on success.
-+*/
-+static gceSTATUS
-+gckKERNEL_NewRecord(
-+    IN gckKERNEL Kernel,
-+    IN gcsDATABASE_PTR Database,
-+    IN gctUINT32 Slot,
-+    OUT gcsDATABASE_RECORD_PTR * Record
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_RECORD_PTR record = gcvNULL;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x", Kernel, Database);
-+
-+    if (Kernel->db->freeRecord != gcvNULL)
-+    {
-+        /* Allocate the record from the free list. */
-+        record             = Kernel->db->freeRecord;
-+        Kernel->db->freeRecord = record->next;
-+    }
-+    else
-+    {
-+        gctPOINTER pointer = gcvNULL;
-+
-+        /* Allocate the record from the heap. */
-+        gcmkONERROR(gckOS_Allocate(Kernel->os,
-+                                   gcmSIZEOF(gcsDATABASE_RECORD),
-+                                   &pointer));
-+
-+        record = pointer;
-+    }
-+
-+    /* Insert the record in the database. */
-+    record->next         = Database->list[Slot];
-+    Database->list[Slot] = record;
-+
-+    /* Return the record. */
-+    *Record = record;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Record=0x%x", *Record);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (record != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, record));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_DeleteRecord
-+**
-+**  Remove a database record from the database and delete its structure.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gcsDATABASE_PTR Database
-+**          Pointer to a database structure.
-+**
-+**      gceDATABASE_TYPE Type
-+**          Type of the record to remove.
-+**
-+**      gctPOINTER Data
-+**          Data of the record to remove.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T_PTR Bytes
-+**          Pointer to a variable that receives the size of the record deleted.
-+**          Can be gcvNULL if the size is not required.
-+*/
-+static gceSTATUS
-+gckKERNEL_DeleteRecord(
-+    IN gckKERNEL Kernel,
-+    IN gcsDATABASE_PTR Database,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Data,
-+    OUT gctSIZE_T_PTR Bytes OPTIONAL
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_RECORD_PTR record, previous;
-+    gctUINT32 slot = _GetSlot(Database, Data);
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x Type=%d Data=0x%x",
-+                   Kernel, Database, Type, Data);
-+
-+    /* Scan the database for this record. */
-+    for (record = Database->list[slot], previous = gcvNULL;
-+         record != gcvNULL;
-+         record = record->next
-+    )
-+    {
-+        if ((record->type == Type)
-+        &&  (record->data == Data)
-+        )
-+        {
-+            /* Found it! */
-+            break;
-+        }
-+
-+        previous = record;
-+    }
-+
-+    if (record == gcvNULL)
-+    {
-+        /* Ouch!  This record is not found? */
-+        gcmkONERROR(gcvSTATUS_INVALID_DATA);
-+    }
-+
-+    if (Bytes != gcvNULL)
-+    {
-+        /* Return size of record. */
-+        *Bytes = record->bytes;
-+    }
-+
-+    /* Remove record from database. */
-+    if (previous == gcvNULL)
-+    {
-+        Database->list[slot] = record->next;
-+    }
-+    else
-+    {
-+        previous->next = record->next;
-+    }
-+
-+    /* Insert record in free list. */
-+    record->next       = Kernel->db->freeRecord;
-+    Kernel->db->freeRecord = record;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_FindRecord
-+**
-+**  Find a database record from the database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gcsDATABASE_PTR Database
-+**          Pointer to a database structure.
-+**
-+**      gceDATABASE_TYPE Type
-+**          Type of the record to remove.
-+**
-+**      gctPOINTER Data
-+**          Data of the record to remove.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T_PTR Bytes
-+**          Pointer to a variable that receives the size of the record deleted.
-+**          Can be gcvNULL if the size is not required.
-+*/
-+static gceSTATUS
-+gckKERNEL_FindRecord(
-+    IN gckKERNEL Kernel,
-+    IN gcsDATABASE_PTR Database,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Data,
-+    OUT gcsDATABASE_RECORD_PTR Record
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_RECORD_PTR record;
-+    gctUINT32 slot = _GetSlot(Database, Data);
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x Type=%d Data=0x%x",
-+                   Kernel, Database, Type, Data);
-+
-+    /* Scan the database for this record. */
-+    for (record = Database->list[slot];
-+         record != gcvNULL;
-+         record = record->next
-+    )
-+    {
-+        if ((record->type == Type)
-+        &&  (record->data == Data)
-+        )
-+        {
-+            /* Found it! */
-+            break;
-+        }
-+    }
-+
-+    if (record == gcvNULL)
-+    {
-+        /* Ouch!  This record is not found? */
-+        gcmkONERROR(gcvSTATUS_INVALID_DATA);
-+    }
-+
-+    if (Record != gcvNULL)
-+    {
-+        /* Return information of record. */
-+        gcmkONERROR(
-+            gckOS_MemCopy(Record, record, sizeof(gcsDATABASE_RECORD)));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("Record=0x%x", Record);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-+/*******************************************************************************
-+***** Public API **************************************************************/
-+
-+/*******************************************************************************
-+**  gckKERNEL_CreateProcessDB
-+**
-+**  Create a new process database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_CreateProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database = gcvNULL;
-+    gctUINT32 i;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Create a new database. */
-+    gcmkONERROR(gckKERNEL_NewDatabase(Kernel, ProcessID, &database));
-+
-+    /* Initialize the database. */
-+    database->processID             = ProcessID;
-+    database->vidMem.bytes          = 0;
-+    database->vidMem.maxBytes       = 0;
-+    database->vidMem.totalBytes     = 0;
-+    database->nonPaged.bytes        = 0;
-+    database->nonPaged.maxBytes     = 0;
-+    database->nonPaged.totalBytes   = 0;
-+    database->contiguous.bytes      = 0;
-+    database->contiguous.maxBytes   = 0;
-+    database->contiguous.totalBytes = 0;
-+    database->mapMemory.bytes          = 0;
-+    database->mapMemory.maxBytes       = 0;
-+    database->mapMemory.totalBytes     = 0;
-+    database->mapUserMemory.bytes      = 0;
-+    database->mapUserMemory.maxBytes   = 0;
-+    database->mapUserMemory.totalBytes = 0;
-+    database->vidMemResv.bytes         = 0;
-+    database->vidMemResv.maxBytes      = 0;
-+    database->vidMemResv.totalBytes    = 0;
-+    database->vidMemCont.bytes         = 0;
-+    database->vidMemCont.maxBytes      = 0;
-+    database->vidMemCont.totalBytes    = 0;
-+    database->vidMemVirt.bytes         = 0;
-+    database->vidMemVirt.maxBytes      = 0;
-+    database->vidMemVirt.totalBytes    = 0;
-+
-+    for (i = 0; i < gcmCOUNTOF(database->list); i++)
-+    {
-+        database->list[i]              = gcvNULL;
-+    }
-+
-+#if gcdSECURE_USER
-+    {
-+        gctINT slot;
-+        gcskSECURE_CACHE * cache = &database->cache;
-+
-+        /* Setup the linked list of cache nodes. */
-+        for (slot = 1; slot <= gcdSECURE_CACHE_SLOTS; ++slot)
-+        {
-+            cache->cache[slot].logical = gcvNULL;
-+
-+#if gcdSECURE_CACHE_METHOD != gcdSECURE_CACHE_TABLE
-+            cache->cache[slot].prev = &cache->cache[slot - 1];
-+            cache->cache[slot].next = &cache->cache[slot + 1];
-+#   endif
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+            cache->cache[slot].nextHash = gcvNULL;
-+            cache->cache[slot].prevHash = gcvNULL;
-+#   endif
-+        }
-+
-+#if gcdSECURE_CACHE_METHOD != gcdSECURE_CACHE_TABLE
-+        /* Setup the head and tail of the cache. */
-+        cache->cache[0].next    = &cache->cache[1];
-+        cache->cache[0].prev    = &cache->cache[gcdSECURE_CACHE_SLOTS];
-+        cache->cache[0].logical = gcvNULL;
-+
-+        /* Fix up the head and tail pointers. */
-+        cache->cache[0].next->prev = &cache->cache[0];
-+        cache->cache[0].prev->next = &cache->cache[0];
-+#   endif
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+        /* Zero out the hash table. */
-+        for (slot = 0; slot < gcmCOUNTOF(cache->hash); ++slot)
-+        {
-+            cache->hash[slot].logical  = gcvNULL;
-+            cache->hash[slot].nextHash = gcvNULL;
-+        }
-+#   endif
-+
-+        /* Initialize cache index. */
-+        cache->cacheIndex = gcvNULL;
-+        cache->cacheFree  = 1;
-+        cache->cacheStamp = 0;
-+    }
-+#endif
-+
-+    /* Reset idle timer. */
-+    Kernel->db->lastIdle = 0;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_AddProcessDB
-+**
-+**  Add a record to a process database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**      gceDATABASE_TYPE TYPE
-+**          Type of the record to add.
-+**
-+**      gctPOINTER Pointer
-+**          Data of the record to add.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the record to add.
-+**
-+**      gctSIZE_T Size
-+**          Size of the record to add.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_AddProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Pointer,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Size
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+    gcsDATABASE_RECORD_PTR record = gcvNULL;
-+    gcsDATABASE_COUNTERS * count;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Pointer=0x%x "
-+                   "Physical=0x%x Size=%lu",
-+                   Kernel, ProcessID, Type, Pointer, Physical, Size);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Acquire the database mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Special case the idle record. */
-+    if (Type == gcvDB_IDLE)
-+    {
-+        gctUINT64 time;
-+
-+        /* Get the current profile time. */
-+        gcmkONERROR(gckOS_GetProfileTick(&time));
-+
-+        if ((ProcessID == 0) && (Kernel->db->lastIdle != 0))
-+        {
-+            /* Out of idle, adjust time it was idle. */
-+            Kernel->db->idleTime += time - Kernel->db->lastIdle;
-+            Kernel->db->lastIdle  = 0;
-+        }
-+        else if (ProcessID == 1)
-+        {
-+            /* Save current idle time. */
-+            Kernel->db->lastIdle = time;
-+        }
-+
-+#if gcdDYNAMIC_SPEED
-+        {
-+            /* Test for first call. */
-+            if (Kernel->db->lastSlowdown == 0)
-+            {
-+                /* Save milliseconds. */
-+                Kernel->db->lastSlowdown     = time;
-+                Kernel->db->lastSlowdownIdle = Kernel->db->idleTime;
-+            }
-+            else
-+            {
-+                /* Compute ellapsed time in milliseconds. */
-+                gctUINT delta = gckOS_ProfileToMS(time - Kernel->db->lastSlowdown);
-+
-+                /* Test for end of period. */
-+                if (delta >= gcdDYNAMIC_SPEED)
-+                {
-+                    /* Compute number of idle milliseconds. */
-+                    gctUINT idle = gckOS_ProfileToMS(
-+                        Kernel->db->idleTime  - Kernel->db->lastSlowdownIdle);
-+
-+                    /* Broadcast to slow down the GPU. */
-+                    gcmkONERROR(gckOS_BroadcastCalibrateSpeed(Kernel->os,
-+                                                              Kernel->hardware,
-+                                                              idle,
-+                                                              delta));
-+
-+                    /* Save current time. */
-+                    Kernel->db->lastSlowdown     = time;
-+                    Kernel->db->lastSlowdownIdle = Kernel->db->idleTime;
-+                }
-+            }
-+        }
-+#endif
-+        /* Release the database mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+        /* Success. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+
-+
-+    /* Find the database. */
-+    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
-+
-+    /* Create a new record in the database. */
-+    gcmkONERROR(gckKERNEL_NewRecord(Kernel, database, _GetSlot(database, Pointer), &record));
-+
-+    /* Initialize the record. */
-+    record->kernel   = Kernel;
-+    record->type     = Type;
-+    record->data     = Pointer;
-+    record->physical = Physical;
-+    record->bytes    = Size;
-+
-+    /* Get pointer to counters. */
-+    switch (Type)
-+    {
-+    case gcvDB_VIDEO_MEMORY:
-+        count = &database->vidMem;
-+        break;
-+
-+    case gcvDB_NON_PAGED:
-+        count = &database->nonPaged;
-+        break;
-+
-+    case gcvDB_CONTIGUOUS:
-+        count = &database->contiguous;
-+        break;
-+
-+    case gcvDB_MAP_MEMORY:
-+        count = &database->mapMemory;
-+        break;
-+
-+    case gcvDB_MAP_USER_MEMORY:
-+        count = &database->mapUserMemory;
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_RESERVED:
-+        count = &database->vidMemResv;
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
-+        count = &database->vidMemCont;
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_VIRTUAL:
-+        count = &database->vidMemVirt;
-+        break;
-+
-+    default:
-+        count = gcvNULL;
-+        break;
-+    }
-+
-+    if (count != gcvNULL)
-+    {
-+        /* Adjust counters. */
-+        count->totalBytes += Size;
-+        count->bytes      += Size;
-+
-+        if (count->bytes > count->maxBytes)
-+        {
-+            count->maxBytes = count->bytes;
-+        }
-+    }
-+
-+    /* Release the database mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the database mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_RemoveProcessDB
-+**
-+**  Remove a record from a process database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**      gceDATABASE_TYPE TYPE
-+**          Type of the record to remove.
-+**
-+**      gctPOINTER Pointer
-+**          Data of the record to remove.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_RemoveProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Pointer
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+    gctSIZE_T bytes = 0;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Pointer=0x%x",
-+                   Kernel, ProcessID, Type, Pointer);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+
-+    /* Acquire the database mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Find the database. */
-+    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
-+
-+    /* Delete the record. */
-+    gcmkONERROR(
-+        gckKERNEL_DeleteRecord(Kernel, database, Type, Pointer, &bytes));
-+
-+    /* Update counters. */
-+    switch (Type)
-+    {
-+    case gcvDB_VIDEO_MEMORY:
-+        database->vidMem.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_NON_PAGED:
-+        database->nonPaged.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_CONTIGUOUS:
-+        database->contiguous.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_MAP_MEMORY:
-+        database->mapMemory.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_MAP_USER_MEMORY:
-+        database->mapUserMemory.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_RESERVED:
-+        database->vidMemResv.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
-+        database->vidMemCont.bytes -= bytes;
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_VIRTUAL:
-+        database->vidMemVirt.bytes -= bytes;
-+        break;
-+
-+    default:
-+        break;
-+    }
-+
-+    /* Release the database mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the database mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_FindProcessDB
-+**
-+**  Find a record from a process database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**      gceDATABASE_TYPE TYPE
-+**          Type of the record to remove.
-+**
-+**      gctPOINTER Pointer
-+**          Data of the record to remove.
-+**
-+**  OUTPUT:
-+**
-+**      gcsDATABASE_RECORD_PTR Record
-+**          Copy of record.
-+*/
-+gceSTATUS
-+gckKERNEL_FindProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gctUINT32 ThreadID,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Pointer,
-+    OUT gcsDATABASE_RECORD_PTR Record
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Pointer=0x%x",
-+                   Kernel, ProcessID, ThreadID, Type, Pointer);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+
-+    /* Acquire the database mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Find the database. */
-+    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
-+
-+    /* Find the record. */
-+    gcmkONERROR(
-+        gckKERNEL_FindRecord(Kernel, database, Type, Pointer, Record));
-+
-+    /* Release the database mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the database mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_DestroyProcessDB
-+**
-+**  Destroy a process database.  If the database contains any records, the data
-+**  inside those records will be deleted as well.  This aids in the cleanup if
-+**  a process has died unexpectedly or has memory leaks.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_DestroyProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+    gcsDATABASE_RECORD_PTR record, next;
-+    gctBOOL asynchronous;
-+    gctPHYS_ADDR physical;
-+    gcuVIDMEM_NODE_PTR node;
-+    gckKERNEL kernel = Kernel;
-+    gctUINT32 i;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Acquire the database mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Find the database. */
-+    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
-+                   "DB(%d): VidMem: total=%lu max=%lu",
-+                   ProcessID, database->vidMem.totalBytes,
-+                   database->vidMem.maxBytes);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
-+                   "DB(%d): NonPaged: total=%lu max=%lu",
-+                   ProcessID, database->nonPaged.totalBytes,
-+                   database->nonPaged.maxBytes);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
-+                   "DB(%d): Contiguous: total=%lu max=%lu",
-+                   ProcessID, database->contiguous.totalBytes,
-+                   database->contiguous.maxBytes);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
-+                   "DB(%d): Idle time=%llu",
-+                   ProcessID, Kernel->db->idleTime);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
-+                   "DB(%d): Map: total=%lu max=%lu",
-+                   ProcessID, database->mapMemory.totalBytes,
-+                   database->mapMemory.maxBytes);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
-+                   "DB(%d): Map: total=%lu max=%lu",
-+                   ProcessID, database->mapUserMemory.totalBytes,
-+                   database->mapUserMemory.maxBytes);
-+
-+    if (database->list != gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                       "Process %d has entries in its database:",
-+                       ProcessID);
-+    }
-+
-+    for(i = 0; i < gcmCOUNTOF(database->list); i++)
-+    {
-+
-+    /* Walk all records. */
-+    for (record = database->list[i]; record != gcvNULL; record = next)
-+    {
-+        /* Next next record. */
-+        next = record->next;
-+
-+        gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+        acquired = gcvFALSE;
-+
-+        /* Dispatch on record type. */
-+        switch (record->type)
-+        {
-+        case gcvDB_VIDEO_MEMORY:
-+            /* Free the video memory. */
-+            status = gckVIDMEM_Free(Kernel, gcmUINT64_TO_PTR(record->data));
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: VIDEO_MEMORY 0x%x (status=%d)",
-+                           record->data, status);
-+            break;
-+
-+        case gcvDB_NON_PAGED:
-+            physical = gcmNAME_TO_PTR(record->physical);
-+            /* Unmap user logical memory first. */
-+            status = gckOS_UnmapUserLogical(Kernel->os,
-+                                            physical,
-+                                            record->bytes,
-+                                            record->data);
-+
-+            /* Free the non paged memory. */
-+            status = gckOS_FreeNonPagedMemory(Kernel->os,
-+                                              record->bytes,
-+                                              physical,
-+                                              record->data);
-+            gcmRELEASE_NAME(record->physical);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: NON_PAGED 0x%x, bytes=%lu (status=%d)",
-+                           record->data, record->bytes, status);
-+            break;
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+        case gcvDB_COMMAND_BUFFER:
-+            /* Free the command buffer. */
-+            status = gckEVENT_DestroyVirtualCommandBuffer(record->kernel->eventObj,
-+                                                          record->bytes,
-+                                                          gcmNAME_TO_PTR(record->physical),
-+                                                          record->data,
-+                                                          gcvKERNEL_PIXEL);
-+            gcmRELEASE_NAME(record->physical);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: COMMAND_BUFFER 0x%x, bytes=%lu (status=%d)",
-+                           record->data, record->bytes, status);
-+            break;
-+#endif
-+
-+        case gcvDB_CONTIGUOUS:
-+            physical = gcmNAME_TO_PTR(record->physical);
-+            /* Unmap user logical memory first. */
-+            status = gckOS_UnmapUserLogical(Kernel->os,
-+                                            physical,
-+                                            record->bytes,
-+                                            record->data);
-+
-+            /* Free the contiguous memory. */
-+            status = gckEVENT_FreeContiguousMemory(Kernel->eventObj,
-+                                                   record->bytes,
-+                                                   physical,
-+                                                   record->data,
-+                                                   gcvKERNEL_PIXEL);
-+            gcmRELEASE_NAME(record->physical);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: CONTIGUOUS 0x%x bytes=%lu (status=%d)",
-+                           record->data, record->bytes, status);
-+            break;
-+
-+        case gcvDB_SIGNAL:
-+#if USE_NEW_LINUX_SIGNAL
-+            status = gcvSTATUS_NOT_SUPPORTED;
-+#else
-+            /* Free the user signal. */
-+            status = gckOS_DestroyUserSignal(Kernel->os,
-+                                             gcmPTR2INT(record->data));
-+#endif /* USE_NEW_LINUX_SIGNAL */
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: SIGNAL %d (status=%d)",
-+                           (gctINT)(gctUINTPTR_T)record->data, status);
-+            break;
-+
-+        case gcvDB_VIDEO_MEMORY_LOCKED:
-+            node = gcmUINT64_TO_PTR(record->data);
-+            /* Unlock what we still locked */
-+            status = gckVIDMEM_Unlock(record->kernel,
-+                                      node,
-+                                      gcvSURF_TYPE_UNKNOWN,
-+                                      &asynchronous);
-+
-+            if (gcmIS_SUCCESS(status) && (gcvTRUE == asynchronous))
-+            {
-+                /* TODO: we maybe need to schedule a event here */
-+                status = gckVIDMEM_Unlock(record->kernel,
-+                                          node,
-+                                          gcvSURF_TYPE_UNKNOWN,
-+                                          gcvNULL);
-+            }
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: VIDEO_MEMORY_LOCKED 0x%x (status=%d)",
-+                           node, status);
-+            break;
-+
-+        case gcvDB_CONTEXT:
-+            /* TODO: Free the context */
-+            status = gckCOMMAND_Detach(Kernel->command, gcmNAME_TO_PTR(record->data));
-+            gcmRELEASE_NAME(record->data);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: CONTEXT 0x%x (status=%d)",
-+                           record->data, status);
-+            break;
-+
-+        case gcvDB_MAP_MEMORY:
-+            /* Unmap memory. */
-+            status = gckKERNEL_UnmapMemory(Kernel,
-+                                           record->physical,
-+                                           record->bytes,
-+                                           record->data);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: MAP MEMORY %d (status=%d)",
-+                           gcmPTR2INT(record->data), status);
-+            break;
-+
-+        case gcvDB_MAP_USER_MEMORY:
-+            /* TODO: Unmap user memory. */
-+            status = gckOS_UnmapUserMemory(Kernel->os,
-+                                           Kernel->core,
-+                                           record->physical,
-+                                           record->bytes,
-+                                           gcmNAME_TO_PTR(record->data),
-+                                           0);
-+            gcmRELEASE_NAME(record->data);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: MAP USER MEMORY %d (status=%d)",
-+                           gcmPTR2INT(record->data), status);
-+            break;
-+
-+        case gcvDB_SHARED_INFO:
-+            status = gckOS_FreeMemory(Kernel->os, record->physical);
-+            break;
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+        case gcvDB_SYNC_POINT:
-+            /* Free the user signal. */
-+            status = gckOS_DestroySyncPoint(Kernel->os,
-+                                            (gctSYNC_POINT) record->data);
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
-+                           "DB: SYNC POINT %d (status=%d)",
-+                           (gctINT)(gctUINTPTR_T)record->data, status);
-+            break;
-+#endif
-+
-+        case gcvDB_VIDEO_MEMORY_RESERVED:
-+        case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
-+        case gcvDB_VIDEO_MEMORY_VIRTUAL:
-+            break;//Nothing to do
-+
-+        default:
-+            gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DATABASE,
-+                           "DB: Correcupted record=0x%08x type=%d",
-+                           record, record->type);
-+            break;
-+        }
-+
-+        gcmkONERROR(
-+            gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+        acquired = gcvTRUE;
-+
-+        /* Delete the record. */
-+        gcmkONERROR(gckKERNEL_DeleteRecord(Kernel,
-+                                           database,
-+                                           record->type,
-+                                           record->data,
-+                                           gcvNULL));
-+    }
-+
-+    }
-+
-+    /* Delete the database. */
-+    gcmkONERROR(gckKERNEL_DeleteDatabase(Kernel, database));
-+
-+    /* Release the database mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the database mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckKERNEL_QueryProcessDB
-+**
-+**  Query a process database for the current usage of a particular record type.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**      gctBOOL LastProcessID
-+**          gcvTRUE if searching for the last known process ID.  gcvFALSE if
-+**          we need to search for the process ID specified by the ProcessID
-+**          argument.
-+**
-+**      gceDATABASE_TYPE Type
-+**          Type of the record to query.
-+**
-+**  OUTPUT:
-+**
-+**      gcuDATABASE_INFO * Info
-+**          Pointer to a variable that receives the requested information.
-+*/
-+gceSTATUS
-+gckKERNEL_QueryProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gctBOOL LastProcessID,
-+    IN gceDATABASE_TYPE Type,
-+    OUT gcuDATABASE_INFO * Info
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Info=0x%x",
-+                   Kernel, ProcessID, Type, Info);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
-+
-+    /* Acquire the database mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Find the database. */
-+    gcmkONERROR(
-+        gckKERNEL_FindDatabase(Kernel, ProcessID, LastProcessID, &database));
-+
-+    /* Get pointer to counters. */
-+    switch (Type)
-+    {
-+    case gcvDB_VIDEO_MEMORY:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->vidMem,
-+                                  gcmSIZEOF(database->vidMem));
-+        break;
-+
-+    case gcvDB_NON_PAGED:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->nonPaged,
-+                                  gcmSIZEOF(database->vidMem));
-+        break;
-+
-+    case gcvDB_CONTIGUOUS:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->contiguous,
-+                                  gcmSIZEOF(database->vidMem));
-+        break;
-+
-+    case gcvDB_IDLE:
-+        Info->time           = Kernel->db->idleTime;
-+        Kernel->db->idleTime = 0;
-+        break;
-+
-+    case gcvDB_MAP_MEMORY:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->mapMemory,
-+                                  gcmSIZEOF(database->mapMemory));
-+        break;
-+
-+    case gcvDB_MAP_USER_MEMORY:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->mapUserMemory,
-+                                  gcmSIZEOF(database->mapUserMemory));
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_RESERVED:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->vidMemResv,
-+                                  gcmSIZEOF(database->vidMemResv));
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->vidMemCont,
-+                                  gcmSIZEOF(database->vidMemCont));
-+        break;
-+
-+    case gcvDB_VIDEO_MEMORY_VIRTUAL:
-+        gckOS_MemCopy(&Info->counters,
-+                                  &database->vidMemVirt,
-+                                  gcmSIZEOF(database->vidMemVirt));
-+        break;
-+
-+    default:
-+        break;
-+    }
-+
-+    /* Release the database mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the database mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdSECURE_USER
-+/*******************************************************************************
-+**  gckKERNEL_GetProcessDBCache
-+**
-+**  Get teh secure cache from a process database.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to a gckKERNEL object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID used to identify the database.
-+**
-+**  OUTPUT:
-+**
-+**      gcskSECURE_CACHE_PTR * Cache
-+**          Pointer to a variable that receives the secure cache pointer.
-+*/
-+gceSTATUS
-+gckKERNEL_GetProcessDBCache(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    OUT gcskSECURE_CACHE_PTR * Cache
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDATABASE_PTR database;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Cache != gcvNULL);
-+
-+    /* Find the database. */
-+    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
-+
-+    /* Return the pointer to the cache. */
-+    *Cache = &database->cache;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Cache=0x%x", *Cache);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+gceSTATUS
-+gckKERNEL_DumpProcessDB(
-+    IN gckKERNEL Kernel
-+    )
-+{
-+    gcsDATABASE_PTR database;
-+    gctINT i, pid;
-+    gctUINT8 name[24];
-+
-+    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
-+
-+    /* Acquire the database mutex. */
-+    gcmkVERIFY_OK(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
-+
-+    gcmkPRINT("**************************\n");
-+    gcmkPRINT("***  PROCESS DB DUMP   ***\n");
-+    gcmkPRINT("**************************\n");
-+
-+    gcmkPRINT_N(8, "%-8s%s\n", "PID", "NAME");
-+    /* Walk the databases. */
-+    for (i = 0; i < gcmCOUNTOF(Kernel->db->db); ++i)
-+    {
-+        for (database = Kernel->db->db[i];
-+             database != gcvNULL;
-+             database = database->next)
-+        {
-+            pid = database->processID;
-+
-+            gcmkVERIFY_OK(gckOS_ZeroMemory(name, gcmSIZEOF(name)));
-+
-+            gcmkVERIFY_OK(gckOS_GetProcessNameByPid(pid, gcmSIZEOF(name), name));
-+
-+            gcmkPRINT_N(8, "%-8d%s\n", pid, name);
-+        }
-+    }
-+
-+    /* Release the database mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,2559 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+#include <gc_hal_kernel_debug.h>
-+
-+/******************************************************************************\
-+******************************** Debug Variables *******************************
-+\******************************************************************************/
-+
-+static gceSTATUS _lastError  = gcvSTATUS_OK;
-+static gctUINT32 _debugLevel = gcvLEVEL_ERROR;
-+/*
-+_debugZones config value
-+Please Reference define in gc_hal_base.h
-+*/
-+static gctUINT32 _debugZones = gcvZONE_NONE;
-+
-+/******************************************************************************\
-+********************************* Debug Switches *******************************
-+\******************************************************************************/
-+
-+/*
-+    gcdBUFFERED_OUTPUT
-+
-+    When set to non-zero, all output is collected into a buffer with the
-+    specified size.  Once the buffer gets full, the debug buffer will be
-+    printed to the console. gcdBUFFERED_SIZE determines the size of the buffer.
-+*/
-+#define gcdBUFFERED_OUTPUT  0
-+
-+/*
-+    gcdBUFFERED_SIZE
-+
-+    When set to non-zero, all output is collected into a buffer with the
-+    specified size.  Once the buffer gets full, the debug buffer will be
-+    printed to the console.
-+*/
-+#define gcdBUFFERED_SIZE    (1024 * 1024 * 2)
-+
-+/*
-+    gcdDMA_BUFFER_COUNT
-+
-+    If greater then zero, the debugger will attempt to find the command buffer
-+    where DMA is currently executing and then print this buffer and
-+    (gcdDMA_BUFFER_COUNT - 1) buffers before the current one. If set to zero
-+    or the current buffer is not found, all buffers are printed.
-+*/
-+#define gcdDMA_BUFFER_COUNT 0
-+
-+/*
-+    gcdTHREAD_BUFFERS
-+
-+    When greater then one, will accumulate messages from the specified number
-+    of threads in separate output buffers.
-+*/
-+#define gcdTHREAD_BUFFERS   1
-+
-+/*
-+    gcdENABLE_OVERFLOW
-+
-+    When set to non-zero, and the output buffer gets full, instead of being
-+    printed, it will be allowed to overflow removing the oldest messages.
-+*/
-+#define gcdENABLE_OVERFLOW  1
-+
-+/*
-+    gcdSHOW_LINE_NUMBER
-+
-+    When enabledm each print statement will be preceeded with the current
-+    line number.
-+*/
-+#define gcdSHOW_LINE_NUMBER 0
-+
-+/*
-+    gcdSHOW_PROCESS_ID
-+
-+    When enabledm each print statement will be preceeded with the current
-+    process ID.
-+*/
-+#define gcdSHOW_PROCESS_ID  0
-+
-+/*
-+    gcdSHOW_THREAD_ID
-+
-+    When enabledm each print statement will be preceeded with the current
-+    thread ID.
-+*/
-+#define gcdSHOW_THREAD_ID   0
-+
-+/*
-+    gcdSHOW_TIME
-+
-+    When enabled each print statement will be preceeded with the current
-+    high-resolution time.
-+*/
-+#define gcdSHOW_TIME        0
-+
-+
-+/******************************************************************************\
-+****************************** Miscellaneous Macros ****************************
-+\******************************************************************************/
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+#   define gcmDBGASSERT(Expression, Format, Value) \
-+        if (!(Expression)) \
-+        { \
-+            _DirectPrint( \
-+                "*** gcmDBGASSERT ***************************\n" \
-+                "    function     : %s\n" \
-+                "    line         : %d\n" \
-+                "    expression   : " #Expression "\n" \
-+                "    actual value : " Format "\n", \
-+                __FUNCTION__, __LINE__, Value \
-+                ); \
-+        }
-+#else
-+#   define gcmDBGASSERT(Expression, Format, Value)
-+#endif
-+
-+#define gcmPTRALIGNMENT(Pointer, Alignemnt) \
-+( \
-+    gcmALIGN(gcmPTR2INT(Pointer), Alignemnt) - gcmPTR2INT(Pointer) \
-+)
-+
-+#if gcdALIGNBYSIZE
-+#   define gcmISALIGNED(Offset, Alignment) \
-+        (((Offset) & ((Alignment) - 1)) == 0)
-+
-+#   define gcmkALIGNPTR(Type, Pointer, Alignment) \
-+        Pointer = (Type) gcmINT2PTR(gcmALIGN(gcmPTR2INT(Pointer), Alignment))
-+#else
-+#   define gcmISALIGNED(Offset, Alignment) \
-+        gcvTRUE
-+
-+#   define gcmkALIGNPTR(Type, Pointer, Alignment)
-+#endif
-+
-+#define gcmALIGNSIZE(Offset, Size) \
-+    ((Size - Offset) + Size)
-+
-+#define gcdHAVEPREFIX \
-+( \
-+       gcdSHOW_TIME \
-+    || gcdSHOW_LINE_NUMBER \
-+    || gcdSHOW_PROCESS_ID \
-+    || gcdSHOW_THREAD_ID \
-+)
-+
-+#if gcdHAVEPREFIX
-+
-+#   define gcdOFFSET                    0
-+
-+#if gcdSHOW_TIME
-+#if gcmISALIGNED(gcdOFFSET, 8)
-+#           define gcdTIMESIZE          gcmSIZEOF(gctUINT64)
-+#       elif gcdOFFSET == 4
-+#           define gcdTIMESIZE          gcmALIGNSIZE(4, gcmSIZEOF(gctUINT64))
-+#       else
-+#           error "Unexpected offset value."
-+#       endif
-+#       undef  gcdOFFSET
-+#       define gcdOFFSET                8
-+#if !defined(gcdPREFIX_LEADER)
-+#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT64)
-+#           define gcdTIMEFORMAT        "0x%016llX"
-+#       else
-+#           define gcdTIMEFORMAT        ", 0x%016llX"
-+#       endif
-+#   else
-+#       define gcdTIMESIZE              0
-+#       define gcdTIMEFORMAT
-+#   endif
-+
-+#if gcdSHOW_LINE_NUMBER
-+#if gcmISALIGNED(gcdOFFSET, 8)
-+#           define gcdNUMSIZE           gcmSIZEOF(gctUINT64)
-+#       elif gcdOFFSET == 4
-+#           define gcdNUMSIZE           gcmALIGNSIZE(4, gcmSIZEOF(gctUINT64))
-+#       else
-+#           error "Unexpected offset value."
-+#       endif
-+#       undef  gcdOFFSET
-+#       define gcdOFFSET                8
-+#if !defined(gcdPREFIX_LEADER)
-+#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT64)
-+#           define gcdNUMFORMAT         "%8llu"
-+#       else
-+#           define gcdNUMFORMAT         ", %8llu"
-+#       endif
-+#   else
-+#       define gcdNUMSIZE               0
-+#       define gcdNUMFORMAT
-+#   endif
-+
-+#if gcdSHOW_PROCESS_ID
-+#if gcmISALIGNED(gcdOFFSET, 4)
-+#           define gcdPIDSIZE           gcmSIZEOF(gctUINT32)
-+#       else
-+#           error "Unexpected offset value."
-+#       endif
-+#       undef  gcdOFFSET
-+#       define gcdOFFSET                4
-+#if !defined(gcdPREFIX_LEADER)
-+#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT32)
-+#           define gcdPIDFORMAT         "pid=%5d"
-+#       else
-+#           define gcdPIDFORMAT         ", pid=%5d"
-+#       endif
-+#   else
-+#       define gcdPIDSIZE               0
-+#       define gcdPIDFORMAT
-+#   endif
-+
-+#if gcdSHOW_THREAD_ID
-+#if gcmISALIGNED(gcdOFFSET, 4)
-+#           define gcdTIDSIZE           gcmSIZEOF(gctUINT32)
-+#       else
-+#           error "Unexpected offset value."
-+#       endif
-+#       undef  gcdOFFSET
-+#       define gcdOFFSET                4
-+#if !defined(gcdPREFIX_LEADER)
-+#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT32)
-+#           define gcdTIDFORMAT         "tid=%5d"
-+#       else
-+#           define gcdTIDFORMAT         ", tid=%5d"
-+#       endif
-+#   else
-+#       define gcdTIDSIZE               0
-+#       define gcdTIDFORMAT
-+#   endif
-+
-+#   define gcdPREFIX_SIZE \
-+    ( \
-+          gcdTIMESIZE \
-+        + gcdNUMSIZE  \
-+        + gcdPIDSIZE  \
-+        + gcdTIDSIZE  \
-+    )
-+
-+    static const char * _prefixFormat =
-+    "["
-+        gcdTIMEFORMAT
-+        gcdNUMFORMAT
-+        gcdPIDFORMAT
-+        gcdTIDFORMAT
-+    "] ";
-+
-+#else
-+
-+#   define gcdPREFIX_LEADER             gcmSIZEOF(gctUINT32)
-+#   define gcdPREFIX_SIZE               0
-+
-+#endif
-+
-+/* Assumed largest variable argument leader size. */
-+#define gcdVARARG_LEADER                gcmSIZEOF(gctUINT64)
-+
-+/* Alignnments. */
-+#if gcdALIGNBYSIZE
-+#   define gcdPREFIX_ALIGNMENT gcdPREFIX_LEADER
-+#   define gcdVARARG_ALIGNMENT gcdVARARG_LEADER
-+#else
-+#   define gcdPREFIX_ALIGNMENT 0
-+#   define gcdVARARG_ALIGNMENT 0
-+#endif
-+
-+#if gcdBUFFERED_OUTPUT
-+#   define gcdOUTPUTPREFIX _AppendPrefix
-+#   define gcdOUTPUTSTRING _AppendString
-+#   define gcdOUTPUTCOPY   _AppendCopy
-+#   define gcdOUTPUTBUFFER _AppendBuffer
-+#else
-+#   define gcdOUTPUTPREFIX _PrintPrefix
-+#   define gcdOUTPUTSTRING _PrintString
-+#   define gcdOUTPUTCOPY   _PrintString
-+#   define gcdOUTPUTBUFFER _PrintBuffer
-+#endif
-+
-+/******************************************************************************\
-+****************************** Private Structures ******************************
-+\******************************************************************************/
-+
-+typedef enum _gceBUFITEM
-+{
-+    gceBUFITEM_NONE,
-+    gcvBUFITEM_PREFIX,
-+    gcvBUFITEM_STRING,
-+    gcvBUFITEM_COPY,
-+    gcvBUFITEM_BUFFER
-+}
-+gceBUFITEM;
-+
-+/* Common item head/buffer terminator. */
-+typedef struct _gcsBUFITEM_HEAD * gcsBUFITEM_HEAD_PTR;
-+typedef struct _gcsBUFITEM_HEAD
-+{
-+    gceBUFITEM              type;
-+}
-+gcsBUFITEM_HEAD;
-+
-+/* String prefix (for ex. [     1,tid=0x019A]) */
-+typedef struct _gcsBUFITEM_PREFIX * gcsBUFITEM_PREFIX_PTR;
-+typedef struct _gcsBUFITEM_PREFIX
-+{
-+    gceBUFITEM              type;
-+#if gcdHAVEPREFIX
-+    gctPOINTER              prefixData;
-+#endif
-+}
-+gcsBUFITEM_PREFIX;
-+
-+/* Buffered string. */
-+typedef struct _gcsBUFITEM_STRING * gcsBUFITEM_STRING_PTR;
-+typedef struct _gcsBUFITEM_STRING
-+{
-+    gceBUFITEM              type;
-+    gctINT                  indent;
-+    gctCONST_STRING         message;
-+    gctPOINTER              messageData;
-+    gctUINT                 messageDataSize;
-+}
-+gcsBUFITEM_STRING;
-+
-+/* Buffered string (copy of the string is included with the record). */
-+typedef struct _gcsBUFITEM_COPY * gcsBUFITEM_COPY_PTR;
-+typedef struct _gcsBUFITEM_COPY
-+{
-+    gceBUFITEM              type;
-+    gctINT                  indent;
-+    gctPOINTER              messageData;
-+    gctUINT                 messageDataSize;
-+}
-+gcsBUFITEM_COPY;
-+
-+/* Memory buffer. */
-+typedef struct _gcsBUFITEM_BUFFER * gcsBUFITEM_BUFFER_PTR;
-+typedef struct _gcsBUFITEM_BUFFER
-+{
-+    gceBUFITEM              type;
-+    gctINT                  indent;
-+    gceDUMP_BUFFER          bufferType;
-+
-+#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
-+    gctUINT32               dmaAddress;
-+#endif
-+
-+    gctUINT                 dataSize;
-+    gctUINT32               address;
-+#if gcdHAVEPREFIX
-+    gctPOINTER              prefixData;
-+#endif
-+}
-+gcsBUFITEM_BUFFER;
-+
-+typedef struct _gcsBUFFERED_OUTPUT * gcsBUFFERED_OUTPUT_PTR;
-+typedef struct _gcsBUFFERED_OUTPUT
-+{
-+#if gcdTHREAD_BUFFERS > 1
-+    gctUINT32               threadID;
-+#endif
-+
-+#if gcdSHOW_LINE_NUMBER
-+    gctUINT64               lineNumber;
-+#endif
-+
-+    gctINT                  indent;
-+
-+#if gcdBUFFERED_OUTPUT
-+    gctINT                  start;
-+    gctINT                  index;
-+    gctINT                  count;
-+    gctUINT8                buffer[gcdBUFFERED_SIZE];
-+#endif
-+
-+    gcsBUFFERED_OUTPUT_PTR  prev;
-+    gcsBUFFERED_OUTPUT_PTR  next;
-+}
-+gcsBUFFERED_OUTPUT;
-+
-+typedef gctUINT (* gcfPRINTSTRING) (
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    );
-+
-+typedef gctINT (* gcfGETITEMSIZE) (
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    );
-+
-+/******************************************************************************\
-+******************************* Private Variables ******************************
-+\******************************************************************************/
-+
-+static gcsBUFFERED_OUTPUT     _outputBuffer[gcdTHREAD_BUFFERS];
-+static gcsBUFFERED_OUTPUT_PTR _outputBufferHead = gcvNULL;
-+static gcsBUFFERED_OUTPUT_PTR _outputBufferTail = gcvNULL;
-+
-+/******************************************************************************\
-+****************************** Item Size Functions *****************************
-+\******************************************************************************/
-+
-+#if gcdBUFFERED_OUTPUT
-+static gctINT
-+_GetTerminatorItemSize(
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+    return gcmSIZEOF(gcsBUFITEM_HEAD);
-+}
-+
-+static gctINT
-+_GetPrefixItemSize(
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+#if gcdHAVEPREFIX
-+    gcsBUFITEM_PREFIX_PTR item = (gcsBUFITEM_PREFIX_PTR) Item;
-+    gctUINT vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
-+    return vlen + gcdPREFIX_SIZE;
-+#else
-+    return gcmSIZEOF(gcsBUFITEM_PREFIX);
-+#endif
-+}
-+
-+static gctINT
-+_GetStringItemSize(
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+    gcsBUFITEM_STRING_PTR item = (gcsBUFITEM_STRING_PTR) Item;
-+    gctUINT vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
-+    return vlen + item->messageDataSize;
-+}
-+
-+static gctINT
-+_GetCopyItemSize(
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+    gcsBUFITEM_COPY_PTR item = (gcsBUFITEM_COPY_PTR) Item;
-+    gctUINT vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
-+    return vlen + item->messageDataSize;
-+}
-+
-+static gctINT
-+_GetBufferItemSize(
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+#if gcdHAVEPREFIX
-+    gcsBUFITEM_BUFFER_PTR item = (gcsBUFITEM_BUFFER_PTR) Item;
-+    gctUINT vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
-+    return vlen + gcdPREFIX_SIZE + item->dataSize;
-+#else
-+    gcsBUFITEM_BUFFER_PTR item = (gcsBUFITEM_BUFFER_PTR) Item;
-+    return gcmSIZEOF(gcsBUFITEM_BUFFER) + item->dataSize;
-+#endif
-+}
-+
-+static gcfGETITEMSIZE _itemSize[] =
-+{
-+    _GetTerminatorItemSize,
-+    _GetPrefixItemSize,
-+    _GetStringItemSize,
-+    _GetCopyItemSize,
-+    _GetBufferItemSize
-+};
-+#endif
-+
-+/******************************************************************************\
-+******************************* Printing Functions *****************************
-+\******************************************************************************/
-+
-+#if gcdDEBUG || gcdBUFFERED_OUTPUT
-+static void
-+_DirectPrint(
-+    gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    gctINT len;
-+    char buffer[768];
-+    gctARGUMENTS arguments;
-+
-+    gcmkARGUMENTS_START(arguments, Message);
-+    len = gcmkVSPRINTF(buffer, gcmSIZEOF(buffer), Message, arguments);
-+    gcmkARGUMENTS_END(arguments);
-+
-+    buffer[len] = '\0';
-+    gcmkOUTPUT_STRING(buffer);
-+}
-+#endif
-+
-+static int
-+_AppendIndent(
-+    IN gctINT Indent,
-+    IN char * Buffer,
-+    IN int BufferSize
-+    )
-+{
-+    gctINT i;
-+
-+    gctINT len    = 0;
-+    gctINT indent = Indent % 40;
-+
-+    for (i = 0; i < indent; i += 1)
-+    {
-+        Buffer[len++] = ' ';
-+    }
-+
-+    if (indent != Indent)
-+    {
-+        len += gcmkSPRINTF(
-+            Buffer + len, BufferSize - len, " <%d> ", Indent
-+            );
-+
-+        Buffer[len] = '\0';
-+    }
-+
-+    return len;
-+}
-+
-+#if gcdHAVEPREFIX
-+static void
-+_PrintPrefix(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctPOINTER Data
-+    )
-+{
-+    char buffer[768];
-+    gctINT len;
-+
-+    /* Format the string. */
-+    len = gcmkVSPRINTF(buffer, gcmSIZEOF(buffer), _prefixFormat, Data);
-+    buffer[len] = '\0';
-+
-+    /* Print the string. */
-+    gcmkOUTPUT_STRING(buffer);
-+}
-+#endif
-+
-+static void
-+_PrintString(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctINT Indent,
-+    IN gctCONST_STRING Message,
-+    IN gctUINT ArgumentSize,
-+    IN gctPOINTER Data
-+    )
-+{
-+    char buffer[768];
-+    gctINT len;
-+
-+    /* Append the indent string. */
-+    len = _AppendIndent(Indent, buffer, gcmSIZEOF(buffer));
-+
-+    /* Format the string. */
-+    len += gcmkVSPRINTF(buffer + len, gcmSIZEOF(buffer) - len, Message, Data);
-+    buffer[len] = '\0';
-+
-+    /* Add end-of-line if missing. */
-+    if (buffer[len - 1] != '\n')
-+    {
-+        buffer[len++] = '\n';
-+        buffer[len] = '\0';
-+    }
-+
-+    /* Print the string. */
-+    gcmkOUTPUT_STRING(buffer);
-+}
-+
-+static void
-+_PrintBuffer(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctINT Indent,
-+    IN gctPOINTER PrefixData,
-+    IN gctPOINTER Data,
-+    IN gctUINT Address,
-+    IN gctUINT DataSize,
-+    IN gceDUMP_BUFFER Type,
-+    IN gctUINT32 DmaAddress
-+    )
-+{
-+    static gctCONST_STRING _titleString[] =
-+    {
-+        "CONTEXT BUFFER",
-+        "USER COMMAND BUFFER",
-+        "KERNEL COMMAND BUFFER",
-+        "LINK BUFFER",
-+        "WAIT LINK BUFFER",
-+        ""
-+    };
-+
-+    static const gctINT COLUMN_COUNT = 8;
-+
-+    gctUINT i, count, column, address;
-+    gctUINT32_PTR data;
-+    gctCHAR buffer[768];
-+    gctUINT indent, len;
-+    gctBOOL command;
-+
-+    /* Append space for the prefix. */
-+#if gcdHAVEPREFIX
-+    indent = gcmkVSPRINTF(buffer, gcmSIZEOF(buffer), _prefixFormat, PrefixData);
-+    buffer[indent] = '\0';
-+#else
-+    indent = 0;
-+#endif
-+
-+    /* Append the indent string. */
-+    indent += _AppendIndent(
-+        Indent, buffer + indent, gcmSIZEOF(buffer) - indent
-+        );
-+
-+    switch (Type)
-+    {
-+    case gceDUMP_BUFFER_CONTEXT:
-+    case gceDUMP_BUFFER_USER:
-+    case gceDUMP_BUFFER_KERNEL:
-+    case gceDUMP_BUFFER_LINK:
-+    case gceDUMP_BUFFER_WAITLINK:
-+        /* Form and print the title string. */
-+        gcmkSPRINTF2(
-+            buffer + indent, gcmSIZEOF(buffer) - indent,
-+            "%s%s\n", _titleString[Type],
-+            ((DmaAddress >= Address) && (DmaAddress < Address + DataSize))
-+                ? " (CURRENT)" : ""
-+            );
-+
-+        gcmkOUTPUT_STRING(buffer);
-+
-+        /* Terminate the string. */
-+        buffer[indent] = '\0';
-+
-+        /* This is a command buffer. */
-+        command = gcvTRUE;
-+        break;
-+
-+    case gceDUMP_BUFFER_FROM_USER:
-+        /* This is not a command buffer. */
-+        command = gcvFALSE;
-+
-+        /* No title. */
-+        break;
-+
-+    default:
-+        gcmDBGASSERT(gcvFALSE, "%s", "invalid buffer type");
-+
-+        /* This is not a command buffer. */
-+        command = gcvFALSE;
-+    }
-+
-+    /* Overwrite the prefix with spaces. */
-+    for (i = 0; i < indent; i += 1)
-+    {
-+        buffer[i] = ' ';
-+    }
-+
-+    /* Form and print the opening string. */
-+    if (command)
-+    {
-+        gcmkSPRINTF2(
-+            buffer + indent, gcmSIZEOF(buffer) - indent,
-+            "@[kernel.command %08X %08X\n", Address, DataSize
-+            );
-+
-+        gcmkOUTPUT_STRING(buffer);
-+
-+        /* Terminate the string. */
-+        buffer[indent] = '\0';
-+    }
-+
-+    /* Get initial address. */
-+    address = Address;
-+
-+    /* Cast the data pointer. */
-+    data = (gctUINT32_PTR) Data;
-+
-+    /* Compute the number of double words. */
-+    count = DataSize / gcmSIZEOF(gctUINT32);
-+
-+    /* Print the buffer. */
-+    for (i = 0, len = indent, column = 0; i < count; i += 1)
-+    {
-+        /* Append the address. */
-+        if (column == 0)
-+        {
-+            len += gcmkSPRINTF(
-+                buffer + len, gcmSIZEOF(buffer) - len, "0x%08X:", address
-+                );
-+        }
-+
-+        /* Append the data value. */
-+        len += gcmkSPRINTF2(
-+            buffer + len, gcmSIZEOF(buffer) - len, "%c%08X",
-+            (address == DmaAddress)? '>' : ' ', data[i]
-+            );
-+
-+        buffer[len] = '\0';
-+
-+        /* Update the address. */
-+        address += gcmSIZEOF(gctUINT32);
-+
-+        /* Advance column count. */
-+        column += 1;
-+
-+        /* End of line? */
-+        if ((column % COLUMN_COUNT) == 0)
-+        {
-+            /* Append EOL. */
-+            gcmkSTRCAT(buffer + len, gcmSIZEOF(buffer) - len, "\n");
-+
-+            /* Print the string. */
-+            gcmkOUTPUT_STRING(buffer);
-+
-+            /* Reset. */
-+            len    = indent;
-+            column = 0;
-+        }
-+    }
-+
-+    /* Print the last partial string. */
-+    if (column != 0)
-+    {
-+        /* Append EOL. */
-+        gcmkSTRCAT(buffer + len, gcmSIZEOF(buffer) - len, "\n");
-+
-+        /* Print the string. */
-+        gcmkOUTPUT_STRING(buffer);
-+    }
-+
-+    /* Form and print the opening string. */
-+    if (command)
-+    {
-+        buffer[indent] = '\0';
-+        gcmkSTRCAT(buffer, gcmSIZEOF(buffer), "] -- command\n");
-+        gcmkOUTPUT_STRING(buffer);
-+    }
-+}
-+
-+#if gcdBUFFERED_OUTPUT
-+static gctUINT
-+_PrintNone(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+    /* Return the size of the node. */
-+    return gcmSIZEOF(gcsBUFITEM_HEAD);
-+}
-+
-+static gctUINT
-+_PrintPrefixWrapper(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+#if gcdHAVEPREFIX
-+    gcsBUFITEM_PREFIX_PTR item;
-+    gctUINT vlen;
-+
-+    /* Get access to the data. */
-+    item = (gcsBUFITEM_PREFIX_PTR) Item;
-+
-+    /* Print the message. */
-+    _PrintPrefix(OutputBuffer, item->prefixData);
-+
-+    /* Compute the size of the variable portion of the structure. */
-+    vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
-+
-+    /* Return the size of the node. */
-+    return vlen + gcdPREFIX_SIZE;
-+#else
-+    return gcmSIZEOF(gcsBUFITEM_PREFIX);
-+#endif
-+}
-+
-+static gctUINT
-+_PrintStringWrapper(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+    gcsBUFITEM_STRING_PTR item;
-+    gctUINT vlen;
-+
-+    /* Get access to the data. */
-+    item = (gcsBUFITEM_STRING_PTR) Item;
-+
-+    /* Print the message. */
-+    _PrintString(
-+        OutputBuffer,
-+        item->indent, item->message, item->messageDataSize, item->messageData
-+        );
-+
-+    /* Compute the size of the variable portion of the structure. */
-+    vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
-+
-+    /* Return the size of the node. */
-+    return vlen + item->messageDataSize;
-+}
-+
-+static gctUINT
-+_PrintCopyWrapper(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+    gcsBUFITEM_COPY_PTR item;
-+    gctCONST_STRING message;
-+    gctUINT vlen;
-+
-+    /* Get access to the data. */
-+    item = (gcsBUFITEM_COPY_PTR) Item;
-+
-+    /* Determine the string pointer. */
-+    message = (gctCONST_STRING) (item + 1);
-+
-+    /* Print the message. */
-+    _PrintString(
-+        OutputBuffer,
-+        item->indent, message, item->messageDataSize, item->messageData
-+        );
-+
-+    /* Compute the size of the variable portion of the structure. */
-+    vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
-+
-+    /* Return the size of the node. */
-+    return vlen + item->messageDataSize;
-+}
-+
-+static gctUINT
-+_PrintBufferWrapper(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gcsBUFITEM_HEAD_PTR Item
-+    )
-+{
-+#if gcdHAVEPREFIX
-+    gctUINT32 dmaAddress;
-+    gcsBUFITEM_BUFFER_PTR item;
-+    gctPOINTER data;
-+    gctUINT vlen;
-+
-+    /* Get access to the data. */
-+    item = (gcsBUFITEM_BUFFER_PTR) Item;
-+
-+#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
-+    dmaAddress = item->dmaAddress;
-+#else
-+    dmaAddress = 0xFFFFFFFF;
-+#endif
-+
-+    if (dmaAddress != 0)
-+    {
-+        /* Compute the data address. */
-+        data = ((gctUINT8_PTR) item->prefixData) + gcdPREFIX_SIZE;
-+
-+        /* Print buffer. */
-+        _PrintBuffer(
-+            OutputBuffer,
-+            item->indent, item->prefixData,
-+            data, item->address, item->dataSize,
-+            item->bufferType, dmaAddress
-+            );
-+    }
-+
-+    /* Compute the size of the variable portion of the structure. */
-+    vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
-+
-+    /* Return the size of the node. */
-+    return vlen + gcdPREFIX_SIZE + item->dataSize;
-+#else
-+    gctUINT32 dmaAddress;
-+    gcsBUFITEM_BUFFER_PTR item;
-+
-+    /* Get access to the data. */
-+    item = (gcsBUFITEM_BUFFER_PTR) Item;
-+
-+#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
-+    dmaAddress = item->dmaAddress;
-+#else
-+    dmaAddress = 0xFFFFFFFF;
-+#endif
-+
-+    if (dmaAddress != 0)
-+    {
-+        /* Print buffer. */
-+        _PrintBuffer(
-+            OutputBuffer,
-+            item->indent, gcvNULL,
-+            item + 1, item->address, item->dataSize,
-+            item->bufferType, dmaAddress
-+            );
-+    }
-+
-+    /* Return the size of the node. */
-+    return gcmSIZEOF(gcsBUFITEM_BUFFER) + item->dataSize;
-+#endif
-+}
-+
-+static gcfPRINTSTRING _printArray[] =
-+{
-+    _PrintNone,
-+    _PrintPrefixWrapper,
-+    _PrintStringWrapper,
-+    _PrintCopyWrapper,
-+    _PrintBufferWrapper
-+};
-+#endif
-+
-+/******************************************************************************\
-+******************************* Private Functions ******************************
-+\******************************************************************************/
-+
-+#if gcdBUFFERED_OUTPUT
-+
-+#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
-+static gcsBUFITEM_BUFFER_PTR
-+_FindCurrentDMABuffer(
-+    gctUINT32 DmaAddress
-+    )
-+{
-+    gctINT i, skip;
-+    gcsBUFITEM_HEAD_PTR item;
-+    gcsBUFITEM_BUFFER_PTR dmaCurrent;
-+
-+    /* Reset the current buffer. */
-+    dmaCurrent = gcvNULL;
-+
-+    /* Get the first stored item. */
-+    item = (gcsBUFITEM_HEAD_PTR) &_outputBufferHead->buffer[_outputBufferHead->start];
-+
-+    /* Run through all items. */
-+    for (i = 0; i < _outputBufferHead->count; i += 1)
-+    {
-+        /* Buffer item? */
-+        if (item->type == gcvBUFITEM_BUFFER)
-+        {
-+            gcsBUFITEM_BUFFER_PTR buffer = (gcsBUFITEM_BUFFER_PTR) item;
-+
-+            if ((DmaAddress >= buffer->address) &&
-+                (DmaAddress <  buffer->address + buffer->dataSize))
-+            {
-+                dmaCurrent = buffer;
-+            }
-+        }
-+
-+        /* Get the item size and skip it. */
-+        skip = (* _itemSize[item->type]) (item);
-+        item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
-+
-+        /* End of the buffer? Wrap around. */
-+        if (item->type == gceBUFITEM_NONE)
-+        {
-+            item = (gcsBUFITEM_HEAD_PTR) _outputBufferHead->buffer;
-+        }
-+    }
-+
-+    /* Return result. */
-+    return dmaCurrent;
-+}
-+
-+static void
-+_EnableAllDMABuffers(
-+    void
-+    )
-+{
-+    gctINT i, skip;
-+    gcsBUFITEM_HEAD_PTR item;
-+
-+    /* Get the first stored item. */
-+    item = (gcsBUFITEM_HEAD_PTR) &_outputBufferHead->buffer[_outputBufferHead->start];
-+
-+    /* Run through all items. */
-+    for (i = 0; i < _outputBufferHead->count; i += 1)
-+    {
-+        /* Buffer item? */
-+        if (item->type == gcvBUFITEM_BUFFER)
-+        {
-+            gcsBUFITEM_BUFFER_PTR buffer = (gcsBUFITEM_BUFFER_PTR) item;
-+
-+            /* Enable the buffer. */
-+            buffer->dmaAddress = ~0U;
-+        }
-+
-+        /* Get the item size and skip it. */
-+        skip = (* _itemSize[item->type]) (item);
-+        item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
-+
-+        /* End of the buffer? Wrap around. */
-+        if (item->type == gceBUFITEM_NONE)
-+        {
-+            item = (gcsBUFITEM_HEAD_PTR) _outputBufferHead->buffer;
-+        }
-+    }
-+}
-+
-+static void
-+_EnableDMABuffers(
-+    gctUINT32 DmaAddress,
-+    gcsBUFITEM_BUFFER_PTR CurrentDMABuffer
-+    )
-+{
-+    gctINT i, skip, index;
-+    gcsBUFITEM_HEAD_PTR item;
-+    gcsBUFITEM_BUFFER_PTR buffers[gcdDMA_BUFFER_COUNT];
-+
-+    /* Reset buffer pointers. */
-+    gckOS_ZeroMemory(buffers, gcmSIZEOF(buffers));
-+
-+    /* Set the current buffer index. */
-+    index = -1;
-+
-+    /* Get the first stored item. */
-+    item = (gcsBUFITEM_HEAD_PTR) &_outputBufferHead->buffer[_outputBufferHead->start];
-+
-+    /* Run through all items until the current DMA buffer is found. */
-+    for (i = 0; i < _outputBufferHead->count; i += 1)
-+    {
-+        /* Buffer item? */
-+        if (item->type == gcvBUFITEM_BUFFER)
-+        {
-+            /* Advance the index. */
-+            index = (index + 1) % gcdDMA_BUFFER_COUNT;
-+
-+            /* Add to the buffer array. */
-+            buffers[index] = (gcsBUFITEM_BUFFER_PTR) item;
-+
-+            /* Stop if this is the current DMA buffer. */
-+            if ((gcsBUFITEM_BUFFER_PTR) item == CurrentDMABuffer)
-+            {
-+                break;
-+            }
-+        }
-+
-+        /* Get the item size and skip it. */
-+        skip = (* _itemSize[item->type]) (item);
-+        item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
-+
-+        /* End of the buffer? Wrap around. */
-+        if (item->type == gceBUFITEM_NONE)
-+        {
-+            item = (gcsBUFITEM_HEAD_PTR) _outputBufferHead->buffer;
-+        }
-+    }
-+
-+    /* Enable the found buffers. */
-+    gcmDBGASSERT(index != -1, "%d", index);
-+
-+    for (i = 0; i < gcdDMA_BUFFER_COUNT; i += 1)
-+    {
-+        if (buffers[index] == gcvNULL)
-+        {
-+            break;
-+        }
-+
-+        buffers[index]->dmaAddress = DmaAddress;
-+
-+        index -= 1;
-+
-+        if (index == -1)
-+        {
-+            index = gcdDMA_BUFFER_COUNT - 1;
-+        }
-+    }
-+}
-+#endif
-+
-+static void
-+_Flush(
-+    gctUINT32 DmaAddress
-+    )
-+{
-+    gctINT i, skip;
-+    gcsBUFITEM_HEAD_PTR item;
-+
-+    gcsBUFFERED_OUTPUT_PTR outputBuffer = _outputBufferHead;
-+
-+#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
-+    if ((outputBuffer != gcvNULL) && (outputBuffer->count != 0))
-+    {
-+        /* Find the current DMA buffer. */
-+        gcsBUFITEM_BUFFER_PTR dmaCurrent = _FindCurrentDMABuffer(DmaAddress);
-+
-+        /* Was the current buffer found? */
-+        if (dmaCurrent == gcvNULL)
-+        {
-+            /* No, print all buffers. */
-+            _EnableAllDMABuffers();
-+        }
-+        else
-+        {
-+            /* Yes, enable only specified number of buffers. */
-+            _EnableDMABuffers(DmaAddress, dmaCurrent);
-+        }
-+    }
-+#endif
-+
-+    while (outputBuffer != gcvNULL)
-+    {
-+        if (outputBuffer->count != 0)
-+        {
-+            _DirectPrint("********************************************************************************\n");
-+            _DirectPrint("FLUSHING DEBUG OUTPUT BUFFER (%d elements).\n", outputBuffer->count);
-+            _DirectPrint("********************************************************************************\n");
-+
-+            item = (gcsBUFITEM_HEAD_PTR) &outputBuffer->buffer[outputBuffer->start];
-+
-+            for (i = 0; i < outputBuffer->count; i += 1)
-+            {
-+                skip = (* _printArray[item->type]) (outputBuffer, item);
-+
-+                item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
-+
-+                if (item->type == gceBUFITEM_NONE)
-+                {
-+                    item = (gcsBUFITEM_HEAD_PTR) outputBuffer->buffer;
-+                }
-+            }
-+
-+            outputBuffer->start = 0;
-+            outputBuffer->index = 0;
-+            outputBuffer->count = 0;
-+        }
-+
-+        outputBuffer = outputBuffer->next;
-+    }
-+}
-+
-+static gcsBUFITEM_HEAD_PTR
-+_AllocateItem(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctINT Size
-+    )
-+{
-+    gctINT skip;
-+    gcsBUFITEM_HEAD_PTR item, next;
-+
-+#if gcdENABLE_OVERFLOW
-+    if (
-+            (OutputBuffer->index + Size >= gcdBUFFERED_SIZE - gcmSIZEOF(gcsBUFITEM_HEAD))
-+            ||
-+            (
-+                (OutputBuffer->index        <  OutputBuffer->start) &&
-+                (OutputBuffer->index + Size >= OutputBuffer->start)
-+            )
-+    )
-+    {
-+        if (OutputBuffer->index + Size >= gcdBUFFERED_SIZE - gcmSIZEOF(gcsBUFITEM_HEAD))
-+        {
-+            if (OutputBuffer->index < OutputBuffer->start)
-+            {
-+                item = (gcsBUFITEM_HEAD_PTR) &OutputBuffer->buffer[OutputBuffer->start];
-+
-+                while (item->type != gceBUFITEM_NONE)
-+                {
-+                    skip = (* _itemSize[item->type]) (item);
-+
-+                    OutputBuffer->start += skip;
-+                    OutputBuffer->count -= 1;
-+
-+                    item->type = gceBUFITEM_NONE;
-+                    item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
-+                }
-+
-+                OutputBuffer->start = 0;
-+            }
-+
-+            OutputBuffer->index = 0;
-+        }
-+
-+        item = (gcsBUFITEM_HEAD_PTR) &OutputBuffer->buffer[OutputBuffer->start];
-+
-+        while (OutputBuffer->start - OutputBuffer->index <= Size)
-+        {
-+            skip = (* _itemSize[item->type]) (item);
-+
-+            OutputBuffer->start += skip;
-+            OutputBuffer->count -= 1;
-+
-+            item->type = gceBUFITEM_NONE;
-+            item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
-+
-+            if (item->type == gceBUFITEM_NONE)
-+            {
-+                OutputBuffer->start = 0;
-+                break;
-+            }
-+        }
-+    }
-+#else
-+    if (OutputBuffer->index + Size > gcdBUFFERED_SIZE - gcmSIZEOF(gcsBUFITEM_HEAD))
-+    {
-+        _DirectPrint("\nMessage buffer full; forcing message flush.\n\n");
-+        _Flush(~0U);
-+    }
-+#endif
-+
-+    item = (gcsBUFITEM_HEAD_PTR) &OutputBuffer->buffer[OutputBuffer->index];
-+
-+    OutputBuffer->index += Size;
-+    OutputBuffer->count += 1;
-+
-+    next = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + Size);
-+    next->type = gceBUFITEM_NONE;
-+
-+    return item;
-+}
-+
-+#if gcdALIGNBYSIZE
-+static void
-+_FreeExtraSpace(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctPOINTER Item,
-+    IN gctINT ItemSize,
-+    IN gctINT FreeSize
-+    )
-+{
-+    gcsBUFITEM_HEAD_PTR next;
-+
-+    OutputBuffer->index -= FreeSize;
-+
-+    next = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) Item + ItemSize);
-+    next->type = gceBUFITEM_NONE;
-+}
-+#endif
-+
-+#if gcdHAVEPREFIX
-+static void
-+_AppendPrefix(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctPOINTER Data
-+    )
-+{
-+    gctUINT8_PTR prefixData;
-+    gcsBUFITEM_PREFIX_PTR item;
-+    gctINT allocSize;
-+
-+#if gcdALIGNBYSIZE
-+    gctUINT alignment;
-+    gctINT size, freeSize;
-+#endif
-+
-+    gcmDBGASSERT(Data != gcvNULL, "%p", Data);
-+
-+    /* Determine the maximum item size. */
-+    allocSize
-+        = gcmSIZEOF(gcsBUFITEM_PREFIX)
-+        + gcdPREFIX_SIZE
-+        + gcdPREFIX_ALIGNMENT;
-+
-+    /* Allocate prefix item. */
-+    item = (gcsBUFITEM_PREFIX_PTR) _AllocateItem(OutputBuffer, allocSize);
-+
-+    /* Compute the initial prefix data pointer. */
-+    prefixData = (gctUINT8_PTR) (item + 1);
-+
-+    /* Align the data pointer as necessary. */
-+#if gcdALIGNBYSIZE
-+    alignment = gcmPTRALIGNMENT(prefixData, gcdPREFIX_ALIGNMENT);
-+    prefixData += alignment;
-+#endif
-+
-+    /* Set item data. */
-+    item->type       = gcvBUFITEM_PREFIX;
-+    item->prefixData = prefixData;
-+
-+    /* Copy argument value. */
-+    memcpy(prefixData, Data, gcdPREFIX_SIZE);
-+
-+#if gcdALIGNBYSIZE
-+    /* Compute the actual node size. */
-+    size = gcmSIZEOF(gcsBUFITEM_PREFIX) + gcdPREFIX_SIZE + alignment;
-+
-+    /* Free extra memory if any. */
-+    freeSize = allocSize - size;
-+    if (freeSize != 0)
-+    {
-+        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
-+    }
-+#endif
-+}
-+#endif
-+
-+static void
-+_AppendString(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctINT Indent,
-+    IN gctCONST_STRING Message,
-+    IN gctUINT ArgumentSize,
-+    IN gctPOINTER Data
-+    )
-+{
-+    gctUINT8_PTR messageData;
-+    gcsBUFITEM_STRING_PTR item;
-+    gctINT allocSize;
-+
-+#if gcdALIGNBYSIZE
-+    gctUINT alignment;
-+    gctINT size, freeSize;
-+#endif
-+
-+    /* Determine the maximum item size. */
-+    allocSize
-+        = gcmSIZEOF(gcsBUFITEM_STRING)
-+        + ArgumentSize
-+        + gcdVARARG_ALIGNMENT;
-+
-+    /* Allocate prefix item. */
-+    item = (gcsBUFITEM_STRING_PTR) _AllocateItem(OutputBuffer, allocSize);
-+
-+    /* Compute the initial message data pointer. */
-+    messageData = (gctUINT8_PTR) (item + 1);
-+
-+    /* Align the data pointer as necessary. */
-+#if gcdALIGNBYSIZE
-+    alignment = gcmPTRALIGNMENT(messageData, gcdVARARG_ALIGNMENT);
-+    messageData += alignment;
-+#endif
-+
-+    /* Set item data. */
-+    item->type            = gcvBUFITEM_STRING;
-+    item->indent          = Indent;
-+    item->message         = Message;
-+    item->messageData     = messageData;
-+    item->messageDataSize = ArgumentSize;
-+
-+    /* Copy argument value. */
-+    if (ArgumentSize != 0)
-+    {
-+        memcpy(messageData, Data, ArgumentSize);
-+    }
-+
-+#if gcdALIGNBYSIZE
-+    /* Compute the actual node size. */
-+    size = gcmSIZEOF(gcsBUFITEM_STRING) + ArgumentSize + alignment;
-+
-+    /* Free extra memory if any. */
-+    freeSize = allocSize - size;
-+    if (freeSize != 0)
-+    {
-+        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
-+    }
-+#endif
-+}
-+
-+static void
-+_AppendCopy(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctINT Indent,
-+    IN gctCONST_STRING Message,
-+    IN gctUINT ArgumentSize,
-+    IN gctPOINTER Data
-+    )
-+{
-+    gctUINT8_PTR messageData;
-+    gcsBUFITEM_COPY_PTR item;
-+    gctINT allocSize;
-+    gctINT messageLength;
-+    gctCONST_STRING message;
-+
-+#if gcdALIGNBYSIZE
-+    gctUINT alignment;
-+    gctINT size, freeSize;
-+#endif
-+
-+    /* Get the length of the string. */
-+    messageLength = strlen(Message) + 1;
-+
-+    /* Determine the maximum item size. */
-+    allocSize
-+        = gcmSIZEOF(gcsBUFITEM_COPY)
-+        + messageLength
-+        + ArgumentSize
-+        + gcdVARARG_ALIGNMENT;
-+
-+    /* Allocate prefix item. */
-+    item = (gcsBUFITEM_COPY_PTR) _AllocateItem(OutputBuffer, allocSize);
-+
-+    /* Determine the message placement. */
-+    message = (gctCONST_STRING) (item + 1);
-+
-+    /* Compute the initial message data pointer. */
-+    messageData = (gctUINT8_PTR) message + messageLength;
-+
-+    /* Align the data pointer as necessary. */
-+#if gcdALIGNBYSIZE
-+    if (ArgumentSize == 0)
-+    {
-+        alignment = 0;
-+    }
-+    else
-+    {
-+        alignment = gcmPTRALIGNMENT(messageData, gcdVARARG_ALIGNMENT);
-+        messageData += alignment;
-+    }
-+#endif
-+
-+    /* Set item data. */
-+    item->type            = gcvBUFITEM_COPY;
-+    item->indent          = Indent;
-+    item->messageData     = messageData;
-+    item->messageDataSize = ArgumentSize;
-+
-+    /* Copy the message. */
-+    memcpy((gctPOINTER) message, Message, messageLength);
-+
-+    /* Copy argument value. */
-+    if (ArgumentSize != 0)
-+    {
-+        memcpy(messageData, Data, ArgumentSize);
-+    }
-+
-+#if gcdALIGNBYSIZE
-+    /* Compute the actual node size. */
-+    size
-+        = gcmSIZEOF(gcsBUFITEM_COPY)
-+        + messageLength
-+        + ArgumentSize
-+        + alignment;
-+
-+    /* Free extra memory if any. */
-+    freeSize = allocSize - size;
-+    if (freeSize != 0)
-+    {
-+        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
-+    }
-+#endif
-+}
-+
-+static void
-+_AppendBuffer(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctINT Indent,
-+    IN gctPOINTER PrefixData,
-+    IN gctPOINTER Data,
-+    IN gctUINT Address,
-+    IN gctUINT DataSize,
-+    IN gceDUMP_BUFFER Type,
-+    IN gctUINT32 DmaAddress
-+    )
-+{
-+#if gcdHAVEPREFIX
-+    gctUINT8_PTR prefixData;
-+    gcsBUFITEM_BUFFER_PTR item;
-+    gctINT allocSize;
-+    gctPOINTER data;
-+
-+#if gcdALIGNBYSIZE
-+    gctUINT alignment;
-+    gctINT size, freeSize;
-+#endif
-+
-+    gcmDBGASSERT(DataSize != 0, "%d", DataSize);
-+    gcmDBGASSERT(Data != gcvNULL, "%p", Data);
-+
-+    /* Determine the maximum item size. */
-+    allocSize
-+        = gcmSIZEOF(gcsBUFITEM_BUFFER)
-+        + gcdPREFIX_SIZE
-+        + gcdPREFIX_ALIGNMENT
-+        + DataSize;
-+
-+    /* Allocate prefix item. */
-+    item = (gcsBUFITEM_BUFFER_PTR) _AllocateItem(OutputBuffer, allocSize);
-+
-+    /* Compute the initial prefix data pointer. */
-+    prefixData = (gctUINT8_PTR) (item + 1);
-+
-+#if gcdALIGNBYSIZE
-+    /* Align the data pointer as necessary. */
-+    alignment = gcmPTRALIGNMENT(prefixData, gcdPREFIX_ALIGNMENT);
-+    prefixData += alignment;
-+#endif
-+
-+    /* Set item data. */
-+    item->type       = gcvBUFITEM_BUFFER;
-+    item->indent     = Indent;
-+    item->bufferType = Type;
-+    item->dataSize   = DataSize;
-+    item->address    = Address;
-+    item->prefixData = prefixData;
-+
-+#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
-+    item->dmaAddress = DmaAddress;
-+#endif
-+
-+    /* Copy prefix data. */
-+    memcpy(prefixData, PrefixData, gcdPREFIX_SIZE);
-+
-+    /* Compute the data pointer. */
-+    data = prefixData + gcdPREFIX_SIZE;
-+
-+    /* Copy argument value. */
-+    memcpy(data, Data, DataSize);
-+
-+#if gcdALIGNBYSIZE
-+    /* Compute the actual node size. */
-+    size
-+        = gcmSIZEOF(gcsBUFITEM_BUFFER)
-+        + gcdPREFIX_SIZE
-+        + alignment
-+        + DataSize;
-+
-+    /* Free extra memory if any. */
-+    freeSize = allocSize - size;
-+    if (freeSize != 0)
-+    {
-+        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
-+    }
-+#endif
-+#else
-+    gcsBUFITEM_BUFFER_PTR item;
-+    gctINT size;
-+
-+    gcmDBGASSERT(DataSize != 0, "%d", DataSize);
-+    gcmDBGASSERT(Data != gcvNULL, "%p", Data);
-+
-+    /* Determine the maximum item size. */
-+    size = gcmSIZEOF(gcsBUFITEM_BUFFER) + DataSize;
-+
-+    /* Allocate prefix item. */
-+    item = (gcsBUFITEM_BUFFER_PTR) _AllocateItem(OutputBuffer, size);
-+
-+    /* Set item data. */
-+    item->type     = gcvBUFITEM_BUFFER;
-+    item->indent   = Indent;
-+    item->dataSize = DataSize;
-+    item->address  = Address;
-+
-+    /* Copy argument value. */
-+    memcpy(item + 1, Data, DataSize);
-+#endif
-+}
-+#endif
-+
-+static gcmINLINE void
-+_InitBuffers(
-+    void
-+    )
-+{
-+    int i;
-+
-+    if (_outputBufferHead == gcvNULL)
-+    {
-+        for (i = 0; i < gcdTHREAD_BUFFERS; i += 1)
-+        {
-+            if (_outputBufferTail == gcvNULL)
-+            {
-+                _outputBufferHead = &_outputBuffer[i];
-+            }
-+            else
-+            {
-+                _outputBufferTail->next = &_outputBuffer[i];
-+            }
-+
-+#if gcdTHREAD_BUFFERS > 1
-+            _outputBuffer[i].threadID = ~0U;
-+#endif
-+
-+            _outputBuffer[i].prev = _outputBufferTail;
-+            _outputBuffer[i].next =  gcvNULL;
-+
-+            _outputBufferTail = &_outputBuffer[i];
-+        }
-+    }
-+}
-+
-+static gcmINLINE gcsBUFFERED_OUTPUT_PTR
-+_GetOutputBuffer(
-+    void
-+    )
-+{
-+    gcsBUFFERED_OUTPUT_PTR outputBuffer;
-+
-+#if gcdTHREAD_BUFFERS > 1
-+    /* Get the current thread ID. */
-+    gctUINT32 ThreadID = gcmkGETTHREADID();
-+
-+    /* Locate the output buffer for the thread. */
-+    outputBuffer = _outputBufferHead;
-+
-+    while (outputBuffer != gcvNULL)
-+    {
-+        if (outputBuffer->threadID == ThreadID)
-+        {
-+            break;
-+        }
-+
-+        outputBuffer = outputBuffer->next;
-+    }
-+
-+    /* No matching buffer found? */
-+    if (outputBuffer == gcvNULL)
-+    {
-+        /* Get the tail for the buffer. */
-+        outputBuffer = _outputBufferTail;
-+
-+        /* Move it to the head. */
-+        _outputBufferTail       = _outputBufferTail->prev;
-+        _outputBufferTail->next = gcvNULL;
-+
-+        outputBuffer->prev = gcvNULL;
-+        outputBuffer->next = _outputBufferHead;
-+
-+        _outputBufferHead->prev = outputBuffer;
-+        _outputBufferHead       = outputBuffer;
-+
-+        /* Reset the buffer. */
-+        outputBuffer->threadID   = ThreadID;
-+#if gcdBUFFERED_OUTPUT
-+        outputBuffer->start      = 0;
-+        outputBuffer->index      = 0;
-+        outputBuffer->count      = 0;
-+#endif
-+#if gcdSHOW_LINE_NUMBER
-+        outputBuffer->lineNumber = 0;
-+#endif
-+    }
-+#else
-+    outputBuffer = _outputBufferHead;
-+#endif
-+
-+    return outputBuffer;
-+}
-+
-+static gcmINLINE int _GetArgumentSize(
-+    IN gctCONST_STRING Message
-+    )
-+{
-+    int i, count;
-+
-+    gcmDBGASSERT(Message != gcvNULL, "%p", Message);
-+
-+    for (i = 0, count = 0; Message[i]; i += 1)
-+    {
-+        if (Message[i] == '%')
-+        {
-+            count += 1;
-+        }
-+    }
-+
-+    return count * gcmSIZEOF(gctUINT32);
-+}
-+
-+#if gcdHAVEPREFIX
-+static void
-+_InitPrefixData(
-+    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
-+    IN gctPOINTER Data
-+    )
-+{
-+    gctUINT8_PTR data  = (gctUINT8_PTR) Data;
-+
-+#if gcdSHOW_TIME
-+    {
-+        gctUINT64 time;
-+        gckOS_GetProfileTick(&time);
-+        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT64));
-+        * ((gctUINT64_PTR) data) = time;
-+        data += gcmSIZEOF(gctUINT64);
-+    }
-+#endif
-+
-+#if gcdSHOW_LINE_NUMBER
-+    {
-+        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT64));
-+        * ((gctUINT64_PTR) data) = OutputBuffer->lineNumber;
-+        data += gcmSIZEOF(gctUINT64);
-+    }
-+#endif
-+
-+#if gcdSHOW_PROCESS_ID
-+    {
-+        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT32));
-+        * ((gctUINT32_PTR) data) = gcmkGETPROCESSID();
-+        data += gcmSIZEOF(gctUINT32);
-+    }
-+#endif
-+
-+#if gcdSHOW_THREAD_ID
-+    {
-+        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT32));
-+        * ((gctUINT32_PTR) data) = gcmkGETTHREADID();
-+    }
-+#endif
-+}
-+#endif
-+
-+static void
-+_Print(
-+    IN gctUINT ArgumentSize,
-+    IN gctBOOL CopyMessage,
-+    IN gctCONST_STRING Message,
-+    IN gctARGUMENTS Arguments
-+    )
-+{
-+    gcsBUFFERED_OUTPUT_PTR outputBuffer;
-+    gcmkDECLARE_LOCK(lockHandle);
-+
-+    gcmkLOCKSECTION(lockHandle);
-+
-+    /* Initialize output buffer list. */
-+    _InitBuffers();
-+
-+    /* Locate the proper output buffer. */
-+    outputBuffer = _GetOutputBuffer();
-+
-+    /* Update the line number. */
-+#if gcdSHOW_LINE_NUMBER
-+    outputBuffer->lineNumber += 1;
-+#endif
-+
-+    /* Print prefix. */
-+#if gcdHAVEPREFIX
-+    {
-+        gctUINT8_PTR alignedPrefixData;
-+        gctUINT8 prefixData[gcdPREFIX_SIZE + gcdPREFIX_ALIGNMENT];
-+
-+        /* Compute aligned pointer. */
-+        alignedPrefixData = prefixData;
-+        gcmkALIGNPTR(gctUINT8_PTR, alignedPrefixData, gcdPREFIX_ALIGNMENT);
-+
-+        /* Initialize the prefix data. */
-+        _InitPrefixData(outputBuffer, alignedPrefixData);
-+
-+        /* Print the prefix. */
-+        gcdOUTPUTPREFIX(outputBuffer, alignedPrefixData);
-+    }
-+#endif
-+
-+    /* Form the indent string. */
-+    if (strncmp(Message, "--", 2) == 0)
-+    {
-+        outputBuffer->indent -= 2;
-+    }
-+
-+    /* Print the message. */
-+    if (CopyMessage)
-+    {
-+        gcdOUTPUTCOPY(
-+            outputBuffer, outputBuffer->indent,
-+            Message, ArgumentSize, * (gctPOINTER *) &Arguments
-+            );
-+    }
-+    else
-+    {
-+        gcdOUTPUTSTRING(
-+            outputBuffer, outputBuffer->indent,
-+            Message, ArgumentSize, * (gctPOINTER *) &Arguments
-+            );
-+    }
-+
-+    /* Check increasing indent. */
-+    if (strncmp(Message, "++", 2) == 0)
-+    {
-+        outputBuffer->indent += 2;
-+    }
-+
-+    gcmkUNLOCKSECTION(lockHandle);
-+}
-+
-+
-+/******************************************************************************\
-+********************************* Debug Macros *********************************
-+\******************************************************************************/
-+
-+#ifdef __QNXNTO__
-+
-+extern volatile unsigned g_nQnxInIsrs;
-+
-+#define gcmDEBUGPRINT(ArgumentSize, CopyMessage, Message) \
-+{ \
-+    if (atomic_add_value(&g_nQnxInIsrs, 1) == 0) \
-+    { \
-+        gctARGUMENTS __arguments__; \
-+        gcmkARGUMENTS_START(__arguments__, Message); \
-+        _Print(ArgumentSize, CopyMessage, Message, __arguments__); \
-+        gcmkARGUMENTS_END(__arguments__); \
-+    } \
-+    atomic_sub(&g_nQnxInIsrs, 1); \
-+}
-+
-+#else
-+
-+#define gcmDEBUGPRINT(ArgumentSize, CopyMessage, Message) \
-+{ \
-+    gctARGUMENTS __arguments__; \
-+    gcmkARGUMENTS_START(__arguments__, Message); \
-+    _Print(ArgumentSize, CopyMessage, Message, __arguments__); \
-+    gcmkARGUMENTS_END(__arguments__); \
-+}
-+
-+#endif
-+
-+/******************************************************************************\
-+********************************** Debug Code **********************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Print
-+**
-+**  Send a message to the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_Print(
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_PrintN
-+**
-+**  Send a message to the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctUINT ArgumentSize
-+**          The size of the optional arguments in bytes.
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_PrintN(
-+    IN gctUINT ArgumentSize,
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    gcmDEBUGPRINT(ArgumentSize, gcvFALSE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CopyPrint
-+**
-+**  Send a message to the debugger. If in buffered output mode, the entire
-+**  message will be copied into the buffer instead of using the pointer to
-+**  the string.
-+**
-+**  INPUT:
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_CopyPrint(
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvTRUE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DumpBuffer
-+**
-+**  Print the contents of the specified buffer.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctPOINTER Buffer
-+**          Pointer to the buffer to print.
-+**
-+**      gctUINT Size
-+**          Size of the buffer.
-+**
-+**      gceDUMP_BUFFER Type
-+**          Buffer type.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_DumpBuffer(
-+    IN gckOS Os,
-+    IN gctPOINTER Buffer,
-+    IN gctUINT Size,
-+    IN gceDUMP_BUFFER Type,
-+    IN gctBOOL CopyMessage
-+    )
-+{
-+    gctUINT32 address;
-+    gcsBUFFERED_OUTPUT_PTR outputBuffer;
-+    static gctBOOL userLocked;
-+    gctCHAR *buffer = (gctCHAR*)Buffer;
-+
-+    gcmkDECLARE_LOCK(lockHandle);
-+
-+    /* Request lock when not coming from user,
-+       or coming from user and not yet locked
-+          and message is starting with @[. */
-+    if (Type == gceDUMP_BUFFER_FROM_USER)
-+    {
-+        if ((Size > 2)
-+        && (buffer[0] == '@')
-+        && (buffer[1] == '['))
-+        {
-+            /* Beginning of a user dump. */
-+            gcmkLOCKSECTION(lockHandle);
-+            userLocked = gcvTRUE;
-+        }
-+        /* Else, let it pass through. */
-+    }
-+    else
-+    {
-+        gcmkLOCKSECTION(lockHandle);
-+        userLocked = gcvFALSE;
-+    }
-+
-+    if (Buffer != gcvNULL)
-+    {
-+        /* Initialize output buffer list. */
-+        _InitBuffers();
-+
-+        /* Locate the proper output buffer. */
-+        outputBuffer = _GetOutputBuffer();
-+
-+        /* Update the line number. */
-+#if gcdSHOW_LINE_NUMBER
-+        outputBuffer->lineNumber += 1;
-+#endif
-+
-+        /* Get the physical address of the buffer. */
-+        if (Type != gceDUMP_BUFFER_FROM_USER)
-+        {
-+            gcmkVERIFY_OK(gckOS_GetPhysicalAddress(Os, Buffer, &address));
-+        }
-+        else
-+        {
-+            address = 0;
-+        }
-+
-+#if gcdHAVEPREFIX
-+        {
-+            gctUINT8_PTR alignedPrefixData;
-+            gctUINT8 prefixData[gcdPREFIX_SIZE + gcdPREFIX_ALIGNMENT];
-+
-+            /* Compute aligned pointer. */
-+            alignedPrefixData = prefixData;
-+            gcmkALIGNPTR(gctUINT8_PTR, alignedPrefixData, gcdPREFIX_ALIGNMENT);
-+
-+            /* Initialize the prefix data. */
-+            _InitPrefixData(outputBuffer, alignedPrefixData);
-+
-+            /* Print/schedule the buffer. */
-+            gcdOUTPUTBUFFER(
-+                outputBuffer, outputBuffer->indent,
-+                alignedPrefixData, Buffer, address, Size, Type, 0
-+                );
-+        }
-+#else
-+        /* Print/schedule the buffer. */
-+        if (Type == gceDUMP_BUFFER_FROM_USER)
-+        {
-+            gcdOUTPUTSTRING(
-+                outputBuffer, outputBuffer->indent,
-+                Buffer, 0, gcvNULL
-+                );
-+        }
-+        else
-+        {
-+            gcdOUTPUTBUFFER(
-+                outputBuffer, outputBuffer->indent,
-+                gcvNULL, Buffer, address, Size, Type, 0
-+                );
-+        }
-+#endif
-+    }
-+
-+    /* Unlock when not coming from user,
-+       or coming from user and not yet locked. */
-+    if (userLocked)
-+    {
-+        if ((Size > 4)
-+        && (buffer[0] == ']')
-+        && (buffer[1] == ' ')
-+        && (buffer[2] == '-')
-+        && (buffer[3] == '-'))
-+        {
-+            /* End of a user dump. */
-+            gcmkUNLOCKSECTION(lockHandle);
-+            userLocked = gcvFALSE;
-+        }
-+        /* Else, let it pass through, don't unlock. */
-+    }
-+    else
-+    {
-+        gcmkUNLOCKSECTION(lockHandle);
-+    }
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugTrace
-+**
-+**  Send a leveled message to the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Level
-+**          Debug level of message.
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_DebugTrace(
-+    IN gctUINT32 Level,
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    if (Level > _debugLevel)
-+    {
-+        return;
-+    }
-+
-+    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugTraceN
-+**
-+**  Send a leveled message to the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Level
-+**          Debug level of message.
-+**
-+**      gctUINT ArgumentSize
-+**          The size of the optional arguments in bytes.
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_DebugTraceN(
-+    IN gctUINT32 Level,
-+    IN gctUINT ArgumentSize,
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    if (Level > _debugLevel)
-+    {
-+        return;
-+    }
-+
-+    gcmDEBUGPRINT(ArgumentSize, gcvFALSE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugTraceZone
-+**
-+**  Send a leveled and zoned message to the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Level
-+**          Debug level for message.
-+**
-+**      gctUINT32 Zone
-+**          Debug zone for message.
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_DebugTraceZone(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone,
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    if ((Level > _debugLevel) || !(Zone & _debugZones))
-+    {
-+        return;
-+    }
-+
-+    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugTraceZoneN
-+**
-+**  Send a leveled and zoned message to the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Level
-+**          Debug level for message.
-+**
-+**      gctUINT32 Zone
-+**          Debug zone for message.
-+**
-+**      gctUINT ArgumentSize
-+**          The size of the optional arguments in bytes.
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_DebugTraceZoneN(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone,
-+    IN gctUINT ArgumentSize,
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    if ((Level > _debugLevel) || !(Zone & _debugZones))
-+    {
-+        return;
-+    }
-+
-+    gcmDEBUGPRINT(ArgumentSize, gcvFALSE, Message);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugBreak
-+**
-+**  Break into the debugger.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+void
-+gckOS_DebugBreak(
-+    void
-+    )
-+{
-+    gckOS_DebugTrace(gcvLEVEL_ERROR, "%s(%d)", __FUNCTION__, __LINE__);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugFatal
-+**
-+**  Send a message to the debugger and break into the debugger.
-+**
-+**  INPUT:
-+**
-+**      gctCONST_STRING Message
-+**          Pointer to message.
-+**
-+**      ...
-+**          Optional arguments.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+void
-+gckOS_DebugFatal(
-+    IN gctCONST_STRING Message,
-+    ...
-+    )
-+{
-+    gcmkPRINT_VERSION();
-+    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
-+
-+    /* Break into the debugger. */
-+    gckOS_DebugBreak();
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetDebugLevel
-+**
-+**  Set the debug level.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Level
-+**          New debug level.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_SetDebugLevel(
-+    IN gctUINT32 Level
-+    )
-+{
-+    _debugLevel = Level;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetDebugZone
-+**
-+**  Set the debug zone.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Zone
-+**          New debug zone.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+void
-+gckOS_SetDebugZone(
-+    IN gctUINT32 Zone
-+    )
-+{
-+    _debugZones = Zone;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetDebugLevelZone
-+**
-+**  Set the debug level and zone.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Level
-+**          New debug level.
-+**
-+**      gctUINT32 Zone
-+**          New debug zone.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_SetDebugLevelZone(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone
-+    )
-+{
-+    _debugLevel = Level;
-+    _debugZones = Zone;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetDebugZones
-+**
-+**  Enable or disable debug zones.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Zones
-+**          Debug zones to enable or disable.
-+**
-+**      gctBOOL Enable
-+**          Set to gcvTRUE to enable the zones (or the Zones with the current
-+**          zones) or gcvFALSE to disable the specified Zones.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_SetDebugZones(
-+    IN gctUINT32 Zones,
-+    IN gctBOOL Enable
-+    )
-+{
-+    if (Enable)
-+    {
-+        /* Enable the zones. */
-+        _debugZones |= Zones;
-+    }
-+    else
-+    {
-+        /* Disable the zones. */
-+        _debugZones &= ~Zones;
-+    }
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Verify
-+**
-+**  Called to verify the result of a function call.
-+**
-+**  INPUT:
-+**
-+**      gceSTATUS Status
-+**          Function call result.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_Verify(
-+    IN gceSTATUS status
-+    )
-+{
-+    _lastError = status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DebugFlush
-+**
-+**  Force messages to be flushed out.
-+**
-+**  INPUT:
-+**
-+**      gctCONST_STRING CallerName
-+**          Name of the caller function.
-+**
-+**      gctUINT LineNumber
-+**          Line number of the caller.
-+**
-+**      gctUINT32 DmaAddress
-+**          The current DMA address or ~0U to ignore.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+void
-+gckOS_DebugFlush(
-+    gctCONST_STRING CallerName,
-+    gctUINT LineNumber,
-+    gctUINT32 DmaAddress
-+    )
-+{
-+#if gcdBUFFERED_OUTPUT
-+    _DirectPrint("\nFlush requested by %s(%d).\n\n", CallerName, LineNumber);
-+    _Flush(DmaAddress);
-+#endif
-+}
-+gctCONST_STRING
-+gckOS_DebugStatus2Name(
-+	gceSTATUS status
-+	)
-+{
-+	switch (status)
-+	{
-+	case gcvSTATUS_OK:
-+		return "gcvSTATUS_OK";
-+	case gcvSTATUS_TRUE:
-+		return "gcvSTATUS_TRUE";
-+	case gcvSTATUS_NO_MORE_DATA:
-+		return "gcvSTATUS_NO_MORE_DATA";
-+	case gcvSTATUS_CACHED:
-+		return "gcvSTATUS_CACHED";
-+	case gcvSTATUS_MIPMAP_TOO_LARGE:
-+		return "gcvSTATUS_MIPMAP_TOO_LARGE";
-+	case gcvSTATUS_NAME_NOT_FOUND:
-+		return "gcvSTATUS_NAME_NOT_FOUND";
-+	case gcvSTATUS_NOT_OUR_INTERRUPT:
-+		return "gcvSTATUS_NOT_OUR_INTERRUPT";
-+	case gcvSTATUS_MISMATCH:
-+		return "gcvSTATUS_MISMATCH";
-+	case gcvSTATUS_MIPMAP_TOO_SMALL:
-+		return "gcvSTATUS_MIPMAP_TOO_SMALL";
-+	case gcvSTATUS_LARGER:
-+		return "gcvSTATUS_LARGER";
-+	case gcvSTATUS_SMALLER:
-+		return "gcvSTATUS_SMALLER";
-+	case gcvSTATUS_CHIP_NOT_READY:
-+		return "gcvSTATUS_CHIP_NOT_READY";
-+	case gcvSTATUS_NEED_CONVERSION:
-+		return "gcvSTATUS_NEED_CONVERSION";
-+	case gcvSTATUS_SKIP:
-+		return "gcvSTATUS_SKIP";
-+	case gcvSTATUS_DATA_TOO_LARGE:
-+		return "gcvSTATUS_DATA_TOO_LARGE";
-+	case gcvSTATUS_INVALID_CONFIG:
-+		return "gcvSTATUS_INVALID_CONFIG";
-+	case gcvSTATUS_CHANGED:
-+		return "gcvSTATUS_CHANGED";
-+	case gcvSTATUS_NOT_SUPPORT_DITHER:
-+		return "gcvSTATUS_NOT_SUPPORT_DITHER";
-+
-+	case gcvSTATUS_INVALID_ARGUMENT:
-+		return "gcvSTATUS_INVALID_ARGUMENT";
-+	case gcvSTATUS_INVALID_OBJECT:
-+		return "gcvSTATUS_INVALID_OBJECT";
-+	case gcvSTATUS_OUT_OF_MEMORY:
-+		return "gcvSTATUS_OUT_OF_MEMORY";
-+	case gcvSTATUS_MEMORY_LOCKED:
-+		return "gcvSTATUS_MEMORY_LOCKED";
-+	case gcvSTATUS_MEMORY_UNLOCKED:
-+		return "gcvSTATUS_MEMORY_UNLOCKED";
-+	case gcvSTATUS_HEAP_CORRUPTED:
-+		return "gcvSTATUS_HEAP_CORRUPTED";
-+	case gcvSTATUS_GENERIC_IO:
-+		return "gcvSTATUS_GENERIC_IO";
-+	case gcvSTATUS_INVALID_ADDRESS:
-+		return "gcvSTATUS_INVALID_ADDRESS";
-+	case gcvSTATUS_CONTEXT_LOSSED:
-+		return "gcvSTATUS_CONTEXT_LOSSED";
-+	case gcvSTATUS_TOO_COMPLEX:
-+		return "gcvSTATUS_TOO_COMPLEX";
-+	case gcvSTATUS_BUFFER_TOO_SMALL:
-+		return "gcvSTATUS_BUFFER_TOO_SMALL";
-+	case gcvSTATUS_INTERFACE_ERROR:
-+		return "gcvSTATUS_INTERFACE_ERROR";
-+	case gcvSTATUS_NOT_SUPPORTED:
-+		return "gcvSTATUS_NOT_SUPPORTED";
-+	case gcvSTATUS_MORE_DATA:
-+		return "gcvSTATUS_MORE_DATA";
-+	case gcvSTATUS_TIMEOUT:
-+		return "gcvSTATUS_TIMEOUT";
-+	case gcvSTATUS_OUT_OF_RESOURCES:
-+		return "gcvSTATUS_OUT_OF_RESOURCES";
-+	case gcvSTATUS_INVALID_DATA:
-+		return "gcvSTATUS_INVALID_DATA";
-+	case gcvSTATUS_INVALID_MIPMAP:
-+		return "gcvSTATUS_INVALID_MIPMAP";
-+	case gcvSTATUS_NOT_FOUND:
-+		return "gcvSTATUS_NOT_FOUND";
-+	case gcvSTATUS_NOT_ALIGNED:
-+		return "gcvSTATUS_NOT_ALIGNED";
-+	case gcvSTATUS_INVALID_REQUEST:
-+		return "gcvSTATUS_INVALID_REQUEST";
-+	case gcvSTATUS_GPU_NOT_RESPONDING:
-+		return "gcvSTATUS_GPU_NOT_RESPONDING";
-+	case gcvSTATUS_TIMER_OVERFLOW:
-+		return "gcvSTATUS_TIMER_OVERFLOW";
-+	case gcvSTATUS_VERSION_MISMATCH:
-+		return "gcvSTATUS_VERSION_MISMATCH";
-+	case gcvSTATUS_LOCKED:
-+		return "gcvSTATUS_LOCKED";
-+
-+    /* Linker errors. */
-+	case gcvSTATUS_GLOBAL_TYPE_MISMATCH:
-+		return "gcvSTATUS_GLOBAL_TYPE_MISMATCH";
-+	case gcvSTATUS_TOO_MANY_ATTRIBUTES:
-+		return "gcvSTATUS_TOO_MANY_ATTRIBUTES";
-+	case gcvSTATUS_TOO_MANY_UNIFORMS:
-+		return "gcvSTATUS_TOO_MANY_UNIFORMS";
-+	case gcvSTATUS_TOO_MANY_VARYINGS:
-+		return "gcvSTATUS_TOO_MANY_VARYINGS";
-+	case gcvSTATUS_UNDECLARED_VARYING:
-+		return "gcvSTATUS_UNDECLARED_VARYING";
-+	case gcvSTATUS_VARYING_TYPE_MISMATCH:
-+		return "gcvSTATUS_VARYING_TYPE_MISMATCH";
-+	case gcvSTATUS_MISSING_MAIN:
-+		return "gcvSTATUS_MISSING_MAIN";
-+	case gcvSTATUS_NAME_MISMATCH:
-+		return "gcvSTATUS_NAME_MISMATCH";
-+	case gcvSTATUS_INVALID_INDEX:
-+		return "gcvSTATUS_INVALID_INDEX";
-+	default:
-+		return "nil";
-+	}
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,2898 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+#include "gc_hal_kernel_buffer.h"
-+
-+#ifdef __QNXNTO__
-+#include <atomic.h>
-+#include "gc_hal_kernel_qnx.h"
-+#endif
-+
-+#define _GC_OBJ_ZONE                    gcvZONE_EVENT
-+
-+#define gcdEVENT_ALLOCATION_COUNT       (4096 / gcmSIZEOF(gcsHAL_INTERFACE))
-+#define gcdEVENT_MIN_THRESHOLD          4
-+
-+/******************************************************************************\
-+********************************* Support Code *********************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+gckEVENT_AllocateQueue(
-+    IN gckEVENT Event,
-+    OUT gcsEVENT_QUEUE_PTR * Queue
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Event=0x%x", Event);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Queue != gcvNULL);
-+
-+    /* Do we have free queues? */
-+    if (Event->freeList == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+    /* Move one free queue from the free list. */
-+    * Queue = Event->freeList;
-+    Event->freeList = Event->freeList->next;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Queue=0x%x", gcmOPT_POINTER(Queue));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+gckEVENT_FreeQueue(
-+    IN gckEVENT Event,
-+    OUT gcsEVENT_QUEUE_PTR Queue
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+
-+    gcmkHEADER_ARG("Event=0x%x", Event);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Queue != gcvNULL);
-+
-+    /* Move one free queue from the free list. */
-+    Queue->next = Event->freeList;
-+    Event->freeList = Queue;
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+gckEVENT_FreeRecord(
-+    IN gckEVENT Event,
-+    IN gcsEVENT_PTR Record
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Event=0x%x Record=0x%x", Event, Record);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Record != gcvNULL);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Event->os,
-+                                   Event->freeEventMutex,
-+                                   gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Push the record on the free list. */
-+    Record->next           = Event->freeEventList;
-+    Event->freeEventList   = Record;
-+    Event->freeEventCount += 1;
-+
-+    /* Release the mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+gckEVENT_IsEmpty(
-+    IN gckEVENT Event,
-+    OUT gctBOOL_PTR IsEmpty
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T i;
-+
-+    gcmkHEADER_ARG("Event=0x%x", Event);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(IsEmpty != gcvNULL);
-+
-+    /* Assume the event queue is empty. */
-+    *IsEmpty = gcvTRUE;
-+
-+    /* Try acquiring the mutex. */
-+    status = gckOS_AcquireMutex(Event->os, Event->eventQueueMutex, 0);
-+    if (status == gcvSTATUS_TIMEOUT)
-+    {
-+        /* Timeout - queue is no longer empty. */
-+        *IsEmpty = gcvFALSE;
-+    }
-+    else
-+    {
-+        /* Bail out on error. */
-+        gcmkONERROR(status);
-+
-+        /* Walk the event queue. */
-+        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+        {
-+            /* Check whether this event is in use. */
-+            if (Event->queues[i].head != gcvNULL)
-+            {
-+                /* The event is in use, hence the queue is not empty. */
-+                *IsEmpty = gcvFALSE;
-+                break;
-+            }
-+        }
-+
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*IsEmpty=%d", gcmOPT_VALUE(IsEmpty));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+_TryToIdleGPU(
-+    IN gckEVENT Event
-+)
-+{
-+    gceSTATUS status;
-+    gctBOOL empty = gcvFALSE, idle = gcvFALSE;
-+    gctBOOL powerLocked = gcvFALSE;
-+    gckHARDWARE hardware;
-+
-+    gcmkHEADER_ARG("Event=0x%x", Event);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    /* Grab gckHARDWARE object. */
-+    hardware = Event->kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    /* Check whether the event queue is empty. */
-+    gcmkONERROR(gckEVENT_IsEmpty(Event, &empty));
-+
-+    if (empty)
-+    {
-+        status = gckOS_AcquireMutex(hardware->os, hardware->powerMutex, 0);
-+        if (status == gcvSTATUS_TIMEOUT)
-+        {
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        powerLocked = gcvTRUE;
-+
-+        /* Query whether the hardware is idle. */
-+        gcmkONERROR(gckHARDWARE_QueryIdle(Event->kernel->hardware, &idle));
-+
-+        gcmkONERROR(gckOS_ReleaseMutex(hardware->os, hardware->powerMutex));
-+        powerLocked = gcvFALSE;
-+
-+        if (idle)
-+        {
-+            /* Inform the system of idle GPU. */
-+            gcmkONERROR(gckOS_Broadcast(Event->os,
-+                                        Event->kernel->hardware,
-+                                        gcvBROADCAST_GPU_IDLE));
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (powerLocked)
-+    {
-+        gcmkONERROR(gckOS_ReleaseMutex(hardware->os, hardware->powerMutex));
-+        powerLocked = gcvFALSE;
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+__RemoveRecordFromProcessDB(
-+    IN gckEVENT Event,
-+    IN gcsEVENT_PTR Record
-+    )
-+{
-+    gcmkHEADER_ARG("Event=0x%x Record=0x%x", Event, Record);
-+    gcmkVERIFY_ARGUMENT(Record != gcvNULL);
-+
-+    while (Record != gcvNULL)
-+    {
-+        if (Record->info.command == gcvHAL_SIGNAL)
-+        {
-+            /* TODO: Find a better place to bind signal to hardware.*/
-+            gcmkVERIFY_OK(gckOS_SignalSetHardware(Event->os,
-+                        gcmUINT64_TO_PTR(Record->info.u.Signal.signal),
-+                        Event->kernel->hardware));
-+        }
-+
-+        if (Record->fromKernel)
-+        {
-+            /* No need to check db if event is from kernel. */
-+            Record = Record->next;
-+            continue;
-+        }
-+
-+        switch (Record->info.command)
-+        {
-+        case gcvHAL_FREE_NON_PAGED_MEMORY:
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Event->kernel,
-+                Record->processID,
-+                gcvDB_NON_PAGED,
-+                gcmUINT64_TO_PTR(Record->info.u.FreeNonPagedMemory.logical)));
-+            break;
-+
-+        case gcvHAL_FREE_CONTIGUOUS_MEMORY:
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Event->kernel,
-+                Record->processID,
-+                gcvDB_CONTIGUOUS,
-+                gcmUINT64_TO_PTR(Record->info.u.FreeContiguousMemory.logical)));
-+            break;
-+
-+        case gcvHAL_FREE_VIDEO_MEMORY:
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Event->kernel,
-+                Record->processID,
-+                gcvDB_VIDEO_MEMORY,
-+                gcmUINT64_TO_PTR(Record->info.u.FreeVideoMemory.node)));
-+
-+            {
-+                gcuVIDMEM_NODE_PTR node = (gcuVIDMEM_NODE_PTR)(gcmUINT64_TO_PTR(Record->info.u.FreeVideoMemory.node));
-+
-+                if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+                {
-+                     gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(Event->kernel,
-+                                      Record->processID,
-+                                      gcvDB_VIDEO_MEMORY_RESERVED,
-+                                      node));
-+                }
-+                else if(node->Virtual.contiguous)
-+                {
-+                    gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(Event->kernel,
-+                                      Record->processID,
-+                                      gcvDB_VIDEO_MEMORY_CONTIGUOUS,
-+                                      node));
-+                }
-+                else
-+                {
-+                    gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(Event->kernel,
-+                                      Record->processID,
-+                                      gcvDB_VIDEO_MEMORY_VIRTUAL,
-+                                      node));
-+                }
-+            }
-+
-+            break;
-+
-+        case gcvHAL_UNLOCK_VIDEO_MEMORY:
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Event->kernel,
-+                Record->processID,
-+                gcvDB_VIDEO_MEMORY_LOCKED,
-+                gcmUINT64_TO_PTR(Record->info.u.UnlockVideoMemory.node)));
-+            break;
-+
-+        case gcvHAL_UNMAP_USER_MEMORY:
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Event->kernel,
-+                Record->processID,
-+                gcvDB_MAP_USER_MEMORY,
-+                gcmINT2PTR(Record->info.u.UnmapUserMemory.info)));
-+            break;
-+
-+        case gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER:
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Event->kernel,
-+                Record->processID,
-+                gcvDB_COMMAND_BUFFER,
-+                gcmUINT64_TO_PTR(Record->info.u.FreeVirtualCommandBuffer.logical)));
-+            break;
-+
-+        default:
-+            break;
-+        }
-+
-+        Record = Record->next;
-+    }
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+void
-+_SubmitTimerFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gckEVENT event = (gckEVENT)Data;
-+    gcmkVERIFY_OK(gckEVENT_Submit(event, gcvTRUE, gcvFALSE));
-+}
-+
-+/******************************************************************************\
-+******************************* gckEVENT API Code *******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Construct
-+**
-+**  Construct a new gckEVENT object.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**  OUTPUT:
-+**
-+**      gckEVENT * Event
-+**          Pointer to a variable that receives the gckEVENT object pointer.
-+*/
-+gceSTATUS
-+gckEVENT_Construct(
-+    IN gckKERNEL Kernel,
-+    OUT gckEVENT * Event
-+    )
-+{
-+    gckOS os;
-+    gceSTATUS status;
-+    gckEVENT eventObj = gcvNULL;
-+    int i;
-+    gcsEVENT_PTR record;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Event != gcvNULL);
-+
-+    /* Extract the pointer to the gckOS object. */
-+    os = Kernel->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Allocate the gckEVENT object. */
-+    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(struct _gckEVENT), &pointer));
-+
-+    eventObj = pointer;
-+
-+    /* Reset the object. */
-+    gcmkVERIFY_OK(gckOS_ZeroMemory(eventObj, gcmSIZEOF(struct _gckEVENT)));
-+
-+    /* Initialize the gckEVENT object. */
-+    eventObj->object.type = gcvOBJ_EVENT;
-+    eventObj->kernel      = Kernel;
-+    eventObj->os          = os;
-+
-+    /* Create the mutexes. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &eventObj->eventQueueMutex));
-+    gcmkONERROR(gckOS_CreateMutex(os, &eventObj->freeEventMutex));
-+    gcmkONERROR(gckOS_CreateMutex(os, &eventObj->eventListMutex));
-+
-+    /* Create a bunch of event reccords. */
-+    for (i = 0; i < gcdEVENT_ALLOCATION_COUNT; i += 1)
-+    {
-+        /* Allocate an event record. */
-+        gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(gcsEVENT), &pointer));
-+
-+        record = pointer;
-+
-+        /* Push it on the free list. */
-+        record->next              = eventObj->freeEventList;
-+        eventObj->freeEventList   = record;
-+        eventObj->freeEventCount += 1;
-+    }
-+
-+    /* Initialize the free list of event queues. */
-+    for (i = 0; i < gcdREPO_LIST_COUNT; i += 1)
-+    {
-+        eventObj->repoList[i].next = eventObj->freeList;
-+        eventObj->freeList = &eventObj->repoList[i];
-+    }
-+
-+    /* Construct the atom. */
-+    gcmkONERROR(gckOS_AtomConstruct(os, &eventObj->freeAtom));
-+    gcmkONERROR(gckOS_AtomSet(os,
-+                              eventObj->freeAtom,
-+                              gcmCOUNTOF(eventObj->queues)));
-+
-+#if gcdSMP
-+    gcmkONERROR(gckOS_AtomConstruct(os, &eventObj->pending));
-+#endif
-+
-+    gcmkVERIFY_OK(gckOS_CreateTimer(os,
-+                                    _SubmitTimerFunction,
-+                                    (gctPOINTER)eventObj,
-+                                    &eventObj->submitTimer));
-+
-+    /* Return pointer to the gckEVENT object. */
-+    *Event = eventObj;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Event=0x%x", *Event);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (eventObj != gcvNULL)
-+    {
-+        if (eventObj->eventQueueMutex != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(os, eventObj->eventQueueMutex));
-+        }
-+
-+        if (eventObj->freeEventMutex != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(os, eventObj->freeEventMutex));
-+        }
-+
-+        if (eventObj->eventListMutex != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(os, eventObj->eventListMutex));
-+        }
-+
-+        while (eventObj->freeEventList != gcvNULL)
-+        {
-+            record = eventObj->freeEventList;
-+            eventObj->freeEventList = record->next;
-+
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, record));
-+        }
-+
-+        if (eventObj->freeAtom != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(os, eventObj->freeAtom));
-+        }
-+
-+#if gcdSMP
-+        if (eventObj->pending != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_AtomDestroy(os, eventObj->pending));
-+        }
-+#endif
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, eventObj));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Destroy
-+**
-+**  Destroy an gckEVENT object.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Destroy(
-+    IN gckEVENT Event
-+    )
-+{
-+    gcsEVENT_PTR record;
-+    gcsEVENT_QUEUE_PTR queue;
-+
-+    gcmkHEADER_ARG("Event=0x%x", Event);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    if (Event->submitTimer != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckOS_StopTimer(Event->os, Event->submitTimer));
-+        gcmkVERIFY_OK(gckOS_DestroyTimer(Event->os, Event->submitTimer));
-+    }
-+
-+    /* Delete the queue mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Event->os, Event->eventQueueMutex));
-+
-+    /* Free all free events. */
-+    while (Event->freeEventList != gcvNULL)
-+    {
-+        record = Event->freeEventList;
-+        Event->freeEventList = record->next;
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Event->os, record));
-+    }
-+
-+    /* Delete the free mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Event->os, Event->freeEventMutex));
-+
-+    /* Free all pending queues. */
-+    while (Event->queueHead != gcvNULL)
-+    {
-+        /* Get the current queue. */
-+        queue = Event->queueHead;
-+
-+        /* Free all pending events. */
-+        while (queue->head != gcvNULL)
-+        {
-+            record      = queue->head;
-+            queue->head = record->next;
-+
-+            gcmkTRACE_ZONE_N(
-+                gcvLEVEL_WARNING, gcvZONE_EVENT,
-+                gcmSIZEOF(record) + gcmSIZEOF(queue->source),
-+                "Event record 0x%x is still pending for %d.",
-+                record, queue->source
-+                );
-+
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Event->os, record));
-+        }
-+
-+        /* Remove the top queue from the list. */
-+        if (Event->queueHead == Event->queueTail)
-+        {
-+            Event->queueHead =
-+            Event->queueTail = gcvNULL;
-+        }
-+        else
-+        {
-+            Event->queueHead = Event->queueHead->next;
-+        }
-+
-+        /* Free the queue. */
-+        gcmkVERIFY_OK(gckEVENT_FreeQueue(Event, queue));
-+    }
-+
-+    /* Delete the list mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Event->os, Event->eventListMutex));
-+
-+    /* Delete the atom. */
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Event->os, Event->freeAtom));
-+
-+#if gcdSMP
-+    gcmkVERIFY_OK(gckOS_AtomDestroy(Event->os, Event->pending));
-+#endif
-+
-+    /* Mark the gckEVENT object as unknown. */
-+    Event->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckEVENT object. */
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Event->os, Event));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_GetEvent
-+**
-+**  Reserve the next available hardware event.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctBOOL Wait
-+**          Set to gcvTRUE to force the function to wait if no events are
-+**          immediately available.
-+**
-+**      gceKERNEL_WHERE Source
-+**          Source of the event.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT8 * EventID
-+**          Reserved event ID.
-+*/
-+static gceSTATUS
-+gckEVENT_GetEvent(
-+    IN gckEVENT Event,
-+    IN gctBOOL Wait,
-+    OUT gctUINT8 * EventID,
-+    IN gcsEVENT_PTR Head,
-+    IN gceKERNEL_WHERE Source
-+    )
-+{
-+    gctINT i, id;
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+    gctINT32 free;
-+
-+#if gcdGPU_TIMEOUT
-+    gctUINT32 timer = 0;
-+#endif
-+
-+    gcmkHEADER_ARG("Event=0x%x Head=%p Source=%d", Event, Head, Source);
-+
-+    while (gcvTRUE)
-+    {
-+        /* Grab the queue mutex. */
-+        gcmkONERROR(gckOS_AcquireMutex(Event->os,
-+                                       Event->eventQueueMutex,
-+                                       gcvINFINITE));
-+        acquired = gcvTRUE;
-+
-+        /* Walk through all events. */
-+        id = Event->lastID;
-+        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+        {
-+            gctINT nextID = gckMATH_ModuloInt((id + 1),
-+                                              gcmCOUNTOF(Event->queues));
-+
-+            if (Event->queues[id].head == gcvNULL)
-+            {
-+                *EventID = (gctUINT8) id;
-+
-+                Event->lastID = (gctUINT8) nextID;
-+
-+                /* Save time stamp of event. */
-+                Event->queues[id].stamp  = ++(Event->stamp);
-+                Event->queues[id].head = Head;
-+                Event->queues[id].source = Source;
-+
-+                gcmkONERROR(gckOS_AtomDecrement(Event->os,
-+                                                Event->freeAtom,
-+                                                &free));
-+#if gcdDYNAMIC_SPEED
-+                if (free <= gcdDYNAMIC_EVENT_THRESHOLD)
-+                {
-+                    gcmkONERROR(gckOS_BroadcastHurry(
-+                        Event->os,
-+                        Event->kernel->hardware,
-+                        gcdDYNAMIC_EVENT_THRESHOLD - free));
-+                }
-+#endif
-+
-+                /* Release the queue mutex. */
-+                gcmkONERROR(gckOS_ReleaseMutex(Event->os,
-+                                               Event->eventQueueMutex));
-+
-+                /* Success. */
-+                gcmkTRACE_ZONE_N(
-+                    gcvLEVEL_INFO, gcvZONE_EVENT,
-+                    gcmSIZEOF(id),
-+                    "Using id=%d",
-+                    id
-+                    );
-+
-+                gcmkFOOTER_ARG("*EventID=%u", *EventID);
-+                return gcvSTATUS_OK;
-+            }
-+
-+            id = nextID;
-+        }
-+
-+#if gcdDYNAMIC_SPEED
-+        /* No free events, speed up the GPU right now! */
-+        gcmkONERROR(gckOS_BroadcastHurry(Event->os,
-+                                         Event->kernel->hardware,
-+                                         gcdDYNAMIC_EVENT_THRESHOLD));
-+#endif
-+
-+        /* Release the queue mutex. */
-+        gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+        acquired = gcvFALSE;
-+
-+        /* Fail if wait is not requested. */
-+        if (!Wait)
-+        {
-+            /* Out of resources. */
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+
-+        /* Delay a while. */
-+        gcmkONERROR(gckOS_Delay(Event->os, 1));
-+
-+#if gcdGPU_TIMEOUT
-+        /* Increment the wait timer. */
-+        timer += 1;
-+
-+        if (timer == Event->kernel->timeOut)
-+        {
-+            /* Try to call any outstanding events. */
-+            gcmkONERROR(gckHARDWARE_Interrupt(Event->kernel->hardware,
-+                                              gcvTRUE));
-+        }
-+        else if (timer > Event->kernel->timeOut)
-+        {
-+            gcmkTRACE_N(
-+                gcvLEVEL_ERROR,
-+                gcmSIZEOF(gctCONST_STRING) + gcmSIZEOF(gctINT),
-+                "%s(%d): no available events\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            /* Bail out. */
-+            gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
-+        }
-+#endif
-+    }
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the queue mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_AllocateRecord
-+**
-+**  Allocate a record for the new event.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctBOOL AllocateAllowed
-+**          State for allocation if out of free events.
-+**
-+**  OUTPUT:
-+**
-+**      gcsEVENT_PTR * Record
-+**          Allocated event record.
-+*/
-+gceSTATUS
-+gckEVENT_AllocateRecord(
-+    IN gckEVENT Event,
-+    IN gctBOOL AllocateAllowed,
-+    OUT gcsEVENT_PTR * Record
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+    gctINT i;
-+    gcsEVENT_PTR record;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Event=0x%x AllocateAllowed=%d", Event, AllocateAllowed);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Record != gcvNULL);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Event->os, Event->freeEventMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Test if we are below the allocation threshold. */
-+    if ( (AllocateAllowed && (Event->freeEventCount < gcdEVENT_MIN_THRESHOLD)) ||
-+         (Event->freeEventCount == 0) )
-+    {
-+        /* Allocate a bunch of records. */
-+        for (i = 0; i < gcdEVENT_ALLOCATION_COUNT; i += 1)
-+        {
-+            /* Allocate an event record. */
-+            gcmkONERROR(gckOS_Allocate(Event->os,
-+                                       gcmSIZEOF(gcsEVENT),
-+                                       &pointer));
-+
-+            record = pointer;
-+
-+            /* Push it on the free list. */
-+            record->next           = Event->freeEventList;
-+            Event->freeEventList   = record;
-+            Event->freeEventCount += 1;
-+        }
-+    }
-+
-+    *Record                = Event->freeEventList;
-+    Event->freeEventList   = Event->freeEventList->next;
-+    Event->freeEventCount -= 1;
-+
-+    /* Release the mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Record=0x%x", gcmOPT_POINTER(Record));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_AddList
-+**
-+**  Add a new event to the list of events.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gcsHAL_INTERFACE_PTR Interface
-+**          Pointer to the interface for the event to be added.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+**
-+**      gctBOOL AllocateAllowed
-+**          State for allocation if out of free events.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_AddList(
-+    IN gckEVENT Event,
-+    IN gcsHAL_INTERFACE_PTR Interface,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN gctBOOL AllocateAllowed,
-+    IN gctBOOL FromKernel
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+    gcsEVENT_PTR record = gcvNULL;
-+    gcsEVENT_QUEUE_PTR queue;
-+    gckKERNEL kernel = Event->kernel;
-+
-+    gcmkHEADER_ARG("Event=0x%x Interface=0x%x",
-+                   Event, Interface);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, _GC_OBJ_ZONE,
-+                    "FromWhere=%d AllocateAllowed=%d",
-+                    FromWhere, AllocateAllowed);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
-+
-+    /* Verify the event command. */
-+    gcmkASSERT
-+        (  (Interface->command == gcvHAL_FREE_NON_PAGED_MEMORY)
-+        || (Interface->command == gcvHAL_FREE_CONTIGUOUS_MEMORY)
-+        || (Interface->command == gcvHAL_FREE_VIDEO_MEMORY)
-+        || (Interface->command == gcvHAL_WRITE_DATA)
-+        || (Interface->command == gcvHAL_UNLOCK_VIDEO_MEMORY)
-+        || (Interface->command == gcvHAL_SIGNAL)
-+        || (Interface->command == gcvHAL_UNMAP_USER_MEMORY)
-+        || (Interface->command == gcvHAL_TIMESTAMP)
-+        || (Interface->command == gcvHAL_COMMIT_DONE)
-+        || (Interface->command == gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER)
-+        || (Interface->command == gcvHAL_SYNC_POINT)
-+        );
-+
-+    /* Validate the source. */
-+    if ((FromWhere != gcvKERNEL_COMMAND) && (FromWhere != gcvKERNEL_PIXEL))
-+    {
-+        /* Invalid argument. */
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Allocate a free record. */
-+    gcmkONERROR(gckEVENT_AllocateRecord(Event, AllocateAllowed, &record));
-+
-+    /* Termninate the record. */
-+    record->next = gcvNULL;
-+
-+    /* Record the committer. */
-+    record->fromKernel = FromKernel;
-+
-+    /* Copy the event interface into the record. */
-+    gckOS_MemCopy(&record->info, Interface, gcmSIZEOF(record->info));
-+
-+    /* Get process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&record->processID));
-+
-+#ifdef __QNXNTO__
-+    record->kernel = Event->kernel;
-+#endif
-+
-+    gcmkONERROR(__RemoveRecordFromProcessDB(Event, record));
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Event->os, Event->eventListMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Do we need to allocate a new queue? */
-+    if ((Event->queueTail == gcvNULL) || (Event->queueTail->source < FromWhere))
-+    {
-+        /* Allocate a new queue. */
-+        gcmkONERROR(gckEVENT_AllocateQueue(Event, &queue));
-+
-+        /* Initialize the queue. */
-+        queue->source = FromWhere;
-+        queue->head   = gcvNULL;
-+        queue->next   = gcvNULL;
-+
-+        /* Attach it to the list of allocated queues. */
-+        if (Event->queueTail == gcvNULL)
-+        {
-+            Event->queueHead =
-+            Event->queueTail = queue;
-+        }
-+        else
-+        {
-+            Event->queueTail->next = queue;
-+            Event->queueTail       = queue;
-+        }
-+    }
-+    else
-+    {
-+        queue = Event->queueTail;
-+    }
-+
-+    /* Attach the record to the queue. */
-+    if (queue->head == gcvNULL)
-+    {
-+        queue->head = record;
-+        queue->tail = record;
-+    }
-+    else
-+    {
-+        queue->tail->next = record;
-+        queue->tail       = record;
-+    }
-+
-+    /* Unmap user space logical address.
-+     * Linux kernel does not support unmap the memory of other process any more since 3.5.
-+     * Let's unmap memory of self process before submit the event to gpu.
-+     * */
-+    switch(Interface->command)
-+    {
-+    case gcvHAL_FREE_NON_PAGED_MEMORY:
-+        gcmkONERROR(gckOS_UnmapUserLogical(
-+                        Event->os,
-+                        gcmNAME_TO_PTR(Interface->u.FreeNonPagedMemory.physical),
-+                        (gctSIZE_T) Interface->u.FreeNonPagedMemory.bytes,
-+                        gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
-+        break;
-+    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
-+        gcmkONERROR(gckOS_UnmapUserLogical(
-+                        Event->os,
-+                        gcmNAME_TO_PTR(Interface->u.FreeContiguousMemory.physical),
-+                        (gctSIZE_T) Interface->u.FreeContiguousMemory.bytes,
-+                        gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical)));
-+        break;
-+    default:
-+        break;
-+    }
-+
-+
-+    /* Release the mutex. */
-+    gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
-+    }
-+
-+    if (record != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckEVENT_FreeRecord(Event, record));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Unlock
-+**
-+**  Schedule an event to unlock virtual memory.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to a gcuVIDMEM_NODE union that specifies the virtual memory
-+**          to unlock.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of surface to unlock.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Unlock(
-+    IN gckEVENT Event,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gceSURF_TYPE Type
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+
-+    gcmkHEADER_ARG("Event=0x%x FromWhere=%d Node=0x%x Type=%d",
-+                   Event, FromWhere, Node, Type);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
-+
-+    /* Mark the event as an unlock. */
-+    iface.command                           = gcvHAL_UNLOCK_VIDEO_MEMORY;
-+    iface.u.UnlockVideoMemory.node          = gcmPTR_TO_UINT64(Node);
-+    iface.u.UnlockVideoMemory.type          = Type;
-+    iface.u.UnlockVideoMemory.asynchroneous = 0;
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_FreeVideoMemory
-+**
-+**  Schedule an event to free video memory.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gcuVIDMEM_NODE_PTR VideoMemory
-+**          Pointer to a gcuVIDMEM_NODE object to free.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_FreeVideoMemory(
-+    IN gckEVENT Event,
-+    IN gcuVIDMEM_NODE_PTR VideoMemory,
-+    IN gceKERNEL_WHERE FromWhere
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+
-+    gcmkHEADER_ARG("Event=0x%x VideoMemory=0x%x FromWhere=%d",
-+                   Event, VideoMemory, FromWhere);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(VideoMemory != gcvNULL);
-+
-+    /* Create an event. */
-+    iface.command = gcvHAL_FREE_VIDEO_MEMORY;
-+    iface.u.FreeVideoMemory.node = gcmPTR_TO_UINT64(VideoMemory);
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_FreeNonPagedMemory
-+**
-+**  Schedule an event to free non-paged memory.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes of non-paged memory to free.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of non-paged memory to free.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of non-paged memory to free.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+*/
-+gceSTATUS
-+gckEVENT_FreeNonPagedMemory(
-+    IN gckEVENT Event,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gceKERNEL_WHERE FromWhere
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+    gckKERNEL kernel = Event->kernel;
-+
-+    gcmkHEADER_ARG("Event=0x%x Bytes=%lu Physical=0x%x Logical=0x%x "
-+                   "FromWhere=%d",
-+                   Event, Bytes, Physical, Logical, FromWhere);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    /* Create an event. */
-+    iface.command = gcvHAL_FREE_NON_PAGED_MEMORY;
-+    iface.u.FreeNonPagedMemory.bytes    = Bytes;
-+    iface.u.FreeNonPagedMemory.physical = gcmPTR_TO_NAME(Physical);
-+    iface.u.FreeNonPagedMemory.logical  = gcmPTR_TO_UINT64(Logical);
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckEVENT_DestroyVirtualCommandBuffer(
-+    IN gckEVENT Event,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gceKERNEL_WHERE FromWhere
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+    gckKERNEL kernel = Event->kernel;
-+
-+    gcmkHEADER_ARG("Event=0x%x Bytes=%lu Physical=0x%x Logical=0x%x "
-+                   "FromWhere=%d",
-+                   Event, Bytes, Physical, Logical, FromWhere);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    /* Create an event. */
-+    iface.command = gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER;
-+    iface.u.FreeVirtualCommandBuffer.bytes    = Bytes;
-+    iface.u.FreeVirtualCommandBuffer.physical = gcmPTR_TO_NAME(Physical);
-+    iface.u.FreeVirtualCommandBuffer.logical  = gcmPTR_TO_UINT64(Logical);
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_FreeContigiuousMemory
-+**
-+**  Schedule an event to free contiguous memory.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes of contiguous memory to free.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of contiguous memory to free.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of contiguous memory to free.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+*/
-+gceSTATUS
-+gckEVENT_FreeContiguousMemory(
-+    IN gckEVENT Event,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gceKERNEL_WHERE FromWhere
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+    gckKERNEL kernel = Event->kernel;
-+
-+    gcmkHEADER_ARG("Event=0x%x Bytes=%lu Physical=0x%x Logical=0x%x "
-+                   "FromWhere=%d",
-+                   Event, Bytes, Physical, Logical, FromWhere);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    /* Create an event. */
-+    iface.command = gcvHAL_FREE_CONTIGUOUS_MEMORY;
-+    iface.u.FreeContiguousMemory.bytes    = Bytes;
-+    iface.u.FreeContiguousMemory.physical = gcmPTR_TO_NAME(Physical);
-+    iface.u.FreeContiguousMemory.logical  = gcmPTR_TO_UINT64(Logical);
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Signal
-+**
-+**  Schedule an event to trigger a signal.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the signal to trigger.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Signal(
-+    IN gckEVENT Event,
-+    IN gctSIGNAL Signal,
-+    IN gceKERNEL_WHERE FromWhere
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+
-+    gcmkHEADER_ARG("Event=0x%x Signal=0x%x FromWhere=%d",
-+                   Event, Signal, FromWhere);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+
-+    /* Mark the event as a signal. */
-+    iface.command            = gcvHAL_SIGNAL;
-+    iface.u.Signal.signal    = gcmPTR_TO_UINT64(Signal);
-+#ifdef __QNXNTO__
-+    iface.u.Signal.coid      = 0;
-+    iface.u.Signal.rcvid     = 0;
-+#endif
-+    iface.u.Signal.auxSignal = 0;
-+    iface.u.Signal.process   = 0;
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_CommitDone
-+**
-+**  Schedule an event to wake up work thread when commit is done by GPU.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gceKERNEL_WHERE FromWhere
-+**          Place in the pipe where the event needs to be generated.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_CommitDone(
-+    IN gckEVENT Event,
-+    IN gceKERNEL_WHERE FromWhere
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+
-+    gcmkHEADER_ARG("Event=0x%x FromWhere=%d", Event, FromWhere);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    iface.command = gcvHAL_COMMIT_DONE;
-+
-+    /* Append it to the queue. */
-+    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+/*******************************************************************************
-+**
-+**  gckEVENT_Submit
-+**
-+**  Submit the current event queue to the GPU.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctBOOL Wait
-+**          Submit requires one vacant event; if Wait is set to not zero,
-+**          and there are no vacant events at this time, the function will
-+**          wait until an event becomes vacant so that submission of the
-+**          queue is successful.
-+**
-+**      gctBOOL FromPower
-+**          Determines whether the call originates from inside the power
-+**          management or not.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Submit(
-+    IN gckEVENT Event,
-+    IN gctBOOL Wait,
-+    IN gctBOOL FromPower
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT8 id = 0xFF;
-+    gcsEVENT_QUEUE_PTR queue;
-+    gctBOOL acquired = gcvFALSE;
-+    gckCOMMAND command = gcvNULL;
-+    gctBOOL commitEntered = gcvFALSE;
-+#if !gcdNULL_DRIVER
-+    gctSIZE_T bytes;
-+    gctPOINTER buffer;
-+#endif
-+
-+    gcmkHEADER_ARG("Event=0x%x Wait=%d", Event, Wait);
-+
-+    /* Get gckCOMMAND object. */
-+    command = Event->kernel->command;
-+
-+    /* Are there event queues? */
-+    if (Event->queueHead != gcvNULL)
-+    {
-+        /* Acquire the command queue. */
-+        gcmkONERROR(gckCOMMAND_EnterCommit(command, FromPower));
-+        commitEntered = gcvTRUE;
-+
-+        /* Process all queues. */
-+        while (Event->queueHead != gcvNULL)
-+        {
-+            /* Acquire the list mutex. */
-+            gcmkONERROR(gckOS_AcquireMutex(Event->os,
-+                                           Event->eventListMutex,
-+                                           gcvINFINITE));
-+            acquired = gcvTRUE;
-+
-+            /* Get the current queue. */
-+            queue = Event->queueHead;
-+
-+            /* Allocate an event ID. */
-+            gcmkONERROR(gckEVENT_GetEvent(Event, Wait, &id, queue->head, queue->source));
-+
-+            /* Copy event list to event ID queue. */
-+            Event->queues[id].head   = queue->head;
-+
-+            /* Remove the top queue from the list. */
-+            if (Event->queueHead == Event->queueTail)
-+            {
-+                Event->queueHead = gcvNULL;
-+                Event->queueTail = gcvNULL;
-+            }
-+            else
-+            {
-+                Event->queueHead = Event->queueHead->next;
-+            }
-+
-+            /* Free the queue. */
-+            gcmkONERROR(gckEVENT_FreeQueue(Event, queue));
-+
-+            /* Release the list mutex. */
-+            gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
-+            acquired = gcvFALSE;
-+
-+#if gcdNULL_DRIVER
-+            /* Notify immediately on infinite hardware. */
-+            gcmkONERROR(gckEVENT_Interrupt(Event, 1 << id));
-+
-+            gcmkONERROR(gckEVENT_Notify(Event, 0));
-+#else
-+            /* Get the size of the hardware event. */
-+            gcmkONERROR(gckHARDWARE_Event(Event->kernel->hardware,
-+                                          gcvNULL,
-+                                          id,
-+                                          Event->queues[id].source,
-+                                          &bytes));
-+
-+            /* Reserve space in the command queue. */
-+            gcmkONERROR(gckCOMMAND_Reserve(command,
-+                                           bytes,
-+                                           &buffer,
-+                                           &bytes));
-+
-+            /* Set the hardware event in the command queue. */
-+            gcmkONERROR(gckHARDWARE_Event(Event->kernel->hardware,
-+                                          buffer,
-+                                          id,
-+                                          Event->queues[id].source,
-+                                          &bytes));
-+
-+            /* Execute the hardware event. */
-+            gcmkONERROR(gckCOMMAND_Execute(command, bytes));
-+#endif
-+        }
-+
-+        /* Release the command queue. */
-+        gcmkONERROR(gckCOMMAND_ExitCommit(command, FromPower));
-+        commitEntered = gcvFALSE;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, FromPower));
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Need to unroll the mutex acquire. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
-+    }
-+
-+    if (id != 0xFF)
-+    {
-+        /* Need to unroll the event allocation. */
-+        Event->queues[id].head = gcvNULL;
-+    }
-+
-+    if (status == gcvSTATUS_GPU_NOT_RESPONDING)
-+    {
-+        /* Broadcast GPU stuck. */
-+        status = gckOS_Broadcast(Event->os,
-+                                 Event->kernel->hardware,
-+                                 gcvBROADCAST_GPU_STUCK);
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Commit
-+**
-+**  Commit an event queue from the user.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gcsQUEUE_PTR Queue
-+**          User event queue.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Commit(
-+    IN gckEVENT Event,
-+    IN gcsQUEUE_PTR Queue
-+    )
-+{
-+    gceSTATUS status;
-+    gcsQUEUE_PTR record = gcvNULL, next;
-+    gctUINT32 processID;
-+    gctBOOL needCopy = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Event=0x%x Queue=0x%x", Event, Queue);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    /* Get the current process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&processID));
-+
-+    /* Query if we need to copy the client data. */
-+    gcmkONERROR(gckOS_QueryNeedCopy(Event->os, processID, &needCopy));
-+
-+    /* Loop while there are records in the queue. */
-+    while (Queue != gcvNULL)
-+    {
-+        gcsQUEUE queue;
-+
-+        if (needCopy)
-+        {
-+            /* Point to stack record. */
-+            record = &queue;
-+
-+            /* Copy the data from the client. */
-+            gcmkONERROR(gckOS_CopyFromUserData(Event->os,
-+                                               record,
-+                                               Queue,
-+                                               gcmSIZEOF(gcsQUEUE)));
-+        }
-+        else
-+        {
-+            gctPOINTER pointer = gcvNULL;
-+
-+            /* Map record into kernel memory. */
-+            gcmkONERROR(gckOS_MapUserPointer(Event->os,
-+                                             Queue,
-+                                             gcmSIZEOF(gcsQUEUE),
-+                                             &pointer));
-+
-+            record = pointer;
-+        }
-+
-+        /* Append event record to event queue. */
-+        gcmkONERROR(
-+            gckEVENT_AddList(Event, &record->iface, gcvKERNEL_PIXEL, gcvTRUE, gcvFALSE));
-+
-+        /* Next record in the queue. */
-+        next = gcmUINT64_TO_PTR(record->next);
-+
-+        if (!needCopy)
-+        {
-+            /* Unmap record from kernel memory. */
-+            gcmkONERROR(
-+                gckOS_UnmapUserPointer(Event->os,
-+                                       Queue,
-+                                       gcmSIZEOF(gcsQUEUE),
-+                                       (gctPOINTER *) record));
-+            record = gcvNULL;
-+        }
-+
-+        Queue = next;
-+    }
-+
-+    /* Submit the event list. */
-+    gcmkONERROR(gckEVENT_Submit(Event, gcvTRUE, gcvFALSE));
-+
-+    /* Success */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if ((record != gcvNULL) && !needCopy)
-+    {
-+        /* Roll back. */
-+        gcmkVERIFY_OK(gckOS_UnmapUserPointer(Event->os,
-+                                             Queue,
-+                                             gcmSIZEOF(gcsQUEUE),
-+                                             (gctPOINTER *) record));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Compose
-+**
-+**  Schedule a composition event and start a composition.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gcsHAL_COMPOSE_PTR Info
-+**          Pointer to the composition structure.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Compose(
-+    IN gckEVENT Event,
-+    IN gcsHAL_COMPOSE_PTR Info
-+    )
-+{
-+    gceSTATUS status;
-+    gcsEVENT_PTR headRecord;
-+    gcsEVENT_PTR tailRecord;
-+    gcsEVENT_PTR tempRecord;
-+    gctUINT8 id = 0xFF;
-+    gctUINT32 processID;
-+
-+    gcmkHEADER_ARG("Event=0x%x Info=0x%x", Event, Info);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
-+
-+    /* Get process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&processID));
-+
-+    /* Allocate a record. */
-+    gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &tempRecord));
-+    headRecord = tailRecord = tempRecord;
-+
-+    /* Initialize the record. */
-+    tempRecord->info.command            = gcvHAL_SIGNAL;
-+    tempRecord->info.u.Signal.process   = Info->process;
-+#ifdef __QNXNTO__
-+    tempRecord->info.u.Signal.coid      = Info->coid;
-+    tempRecord->info.u.Signal.rcvid     = Info->rcvid;
-+#endif
-+    tempRecord->info.u.Signal.signal    = Info->signal;
-+    tempRecord->info.u.Signal.auxSignal = 0;
-+    tempRecord->next = gcvNULL;
-+    tempRecord->processID = processID;
-+
-+    /* Allocate another record for user signal #1. */
-+    if (gcmUINT64_TO_PTR(Info->userSignal1) != gcvNULL)
-+    {
-+        /* Allocate a record. */
-+        gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &tempRecord));
-+        tailRecord->next = tempRecord;
-+        tailRecord = tempRecord;
-+
-+        /* Initialize the record. */
-+        tempRecord->info.command            = gcvHAL_SIGNAL;
-+        tempRecord->info.u.Signal.process   = Info->userProcess;
-+#ifdef __QNXNTO__
-+        tempRecord->info.u.Signal.coid      = Info->coid;
-+        tempRecord->info.u.Signal.rcvid     = Info->rcvid;
-+#endif
-+        tempRecord->info.u.Signal.signal    = Info->userSignal1;
-+        tempRecord->info.u.Signal.auxSignal = 0;
-+        tempRecord->next = gcvNULL;
-+        tempRecord->processID = processID;
-+    }
-+
-+    /* Allocate another record for user signal #2. */
-+    if (gcmUINT64_TO_PTR(Info->userSignal2) != gcvNULL)
-+    {
-+        /* Allocate a record. */
-+        gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &tempRecord));
-+        tailRecord->next = tempRecord;
-+        tailRecord = tempRecord;
-+
-+        /* Initialize the record. */
-+        tempRecord->info.command            = gcvHAL_SIGNAL;
-+        tempRecord->info.u.Signal.process   = Info->userProcess;
-+#ifdef __QNXNTO__
-+        tempRecord->info.u.Signal.coid      = Info->coid;
-+        tempRecord->info.u.Signal.rcvid     = Info->rcvid;
-+#endif
-+        tempRecord->info.u.Signal.signal    = Info->userSignal2;
-+        tempRecord->info.u.Signal.auxSignal = 0;
-+        tempRecord->next = gcvNULL;
-+        tempRecord->processID = processID;
-+    }
-+
-+    /* Allocate an event ID. */
-+    gcmkONERROR(gckEVENT_GetEvent(Event, gcvTRUE, &id, headRecord, gcvKERNEL_PIXEL));
-+
-+    /* Start composition. */
-+    gcmkONERROR(gckHARDWARE_Compose(
-+        Event->kernel->hardware, processID,
-+        gcmUINT64_TO_PTR(Info->physical), gcmUINT64_TO_PTR(Info->logical), Info->offset, Info->size, id
-+        ));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Interrupt
-+**
-+**  Called by the interrupt service routine to store the triggered interrupt
-+**  mask to be later processed by gckEVENT_Notify.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctUINT32 Data
-+**          Mask for the 32 interrupts.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Interrupt(
-+    IN gckEVENT Event,
-+    IN gctUINT32 Data
-+    )
-+{
-+    unsigned long flags;
-+    gcmkHEADER_ARG("Event=0x%x Data=0x%x", Event, Data);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    /* Combine current interrupt status with pending flags. */
-+    spin_lock_irqsave(&Event->kernel->irq_lock, flags);
-+#if gcdSMP
-+    gckOS_AtomSetMask(Event->pending, Data);
-+#elif defined(__QNXNTO__)
-+    atomic_set(&Event->pending, Data);
-+#else
-+    Event->pending |= Data;
-+#endif
-+    spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckEVENT_Notify
-+**
-+**  Process all triggered interrupts.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Notify(
-+    IN gckEVENT Event,
-+    IN gctUINT32 IDs
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctINT i;
-+    gcsEVENT_QUEUE * queue;
-+    gctUINT mask = 0;
-+    gctBOOL acquired = gcvFALSE;
-+    gcuVIDMEM_NODE_PTR node;
-+    gctPOINTER info;
-+    gctSIGNAL signal;
-+    gctUINT pending;
-+    gckKERNEL kernel = Event->kernel;
-+#if !gcdSMP
-+    gctBOOL suspended = gcvFALSE;
-+#endif
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gctINT eventNumber = 0;
-+#endif
-+    gctINT32 free;
-+#if gcdSECURE_USER
-+    gcskSECURE_CACHE_PTR cache;
-+#endif
-+    unsigned long flags;
-+
-+    gcmkHEADER_ARG("Event=0x%x IDs=0x%x", Event, IDs);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    gcmDEBUG_ONLY(
-+        if (IDs != 0)
-+        {
-+            for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+            {
-+                if (Event->queues[i].head != gcvNULL)
-+                {
-+                    gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                                   "Queue(%d): stamp=%llu source=%d",
-+                                   i,
-+                                   Event->queues[i].stamp,
-+                                   Event->queues[i].source);
-+                }
-+            }
-+        }
-+    );
-+
-+    for (;;)
-+    {
-+        gcsEVENT_PTR record;
-+
-+        spin_lock_irqsave(&Event->kernel->irq_lock, flags);
-+#if gcdSMP
-+        /* Get current interrupts. */
-+        gckOS_AtomGet(Event->os, Event->pending, (gctINT32_PTR)&pending);
-+#else
-+        /* Get current interrupts. */
-+        pending = Event->pending;
-+#endif
-+        spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
-+
-+        if (pending & 0x80000000)
-+        {
-+            //gckOS_Print("!!!!!!!!!!!!! AXI BUS ERROR !!!!!!!!!!!!!\n");
-+            gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_EVENT, "AXI BUS ERROR");
-+            pending &= 0x7FFFFFFF;
-+        }
-+
-+        if (pending & 0x40000000)
-+        {
-+            gckHARDWARE_DumpMMUException(Event->kernel->hardware);
-+
-+            pending &= 0x3FFFFFFF;
-+        }
-+
-+        gcmkTRACE_ZONE_N(
-+            gcvLEVEL_INFO, gcvZONE_EVENT,
-+            gcmSIZEOF(pending),
-+            "Pending interrupts 0x%x",
-+            pending
-+            );
-+
-+        if (pending == 0)
-+        {
-+            /* No more pending interrupts - done. */
-+            break;
-+        }
-+
-+        queue = gcvNULL;
-+
-+        /* Grab the mutex queue. */
-+        gcmkONERROR(gckOS_AcquireMutex(Event->os,
-+                                       Event->eventQueueMutex,
-+                                       gcvINFINITE));
-+        acquired = gcvTRUE;
-+
-+        gcmDEBUG_ONLY(
-+            if (IDs == 0)
-+            {
-+                for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+                {
-+                    if (Event->queues[i].head != gcvNULL)
-+                    {
-+                        gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                                       "Queue(%d): stamp=%llu source=%d",
-+                                       i,
-+                                       Event->queues[i].stamp,
-+                                       Event->queues[i].source);
-+                    }
-+                }
-+            }
-+        );
-+
-+        /* Find the oldest pending interrupt. */
-+        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+        {
-+            if ((Event->queues[i].head != gcvNULL)
-+            &&  (pending & (1 << i))
-+            )
-+            {
-+                if ((queue == gcvNULL)
-+                ||  (Event->queues[i].stamp < queue->stamp)
-+                )
-+                {
-+                    queue = &Event->queues[i];
-+                    mask  = 1 << i;
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+                    eventNumber = i;
-+#endif
-+                }
-+            }
-+        }
-+
-+        if (queue == gcvNULL)
-+        {
-+            gcmkTRACE_ZONE_N(
-+                gcvLEVEL_ERROR, gcvZONE_EVENT,
-+                gcmSIZEOF(pending),
-+                "Interrupts 0x%x are not pending.",
-+                pending
-+                );
-+
-+            /* Release the mutex queue. */
-+            gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+            acquired = gcvFALSE;
-+
-+            spin_lock_irqsave(&Event->kernel->irq_lock, flags);
-+#if gcdSMP
-+            /* Mark pending interrupts as handled. */
-+            gckOS_AtomClearMask(Event->pending, pending);
-+#elif defined(__QNXNTO__)
-+            /* Mark pending interrupts as handled. */
-+            atomic_clr((gctUINT32_PTR)&Event->pending, pending);
-+#else
-+            /* Mark pending interrupts as handled. */
-+            Event->pending &= ~pending;
-+#endif
-+            spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
-+            break;
-+        }
-+
-+        /* Check whether there is a missed interrupt. */
-+        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+        {
-+            if ((Event->queues[i].head != gcvNULL)
-+            &&  (Event->queues[i].stamp < queue->stamp)
-+            &&  (Event->queues[i].source <= queue->source)
-+            )
-+            {
-+                gcmkTRACE_N(
-+                    gcvLEVEL_ERROR,
-+                    gcmSIZEOF(i) + gcmSIZEOF(Event->queues[i].stamp),
-+                    "Event %d lost (stamp %llu)",
-+                    i, Event->queues[i].stamp
-+                    );
-+
-+                /* Use this event instead. */
-+                queue = &Event->queues[i];
-+                mask  = 0;
-+            }
-+        }
-+
-+        if (mask != 0)
-+        {
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+            gcmkTRACE_ZONE_N(
-+                gcvLEVEL_INFO, gcvZONE_EVENT,
-+                gcmSIZEOF(eventNumber),
-+                "Processing interrupt %d",
-+                eventNumber
-+                );
-+#endif
-+        }
-+
-+        spin_lock_irqsave(&Event->kernel->irq_lock, flags);
-+#if gcdSMP
-+        /* Mark pending interrupt as handled. */
-+        gckOS_AtomClearMask(Event->pending, mask);
-+#elif defined(__QNXNTO__)
-+        /* Mark pending interrupt as handled. */
-+        atomic_clr(&Event->pending, mask);
-+#else
-+        /* Mark pending interrupt as handled. */
-+        Event->pending &= ~mask;
-+#endif
-+        spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
-+
-+        /* We are in the notify loop. */
-+        Event->inNotify = gcvTRUE;
-+
-+        /* We are in the notify loop. */
-+        Event->inNotify = gcvTRUE;
-+
-+        /* Grab the event head. */
-+        record = queue->head;
-+
-+        /* Now quickly clear its event list. */
-+        queue->head = gcvNULL;
-+
-+        /* Release the mutex queue. */
-+        gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+        acquired = gcvFALSE;
-+
-+        /* Increase the number of free events. */
-+        gcmkONERROR(gckOS_AtomIncrement(Event->os, Event->freeAtom, &free));
-+
-+        /* Walk all events for this interrupt. */
-+        while (record != gcvNULL)
-+        {
-+            gcsEVENT_PTR recordNext;
-+#ifndef __QNXNTO__
-+            gctPOINTER logical;
-+#endif
-+#if gcdSECURE_USER
-+            gctSIZE_T bytes;
-+#endif
-+
-+            /* Grab next record. */
-+            recordNext = record->next;
-+
-+#ifdef __QNXNTO__
-+            /* Assign record->processID as the pid for this galcore thread.
-+             * Used in OS calls like gckOS_UnlockMemory() which do not take a pid.
-+             */
-+            drv_thread_specific_key_assign(record->processID, 0, Event->kernel->core);
-+#endif
-+
-+#if gcdSECURE_USER
-+            /* Get the cache that belongs to this process. */
-+            gcmkONERROR(gckKERNEL_GetProcessDBCache(Event->kernel,
-+                        record->processID,
-+                        &cache));
-+#endif
-+
-+            gcmkTRACE_ZONE_N(
-+                gcvLEVEL_INFO, gcvZONE_EVENT,
-+                gcmSIZEOF(record->info.command),
-+                "Processing event type: %d",
-+                record->info.command
-+                );
-+
-+            switch (record->info.command)
-+            {
-+            case gcvHAL_FREE_NON_PAGED_MEMORY:
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                               "gcvHAL_FREE_NON_PAGED_MEMORY: 0x%x",
-+                               gcmNAME_TO_PTR(record->info.u.FreeNonPagedMemory.physical));
-+
-+                /* Free non-paged memory. */
-+                status = gckOS_FreeNonPagedMemory(
-+                            Event->os,
-+                            (gctSIZE_T) record->info.u.FreeNonPagedMemory.bytes,
-+                            gcmNAME_TO_PTR(record->info.u.FreeNonPagedMemory.physical),
-+                            gcmUINT64_TO_PTR(record->info.u.FreeNonPagedMemory.logical));
-+
-+                if (gcmIS_SUCCESS(status))
-+                {
-+#if gcdSECURE_USER
-+                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+                        Event->kernel,
-+                        cache,
-+                        gcmUINT64_TO_PTR(record->record.u.FreeNonPagedMemory.logical),
-+                        (gctSIZE_T) record->record.u.FreeNonPagedMemory.bytes));
-+#endif
-+                }
-+                gcmRELEASE_NAME(record->info.u.FreeNonPagedMemory.physical);
-+                break;
-+
-+            case gcvHAL_FREE_CONTIGUOUS_MEMORY:
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                    "gcvHAL_FREE_CONTIGUOUS_MEMORY: 0x%x",
-+                    gcmNAME_TO_PTR(record->info.u.FreeContiguousMemory.physical));
-+
-+                /* Unmap the user memory. */
-+                status = gckOS_FreeContiguous(
-+                            Event->os,
-+                            gcmNAME_TO_PTR(record->info.u.FreeContiguousMemory.physical),
-+                            gcmUINT64_TO_PTR(record->info.u.FreeContiguousMemory.logical),
-+                            (gctSIZE_T) record->info.u.FreeContiguousMemory.bytes);
-+
-+                if (gcmIS_SUCCESS(status))
-+                {
-+#if gcdSECURE_USER
-+                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+                        Event->kernel,
-+                        cache,
-+                        gcmUINT64_TO_PTR(record->record.u.FreeContiguousMemory.logical),
-+                        (gctSIZE_T) record->record.u.FreeContiguousMemory.bytes));
-+#endif
-+                }
-+                gcmRELEASE_NAME(record->info.u.FreeContiguousMemory.physical);
-+                break;
-+
-+            case gcvHAL_FREE_VIDEO_MEMORY:
-+                node = gcmUINT64_TO_PTR(record->info.u.FreeVideoMemory.node);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                               "gcvHAL_FREE_VIDEO_MEMORY: 0x%x",
-+                               node);
-+#ifdef __QNXNTO__
-+#if gcdUSE_VIDMEM_PER_PID
-+                /* Check if the VidMem object still exists. */
-+                if (gckKERNEL_GetVideoMemoryPoolPid(record->kernel,
-+                                                    gcvPOOL_SYSTEM,
-+                                                    record->processID,
-+                                                    gcvNULL) == gcvSTATUS_NOT_FOUND)
-+                {
-+                    /*printf("Vidmem not found for process:%d\n", queue->processID);*/
-+                    status = gcvSTATUS_OK;
-+                    break;
-+                }
-+#else
-+                if ((node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+                &&  (node->VidMem.logical != gcvNULL)
-+                )
-+                {
-+                    gcmkERR_BREAK(
-+                        gckKERNEL_UnmapVideoMemory(record->kernel,
-+                                                   node->VidMem.logical,
-+                                                   record->processID,
-+                                                   node->VidMem.bytes));
-+                    node->VidMem.logical = gcvNULL;
-+                }
-+#endif
-+#endif
-+
-+                /* Free video memory. */
-+                status =
-+                    gckVIDMEM_Free(Event->kernel, node);
-+
-+                break;
-+
-+            case gcvHAL_WRITE_DATA:
-+#ifndef __QNXNTO__
-+                /* Convert physical into logical address. */
-+                gcmkERR_BREAK(
-+                    gckOS_MapPhysical(Event->os,
-+                                      record->info.u.WriteData.address,
-+                                      gcmSIZEOF(gctUINT32),
-+                                      &logical));
-+
-+                /* Write data. */
-+                gcmkERR_BREAK(
-+                    gckOS_WriteMemory(Event->os,
-+                                      logical,
-+                                      record->info.u.WriteData.data));
-+
-+                /* Unmap the physical memory. */
-+                gcmkERR_BREAK(
-+                    gckOS_UnmapPhysical(Event->os,
-+                                        logical,
-+                                        gcmSIZEOF(gctUINT32)));
-+#else
-+                /* Write data. */
-+                gcmkERR_BREAK(
-+                    gckOS_WriteMemory(Event->os,
-+                                      (gctPOINTER)
-+                                          record->info.u.WriteData.address,
-+                                      record->info.u.WriteData.data));
-+#endif
-+                break;
-+
-+            case gcvHAL_UNLOCK_VIDEO_MEMORY:
-+                node = gcmUINT64_TO_PTR(record->info.u.UnlockVideoMemory.node);
-+
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                               "gcvHAL_UNLOCK_VIDEO_MEMORY: 0x%x",
-+                               node);
-+
-+                /* Save node information before it disappears. */
-+#if gcdSECURE_USER
-+                if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+                {
-+                    logical = gcvNULL;
-+                    bytes   = 0;
-+                }
-+                else
-+                {
-+                    logical = node->Virtual.logical;
-+                    bytes   = node->Virtual.bytes;
-+                }
-+#endif
-+
-+                /* Unlock. */
-+                status = gckVIDMEM_Unlock(
-+                    Event->kernel,
-+                    node,
-+                    record->info.u.UnlockVideoMemory.type,
-+                    gcvNULL);
-+
-+#if gcdSECURE_USER
-+                if (gcmIS_SUCCESS(status) && (logical != gcvNULL))
-+                {
-+                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+                        Event->kernel,
-+                        cache,
-+                        logical,
-+                        bytes));
-+                }
-+#endif
-+                break;
-+
-+            case gcvHAL_SIGNAL:
-+                signal = gcmUINT64_TO_PTR(record->info.u.Signal.signal);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                               "gcvHAL_SIGNAL: 0x%x",
-+                               signal);
-+
-+#ifdef __QNXNTO__
-+                if ((record->info.u.Signal.coid == 0)
-+                &&  (record->info.u.Signal.rcvid == 0)
-+                )
-+                {
-+                    /* Kernel signal. */
-+                    gcmkERR_BREAK(
-+                        gckOS_Signal(Event->os,
-+                                     signal,
-+                                     gcvTRUE));
-+                }
-+                else
-+                {
-+                    /* User signal. */
-+                    gcmkERR_BREAK(
-+                        gckOS_UserSignal(Event->os,
-+                                         signal,
-+                                         record->info.u.Signal.rcvid,
-+                                         record->info.u.Signal.coid));
-+                }
-+#else
-+                /* Set signal. */
-+                if (gcmUINT64_TO_PTR(record->info.u.Signal.process) == gcvNULL)
-+                {
-+                    /* Kernel signal. */
-+                    gcmkERR_BREAK(
-+                        gckOS_Signal(Event->os,
-+                                     signal,
-+                                     gcvTRUE));
-+                }
-+                else
-+                {
-+                    /* User signal. */
-+                    gcmkERR_BREAK(
-+                        gckOS_UserSignal(Event->os,
-+                                         signal,
-+                                         gcmUINT64_TO_PTR(record->info.u.Signal.process)));
-+                }
-+
-+                gcmkASSERT(record->info.u.Signal.auxSignal == 0);
-+#endif
-+                break;
-+
-+            case gcvHAL_UNMAP_USER_MEMORY:
-+                info = gcmNAME_TO_PTR(record->info.u.UnmapUserMemory.info);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                               "gcvHAL_UNMAP_USER_MEMORY: 0x%x",
-+                               info);
-+
-+                /* Unmap the user memory. */
-+                status = gckOS_UnmapUserMemory(
-+                    Event->os,
-+                    Event->kernel->core,
-+                    gcmUINT64_TO_PTR(record->info.u.UnmapUserMemory.memory),
-+                    (gctSIZE_T) record->info.u.UnmapUserMemory.size,
-+                    info,
-+                    record->info.u.UnmapUserMemory.address);
-+
-+#if gcdSECURE_USER
-+                if (gcmIS_SUCCESS(status))
-+                {
-+                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
-+                        Event->kernel,
-+                        cache,
-+                        gcmUINT64_TO_PTR(record->info.u.UnmapUserMemory.memory),
-+                        (gctSIZE_T) record->info.u.UnmapUserMemory.size));
-+                }
-+#endif
-+                gcmRELEASE_NAME(record->info.u.UnmapUserMemory.info);
-+                break;
-+
-+            case gcvHAL_TIMESTAMP:
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                               "gcvHAL_TIMESTAMP: %d %d",
-+                               record->info.u.TimeStamp.timer,
-+                               record->info.u.TimeStamp.request);
-+
-+                /* Process the timestamp. */
-+                switch (record->info.u.TimeStamp.request)
-+                {
-+                case 0:
-+                    status = gckOS_GetTime(&Event->kernel->timers[
-+                                           record->info.u.TimeStamp.timer].
-+                                           stopTime);
-+                    break;
-+
-+                case 1:
-+                    status = gckOS_GetTime(&Event->kernel->timers[
-+                                           record->info.u.TimeStamp.timer].
-+                                           startTime);
-+                    break;
-+
-+                default:
-+                    gcmkTRACE_ZONE_N(
-+                        gcvLEVEL_ERROR, gcvZONE_EVENT,
-+                        gcmSIZEOF(record->info.u.TimeStamp.request),
-+                        "Invalid timestamp request: %d",
-+                        record->info.u.TimeStamp.request
-+                        );
-+
-+                    status = gcvSTATUS_INVALID_ARGUMENT;
-+                    break;
-+                }
-+                break;
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+             case gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER:
-+                 gcmkVERIFY_OK(
-+                     gckKERNEL_DestroyVirtualCommandBuffer(Event->kernel,
-+                         (gctSIZE_T) record->info.u.FreeVirtualCommandBuffer.bytes,
-+                         gcmNAME_TO_PTR(record->info.u.FreeVirtualCommandBuffer.physical),
-+                         gcmUINT64_TO_PTR(record->info.u.FreeVirtualCommandBuffer.logical)
-+                         ));
-+                 gcmRELEASE_NAME(record->info.u.FreeVirtualCommandBuffer.physical);
-+                 break;
-+#endif
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+            case gcvHAL_SYNC_POINT:
-+                {
-+                    gctSYNC_POINT syncPoint;
-+
-+                    syncPoint = gcmUINT64_TO_PTR(record->info.u.SyncPoint.syncPoint);
-+                    status = gckOS_SignalSyncPoint(Event->os, syncPoint);
-+                }
-+                break;
-+#endif
-+
-+            case gcvHAL_COMMIT_DONE:
-+                break;
-+
-+            default:
-+                /* Invalid argument. */
-+                gcmkTRACE_ZONE_N(
-+                    gcvLEVEL_ERROR, gcvZONE_EVENT,
-+                    gcmSIZEOF(record->info.command),
-+                    "Unknown event type: %d",
-+                    record->info.command
-+                    );
-+
-+                status = gcvSTATUS_INVALID_ARGUMENT;
-+                break;
-+            }
-+
-+            /* Make sure there are no errors generated. */
-+            if (gcmIS_ERROR(status))
-+            {
-+                gcmkTRACE_ZONE_N(
-+                    gcvLEVEL_WARNING, gcvZONE_EVENT,
-+                    gcmSIZEOF(status),
-+                    "Event produced status: %d(%s)",
-+                    status, gckOS_DebugStatus2Name(status));
-+            }
-+
-+            /* Free the event. */
-+            gcmkVERIFY_OK(gckEVENT_FreeRecord(Event, record));
-+
-+            /* Advance to next record. */
-+            record = recordNext;
-+        }
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
-+                       "Handled interrupt 0x%x", mask);
-+    }
-+
-+    if (IDs == 0)
-+    {
-+        gcmkONERROR(_TryToIdleGPU(Event));
-+    }
-+
-+    /* We are out the notify loop. */
-+    Event->inNotify = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+    }
-+
-+#if !gcdSMP
-+    if (suspended)
-+    {
-+        /* Resume interrupts. */
-+        gcmkVERIFY_OK(gckOS_ResumeInterruptEx(Event->os, Event->kernel->core));
-+    }
-+#endif
-+
-+    /* We are out the notify loop. */
-+    Event->inNotify = gcvFALSE;
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckEVENT_FreeProcess
-+**
-+**  Free all events owned by a particular process ID.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID of the process to be freed up.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_FreeProcess(
-+    IN gckEVENT Event,
-+    IN gctUINT32 ProcessID
-+    )
-+{
-+    gctSIZE_T i;
-+    gctBOOL acquired = gcvFALSE;
-+    gcsEVENT_PTR record, next;
-+    gceSTATUS status;
-+    gcsEVENT_PTR deleteHead, deleteTail;
-+
-+    gcmkHEADER_ARG("Event=0x%x ProcessID=%d", Event, ProcessID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    /* Walk through all queues. */
-+    for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
-+    {
-+        if (Event->queues[i].head != gcvNULL)
-+        {
-+            /* Grab the event queue mutex. */
-+            gcmkONERROR(gckOS_AcquireMutex(Event->os,
-+                                           Event->eventQueueMutex,
-+                                           gcvINFINITE));
-+            acquired = gcvTRUE;
-+
-+            /* Grab the mutex head. */
-+            record                = Event->queues[i].head;
-+            Event->queues[i].head = gcvNULL;
-+            Event->queues[i].tail = gcvNULL;
-+            deleteHead            = gcvNULL;
-+            deleteTail            = gcvNULL;
-+
-+            while (record != gcvNULL)
-+            {
-+                next = record->next;
-+                if (record->processID == ProcessID)
-+                {
-+                    if (deleteHead == gcvNULL)
-+                    {
-+                        deleteHead = record;
-+                    }
-+                    else
-+                    {
-+                        deleteTail->next = record;
-+                    }
-+
-+                    deleteTail = record;
-+                }
-+                else
-+                {
-+                    if (Event->queues[i].head == gcvNULL)
-+                    {
-+                        Event->queues[i].head = record;
-+                    }
-+                    else
-+                    {
-+                        Event->queues[i].tail->next = record;
-+                    }
-+
-+                    Event->queues[i].tail = record;
-+                }
-+
-+                record->next = gcvNULL;
-+                record = next;
-+            }
-+
-+            /* Release the mutex queue. */
-+            gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+            acquired = gcvFALSE;
-+
-+            /* Loop through the entire list of events. */
-+            for (record = deleteHead; record != gcvNULL; record = next)
-+            {
-+                /* Get the next event record. */
-+                next = record->next;
-+
-+                /* Free the event record. */
-+                gcmkONERROR(gckEVENT_FreeRecord(Event, record));
-+            }
-+        }
-+    }
-+
-+    gcmkONERROR(_TryToIdleGPU(Event));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Release the event queue mutex. */
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**  gckEVENT_Stop
-+**
-+**  Stop the hardware using the End event mechanism.
-+**
-+**  INPUT:
-+**
-+**      gckEVENT Event
-+**          Pointer to an gckEVENT object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID Logical belongs.
-+**
-+**      gctPHYS_ADDR Handle
-+**          Physical address handle.  If gcvNULL it is video memory.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to flush.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the signal to trigger.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckEVENT_Stop(
-+    IN gckEVENT Event,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Handle,
-+    IN gctPOINTER Logical,
-+    IN gctSIGNAL Signal,
-+	IN OUT gctSIZE_T * waitSize
-+    )
-+{
-+    gceSTATUS status;
-+   /* gctSIZE_T waitSize;*/
-+    gcsEVENT_PTR record;
-+    gctUINT8 id = 0xFF;
-+
-+    gcmkHEADER_ARG("Event=0x%x ProcessID=%u Handle=0x%x Logical=0x%x "
-+                   "Signal=0x%x",
-+                   Event, ProcessID, Handle, Logical, Signal);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
-+
-+    /* Submit the current event queue. */
-+    gcmkONERROR(gckEVENT_Submit(Event, gcvTRUE, gcvFALSE));
-+
-+    /* Allocate a record. */
-+    gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &record));
-+
-+    /* Initialize the record. */
-+    record->next = gcvNULL;
-+    record->processID               = ProcessID;
-+    record->info.command            = gcvHAL_SIGNAL;
-+    record->info.u.Signal.signal    = gcmPTR_TO_UINT64(Signal);
-+#ifdef __QNXNTO__
-+    record->info.u.Signal.coid      = 0;
-+    record->info.u.Signal.rcvid     = 0;
-+#endif
-+    record->info.u.Signal.auxSignal = 0;
-+    record->info.u.Signal.process   = 0;
-+
-+
-+    gcmkONERROR(gckEVENT_GetEvent(Event, gcvTRUE, &id, record, gcvKERNEL_PIXEL));
-+
-+    /* Replace last WAIT with END. */
-+    gcmkONERROR(gckHARDWARE_End(
-+        Event->kernel->hardware, Logical, waitSize
-+        ));
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Flush the cache for the END. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Event->os,
-+        ProcessID,
-+        gcvNULL,
-+        Handle,
-+        Logical,
-+        *waitSize
-+        ));
-+#endif
-+
-+    /* Wait for the signal. */
-+    gcmkONERROR(gckOS_WaitSignal(Event->os, Signal, gcvINFINITE));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static void
-+_PrintRecord(
-+    gcsEVENT_PTR record
-+    )
-+{
-+    switch (record->info.command)
-+    {
-+    case gcvHAL_FREE_NON_PAGED_MEMORY:
-+        gcmkPRINT("      gcvHAL_FREE_NON_PAGED_MEMORY");
-+            break;
-+
-+    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
-+        gcmkPRINT("      gcvHAL_FREE_CONTIGUOUS_MEMORY");
-+            break;
-+
-+    case gcvHAL_FREE_VIDEO_MEMORY:
-+        gcmkPRINT("      gcvHAL_FREE_VIDEO_MEMORY");
-+            break;
-+
-+    case gcvHAL_WRITE_DATA:
-+        gcmkPRINT("      gcvHAL_WRITE_DATA");
-+       break;
-+
-+    case gcvHAL_UNLOCK_VIDEO_MEMORY:
-+        gcmkPRINT("      gcvHAL_UNLOCK_VIDEO_MEMORY");
-+        break;
-+
-+    case gcvHAL_SIGNAL:
-+        gcmkPRINT("      gcvHAL_SIGNAL process=%d signal=0x%x",
-+                  record->info.u.Signal.process,
-+                  record->info.u.Signal.signal);
-+        break;
-+
-+    case gcvHAL_UNMAP_USER_MEMORY:
-+        gcmkPRINT("      gcvHAL_UNMAP_USER_MEMORY");
-+       break;
-+
-+    case gcvHAL_TIMESTAMP:
-+        gcmkPRINT("      gcvHAL_TIMESTAMP");
-+        break;
-+
-+    case gcvHAL_COMMIT_DONE:
-+        gcmkPRINT("      gcvHAL_COMMIT_DONE");
-+        break;
-+
-+    case gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER:
-+        gcmkPRINT("      gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER logical=0x%08x",
-+                  record->info.u.FreeVirtualCommandBuffer.logical);
-+        break;
-+
-+    default:
-+        gcmkPRINT("      Illegal Event %d", record->info.command);
-+        break;
-+    }
-+}
-+
-+/*******************************************************************************
-+** gckEVENT_Dump
-+**
-+** Dump record in event queue when stuck happens.
-+** No protection for the event queue.
-+**/
-+gceSTATUS
-+gckEVENT_Dump(
-+    IN gckEVENT Event
-+    )
-+{
-+    gcsEVENT_QUEUE_PTR queueHead = Event->queueHead;
-+    gcsEVENT_QUEUE_PTR queue;
-+    gcsEVENT_PTR record = gcvNULL;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Event=0x%x", Event);
-+
-+    gcmkPRINT("**************************\n");
-+    gcmkPRINT("***  EVENT STATE DUMP  ***\n");
-+    gcmkPRINT("**************************\n");
-+
-+
-+    gcmkPRINT("  Unsumbitted Event:");
-+    while(queueHead)
-+    {
-+        queue = queueHead;
-+        record = queueHead->head;
-+
-+        gcmkPRINT("    [%x]:", queue);
-+        while(record)
-+        {
-+            _PrintRecord(record);
-+            record = record->next;
-+        }
-+
-+        if (queueHead == Event->queueTail)
-+        {
-+            queueHead = gcvNULL;
-+        }
-+        else
-+        {
-+            queueHead = queueHead->next;
-+        }
-+    }
-+
-+    gcmkPRINT("  Untriggered Event:");
-+    for (i = 0; i < 30; i++)
-+    {
-+        queue = &Event->queues[i];
-+        record = queue->head;
-+
-+        gcmkPRINT("    [%d]:", i);
-+        while(record)
-+        {
-+            _PrintRecord(record);
-+            record = record->next;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS gckEVENT_WaitEmpty(gckEVENT Event)
-+{
-+    gctBOOL isEmpty;
-+
-+    while (Event->inNotify || (gcmIS_SUCCESS(gckEVENT_IsEmpty(Event, &isEmpty)) && !isEmpty)) ;
-+
-+    return gcvSTATUS_OK;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h	2015-07-27 23:13:06.190893891 +0200
-@@ -0,0 +1,1007 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_h_
-+#define __gc_hal_kernel_h_
-+
-+#include <linux/spinlock.h>
-+
-+#include "gc_hal.h"
-+#include "gc_hal_kernel_hardware.h"
-+#include "gc_hal_driver.h"
-+
-+#if gcdENABLE_VG
-+#include "gc_hal_kernel_vg.h"
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+
-+/*******************************************************************************
-+***** New MMU Defination *******************************************************/
-+#define gcdMMU_MTLB_SHIFT           22
-+#define gcdMMU_STLB_4K_SHIFT        12
-+#define gcdMMU_STLB_64K_SHIFT       16
-+
-+#define gcdMMU_MTLB_BITS            (32 - gcdMMU_MTLB_SHIFT)
-+#define gcdMMU_PAGE_4K_BITS         gcdMMU_STLB_4K_SHIFT
-+#define gcdMMU_STLB_4K_BITS         (32 - gcdMMU_MTLB_BITS - gcdMMU_PAGE_4K_BITS)
-+#define gcdMMU_PAGE_64K_BITS        gcdMMU_STLB_64K_SHIFT
-+#define gcdMMU_STLB_64K_BITS        (32 - gcdMMU_MTLB_BITS - gcdMMU_PAGE_64K_BITS)
-+
-+#define gcdMMU_MTLB_ENTRY_NUM       (1 << gcdMMU_MTLB_BITS)
-+#define gcdMMU_MTLB_SIZE            (gcdMMU_MTLB_ENTRY_NUM << 2)
-+#define gcdMMU_STLB_4K_ENTRY_NUM    (1 << gcdMMU_STLB_4K_BITS)
-+#define gcdMMU_STLB_4K_SIZE         (gcdMMU_STLB_4K_ENTRY_NUM << 2)
-+#define gcdMMU_PAGE_4K_SIZE         (1 << gcdMMU_STLB_4K_SHIFT)
-+#define gcdMMU_STLB_64K_ENTRY_NUM   (1 << gcdMMU_STLB_64K_BITS)
-+#define gcdMMU_STLB_64K_SIZE        (gcdMMU_STLB_64K_ENTRY_NUM << 2)
-+#define gcdMMU_PAGE_64K_SIZE        (1 << gcdMMU_STLB_64K_SHIFT)
-+
-+#define gcdMMU_MTLB_MASK            (~((1U << gcdMMU_MTLB_SHIFT)-1))
-+#define gcdMMU_STLB_4K_MASK         ((~0U << gcdMMU_STLB_4K_SHIFT) ^ gcdMMU_MTLB_MASK)
-+#define gcdMMU_PAGE_4K_MASK         (gcdMMU_PAGE_4K_SIZE - 1)
-+#define gcdMMU_STLB_64K_MASK        ((~((1U << gcdMMU_STLB_64K_SHIFT)-1)) ^ gcdMMU_MTLB_MASK)
-+#define gcdMMU_PAGE_64K_MASK        (gcdMMU_PAGE_64K_SIZE - 1)
-+
-+/* Page offset definitions. */
-+#define gcdMMU_OFFSET_4K_BITS       (32 - gcdMMU_MTLB_BITS - gcdMMU_STLB_4K_BITS)
-+#define gcdMMU_OFFSET_4K_MASK       ((1U << gcdMMU_OFFSET_4K_BITS) - 1)
-+#define gcdMMU_OFFSET_16K_BITS      (32 - gcdMMU_MTLB_BITS - gcdMMU_STLB_16K_BITS)
-+#define gcdMMU_OFFSET_16K_MASK      ((1U << gcdMMU_OFFSET_16K_BITS) - 1)
-+
-+/*******************************************************************************
-+***** Process Secure Cache ****************************************************/
-+
-+#define gcdSECURE_CACHE_LRU         1
-+#define gcdSECURE_CACHE_LINEAR      2
-+#define gcdSECURE_CACHE_HASH        3
-+#define gcdSECURE_CACHE_TABLE       4
-+
-+typedef struct _gcskLOGICAL_CACHE * gcskLOGICAL_CACHE_PTR;
-+typedef struct _gcskLOGICAL_CACHE   gcskLOGICAL_CACHE;
-+struct _gcskLOGICAL_CACHE
-+{
-+    /* Logical address. */
-+    gctPOINTER                      logical;
-+
-+    /* DMAable address. */
-+    gctUINT32                       dma;
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+    /* Pointer to the previous and next hash tables. */
-+    gcskLOGICAL_CACHE_PTR           nextHash;
-+    gcskLOGICAL_CACHE_PTR           prevHash;
-+#endif
-+
-+#if gcdSECURE_CACHE_METHOD != gcdSECURE_CACHE_TABLE
-+    /* Pointer to the previous and next slot. */
-+    gcskLOGICAL_CACHE_PTR           next;
-+    gcskLOGICAL_CACHE_PTR           prev;
-+#endif
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LINEAR
-+    /* Time stamp. */
-+    gctUINT64                       stamp;
-+#endif
-+};
-+
-+typedef struct _gcskSECURE_CACHE * gcskSECURE_CACHE_PTR;
-+typedef struct _gcskSECURE_CACHE
-+{
-+    /* Cache memory. */
-+    gcskLOGICAL_CACHE               cache[1 + gcdSECURE_CACHE_SLOTS];
-+
-+    /* Last known index for LINEAR mode. */
-+    gcskLOGICAL_CACHE_PTR           cacheIndex;
-+
-+    /* Current free slot for LINEAR mode. */
-+    gctUINT32                       cacheFree;
-+
-+    /* Time stamp for LINEAR mode. */
-+    gctUINT64                       cacheStamp;
-+
-+#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
-+    /* Hash table for HASH mode. */
-+    gcskLOGICAL_CACHE              hash[256];
-+#endif
-+}
-+gcskSECURE_CACHE;
-+
-+/*******************************************************************************
-+***** Process Database Management *********************************************/
-+
-+typedef enum _gceDATABASE_TYPE
-+{
-+    gcvDB_VIDEO_MEMORY = 1,             /* Video memory created. */
-+    gcvDB_COMMAND_BUFFER,               /* Command Buffer. */
-+    gcvDB_NON_PAGED,                    /* Non paged memory. */
-+    gcvDB_CONTIGUOUS,                   /* Contiguous memory. */
-+    gcvDB_SIGNAL,                       /* Signal. */
-+    gcvDB_VIDEO_MEMORY_LOCKED,          /* Video memory locked. */
-+    gcvDB_CONTEXT,                      /* Context */
-+    gcvDB_IDLE,                         /* GPU idle. */
-+    gcvDB_MAP_MEMORY,                   /* Map memory */
-+    gcvDB_SHARED_INFO,                  /* Private data */
-+    gcvDB_MAP_USER_MEMORY,              /* Map user memory */
-+    gcvDB_SYNC_POINT,                   /* Sync point. */
-+    gcvDB_VIDEO_MEMORY_RESERVED,        /* Reserved video memory */
-+    gcvDB_VIDEO_MEMORY_CONTIGUOUS,      /* Contiguous video memory */
-+    gcvDB_VIDEO_MEMORY_VIRTUAL,         /* Virtual video memory */
-+}
-+gceDATABASE_TYPE;
-+
-+typedef struct _gcsDATABASE_RECORD *    gcsDATABASE_RECORD_PTR;
-+typedef struct _gcsDATABASE_RECORD
-+{
-+    /* Pointer to kernel. */
-+    gckKERNEL                           kernel;
-+
-+    /* Pointer to next database record. */
-+    gcsDATABASE_RECORD_PTR              next;
-+
-+    /* Type of record. */
-+    gceDATABASE_TYPE                    type;
-+
-+    /* Data for record. */
-+    gctPOINTER                          data;
-+    gctPHYS_ADDR                        physical;
-+    gctSIZE_T                           bytes;
-+}
-+gcsDATABASE_RECORD;
-+
-+typedef struct _gcsDATABASE *           gcsDATABASE_PTR;
-+typedef struct _gcsDATABASE
-+{
-+    /* Pointer to next entry is hash list. */
-+    gcsDATABASE_PTR                     next;
-+    gctSIZE_T                           slot;
-+
-+    /* Process ID. */
-+    gctUINT32                           processID;
-+
-+    /* Sizes to query. */
-+    gcsDATABASE_COUNTERS                vidMem;
-+    gcsDATABASE_COUNTERS                nonPaged;
-+    gcsDATABASE_COUNTERS                contiguous;
-+    gcsDATABASE_COUNTERS                mapUserMemory;
-+    gcsDATABASE_COUNTERS                mapMemory;
-+    gcsDATABASE_COUNTERS                vidMemResv;
-+    gcsDATABASE_COUNTERS                vidMemCont;
-+    gcsDATABASE_COUNTERS                vidMemVirt;
-+
-+    /* Idle time management. */
-+    gctUINT64                           lastIdle;
-+    gctUINT64                           idle;
-+
-+    /* Pointer to database. */
-+    gcsDATABASE_RECORD_PTR              list[48];
-+
-+#if gcdSECURE_USER
-+    /* Secure cache. */
-+    gcskSECURE_CACHE                    cache;
-+#endif
-+
-+    gctPOINTER                          handleDatabase;
-+    gctPOINTER                          handleDatabaseMutex;
-+}
-+gcsDATABASE;
-+
-+/* Create a process database that will contain all its allocations. */
-+gceSTATUS
-+gckKERNEL_CreateProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID
-+    );
-+
-+/* Add a record to the process database. */
-+gceSTATUS
-+gckKERNEL_AddProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Pointer,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Size
-+    );
-+
-+/* Remove a record to the process database. */
-+gceSTATUS
-+gckKERNEL_RemoveProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Pointer
-+    );
-+
-+/* Destroy the process database. */
-+gceSTATUS
-+gckKERNEL_DestroyProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID
-+    );
-+
-+/* Find a record to the process database. */
-+gceSTATUS
-+gckKERNEL_FindProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gctUINT32 ThreadID,
-+    IN gceDATABASE_TYPE Type,
-+    IN gctPOINTER Pointer,
-+    OUT gcsDATABASE_RECORD_PTR Record
-+    );
-+
-+/* Query the process database. */
-+gceSTATUS
-+gckKERNEL_QueryProcessDB(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    IN gctBOOL LastProcessID,
-+    IN gceDATABASE_TYPE Type,
-+    OUT gcuDATABASE_INFO * Info
-+    );
-+
-+/* Dump the process database. */
-+gceSTATUS
-+gckKERNEL_DumpProcessDB(
-+    IN gckKERNEL Kernel
-+    );
-+
-+/* ID database */
-+gceSTATUS
-+gckKERNEL_CreateIntegerDatabase(
-+    IN gckKERNEL Kernel,
-+    OUT gctPOINTER * Database
-+    );
-+
-+gceSTATUS
-+gckKERNEL_DestroyIntegerDatabase(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Database
-+    );
-+
-+gceSTATUS
-+gckKERNEL_AllocateIntegerId(
-+    IN gctPOINTER Database,
-+    IN gctPOINTER Pointer,
-+    OUT gctUINT32 * Id
-+    );
-+
-+gceSTATUS
-+gckKERNEL_FreeIntegerId(
-+    IN gctPOINTER Database,
-+    IN gctUINT32 Id
-+    );
-+
-+gceSTATUS
-+gckKERNEL_QueryIntegerId(
-+    IN gctPOINTER Database,
-+    IN gctUINT32 Id,
-+    OUT gctPOINTER * Pointer
-+    );
-+
-+gctUINT32
-+gckKERNEL_AllocateNameFromPointer(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Pointer
-+    );
-+
-+gctPOINTER
-+gckKERNEL_QueryPointerFromName(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 Name
-+    );
-+
-+gceSTATUS
-+gckKERNEL_DeleteName(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 Name
-+    );
-+
-+#if gcdSECURE_USER
-+/* Get secure cache from the process database. */
-+gceSTATUS
-+gckKERNEL_GetProcessDBCache(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 ProcessID,
-+    OUT gcskSECURE_CACHE_PTR * Cache
-+    );
-+#endif
-+
-+/*******************************************************************************
-+********* Timer Management ****************************************************/
-+typedef struct _gcsTIMER *           gcsTIMER_PTR;
-+typedef struct _gcsTIMER
-+{
-+    /* Start and Stop time holders. */
-+    gctUINT64                           startTime;
-+    gctUINT64                           stopTime;
-+}
-+gcsTIMER;
-+
-+/******************************************************************************\
-+********************************** Structures **********************************
-+\******************************************************************************/
-+
-+/* gckDB object. */
-+struct _gckDB
-+{
-+    /* Database management. */
-+    gcsDATABASE_PTR             db[16];
-+    gctPOINTER                  dbMutex;
-+    gcsDATABASE_PTR             freeDatabase;
-+    gcsDATABASE_RECORD_PTR      freeRecord;
-+    gcsDATABASE_PTR             lastDatabase;
-+    gctUINT32                   lastProcessID;
-+    gctUINT64                   lastIdle;
-+    gctUINT64                   idleTime;
-+    gctUINT64                   lastSlowdown;
-+    gctUINT64                   lastSlowdownIdle;
-+    /* ID - Pointer database*/
-+    gctPOINTER                  pointerDatabase;
-+    gctPOINTER                  pointerDatabaseMutex;
-+};
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+typedef struct _gckVIRTUAL_COMMAND_BUFFER * gckVIRTUAL_COMMAND_BUFFER_PTR;
-+typedef struct _gckVIRTUAL_COMMAND_BUFFER
-+{
-+    gctPHYS_ADDR                physical;
-+    gctPOINTER                  userLogical;
-+    gctPOINTER                  kernelLogical;
-+    gctSIZE_T                   pageCount;
-+    gctPOINTER                  pageTable;
-+    gctUINT32                   gpuAddress;
-+    gctUINT                     pid;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR   next;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR   prev;
-+    gckKERNEL                   kernel;
-+}
-+gckVIRTUAL_COMMAND_BUFFER;
-+#endif
-+
-+/* gckKERNEL object. */
-+struct _gckKERNEL
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Core */
-+    gceCORE                     core;
-+
-+    /* Pointer to gckHARDWARE object. */
-+    gckHARDWARE                 hardware;
-+
-+    /* Pointer to gckCOMMAND object. */
-+    gckCOMMAND                  command;
-+
-+    /* Pointer to gckEVENT object. */
-+    gckEVENT                    eventObj;
-+
-+    /* Pointer to context. */
-+    gctPOINTER                  context;
-+
-+    /* Pointer to gckMMU object. */
-+    gckMMU                      mmu;
-+
-+    /* Arom holding number of clients. */
-+    gctPOINTER                  atomClients;
-+
-+#if VIVANTE_PROFILER
-+    /* Enable profiling */
-+    gctBOOL                     profileEnable;
-+
-+    /* Clear profile register or not*/
-+    gctBOOL                     profileCleanRegister;
-+
-+#endif
-+
-+#ifdef QNX_SINGLE_THREADED_DEBUGGING
-+    gctPOINTER                  debugMutex;
-+#endif
-+
-+    /* Database management. */
-+    gckDB                       db;
-+    gctBOOL                     dbCreated;
-+
-+#if gcdENABLE_RECOVERY
-+    gctPOINTER                  resetFlagClearTimer;
-+    gctPOINTER                  resetAtom;
-+    gctUINT64                   resetTimeStamp;
-+#endif
-+
-+    /* Pointer to gckEVENT object. */
-+    gcsTIMER                    timers[8];
-+    gctUINT32                   timeOut;
-+
-+#if gcdENABLE_VG
-+    gckVGKERNEL                 vg;
-+#endif
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+    gckVIRTUAL_COMMAND_BUFFER_PTR virtualBufferHead;
-+    gckVIRTUAL_COMMAND_BUFFER_PTR virtualBufferTail;
-+    gctPOINTER                    virtualBufferLock;
-+#endif
-+
-+#if gcdDVFS
-+    gckDVFS                     dvfs;
-+#endif
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    gctHANDLE                   timeline;
-+#endif
-+
-+    spinlock_t                 irq_lock;
-+
-+    gctPOINTER                  vidmemMutex;
-+};
-+
-+struct _FrequencyHistory
-+{
-+    gctUINT32                   frequency;
-+    gctUINT32                   count;
-+};
-+
-+/* gckDVFS object. */
-+struct _gckDVFS
-+{
-+    gckOS                       os;
-+    gckHARDWARE                 hardware;
-+    gctPOINTER                  timer;
-+    gctUINT32                   pollingTime;
-+    gctBOOL                     stop;
-+    gctUINT32                   totalConfig;
-+    gctUINT32                   loads[8];
-+    gctUINT8                    currentScale;
-+    struct _FrequencyHistory    frequencyHistory[16];
-+};
-+
-+/* gckCOMMAND object. */
-+struct _gckCOMMAND
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to required object. */
-+    gckKERNEL                   kernel;
-+    gckOS                       os;
-+
-+    /* Number of bytes per page. */
-+    gctSIZE_T                   pageSize;
-+
-+    /* Current pipe select. */
-+    gcePIPE_SELECT              pipeSelect;
-+
-+    /* Command queue running flag. */
-+    gctBOOL                     running;
-+
-+    /* Idle flag and commit stamp. */
-+    gctBOOL                     idle;
-+    gctUINT64                   commitStamp;
-+
-+    /* Command queue mutex. */
-+    gctPOINTER                  mutexQueue;
-+
-+    /* Context switching mutex. */
-+    gctPOINTER                  mutexContext;
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+    /* Context sequence mutex. */
-+    gctPOINTER                  mutexContextSeq;
-+#endif
-+
-+    /* Command queue power semaphore. */
-+    gctPOINTER                  powerSemaphore;
-+
-+    /* Current command queue. */
-+    struct _gcskCOMMAND_QUEUE
-+    {
-+        gctSIGNAL               signal;
-+        gctPHYS_ADDR            physical;
-+        gctPOINTER              logical;
-+    }
-+    queues[gcdCOMMAND_QUEUES];
-+
-+    gctPHYS_ADDR                physical;
-+    gctPOINTER                  logical;
-+    gctUINT32                   offset;
-+    gctINT                      index;
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+    gctUINT                     wrapCount;
-+#endif
-+
-+    /* The command queue is new. */
-+    gctBOOL                     newQueue;
-+
-+    /* Context management. */
-+    gckCONTEXT                  currContext;
-+
-+    /* Pointer to last WAIT command. */
-+    gctPHYS_ADDR                waitPhysical;
-+    gctPOINTER                  waitLogical;
-+    gctSIZE_T                   waitSize;
-+
-+    /* Command buffer alignment. */
-+    gctSIZE_T                   alignment;
-+    gctSIZE_T                   reservedHead;
-+    gctSIZE_T                   reservedTail;
-+
-+    /* Commit counter. */
-+    gctPOINTER                  atomCommit;
-+
-+    /* Kernel process ID. */
-+    gctUINT32                   kernelProcessID;
-+
-+    /* End Event signal. */
-+    gctSIGNAL                   endEventSignal;
-+
-+#if gcdSECURE_USER
-+    /* Hint array copy buffer. */
-+    gctBOOL                     hintArrayAllocated;
-+    gctUINT                     hintArraySize;
-+    gctUINT32_PTR               hintArray;
-+#endif
-+};
-+
-+typedef struct _gcsEVENT *      gcsEVENT_PTR;
-+
-+/* Structure holding one event to be processed. */
-+typedef struct _gcsEVENT
-+{
-+    /* Pointer to next event in queue. */
-+    gcsEVENT_PTR                next;
-+
-+    /* Event information. */
-+    gcsHAL_INTERFACE            info;
-+
-+    /* Process ID owning the event. */
-+    gctUINT32                   processID;
-+
-+#ifdef __QNXNTO__
-+    /* Kernel. */
-+    gckKERNEL                   kernel;
-+#endif
-+
-+    gctBOOL                     fromKernel;
-+}
-+gcsEVENT;
-+
-+/* Structure holding a list of events to be processed by an interrupt. */
-+typedef struct _gcsEVENT_QUEUE * gcsEVENT_QUEUE_PTR;
-+typedef struct _gcsEVENT_QUEUE
-+{
-+    /* Time stamp. */
-+    gctUINT64                   stamp;
-+
-+    /* Source of the event. */
-+    gceKERNEL_WHERE             source;
-+
-+    /* Pointer to head of event queue. */
-+    gcsEVENT_PTR                head;
-+
-+    /* Pointer to tail of event queue. */
-+    gcsEVENT_PTR                tail;
-+
-+    /* Next list of events. */
-+    gcsEVENT_QUEUE_PTR          next;
-+}
-+gcsEVENT_QUEUE;
-+
-+/*
-+    gcdREPO_LIST_COUNT defines the maximum number of event queues with different
-+    hardware module sources that may coexist at the same time. Only two sources
-+    are supported - gcvKERNEL_COMMAND and gcvKERNEL_PIXEL. gcvKERNEL_COMMAND
-+    source is used only for managing the kernel command queue and is only issued
-+    when the current command queue gets full. Since we commit event queues every
-+    time we commit command buffers, in the worst case we can have up to three
-+    pending event queues:
-+        - gcvKERNEL_PIXEL
-+        - gcvKERNEL_COMMAND (queue overflow)
-+        - gcvKERNEL_PIXEL
-+*/
-+#define gcdREPO_LIST_COUNT      3
-+
-+/* gckEVENT object. */
-+struct _gckEVENT
-+{
-+    /* The object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to required objects. */
-+    gckOS                       os;
-+    gckKERNEL                   kernel;
-+
-+    /* Time stamp. */
-+    gctUINT64                   stamp;
-+    gctUINT64                   lastCommitStamp;
-+
-+    /* Queue mutex. */
-+    gctPOINTER                  eventQueueMutex;
-+
-+    /* Array of event queues. */
-+    gcsEVENT_QUEUE              queues[30];
-+    gctUINT8                    lastID;
-+    gctPOINTER                  freeAtom;
-+
-+    /* Pending events. */
-+#if gcdSMP
-+    gctPOINTER                  pending;
-+#else
-+    volatile gctUINT            pending;
-+#endif
-+
-+    /* List of free event structures and its mutex. */
-+    gcsEVENT_PTR                freeEventList;
-+    gctSIZE_T                   freeEventCount;
-+    gctPOINTER                  freeEventMutex;
-+
-+    /* Event queues. */
-+    gcsEVENT_QUEUE_PTR          queueHead;
-+    gcsEVENT_QUEUE_PTR          queueTail;
-+    gcsEVENT_QUEUE_PTR          freeList;
-+    gcsEVENT_QUEUE              repoList[gcdREPO_LIST_COUNT];
-+    gctPOINTER                  eventListMutex;
-+
-+    gctPOINTER                  submitTimer;
-+
-+    volatile gctBOOL            inNotify;
-+};
-+
-+/* Free all events belonging to a process. */
-+gceSTATUS
-+gckEVENT_FreeProcess(
-+    IN gckEVENT Event,
-+    IN gctUINT32 ProcessID
-+    );
-+
-+gceSTATUS
-+gckEVENT_Stop(
-+    IN gckEVENT Event,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Handle,
-+    IN gctPOINTER Logical,
-+    IN gctSIGNAL Signal,
-+	IN OUT gctSIZE_T * waitSize
-+    );
-+
-+gceSTATUS
-+gckEVENT_WaitEmpty(
-+    IN gckEVENT Event
-+    );
-+
-+/* gcuVIDMEM_NODE structure. */
-+typedef union _gcuVIDMEM_NODE
-+{
-+    /* Allocated from gckVIDMEM. */
-+    struct _gcsVIDMEM_NODE_VIDMEM
-+    {
-+        /* Owner of this node. */
-+        gckVIDMEM               memory;
-+
-+        /* Dual-linked list of nodes. */
-+        gcuVIDMEM_NODE_PTR      next;
-+        gcuVIDMEM_NODE_PTR      prev;
-+
-+        /* Dual linked list of free nodes. */
-+        gcuVIDMEM_NODE_PTR      nextFree;
-+        gcuVIDMEM_NODE_PTR      prevFree;
-+
-+        /* Information for this node. */
-+        gctUINT32               offset;
-+        gctSIZE_T               bytes;
-+        gctUINT32               alignment;
-+
-+#ifdef __QNXNTO__
-+        /* Client/server vaddr (mapped using mmap_join). */
-+        gctPOINTER              logical;
-+#endif
-+
-+        /* Locked counter. */
-+        gctINT32                locked;
-+
-+        /* Memory pool. */
-+        gcePOOL                 pool;
-+        gctUINT32               physical;
-+
-+        /* Process ID owning this memory. */
-+        gctUINT32               processID;
-+
-+        /* Prevent compositor from freeing until client unlocks. */
-+        gctBOOL                 freePending;
-+
-+        /* */
-+        gcsVIDMEM_NODE_SHARED_INFO sharedInfo;
-+
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
-+        gctPOINTER              kernelVirtual;
-+#endif
-+
-+        /* Surface type. */
-+        gceSURF_TYPE            type;
-+    }
-+    VidMem;
-+
-+    /* Allocated from gckOS. */
-+    struct _gcsVIDMEM_NODE_VIRTUAL
-+    {
-+        /* Pointer to gckKERNEL object. */
-+        gckKERNEL               kernel;
-+
-+        /* Information for this node. */
-+        /* Contiguously allocated? */
-+        gctBOOL                 contiguous;
-+        /* mdl record pointer... a kmalloc address. Process agnostic. */
-+        gctPHYS_ADDR            physical;
-+        gctSIZE_T               bytes;
-+        /* do_mmap_pgoff address... mapped per-process. */
-+        gctPOINTER              logical;
-+
-+        /* Page table information. */
-+        /* Used only when node is not contiguous */
-+        gctSIZE_T               pageCount;
-+
-+        /* Used only when node is not contiguous */
-+        gctPOINTER              pageTables[gcdMAX_GPU_COUNT];
-+        /* Pointer to gckKERNEL object who lock this. */
-+        gckKERNEL               lockKernels[gcdMAX_GPU_COUNT];
-+        /* Actual physical address */
-+        gctUINT32               addresses[gcdMAX_GPU_COUNT];
-+
-+        /* Locked counter. */
-+        gctINT32                lockeds[gcdMAX_GPU_COUNT];
-+
-+#ifdef __QNXNTO__
-+        /* Single linked list of nodes. */
-+        gcuVIDMEM_NODE_PTR      next;
-+
-+        /* Unlock pending flag. */
-+        gctBOOL                 unlockPendings[gcdMAX_GPU_COUNT];
-+
-+        /* Free pending flag. */
-+        gctBOOL                 freePending;
-+#endif
-+
-+        /* Process ID owning this memory. */
-+        gctUINT32               processID;
-+
-+        /* Owner process sets freed to true
-+         * when it trys to free a locked
-+         * node */
-+        gctBOOL                 freed;
-+
-+        /* */
-+        gcsVIDMEM_NODE_SHARED_INFO sharedInfo;
-+
-+        /* Surface type. */
-+        gceSURF_TYPE            type;
-+    }
-+    Virtual;
-+}
-+gcuVIDMEM_NODE;
-+
-+/* gckVIDMEM object. */
-+struct _gckVIDMEM
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Information for this video memory heap. */
-+    gctUINT32                   baseAddress;
-+    gctSIZE_T                   bytes;
-+    gctSIZE_T                   freeBytes;
-+
-+    /* Mapping for each type of surface. */
-+    gctINT                      mapping[gcvSURF_NUM_TYPES];
-+
-+    /* Sentinel nodes for up to 8 banks. */
-+    gcuVIDMEM_NODE              sentinel[8];
-+
-+    /* Allocation threshold. */
-+    gctSIZE_T                   threshold;
-+
-+#if gcdUSE_VIDMEM_PER_PID
-+    /* The Pid this VidMem belongs to. */
-+    gctUINT32                   pid;
-+
-+    struct _gckVIDMEM*          next;
-+#endif
-+};
-+
-+/* gckMMU object. */
-+struct _gckMMU
-+{
-+    /* The object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Pointer to gckHARDWARE object. */
-+    gckHARDWARE                 hardware;
-+
-+    /* The page table mutex. */
-+    gctPOINTER                  pageTableMutex;
-+
-+    /* Page table information. */
-+    gctSIZE_T                   pageTableSize;
-+    gctPHYS_ADDR                pageTablePhysical;
-+    gctUINT32_PTR               pageTableLogical;
-+    gctUINT32                   pageTableEntries;
-+
-+    /* Master TLB information. */
-+    gctSIZE_T                   mtlbSize;
-+    gctPHYS_ADDR                mtlbPhysical;
-+    gctUINT32_PTR               mtlbLogical;
-+    gctUINT32                   mtlbEntries;
-+
-+    /* Free entries. */
-+    gctUINT32                   heapList;
-+    gctBOOL                     freeNodes;
-+
-+    gctPOINTER                  staticSTLB;
-+    gctBOOL                     enabled;
-+
-+    gctUINT32                   dynamicMappingStart;
-+
-+#ifdef __QNXNTO__
-+    /* Single linked list of all allocated nodes. */
-+    gctPOINTER                  nodeMutex;
-+    gcuVIDMEM_NODE_PTR          nodeList;
-+#endif
-+};
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+gceSTATUS
-+gckOS_CreateKernelVirtualMapping(
-+    IN gctPHYS_ADDR Physical,
-+    OUT gctSIZE_T * PageCount,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+gceSTATUS
-+gckOS_DestroyKernelVirtualMapping(
-+    IN gctPOINTER Logical
-+    );
-+
-+gceSTATUS
-+gckKERNEL_AllocateVirtualCommandBuffer(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+gceSTATUS
-+gckKERNEL_DestroyVirtualCommandBuffer(
-+    IN gckKERNEL Kernel,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical
-+    );
-+
-+gceSTATUS
-+gckKERNEL_GetGPUAddress(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    );
-+
-+gceSTATUS
-+gckKERNEL_QueryGPUAddress(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 GpuAddress,
-+    OUT gckVIRTUAL_COMMAND_BUFFER_PTR * Buffer
-+    );
-+#endif
-+
-+gceSTATUS
-+gckKERNEL_AttachProcess(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL Attach
-+    );
-+
-+gceSTATUS
-+gckKERNEL_AttachProcessEx(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL Attach,
-+    IN gctUINT32 PID
-+    );
-+
-+#if gcdSECURE_USER
-+gceSTATUS
-+gckKERNEL_MapLogicalToPhysical(
-+    IN gckKERNEL Kernel,
-+    IN gcskSECURE_CACHE_PTR Cache,
-+    IN OUT gctPOINTER * Data
-+    );
-+
-+gceSTATUS
-+gckKERNEL_FlushTranslationCache(
-+    IN gckKERNEL Kernel,
-+    IN gcskSECURE_CACHE_PTR Cache,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+#endif
-+
-+gceSTATUS
-+gckHARDWARE_QueryIdle(
-+    IN gckHARDWARE Hardware,
-+    OUT gctBOOL_PTR IsIdle
-+    );
-+
-+/******************************************************************************\
-+******************************* gckCONTEXT Object *******************************
-+\******************************************************************************/
-+
-+gceSTATUS
-+gckCONTEXT_Construct(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 ProcessID,
-+    OUT gckCONTEXT * Context
-+    );
-+
-+gceSTATUS
-+gckCONTEXT_Destroy(
-+    IN gckCONTEXT Context
-+    );
-+
-+gceSTATUS
-+gckCONTEXT_Update(
-+    IN gckCONTEXT Context,
-+    IN gctUINT32 ProcessID,
-+    IN gcsSTATE_DELTA_PTR StateDelta
-+    );
-+
-+#if gcdLINK_QUEUE_SIZE
-+void
-+gckLINKQUEUE_Enqueue(
-+    IN gckLINKQUEUE LinkQueue,
-+    IN gctUINT32 start,
-+    IN gctUINT32 end
-+    );
-+
-+void
-+gckLINKQUEUE_GetData(
-+    IN gckLINKQUEUE LinkQueue,
-+    IN gctUINT32 Index,
-+    OUT gckLINKDATA * Data
-+    );
-+#endif
-+
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,859 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+/**
-+**  @file
-+**  gckHEAP object for kernel HAL layer.  The heap implemented here is an arena-
-+**  based memory allocation.  An arena-based memory heap allocates data quickly
-+**  from specified arenas and reduces memory fragmentation.
-+**
-+*/
-+#include "gc_hal_kernel_precomp.h"
-+
-+#define _GC_OBJ_ZONE            gcvZONE_HEAP
-+
-+/*******************************************************************************
-+***** Structures ***************************************************************
-+*******************************************************************************/
-+
-+#define gcdIN_USE               ((gcskNODE_PTR) ~0)
-+
-+typedef struct _gcskNODE *      gcskNODE_PTR;
-+typedef struct _gcskNODE
-+{
-+    /* Number of byets in node. */
-+    gctSIZE_T                   bytes;
-+
-+    /* Pointer to next free node, or gcvNULL to mark the node as freed, or
-+    ** gcdIN_USE to mark the node as used. */
-+    gcskNODE_PTR                next;
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Time stamp of allocation. */
-+    gctUINT64                   timeStamp;
-+#endif
-+}
-+gcskNODE;
-+
-+typedef struct _gcskHEAP    *   gcskHEAP_PTR;
-+typedef struct _gcskHEAP
-+{
-+    /* Linked list. */
-+    gcskHEAP_PTR                next;
-+    gcskHEAP_PTR                prev;
-+
-+    /* Heap size. */
-+    gctSIZE_T                   size;
-+
-+    /* Free list. */
-+    gcskNODE_PTR                freeList;
-+}
-+gcskHEAP;
-+
-+struct _gckHEAP
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to a gckOS object. */
-+    gckOS                       os;
-+
-+    /* Locking mutex. */
-+    gctPOINTER                  mutex;
-+
-+    /* Allocation parameters. */
-+    gctSIZE_T                   allocationSize;
-+
-+    /* Heap list. */
-+    gcskHEAP_PTR                heap;
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    gctUINT64                   timeStamp;
-+#endif
-+
-+#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Profile information. */
-+    gctUINT32                   allocCount;
-+    gctUINT64                   allocBytes;
-+    gctUINT64                   allocBytesMax;
-+    gctUINT64                   allocBytesTotal;
-+    gctUINT32                   heapCount;
-+    gctUINT32                   heapCountMax;
-+    gctUINT64                   heapMemory;
-+    gctUINT64                   heapMemoryMax;
-+#endif
-+};
-+
-+/*******************************************************************************
-+***** Static Support Functions *************************************************
-+*******************************************************************************/
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+static gctSIZE_T
-+_DumpHeap(
-+    IN gcskHEAP_PTR Heap
-+    )
-+{
-+    gctPOINTER p;
-+    gctSIZE_T leaked = 0;
-+
-+    /* Start at first node. */
-+    for (p = Heap + 1;;)
-+    {
-+        /* Convert the pointer. */
-+        gcskNODE_PTR node = (gcskNODE_PTR) p;
-+
-+        /* Check if this is a used node. */
-+        if (node->next == gcdIN_USE)
-+        {
-+            /* Print the leaking node. */
-+            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_HEAP,
-+                           "Detected leaking: node=0x%x bytes=%lu timeStamp=%llu "
-+                           "(%08X %c%c%c%c)",
-+                           node, node->bytes, node->timeStamp,
-+                           ((gctUINT32_PTR) (node + 1))[0],
-+                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[0]),
-+                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[1]),
-+                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[2]),
-+                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[3]));
-+
-+            /* Add leaking byte count. */
-+            leaked += node->bytes;
-+        }
-+
-+        /* Test for end of heap. */
-+        if (node->bytes == 0)
-+        {
-+            break;
-+        }
-+
-+        else
-+        {
-+            /* Move to next node. */
-+            p = (gctUINT8_PTR) node + node->bytes;
-+        }
-+    }
-+
-+    /* Return the number of leaked bytes. */
-+    return leaked;
-+}
-+#endif
-+
-+static gceSTATUS
-+_CompactKernelHeap(
-+    IN gckHEAP Heap
-+    )
-+{
-+    gcskHEAP_PTR heap, next;
-+    gctPOINTER p;
-+    gcskHEAP_PTR freeList = gcvNULL;
-+
-+    gcmkHEADER_ARG("Heap=0x%x", Heap);
-+
-+    /* Walk all the heaps. */
-+    for (heap = Heap->heap; heap != gcvNULL; heap = next)
-+    {
-+        gcskNODE_PTR lastFree = gcvNULL;
-+
-+        /* Zero out the free list. */
-+        heap->freeList = gcvNULL;
-+
-+        /* Start at the first node. */
-+        for (p = (gctUINT8_PTR) (heap + 1);;)
-+        {
-+            /* Convert the pointer. */
-+            gcskNODE_PTR node = (gcskNODE_PTR) p;
-+
-+            gcmkASSERT(p <= (gctPOINTER) ((gctUINT8_PTR) (heap + 1) + heap->size));
-+
-+            /* Test if this node not used. */
-+            if (node->next != gcdIN_USE)
-+            {
-+                /* Test if this is the end of the heap. */
-+                if (node->bytes == 0)
-+                {
-+                    break;
-+                }
-+
-+                /* Test of this is the first free node. */
-+                else if (lastFree == gcvNULL)
-+                {
-+                    /* Initialzie the free list. */
-+                    heap->freeList = node;
-+                    lastFree       = node;
-+                }
-+
-+                else
-+                {
-+                    /* Test if this free node is contiguous with the previous
-+                    ** free node. */
-+                    if ((gctUINT8_PTR) lastFree + lastFree->bytes == p)
-+                    {
-+                        /* Just increase the size of the previous free node. */
-+                        lastFree->bytes += node->bytes;
-+                    }
-+                    else
-+                    {
-+                        /* Add to linked list. */
-+                        lastFree->next = node;
-+                        lastFree       = node;
-+                    }
-+                }
-+            }
-+
-+            /* Move to next node. */
-+            p = (gctUINT8_PTR) node + node->bytes;
-+        }
-+
-+        /* Mark the end of the chain. */
-+        if (lastFree != gcvNULL)
-+        {
-+            lastFree->next = gcvNULL;
-+        }
-+
-+        /* Get next heap. */
-+        next = heap->next;
-+
-+        /* Check if the entire heap is free. */
-+        if ((heap->freeList != gcvNULL)
-+        &&  (heap->freeList->bytes == heap->size - gcmSIZEOF(gcskNODE))
-+        )
-+        {
-+            /* Remove the heap from the linked list. */
-+            if (heap->prev == gcvNULL)
-+            {
-+                Heap->heap = next;
-+            }
-+            else
-+            {
-+                heap->prev->next = next;
-+            }
-+
-+            if (heap->next != gcvNULL)
-+            {
-+                heap->next->prev = heap->prev;
-+            }
-+
-+#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
-+            /* Update profiling. */
-+            Heap->heapCount  -= 1;
-+            Heap->heapMemory -= heap->size + gcmSIZEOF(gcskHEAP);
-+#endif
-+
-+            /* Add this heap to the list of heaps that need to be freed. */
-+            heap->next = freeList;
-+            freeList   = heap;
-+        }
-+    }
-+
-+    if (freeList != gcvNULL)
-+    {
-+        /* Release the mutex, remove any chance for a dead lock. */
-+        gcmkVERIFY_OK(
-+            gckOS_ReleaseMutex(Heap->os, Heap->mutex));
-+
-+        /* Free all heaps in the free list. */
-+        for (heap = freeList; heap != gcvNULL; heap = next)
-+        {
-+            /* Get pointer to the next heap. */
-+            next = heap->next;
-+
-+            /* Free the heap. */
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HEAP,
-+                           "Freeing heap 0x%x (%lu bytes)",
-+                           heap, heap->size + gcmSIZEOF(gcskHEAP));
-+            gcmkVERIFY_OK(gckOS_FreeMemory(Heap->os, heap));
-+        }
-+
-+        /* Acquire the mutex again. */
-+        gcmkVERIFY_OK(
-+            gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+***** gckHEAP API Code *********************************************************
-+*******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckHEAP_Construct
-+**
-+**  Construct a new gckHEAP object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctSIZE_T AllocationSize
-+**          Minimum size per arena.
-+**
-+**  OUTPUT:
-+**
-+**      gckHEAP * Heap
-+**          Pointer to a variable that will hold the pointer to the gckHEAP
-+**          object.
-+*/
-+gceSTATUS
-+gckHEAP_Construct(
-+    IN gckOS Os,
-+    IN gctSIZE_T AllocationSize,
-+    OUT gckHEAP * Heap
-+    )
-+{
-+    gceSTATUS status;
-+    gckHEAP heap = gcvNULL;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%x AllocationSize=%lu", Os, AllocationSize);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Heap != gcvNULL);
-+
-+    /* Allocate the gckHEAP object. */
-+    gcmkONERROR(gckOS_AllocateMemory(Os,
-+                                     gcmSIZEOF(struct _gckHEAP),
-+                                     &pointer));
-+
-+    heap = pointer;
-+
-+    /* Initialize the gckHEAP object. */
-+    heap->object.type    = gcvOBJ_HEAP;
-+    heap->os             = Os;
-+    heap->allocationSize = AllocationSize;
-+    heap->heap           = gcvNULL;
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    heap->timeStamp      = 0;
-+#endif
-+
-+#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Zero the counters. */
-+    heap->allocCount      = 0;
-+    heap->allocBytes      = 0;
-+    heap->allocBytesMax   = 0;
-+    heap->allocBytesTotal = 0;
-+    heap->heapCount       = 0;
-+    heap->heapCountMax    = 0;
-+    heap->heapMemory      = 0;
-+    heap->heapMemoryMax   = 0;
-+#endif
-+
-+    /* Create the mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(Os, &heap->mutex));
-+
-+    /* Return the pointer to the gckHEAP object. */
-+    *Heap = heap;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Heap=0x%x", *Heap);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (heap != gcvNULL)
-+    {
-+        /* Free the heap structure. */
-+        gcmkVERIFY_OK(gckOS_FreeMemory(Os, heap));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHEAP_Destroy
-+**
-+**  Destroy a gckHEAP object.
-+**
-+**  INPUT:
-+**
-+**      gckHEAP Heap
-+**          Pointer to a gckHEAP object to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckHEAP_Destroy(
-+    IN gckHEAP Heap
-+    )
-+{
-+    gcskHEAP_PTR heap;
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    gctSIZE_T leaked = 0;
-+#endif
-+
-+    gcmkHEADER_ARG("Heap=0x%x", Heap);
-+
-+    for (heap = Heap->heap; heap != gcvNULL; heap = Heap->heap)
-+    {
-+        /* Unlink heap from linked list. */
-+        Heap->heap = heap->next;
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+        /* Check for leaked memory. */
-+        leaked += _DumpHeap(heap);
-+#endif
-+
-+        /* Free the heap. */
-+        gcmkVERIFY_OK(gckOS_FreeMemory(Heap->os, heap));
-+    }
-+
-+    /* Free the mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Heap->os, Heap->mutex));
-+
-+    /* Free the heap structure. */
-+    gcmkVERIFY_OK(gckOS_FreeMemory(Heap->os, Heap));
-+
-+    /* Success. */
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    gcmkFOOTER_ARG("leaked=%lu", leaked);
-+#else
-+    gcmkFOOTER_NO();
-+#endif
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHEAP_Allocate
-+**
-+**  Allocate data from the heap.
-+**
-+**  INPUT:
-+**
-+**      gckHEAP Heap
-+**          Pointer to a gckHEAP object.
-+**
-+**      IN gctSIZE_T Bytes
-+**          Number of byte to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Memory
-+**          Pointer to a variable that will hold the address of the allocated
-+**          memory.
-+*/
-+gceSTATUS
-+gckHEAP_Allocate(
-+    IN gckHEAP Heap,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    )
-+{
-+    gctBOOL acquired = gcvFALSE;
-+    gcskHEAP_PTR heap;
-+    gceSTATUS status;
-+    gctSIZE_T bytes;
-+    gcskNODE_PTR node, used, prevFree = gcvNULL;
-+    gctPOINTER memory = gcvNULL;
-+
-+    gcmkHEADER_ARG("Heap=0x%x Bytes=%lu", Heap, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    /* Determine number of bytes required for a node. */
-+    bytes = gcmALIGN(Bytes + gcmSIZEOF(gcskNODE), 8);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
-+
-+    acquired = gcvTRUE;
-+
-+    /* Check if this allocation is bigger than the default allocation size. */
-+    if (bytes > Heap->allocationSize - gcmSIZEOF(gcskHEAP) - gcmSIZEOF(gcskNODE))
-+    {
-+        /* Adjust allocation size. */
-+        Heap->allocationSize = bytes * 2;
-+    }
-+
-+    else if (Heap->heap != gcvNULL)
-+    {
-+        gctINT i;
-+
-+        /* 2 retries, since we might need to compact. */
-+        for (i = 0; i < 2; ++i)
-+        {
-+            /* Walk all the heaps. */
-+            for (heap = Heap->heap; heap != gcvNULL; heap = heap->next)
-+            {
-+                /* Check if this heap has enough bytes to hold the request. */
-+                if (bytes <= heap->size - gcmSIZEOF(gcskNODE))
-+                {
-+                    prevFree = gcvNULL;
-+
-+                    /* Walk the chain of free nodes. */
-+                    for (node = heap->freeList;
-+                         node != gcvNULL;
-+                         node = node->next
-+                    )
-+                    {
-+                        gcmkASSERT(node->next != gcdIN_USE);
-+
-+                        /* Check if this free node has enough bytes. */
-+                        if (node->bytes >= bytes)
-+                        {
-+                            /* Use the node. */
-+                            goto UseNode;
-+                        }
-+
-+                        /* Save current free node for linked list management. */
-+                        prevFree = node;
-+                    }
-+                }
-+            }
-+
-+            if (i == 0)
-+            {
-+                /* Compact the heap. */
-+                gcmkVERIFY_OK(_CompactKernelHeap(Heap));
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "===== KERNEL HEAP =====");
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Number of allocations           : %12u",
-+                               Heap->allocCount);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Number of bytes allocated       : %12llu",
-+                               Heap->allocBytes);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Maximum allocation size         : %12llu",
-+                               Heap->allocBytesMax);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Total number of bytes allocated : %12llu",
-+                               Heap->allocBytesTotal);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Number of heaps                 : %12u",
-+                               Heap->heapCount);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Heap memory in bytes            : %12llu",
-+                               Heap->heapMemory);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Maximum number of heaps         : %12u",
-+                               Heap->heapCountMax);
-+                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
-+                               "Maximum heap memory in bytes    : %12llu",
-+                               Heap->heapMemoryMax);
-+#endif
-+            }
-+        }
-+    }
-+
-+    /* Release the mutex. */
-+    gcmkONERROR(
-+        gckOS_ReleaseMutex(Heap->os, Heap->mutex));
-+
-+    acquired = gcvFALSE;
-+
-+    /* Allocate a new heap. */
-+    gcmkONERROR(
-+        gckOS_AllocateMemory(Heap->os,
-+                             Heap->allocationSize,
-+                             &memory));
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HEAP,
-+                   "Allocated heap 0x%x (%lu bytes)",
-+                   memory, Heap->allocationSize);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
-+
-+    acquired = gcvTRUE;
-+
-+    /* Use the allocated memory as the heap. */
-+    heap = (gcskHEAP_PTR) memory;
-+
-+    /* Insert this heap to the head of the chain. */
-+    heap->next = Heap->heap;
-+    heap->prev = gcvNULL;
-+    heap->size = Heap->allocationSize - gcmSIZEOF(gcskHEAP);
-+
-+    if (heap->next != gcvNULL)
-+    {
-+        heap->next->prev = heap;
-+    }
-+    Heap->heap = heap;
-+
-+    /* Mark the end of the heap. */
-+    node = (gcskNODE_PTR) ( (gctUINT8_PTR) heap
-+                          + Heap->allocationSize
-+                          - gcmSIZEOF(gcskNODE)
-+                          );
-+    node->bytes = 0;
-+    node->next  = gcvNULL;
-+
-+    /* Create a free list. */
-+    node           = (gcskNODE_PTR) (heap + 1);
-+    heap->freeList = node;
-+
-+    /* Initialize the free list. */
-+    node->bytes = heap->size - gcmSIZEOF(gcskNODE);
-+    node->next  = gcvNULL;
-+
-+    /* No previous free. */
-+    prevFree = gcvNULL;
-+
-+#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Update profiling. */
-+    Heap->heapCount  += 1;
-+    Heap->heapMemory += Heap->allocationSize;
-+
-+    if (Heap->heapCount > Heap->heapCountMax)
-+    {
-+        Heap->heapCountMax = Heap->heapCount;
-+    }
-+    if (Heap->heapMemory > Heap->heapMemoryMax)
-+    {
-+        Heap->heapMemoryMax = Heap->heapMemory;
-+    }
-+#endif
-+
-+UseNode:
-+    /* Verify some stuff. */
-+    gcmkASSERT(heap != gcvNULL);
-+    gcmkASSERT(node != gcvNULL);
-+    gcmkASSERT(node->bytes >= bytes);
-+
-+    if (heap->prev != gcvNULL)
-+    {
-+        /* Unlink the heap from the linked list. */
-+        heap->prev->next = heap->next;
-+        if (heap->next != gcvNULL)
-+        {
-+            heap->next->prev = heap->prev;
-+        }
-+
-+        /* Move the heap to the front of the list. */
-+        heap->next       = Heap->heap;
-+        heap->prev       = gcvNULL;
-+        Heap->heap       = heap;
-+        heap->next->prev = heap;
-+    }
-+
-+    /* Check if there is enough free space left after usage for another free
-+    ** node. */
-+    if (node->bytes - bytes >= gcmSIZEOF(gcskNODE))
-+    {
-+        /* Allocated used space from the back of the free list. */
-+        used = (gcskNODE_PTR) ((gctUINT8_PTR) node + node->bytes - bytes);
-+
-+        /* Adjust the number of free bytes. */
-+        node->bytes -= bytes;
-+        gcmkASSERT(node->bytes >= gcmSIZEOF(gcskNODE));
-+    }
-+    else
-+    {
-+        /* Remove this free list from the chain. */
-+        if (prevFree == gcvNULL)
-+        {
-+            heap->freeList = node->next;
-+        }
-+        else
-+        {
-+            prevFree->next = node->next;
-+        }
-+
-+        /* Consume the entire free node. */
-+        used  = (gcskNODE_PTR) node;
-+        bytes = node->bytes;
-+    }
-+
-+    /* Mark node as used. */
-+    used->bytes     = bytes;
-+    used->next      = gcdIN_USE;
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    used->timeStamp = ++Heap->timeStamp;
-+#endif
-+
-+#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Update profile counters. */
-+    Heap->allocCount      += 1;
-+    Heap->allocBytes      += bytes;
-+    Heap->allocBytesMax    = gcmMAX(Heap->allocBytes, Heap->allocBytesMax);
-+    Heap->allocBytesTotal += bytes;
-+#endif
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(
-+        gckOS_ReleaseMutex(Heap->os, Heap->mutex));
-+
-+    /* Return pointer to memory. */
-+    *Memory = used + 1;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Memory=0x%x", *Memory);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(
-+            gckOS_ReleaseMutex(Heap->os, Heap->mutex));
-+    }
-+
-+    if (memory != gcvNULL)
-+    {
-+        /* Free the heap memory. */
-+        gckOS_FreeMemory(Heap->os, memory);
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckHEAP_Free
-+**
-+**  Free allocated memory from the heap.
-+**
-+**  INPUT:
-+**
-+**      gckHEAP Heap
-+**          Pointer to a gckHEAP object.
-+**
-+**      IN gctPOINTER Memory
-+**          Pointer to memory to free.
-+**
-+**  OUTPUT:
-+**
-+**      NOTHING.
-+*/
-+gceSTATUS
-+gckHEAP_Free(
-+    IN gckHEAP Heap,
-+    IN gctPOINTER Memory
-+    )
-+{
-+    gcskNODE_PTR node;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Heap=0x%x Memory=0x%x", Heap, Memory);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
-+
-+    /* Pointer to structure. */
-+    node = (gcskNODE_PTR) Memory - 1;
-+
-+    /* Mark the node as freed. */
-+    node->next = gcvNULL;
-+
-+#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Update profile counters. */
-+    Heap->allocBytes -= node->bytes;
-+#endif
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(
-+        gckOS_ReleaseMutex(Heap->os, Heap->mutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if VIVANTE_PROFILER
-+gceSTATUS
-+gckHEAP_ProfileStart(
-+    IN gckHEAP Heap
-+    )
-+{
-+    gcmkHEADER_ARG("Heap=0x%x", Heap);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
-+
-+    /* Zero the counters. */
-+    Heap->allocCount      = 0;
-+    Heap->allocBytes      = 0;
-+    Heap->allocBytesMax   = 0;
-+    Heap->allocBytesTotal = 0;
-+    Heap->heapCount       = 0;
-+    Heap->heapCountMax    = 0;
-+    Heap->heapMemory      = 0;
-+    Heap->heapMemoryMax   = 0;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckHEAP_ProfileEnd(
-+    IN gckHEAP Heap,
-+    IN gctCONST_STRING Title
-+    )
-+{
-+    gcmkHEADER_ARG("Heap=0x%x Title=0x%x", Heap, Title);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
-+    gcmkVERIFY_ARGUMENT(Title != gcvNULL);
-+
-+    gcmkPRINT("");
-+    gcmkPRINT("=====[ HEAP - %s ]=====", Title);
-+    gcmkPRINT("Number of allocations           : %12u",   Heap->allocCount);
-+    gcmkPRINT("Number of bytes allocated       : %12llu", Heap->allocBytes);
-+    gcmkPRINT("Maximum allocation size         : %12llu", Heap->allocBytesMax);
-+    gcmkPRINT("Total number of bytes allocated : %12llu", Heap->allocBytesTotal);
-+    gcmkPRINT("Number of heaps                 : %12u",   Heap->heapCount);
-+    gcmkPRINT("Heap memory in bytes            : %12llu", Heap->heapMemory);
-+    gcmkPRINT("Maximum number of heaps         : %12u",   Heap->heapCountMax);
-+    gcmkPRINT("Maximum heap memory in bytes    : %12llu", Heap->heapMemoryMax);
-+    gcmkPRINT("==============================================");
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+#endif /* VIVANTE_PROFILER */
-+
-+/*******************************************************************************
-+***** Test Code ****************************************************************
-+*******************************************************************************/
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,877 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#if gcdENABLE_VG
-+
-+/******************************************************************************\
-+*********************** Support Functions and Definitions **********************
-+\******************************************************************************/
-+
-+/* Interruot statistics will be accumulated if not zero. */
-+#define gcmENABLE_INTERRUPT_STATISTICS 0
-+
-+#define _GC_OBJ_ZONE    gcvZONE_INTERRUPT
-+
-+/* Object structure. */
-+struct _gckVGINTERRUPT
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* gckVGKERNEL pointer. */
-+    gckVGKERNEL                 kernel;
-+
-+    /* gckOS pointer. */
-+    gckOS                       os;
-+
-+    /* Interrupt handlers. */
-+    gctINTERRUPT_HANDLER        handlers[32];
-+
-+    /* Main interrupt handler thread. */
-+    gctTHREAD                   handler;
-+    gctBOOL                     terminate;
-+
-+    /* Interrupt FIFO. */
-+    gctSEMAPHORE                fifoValid;
-+    gctUINT32                   fifo[256];
-+    gctUINT                     fifoItems;
-+    gctUINT8                    head;
-+    gctUINT8                    tail;
-+
-+    /* Interrupt statistics. */
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+    gctUINT                     maxFifoItems;
-+    gctUINT                     fifoOverflow;
-+    gctUINT                     maxSimultaneous;
-+    gctUINT                     multipleCount;
-+#endif
-+};
-+
-+
-+/*******************************************************************************
-+**
-+**  _ProcessInterrupt
-+**
-+**  The interrupt processor.
-+**
-+**  INPUT:
-+**
-+**      ThreadParameter
-+**          Pointer to the gckVGINTERRUPT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+static void
-+_ProcessInterrupt(
-+    gckVGINTERRUPT Interrupt,
-+    gctUINT_PTR TriggeredCount
-+    )
-+#else
-+static void
-+_ProcessInterrupt(
-+    gckVGINTERRUPT Interrupt
-+    )
-+#endif
-+{
-+    gceSTATUS status;
-+    gctUINT32 triggered;
-+    gctUINT i;
-+
-+    /* Advance to the next entry. */
-+    Interrupt->tail      += 1;
-+    Interrupt->fifoItems -= 1;
-+
-+    /* Get the interrupt value. */
-+    triggered = Interrupt->fifo[Interrupt->tail];
-+    gcmkASSERT(triggered != 0);
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "%s: triggered=0x%08X\n",
-+        __FUNCTION__,
-+        triggered
-+        );
-+
-+    /* Walk through all possible interrupts. */
-+    for (i = 0; i < gcmSIZEOF(Interrupt->handlers); i += 1)
-+    {
-+        /* Test if interrupt happened. */
-+        if ((triggered & 1) == 1)
-+        {
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+            if (TriggeredCount != gcvNULL)
-+            {
-+                (* TriggeredCount) += 1;
-+            }
-+#endif
-+
-+            /* Make sure we have valid handler. */
-+            if (Interrupt->handlers[i] == gcvNULL)
-+            {
-+                gcmkTRACE(
-+                    gcvLEVEL_ERROR,
-+                    "%s: Interrupt %d isn't registered.\n",
-+                    __FUNCTION__, i
-+                    );
-+            }
-+            else
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                    "%s: interrupt=%d\n",
-+                    __FUNCTION__,
-+                    i
-+                    );
-+
-+                /* Call the handler. */
-+                status = Interrupt->handlers[i] (Interrupt->kernel);
-+
-+                if (gcmkIS_ERROR(status))
-+                {
-+                    /* Failed to signal the semaphore. */
-+                    gcmkTRACE(
-+                        gcvLEVEL_ERROR,
-+                        "%s: Error %d incrementing the semaphore #%d.\n",
-+                        __FUNCTION__, status, i
-+                        );
-+                }
-+            }
-+        }
-+
-+        /* Next interrupt. */
-+        triggered >>= 1;
-+
-+        /* No more interrupts to handle? */
-+        if (triggered == 0)
-+        {
-+            break;
-+        }
-+    }
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  _MainInterruptHandler
-+**
-+**  The main interrupt thread serves the interrupt FIFO and calls registered
-+**  handlers for the interrupts that occured. The handlers are called in the
-+**  sequence interrupts occured with the exception when multiple interrupts
-+**  occured at the same time. In that case the handler calls are "sorted" by
-+**  the interrupt number therefore giving the interrupts with lower numbers
-+**  higher priority.
-+**
-+**  INPUT:
-+**
-+**      ThreadParameter
-+**          Pointer to the gckVGINTERRUPT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+static gctTHREADFUNCRESULT gctTHREADFUNCTYPE
-+_MainInterruptHandler(
-+    gctTHREADFUNCPARAMETER ThreadParameter
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGINTERRUPT interrupt;
-+
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+    gctUINT count;
-+#endif
-+
-+    /* Cast the object. */
-+    interrupt = (gckVGINTERRUPT) ThreadParameter;
-+
-+    /* Enter the loop. */
-+    while (gcvTRUE)
-+    {
-+        /* Wait for an interrupt. */
-+        status = gckOS_DecrementSemaphore(interrupt->os, interrupt->fifoValid);
-+
-+        /* Error? */
-+        if (gcmkIS_ERROR(status))
-+        {
-+            break;
-+        }
-+
-+        /* System termination request? */
-+        if (status == gcvSTATUS_TERMINATE)
-+        {
-+            break;
-+        }
-+
-+        /* Driver is shutting down? */
-+        if (interrupt->terminate)
-+        {
-+            break;
-+        }
-+
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+        /* Reset triggered count. */
-+        count = 0;
-+
-+        /* Process the interrupt. */
-+        _ProcessInterrupt(interrupt, &count);
-+
-+        /* Update conters. */
-+        if (count > interrupt->maxSimultaneous)
-+        {
-+            interrupt->maxSimultaneous = count;
-+        }
-+
-+        if (count > 1)
-+        {
-+            interrupt->multipleCount += 1;
-+        }
-+#else
-+        /* Process the interrupt. */
-+        _ProcessInterrupt(interrupt);
-+#endif
-+    }
-+
-+    return 0;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  _StartInterruptHandler / _StopInterruptHandler
-+**
-+**  Main interrupt handler routine control.
-+**
-+**  INPUT:
-+**
-+**      ThreadParameter
-+**          Pointer to the gckVGINTERRUPT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+static gceSTATUS
-+_StartInterruptHandler(
-+    gckVGINTERRUPT Interrupt
-+    )
-+{
-+    gceSTATUS status, last;
-+
-+    do
-+    {
-+        /* Objects must not be already created. */
-+        gcmkASSERT(Interrupt->fifoValid == gcvNULL);
-+        gcmkASSERT(Interrupt->handler   == gcvNULL);
-+
-+        /* Reset the termination request. */
-+        Interrupt->terminate = gcvFALSE;
-+
-+#if !gcdENABLE_INFINITE_SPEED_HW
-+        /* Construct the fifo semaphore. */
-+        gcmkERR_BREAK(gckOS_CreateSemaphoreVG(
-+            Interrupt->os, &Interrupt->fifoValid
-+            ));
-+
-+        /* Start the interrupt handler thread. */
-+        gcmkERR_BREAK(gckOS_StartThread(
-+            Interrupt->os,
-+            _MainInterruptHandler,
-+            Interrupt,
-+            &Interrupt->handler
-+            ));
-+#endif
-+
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Roll back. */
-+    if (Interrupt->fifoValid != gcvNULL)
-+    {
-+        gcmkCHECK_STATUS(gckOS_DestroySemaphore(
-+            Interrupt->os, Interrupt->fifoValid
-+            ));
-+
-+        Interrupt->fifoValid = gcvNULL;
-+    }
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+static gceSTATUS
-+_StopInterruptHandler(
-+    gckVGINTERRUPT Interrupt
-+    )
-+{
-+    gceSTATUS status;
-+
-+    do
-+    {
-+        /* Does the thread exist? */
-+        if (Interrupt->handler == gcvNULL)
-+        {
-+            /* The semaphore must be NULL as well. */
-+            gcmkASSERT(Interrupt->fifoValid == gcvNULL);
-+
-+            /* Success. */
-+            status = gcvSTATUS_OK;
-+            break;
-+        }
-+
-+        /* The semaphore must exist as well. */
-+        gcmkASSERT(Interrupt->fifoValid != gcvNULL);
-+
-+        /* Set the termination request. */
-+        Interrupt->terminate = gcvTRUE;
-+
-+        /* Unlock the thread. */
-+        gcmkERR_BREAK(gckOS_IncrementSemaphore(
-+            Interrupt->os, Interrupt->fifoValid
-+            ));
-+
-+        /* Wait until the thread quits. */
-+        gcmkERR_BREAK(gckOS_StopThread(
-+            Interrupt->os,
-+            Interrupt->handler
-+            ));
-+
-+        /* Destroy the semaphore. */
-+        gcmkERR_BREAK(gckOS_DestroySemaphore(
-+            Interrupt->os, Interrupt->fifoValid
-+            ));
-+
-+        /* Reset handles. */
-+        Interrupt->handler   = gcvNULL;
-+        Interrupt->fifoValid = gcvNULL;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+
-+/******************************************************************************\
-+***************************** Interrupt Object API *****************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckVGINTERRUPT_Construct
-+**
-+**  Construct an interrupt object.
-+**
-+**  INPUT:
-+**
-+**      Kernel
-+**          Pointer to the gckVGKERNEL object.
-+**
-+**  OUTPUT:
-+**
-+**      Interrupt
-+**          Pointer to the new gckVGINTERRUPT object.
-+*/
-+
-+gceSTATUS
-+gckVGINTERRUPT_Construct(
-+    IN gckVGKERNEL Kernel,
-+    OUT gckVGINTERRUPT * Interrupt
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGINTERRUPT interrupt = gcvNULL;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Interrupt=0x%x", Kernel, Interrupt);
-+
-+    /* Verify argeuments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Interrupt != gcvNULL);
-+
-+    do
-+    {
-+        /* Allocate the gckVGINTERRUPT structure. */
-+        gcmkERR_BREAK(gckOS_Allocate(
-+            Kernel->os,
-+            gcmSIZEOF(struct _gckVGINTERRUPT),
-+            (gctPOINTER *) &interrupt
-+            ));
-+
-+        /* Reset the object data. */
-+        gcmkVERIFY_OK(gckOS_ZeroMemory(
-+            interrupt, gcmSIZEOF(struct _gckVGINTERRUPT)
-+            ));
-+
-+        /* Initialize the object. */
-+        interrupt->object.type = gcvOBJ_INTERRUPT;
-+
-+        /* Initialize the object pointers. */
-+        interrupt->kernel = Kernel;
-+        interrupt->os     = Kernel->os;
-+
-+        /* Initialize the current FIFO position. */
-+        interrupt->head = (gctUINT8)~0;
-+        interrupt->tail = (gctUINT8)~0;
-+
-+        /* Start the thread. */
-+        gcmkERR_BREAK(_StartInterruptHandler(interrupt));
-+
-+        /* Return interrupt object. */
-+        *Interrupt = interrupt;
-+
-+        gcmkFOOTER_ARG("*Interrup=0x%x", *Interrupt);
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Roll back. */
-+    if (interrupt != gcvNULL)
-+    {
-+        /* Free the gckVGINTERRUPT structure. */
-+        gcmkVERIFY_OK(gckOS_Free(interrupt->os, interrupt));
-+    }
-+
-+    gcmkFOOTER();
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gckVGINTERRUPT_Destroy
-+**
-+**  Destroy an interrupt object.
-+**
-+**  INPUT:
-+**
-+**      Interrupt
-+**          Pointer to the gckVGINTERRUPT object to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+gceSTATUS
-+gckVGINTERRUPT_Destroy(
-+    IN gckVGINTERRUPT Interrupt
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Interrupt=0x%x", Interrupt);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
-+
-+    do
-+    {
-+        /* Stop the interrupt thread. */
-+        gcmkERR_BREAK(_StopInterruptHandler(Interrupt));
-+
-+        /* Mark the object as unknown. */
-+        Interrupt->object.type = gcvOBJ_UNKNOWN;
-+
-+        /* Free the gckVGINTERRUPT structure. */
-+        gcmkERR_BREAK(gckOS_Free(Interrupt->os, Interrupt));
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gckVGINTERRUPT_DumpState
-+**
-+**  Print the current state of the interrupt manager.
-+**
-+**  INPUT:
-+**
-+**      Interrupt
-+**          Pointer to a gckVGINTERRUPT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+#if gcvDEBUG
-+gceSTATUS
-+gckVGINTERRUPT_DumpState(
-+    IN gckVGINTERRUPT Interrupt
-+    )
-+{
-+    gcmkHEADER_ARG("Interrupt=0x%x", Interrupt);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
-+
-+    /* Print the header. */
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "%s: INTERRUPT OBJECT STATUS\n",
-+        __FUNCTION__
-+        );
-+
-+    /* Print statistics. */
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "  Maximum number of FIFO items accumulated at a single time: %d\n",
-+        Interrupt->maxFifoItems
-+        );
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "  Interrupt FIFO overflow happened times: %d\n",
-+        Interrupt->fifoOverflow
-+        );
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "  Maximum number of interrupts simultaneously generated: %d\n",
-+        Interrupt->maxSimultaneous
-+        );
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "  Number of times when there were multiple interrupts generated: %d\n",
-+        Interrupt->multipleCount
-+        );
-+#endif
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+        "  The current number of entries in the FIFO: %d\n",
-+        Interrupt->fifoItems
-+        );
-+
-+    /* Print the FIFO contents. */
-+    if (Interrupt->fifoItems != 0)
-+    {
-+        gctUINT8 index;
-+        gctUINT8 last;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+            "  FIFO current contents:\n"
-+            );
-+
-+        /* Get the current pointers. */
-+        index = Interrupt->tail;
-+        last  = Interrupt->head;
-+
-+        while (index != last)
-+        {
-+            /* Advance to the next entry. */
-+            index += 1;
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
-+                "    %d: 0x%08X\n",
-+                index, Interrupt->fifo[index]
-+                );
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+
-+/*******************************************************************************
-+**
-+**  gckVGINTERRUPT_Enable
-+**
-+**  Enable the specified interrupt.
-+**
-+**  INPUT:
-+**
-+**      Interrupt
-+**          Pointer to a gckVGINTERRUPT object.
-+**
-+**      Id
-+**          Pointer to the variable that holds the interrupt number to be
-+**          registered in range 0..31.
-+**          If the value is less then 0, gckVGINTERRUPT_Enable will attempt
-+**          to find an unused interrupt. If such interrupt is found, the number
-+**          will be assigned to the variable if the functuion call succeedes.
-+**
-+**      Handler
-+**          Pointer to the handler to register for the interrupt.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+gceSTATUS
-+gckVGINTERRUPT_Enable(
-+    IN gckVGINTERRUPT Interrupt,
-+    IN OUT gctINT32_PTR Id,
-+    IN gctINTERRUPT_HANDLER Handler
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT32 i;
-+
-+    gcmkHEADER_ARG("Interrupt=0x%x Id=0x%x Handler=0x%x", Interrupt, Id, Handler);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
-+    gcmkVERIFY_ARGUMENT(Id != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Handler != gcvNULL);
-+
-+    do
-+    {
-+        /* See if we need to allocate an ID. */
-+        if (*Id < 0)
-+        {
-+            /* Find the first unused interrupt handler. */
-+            for (i = 0; i < gcmCOUNTOF(Interrupt->handlers); ++i)
-+            {
-+                if (Interrupt->handlers[i] == gcvNULL)
-+                {
-+                    break;
-+                }
-+            }
-+
-+            /* No unused innterrupts? */
-+            if (i == gcmCOUNTOF(Interrupt->handlers))
-+            {
-+                status = gcvSTATUS_OUT_OF_RESOURCES;
-+                break;
-+            }
-+
-+            /* Update the interrupt ID. */
-+            *Id = i;
-+        }
-+
-+        /* Make sure the ID is in range. */
-+        else if (*Id >= gcmCOUNTOF(Interrupt->handlers))
-+        {
-+            status = gcvSTATUS_INVALID_ARGUMENT;
-+            break;
-+        }
-+
-+        /* Set interrupt handler. */
-+        Interrupt->handlers[*Id] = Handler;
-+
-+        /* Success. */
-+        status = gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gckVGINTERRUPT_Disable
-+**
-+**  Disable the specified interrupt.
-+**
-+**  INPUT:
-+**
-+**      Interrupt
-+**          Pointer to a gckVGINTERRUPT object.
-+**
-+**      Id
-+**          Interrupt number to be disabled in range 0..31.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+gceSTATUS
-+gckVGINTERRUPT_Disable(
-+    IN gckVGINTERRUPT Interrupt,
-+    IN gctINT32 Id
-+    )
-+{
-+    gcmkHEADER_ARG("Interrupt=0x%x Id=0x%x", Interrupt, Id);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
-+    gcmkVERIFY_ARGUMENT((Id >= 0) && (Id < gcmCOUNTOF(Interrupt->handlers)));
-+
-+    /* Reset interrupt handler. */
-+    Interrupt->handlers[Id] = gcvNULL;
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gckVGINTERRUPT_Enque
-+**
-+**  Read the interrupt status register and put the value in the interrupt FIFO.
-+**
-+**  INPUT:
-+**
-+**      Interrupt
-+**          Pointer to a gckVGINTERRUPT object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+
-+#ifndef __QNXNTO__
-+gceSTATUS
-+gckVGINTERRUPT_Enque(
-+    IN gckVGINTERRUPT Interrupt
-+    )
-+#else
-+gceSTATUS
-+gckVGINTERRUPT_Enque(
-+    IN gckVGINTERRUPT Interrupt,
-+    OUT gckOS *Os,
-+    OUT gctSEMAPHORE *Semaphore
-+    )
-+#endif
-+{
-+    gceSTATUS status;
-+    gctUINT32 triggered;
-+
-+    gcmkHEADER_ARG("Interrupt=0x%x", Interrupt);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
-+
-+#ifdef __QNXNTO__
-+    *Os = gcvNULL;
-+    *Semaphore = gcvNULL;
-+#endif
-+
-+    do
-+    {
-+        /* Read interrupt status register. */
-+        gcmkERR_BREAK(gckVGHARDWARE_ReadInterrupt(
-+            Interrupt->kernel->hardware, &triggered
-+            ));
-+
-+        /* Mask out TS overflow interrupt */
-+        triggered &= 0xfffffffe;
-+
-+        /* No interrupts to process? */
-+        if (triggered == 0)
-+        {
-+            status = gcvSTATUS_NOT_OUR_INTERRUPT;
-+            break;
-+        }
-+
-+        /* FIFO overflow? */
-+        if (Interrupt->fifoItems == gcmCOUNTOF(Interrupt->fifo))
-+        {
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+            Interrupt->fifoOverflow += 1;
-+#endif
-+
-+            /* OR the interrupt with the last value in the FIFO. */
-+            Interrupt->fifo[Interrupt->head] |= triggered;
-+
-+            /* Success (kind of). */
-+            status = gcvSTATUS_OK;
-+        }
-+        else
-+        {
-+            /* Advance to the next entry. */
-+            Interrupt->head      += 1;
-+            Interrupt->fifoItems += 1;
-+
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+            if (Interrupt->fifoItems > Interrupt->maxFifoItems)
-+            {
-+                Interrupt->maxFifoItems = Interrupt->fifoItems;
-+            }
-+#endif
-+
-+            /* Set the new value. */
-+            Interrupt->fifo[Interrupt->head] = triggered;
-+
-+#ifndef __QNXNTO__
-+            /* Increment the FIFO semaphore. */
-+            gcmkERR_BREAK(gckOS_IncrementSemaphore(
-+                Interrupt->os, Interrupt->fifoValid
-+                ));
-+#else
-+            *Os = Interrupt->os;
-+            *Semaphore = Interrupt->fifoValid;
-+#endif
-+
-+            /* Windows kills our threads prematurely when the application
-+               exists. Verify here that the thread is still alive. */
-+            status = gckOS_VerifyThread(Interrupt->os, Interrupt->handler);
-+
-+            /* Has the thread been prematurely terminated? */
-+            if (status != gcvSTATUS_OK)
-+            {
-+                /* Process all accumulated interrupts. */
-+                while (Interrupt->head != Interrupt->tail)
-+                {
-+#if gcmENABLE_INTERRUPT_STATISTICS
-+                    /* Process the interrupt. */
-+                    _ProcessInterrupt(Interrupt, gcvNULL);
-+#else
-+                    /* Process the interrupt. */
-+                    _ProcessInterrupt(Interrupt);
-+#endif
-+                }
-+
-+                /* Set success. */
-+                status = gcvSTATUS_OK;
-+            }
-+        }
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+#endif /* gcdENABLE_VG */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,1982 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_MMU
-+
-+typedef enum _gceMMU_TYPE
-+{
-+    gcvMMU_USED     = (0 << 4),
-+    gcvMMU_SINGLE   = (1 << 4),
-+    gcvMMU_FREE     = (2 << 4),
-+}
-+gceMMU_TYPE;
-+
-+#define gcmENTRY_TYPE(x) (x & 0xF0)
-+
-+#define gcdMMU_TABLE_DUMP       0
-+
-+#define gcdUSE_MMU_EXCEPTION    0
-+
-+/*
-+    gcdMMU_CLEAR_VALUE
-+
-+        The clear value for the entry of the old MMU.
-+*/
-+#ifndef gcdMMU_CLEAR_VALUE
-+#   define gcdMMU_CLEAR_VALUE                   0x00000ABC
-+#endif
-+
-+/* VIV: Start GPU address for gcvSURF_VERTEX.  */
-+#define gcdVERTEX_START      (128 << 10)
-+
-+typedef struct _gcsMMU_STLB *gcsMMU_STLB_PTR;
-+
-+typedef struct _gcsMMU_STLB
-+{
-+    gctPHYS_ADDR    physical;
-+    gctUINT32_PTR   logical;
-+    gctSIZE_T       size;
-+    gctUINT32       physBase;
-+    gctSIZE_T       pageCount;
-+    gctUINT32       mtlbIndex;
-+    gctUINT32       mtlbEntryNum;
-+    gcsMMU_STLB_PTR next;
-+} gcsMMU_STLB;
-+
-+#if gcdSHARED_PAGETABLE
-+typedef struct _gcsSharedPageTable * gcsSharedPageTable_PTR;
-+typedef struct _gcsSharedPageTable
-+{
-+    /* Shared gckMMU object. */
-+    gckMMU          mmu;
-+
-+    /* Hardwares which use this shared pagetable. */
-+    gckHARDWARE     hardwares[gcdMAX_GPU_COUNT];
-+
-+    /* Number of cores use this shared pagetable. */
-+    gctUINT32       reference;
-+}
-+gcsSharedPageTable;
-+
-+static gcsSharedPageTable_PTR sharedPageTable = gcvNULL;
-+#endif
-+
-+#if gcdMIRROR_PAGETABLE
-+typedef struct _gcsMirrorPageTable * gcsMirrorPageTable_PTR;
-+typedef struct _gcsMirrorPageTable
-+{
-+    /* gckMMU objects. */
-+    gckMMU          mmus[gcdMAX_GPU_COUNT];
-+
-+    /* Hardwares which use this shared pagetable. */
-+    gckHARDWARE     hardwares[gcdMAX_GPU_COUNT];
-+
-+    /* Number of cores use this shared pagetable. */
-+    gctUINT32       reference;
-+}
-+gcsMirrorPageTable;
-+
-+static gcsMirrorPageTable_PTR mirrorPageTable = gcvNULL;
-+static gctPOINTER mirrorPageTableMutex = gcvNULL;
-+#endif
-+
-+typedef struct _gcsDynamicSpaceNode * gcsDynamicSpaceNode_PTR;
-+typedef struct _gcsDynamicSpaceNode
-+{
-+    gctUINT32       start;
-+    gctINT32        entries;
-+}
-+gcsDynamicSpaceNode;
-+
-+static void
-+_WritePageEntry(
-+    IN gctUINT32_PTR PageEntry,
-+    IN gctUINT32     EntryValue
-+    )
-+{
-+    static gctUINT16 data = 0xff00;
-+
-+    if (*(gctUINT8 *)&data == 0xff)
-+    {
-+        *PageEntry = gcmSWAB32(EntryValue);
-+    }
-+    else
-+    {
-+        *PageEntry = EntryValue;
-+    }
-+}
-+
-+static gctUINT32
-+_ReadPageEntry(
-+    IN gctUINT32_PTR PageEntry
-+    )
-+{
-+    static gctUINT16 data = 0xff00;
-+    gctUINT32 entryValue;
-+
-+    if (*(gctUINT8 *)&data == 0xff)
-+    {
-+        entryValue = *PageEntry;
-+        return gcmSWAB32(entryValue);
-+    }
-+    else
-+    {
-+        return *PageEntry;
-+    }
-+}
-+
-+static gceSTATUS
-+_FillPageTable(
-+    IN gctUINT32_PTR PageTable,
-+    IN gctUINT32     PageCount,
-+    IN gctUINT32     EntryValue
-+)
-+{
-+    gctUINT i;
-+
-+    for (i = 0; i < PageCount; i++)
-+    {
-+        _WritePageEntry(PageTable + i, EntryValue);
-+    }
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+_Link(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Next
-+    )
-+{
-+    if (Index >= Mmu->pageTableEntries)
-+    {
-+        /* Just move heap pointer. */
-+        Mmu->heapList = Next;
-+    }
-+    else
-+    {
-+        /* Address page table. */
-+        gctUINT32_PTR pageTable = Mmu->pageTableLogical;
-+
-+        /* Dispatch on node type. */
-+        switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[Index])))
-+        {
-+        case gcvMMU_SINGLE:
-+            /* Set single index. */
-+            _WritePageEntry(&pageTable[Index], (Next << 8) | gcvMMU_SINGLE);
-+            break;
-+
-+        case gcvMMU_FREE:
-+            /* Set index. */
-+            _WritePageEntry(&pageTable[Index + 1], Next);
-+            break;
-+
-+        default:
-+            gcmkFATAL("MMU table correcupted at index %u!", Index);
-+            return gcvSTATUS_HEAP_CORRUPTED;
-+        }
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+static gceSTATUS
-+_AddFree(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Node,
-+    IN gctUINT32 Count
-+    )
-+{
-+    gctUINT32_PTR pageTable = Mmu->pageTableLogical;
-+
-+    if (Count == 1)
-+    {
-+        /* Initialize a single page node. */
-+        _WritePageEntry(pageTable + Node, (~((1U<<8)-1)) | gcvMMU_SINGLE);
-+    }
-+    else
-+    {
-+        /* Initialize the node. */
-+        _WritePageEntry(pageTable + Node + 0, (Count << 8) | gcvMMU_FREE);
-+        _WritePageEntry(pageTable + Node + 1, ~0U);
-+    }
-+
-+    /* Append the node. */
-+    return _Link(Mmu, Index, Node);
-+}
-+
-+static gceSTATUS
-+_Collect(
-+    IN gckMMU Mmu
-+    )
-+{
-+    gctUINT32_PTR pageTable = Mmu->pageTableLogical;
-+    gceSTATUS status;
-+    gctUINT32 i, previous, start = 0, count = 0;
-+
-+    previous = Mmu->heapList = ~0U;
-+    Mmu->freeNodes = gcvFALSE;
-+
-+    /* Walk the entire page table. */
-+    for (i = 0; i < Mmu->pageTableEntries; ++i)
-+    {
-+        /* Dispatch based on type of page. */
-+        switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[i])))
-+        {
-+        case gcvMMU_USED:
-+            /* Used page, so close any open node. */
-+            if (count > 0)
-+            {
-+                /* Add the node. */
-+                gcmkONERROR(_AddFree(Mmu, previous, start, count));
-+
-+                /* Reset the node. */
-+                previous = start;
-+                count    = 0;
-+            }
-+            break;
-+
-+        case gcvMMU_SINGLE:
-+            /* Single free node. */
-+            if (count++ == 0)
-+            {
-+                /* Start a new node. */
-+                start = i;
-+            }
-+            break;
-+
-+        case gcvMMU_FREE:
-+            /* A free node. */
-+            if (count == 0)
-+            {
-+                /* Start a new node. */
-+                start = i;
-+            }
-+
-+            /* Advance the count. */
-+            count += _ReadPageEntry(&pageTable[i]) >> 8;
-+
-+            /* Advance the index into the page table. */
-+            i     += (_ReadPageEntry(&pageTable[i]) >> 8) - 1;
-+            break;
-+
-+        default:
-+            gcmkFATAL("MMU page table correcupted at index %u!", i);
-+            return gcvSTATUS_HEAP_CORRUPTED;
-+        }
-+    }
-+
-+    /* See if we have an open node left. */
-+    if (count > 0)
-+    {
-+        /* Add the node to the list. */
-+        gcmkONERROR(_AddFree(Mmu, previous, start, count));
-+    }
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_MMU,
-+                   "Performed a garbage collection of the MMU heap.");
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the staus. */
-+    return status;
-+}
-+
-+static gctUINT32
-+_SetPage(gctUINT32 PageAddress)
-+{
-+    return PageAddress
-+           /* writable */
-+           | (1 << 2)
-+           /* Ignore exception */
-+           | (0 << 1)
-+           /* Present */
-+           | (1 << 0);
-+}
-+
-+static gceSTATUS
-+_FillFlatMapping(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 PhysBase,
-+    OUT gctSIZE_T Size
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL mutex = gcvFALSE;
-+    gcsMMU_STLB_PTR head = gcvNULL, pre = gcvNULL;
-+    gctUINT32 start = PhysBase & (~gcdMMU_PAGE_64K_MASK);
-+    gctUINT32 end = (PhysBase + Size - 1) & (~gcdMMU_PAGE_64K_MASK);
-+    gctUINT32 mStart = start >> gcdMMU_MTLB_SHIFT;
-+    gctUINT32 mEnd = end >> gcdMMU_MTLB_SHIFT;
-+    gctUINT32 sStart = (start & gcdMMU_STLB_64K_MASK) >> gcdMMU_STLB_64K_SHIFT;
-+    gctUINT32 sEnd = (end & gcdMMU_STLB_64K_MASK) >> gcdMMU_STLB_64K_SHIFT;
-+
-+    /* Grab the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
-+    mutex = gcvTRUE;
-+
-+    while (mStart <= mEnd)
-+    {
-+        gcmkASSERT(mStart < gcdMMU_MTLB_ENTRY_NUM);
-+        if (*(Mmu->mtlbLogical + mStart) == 0)
-+        {
-+            gcsMMU_STLB_PTR stlb;
-+            gctPOINTER pointer = gcvNULL;
-+            gctUINT32 last = (mStart == mEnd) ? sEnd : (gcdMMU_STLB_64K_ENTRY_NUM - 1);
-+
-+            gcmkONERROR(gckOS_Allocate(Mmu->os, sizeof(struct _gcsMMU_STLB), &pointer));
-+            stlb = pointer;
-+
-+            stlb->mtlbEntryNum = 0;
-+            stlb->next = gcvNULL;
-+            stlb->physical = gcvNULL;
-+            stlb->logical = gcvNULL;
-+            stlb->size = gcdMMU_STLB_64K_SIZE;
-+            stlb->pageCount = 0;
-+
-+            if (pre == gcvNULL)
-+            {
-+                pre = head = stlb;
-+            }
-+            else
-+            {
-+                gcmkASSERT(pre->next == gcvNULL);
-+                pre->next = stlb;
-+                pre = stlb;
-+            }
-+
-+            gcmkONERROR(
-+                    gckOS_AllocateContiguous(Mmu->os,
-+                                             gcvFALSE,
-+                                             &stlb->size,
-+                                             &stlb->physical,
-+                                             (gctPOINTER)&stlb->logical));
-+
-+            gcmkONERROR(gckOS_ZeroMemory(stlb->logical, stlb->size));
-+
-+            gcmkONERROR(gckOS_GetPhysicalAddress(
-+                Mmu->os,
-+                stlb->logical,
-+                &stlb->physBase));
-+
-+            if (stlb->physBase & (gcdMMU_STLB_64K_SIZE - 1))
-+            {
-+                gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
-+            }
-+
-+            _WritePageEntry(Mmu->mtlbLogical + mStart,
-+                            stlb->physBase
-+                            /* 64KB page size */
-+                            | (1 << 2)
-+                            /* Ignore exception */
-+                            | (0 << 1)
-+                            /* Present */
-+                            | (1 << 0)
-+                            );
-+#if gcdMMU_TABLE_DUMP
-+            gckOS_Print("%s(%d): insert MTLB[%d]: %08x\n",
-+                __FUNCTION__, __LINE__,
-+                mStart,
-+                _ReadPageEntry(Mmu->mtlbLogical + mStart));
-+#endif
-+
-+            stlb->mtlbIndex = mStart;
-+            stlb->mtlbEntryNum = 1;
-+#if gcdMMU_TABLE_DUMP
-+            gckOS_Print("%s(%d): STLB: logical:%08x -> physical:%08x\n",
-+                    __FUNCTION__, __LINE__,
-+                    stlb->logical,
-+                    stlb->physBase);
-+#endif
-+
-+            while (sStart <= last)
-+            {
-+                gcmkASSERT(!(start & gcdMMU_PAGE_64K_MASK));
-+                _WritePageEntry(stlb->logical + sStart, _SetPage(start));
-+#if gcdMMU_TABLE_DUMP
-+                gckOS_Print("%s(%d): insert STLB[%d]: %08x\n",
-+                    __FUNCTION__, __LINE__,
-+                    sStart,
-+                    _ReadPageEntry(stlb->logical + sStart));
-+#endif
-+                /* next page. */
-+                start += gcdMMU_PAGE_64K_SIZE;
-+                sStart++;
-+                stlb->pageCount++;
-+            }
-+
-+            sStart = 0;
-+            ++mStart;
-+        }
-+        else
-+        {
-+            gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+        }
-+    }
-+
-+    /* Insert the stlb into staticSTLB. */
-+    if (Mmu->staticSTLB == gcvNULL)
-+    {
-+        Mmu->staticSTLB = head;
-+    }
-+    else
-+    {
-+        gcmkASSERT(pre == gcvNULL);
-+        gcmkASSERT(pre->next == gcvNULL);
-+        pre->next = Mmu->staticSTLB;
-+        Mmu->staticSTLB = head;
-+    }
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    /* Roll back. */
-+    while (head != gcvNULL)
-+    {
-+        pre = head;
-+        head = head->next;
-+
-+        if (pre->physical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(
-+                gckOS_FreeContiguous(Mmu->os,
-+                    pre->physical,
-+                    pre->logical,
-+                    pre->size));
-+        }
-+
-+        if (pre->mtlbEntryNum != 0)
-+        {
-+            gcmkASSERT(pre->mtlbEntryNum == 1);
-+            _WritePageEntry(Mmu->mtlbLogical + pre->mtlbIndex, 0);
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, pre));
-+    }
-+
-+    if (mutex)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+    }
-+
-+    return status;
-+}
-+
-+static gceSTATUS
-+_FindDynamicSpace(
-+    IN gckMMU Mmu,
-+    OUT gcsDynamicSpaceNode_PTR *Array,
-+    OUT gctINT * Size
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gctPOINTER pointer = gcvNULL;
-+    gcsDynamicSpaceNode_PTR array = gcvNULL;
-+    gctINT size = 0;
-+    gctINT i = 0, nodeStart = -1, nodeEntries = 0;
-+
-+    /* Allocate memory for the array. */
-+    gcmkONERROR(gckOS_Allocate(Mmu->os,
-+                               gcmSIZEOF(*array) * (gcdMMU_MTLB_ENTRY_NUM / 2),
-+                               &pointer));
-+
-+    array = (gcsDynamicSpaceNode_PTR)pointer;
-+
-+    /* Loop all the entries. */
-+    while (i < gcdMMU_MTLB_ENTRY_NUM)
-+    {
-+        if (!Mmu->mtlbLogical[i])
-+        {
-+            if (nodeStart < 0)
-+            {
-+                /* This is the first entry of the dynamic space. */
-+                nodeStart   = i;
-+                nodeEntries = 1;
-+            }
-+            else
-+            {
-+                /* Other entries of the dynamic space. */
-+                nodeEntries++;
-+            }
-+        }
-+        else if (nodeStart >= 0)
-+        {
-+            /* Save the previous node. */
-+            array[size].start   = nodeStart;
-+            array[size].entries = nodeEntries;
-+            size++;
-+
-+            /* Reset the start. */
-+            nodeStart   = -1;
-+            nodeEntries = 0;
-+        }
-+
-+        i++;
-+    }
-+
-+    /* Save the previous node. */
-+    if (nodeStart >= 0)
-+    {
-+        array[size].start   = nodeStart;
-+        array[size].entries = nodeEntries;
-+        size++;
-+    }
-+
-+#if gcdMMU_TABLE_DUMP
-+    for (i = 0; i < size; i++)
-+    {
-+        gckOS_Print("%s(%d): [%d]: start=%d, entries=%d.\n",
-+                __FUNCTION__, __LINE__,
-+                i,
-+                array[i].start,
-+                array[i].entries);
-+    }
-+#endif
-+
-+    *Array = array;
-+    *Size  = size;
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (pointer != gcvNULL)
-+    {
-+        gckOS_Free(Mmu->os, pointer);
-+    }
-+
-+    return status;
-+}
-+
-+static gceSTATUS
-+_SetupDynamicSpace(
-+    IN gckMMU Mmu
-+    )
-+{
-+    gceSTATUS status;
-+    gcsDynamicSpaceNode_PTR nodeArray = gcvNULL;
-+    gctINT i, nodeArraySize = 0;
-+    gctUINT32 physical;
-+    gctINT numEntries = 0;
-+    gctUINT32_PTR pageTable;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    /* Find all the dynamic address space. */
-+    gcmkONERROR(_FindDynamicSpace(Mmu, &nodeArray, &nodeArraySize));
-+
-+    /* TODO: We only use the largest one for now. */
-+    for (i = 0; i < nodeArraySize; i++)
-+    {
-+        if (nodeArray[i].entries > numEntries)
-+        {
-+            Mmu->dynamicMappingStart = nodeArray[i].start;
-+            numEntries               = nodeArray[i].entries;
-+        }
-+    }
-+
-+    gckOS_Free(Mmu->os, (gctPOINTER)nodeArray);
-+
-+    Mmu->pageTableSize = numEntries * 4096;
-+
-+    Mmu->pageTableEntries = Mmu->pageTableSize / gcmSIZEOF(gctUINT32);
-+
-+    /* Construct Slave TLB. */
-+    gcmkONERROR(gckOS_AllocateContiguous(Mmu->os,
-+                gcvFALSE,
-+                &Mmu->pageTableSize,
-+                &Mmu->pageTablePhysical,
-+                (gctPOINTER)&Mmu->pageTableLogical));
-+
-+#if gcdUSE_MMU_EXCEPTION
-+    gcmkONERROR(_FillPageTable(Mmu->pageTableLogical,
-+                               Mmu->pageTableEntries,
-+                               /* Enable exception */
-+                               1 << 1));
-+#else
-+    /* Invalidate all entries. */
-+    gcmkONERROR(gckOS_ZeroMemory(Mmu->pageTableLogical,
-+                Mmu->pageTableSize));
-+#endif
-+
-+    /* Initilization. */
-+    pageTable      = Mmu->pageTableLogical;
-+    _WritePageEntry(pageTable,     (Mmu->pageTableEntries << 8) | gcvMMU_FREE);
-+    _WritePageEntry(pageTable + 1, ~0U);
-+    Mmu->heapList  = 0;
-+    Mmu->freeNodes = gcvFALSE;
-+
-+    gcmkONERROR(gckOS_GetPhysicalAddress(Mmu->os,
-+                Mmu->pageTableLogical,
-+                &physical));
-+
-+    /* Grab the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Map to Master TLB. */
-+    for (i = (gctINT)Mmu->dynamicMappingStart;
-+         i < (gctINT)Mmu->dynamicMappingStart + numEntries;
-+         i++)
-+    {
-+        _WritePageEntry(Mmu->mtlbLogical + i,
-+                        physical
-+                        /* 4KB page size */
-+                        | (0 << 2)
-+                        /* Ignore exception */
-+                        | (0 << 1)
-+                        /* Present */
-+                        | (1 << 0)
-+                        );
-+#if gcdMMU_TABLE_DUMP
-+        gckOS_Print("%s(%d): insert MTLB[%d]: %08x\n",
-+                __FUNCTION__, __LINE__,
-+                i,
-+                _ReadPageEntry(Mmu->mtlbLogical + i));
-+#endif
-+        physical += gcdMMU_STLB_4K_SIZE;
-+    }
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (Mmu->pageTableLogical)
-+    {
-+        /* Free the page table. */
-+        gcmkVERIFY_OK(
-+                gckOS_FreeContiguous(Mmu->os,
-+                    Mmu->pageTablePhysical,
-+                    (gctPOINTER) Mmu->pageTableLogical,
-+                    Mmu->pageTableSize));
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+    }
-+
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  _Construct
-+**
-+**  Construct a new gckMMU object.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctSIZE_T MmuSize
-+**          Number of bytes for the page table.
-+**
-+**  OUTPUT:
-+**
-+**      gckMMU * Mmu
-+**          Pointer to a variable that receives the gckMMU object pointer.
-+*/
-+gceSTATUS
-+_Construct(
-+    IN gckKERNEL Kernel,
-+    IN gctSIZE_T MmuSize,
-+    OUT gckMMU * Mmu
-+    )
-+{
-+    gckOS os;
-+    gckHARDWARE hardware;
-+    gceSTATUS status;
-+    gckMMU mmu = gcvNULL;
-+    gctUINT32_PTR pageTable;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x MmuSize=%lu", Kernel, MmuSize);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(MmuSize > 0);
-+    gcmkVERIFY_ARGUMENT(Mmu != gcvNULL);
-+
-+    /* Extract the gckOS object pointer. */
-+    os = Kernel->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Extract the gckHARDWARE object pointer. */
-+    hardware = Kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    /* Allocate memory for the gckMMU object. */
-+    gcmkONERROR(gckOS_Allocate(os, sizeof(struct _gckMMU), &pointer));
-+
-+    mmu = pointer;
-+
-+    /* Initialize the gckMMU object. */
-+    mmu->object.type      = gcvOBJ_MMU;
-+    mmu->os               = os;
-+    mmu->hardware         = hardware;
-+    mmu->pageTableMutex   = gcvNULL;
-+    mmu->pageTableLogical = gcvNULL;
-+    mmu->mtlbLogical      = gcvNULL;
-+    mmu->staticSTLB       = gcvNULL;
-+    mmu->enabled          = gcvFALSE;
-+#ifdef __QNXNTO__
-+    mmu->nodeList         = gcvNULL;
-+    mmu->nodeMutex        = gcvNULL;
-+#endif
-+
-+    /* Create the page table mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &mmu->pageTableMutex));
-+
-+#ifdef __QNXNTO__
-+    /* Create the node list mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &mmu->nodeMutex));
-+#endif
-+
-+    if (hardware->mmuVersion == 0)
-+    {
-+        mmu->pageTableSize = MmuSize;
-+
-+        gcmkONERROR(
-+            gckOS_AllocateContiguous(os,
-+                                     gcvFALSE,
-+                                     &mmu->pageTableSize,
-+                                     &mmu->pageTablePhysical,
-+                                     &pointer));
-+
-+        mmu->pageTableLogical = pointer;
-+
-+        /* Compute number of entries in page table. */
-+        mmu->pageTableEntries = mmu->pageTableSize / sizeof(gctUINT32);
-+
-+        /* Mark all pages as free. */
-+        pageTable      = mmu->pageTableLogical;
-+
-+#if gcdMMU_CLEAR_VALUE
-+        _FillPageTable(pageTable, mmu->pageTableEntries, gcdMMU_CLEAR_VALUE);
-+#endif
-+
-+        _WritePageEntry(pageTable,     (mmu->pageTableEntries << 8) | gcvMMU_FREE);
-+        _WritePageEntry(pageTable + 1, ~0U);
-+        mmu->heapList  = 0;
-+        mmu->freeNodes = gcvFALSE;
-+
-+        /* Set page table address. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetMMU(hardware, (gctPOINTER) mmu->pageTableLogical));
-+    }
-+    else
-+    {
-+        /* Allocate the 4K mode MTLB table. */
-+        mmu->mtlbSize = gcdMMU_MTLB_SIZE + 64;
-+
-+        gcmkONERROR(
-+            gckOS_AllocateContiguous(os,
-+                                     gcvFALSE,
-+                                     &mmu->mtlbSize,
-+                                     &mmu->mtlbPhysical,
-+                                     &pointer));
-+
-+        mmu->mtlbLogical = pointer;
-+
-+        /* Invalid all the entries. */
-+        gcmkONERROR(
-+            gckOS_ZeroMemory(pointer, mmu->mtlbSize));
-+    }
-+
-+    /* Return the gckMMU object pointer. */
-+    *Mmu = mmu;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Mmu=0x%x", *Mmu);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (mmu != gcvNULL)
-+    {
-+        if (mmu->pageTableLogical != gcvNULL)
-+        {
-+            /* Free the page table. */
-+            gcmkVERIFY_OK(
-+                gckOS_FreeContiguous(os,
-+                                     mmu->pageTablePhysical,
-+                                     (gctPOINTER) mmu->pageTableLogical,
-+                                     mmu->pageTableSize));
-+
-+        }
-+
-+        if (mmu->mtlbLogical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(
-+                gckOS_FreeContiguous(os,
-+                                     mmu->mtlbPhysical,
-+                                     (gctPOINTER) mmu->mtlbLogical,
-+                                     mmu->mtlbSize));
-+        }
-+
-+        if (mmu->pageTableMutex != gcvNULL)
-+        {
-+            /* Delete the mutex. */
-+            gcmkVERIFY_OK(
-+                gckOS_DeleteMutex(os, mmu->pageTableMutex));
-+        }
-+
-+#ifdef __QNXNTO__
-+        if (mmu->nodeMutex != gcvNULL)
-+        {
-+            /* Delete the mutex. */
-+            gcmkVERIFY_OK(
-+                gckOS_DeleteMutex(os, mmu->nodeMutex));
-+        }
-+#endif
-+
-+        /* Mark the gckMMU object as unknown. */
-+        mmu->object.type = gcvOBJ_UNKNOWN;
-+
-+        /* Free the allocates memory. */
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, mmu));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  _Destroy
-+**
-+**  Destroy a gckMMU object.
-+**
-+**  INPUT:
-+**
-+**      gckMMU Mmu
-+**          Pointer to an gckMMU object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+_Destroy(
-+    IN gckMMU Mmu
-+    )
-+{
-+#ifdef __QNXNTO__
-+    gcuVIDMEM_NODE_PTR node, next;
-+#endif
-+
-+    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+#ifdef __QNXNTO__
-+    /* Free all associated virtual memory. */
-+    for (node = Mmu->nodeList; node != gcvNULL; node = next)
-+    {
-+        next = node->Virtual.next;
-+        gcmkVERIFY_OK(gckVIDMEM_Free(node));
-+    }
-+#endif
-+
-+    while (Mmu->staticSTLB != gcvNULL)
-+    {
-+        gcsMMU_STLB_PTR pre = Mmu->staticSTLB;
-+        Mmu->staticSTLB = pre->next;
-+
-+        if (pre->physical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(
-+                gckOS_FreeContiguous(Mmu->os,
-+                    pre->physical,
-+                    pre->logical,
-+                    pre->size));
-+        }
-+
-+        if (pre->mtlbEntryNum != 0)
-+        {
-+            gcmkASSERT(pre->mtlbEntryNum == 1);
-+            _WritePageEntry(Mmu->mtlbLogical + pre->mtlbIndex, 0);
-+#if gcdMMU_TABLE_DUMP
-+            gckOS_Print("%s(%d): clean MTLB[%d]\n",
-+                __FUNCTION__, __LINE__,
-+                pre->mtlbIndex);
-+#endif
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, pre));
-+    }
-+
-+    if (Mmu->hardware->mmuVersion != 0)
-+    {
-+        gcmkVERIFY_OK(
-+                gckOS_FreeContiguous(Mmu->os,
-+                    Mmu->mtlbPhysical,
-+                    (gctPOINTER) Mmu->mtlbLogical,
-+                    Mmu->mtlbSize));
-+    }
-+
-+    /* Free the page table. */
-+    gcmkVERIFY_OK(
-+            gckOS_FreeContiguous(Mmu->os,
-+                Mmu->pageTablePhysical,
-+                (gctPOINTER) Mmu->pageTableLogical,
-+                Mmu->pageTableSize));
-+
-+#ifdef __QNXNTO__
-+    /* Delete the node list mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Mmu->os, Mmu->nodeMutex));
-+#endif
-+
-+    /* Delete the page table mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Mmu->os, Mmu->pageTableMutex));
-+
-+    /* Mark the gckMMU object as unknown. */
-+    Mmu->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckMMU object. */
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, Mmu));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+** _AdjstIndex
-+**
-+**  Adjust the index from which we search for a usable node to make sure
-+**  index allocated is greater than Start.
-+*/
-+gceSTATUS
-+_AdjustIndex(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 PageCount,
-+    IN gctUINT32 Start,
-+    OUT gctUINT32 * IndexAdjusted
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 index = Index;
-+    gctUINT32_PTR map = Mmu->pageTableLogical;
-+
-+    gcmkHEADER();
-+
-+    for (; index < Mmu->pageTableEntries;)
-+    {
-+        gctUINT32 result = 0;
-+        gctUINT32 nodeSize = 0;
-+
-+        if (index >= Start)
-+        {
-+            break;
-+        }
-+
-+        switch (gcmENTRY_TYPE(map[index]))
-+        {
-+        case gcvMMU_SINGLE:
-+            nodeSize = 1;
-+            break;
-+
-+        case gcvMMU_FREE:
-+            nodeSize = map[index] >> 8;
-+            break;
-+
-+        default:
-+            gcmkFATAL("MMU table correcupted at index %u!", index);
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+
-+        if (nodeSize > PageCount)
-+        {
-+            result = index + (nodeSize - PageCount);
-+
-+            if (result >= Start)
-+            {
-+                break;
-+            }
-+        }
-+
-+        switch (gcmENTRY_TYPE(map[index]))
-+        {
-+        case gcvMMU_SINGLE:
-+            index = map[index] >> 8;
-+            break;
-+
-+        case gcvMMU_FREE:
-+            index = map[index + 1];
-+            break;
-+
-+        default:
-+            gcmkFATAL("MMU table correcupted at index %u!", index);
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+    }
-+
-+    *IndexAdjusted = index;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckMMU_Construct(
-+    IN gckKERNEL Kernel,
-+    IN gctSIZE_T MmuSize,
-+    OUT gckMMU * Mmu
-+    )
-+{
-+#if gcdSHARED_PAGETABLE
-+    gceSTATUS status;
-+    gctPOINTER pointer;
-+
-+    gcmkHEADER_ARG("Kernel=0x%08x", Kernel);
-+
-+    if (sharedPageTable == gcvNULL)
-+    {
-+        gcmkONERROR(
-+                gckOS_Allocate(Kernel->os,
-+                               sizeof(struct _gcsSharedPageTable),
-+                               &pointer));
-+        sharedPageTable = pointer;
-+
-+        gcmkONERROR(
-+                gckOS_ZeroMemory(sharedPageTable,
-+                    sizeof(struct _gcsSharedPageTable)));
-+
-+        gcmkONERROR(_Construct(Kernel, MmuSize, &sharedPageTable->mmu));
-+    }
-+    else if (Kernel->hardware->mmuVersion == 0)
-+    {
-+        /* Set page table address. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetMMU(Kernel->hardware, (gctPOINTER) sharedPageTable->mmu->pageTableLogical));
-+    }
-+
-+    *Mmu = sharedPageTable->mmu;
-+
-+    sharedPageTable->hardwares[sharedPageTable->reference] = Kernel->hardware;
-+
-+    sharedPageTable->reference++;
-+
-+    gcmkFOOTER_ARG("sharedPageTable->reference=%lu", sharedPageTable->reference);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (sharedPageTable)
-+    {
-+        if (sharedPageTable->mmu)
-+        {
-+            gcmkVERIFY_OK(gckMMU_Destroy(sharedPageTable->mmu));
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, sharedPageTable));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+#elif gcdMIRROR_PAGETABLE
-+    gceSTATUS status;
-+    gctPOINTER pointer;
-+
-+    gcmkHEADER_ARG("Kernel=0x%08x", Kernel);
-+
-+    if (mirrorPageTable == gcvNULL)
-+    {
-+        gcmkONERROR(
-+            gckOS_Allocate(Kernel->os,
-+                           sizeof(struct _gcsMirrorPageTable),
-+                           &pointer));
-+        mirrorPageTable = pointer;
-+
-+        gcmkONERROR(
-+            gckOS_ZeroMemory(mirrorPageTable,
-+                    sizeof(struct _gcsMirrorPageTable)));
-+
-+        gcmkONERROR(
-+            gckOS_CreateMutex(Kernel->os, &mirrorPageTableMutex));
-+    }
-+
-+    gcmkONERROR(_Construct(Kernel, MmuSize, Mmu));
-+
-+    mirrorPageTable->mmus[mirrorPageTable->reference] = *Mmu;
-+
-+    mirrorPageTable->hardwares[mirrorPageTable->reference] = Kernel->hardware;
-+
-+    mirrorPageTable->reference++;
-+
-+    gcmkFOOTER_ARG("mirrorPageTable->reference=%lu", mirrorPageTable->reference);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (mirrorPageTable && mirrorPageTable->reference == 0)
-+    {
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, mirrorPageTable));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+#else
-+    return _Construct(Kernel, MmuSize, Mmu);
-+#endif
-+}
-+
-+gceSTATUS
-+gckMMU_Destroy(
-+    IN gckMMU Mmu
-+    )
-+{
-+#if gcdSHARED_PAGETABLE
-+    sharedPageTable->reference--;
-+
-+    if (sharedPageTable->reference == 0)
-+    {
-+        if (sharedPageTable->mmu)
-+        {
-+            gcmkVERIFY_OK(_Destroy(Mmu));
-+        }
-+
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, sharedPageTable));
-+    }
-+
-+    return gcvSTATUS_OK;
-+#elif gcdMIRROR_PAGETABLE
-+    mirrorPageTable->reference--;
-+
-+    if (mirrorPageTable->reference == 0)
-+    {
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, mirrorPageTable));
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, mirrorPageTableMutex));
-+    }
-+
-+    return _Destroy(Mmu);
-+#else
-+    return _Destroy(Mmu);
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckMMU_AllocatePages
-+**
-+**  Allocate pages inside the page table.
-+**
-+**  INPUT:
-+**
-+**      gckMMU Mmu
-+**          Pointer to an gckMMU object.
-+**
-+**      gctSIZE_T PageCount
-+**          Number of pages to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * PageTable
-+**          Pointer to a variable that receives the base address of the page
-+**          table.
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable that receives the hardware specific address.
-+*/
-+gceSTATUS
-+_AllocatePages(
-+    IN gckMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    IN gceSURF_TYPE Type,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL mutex = gcvFALSE;
-+    gctUINT32 index = 0, previous = ~0U, left;
-+    gctUINT32_PTR pageTable;
-+    gctBOOL gotIt;
-+    gctUINT32 address;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x PageCount=%lu", Mmu, PageCount);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+    gcmkVERIFY_ARGUMENT(PageCount > 0);
-+    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
-+
-+    if (PageCount > Mmu->pageTableEntries)
-+    {
-+        gcmkPRINT("[galcore]: %s(%d): Run out of free page entry.",
-+                  __FUNCTION__, __LINE__);
-+
-+        /* Not enough pages avaiable. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+    /* Grab the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
-+    mutex = gcvTRUE;
-+
-+    /* Cast pointer to page table. */
-+    for (pageTable = Mmu->pageTableLogical, gotIt = gcvFALSE; !gotIt;)
-+    {
-+        index = Mmu->heapList;
-+
-+        if ((Mmu->hardware->mmuVersion == 0) && (Type == gcvSURF_VERTEX))
-+        {
-+            gcmkONERROR(_AdjustIndex(
-+                Mmu,
-+                index,
-+                PageCount,
-+                gcdVERTEX_START / gcmSIZEOF(gctUINT32),
-+                &index
-+                ));
-+        }
-+
-+        /* Walk the heap list. */
-+        for (; !gotIt && (index < Mmu->pageTableEntries);)
-+        {
-+            /* Check the node type. */
-+            switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[index])))
-+            {
-+            case gcvMMU_SINGLE:
-+                /* Single odes are valid if we only need 1 page. */
-+                if (PageCount == 1)
-+                {
-+                    gotIt = gcvTRUE;
-+                }
-+                else
-+                {
-+                    /* Move to next node. */
-+                    previous = index;
-+                    index    = _ReadPageEntry(&pageTable[index]) >> 8;
-+                }
-+                break;
-+
-+            case gcvMMU_FREE:
-+                /* Test if the node has enough space. */
-+                if (PageCount <= (_ReadPageEntry(&pageTable[index]) >> 8))
-+                {
-+                    gotIt = gcvTRUE;
-+                }
-+                else
-+                {
-+                    /* Move to next node. */
-+                    previous = index;
-+                    index    = _ReadPageEntry(&pageTable[index + 1]);
-+                }
-+                break;
-+
-+            default:
-+                gcmkFATAL("MMU table correcupted at index %u!", index);
-+                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+            }
-+        }
-+
-+        /* Test if we are out of memory. */
-+        if (index >= Mmu->pageTableEntries)
-+        {
-+            if (Mmu->freeNodes)
-+            {
-+                /* Time to move out the trash! */
-+                gcmkONERROR(_Collect(Mmu));
-+            }
-+            else
-+            {
-+                gcmkPRINT("[galcore]: %s(%d): Run out of free page entry.",
-+                          __FUNCTION__, __LINE__);
-+
-+                /* Out of resources. */
-+                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+            }
-+        }
-+    }
-+
-+    switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[index])))
-+    {
-+    case gcvMMU_SINGLE:
-+        /* Unlink single node from free list. */
-+        gcmkONERROR(
-+            _Link(Mmu, previous, _ReadPageEntry(&pageTable[index]) >> 8));
-+        break;
-+
-+    case gcvMMU_FREE:
-+        /* Check how many pages will be left. */
-+        left = (_ReadPageEntry(&pageTable[index]) >> 8) - PageCount;
-+        switch (left)
-+        {
-+        case 0:
-+            /* The entire node is consumed, just unlink it. */
-+            gcmkONERROR(
-+                _Link(Mmu, previous, _ReadPageEntry(&pageTable[index + 1])));
-+            break;
-+
-+        case 1:
-+            /* One page will remain.  Convert the node to a single node and
-+            ** advance the index. */
-+            _WritePageEntry(&pageTable[index], (_ReadPageEntry(&pageTable[index + 1]) << 8) | gcvMMU_SINGLE);
-+            index ++;
-+            break;
-+
-+        default:
-+            /* Enough pages remain for a new node.  However, we will just adjust
-+            ** the size of the current node and advance the index. */
-+            _WritePageEntry(&pageTable[index], (left << 8) | gcvMMU_FREE);
-+            index += left;
-+            break;
-+        }
-+        break;
-+    }
-+
-+    /* Mark node as used. */
-+    gcmkONERROR(_FillPageTable(&pageTable[index], PageCount, gcvMMU_USED));
-+
-+    /* Return pointer to page table. */
-+    *PageTable = &pageTable[index];
-+
-+    /* Build virtual address. */
-+    if (Mmu->hardware->mmuVersion == 0)
-+    {
-+        gcmkONERROR(
-+                gckHARDWARE_BuildVirtualAddress(Mmu->hardware, index, 0, &address));
-+    }
-+    else
-+    {
-+        gctUINT32 masterOffset = index / gcdMMU_STLB_4K_ENTRY_NUM
-+                               + Mmu->dynamicMappingStart;
-+        gctUINT32 slaveOffset = index % gcdMMU_STLB_4K_ENTRY_NUM;
-+
-+        address = (masterOffset << gcdMMU_MTLB_SHIFT)
-+                | (slaveOffset << gcdMMU_STLB_4K_SHIFT);
-+    }
-+
-+    if (Address != gcvNULL)
-+    {
-+        *Address = address;
-+    }
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*PageTable=0x%x *Address=%08x",
-+                   *PageTable, gcmOPT_VALUE(Address));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    if (mutex)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckMMU_FreePages
-+**
-+**  Free pages inside the page table.
-+**
-+**  INPUT:
-+**
-+**      gckMMU Mmu
-+**          Pointer to an gckMMU object.
-+**
-+**      gctPOINTER PageTable
-+**          Base address of the page table to free.
-+**
-+**      gctSIZE_T PageCount
-+**          Number of pages to free.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+_FreePages(
-+    IN gckMMU Mmu,
-+    IN gctPOINTER PageTable,
-+    IN gctSIZE_T PageCount
-+    )
-+{
-+    gctUINT32_PTR pageTable;
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x PageTable=0x%x PageCount=%lu",
-+                   Mmu, PageTable, PageCount);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(PageCount > 0);
-+
-+    /* Convert the pointer. */
-+    pageTable = (gctUINT32_PTR) PageTable;
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+#if gcdMMU_CLEAR_VALUE
-+    if (Mmu->hardware->mmuVersion == 0)
-+    {
-+        _FillPageTable(pageTable, PageCount, gcdMMU_CLEAR_VALUE);
-+    }
-+#endif
-+
-+    if (PageCount == 1)
-+    {
-+        /* Single page node. */
-+        _WritePageEntry(pageTable,
-+                        (~((1U<<8)-1)) | gcvMMU_SINGLE
-+#if gcdUSE_MMU_EXCEPTION
-+                        /* Enable exception */
-+                        | 1 << 1
-+#endif
-+                        );
-+    }
-+    else
-+    {
-+        /* Mark the node as free. */
-+        _WritePageEntry(pageTable,
-+                        (PageCount << 8) | gcvMMU_FREE
-+#if gcdUSE_MMU_EXCEPTION
-+                        /* Enable exception */
-+                        | 1 << 1
-+#endif
-+                       );
-+        _WritePageEntry(pageTable + 1, ~0U);
-+
-+#if gcdUSE_MMU_EXCEPTION
-+        /* Enable exception */
-+        gcmkVERIFY_OK(_FillPageTable(pageTable + 2, PageCount - 2, 1 << 1));
-+#endif
-+    }
-+
-+    /* We have free nodes. */
-+    Mmu->freeNodes = gcvTRUE;
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckMMU_AllocatePages(
-+    IN gckMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    return gckMMU_AllocatePagesEx(
-+                Mmu, PageCount, gcvSURF_UNKNOWN, PageTable, Address);
-+}
-+
-+gceSTATUS
-+gckMMU_AllocatePagesEx(
-+    IN gckMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    IN gceSURF_TYPE Type,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+#if gcdMIRROR_PAGETABLE
-+    gceSTATUS status;
-+    gctPOINTER pageTable;
-+    gctUINT32 address;
-+    gctINT i;
-+    gckMMU mmu;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL allocated = gcvFALSE;
-+
-+    gckOS_AcquireMutex(Mmu->os, mirrorPageTableMutex, gcvINFINITE);
-+    acquired = gcvTRUE;
-+
-+    /* Allocate page table for current MMU. */
-+    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
-+    {
-+        if (Mmu == mirrorPageTable->mmus[i])
-+        {
-+            gcmkONERROR(_AllocatePages(Mmu, PageCount, Type, PageTable, Address));
-+            allocated = gcvTRUE;
-+        }
-+    }
-+
-+    /* Allocate page table for other MMUs. */
-+    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
-+    {
-+        mmu = mirrorPageTable->mmus[i];
-+
-+        if (Mmu != mmu)
-+        {
-+            gcmkONERROR(_AllocatePages(mmu, PageCount, Type, &pageTable, &address));
-+            gcmkASSERT(address == *Address);
-+        }
-+    }
-+
-+    gckOS_ReleaseMutex(Mmu->os, mirrorPageTableMutex);
-+    acquired = gcvFALSE;
-+
-+    return gcvSTATUS_OK;
-+OnError:
-+
-+    if (allocated)
-+    {
-+        /* Page tables for multiple GPU always keep the same. So it is impossible
-+         * the fist one allocates successfully but others fail.
-+         */
-+        gcmkASSERT(0);
-+    }
-+
-+    if (acquired)
-+    {
-+        gckOS_ReleaseMutex(Mmu->os, mirrorPageTableMutex);
-+    }
-+
-+    return status;
-+#else
-+    return _AllocatePages(Mmu, PageCount, Type, PageTable, Address);
-+#endif
-+}
-+
-+gceSTATUS
-+gckMMU_FreePages(
-+    IN gckMMU Mmu,
-+    IN gctPOINTER PageTable,
-+    IN gctSIZE_T PageCount
-+    )
-+{
-+#if gcdMIRROR_PAGETABLE
-+    gctINT i;
-+    gctUINT32 offset;
-+    gckMMU mmu;
-+
-+    gckOS_AcquireMutex(Mmu->os, mirrorPageTableMutex, gcvINFINITE);
-+
-+    gcmkVERIFY_OK(_FreePages(Mmu, PageTable, PageCount));
-+
-+    offset = (gctUINT32)PageTable - (gctUINT32)Mmu->pageTableLogical;
-+
-+    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
-+    {
-+        mmu = mirrorPageTable->mmus[i];
-+
-+        if (mmu != Mmu)
-+        {
-+            gcmkVERIFY_OK(_FreePages(mmu, mmu->pageTableLogical + offset/4, PageCount));
-+        }
-+    }
-+
-+    gckOS_ReleaseMutex(Mmu->os, mirrorPageTableMutex);
-+
-+    return gcvSTATUS_OK;
-+#else
-+    return _FreePages(Mmu, PageTable, PageCount);
-+#endif
-+}
-+
-+gceSTATUS
-+gckMMU_Enable(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 PhysBaseAddr,
-+    IN gctUINT32 PhysSize
-+    )
-+{
-+    gceSTATUS status;
-+#if gcdSHARED_PAGETABLE
-+    gckHARDWARE hardware;
-+    gctINT i;
-+#endif
-+
-+    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+#if gcdSHARED_PAGETABLE
-+    if (Mmu->enabled)
-+    {
-+        gcmkFOOTER_ARG("Status=%d", gcvSTATUS_SKIP);
-+        return gcvSTATUS_SKIP;
-+    }
-+#endif
-+
-+    if (Mmu->hardware->mmuVersion == 0)
-+    {
-+        /* Success. */
-+        gcmkFOOTER_ARG("Status=%d", gcvSTATUS_SKIP);
-+        return gcvSTATUS_SKIP;
-+    }
-+    else
-+    {
-+        if (PhysSize != 0)
-+        {
-+            gcmkONERROR(_FillFlatMapping(
-+                Mmu,
-+                PhysBaseAddr,
-+                PhysSize
-+                ));
-+        }
-+
-+        gcmkONERROR(_SetupDynamicSpace(Mmu));
-+
-+#if gcdSHARED_PAGETABLE
-+        for(i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            hardware = sharedPageTable->hardwares[i];
-+            if (hardware != gcvNULL)
-+            {
-+                gcmkONERROR(
-+                    gckHARDWARE_SetMMUv2(
-+                        hardware,
-+                        gcvTRUE,
-+                        Mmu->mtlbLogical,
-+                        gcvMMU_MODE_4K,
-+                        (gctUINT8_PTR)Mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
-+                        gcvFALSE
-+                        ));
-+            }
-+        }
-+#else
-+        gcmkONERROR(
-+            gckHARDWARE_SetMMUv2(
-+                Mmu->hardware,
-+                gcvTRUE,
-+                Mmu->mtlbLogical,
-+                gcvMMU_MODE_4K,
-+                (gctUINT8_PTR)Mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
-+                gcvFALSE
-+                ));
-+#endif
-+
-+        Mmu->enabled = gcvTRUE;
-+
-+        /* Success. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckMMU_SetPage(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 PageAddress,
-+    IN gctUINT32 *PageEntry
-+    )
-+{
-+#if gcdMIRROR_PAGETABLE
-+    gctUINT32_PTR pageEntry;
-+    gctINT i;
-+    gckMMU mmu;
-+    gctUINT32 offset = (gctUINT32)PageEntry - (gctUINT32)Mmu->pageTableLogical;
-+#endif
-+
-+    gctUINT32 data;
-+    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+    gcmkVERIFY_ARGUMENT(PageEntry != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(!(PageAddress & 0xFFF));
-+
-+    if (Mmu->hardware->mmuVersion == 0)
-+    {
-+        data = PageAddress;
-+    }
-+    else
-+    {
-+        data = _SetPage(PageAddress);
-+    }
-+
-+    _WritePageEntry(PageEntry, data);
-+
-+#if gcdMIRROR_PAGETABLE
-+    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
-+    {
-+        mmu = mirrorPageTable->mmus[i];
-+
-+        if (mmu != Mmu)
-+        {
-+            pageEntry = mmu->pageTableLogical + offset / 4;
-+
-+            if (mmu->hardware->mmuVersion == 0)
-+            {
-+                _WritePageEntry(pageEntry, PageAddress);
-+            }
-+            else
-+            {
-+                _WritePageEntry(pageEntry, _SetPage(PageAddress));
-+            }
-+        }
-+
-+    }
-+#endif
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#ifdef __QNXNTO__
-+gceSTATUS
-+gckMMU_InsertNode(
-+    IN gckMMU Mmu,
-+    IN gcuVIDMEM_NODE_PTR Node)
-+{
-+    gceSTATUS status;
-+    gctBOOL mutex = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x Node=0x%x", Mmu, Node);
-+
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->nodeMutex, gcvINFINITE));
-+    mutex = gcvTRUE;
-+
-+    Node->Virtual.next = Mmu->nodeList;
-+    Mmu->nodeList = Node;
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
-+
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (mutex)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckMMU_RemoveNode(
-+    IN gckMMU Mmu,
-+    IN gcuVIDMEM_NODE_PTR Node)
-+{
-+    gceSTATUS status;
-+    gctBOOL mutex = gcvFALSE;
-+    gcuVIDMEM_NODE_PTR *iter;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x Node=0x%x", Mmu, Node);
-+
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->nodeMutex, gcvINFINITE));
-+    mutex = gcvTRUE;
-+
-+    for (iter = &Mmu->nodeList; *iter; iter = &(*iter)->Virtual.next)
-+    {
-+        if (*iter == Node)
-+        {
-+            *iter = Node->Virtual.next;
-+            break;
-+        }
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
-+
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (mutex)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckMMU_FreeHandleMemory(
-+    IN gckKERNEL Kernel,
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Pid
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+    gcuVIDMEM_NODE_PTR curr, next;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x, Mmu=0x%x Pid=%u", Kernel, Mmu, Pid);
-+
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->nodeMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    for (curr = Mmu->nodeList; curr != gcvNULL; curr = next)
-+    {
-+        next = curr->Virtual.next;
-+
-+        if (curr->Virtual.processID == Pid)
-+        {
-+            while (curr->Virtual.unlockPendings[Kernel->core] == 0 && curr->Virtual.lockeds[Kernel->core] > 0)
-+            {
-+                gcmkONERROR(gckVIDMEM_Unlock(Kernel, curr, gcvSURF_TYPE_UNKNOWN, gcvNULL));
-+            }
-+
-+            gcmkVERIFY_OK(gckVIDMEM_Free(curr));
-+        }
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
-+
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+gceSTATUS
-+gckMMU_Flush(
-+    IN gckMMU Mmu
-+    )
-+{
-+    gckHARDWARE hardware;
-+#if gcdSHARED_PAGETABLE
-+    gctINT i;
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+#if gcdENABLE_VG
-+        if (i == gcvCORE_VG)
-+        {
-+            continue;
-+        }
-+#endif
-+        hardware = sharedPageTable->hardwares[i];
-+        if (hardware)
-+        {
-+            /* Notify cores who use this page table. */
-+            gcmkVERIFY_OK(
-+                gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
-+        }
-+    }
-+#elif gcdMIRROR_PAGETABLE
-+    gctINT i;
-+    for (i = 0; i < mirrorPageTable->reference; i++)
-+    {
-+        hardware = mirrorPageTable->hardwares[i];
-+
-+        /* Notify cores who use this page table. */
-+        gcmkVERIFY_OK(
-+            gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
-+    }
-+#else
-+    hardware = Mmu->hardware;
-+    gcmkVERIFY_OK(
-+        gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckMMU_DumpPageTableEntry(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Address
-+    )
-+{
-+    gctUINT32_PTR pageTable;
-+    gctUINT32 index;
-+    gctUINT32 mtlb, stlb;
-+
-+    gcmkHEADER_ARG("Mmu=0x%08X Address=0x%08X", Mmu, Address);
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+    gcmkASSERT(Mmu->hardware->mmuVersion > 0);
-+
-+    mtlb   = (Address & gcdMMU_MTLB_MASK) >> gcdMMU_MTLB_SHIFT;
-+    stlb   = (Address & gcdMMU_STLB_4K_MASK) >> gcdMMU_STLB_4K_SHIFT;
-+
-+    if (Address >= 0x80000000)
-+    {
-+        pageTable = Mmu->pageTableLogical;
-+
-+        index = (mtlb - Mmu->dynamicMappingStart)
-+              * gcdMMU_STLB_4K_ENTRY_NUM
-+              + stlb;
-+
-+        gcmkPRINT("    Page table entry = 0x%08X", _ReadPageEntry(pageTable + index));
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/******************************************************************************
-+****************************** T E S T   C O D E ******************************
-+******************************************************************************/
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,522 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#if gcdENABLE_VG
-+
-+#define _GC_OBJ_ZONE    gcvZONE_MMU
-+
-+/*******************************************************************************
-+**
-+**  gckVGMMU_Construct
-+**
-+**  Construct a new gckVGMMU object.
-+**
-+**  INPUT:
-+**
-+**      gckVGKERNEL Kernel
-+**          Pointer to an gckVGKERNEL object.
-+**
-+**      gctSIZE_T MmuSize
-+**          Number of bytes for the page table.
-+**
-+**  OUTPUT:
-+**
-+**      gckVGMMU * Mmu
-+**          Pointer to a variable that receives the gckVGMMU object pointer.
-+*/
-+gceSTATUS gckVGMMU_Construct(
-+    IN gckVGKERNEL Kernel,
-+    IN gctSIZE_T MmuSize,
-+    OUT gckVGMMU * Mmu
-+    )
-+{
-+    gckOS os;
-+    gckVGHARDWARE hardware;
-+    gceSTATUS status;
-+    gckVGMMU mmu;
-+    gctUINT32 * pageTable;
-+    gctUINT32 i;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x MmuSize=0x%x Mmu=0x%x", Kernel, MmuSize, Mmu);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(MmuSize > 0);
-+    gcmkVERIFY_ARGUMENT(Mmu != gcvNULL);
-+
-+    /* Extract the gckOS object pointer. */
-+    os = Kernel->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Extract the gckVGHARDWARE object pointer. */
-+    hardware = Kernel->hardware;
-+    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+    /* Allocate memory for the gckVGMMU object. */
-+    status = gckOS_Allocate(os, sizeof(struct _gckVGMMU), (gctPOINTER *) &mmu);
-+
-+    if (status < 0)
-+    {
-+        /* Error. */
-+        gcmkFATAL(
-+            "%s(%d): could not allocate gckVGMMU object.",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkFOOTER();
-+        return status;
-+    }
-+
-+    /* Initialize the gckVGMMU object. */
-+    mmu->object.type = gcvOBJ_MMU;
-+    mmu->os = os;
-+    mmu->hardware = hardware;
-+
-+    /* Create the mutex. */
-+    status = gckOS_CreateMutex(os, &mmu->mutex);
-+
-+    if (status < 0)
-+    {
-+        /* Roll back. */
-+        mmu->object.type = gcvOBJ_UNKNOWN;
-+        gcmkVERIFY_OK(gckOS_Free(os, mmu));
-+
-+        gcmkFOOTER();
-+        /* Error. */
-+        return status;
-+    }
-+
-+    /* Allocate the page table. */
-+    mmu->pageTableSize = MmuSize;
-+    status = gckOS_AllocateContiguous(os,
-+                                      gcvFALSE,
-+                                      &mmu->pageTableSize,
-+                                      &mmu->pageTablePhysical,
-+                                      &mmu->pageTableLogical);
-+
-+    if (status < 0)
-+    {
-+        /* Roll back. */
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(os, mmu->mutex));
-+
-+        mmu->object.type = gcvOBJ_UNKNOWN;
-+        gcmkVERIFY_OK(gckOS_Free(os, mmu));
-+
-+        /* Error. */
-+        gcmkFATAL(
-+            "%s(%d): could not allocate page table.",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkFOOTER();
-+        return status;
-+    }
-+
-+    /* Compute number of entries in page table. */
-+    mmu->entryCount = mmu->pageTableSize / sizeof(gctUINT32);
-+    mmu->entry = 0;
-+
-+    /* Mark the entire page table as available. */
-+    pageTable = (gctUINT32 *) mmu->pageTableLogical;
-+    for (i = 0; i < mmu->entryCount; i++)
-+    {
-+        pageTable[i] = (gctUINT32)~0;
-+    }
-+
-+    /* Set page table address. */
-+    status = gckVGHARDWARE_SetMMU(hardware, mmu->pageTableLogical);
-+
-+    if (status < 0)
-+    {
-+        /* Free the page table. */
-+        gcmkVERIFY_OK(gckOS_FreeContiguous(mmu->os,
-+                                      mmu->pageTablePhysical,
-+                                      mmu->pageTableLogical,
-+                                      mmu->pageTableSize));
-+
-+        /* Roll back. */
-+        gcmkVERIFY_OK(gckOS_DeleteMutex(os, mmu->mutex));
-+
-+        mmu->object.type = gcvOBJ_UNKNOWN;
-+        gcmkVERIFY_OK(gckOS_Free(os, mmu));
-+
-+        /* Error. */
-+        gcmkFATAL(
-+            "%s(%d): could not program page table.",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkFOOTER();
-+        return status;
-+    }
-+
-+    /* Return the gckVGMMU object pointer. */
-+    *Mmu = mmu;
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_MMU,
-+        "%s(%d): %u entries at %p.(0x%08X)\n",
-+        __FUNCTION__, __LINE__,
-+        mmu->entryCount,
-+        mmu->pageTableLogical,
-+        mmu->pageTablePhysical
-+        );
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGMMU_Destroy
-+**
-+**  Destroy a nAQMMU object.
-+**
-+**  INPUT:
-+**
-+**      gckVGMMU Mmu
-+**          Pointer to an gckVGMMU object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGMMU_Destroy(
-+    IN gckVGMMU Mmu
-+    )
-+{
-+    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+
-+    /* Free the page table. */
-+    gcmkVERIFY_OK(gckOS_FreeContiguous(Mmu->os,
-+                                  Mmu->pageTablePhysical,
-+                                  Mmu->pageTableLogical,
-+                                  Mmu->pageTableSize));
-+
-+    /* Roll back. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Mmu->os, Mmu->mutex));
-+
-+    /* Mark the gckVGMMU object as unknown. */
-+    Mmu->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckVGMMU object. */
-+    gcmkVERIFY_OK(gckOS_Free(Mmu->os, Mmu));
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGMMU_AllocatePages
-+**
-+**  Allocate pages inside the page table.
-+**
-+**  INPUT:
-+**
-+**      gckVGMMU Mmu
-+**          Pointer to an gckVGMMU object.
-+**
-+**      gctSIZE_T PageCount
-+**          Number of pages to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * PageTable
-+**          Pointer to a variable that receives the base address of the page
-+**          table.
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable that receives the hardware specific address.
-+*/
-+gceSTATUS gckVGMMU_AllocatePages(
-+    IN gckVGMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 tail, index, i;
-+    gctUINT32 * table;
-+    gctBOOL allocated = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x PageCount=0x%x PageTable=0x%x Address=0x%x",
-+        Mmu, PageCount, PageTable, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+    gcmkVERIFY_ARGUMENT(PageCount > 0);
-+    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_MMU,
-+        "%s(%d): %u pages.\n",
-+        __FUNCTION__, __LINE__,
-+        PageCount
-+        );
-+
-+    if (PageCount > Mmu->entryCount)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_MMU,
-+            "%s(%d): page table too small for %u pages.\n",
-+            __FUNCTION__, __LINE__,
-+            PageCount
-+            );
-+
-+        gcmkFOOTER_NO();
-+        /* Not enough pages avaiable. */
-+        return gcvSTATUS_OUT_OF_RESOURCES;
-+    }
-+
-+    /* Grab the mutex. */
-+    status = gckOS_AcquireMutex(Mmu->os, Mmu->mutex, gcvINFINITE);
-+
-+    if (status < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_MMU,
-+            "%s(%d): could not acquire mutex.\n"
-+            ,__FUNCTION__, __LINE__
-+            );
-+
-+        gcmkFOOTER();
-+        /* Error. */
-+        return status;
-+    }
-+
-+    /* Compute the tail for this allocation. */
-+    tail = Mmu->entryCount - PageCount;
-+
-+    /* Walk all entries until we find enough slots. */
-+    for (index = Mmu->entry; index <= tail;)
-+    {
-+        /* Access page table. */
-+        table = (gctUINT32 *) Mmu->pageTableLogical + index;
-+
-+        /* See if all slots are available. */
-+        for (i = 0; i < PageCount; i++, table++)
-+        {
-+            if (*table != ~0)
-+            {
-+                /* Start from next slot. */
-+                index += i + 1;
-+                break;
-+            }
-+        }
-+
-+        if (i == PageCount)
-+        {
-+            /* Bail out if we have enough page entries. */
-+            allocated = gcvTRUE;
-+            break;
-+        }
-+    }
-+
-+    if (!allocated)
-+    {
-+        if (status >= 0)
-+        {
-+            /* Walk all entries until we find enough slots. */
-+            for (index = 0; index <= tail;)
-+            {
-+                /* Access page table. */
-+                table = (gctUINT32 *) Mmu->pageTableLogical + index;
-+
-+                /* See if all slots are available. */
-+                for (i = 0; i < PageCount; i++, table++)
-+                {
-+                    if (*table != ~0)
-+                    {
-+                        /* Start from next slot. */
-+                        index += i + 1;
-+                        break;
-+                    }
-+                }
-+
-+                if (i == PageCount)
-+                {
-+                    /* Bail out if we have enough page entries. */
-+                    allocated = gcvTRUE;
-+                    break;
-+                }
-+            }
-+        }
-+    }
-+
-+    if (!allocated && (status >= 0))
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_MMU,
-+            "%s(%d): not enough free pages for %u pages.\n",
-+            __FUNCTION__, __LINE__,
-+            PageCount
-+            );
-+
-+        /* Not enough empty slots available. */
-+        status = gcvSTATUS_OUT_OF_RESOURCES;
-+    }
-+
-+    if (status >= 0)
-+    {
-+        /* Build virtual address. */
-+        status = gckVGHARDWARE_BuildVirtualAddress(Mmu->hardware,
-+                                                 index,
-+                                                 0,
-+                                                 Address);
-+
-+        if (status >= 0)
-+        {
-+            /* Update current entry into page table. */
-+            Mmu->entry = index + PageCount;
-+
-+            /* Return pointer to page table. */
-+            *PageTable = (gctUINT32 *)  Mmu->pageTableLogical + index;
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_MMU,
-+                "%s(%d): allocated %u pages at index %u (0x%08X) @ %p.\n",
-+                __FUNCTION__, __LINE__,
-+                PageCount,
-+                index,
-+                *Address,
-+                *PageTable
-+                );
-+            }
-+    }
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->mutex));
-+    gcmkFOOTER();
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVGMMU_FreePages
-+**
-+**  Free pages inside the page table.
-+**
-+**  INPUT:
-+**
-+**      gckVGMMU Mmu
-+**          Pointer to an gckVGMMU object.
-+**
-+**      gctPOINTER PageTable
-+**          Base address of the page table to free.
-+**
-+**      gctSIZE_T PageCount
-+**          Number of pages to free.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGMMU_FreePages(
-+    IN gckVGMMU Mmu,
-+    IN gctPOINTER PageTable,
-+    IN gctSIZE_T PageCount
-+    )
-+{
-+    gctUINT32 * table;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x PageTable=0x%x PageCount=0x%x",
-+        Mmu, PageTable, PageCount);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(PageCount > 0);
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_MMU,
-+        "%s(%d): freeing %u pages at index %u @ %p.\n",
-+        __FUNCTION__, __LINE__,
-+        PageCount,
-+        ((gctUINT32 *) PageTable - (gctUINT32 *) Mmu->pageTableLogical),
-+        PageTable
-+        );
-+
-+    /* Convert pointer. */
-+    table = (gctUINT32 *) PageTable;
-+
-+    /* Mark the page table entries as available. */
-+    while (PageCount-- > 0)
-+    {
-+        *table++ = (gctUINT32)~0;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGMMU_SetPage(
-+    IN gckVGMMU Mmu,
-+    IN gctUINT32 PageAddress,
-+    IN gctUINT32 *PageEntry
-+    )
-+{
-+    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
-+    gcmkVERIFY_ARGUMENT(PageEntry != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(!(PageAddress & 0xFFF));
-+
-+    *PageEntry = PageAddress;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckVGMMU_Flush(
-+   IN gckVGMMU Mmu
-+   )
-+{
-+    gckVGHARDWARE hardware;
-+
-+    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
-+
-+    hardware = Mmu->hardware;
-+    gcmkVERIFY_OK(
-+        gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#endif /* gcdENABLE_VG */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,347 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_POWER
-+
-+/******************************************************************************\
-+************************ Dynamic Voltage Frequency Setting *********************
-+\******************************************************************************/
-+#if gcdDVFS
-+static gctUINT32
-+_GetLoadHistory(
-+    IN gckDVFS Dvfs,
-+    IN gctUINT32 Select,
-+    IN gctUINT32 Index
-+)
-+{
-+    return Dvfs->loads[Index];
-+}
-+
-+static void
-+_IncreaseScale(
-+    IN gckDVFS Dvfs,
-+    IN gctUINT32 Load,
-+    OUT gctUINT8 *Scale
-+    )
-+{
-+    if (Dvfs->currentScale < 32)
-+    {
-+        *Scale = Dvfs->currentScale + 8;
-+    }
-+    else
-+    {
-+        *Scale = Dvfs->currentScale + 8;
-+        *Scale = gcmMIN(64, *Scale);
-+    }
-+}
-+
-+static void
-+_RecordFrequencyHistory(
-+    gckDVFS Dvfs,
-+    gctUINT32 Frequency
-+    )
-+{
-+    gctUINT32 i = 0;
-+
-+    struct _FrequencyHistory *history = Dvfs->frequencyHistory;
-+
-+    for (i = 0; i < 16; i++)
-+    {
-+        if (history->frequency == Frequency)
-+        {
-+            break;
-+        }
-+
-+        if (history->frequency == 0)
-+        {
-+            history->frequency = Frequency;
-+            break;
-+        }
-+
-+        history++;
-+    }
-+
-+    if (i < 16)
-+    {
-+        history->count++;
-+    }
-+}
-+
-+static gctUINT32
-+_GetFrequencyHistory(
-+    gckDVFS Dvfs,
-+    gctUINT32 Frequency
-+    )
-+{
-+    gctUINT32 i = 0;
-+
-+    struct _FrequencyHistory * history = Dvfs->frequencyHistory;
-+
-+    for (i = 0; i < 16; i++)
-+    {
-+        if (history->frequency == Frequency)
-+        {
-+            break;
-+        }
-+
-+        history++;
-+    }
-+
-+    if (i < 16)
-+    {
-+        return history->count;
-+    }
-+
-+    return 0;
-+}
-+
-+static void
-+_Policy(
-+    IN gckDVFS Dvfs,
-+    IN gctUINT32 Load,
-+    OUT gctUINT8 *Scale
-+    )
-+{
-+    gctUINT8 load[4], nextLoad;
-+    gctUINT8 scale;
-+
-+    /* Last 4 history. */
-+    load[0] = (Load & 0xFF);
-+    load[1] = (Load & 0xFF00) >> 8;
-+    load[2] = (Load & 0xFF0000) >> 16;
-+    load[3] = (Load & 0xFF000000) >> 24;
-+
-+    /* Determine target scale. */
-+    if (load[0] > 54)
-+    {
-+        _IncreaseScale(Dvfs, Load, &scale);
-+    }
-+    else
-+    {
-+        nextLoad = (load[0] + load[1] + load[2] + load[3])/4;
-+
-+        scale = Dvfs->currentScale * (nextLoad) / 54;
-+
-+        scale = gcmMAX(1, scale);
-+        scale = gcmMIN(64, scale);
-+    }
-+
-+    Dvfs->totalConfig++;
-+
-+    Dvfs->loads[(load[0]-1)/8]++;
-+
-+    *Scale = scale;
-+
-+
-+    if (Dvfs->totalConfig % 100 == 0)
-+    {
-+        gcmkPRINT("=======================================================");
-+        gcmkPRINT("GPU Load:       %-8d %-8d %-8d %-8d %-8d %-8d %-8d %-8d",
-+                                   8, 16, 24, 32, 40, 48, 56, 64);
-+        gcmkPRINT("                %-8d %-8d %-8d %-8d %-8d %-8d %-8d %-8d",
-+                  _GetLoadHistory(Dvfs,2, 0),
-+                  _GetLoadHistory(Dvfs,2, 1),
-+                  _GetLoadHistory(Dvfs,2, 2),
-+                  _GetLoadHistory(Dvfs,2, 3),
-+                  _GetLoadHistory(Dvfs,2, 4),
-+                  _GetLoadHistory(Dvfs,2, 5),
-+                  _GetLoadHistory(Dvfs,2, 6),
-+                  _GetLoadHistory(Dvfs,2, 7)
-+                  );
-+
-+        gcmkPRINT("Frequency(MHz)  %-8d %-8d %-8d %-8d %-8d",
-+                  58, 120, 240, 360, 480);
-+        gcmkPRINT("                %-8d %-8d %-8d %-8d %-8d",
-+                  _GetFrequencyHistory(Dvfs, 58),
-+                  _GetFrequencyHistory(Dvfs,120),
-+                  _GetFrequencyHistory(Dvfs,240),
-+                  _GetFrequencyHistory(Dvfs,360),
-+                  _GetFrequencyHistory(Dvfs,480)
-+                  );
-+    }
-+}
-+
-+static void
-+_TimerFunction(
-+    gctPOINTER Data
-+    )
-+{
-+    gceSTATUS status;
-+    gckDVFS dvfs = (gckDVFS) Data;
-+    gckHARDWARE hardware = dvfs->hardware;
-+    gctUINT32 value;
-+    gctUINT32 frequency;
-+    gctUINT8 scale;
-+    gctUINT32 t1, t2, consumed;
-+
-+    gckOS_GetTicks(&t1);
-+
-+    gcmkONERROR(gckHARDWARE_QueryLoad(hardware, &value));
-+
-+    /* determine target sacle. */
-+    _Policy(dvfs, value, &scale);
-+
-+    /* Set frequency and voltage. */
-+    gcmkONERROR(gckOS_SetGPUFrequency(hardware->os, hardware->core, scale));
-+
-+    /* Query real frequency. */
-+    gcmkONERROR(
-+        gckOS_QueryGPUFrequency(hardware->os,
-+                                hardware->core,
-+                                &frequency,
-+                                &dvfs->currentScale));
-+
-+    _RecordFrequencyHistory(dvfs, frequency);
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_POWER,
-+                   "Current frequency = %d",
-+                   frequency);
-+
-+    /* Set period. */
-+    gcmkONERROR(gckHARDWARE_SetDVFSPeroid(hardware, frequency));
-+
-+OnError:
-+    /* Determine next querying time. */
-+    gckOS_GetTicks(&t2);
-+
-+    consumed = gcmMIN(((long)t2 - (long)t1), 5);
-+
-+    if (dvfs->stop == gcvFALSE)
-+    {
-+        gcmkVERIFY_OK(gckOS_StartTimer(hardware->os,
-+                                       dvfs->timer,
-+                                       dvfs->pollingTime - consumed));
-+    }
-+
-+    return;
-+}
-+
-+gceSTATUS
-+gckDVFS_Construct(
-+    IN gckHARDWARE Hardware,
-+    OUT gckDVFS * Dvfs
-+    )
-+{
-+    gceSTATUS status;
-+    gctPOINTER pointer;
-+    gckDVFS dvfs = gcvNULL;
-+    gckOS os = Hardware->os;
-+
-+    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
-+
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
-+
-+    /* Allocate a gckDVFS manager. */
-+    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(struct _gckDVFS), &pointer));
-+
-+    gckOS_ZeroMemory(pointer, gcmSIZEOF(struct _gckDVFS));
-+
-+    dvfs = pointer;
-+
-+    /* Initialization. */
-+    dvfs->hardware = Hardware;
-+    dvfs->pollingTime = gcdDVFS_POLLING_TIME;
-+    dvfs->os = Hardware->os;
-+    dvfs->currentScale = 64;
-+
-+    /* Create a polling timer. */
-+    gcmkONERROR(gckOS_CreateTimer(os, _TimerFunction, pointer, &dvfs->timer));
-+
-+    /* Initialize frequency and voltage adjustment helper. */
-+    gcmkONERROR(gckOS_PrepareGPUFrequency(os, Hardware->core));
-+
-+    /* Return result. */
-+    *Dvfs = dvfs;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (dvfs)
-+    {
-+        if (dvfs->timer)
-+        {
-+            gcmkVERIFY_OK(gckOS_DestroyTimer(os, dvfs->timer));
-+        }
-+
-+        gcmkOS_SAFE_FREE(os, dvfs);
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckDVFS_Destroy(
-+    IN gckDVFS Dvfs
-+    )
-+{
-+    gcmkHEADER_ARG("Dvfs=0x%X", Dvfs);
-+    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
-+
-+    /* Deinitialize helper fuunction. */
-+    gcmkVERIFY_OK(gckOS_FinishGPUFrequency(Dvfs->os, Dvfs->hardware->core));
-+
-+    /* DestroyTimer. */
-+    gcmkVERIFY_OK(gckOS_DestroyTimer(Dvfs->os, Dvfs->timer));
-+
-+    gcmkOS_SAFE_FREE(Dvfs->os, Dvfs);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckDVFS_Start(
-+    IN gckDVFS Dvfs
-+    )
-+{
-+    gcmkHEADER_ARG("Dvfs=0x%X", Dvfs);
-+    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
-+
-+    gckHARDWARE_InitDVFS(Dvfs->hardware);
-+
-+    Dvfs->stop = gcvFALSE;
-+
-+    gckOS_StartTimer(Dvfs->os, Dvfs->timer, Dvfs->pollingTime);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckDVFS_Stop(
-+    IN gckDVFS Dvfs
-+    )
-+{
-+    gcmkHEADER_ARG("Dvfs=0x%X", Dvfs);
-+    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
-+
-+    Dvfs->stop = gcvTRUE;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,29 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_precomp_h_
-+#define __gc_hal_kernel_precomp_h_
-+
-+#include "gc_hal.h"
-+#include "gc_hal_driver.h"
-+#include "gc_hal_kernel.h"
-+
-+#endif /* __gc_hal_kernel_precomp_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,239 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+
-+
-+
-+#define _GC_OBJ_ZONE    gcvZONE_KERNEL
-+
-+#if gcdSECURITY
-+
-+/*
-+** Open a security service channel.
-+*/
-+gceSTATUS
-+gckKERNEL_SecurityOpen(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 GPU,
-+    OUT gctUINT32 *Channel
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkONERROR(gckOS_OpenSecurityChannel(Kernel->os, Kernel->core, Channel));
-+    gcmkONERROR(gckOS_InitSecurityChannel(*Channel));
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+/*
-+** Close a security service channel
-+*/
-+gceSTATUS
-+gckKERNEL_SecurityClose(
-+    IN gctUINT32 Channel
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+/*
-+** Security service interface.
-+*/
-+gceSTATUS
-+gckKERNEL_SecurityCallService(
-+    IN gctUINT32 Channel,
-+    IN OUT gcsTA_INTERFACE * Interface
-+)
-+{
-+    gceSTATUS status;
-+    gcmkHEADER();
-+
-+    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
-+
-+    gckOS_CallSecurityService(Channel, Interface);
-+
-+    status = Interface->result;
-+
-+    gcmkONERROR(status);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_SecurityStartCommand(
-+    IN gckKERNEL Kernel
-+    )
-+{
-+    gceSTATUS status;
-+    gcsTA_INTERFACE iface;
-+
-+    gcmkHEADER();
-+
-+    iface.command = KERNEL_START_COMMAND;
-+    iface.u.StartCommand.gpu = Kernel->core;
-+
-+    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_SecurityAllocateSecurityMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 Bytes,
-+    OUT gctUINT32 * Handle
-+    )
-+{
-+    gceSTATUS status;
-+    gcsTA_INTERFACE iface;
-+
-+    gcmkHEADER();
-+
-+    iface.command = KERNEL_ALLOCATE_SECRUE_MEMORY;
-+    iface.u.AllocateSecurityMemory.bytes = Bytes;
-+
-+    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
-+
-+    *Handle = iface.u.AllocateSecurityMemory.memory_handle;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_SecurityExecute(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Buffer,
-+    IN gctUINT32 Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gcsTA_INTERFACE iface;
-+
-+    gcmkHEADER();
-+
-+    iface.command = KERNEL_EXECUTE;
-+    iface.u.Execute.command_buffer = (gctUINT32 *)Buffer;
-+    iface.u.Execute.gpu = Kernel->core;
-+    iface.u.Execute.command_buffer_length = Bytes;
-+
-+#if defined(LINUX)
-+    gcmkONERROR(gckOS_GetPhysicalAddress(Kernel->os, Buffer,
-+            (gctUINT32 *)&iface.u.Execute.command_buffer));
-+#endif
-+
-+    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
-+
-+    /* Update queue tail pointer. */
-+    gcmkONERROR(gckHARDWARE_UpdateQueueTail(
-+        Kernel->hardware, 0, 0
-+        ));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_SecurityMapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 *PhysicalArray,
-+    IN gctUINT32 PageCount,
-+    OUT gctUINT32 * GPUAddress
-+    )
-+{
-+    gceSTATUS status;
-+    gcsTA_INTERFACE iface;
-+
-+    gcmkHEADER();
-+
-+    iface.command = KERNEL_MAP_MEMORY;
-+
-+#if defined(LINUX)
-+    gcmkONERROR(gckOS_GetPhysicalAddress(Kernel->os, PhysicalArray,
-+            (gctUINT32 *)&iface.u.MapMemory.physicals));
-+#endif
-+
-+    iface.u.MapMemory.pageCount = PageCount;
-+
-+    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
-+
-+    *GPUAddress = iface.u.MapMemory.gpuAddress;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_SecurityUnmapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 GPUAddress,
-+    IN gctUINT32 PageCount
-+    )
-+{
-+    gceSTATUS status;
-+    gcsTA_INTERFACE iface;
-+
-+    gcmkHEADER();
-+
-+    iface.command = KERNEL_UNMAP_MEMORY;
-+
-+    iface.u.UnmapMemory.gpuAddress = GPUAddress;
-+    iface.u.UnmapMemory.pageCount  = PageCount;
-+
-+    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,896 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#if gcdENABLE_VG
-+
-+#define ENABLE_VG_TRY_VIRTUAL_MEMORY 0
-+
-+#define _GC_OBJ_ZONE            gcvZONE_VG
-+
-+/******************************************************************************\
-+******************************* gckKERNEL API Code ******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Construct
-+**
-+**  Construct a new gckKERNEL object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      IN gctPOINTER Context
-+**          Pointer to a driver defined context.
-+**
-+**  OUTPUT:
-+**
-+**      gckKERNEL * Kernel
-+**          Pointer to a variable that will hold the pointer to the gckKERNEL
-+**          object.
-+*/
-+gceSTATUS gckVGKERNEL_Construct(
-+    IN gckOS Os,
-+    IN gctPOINTER Context,
-+    IN gckKERNEL  inKernel,
-+    OUT gckVGKERNEL * Kernel
-+    )
-+{
-+    gceSTATUS status;
-+    gckVGKERNEL kernel = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%x Context=0x%x", Os, Context);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Kernel != gcvNULL);
-+
-+    do
-+    {
-+        /* Allocate the gckKERNEL object. */
-+        gcmkERR_BREAK(gckOS_Allocate(
-+            Os,
-+            sizeof(struct _gckVGKERNEL),
-+            (gctPOINTER *) &kernel
-+            ));
-+
-+        /* Initialize the gckKERNEL object. */
-+        kernel->object.type = gcvOBJ_KERNEL;
-+        kernel->os          = Os;
-+        kernel->context     = Context;
-+        kernel->hardware    = gcvNULL;
-+        kernel->interrupt   = gcvNULL;
-+        kernel->command     = gcvNULL;
-+        kernel->mmu         = gcvNULL;
-+        kernel->kernel      = inKernel;
-+
-+        /* Construct the gckVGHARDWARE object. */
-+        gcmkERR_BREAK(gckVGHARDWARE_Construct(
-+            Os, &kernel->hardware
-+            ));
-+
-+        /* Set pointer to gckKERNEL object in gckVGHARDWARE object. */
-+        kernel->hardware->kernel = kernel;
-+
-+        /* Construct the gckVGINTERRUPT object. */
-+        gcmkERR_BREAK(gckVGINTERRUPT_Construct(
-+            kernel, &kernel->interrupt
-+            ));
-+
-+        /* Construct the gckVGCOMMAND object. */
-+        gcmkERR_BREAK(gckVGCOMMAND_Construct(
-+            kernel, gcmKB2BYTES(8), gcmKB2BYTES(2), &kernel->command
-+            ));
-+
-+        /* Construct the gckVGMMU object. */
-+        gcmkERR_BREAK(gckVGMMU_Construct(
-+            kernel, gcmKB2BYTES(32), &kernel->mmu
-+            ));
-+
-+        /* Return pointer to the gckKERNEL object. */
-+        *Kernel = kernel;
-+
-+        gcmkFOOTER_ARG("*Kernel=0x%x", *Kernel);
-+        /* Success. */
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Roll back. */
-+    if (kernel != gcvNULL)
-+    {
-+        if (kernel->mmu != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckVGMMU_Destroy(kernel->mmu));
-+        }
-+
-+        if (kernel->command != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckVGCOMMAND_Destroy(kernel->command));
-+        }
-+
-+        if (kernel->interrupt != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckVGINTERRUPT_Destroy(kernel->interrupt));
-+        }
-+
-+        if (kernel->hardware != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckVGHARDWARE_Destroy(kernel->hardware));
-+        }
-+
-+        gcmkVERIFY_OK(gckOS_Free(Os, kernel));
-+    }
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Destroy
-+**
-+**  Destroy an gckKERNEL object.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckVGKERNEL_Destroy(
-+    IN gckVGKERNEL Kernel
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    do
-+    {
-+        /* Destroy the gckVGMMU object. */
-+        if (Kernel->mmu != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckVGMMU_Destroy(Kernel->mmu));
-+            Kernel->mmu = gcvNULL;
-+        }
-+
-+        /* Destroy the gckVGCOMMAND object. */
-+        if (Kernel->command != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckVGCOMMAND_Destroy(Kernel->command));
-+            Kernel->command = gcvNULL;
-+        }
-+
-+        /* Destroy the gckVGINTERRUPT object. */
-+        if (Kernel->interrupt != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckVGINTERRUPT_Destroy(Kernel->interrupt));
-+            Kernel->interrupt = gcvNULL;
-+        }
-+
-+        /* Destroy the gckVGHARDWARE object. */
-+        if (Kernel->hardware != gcvNULL)
-+        {
-+            gcmkERR_BREAK(gckVGHARDWARE_Destroy(Kernel->hardware));
-+            Kernel->hardware = gcvNULL;
-+        }
-+
-+        /* Mark the gckKERNEL object as unknown. */
-+        Kernel->object.type = gcvOBJ_UNKNOWN;
-+
-+        /* Free the gckKERNEL object. */
-+        gcmkERR_BREAK(gckOS_Free(Kernel->os, Kernel));
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_AllocateLinearMemory
-+**
-+**  Function walks all required memory pools and allocates the requested
-+**  amount of video memory.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcePOOL * Pool
-+**          Pointer the desired memory pool.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to allocate.
-+**
-+**      gctSIZE_T Alignment
-+**          Required buffer alignment.
-+**
-+**      gceSURF_TYPE Type
-+**          Surface type.
-+**
-+**  OUTPUT:
-+**
-+**      gcePOOL * Pool
-+**          Pointer to the actual pool where the memory was allocated.
-+**
-+**      gcuVIDMEM_NODE_PTR * Node
-+**          Allocated node.
-+*/
-+gceSTATUS
-+gckKERNEL_AllocateLinearMemory(
-+    IN gckKERNEL Kernel,
-+    IN OUT gcePOOL * Pool,
-+    IN gctSIZE_T Bytes,
-+    IN gctSIZE_T Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    )
-+{
-+    gcePOOL pool;
-+    gceSTATUS status;
-+    gckVIDMEM videoMemory;
-+
-+    /* Get initial pool. */
-+    switch (pool = *Pool)
-+    {
-+    case gcvPOOL_DEFAULT:
-+    case gcvPOOL_LOCAL:
-+        pool = gcvPOOL_LOCAL_INTERNAL;
-+        break;
-+
-+    case gcvPOOL_UNIFIED:
-+        pool = gcvPOOL_SYSTEM;
-+        break;
-+
-+    default:
-+        break;
-+    }
-+
-+    do
-+    {
-+        /* Verify the number of bytes to allocate. */
-+        if (Bytes == 0)
-+        {
-+            status = gcvSTATUS_INVALID_ARGUMENT;
-+            break;
-+        }
-+
-+        if (pool == gcvPOOL_VIRTUAL)
-+        {
-+            /* Create a gcuVIDMEM_NODE for virtual memory. */
-+            gcmkERR_BREAK(gckVIDMEM_ConstructVirtual(Kernel, gcvFALSE, Bytes, Node));
-+
-+            /* Success. */
-+            break;
-+        }
-+
-+        else
-+        {
-+            /* Get pointer to gckVIDMEM object for pool. */
-+            status = gckKERNEL_GetVideoMemoryPool(Kernel, pool, &videoMemory);
-+
-+            if (status == gcvSTATUS_OK)
-+            {
-+                if(*Pool == gcvPOOL_SYSTEM)
-+                    Type |= gcvSURF_VG;
-+                /* Allocate memory. */
-+                status = gckVIDMEM_AllocateLinear(Kernel,
-+                                                  videoMemory,
-+                                                  Bytes,
-+                                                  Alignment,
-+                                                  Type,
-+                                                  Node);
-+
-+                if (status == gcvSTATUS_OK)
-+                {
-+                    /* Memory allocated. */
-+                    break;
-+                }
-+            }
-+        }
-+
-+        if (pool == gcvPOOL_LOCAL_INTERNAL)
-+        {
-+            /* Advance to external memory. */
-+            pool = gcvPOOL_LOCAL_EXTERNAL;
-+        }
-+        else if (pool == gcvPOOL_LOCAL_EXTERNAL)
-+        {
-+            /* Advance to contiguous system memory. */
-+            pool = gcvPOOL_SYSTEM;
-+        }
-+        else if (pool == gcvPOOL_SYSTEM)
-+        {
-+            /* Advance to virtual memory. */
-+#if ENABLE_VG_TRY_VIRTUAL_MEMORY
-+            pool = gcvPOOL_VIRTUAL;
-+#else
-+            /*VG non-contiguous memory support is not ready yet, disable it temporary*/
-+            status = gcvSTATUS_OUT_OF_MEMORY;
-+            break;
-+#endif
-+        }
-+        else
-+        {
-+            /* Out of pools. */
-+            status = gcvSTATUS_OUT_OF_MEMORY;
-+            break;
-+        }
-+    }
-+    /* Loop only for multiple selection pools. */
-+    while ((*Pool == gcvPOOL_DEFAULT)
-+    ||     (*Pool == gcvPOOL_LOCAL)
-+    ||     (*Pool == gcvPOOL_UNIFIED)
-+    );
-+
-+    if (gcmIS_SUCCESS(status))
-+    {
-+        /* Return pool used for allocation. */
-+        *Pool = pool;
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Dispatch
-+**
-+**  Dispatch a command received from the user HAL layer.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to a gcsHAL_INTERFACE structure that defines the command to
-+**          be dispatched.
-+**
-+**  OUTPUT:
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to a gcsHAL_INTERFACE structure that receives any data to be
-+**          returned.
-+*/
-+gceSTATUS gckVGKERNEL_Dispatch(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL FromUser,
-+    IN OUT gcsHAL_INTERFACE * Interface
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE * kernelInterface = Interface;
-+    gcuVIDMEM_NODE_PTR node;
-+    gctUINT32 processID;
-+    gckKERNEL kernel = Kernel;
-+    gctPOINTER info = gcvNULL;
-+    gctPHYS_ADDR physical = gcvNULL;
-+    gctPOINTER logical = gcvNULL;
-+    gctSIZE_T bytes = 0;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Interface=0x%x ", Kernel, Interface);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
-+
-+    gcmkONERROR(gckOS_GetProcessID(&processID));
-+
-+    /* Dispatch on command. */
-+    switch (Interface->command)
-+    {
-+    case gcvHAL_QUERY_VIDEO_MEMORY:
-+        /* Query video memory size. */
-+        gcmkERR_BREAK(gckKERNEL_QueryVideoMemory(
-+            Kernel, kernelInterface
-+            ));
-+        break;
-+
-+    case gcvHAL_QUERY_CHIP_IDENTITY:
-+        /* Query chip identity. */
-+        gcmkERR_BREAK(gckVGHARDWARE_QueryChipIdentity(
-+            Kernel->vg->hardware,
-+            &kernelInterface->u.QueryChipIdentity.chipModel,
-+            &kernelInterface->u.QueryChipIdentity.chipRevision,
-+            &kernelInterface->u.QueryChipIdentity.chipFeatures,
-+            &kernelInterface->u.QueryChipIdentity.chipMinorFeatures,
-+            &kernelInterface->u.QueryChipIdentity.chipMinorFeatures2
-+            ));
-+        break;
-+
-+    case gcvHAL_QUERY_COMMAND_BUFFER:
-+        /* Query command buffer information. */
-+        gcmkERR_BREAK(gckKERNEL_QueryCommandBuffer(
-+            Kernel,
-+            &kernelInterface->u.QueryCommandBuffer.information
-+            ));
-+        break;
-+    case gcvHAL_ALLOCATE_NON_PAGED_MEMORY:
-+        bytes = (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes;
-+        /* Allocate non-paged memory. */
-+        gcmkERR_BREAK(gckOS_AllocateContiguous(
-+            Kernel->os,
-+            gcvTRUE,
-+            &bytes,
-+            &physical,
-+            &logical
-+            ));
-+
-+        kernelInterface->u.AllocateNonPagedMemory.bytes    = bytes;
-+        kernelInterface->u.AllocateNonPagedMemory.logical  = gcmPTR_TO_UINT64(logical);
-+        kernelInterface->u.AllocateNonPagedMemory.physical = gcmPTR_TO_NAME(physical);
-+        break;
-+
-+    case gcvHAL_FREE_NON_PAGED_MEMORY:
-+        physical = gcmNAME_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.physical);
-+
-+        /* Unmap user logical out of physical memory first. */
-+        gcmkERR_BREAK(gckOS_UnmapUserLogical(
-+            Kernel->os,
-+            physical,
-+            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes,
-+            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical)
-+            ));
-+
-+        /* Free non-paged memory. */
-+        gcmkERR_BREAK(gckOS_FreeNonPagedMemory(
-+            Kernel->os,
-+            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes,
-+            physical,
-+            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical)
-+            ));
-+
-+        gcmRELEASE_NAME(kernelInterface->u.AllocateNonPagedMemory.physical);
-+        break;
-+
-+    case gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY:
-+        bytes = (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes;
-+        /* Allocate contiguous memory. */
-+        gcmkERR_BREAK(gckOS_AllocateContiguous(
-+            Kernel->os,
-+            gcvTRUE,
-+            &bytes,
-+            &physical,
-+            &logical
-+            ));
-+
-+        kernelInterface->u.AllocateNonPagedMemory.bytes    = bytes;
-+        kernelInterface->u.AllocateNonPagedMemory.logical  = gcmPTR_TO_UINT64(logical);
-+        kernelInterface->u.AllocateNonPagedMemory.physical = gcmPTR_TO_NAME(physical);
-+        break;
-+
-+    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
-+        physical = gcmNAME_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.physical);
-+        /* Unmap user logical out of physical memory first. */
-+        gcmkERR_BREAK(gckOS_UnmapUserLogical(
-+            Kernel->os,
-+            physical,
-+            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes,
-+            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical)
-+            ));
-+
-+        /* Free contiguous memory. */
-+        gcmkERR_BREAK(gckOS_FreeContiguous(
-+            Kernel->os,
-+            physical,
-+            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical),
-+            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes
-+            ));
-+
-+        gcmRELEASE_NAME(kernelInterface->u.AllocateNonPagedMemory.physical);
-+        break;
-+
-+    case gcvHAL_ALLOCATE_VIDEO_MEMORY:
-+        {
-+            gctSIZE_T bytes;
-+            gctUINT32 bitsPerPixel;
-+            gctUINT32 bits;
-+
-+            /* Align width and height to tiles. */
-+            gcmkERR_BREAK(gckVGHARDWARE_AlignToTile(
-+                Kernel->vg->hardware,
-+                kernelInterface->u.AllocateVideoMemory.type,
-+                &kernelInterface->u.AllocateVideoMemory.width,
-+                &kernelInterface->u.AllocateVideoMemory.height
-+                ));
-+
-+            /* Convert format into bytes per pixel and bytes per tile. */
-+            gcmkERR_BREAK(gckVGHARDWARE_ConvertFormat(
-+                Kernel->vg->hardware,
-+                kernelInterface->u.AllocateVideoMemory.format,
-+                &bitsPerPixel,
-+                gcvNULL
-+                ));
-+
-+            /* Compute number of bits for the allocation. */
-+            bits
-+                = kernelInterface->u.AllocateVideoMemory.width
-+                * kernelInterface->u.AllocateVideoMemory.height
-+                * kernelInterface->u.AllocateVideoMemory.depth
-+                * bitsPerPixel;
-+
-+            /* Compute number of bytes for the allocation. */
-+            bytes = gcmALIGN(bits, 8) / 8;
-+
-+            /* Allocate memory. */
-+            gcmkERR_BREAK(gckKERNEL_AllocateLinearMemory(
-+                Kernel,
-+                &kernelInterface->u.AllocateVideoMemory.pool,
-+                bytes,
-+                64,
-+                kernelInterface->u.AllocateVideoMemory.type,
-+                &node
-+                ));
-+
-+            kernelInterface->u.AllocateVideoMemory.node = gcmPTR_TO_UINT64(node);
-+        }
-+        break;
-+
-+    case gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY:
-+        /* Allocate memory. */
-+        gcmkERR_BREAK(gckKERNEL_AllocateLinearMemory(
-+            Kernel,
-+            &kernelInterface->u.AllocateLinearVideoMemory.pool,
-+            kernelInterface->u.AllocateLinearVideoMemory.bytes,
-+            kernelInterface->u.AllocateLinearVideoMemory.alignment,
-+            kernelInterface->u.AllocateLinearVideoMemory.type,
-+            &node
-+            ));
-+
-+        gcmkERR_BREAK(gckKERNEL_AddProcessDB(Kernel,
-+           processID, gcvDB_VIDEO_MEMORY,
-+           node,
-+           gcvNULL,
-+           kernelInterface->u.AllocateLinearVideoMemory.bytes
-+           ));
-+
-+        kernelInterface->u.AllocateLinearVideoMemory.node = gcmPTR_TO_UINT64(node);
-+        break;
-+
-+    case gcvHAL_FREE_VIDEO_MEMORY:
-+        node = gcmUINT64_TO_PTR(Interface->u.FreeVideoMemory.node);
-+#ifdef __QNXNTO__
-+        /* Unmap the video memory */
-+
-+        if ((node->VidMem.memory->object.type == gcvOBJ_VIDMEM) &&
-+            (node->VidMem.logical != gcvNULL))
-+        {
-+            gckKERNEL_UnmapVideoMemory(Kernel,
-+                                       node->VidMem.logical,
-+                                       processID,
-+                                       node->VidMem.bytes);
-+            node->VidMem.logical = gcvNULL;
-+        }
-+#endif /* __QNXNTO__ */
-+
-+        /* Free video memory. */
-+        gcmkERR_BREAK(gckVIDMEM_Free(Kernel,
-+            node
-+            ));
-+
-+        gcmkERR_BREAK(gckKERNEL_RemoveProcessDB(
-+            Kernel,
-+            processID, gcvDB_VIDEO_MEMORY,
-+            node
-+            ));
-+
-+        break;
-+
-+    case gcvHAL_MAP_MEMORY:
-+        /* Map memory. */
-+        gcmkERR_BREAK(gckKERNEL_MapMemory(
-+            Kernel,
-+            gcmINT2PTR(kernelInterface->u.MapMemory.physical),
-+            (gctSIZE_T) kernelInterface->u.MapMemory.bytes,
-+            &logical
-+            ));
-+        kernelInterface->u.MapMemory.logical = gcmPTR_TO_UINT64(logical);
-+        break;
-+
-+    case gcvHAL_UNMAP_MEMORY:
-+        /* Unmap memory. */
-+        gcmkERR_BREAK(gckKERNEL_UnmapMemory(
-+            Kernel,
-+            gcmINT2PTR(kernelInterface->u.MapMemory.physical),
-+            (gctSIZE_T) kernelInterface->u.MapMemory.bytes,
-+            gcmUINT64_TO_PTR(kernelInterface->u.MapMemory.logical)
-+            ));
-+        break;
-+
-+    case gcvHAL_MAP_USER_MEMORY:
-+        /* Map user memory to DMA. */
-+        gcmkERR_BREAK(gckOS_MapUserMemory(
-+            Kernel->os,
-+            gcvCORE_VG,
-+            gcmUINT64_TO_PTR(kernelInterface->u.MapUserMemory.memory),
-+            kernelInterface->u.MapUserMemory.physical,
-+            (gctSIZE_T) kernelInterface->u.MapUserMemory.size,
-+            &info,
-+            &kernelInterface->u.MapUserMemory.address
-+            ));
-+
-+        kernelInterface->u.MapUserMemory.info = gcmPTR_TO_NAME(info);
-+        break;
-+
-+    case gcvHAL_UNMAP_USER_MEMORY:
-+        /* Unmap user memory. */
-+        gcmkERR_BREAK(gckOS_UnmapUserMemory(
-+            Kernel->os,
-+            gcvCORE_VG,
-+            gcmUINT64_TO_PTR(kernelInterface->u.UnmapUserMemory.memory),
-+            (gctSIZE_T) kernelInterface->u.UnmapUserMemory.size,
-+            gcmNAME_TO_PTR(kernelInterface->u.UnmapUserMemory.info),
-+            kernelInterface->u.UnmapUserMemory.address
-+            ));
-+        gcmRELEASE_NAME(kernelInterface->u.UnmapUserMemory.info);
-+        break;
-+    case gcvHAL_LOCK_VIDEO_MEMORY:
-+        node = gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node);
-+
-+        /* Lock video memory. */
-+        gcmkERR_BREAK(
-+            gckVIDMEM_Lock(Kernel,
-+                           node,
-+						   gcvFALSE,
-+                           &Interface->u.LockVideoMemory.address));
-+
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+            /* Map video memory address into user space. */
-+#ifdef __QNXNTO__
-+        if (node->VidMem.logical == gcvNULL)
-+        {
-+            gcmkONERROR(
-+                gckKERNEL_MapVideoMemory(Kernel,
-+                                         FromUser,
-+                                         Interface->u.LockVideoMemory.address,
-+                                         processID,
-+                                         node->VidMem.bytes,
-+                                         &node->VidMem.logical));
-+        }
-+
-+        Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->VidMem.logical);
-+#else
-+            gcmkERR_BREAK(
-+                gckKERNEL_MapVideoMemoryEx(Kernel,
-+                                         gcvCORE_VG,
-+                                         FromUser,
-+                                         Interface->u.LockVideoMemory.address,
-+                                         &logical));
-+            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(logical);
-+#endif
-+        }
-+        else
-+        {
-+            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->Virtual.logical);
-+
-+            /* Success. */
-+            status = gcvSTATUS_OK;
-+        }
-+
-+#if gcdSECURE_USER
-+        /* Return logical address as physical address. */
-+        Interface->u.LockVideoMemory.address =
-+            (gctUINT32)(Interface->u.LockVideoMemory.memory);
-+#endif
-+        gcmkERR_BREAK(
-+            gckKERNEL_AddProcessDB(Kernel,
-+                                   processID, gcvDB_VIDEO_MEMORY_LOCKED,
-+                                   node,
-+                                   gcvNULL,
-+                                   0));
-+        break;
-+
-+    case gcvHAL_UNLOCK_VIDEO_MEMORY:
-+        /* Unlock video memory. */
-+        node = gcmUINT64_TO_PTR(Interface->u.UnlockVideoMemory.node);
-+
-+#if gcdSECURE_USER
-+        /* Save node information before it disappears. */
-+        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        {
-+            logical = gcvNULL;
-+            bytes   = 0;
-+        }
-+        else
-+        {
-+            logical = node->Virtual.logical;
-+            bytes   = node->Virtual.bytes;
-+        }
-+#endif
-+
-+        /* Unlock video memory. */
-+        gcmkERR_BREAK(
-+            gckVIDMEM_Unlock(Kernel,
-+                             node,
-+                             Interface->u.UnlockVideoMemory.type,
-+                             &Interface->u.UnlockVideoMemory.asynchroneous));
-+
-+#if gcdSECURE_USER
-+        /* Flush the translation cache for virtual surfaces. */
-+        if (logical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(Kernel,
-+                                                          cache,
-+                                                          logical,
-+                                                          bytes));
-+        }
-+#endif
-+
-+        if (Interface->u.UnlockVideoMemory.asynchroneous == gcvFALSE)
-+        {
-+            /* There isn't a event to unlock this node, remove record now */
-+            gcmkERR_BREAK(
-+                    gckKERNEL_RemoveProcessDB(Kernel,
-+                        processID, gcvDB_VIDEO_MEMORY_LOCKED,
-+                        node));
-+        }
-+
-+        break;
-+    case gcvHAL_USER_SIGNAL:
-+#if !USE_NEW_LINUX_SIGNAL
-+        /* Dispatch depends on the user signal subcommands. */
-+        switch(Interface->u.UserSignal.command)
-+        {
-+        case gcvUSER_SIGNAL_CREATE:
-+            /* Create a signal used in the user space. */
-+            gcmkERR_BREAK(
-+                gckOS_CreateUserSignal(Kernel->os,
-+                                       Interface->u.UserSignal.manualReset,
-+                                       &Interface->u.UserSignal.id));
-+
-+            gcmkVERIFY_OK(
-+                gckKERNEL_AddProcessDB(Kernel,
-+                                       processID, gcvDB_SIGNAL,
-+                                       gcmINT2PTR(Interface->u.UserSignal.id),
-+                                       gcvNULL,
-+                                       0));
-+            break;
-+
-+        case gcvUSER_SIGNAL_DESTROY:
-+            /* Destroy the signal. */
-+            gcmkERR_BREAK(
-+                gckOS_DestroyUserSignal(Kernel->os,
-+                                        Interface->u.UserSignal.id));
-+
-+            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
-+                Kernel,
-+                processID, gcvDB_SIGNAL,
-+                gcmINT2PTR(Interface->u.UserSignal.id)));
-+            break;
-+
-+        case gcvUSER_SIGNAL_SIGNAL:
-+            /* Signal the signal. */
-+            gcmkERR_BREAK(
-+                gckOS_SignalUserSignal(Kernel->os,
-+                                       Interface->u.UserSignal.id,
-+                                       Interface->u.UserSignal.state));
-+            break;
-+
-+        case gcvUSER_SIGNAL_WAIT:
-+            /* Wait on the signal. */
-+            status = gckOS_WaitUserSignal(Kernel->os,
-+                                          Interface->u.UserSignal.id,
-+                                          Interface->u.UserSignal.wait);
-+            break;
-+
-+        default:
-+            /* Invalid user signal command. */
-+            gcmkERR_BREAK(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+#endif
-+        break;
-+
-+    case gcvHAL_COMMIT:
-+        /* Commit a command and context buffer. */
-+        gcmkERR_BREAK(gckVGCOMMAND_Commit(
-+            Kernel->vg->command,
-+            gcmUINT64_TO_PTR(kernelInterface->u.VGCommit.context),
-+            gcmUINT64_TO_PTR(kernelInterface->u.VGCommit.queue),
-+            kernelInterface->u.VGCommit.entryCount,
-+            gcmUINT64_TO_PTR(kernelInterface->u.VGCommit.taskTable)
-+            ));
-+        break;
-+    case gcvHAL_VERSION:
-+        kernelInterface->u.Version.major = gcvVERSION_MAJOR;
-+        kernelInterface->u.Version.minor = gcvVERSION_MINOR;
-+        kernelInterface->u.Version.patch = gcvVERSION_PATCH;
-+        kernelInterface->u.Version.build = gcvVERSION_BUILD;
-+        status = gcvSTATUS_OK;
-+        break;
-+
-+    case gcvHAL_GET_BASE_ADDRESS:
-+        /* Get base address. */
-+        gcmkERR_BREAK(
-+            gckOS_GetBaseAddress(Kernel->os,
-+                                 &kernelInterface->u.GetBaseAddress.baseAddress));
-+        break;
-+    default:
-+        /* Invalid command. */
-+        status = gcvSTATUS_INVALID_ARGUMENT;
-+    }
-+
-+OnError:
-+    /* Save status. */
-+    kernelInterface->status = status;
-+
-+    gcmkFOOTER();
-+
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_QueryCommandBuffer
-+**
-+**  Query command buffer attributes.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckVGHARDWARE object.
-+**
-+**  OUTPUT:
-+**
-+**      gcsCOMMAND_BUFFER_INFO_PTR Information
-+**          Pointer to the information structure to receive buffer attributes.
-+*/
-+gceSTATUS
-+gckKERNEL_QueryCommandBuffer(
-+    IN gckKERNEL Kernel,
-+    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x *Pool=0x%x",
-+                   Kernel, Information);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Get the information. */
-+    status = gckVGCOMMAND_QueryCommandBuffer(Kernel->vg->command, Information);
-+
-+    gcmkFOOTER();
-+    /* Return status. */
-+    return status;
-+}
-+
-+#endif /* gcdENABLE_VG */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,85 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_vg_h_
-+#define __gc_hal_kernel_vg_h_
-+
-+#include "gc_hal.h"
-+#include "gc_hal_driver.h"
-+#include "gc_hal_kernel_hardware.h"
-+
-+/******************************************************************************\
-+********************************** Structures **********************************
-+\******************************************************************************/
-+
-+/* gckKERNEL object. */
-+struct _gckVGKERNEL
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Pointer to gckHARDWARE object. */
-+    gckVGHARDWARE                   hardware;
-+
-+    /* Pointer to gckINTERRUPT object. */
-+    gckVGINTERRUPT              interrupt;
-+
-+    /* Pointer to gckCOMMAND object. */
-+    gckVGCOMMAND                    command;
-+
-+    /* Pointer to context. */
-+    gctPOINTER                  context;
-+
-+    /* Pointer to gckMMU object. */
-+    gckVGMMU                        mmu;
-+
-+    gckKERNEL                   kernel;
-+};
-+
-+/* gckMMU object. */
-+struct _gckVGMMU
-+{
-+    /* The object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to gckOS object. */
-+    gckOS                       os;
-+
-+    /* Pointer to gckHARDWARE object. */
-+    gckVGHARDWARE                   hardware;
-+
-+    /* The page table mutex. */
-+    gctPOINTER                  mutex;
-+
-+    /* Page table information. */
-+    gctSIZE_T                   pageTableSize;
-+    gctPHYS_ADDR                pageTablePhysical;
-+    gctPOINTER                  pageTableLogical;
-+
-+    /* Allocation index. */
-+    gctUINT32                   entryCount;
-+    gctUINT32                   entry;
-+};
-+
-+#endif /* __gc_hal_kernel_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,2229 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_precomp.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_VIDMEM
-+
-+/******************************************************************************\
-+******************************* Private Functions ******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  _Split
-+**
-+**  Split a node on the required byte boundary.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to the node to split.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to keep in the node.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      gctBOOL
-+**          gcvTRUE if the node was split successfully, or gcvFALSE if there is an
-+**          error.
-+**
-+*/
-+static gctBOOL
-+_Split(
-+    IN gckOS Os,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gcuVIDMEM_NODE_PTR node;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    /* Make sure the byte boundary makes sense. */
-+    if ((Bytes <= 0) || (Bytes > Node->VidMem.bytes))
-+    {
-+        return gcvFALSE;
-+    }
-+
-+    /* Allocate a new gcuVIDMEM_NODE object. */
-+    if (gcmIS_ERROR(gckOS_Allocate(Os,
-+                                   gcmSIZEOF(gcuVIDMEM_NODE),
-+                                   &pointer)))
-+    {
-+        /* Error. */
-+        return gcvFALSE;
-+    }
-+
-+    node = pointer;
-+
-+    /* Initialize gcuVIDMEM_NODE structure. */
-+    node->VidMem.offset    = Node->VidMem.offset + Bytes;
-+    node->VidMem.bytes     = Node->VidMem.bytes  - Bytes;
-+    node->VidMem.alignment = 0;
-+    node->VidMem.locked    = 0;
-+    node->VidMem.memory    = Node->VidMem.memory;
-+    node->VidMem.pool      = Node->VidMem.pool;
-+    node->VidMem.physical  = Node->VidMem.physical;
-+#ifdef __QNXNTO__
-+#if gcdUSE_VIDMEM_PER_PID
-+    gcmkASSERT(Node->VidMem.physical != 0);
-+    gcmkASSERT(Node->VidMem.logical != gcvNULL);
-+    node->VidMem.processID = Node->VidMem.processID;
-+    node->VidMem.physical  = Node->VidMem.physical + Bytes;
-+    node->VidMem.logical   = Node->VidMem.logical + Bytes;
-+#else
-+    node->VidMem.processID = 0;
-+    node->VidMem.logical   = gcvNULL;
-+#endif
-+#endif
-+
-+    /* Insert node behind specified node. */
-+    node->VidMem.next = Node->VidMem.next;
-+    node->VidMem.prev = Node;
-+    Node->VidMem.next = node->VidMem.next->VidMem.prev = node;
-+
-+    /* Insert free node behind specified node. */
-+    node->VidMem.nextFree = Node->VidMem.nextFree;
-+    node->VidMem.prevFree = Node;
-+    Node->VidMem.nextFree = node->VidMem.nextFree->VidMem.prevFree = node;
-+
-+    /* Adjust size of specified node. */
-+    Node->VidMem.bytes = Bytes;
-+
-+    /* Success. */
-+    return gcvTRUE;
-+}
-+
-+/*******************************************************************************
-+**
-+**  _Merge
-+**
-+**  Merge two adjacent nodes together.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to the first of the two nodes to merge.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+*/
-+static gceSTATUS
-+_Merge(
-+    IN gckOS Os,
-+    IN gcuVIDMEM_NODE_PTR Node
-+    )
-+{
-+    gcuVIDMEM_NODE_PTR node;
-+    gceSTATUS status;
-+
-+    /* Save pointer to next node. */
-+    node = Node->VidMem.next;
-+#if gcdUSE_VIDMEM_PER_PID
-+    /* Check if the nodes are adjacent physically. */
-+    if ( ((Node->VidMem.physical + Node->VidMem.bytes) != node->VidMem.physical) ||
-+          ((Node->VidMem.logical + Node->VidMem.bytes) != node->VidMem.logical) )
-+    {
-+        /* Can't merge. */
-+        return gcvSTATUS_OK;
-+    }
-+#else
-+
-+    /* This is a good time to make sure the heap is not corrupted. */
-+    if (Node->VidMem.offset + Node->VidMem.bytes != node->VidMem.offset)
-+    {
-+        /* Corrupted heap. */
-+        gcmkASSERT(
-+            Node->VidMem.offset + Node->VidMem.bytes == node->VidMem.offset);
-+        return gcvSTATUS_HEAP_CORRUPTED;
-+    }
-+#endif
-+
-+    /* Adjust byte count. */
-+    Node->VidMem.bytes += node->VidMem.bytes;
-+
-+    /* Unlink next node from linked list. */
-+    Node->VidMem.next     = node->VidMem.next;
-+    Node->VidMem.nextFree = node->VidMem.nextFree;
-+
-+    Node->VidMem.next->VidMem.prev         =
-+    Node->VidMem.nextFree->VidMem.prevFree = Node;
-+
-+    /* Free next node. */
-+    status = gcmkOS_SAFE_FREE(Os, node);
-+    return status;
-+}
-+
-+/******************************************************************************\
-+******************************* gckVIDMEM API Code ******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_ConstructVirtual
-+**
-+**  Construct a new gcuVIDMEM_NODE union for virtual memory.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of byte to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gcuVIDMEM_NODE_PTR * Node
-+**          Pointer to a variable that receives the gcuVIDMEM_NODE union pointer.
-+*/
-+gceSTATUS
-+gckVIDMEM_ConstructVirtual(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL Contiguous,
-+    IN gctSIZE_T Bytes,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    )
-+{
-+    gckOS os;
-+    gceSTATUS status;
-+    gcuVIDMEM_NODE_PTR node = gcvNULL;
-+    gctPOINTER pointer = gcvNULL;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x Contiguous=%d Bytes=%lu", Kernel, Contiguous, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
-+
-+    /* Extract the gckOS object pointer. */
-+    os = Kernel->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    /* Allocate an gcuVIDMEM_NODE union. */
-+    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(gcuVIDMEM_NODE), &pointer));
-+
-+    node = pointer;
-+
-+    /* Initialize gcuVIDMEM_NODE union for virtual memory. */
-+    node->Virtual.kernel        = Kernel;
-+    node->Virtual.contiguous    = Contiguous;
-+    node->Virtual.logical       = gcvNULL;
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        node->Virtual.lockeds[i]        = 0;
-+        node->Virtual.pageTables[i]     = gcvNULL;
-+        node->Virtual.lockKernels[i]    = gcvNULL;
-+    }
-+
-+    gcmkONERROR(gckOS_GetProcessID(&node->Virtual.processID));
-+
-+#ifdef __QNXNTO__
-+    node->Virtual.next          = gcvNULL;
-+    node->Virtual.freePending   = gcvFALSE;
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        node->Virtual.unlockPendings[i] = gcvFALSE;
-+    }
-+#endif
-+
-+    node->Virtual.freed         = gcvFALSE;
-+
-+    gcmkONERROR(gckOS_ZeroMemory(&node->Virtual.sharedInfo, gcmSIZEOF(gcsVIDMEM_NODE_SHARED_INFO)));
-+
-+    /* Allocate the virtual memory. */
-+    gcmkONERROR(
-+        gckOS_AllocatePagedMemoryEx(os,
-+                                    node->Virtual.contiguous,
-+                                    node->Virtual.bytes = Bytes,
-+                                    &node->Virtual.physical));
-+
-+#ifdef __QNXNTO__
-+    /* Register. */
-+#if gcdENABLE_VG
-+    if (Kernel->core != gcvCORE_VG)
-+#endif
-+    {
-+        gckMMU_InsertNode(Kernel->mmu, node);
-+    }
-+#endif
-+
-+    /* Return pointer to the gcuVIDMEM_NODE union. */
-+    *Node = node;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                   "Created virtual node 0x%x for %u bytes @ 0x%x",
-+                   node, Bytes, node->Virtual.physical);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Node=0x%x", *Node);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (node != gcvNULL)
-+    {
-+        /* Free the structure. */
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, node));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_DestroyVirtual
-+**
-+**  Destroy an gcuVIDMEM_NODE union for virtual memory.
-+**
-+**  INPUT:
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to a gcuVIDMEM_NODE union.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVIDMEM_DestroyVirtual(
-+    IN gcuVIDMEM_NODE_PTR Node
-+    )
-+{
-+    gckOS os;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Node=0x%x", Node);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Node->Virtual.kernel, gcvOBJ_KERNEL);
-+
-+    /* Extact the gckOS object pointer. */
-+    os = Node->Virtual.kernel->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+#ifdef __QNXNTO__
-+    /* Unregister. */
-+#if gcdENABLE_VG
-+    if (Node->Virtual.kernel->core != gcvCORE_VG)
-+#endif
-+    {
-+        gcmkVERIFY_OK(
-+                gckMMU_RemoveNode(Node->Virtual.kernel->mmu, Node));
-+    }
-+#endif
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (Node->Virtual.pageTables[i] != gcvNULL)
-+        {
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                /* Free the pages. */
-+                gcmkVERIFY_OK(gckVGMMU_FreePages(Node->Virtual.lockKernels[i]->vg->mmu,
-+                                               Node->Virtual.pageTables[i],
-+                                               Node->Virtual.pageCount));
-+            }
-+            else
-+#endif
-+            {
-+                /* Free the pages. */
-+                gcmkVERIFY_OK(gckMMU_FreePages(Node->Virtual.lockKernels[i]->mmu,
-+                                               Node->Virtual.pageTables[i],
-+                                               Node->Virtual.pageCount));
-+            }
-+        }
-+    }
-+
-+    /* Delete the gcuVIDMEM_NODE union. */
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, Node));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_Construct
-+**
-+**  Construct a new gckVIDMEM object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 BaseAddress
-+**          Base address for the video memory heap.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes in the video memory heap.
-+**
-+**      gctSIZE_T Threshold
-+**          Minimum number of bytes beyond am allocation before the node is
-+**          split.  Can be used as a minimum alignment requirement.
-+**
-+**      gctSIZE_T BankSize
-+**          Number of bytes per physical memory bank.  Used by bank
-+**          optimization.
-+**
-+**  OUTPUT:
-+**
-+**      gckVIDMEM * Memory
-+**          Pointer to a variable that will hold the pointer to the gckVIDMEM
-+**          object.
-+*/
-+gceSTATUS
-+gckVIDMEM_Construct(
-+    IN gckOS Os,
-+    IN gctUINT32 BaseAddress,
-+    IN gctSIZE_T Bytes,
-+    IN gctSIZE_T Threshold,
-+    IN gctSIZE_T BankSize,
-+    OUT gckVIDMEM * Memory
-+    )
-+{
-+    gckVIDMEM memory = gcvNULL;
-+    gceSTATUS status;
-+    gcuVIDMEM_NODE_PTR node;
-+    gctINT i, banks = 0;
-+    gctPOINTER pointer = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%x BaseAddress=%08x Bytes=%lu Threshold=%lu "
-+                   "BankSize=%lu",
-+                   Os, BaseAddress, Bytes, Threshold, BankSize);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    /* Allocate the gckVIDMEM object. */
-+    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(struct _gckVIDMEM), &pointer));
-+
-+    memory = pointer;
-+
-+    /* Initialize the gckVIDMEM object. */
-+    memory->object.type = gcvOBJ_VIDMEM;
-+    memory->os          = Os;
-+
-+    /* Set video memory heap information. */
-+    memory->baseAddress = BaseAddress;
-+    memory->bytes       = Bytes;
-+    memory->freeBytes   = Bytes;
-+    memory->threshold   = Threshold;
-+#if gcdUSE_VIDMEM_PER_PID
-+    gcmkONERROR(gckOS_GetProcessID(&memory->pid));
-+#endif
-+
-+    BaseAddress = 0;
-+
-+    /* Walk all possible banks. */
-+    for (i = 0; i < gcmCOUNTOF(memory->sentinel); ++i)
-+    {
-+        gctSIZE_T bytes;
-+
-+        if (BankSize == 0)
-+        {
-+            /* Use all bytes for the first bank. */
-+            bytes = Bytes;
-+        }
-+        else
-+        {
-+            /* Compute number of bytes for this bank. */
-+            bytes = gcmALIGN(BaseAddress + 1, BankSize) - BaseAddress;
-+
-+            if (bytes > Bytes)
-+            {
-+                /* Make sure we don't exceed the total number of bytes. */
-+                bytes = Bytes;
-+            }
-+        }
-+
-+        if (bytes == 0)
-+        {
-+            /* Mark heap is not used. */
-+            memory->sentinel[i].VidMem.next     =
-+            memory->sentinel[i].VidMem.prev     =
-+            memory->sentinel[i].VidMem.nextFree =
-+            memory->sentinel[i].VidMem.prevFree = gcvNULL;
-+            continue;
-+        }
-+
-+        /* Allocate one gcuVIDMEM_NODE union. */
-+        gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcuVIDMEM_NODE), &pointer));
-+
-+        node = pointer;
-+
-+        /* Initialize gcuVIDMEM_NODE union. */
-+        node->VidMem.memory    = memory;
-+
-+        node->VidMem.next      =
-+        node->VidMem.prev      =
-+        node->VidMem.nextFree  =
-+        node->VidMem.prevFree  = &memory->sentinel[i];
-+
-+        node->VidMem.offset    = BaseAddress;
-+        node->VidMem.bytes     = bytes;
-+        node->VidMem.alignment = 0;
-+        node->VidMem.physical  = 0;
-+        node->VidMem.pool      = gcvPOOL_UNKNOWN;
-+
-+        node->VidMem.locked    = 0;
-+
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
-+        node->VidMem.kernelVirtual = gcvNULL;
-+#endif
-+
-+        gcmkONERROR(gckOS_ZeroMemory(&node->VidMem.sharedInfo, gcmSIZEOF(gcsVIDMEM_NODE_SHARED_INFO)));
-+
-+#ifdef __QNXNTO__
-+#if gcdUSE_VIDMEM_PER_PID
-+        node->VidMem.processID = memory->pid;
-+        node->VidMem.physical  = memory->baseAddress + BaseAddress;
-+        gcmkONERROR(gckOS_GetLogicalAddressProcess(Os,
-+                    node->VidMem.processID,
-+                    node->VidMem.physical,
-+                    &node->VidMem.logical));
-+#else
-+        node->VidMem.processID = 0;
-+        node->VidMem.logical   = gcvNULL;
-+#endif
-+#endif
-+
-+        /* Initialize the linked list of nodes. */
-+        memory->sentinel[i].VidMem.next     =
-+        memory->sentinel[i].VidMem.prev     =
-+        memory->sentinel[i].VidMem.nextFree =
-+        memory->sentinel[i].VidMem.prevFree = node;
-+
-+        /* Mark sentinel. */
-+        memory->sentinel[i].VidMem.bytes = 0;
-+
-+        /* Adjust address for next bank. */
-+        BaseAddress += bytes;
-+        Bytes       -= bytes;
-+        banks       ++;
-+    }
-+
-+    /* Assign all the bank mappings. */
-+    memory->mapping[gcvSURF_RENDER_TARGET]      = banks - 1;
-+    memory->mapping[gcvSURF_BITMAP]             = banks - 1;
-+    if (banks > 1) --banks;
-+    memory->mapping[gcvSURF_DEPTH]              = banks - 1;
-+    memory->mapping[gcvSURF_HIERARCHICAL_DEPTH] = banks - 1;
-+    if (banks > 1) --banks;
-+    memory->mapping[gcvSURF_TEXTURE]            = banks - 1;
-+    if (banks > 1) --banks;
-+    memory->mapping[gcvSURF_VERTEX]             = banks - 1;
-+    if (banks > 1) --banks;
-+    memory->mapping[gcvSURF_INDEX]              = banks - 1;
-+    if (banks > 1) --banks;
-+    memory->mapping[gcvSURF_TILE_STATUS]        = banks - 1;
-+    if (banks > 1) --banks;
-+    memory->mapping[gcvSURF_TYPE_UNKNOWN]       = 0;
-+
-+#if gcdENABLE_VG
-+    memory->mapping[gcvSURF_IMAGE]   = 0;
-+    memory->mapping[gcvSURF_MASK]    = 0;
-+    memory->mapping[gcvSURF_SCISSOR] = 0;
-+#endif
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                  "[GALCORE] INDEX:         bank %d",
-+                  memory->mapping[gcvSURF_INDEX]);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                  "[GALCORE] VERTEX:        bank %d",
-+                  memory->mapping[gcvSURF_VERTEX]);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                  "[GALCORE] TEXTURE:       bank %d",
-+                  memory->mapping[gcvSURF_TEXTURE]);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                  "[GALCORE] RENDER_TARGET: bank %d",
-+                  memory->mapping[gcvSURF_RENDER_TARGET]);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                  "[GALCORE] DEPTH:         bank %d",
-+                  memory->mapping[gcvSURF_DEPTH]);
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                  "[GALCORE] TILE_STATUS:   bank %d",
-+                  memory->mapping[gcvSURF_TILE_STATUS]);
-+
-+    /* Return pointer to the gckVIDMEM object. */
-+    *Memory = memory;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Memory=0x%x", *Memory);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    if (memory != gcvNULL)
-+    {
-+        for (i = 0; i < banks; ++i)
-+        {
-+            /* Free the heap. */
-+            gcmkASSERT(memory->sentinel[i].VidMem.next != gcvNULL);
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, memory->sentinel[i].VidMem.next));
-+        }
-+
-+        /* Free the object. */
-+        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, memory));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_Destroy
-+**
-+**  Destroy an gckVIDMEM object.
-+**
-+**  INPUT:
-+**
-+**      gckVIDMEM Memory
-+**          Pointer to an gckVIDMEM object to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVIDMEM_Destroy(
-+    IN gckVIDMEM Memory
-+    )
-+{
-+    gcuVIDMEM_NODE_PTR node, next;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Memory=0x%x", Memory);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
-+
-+    /* Walk all sentinels. */
-+    for (i = 0; i < gcmCOUNTOF(Memory->sentinel); ++i)
-+    {
-+        /* Bail out of the heap is not used. */
-+        if (Memory->sentinel[i].VidMem.next == gcvNULL)
-+        {
-+            break;
-+        }
-+
-+        /* Walk all the nodes until we reach the sentinel. */
-+        for (node = Memory->sentinel[i].VidMem.next;
-+             node->VidMem.bytes != 0;
-+             node = next)
-+        {
-+            /* Save pointer to the next node. */
-+            next = node->VidMem.next;
-+
-+            /* Free the node. */
-+            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Memory->os, node));
-+        }
-+    }
-+
-+    /* Mark the object as unknown. */
-+    Memory->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckVIDMEM object. */
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Memory->os, Memory));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_Allocate
-+**
-+**  Allocate rectangular memory from the gckVIDMEM object.
-+**
-+**  INPUT:
-+**
-+**      gckVIDMEM Memory
-+**          Pointer to an gckVIDMEM object.
-+**
-+**      gctUINT Width
-+**          Width of rectangle to allocate.  Make sure the width is properly
-+**          aligned.
-+**
-+**      gctUINT Height
-+**          Height of rectangle to allocate.  Make sure the height is properly
-+**          aligned.
-+**
-+**      gctUINT Depth
-+**          Depth of rectangle to allocate.  This equals to the number of
-+**          rectangles to allocate contiguously (i.e., for cubic maps and volume
-+**          textures).
-+**
-+**      gctUINT BytesPerPixel
-+**          Number of bytes per pixel.
-+**
-+**      gctUINT32 Alignment
-+**          Byte alignment for allocation.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of surface to allocate (use by bank optimization).
-+**
-+**  OUTPUT:
-+**
-+**      gcuVIDMEM_NODE_PTR * Node
-+**          Pointer to a variable that will hold the allocated memory node.
-+*/
-+gceSTATUS
-+gckVIDMEM_Allocate(
-+    IN gckKERNEL Kernel,
-+    IN gckVIDMEM Memory,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Depth,
-+    IN gctUINT BytesPerPixel,
-+    IN gctUINT32 Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    )
-+{
-+    gctSIZE_T bytes;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Memory=0x%x Width=%u Height=%u Depth=%u BytesPerPixel=%u "
-+                   "Alignment=%u Type=%d",
-+                   Memory, Width, Height, Depth, BytesPerPixel, Alignment,
-+                   Type);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
-+    gcmkVERIFY_ARGUMENT(Width > 0);
-+    gcmkVERIFY_ARGUMENT(Height > 0);
-+    gcmkVERIFY_ARGUMENT(Depth > 0);
-+    gcmkVERIFY_ARGUMENT(BytesPerPixel > 0);
-+    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
-+
-+    /* Compute linear size. */
-+    bytes = Width * Height * Depth * BytesPerPixel;
-+
-+    /* Allocate through linear function. */
-+    gcmkONERROR(
-+        gckVIDMEM_AllocateLinear(Kernel, Memory, bytes, Alignment, Type, Node));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Node=0x%x", *Node);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdENABLE_BANK_ALIGNMENT
-+
-+#if !gcdBANK_BIT_START
-+#error gcdBANK_BIT_START not defined.
-+#endif
-+
-+#if !gcdBANK_BIT_END
-+#error gcdBANK_BIT_END not defined.
-+#endif
-+/*******************************************************************************
-+**  _GetSurfaceBankAlignment
-+**
-+**  Return the required offset alignment required to the make BaseAddress
-+**  aligned properly.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to gcoOS object.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of allocation.
-+**
-+**      gctUINT32 BaseAddress
-+**          Base address of current video memory node.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR AlignmentOffset
-+**          Pointer to a variable that will hold the number of bytes to skip in
-+**          the current video memory node in order to make the alignment bank
-+**          aligned.
-+*/
-+static gceSTATUS
-+_GetSurfaceBankAlignment(
-+    IN gceSURF_TYPE Type,
-+    IN gctUINT32 BaseAddress,
-+    OUT gctUINT32_PTR AlignmentOffset
-+    )
-+{
-+    gctUINT32 bank;
-+    /* To retrieve the bank. */
-+    static const gctUINT32 bankMask = (0xFFFFFFFF << gcdBANK_BIT_START)
-+                                    ^ (0xFFFFFFFF << (gcdBANK_BIT_END + 1));
-+
-+    /* To retrieve the bank and all the lower bytes. */
-+    static const gctUINT32 byteMask = ~(0xFFFFFFFF << (gcdBANK_BIT_END + 1));
-+
-+    gcmkHEADER_ARG("Type=%d BaseAddress=0x%x ", Type, BaseAddress);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(AlignmentOffset != gcvNULL);
-+
-+    switch (Type)
-+    {
-+    case gcvSURF_RENDER_TARGET:
-+        bank = (BaseAddress & bankMask) >> (gcdBANK_BIT_START);
-+
-+        /* Align to the first bank. */
-+        *AlignmentOffset = (bank == 0) ?
-+            0 :
-+            ((1 << (gcdBANK_BIT_END + 1)) + 0) -  (BaseAddress & byteMask);
-+        break;
-+
-+    case gcvSURF_DEPTH:
-+        bank = (BaseAddress & bankMask) >> (gcdBANK_BIT_START);
-+
-+        /* Align to the third bank. */
-+        *AlignmentOffset = (bank == 2) ?
-+            0 :
-+            ((1 << (gcdBANK_BIT_END + 1)) + (2 << gcdBANK_BIT_START)) -  (BaseAddress & byteMask);
-+
-+        /* Add a channel offset at the channel bit. */
-+        *AlignmentOffset += (1 << gcdBANK_CHANNEL_BIT);
-+        break;
-+
-+    default:
-+        /* no alignment needed. */
-+        *AlignmentOffset = 0;
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER_ARG("*AlignmentOffset=%u", *AlignmentOffset);
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+static gcuVIDMEM_NODE_PTR
-+_FindNode(
-+    IN gckVIDMEM Memory,
-+    IN gctINT Bank,
-+    IN gctSIZE_T Bytes,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctUINT32_PTR Alignment
-+    )
-+{
-+    gcuVIDMEM_NODE_PTR node;
-+    gctUINT32 alignment;
-+
-+#if gcdENABLE_BANK_ALIGNMENT
-+    gctUINT32 bankAlignment;
-+    gceSTATUS status;
-+#endif
-+
-+    if (Memory->sentinel[Bank].VidMem.nextFree == gcvNULL)
-+    {
-+        /* No free nodes left. */
-+        return gcvNULL;
-+    }
-+
-+#if gcdENABLE_BANK_ALIGNMENT
-+    /* Walk all free nodes until we have one that is big enough or we have
-+    ** reached the sentinel. */
-+    for (node = Memory->sentinel[Bank].VidMem.nextFree;
-+         node->VidMem.bytes != 0;
-+         node = node->VidMem.nextFree)
-+    {
-+        gcmkONERROR(_GetSurfaceBankAlignment(
-+            Type,
-+            node->VidMem.memory->baseAddress + node->VidMem.offset,
-+            &bankAlignment));
-+
-+        bankAlignment = gcmALIGN(bankAlignment, *Alignment);
-+
-+        /* Compute number of bytes to skip for alignment. */
-+        alignment = (*Alignment == 0)
-+                  ? 0
-+                  : (*Alignment - (node->VidMem.offset % *Alignment));
-+
-+        if (alignment == *Alignment)
-+        {
-+            /* Node is already aligned. */
-+            alignment = 0;
-+        }
-+
-+        if (node->VidMem.bytes >= Bytes + alignment + bankAlignment)
-+        {
-+            /* This node is big enough. */
-+            *Alignment = alignment + bankAlignment;
-+            return node;
-+        }
-+    }
-+#endif
-+
-+    /* Walk all free nodes until we have one that is big enough or we have
-+       reached the sentinel. */
-+    for (node = Memory->sentinel[Bank].VidMem.nextFree;
-+         node->VidMem.bytes != 0;
-+         node = node->VidMem.nextFree)
-+    {
-+
-+        gctINT modulo = gckMATH_ModuloInt(node->VidMem.offset, *Alignment);
-+
-+        /* Compute number of bytes to skip for alignment. */
-+        alignment = (*Alignment == 0) ? 0 : (*Alignment - modulo);
-+
-+        if (alignment == *Alignment)
-+        {
-+            /* Node is already aligned. */
-+            alignment = 0;
-+        }
-+
-+        if (node->VidMem.bytes >= Bytes + alignment)
-+        {
-+            /* This node is big enough. */
-+            *Alignment = alignment;
-+            return node;
-+        }
-+    }
-+
-+#if gcdENABLE_BANK_ALIGNMENT
-+OnError:
-+#endif
-+    /* Not enough memory. */
-+    return gcvNULL;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_AllocateLinear
-+**
-+**  Allocate linear memory from the gckVIDMEM object.
-+**
-+**  INPUT:
-+**
-+**      gckVIDMEM Memory
-+**          Pointer to an gckVIDMEM object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to allocate.
-+**
-+**      gctUINT32 Alignment
-+**          Byte alignment for allocation.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of surface to allocate (use by bank optimization).
-+**
-+**  OUTPUT:
-+**
-+**      gcuVIDMEM_NODE_PTR * Node
-+**          Pointer to a variable that will hold the allocated memory node.
-+*/
-+gceSTATUS
-+gckVIDMEM_AllocateLinear(
-+    IN gckKERNEL Kernel,
-+    IN gckVIDMEM Memory,
-+    IN gctSIZE_T Bytes,
-+    IN gctUINT32 Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    )
-+{
-+    gceSTATUS status;
-+    gcuVIDMEM_NODE_PTR node;
-+    gctUINT32 alignment;
-+    gctINT bank, i;
-+    gctBOOL acquired = gcvFALSE;
-+#if gcdSMALL_BLOCK_SIZE
-+    gctBOOL force_allocate = (Type == gcvSURF_TILE_STATUS) || (Type & gcvSURF_VG);
-+#endif
-+
-+    gcmkHEADER_ARG("Memory=0x%x Bytes=%lu Alignment=%u Type=%d",
-+                   Memory, Bytes, Alignment, Type);
-+
-+    Type &= ~gcvSURF_VG;
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Type < gcvSURF_NUM_TYPES);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Memory->os, Kernel->vidmemMutex, gcvINFINITE));
-+
-+    acquired = gcvTRUE;
-+#if !gcdUSE_VIDMEM_PER_PID
-+
-+    if (Bytes > Memory->freeBytes)
-+    {
-+        /* Not enough memory. */
-+        status = gcvSTATUS_OUT_OF_MEMORY;
-+        goto OnError;
-+    }
-+#endif
-+
-+#if gcdSMALL_BLOCK_SIZE
-+    if ((!force_allocate) && (Memory->freeBytes < (Memory->bytes/gcdRATIO_FOR_SMALL_MEMORY))
-+    &&  (Bytes >= gcdSMALL_BLOCK_SIZE)
-+    )
-+    {
-+        /* The left memory is for small memory.*/
-+        status = gcvSTATUS_OUT_OF_MEMORY;
-+        goto OnError;
-+    }
-+#endif
-+
-+    /* Find the default bank for this surface type. */
-+    gcmkASSERT((gctINT) Type < gcmCOUNTOF(Memory->mapping));
-+    bank      = Memory->mapping[Type];
-+    alignment = Alignment;
-+
-+#if gcdUSE_VIDMEM_PER_PID
-+    if (Bytes <= Memory->freeBytes)
-+    {
-+#endif
-+    /* Find a free node in the default bank. */
-+    node = _FindNode(Memory, bank, Bytes, Type, &alignment);
-+
-+    /* Out of memory? */
-+    if (node == gcvNULL)
-+    {
-+        /* Walk all lower banks. */
-+        for (i = bank - 1; i >= 0; --i)
-+        {
-+            /* Find a free node inside the current bank. */
-+            node = _FindNode(Memory, i, Bytes, Type, &alignment);
-+            if (node != gcvNULL)
-+            {
-+                break;
-+            }
-+        }
-+    }
-+
-+    if (node == gcvNULL)
-+    {
-+        /* Walk all upper banks. */
-+        for (i = bank + 1; i < gcmCOUNTOF(Memory->sentinel); ++i)
-+        {
-+            if (Memory->sentinel[i].VidMem.nextFree == gcvNULL)
-+            {
-+                /* Abort when we reach unused banks. */
-+                break;
-+            }
-+
-+            /* Find a free node inside the current bank. */
-+            node = _FindNode(Memory, i, Bytes, Type, &alignment);
-+            if (node != gcvNULL)
-+            {
-+                break;
-+            }
-+        }
-+    }
-+#if gcdUSE_VIDMEM_PER_PID
-+    }
-+#endif
-+
-+    if (node == gcvNULL)
-+    {
-+        /* Out of memory. */
-+#if gcdUSE_VIDMEM_PER_PID
-+        /* Allocate more memory from shared pool. */
-+        gctSIZE_T bytes;
-+        gctPHYS_ADDR physical_temp;
-+        gctUINT32 physical;
-+        gctPOINTER logical;
-+
-+        bytes = gcmALIGN(Bytes, gcdUSE_VIDMEM_PER_PID_SIZE);
-+
-+        gcmkONERROR(gckOS_AllocateContiguous(Memory->os,
-+                gcvTRUE,
-+                &bytes,
-+                &physical_temp,
-+                &logical));
-+
-+        /* physical address is returned as 0 for user space. workaround. */
-+        if (physical_temp == gcvNULL)
-+        {
-+        gcmkONERROR(gckOS_GetPhysicalAddress(Memory->os, logical, &physical));
-+        }
-+
-+        /* Allocate one gcuVIDMEM_NODE union. */
-+        gcmkONERROR(
-+            gckOS_Allocate(Memory->os,
-+                           gcmSIZEOF(gcuVIDMEM_NODE),
-+                           (gctPOINTER *) &node));
-+
-+        /* Initialize gcuVIDMEM_NODE union. */
-+        node->VidMem.memory    = Memory;
-+
-+        node->VidMem.offset    = 0;
-+        node->VidMem.bytes     = bytes;
-+        node->VidMem.alignment = 0;
-+        node->VidMem.physical  = physical;
-+        node->VidMem.pool      = gcvPOOL_UNKNOWN;
-+
-+        node->VidMem.locked    = 0;
-+
-+#ifdef __QNXNTO__
-+        gcmkONERROR(gckOS_GetProcessID(&node->VidMem.processID));
-+        node->VidMem.logical   = logical;
-+        gcmkASSERT(logical != gcvNULL);
-+#endif
-+
-+        /* Insert node behind sentinel node. */
-+        node->VidMem.next = Memory->sentinel[bank].VidMem.next;
-+        node->VidMem.prev = &Memory->sentinel[bank];
-+        Memory->sentinel[bank].VidMem.next = node->VidMem.next->VidMem.prev = node;
-+
-+        /* Insert free node behind sentinel node. */
-+        node->VidMem.nextFree = Memory->sentinel[bank].VidMem.nextFree;
-+        node->VidMem.prevFree = &Memory->sentinel[bank];
-+        Memory->sentinel[bank].VidMem.nextFree = node->VidMem.nextFree->VidMem.prevFree = node;
-+
-+        Memory->freeBytes += bytes;
-+#else
-+        status = gcvSTATUS_OUT_OF_MEMORY;
-+        goto OnError;
-+#endif
-+    }
-+
-+    /* Do we have an alignment? */
-+    if (alignment > 0)
-+    {
-+        /* Split the node so it is aligned. */
-+        if (_Split(Memory->os, node, alignment))
-+        {
-+            /* Successful split, move to aligned node. */
-+            node = node->VidMem.next;
-+
-+            /* Remove alignment. */
-+            alignment = 0;
-+        }
-+    }
-+
-+    /* Do we have enough memory after the allocation to split it? */
-+    if (node->VidMem.bytes - Bytes > Memory->threshold)
-+    {
-+        /* Adjust the node size. */
-+        _Split(Memory->os, node, Bytes);
-+    }
-+
-+    /* Remove the node from the free list. */
-+    node->VidMem.prevFree->VidMem.nextFree = node->VidMem.nextFree;
-+    node->VidMem.nextFree->VidMem.prevFree = node->VidMem.prevFree;
-+    node->VidMem.nextFree                  =
-+    node->VidMem.prevFree                  = gcvNULL;
-+
-+    /* Fill in the information. */
-+    node->VidMem.alignment = alignment;
-+    node->VidMem.memory    = Memory;
-+#ifdef __QNXNTO__
-+#if !gcdUSE_VIDMEM_PER_PID
-+    node->VidMem.logical   = gcvNULL;
-+    gcmkONERROR(gckOS_GetProcessID(&node->VidMem.processID));
-+#else
-+    gcmkASSERT(node->VidMem.logical != gcvNULL);
-+#endif
-+#endif
-+
-+    /* Adjust the number of free bytes. */
-+    Memory->freeBytes -= node->VidMem.bytes;
-+
-+    node->VidMem.freePending = gcvFALSE;
-+
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
-+    node->VidMem.kernelVirtual = gcvNULL;
-+#endif
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Kernel->vidmemMutex));
-+
-+    /* Return the pointer to the node. */
-+    *Node = node;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                   "Allocated %u bytes @ 0x%x [0x%08X]",
-+                   node->VidMem.bytes, node, node->VidMem.offset);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Node=0x%x", *Node);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+     /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Kernel->vidmemMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_Free
-+**
-+**  Free an allocated video memory node.
-+**
-+**  INPUT:
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to a gcuVIDMEM_NODE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVIDMEM_Free(
-+    IN gckKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node
-+    )
-+{
-+    gceSTATUS status;
-+    gckKERNEL kernel = gcvNULL;
-+    gckVIDMEM memory = gcvNULL;
-+    gcuVIDMEM_NODE_PTR node;
-+    gckOS os = gcvNULL;
-+    gctBOOL acquired = gcvFALSE;
-+    gctINT32 i, totalLocked;
-+
-+    gcmkHEADER_ARG("Node=0x%x", Node);
-+
-+    /* Acquire the mutex. */
-+    gcmkONERROR(
-+        gckOS_AcquireMutex(Kernel->os, Kernel->vidmemMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    /* Verify the arguments. */
-+    if ((Node == gcvNULL)
-+    ||  (Node->VidMem.memory == gcvNULL)
-+    )
-+    {
-+        /* Invalid object. */
-+        gcmkONERROR(gcvSTATUS_INVALID_OBJECT);
-+    }
-+
-+    /**************************** Video Memory ********************************/
-+
-+    if (Node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+    {
-+        if (Node->VidMem.locked > 0)
-+        {
-+            /* Client still has a lock, defer free op 'till when lock reaches 0. */
-+            Node->VidMem.freePending = gcvTRUE;
-+
-+            gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+            acquired = gcvFALSE;
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                           "Node 0x%x is locked (%d)... deferring free.",
-+                           Node, Node->VidMem.locked);
-+
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        /* Extract pointer to gckVIDMEM object owning the node. */
-+        memory = Node->VidMem.memory;
-+
-+#ifdef __QNXNTO__
-+#if !gcdUSE_VIDMEM_PER_PID
-+        /* Reset. */
-+        Node->VidMem.processID = 0;
-+        Node->VidMem.logical = gcvNULL;
-+#endif
-+
-+        /* Don't try to re-free an already freed node. */
-+        if ((Node->VidMem.nextFree == gcvNULL)
-+        &&  (Node->VidMem.prevFree == gcvNULL)
-+        )
-+#endif
-+        {
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
-+            if (Node->VidMem.kernelVirtual)
-+            {
-+                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                        "%s(%d) Unmap %x from kernel space.",
-+                        __FUNCTION__, __LINE__,
-+                        Node->VidMem.kernelVirtual);
-+
-+                gcmkVERIFY_OK(
-+                    gckOS_UnmapPhysical(memory->os,
-+                                        Node->VidMem.kernelVirtual,
-+                                        Node->VidMem.bytes));
-+
-+                Node->VidMem.kernelVirtual = gcvNULL;
-+            }
-+#endif
-+
-+            /* Check if Node is already freed. */
-+            if (Node->VidMem.nextFree)
-+            {
-+                /* Node is alread freed. */
-+                gcmkONERROR(gcvSTATUS_INVALID_DATA);
-+            }
-+
-+            /* Update the number of free bytes. */
-+            memory->freeBytes += Node->VidMem.bytes;
-+
-+            /* Find the next free node. */
-+            for (node = Node->VidMem.next;
-+                 node != gcvNULL && node->VidMem.nextFree == gcvNULL;
-+                 node = node->VidMem.next) ;
-+
-+            /* Insert this node in the free list. */
-+            Node->VidMem.nextFree = node;
-+            Node->VidMem.prevFree = node->VidMem.prevFree;
-+
-+            Node->VidMem.prevFree->VidMem.nextFree =
-+            node->VidMem.prevFree                  = Node;
-+
-+            /* Is the next node a free node and not the sentinel? */
-+            if ((Node->VidMem.next == Node->VidMem.nextFree)
-+            &&  (Node->VidMem.next->VidMem.bytes != 0)
-+            )
-+            {
-+                /* Merge this node with the next node. */
-+                gcmkONERROR(_Merge(memory->os, node = Node));
-+                gcmkASSERT(node->VidMem.nextFree != node);
-+                gcmkASSERT(node->VidMem.prevFree != node);
-+            }
-+
-+            /* Is the previous node a free node and not the sentinel? */
-+            if ((Node->VidMem.prev == Node->VidMem.prevFree)
-+            &&  (Node->VidMem.prev->VidMem.bytes != 0)
-+            )
-+            {
-+                /* Merge this node with the previous node. */
-+                gcmkONERROR(_Merge(memory->os, node = Node->VidMem.prev));
-+                gcmkASSERT(node->VidMem.nextFree != node);
-+                gcmkASSERT(node->VidMem.prevFree != node);
-+            }
-+        }
-+
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                       "Node 0x%x is freed.",
-+                       Node);
-+
-+        /* Success. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /*************************** Virtual Memory *******************************/
-+
-+    /* Get gckKERNEL object. */
-+    kernel = Node->Virtual.kernel;
-+
-+    /* Verify the gckKERNEL object pointer. */
-+    gcmkVERIFY_OBJECT(kernel, gcvOBJ_KERNEL);
-+
-+    /* Get the gckOS object pointer. */
-+    os = kernel->os;
-+    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+    for (i = 0, totalLocked = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        totalLocked += Node->Virtual.lockeds[i];
-+    }
-+
-+    if (totalLocked > 0)
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_VIDMEM,
-+                       "gckVIDMEM_Free: Virtual node 0x%x is locked (%d)",
-+                       Node, totalLocked);
-+
-+        /* Set Flag */
-+        Node->Virtual.freed = gcvTRUE;
-+    }
-+    else
-+    {
-+        /* Free the virtual memory. */
-+        gcmkVERIFY_OK(gckOS_FreePagedMemory(kernel->os,
-+                                            Node->Virtual.physical,
-+                                            Node->Virtual.bytes));
-+
-+        /* Destroy the gcuVIDMEM_NODE union. */
-+        gcmkVERIFY_OK(gckVIDMEM_DestroyVirtual(Node));
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-+#ifdef __QNXNTO__
-+/*******************************************************************************
-+**
-+**  gcoVIDMEM_FreeHandleMemory
-+**
-+**  Free all allocated video memory nodes for a handle.
-+**
-+**  INPUT:
-+**
-+**      gcoVIDMEM Memory
-+**          Pointer to an gcoVIDMEM object..
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckVIDMEM_FreeHandleMemory(
-+    IN gckKERNEL Kernel,
-+    IN gckVIDMEM Memory,
-+    IN gctUINT32 Pid
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL mutex = gcvFALSE;
-+    gcuVIDMEM_NODE_PTR node;
-+    gctINT i;
-+    gctUINT32 nodeCount = 0, byteCount = 0;
-+    gctBOOL again;
-+
-+    gcmkHEADER_ARG("Kernel=0x%x, Memory=0x%x Pid=0x%u", Kernel, Memory, Pid);
-+
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Memory->os, Memory->mutex, gcvINFINITE));
-+    mutex = gcvTRUE;
-+
-+    /* Walk all sentinels. */
-+    for (i = 0; i < gcmCOUNTOF(Memory->sentinel); ++i)
-+    {
-+        /* Bail out of the heap if it is not used. */
-+        if (Memory->sentinel[i].VidMem.next == gcvNULL)
-+        {
-+            break;
-+        }
-+
-+        do
-+        {
-+            again = gcvFALSE;
-+
-+            /* Walk all the nodes until we reach the sentinel. */
-+            for (node = Memory->sentinel[i].VidMem.next;
-+                 node->VidMem.bytes != 0;
-+                 node = node->VidMem.next)
-+            {
-+                /* Free the node if it was allocated by Handle. */
-+                if (node->VidMem.processID == Pid)
-+                {
-+                    /* Unlock video memory. */
-+                    while (node->VidMem.locked > 0)
-+                    {
-+                        gckVIDMEM_Unlock(Kernel, node, gcvSURF_TYPE_UNKNOWN, gcvNULL);
-+                    }
-+
-+                    nodeCount++;
-+                    byteCount += node->VidMem.bytes;
-+
-+                    /* Free video memory. */
-+                    gcmkVERIFY_OK(gckVIDMEM_Free(node));
-+
-+                    /*
-+                     * Freeing may cause a merge which will invalidate our iteration.
-+                     * Don't be clever, just restart.
-+                     */
-+                    again = gcvTRUE;
-+
-+                    break;
-+                }
-+#if gcdUSE_VIDMEM_PER_PID
-+                else
-+                {
-+                    gcmkASSERT(node->VidMem.processID == Pid);
-+                }
-+#endif
-+            }
-+        }
-+        while (again);
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Memory->mutex));
-+    gcmkFOOTER();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (mutex)
-+    {
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Memory->mutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+** _NeedVirtualMapping
-+**
-+**  Whether setup GPU page table for video node.
-+**
-+**  INPUT:
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to a gcuVIDMEM_NODE union.
-+**
-+**      gceCORE  Core
-+**          Id of current GPU.
-+**
-+**  OUTPUT:
-+**      gctBOOL * NeedMapping
-+**          A pointer hold the result whether Node should be mapping.
-+*/
-+static gceSTATUS
-+_NeedVirtualMapping(
-+    IN gckKERNEL Kernel,
-+    IN gceCORE  Core,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    OUT gctBOOL * NeedMapping
-+)
-+{
-+    gceSTATUS status;
-+    gctUINT32 phys;
-+    gctUINT32 end;
-+    gcePOOL pool;
-+    gctUINT32 offset;
-+    gctUINT32 baseAddress;
-+
-+    gcmkHEADER_ARG("Node=0x%X", Node);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Kernel != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(NeedMapping != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Core < gcdMAX_GPU_COUNT);
-+
-+    if (Node->Virtual.contiguous)
-+    {
-+#if gcdENABLE_VG
-+        if (Core == gcvCORE_VG)
-+        {
-+            *NeedMapping = gcvFALSE;
-+        }
-+        else
-+#endif
-+        {
-+            /* Convert logical address into a physical address. */
-+            gcmkONERROR(
-+                gckOS_GetPhysicalAddress(Kernel->os, Node->Virtual.logical, &phys));
-+
-+            gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
-+
-+            gcmkASSERT(phys >= baseAddress);
-+
-+            /* Subtract baseAddress to get a GPU address used for programming. */
-+            phys -= baseAddress;
-+
-+            /* If part of region is belong to gcvPOOL_VIRTUAL,
-+            ** whole region has to be mapped. */
-+            end = phys + Node->Virtual.bytes - 1;
-+
-+            gcmkONERROR(gckHARDWARE_SplitMemory(
-+                        Kernel->hardware, end, &pool, &offset
-+                        ));
-+
-+            *NeedMapping = (pool == gcvPOOL_VIRTUAL);
-+        }
-+    }
-+    else
-+    {
-+        *NeedMapping = gcvTRUE;
-+    }
-+
-+    gcmkFOOTER_ARG("*NeedMapping=%d", *NeedMapping);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_Lock
-+**
-+**  Lock a video memory node and return its hardware specific address.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to a gcuVIDMEM_NODE union.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Pointer to a variable that will hold the hardware specific address.
-+*/
-+gceSTATUS
-+gckVIDMEM_Lock(
-+    IN gckKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gctBOOL Cacheable,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL locked = gcvFALSE;
-+    gckOS os = gcvNULL;
-+    gctBOOL needMapping;
-+    gctUINT32 baseAddress;
-+
-+    gcmkHEADER_ARG("Node=0x%x", Node);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Grab the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Kernel->os, Kernel->vidmemMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    if ((Node == gcvNULL)
-+    ||  (Node->VidMem.memory == gcvNULL)
-+    )
-+    {
-+        /* Invalid object. */
-+        gcmkONERROR(gcvSTATUS_INVALID_OBJECT);
-+    }
-+
-+    /**************************** Video Memory ********************************/
-+
-+    if (Node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+    {
-+        if (Cacheable == gcvTRUE)
-+        {
-+            gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
-+        }
-+
-+        /* Increment the lock count. */
-+        Node->VidMem.locked ++;
-+
-+        /* Return the physical address of the node. */
-+#if !gcdUSE_VIDMEM_PER_PID
-+        *Address = Node->VidMem.memory->baseAddress
-+                 + Node->VidMem.offset
-+                 + Node->VidMem.alignment;
-+#else
-+        *Address = Node->VidMem.physical;
-+#endif
-+
-+        /* Get hardware specific address. */
-+#if gcdENABLE_VG
-+        if (Kernel->vg == gcvNULL)
-+#endif
-+        {
-+            if (Kernel->hardware->mmuVersion == 0)
-+            {
-+                /* Convert physical to GPU address for old mmu. */
-+                gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
-+                gcmkASSERT(*Address > baseAddress);
-+                *Address -= baseAddress;
-+            }
-+        }
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                      "Locked node 0x%x (%d) @ 0x%08X",
-+                      Node,
-+                      Node->VidMem.locked,
-+                      *Address);
-+    }
-+
-+    /*************************** Virtual Memory *******************************/
-+
-+    else
-+    {
-+        /* Verify the gckKERNEL object pointer. */
-+        gcmkVERIFY_OBJECT(Node->Virtual.kernel, gcvOBJ_KERNEL);
-+
-+        /* Extract the gckOS object pointer. */
-+        os = Node->Virtual.kernel->os;
-+        gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+#if gcdPAGED_MEMORY_CACHEABLE
-+        /* Force video memory cacheable. */
-+        Cacheable = gcvTRUE;
-+#endif
-+
-+        gcmkONERROR(
-+            gckOS_LockPages(os,
-+                            Node->Virtual.physical,
-+                            Node->Virtual.bytes,
-+                            Cacheable,
-+                            &Node->Virtual.logical,
-+                            &Node->Virtual.pageCount));
-+
-+        /* Increment the lock count. */
-+        if (Node->Virtual.lockeds[Kernel->core] ++ == 0)
-+        {
-+            /* Is this node pending for a final unlock? */
-+#ifdef __QNXNTO__
-+            if (!Node->Virtual.contiguous && Node->Virtual.unlockPendings[Kernel->core])
-+            {
-+                /* Make sure we have a page table. */
-+                gcmkASSERT(Node->Virtual.pageTables[Kernel->core] != gcvNULL);
-+
-+                /* Remove pending unlock. */
-+                Node->Virtual.unlockPendings[Kernel->core] = gcvFALSE;
-+            }
-+
-+            /* First lock - create a page table. */
-+            gcmkASSERT(Node->Virtual.pageTables[Kernel->core] == gcvNULL);
-+
-+            /* Make sure we mark our node as not flushed. */
-+            Node->Virtual.unlockPendings[Kernel->core] = gcvFALSE;
-+#endif
-+
-+            locked = gcvTRUE;
-+
-+            gcmkONERROR(_NeedVirtualMapping(Kernel, Kernel->core, Node, &needMapping));
-+
-+            if (needMapping == gcvFALSE)
-+            {
-+                /* Get hardware specific address. */
-+#if gcdENABLE_VG
-+                if (Kernel->vg != gcvNULL)
-+                {
-+                    gcmkONERROR(gckVGHARDWARE_ConvertLogical(Kernel->vg->hardware,
-+                                Node->Virtual.logical,
-+                                &Node->Virtual.addresses[Kernel->core]));
-+                }
-+                else
-+#endif
-+                {
-+                    gcmkONERROR(gckHARDWARE_ConvertLogical(Kernel->hardware,
-+                                Node->Virtual.logical,
-+                                &Node->Virtual.addresses[Kernel->core]));
-+                }
-+            }
-+            else
-+            {
-+#if gcdENABLE_VG
-+                if (Kernel->vg != gcvNULL)
-+                {
-+                    /* Allocate pages inside the MMU. */
-+                    gcmkONERROR(
-+                        gckVGMMU_AllocatePages(Kernel->vg->mmu,
-+                                             Node->Virtual.pageCount,
-+                                             &Node->Virtual.pageTables[Kernel->core],
-+                                             &Node->Virtual.addresses[Kernel->core]));
-+                }
-+                else
-+#endif
-+                {
-+                    /* Allocate pages inside the MMU. */
-+                    gcmkONERROR(
-+                        gckMMU_AllocatePagesEx(Kernel->mmu,
-+                                             Node->Virtual.pageCount,
-+                                             Node->Virtual.type,
-+                                             &Node->Virtual.pageTables[Kernel->core],
-+                                             &Node->Virtual.addresses[Kernel->core]));
-+                }
-+
-+                Node->Virtual.lockKernels[Kernel->core] = Kernel;
-+
-+                /* Map the pages. */
-+#ifdef __QNXNTO__
-+                gcmkONERROR(
-+                    gckOS_MapPagesEx(os,
-+                                     Kernel->core,
-+                                     Node->Virtual.physical,
-+                                     Node->Virtual.logical,
-+                                     Node->Virtual.pageCount,
-+                                     Node->Virtual.pageTables[Kernel->core]));
-+#else
-+                gcmkONERROR(
-+                    gckOS_MapPagesEx(os,
-+                                     Kernel->core,
-+                                     Node->Virtual.physical,
-+                                     Node->Virtual.pageCount,
-+                                     Node->Virtual.pageTables[Kernel->core]));
-+#endif
-+
-+#if gcdENABLE_VG
-+                if (Kernel->core == gcvCORE_VG)
-+                {
-+                    gcmkONERROR(gckVGMMU_Flush(Kernel->vg->mmu));
-+                }
-+                else
-+#endif
-+                {
-+                    gcmkONERROR(gckMMU_Flush(Kernel->mmu));
-+                }
-+            }
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                           "Mapped virtual node 0x%x to 0x%08X",
-+                           Node,
-+                           Node->Virtual.addresses[Kernel->core]);
-+        }
-+
-+        /* Return hardware address. */
-+        *Address = Node->Virtual.addresses[Kernel->core];
-+    }
-+
-+    /* Release the mutex. */
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=%08x", *Address);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (locked)
-+    {
-+        if (Node->Virtual.pageTables[Kernel->core] != gcvNULL)
-+        {
-+#if gcdENABLE_VG
-+            if (Kernel->vg != gcvNULL)
-+            {
-+                /* Free the pages from the MMU. */
-+                gcmkVERIFY_OK(
-+                    gckVGMMU_FreePages(Kernel->vg->mmu,
-+                                     Node->Virtual.pageTables[Kernel->core],
-+                                     Node->Virtual.pageCount));
-+            }
-+            else
-+#endif
-+            {
-+                /* Free the pages from the MMU. */
-+                gcmkVERIFY_OK(
-+                    gckMMU_FreePages(Kernel->mmu,
-+                                     Node->Virtual.pageTables[Kernel->core],
-+                                     Node->Virtual.pageCount));
-+            }
-+            Node->Virtual.pageTables[Kernel->core]  = gcvNULL;
-+            Node->Virtual.lockKernels[Kernel->core] = gcvNULL;
-+        }
-+
-+        /* Unlock the pages. */
-+        gcmkVERIFY_OK(
-+            gckOS_UnlockPages(os,
-+                              Node->Virtual.physical,
-+                              Node->Virtual.bytes,
-+                              Node->Virtual.logical
-+                              ));
-+
-+        Node->Virtual.lockeds[Kernel->core]--;
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckVIDMEM_Unlock
-+**
-+**  Unlock a video memory node.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcuVIDMEM_NODE_PTR Node
-+**          Pointer to a locked gcuVIDMEM_NODE union.
-+**
-+**      gceSURF_TYPE Type
-+**          Type of surface to unlock.
-+**
-+**      gctBOOL * Asynchroneous
-+**          Pointer to a variable specifying whether the surface should be
-+**          unlocked asynchroneously or not.
-+**
-+**  OUTPUT:
-+**
-+**      gctBOOL * Asynchroneous
-+**          Pointer to a variable receiving the number of bytes used in the
-+**          command buffer specified by 'Commands'.  If gcvNULL, there is no
-+**          command buffer.
-+*/
-+gceSTATUS
-+gckVIDMEM_Unlock(
-+    IN gckKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctBOOL * Asynchroneous
-+    )
-+{
-+    gceSTATUS status;
-+    gckHARDWARE hardware;
-+    gctPOINTER buffer;
-+    gctSIZE_T requested, bufferSize;
-+    gckCOMMAND command = gcvNULL;
-+    gceKERNEL_FLUSH flush;
-+    gckOS os = gcvNULL;
-+    gctBOOL acquired = gcvFALSE;
-+    gctBOOL commitEntered = gcvFALSE;
-+    gctINT32 i, totalLocked;
-+
-+    gcmkHEADER_ARG("Node=0x%x Type=%d *Asynchroneous=%d",
-+                   Node, Type, gcmOPT_VALUE(Asynchroneous));
-+
-+    /* Grab the mutex. */
-+    gcmkONERROR(gckOS_AcquireMutex(Kernel->os, Kernel->vidmemMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+
-+    /* Verify the arguments. */
-+    if ((Node == gcvNULL)
-+    ||  (Node->VidMem.memory == gcvNULL)
-+    )
-+    {
-+        /* Invalid object. */
-+        gcmkONERROR(gcvSTATUS_INVALID_OBJECT);
-+    }
-+
-+    /**************************** Video Memory ********************************/
-+
-+    if (Node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+    {
-+        if (Node->VidMem.locked <= 0)
-+        {
-+            /* The surface was not locked. */
-+            status = gcvSTATUS_MEMORY_UNLOCKED;
-+            goto OnError;
-+        }
-+
-+        /* Decrement the lock count. */
-+        Node->VidMem.locked --;
-+
-+        if (Asynchroneous != gcvNULL)
-+        {
-+            /* No need for any events. */
-+            *Asynchroneous = gcvFALSE;
-+        }
-+
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                      "Unlocked node 0x%x (%d)",
-+                      Node,
-+                      Node->VidMem.locked);
-+
-+#ifdef __QNXNTO__
-+        /* Unmap the video memory */
-+        if ((Node->VidMem.locked == 0) && (Node->VidMem.logical != gcvNULL))
-+        {
-+            if (Kernel->core == gcvCORE_VG)
-+            {
-+                gckKERNEL_UnmapVideoMemory(Kernel,
-+                                           Node->VidMem.logical,
-+                                           Node->VidMem.processID,
-+                                           Node->VidMem.bytes);
-+                Node->VidMem.logical = gcvNULL;
-+            }
-+        }
-+#endif /* __QNXNTO__ */
-+
-+        if (Node->VidMem.freePending && (Node->VidMem.locked == 0))
-+        {
-+            /* Client has unlocked node previously attempted to be freed by compositor. Free now. */
-+            Node->VidMem.freePending = gcvFALSE;
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                           "Deferred-freeing Node 0x%x.",
-+                           Node);
-+
-+            gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+            acquired = gcvFALSE;
-+
-+            gcmkONERROR(gckVIDMEM_Free(Kernel, Node));
-+        }
-+    }
-+
-+    /*************************** Virtual Memory *******************************/
-+
-+    else
-+    {
-+        /* Verify the gckHARDWARE object pointer. */
-+        hardware = Kernel->hardware;
-+        gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
-+
-+        /* Verify the gckCOMMAND object pointer. */
-+        command = Kernel->command;
-+        gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
-+
-+        /* Get the gckOS object pointer. */
-+        os = Kernel->os;
-+        gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
-+
-+        if (Asynchroneous == gcvNULL)
-+        {
-+            if (Node->Virtual.lockeds[Kernel->core] == 0)
-+            {
-+                status = gcvSTATUS_MEMORY_UNLOCKED;
-+                goto OnError;
-+            }
-+
-+            /* Decrement lock count. */
-+            -- Node->Virtual.lockeds[Kernel->core];
-+
-+            /* See if we can unlock the resources. */
-+            if (Node->Virtual.lockeds[Kernel->core] == 0)
-+            {
-+                /* Free the page table. */
-+                if (Node->Virtual.pageTables[Kernel->core] != gcvNULL)
-+                {
-+#if gcdENABLE_VG
-+                    if (Kernel->vg != gcvNULL)
-+                    {
-+                        gcmkONERROR(
-+                            gckVGMMU_FreePages(Kernel->vg->mmu,
-+                                             Node->Virtual.pageTables[Kernel->core],
-+                                             Node->Virtual.pageCount));
-+                    }
-+                    else
-+#endif
-+                    {
-+                        gcmkONERROR(
-+                            gckMMU_FreePages(Kernel->mmu,
-+                                             Node->Virtual.pageTables[Kernel->core],
-+                                             Node->Virtual.pageCount));
-+                    }
-+                    /* Mark page table as freed. */
-+                    Node->Virtual.pageTables[Kernel->core] = gcvNULL;
-+                    Node->Virtual.lockKernels[Kernel->core] = gcvNULL;
-+                }
-+
-+#ifdef __QNXNTO__
-+                /* Mark node as unlocked. */
-+                Node->Virtual.unlockPendings[Kernel->core] = gcvFALSE;
-+#endif
-+            }
-+
-+            for (i = 0, totalLocked = 0; i < gcdMAX_GPU_COUNT; i++)
-+            {
-+                totalLocked += Node->Virtual.lockeds[i];
-+            }
-+
-+            if (totalLocked == 0)
-+            {
-+                /* Owner have already freed this node
-+                ** and we are the last one to unlock, do
-+                ** real free */
-+                if (Node->Virtual.freed)
-+                {
-+                    /* Free the virtual memory. */
-+                    gcmkVERIFY_OK(gckOS_FreePagedMemory(Kernel->os,
-+                                                        Node->Virtual.physical,
-+                                                        Node->Virtual.bytes));
-+
-+                    /* Destroy the gcuVIDMEM_NODE union. */
-+                    gcmkVERIFY_OK(gckVIDMEM_DestroyVirtual(Node));
-+
-+                    /* Release mutex before node is destroyed */
-+                    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+
-+                    acquired = gcvFALSE;
-+
-+                    /* Node has been destroyed, so we should not touch it any more */
-+                    gcmkFOOTER();
-+                    return gcvSTATUS_OK;
-+                }
-+            }
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                           "Unmapped virtual node 0x%x from 0x%08X",
-+                           Node, Node->Virtual.addresses[Kernel->core]);
-+
-+        }
-+
-+        else
-+        {
-+            /* If we need to unlock a node from virtual memory we have to be
-+            ** very carefull.  If the node is still inside the caches we
-+            ** might get a bus error later if the cache line needs to be
-+            ** replaced.  So - we have to flush the caches before we do
-+            ** anything. */
-+
-+            /* gckCommand_EnterCommit() can't be called in interrupt handler because
-+            ** of a dead lock situation:
-+            ** process call Command_Commit(), and acquire Command->mutexQueue in
-+            ** gckCOMMAND_EnterCommit(). Then it will wait for a signal which depends
-+            ** on interrupt handler to generate, if interrupt handler enter
-+            ** gckCommand_EnterCommit(), process will never get the signal. */
-+
-+            /* So, flush cache when we still in process context, and then ask caller to
-+            ** schedule a event. */
-+
-+            gcmkONERROR(
-+                gckOS_UnlockPages(os,
-+                              Node->Virtual.physical,
-+                              Node->Virtual.bytes,
-+                              Node->Virtual.logical));
-+
-+            if (!Node->Virtual.contiguous
-+            &&  (Node->Virtual.lockeds[Kernel->core] == 1)
-+#if gcdENABLE_VG
-+            && (Kernel->vg == gcvNULL)
-+#endif
-+            )
-+            {
-+                if (Type == gcvSURF_BITMAP)
-+                {
-+                    /* Flush 2D cache. */
-+                    flush = gcvFLUSH_2D;
-+                }
-+                else if (Type == gcvSURF_RENDER_TARGET)
-+                {
-+                    /* Flush color cache. */
-+                    flush = gcvFLUSH_COLOR;
-+                }
-+                else if (Type == gcvSURF_DEPTH)
-+                {
-+                    /* Flush depth cache. */
-+                    flush = gcvFLUSH_DEPTH;
-+                }
-+                else
-+                {
-+                    /* No flush required. */
-+                    flush = (gceKERNEL_FLUSH) 0;
-+                }
-+                if(hardware)
-+                {
-+                    gcmkONERROR(
-+                        gckHARDWARE_Flush(hardware, flush, gcvNULL, &requested));
-+
-+                    if (requested != 0)
-+                    {
-+                        /* Acquire the command queue. */
-+                        gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvFALSE));
-+                        commitEntered = gcvTRUE;
-+
-+                        gcmkONERROR(gckCOMMAND_Reserve(
-+                            command, requested, &buffer, &bufferSize
-+                            ));
-+
-+                        gcmkONERROR(gckHARDWARE_Flush(
-+                            hardware, flush, buffer, &bufferSize
-+                            ));
-+
-+                        /* Mark node as pending. */
-+#ifdef __QNXNTO__
-+                        Node->Virtual.unlockPendings[Kernel->core] = gcvTRUE;
-+#endif
-+
-+                        gcmkONERROR(gckCOMMAND_Execute(command, requested));
-+
-+                        /* Release the command queue. */
-+                        gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvFALSE));
-+                        commitEntered = gcvFALSE;
-+                    }
-+                }
-+                else
-+                {
-+                    gckOS_Print("Hardware already is freed.\n");
-+                }
-+            }
-+
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
-+                           "Scheduled unlock for virtual node 0x%x",
-+                           Node);
-+
-+            /* Schedule the surface to be unlocked. */
-+            *Asynchroneous = gcvTRUE;
-+        }
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+        acquired = gcvFALSE;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Asynchroneous=%d", gcmOPT_VALUE(Asynchroneous));
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (commitEntered)
-+    {
-+        /* Release the command queue mutex. */
-+        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, gcvFALSE));
-+    }
-+
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,3896 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_base_h_
-+#define __gc_hal_base_h_
-+
-+#include "gc_hal_enum.h"
-+#include "gc_hal_types.h"
-+
-+#include "gc_hal_dump.h"
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+****************************** Object Declarations *****************************
-+\******************************************************************************/
-+
-+typedef struct _gckOS *                 gckOS;
-+typedef struct _gcoHAL *                gcoHAL;
-+typedef struct _gcoOS *                 gcoOS;
-+typedef struct _gco2D *                 gco2D;
-+
-+#ifndef VIVANTE_NO_3D
-+typedef struct _gco3D *                 gco3D;
-+#endif
-+
-+typedef struct _gcoSURF *               gcoSURF;
-+typedef struct _gcsSURF_INFO *          gcsSURF_INFO_PTR;
-+typedef struct _gcsSURF_NODE *          gcsSURF_NODE_PTR;
-+typedef struct _gcsSURF_FORMAT_INFO *   gcsSURF_FORMAT_INFO_PTR;
-+typedef struct _gcsPOINT *              gcsPOINT_PTR;
-+typedef struct _gcsSIZE *               gcsSIZE_PTR;
-+typedef struct _gcsRECT *               gcsRECT_PTR;
-+typedef struct _gcsBOUNDARY *           gcsBOUNDARY_PTR;
-+typedef struct _gcoDUMP *               gcoDUMP;
-+typedef struct _gcoHARDWARE *           gcoHARDWARE;
-+typedef union  _gcuVIDMEM_NODE *        gcuVIDMEM_NODE_PTR;
-+
-+typedef struct gcsATOM *                gcsATOM_PTR;
-+
-+#if gcdENABLE_VG
-+typedef struct _gcoVG *                 gcoVG;
-+typedef struct _gcsCOMPLETION_SIGNAL *	gcsCOMPLETION_SIGNAL_PTR;
-+typedef struct _gcsCONTEXT_MAP *		gcsCONTEXT_MAP_PTR;
-+#else
-+typedef void *                          gcoVG;
-+#endif
-+
-+#if gcdSYNC
-+typedef struct _gcoFENCE *              gcoFENCE;
-+typedef struct _gcsSYNC_CONTEXT  *      gcsSYNC_CONTEXT_PTR;
-+#endif
-+
-+typedef struct _gcoOS_SymbolsList gcoOS_SymbolsList;
-+
-+/******************************************************************************\
-+******************************* Process local storage *************************
-+\******************************************************************************/
-+typedef struct _gcsPLS * gcsPLS_PTR;
-+
-+typedef void (* gctPLS_DESTRUCTOR) (
-+    gcsPLS_PTR
-+    );
-+
-+typedef struct _gcsPLS
-+{
-+    /* Global objects. */
-+    gcoOS                       os;
-+    gcoHAL                      hal;
-+
-+    /* Internal memory pool. */
-+    gctSIZE_T                   internalSize;
-+    gctPHYS_ADDR                internalPhysical;
-+    gctPOINTER                  internalLogical;
-+
-+    /* External memory pool. */
-+    gctSIZE_T                   externalSize;
-+    gctPHYS_ADDR                externalPhysical;
-+    gctPOINTER                  externalLogical;
-+
-+    /* Contiguous memory pool. */
-+    gctSIZE_T                   contiguousSize;
-+    gctPHYS_ADDR                contiguousPhysical;
-+    gctPOINTER                  contiguousLogical;
-+
-+    /* EGL-specific process-wide objects. */
-+    gctPOINTER                  eglDisplayInfo;
-+    gctPOINTER                  eglSurfaceInfo;
-+    gceSURF_FORMAT              eglConfigFormat;
-+
-+    /* PorcessID of the constrcutor process */
-+    gctUINT32                   processID;
-+#if gcdFORCE_GAL_LOAD_TWICE
-+    /* ThreadID of the constrcutor process. */
-+    gctSIZE_T                   threadID;
-+    /* Flag for calling module destructor. */
-+    gctBOOL                     exiting;
-+#endif
-+
-+    /* Reference count for destructor. */
-+    gcsATOM_PTR                 reference;
-+    gctBOOL                     bKFS;
-+#if gcdUSE_NPOT_PATCH
-+    gctBOOL                     bNeedSupportNP2Texture;
-+#endif
-+
-+    /* Destructor for eglDisplayInfo. */
-+    gctPLS_DESTRUCTOR           destructor;
-+}
-+gcsPLS;
-+
-+extern gcsPLS gcPLS;
-+
-+/******************************************************************************\
-+******************************* Thread local storage *************************
-+\******************************************************************************/
-+
-+typedef struct _gcsTLS * gcsTLS_PTR;
-+
-+typedef void (* gctTLS_DESTRUCTOR) (
-+    gcsTLS_PTR
-+    );
-+
-+typedef struct _gcsTLS
-+{
-+    gceHARDWARE_TYPE            currentType;
-+    gcoHARDWARE                 hardware;
-+    /* Only for separated 3D and 2D */
-+    gcoHARDWARE                 hardware2D;
-+#if gcdENABLE_VG
-+    gcoVGHARDWARE               vg;
-+    gcoVG                       engineVG;
-+#endif /* gcdENABLE_VG */
-+    gctPOINTER                  context;
-+    gctTLS_DESTRUCTOR           destructor;
-+    gctBOOL                     ProcessExiting;
-+
-+#ifndef VIVANTE_NO_3D
-+	gco3D						engine3D;
-+#endif
-+#if gcdSYNC
-+    gctBOOL                     fenceEnable;
-+#endif
-+	gco2D						engine2D;
-+    gctBOOL                     copied;
-+
-+#if gcdFORCE_GAL_LOAD_TWICE
-+    /* libGAL.so handle */
-+    gctHANDLE                   handle;
-+#endif
-+}
-+gcsTLS;
-+
-+/******************************************************************************\
-+********************************* Enumerations *********************************
-+\******************************************************************************/
-+
-+typedef enum _gcePLS_VALUE
-+{
-+  gcePLS_VALUE_EGL_DISPLAY_INFO,
-+  gcePLS_VALUE_EGL_SURFACE_INFO,
-+  gcePLS_VALUE_EGL_CONFIG_FORMAT_INFO,
-+  gcePLS_VALUE_EGL_DESTRUCTOR_INFO,
-+}
-+gcePLS_VALUE;
-+
-+/* Video memory pool type. */
-+typedef enum _gcePOOL
-+{
-+    gcvPOOL_UNKNOWN = 0,
-+    gcvPOOL_DEFAULT,
-+    gcvPOOL_LOCAL,
-+    gcvPOOL_LOCAL_INTERNAL,
-+    gcvPOOL_LOCAL_EXTERNAL,
-+    gcvPOOL_UNIFIED,
-+    gcvPOOL_SYSTEM,
-+    gcvPOOL_VIRTUAL,
-+    gcvPOOL_USER,
-+    gcvPOOL_CONTIGUOUS,
-+    gcvPOOL_DEFAULT_FORCE_CONTIGUOUS,
-+    gcvPOOL_DEFAULT_FORCE_CONTIGUOUS_CACHEABLE,
-+
-+    gcvPOOL_NUMBER_OF_POOLS
-+}
-+gcePOOL;
-+
-+#ifndef VIVANTE_NO_3D
-+/* Blending functions. */
-+typedef enum _gceBLEND_FUNCTION
-+{
-+    gcvBLEND_ZERO,
-+    gcvBLEND_ONE,
-+    gcvBLEND_SOURCE_COLOR,
-+    gcvBLEND_INV_SOURCE_COLOR,
-+    gcvBLEND_SOURCE_ALPHA,
-+    gcvBLEND_INV_SOURCE_ALPHA,
-+    gcvBLEND_TARGET_COLOR,
-+    gcvBLEND_INV_TARGET_COLOR,
-+    gcvBLEND_TARGET_ALPHA,
-+    gcvBLEND_INV_TARGET_ALPHA,
-+    gcvBLEND_SOURCE_ALPHA_SATURATE,
-+    gcvBLEND_CONST_COLOR,
-+    gcvBLEND_INV_CONST_COLOR,
-+    gcvBLEND_CONST_ALPHA,
-+    gcvBLEND_INV_CONST_ALPHA,
-+}
-+gceBLEND_FUNCTION;
-+
-+/* Blending modes. */
-+typedef enum _gceBLEND_MODE
-+{
-+    gcvBLEND_ADD,
-+    gcvBLEND_SUBTRACT,
-+    gcvBLEND_REVERSE_SUBTRACT,
-+    gcvBLEND_MIN,
-+    gcvBLEND_MAX,
-+}
-+gceBLEND_MODE;
-+
-+/* API flags. */
-+typedef enum _gceAPI
-+{
-+    gcvAPI_D3D                  = 0x1,
-+    gcvAPI_OPENGL               = 0x2,
-+    gcvAPI_OPENVG               = 0x3,
-+    gcvAPI_OPENCL               = 0x4,
-+}
-+gceAPI;
-+
-+/* Depth modes. */
-+typedef enum _gceDEPTH_MODE
-+{
-+    gcvDEPTH_NONE,
-+    gcvDEPTH_Z,
-+    gcvDEPTH_W,
-+}
-+gceDEPTH_MODE;
-+#endif /* VIVANTE_NO_3D */
-+
-+typedef enum _gceWHERE
-+{
-+    gcvWHERE_COMMAND,
-+    gcvWHERE_RASTER,
-+    gcvWHERE_PIXEL,
-+}
-+gceWHERE;
-+
-+typedef enum _gceHOW
-+{
-+    gcvHOW_SEMAPHORE            = 0x1,
-+    gcvHOW_STALL                = 0x2,
-+    gcvHOW_SEMAPHORE_STALL      = 0x3,
-+}
-+gceHOW;
-+
-+typedef enum _gceSignalHandlerType
-+{
-+    gcvHANDLE_SIGFPE_WHEN_SIGNAL_CODE_IS_0        = 0x1,
-+}
-+gceSignalHandlerType;
-+
-+
-+#if gcdENABLE_VG
-+/* gcsHAL_Limits*/
-+typedef struct _gcsHAL_LIMITS
-+{
-+    /* chip info */
-+    gceCHIPMODEL    chipModel;
-+    gctUINT32       chipRevision;
-+    gctUINT32       featureCount;
-+    gctUINT32       *chipFeatures;
-+
-+    /* target caps */
-+	gctUINT32         maxWidth;
-+	gctUINT32         maxHeight;
-+	gctUINT32         multiTargetCount;
-+	gctUINT32         maxSamples;
-+
-+}gcsHAL_LIMITS;
-+#endif
-+
-+/******************************************************************************\
-+*********** Generic Memory Allocation Optimization Using Containers ************
-+\******************************************************************************/
-+
-+/* Generic container definition. */
-+typedef struct _gcsCONTAINER_LINK * gcsCONTAINER_LINK_PTR;
-+typedef struct _gcsCONTAINER_LINK
-+{
-+    /* Points to the next container. */
-+    gcsCONTAINER_LINK_PTR           next;
-+}
-+gcsCONTAINER_LINK;
-+
-+typedef struct _gcsCONTAINER_RECORD * gcsCONTAINER_RECORD_PTR;
-+typedef struct _gcsCONTAINER_RECORD
-+{
-+    gcsCONTAINER_RECORD_PTR         prev;
-+    gcsCONTAINER_RECORD_PTR         next;
-+}
-+gcsCONTAINER_RECORD;
-+
-+typedef struct _gcsCONTAINER * gcsCONTAINER_PTR;
-+typedef struct _gcsCONTAINER
-+{
-+    gctUINT                         containerSize;
-+    gctUINT                         recordSize;
-+    gctUINT                         recordCount;
-+    gcsCONTAINER_LINK_PTR           containers;
-+    gcsCONTAINER_RECORD             freeList;
-+    gcsCONTAINER_RECORD             allocList;
-+}
-+gcsCONTAINER;
-+
-+gceSTATUS
-+gcsCONTAINER_Construct(
-+    IN gcsCONTAINER_PTR Container,
-+    gctUINT RecordsPerContainer,
-+    gctUINT RecordSize
-+    );
-+
-+gceSTATUS
-+gcsCONTAINER_Destroy(
-+    IN gcsCONTAINER_PTR Container
-+    );
-+
-+gceSTATUS
-+gcsCONTAINER_AllocateRecord(
-+    IN gcsCONTAINER_PTR Container,
-+    OUT gctPOINTER * Record
-+    );
-+
-+gceSTATUS
-+gcsCONTAINER_FreeRecord(
-+    IN gcsCONTAINER_PTR Container,
-+    IN gctPOINTER Record
-+    );
-+
-+gceSTATUS
-+gcsCONTAINER_FreeAll(
-+    IN gcsCONTAINER_PTR Container
-+    );
-+
-+/******************************************************************************\
-+********************************* gcoHAL Object *********************************
-+\******************************************************************************/
-+
-+/* Construct a new gcoHAL object. */
-+gceSTATUS
-+gcoHAL_Construct(
-+    IN gctPOINTER Context,
-+    IN gcoOS Os,
-+    OUT gcoHAL * Hal
-+    );
-+
-+/* Destroy an gcoHAL object. */
-+gceSTATUS
-+gcoHAL_Destroy(
-+    IN gcoHAL Hal
-+    );
-+
-+/* Get pointer to gco2D object. */
-+gceSTATUS
-+gcoHAL_Get2DEngine(
-+    IN gcoHAL Hal,
-+    OUT gco2D * Engine
-+    );
-+
-+gceSTATUS
-+gcoHAL_SetFscaleValue(
-+    IN gctUINT FscaleValue
-+    );
-+
-+gceSTATUS
-+gcoHAL_GetFscaleValue(
-+    OUT gctUINT * FscaleValue,
-+    OUT gctUINT * MinFscaleValue,
-+    OUT gctUINT * MaxFscaleValue
-+    );
-+
-+gceSTATUS
-+gcoHAL_SetBltNP2Texture(
-+    gctBOOL enable
-+    );
-+
-+#ifndef VIVANTE_NO_3D
-+/* Get pointer to gco3D object. */
-+gceSTATUS
-+gcoHAL_Get3DEngine(
-+    IN gcoHAL Hal,
-+    OUT gco3D * Engine
-+    );
-+
-+gceSTATUS
-+gcoHAL_Query3DEngine(
-+    IN gcoHAL Hal,
-+    OUT gco3D * Engine
-+    );
-+
-+gceSTATUS
-+gcoHAL_Set3DEngine(
-+    IN gcoHAL Hal,
-+    IN gco3D Engine
-+    );
-+
-+gceSTATUS
-+gcoHAL_Get3DHardware(
-+    IN gcoHAL Hal,
-+    OUT gcoHARDWARE * Hardware
-+    );
-+
-+gceSTATUS
-+gcoHAL_Set3DHardware(
-+    IN gcoHAL Hal,
-+    IN gcoHARDWARE Hardware
-+    );
-+
-+
-+#endif /* VIVANTE_NO_3D */
-+
-+/* Verify whether the specified feature is available in hardware. */
-+gceSTATUS
-+gcoHAL_IsFeatureAvailable(
-+    IN gcoHAL Hal,
-+    IN gceFEATURE Feature
-+    );
-+
-+/* Query the identity of the hardware. */
-+gceSTATUS
-+gcoHAL_QueryChipIdentity(
-+    IN gcoHAL Hal,
-+    OUT gceCHIPMODEL* ChipModel,
-+    OUT gctUINT32* ChipRevision,
-+    OUT gctUINT32* ChipFeatures,
-+    OUT gctUINT32* ChipMinorFeatures
-+    );
-+
-+/* Query the minor features of the hardware. */
-+gceSTATUS gcoHAL_QueryChipMinorFeatures(
-+    IN gcoHAL Hal,
-+    OUT gctUINT32* NumFeatures,
-+    OUT gctUINT32* ChipMinorFeatures
-+    );
-+
-+/* Query the amount of video memory. */
-+gceSTATUS
-+gcoHAL_QueryVideoMemory(
-+    IN gcoHAL Hal,
-+    OUT gctPHYS_ADDR * InternalAddress,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctPHYS_ADDR * ExternalAddress,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctPHYS_ADDR * ContiguousAddress,
-+    OUT gctSIZE_T * ContiguousSize
-+    );
-+
-+/* Map video memory. */
-+gceSTATUS
-+gcoHAL_MapMemory(
-+    IN gcoHAL Hal,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T NumberOfBytes,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Unmap video memory. */
-+gceSTATUS
-+gcoHAL_UnmapMemory(
-+    IN gcoHAL Hal,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T NumberOfBytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Schedule an unmap of a buffer mapped through its physical address. */
-+gceSTATUS
-+gcoHAL_ScheduleUnmapMemory(
-+    IN gcoHAL Hal,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T NumberOfBytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Map user memory. */
-+gceSTATUS
-+gcoHAL_MapUserMemory(
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Physical,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * Info,
-+    OUT gctUINT32_PTR GPUAddress
-+    );
-+
-+/* Unmap user memory. */
-+gceSTATUS
-+gcoHAL_UnmapUserMemory(
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Size,
-+    IN gctPOINTER Info,
-+    IN gctUINT32 GPUAddress
-+    );
-+
-+/* Schedule an unmap of a user buffer using event mechanism. */
-+gceSTATUS
-+gcoHAL_ScheduleUnmapUserMemory(
-+    IN gcoHAL Hal,
-+    IN gctPOINTER Info,
-+    IN gctSIZE_T Size,
-+    IN gctUINT32 Address,
-+    IN gctPOINTER Memory
-+    );
-+
-+/* Commit the current command buffer. */
-+gceSTATUS
-+gcoHAL_Commit(
-+    IN gcoHAL Hal,
-+    IN gctBOOL Stall
-+    );
-+
-+/* Query the tile capabilities. */
-+gceSTATUS
-+gcoHAL_QueryTiled(
-+    IN gcoHAL Hal,
-+    OUT gctINT32 * TileWidth2D,
-+    OUT gctINT32 * TileHeight2D,
-+    OUT gctINT32 * TileWidth3D,
-+    OUT gctINT32 * TileHeight3D
-+    );
-+
-+gceSTATUS
-+gcoHAL_Compact(
-+    IN gcoHAL Hal
-+    );
-+
-+#if VIVANTE_PROFILER
-+gceSTATUS
-+gcoHAL_ProfileStart(
-+    IN gcoHAL Hal
-+    );
-+
-+gceSTATUS
-+gcoHAL_ProfileEnd(
-+    IN gcoHAL Hal,
-+    IN gctCONST_STRING Title
-+    );
-+#endif
-+
-+/* Power Management */
-+gceSTATUS
-+gcoHAL_SetPowerManagementState(
-+    IN gcoHAL Hal,
-+    IN gceCHIPPOWERSTATE State
-+    );
-+
-+gceSTATUS
-+gcoHAL_QueryPowerManagementState(
-+    IN gcoHAL Hal,
-+    OUT gceCHIPPOWERSTATE *State
-+    );
-+
-+/* Set the filter type for filter blit. */
-+gceSTATUS
-+gcoHAL_SetFilterType(
-+    IN gcoHAL Hal,
-+    IN gceFILTER_TYPE FilterType
-+    );
-+
-+gceSTATUS
-+gcoHAL_GetDump(
-+    IN gcoHAL Hal,
-+    OUT gcoDUMP * Dump
-+    );
-+
-+/* Call the kernel HAL layer. */
-+gceSTATUS
-+gcoHAL_Call(
-+    IN gcoHAL Hal,
-+    IN OUT gcsHAL_INTERFACE_PTR Interface
-+    );
-+
-+gceSTATUS
-+gcoHAL_GetPatchID(
-+    IN  gcoHAL Hal,
-+    OUT gcePATCH_ID * PatchID
-+    );
-+
-+/* Schedule an event. */
-+gceSTATUS
-+gcoHAL_ScheduleEvent(
-+    IN gcoHAL Hal,
-+    IN OUT gcsHAL_INTERFACE_PTR Interface
-+    );
-+
-+/* Destroy a surface. */
-+gceSTATUS
-+gcoHAL_DestroySurface(
-+    IN gcoHAL Hal,
-+    IN gcoSURF Surface
-+    );
-+
-+/* Request a start/stop timestamp. */
-+gceSTATUS
-+gcoHAL_SetTimer(
-+    IN gcoHAL Hal,
-+    IN gctUINT32 Index,
-+    IN gctBOOL Start
-+    );
-+
-+/* Get Time delta from a Timer in microseconds. */
-+gceSTATUS
-+gcoHAL_GetTimerTime(
-+    IN gcoHAL Hal,
-+    IN gctUINT32 Timer,
-+    OUT gctINT32_PTR TimeDelta
-+    );
-+
-+/* set timeout value. */
-+gceSTATUS
-+gcoHAL_SetTimeOut(
-+    IN gcoHAL Hal,
-+    IN gctUINT32 timeOut
-+    );
-+
-+gceSTATUS
-+gcoHAL_SetHardwareType(
-+    IN gcoHAL Hal,
-+    IN gceHARDWARE_TYPE HardwardType
-+    );
-+
-+gceSTATUS
-+gcoHAL_GetHardwareType(
-+    IN gcoHAL Hal,
-+    OUT gceHARDWARE_TYPE * HardwardType
-+    );
-+
-+gceSTATUS
-+gcoHAL_QueryChipCount(
-+    IN gcoHAL Hal,
-+    OUT gctINT32 * Count
-+    );
-+
-+gceSTATUS
-+gcoHAL_QuerySeparated3D2D(
-+    IN gcoHAL Hal
-+    );
-+
-+gceSTATUS
-+gcoHAL_QuerySpecialHint(
-+    IN gceSPECIAL_HINT Hint
-+    );
-+
-+gceSTATUS
-+gcoHAL_SetSpecialHintData(
-+    IN gcoHARDWARE Hardware
-+    );
-+
-+/* Get pointer to gcoVG object. */
-+gceSTATUS
-+gcoHAL_GetVGEngine(
-+    IN gcoHAL Hal,
-+    OUT gcoVG * Engine
-+    );
-+
-+#if gcdENABLE_VG
-+gceSTATUS
-+gcoHAL_QueryChipLimits(
-+    IN gcoHAL           Hal,
-+    IN gctINT32         Chip,
-+    OUT gcsHAL_LIMITS   *Limits);
-+
-+gceSTATUS
-+gcoHAL_QueryChipFeature(
-+    IN gcoHAL       Hal,
-+    IN gctINT32     Chip,
-+    IN gceFEATURE   Feature);
-+
-+#endif
-+/******************************************************************************\
-+********************************** gcoOS Object *********************************
-+\******************************************************************************/
-+
-+/* Get PLS value for given key */
-+gctPOINTER
-+gcoOS_GetPLSValue(
-+    IN gcePLS_VALUE key
-+    );
-+
-+/* Set PLS value of a given key */
-+void
-+gcoOS_SetPLSValue(
-+    IN gcePLS_VALUE key,
-+    OUT gctPOINTER value
-+    );
-+
-+/* Get access to the thread local storage. */
-+gceSTATUS
-+gcoOS_GetTLS(
-+    OUT gcsTLS_PTR * TLS
-+    );
-+
-+    /* Copy the TLS from a source thread. */
-+    gceSTATUS gcoOS_CopyTLS(IN gcsTLS_PTR Source);
-+
-+/* Destroy the objects associated with the current thread. */
-+void
-+gcoOS_FreeThreadData(
-+    IN gctBOOL ProcessExiting
-+    );
-+
-+/* Construct a new gcoOS object. */
-+gceSTATUS
-+gcoOS_Construct(
-+    IN gctPOINTER Context,
-+    OUT gcoOS * Os
-+    );
-+
-+/* Destroy an gcoOS object. */
-+gceSTATUS
-+gcoOS_Destroy(
-+    IN gcoOS Os
-+    );
-+
-+/* Get the base address for the physical memory. */
-+gceSTATUS
-+gcoOS_GetBaseAddress(
-+    IN gcoOS Os,
-+    OUT gctUINT32_PTR BaseAddress
-+    );
-+
-+/* Allocate memory from the heap. */
-+gceSTATUS
-+gcoOS_Allocate(
-+    IN gcoOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+/* Get allocated memory size. */
-+gceSTATUS
-+gcoOS_GetMemorySize(
-+    IN gcoOS Os,
-+    IN gctPOINTER Memory,
-+    OUT gctSIZE_T_PTR MemorySize
-+    );
-+
-+/* Free allocated memory. */
-+gceSTATUS
-+gcoOS_Free(
-+    IN gcoOS Os,
-+    IN gctPOINTER Memory
-+    );
-+
-+/* Allocate memory. */
-+gceSTATUS
-+gcoOS_AllocateMemory(
-+    IN gcoOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+/* Free memory. */
-+gceSTATUS
-+gcoOS_FreeMemory(
-+    IN gcoOS Os,
-+    IN gctPOINTER Memory
-+    );
-+
-+/* Allocate contiguous memory. */
-+gceSTATUS
-+gcoOS_AllocateContiguous(
-+    IN gcoOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Free contiguous memory. */
-+gceSTATUS
-+gcoOS_FreeContiguous(
-+    IN gcoOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Allocate video memory. */
-+gceSTATUS
-+gcoOS_AllocateVideoMemory(
-+    IN gcoOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN gctBOOL InCacheable,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctUINT32 * Physical,
-+    OUT gctPOINTER * Logical,
-+    OUT gctPOINTER * Handle
-+    );
-+
-+/* Free video memory. */
-+gceSTATUS
-+gcoOS_FreeVideoMemory(
-+    IN gcoOS Os,
-+    IN gctPOINTER Handle
-+    );
-+
-+gceSTATUS
-+gcoSURF_GetBankOffsetBytes(
-+    IN gcoSURF Surfce,
-+    IN gceSURF_TYPE Type,
-+    IN gctUINT32 Stride,
-+    IN gctUINT32_PTR Bytes
-+    );
-+
-+/* Map user memory. */
-+gceSTATUS
-+gcoOS_MapUserMemory(
-+    IN gcoOS Os,
-+    IN gctPOINTER Memory,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * Info,
-+    OUT gctUINT32_PTR Address
-+    );
-+
-+/* Map user memory. */
-+gceSTATUS
-+gcoOS_MapUserMemoryEx(
-+    IN gcoOS Os,
-+    IN gctPOINTER Memory,
-+    IN gctUINT32 Physical,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * Info,
-+    OUT gctUINT32_PTR Address
-+    );
-+
-+/* Unmap user memory. */
-+gceSTATUS
-+gcoOS_UnmapUserMemory(
-+    IN gcoOS Os,
-+    IN gctPOINTER Memory,
-+    IN gctSIZE_T Size,
-+    IN gctPOINTER Info,
-+    IN gctUINT32 Address
-+    );
-+
-+/* Device I/O Control call to the kernel HAL layer. */
-+gceSTATUS
-+gcoOS_DeviceControl(
-+    IN gcoOS Os,
-+    IN gctUINT32 IoControlCode,
-+    IN gctPOINTER InputBuffer,
-+    IN gctSIZE_T InputBufferSize,
-+    IN gctPOINTER OutputBuffer,
-+    IN gctSIZE_T OutputBufferSize
-+    );
-+
-+/* Allocate non paged memory. */
-+gceSTATUS
-+gcoOS_AllocateNonPagedMemory(
-+    IN gcoOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Free non paged memory. */
-+gceSTATUS
-+gcoOS_FreeNonPagedMemory(
-+    IN gcoOS Os,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical
-+    );
-+
-+#define gcmOS_SAFE_FREE(os, mem) \
-+	gcoOS_Free(os, mem); \
-+	mem = gcvNULL
-+
-+#define gcmkOS_SAFE_FREE(os, mem) \
-+    gckOS_Free(os, mem); \
-+	mem = gcvNULL
-+
-+typedef enum _gceFILE_MODE
-+{
-+    gcvFILE_CREATE          = 0,
-+    gcvFILE_APPEND,
-+    gcvFILE_READ,
-+    gcvFILE_CREATETEXT,
-+    gcvFILE_APPENDTEXT,
-+    gcvFILE_READTEXT,
-+}
-+gceFILE_MODE;
-+
-+/* Open a file. */
-+gceSTATUS
-+gcoOS_Open(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING FileName,
-+    IN gceFILE_MODE Mode,
-+    OUT gctFILE * File
-+    );
-+
-+/* Close a file. */
-+gceSTATUS
-+gcoOS_Close(
-+    IN gcoOS Os,
-+    IN gctFILE File
-+    );
-+
-+/* Read data from a file. */
-+gceSTATUS
-+gcoOS_Read(
-+    IN gcoOS Os,
-+    IN gctFILE File,
-+    IN gctSIZE_T ByteCount,
-+    IN gctPOINTER Data,
-+    OUT gctSIZE_T * ByteRead
-+    );
-+
-+/* Write data to a file. */
-+gceSTATUS
-+gcoOS_Write(
-+    IN gcoOS Os,
-+    IN gctFILE File,
-+    IN gctSIZE_T ByteCount,
-+    IN gctCONST_POINTER Data
-+    );
-+
-+/* Flush data to a file. */
-+gceSTATUS
-+gcoOS_Flush(
-+    IN gcoOS Os,
-+    IN gctFILE File
-+    );
-+
-+/* Close a file descriptor. */
-+gceSTATUS
-+gcoOS_CloseFD(
-+    IN gcoOS Os,
-+    IN gctINT FD
-+    );
-+
-+/* Dup file descriptor to another. */
-+gceSTATUS
-+gcoOS_DupFD(
-+    IN gcoOS Os,
-+    IN gctINT FD,
-+    OUT gctINT * FD2
-+    );
-+
-+/* Create an endpoint for communication. */
-+gceSTATUS
-+gcoOS_Socket(
-+    IN gcoOS Os,
-+    IN gctINT Domain,
-+    IN gctINT Type,
-+    IN gctINT Protocol,
-+    OUT gctINT *SockFd
-+    );
-+
-+/* Close a socket. */
-+gceSTATUS
-+gcoOS_CloseSocket(
-+    IN gcoOS Os,
-+    IN gctINT SockFd
-+    );
-+
-+/* Initiate a connection on a socket. */
-+gceSTATUS
-+gcoOS_Connect(
-+    IN gcoOS Os,
-+    IN gctINT SockFd,
-+    IN gctCONST_POINTER HostName,
-+    IN gctUINT Port);
-+
-+/* Shut down part of connection on a socket. */
-+gceSTATUS
-+gcoOS_Shutdown(
-+    IN gcoOS Os,
-+    IN gctINT SockFd,
-+    IN gctINT How
-+    );
-+
-+/* Send a message on a socket. */
-+gceSTATUS
-+gcoOS_Send(
-+    IN gcoOS Os,
-+    IN gctINT SockFd,
-+    IN gctSIZE_T ByteCount,
-+    IN gctCONST_POINTER Data,
-+    IN gctINT Flags
-+    );
-+
-+/* Initiate a connection on a socket. */
-+gceSTATUS
-+gcoOS_WaitForSend(
-+    IN gcoOS Os,
-+    IN gctINT SockFd,
-+    IN gctINT Seconds,
-+    IN gctINT MicroSeconds);
-+
-+/* Get environment variable value. */
-+gceSTATUS
-+gcoOS_GetEnv(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING VarName,
-+    OUT gctSTRING * Value
-+    );
-+
-+/* Set environment variable value. */
-+gceSTATUS
-+gcoOS_SetEnv(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING VarName,
-+    IN gctSTRING Value
-+    );
-+
-+/* Get current working directory. */
-+gceSTATUS
-+gcoOS_GetCwd(
-+    IN gcoOS Os,
-+	IN gctINT SizeInBytes,
-+    OUT gctSTRING Buffer
-+    );
-+
-+/* Get file status info. */
-+gceSTATUS
-+gcoOS_Stat(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING FileName,
-+    OUT gctPOINTER Buffer
-+    );
-+
-+typedef enum _gceFILE_WHENCE
-+{
-+    gcvFILE_SEEK_SET,
-+    gcvFILE_SEEK_CUR,
-+    gcvFILE_SEEK_END
-+}
-+gceFILE_WHENCE;
-+
-+/* Set the current position of a file. */
-+gceSTATUS
-+gcoOS_Seek(
-+    IN gcoOS Os,
-+    IN gctFILE File,
-+    IN gctUINT32 Offset,
-+    IN gceFILE_WHENCE Whence
-+    );
-+
-+/* Set the current position of a file. */
-+gceSTATUS
-+gcoOS_SetPos(
-+    IN gcoOS Os,
-+    IN gctFILE File,
-+    IN gctUINT32 Position
-+    );
-+
-+/* Get the current position of a file. */
-+gceSTATUS
-+gcoOS_GetPos(
-+    IN gcoOS Os,
-+    IN gctFILE File,
-+    OUT gctUINT32 * Position
-+    );
-+
-+/* Same as strstr. */
-+gceSTATUS
-+gcoOS_StrStr(
-+    IN gctCONST_STRING String,
-+    IN gctCONST_STRING SubString,
-+    OUT gctSTRING * Output
-+    );
-+
-+/* Find the last occurance of a character inside a string. */
-+gceSTATUS
-+gcoOS_StrFindReverse(
-+    IN gctCONST_STRING String,
-+    IN gctINT8 Character,
-+    OUT gctSTRING * Output
-+    );
-+
-+gceSTATUS
-+gcoOS_StrDup(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING String,
-+    OUT gctSTRING * Target
-+    );
-+
-+/* Copy a string. */
-+gceSTATUS
-+gcoOS_StrCopySafe(
-+    IN gctSTRING Destination,
-+    IN gctSIZE_T DestinationSize,
-+    IN gctCONST_STRING Source
-+    );
-+
-+/* Append a string. */
-+gceSTATUS
-+gcoOS_StrCatSafe(
-+    IN gctSTRING Destination,
-+    IN gctSIZE_T DestinationSize,
-+    IN gctCONST_STRING Source
-+    );
-+
-+/* Compare two strings. */
-+gceSTATUS
-+gcoOS_StrCmp(
-+    IN gctCONST_STRING String1,
-+    IN gctCONST_STRING String2
-+    );
-+
-+/* Compare characters of two strings. */
-+gceSTATUS
-+gcoOS_StrNCmp(
-+    IN gctCONST_STRING String1,
-+    IN gctCONST_STRING String2,
-+    IN gctSIZE_T Count
-+    );
-+
-+/* Convert string to float. */
-+gceSTATUS
-+gcoOS_StrToFloat(
-+    IN gctCONST_STRING String,
-+    OUT gctFLOAT * Float
-+    );
-+
-+/* Convert hex string to integer. */
-+gceSTATUS
-+gcoOS_HexStrToInt(
-+	IN gctCONST_STRING String,
-+	OUT gctINT * Int
-+	);
-+
-+/* Convert hex string to float. */
-+gceSTATUS
-+gcoOS_HexStrToFloat(
-+	IN gctCONST_STRING String,
-+	OUT gctFLOAT * Float
-+	);
-+
-+/* Convert string to integer. */
-+gceSTATUS
-+gcoOS_StrToInt(
-+    IN gctCONST_STRING String,
-+    OUT gctINT * Int
-+    );
-+
-+gceSTATUS
-+gcoOS_MemCmp(
-+    IN gctCONST_POINTER Memory1,
-+    IN gctCONST_POINTER Memory2,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gcoOS_PrintStrSafe(
-+    OUT gctSTRING String,
-+    IN gctSIZE_T StringSize,
-+    IN OUT gctUINT * Offset,
-+    IN gctCONST_STRING Format,
-+    ...
-+    );
-+
-+gceSTATUS
-+gcoOS_LoadLibrary(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING Library,
-+    OUT gctHANDLE * Handle
-+    );
-+
-+gceSTATUS
-+gcoOS_FreeLibrary(
-+    IN gcoOS Os,
-+    IN gctHANDLE Handle
-+    );
-+
-+gceSTATUS
-+gcoOS_GetProcAddress(
-+    IN gcoOS Os,
-+    IN gctHANDLE Handle,
-+    IN gctCONST_STRING Name,
-+    OUT gctPOINTER * Function
-+    );
-+
-+gceSTATUS
-+gcoOS_Compact(
-+    IN gcoOS Os
-+    );
-+
-+gceSTATUS
-+gcoOS_AddSignalHandler (
-+    IN gceSignalHandlerType SignalHandlerType
-+    );
-+
-+#if VIVANTE_PROFILER
-+gceSTATUS
-+gcoOS_ProfileStart(
-+    IN gcoOS Os
-+    );
-+
-+gceSTATUS
-+gcoOS_ProfileEnd(
-+    IN gcoOS Os,
-+    IN gctCONST_STRING Title
-+    );
-+
-+gceSTATUS
-+gcoOS_SetProfileSetting(
-+        IN gcoOS Os,
-+        IN gctBOOL Enable,
-+        IN gctCONST_STRING FileName
-+        );
-+#endif
-+
-+gctBOOL
-+gcoOS_IsNeededSupportNP2Texture(
-+    IN gctCHAR* ProcName
-+    );
-+
-+/* Query the video memory. */
-+gceSTATUS
-+gcoOS_QueryVideoMemory(
-+    IN gcoOS Os,
-+    OUT gctPHYS_ADDR * InternalAddress,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctPHYS_ADDR * ExternalAddress,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctPHYS_ADDR * ContiguousAddress,
-+    OUT gctSIZE_T * ContiguousSize
-+    );
-+
-+/* Detect if the process is the executable specified. */
-+gceSTATUS
-+gcoOS_DetectProcessByNamePid(
-+    IN gctCONST_STRING Name,
-+    IN gctHANDLE Pid
-+    );
-+
-+/* Detect if the current process is the executable specified. */
-+gceSTATUS
-+gcoOS_DetectProcessByName(
-+    IN gctCONST_STRING Name
-+    );
-+
-+gceSTATUS
-+gcoOS_DetectProcessByEncryptedName(
-+    IN gctCONST_STRING Name
-+    );
-+
-+#if defined(ANDROID)
-+gceSTATUS
-+gcoOS_DetectProgrameByEncryptedSymbols(
-+    IN gcoOS_SymbolsList Symbols
-+    );
-+#endif
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Atoms ----------------------------------------------------------------*/
-+
-+/* Construct an atom. */
-+gceSTATUS
-+gcoOS_AtomConstruct(
-+    IN gcoOS Os,
-+    OUT gcsATOM_PTR * Atom
-+    );
-+
-+/* Destroy an atom. */
-+gceSTATUS
-+gcoOS_AtomDestroy(
-+    IN gcoOS Os,
-+    IN gcsATOM_PTR Atom
-+    );
-+
-+/* Increment an atom. */
-+gceSTATUS
-+gcoOS_AtomIncrement(
-+    IN gcoOS Os,
-+    IN gcsATOM_PTR Atom,
-+    OUT gctINT32_PTR OldValue
-+    );
-+
-+/* Decrement an atom. */
-+gceSTATUS
-+gcoOS_AtomDecrement(
-+    IN gcoOS Os,
-+    IN gcsATOM_PTR Atom,
-+    OUT gctINT32_PTR OldValue
-+    );
-+
-+gctHANDLE
-+gcoOS_GetCurrentProcessID(
-+    void
-+    );
-+
-+gctHANDLE
-+gcoOS_GetCurrentThreadID(
-+    void
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Time -----------------------------------------------------------------*/
-+
-+/* Get the number of milliseconds since the system started. */
-+gctUINT32
-+gcoOS_GetTicks(
-+    void
-+    );
-+
-+/* Get time in microseconds. */
-+gceSTATUS
-+gcoOS_GetTime(
-+    gctUINT64_PTR Time
-+    );
-+
-+/* Get CPU usage in microseconds. */
-+gceSTATUS
-+gcoOS_GetCPUTime(
-+    gctUINT64_PTR CPUTime
-+    );
-+
-+/* Get memory usage. */
-+gceSTATUS
-+gcoOS_GetMemoryUsage(
-+    gctUINT32_PTR MaxRSS,
-+    gctUINT32_PTR IxRSS,
-+    gctUINT32_PTR IdRSS,
-+    gctUINT32_PTR IsRSS
-+    );
-+
-+/* Delay a number of microseconds. */
-+gceSTATUS
-+gcoOS_Delay(
-+    IN gcoOS Os,
-+    IN gctUINT32 Delay
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Threads --------------------------------------------------------------*/
-+
-+#ifdef _WIN32
-+/* Cannot include windows.h here becuase "near" and "far"
-+ * which are used in gcsDEPTH_INFO, are defined to nothing in WinDef.h.
-+ * So, use the real value of DWORD and WINAPI, instead.
-+ * DWORD is unsigned long, and WINAPI is __stdcall.
-+ * If these two are change in WinDef.h, the following two typdefs
-+ * need to be changed, too.
-+ */
-+typedef unsigned long gctTHREAD_RETURN;
-+typedef unsigned long (__stdcall * gcTHREAD_ROUTINE)(void * Argument);
-+#else
-+typedef void * gctTHREAD_RETURN;
-+typedef void * (* gcTHREAD_ROUTINE)(void *);
-+#endif
-+
-+/* Create a new thread. */
-+gceSTATUS
-+gcoOS_CreateThread(
-+    IN gcoOS Os,
-+    IN gcTHREAD_ROUTINE Worker,
-+    IN gctPOINTER Argument,
-+    OUT gctPOINTER * Thread
-+    );
-+
-+/* Close a thread. */
-+gceSTATUS
-+gcoOS_CloseThread(
-+    IN gcoOS Os,
-+    IN gctPOINTER Thread
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Mutexes --------------------------------------------------------------*/
-+
-+/* Create a new mutex. */
-+gceSTATUS
-+gcoOS_CreateMutex(
-+    IN gcoOS Os,
-+    OUT gctPOINTER * Mutex
-+    );
-+
-+/* Delete a mutex. */
-+gceSTATUS
-+gcoOS_DeleteMutex(
-+    IN gcoOS Os,
-+    IN gctPOINTER Mutex
-+    );
-+
-+/* Acquire a mutex. */
-+gceSTATUS
-+gcoOS_AcquireMutex(
-+    IN gcoOS Os,
-+    IN gctPOINTER Mutex,
-+    IN gctUINT32 Timeout
-+    );
-+
-+/* Release a mutex. */
-+gceSTATUS
-+gcoOS_ReleaseMutex(
-+    IN gcoOS Os,
-+    IN gctPOINTER Mutex
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Signals --------------------------------------------------------------*/
-+
-+/* Create a signal. */
-+gceSTATUS
-+gcoOS_CreateSignal(
-+    IN gcoOS Os,
-+    IN gctBOOL ManualReset,
-+    OUT gctSIGNAL * Signal
-+    );
-+
-+/* Destroy a signal. */
-+gceSTATUS
-+gcoOS_DestroySignal(
-+    IN gcoOS Os,
-+    IN gctSIGNAL Signal
-+    );
-+
-+/* Signal a signal. */
-+gceSTATUS
-+gcoOS_Signal(
-+    IN gcoOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctBOOL State
-+    );
-+
-+/* Wait for a signal. */
-+gceSTATUS
-+gcoOS_WaitSignal(
-+    IN gcoOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctUINT32 Wait
-+    );
-+
-+/* Map a signal from another process */
-+gceSTATUS
-+gcoOS_MapSignal(
-+    IN gctSIGNAL  RemoteSignal,
-+    OUT gctSIGNAL * LocalSignal
-+    );
-+
-+/* Unmap a signal mapped from another process */
-+gceSTATUS
-+gcoOS_UnmapSignal(
-+    IN gctSIGNAL Signal
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Android Native Fence -------------------------------------------------*/
-+
-+/* Create sync point. */
-+gceSTATUS
-+gcoOS_CreateSyncPoint(
-+    IN gcoOS Os,
-+    OUT gctSYNC_POINT * SyncPoint
-+    );
-+
-+/* Destroy sync point. */
-+gceSTATUS
-+gcoOS_DestroySyncPoint(
-+    IN gcoOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    );
-+
-+/* Create native fence. */
-+gceSTATUS
-+gcoOS_CreateNativeFence(
-+    IN gcoOS Os,
-+    IN gctSYNC_POINT SyncPoint,
-+    OUT gctINT * FenceFD
-+    );
-+
-+/* Wait on native fence. */
-+gceSTATUS
-+gcoOS_WaitNativeFence(
-+    IN gcoOS Os,
-+    IN gctINT FenceFD,
-+    IN gctUINT32 Timeout
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Memory Access and Cache ----------------------------------------------*/
-+
-+/* Write a register. */
-+gceSTATUS
-+gcoOS_WriteRegister(
-+    IN gcoOS Os,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Data
-+    );
-+
-+/* Read a register. */
-+gceSTATUS
-+gcoOS_ReadRegister(
-+    IN gcoOS Os,
-+    IN gctUINT32 Address,
-+    OUT gctUINT32 * Data
-+    );
-+
-+gceSTATUS
-+gcoOS_CacheClean(
-+    IN gcoOS Os,
-+    IN gctUINT64 Node,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gcoOS_CacheFlush(
-+    IN gcoOS Os,
-+    IN gctUINT64 Node,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gcoOS_CacheInvalidate(
-+    IN gcoOS Os,
-+    IN gctUINT64 Node,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gcoOS_MemoryBarrier(
-+    IN gcoOS Os,
-+    IN gctPOINTER Logical
-+    );
-+
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Profile --------------------------------------------------------------*/
-+
-+gceSTATUS
-+gckOS_GetProfileTick(
-+    OUT gctUINT64_PTR Tick
-+    );
-+
-+gceSTATUS
-+gckOS_QueryProfileTickRate(
-+    OUT gctUINT64_PTR TickRate
-+    );
-+
-+gctUINT32
-+gckOS_ProfileToMS(
-+    IN gctUINT64 Ticks
-+    );
-+
-+gceSTATUS
-+gcoOS_GetProfileTick(
-+    OUT gctUINT64_PTR Tick
-+    );
-+
-+gceSTATUS
-+gcoOS_QueryProfileTickRate(
-+    OUT gctUINT64_PTR TickRate
-+    );
-+
-+#define _gcmPROFILE_INIT(prefix, freq, start) \
-+    do { \
-+        prefix ## OS_QueryProfileTickRate(&(freq)); \
-+        prefix ## OS_GetProfileTick(&(start)); \
-+    } while (gcvFALSE)
-+
-+#define _gcmPROFILE_QUERY(prefix, start, ticks) \
-+    do { \
-+        prefix ## OS_GetProfileTick(&(ticks)); \
-+        (ticks) = ((ticks) > (start)) ? ((ticks) - (start)) \
-+                                      : (~0ull - (start) + (ticks) + 1); \
-+    } while (gcvFALSE)
-+
-+#if gcdENABLE_PROFILING
-+#   define gcmkPROFILE_INIT(freq, start)    _gcmPROFILE_INIT(gck, freq, start)
-+#   define gcmkPROFILE_QUERY(start, ticks)  _gcmPROFILE_QUERY(gck, start, ticks)
-+#   define gcmPROFILE_INIT(freq, start)     _gcmPROFILE_INIT(gco, freq, start)
-+#   define gcmPROFILE_QUERY(start, ticks)   _gcmPROFILE_QUERY(gco, start, ticks)
-+#   define gcmPROFILE_ONLY(x)               x
-+#   define gcmPROFILE_ELSE(x)               do { } while (gcvFALSE)
-+#   define gcmPROFILE_DECLARE_ONLY(x)       x
-+#   define gcmPROFILE_DECLARE_ELSE(x)       typedef x
-+#else
-+#   define gcmkPROFILE_INIT(start, freq)    do { } while (gcvFALSE)
-+#   define gcmkPROFILE_QUERY(start, ticks)  do { } while (gcvFALSE)
-+#   define gcmPROFILE_INIT(start, freq)     do { } while (gcvFALSE)
-+#   define gcmPROFILE_QUERY(start, ticks)   do { } while (gcvFALSE)
-+#   define gcmPROFILE_ONLY(x)               do { } while (gcvFALSE)
-+#   define gcmPROFILE_ELSE(x)               x
-+#   define gcmPROFILE_DECLARE_ONLY(x)       do { } while (gcvFALSE) 
-+#   define gcmPROFILE_DECLARE_ELSE(x)       x
-+#endif
-+
-+/*******************************************************************************
-+**  gcoMATH object
-+*/
-+
-+#define gcdPI                   3.14159265358979323846f
-+
-+/* Kernel. */
-+gctINT
-+gckMATH_ModuloInt(
-+    IN gctINT X,
-+    IN gctINT Y
-+    );
-+
-+/* User. */
-+gctUINT32
-+gcoMATH_Log2in5dot5(
-+    IN gctINT X
-+    );
-+
-+
-+gctFLOAT
-+gcoMATH_UIntAsFloat(
-+    IN gctUINT32 X
-+    );
-+
-+gctUINT32
-+gcoMATH_FloatAsUInt(
-+    IN gctFLOAT X
-+    );
-+
-+gctBOOL
-+gcoMATH_CompareEqualF(
-+    IN gctFLOAT X,
-+    IN gctFLOAT Y
-+    );
-+
-+gctUINT16
-+gcoMATH_UInt8AsFloat16(
-+    IN gctUINT8 X
-+    );
-+
-+/******************************************************************************\
-+**************************** Coordinate Structures *****************************
-+\******************************************************************************/
-+
-+typedef struct _gcsPOINT
-+{
-+    gctINT32                    x;
-+    gctINT32                    y;
-+}
-+gcsPOINT;
-+
-+typedef struct _gcsSIZE
-+{
-+    gctINT32                    width;
-+    gctINT32                    height;
-+}
-+gcsSIZE;
-+
-+typedef struct _gcsRECT
-+{
-+    gctINT32                    left;
-+    gctINT32                    top;
-+    gctINT32                    right;
-+    gctINT32                    bottom;
-+}
-+gcsRECT;
-+
-+typedef union _gcsPIXEL
-+{
-+    struct
-+    {
-+        gctFLOAT r, g, b, a;
-+        gctFLOAT d, s;
-+    } pf;
-+
-+    struct
-+    {
-+        gctINT32 r, g, b, a;
-+        gctINT32 d, s;
-+    } pi;
-+
-+    struct
-+    {
-+        gctUINT32 r, g, b, a;
-+        gctUINT32 d, s;
-+    } pui;
-+
-+} gcsPIXEL;
-+
-+
-+/******************************************************************************\
-+********************************* gcoSURF Object ********************************
-+\******************************************************************************/
-+
-+/*----------------------------------------------------------------------------*/
-+/*------------------------------- gcoSURF Common ------------------------------*/
-+
-+/* Color format classes. */
-+typedef enum _gceFORMAT_CLASS
-+{
-+    gcvFORMAT_CLASS_RGBA        = 4500,
-+    gcvFORMAT_CLASS_YUV,
-+    gcvFORMAT_CLASS_INDEX,
-+    gcvFORMAT_CLASS_LUMINANCE,
-+    gcvFORMAT_CLASS_BUMP,
-+    gcvFORMAT_CLASS_DEPTH,
-+}
-+gceFORMAT_CLASS;
-+
-+/* Special enums for width field in gcsFORMAT_COMPONENT. */
-+typedef enum _gceCOMPONENT_CONTROL
-+{
-+    gcvCOMPONENT_NOTPRESENT     = 0x00,
-+    gcvCOMPONENT_DONTCARE       = 0x80,
-+    gcvCOMPONENT_WIDTHMASK      = 0x7F,
-+    gcvCOMPONENT_ODD            = 0x80
-+}
-+gceCOMPONENT_CONTROL;
-+
-+/* Color format component parameters. */
-+typedef struct _gcsFORMAT_COMPONENT
-+{
-+    gctUINT8                    start;
-+    gctUINT8                    width;
-+}
-+gcsFORMAT_COMPONENT;
-+
-+/* RGBA color format class. */
-+typedef struct _gcsFORMAT_CLASS_TYPE_RGBA
-+{
-+    gcsFORMAT_COMPONENT         alpha;
-+    gcsFORMAT_COMPONENT         red;
-+    gcsFORMAT_COMPONENT         green;
-+    gcsFORMAT_COMPONENT         blue;
-+}
-+gcsFORMAT_CLASS_TYPE_RGBA;
-+
-+/* YUV color format class. */
-+typedef struct _gcsFORMAT_CLASS_TYPE_YUV
-+{
-+    gcsFORMAT_COMPONENT         y;
-+    gcsFORMAT_COMPONENT         u;
-+    gcsFORMAT_COMPONENT         v;
-+}
-+gcsFORMAT_CLASS_TYPE_YUV;
-+
-+/* Index color format class. */
-+typedef struct _gcsFORMAT_CLASS_TYPE_INDEX
-+{
-+    gcsFORMAT_COMPONENT         value;
-+}
-+gcsFORMAT_CLASS_TYPE_INDEX;
-+
-+/* Luminance color format class. */
-+typedef struct _gcsFORMAT_CLASS_TYPE_LUMINANCE
-+{
-+    gcsFORMAT_COMPONENT         alpha;
-+    gcsFORMAT_COMPONENT         value;
-+}
-+gcsFORMAT_CLASS_TYPE_LUMINANCE;
-+
-+/* Bump map color format class. */
-+typedef struct _gcsFORMAT_CLASS_TYPE_BUMP
-+{
-+    gcsFORMAT_COMPONENT         alpha;
-+    gcsFORMAT_COMPONENT         l;
-+    gcsFORMAT_COMPONENT         v;
-+    gcsFORMAT_COMPONENT         u;
-+    gcsFORMAT_COMPONENT         q;
-+    gcsFORMAT_COMPONENT         w;
-+}
-+gcsFORMAT_CLASS_TYPE_BUMP;
-+
-+/* Depth and stencil format class. */
-+typedef struct _gcsFORMAT_CLASS_TYPE_DEPTH
-+{
-+    gcsFORMAT_COMPONENT         depth;
-+    gcsFORMAT_COMPONENT         stencil;
-+}
-+gcsFORMAT_CLASS_TYPE_DEPTH;
-+
-+/* Format parameters. */
-+typedef struct _gcsSURF_FORMAT_INFO
-+{
-+    /* Format code and class. */
-+    gceSURF_FORMAT              format;
-+    gceFORMAT_CLASS             fmtClass;
-+
-+    /* The size of one pixel in bits. */
-+    gctUINT8                    bitsPerPixel;
-+
-+    /* Component swizzle. */
-+    gceSURF_SWIZZLE             swizzle;
-+
-+    /* Some formats have two neighbour pixels interleaved together. */
-+    /* To describe such format, set the flag to 1 and add another   */
-+    /* like this one describing the odd pixel format.               */
-+    gctUINT8                    interleaved;
-+
-+    /* Format components. */
-+    union
-+    {
-+        gcsFORMAT_CLASS_TYPE_BUMP       bump;
-+        gcsFORMAT_CLASS_TYPE_RGBA       rgba;
-+        gcsFORMAT_CLASS_TYPE_YUV        yuv;
-+        gcsFORMAT_CLASS_TYPE_LUMINANCE  lum;
-+        gcsFORMAT_CLASS_TYPE_INDEX      index;
-+        gcsFORMAT_CLASS_TYPE_DEPTH      depth;
-+    } u;
-+}
-+gcsSURF_FORMAT_INFO;
-+
-+/* Frame buffer information. */
-+typedef struct _gcsSURF_FRAMEBUFFER
-+{
-+    gctPOINTER                  logical;
-+    gctUINT                     width, height;
-+    gctINT                      stride;
-+    gceSURF_FORMAT              format;
-+}
-+gcsSURF_FRAMEBUFFER;
-+
-+typedef struct _gcsVIDMEM_NODE_SHARED_INFO
-+{
-+    gctBOOL                     tileStatusDisabled;
-+    gcsPOINT                    SrcOrigin;
-+    gcsPOINT                    DestOrigin;
-+    gcsSIZE                     RectSize;
-+    gctUINT32                   clearValue;
-+}
-+gcsVIDMEM_NODE_SHARED_INFO;
-+
-+/* Generic pixel component descriptors. */
-+extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_XXX8;
-+extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_XX8X;
-+extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_X8XX;
-+extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_8XXX;
-+
-+typedef enum _gceORIENTATION
-+{
-+    gcvORIENTATION_TOP_BOTTOM,
-+    gcvORIENTATION_BOTTOM_TOP,
-+}
-+gceORIENTATION;
-+
-+
-+/* Construct a new gcoSURF object. */
-+gceSTATUS
-+gcoSURF_Construct(
-+    IN gcoHAL Hal,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Depth,
-+    IN gceSURF_TYPE Type,
-+    IN gceSURF_FORMAT Format,
-+    IN gcePOOL Pool,
-+    OUT gcoSURF * Surface
-+    );
-+
-+/* Destroy an gcoSURF object. */
-+gceSTATUS
-+gcoSURF_Destroy(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Map user-allocated surface. */
-+gceSTATUS
-+gcoSURF_MapUserSurface(
-+    IN gcoSURF Surface,
-+    IN gctUINT Alignment,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Physical
-+    );
-+
-+/* Query vid mem node info. */
-+gceSTATUS
-+gcoSURF_QueryVidMemNode(
-+    IN gcoSURF Surface,
-+    OUT gctUINT64 * Node,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT_PTR Bytes
-+    );
-+
-+/* Set the color type of the surface. */
-+gceSTATUS
-+gcoSURF_SetColorType(
-+    IN gcoSURF Surface,
-+    IN gceSURF_COLOR_TYPE ColorType
-+    );
-+
-+/* Get the color type of the surface. */
-+gceSTATUS
-+gcoSURF_GetColorType(
-+    IN gcoSURF Surface,
-+    OUT gceSURF_COLOR_TYPE *ColorType
-+    );
-+
-+/* Set the surface ration angle. */
-+gceSTATUS
-+gcoSURF_SetRotation(
-+    IN gcoSURF Surface,
-+    IN gceSURF_ROTATION Rotation
-+    );
-+
-+gceSTATUS
-+gcoSURF_SetPreRotation(
-+    IN gcoSURF Surface,
-+    IN gceSURF_ROTATION Rotation
-+    );
-+
-+gceSTATUS
-+gcoSURF_GetPreRotation(
-+    IN gcoSURF Surface,
-+    IN gceSURF_ROTATION *Rotation
-+    );
-+
-+gceSTATUS
-+gcoSURF_IsValid(
-+    IN gcoSURF Surface
-+    );
-+
-+#ifndef VIVANTE_NO_3D
-+/* Verify and return the state of the tile status mechanism. */
-+gceSTATUS
-+gcoSURF_IsTileStatusSupported(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Process tile status for the specified surface. */
-+gceSTATUS
-+gcoSURF_SetTileStatus(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Enable tile status for the specified surface. */
-+gceSTATUS
-+gcoSURF_EnableTileStatus(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Disable tile status for the specified surface. */
-+gceSTATUS
-+gcoSURF_DisableTileStatus(
-+    IN gcoSURF Surface,
-+    IN gctBOOL Decompress
-+    );
-+
-+gceSTATUS
-+gcoSURF_AlignResolveRect(
-+    IN gcoSURF Surf,
-+    IN gcsPOINT_PTR RectOrigin,
-+    IN gcsPOINT_PTR RectSize,
-+    OUT gcsPOINT_PTR AlignedOrigin,
-+    OUT gcsPOINT_PTR AlignedSize
-+    );
-+#endif /* VIVANTE_NO_3D */
-+
-+/* Get surface size. */
-+gceSTATUS
-+gcoSURF_GetSize(
-+    IN gcoSURF Surface,
-+    OUT gctUINT * Width,
-+    OUT gctUINT * Height,
-+    OUT gctUINT * Depth
-+    );
-+
-+/* Get surface aligned sizes. */
-+gceSTATUS
-+gcoSURF_GetAlignedSize(
-+    IN gcoSURF Surface,
-+    OUT gctUINT * Width,
-+    OUT gctUINT * Height,
-+    OUT gctINT * Stride
-+    );
-+
-+/* Get alignments. */
-+gceSTATUS
-+gcoSURF_GetAlignment(
-+    IN gceSURF_TYPE Type,
-+    IN gceSURF_FORMAT Format,
-+    OUT gctUINT * AddressAlignment,
-+    OUT gctUINT * XAlignment,
-+    OUT gctUINT * YAlignment
-+    );
-+
-+/* Get surface type and format. */
-+gceSTATUS
-+gcoSURF_GetFormat(
-+    IN gcoSURF Surface,
-+    OUT gceSURF_TYPE * Type,
-+    OUT gceSURF_FORMAT * Format
-+    );
-+
-+/* Get surface tiling. */
-+gceSTATUS
-+gcoSURF_GetTiling(
-+    IN gcoSURF Surface,
-+    OUT gceTILING * Tiling
-+    );
-+
-+/* Lock the surface. */
-+gceSTATUS
-+gcoSURF_Lock(
-+    IN gcoSURF Surface,
-+    IN OUT gctUINT32 * Address,
-+    IN OUT gctPOINTER * Memory
-+    );
-+
-+/* Unlock the surface. */
-+gceSTATUS
-+gcoSURF_Unlock(
-+    IN gcoSURF Surface,
-+    IN gctPOINTER Memory
-+    );
-+
-+/* Return pixel format parameters. */
-+gceSTATUS
-+gcoSURF_QueryFormat(
-+    IN gceSURF_FORMAT Format,
-+    OUT gcsSURF_FORMAT_INFO_PTR * Info
-+    );
-+
-+/* Compute the color pixel mask. */
-+gceSTATUS
-+gcoSURF_ComputeColorMask(
-+    IN gcsSURF_FORMAT_INFO_PTR Format,
-+    OUT gctUINT32_PTR ColorMask
-+    );
-+
-+/* Flush the surface. */
-+gceSTATUS
-+gcoSURF_Flush(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Fill surface from it's tile status buffer. */
-+gceSTATUS
-+gcoSURF_FillFromTile(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Check if surface needs a filler. */
-+gceSTATUS gcoSURF_NeedFiller(IN gcoSURF Surface);
-+
-+/* Fill surface with a value. */
-+gceSTATUS
-+gcoSURF_Fill(
-+    IN gcoSURF Surface,
-+    IN gcsPOINT_PTR Origin,
-+    IN gcsSIZE_PTR Size,
-+    IN gctUINT32 Value,
-+    IN gctUINT32 Mask
-+    );
-+
-+/* Alpha blend two surfaces together. */
-+gceSTATUS
-+gcoSURF_Blend(
-+    IN gcoSURF SrcSurface,
-+    IN gcoSURF DestSurface,
-+    IN gcsPOINT_PTR SrcOrig,
-+    IN gcsPOINT_PTR DestOrigin,
-+    IN gcsSIZE_PTR Size,
-+    IN gceSURF_BLEND_MODE Mode
-+    );
-+
-+/* Create a new gcoSURF wrapper object. */
-+gceSTATUS
-+gcoSURF_ConstructWrapper(
-+    IN gcoHAL Hal,
-+    OUT gcoSURF * Surface
-+    );
-+
-+/* Set the underlying buffer for the surface wrapper. */
-+gceSTATUS
-+gcoSURF_SetBuffer(
-+    IN gcoSURF Surface,
-+    IN gceSURF_TYPE Type,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT Stride,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Physical
-+    );
-+
-+/* Set the underlying video buffer for the surface wrapper. */
-+gceSTATUS
-+gcoSURF_SetVideoBuffer(
-+    IN gcoSURF Surface,
-+    IN gceSURF_TYPE Type,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Stride,
-+    IN gctPOINTER *LogicalPlane1,
-+    IN gctUINT32 *PhysicalPlane1
-+    );
-+
-+/* Set the size of the surface in pixels and map the underlying buffer. */
-+gceSTATUS
-+gcoSURF_SetWindow(
-+    IN gcoSURF Surface,
-+    IN gctUINT X,
-+    IN gctUINT Y,
-+    IN gctUINT Width,
-+    IN gctUINT Height
-+    );
-+
-+/* Set width/height alignment of the surface directly and calculate stride/size. This is only for dri backend now. Please be careful before use. */
-+gceSTATUS
-+gcoSURF_SetAlignment(
-+    IN gcoSURF Surface,
-+    IN gctUINT Width,
-+    IN gctUINT Height
-+    );
-+
-+/* Increase reference count of the surface. */
-+gceSTATUS
-+gcoSURF_ReferenceSurface(
-+    IN gcoSURF Surface
-+    );
-+
-+/* Get surface reference count. */
-+gceSTATUS
-+gcoSURF_QueryReferenceCount(
-+    IN gcoSURF Surface,
-+    OUT gctINT32 * ReferenceCount
-+    );
-+
-+/* Set surface orientation. */
-+gceSTATUS
-+gcoSURF_SetOrientation(
-+    IN gcoSURF Surface,
-+    IN gceORIENTATION Orientation
-+    );
-+
-+/* Query surface orientation. */
-+gceSTATUS
-+gcoSURF_QueryOrientation(
-+    IN gcoSURF Surface,
-+    OUT gceORIENTATION * Orientation
-+    );
-+
-+gceSTATUS
-+gcoSURF_SetOffset(
-+    IN gcoSURF Surface,
-+    IN gctUINT Offset
-+    );
-+
-+gceSTATUS
-+gcoSURF_GetOffset(
-+    IN gcoSURF Surface,
-+    OUT gctUINT *Offset
-+    );
-+
-+gceSTATUS
-+gcoSURF_NODE_Cache(
-+    IN gcsSURF_NODE_PTR Node,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes,
-+    IN gceCACHEOPERATION Operation
-+    );
-+
-+/* Perform CPU cache operation on surface */
-+gceSTATUS
-+gcoSURF_CPUCacheOperation(
-+    IN gcoSURF Surface,
-+    IN gceCACHEOPERATION Operation
-+    );
-+
-+
-+gceSTATUS
-+gcoSURF_SetLinearResolveAddress(
-+    IN gcoSURF Surface,
-+    IN gctUINT32 Address,
-+    IN gctPOINTER Memory
-+    );
-+
-+    gceSTATUS
-+    gcoSURF_Swap(IN gcoSURF Surface1, IN gcoSURF Surface2);
-+
-+/******************************************************************************\
-+********************************* gcoDUMP Object ********************************
-+\******************************************************************************/
-+
-+/* Construct a new gcoDUMP object. */
-+gceSTATUS
-+gcoDUMP_Construct(
-+    IN gcoOS Os,
-+    IN gcoHAL Hal,
-+    OUT gcoDUMP * Dump
-+    );
-+
-+/* Destroy a gcoDUMP object. */
-+gceSTATUS
-+gcoDUMP_Destroy(
-+    IN gcoDUMP Dump
-+    );
-+
-+/* Enable/disable dumping. */
-+gceSTATUS
-+gcoDUMP_Control(
-+    IN gcoDUMP Dump,
-+    IN gctSTRING FileName
-+    );
-+
-+gceSTATUS
-+gcoDUMP_IsEnabled(
-+    IN gcoDUMP Dump,
-+    OUT gctBOOL * Enabled
-+    );
-+
-+/* Add surface. */
-+gceSTATUS
-+gcoDUMP_AddSurface(
-+    IN gcoDUMP Dump,
-+    IN gctINT32 Width,
-+    IN gctINT32 Height,
-+    IN gceSURF_FORMAT PixelFormat,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T ByteCount
-+    );
-+
-+/* Mark the beginning of a frame. */
-+gceSTATUS
-+gcoDUMP_FrameBegin(
-+    IN gcoDUMP Dump
-+    );
-+
-+/* Mark the end of a frame. */
-+gceSTATUS
-+gcoDUMP_FrameEnd(
-+    IN gcoDUMP Dump
-+    );
-+
-+/* Dump data. */
-+gceSTATUS
-+gcoDUMP_DumpData(
-+    IN gcoDUMP Dump,
-+    IN gceDUMP_TAG Type,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T ByteCount,
-+    IN gctCONST_POINTER Data
-+    );
-+
-+/* Delete an address. */
-+gceSTATUS
-+gcoDUMP_Delete(
-+    IN gcoDUMP Dump,
-+    IN gctUINT32 Address
-+    );
-+
-+/* Enable dump or not. */
-+gceSTATUS
-+gcoDUMP_SetDumpFlag(
-+    IN gctBOOL DumpState
-+    );
-+
-+/******************************************************************************\
-+******************************* gcsRECT Structure ******************************
-+\******************************************************************************/
-+
-+/* Initialize rectangle structure. */
-+gceSTATUS
-+gcsRECT_Set(
-+    OUT gcsRECT_PTR Rect,
-+    IN gctINT32 Left,
-+    IN gctINT32 Top,
-+    IN gctINT32 Right,
-+    IN gctINT32 Bottom
-+    );
-+
-+/* Return the width of the rectangle. */
-+gceSTATUS
-+gcsRECT_Width(
-+    IN gcsRECT_PTR Rect,
-+    OUT gctINT32 * Width
-+    );
-+
-+/* Return the height of the rectangle. */
-+gceSTATUS
-+gcsRECT_Height(
-+    IN gcsRECT_PTR Rect,
-+    OUT gctINT32 * Height
-+    );
-+
-+/* Ensure that top left corner is to the left and above the right bottom. */
-+gceSTATUS
-+gcsRECT_Normalize(
-+    IN OUT gcsRECT_PTR Rect
-+    );
-+
-+/* Compare two rectangles. */
-+gceSTATUS
-+gcsRECT_IsEqual(
-+    IN gcsRECT_PTR Rect1,
-+    IN gcsRECT_PTR Rect2,
-+    OUT gctBOOL * Equal
-+    );
-+
-+/* Compare the sizes of two rectangles. */
-+gceSTATUS
-+gcsRECT_IsOfEqualSize(
-+    IN gcsRECT_PTR Rect1,
-+    IN gcsRECT_PTR Rect2,
-+    OUT gctBOOL * EqualSize
-+    );
-+
-+gceSTATUS
-+gcsRECT_RelativeRotation(
-+    IN gceSURF_ROTATION Orientation,
-+    IN OUT gceSURF_ROTATION *Relation);
-+
-+gceSTATUS
-+
-+gcsRECT_Rotate(
-+
-+    IN OUT gcsRECT_PTR Rect,
-+
-+    IN gceSURF_ROTATION Rotation,
-+
-+    IN gceSURF_ROTATION toRotation,
-+
-+    IN gctINT32 SurfaceWidth,
-+
-+    IN gctINT32 SurfaceHeight
-+
-+    );
-+
-+/******************************************************************************\
-+**************************** gcsBOUNDARY Structure *****************************
-+\******************************************************************************/
-+
-+typedef struct _gcsBOUNDARY
-+{
-+    gctINT                      x;
-+    gctINT                      y;
-+    gctINT                      width;
-+    gctINT                      height;
-+}
-+gcsBOUNDARY;
-+
-+/******************************************************************************\
-+********************************* gcoHEAP Object ********************************
-+\******************************************************************************/
-+
-+typedef struct _gcoHEAP *       gcoHEAP;
-+
-+/* Construct a new gcoHEAP object. */
-+gceSTATUS
-+gcoHEAP_Construct(
-+    IN gcoOS Os,
-+    IN gctSIZE_T AllocationSize,
-+    OUT gcoHEAP * Heap
-+    );
-+
-+/* Destroy an gcoHEAP object. */
-+gceSTATUS
-+gcoHEAP_Destroy(
-+    IN gcoHEAP Heap
-+    );
-+
-+/* Allocate memory. */
-+gceSTATUS
-+gcoHEAP_Allocate(
-+    IN gcoHEAP Heap,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Node
-+    );
-+
-+gceSTATUS
-+gcoHEAP_GetMemorySize(
-+    IN gcoHEAP Heap,
-+    IN gctPOINTER Memory,
-+    OUT gctSIZE_T_PTR MemorySize
-+    );
-+
-+/* Free memory. */
-+gceSTATUS
-+gcoHEAP_Free(
-+    IN gcoHEAP Heap,
-+    IN gctPOINTER Node
-+    );
-+
-+#if (VIVANTE_PROFILER  || gcdDEBUG)
-+/* Profile the heap. */
-+gceSTATUS
-+gcoHEAP_ProfileStart(
-+    IN gcoHEAP Heap
-+    );
-+
-+gceSTATUS
-+gcoHEAP_ProfileEnd(
-+    IN gcoHEAP Heap,
-+    IN gctCONST_STRING Title
-+    );
-+#endif
-+
-+
-+/******************************************************************************\
-+******************************* Debugging Macros *******************************
-+\******************************************************************************/
-+
-+void
-+gcoOS_SetDebugLevel(
-+    IN gctUINT32 Level
-+    );
-+
-+void
-+gcoOS_GetDebugLevel(
-+    OUT gctUINT32_PTR DebugLevel
-+    );
-+
-+void
-+gcoOS_SetDebugZone(
-+    IN gctUINT32 Zone
-+    );
-+
-+void
-+gcoOS_GetDebugZone(
-+    IN gctUINT32 Zone,
-+    OUT gctUINT32_PTR DebugZone
-+    );
-+
-+void
-+gcoOS_SetDebugLevelZone(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone
-+    );
-+
-+void
-+gcoOS_SetDebugZones(
-+    IN gctUINT32 Zones,
-+    IN gctBOOL Enable
-+    );
-+
-+void
-+gcoOS_SetDebugFile(
-+    IN gctCONST_STRING FileName
-+    );
-+
-+gctFILE
-+gcoOS_ReplaceDebugFile(
-+    IN gctFILE fp
-+	);
-+
-+/*******************************************************************************
-+**
-+**  gcmFATAL
-+**
-+**      Print a message to the debugger and execute a break point.
-+**
-+**  ARGUMENTS:
-+**
-+**      message Message.
-+**      ...     Optional arguments.
-+*/
-+
-+void
-+gckOS_DebugFatal(
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gcoOS_DebugFatal(
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+#if gcmIS_DEBUG(gcdDEBUG_FATAL)
-+#   define gcmFATAL             gcoOS_DebugFatal
-+#   define gcmkFATAL            gckOS_DebugFatal
-+#elif gcdHAS_ELLIPSES
-+#   define gcmFATAL(...)
-+#   define gcmkFATAL(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_fatal(
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+#   define gcmFATAL             __dummy_fatal
-+#   define gcmkFATAL            __dummy_fatal
-+#endif
-+
-+#define gcmENUM2TEXT(e)         case e: return #e
-+
-+/*******************************************************************************
-+**
-+**  gcmTRACE
-+**
-+**      Print a message to the debugfer if the correct level has been set.  In
-+**      retail mode this macro does nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      level   Level of message.
-+**      message Message.
-+**      ...     Optional arguments.
-+*/
-+#define gcvLEVEL_NONE           -1
-+#define gcvLEVEL_ERROR          0
-+#define gcvLEVEL_WARNING        1
-+#define gcvLEVEL_INFO           2
-+#define gcvLEVEL_VERBOSE        3
-+
-+void
-+gckOS_DebugTrace(
-+    IN gctUINT32 Level,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gckOS_DebugTraceN(
-+    IN gctUINT32 Level,
-+    IN gctUINT ArgumentSize,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gcoOS_DebugTrace(
-+    IN gctUINT32 Level,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+#   define gcmTRACE             gcoOS_DebugTrace
-+#   define gcmkTRACE            gckOS_DebugTrace
-+#   define gcmkTRACE_N          gckOS_DebugTraceN
-+#elif gcdHAS_ELLIPSES
-+#   define gcmTRACE(...)
-+#   define gcmkTRACE(...)
-+#   define gcmkTRACE_N(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_trace(
-+        IN gctUINT32 Level,
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+
-+    gcmINLINE static void
-+    __dummy_trace_n(
-+        IN gctUINT32 Level,
-+        IN gctUINT ArgumentSize,
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+
-+#   define gcmTRACE             __dummy_trace
-+#   define gcmkTRACE            __dummy_trace
-+#   define gcmkTRACE_N          __dummy_trace_n
-+#endif
-+
-+/* Zones common for kernel and user. */
-+#define gcvZONE_OS              (1 << 0)
-+#define gcvZONE_HARDWARE        (1 << 1)
-+#define gcvZONE_HEAP            (1 << 2)
-+#define gcvZONE_SIGNAL          (1 << 27)
-+
-+/* Kernel zones. */
-+#define gcvZONE_KERNEL          (1 << 3)
-+#define gcvZONE_VIDMEM          (1 << 4)
-+#define gcvZONE_COMMAND         (1 << 5)
-+#define gcvZONE_DRIVER          (1 << 6)
-+#define gcvZONE_CMODEL          (1 << 7)
-+#define gcvZONE_MMU             (1 << 8)
-+#define gcvZONE_EVENT           (1 << 9)
-+#define gcvZONE_DEVICE          (1 << 10)
-+#define gcvZONE_DATABASE        (1 << 11)
-+#define gcvZONE_INTERRUPT       (1 << 12)
-+#define gcvZONE_POWER           (1 << 13)
-+
-+/* User zones. */
-+#define gcvZONE_HAL             (1 << 3)
-+#define gcvZONE_BUFFER          (1 << 4)
-+#define gcvZONE_CONTEXT         (1 << 5)
-+#define gcvZONE_SURFACE         (1 << 6)
-+#define gcvZONE_INDEX           (1 << 7)
-+#define gcvZONE_STREAM          (1 << 8)
-+#define gcvZONE_TEXTURE         (1 << 9)
-+#define gcvZONE_2D              (1 << 10)
-+#define gcvZONE_3D              (1 << 11)
-+#define gcvZONE_COMPILER        (1 << 12)
-+#define gcvZONE_MEMORY          (1 << 13)
-+#define gcvZONE_STATE           (1 << 14)
-+#define gcvZONE_AUX             (1 << 15)
-+#define gcvZONE_VERTEX          (1 << 16)
-+#define gcvZONE_CL              (1 << 17)
-+#define gcvZONE_COMPOSITION     (1 << 17)
-+#define gcvZONE_VG              (1 << 18)
-+#define gcvZONE_IMAGE           (1 << 19)
-+#define gcvZONE_UTILITY         (1 << 20)
-+#define gcvZONE_PARAMETERS      (1 << 21)
-+
-+/* API definitions. */
-+#define gcvZONE_API_HAL         (1 << 28)
-+#define gcvZONE_API_EGL         (2 << 28)
-+#define gcvZONE_API_ES11        (3 << 28)
-+#define gcvZONE_API_ES20        (4 << 28)
-+#define gcvZONE_API_VG11        (5 << 28)
-+#define gcvZONE_API_GL          (6 << 28)
-+#define gcvZONE_API_DFB         (7 << 28)
-+#define gcvZONE_API_GDI         (8 << 28)
-+#define gcvZONE_API_D3D         (9 << 28)
-+#define gcvZONE_API_ES30        (10 << 28)
-+
-+
-+#define gcmZONE_GET_API(zone)   ((zone) >> 28)
-+/*Set gcdZONE_MASE like 0x0 | gcvZONE_API_EGL
-+will enable print EGL module debug info*/
-+#define gcdZONE_MASK            0x0FFFFFFF
-+
-+/* Handy zones. */
-+#define gcvZONE_NONE            0
-+#define gcvZONE_ALL             0x0FFFFFFF
-+
-+/*Dump API depth set 1 for API, 2 for API and API behavior*/
-+#define gcvDUMP_API_DEPTH       1
-+
-+/*******************************************************************************
-+**
-+**  gcmTRACE_ZONE
-+**
-+**      Print a message to the debugger if the correct level and zone has been
-+**      set.  In retail mode this macro does nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      Level   Level of message.
-+**      Zone    Zone of message.
-+**      Message Message.
-+**      ...     Optional arguments.
-+*/
-+
-+void
-+gckOS_DebugTraceZone(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gckOS_DebugTraceZoneN(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone,
-+    IN gctUINT ArgumentSize,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gcoOS_DebugTraceZone(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+#   define gcmTRACE_ZONE            gcoOS_DebugTraceZone
-+#   define gcmkTRACE_ZONE           gckOS_DebugTraceZone
-+#   define gcmkTRACE_ZONE_N         gckOS_DebugTraceZoneN
-+#elif gcdHAS_ELLIPSES
-+#   define gcmTRACE_ZONE(...)
-+#   define gcmkTRACE_ZONE(...)
-+#   define gcmkTRACE_ZONE_N(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_trace_zone(
-+        IN gctUINT32 Level,
-+        IN gctUINT32 Zone,
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+
-+    gcmINLINE static void
-+    __dummy_trace_zone_n(
-+        IN gctUINT32 Level,
-+        IN gctUINT32 Zone,
-+        IN gctUINT ArgumentSize,
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+
-+#   define gcmTRACE_ZONE            __dummy_trace_zone
-+#   define gcmkTRACE_ZONE           __dummy_trace_zone
-+#   define gcmkTRACE_ZONE_N         __dummy_trace_zone_n
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDEBUG_ONLY
-+**
-+**      Execute a statement or function only in DEBUG mode.
-+**
-+**  ARGUMENTS:
-+**
-+**      f       Statement or function to execute.
-+*/
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+#   define gcmDEBUG_ONLY(f)         f
-+#else
-+#   define gcmDEBUG_ONLY(f)
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmSTACK_PUSH
-+**  gcmSTACK_POP
-+**  gcmSTACK_DUMP
-+**
-+**      Push or pop a function with entry arguments on the trace stack.
-+**
-+**  ARGUMENTS:
-+**
-+**      Function    Name of function.
-+**      Line        Line number.
-+**      Text        Optional text.
-+**      ...         Optional arguments for text.
-+*/
-+#if gcmIS_DEBUG(gcdDEBUG_STACK)
-+    void
-+    gcoOS_StackPush(
-+        IN gctCONST_STRING Function,
-+        IN gctINT Line,
-+        IN gctCONST_STRING Text,
-+        ...
-+        );
-+    void
-+    gcoOS_StackPop(
-+        IN gctCONST_STRING Function
-+        );
-+    void
-+    gcoOS_StackDump(
-+        void
-+        );
-+#   define gcmSTACK_PUSH            gcoOS_StackPush
-+#   define gcmSTACK_POP             gcoOS_StackPop
-+#   define gcmSTACK_DUMP            gcoOS_StackDump
-+#elif gcdHAS_ELLIPSES
-+#   define gcmSTACK_PUSH(...)       do { } while (0)
-+#   define gcmSTACK_POP(Function)   do { } while (0)
-+#   define gcmSTACK_DUMP()          do { } while (0)
-+#else
-+    gcmINLINE static void
-+    __dummy_stack_push(
-+        IN gctCONST_STRING Function,
-+        IN gctINT Line,
-+        IN gctCONST_STRING Text, ...
-+        )
-+    {
-+    }
-+#   define gcmSTACK_PUSH            __dummy_stack_push
-+#   define gcmSTACK_POP(Function)   do { } while (0)
-+#   define gcmSTACK_DUMP()          do { } while (0)
-+#endif
-+
-+/******************************************************************************\
-+******************************** Logging Macros ********************************
-+\******************************************************************************/
-+
-+#define gcdHEADER_LEVEL             gcvLEVEL_VERBOSE
-+
-+
-+#if gcdENABLE_PROFILING
-+void
-+gcoOS_ProfileDB(
-+    IN gctCONST_STRING Function,
-+    IN OUT gctBOOL_PTR Initialized
-+    );
-+
-+#define gcmHEADER() \
-+    static gctBOOL __profile__initialized__ = gcvFALSE; \
-+    gcmSTACK_PUSH(__FUNCTION__, __LINE__, gcvNULL, gcvNULL); \
-+    gcoOS_ProfileDB(__FUNCTION__, &__profile__initialized__)
-+#define gcmHEADER_ARG(...) \
-+    static gctBOOL __profile__initialized__ = gcvFALSE; \
-+    gcmSTACK_PUSH(__FUNCTION__, __LINE__, Text, __VA_ARGS__); \
-+    gcoOS_ProfileDB(__FUNCTION__, &__profile__initialized__)
-+#define gcmFOOTER() \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcoOS_ProfileDB(__FUNCTION__, gcvNULL)
-+#define gcmFOOTER_NO() \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcoOS_ProfileDB(__FUNCTION__, gcvNULL)
-+#define gcmFOOTER_ARG(...) \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcoOS_ProfileDB(__FUNCTION__, gcvNULL)
-+#define gcmFOOTER_KILL() \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcoOS_ProfileDB(gcvNULL, gcvNULL)
-+
-+#else /* gcdENABLE_PROFILING */
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmHEADER() \
-+    gctINT8 __user__ = 1; \
-+    gctINT8_PTR __user_ptr__ = &__user__; \
-+    gcmSTACK_PUSH(__FUNCTION__, __LINE__, gcvNULL, gcvNULL); \
-+    gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                  "++%s(%d)", __FUNCTION__, __LINE__)
-+#else
-+    gcmINLINE static void
-+    __dummy_header(void)
-+    {
-+    }
-+#   define gcmHEADER                   __dummy_header
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#   define gcmHEADER_ARG(Text, ...) \
-+        gctINT8 __user__ = 1; \
-+        gctINT8_PTR __user_ptr__ = &__user__; \
-+        gcmSTACK_PUSH(__FUNCTION__, __LINE__, Text, __VA_ARGS__); \
-+        gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                      "++%s(%d): " Text, __FUNCTION__, __LINE__, __VA_ARGS__)
-+#else
-+    gcmINLINE static void
-+    __dummy_header_arg(
-+        IN gctCONST_STRING Text,
-+        ...
-+        )
-+    {
-+    }
-+#   define gcmHEADER_ARG                __dummy_header_arg
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#   define gcmFOOTER() \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcmPROFILE_ONLY(gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                                  "--%s(%d) [%llu,%llu]: status=%d(%s)", \
-+                                  __FUNCTION__, __LINE__, \
-+                                  __ticks__, __total__, \
-+                                  status, gcoOS_DebugStatus2Name(status))); \
-+    gcmPROFILE_ELSE(gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                                  "--%s(%d): status=%d(%s)", \
-+                                  __FUNCTION__, __LINE__, \
-+                                  status, gcoOS_DebugStatus2Name(status))); \
-+    *__user_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_footer(void)
-+    {
-+    }
-+#   define gcmFOOTER                    __dummy_footer
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmFOOTER_NO() \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                  "--%s(%d)", __FUNCTION__, __LINE__); \
-+    *__user_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_footer_no(void)
-+    {
-+    }
-+#   define gcmFOOTER_NO                 __dummy_footer_no
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmFOOTER_KILL() \
-+    gcmSTACK_POP(__FUNCTION__); \
-+    gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                  "--%s(%d)", __FUNCTION__, __LINE__); \
-+    *__user_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_footer_kill(void)
-+    {
-+    }
-+#   define gcmFOOTER_KILL               __dummy_footer_kill
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#   define gcmFOOTER_ARG(Text, ...) \
-+        gcmSTACK_POP(__FUNCTION__); \
-+        gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                      "--%s(%d): " Text, __FUNCTION__, __LINE__, __VA_ARGS__); \
-+        *__user_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_footer_arg(
-+        IN gctCONST_STRING Text,
-+        ...
-+        )
-+    {
-+    }
-+#   define gcmFOOTER_ARG                __dummy_footer_arg
-+#endif
-+
-+#endif /* gcdENABLE_PROFILING */
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmkHEADER() \
-+    gctINT8 __kernel__ = 1; \
-+    gctINT8_PTR __kernel_ptr__ = &__kernel__; \
-+    gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                   "++%s(%d)", __FUNCTION__, __LINE__)
-+#else
-+    gcmINLINE static void
-+    __dummy_kheader(void)
-+    {
-+    }
-+#   define gcmkHEADER                  __dummy_kheader
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#   define gcmkHEADER_ARG(Text, ...) \
-+        gctINT8 __kernel__ = 1; \
-+        gctINT8_PTR __kernel_ptr__ = &__kernel__; \
-+        gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                       "++%s(%d): " Text, __FUNCTION__, __LINE__, __VA_ARGS__)
-+#else
-+    gcmINLINE static void
-+    __dummy_kheader_arg(
-+        IN gctCONST_STRING Text,
-+        ...
-+        )
-+    {
-+    }
-+#   define gcmkHEADER_ARG               __dummy_kheader_arg
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmkFOOTER() \
-+    gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                   "--%s(%d): status=%d(%s)", \
-+                   __FUNCTION__, __LINE__, status, gckOS_DebugStatus2Name(status)); \
-+    *__kernel_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_kfooter(void)
-+    {
-+    }
-+#   define gcmkFOOTER                   __dummy_kfooter
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmkFOOTER_NO() \
-+    gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                   "--%s(%d)", __FUNCTION__, __LINE__); \
-+    *__kernel_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_kfooter_no(void)
-+    {
-+    }
-+#   define gcmkFOOTER_NO                __dummy_kfooter_no
-+#endif
-+
-+#if gcdHAS_ELLIPSES
-+#   define gcmkFOOTER_ARG(Text, ...) \
-+        gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
-+                       "--%s(%d): " Text, \
-+                       __FUNCTION__, __LINE__, __VA_ARGS__); \
-+        *__kernel_ptr__ -= 1
-+#else
-+    gcmINLINE static void
-+    __dummy_kfooter_arg(
-+        IN gctCONST_STRING Text,
-+        ...
-+        )
-+    {
-+    }
-+#   define gcmkFOOTER_ARG               __dummy_kfooter_arg
-+#endif
-+
-+#define gcmOPT_VALUE(ptr)               (((ptr) == gcvNULL) ? 0 : *(ptr))
-+#define gcmOPT_VALUE_INDEX(ptr, index)  (((ptr) == gcvNULL) ? 0 : ptr[index])
-+#define gcmOPT_POINTER(ptr)             (((ptr) == gcvNULL) ? gcvNULL : *(ptr))
-+#define gcmOPT_STRING(ptr)              (((ptr) == gcvNULL) ? "(nil)" : (ptr))
-+
-+void
-+gckOS_Print(
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gckOS_PrintN(
-+    IN gctUINT ArgumentSize,
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gckOS_CopyPrint(
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gcoOS_Print(
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+#define gcmPRINT                gcoOS_Print
-+#define gcmkPRINT               gckOS_Print
-+#define gcmkPRINT_N             gckOS_PrintN
-+
-+#if gcdPRINT_VERSION
-+#   define gcmPRINT_VERSION()       do { \
-+                                        _gcmPRINT_VERSION(gcm); \
-+                                        gcmSTACK_DUMP(); \
-+                                    } while (0)
-+#   define gcmkPRINT_VERSION()      _gcmPRINT_VERSION(gcmk)
-+#   define _gcmPRINT_VERSION(prefix) \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+                      "Vivante HAL version %d.%d.%d build %d  %s  %s", \
-+                      gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH, \
-+                      gcvVERSION_BUILD, gcvVERSION_DATE, gcvVERSION_TIME )
-+#else
-+#   define gcmPRINT_VERSION()       do { gcmSTACK_DUMP(); } while (gcvFALSE)
-+#   define gcmkPRINT_VERSION()      do { } while (gcvFALSE)
-+#endif
-+
-+typedef enum _gceDUMP_BUFFER
-+{
-+    gceDUMP_BUFFER_CONTEXT,
-+    gceDUMP_BUFFER_USER,
-+    gceDUMP_BUFFER_KERNEL,
-+    gceDUMP_BUFFER_LINK,
-+    gceDUMP_BUFFER_WAITLINK,
-+    gceDUMP_BUFFER_FROM_USER,
-+}
-+gceDUMP_BUFFER;
-+
-+void
-+gckOS_DumpBuffer(
-+    IN gckOS Os,
-+    IN gctPOINTER Buffer,
-+    IN gctUINT Size,
-+    IN gceDUMP_BUFFER Type,
-+    IN gctBOOL CopyMessage
-+    );
-+
-+#define gcmkDUMPBUFFER          gckOS_DumpBuffer
-+
-+#if gcdDUMP_COMMAND
-+#   define gcmkDUMPCOMMAND(Os, Buffer, Size, Type, CopyMessage) \
-+        gcmkDUMPBUFFER(Os, Buffer, Size, Type, CopyMessage)
-+#else
-+#   define gcmkDUMPCOMMAND(Os, Buffer, Size, Type, CopyMessage)
-+#endif
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+
-+void
-+gckOS_DebugFlush(
-+    gctCONST_STRING CallerName,
-+    gctUINT LineNumber,
-+    gctUINT32 DmaAddress
-+    );
-+
-+#   define gcmkDEBUGFLUSH(DmaAddress) \
-+        gckOS_DebugFlush(__FUNCTION__, __LINE__, DmaAddress)
-+#else
-+#   define gcmkDEBUGFLUSH(DmaAddress)
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_FRAMERATE
-+**
-+**      Print average frame rate
-+**
-+*/
-+#if gcdDUMP_FRAMERATE
-+    gceSTATUS
-+    gcfDumpFrameRate(
-+        void
-+    );
-+#   define gcmDUMP_FRAMERATE        gcfDumpFrameRate
-+#elif gcdHAS_ELLIPSES
-+#   define gcmDUMP_FRAMERATE(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_frame_rate(
-+        void
-+        )
-+    {
-+    }
-+#   define gcmDUMP_FRAMERATE        __dummy_dump_frame_rate
-+#endif
-+
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP
-+**
-+**      Print a dump message.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctSTRING   Message.
-+**
-+**      ...         Optional arguments.
-+*/
-+#if gcdDUMP
-+    gceSTATUS
-+    gcfDump(
-+        IN gcoOS Os,
-+        IN gctCONST_STRING String,
-+        ...
-+        );
-+#  define gcmDUMP               gcfDump
-+#elif gcdHAS_ELLIPSES
-+#  define gcmDUMP(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump(
-+        IN gcoOS Os,
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+#  define gcmDUMP               __dummy_dump
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_DATA
-+**
-+**      Add data to the dump.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctSTRING Tag
-+**          Tag for dump.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of buffer.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes.
-+*/
-+
-+#if gcdDUMP || gcdDUMP_COMMAND
-+    gceSTATUS
-+    gcfDumpData(
-+        IN gcoOS Os,
-+        IN gctSTRING Tag,
-+        IN gctPOINTER Logical,
-+        IN gctSIZE_T Bytes
-+        );
-+#  define gcmDUMP_DATA          gcfDumpData
-+#elif gcdHAS_ELLIPSES
-+#  define gcmDUMP_DATA(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_data(
-+        IN gcoOS Os,
-+        IN gctSTRING Tag,
-+        IN gctPOINTER Logical,
-+        IN gctSIZE_T Bytes
-+        )
-+    {
-+    }
-+#  define gcmDUMP_DATA          __dummy_dump_data
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_BUFFER
-+**
-+**      Print a buffer to the dump.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctSTRING Tag
-+**          Tag for dump.
-+**
-+**      gctUINT32 Physical
-+**          Physical address of buffer.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of buffer.
-+**
-+**      gctUINT32 Offset
-+**          Offset into buffer.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes.
-+*/
-+
-+#if gcdDUMP || gcdDUMP_COMMAND
-+gceSTATUS
-+gcfDumpBuffer(
-+    IN gcoOS Os,
-+    IN gctSTRING Tag,
-+    IN gctUINT32 Physical,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset,
-+    IN gctSIZE_T Bytes
-+    );
-+#   define gcmDUMP_BUFFER       gcfDumpBuffer
-+#elif gcdHAS_ELLIPSES
-+#   define gcmDUMP_BUFFER(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_buffer(
-+        IN gcoOS Os,
-+        IN gctSTRING Tag,
-+        IN gctUINT32 Physical,
-+        IN gctPOINTER Logical,
-+        IN gctUINT32 Offset,
-+        IN gctSIZE_T Bytes
-+        )
-+    {
-+    }
-+#   define gcmDUMP_BUFFER       __dummy_dump_buffer
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_API
-+**
-+**      Print a dump message for a high level API prefixed by the function name.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctSTRING   Message.
-+**
-+**      ...         Optional arguments.
-+*/
-+gceSTATUS gcfDumpApi(IN gctCONST_STRING String, ...);
-+#if gcdDUMP_API
-+#   define gcmDUMP_API           gcfDumpApi
-+#elif gcdHAS_ELLIPSES
-+#   define gcmDUMP_API(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_api(
-+        IN gctCONST_STRING Message,
-+        ...
-+        )
-+    {
-+    }
-+#  define gcmDUMP_API           __dummy_dump_api
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_API_ARRAY
-+**
-+**      Print an array of data.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctUINT32_PTR   Pointer to array.
-+**      gctUINT32       Size.
-+*/
-+gceSTATUS gcfDumpArray(IN gctCONST_POINTER Data, IN gctUINT32 Size);
-+#if gcdDUMP_API
-+#   define gcmDUMP_API_ARRAY        gcfDumpArray
-+#elif gcdHAS_ELLIPSES
-+#   define gcmDUMP_API_ARRAY(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_api_array(
-+        IN gctCONST_POINTER Data,
-+        IN gctUINT32 Size
-+        )
-+    {
-+    }
-+#   define gcmDUMP_API_ARRAY        __dummy_dump_api_array
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_API_ARRAY_TOKEN
-+**
-+**      Print an array of data terminated by a token.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctUINT32_PTR   Pointer to array.
-+**      gctUINT32       Termination.
-+*/
-+gceSTATUS gcfDumpArrayToken(IN gctCONST_POINTER Data, IN gctUINT32 Termination);
-+#if gcdDUMP_API
-+#   define gcmDUMP_API_ARRAY_TOKEN  gcfDumpArrayToken
-+#elif gcdHAS_ELLIPSES
-+#   define gcmDUMP_API_ARRAY_TOKEN(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_api_array_token(
-+        IN gctCONST_POINTER Data,
-+        IN gctUINT32 Termination
-+        )
-+    {
-+    }
-+#   define gcmDUMP_API_ARRAY_TOKEN  __dummy_dump_api_array_token
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmDUMP_API_DATA
-+**
-+**      Print an array of bytes.
-+**
-+**  ARGUMENTS:
-+**
-+**      gctCONST_POINTER    Pointer to array.
-+**      gctSIZE_T           Size.
-+*/
-+gceSTATUS gcfDumpApiData(IN gctCONST_POINTER Data, IN gctSIZE_T Size);
-+#if gcdDUMP_API
-+#   define gcmDUMP_API_DATA         gcfDumpApiData
-+#elif gcdHAS_ELLIPSES
-+#   define gcmDUMP_API_DATA(...)
-+#else
-+    gcmINLINE static void
-+    __dummy_dump_api_data(
-+        IN gctCONST_POINTER Data,
-+        IN gctSIZE_T Size
-+        )
-+    {
-+    }
-+#   define gcmDUMP_API_DATA         __dummy_dump_api_data
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmTRACE_RELEASE
-+**
-+**      Print a message to the shader debugger.
-+**
-+**  ARGUMENTS:
-+**
-+**      message Message.
-+**      ...     Optional arguments.
-+*/
-+
-+#define gcmTRACE_RELEASE                gcoOS_DebugShaderTrace
-+
-+void
-+gcoOS_DebugShaderTrace(
-+    IN gctCONST_STRING Message,
-+    ...
-+    );
-+
-+void
-+gcoOS_SetDebugShaderFiles(
-+    IN gctCONST_STRING VSFileName,
-+    IN gctCONST_STRING FSFileName
-+    );
-+
-+void
-+gcoOS_SetDebugShaderFileType(
-+    IN gctUINT32 ShaderType
-+    );
-+
-+void
-+gcoOS_EnableDebugBuffer(
-+    IN gctBOOL Enable
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gcmBREAK
-+**
-+**      Break into the debugger.  In retail mode this macro does nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      None.
-+*/
-+
-+void
-+gcoOS_DebugBreak(
-+    void
-+    );
-+
-+void
-+gckOS_DebugBreak(
-+    void
-+    );
-+
-+#if gcmIS_DEBUG(gcdDEBUG_BREAK)
-+#   define gcmBREAK             gcoOS_DebugBreak
-+#   define gcmkBREAK            gckOS_DebugBreak
-+#else
-+#   define gcmBREAK()
-+#   define gcmkBREAK()
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmASSERT
-+**
-+**      Evaluate an expression and break into the debugger if the expression
-+**      evaluates to false.  In retail mode this macro does nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      exp     Expression to evaluate.
-+*/
-+#if gcmIS_DEBUG(gcdDEBUG_ASSERT)
-+#   define _gcmASSERT(prefix, exp) \
-+        do \
-+        { \
-+            if (!(exp)) \
-+            { \
-+                prefix##TRACE(gcvLEVEL_ERROR, \
-+                              #prefix "ASSERT at %s(%d)", \
-+                              __FUNCTION__, __LINE__); \
-+                prefix##TRACE(gcvLEVEL_ERROR, \
-+                              "(%s)", #exp); \
-+                prefix##BREAK(); \
-+            } \
-+        } \
-+        while (gcvFALSE)
-+#   define gcmASSERT(exp)           _gcmASSERT(gcm, exp)
-+#   define gcmkASSERT(exp)          _gcmASSERT(gcmk, exp)
-+#else
-+#   define gcmASSERT(exp)
-+#   define gcmkASSERT(exp)
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY
-+**
-+**      Verify if an expression returns true.  If the expression does not
-+**      evaluates to true, an assertion will happen in debug mode.
-+**
-+**  ARGUMENTS:
-+**
-+**      exp     Expression to evaluate.
-+*/
-+#if gcmIS_DEBUG(gcdDEBUG_ASSERT)
-+#   define gcmVERIFY(exp)           gcmASSERT(exp)
-+#   define gcmkVERIFY(exp)          gcmkASSERT(exp)
-+#else
-+#   define gcmVERIFY(exp)           exp
-+#   define gcmkVERIFY(exp)          exp
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY_OK
-+**
-+**      Verify a fucntion returns gcvSTATUS_OK.  If the function does not return
-+**      gcvSTATUS_OK, an assertion will happen in debug mode.
-+**
-+**  ARGUMENTS:
-+**
-+**      func    Function to evaluate.
-+*/
-+
-+void
-+gcoOS_Verify(
-+    IN gceSTATUS status
-+    );
-+
-+void
-+gckOS_Verify(
-+    IN gceSTATUS status
-+    );
-+
-+#if gcmIS_DEBUG(gcdDEBUG_ASSERT)
-+#   define gcmVERIFY_OK(func) \
-+        do \
-+        { \
-+            gceSTATUS verifyStatus = func; \
-+            gcoOS_Verify(verifyStatus); \
-+            if (verifyStatus != gcvSTATUS_OK) \
-+            { \
-+                gcmTRACE( \
-+                    gcvLEVEL_ERROR, \
-+                    "gcmVERIFY_OK(%d): function returned %d", \
-+                    __LINE__, verifyStatus \
-+                    ); \
-+            } \
-+            gcmASSERT(verifyStatus == gcvSTATUS_OK); \
-+        } \
-+        while (gcvFALSE)
-+#   define gcmkVERIFY_OK(func) \
-+        do \
-+        { \
-+            gceSTATUS verifyStatus = func; \
-+            if (verifyStatus != gcvSTATUS_OK) \
-+            { \
-+                gcmkTRACE( \
-+                    gcvLEVEL_ERROR, \
-+                    "gcmkVERIFY_OK(%d): function returned %d", \
-+                    __LINE__, verifyStatus \
-+                    ); \
-+            } \
-+            gckOS_Verify(verifyStatus); \
-+            gcmkASSERT(verifyStatus == gcvSTATUS_OK); \
-+        } \
-+        while (gcvFALSE)
-+#else
-+#   define gcmVERIFY_OK(func)       func
-+#   define gcmkVERIFY_OK(func)      func
-+#endif
-+
-+gctCONST_STRING
-+gcoOS_DebugStatus2Name(
-+    gceSTATUS status
-+    );
-+
-+gctCONST_STRING
-+gckOS_DebugStatus2Name(
-+    gceSTATUS status
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gcmERR_BREAK
-+**
-+**      Executes a break statement on error.
-+**
-+**  ASSUMPTIONS:
-+**
-+**      'status' variable of gceSTATUS type must be defined.
-+**
-+**  ARGUMENTS:
-+**
-+**      func    Function to evaluate.
-+*/
-+#define _gcmERR_BREAK(prefix, func) \
-+    status = func; \
-+    if (gcmIS_ERROR(status)) \
-+    { \
-+        prefix##PRINT_VERSION(); \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+            #prefix "ERR_BREAK: status=%d(%s) @ %s(%d)", \
-+            status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+        break; \
-+    } \
-+    do { } while (gcvFALSE)
-+#define _gcmkERR_BREAK(prefix, func) \
-+    status = func; \
-+    if (gcmIS_ERROR(status)) \
-+    { \
-+        prefix##PRINT_VERSION(); \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+            #prefix "ERR_BREAK: status=%d(%s) @ %s(%d)", \
-+            status, gckOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+        break; \
-+    } \
-+    do { } while (gcvFALSE)
-+#define gcmERR_BREAK(func)          _gcmERR_BREAK(gcm, func)
-+#define gcmkERR_BREAK(func)         _gcmkERR_BREAK(gcmk, func)
-+
-+/*******************************************************************************
-+**
-+**  gcmERR_RETURN
-+**
-+**      Executes a return on error.
-+**
-+**  ASSUMPTIONS:
-+**
-+**      'status' variable of gceSTATUS type must be defined.
-+**
-+**  ARGUMENTS:
-+**
-+**      func    Function to evaluate.
-+*/
-+#define _gcmERR_RETURN(prefix, func) \
-+    status = func; \
-+    if (gcmIS_ERROR(status)) \
-+    { \
-+        prefix##PRINT_VERSION(); \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+            #prefix "ERR_RETURN: status=%d(%s) @ %s(%d)", \
-+            status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+        prefix##FOOTER(); \
-+        return status; \
-+    } \
-+    do { } while (gcvFALSE)
-+#define _gcmkERR_RETURN(prefix, func) \
-+    status = func; \
-+    if (gcmIS_ERROR(status)) \
-+    { \
-+        prefix##PRINT_VERSION(); \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+            #prefix "ERR_RETURN: status=%d(%s) @ %s(%d)", \
-+            status, gckOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+        prefix##FOOTER(); \
-+        return status; \
-+    } \
-+    do { } while (gcvFALSE)
-+#define gcmERR_RETURN(func)         _gcmERR_RETURN(gcm, func)
-+#define gcmkERR_RETURN(func)        _gcmkERR_RETURN(gcmk, func)
-+
-+
-+/*******************************************************************************
-+**
-+**  gcmONERROR
-+**
-+**      Jump to the error handler in case there is an error.
-+**
-+**  ASSUMPTIONS:
-+**
-+**      'status' variable of gceSTATUS type must be defined.
-+**
-+**  ARGUMENTS:
-+**
-+**      func    Function to evaluate.
-+*/
-+#define _gcmONERROR(prefix, func) \
-+    do \
-+    { \
-+        status = func; \
-+        if (gcmIS_ERROR(status)) \
-+        { \
-+            prefix##PRINT_VERSION(); \
-+            prefix##TRACE(gcvLEVEL_ERROR, \
-+                #prefix "ONERROR: status=%d(%s) @ %s(%d)", \
-+                status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+            goto OnError; \
-+        } \
-+    } \
-+    while (gcvFALSE)
-+#define _gcmkONERROR(prefix, func) \
-+    do \
-+    { \
-+        status = func; \
-+        if (gcmIS_ERROR(status)) \
-+        { \
-+            prefix##PRINT_VERSION(); \
-+            prefix##TRACE(gcvLEVEL_ERROR, \
-+                #prefix "ONERROR: status=%d(%s) @ %s(%d)", \
-+                status, gckOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+            goto OnError; \
-+        } \
-+    } \
-+    while (gcvFALSE)
-+#define gcmONERROR(func)            _gcmONERROR(gcm, func)
-+#define gcmkONERROR(func)           _gcmkONERROR(gcmk, func)
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY_LOCK
-+**
-+**      Verifies whether the surface is locked.
-+**
-+**  ARGUMENTS:
-+**
-+**      surfaceInfo Pointer to the surface iniformational structure.
-+*/
-+#define gcmVERIFY_LOCK(surfaceInfo) \
-+    if (!surfaceInfo->node.valid) \
-+    { \
-+        gcmONERROR(gcvSTATUS_MEMORY_UNLOCKED); \
-+    } \
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY_NODE_LOCK
-+**
-+**      Verifies whether the surface node is locked.
-+**
-+**  ARGUMENTS:
-+**
-+**      surfaceInfo Pointer to the surface iniformational structure.
-+*/
-+#define gcmVERIFY_NODE_LOCK(surfaceNode) \
-+    if (!(surfaceNode)->valid) \
-+    { \
-+        status = gcvSTATUS_MEMORY_UNLOCKED; \
-+        break; \
-+    } \
-+    do { } while (gcvFALSE)
-+
-+/*******************************************************************************
-+**
-+**  gcmBADOBJECT_BREAK
-+**
-+**      Executes a break statement on bad object.
-+**
-+**  ARGUMENTS:
-+**
-+**      obj     Object to test.
-+**      t       Expected type of the object.
-+*/
-+#define gcmBADOBJECT_BREAK(obj, t) \
-+    if ((obj == gcvNULL) \
-+    ||  (((gcsOBJECT *)(obj))->type != t) \
-+    ) \
-+    { \
-+        status = gcvSTATUS_INVALID_OBJECT; \
-+        break; \
-+    } \
-+    do { } while (gcvFALSE)
-+
-+/*******************************************************************************
-+**
-+**  gcmCHECK_STATUS
-+**
-+**      Executes a break statement on error.
-+**
-+**  ASSUMPTIONS:
-+**
-+**      'status' variable of gceSTATUS type must be defined.
-+**
-+**  ARGUMENTS:
-+**
-+**      func    Function to evaluate.
-+*/
-+#define _gcmCHECK_STATUS(prefix, func) \
-+    do \
-+    { \
-+        last = func; \
-+        if (gcmIS_ERROR(last)) \
-+        { \
-+            prefix##TRACE(gcvLEVEL_ERROR, \
-+                #prefix "CHECK_STATUS: status=%d(%s) @ %s(%d)", \
-+                last, gcoOS_DebugStatus2Name(last), __FUNCTION__, __LINE__); \
-+            status = last; \
-+        } \
-+    } \
-+    while (gcvFALSE)
-+#define _gcmkCHECK_STATUS(prefix, func) \
-+    do \
-+    { \
-+        last = func; \
-+        if (gcmIS_ERROR(last)) \
-+        { \
-+            prefix##TRACE(gcvLEVEL_ERROR, \
-+                #prefix "CHECK_STATUS: status=%d(%s) @ %s(%d)", \
-+                last, gckOS_DebugStatus2Name(last), __FUNCTION__, __LINE__); \
-+            status = last; \
-+        } \
-+    } \
-+    while (gcvFALSE)
-+#define gcmCHECK_STATUS(func)       _gcmCHECK_STATUS(gcm, func)
-+#define gcmkCHECK_STATUS(func)      _gcmkCHECK_STATUS(gcmk, func)
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY_ARGUMENT
-+**
-+**      Assert if an argument does not apply to the specified expression.  If
-+**      the argument evaluates to false, gcvSTATUS_INVALID_ARGUMENT will be
-+**      returned from the current function.  In retail mode this macro does
-+**      nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      arg     Argument to evaluate.
-+*/
-+#   define _gcmVERIFY_ARGUMENT(prefix, arg) \
-+       do \
-+       { \
-+           if (!(arg)) \
-+           { \
-+               prefix##TRACE(gcvLEVEL_ERROR, #prefix "VERIFY_ARGUMENT failed:"); \
-+               prefix##ASSERT(arg); \
-+               prefix##FOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT); \
-+               return gcvSTATUS_INVALID_ARGUMENT; \
-+           } \
-+       } \
-+       while (gcvFALSE)
-+#   define gcmVERIFY_ARGUMENT(arg)     _gcmVERIFY_ARGUMENT(gcm, arg)
-+#   define gcmkVERIFY_ARGUMENT(arg)    _gcmVERIFY_ARGUMENT(gcmk, arg)
-+
-+/*******************************************************************************
-+**
-+**  gcmDEBUG_VERIFY_ARGUMENT
-+**
-+**      Works just like gcmVERIFY_ARGUMENT, but is only valid in debug mode.
-+**      Use this to verify arguments inside non-public API functions.
-+*/
-+#if gcdDEBUG
-+#   define gcmDEBUG_VERIFY_ARGUMENT(arg)    _gcmVERIFY_ARGUMENT(gcm, arg)
-+#   define gcmkDEBUG_VERIFY_ARGUMENT(arg)   _gcmkVERIFY_ARGUMENT(gcm, arg)
-+#else
-+#   define gcmDEBUG_VERIFY_ARGUMENT(arg)
-+#   define gcmkDEBUG_VERIFY_ARGUMENT(arg)
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY_ARGUMENT_RETURN
-+**
-+**      Assert if an argument does not apply to the specified expression.  If
-+**      the argument evaluates to false, gcvSTATUS_INVALID_ARGUMENT will be
-+**      returned from the current function.  In retail mode this macro does
-+**      nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      arg     Argument to evaluate.
-+*/
-+#   define _gcmVERIFY_ARGUMENT_RETURN(prefix, arg, value) \
-+       do \
-+       { \
-+           if (!(arg)) \
-+           { \
-+               prefix##TRACE(gcvLEVEL_ERROR, \
-+                             #prefix "gcmVERIFY_ARGUMENT_RETURN failed:"); \
-+               prefix##ASSERT(arg); \
-+               prefix##FOOTER_ARG("value=%d", value); \
-+               return value; \
-+           } \
-+       } \
-+       while (gcvFALSE)
-+#   define gcmVERIFY_ARGUMENT_RETURN(arg, value) \
-+                _gcmVERIFY_ARGUMENT_RETURN(gcm, arg, value)
-+#   define gcmkVERIFY_ARGUMENT_RETURN(arg, value) \
-+                _gcmVERIFY_ARGUMENT_RETURN(gcmk, arg, value)
-+
-+#define MAX_LOOP_COUNT 0x7FFFFFFF
-+
-+/******************************************************************************\
-+****************************** User Debug Option ******************************
-+\******************************************************************************/
-+
-+/* User option. */
-+typedef enum _gceDEBUG_MSG
-+{
-+    gcvDEBUG_MSG_NONE,
-+    gcvDEBUG_MSG_ERROR,
-+    gcvDEBUG_MSG_WARNING
-+}
-+gceDEBUG_MSG;
-+
-+typedef struct _gcsUSER_DEBUG_OPTION
-+{
-+    gceDEBUG_MSG        debugMsg;
-+}
-+gcsUSER_DEBUG_OPTION;
-+
-+gcsUSER_DEBUG_OPTION *
-+gcGetUserDebugOption(
-+    void
-+    );
-+
-+struct _gcoOS_SymbolsList
-+{
-+    gcePATCH_ID patchId;
-+    const char * symList[10];
-+};
-+
-+#if gcdHAS_ELLIPSES
-+#define gcmUSER_DEBUG_MSG(level, ...) \
-+    do \
-+    { \
-+        if (level <= gcGetUserDebugOption()->debugMsg) \
-+        { \
-+            gcoOS_Print(__VA_ARGS__); \
-+        } \
-+    } while (gcvFALSE)
-+
-+#define gcmUSER_DEBUG_ERROR_MSG(...)   gcmUSER_DEBUG_MSG(gcvDEBUG_MSG_ERROR, "Error: " __VA_ARGS__)
-+#define gcmUSER_DEBUG_WARNING_MSG(...) gcmUSER_DEBUG_MSG(gcvDEBUG_MSG_WARNING, "Warring: " __VA_ARGS__)
-+#else
-+#define gcmUSER_DEBUG_MSG
-+#define gcmUSER_DEBUG_ERROR_MSG
-+#define gcmUSER_DEBUG_WARNING_MSG
-+#endif
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_base_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,4356 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+/*
-+**	Include file the defines the front- and back-end compilers, as well as the
-+**	objects they use.
-+*/
-+
-+#ifndef __gc_hal_compiler_h_
-+#define __gc_hal_compiler_h_
-+
-+#ifndef VIVANTE_NO_3D
-+#include "gc_hal_types.h"
-+#include "gc_hal_engine.h"
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+#ifndef GC_ENABLE_LOADTIME_OPT
-+#define GC_ENABLE_LOADTIME_OPT           1
-+#endif
-+
-+#define TEMP_OPT_CONSTANT_TEXLD_COORD    0
-+
-+#define TEMP_SHADER_PATCH                1
-+
-+#define TEMP_INLINE_ALL_EXPANSION            1
-+/******************************* IR VERSION ******************/
-+#define gcdSL_IR_VERSION gcmCC('\0','\0','\0','\1')
-+
-+/******************************************************************************\
-+|******************************* SHADER LANGUAGE ******************************|
-+\******************************************************************************/
-+
-+    /* allocator/deallocator function pointer */
-+typedef gceSTATUS (*gctAllocatorFunc)(
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+typedef gceSTATUS (*gctDeallocatorFunc)(
-+    IN gctPOINTER Memory
-+    );
-+
-+typedef gctBOOL (*compareFunc) (
-+     IN void *    data,
-+     IN void *    key
-+     );
-+
-+typedef struct _gcsListNode gcsListNode;
-+struct _gcsListNode
-+{
-+    gcsListNode *       next;
-+    void *              data;
-+};
-+
-+typedef struct _gcsAllocator
-+{
-+    gctAllocatorFunc    allocate;
-+    gctDeallocatorFunc  deallocate;
-+} gcsAllocator;
-+
-+/* simple map structure */
-+typedef struct _SimpleMap SimpleMap;
-+struct _SimpleMap
-+{
-+    gctUINT32     key;
-+    gctUINT32     val;
-+    SimpleMap    *next;
-+    gcsAllocator *allocator;
-+
-+};
-+
-+/* SimpleMap Operations */
-+/* return -1 if not found, otherwise return the mapped value */
-+gctUINT32
-+gcSimpleMap_Find(
-+     IN SimpleMap *Map,
-+     IN gctUINT32    Key
-+     );
-+
-+gceSTATUS
-+gcSimpleMap_Destory(
-+     IN SimpleMap *    Map,
-+     IN gcsAllocator * Allocator
-+     );
-+
-+/* Add a pair <Key, Val> to the Map head, the user should be aware that the
-+ * map pointer is always changed when adding a new node :
-+ *
-+ *   gcSimpleMap_AddNode(&theMap, key, val, allocator);
-+ *
-+ */
-+gceSTATUS
-+gcSimpleMap_AddNode(
-+     IN SimpleMap **   Map,
-+     IN gctUINT32      Key,
-+     IN gctUINT32      Val,
-+     IN gcsAllocator * Allocator
-+     );
-+
-+/* gcsList data structure and related operations */
-+typedef struct _gcsList
-+{
-+    gcsListNode  *head;
-+    gcsListNode  *tail;
-+    gctINT        count;
-+    gcsAllocator *allocator;
-+} gcsList;
-+
-+/* List operations */
-+void
-+gcList_Init(
-+    IN gcsList *list,
-+    IN gcsAllocator *allocator
-+    );
-+
-+gceSTATUS
-+gcList_CreateNode(
-+    IN void *             Data,
-+    IN gctAllocatorFunc   Allocator,
-+    OUT gcsListNode **    ListNode
-+    );
-+
-+gceSTATUS
-+gcList_Clean(
-+    IN gcsList *          List,
-+    IN gctBOOL            FreeData
-+    );
-+
-+gcsListNode *
-+gcList_FindNode(
-+    IN gcsList *      List,
-+    IN void *         Key,
-+    IN compareFunc    compare
-+    );
-+
-+gceSTATUS
-+gcList_AddNode(
-+    IN gcsList *          List,
-+    IN void *             Data
-+    );
-+
-+gceSTATUS
-+gcList_RemoveNode(
-+    IN gcsList *          List,
-+    IN gcsListNode *      Node
-+    );
-+
-+/*  link list structure for code list */
-+typedef gcsList gcsCodeList;
-+typedef gcsCodeList * gctCodeList;
-+typedef gcsListNode gcsCodeListNode;
-+
-+/* Possible shader language opcodes. */
-+typedef enum _gcSL_OPCODE
-+{
-+	gcSL_NOP,							/* 0x00 */
-+	gcSL_MOV,							/* 0x01 */
-+	gcSL_SAT,							/* 0x02 */
-+	gcSL_DP3,							/* 0x03 */
-+	gcSL_DP4,							/* 0x04 */
-+	gcSL_ABS,							/* 0x05 */
-+	gcSL_JMP,							/* 0x06 */
-+	gcSL_ADD,							/* 0x07 */
-+	gcSL_MUL,							/* 0x08 */
-+	gcSL_RCP,							/* 0x09 */
-+	gcSL_SUB,							/* 0x0A */
-+	gcSL_KILL,							/* 0x0B */
-+	gcSL_TEXLD,							/* 0x0C */
-+	gcSL_CALL,							/* 0x0D */
-+	gcSL_RET,							/* 0x0E */
-+	gcSL_NORM,							/* 0x0F */
-+	gcSL_MAX,							/* 0x10 */
-+	gcSL_MIN,							/* 0x11 */
-+	gcSL_POW,							/* 0x12 */
-+	gcSL_RSQ,							/* 0x13 */
-+	gcSL_LOG,							/* 0x14 */
-+	gcSL_FRAC,							/* 0x15 */
-+	gcSL_FLOOR,							/* 0x16 */
-+	gcSL_CEIL,							/* 0x17 */
-+	gcSL_CROSS,							/* 0x18 */
-+	gcSL_TEXLDP,						/* 0x19 */
-+	gcSL_TEXBIAS,						/* 0x1A */
-+	gcSL_TEXGRAD,						/* 0x1B */
-+	gcSL_TEXLOD,						/* 0x1C */
-+	gcSL_SIN,							/* 0x1D */
-+	gcSL_COS,							/* 0x1E */
-+	gcSL_TAN,							/* 0x1F */
-+	gcSL_EXP,							/* 0x20 */
-+	gcSL_SIGN,							/* 0x21 */
-+	gcSL_STEP,							/* 0x22 */
-+	gcSL_SQRT,							/* 0x23 */
-+	gcSL_ACOS,							/* 0x24 */
-+	gcSL_ASIN,							/* 0x25 */
-+	gcSL_ATAN,							/* 0x26 */
-+	gcSL_SET,							/* 0x27 */
-+	gcSL_DSX,							/* 0x28 */
-+	gcSL_DSY,							/* 0x29 */
-+	gcSL_FWIDTH,						/* 0x2A */
-+	gcSL_DIV,   						/* 0x2B */
-+	gcSL_MOD,   						/* 0x2C */
-+	gcSL_AND_BITWISE,					/* 0x2D */
-+	gcSL_OR_BITWISE,					/* 0x2E */
-+	gcSL_XOR_BITWISE,					/* 0x2F */
-+	gcSL_NOT_BITWISE,					/* 0x30 */
-+	gcSL_LSHIFT,						/* 0x31 */
-+	gcSL_RSHIFT,						/* 0x32 */
-+	gcSL_ROTATE,						/* 0x33 */
-+	gcSL_BITSEL,						/* 0x34 */
-+	gcSL_LEADZERO,						/* 0x35 */
-+	gcSL_LOAD,							/* 0x36 */
-+	gcSL_STORE,							/* 0x37 */
-+	gcSL_BARRIER,						/* 0x38 */
-+	gcSL_STORE1,						/* 0x39 */
-+	gcSL_ATOMADD,						/* 0x3A */
-+	gcSL_ATOMSUB,						/* 0x3B */
-+	gcSL_ATOMXCHG,						/* 0x3C */
-+	gcSL_ATOMCMPXCHG,					/* 0x3D */
-+	gcSL_ATOMMIN,						/* 0x3E */
-+	gcSL_ATOMMAX,						/* 0x3F */
-+	gcSL_ATOMOR,						/* 0x40 */
-+	gcSL_ATOMAND,						/* 0x41 */
-+	gcSL_ATOMXOR,						/* 0x42 */
-+	/*gcSL_UNUSED,						 0x43 */
-+	/*gcSL_UNUSED,						 0x44 */
-+	/*gcSL_UNUSED,						 0x45 */
-+	/*gcSL_UNUSED,						 0x46 */
-+	/*gcSL_UNUSED,						 0x47 */
-+	/*gcSL_UNUSED,						 0x48 */
-+	/*gcSL_UNUSED,						 0x49 */
-+	/*gcSL_UNUSED,						 0x4A */
-+	/*gcSL_UNUSED,						 0x4B */
-+	/*gcSL_UNUSED,					 	 0x4C */
-+	/*gcSL_UNUSED,						 0x4D */
-+	/*gcSL_UNUSED,						 0x4E */
-+	/*gcSL_UNUSED,						 0x4F */
-+	/*gcSL_UNUSED,						 0x50 */
-+	/*gcSL_UNUSED,						 0x51 */
-+	/*gcSL_UNUSED,						 0x52 */
-+	gcSL_ADDLO = 0x53,					/* 0x53 */  /* Float only. */
-+	gcSL_MULLO,							/* 0x54 */  /* Float only. */
-+	gcSL_CONV,							/* 0x55 */
-+	gcSL_GETEXP,						/* 0x56 */
-+	gcSL_GETMANT,						/* 0x57 */
-+	gcSL_MULHI,							/* 0x58 */  /* Integer only. */
-+	gcSL_CMP,							/* 0x59 */
-+	gcSL_I2F,							/* 0x5A */
-+	gcSL_F2I,							/* 0x5B */
-+	gcSL_ADDSAT,						/* 0x5C */  /* Integer only. */
-+	gcSL_SUBSAT,						/* 0x5D */  /* Integer only. */
-+	gcSL_MULSAT,						/* 0x5E */  /* Integer only. */
-+	gcSL_DP2,							/* 0x5F */
-+	gcSL_MAXOPCODE
-+}
-+gcSL_OPCODE;
-+
-+typedef enum _gcSL_FORMAT
-+{
-+	gcSL_FLOAT = 0,						/* 0 */
-+	gcSL_INTEGER = 1,				    /* 1 */
-+	gcSL_INT32 = 1,					    /* 1 */
-+	gcSL_BOOLEAN = 2,					/* 2 */
-+	gcSL_UINT32 = 3,					/* 3 */
-+	gcSL_INT8,						    /* 4 */
-+	gcSL_UINT8,						    /* 5 */
-+	gcSL_INT16,						    /* 6 */
-+	gcSL_UINT16,						/* 7 */
-+	gcSL_INT64,						    /* 8 */     /* Reserved for future enhancement. */
-+	gcSL_UINT64,						/* 9 */     /* Reserved for future enhancement. */
-+	gcSL_INT128,					    /* 10 */    /* Reserved for future enhancement. */
-+	gcSL_UINT128,						/* 11 */    /* Reserved for future enhancement. */
-+	gcSL_FLOAT16,					    /* 12 */
-+	gcSL_FLOAT64,						/* 13 */    /* Reserved for future enhancement. */
-+	gcSL_FLOAT128,						/* 14 */    /* Reserved for future enhancement. */
-+}
-+gcSL_FORMAT;
-+
-+/* Destination write enable bits. */
-+typedef enum _gcSL_ENABLE
-+{
-+    gcSL_ENABLE_NONE                    = 0x0,     /* none is enabled, error/uninitialized state */
-+	gcSL_ENABLE_X						= 0x1,
-+	gcSL_ENABLE_Y						= 0x2,
-+	gcSL_ENABLE_Z						= 0x4,
-+	gcSL_ENABLE_W						= 0x8,
-+	/* Combinations. */
-+	gcSL_ENABLE_XY						= gcSL_ENABLE_X | gcSL_ENABLE_Y,
-+	gcSL_ENABLE_XYZ						= gcSL_ENABLE_X | gcSL_ENABLE_Y | gcSL_ENABLE_Z,
-+	gcSL_ENABLE_XYZW					= gcSL_ENABLE_X | gcSL_ENABLE_Y | gcSL_ENABLE_Z | gcSL_ENABLE_W,
-+	gcSL_ENABLE_XYW						= gcSL_ENABLE_X | gcSL_ENABLE_Y | gcSL_ENABLE_W,
-+	gcSL_ENABLE_XZ						= gcSL_ENABLE_X | gcSL_ENABLE_Z,
-+	gcSL_ENABLE_XZW						= gcSL_ENABLE_X | gcSL_ENABLE_Z | gcSL_ENABLE_W,
-+	gcSL_ENABLE_XW						= gcSL_ENABLE_X | gcSL_ENABLE_W,
-+	gcSL_ENABLE_YZ						= gcSL_ENABLE_Y | gcSL_ENABLE_Z,
-+	gcSL_ENABLE_YZW						= gcSL_ENABLE_Y | gcSL_ENABLE_Z | gcSL_ENABLE_W,
-+	gcSL_ENABLE_YW						= gcSL_ENABLE_Y | gcSL_ENABLE_W,
-+	gcSL_ENABLE_ZW						= gcSL_ENABLE_Z | gcSL_ENABLE_W,
-+}
-+gcSL_ENABLE;
-+
-+/* Possible indices. */
-+typedef enum _gcSL_INDEXED
-+{
-+	gcSL_NOT_INDEXED,					/* 0 */
-+	gcSL_INDEXED_X,						/* 1 */
-+	gcSL_INDEXED_Y,						/* 2 */
-+	gcSL_INDEXED_Z,						/* 3 */
-+	gcSL_INDEXED_W,						/* 4 */
-+}
-+gcSL_INDEXED;
-+
-+/* Opcode conditions. */
-+typedef enum _gcSL_CONDITION
-+{
-+	gcSL_ALWAYS,						/* 0x0 */
-+	gcSL_NOT_EQUAL,						/* 0x1 */
-+	gcSL_LESS_OR_EQUAL,					/* 0x2 */
-+	gcSL_LESS,							/* 0x3 */
-+	gcSL_EQUAL,							/* 0x4 */
-+	gcSL_GREATER,						/* 0x5 */
-+	gcSL_GREATER_OR_EQUAL,				/* 0x6 */
-+	gcSL_AND,							/* 0x7 */
-+	gcSL_OR,							/* 0x8 */
-+	gcSL_XOR,							/* 0x9 */
-+    gcSL_NOT_ZERO,                      /* 0xA */
-+}
-+gcSL_CONDITION;
-+
-+/* Possible source operand types. */
-+typedef enum _gcSL_TYPE
-+{
-+	gcSL_NONE,							/* 0x0 */
-+	gcSL_TEMP,							/* 0x1 */
-+	gcSL_ATTRIBUTE,						/* 0x2 */
-+	gcSL_UNIFORM,						/* 0x3 */
-+	gcSL_SAMPLER,						/* 0x4 */
-+	gcSL_CONSTANT,						/* 0x5 */
-+	gcSL_OUTPUT,						/* 0x6 */
-+	gcSL_PHYSICAL,						/* 0x7 */
-+}
-+gcSL_TYPE;
-+
-+/* Swizzle generator macro. */
-+#define gcmSWIZZLE(Component1, Component2, Component3, Component4) \
-+( \
-+	(gcSL_SWIZZLE_ ## Component1 << 0) | \
-+	(gcSL_SWIZZLE_ ## Component2 << 2) | \
-+	(gcSL_SWIZZLE_ ## Component3 << 4) | \
-+	(gcSL_SWIZZLE_ ## Component4 << 6)   \
-+)
-+
-+#define gcmExtractSwizzle(Swizzle, Index) \
-+    ((gcSL_SWIZZLE) ((((Swizzle) >> (Index * 2)) & 0x3)))
-+
-+#define gcmComposeSwizzle(SwizzleX, SwizzleY, SwizzleZ, SwizzleW) \
-+( \
-+	((SwizzleX) << 0) | \
-+	((SwizzleY) << 2) | \
-+	((SwizzleZ) << 4) | \
-+	((SwizzleW) << 6)   \
-+)
-+
-+/* Possible swizzle values. */
-+typedef enum _gcSL_SWIZZLE
-+{
-+	gcSL_SWIZZLE_X,						/* 0x0 */
-+	gcSL_SWIZZLE_Y,						/* 0x1 */
-+	gcSL_SWIZZLE_Z,						/* 0x2 */
-+	gcSL_SWIZZLE_W,						/* 0x3 */
-+	/* Combinations. */
-+	gcSL_SWIZZLE_XXXX = gcmSWIZZLE(X, X, X, X),
-+	gcSL_SWIZZLE_YYYY = gcmSWIZZLE(Y, Y, Y, Y),
-+	gcSL_SWIZZLE_ZZZZ = gcmSWIZZLE(Z, Z, Z, Z),
-+	gcSL_SWIZZLE_WWWW = gcmSWIZZLE(W, W, W, W),
-+	gcSL_SWIZZLE_XYYY = gcmSWIZZLE(X, Y, Y, Y),
-+	gcSL_SWIZZLE_XZZZ = gcmSWIZZLE(X, Z, Z, Z),
-+	gcSL_SWIZZLE_XWWW = gcmSWIZZLE(X, W, W, W),
-+	gcSL_SWIZZLE_YZZZ = gcmSWIZZLE(Y, Z, Z, Z),
-+	gcSL_SWIZZLE_YWWW = gcmSWIZZLE(Y, W, W, W),
-+	gcSL_SWIZZLE_ZWWW = gcmSWIZZLE(Z, W, W, W),
-+	gcSL_SWIZZLE_XYZZ = gcmSWIZZLE(X, Y, Z, Z),
-+	gcSL_SWIZZLE_XYWW = gcmSWIZZLE(X, Y, W, W),
-+	gcSL_SWIZZLE_XZWW = gcmSWIZZLE(X, Z, W, W),
-+	gcSL_SWIZZLE_YZWW = gcmSWIZZLE(Y, Z, W, W),
-+	gcSL_SWIZZLE_XXYZ = gcmSWIZZLE(X, X, Y, Z),
-+	gcSL_SWIZZLE_XYZW = gcmSWIZZLE(X, Y, Z, W),
-+	gcSL_SWIZZLE_XYXY = gcmSWIZZLE(X, Y, X, Y),
-+	gcSL_SWIZZLE_YYZZ = gcmSWIZZLE(Y, Y, Z, Z),
-+	gcSL_SWIZZLE_YYWW = gcmSWIZZLE(Y, Y, W, W),
-+	gcSL_SWIZZLE_ZZZW = gcmSWIZZLE(Z, Z, Z, W),
-+	gcSL_SWIZZLE_XZZW = gcmSWIZZLE(X, Z, Z, W),
-+	gcSL_SWIZZLE_YYZW = gcmSWIZZLE(Y, Y, Z, W),
-+
-+    gcSL_SWIZZLE_INVALID = 0x7FFFFFFF
-+}
-+gcSL_SWIZZLE;
-+
-+typedef enum _gcSL_COMPONENT
-+{
-+	gcSL_COMPONENT_X,               /* 0x0 */
-+	gcSL_COMPONENT_Y,               /* 0x1 */
-+	gcSL_COMPONENT_Z,               /* 0x2 */
-+	gcSL_COMPONENT_W,               /* 0x3 */
-+    gcSL_COMPONENT_COUNT            /* 0x4 */
-+} gcSL_COMPONENT;
-+
-+#define gcmIsComponentEnabled(Enable, Component) (((Enable) & (1 << (Component))) != 0)
-+
-+/******************************************************************************\
-+|*********************************** SHADERS **********************************|
-+\******************************************************************************/
-+
-+/* Shader types. */
-+typedef enum _gcSHADER_KIND {
-+    gcSHADER_TYPE_UNKNOWN = 0,
-+    gcSHADER_TYPE_VERTEX,
-+    gcSHADER_TYPE_FRAGMENT,
-+    gcSHADER_TYPE_CL,
-+    gcSHADER_TYPE_PRECOMPILED,
-+    gcSHADER_KIND_COUNT
-+} gcSHADER_KIND;
-+
-+typedef enum _gcGL_DRIVER_VERSION {
-+    gcGL_DRIVER_ES11,    /* OpenGL ES 1.1 */
-+    gcGL_DRIVER_ES20,    /* OpenGL ES 2.0 */
-+    gcGL_DRIVER_ES30     /* OpenGL ES 3.0 */
-+} gcGL_DRIVER_VERSION;
-+
-+/* gcSHADER objects. */
-+typedef struct _gcSHADER *              gcSHADER;
-+typedef struct _gcATTRIBUTE *			gcATTRIBUTE;
-+typedef struct _gcUNIFORM *             gcUNIFORM;
-+typedef struct _gcOUTPUT *              gcOUTPUT;
-+typedef struct _gcsFUNCTION *			gcFUNCTION;
-+typedef struct _gcsKERNEL_FUNCTION *	gcKERNEL_FUNCTION;
-+typedef struct _gcsHINT *               gcsHINT_PTR;
-+typedef struct _gcSHADER_PROFILER *     gcSHADER_PROFILER;
-+typedef struct _gcVARIABLE *			gcVARIABLE;
-+typedef struct _gcSHADER_LIST *         gcSHADER_LIST;
-+
-+struct _gcsHINT
-+{
-+    /* Numbr of data transfers for Vertex Shader output. */
-+    gctUINT32   vsOutputCount;
-+
-+    /* Flag whether the VS has point size or not. */
-+    gctBOOL     vsHasPointSize;
-+
-+#if gcdUSE_WCLIP_PATCH
-+    /* Flag whether the VS gl_position.z depends on gl_position.w
-+       it's a hint for wclipping */
-+    gctBOOL     vsPositionZDependsOnW;
-+#endif
-+
-+    gctBOOL     clipW;
-+
-+    /* Flag whether or not the shader has a KILL instruction. */
-+    gctBOOL     hasKill;
-+
-+    /* Element count. */
-+    gctUINT32   elementCount;
-+
-+    /* Component count. */
-+    gctUINT32   componentCount;
-+
-+    /* Number of data transfers for Fragment Shader input. */
-+    gctUINT32   fsInputCount;
-+
-+    /* Maximum number of temporary registers used in FS. */
-+    gctUINT32   fsMaxTemp;
-+
-+	/* Maximum number of temporary registers used in VS. */
-+	gctUINT32   vsMaxTemp;
-+
-+    /* Balance minimum. */
-+    gctUINT32   balanceMin;
-+
-+    /* Balance maximum. */
-+    gctUINT32   balanceMax;
-+
-+    /* Auto-shift balancing. */
-+    gctBOOL     autoShift;
-+
-+    /* Flag whether the PS outputs the depth value or not. */
-+    gctBOOL     psHasFragDepthOut;
-+
-+	/* Flag whether the ThreadWalker is in PS. */
-+	gctBOOL		threadWalkerInPS;
-+
-+    /* HW reg number for position of VS */
-+    gctUINT32   hwRegNoOfSIVPos;
-+
-+#if gcdALPHA_KILL_IN_SHADER
-+    /* States to set when alpha kill is enabled. */
-+    gctUINT32   killStateAddress;
-+    gctUINT32   alphaKillStateValue;
-+    gctUINT32   colorKillStateValue;
-+
-+    /* Shader instructiuon. */
-+    gctUINT32   killInstructionAddress;
-+    gctUINT32   alphaKillInstruction[3];
-+    gctUINT32   colorKillInstruction[3];
-+#endif
-+
-+#if TEMP_SHADER_PATCH
-+	gctUINT32	pachedShaderIdentifier;
-+#endif
-+
-+#if gcdUSE_WCLIP_PATCH
-+    /* Strict WClip match. */
-+    gctBOOL     strictWClipMatch;
-+#endif
-+};
-+
-+#if TEMP_SHADER_PATCH
-+#define INVALID_SHADER_IDENTIFIER 0xFFFFFFFF
-+#endif
-+
-+/* gcSHADER_TYPE enumeration. */
-+typedef enum _gcSHADER_TYPE
-+{
-+    gcSHADER_FLOAT_X1   = 0,        /* 0x00 */
-+    gcSHADER_FLOAT_X2,				/* 0x01 */
-+	gcSHADER_FLOAT_X3,				/* 0x02 */
-+	gcSHADER_FLOAT_X4,				/* 0x03 */
-+	gcSHADER_FLOAT_2X2,				/* 0x04 */
-+	gcSHADER_FLOAT_3X3,				/* 0x05 */
-+	gcSHADER_FLOAT_4X4,				/* 0x06 */
-+	gcSHADER_BOOLEAN_X1,			/* 0x07 */
-+	gcSHADER_BOOLEAN_X2,			/* 0x08 */
-+	gcSHADER_BOOLEAN_X3,			/* 0x09 */
-+	gcSHADER_BOOLEAN_X4,			/* 0x0A */
-+	gcSHADER_INTEGER_X1,			/* 0x0B */
-+	gcSHADER_INTEGER_X2,			/* 0x0C */
-+	gcSHADER_INTEGER_X3,			/* 0x0D */
-+	gcSHADER_INTEGER_X4,			/* 0x0E */
-+	gcSHADER_SAMPLER_1D,			/* 0x0F */
-+	gcSHADER_SAMPLER_2D,			/* 0x10 */
-+	gcSHADER_SAMPLER_3D,			/* 0x11 */
-+	gcSHADER_SAMPLER_CUBIC,			/* 0x12 */
-+	gcSHADER_FIXED_X1,				/* 0x13 */
-+	gcSHADER_FIXED_X2,				/* 0x14 */
-+	gcSHADER_FIXED_X3,				/* 0x15 */
-+	gcSHADER_FIXED_X4,				/* 0x16 */
-+	gcSHADER_IMAGE_2D,				/* 0x17 */  /* For OCL. */
-+	gcSHADER_IMAGE_3D,				/* 0x18 */  /* For OCL. */
-+	gcSHADER_SAMPLER,				/* 0x19 */  /* For OCL. */
-+	gcSHADER_FLOAT_2X3,				/* 0x1A */
-+	gcSHADER_FLOAT_2X4,				/* 0x1B */
-+	gcSHADER_FLOAT_3X2,				/* 0x1C */
-+	gcSHADER_FLOAT_3X4,				/* 0x1D */
-+	gcSHADER_FLOAT_4X2,				/* 0x1E */
-+	gcSHADER_FLOAT_4X3,				/* 0x1F */
-+	gcSHADER_ISAMPLER_2D,			/* 0x20 */
-+	gcSHADER_ISAMPLER_3D,			/* 0x21 */
-+	gcSHADER_ISAMPLER_CUBIC,		/* 0x22 */
-+	gcSHADER_USAMPLER_2D,			/* 0x23 */
-+	gcSHADER_USAMPLER_3D,			/* 0x24 */
-+	gcSHADER_USAMPLER_CUBIC,		/* 0x25 */
-+	gcSHADER_SAMPLER_EXTERNAL_OES,		/* 0x26 */
-+
-+	gcSHADER_UINT_X1,			/* 0x27 */
-+	gcSHADER_UINT_X2,			/* 0x28 */
-+	gcSHADER_UINT_X3,			/* 0x29 */
-+	gcSHADER_UINT_X4,			/* 0x2A */
-+
-+    gcSHADER_UNKONWN_TYPE,      /* do not add type after this */
-+    gcSHADER_TYPE_COUNT         /* must to change gcvShaderTypeInfo at the
-+                                 * same time if you add any new type! */}
-+gcSHADER_TYPE;
-+
-+typedef enum _gcSHADER_TYPE_KIND
-+{
-+    gceTK_UNKOWN,
-+    gceTK_FLOAT,
-+    gceTK_INT,
-+    gceTK_UINT,
-+    gceTK_BOOL,
-+    gceTK_FIXED,
-+    gceTK_SAMPLER,
-+    gceTK_IMAGE,
-+    gceTK_OTHER
-+} gcSHADER_TYPE_KIND;
-+
-+typedef struct _gcSHADER_TYPEINFO
-+{
-+    gcSHADER_TYPE      type;              /* e.g. gcSHADER_FLOAT_2X4 */
-+    gctINT             components;        /* e.g. 4 components       */
-+    gctINT             rows;              /* e.g. 2 rows             */
-+    gcSHADER_TYPE      componentType;     /* e.g. gcSHADER_FLOAT_X4  */
-+    gcSHADER_TYPE_KIND kind;              /* e.g. gceTK_FLOAT */
-+    gctCONST_STRING    name;              /* e.g. "FLOAT_2X4" */
-+} gcSHADER_TYPEINFO;
-+
-+extern gcSHADER_TYPEINFO gcvShaderTypeInfo[];
-+
-+#define gcmType_Comonents(Type)    (gcvShaderTypeInfo[Type].components)
-+#define gcmType_Rows(Type)         (gcvShaderTypeInfo[Type].rows)
-+#define gcmType_ComonentType(Type) (gcvShaderTypeInfo[Type].componentType)
-+#define gcmType_Kind(Type)         (gcvShaderTypeInfo[Type].kind)
-+#define gcmType_Name(Type)         (gcvShaderTypeInfo[Type].name)
-+
-+#define gcmType_isMatrix(type) (gcmType_Rows(type) > 1)
-+
-+typedef enum _gcSHADER_VAR_CATEGORY
-+{
-+    gcSHADER_VAR_CATEGORY_NORMAL  =  0, /* primitive type and its array */
-+    gcSHADER_VAR_CATEGORY_STRUCT  =  1  /* structure */
-+}
-+gcSHADER_VAR_CATEGORY;
-+
-+typedef enum _gceTYPE_QUALIFIER
-+{
-+    gcvTYPE_QUALIFIER_NONE         = 0x0, /* unqualified */
-+    gcvTYPE_QUALIFIER_VOLATILE     = 0x1, /* volatile */
-+}gceTYPE_QUALIFIER;
-+
-+typedef gctUINT16  gctTYPE_QUALIFIER;
-+
-+#if GC_ENABLE_LOADTIME_OPT
-+typedef struct _gcSHADER_TYPE_INFO
-+{
-+    gcSHADER_TYPE    type;        /* eg. gcSHADER_FLOAT_2X3 is the type */
-+    gctCONST_STRING  name;        /* the name of the type: "gcSHADER_FLOAT_2X3" */
-+    gcSHADER_TYPE    baseType;    /* its base type is gcSHADER_FLOAT_2 */
-+    gctINT           components;  /* it has 2 components */
-+    gctINT           rows;        /* and 3 rows */
-+    gctINT           size;        /* the size in byte */
-+} gcSHADER_TYPE_INFO;
-+
-+extern gcSHADER_TYPE_INFO shader_type_info[];
-+
-+enum gceLTCDumpOption {
-+    gceLTC_DUMP_UNIFORM      = 0x0001,
-+    gceLTC_DUMP_EVALUATION   = 0x0002,
-+    gceLTC_DUMP_EXPESSION    = 0x0004,
-+    gceLTC_DUMP_COLLECTING   = 0x0008,
-+};
-+
-+gctBOOL gcDumpOption(gctINT Opt);
-+
-+#endif /* GC_ENABLE_LOADTIME_OPT */
-+
-+#define IS_MATRIX_TYPE(type) \
-+    (((type >= gcSHADER_FLOAT_2X2) && (type <= gcSHADER_FLOAT_4X4)) || \
-+     ((type >= gcSHADER_FLOAT_2X3) && (type <= gcSHADER_FLOAT_4X3)))
-+
-+/* gcSHADER_PRECISION enumeration. */
-+typedef enum _gcSHADER_PRECISION
-+{
-+	gcSHADER_PRECISION_DEFAULT,				/* 0x00 */
-+	gcSHADER_PRECISION_HIGH,				/* 0x01 */
-+	gcSHADER_PRECISION_MEDIUM,				/* 0x02 */
-+	gcSHADER_PRECISION_LOW,				    /* 0x03 */
-+}
-+gcSHADER_PRECISION;
-+
-+/* Shader flags. */
-+typedef enum _gceSHADER_FLAGS
-+{
-+    gcvSHADER_NO_OPTIMIZATION           = 0x00,
-+	gcvSHADER_DEAD_CODE					= 0x01,
-+	gcvSHADER_RESOURCE_USAGE			= 0x02,
-+	gcvSHADER_OPTIMIZER					= 0x04,
-+	gcvSHADER_USE_GL_Z					= 0x08,
-+    /*
-+        The GC family of GPU cores model GC860 and under require the Z
-+        to be from 0 <= z <= w.
-+        However, OpenGL specifies the Z to be from -w <= z <= w.  So we
-+        have to a conversion here:
-+
-+            z = (z + w) / 2.
-+
-+        So here we append two instructions to the vertex shader.
-+    */
-+	gcvSHADER_USE_GL_POSITION			= 0x10,
-+	gcvSHADER_USE_GL_FACE				= 0x20,
-+	gcvSHADER_USE_GL_POINT_COORD		= 0x40,
-+	gcvSHADER_LOADTIME_OPTIMIZER		= 0x80,
-+#if gcdALPHA_KILL_IN_SHADER
-+    gcvSHADER_USE_ALPHA_KILL            = 0x100,
-+#endif
-+
-+#if gcdPRE_ROTATION && (ANDROID_SDK_VERSION >= 14)
-+    gcvSHADER_VS_PRE_ROTATION           = 0x200,
-+#endif
-+
-+#if TEMP_INLINE_ALL_EXPANSION
-+    gcvSHADER_INLINE_ALL_EXPANSION      = 0x400,
-+#endif
-+}
-+gceSHADER_FLAGS;
-+
-+gceSTATUS
-+gcSHADER_CheckClipW(
-+    IN gctCONST_STRING VertexSource,
-+    IN gctCONST_STRING FragmentSource,
-+    OUT gctBOOL * clipW);
-+
-+/*******************************************************************************
-+**  gcSHADER_GetUniformVectorCount
-+**
-+**  Get the number of vectors used by uniforms for this shader.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Count
-+**          Pointer to a variable receiving the number of vectors.
-+*/
-+gceSTATUS
-+gcSHADER_GetUniformVectorCount(
-+    IN gcSHADER Shader,
-+    OUT gctSIZE_T * Count
-+    );
-+
-+/*******************************************************************************
-+**							gcOptimizer Data Structures
-+*******************************************************************************/
-+typedef enum _gceSHADER_OPTIMIZATION
-+{
-+    /*  No optimization. */
-+	gcvOPTIMIZATION_NONE,
-+
-+    /*  Flow graph construction. */
-+	gcvOPTIMIZATION_CONSTRUCTION                = 1 << 0,
-+
-+    /*  Dead code elimination. */
-+	gcvOPTIMIZATION_DEAD_CODE                   = 1 << 1,
-+
-+    /*  Redundant move instruction elimination. */
-+	gcvOPTIMIZATION_REDUNDANT_MOVE              = 1 << 2,
-+
-+    /*  Inline expansion. */
-+	gcvOPTIMIZATION_INLINE_EXPANSION            = 1 << 3,
-+
-+    /*  Constant propagation. */
-+	gcvOPTIMIZATION_CONSTANT_PROPAGATION        = 1 << 4,
-+
-+    /*  Redundant bounds/checking elimination. */
-+	gcvOPTIMIZATION_REDUNDANT_CHECKING          = 1 << 5,
-+
-+    /*  Loop invariant movement. */
-+	gcvOPTIMIZATION_LOOP_INVARIANT              = 1 << 6,
-+
-+    /*  Induction variable removal. */
-+	gcvOPTIMIZATION_INDUCTION_VARIABLE          = 1 << 7,
-+
-+    /*  Common subexpression elimination. */
-+	gcvOPTIMIZATION_COMMON_SUBEXPRESSION        = 1 << 8,
-+
-+    /*  Control flow/banch optimization. */
-+	gcvOPTIMIZATION_CONTROL_FLOW                = 1 << 9,
-+
-+    /*  Vector component operation merge. */
-+	gcvOPTIMIZATION_VECTOR_INSTRUCTION_MERGE    = 1 << 10,
-+
-+    /*  Algebra simplificaton. */
-+	gcvOPTIMIZATION_ALGEBRAIC_SIMPLIFICATION    = 1 << 11,
-+
-+    /*  Pattern matching and replacing. */
-+	gcvOPTIMIZATION_PATTERN_MATCHING            = 1 << 12,
-+
-+    /*  Interprocedural constant propagation. */
-+	gcvOPTIMIZATION_IP_CONSTANT_PROPAGATION     = 1 << 13,
-+
-+    /*  Interprecedural register optimization. */
-+	gcvOPTIMIZATION_IP_REGISTRATION             = 1 << 14,
-+
-+    /*  Optimization option number. */
-+	gcvOPTIMIZATION_OPTION_NUMBER               = 1 << 15,
-+
-+	/*  Loadtime constant. */
-+    gcvOPTIMIZATION_LOADTIME_CONSTANT           = 1 << 16,
-+
-+    /*  MAD instruction optimization. */
-+	gcvOPTIMIZATION_MAD_INSTRUCTION             = 1 << 17,
-+
-+    /*  Special optimization for LOAD SW workaround. */
-+	gcvOPTIMIZATION_LOAD_SW_WORKAROUND          = 1 << 18,
-+
-+    /* move code into conditional block if possile */
-+	gcvOPTIMIZATION_CONDITIONALIZE              = 1 << 19,
-+
-+    /* expriemental: power optimization mode
-+        1. add extra dummy texld to tune performance
-+        2. insert NOP after high power instrucitons
-+        3. split high power vec3/vec4 instruciton to vec2/vec1 operation
-+        4. ...
-+     */
-+	gcvOPTIMIZATION_POWER_OPTIMIZATION           = 1 << 20,
-+
-+    /* optimize varying packing */
-+    gcvOPTIMIZATION_VARYINGPACKING              = 1 << 22,
-+
-+#if TEMP_INLINE_ALL_EXPANSION
-+	gcvOPTIMIZATION_INLINE_ALL_EXPANSION        = 1 << 23,
-+#endif
-+
-+    /*  Full optimization. */
-+    /*  Note that gcvOPTIMIZATION_LOAD_SW_WORKAROUND is off. */
-+	gcvOPTIMIZATION_FULL                        = 0x7FFFFFFF &
-+                                                  ~gcvOPTIMIZATION_LOAD_SW_WORKAROUND &
-+                                                  ~gcvOPTIMIZATION_INLINE_ALL_EXPANSION &
-+                                                  ~gcvOPTIMIZATION_POWER_OPTIMIZATION,
-+
-+	/* Optimization Unit Test flag. */
-+    gcvOPTIMIZATION_UNIT_TEST                   = 1 << 31
-+}
-+gceSHADER_OPTIMIZATION;
-+
-+typedef enum _gceOPTIMIZATION_VaryingPaking
-+{
-+    gcvOPTIMIZATION_VARYINGPACKING_NONE = 0,
-+    gcvOPTIMIZATION_VARYINGPACKING_NOSPLIT,
-+    gcvOPTIMIZATION_VARYINGPACKING_SPLIT
-+} gceOPTIMIZATION_VaryingPaking;
-+
-+typedef struct _gcOPTIMIZER_OPTION
-+{
-+    gceSHADER_OPTIMIZATION     optFlags;
-+
-+    /* debug & dump options:
-+
-+         VC_OPTION=-DUMP:SRC:OPT|:OPTV|:CG|:CGV:|ALL|ALLV
-+
-+         SRC:  dump shader source code
-+         OPT:  dump incoming and final IR
-+         OPTV: dump result IR in each optimization phase
-+         CG:   dump generated machine code
-+         CGV:  dump BE tree and optimization detail
-+
-+         ALL = SRC|OPT|CG
-+         ALLV = SRC|OPT|OPTV|CG|CGV
-+     */
-+    gctBOOL     dumpShaderSource;      /* dump shader source code */
-+    gctBOOL     dumpOptimizer;         /* dump incoming and final IR */
-+    gctBOOL     dumpOptimizerVerbose;  /* dump result IR in each optimization phase */
-+    gctBOOL     dumpBEGenertedCode;    /* dump generated machine code */
-+    gctBOOL     dumpBEVerbose;         /* dump BE tree and optimization detail */
-+    gctBOOL     dumpBEFinalIR;         /* dump BE final IR */
-+
-+    /* Code generation */
-+
-+    /* Varying Packing:
-+
-+          VC_OPTION=-PACKVARYING:[0-2]|:T[-]m[,n]|:LshaderIdx,min,max
-+
-+          0: turn off varying packing
-+          1: pack varyings, donot split any varying
-+          2: pack varyings, may split to make fully packed output
-+
-+          Tm:    only packing shader pair which vertex shader id is m
-+          Tm,n:  only packing shader pair which vertex shader id
-+                   is in range of [m, n]
-+          T-m:   do not packing shader pair which vertex shader id is m
-+          T-m,n: do not packing shader pair which vertex shader id
-+                   is in range of [m, n]
-+
-+          LshaderIdx,min,max : set  load balance (min, max) for shaderIdx
-+                               if shaderIdx is -1, all shaders are impacted
-+                               newMin = origMin * (min/100.);
-+                               newMax = origMax * (max/100.);
-+     */
-+    gceOPTIMIZATION_VaryingPaking    packVarying;
-+    gctINT                           _triageStart;
-+    gctINT                           _triageEnd;
-+    gctINT                           _loadBalanceShaderIdx;
-+    gctINT                           _loadBalanceMin;
-+    gctINT                           _loadBalanceMax;
-+
-+    /* Do not generate immdeiate
-+
-+          VC_OPTION=-NOIMM
-+
-+       Force generate immediate even the machine model don't support it,
-+       for testing purpose only
-+
-+          VC_OPTION=-FORCEIMM
-+     */
-+    gctBOOL     noImmediate;
-+    gctBOOL     forceImmediate;
-+
-+    /* Power reduction mode options */
-+    gctBOOL   needPowerOptimization;
-+
-+    /* Patch TEXLD instruction by adding dummy texld
-+       (can be used to tune GPU power usage):
-+         for every TEXLD we seen, add n dummy TEXLD
-+
-+        it can be enabled by environment variable:
-+
-+          VC_OPTION=-PATCH_TEXLD:M:N
-+
-+        (for each M texld, add N dummy texld)
-+     */
-+    gctINT      patchEveryTEXLDs;
-+    gctINT      patchDummyTEXLDs;
-+
-+    /* Insert NOP after high power consumption instructions
-+
-+         VC_OPTION="-INSERTNOP:MUL:MULLO:DP3:DP4:SEENTEXLD"
-+     */
-+    gctBOOL     insertNOP;
-+    gctBOOL     insertNOPAfterMUL;
-+    gctBOOL     insertNOPAfterMULLO;
-+    gctBOOL     insertNOPAfterDP3;
-+    gctBOOL     insertNOPAfterDP4;
-+    gctBOOL     insertNOPOnlyWhenTexldSeen;
-+
-+    /* split MAD to MUL and ADD:
-+
-+         VC_OPTION=-SPLITMAD
-+     */
-+    gctBOOL     splitMAD;
-+
-+    /* Convert vect3/vec4 operations to multiple vec2/vec1 operations
-+
-+         VC_OPTION=-SPLITVEC:MUL:MULLO:DP3:DP4
-+     */
-+    gctBOOL     splitVec;
-+    gctBOOL     splitVec4MUL;
-+    gctBOOL     splitVec4MULLO;
-+    gctBOOL     splitVec4DP3;
-+    gctBOOL     splitVec4DP4;
-+
-+    /* turn/off features:
-+
-+          VC_OPTION=-F:n,[0|1]
-+          Note: n must be decimal number
-+     */
-+    gctUINT     featureBits;
-+
-+    /* inline level (default 2 at O1):
-+
-+          VC_OPTION=-INLINELEVEL:[0-3]
-+             0:  no inline
-+             1:  only inline the function only called once or small function
-+             2:  inline functions be called less than 5 times or medium size function
-+             3:  inline everything possible
-+     */
-+    gctUINT     inlineLevel;
-+} gcOPTIMIZER_OPTION;
-+
-+extern gcOPTIMIZER_OPTION theOptimizerOption;
-+#define gcmGetOptimizerOption() gcGetOptimizerOption()
-+
-+#define gcmOPT_DUMP_SHADER_SRC()         \
-+             (gcmGetOptimizerOption()->dumpShaderSource != 0)
-+#define gcmOPT_DUMP_OPTIMIZER()          \
-+             (gcmGetOptimizerOption()->dumpOptimizer != 0 || \
-+              gcmOPT_DUMP_OPTIMIZER_VERBOSE() )
-+#define gcmOPT_DUMP_OPTIMIZER_VERBOSE()  \
-+             (gcmGetOptimizerOption()->dumpOptimizerVerbose != 0)
-+#define gcmOPT_DUMP_CODEGEN()            \
-+             (gcmGetOptimizerOption()->dumpBEGenertedCode != 0 || \
-+              gcmOPT_DUMP_CODEGEN_VERBOSE() )
-+#define gcmOPT_DUMP_CODEGEN_VERBOSE()    \
-+             (gcmGetOptimizerOption()->dumpBEVerbose != 0)
-+#define gcmOPT_DUMP_FINAL_IR()    \
-+             (gcmGetOptimizerOption()->dumpBEFinalIR != 0)
-+
-+#define gcmOPT_SET_DUMP_SHADER_SRC(v)   \
-+             gcmGetOptimizerOption()->dumpShaderSource = (v)
-+
-+#define gcmOPT_PATCH_TEXLD()  (gcmGetOptimizerOption()->patchDummyTEXLDs != 0)
-+#define gcmOPT_INSERT_NOP()   (gcmGetOptimizerOption()->insertNOP == gcvTRUE)
-+#define gcmOPT_SPLITMAD()     (gcmGetOptimizerOption()->splitMAD == gcvTRUE)
-+#define gcmOPT_SPLITVEC()     (gcmGetOptimizerOption()->splitVec == gcvTRUE)
-+
-+#define gcmOPT_NOIMMEDIATE()  (gcmGetOptimizerOption()->noImmediate == gcvTRUE)
-+#define gcmOPT_FORCEIMMEDIATE()  (gcmGetOptimizerOption()->forceImmediate == gcvTRUE)
-+
-+#define gcmOPT_PACKVARYING()     (gcmGetOptimizerOption()->packVarying)
-+#define gcmOPT_PACKVARYING_triageStart()   (gcmGetOptimizerOption()->_triageStart)
-+#define gcmOPT_PACKVARYING_triageEnd()     (gcmGetOptimizerOption()->_triageEnd)
-+
-+#define gcmOPT_INLINELEVEL()     (gcmGetOptimizerOption()->inlineLevel)
-+
-+/* Setters */
-+#define gcmOPT_SetPatchTexld(m,n) (gcmGetOptimizerOption()->patchEveryTEXLDs = (m),\
-+                                   gcmGetOptimizerOption()->patchDummyTEXLDs = (n))
-+#define gcmOPT_SetSplitVecMUL() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
-+                                 gcmGetOptimizerOption()->splitVec4MUL = gcvTRUE)
-+#define gcmOPT_SetSplitVecMULLO() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
-+                                  gcmGetOptimizerOption()->splitVec4MULLO = gcvTRUE)
-+#define gcmOPT_SetSplitVecDP3() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
-+                                 gcmGetOptimizerOption()->splitVec4DP3 = gcvTRUE)
-+#define gcmOPT_SetSplitVecDP4() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
-+                                 gcmGetOptimizerOption()->splitVec4DP4 = gcvTRUE)
-+
-+#define gcmOPT_SetPackVarying(v)     (gcmGetOptimizerOption()->packVarying = v)
-+
-+#define FB_LIVERANGE_FIX1     0x0001
-+
-+
-+#define PredefinedDummySamplerId       8
-+
-+/* Function argument qualifier */
-+typedef enum _gceINPUT_OUTPUT
-+{
-+	gcvFUNCTION_INPUT,
-+	gcvFUNCTION_OUTPUT,
-+	gcvFUNCTION_INOUT
-+}
-+gceINPUT_OUTPUT;
-+
-+/* Kernel function property flags. */
-+typedef enum _gcePROPERTY_FLAGS
-+{
-+	gcvPROPERTY_REQD_WORK_GRP_SIZE	= 0x01
-+}
-+gceKERNEL_FUNCTION_PROPERTY_FLAGS;
-+
-+/* Uniform flags. */
-+typedef enum _gceUNIFORM_FLAGS
-+{
-+	gcvUNIFORM_KERNEL_ARG			= 0x01,
-+	gcvUNIFORM_KERNEL_ARG_LOCAL		= 0x02,
-+	gcvUNIFORM_KERNEL_ARG_SAMPLER		= 0x04,
-+	gcvUNIFORM_LOCAL_ADDRESS_SPACE		= 0x08,
-+	gcvUNIFORM_PRIVATE_ADDRESS_SPACE	= 0x10,
-+	gcvUNIFORM_CONSTANT_ADDRESS_SPACE	= 0x20,
-+	gcvUNIFORM_GLOBAL_SIZE			= 0x40,
-+	gcvUNIFORM_LOCAL_SIZE			= 0x80,
-+	gcvUNIFORM_NUM_GROUPS			= 0x100,
-+	gcvUNIFORM_GLOBAL_OFFSET		= 0x200,
-+	gcvUNIFORM_WORK_DIM			= 0x400,
-+	gcvUNIFORM_KERNEL_ARG_CONSTANT		= 0x800,
-+	gcvUNIFORM_KERNEL_ARG_LOCAL_MEM_SIZE	= 0x1000,
-+	gcvUNIFORM_KERNEL_ARG_PRIVATE		= 0x2000,
-+	gcvUNIFORM_LOADTIME_CONSTANT		= 0x4000,
-+    gcvUNIFORM_IS_ARRAY                 = 0x8000,
-+}
-+gceUNIFORM_FLAGS;
-+
-+#define gcdUNIFORM_KERNEL_ARG_MASK  (gcvUNIFORM_KERNEL_ARG         | \
-+                                     gcvUNIFORM_KERNEL_ARG_LOCAL   | \
-+									 gcvUNIFORM_KERNEL_ARG_SAMPLER | \
-+									 gcvUNIFORM_KERNEL_ARG_PRIVATE | \
-+									 gcvUNIFORM_KERNEL_ARG_CONSTANT)
-+
-+typedef enum _gceVARIABLE_UPDATE_FLAGS
-+{
-+    gcvVARIABLE_UPDATE_NOUPDATE = 0,
-+    gcvVARIABLE_UPDATE_TEMPREG,
-+    gcvVARIABLE_UPDATE_TYPE_QUALIFIER,
-+}gceVARIABLE_UPDATE_FLAGS;
-+
-+typedef struct _gcMACHINE_INST
-+{
-+    gctUINT        state0;
-+    gctUINT        state1;
-+    gctUINT        state2;
-+    gctUINT        state3;
-+}gcMACHINE_INST, *gcMACHINE_INST_PTR;
-+
-+typedef struct _gcMACHINECODE
-+{
-+    gcMACHINE_INST_PTR   pCode;          /* machine code  */
-+    gctUINT              instCount;      /* 128-bit count */
-+    gctUINT              maxConstRegNo;
-+    gctUINT              maxTempRegNo;
-+    gctUINT              endPCOfMainRoutine;
-+}gcMACHINECODE, *gcMACHINECODE_PTR;
-+
-+typedef enum NP2_ADDRESS_MODE
-+{
-+    NP2_ADDRESS_MODE_CLAMP  = 0,
-+    NP2_ADDRESS_MODE_REPEAT = 1,
-+    NP2_ADDRESS_MODE_MIRROR = 2
-+}NP2_ADDRESS_MODE;
-+
-+typedef struct _gcNPOT_PATCH_PARAM
-+{
-+    gctINT               samplerSlot;
-+    NP2_ADDRESS_MODE     addressMode[3];
-+    gctINT               texDimension;    /* 2 or 3 */
-+}gcNPOT_PATCH_PARAM, *gcNPOT_PATCH_PARAM_PTR;
-+
-+typedef struct _gcZBIAS_PATCH_PARAM
-+{
-+    /* Driver uses this to program uniform that designating zbias */
-+    gctINT               uniformAddr;
-+    gctINT               channel;
-+}gcZBIAS_PATCH_PARAM, *gcZBIAS_PATCH_PARAM_PTR;
-+
-+void
-+gcGetOptionFromEnv(
-+    IN OUT gcOPTIMIZER_OPTION * Option
-+    );
-+
-+void
-+gcSetOptimizerOption(
-+    IN gceSHADER_FLAGS Flags
-+    );
-+
-+gcOPTIMIZER_OPTION *
-+gcGetOptimizerOption();
-+
-+/*******************************************************************************
-+**  gcSHADER_SetCompilerVersion
-+**
-+**  Set the compiler version of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to gcSHADER object
-+**
-+**      gctINT *Version
-+**          Pointer to a two word version
-+*/
-+gceSTATUS
-+gcSHADER_SetCompilerVersion(
-+    IN gcSHADER Shader,
-+    IN gctUINT32 *Version
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_GetCompilerVersion
-+**
-+**  Get the compiler version of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR *CompilerVersion.
-+**          Pointer to holder of returned compilerVersion pointer
-+*/
-+gceSTATUS
-+gcSHADER_GetCompilerVersion(
-+    IN gcSHADER Shader,
-+    OUT gctUINT32_PTR *CompilerVersion
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_GetType
-+**
-+**  Get the gcSHADER object's type.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT *Type.
-+**          Pointer to return shader type.
-+*/
-+gceSTATUS
-+gcSHADER_GetType(
-+    IN gcSHADER Shader,
-+    OUT gctINT *Type
-+    );
-+
-+gctUINT
-+gcSHADER_NextId();
-+/*******************************************************************************
-+**                             gcSHADER_Construct
-+********************************************************************************
-+**
-+**	Construct a new gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcoOS Hal
-+**			Pointer to an gcoHAL object.
-+**
-+**		gctINT ShaderType
-+**			Type of gcSHADER object to cerate.  'ShaderType' can be one of the
-+**			following:
-+**
-+**				gcSHADER_TYPE_VERTEX	Vertex shader.
-+**				gcSHADER_TYPE_FRAGMENT	Fragment shader.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER * Shader
-+**			Pointer to a variable receiving the gcSHADER object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_Construct(
-+	IN gcoHAL Hal,
-+	IN gctINT ShaderType,
-+	OUT gcSHADER * Shader
-+	);
-+
-+/*******************************************************************************
-+**                              gcSHADER_Destroy
-+********************************************************************************
-+**
-+**	Destroy a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_Destroy(
-+	IN gcSHADER Shader
-+	);
-+
-+/*******************************************************************************
-+**                              gcSHADER_Copy
-+********************************************************************************
-+**
-+**	Copy a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**      gcSHADER Source
-+**          Pointer to a gcSHADER object that will be copied.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_Copy(
-+	IN gcSHADER Shader,
-+	IN gcSHADER Source
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_LoadHeader
-+**
-+**  Load a gcSHADER object from a binary buffer.  The binary buffer is layed out
-+**  as follows:
-+**      // Six word header
-+**      // Signature, must be 'S','H','D','R'.
-+**      gctINT8             signature[4];
-+**      gctUINT32           binFileVersion;
-+**      gctUINT32           compilerVersion[2];
-+**      gctUINT32           gcSLVersion;
-+**      gctUINT32           binarySize;
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**          Shader type will be returned if type in shader object is not gcSHADER_TYPE_PRECOMPILED
-+**
-+**      gctPOINTER Buffer
-+**          Pointer to a binary buffer containing the shader data to load.
-+**
-+**      gctSIZE_T BufferSize
-+**          Number of bytes inside the binary buffer pointed to by 'Buffer'.
-+**
-+**  OUTPUT:
-+**      nothing
-+**
-+*/
-+gceSTATUS
-+gcSHADER_LoadHeader(
-+    IN gcSHADER Shader,
-+    IN gctPOINTER Buffer,
-+    IN gctSIZE_T BufferSize,
-+    OUT gctUINT32 * ShaderVersion
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_LoadKernel
-+**
-+**  Load a kernel function given by name into gcSHADER object
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSTRING KernelName
-+**          Pointer to a kernel function name
-+**
-+**  OUTPUT:
-+**      nothing
-+**
-+*/
-+gceSTATUS
-+gcSHADER_LoadKernel(
-+    IN gcSHADER Shader,
-+    IN gctSTRING KernelName
-+    );
-+
-+/*******************************************************************************
-+**                                gcSHADER_Load
-+********************************************************************************
-+**
-+**	Load a gcSHADER object from a binary buffer.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctPOINTER Buffer
-+**			Pointer to a binary buffer containg the shader data to load.
-+**
-+**		gctSIZE_T BufferSize
-+**			Number of bytes inside the binary buffer pointed to by 'Buffer'.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_Load(
-+	IN gcSHADER Shader,
-+	IN gctPOINTER Buffer,
-+	IN gctSIZE_T BufferSize
-+	);
-+
-+/*******************************************************************************
-+**                                gcSHADER_Save
-+********************************************************************************
-+**
-+**	Save a gcSHADER object to a binary buffer.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctPOINTER Buffer
-+**			Pointer to a binary buffer to be used as storage for the gcSHADER
-+**			object.  If 'Buffer' is gcvNULL, the gcSHADER object will not be saved,
-+**			but the number of bytes required to hold the binary output for the
-+**			gcSHADER object will be returned.
-+**
-+**		gctSIZE_T * BufferSize
-+**			Pointer to a variable holding the number of bytes allocated in
-+**			'Buffer'.  Only valid if 'Buffer' is not gcvNULL.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * BufferSize
-+**			Pointer to a variable receiving the number of bytes required to hold
-+**			the binary form of the gcSHADER object.
-+*/
-+gceSTATUS
-+gcSHADER_Save(
-+	IN gcSHADER Shader,
-+	IN gctPOINTER Buffer,
-+	IN OUT gctSIZE_T * BufferSize
-+	);
-+
-+/*******************************************************************************
-+**                                gcSHADER_LoadEx
-+********************************************************************************
-+**
-+**	Load a gcSHADER object from a binary buffer.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctPOINTER Buffer
-+**			Pointer to a binary buffer containg the shader data to load.
-+**
-+**		gctSIZE_T BufferSize
-+**			Number of bytes inside the binary buffer pointed to by 'Buffer'.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_LoadEx(
-+	IN gcSHADER Shader,
-+	IN gctPOINTER Buffer,
-+	IN gctSIZE_T BufferSize
-+	);
-+
-+/*******************************************************************************
-+**                                gcSHADER_SaveEx
-+********************************************************************************
-+**
-+**	Save a gcSHADER object to a binary buffer.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctPOINTER Buffer
-+**			Pointer to a binary buffer to be used as storage for the gcSHADER
-+**			object.  If 'Buffer' is gcvNULL, the gcSHADER object will not be saved,
-+**			but the number of bytes required to hold the binary output for the
-+**			gcSHADER object will be returned.
-+**
-+**		gctSIZE_T * BufferSize
-+**			Pointer to a variable holding the number of bytes allocated in
-+**			'Buffer'.  Only valid if 'Buffer' is not gcvNULL.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * BufferSize
-+**			Pointer to a variable receiving the number of bytes required to hold
-+**			the binary form of the gcSHADER object.
-+*/
-+gceSTATUS
-+gcSHADER_SaveEx(
-+	IN gcSHADER Shader,
-+	IN gctPOINTER Buffer,
-+	IN OUT gctSIZE_T * BufferSize
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_ReallocateAttributes
-+**
-+**  Reallocate an array of pointers to gcATTRIBUTE objects.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcSHADER_ReallocateAttributes(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T Count
-+    );
-+
-+/*******************************************************************************
-+**							  gcSHADER_AddAttribute
-+********************************************************************************
-+**
-+**	Add an attribute to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the attribute to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the attribute to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the attribute to add.  'Length' must be at least 1.
-+**
-+**		gctBOOL IsTexture
-+**			gcvTRUE if the attribute is used as a texture coordinate, gcvFALSE if not.
-+**
-+**	OUTPUT:
-+**
-+**		gcATTRIBUTE * Attribute
-+**			Pointer to a variable receiving the gcATTRIBUTE object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_AddAttribute(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+	IN gctSIZE_T Length,
-+	IN gctBOOL IsTexture,
-+	OUT gcATTRIBUTE * Attribute
-+	);
-+
-+/*******************************************************************************
-+**                         gcSHADER_GetAttributeCount
-+********************************************************************************
-+**
-+**	Get the number of attributes for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Count
-+**			Pointer to a variable receiving the number of attributes.
-+*/
-+gceSTATUS
-+gcSHADER_GetAttributeCount(
-+	IN gcSHADER Shader,
-+	OUT gctSIZE_T * Count
-+	);
-+
-+/*******************************************************************************
-+**                            gcSHADER_GetAttribute
-+********************************************************************************
-+**
-+**	Get the gcATTRIBUTE object poniter for an indexed attribute for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT Index
-+**			Index of the attribute to retrieve.
-+**
-+**	OUTPUT:
-+**
-+**		gcATTRIBUTE * Attribute
-+**			Pointer to a variable receiving the gcATTRIBUTE object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_GetAttribute(
-+	IN gcSHADER Shader,
-+	IN gctUINT Index,
-+	OUT gcATTRIBUTE * Attribute
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_ReallocateUniforms
-+**
-+**  Reallocate an array of pointers to gcUNIFORM objects.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcSHADER_ReallocateUniforms(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T Count
-+    );
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddUniform
-+********************************************************************************
-+**
-+**	Add an uniform to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the uniform to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the uniform to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the uniform to add.  'Length' must be at least 1.
-+**
-+**	OUTPUT:
-+**
-+**		gcUNIFORM * Uniform
-+**			Pointer to a variable receiving the gcUNIFORM object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_AddUniform(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+	IN gctSIZE_T Length,
-+	OUT gcUNIFORM * Uniform
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddPreRotationUniform
-+********************************************************************************
-+**
-+**	Add an uniform to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the uniform to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the uniform to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the uniform to add.  'Length' must be at least 1.
-+**
-+**		gctINT col
-+**			Which uniform.
-+**
-+**	OUTPUT:
-+**
-+**		gcUNIFORM * Uniform
-+**			Pointer to a variable receiving the gcUNIFORM object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_AddPreRotationUniform(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+	IN gctSIZE_T Length,
-+    IN gctINT col,
-+	OUT gcUNIFORM * Uniform
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddUniformEx
-+********************************************************************************
-+**
-+**	Add an uniform to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the uniform to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the uniform to add.
-+**
-+**      gcSHADER_PRECISION precision
-+**          Precision of the uniform to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the uniform to add.  'Length' must be at least 1.
-+**
-+**	OUTPUT:
-+**
-+**		gcUNIFORM * Uniform
-+**			Pointer to a variable receiving the gcUNIFORM object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_AddUniformEx(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+    IN gcSHADER_PRECISION precision,
-+	IN gctSIZE_T Length,
-+	OUT gcUNIFORM * Uniform
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddUniformEx1
-+********************************************************************************
-+**
-+**	Add an uniform to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the uniform to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the uniform to add.
-+**
-+**      gcSHADER_PRECISION precision
-+**          Precision of the uniform to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the uniform to add.  'Length' must be at least 1.
-+**
-+**      gcSHADER_VAR_CATEGORY varCategory
-+**          Variable category, normal or struct.
-+**
-+**      gctUINT16 numStructureElement
-+**          If struct, its element number.
-+**
-+**      gctINT16 parent
-+**          If struct, parent index in gcSHADER.variables.
-+**
-+**      gctINT16 prevSibling
-+**          If struct, previous sibling index in gcSHADER.variables.
-+**
-+**	OUTPUT:
-+**
-+**		gcUNIFORM * Uniform
-+**			Pointer to a variable receiving the gcUNIFORM object pointer.
-+**
-+**      gctINT16* ThisUniformIndex
-+**          Returned value about uniform index in gcSHADER.
-+*/
-+gceSTATUS
-+gcSHADER_AddUniformEx1(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+    IN gcSHADER_PRECISION precision,
-+	IN gctSIZE_T Length,
-+    IN gctINT    IsArray,
-+    IN gcSHADER_VAR_CATEGORY varCategory,
-+    IN gctUINT16 numStructureElement,
-+    IN gctINT16 parent,
-+    IN gctINT16 prevSibling,
-+    OUT gctINT16* ThisUniformIndex,
-+	OUT gcUNIFORM * Uniform
-+	);
-+
-+/*******************************************************************************
-+**                          gcSHADER_GetUniformCount
-+********************************************************************************
-+**
-+**	Get the number of uniforms for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Count
-+**			Pointer to a variable receiving the number of uniforms.
-+*/
-+gceSTATUS
-+gcSHADER_GetUniformCount(
-+	IN gcSHADER Shader,
-+	OUT gctSIZE_T * Count
-+	);
-+
-+/*******************************************************************************
-+**                         gcSHADER_GetPreRotationUniform
-+********************************************************************************
-+**
-+**	Get the preRotate Uniform.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		gcUNIFORM ** pUniform
-+**			Pointer to a preRotation uniforms array.
-+*/
-+gceSTATUS
-+gcSHADER_GetPreRotationUniform(
-+	IN gcSHADER Shader,
-+	OUT gcUNIFORM ** pUniform
-+	);
-+
-+/*******************************************************************************
-+**                             gcSHADER_GetUniform
-+********************************************************************************
-+**
-+**	Get the gcUNIFORM object pointer for an indexed uniform for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT Index
-+**			Index of the uniform to retrieve.
-+**
-+**	OUTPUT:
-+**
-+**		gcUNIFORM * Uniform
-+**			Pointer to a variable receiving the gcUNIFORM object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_GetUniform(
-+	IN gcSHADER Shader,
-+	IN gctUINT Index,
-+	OUT gcUNIFORM * Uniform
-+	);
-+
-+
-+/*******************************************************************************
-+**                             gcSHADER_GetUniformIndexingRange
-+********************************************************************************
-+**
-+**	Get the gcUNIFORM object pointer for an indexed uniform for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctINT uniformIndex
-+**			Index of the start uniform.
-+**
-+**		gctINT offset
-+**			Offset to indexing.
-+**
-+**	OUTPUT:
-+**
-+**		gctINT * LastUniformIndex
-+**			Pointer to index of last uniform in indexing range.
-+**
-+**		gctINT * OffsetUniformIndex
-+**			Pointer to index of uniform that indexing at offset.
-+**
-+**		gctINT * DeviationInOffsetUniform
-+**			Pointer to offset in uniform picked up.
-+*/
-+gceSTATUS
-+gcSHADER_GetUniformIndexingRange(
-+	IN gcSHADER Shader,
-+	IN gctINT uniformIndex,
-+    IN gctINT offset,
-+	OUT gctINT * LastUniformIndex,
-+    OUT gctINT * OffsetUniformIndex,
-+    OUT gctINT * DeviationInOffsetUniform
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_GetKernelFucntion
-+**
-+**  Get the gcKERNEL_FUNCTION object pointer for an indexed kernel function for this shader.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctUINT Index
-+**          Index of kernel function to retreive the name for.
-+**
-+**  OUTPUT:
-+**
-+**      gcKERNEL_FUNCTION * KernelFunction
-+**          Pointer to a variable receiving the gcKERNEL_FUNCTION object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_GetKernelFunction(
-+    IN gcSHADER Shader,
-+    IN gctUINT Index,
-+    OUT gcKERNEL_FUNCTION * KernelFunction
-+    );
-+
-+gceSTATUS
-+gcSHADER_GetKernelFunctionByName(
-+	IN gcSHADER Shader,
-+    IN gctSTRING KernelName,
-+    OUT gcKERNEL_FUNCTION * KernelFunction
-+    );
-+/*******************************************************************************
-+**  gcSHADER_GetKernelFunctionCount
-+**
-+**  Get the number of kernel functions for this shader.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Count
-+**          Pointer to a variable receiving the number of kernel functions.
-+*/
-+gceSTATUS
-+gcSHADER_GetKernelFunctionCount(
-+    IN gcSHADER Shader,
-+    OUT gctSIZE_T * Count
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_ReallocateOutputs
-+**
-+**  Reallocate an array of pointers to gcOUTPUT objects.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcSHADER_ReallocateOutputs(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T Count
-+    );
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddOutput
-+********************************************************************************
-+**
-+**	Add an output to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the output to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the output to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the output to add.  'Length' must be at least 1.
-+**
-+**		gctUINT16 TempRegister
-+**			Temporary register index that holds the output value.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOutput(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+	IN gctSIZE_T Length,
-+	IN gctUINT16 TempRegister
-+	);
-+
-+gceSTATUS
-+gcSHADER_AddOutputIndexed(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gctSIZE_T Index,
-+	IN gctUINT16 TempIndex
-+	);
-+
-+/*******************************************************************************
-+**							 gcSHADER_GetOutputCount
-+********************************************************************************
-+**
-+**	Get the number of outputs for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Count
-+**			Pointer to a variable receiving the number of outputs.
-+*/
-+gceSTATUS
-+gcSHADER_GetOutputCount(
-+	IN gcSHADER Shader,
-+	OUT gctSIZE_T * Count
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_GetOutput
-+********************************************************************************
-+**
-+**	Get the gcOUTPUT object pointer for an indexed output for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT Index
-+**			Index of output to retrieve.
-+**
-+**	OUTPUT:
-+**
-+**		gcOUTPUT * Output
-+**			Pointer to a variable receiving the gcOUTPUT object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_GetOutput(
-+	IN gcSHADER Shader,
-+	IN gctUINT Index,
-+	OUT gcOUTPUT * Output
-+	);
-+
-+
-+/*******************************************************************************
-+**							   gcSHADER_GetOutputByName
-+********************************************************************************
-+**
-+**	Get the gcOUTPUT object pointer for this shader by output name.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctSTRING name
-+**			Name of output to retrieve.
-+**
-+**      gctSIZE_T nameLength
-+**          Length of name to retrieve
-+**
-+**	OUTPUT:
-+**
-+**		gcOUTPUT * Output
-+**			Pointer to a variable receiving the gcOUTPUT object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_GetOutputByName(
-+	IN gcSHADER Shader,
-+	IN gctSTRING name,
-+    IN gctSIZE_T nameLength,
-+	OUT gcOUTPUT * Output
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_ReallocateVariables
-+**
-+**  Reallocate an array of pointers to gcVARIABLE objects.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcSHADER_ReallocateVariables(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T Count
-+    );
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddVariable
-+********************************************************************************
-+**
-+**	Add a variable to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctCONST_STRING Name
-+**			Name of the variable to add.
-+**
-+**		gcSHADER_TYPE Type
-+**			Type of the variable to add.
-+**
-+**		gctSIZE_T Length
-+**			Array length of the variable to add.  'Length' must be at least 1.
-+**
-+**		gctUINT16 TempRegister
-+**			Temporary register index that holds the variable value.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddVariable(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	IN gcSHADER_TYPE Type,
-+	IN gctSIZE_T Length,
-+	IN gctUINT16 TempRegister
-+	);
-+
-+
-+/*******************************************************************************
-+**  gcSHADER_AddVariableEx
-+********************************************************************************
-+**
-+**  Add a variable to a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctCONST_STRING Name
-+**          Name of the variable to add.
-+**
-+**      gcSHADER_TYPE Type
-+**          Type of the variable to add.
-+**
-+**      gctSIZE_T Length
-+**          Array length of the variable to add.  'Length' must be at least 1.
-+**
-+**      gctUINT16 TempRegister
-+**          Temporary register index that holds the variable value.
-+**
-+**      gcSHADER_VAR_CATEGORY varCategory
-+**          Variable category, normal or struct.
-+**
-+**      gctUINT16 numStructureElement
-+**          If struct, its element number.
-+**
-+**      gctINT16 parent
-+**          If struct, parent index in gcSHADER.variables.
-+**
-+**      gctINT16 prevSibling
-+**          If struct, previous sibling index in gcSHADER.variables.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT16* ThisVarIndex
-+**          Returned value about variable index in gcSHADER.
-+*/
-+gceSTATUS
-+gcSHADER_AddVariableEx(
-+    IN gcSHADER Shader,
-+    IN gctCONST_STRING Name,
-+    IN gcSHADER_TYPE Type,
-+    IN gctSIZE_T Length,
-+    IN gctUINT16 TempRegister,
-+    IN gcSHADER_VAR_CATEGORY varCategory,
-+    IN gctUINT16 numStructureElement,
-+    IN gctINT16 parent,
-+    IN gctINT16 prevSibling,
-+    OUT gctINT16* ThisVarIndex
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_UpdateVariable
-+********************************************************************************
-+**
-+**  Update a variable to a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT Index
-+**			Index of variable to retrieve.
-+**
-+**		gceVARIABLE_UPDATE_FLAGS flag
-+**			Flag which property of variable will be updated.
-+**
-+**      gctUINT newValue
-+**          New value to update.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_UpdateVariable(
-+    IN gcSHADER Shader,
-+    IN gctUINT Index,
-+    IN gceVARIABLE_UPDATE_FLAGS flag,
-+    IN gctUINT newValue
-+    );
-+
-+/*******************************************************************************
-+**							 gcSHADER_GetVariableCount
-+********************************************************************************
-+**
-+**	Get the number of variables for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Count
-+**			Pointer to a variable receiving the number of variables.
-+*/
-+gceSTATUS
-+gcSHADER_GetVariableCount(
-+	IN gcSHADER Shader,
-+	OUT gctSIZE_T * Count
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_GetVariable
-+********************************************************************************
-+**
-+**	Get the gcVARIABLE object pointer for an indexed variable for this shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT Index
-+**			Index of variable to retrieve.
-+**
-+**	OUTPUT:
-+**
-+**		gcVARIABLE * Variable
-+**			Pointer to a variable receiving the gcVARIABLE object pointer.
-+*/
-+gceSTATUS
-+gcSHADER_GetVariable(
-+	IN gcSHADER Shader,
-+	IN gctUINT Index,
-+	OUT gcVARIABLE * Variable
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_GetVariableIndexingRange
-+********************************************************************************
-+**
-+**	Get the gcVARIABLE indexing range.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcVARIABLE variable
-+**			Start variable.
-+**
-+**		gctBOOL whole
-+**			Indicate whether maximum indexing range is queried
-+**
-+**	OUTPUT:
-+**
-+**		gctUINT *Start
-+**			Pointer to range start (temp register index).
-+**
-+**		gctUINT *End
-+**			Pointer to range end (temp register index).
-+*/
-+gceSTATUS
-+gcSHADER_GetVariableIndexingRange(
-+	IN gcSHADER Shader,
-+    IN gcVARIABLE variable,
-+    IN gctBOOL whole,
-+    OUT gctUINT *Start,
-+    OUT gctUINT *End
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddOpcode
-+********************************************************************************
-+**
-+**	Add an opcode to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcSL_OPCODE Opcode
-+**			Opcode to add.
-+**
-+**		gctUINT16 TempRegister
-+**			Temporary register index that acts as the target of the opcode.
-+**
-+**		gctUINT8 Enable
-+**			Write enable bits for the temporary register that acts as the target
-+**			of the opcode.
-+**
-+**		gcSL_FORMAT Format
-+**			Format of the temporary register.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOpcode(
-+	IN gcSHADER Shader,
-+	IN gcSL_OPCODE Opcode,
-+	IN gctUINT16 TempRegister,
-+	IN gctUINT8 Enable,
-+	IN gcSL_FORMAT Format
-+	);
-+
-+gceSTATUS
-+gcSHADER_AddOpcode2(
-+	IN gcSHADER Shader,
-+	IN gcSL_OPCODE Opcode,
-+	IN gcSL_CONDITION Condition,
-+	IN gctUINT16 TempRegister,
-+	IN gctUINT8 Enable,
-+	IN gcSL_FORMAT Format
-+	);
-+
-+/*******************************************************************************
-+**							gcSHADER_AddOpcodeIndexed
-+********************************************************************************
-+**
-+**	Add an opcode to a gcSHADER object that writes to an dynamically indexed
-+**	target.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcSL_OPCODE Opcode
-+**			Opcode to add.
-+**
-+**		gctUINT16 TempRegister
-+**			Temporary register index that acts as the target of the opcode.
-+**
-+**		gctUINT8 Enable
-+**			Write enable bits  for the temporary register that acts as the
-+**			target of the opcode.
-+**
-+**		gcSL_INDEXED Mode
-+**			Location of the dynamic index inside the temporary register.  Valid
-+**			values can be:
-+**
-+**				gcSL_INDEXED_X - Use x component of the temporary register.
-+**				gcSL_INDEXED_Y - Use y component of the temporary register.
-+**				gcSL_INDEXED_Z - Use z component of the temporary register.
-+**				gcSL_INDEXED_W - Use w component of the temporary register.
-+**
-+**		gctUINT16 IndexRegister
-+**			Temporary register index that holds the dynamic index.
-+**
-+**		gcSL_FORMAT Format
-+**			Format of the temporary register.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOpcodeIndexed(
-+	IN gcSHADER Shader,
-+	IN gcSL_OPCODE Opcode,
-+	IN gctUINT16 TempRegister,
-+	IN gctUINT8 Enable,
-+	IN gcSL_INDEXED Mode,
-+	IN gctUINT16 IndexRegister,
-+	IN gcSL_FORMAT Format
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_AddOpcodeConditionIndexed
-+**
-+**  Add an opcode to a gcSHADER object that writes to an dynamically indexed
-+**  target.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gcSL_OPCODE Opcode
-+**          Opcode to add.
-+**
-+**      gcSL_CONDITION Condition
-+**          Condition to check.
-+**
-+**      gctUINT16 TempRegister
-+**          Temporary register index that acts as the target of the opcode.
-+**
-+**      gctUINT8 Enable
-+**          Write enable bits  for the temporary register that acts as the
-+**          target of the opcode.
-+**
-+**      gcSL_INDEXED Indexed
-+**          Location of the dynamic index inside the temporary register.  Valid
-+**          values can be:
-+**
-+**              gcSL_INDEXED_X - Use x component of the temporary register.
-+**              gcSL_INDEXED_Y - Use y component of the temporary register.
-+**              gcSL_INDEXED_Z - Use z component of the temporary register.
-+**              gcSL_INDEXED_W - Use w component of the temporary register.
-+**
-+**      gctUINT16 IndexRegister
-+**          Temporary register index that holds the dynamic index.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOpcodeConditionIndexed(
-+    IN gcSHADER Shader,
-+    IN gcSL_OPCODE Opcode,
-+    IN gcSL_CONDITION Condition,
-+    IN gctUINT16 TempRegister,
-+    IN gctUINT8 Enable,
-+    IN gcSL_INDEXED Indexed,
-+    IN gctUINT16 IndexRegister,
-+    IN gcSL_FORMAT Format
-+    );
-+
-+/*******************************************************************************
-+**						  gcSHADER_AddOpcodeConditional
-+********************************************************************************
-+**
-+**	Add an conditional opcode to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcSL_OPCODE Opcode
-+**			Opcode to add.
-+**
-+**		gcSL_CONDITION Condition
-+**			Condition that needs to evaluate to gcvTRUE in order for the opcode to
-+**			execute.
-+**
-+**		gctUINT Label
-+**			Target label if 'Condition' evaluates to gcvTRUE.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOpcodeConditional(
-+	IN gcSHADER Shader,
-+	IN gcSL_OPCODE Opcode,
-+	IN gcSL_CONDITION Condition,
-+	IN gctUINT Label
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_AddOpcodeConditionalFormatted
-+**
-+**  Add an conditional jump or call opcode to a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gcSL_OPCODE Opcode
-+**          Opcode to add.
-+**
-+**      gcSL_CONDITION Condition
-+**          Condition that needs to evaluate to gcvTRUE in order for the opcode to
-+**          execute.
-+**
-+**      gcSL_FORMAT Format
-+**          Format of conditional operands
-+**
-+**      gctUINT Label
-+**          Target label if 'Condition' evaluates to gcvTRUE.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOpcodeConditionalFormatted(
-+    IN gcSHADER Shader,
-+    IN gcSL_OPCODE Opcode,
-+    IN gcSL_CONDITION Condition,
-+    IN gcSL_FORMAT Format,
-+    IN gctUINT Label
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_AddOpcodeConditionalFormattedEnable
-+**
-+**  Add an conditional jump or call opcode to a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gcSL_OPCODE Opcode
-+**          Opcode to add.
-+**
-+**      gcSL_CONDITION Condition
-+**          Condition that needs to evaluate to gcvTRUE in order for the opcode to
-+**          execute.
-+**
-+**      gcSL_FORMAT Format
-+**          Format of conditional operands
-+**
-+**      gctUINT8 Enable
-+**          Write enable value for the target of the opcode.
-+**
-+**      gctUINT Label
-+**          Target label if 'Condition' evaluates to gcvTRUE.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddOpcodeConditionalFormattedEnable(
-+    IN gcSHADER Shader,
-+    IN gcSL_OPCODE Opcode,
-+    IN gcSL_CONDITION Condition,
-+    IN gcSL_FORMAT Format,
-+    IN gctUINT8 Enable,
-+    IN gctUINT Label
-+    );
-+
-+/*******************************************************************************
-+**								gcSHADER_AddLabel
-+********************************************************************************
-+**
-+**	Define a label at the current instruction of a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT Label
-+**			Label to define.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddLabel(
-+	IN gcSHADER Shader,
-+	IN gctUINT Label
-+	);
-+
-+/*******************************************************************************
-+**							   gcSHADER_AddSource
-+********************************************************************************
-+**
-+**	Add a source operand to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcSL_TYPE Type
-+**			Type of the source operand.
-+**
-+**		gctUINT16 SourceIndex
-+**			Index of the source operand.
-+**
-+**		gctUINT8 Swizzle
-+**			x, y, z, and w swizzle values packed into one 8-bit value.
-+**
-+**		gcSL_FORMAT Format
-+**			Format of the source operand.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSource(
-+	IN gcSHADER Shader,
-+	IN gcSL_TYPE Type,
-+	IN gctUINT16 SourceIndex,
-+	IN gctUINT8 Swizzle,
-+	IN gcSL_FORMAT Format
-+	);
-+
-+/*******************************************************************************
-+**							gcSHADER_AddSourceIndexed
-+********************************************************************************
-+**
-+**	Add a dynamically indexed source operand to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcSL_TYPE Type
-+**			Type of the source operand.
-+**
-+**		gctUINT16 SourceIndex
-+**			Index of the source operand.
-+**
-+**		gctUINT8 Swizzle
-+**			x, y, z, and w swizzle values packed into one 8-bit value.
-+**
-+**		gcSL_INDEXED Mode
-+**			Addressing mode for the index.
-+**
-+**		gctUINT16 IndexRegister
-+**			Temporary register index that holds the dynamic index.
-+**
-+**		gcSL_FORMAT Format
-+**			Format of the source operand.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceIndexed(
-+	IN gcSHADER Shader,
-+	IN gcSL_TYPE Type,
-+	IN gctUINT16 SourceIndex,
-+	IN gctUINT8 Swizzle,
-+	IN gcSL_INDEXED Mode,
-+	IN gctUINT16 IndexRegister,
-+	IN gcSL_FORMAT Format
-+	);
-+
-+/*******************************************************************************
-+**						   gcSHADER_AddSourceAttribute
-+********************************************************************************
-+**
-+**	Add an attribute as a source operand to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcATTRIBUTE Attribute
-+**			Pointer to a gcATTRIBUTE object.
-+**
-+**		gctUINT8 Swizzle
-+**			x, y, z, and w swizzle values packed into one 8-bit value.
-+**
-+**		gctINT Index
-+**			Static index into the attribute in case the attribute is a matrix
-+**			or array.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceAttribute(
-+	IN gcSHADER Shader,
-+	IN gcATTRIBUTE Attribute,
-+	IN gctUINT8 Swizzle,
-+	IN gctINT Index
-+	);
-+
-+/*******************************************************************************
-+**						   gcSHADER_AddSourceAttributeIndexed
-+********************************************************************************
-+**
-+**	Add an indexed attribute as a source operand to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcATTRIBUTE Attribute
-+**			Pointer to a gcATTRIBUTE object.
-+**
-+**		gctUINT8 Swizzle
-+**			x, y, z, and w swizzle values packed into one 8-bit value.
-+**
-+**		gctINT Index
-+**			Static index into the attribute in case the attribute is a matrix
-+**			or array.
-+**
-+**		gcSL_INDEXED Mode
-+**			Addressing mode of the dynamic index.
-+**
-+**		gctUINT16 IndexRegister
-+**			Temporary register index that holds the dynamic index.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceAttributeIndexed(
-+	IN gcSHADER Shader,
-+	IN gcATTRIBUTE Attribute,
-+	IN gctUINT8 Swizzle,
-+	IN gctINT Index,
-+	IN gcSL_INDEXED Mode,
-+	IN gctUINT16 IndexRegister
-+	);
-+
-+/*******************************************************************************
-+**							gcSHADER_AddSourceUniform
-+********************************************************************************
-+**
-+**	Add a uniform as a source operand to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**		gctUINT8 Swizzle
-+**			x, y, z, and w swizzle values packed into one 8-bit value.
-+**
-+**		gctINT Index
-+**			Static index into the uniform in case the uniform is a matrix or
-+**			array.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceUniform(
-+	IN gcSHADER Shader,
-+	IN gcUNIFORM Uniform,
-+	IN gctUINT8 Swizzle,
-+	IN gctINT Index
-+	);
-+
-+/*******************************************************************************
-+**						gcSHADER_AddSourceUniformIndexed
-+********************************************************************************
-+**
-+**	Add an indexed uniform as a source operand to a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**		gctUINT8 Swizzle
-+**			x, y, z, and w swizzle values packed into one 8-bit value.
-+**
-+**		gctINT Index
-+**			Static index into the uniform in case the uniform is a matrix or
-+**			array.
-+**
-+**		gcSL_INDEXED Mode
-+**			Addressing mode of the dynamic index.
-+**
-+**		gctUINT16 IndexRegister
-+**			Temporary register index that holds the dynamic index.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceUniformIndexed(
-+	IN gcSHADER Shader,
-+	IN gcUNIFORM Uniform,
-+	IN gctUINT8 Swizzle,
-+	IN gctINT Index,
-+	IN gcSL_INDEXED Mode,
-+	IN gctUINT16 IndexRegister
-+	);
-+
-+gceSTATUS
-+gcSHADER_AddSourceSamplerIndexed(
-+	IN gcSHADER Shader,
-+	IN gctUINT8 Swizzle,
-+	IN gcSL_INDEXED Mode,
-+	IN gctUINT16 IndexRegister
-+	);
-+
-+gceSTATUS
-+gcSHADER_AddSourceAttributeFormatted(
-+    IN gcSHADER Shader,
-+    IN gcATTRIBUTE Attribute,
-+    IN gctUINT8 Swizzle,
-+    IN gctINT Index,
-+    IN gcSL_FORMAT Format
-+    );
-+
-+gceSTATUS
-+gcSHADER_AddSourceAttributeIndexedFormatted(
-+    IN gcSHADER Shader,
-+    IN gcATTRIBUTE Attribute,
-+    IN gctUINT8 Swizzle,
-+    IN gctINT Index,
-+    IN gcSL_INDEXED Mode,
-+    IN gctUINT16 IndexRegister,
-+    IN gcSL_FORMAT Format
-+    );
-+
-+gceSTATUS
-+gcSHADER_AddSourceUniformFormatted(
-+    IN gcSHADER Shader,
-+    IN gcUNIFORM Uniform,
-+    IN gctUINT8 Swizzle,
-+    IN gctINT Index,
-+    IN gcSL_FORMAT Format
-+    );
-+
-+gceSTATUS
-+gcSHADER_AddSourceUniformIndexedFormatted(
-+    IN gcSHADER Shader,
-+    IN gcUNIFORM Uniform,
-+    IN gctUINT8 Swizzle,
-+    IN gctINT Index,
-+    IN gcSL_INDEXED Mode,
-+    IN gctUINT16 IndexRegister,
-+    IN gcSL_FORMAT Format
-+    );
-+
-+gceSTATUS
-+gcSHADER_AddSourceSamplerIndexedFormatted(
-+    IN gcSHADER Shader,
-+    IN gctUINT8 Swizzle,
-+    IN gcSL_INDEXED Mode,
-+    IN gctUINT16 IndexRegister,
-+    IN gcSL_FORMAT Format
-+    );
-+
-+/*******************************************************************************
-+**						   gcSHADER_AddSourceConstant
-+********************************************************************************
-+**
-+**	Add a constant floating point value as a source operand to a gcSHADER
-+**	object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctFLOAT Constant
-+**			Floating point constant.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceConstant(
-+	IN gcSHADER Shader,
-+	IN gctFLOAT Constant
-+	);
-+
-+/*******************************************************************************
-+**			                   gcSHADER_AddSourceConstantFormatted
-+********************************************************************************
-+**
-+**	Add a constant value as a source operand to a gcSHADER
-+**	object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		void * Constant
-+**			Pointer to constant.
-+**
-+**		gcSL_FORMAT Format
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_AddSourceConstantFormatted(
-+	IN gcSHADER Shader,
-+	IN void *Constant,
-+	IN gcSL_FORMAT Format
-+	);
-+
-+/*******************************************************************************
-+**								  gcSHADER_Pack
-+********************************************************************************
-+**
-+**	Pack a dynamically created gcSHADER object by trimming the allocated arrays
-+**	and resolving all the labeling.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_Pack(
-+	IN gcSHADER Shader
-+	);
-+
-+/*******************************************************************************
-+**								gcSHADER_SetOptimizationOption
-+********************************************************************************
-+**
-+**	Set optimization option of a gcSHADER object.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object.
-+**
-+**		gctUINT OptimizationOption
-+**			Optimization option.  Can be one of the following:
-+**
-+**				0						- No optimization.
-+**				1						- Full optimization.
-+**				Other value				- For optimizer testing.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcSHADER_SetOptimizationOption(
-+	IN gcSHADER Shader,
-+	IN gctUINT OptimizationOption
-+	);
-+
-+/*******************************************************************************
-+**  gcSHADER_ReallocateFunctions
-+**
-+**  Reallocate an array of pointers to gcFUNCTION objects.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcSHADER_ReallocateFunctions(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T Count
-+    );
-+
-+gceSTATUS
-+gcSHADER_AddFunction(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	OUT gcFUNCTION * Function
-+	);
-+
-+gceSTATUS
-+gcSHADER_ReallocateKernelFunctions(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T Count
-+    );
-+
-+gceSTATUS
-+gcSHADER_AddKernelFunction(
-+	IN gcSHADER Shader,
-+	IN gctCONST_STRING Name,
-+	OUT gcKERNEL_FUNCTION * KernelFunction
-+	);
-+
-+gceSTATUS
-+gcSHADER_BeginFunction(
-+	IN gcSHADER Shader,
-+	IN gcFUNCTION Function
-+	);
-+
-+gceSTATUS
-+gcSHADER_EndFunction(
-+	IN gcSHADER Shader,
-+	IN gcFUNCTION Function
-+	);
-+
-+gceSTATUS
-+gcSHADER_BeginKernelFunction(
-+	IN gcSHADER Shader,
-+	IN gcKERNEL_FUNCTION KernelFunction
-+	);
-+
-+gceSTATUS
-+gcSHADER_EndKernelFunction(
-+	IN gcSHADER Shader,
-+	IN gcKERNEL_FUNCTION KernelFunction,
-+	IN gctSIZE_T LocalMemorySize
-+	);
-+
-+gceSTATUS
-+gcSHADER_SetMaxKernelFunctionArgs(
-+    IN gcSHADER Shader,
-+    IN gctUINT32 MaxKernelFunctionArgs
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_SetConstantMemorySize
-+**
-+**  Set the constant memory address space size of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T ConstantMemorySize
-+**          Constant memory size in bytes
-+**
-+**      gctCHAR *ConstantMemoryBuffer
-+**          Constant memory buffer
-+*/
-+gceSTATUS
-+gcSHADER_SetConstantMemorySize(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T ConstantMemorySize,
-+    IN gctCHAR * ConstantMemoryBuffer
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_GetConstantMemorySize
-+**
-+**  Set the constant memory address space size of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * ConstantMemorySize
-+**          Pointer to a variable receiving constant memory size in bytes
-+**
-+**      gctCHAR **ConstantMemoryBuffer.
-+**          Pointer to a variable for returned shader constant memory buffer.
-+*/
-+gceSTATUS
-+gcSHADER_GetConstantMemorySize(
-+    IN gcSHADER Shader,
-+    OUT gctSIZE_T * ConstantMemorySize,
-+    OUT gctCHAR ** ConstantMemoryBuffer
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_SetPrivateMemorySize
-+**
-+**  Set the private memory address space size of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T PrivateMemorySize
-+**          Private memory size in bytes
-+*/
-+gceSTATUS
-+gcSHADER_SetPrivateMemorySize(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T PrivateMemorySize
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_GetPrivateMemorySize
-+**
-+**  Set the private memory address space size of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * PrivateMemorySize
-+**          Pointer to a variable receiving private memory size in bytes
-+*/
-+gceSTATUS
-+gcSHADER_GetPrivateMemorySize(
-+    IN gcSHADER Shader,
-+    OUT gctSIZE_T * PrivateMemorySize
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_SetLocalMemorySize
-+**
-+**  Set the local memory address space size of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**      gctSIZE_T LocalMemorySize
-+**          Local memory size in bytes
-+*/
-+gceSTATUS
-+gcSHADER_SetLocalMemorySize(
-+    IN gcSHADER Shader,
-+    IN gctSIZE_T LocalMemorySize
-+    );
-+
-+/*******************************************************************************
-+**  gcSHADER_GetLocalMemorySize
-+**
-+**  Set the local memory address space size of a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * LocalMemorySize
-+**          Pointer to a variable receiving lcoal memory size in bytes
-+*/
-+gceSTATUS
-+gcSHADER_GetLocalMemorySize(
-+    IN gcSHADER Shader,
-+    OUT gctSIZE_T * LocalMemorySize
-+    );
-+
-+
-+/*******************************************************************************
-+**  gcSHADER_CheckValidity
-+**
-+**  Check validity for a gcSHADER object.
-+**
-+**  INPUT:
-+**
-+**      gcSHADER Shader
-+**          Pointer to a gcSHADER object.
-+**
-+*/
-+gceSTATUS
-+gcSHADER_CheckValidity(
-+    IN gcSHADER Shader
-+    );
-+
-+#if gcdUSE_WCLIP_PATCH
-+gceSTATUS
-+gcATTRIBUTE_IsPosition(
-+        IN gcATTRIBUTE Attribute,
-+        OUT gctBOOL * IsPosition
-+        );
-+#endif
-+
-+/*******************************************************************************
-+**                             gcATTRIBUTE_GetType
-+********************************************************************************
-+**
-+**	Get the type and array length of a gcATTRIBUTE object.
-+**
-+**	INPUT:
-+**
-+**		gcATTRIBUTE Attribute
-+**			Pointer to a gcATTRIBUTE object.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER_TYPE * Type
-+**			Pointer to a variable receiving the type of the attribute.  'Type'
-+**			can be gcvNULL, in which case no type will be returned.
-+**
-+**		gctSIZE_T * ArrayLength
-+**			Pointer to a variable receiving the length of the array if the
-+**			attribute was declared as an array.  If the attribute was not
-+**			declared as an array, the array length will be 1.  'ArrayLength' can
-+**			be gcvNULL, in which case no array length will be returned.
-+*/
-+gceSTATUS
-+gcATTRIBUTE_GetType(
-+	IN gcATTRIBUTE Attribute,
-+	OUT gcSHADER_TYPE * Type,
-+	OUT gctSIZE_T * ArrayLength
-+	);
-+
-+/*******************************************************************************
-+**                            gcATTRIBUTE_GetName
-+********************************************************************************
-+**
-+**	Get the name of a gcATTRIBUTE object.
-+**
-+**	INPUT:
-+**
-+**		gcATTRIBUTE Attribute
-+**			Pointer to a gcATTRIBUTE object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Length
-+**			Pointer to a variable receiving the length of the attribute name.
-+**			'Length' can be gcvNULL, in which case no length will be returned.
-+**
-+**		gctCONST_STRING * Name
-+**			Pointer to a variable receiving the pointer to the attribute name.
-+**			'Name' can be gcvNULL, in which case no name will be returned.
-+*/
-+gceSTATUS
-+gcATTRIBUTE_GetName(
-+	IN gcATTRIBUTE Attribute,
-+	OUT gctSIZE_T * Length,
-+	OUT gctCONST_STRING * Name
-+	);
-+
-+/*******************************************************************************
-+**                            gcATTRIBUTE_IsEnabled
-+********************************************************************************
-+**
-+**	Query the enabled state of a gcATTRIBUTE object.
-+**
-+**	INPUT:
-+**
-+**		gcATTRIBUTE Attribute
-+**			Pointer to a gcATTRIBUTE object.
-+**
-+**	OUTPUT:
-+**
-+**		gctBOOL * Enabled
-+**			Pointer to a variable receiving the enabled state of the attribute.
-+*/
-+gceSTATUS
-+gcATTRIBUTE_IsEnabled(
-+	IN gcATTRIBUTE Attribute,
-+	OUT gctBOOL * Enabled
-+	);
-+
-+gceSTATUS
-+gcATTRIBUTE_GetIndex(
-+    IN gcATTRIBUTE Attribute,
-+    OUT gctUINT16 * Index
-+    );
-+
-+/*******************************************************************************
-+**                              gcUNIFORM_GetType
-+********************************************************************************
-+**
-+**	Get the type and array length of a gcUNIFORM object.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER_TYPE * Type
-+**			Pointer to a variable receiving the type of the uniform.  'Type' can
-+**			be gcvNULL, in which case no type will be returned.
-+**
-+**		gctSIZE_T * ArrayLength
-+**			Pointer to a variable receiving the length of the array if the
-+**			uniform was declared as an array.  If the uniform was not declared
-+**			as an array, the array length will be 1.  'ArrayLength' can be gcvNULL,
-+**			in which case no array length will be returned.
-+*/
-+gceSTATUS
-+gcUNIFORM_GetType(
-+	IN gcUNIFORM Uniform,
-+	OUT gcSHADER_TYPE * Type,
-+	OUT gctSIZE_T * ArrayLength
-+	);
-+
-+/*******************************************************************************
-+**                              gcUNIFORM_GetTypeEx
-+********************************************************************************
-+**
-+**	Get the type and array length of a gcUNIFORM object.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER_TYPE * Type
-+**			Pointer to a variable receiving the type of the uniform.  'Type' can
-+**			be gcvNULL, in which case no type will be returned.
-+**
-+**		gcSHADER_PRECISION * Precision
-+**			Pointer to a variable receiving the precision of the uniform.  'Precision' can
-+**			be gcvNULL, in which case no type will be returned.
-+**
-+**		gctSIZE_T * ArrayLength
-+**			Pointer to a variable receiving the length of the array if the
-+**			uniform was declared as an array.  If the uniform was not declared
-+**			as an array, the array length will be 1.  'ArrayLength' can be gcvNULL,
-+**			in which case no array length will be returned.
-+*/
-+gceSTATUS
-+gcUNIFORM_GetTypeEx(
-+	IN gcUNIFORM Uniform,
-+	OUT gcSHADER_TYPE * Type,
-+    OUT gcSHADER_PRECISION * Precision,
-+	OUT gctSIZE_T * ArrayLength
-+	);
-+
-+/*******************************************************************************
-+**                              gcUNIFORM_GetFlags
-+********************************************************************************
-+**
-+**	Get the flags of a gcUNIFORM object.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**	OUTPUT:
-+**
-+**		gceUNIFORM_FLAGS * Flags
-+**			Pointer to a variable receiving the flags of the uniform.
-+**
-+*/
-+gceSTATUS
-+gcUNIFORM_GetFlags(
-+	IN gcUNIFORM Uniform,
-+	OUT gceUNIFORM_FLAGS * Flags
-+	);
-+
-+/*******************************************************************************
-+**                              gcUNIFORM_SetFlags
-+********************************************************************************
-+**
-+**	Set the flags of a gcUNIFORM object.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**		gceUNIFORM_FLAGS Flags
-+**			Flags of the uniform to be set.
-+**
-+**	OUTPUT:
-+**			Nothing.
-+**
-+*/
-+gceSTATUS
-+gcUNIFORM_SetFlags(
-+	IN gcUNIFORM Uniform,
-+	IN gceUNIFORM_FLAGS Flags
-+	);
-+
-+/*******************************************************************************
-+**                              gcUNIFORM_GetName
-+********************************************************************************
-+**
-+**	Get the name of a gcUNIFORM object.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Length
-+**			Pointer to a variable receiving the length of the uniform name.
-+**			'Length' can be gcvNULL, in which case no length will be returned.
-+**
-+**		gctCONST_STRING * Name
-+**			Pointer to a variable receiving the pointer to the uniform name.
-+**			'Name' can be gcvNULL, in which case no name will be returned.
-+*/
-+gceSTATUS
-+gcUNIFORM_GetName(
-+	IN gcUNIFORM Uniform,
-+	OUT gctSIZE_T * Length,
-+	OUT gctCONST_STRING * Name
-+	);
-+
-+/*******************************************************************************
-+**                              gcUNIFORM_GetSampler
-+********************************************************************************
-+**
-+**	Get the physical sampler number for a sampler gcUNIFORM object.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**	OUTPUT:
-+**
-+**		gctUINT32 * Sampler
-+**			Pointer to a variable receiving the physical sampler.
-+*/
-+gceSTATUS
-+gcUNIFORM_GetSampler(
-+	IN gcUNIFORM Uniform,
-+	OUT gctUINT32 * Sampler
-+	);
-+
-+gceSTATUS
-+gcUNIFORM_GetIndex(
-+    IN gcUNIFORM Uniform,
-+    OUT gctUINT16 * Index
-+    );
-+
-+/*******************************************************************************
-+**  gcUNIFORM_GetFormat
-+**
-+**  Get the type and array length of a gcUNIFORM object.
-+**
-+**  INPUT:
-+**
-+**      gcUNIFORM Uniform
-+**          Pointer to a gcUNIFORM object.
-+**
-+**  OUTPUT:
-+**
-+**      gcSL_FORMAT * Format
-+**          Pointer to a variable receiving the format of element of the uniform.
-+**          'Type' can be gcvNULL, in which case no type will be returned.
-+**
-+**      gctBOOL * IsPointer
-+**          Pointer to a variable receiving the state wheter the uniform is a pointer.
-+**          'IsPointer' can be gcvNULL, in which case no array length will be returned.
-+*/
-+gceSTATUS
-+gcUNIFORM_GetFormat(
-+    IN gcUNIFORM Uniform,
-+    OUT gcSL_FORMAT * Format,
-+    OUT gctBOOL * IsPointer
-+    );
-+
-+/*******************************************************************************
-+**  gcUNIFORM_SetFormat
-+**
-+**  Set the format and isPointer of a uniform.
-+**
-+**  INPUT:
-+**
-+**      gcUNIFORM Uniform
-+**          Pointer to a gcUNIFORM object.
-+**
-+**      gcSL_FORMAT Format
-+**          Format of element of the uniform shaderType.
-+**
-+**      gctBOOL IsPointer
-+**          Wheter the uniform is a pointer.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gcUNIFORM_SetFormat(
-+    IN gcUNIFORM Uniform,
-+    IN gcSL_FORMAT Format,
-+    IN gctBOOL IsPointer
-+    );
-+
-+/*******************************************************************************
-+**							   gcUNIFORM_SetValue
-+********************************************************************************
-+**
-+**	Set the value of a uniform in integer.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**		gctSIZE_T Count
-+**			Number of entries to program if the uniform has been declared as an
-+**			array.
-+**
-+**		const gctINT * Value
-+**			Pointer to a buffer holding the integer values for the uniform.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcUNIFORM_SetValue(
-+	IN gcUNIFORM Uniform,
-+	IN gctSIZE_T Count,
-+	IN const gctINT * Value
-+	);
-+
-+/*******************************************************************************
-+**							   gcUNIFORM_SetValueX
-+********************************************************************************
-+**
-+**	Set the value of a uniform in fixed point.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**		gctSIZE_T Count
-+**			Number of entries to program if the uniform has been declared as an
-+**			array.
-+**
-+**		const gctFIXED_POINT * Value
-+**			Pointer to a buffer holding the fixed point values for the uniform.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcUNIFORM_SetValueX(
-+	IN gcUNIFORM Uniform,
-+	IN gctSIZE_T Count,
-+	IN gctFIXED_POINT * Value
-+	);
-+
-+/*******************************************************************************
-+**							   gcUNIFORM_SetValueF
-+********************************************************************************
-+**
-+**	Set the value of a uniform in floating point.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**		gctSIZE_T Count
-+**			Number of entries to program if the uniform has been declared as an
-+**			array.
-+**
-+**		const gctFLOAT * Value
-+**			Pointer to a buffer holding the floating point values for the
-+**			uniform.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gceSTATUS
-+gcUNIFORM_SetValueF(
-+	IN gcUNIFORM Uniform,
-+	IN gctSIZE_T Count,
-+	IN const gctFLOAT * Value
-+	);
-+
-+/*******************************************************************************
-+**  gcUNIFORM_ProgramF
-+**
-+**  Set the value of a uniform in floating point.
-+**
-+**  INPUT:
-+**
-+**      gctUINT32 Address
-+**          Address of Uniform.
-+**
-+**      gctSIZE_T Row/Col
-+**
-+**      const gctFLOAT * Value
-+**          Pointer to a buffer holding the floating point values for the
-+**          uniform.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gcUNIFORM_ProgramF(
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Row,
-+    IN gctSIZE_T Col,
-+    IN const gctFLOAT * Value
-+    );
-+
-+/*******************************************************************************
-+**						 gcUNIFORM_GetModelViewProjMatrix
-+********************************************************************************
-+**
-+**	Get the value of uniform modelViewProjMatrix ID if present.
-+**
-+**	INPUT:
-+**
-+**		gcUNIFORM Uniform
-+**			Pointer to a gcUNIFORM object.
-+**
-+**	OUTPUT:
-+**
-+**		Nothing.
-+*/
-+gctUINT
-+gcUNIFORM_GetModelViewProjMatrix(
-+    IN gcUNIFORM Uniform
-+    );
-+
-+/*******************************************************************************
-+**								gcOUTPUT_GetType
-+********************************************************************************
-+**
-+**	Get the type and array length of a gcOUTPUT object.
-+**
-+**	INPUT:
-+**
-+**		gcOUTPUT Output
-+**			Pointer to a gcOUTPUT object.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER_TYPE * Type
-+**			Pointer to a variable receiving the type of the output.  'Type' can
-+**			be gcvNULL, in which case no type will be returned.
-+**
-+**		gctSIZE_T * ArrayLength
-+**			Pointer to a variable receiving the length of the array if the
-+**			output was declared as an array.  If the output was not declared
-+**			as an array, the array length will be 1.  'ArrayLength' can be gcvNULL,
-+**			in which case no array length will be returned.
-+*/
-+gceSTATUS
-+gcOUTPUT_GetType(
-+	IN gcOUTPUT Output,
-+	OUT gcSHADER_TYPE * Type,
-+	OUT gctSIZE_T * ArrayLength
-+	);
-+
-+/*******************************************************************************
-+**							   gcOUTPUT_GetIndex
-+********************************************************************************
-+**
-+**	Get the index of a gcOUTPUT object.
-+**
-+**	INPUT:
-+**
-+**		gcOUTPUT Output
-+**			Pointer to a gcOUTPUT object.
-+**
-+**	OUTPUT:
-+**
-+**		gctUINT * Index
-+**			Pointer to a variable receiving the temporary register index of the
-+**			output.  'Index' can be gcvNULL,. in which case no index will be
-+**			returned.
-+*/
-+gceSTATUS
-+gcOUTPUT_GetIndex(
-+	IN gcOUTPUT Output,
-+	OUT gctUINT * Index
-+	);
-+
-+/*******************************************************************************
-+**								gcOUTPUT_GetName
-+********************************************************************************
-+**
-+**	Get the name of a gcOUTPUT object.
-+**
-+**	INPUT:
-+**
-+**		gcOUTPUT Output
-+**			Pointer to a gcOUTPUT object.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * Length
-+**			Pointer to a variable receiving the length of the output name.
-+**			'Length' can be gcvNULL, in which case no length will be returned.
-+**
-+**		gctCONST_STRING * Name
-+**			Pointer to a variable receiving the pointer to the output name.
-+**			'Name' can be gcvNULL, in which case no name will be returned.
-+*/
-+gceSTATUS
-+gcOUTPUT_GetName(
-+	IN gcOUTPUT Output,
-+	OUT gctSIZE_T * Length,
-+	OUT gctCONST_STRING * Name
-+	);
-+
-+/*******************************************************************************
-+*********************************************************** F U N C T I O N S **
-+*******************************************************************************/
-+
-+/*******************************************************************************
-+**  gcFUNCTION_ReallocateArguments
-+**
-+**  Reallocate an array of gcsFUNCTION_ARGUMENT objects.
-+**
-+**  INPUT:
-+**
-+**      gcFUNCTION Function
-+**          Pointer to a gcFUNCTION object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcFUNCTION_ReallocateArguments(
-+    IN gcFUNCTION Function,
-+    IN gctSIZE_T Count
-+    );
-+
-+gceSTATUS
-+gcFUNCTION_AddArgument(
-+	IN gcFUNCTION Function,
-+	IN gctUINT16 TempIndex,
-+	IN gctUINT8 Enable,
-+	IN gctUINT8 Qualifier
-+	);
-+
-+gceSTATUS
-+gcFUNCTION_GetArgument(
-+	IN gcFUNCTION Function,
-+	IN gctUINT16 Index,
-+	OUT gctUINT16_PTR Temp,
-+	OUT gctUINT8_PTR Enable,
-+	OUT gctUINT8_PTR Swizzle
-+	);
-+
-+gceSTATUS
-+gcFUNCTION_GetLabel(
-+	IN gcFUNCTION Function,
-+	OUT gctUINT_PTR Label
-+	);
-+
-+/*******************************************************************************
-+************************* K E R N E L    P R O P E R T Y    F U N C T I O N S **
-+*******************************************************************************/
-+/*******************************************************************************/
-+gceSTATUS
-+gcKERNEL_FUNCTION_AddKernelFunctionProperties(
-+	    IN gcKERNEL_FUNCTION KernelFunction,
-+		IN gctINT propertyType,
-+		IN gctSIZE_T propertySize,
-+		IN gctINT * values
-+		);
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetPropertyCount(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    OUT gctSIZE_T * Count
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetProperty(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctUINT Index,
-+	OUT gctSIZE_T * propertySize,
-+	OUT gctINT * propertyType,
-+	OUT gctINT * propertyValues
-+    );
-+
-+
-+/*******************************************************************************
-+*******************************I M A G E   S A M P L E R    F U N C T I O N S **
-+*******************************************************************************/
-+/*******************************************************************************
-+**  gcKERNEL_FUNCTION_ReallocateImageSamplers
-+**
-+**  Reallocate an array of pointers to image sampler pair.
-+**
-+**  INPUT:
-+**
-+**      gcKERNEL_FUNCTION KernelFunction
-+**          Pointer to a gcKERNEL_FUNCTION object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcKERNEL_FUNCTION_ReallocateImageSamplers(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctSIZE_T Count
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_AddImageSampler(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctUINT8 ImageNum,
-+    IN gctBOOL IsConstantSamplerType,
-+    IN gctUINT32 SamplerType
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetImageSamplerCount(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    OUT gctSIZE_T * Count
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetImageSampler(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctUINT Index,
-+    OUT gctUINT8 *ImageNum,
-+    OUT gctBOOL *IsConstantSamplerType,
-+    OUT gctUINT32 *SamplerType
-+    );
-+
-+/*******************************************************************************
-+*********************************************K E R N E L    F U N C T I O N S **
-+*******************************************************************************/
-+
-+/*******************************************************************************
-+**  gcKERNEL_FUNCTION_ReallocateArguments
-+**
-+**  Reallocate an array of gcsFUNCTION_ARGUMENT objects.
-+**
-+**  INPUT:
-+**
-+**      gcKERNEL_FUNCTION Function
-+**          Pointer to a gcKERNEL_FUNCTION object.
-+**
-+**      gctSIZE_T Count
-+**          Array count to reallocate.  'Count' must be at least 1.
-+*/
-+gceSTATUS
-+gcKERNEL_FUNCTION_ReallocateArguments(
-+    IN gcKERNEL_FUNCTION Function,
-+    IN gctSIZE_T Count
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_AddArgument(
-+	IN gcKERNEL_FUNCTION Function,
-+	IN gctUINT16 TempIndex,
-+	IN gctUINT8 Enable,
-+	IN gctUINT8 Qualifier
-+	);
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetArgument(
-+	IN gcKERNEL_FUNCTION Function,
-+	IN gctUINT16 Index,
-+	OUT gctUINT16_PTR Temp,
-+	OUT gctUINT8_PTR Enable,
-+	OUT gctUINT8_PTR Swizzle
-+	);
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetLabel(
-+	IN gcKERNEL_FUNCTION Function,
-+	OUT gctUINT_PTR Label
-+	);
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetName(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    OUT gctSIZE_T * Length,
-+    OUT gctCONST_STRING * Name
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_ReallocateUniformArguments(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctSIZE_T Count
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_AddUniformArgument(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctCONST_STRING Name,
-+    IN gcSHADER_TYPE Type,
-+    IN gctSIZE_T Length,
-+    OUT gcUNIFORM * UniformArgument
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetUniformArgumentCount(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    OUT gctSIZE_T * Count
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_GetUniformArgument(
-+    IN gcKERNEL_FUNCTION KernelFunction,
-+    IN gctUINT Index,
-+    OUT gcUNIFORM * UniformArgument
-+    );
-+
-+gceSTATUS
-+gcKERNEL_FUNCTION_SetCodeEnd(
-+    IN gcKERNEL_FUNCTION KernelFunction
-+    );
-+
-+/*******************************************************************************
-+**                              gcCompileShader
-+********************************************************************************
-+**
-+**	Compile a shader.
-+**
-+**	INPUT:
-+**
-+**		gcoOS Hal
-+**			Pointer to an gcoHAL object.
-+**
-+**		gctINT ShaderType
-+**			Shader type to compile.  Can be one of the following values:
-+**
-+**				gcSHADER_TYPE_VERTEX
-+**					Compile a vertex shader.
-+**
-+**				gcSHADER_TYPE_FRAGMENT
-+**					Compile a fragment shader.
-+**
-+**		gctSIZE_T SourceSize
-+**			Size of the source buffer in bytes.
-+**
-+**		gctCONST_STRING Source
-+**			Pointer to the buffer containing the shader source code.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER * Binary
-+**			Pointer to a variable receiving the pointer to a gcSHADER object
-+**			containg the compiled shader code.
-+**
-+**		gctSTRING * Log
-+**			Pointer to a variable receiving a string pointer containging the
-+**			compile log.
-+*/
-+gceSTATUS
-+gcCompileShader(
-+	IN gcoHAL Hal,
-+	IN gctINT ShaderType,
-+	IN gctSIZE_T SourceSize,
-+	IN gctCONST_STRING Source,
-+	OUT gcSHADER * Binary,
-+	OUT gctSTRING * Log
-+	);
-+
-+/*******************************************************************************
-+**                              gcOptimizeShader
-+********************************************************************************
-+**
-+**	Optimize a shader.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Shader
-+**			Pointer to a gcSHADER object holding information about the compiled
-+**			shader.
-+**
-+**		gctFILE LogFile
-+**			Pointer to an open FILE object.
-+*/
-+gceSTATUS
-+gcOptimizeShader(
-+	IN gcSHADER Shader,
-+	IN gctFILE LogFile
-+	);
-+
-+/*******************************************************************************
-+**                                gcLinkShaders
-+********************************************************************************
-+**
-+**	Link two shaders and generate a harwdare specific state buffer by compiling
-+**	the compiler generated code through the resource allocator and code
-+**	generator.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER VertexShader
-+**			Pointer to a gcSHADER object holding information about the compiled
-+**			vertex shader.
-+**
-+**		gcSHADER FragmentShader
-+**			Pointer to a gcSHADER object holding information about the compiled
-+**			fragment shader.
-+**
-+**		gceSHADER_FLAGS Flags
-+**			Compiler flags.  Can be any of the following:
-+**
-+**				gcvSHADER_DEAD_CODE       - Dead code elimination.
-+**				gcvSHADER_RESOURCE_USAGE  - Resource usage optimizaion.
-+**				gcvSHADER_OPTIMIZER       - Full optimization.
-+**				gcvSHADER_USE_GL_Z        - Use OpenGL ES Z coordinate.
-+**				gcvSHADER_USE_GL_POSITION - Use OpenGL ES gl_Position.
-+**				gcvSHADER_USE_GL_FACE     - Use OpenGL ES gl_FaceForward.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * StateBufferSize
-+**			Pointer to a variable receicing the number of bytes in the buffer
-+**			returned in 'StateBuffer'.
-+**
-+**		gctPOINTER * StateBuffer
-+**			Pointer to a variable receiving a buffer pointer that contains the
-+**			states required to download the shaders into the hardware.
-+**
-+**		gcsHINT_PTR * Hints
-+**			Pointer to a variable receiving a gcsHINT structure pointer that
-+**			contains information required when loading the shader states.
-+*/
-+gceSTATUS
-+gcLinkShaders(
-+	IN gcSHADER VertexShader,
-+	IN gcSHADER FragmentShader,
-+	IN gceSHADER_FLAGS Flags,
-+	OUT gctSIZE_T * StateBufferSize,
-+	OUT gctPOINTER * StateBuffer,
-+	OUT gcsHINT_PTR * Hints,
-+    OUT gcMACHINECODE_PTR *ppVsMachineCode,
-+    OUT gcMACHINECODE_PTR *ppFsMachineCode
-+	);
-+
-+/*******************************************************************************
-+**                                gcLoadShaders
-+********************************************************************************
-+**
-+**	Load a pre-compiled and pre-linked shader program into the hardware.
-+**
-+**	INPUT:
-+**
-+**		gcoHAL Hal
-+**			Pointer to a gcoHAL object.
-+**
-+**		gctSIZE_T StateBufferSize
-+**			The number of bytes in the 'StateBuffer'.
-+**
-+**		gctPOINTER StateBuffer
-+**			Pointer to the states that make up the shader program.
-+**
-+**		gcsHINT_PTR Hints
-+**			Pointer to a gcsHINT structure that contains information required
-+**			when loading the shader states.
-+*/
-+gceSTATUS
-+gcLoadShaders(
-+	IN gcoHAL Hal,
-+	IN gctSIZE_T StateBufferSize,
-+	IN gctPOINTER StateBuffer,
-+	IN gcsHINT_PTR Hints
-+	);
-+
-+gceSTATUS
-+gcRecompileShaders(
-+    IN gcoHAL Hal,
-+    IN gcMACHINECODE_PTR pVsMachineCode,
-+    IN gcMACHINECODE_PTR pPsMachineCode,
-+    /*Recompile variables*/
-+    IN OUT gctPOINTER *ppRecompileStateBuffer,
-+    IN OUT gctSIZE_T *pRecompileStateBufferSize,
-+    IN OUT gcsHINT_PTR *ppRecompileHints,
-+    /* natvie state*/
-+    IN gctPOINTER pNativeStateBuffer,
-+    IN gctSIZE_T nativeStateBufferSize,
-+    IN gcsHINT_PTR pNativeHints,
-+    /* npt info */
-+    IN gctUINT32 Samplers,
-+    IN gctUINT32 *SamplerWrapS,
-+    IN gctUINT32 *SamplerWrapT
-+    );
-+
-+gceSTATUS
-+gcRecompileDepthBias(
-+    IN gcoHAL Hal,
-+    IN gcMACHINECODE_PTR pVsMachineCode,
-+    /*Recompile variables*/
-+    IN OUT gctPOINTER *ppRecompileStateBuffer,
-+    IN OUT gctSIZE_T *pRecompileStateBufferSize,
-+    IN OUT gcsHINT_PTR *ppRecompileHints,
-+    /* natvie state*/
-+    IN gctPOINTER pNativeStateBuffer,
-+    IN gctSIZE_T nativeStateBufferSize,
-+    IN gcsHINT_PTR pNativeHints,
-+	OUT gctINT * uniformAddr,
-+	OUT gctINT * uniformChannel
-+    );
-+
-+/*******************************************************************************
-+**                                gcSaveProgram
-+********************************************************************************
-+**
-+**	Save pre-compiled shaders and pre-linked programs to a binary file.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER VertexShader
-+**			Pointer to vertex shader object.
-+**
-+**		gcSHADER FragmentShader
-+**			Pointer to fragment shader object.
-+**
-+**		gctSIZE_T ProgramBufferSize
-+**			Number of bytes in 'ProgramBuffer'.
-+**
-+**		gctPOINTER ProgramBuffer
-+**			Pointer to buffer containing the program states.
-+**
-+**		gcsHINT_PTR Hints
-+**			Pointer to HINTS structure for program states.
-+**
-+**	OUTPUT:
-+**
-+**		gctPOINTER * Binary
-+**			Pointer to a variable receiving the binary data to be saved.
-+**
-+**		gctSIZE_T * BinarySize
-+**			Pointer to a variable receiving the number of bytes inside 'Binary'.
-+*/
-+gceSTATUS
-+gcSaveProgram(
-+	IN gcSHADER VertexShader,
-+	IN gcSHADER FragmentShader,
-+	IN gctSIZE_T ProgramBufferSize,
-+	IN gctPOINTER ProgramBuffer,
-+	IN gcsHINT_PTR Hints,
-+	OUT gctPOINTER * Binary,
-+	OUT gctSIZE_T * BinarySize
-+	);
-+
-+/*******************************************************************************
-+**                                gcLoadProgram
-+********************************************************************************
-+**
-+**	Load pre-compiled shaders and pre-linked programs from a binary file.
-+**
-+**	INPUT:
-+**
-+**		gctPOINTER Binary
-+**			Pointer to the binary data loaded.
-+**
-+**		gctSIZE_T BinarySize
-+**			Number of bytes in 'Binary'.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER VertexShader
-+**			Pointer to a vertex shader object.
-+**
-+**		gcSHADER FragmentShader
-+**			Pointer to a fragment shader object.
-+**
-+**		gctSIZE_T * ProgramBufferSize
-+**			Pointer to a variable receicing the number of bytes in the buffer
-+**			returned in 'ProgramBuffer'.
-+**
-+**		gctPOINTER * ProgramBuffer
-+**			Pointer to a variable receiving a buffer pointer that contains the
-+**			states required to download the shaders into the hardware.
-+**
-+**		gcsHINT_PTR * Hints
-+**			Pointer to a variable receiving a gcsHINT structure pointer that
-+**			contains information required when loading the shader states.
-+*/
-+gceSTATUS
-+gcLoadProgram(
-+	IN gctPOINTER Binary,
-+	IN gctSIZE_T BinarySize,
-+	OUT gcSHADER VertexShader,
-+	OUT gcSHADER FragmentShader,
-+	OUT gctSIZE_T * ProgramBufferSize,
-+	OUT gctPOINTER * ProgramBuffer,
-+	OUT gcsHINT_PTR * Hints
-+	);
-+
-+/*******************************************************************************
-+**                              gcCompileKernel
-+********************************************************************************
-+**
-+**	Compile a OpenCL kernel shader.
-+**
-+**	INPUT:
-+**
-+**		gcoOS Hal
-+**			Pointer to an gcoHAL object.
-+**
-+**		gctSIZE_T SourceSize
-+**			Size of the source buffer in bytes.
-+**
-+**		gctCONST_STRING Source
-+**			Pointer to the buffer containing the shader source code.
-+**
-+**	OUTPUT:
-+**
-+**		gcSHADER * Binary
-+**			Pointer to a variable receiving the pointer to a gcSHADER object
-+**			containg the compiled shader code.
-+**
-+**		gctSTRING * Log
-+**			Pointer to a variable receiving a string pointer containging the
-+**			compile log.
-+*/
-+gceSTATUS
-+gcCompileKernel(
-+	IN gcoHAL Hal,
-+	IN gctSIZE_T SourceSize,
-+	IN gctCONST_STRING Source,
-+	IN gctCONST_STRING Options,
-+	OUT gcSHADER * Binary,
-+	OUT gctSTRING * Log
-+	);
-+
-+/*******************************************************************************
-+**                                gcLinkKernel
-+********************************************************************************
-+**
-+**	Link OpenCL kernel and generate a harwdare specific state buffer by compiling
-+**	the compiler generated code through the resource allocator and code
-+**	generator.
-+**
-+**	INPUT:
-+**
-+**		gcSHADER Kernel
-+**			Pointer to a gcSHADER object holding information about the compiled
-+**			OpenCL kernel.
-+**
-+**		gceSHADER_FLAGS Flags
-+**			Compiler flags.  Can be any of the following:
-+**
-+**				gcvSHADER_DEAD_CODE       - Dead code elimination.
-+**				gcvSHADER_RESOURCE_USAGE  - Resource usage optimizaion.
-+**				gcvSHADER_OPTIMIZER       - Full optimization.
-+**				gcvSHADER_USE_GL_Z        - Use OpenGL ES Z coordinate.
-+**				gcvSHADER_USE_GL_POSITION - Use OpenGL ES gl_Position.
-+**				gcvSHADER_USE_GL_FACE     - Use OpenGL ES gl_FaceForward.
-+**
-+**	OUTPUT:
-+**
-+**		gctSIZE_T * StateBufferSize
-+**			Pointer to a variable receiving the number of bytes in the buffer
-+**			returned in 'StateBuffer'.
-+**
-+**		gctPOINTER * StateBuffer
-+**			Pointer to a variable receiving a buffer pointer that contains the
-+**			states required to download the shaders into the hardware.
-+**
-+**		gcsHINT_PTR * Hints
-+**			Pointer to a variable receiving a gcsHINT structure pointer that
-+**			contains information required when loading the shader states.
-+*/
-+gceSTATUS
-+gcLinkKernel(
-+	IN gcSHADER Kernel,
-+	IN gceSHADER_FLAGS Flags,
-+	OUT gctSIZE_T * StateBufferSize,
-+	OUT gctPOINTER * StateBuffer,
-+	OUT gcsHINT_PTR * Hints
-+	);
-+
-+/*******************************************************************************
-+**                                gcLoadKernel
-+********************************************************************************
-+**
-+**  Load a pre-compiled and pre-linked kernel program into the hardware.
-+**
-+**  INPUT:
-+**
-+**      gctSIZE_T StateBufferSize
-+**          The number of bytes in the 'StateBuffer'.
-+**
-+**      gctPOINTER StateBuffer
-+**          Pointer to the states that make up the shader program.
-+**
-+**      gcsHINT_PTR Hints
-+**          Pointer to a gcsHINT structure that contains information required
-+**          when loading the shader states.
-+*/
-+gceSTATUS
-+gcLoadKernel(
-+    IN gctSIZE_T StateBufferSize,
-+    IN gctPOINTER StateBuffer,
-+    IN gcsHINT_PTR Hints
-+    );
-+
-+gceSTATUS
-+gcInvokeThreadWalker(
-+    IN gcsTHREAD_WALKER_INFO_PTR Info
-+    );
-+
-+void
-+gcTYPE_GetTypeInfo(
-+    IN gcSHADER_TYPE      Type,
-+    OUT gctINT *          Components,
-+    OUT gctINT *          Rows,
-+    OUT gctCONST_STRING * Name
-+    );
-+
-+gctBOOL
-+gcOPT_doVaryingPackingForShader(
-+	IN gcSHADER Shader
-+    );
-+
-+gceSTATUS
-+gcSHADER_PatchNPOTForMachineCode(
-+    IN     gcSHADER_KIND          shaderType,
-+    IN     gcMACHINECODE_PTR      pMachineCode,
-+    IN     gcNPOT_PATCH_PARAM_PTR pPatchParam,
-+    IN     gctUINT                countOfPatchParam,
-+    IN     gctUINT                hwSupportedInstCount,
-+    OUT    gctPOINTER*            ppCmdBuffer,
-+    OUT    gctUINT32*             pByteSizeOfCmdBuffer,
-+    IN OUT gcsHINT_PTR            pHints /* User needs copy original hints to this one, then passed this one in */
-+    );
-+
-+gceSTATUS
-+gcSHADER_PatchZBiasForMachineCodeVS(
-+    IN     gcMACHINECODE_PTR       pMachineCode,
-+    IN OUT gcZBIAS_PATCH_PARAM_PTR pPatchParam,
-+    IN     gctUINT                 hwSupportedInstCount,
-+    OUT    gctPOINTER*             ppCmdBuffer,
-+    OUT    gctUINT32*              pByteSizeOfCmdBuffer,
-+    IN OUT gcsHINT_PTR             pHints /* User needs copy original hints to this one, then passed this one in */
-+    );
-+
-+gceSTATUS
-+gcSHADER_InsertList(
-+    IN gcSHADER                    Shader,
-+    IN gcSHADER_LIST *             Root,
-+    IN gctINT                      Index,
-+    IN gctINT                      Data0,
-+    IN gctINT                      Data1
-+    );
-+
-+gceSTATUS
-+gcSHADER_UpdateList(
-+    IN gcSHADER                    Shader,
-+    IN gcSHADER_LIST               Root,
-+    IN gctINT                      Index,
-+    IN gctINT                      NewIndex
-+    );
-+
-+gceSTATUS
-+gcSHADER_DeleteList(
-+    IN gcSHADER                    Shader,
-+    IN gcSHADER_LIST *             Root,
-+    IN gctINT                      Index
-+    );
-+
-+gceSTATUS
-+gcSHADER_FindList(
-+    IN gcSHADER                    Shader,
-+    IN gcSHADER_LIST               Root,
-+    IN gctINT                      Index,
-+    IN gcSHADER_LIST *             List
-+    );
-+
-+gceSTATUS
-+gcSHADER_InsertWClipList(
-+    IN gcSHADER                    Shader,
-+    IN gctINT                      Index,
-+    IN gctINT                      Data0,
-+    IN gctINT                      Data1
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* VIVANTE_NO_3D */
-+#endif /* __gc_hal_compiler_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,1051 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_driver_h_
-+#define __gc_hal_driver_h_
-+
-+#include "gc_hal_enum.h"
-+#include "gc_hal_types.h"
-+
-+#if gcdENABLE_VG
-+#include "gc_hal_driver_vg.h"
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+******************************* I/O Control Codes ******************************
-+\******************************************************************************/
-+
-+#define gcvHAL_CLASS                    "galcore"
-+#define IOCTL_GCHAL_INTERFACE           30000
-+#define IOCTL_GCHAL_KERNEL_INTERFACE    30001
-+#define IOCTL_GCHAL_TERMINATE           30002
-+
-+/******************************************************************************\
-+********************************* Command Codes ********************************
-+\******************************************************************************/
-+
-+typedef enum _gceHAL_COMMAND_CODES
-+{
-+    /* Generic query. */
-+    gcvHAL_QUERY_VIDEO_MEMORY,
-+    gcvHAL_QUERY_CHIP_IDENTITY,
-+
-+    /* Contiguous memory. */
-+    gcvHAL_ALLOCATE_NON_PAGED_MEMORY,
-+    gcvHAL_FREE_NON_PAGED_MEMORY,
-+    gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY,
-+    gcvHAL_FREE_CONTIGUOUS_MEMORY,
-+
-+    /* Video memory allocation. */
-+    gcvHAL_ALLOCATE_VIDEO_MEMORY,           /* Enforced alignment. */
-+    gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY,    /* No alignment. */
-+    gcvHAL_FREE_VIDEO_MEMORY,
-+
-+    /* Physical-to-logical mapping. */
-+    gcvHAL_MAP_MEMORY,
-+    gcvHAL_UNMAP_MEMORY,
-+
-+    /* Logical-to-physical mapping. */
-+    gcvHAL_MAP_USER_MEMORY,
-+    gcvHAL_UNMAP_USER_MEMORY,
-+
-+    /* Surface lock/unlock. */
-+    gcvHAL_LOCK_VIDEO_MEMORY,
-+    gcvHAL_UNLOCK_VIDEO_MEMORY,
-+
-+    /* Event queue. */
-+    gcvHAL_EVENT_COMMIT,
-+
-+    gcvHAL_USER_SIGNAL,
-+    gcvHAL_SIGNAL,
-+    gcvHAL_WRITE_DATA,
-+
-+    gcvHAL_COMMIT,
-+    gcvHAL_STALL,
-+
-+    gcvHAL_READ_REGISTER,
-+    gcvHAL_WRITE_REGISTER,
-+
-+    gcvHAL_GET_PROFILE_SETTING,
-+    gcvHAL_SET_PROFILE_SETTING,
-+
-+    gcvHAL_READ_ALL_PROFILE_REGISTERS,
-+    gcvHAL_PROFILE_REGISTERS_2D,
-+#if VIVANTE_PROFILER_PERDRAW
-+    gcvHAL_READ_PROFILER_REGISTER_SETTING,
-+#endif
-+
-+    /* Power management. */
-+    gcvHAL_SET_POWER_MANAGEMENT_STATE,
-+    gcvHAL_QUERY_POWER_MANAGEMENT_STATE,
-+
-+    gcvHAL_GET_BASE_ADDRESS,
-+
-+    gcvHAL_SET_IDLE, /* reserved */
-+
-+    /* Queries. */
-+    gcvHAL_QUERY_KERNEL_SETTINGS,
-+
-+    /* Reset. */
-+    gcvHAL_RESET,
-+
-+    /* Map physical address into handle. */
-+    gcvHAL_MAP_PHYSICAL,
-+
-+    /* Debugger stuff. */
-+    gcvHAL_DEBUG,
-+
-+    /* Cache stuff. */
-+    gcvHAL_CACHE,
-+
-+    /* TimeStamp */
-+    gcvHAL_TIMESTAMP,
-+
-+    /* Database. */
-+    gcvHAL_DATABASE,
-+
-+    /* Version. */
-+    gcvHAL_VERSION,
-+
-+    /* Chip info */
-+    gcvHAL_CHIP_INFO,
-+
-+    /* Process attaching/detaching. */
-+    gcvHAL_ATTACH,
-+    gcvHAL_DETACH,
-+
-+    /* Composition. */
-+    gcvHAL_COMPOSE,
-+
-+    /* Set timeOut value */
-+    gcvHAL_SET_TIMEOUT,
-+
-+    /* Frame database. */
-+    gcvHAL_GET_FRAME_INFO,
-+
-+    /* Shared info for each process */
-+    gcvHAL_GET_SHARED_INFO,
-+    gcvHAL_SET_SHARED_INFO,
-+    gcvHAL_QUERY_COMMAND_BUFFER,
-+
-+    gcvHAL_COMMIT_DONE,
-+
-+    /* GPU and event dump */
-+    gcvHAL_DUMP_GPU_STATE,
-+    gcvHAL_DUMP_EVENT,
-+
-+    /* Virtual command buffer. */
-+    gcvHAL_ALLOCATE_VIRTUAL_COMMAND_BUFFER,
-+    gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER,
-+
-+    /* FSCALE_VAL. */
-+    gcvHAL_SET_FSCALE_VALUE,
-+    gcvHAL_GET_FSCALE_VALUE,
-+
-+    /* Reset time stamp. */
-+    gcvHAL_QUERY_RESET_TIME_STAMP,
-+
-+    /* Sync point operations. */
-+    gcvHAL_SYNC_POINT,
-+
-+    /* Create native fence and return its fd. */
-+    gcvHAL_CREATE_NATIVE_FENCE,
-+
-+    /* Video memory database */
-+    gcvHAL_VIDMEM_DATABASE,
-+}
-+gceHAL_COMMAND_CODES;
-+
-+/******************************************************************************\
-+****************************** Interface Structure *****************************
-+\******************************************************************************/
-+
-+#define gcdMAX_PROFILE_FILE_NAME    128
-+
-+/* Kernel settings. */
-+typedef struct _gcsKERNEL_SETTINGS
-+{
-+    /* Used RealTime signal between kernel and user. */
-+    gctINT signal;
-+}
-+gcsKERNEL_SETTINGS;
-+
-+
-+/* gcvHAL_QUERY_CHIP_IDENTITY */
-+typedef struct _gcsHAL_QUERY_CHIP_IDENTITY * gcsHAL_QUERY_CHIP_IDENTITY_PTR;
-+typedef struct _gcsHAL_QUERY_CHIP_IDENTITY
-+{
-+
-+    /* Chip model. */
-+    gceCHIPMODEL                chipModel;
-+
-+    /* Revision value.*/
-+    gctUINT32                   chipRevision;
-+
-+    /* Supported feature fields. */
-+    gctUINT32                   chipFeatures;
-+
-+    /* Supported minor feature fields. */
-+    gctUINT32                   chipMinorFeatures;
-+
-+    /* Supported minor feature 1 fields. */
-+    gctUINT32                   chipMinorFeatures1;
-+
-+    /* Supported minor feature 2 fields. */
-+    gctUINT32                   chipMinorFeatures2;
-+
-+    /* Supported minor feature 3 fields. */
-+    gctUINT32                   chipMinorFeatures3;
-+
-+    /* Supported minor feature 4 fields. */
-+    gctUINT32                   chipMinorFeatures4;
-+
-+    /* Number of streams supported. */
-+    gctUINT32                   streamCount;
-+
-+    /* Total number of temporary registers per thread. */
-+    gctUINT32                   registerMax;
-+
-+    /* Maximum number of threads. */
-+    gctUINT32                   threadCount;
-+
-+    /* Number of shader cores. */
-+    gctUINT32                   shaderCoreCount;
-+
-+    /* Size of the vertex cache. */
-+    gctUINT32                   vertexCacheSize;
-+
-+    /* Number of entries in the vertex output buffer. */
-+    gctUINT32                   vertexOutputBufferSize;
-+
-+    /* Number of pixel pipes. */
-+    gctUINT32                   pixelPipes;
-+
-+    /* Number of instructions. */
-+    gctUINT32                   instructionCount;
-+
-+    /* Number of constants. */
-+    gctUINT32                   numConstants;
-+
-+    /* Buffer size */
-+    gctUINT32                   bufferSize;
-+
-+    /* Number of varyings */
-+    gctUINT32                   varyingsCount;
-+
-+    /* Supertile layout style in hardware */
-+    gctUINT32                   superTileMode;
-+
-+    /* Special control bits for 2D chip. */
-+    gctUINT32                   chip2DControl;
-+}
-+gcsHAL_QUERY_CHIP_IDENTITY;
-+
-+/* gcvHAL_COMPOSE. */
-+typedef struct _gcsHAL_COMPOSE * gcsHAL_COMPOSE_PTR;
-+typedef struct _gcsHAL_COMPOSE
-+{
-+    /* Composition state buffer. */
-+    gctUINT64                   physical;
-+    gctUINT64                   logical;
-+    gctUINT                     offset;
-+    gctUINT                     size;
-+
-+    /* Composition end signal. */
-+    gctUINT64                   process;
-+    gctUINT64                   signal;
-+
-+    /* User signals. */
-+    gctUINT64                   userProcess;
-+    gctUINT64                   userSignal1;
-+    gctUINT64                   userSignal2;
-+
-+#if defined(__QNXNTO__)
-+    /* Client pulse side-channel connection ID. */
-+    gctINT32                    coid;
-+
-+    /* Set by server. */
-+    gctINT32                    rcvid;
-+#endif
-+}
-+gcsHAL_COMPOSE;
-+
-+
-+typedef struct _gcsHAL_INTERFACE
-+{
-+    /* Command code. */
-+    gceHAL_COMMAND_CODES        command;
-+
-+    /* Hardware type. */
-+    gceHARDWARE_TYPE            hardwareType;
-+
-+    /* Status value. */
-+    gceSTATUS                   status;
-+
-+    /* Handle to this interface channel. */
-+    gctUINT64                   handle;
-+
-+    /* Pid of the client. */
-+    gctUINT32                   pid;
-+
-+    /* Union of command structures. */
-+    union _u
-+    {
-+        /* gcvHAL_GET_BASE_ADDRESS */
-+        struct _gcsHAL_GET_BASE_ADDRESS
-+        {
-+            /* Physical memory address of internal memory. */
-+            OUT gctUINT32               baseAddress;
-+        }
-+        GetBaseAddress;
-+
-+        /* gcvHAL_QUERY_VIDEO_MEMORY */
-+        struct _gcsHAL_QUERY_VIDEO_MEMORY
-+        {
-+            /* Physical memory address of internal memory. Just a name. */
-+            OUT gctUINT32               internalPhysical;
-+
-+            /* Size in bytes of internal memory. */
-+            OUT gctUINT64               internalSize;
-+
-+            /* Physical memory address of external memory. Just a name. */
-+            OUT gctUINT32               externalPhysical;
-+
-+            /* Size in bytes of external memory.*/
-+            OUT gctUINT64               externalSize;
-+
-+            /* Physical memory address of contiguous memory. Just a name. */
-+            OUT gctUINT32               contiguousPhysical;
-+
-+            /* Size in bytes of contiguous memory.*/
-+            OUT gctUINT64               contiguousSize;
-+        }
-+        QueryVideoMemory;
-+
-+        /* gcvHAL_QUERY_CHIP_IDENTITY */
-+        gcsHAL_QUERY_CHIP_IDENTITY      QueryChipIdentity;
-+
-+        /* gcvHAL_MAP_MEMORY */
-+        struct _gcsHAL_MAP_MEMORY
-+        {
-+            /* Physical memory address to map. Just a name on Linux/Qnx. */
-+            IN gctUINT32                physical;
-+
-+            /* Number of bytes in physical memory to map. */
-+            IN gctUINT64                bytes;
-+
-+            /* Address of mapped memory. */
-+            OUT gctUINT64               logical;
-+        }
-+        MapMemory;
-+
-+        /* gcvHAL_UNMAP_MEMORY */
-+        struct _gcsHAL_UNMAP_MEMORY
-+        {
-+            /* Physical memory address to unmap. Just a name on Linux/Qnx. */
-+            IN gctUINT32                physical;
-+
-+            /* Number of bytes in physical memory to unmap. */
-+            IN gctUINT64                bytes;
-+
-+            /* Address of mapped memory to unmap. */
-+            IN gctUINT64                logical;
-+        }
-+        UnmapMemory;
-+
-+        /* gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY */
-+        struct _gcsHAL_ALLOCATE_LINEAR_VIDEO_MEMORY
-+        {
-+            /* Number of bytes to allocate. */
-+            IN OUT gctUINT              bytes;
-+
-+            /* Buffer alignment. */
-+            IN gctUINT                  alignment;
-+
-+            /* Type of allocation. */
-+            IN gceSURF_TYPE             type;
-+
-+            /* Memory pool to allocate from. */
-+            IN OUT gcePOOL              pool;
-+
-+            /* Allocated video memory in gcuVIDMEM_NODE. */
-+            OUT gctUINT64               node;
-+        }
-+        AllocateLinearVideoMemory;
-+
-+        /* gcvHAL_ALLOCATE_VIDEO_MEMORY */
-+        struct _gcsHAL_ALLOCATE_VIDEO_MEMORY
-+        {
-+            /* Width of rectangle to allocate. */
-+            IN OUT gctUINT              width;
-+
-+            /* Height of rectangle to allocate. */
-+            IN OUT gctUINT              height;
-+
-+            /* Depth of rectangle to allocate. */
-+            IN gctUINT                  depth;
-+
-+            /* Format rectangle to allocate in gceSURF_FORMAT. */
-+            IN gceSURF_FORMAT           format;
-+
-+            /* Type of allocation. */
-+            IN gceSURF_TYPE             type;
-+
-+            /* Memory pool to allocate from. */
-+            IN OUT gcePOOL              pool;
-+
-+            /* Allocated video memory in gcuVIDMEM_NODE. */
-+            OUT gctUINT64               node;
-+        }
-+        AllocateVideoMemory;
-+
-+        /* gcvHAL_FREE_VIDEO_MEMORY */
-+        struct _gcsHAL_FREE_VIDEO_MEMORY
-+        {
-+            /* Allocated video memory in gcuVIDMEM_NODE. */
-+            IN gctUINT64        node;
-+
-+#ifdef __QNXNTO__
-+/* TODO: This is part of the unlock - why is it here? */
-+            /* Mapped logical address to unmap in user space. */
-+            OUT gctUINT64       memory;
-+
-+            /* Number of bytes to allocated. */
-+            OUT gctUINT64       bytes;
-+#endif
-+        }
-+        FreeVideoMemory;
-+
-+        /* gcvHAL_LOCK_VIDEO_MEMORY */
-+        struct _gcsHAL_LOCK_VIDEO_MEMORY
-+        {
-+            /* Allocated video memory gcuVIDMEM_NODE gcuVIDMEM_NODE. */
-+            IN gctUINT64            node;
-+
-+            /* Cache configuration. */
-+            /* Only gcvPOOL_CONTIGUOUS and gcvPOOL_VIRUTAL
-+            ** can be configured */
-+            IN gctBOOL              cacheable;
-+
-+            /* Hardware specific address. */
-+            OUT gctUINT32           address;
-+
-+            /* Mapped logical address. */
-+            OUT gctUINT64           memory;
-+        }
-+        LockVideoMemory;
-+
-+        /* gcvHAL_UNLOCK_VIDEO_MEMORY */
-+        struct _gcsHAL_UNLOCK_VIDEO_MEMORY
-+        {
-+            /* Allocated video memory in gcuVIDMEM_NODE. */
-+            IN gctUINT64            node;
-+
-+            /* Type of surface. */
-+            IN gceSURF_TYPE         type;
-+
-+            /* Flag to unlock surface asynchroneously. */
-+            IN OUT gctBOOL          asynchroneous;
-+        }
-+        UnlockVideoMemory;
-+
-+        /* gcvHAL_ALLOCATE_NON_PAGED_MEMORY */
-+        struct _gcsHAL_ALLOCATE_NON_PAGED_MEMORY
-+        {
-+            /* Number of bytes to allocate. */
-+            IN OUT gctUINT64        bytes;
-+
-+            /* Physical address of allocation. Just a name. */
-+            OUT gctUINT32           physical;
-+
-+            /* Logical address of allocation. */
-+            OUT gctUINT64           logical;
-+        }
-+        AllocateNonPagedMemory;
-+
-+        /* gcvHAL_FREE_NON_PAGED_MEMORY */
-+        struct _gcsHAL_FREE_NON_PAGED_MEMORY
-+        {
-+            /* Number of bytes allocated. */
-+            IN gctUINT64            bytes;
-+
-+            /* Physical address of allocation. Just a name. */
-+            IN gctUINT32            physical;
-+
-+            /* Logical address of allocation. */
-+            IN gctUINT64            logical;
-+        }
-+        FreeNonPagedMemory;
-+
-+        /* gcvHAL_ALLOCATE_NON_PAGED_MEMORY */
-+        struct _gcsHAL_ALLOCATE_VIRTUAL_COMMAND_BUFFER
-+        {
-+            /* Number of bytes to allocate. */
-+            IN OUT gctUINT64        bytes;
-+
-+            /* Physical address of allocation. Just a name. */
-+            OUT gctUINT32           physical;
-+
-+            /* Logical address of allocation. */
-+            OUT gctUINT64           logical;
-+        }
-+        AllocateVirtualCommandBuffer;
-+
-+        /* gcvHAL_FREE_NON_PAGED_MEMORY */
-+        struct _gcsHAL_FREE_VIRTUAL_COMMAND_BUFFER
-+        {
-+            /* Number of bytes allocated. */
-+            IN gctUINT64            bytes;
-+
-+            /* Physical address of allocation. Just a name. */
-+            IN gctUINT32            physical;
-+
-+            /* Logical address of allocation. */
-+            IN gctUINT64            logical;
-+        }
-+        FreeVirtualCommandBuffer;
-+
-+        /* gcvHAL_EVENT_COMMIT. */
-+        struct _gcsHAL_EVENT_COMMIT
-+        {
-+            /* Event queue in gcsQUEUE. */
-+            IN gctUINT64             queue;
-+        }
-+        Event;
-+
-+        /* gcvHAL_COMMIT */
-+        struct _gcsHAL_COMMIT
-+        {
-+            /* Context buffer object gckCONTEXT. */
-+            IN gctUINT64            context;
-+
-+            /* Command buffer gcoCMDBUF. */
-+            IN gctUINT64            commandBuffer;
-+
-+            /* State delta buffer in gcsSTATE_DELTA. */
-+            gctUINT64               delta;
-+
-+            /* Event queue in gcsQUEUE. */
-+            IN gctUINT64            queue;
-+        }
-+        Commit;
-+
-+        /* gcvHAL_MAP_USER_MEMORY */
-+        struct _gcsHAL_MAP_USER_MEMORY
-+        {
-+            /* Base address of user memory to map. */
-+            IN gctUINT64                memory;
-+
-+            /* Physical address of user memory to map. */
-+            IN gctUINT32                physical;
-+
-+            /* Size of user memory in bytes to map. */
-+            IN gctUINT64                size;
-+
-+            /* Info record required by gcvHAL_UNMAP_USER_MEMORY. Just a name. */
-+            OUT gctUINT32               info;
-+
-+            /* Physical address of mapped memory. */
-+            OUT gctUINT32               address;
-+        }
-+        MapUserMemory;
-+
-+        /* gcvHAL_UNMAP_USER_MEMORY */
-+        struct _gcsHAL_UNMAP_USER_MEMORY
-+        {
-+            /* Base address of user memory to unmap. */
-+            IN gctUINT64                memory;
-+
-+            /* Size of user memory in bytes to unmap. */
-+            IN gctUINT64                size;
-+
-+            /* Info record returned by gcvHAL_MAP_USER_MEMORY. Just a name. */
-+            IN gctUINT32                info;
-+
-+            /* Physical address of mapped memory as returned by
-+               gcvHAL_MAP_USER_MEMORY. */
-+            IN gctUINT32                address;
-+        }
-+        UnmapUserMemory;
-+#if !USE_NEW_LINUX_SIGNAL
-+        /* gcsHAL_USER_SIGNAL  */
-+        struct _gcsHAL_USER_SIGNAL
-+        {
-+            /* Command. */
-+            gceUSER_SIGNAL_COMMAND_CODES command;
-+
-+            /* Signal ID. */
-+            IN OUT gctINT               id;
-+
-+            /* Reset mode. */
-+            IN gctBOOL                  manualReset;
-+
-+            /* Wait timedout. */
-+            IN gctUINT32                wait;
-+
-+            /* State. */
-+            IN gctBOOL                  state;
-+        }
-+        UserSignal;
-+#endif
-+
-+        /* gcvHAL_SIGNAL. */
-+        struct _gcsHAL_SIGNAL
-+        {
-+            /* Signal handle to signal gctSIGNAL. */
-+            IN gctUINT64                signal;
-+
-+            /* Reserved gctSIGNAL. */
-+            IN gctUINT64                auxSignal;
-+
-+            /* Process owning the signal gctHANDLE. */
-+            IN gctUINT64                process;
-+
-+#if defined(__QNXNTO__)
-+            /* Client pulse side-channel connection ID. Set by client in gcoOS_CreateSignal. */
-+            IN gctINT32                 coid;
-+
-+            /* Set by server. */
-+            IN gctINT32                 rcvid;
-+#endif
-+            /* Event generated from where of pipeline */
-+            IN gceKERNEL_WHERE          fromWhere;
-+        }
-+        Signal;
-+
-+        /* gcvHAL_WRITE_DATA. */
-+        struct _gcsHAL_WRITE_DATA
-+        {
-+            /* Address to write data to. */
-+            IN gctUINT32                address;
-+
-+            /* Data to write. */
-+            IN gctUINT32                data;
-+        }
-+        WriteData;
-+
-+        /* gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY */
-+        struct _gcsHAL_ALLOCATE_CONTIGUOUS_MEMORY
-+        {
-+            /* Number of bytes to allocate. */
-+            IN OUT gctUINT64            bytes;
-+
-+            /* Hardware address of allocation. */
-+            OUT gctUINT32               address;
-+
-+            /* Physical address of allocation. Just a name. */
-+            OUT gctUINT32               physical;
-+
-+            /* Logical address of allocation. */
-+            OUT gctUINT64               logical;
-+        }
-+        AllocateContiguousMemory;
-+
-+        /* gcvHAL_FREE_CONTIGUOUS_MEMORY */
-+        struct _gcsHAL_FREE_CONTIGUOUS_MEMORY
-+        {
-+            /* Number of bytes allocated. */
-+            IN gctUINT64                bytes;
-+
-+            /* Physical address of allocation. Just a name. */
-+            IN gctUINT32                physical;
-+
-+            /* Logical address of allocation. */
-+            IN gctUINT64                logical;
-+        }
-+        FreeContiguousMemory;
-+
-+        /* gcvHAL_READ_REGISTER */
-+        struct _gcsHAL_READ_REGISTER
-+        {
-+            /* Logical address of memory to write data to. */
-+            IN gctUINT32            address;
-+
-+            /* Data read. */
-+            OUT gctUINT32           data;
-+        }
-+        ReadRegisterData;
-+
-+        /* gcvHAL_WRITE_REGISTER */
-+        struct _gcsHAL_WRITE_REGISTER
-+        {
-+            /* Logical address of memory to write data to. */
-+            IN gctUINT32            address;
-+
-+            /* Data read. */
-+            IN gctUINT32            data;
-+        }
-+        WriteRegisterData;
-+
-+#if VIVANTE_PROFILER
-+        /* gcvHAL_GET_PROFILE_SETTING */
-+        struct _gcsHAL_GET_PROFILE_SETTING
-+        {
-+            /* Enable profiling */
-+            OUT gctBOOL             enable;
-+
-+            /* The profile file name */
-+            OUT gctCHAR             fileName[gcdMAX_PROFILE_FILE_NAME];
-+        }
-+        GetProfileSetting;
-+
-+        /* gcvHAL_SET_PROFILE_SETTING */
-+        struct _gcsHAL_SET_PROFILE_SETTING
-+        {
-+            /* Enable profiling */
-+            IN gctBOOL              enable;
-+
-+            /* The profile file name */
-+            IN gctCHAR              fileName[gcdMAX_PROFILE_FILE_NAME];
-+        }
-+        SetProfileSetting;
-+
-+#if VIVANTE_PROFILER_PERDRAW
-+        /* gcvHAL_READ_PROFILER_REGISTER_SETTING */
-+        struct _gcsHAL_READ_PROFILER_REGISTER_SETTING
-+         {
-+            /*Should Clear Register*/
-+            IN gctBOOL               bclear;
-+         }
-+        SetProfilerRegisterClear;
-+#endif
-+
-+        /* gcvHAL_READ_ALL_PROFILE_REGISTERS */
-+        struct _gcsHAL_READ_ALL_PROFILE_REGISTERS
-+        {
-+#if VIVANTE_PROFILER_CONTEXT
-+            /* Context buffer object gckCONTEXT. Just a name. */
-+            IN gctUINT32                context;
-+#endif
-+            /* Data read. */
-+            OUT gcsPROFILER_COUNTERS    counters;
-+        }
-+        RegisterProfileData;
-+
-+        /* gcvHAL_PROFILE_REGISTERS_2D */
-+        struct _gcsHAL_PROFILE_REGISTERS_2D
-+        {
-+            /* Data read in gcs2D_PROFILE. */
-+            OUT gctUINT64       hwProfile2D;
-+        }
-+        RegisterProfileData2D;
-+#endif
-+        /* Power management. */
-+        /* gcvHAL_SET_POWER_MANAGEMENT_STATE */
-+        struct _gcsHAL_SET_POWER_MANAGEMENT
-+        {
-+            /* Data read. */
-+            IN gceCHIPPOWERSTATE        state;
-+        }
-+        SetPowerManagement;
-+
-+        /* gcvHAL_QUERY_POWER_MANAGEMENT_STATE */
-+        struct _gcsHAL_QUERY_POWER_MANAGEMENT
-+        {
-+            /* Data read. */
-+            OUT gceCHIPPOWERSTATE       state;
-+
-+            /* Idle query. */
-+            OUT gctBOOL                 isIdle;
-+        }
-+        QueryPowerManagement;
-+
-+        /* gcvHAL_QUERY_KERNEL_SETTINGS */
-+        struct _gcsHAL_QUERY_KERNEL_SETTINGS
-+        {
-+            /* Settings.*/
-+            OUT gcsKERNEL_SETTINGS      settings;
-+        }
-+        QueryKernelSettings;
-+
-+        /* gcvHAL_MAP_PHYSICAL */
-+        struct _gcsHAL_MAP_PHYSICAL
-+        {
-+            /* gcvTRUE to map, gcvFALSE to unmap. */
-+            IN gctBOOL                  map;
-+
-+            /* Physical address. */
-+            IN OUT gctUINT64            physical;
-+        }
-+        MapPhysical;
-+
-+        /* gcvHAL_DEBUG */
-+        struct _gcsHAL_DEBUG
-+        {
-+            /* If gcvTRUE, set the debug information. */
-+            IN gctBOOL                  set;
-+            IN gctUINT32                level;
-+            IN gctUINT32                zones;
-+            IN gctBOOL                  enable;
-+
-+            IN gceDEBUG_MESSAGE_TYPE    type;
-+            IN gctUINT32                messageSize;
-+
-+            /* Message to print if not empty. */
-+            IN gctCHAR                  message[80];
-+        }
-+        Debug;
-+
-+        /* gcvHAL_CACHE */
-+        struct _gcsHAL_CACHE
-+        {
-+            IN gceCACHEOPERATION        operation;
-+            /* gctHANDLE */
-+            IN gctUINT64                process;
-+            IN gctUINT64                logical;
-+            IN gctUINT64                bytes;
-+            /* gcuVIDMEM_NODE_PTR */
-+            IN gctUINT64                node;
-+        }
-+        Cache;
-+
-+        /* gcvHAL_TIMESTAMP */
-+        struct _gcsHAL_TIMESTAMP
-+        {
-+            /* Timer select. */
-+            IN gctUINT32                timer;
-+
-+            /* Timer request type (0-stop, 1-start, 2-send delta). */
-+            IN gctUINT32                request;
-+
-+            /* Result of delta time in microseconds. */
-+            OUT gctINT32                timeDelta;
-+        }
-+        TimeStamp;
-+
-+        /* gcvHAL_DATABASE */
-+        struct _gcsHAL_DATABASE
-+        {
-+            /* Set to gcvTRUE if you want to query a particular process ID.
-+            ** Set to gcvFALSE to query the last detached process. */
-+            IN gctBOOL                  validProcessID;
-+
-+            /* Process ID to query. */
-+            IN gctUINT32                processID;
-+
-+            /* Information. */
-+            OUT gcuDATABASE_INFO        vidMem;
-+            OUT gcuDATABASE_INFO        nonPaged;
-+            OUT gcuDATABASE_INFO        contiguous;
-+            OUT gcuDATABASE_INFO        gpuIdle;
-+        }
-+        Database;
-+
-+        /* gcvHAL_VIDMEM_DATABASE */
-+        struct _gcsHAL_VIDMEM_DATABASE
-+        {
-+            /* Set to gcvTRUE if you want to query a particular process ID.
-+            ** Set to gcvFALSE to query the last detached process. */
-+            IN gctBOOL                  validProcessID;
-+
-+            /* Process ID to query. */
-+            IN gctUINT32                processID;
-+
-+            /* Information. */
-+            OUT gcuDATABASE_INFO        vidMemResv;
-+            OUT gcuDATABASE_INFO        vidMemCont;
-+            OUT gcuDATABASE_INFO        vidMemVirt;
-+        }
-+        VidMemDatabase;
-+
-+        /* gcvHAL_VERSION */
-+        struct _gcsHAL_VERSION
-+        {
-+            /* Major version: N.n.n. */
-+            OUT gctINT32                major;
-+
-+            /* Minor version: n.N.n. */
-+            OUT gctINT32                minor;
-+
-+            /* Patch version: n.n.N. */
-+            OUT gctINT32                patch;
-+
-+            /* Build version. */
-+            OUT gctUINT32               build;
-+        }
-+        Version;
-+
-+        /* gcvHAL_CHIP_INFO */
-+        struct _gcsHAL_CHIP_INFO
-+        {
-+            /* Chip count. */
-+            OUT gctINT32                count;
-+
-+            /* Chip types. */
-+            OUT gceHARDWARE_TYPE        types[gcdCHIP_COUNT];
-+        }
-+        ChipInfo;
-+
-+        /* gcvHAL_ATTACH */
-+        struct _gcsHAL_ATTACH
-+        {
-+            /* Context buffer object gckCONTEXT. Just a name. */
-+            OUT gctUINT32               context;
-+
-+            /* Number of states in the buffer. */
-+            OUT gctUINT64               stateCount;
-+        }
-+        Attach;
-+
-+        /* gcvHAL_DETACH */
-+        struct _gcsHAL_DETACH
-+        {
-+            /* Context buffer object gckCONTEXT. Just a name. */
-+            IN gctUINT32                context;
-+        }
-+        Detach;
-+
-+        /* gcvHAL_COMPOSE. */
-+        gcsHAL_COMPOSE            Compose;
-+
-+        /* gcvHAL_GET_FRAME_INFO. */
-+        struct _gcsHAL_GET_FRAME_INFO
-+        {
-+            /* gcsHAL_FRAME_INFO* */
-+            OUT gctUINT64     frameInfo;
-+        }
-+        GetFrameInfo;
-+
-+        /* gcvHAL_SET_TIME_OUT. */
-+        struct _gcsHAL_SET_TIMEOUT
-+        {
-+            gctUINT32                   timeOut;
-+        }
-+        SetTimeOut;
-+
-+#if gcdENABLE_VG
-+		/* gcvHAL_COMMIT */
-+		struct _gcsHAL_VGCOMMIT
-+		{
-+			/* Context buffer in gcsVGCONTEXT. */
-+			IN gctUINT64			context;
-+
-+			/* Command queue in gcsVGCMDQUEUE. */
-+			IN gctUINT64			queue;
-+
-+			/* Number of entries in the queue. */
-+			IN gctUINT			entryCount;
-+
-+			/* Task table in gcsTASK_MASTER_TABLE. */
-+			IN gctUINT64	                taskTable;
-+		}
-+		VGCommit;
-+
-+		/* gcvHAL_QUERY_COMMAND_BUFFER */
-+		struct _gcsHAL_QUERY_COMMAND_BUFFER
-+		{
-+			/* Command buffer attributes. */
-+			OUT gcsCOMMAND_BUFFER_INFO	information;
-+		}
-+		QueryCommandBuffer;
-+
-+#endif
-+
-+        struct _gcsHAL_GET_SHARED_INFO
-+        {
-+            /* Process id. */
-+            IN gctUINT32            pid;
-+
-+            /* Data id. */
-+            IN gctUINT32            dataId;
-+
-+            /* Data size. */
-+            IN gctSIZE_T            bytes;
-+
-+            /* Pointer to save the shared data. */
-+            OUT gctPOINTER          data;
-+        }
-+        GetSharedInfo;
-+
-+        struct _gcsHAL_SET_SHARED_INFO
-+        {
-+            /* Data id. */
-+            IN gctUINT32            dataId;
-+
-+            /* Data to be shared. */
-+            IN gctPOINTER           data;
-+
-+            /* Data size. */
-+            IN gctSIZE_T            bytes;
-+        }
-+        SetSharedInfo;
-+
-+        struct _gcsHAL_SET_FSCALE_VALUE
-+        {
-+            IN gctUINT              value;
-+        }
-+        SetFscaleValue;
-+
-+        struct _gcsHAL_GET_FSCALE_VALUE
-+        {
-+            OUT gctUINT             value;
-+            OUT gctUINT             minValue;
-+            OUT gctUINT             maxValue;
-+        }
-+        GetFscaleValue;
-+
-+        struct _gcsHAL_QUERY_RESET_TIME_STAMP
-+        {
-+            OUT gctUINT64           timeStamp;
-+        }
-+        QueryResetTimeStamp;
-+
-+        struct _gcsHAL_SYNC_POINT
-+        {
-+            /* Command. */
-+            gceSYNC_POINT_COMMAND_CODES command;
-+
-+            /* Sync point. */
-+            IN OUT gctUINT64            syncPoint;
-+
-+            /* From where. */
-+            IN gceKERNEL_WHERE          fromWhere;
-+
-+            /* Signaled state. */
-+            OUT gctBOOL                 state;
-+        }
-+        SyncPoint;
-+
-+        struct _gcsHAL_CREATE_NATIVE_FENCE
-+        {
-+            /* Signal id to dup. */
-+            IN gctUINT64                syncPoint;
-+
-+            /* Native fence file descriptor. */
-+            OUT gctINT                  fenceFD;
-+
-+        }
-+        CreateNativeFence;
-+    }
-+    u;
-+}
-+gcsHAL_INTERFACE;
-+
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_driver_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,270 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_driver_vg_h_
-+#define __gc_hal_driver_vg_h_
-+
-+
-+
-+#include "gc_hal_types.h"
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+******************************* I/O Control Codes ******************************
-+\******************************************************************************/
-+
-+#define gcvHAL_CLASS            "galcore"
-+#define IOCTL_GCHAL_INTERFACE   30000
-+
-+/******************************************************************************\
-+********************************* Command Codes ********************************
-+\******************************************************************************/
-+
-+/******************************************************************************\
-+********************* Command buffer information structure. ********************
-+\******************************************************************************/
-+
-+typedef struct _gcsCOMMAND_BUFFER_INFO * gcsCOMMAND_BUFFER_INFO_PTR;
-+typedef struct _gcsCOMMAND_BUFFER_INFO
-+{
-+    /* FE command buffer interrupt ID. */
-+    gctINT32                    feBufferInt;
-+
-+    /* TS overflow interrupt ID. */
-+    gctINT32                    tsOverflowInt;
-+
-+    /* Alignment and mask for the buffer address. */
-+    gctUINT                     addressMask;
-+    gctSIZE_T                   addressAlignment;
-+
-+    /* Alignment for each command. */
-+    gctSIZE_T                   commandAlignment;
-+
-+    /* Number of bytes required by the STATE command. */
-+    gctSIZE_T                   stateCommandSize;
-+
-+    /* Number of bytes required by the RESTART command. */
-+    gctSIZE_T                   restartCommandSize;
-+
-+    /* Number of bytes required by the FETCH command. */
-+    gctSIZE_T                   fetchCommandSize;
-+
-+    /* Number of bytes required by the CALL command. */
-+    gctSIZE_T                   callCommandSize;
-+
-+    /* Number of bytes required by the RETURN command. */
-+    gctSIZE_T                   returnCommandSize;
-+
-+    /* Number of bytes required by the EVENT command. */
-+    gctSIZE_T                   eventCommandSize;
-+
-+    /* Number of bytes required by the END command. */
-+    gctSIZE_T                   endCommandSize;
-+
-+    /* Number of bytes reserved at the tail of a static command buffer. */
-+    gctSIZE_T                   staticTailSize;
-+
-+    /* Number of bytes reserved at the tail of a dynamic command buffer. */
-+    gctSIZE_T                   dynamicTailSize;
-+}
-+gcsCOMMAND_BUFFER_INFO;
-+
-+/******************************************************************************\
-+******************************** Task Structures *******************************
-+\******************************************************************************/
-+
-+typedef enum _gceTASK
-+{
-+    gcvTASK_LINK,
-+    gcvTASK_CLUSTER,
-+    gcvTASK_INCREMENT,
-+    gcvTASK_DECREMENT,
-+    gcvTASK_SIGNAL,
-+    gcvTASK_LOCKDOWN,
-+    gcvTASK_UNLOCK_VIDEO_MEMORY,
-+    gcvTASK_FREE_VIDEO_MEMORY,
-+    gcvTASK_FREE_CONTIGUOUS_MEMORY,
-+    gcvTASK_UNMAP_USER_MEMORY
-+}
-+gceTASK;
-+
-+typedef struct _gcsTASK_HEADER * gcsTASK_HEADER_PTR;
-+typedef struct _gcsTASK_HEADER
-+{
-+    /* Task ID. */
-+    IN gceTASK                  id;
-+}
-+gcsTASK_HEADER;
-+
-+typedef struct _gcsTASK_LINK * gcsTASK_LINK_PTR;
-+typedef struct _gcsTASK_LINK
-+{
-+    /* Task ID (gcvTASK_LINK). */
-+    IN gceTASK                  id;
-+
-+    /* Pointer to the next task container. */
-+    IN gctPOINTER               cotainer;
-+
-+    /* Pointer to the next task from the next task container. */
-+    IN gcsTASK_HEADER_PTR       task;
-+}
-+gcsTASK_LINK;
-+
-+typedef struct _gcsTASK_CLUSTER * gcsTASK_CLUSTER_PTR;
-+typedef struct _gcsTASK_CLUSTER
-+{
-+    /* Task ID (gcvTASK_CLUSTER). */
-+    IN gceTASK                  id;
-+
-+    /* Number of tasks in the cluster. */
-+    IN gctUINT                  taskCount;
-+}
-+gcsTASK_CLUSTER;
-+
-+typedef struct _gcsTASK_INCREMENT * gcsTASK_INCREMENT_PTR;
-+typedef struct _gcsTASK_INCREMENT
-+{
-+    /* Task ID (gcvTASK_INCREMENT). */
-+    IN gceTASK                  id;
-+
-+    /* Address of the variable to increment. */
-+    IN gctUINT32                address;
-+}
-+gcsTASK_INCREMENT;
-+
-+typedef struct _gcsTASK_DECREMENT * gcsTASK_DECREMENT_PTR;
-+typedef struct _gcsTASK_DECREMENT
-+{
-+    /* Task ID (gcvTASK_DECREMENT). */
-+    IN gceTASK                  id;
-+
-+    /* Address of the variable to decrement. */
-+    IN gctUINT32                address;
-+}
-+gcsTASK_DECREMENT;
-+
-+typedef struct _gcsTASK_SIGNAL * gcsTASK_SIGNAL_PTR;
-+typedef struct _gcsTASK_SIGNAL
-+{
-+    /* Task ID (gcvTASK_SIGNAL). */
-+    IN gceTASK                  id;
-+
-+    /* Process owning the signal. */
-+    IN gctHANDLE                process;
-+
-+    /* Signal handle to signal. */
-+    IN gctSIGNAL                signal;
-+
-+#if defined(__QNXNTO__)
-+    IN gctINT32                 coid;
-+    IN gctINT32                 rcvid;
-+#endif
-+}
-+gcsTASK_SIGNAL;
-+
-+typedef struct _gcsTASK_LOCKDOWN * gcsTASK_LOCKDOWN_PTR;
-+typedef struct _gcsTASK_LOCKDOWN
-+{
-+    /* Task ID (gcvTASK_LOCKDOWN). */
-+    IN gceTASK                  id;
-+
-+    /* Address of the user space counter. */
-+    IN gctUINT32                userCounter;
-+
-+    /* Address of the kernel space counter. */
-+    IN gctUINT32                kernelCounter;
-+
-+    /* Process owning the signal. */
-+    IN gctHANDLE                process;
-+
-+    /* Signal handle to signal. */
-+    IN gctSIGNAL                signal;
-+}
-+gcsTASK_LOCKDOWN;
-+
-+typedef struct _gcsTASK_UNLOCK_VIDEO_MEMORY * gcsTASK_UNLOCK_VIDEO_MEMORY_PTR;
-+typedef struct _gcsTASK_UNLOCK_VIDEO_MEMORY
-+{
-+    /* Task ID (gcvTASK_UNLOCK_VIDEO_MEMORY). */
-+    IN gceTASK                  id;
-+
-+    /* Allocated video memory. */
-+    IN gctUINT64                node;
-+}
-+gcsTASK_UNLOCK_VIDEO_MEMORY;
-+
-+typedef struct _gcsTASK_FREE_VIDEO_MEMORY * gcsTASK_FREE_VIDEO_MEMORY_PTR;
-+typedef struct _gcsTASK_FREE_VIDEO_MEMORY
-+{
-+    /* Task ID (gcvTASK_FREE_VIDEO_MEMORY). */
-+    IN gceTASK                  id;
-+
-+    /* Allocated video memory. */
-+    IN gctUINT64                node;
-+}
-+gcsTASK_FREE_VIDEO_MEMORY;
-+
-+typedef struct _gcsTASK_FREE_CONTIGUOUS_MEMORY * gcsTASK_FREE_CONTIGUOUS_MEMORY_PTR;
-+typedef struct _gcsTASK_FREE_CONTIGUOUS_MEMORY
-+{
-+    /* Task ID (gcvTASK_FREE_CONTIGUOUS_MEMORY). */
-+    IN gceTASK                  id;
-+
-+    /* Number of bytes allocated. */
-+    IN gctSIZE_T                bytes;
-+
-+    /* Physical address of allocation. */
-+    IN gctPHYS_ADDR             physical;
-+
-+    /* Logical address of allocation. */
-+    IN gctPOINTER               logical;
-+}
-+gcsTASK_FREE_CONTIGUOUS_MEMORY;
-+
-+typedef struct _gcsTASK_UNMAP_USER_MEMORY * gcsTASK_UNMAP_USER_MEMORY_PTR;
-+typedef struct _gcsTASK_UNMAP_USER_MEMORY
-+{
-+    /* Task ID (gcvTASK_UNMAP_USER_MEMORY). */
-+    IN gceTASK                  id;
-+
-+    /* Base address of user memory to unmap. */
-+    IN gctPOINTER               memory;
-+
-+    /* Size of user memory in bytes to unmap. */
-+    IN gctSIZE_T                size;
-+
-+    /* Info record returned by gcvHAL_MAP_USER_MEMORY. */
-+    IN gctPOINTER               info;
-+
-+    /* Physical address of mapped memory as returned by
-+       gcvHAL_MAP_USER_MEMORY. */
-+    IN gctUINT32                address;
-+}
-+gcsTASK_UNMAP_USER_MEMORY;
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_driver_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,88 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_dump_h_
-+#define __gc_hal_dump_h_
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/*
-+**	FILE LAYOUT:
-+**
-+**		gcsDUMP_FILE structure
-+**
-+**		gcsDUMP_DATA frame
-+**			gcsDUMP_DATA or gcDUMP_DATA_SIZE records rendingring the frame
-+**			gctUINT8 data[length]
-+*/
-+
-+#define gcvDUMP_FILE_SIGNATURE		gcmCC('g','c','D','B')
-+
-+typedef struct _gcsDUMP_FILE
-+{
-+	gctUINT32   		signature;	/* File signature */
-+	gctSIZE_T 			length;		/* Length of file */
-+	gctUINT32 			frames;		/* Number of frames in file */
-+}
-+gcsDUMP_FILE;
-+
-+typedef enum _gceDUMP_TAG
-+{
-+	gcvTAG_SURFACE					= gcmCC('s','u','r','f'),
-+	gcvTAG_FRAME					= gcmCC('f','r','m',' '),
-+	gcvTAG_COMMAND					= gcmCC('c','m','d',' '),
-+	gcvTAG_INDEX					= gcmCC('i','n','d','x'),
-+	gcvTAG_STREAM					= gcmCC('s','t','r','m'),
-+	gcvTAG_TEXTURE					= gcmCC('t','e','x','t'),
-+	gcvTAG_RENDER_TARGET			= gcmCC('r','n','d','r'),
-+	gcvTAG_DEPTH					= gcmCC('z','b','u','f'),
-+	gcvTAG_RESOLVE					= gcmCC('r','s','l','v'),
-+	gcvTAG_DELETE					= gcmCC('d','e','l',' '),
-+}
-+gceDUMP_TAG;
-+
-+typedef struct _gcsDUMP_SURFACE
-+{
-+	gceDUMP_TAG			type;		/* Type of record. */
-+	gctUINT32     		address;	/* Address of the surface. */
-+	gctINT16      		width;		/* Width of surface. */
-+	gctINT16	   		height;		/* Height of surface. */
-+	gceSURF_FORMAT		format;		/* Surface pixel format. */
-+	gctSIZE_T			length;		/* Number of bytes inside the surface. */
-+}
-+gcsDUMP_SURFACE;
-+
-+typedef struct _gcsDUMP_DATA
-+{
-+	gceDUMP_TAG		 	type;		/* Type of record. */
-+	gctSIZE_T     		length;		/* Number of bytes of data. */
-+	gctUINT32     		address;	/* Address for the data. */
-+}
-+gcsDUMP_DATA;
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_dump_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,627 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+#ifndef __gc_hal_eglplatform_h_
-+#define __gc_hal_eglplatform_h_
-+
-+/* Include VDK types. */
-+#include "gc_hal_types.h"
-+#include "gc_hal_base.h"
-+#include "gc_hal_eglplatform_type.h"
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+
-+#if defined(_WIN32) || defined(__VC32__) && !defined(__CYGWIN__) && !defined(__SCITECH_SNAP__)
-+/* Win32 and Windows CE platforms. */
-+#include <windows.h>
-+typedef HDC             HALNativeDisplayType;
-+typedef HWND            HALNativeWindowType;
-+typedef HBITMAP         HALNativePixmapType;
-+
-+typedef struct __BITFIELDINFO{
-+    BITMAPINFO    bmi;
-+    RGBQUAD       bmiColors[2];
-+} BITFIELDINFO;
-+
-+#elif defined(LINUX) && defined(EGL_API_DFB) && !defined(__APPLE__)
-+#include <directfb.h>
-+typedef struct _DFBDisplay * HALNativeDisplayType;
-+typedef struct _DFBWindow *  HALNativeWindowType;
-+typedef struct _DFBPixmap *  HALNativePixmapType;
-+
-+#elif defined(LINUX) && defined(EGL_API_FB) && !defined(__APPLE__)
-+
-+#if defined(EGL_API_WL)
-+/* Wayland platform. */
-+#include "wayland-server.h"
-+#include <wayland-egl.h>
-+
-+#define WL_EGL_NUM_BACKBUFFERS 3
-+
-+typedef struct _gcsWL_VIV_BUFFER
-+{
-+   struct wl_resource *wl_buffer;
-+   gcoSURF surface;
-+   gctINT32 width, height;
-+} gcsWL_VIV_BUFFER;
-+
-+typedef struct _gcsWL_EGL_DISPLAY
-+{
-+   struct wl_display* wl_display;
-+   struct wl_viv* wl_viv;
-+   struct wl_registry *registry;
-+   struct wl_event_queue    *wl_queue;
-+} gcsWL_EGL_DISPLAY;
-+
-+typedef struct _gcsWL_EGL_BUFFER_INFO
-+{
-+   gctINT32 width;
-+   gctINT32 height;
-+   gctINT32 stride;
-+   gceSURF_FORMAT format;
-+   gcuVIDMEM_NODE_PTR node;
-+   gcePOOL pool;
-+   gctUINT bytes;
-+   gcoSURF surface;
-+   gcoSURF attached_surface;
-+   gctINT32 invalidate;
-+   gctBOOL locked;
-+} gcsWL_EGL_BUFFER_INFO;
-+
-+typedef struct _gcsWL_EGL_BUFFER
-+{
-+   struct wl_buffer* wl_buffer;
-+   gcsWL_EGL_BUFFER_INFO info;
-+} gcsWL_EGL_BUFFER;
-+
-+typedef struct _gcsWL_EGL_WINDOW_INFO
-+{
-+   gctINT32 dx;
-+   gctINT32 dy;
-+   gctUINT width;
-+   gctUINT height;
-+   gctINT32 attached_width;
-+   gctINT32 attached_height;
-+   gceSURF_FORMAT format;
-+   gctUINT bpp;
-+} gcsWL_EGL_WINDOW_INFO;
-+
-+struct wl_egl_window
-+{
-+   gcsWL_EGL_DISPLAY* display;
-+   gcsWL_EGL_BUFFER backbuffers[WL_EGL_NUM_BACKBUFFERS];
-+   gcsWL_EGL_WINDOW_INFO info;
-+   gctUINT current;
-+   struct wl_surface* surface;
-+   struct wl_callback* frame_callback;
-+};
-+
-+typedef void*   HALNativeDisplayType;
-+typedef void*   HALNativeWindowType;
-+typedef void*   HALNativePixmapType;
-+#else
-+/* Linux platform for FBDEV. */
-+typedef struct _FBDisplay * HALNativeDisplayType;
-+typedef struct _FBWindow *  HALNativeWindowType;
-+typedef struct _FBPixmap *  HALNativePixmapType;
-+#endif
-+#elif defined(__ANDROID__) || defined(ANDROID)
-+
-+struct egl_native_pixmap_t;
-+
-+#if ANDROID_SDK_VERSION >= 9
-+    #include <android/native_window.h>
-+
-+    typedef struct ANativeWindow*           HALNativeWindowType;
-+    typedef struct egl_native_pixmap_t*     HALNativePixmapType;
-+    typedef void*                           HALNativeDisplayType;
-+#else
-+    struct android_native_window_t;
-+    typedef struct android_native_window_t*    HALNativeWindowType;
-+    typedef struct egl_native_pixmap_t *        HALNativePixmapType;
-+    typedef void*                               HALNativeDisplayType;
-+#endif
-+
-+#elif defined(LINUX) || defined(__APPLE__)
-+/* X11 platform. */
-+#include <X11/Xlib.h>
-+#include <X11/Xutil.h>
-+
-+typedef Display *   HALNativeDisplayType;
-+typedef Window      HALNativeWindowType;
-+
-+#ifdef CUSTOM_PIXMAP
-+typedef void *      HALNativePixmapType;
-+#else
-+typedef Pixmap      HALNativePixmapType;
-+#endif /* CUSTOM_PIXMAP */
-+
-+/* Rename some badly named X defines. */
-+#ifdef Status
-+#   define XStatus      int
-+#   undef Status
-+#endif
-+#ifdef Always
-+#   define XAlways      2
-+#   undef Always
-+#endif
-+#ifdef CurrentTime
-+#   undef CurrentTime
-+#   define XCurrentTime 0
-+#endif
-+
-+#elif defined(__QNXNTO__)
-+#include <screen/screen.h>
-+
-+/* VOID */
-+typedef int              HALNativeDisplayType;
-+typedef screen_window_t  HALNativeWindowType;
-+typedef screen_pixmap_t  HALNativePixmapType;
-+
-+#else
-+
-+#error "Platform not recognized"
-+
-+/* VOID */
-+typedef void *  HALNativeDisplayType;
-+typedef void *  HALNativeWindowType;
-+typedef void *  HALNativePixmapType;
-+
-+#endif
-+
-+/* define DUMMY according to the system */
-+#if defined(EGL_API_WL)
-+#   define WL_DUMMY (31415926)
-+#   define EGL_DUMMY WL_DUMMY
-+#elif defined(__ANDROID__) || defined(ANDROID)
-+#   define ANDROID_DUMMY (31415926)
-+#   define EGL_DUMMY ANDROID_DUMMY
-+#else
-+#   define EGL_DUMMY (31415926)
-+#endif
-+
-+/*******************************************************************************
-+** Display. ********************************************************************
-+*/
-+
-+gceSTATUS
-+gcoOS_GetDisplay(
-+    OUT HALNativeDisplayType * Display,
-+    IN gctPOINTER Context
-+    );
-+
-+gceSTATUS
-+gcoOS_GetDisplayByIndex(
-+    IN gctINT DisplayIndex,
-+    OUT HALNativeDisplayType * Display,
-+    IN gctPOINTER Context
-+    );
-+
-+gceSTATUS
-+gcoOS_GetDisplayInfo(
-+    IN HALNativeDisplayType Display,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height,
-+    OUT gctSIZE_T * Physical,
-+    OUT gctINT * Stride,
-+    OUT gctINT * BitsPerPixel
-+    );
-+
-+
-+
-+gceSTATUS
-+gcoOS_GetDisplayInfoEx(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctUINT DisplayInfoSize,
-+    OUT halDISPLAY_INFO * DisplayInfo
-+    );
-+
-+gceSTATUS
-+gcoOS_GetNextDisplayInfoExByIndex(
-+    IN gctINT Index,
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctUINT DisplayInfoSize,
-+    OUT halDISPLAY_INFO * DisplayInfo
-+    );
-+
-+gceSTATUS
-+gcoOS_GetDisplayVirtual(
-+    IN HALNativeDisplayType Display,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height
-+    );
-+
-+gceSTATUS
-+gcoOS_GetDisplayBackbuffer(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    OUT gctPOINTER  *  context,
-+    OUT gcoSURF     *  surface,
-+    OUT gctUINT * Offset,
-+    OUT gctINT * X,
-+    OUT gctINT * Y
-+    );
-+
-+gceSTATUS
-+gcoOS_SetDisplayVirtual(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctUINT Offset,
-+    IN gctINT X,
-+    IN gctINT Y
-+    );
-+
-+gceSTATUS
-+gcoOS_SetDisplayVirtualEx(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctPOINTER Context,
-+    IN gcoSURF Surface,
-+    IN gctUINT Offset,
-+    IN gctINT X,
-+    IN gctINT Y
-+    );
-+
-+gceSTATUS
-+gcoOS_SetSwapInterval(
-+    IN HALNativeDisplayType Display,
-+    IN gctINT Interval
-+);
-+
-+gceSTATUS
-+gcoOS_GetSwapInterval(
-+    IN HALNativeDisplayType Display,
-+    IN gctINT_PTR Min,
-+    IN gctINT_PTR Max
-+);
-+
-+gceSTATUS
-+gcoOS_DisplayBufferRegions(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctINT NumRects,
-+    IN gctINT_PTR Rects
-+    );
-+
-+gceSTATUS
-+gcoOS_DestroyDisplay(
-+    IN HALNativeDisplayType Display
-+    );
-+
-+gceSTATUS
-+gcoOS_InitLocalDisplayInfo(
-+    IN HALNativeDisplayType Display,
-+    IN OUT gctPOINTER * localDisplay
-+    );
-+
-+gceSTATUS
-+gcoOS_DeinitLocalDisplayInfo(
-+    IN HALNativeDisplayType Display,
-+    IN OUT gctPOINTER * localDisplay
-+    );
-+
-+gceSTATUS
-+gcoOS_GetDisplayInfoEx2(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctPOINTER  localDisplay,
-+    IN gctUINT DisplayInfoSize,
-+    OUT halDISPLAY_INFO * DisplayInfo
-+    );
-+
-+gceSTATUS
-+gcoOS_GetDisplayBackbufferEx(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctPOINTER  localDisplay,
-+    OUT gctPOINTER  *  context,
-+    OUT gcoSURF     *  surface,
-+    OUT gctUINT * Offset,
-+    OUT gctINT * X,
-+    OUT gctINT * Y
-+    );
-+
-+gceSTATUS
-+gcoOS_IsValidDisplay(
-+    IN HALNativeDisplayType Display
-+    );
-+
-+gceSTATUS
-+gcoOS_GetNativeVisualId(
-+    IN HALNativeDisplayType Display,
-+    OUT gctINT* nativeVisualId
-+    );
-+
-+gctBOOL
-+gcoOS_SynchronousFlip(
-+    IN HALNativeDisplayType Display
-+    );
-+
-+/*******************************************************************************
-+** Windows. ********************************************************************
-+*/
-+
-+gceSTATUS
-+gcoOS_CreateWindow(
-+    IN HALNativeDisplayType Display,
-+    IN gctINT X,
-+    IN gctINT Y,
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    OUT HALNativeWindowType * Window
-+    );
-+
-+gceSTATUS
-+gcoOS_GetWindowInfo(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    OUT gctINT * X,
-+    OUT gctINT * Y,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height,
-+    OUT gctINT * BitsPerPixel,
-+    OUT gctUINT * Offset
-+    );
-+
-+gceSTATUS
-+gcoOS_DestroyWindow(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window
-+    );
-+
-+gceSTATUS
-+gcoOS_DrawImage(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctINT Left,
-+    IN gctINT Top,
-+    IN gctINT Right,
-+    IN gctINT Bottom,
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    IN gctINT BitsPerPixel,
-+    IN gctPOINTER Bits
-+    );
-+
-+gceSTATUS
-+gcoOS_GetImage(
-+    IN HALNativeWindowType Window,
-+    IN gctINT Left,
-+    IN gctINT Top,
-+    IN gctINT Right,
-+    IN gctINT Bottom,
-+    OUT gctINT * BitsPerPixel,
-+    OUT gctPOINTER * Bits
-+    );
-+
-+gceSTATUS
-+gcoOS_GetWindowInfoEx(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    OUT gctINT * X,
-+    OUT gctINT * Y,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height,
-+    OUT gctINT * BitsPerPixel,
-+    OUT gctUINT * Offset,
-+    OUT gceSURF_FORMAT * Format
-+    );
-+
-+gceSTATUS
-+gcoOS_DrawImageEx(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctINT Left,
-+    IN gctINT Top,
-+    IN gctINT Right,
-+    IN gctINT Bottom,
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    IN gctINT BitsPerPixel,
-+    IN gctPOINTER Bits,
-+    IN gceSURF_FORMAT  Format
-+    );
-+
-+/*******************************************************************************
-+** Pixmaps. ********************************************************************
-+*/
-+
-+gceSTATUS
-+gcoOS_CreatePixmap(
-+    IN HALNativeDisplayType Display,
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    IN gctINT BitsPerPixel,
-+    OUT HALNativePixmapType * Pixmap
-+    );
-+
-+gceSTATUS
-+gcoOS_GetPixmapInfo(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativePixmapType Pixmap,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height,
-+    OUT gctINT * BitsPerPixel,
-+    OUT gctINT * Stride,
-+    OUT gctPOINTER * Bits
-+    );
-+
-+gceSTATUS
-+gcoOS_DrawPixmap(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativePixmapType Pixmap,
-+    IN gctINT Left,
-+    IN gctINT Top,
-+    IN gctINT Right,
-+    IN gctINT Bottom,
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    IN gctINT BitsPerPixel,
-+    IN gctPOINTER Bits
-+    );
-+
-+gceSTATUS
-+gcoOS_DestroyPixmap(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativePixmapType Pixmap
-+    );
-+
-+gceSTATUS
-+gcoOS_GetPixmapInfoEx(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativePixmapType Pixmap,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height,
-+    OUT gctINT * BitsPerPixel,
-+    OUT gctINT * Stride,
-+    OUT gctPOINTER * Bits,
-+    OUT gceSURF_FORMAT * Format
-+    );
-+
-+gceSTATUS
-+gcoOS_CopyPixmapBits(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativePixmapType Pixmap,
-+    IN gctUINT DstWidth,
-+    IN gctUINT DstHeight,
-+    IN gctINT DstStride,
-+    IN gceSURF_FORMAT DstFormat,
-+    OUT gctPOINTER DstBits
-+    );
-+
-+/*******************************************************************************
-+** OS relative. ****************************************************************
-+*/
-+gceSTATUS
-+gcoOS_LoadEGLLibrary(
-+    OUT gctHANDLE * Handle
-+    );
-+
-+gceSTATUS
-+gcoOS_FreeEGLLibrary(
-+    IN gctHANDLE Handle
-+    );
-+
-+gceSTATUS
-+gcoOS_ShowWindow(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window
-+    );
-+
-+gceSTATUS
-+gcoOS_HideWindow(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window
-+    );
-+
-+gceSTATUS
-+gcoOS_SetWindowTitle(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    IN gctCONST_STRING Title
-+    );
-+
-+gceSTATUS
-+gcoOS_CapturePointer(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window
-+    );
-+
-+gceSTATUS
-+gcoOS_GetEvent(
-+    IN HALNativeDisplayType Display,
-+    IN HALNativeWindowType Window,
-+    OUT halEvent * Event
-+    );
-+
-+gceSTATUS
-+gcoOS_CreateClientBuffer(
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    IN gctINT Format,
-+    IN gctINT Type,
-+    OUT gctPOINTER * ClientBuffer
-+    );
-+
-+gceSTATUS
-+gcoOS_GetClientBufferInfo(
-+    IN gctPOINTER ClientBuffer,
-+    OUT gctINT * Width,
-+    OUT gctINT * Height,
-+    OUT gctINT * Stride,
-+    OUT gctPOINTER * Bits
-+    );
-+
-+gceSTATUS
-+gcoOS_DestroyClientBuffer(
-+    IN gctPOINTER ClientBuffer
-+    );
-+
-+gceSTATUS
-+gcoOS_DestroyContext(
-+    IN gctPOINTER Display,
-+    IN gctPOINTER Context
-+    );
-+
-+gceSTATUS
-+gcoOS_CreateContext(
-+    IN gctPOINTER LocalDisplay,
-+    IN gctPOINTER Context
-+    );
-+
-+gceSTATUS
-+gcoOS_MakeCurrent(
-+    IN gctPOINTER LocalDisplay,
-+    IN HALNativeWindowType DrawDrawable,
-+    IN HALNativeWindowType ReadDrawable,
-+    IN gctPOINTER Context,
-+    IN gcoSURF ResolveTarget
-+    );
-+
-+gceSTATUS
-+gcoOS_CreateDrawable(
-+    IN gctPOINTER LocalDisplay,
-+    IN HALNativeWindowType Drawable
-+    );
-+
-+gceSTATUS
-+gcoOS_DestroyDrawable(
-+    IN gctPOINTER LocalDisplay,
-+    IN HALNativeWindowType Drawable
-+    );
-+gceSTATUS
-+gcoOS_SwapBuffers(
-+    IN gctPOINTER LocalDisplay,
-+    IN HALNativeWindowType Drawable,
-+    IN gcoSURF RenderTarget,
-+    IN gcoSURF ResolveTarget,
-+    IN gctPOINTER ResolveBits,
-+    OUT gctUINT *Width,
-+    OUT gctUINT *Height
-+    );
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_eglplatform_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h	2015-07-27 23:13:06.210822785 +0200
-@@ -0,0 +1,286 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_eglplatform_type_h_
-+#define __gc_hal_eglplatform_type_h_
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/*******************************************************************************
-+** Events. *********************************************************************
-+*/
-+
-+typedef enum _halEventType
-+{
-+	/* Keyboard event. */
-+    HAL_KEYBOARD,
-+
-+	/* Mouse move event. */
-+    HAL_POINTER,
-+
-+	/* Mouse button event. */
-+    HAL_BUTTON,
-+
-+	/* Application close event. */
-+	HAL_CLOSE,
-+
-+	/* Application window has been updated. */
-+	HAL_WINDOW_UPDATE
-+}
-+halEventType;
-+
-+/* Scancodes for keyboard. */
-+typedef enum _halKeys
-+{
-+    HAL_UNKNOWN = -1,
-+
-+    HAL_BACKSPACE = 0x08,
-+    HAL_TAB,
-+    HAL_ENTER = 0x0D,
-+    HAL_ESCAPE = 0x1B,
-+
-+    HAL_SPACE = 0x20,
-+    HAL_SINGLEQUOTE = 0x27,
-+    HAL_PAD_ASTERISK = 0x2A,
-+    HAL_COMMA = 0x2C,
-+    HAL_HYPHEN,
-+    HAL_PERIOD,
-+    HAL_SLASH,
-+    HAL_0,
-+    HAL_1,
-+    HAL_2,
-+    HAL_3,
-+    HAL_4,
-+    HAL_5,
-+    HAL_6,
-+    HAL_7,
-+    HAL_8,
-+    HAL_9,
-+    HAL_SEMICOLON = 0x3B,
-+    HAL_EQUAL = 0x3D,
-+    HAL_A = 0x41,
-+    HAL_B,
-+    HAL_C,
-+    HAL_D,
-+    HAL_E,
-+    HAL_F,
-+    HAL_G,
-+    HAL_H,
-+    HAL_I,
-+    HAL_J,
-+    HAL_K,
-+    HAL_L,
-+    HAL_M,
-+    HAL_N,
-+    HAL_O,
-+    HAL_P,
-+    HAL_Q,
-+    HAL_R,
-+    HAL_S,
-+    HAL_T,
-+    HAL_U,
-+    HAL_V,
-+    HAL_W,
-+    HAL_X,
-+    HAL_Y,
-+    HAL_Z,
-+    HAL_LBRACKET,
-+    HAL_BACKSLASH,
-+    HAL_RBRACKET,
-+    HAL_BACKQUOTE = 0x60,
-+
-+    HAL_F1 = 0x80,
-+    HAL_F2,
-+    HAL_F3,
-+    HAL_F4,
-+    HAL_F5,
-+    HAL_F6,
-+    HAL_F7,
-+    HAL_F8,
-+    HAL_F9,
-+    HAL_F10,
-+    HAL_F11,
-+    HAL_F12,
-+
-+    HAL_LCTRL,
-+    HAL_RCTRL,
-+    HAL_LSHIFT,
-+    HAL_RSHIFT,
-+    HAL_LALT,
-+    HAL_RALT,
-+    HAL_CAPSLOCK,
-+    HAL_NUMLOCK,
-+    HAL_SCROLLLOCK,
-+    HAL_PAD_0,
-+    HAL_PAD_1,
-+    HAL_PAD_2,
-+    HAL_PAD_3,
-+    HAL_PAD_4,
-+    HAL_PAD_5,
-+    HAL_PAD_6,
-+    HAL_PAD_7,
-+    HAL_PAD_8,
-+    HAL_PAD_9,
-+    HAL_PAD_HYPHEN,
-+    HAL_PAD_PLUS,
-+    HAL_PAD_SLASH,
-+    HAL_PAD_PERIOD,
-+    HAL_PAD_ENTER,
-+    HAL_SYSRQ,
-+    HAL_PRNTSCRN,
-+    HAL_BREAK,
-+    HAL_UP,
-+    HAL_LEFT,
-+    HAL_RIGHT,
-+    HAL_DOWN,
-+    HAL_HOME,
-+    HAL_END,
-+    HAL_PGUP,
-+    HAL_PGDN,
-+    HAL_INSERT,
-+    HAL_DELETE,
-+    HAL_LWINDOW,
-+    HAL_RWINDOW,
-+    HAL_MENU,
-+    HAL_POWER,
-+    HAL_SLEEP,
-+    HAL_WAKE
-+}
-+halKeys;
-+
-+/* Structure that defined keyboard mapping. */
-+typedef struct _halKeyMap
-+{
-+	/* Normal key. */
-+    halKeys normal;
-+
-+	/* Extended key. */
-+    halKeys extended;
-+}
-+halKeyMap;
-+
-+/* Event structure. */
-+typedef struct _halEvent
-+{
-+	/* Event type. */
-+    halEventType type;
-+
-+	/* Event data union. */
-+    union _halEventData
-+    {
-+		/* Event data for keyboard. */
-+        struct _halKeyboard
-+        {
-+			/* Scancode. */
-+            halKeys	scancode;
-+
-+			/* ASCII characte of the key pressed. */
-+            char	key;
-+
-+			/* Flag whether the key was pressed (1) or released (0). */
-+            char	pressed;
-+        }
-+        keyboard;
-+
-+		/* Event data for pointer. */
-+        struct _halPointer
-+        {
-+			/* Current pointer coordinate. */
-+            int		x;
-+            int		y;
-+        }
-+        pointer;
-+
-+		/* Event data for mouse buttons. */
-+        struct _halButton
-+        {
-+			/* Left button state. */
-+            int		left;
-+
-+			/* Middle button state. */
-+            int		middle;
-+
-+			/* Right button state. */
-+            int		right;
-+
-+			/* Current pointer coordinate. */
-+			int		x;
-+			int		y;
-+        }
-+        button;
-+    }
-+    data;
-+}
-+halEvent;
-+
-+/* VFK_DISPLAY_INFO structure defining information returned by
-+   vdkGetDisplayInfoEx. */
-+typedef struct _halDISPLAY_INFO
-+{
-+    /* The size of the display in pixels. */
-+    int                         width;
-+    int                         height;
-+
-+    /* The stride of the dispay. -1 is returned if the stride is not known
-+    ** for the specified display.*/
-+    int                         stride;
-+
-+    /* The color depth of the display in bits per pixel. */
-+    int                         bitsPerPixel;
-+
-+    /* The logical pointer to the display memory buffer. NULL is returned
-+    ** if the pointer is not known for the specified display. */
-+    void *                      logical;
-+
-+    /* The physical address of the display memory buffer. ~0 is returned
-+    ** if the address is not known for the specified display. */
-+    unsigned long               physical;
-+
-+    int                wrapFB;   /* true if compositor, false otherwise. */
-+
-+#ifndef __QNXNTO__
-+    /* 355_FB_MULTI_BUFFER */
-+    int                      multiBuffer;
-+    int                      backBufferY;
-+#endif
-+
-+    /* The color info of the display. */
-+    unsigned int                alphaLength;
-+    unsigned int                alphaOffset;
-+    unsigned int                redLength;
-+    unsigned int                redOffset;
-+    unsigned int                greenLength;
-+    unsigned int                greenOffset;
-+    unsigned int                blueLength;
-+    unsigned int                blueOffset;
-+
-+    /* Display flip support. */
-+    int                         flip;
-+}
-+halDISPLAY_INFO;
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_eglplatform_type_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,2053 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_engine_h_
-+#define __gc_hal_engine_h_
-+
-+#ifndef VIVANTE_NO_3D
-+#include "gc_hal_types.h"
-+#include "gc_hal_enum.h"
-+
-+#if gcdENABLE_VG
-+#include "gc_hal_engine_vg.h"
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+****************************** Object Declarations *****************************
-+\******************************************************************************/
-+
-+typedef struct _gcoSTREAM *             gcoSTREAM;
-+typedef struct _gcoVERTEX *             gcoVERTEX;
-+typedef struct _gcoTEXTURE *            gcoTEXTURE;
-+typedef struct _gcoINDEX *              gcoINDEX;
-+typedef struct _gcsVERTEX_ATTRIBUTES *  gcsVERTEX_ATTRIBUTES_PTR;
-+typedef struct _gcoVERTEXARRAY *        gcoVERTEXARRAY;
-+
-+#define gcdATTRIBUTE_COUNT              16
-+
-+/******************************************************************************\
-+********************************* Enumerations *********************************
-+\******************************************************************************/
-+
-+/* Shading format. */
-+typedef enum _gceSHADING
-+{
-+    gcvSHADING_SMOOTH,
-+    gcvSHADING_FLAT_D3D,
-+    gcvSHADING_FLAT_OPENGL,
-+}
-+gceSHADING;
-+
-+/* Culling modes. */
-+typedef enum _gceCULL
-+{
-+    gcvCULL_NONE,
-+    gcvCULL_CCW,
-+    gcvCULL_CW,
-+}
-+gceCULL;
-+
-+/* Fill modes. */
-+typedef enum _gceFILL
-+{
-+    gcvFILL_POINT,
-+    gcvFILL_WIRE_FRAME,
-+    gcvFILL_SOLID,
-+}
-+gceFILL;
-+
-+/* Compare modes. */
-+typedef enum _gceCOMPARE
-+{
-+    gcvCOMPARE_NEVER,
-+    gcvCOMPARE_NOT_EQUAL,
-+    gcvCOMPARE_LESS,
-+    gcvCOMPARE_LESS_OR_EQUAL,
-+    gcvCOMPARE_EQUAL,
-+    gcvCOMPARE_GREATER,
-+    gcvCOMPARE_GREATER_OR_EQUAL,
-+    gcvCOMPARE_ALWAYS,
-+    gcvCOMPARE_INVALID = -1
-+}
-+gceCOMPARE;
-+
-+/* Stencil modes. */
-+typedef enum _gceSTENCIL_MODE
-+{
-+    gcvSTENCIL_NONE,
-+    gcvSTENCIL_SINGLE_SIDED,
-+    gcvSTENCIL_DOUBLE_SIDED,
-+}
-+gceSTENCIL_MODE;
-+
-+/* Stencil operations. */
-+typedef enum _gceSTENCIL_OPERATION
-+{
-+    gcvSTENCIL_KEEP,
-+    gcvSTENCIL_REPLACE,
-+    gcvSTENCIL_ZERO,
-+    gcvSTENCIL_INVERT,
-+    gcvSTENCIL_INCREMENT,
-+    gcvSTENCIL_DECREMENT,
-+    gcvSTENCIL_INCREMENT_SATURATE,
-+    gcvSTENCIL_DECREMENT_SATURATE,
-+    gcvSTENCIL_OPERATION_INVALID = -1
-+}
-+gceSTENCIL_OPERATION;
-+
-+/* Stencil selection. */
-+typedef enum _gceSTENCIL_WHERE
-+{
-+    gcvSTENCIL_FRONT,
-+    gcvSTENCIL_BACK,
-+}
-+gceSTENCIL_WHERE;
-+
-+/* Texture addressing selection. */
-+typedef enum _gceTEXTURE_WHICH
-+{
-+    gcvTEXTURE_S,
-+    gcvTEXTURE_T,
-+    gcvTEXTURE_R,
-+}
-+gceTEXTURE_WHICH;
-+
-+/* Texture addressing modes. */
-+typedef enum _gceTEXTURE_ADDRESSING
-+{
-+    gcvTEXTURE_WRAP,
-+    gcvTEXTURE_CLAMP,
-+    gcvTEXTURE_BORDER,
-+    gcvTEXTURE_MIRROR,
-+    gcvTEXTURE_MIRROR_ONCE,
-+}
-+gceTEXTURE_ADDRESSING;
-+
-+/* Texture filters. */
-+typedef enum _gceTEXTURE_FILTER
-+{
-+    gcvTEXTURE_NONE,
-+    gcvTEXTURE_POINT,
-+    gcvTEXTURE_LINEAR,
-+    gcvTEXTURE_ANISOTROPIC,
-+}
-+gceTEXTURE_FILTER;
-+
-+/* Primitive types. */
-+typedef enum _gcePRIMITIVE
-+{
-+    gcvPRIMITIVE_POINT_LIST,
-+    gcvPRIMITIVE_LINE_LIST,
-+    gcvPRIMITIVE_LINE_STRIP,
-+    gcvPRIMITIVE_LINE_LOOP,
-+    gcvPRIMITIVE_TRIANGLE_LIST,
-+    gcvPRIMITIVE_TRIANGLE_STRIP,
-+    gcvPRIMITIVE_TRIANGLE_FAN,
-+    gcvPRIMITIVE_RECTANGLE,
-+}
-+gcePRIMITIVE;
-+
-+/* Index types. */
-+typedef enum _gceINDEX_TYPE
-+{
-+    gcvINDEX_8,
-+    gcvINDEX_16,
-+    gcvINDEX_32,
-+}
-+gceINDEX_TYPE;
-+
-+/******************************************************************************\
-+********************************* gcoHAL Object *********************************
-+\******************************************************************************/
-+
-+/* Query the target capabilities. */
-+gceSTATUS
-+gcoHAL_QueryTargetCaps(
-+    IN gcoHAL Hal,
-+    OUT gctUINT * MaxWidth,
-+    OUT gctUINT * MaxHeight,
-+    OUT gctUINT * MultiTargetCount,
-+    OUT gctUINT * MaxSamples
-+    );
-+
-+gceSTATUS
-+gcoHAL_SetDepthOnly(
-+    IN gcoHAL Hal,
-+    IN gctBOOL Enable
-+    );
-+
-+gceSTATUS
-+gcoHAL_QueryShaderCaps(
-+    IN gcoHAL Hal,
-+    OUT gctUINT * VertexUniforms,
-+    OUT gctUINT * FragmentUniforms,
-+    OUT gctUINT * Varyings
-+    );
-+
-+gceSTATUS
-+gcoHAL_QueryTextureCaps(
-+    IN gcoHAL Hal,
-+    OUT gctUINT * MaxWidth,
-+    OUT gctUINT * MaxHeight,
-+    OUT gctUINT * MaxDepth,
-+    OUT gctBOOL * Cubic,
-+    OUT gctBOOL * NonPowerOfTwo,
-+    OUT gctUINT * VertexSamplers,
-+    OUT gctUINT * PixelSamplers
-+    );
-+
-+gceSTATUS
-+gcoHAL_QueryTextureMaxAniso(
-+    IN gcoHAL Hal,
-+    OUT gctUINT * MaxAnisoValue
-+    );
-+
-+gceSTATUS
-+gcoHAL_QueryStreamCaps(
-+    IN gcoHAL Hal,
-+    OUT gctUINT32 * MaxAttributes,
-+    OUT gctUINT32 * MaxStreamSize,
-+    OUT gctUINT32 * NumberOfStreams,
-+    OUT gctUINT32 * Alignment
-+    );
-+
-+/******************************************************************************\
-+********************************* gcoSURF Object ********************************
-+\******************************************************************************/
-+
-+/*----------------------------------------------------------------------------*/
-+/*--------------------------------- gcoSURF 3D --------------------------------*/
-+
-+/* Copy surface. */
-+gceSTATUS
-+gcoSURF_Copy(
-+    IN gcoSURF Surface,
-+    IN gcoSURF Source
-+    );
-+
-+/* Clear surface. */
-+gceSTATUS
-+gcoSURF_Clear(
-+    IN gcoSURF Surface,
-+    IN gctUINT Flags
-+    );
-+
-+/* Set number of samples for a gcoSURF object. */
-+gceSTATUS
-+gcoSURF_SetSamples(
-+    IN gcoSURF Surface,
-+    IN gctUINT Samples
-+    );
-+
-+/* Get the number of samples per pixel. */
-+gceSTATUS
-+gcoSURF_GetSamples(
-+    IN gcoSURF Surface,
-+    OUT gctUINT_PTR Samples
-+    );
-+
-+/* Clear rectangular surface. */
-+gceSTATUS
-+gcoSURF_ClearRect(
-+    IN gcoSURF Surface,
-+    IN gctINT Left,
-+    IN gctINT Top,
-+    IN gctINT Right,
-+    IN gctINT Bottom,
-+    IN gctUINT Flags
-+    );
-+
-+/* TO BE REMOVED */
-+    gceSTATUS
-+    depr_gcoSURF_Resolve(
-+        IN gcoSURF SrcSurface,
-+        IN gcoSURF DestSurface,
-+        IN gctUINT32 DestAddress,
-+        IN gctPOINTER DestBits,
-+        IN gctINT DestStride,
-+        IN gceSURF_TYPE DestType,
-+        IN gceSURF_FORMAT DestFormat,
-+        IN gctUINT DestWidth,
-+        IN gctUINT DestHeight
-+        );
-+
-+    gceSTATUS
-+    depr_gcoSURF_ResolveRect(
-+        IN gcoSURF SrcSurface,
-+        IN gcoSURF DestSurface,
-+        IN gctUINT32 DestAddress,
-+        IN gctPOINTER DestBits,
-+        IN gctINT DestStride,
-+        IN gceSURF_TYPE DestType,
-+        IN gceSURF_FORMAT DestFormat,
-+        IN gctUINT DestWidth,
-+        IN gctUINT DestHeight,
-+        IN gcsPOINT_PTR SrcOrigin,
-+        IN gcsPOINT_PTR DestOrigin,
-+        IN gcsPOINT_PTR RectSize
-+        );
-+
-+/* Resample surface. */
-+gceSTATUS
-+gcoSURF_Resample(
-+    IN gcoSURF SrcSurface,
-+    IN gcoSURF DestSurface
-+    );
-+
-+/* Resolve surface. */
-+gceSTATUS
-+gcoSURF_Resolve(
-+    IN gcoSURF SrcSurface,
-+    IN gcoSURF DestSurface
-+    );
-+
-+gceSTATUS
-+gcoSURF_IsHWResolveable(
-+    IN gcoSURF SrcSurface,
-+    IN gcoSURF DestSurface,
-+    IN gcsPOINT_PTR SrcOrigin,
-+    IN gcsPOINT_PTR DestOrigin,
-+    IN gcsPOINT_PTR RectSize
-+    );
-+
-+/* Resolve rectangular area of a surface. */
-+gceSTATUS
-+gcoSURF_ResolveRect(
-+    IN gcoSURF SrcSurface,
-+    IN gcoSURF DestSurface,
-+    IN gcsPOINT_PTR SrcOrigin,
-+    IN gcsPOINT_PTR DestOrigin,
-+    IN gcsPOINT_PTR RectSize
-+    );
-+
-+/* Set surface resolvability. */
-+gceSTATUS
-+gcoSURF_SetResolvability(
-+    IN gcoSURF Surface,
-+    IN gctBOOL Resolvable
-+    );
-+
-+gceSTATUS
-+gcoSURF_IsRenderable(
-+    IN gcoSURF Surface
-+    );
-+
-+gceSTATUS
-+gcoSURF_IsFormatRenderableAsRT(
-+    IN gcoSURF Surface
-+    );
-+
-+#if gcdSYNC
-+gceSTATUS
-+gcoSURF_GetFence(
-+    IN gcoSURF Surface
-+    );
-+gceSTATUS
-+gcoSURF_WaitFence(
-+    IN gcoSURF Surface
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_GetFence(
-+    IN gcoSTREAM stream
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_WaitFence(
-+    IN gcoSTREAM stream
-+    );
-+
-+gceSTATUS
-+gcoINDEX_GetFence(
-+    IN gcoINDEX index
-+    );
-+
-+gceSTATUS
-+gcoINDEX_WaitFence(
-+    IN gcoINDEX index
-+    );
-+#endif
-+
-+/******************************************************************************\
-+******************************** gcoINDEX Object *******************************
-+\******************************************************************************/
-+
-+/* Construct a new gcoINDEX object. */
-+gceSTATUS
-+gcoINDEX_Construct(
-+    IN gcoHAL Hal,
-+    OUT gcoINDEX * Index
-+    );
-+
-+/* Destroy a gcoINDEX object. */
-+gceSTATUS
-+gcoINDEX_Destroy(
-+    IN gcoINDEX Index
-+    );
-+
-+/* Lock index in memory. */
-+gceSTATUS
-+gcoINDEX_Lock(
-+    IN gcoINDEX Index,
-+    OUT gctUINT32 * Address,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+/* Unlock index that was previously locked with gcoINDEX_Lock. */
-+gceSTATUS
-+gcoINDEX_Unlock(
-+    IN gcoINDEX Index
-+    );
-+
-+/* Upload index data into the memory. */
-+gceSTATUS
-+gcoINDEX_Load(
-+    IN gcoINDEX Index,
-+    IN gceINDEX_TYPE IndexType,
-+    IN gctUINT32 IndexCount,
-+    IN gctPOINTER IndexBuffer
-+    );
-+
-+/* Bind an index object to the hardware. */
-+gceSTATUS
-+gcoINDEX_Bind(
-+    IN gcoINDEX Index,
-+    IN gceINDEX_TYPE Type
-+    );
-+
-+/* Bind an index object to the hardware. */
-+gceSTATUS
-+gcoINDEX_BindOffset(
-+    IN gcoINDEX Index,
-+    IN gceINDEX_TYPE Type,
-+    IN gctUINT32 Offset
-+    );
-+
-+/* Free existing index buffer. */
-+gceSTATUS
-+gcoINDEX_Free(
-+    IN gcoINDEX Index
-+    );
-+
-+/* Upload data into an index buffer. */
-+gceSTATUS
-+gcoINDEX_Upload(
-+    IN gcoINDEX Index,
-+    IN gctCONST_POINTER Buffer,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Upload data into an index buffer starting at an offset. */
-+gceSTATUS
-+gcoINDEX_UploadOffset(
-+    IN gcoINDEX Index,
-+    IN gctUINT32 Offset,
-+    IN gctCONST_POINTER Buffer,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/*Merge index2 to index1 from 0, index2 must subset of inex1*/
-+gceSTATUS
-+gcoINDEX_Merge(
-+    IN gcoINDEX Index1,
-+    IN gcoINDEX Index2
-+    );
-+
-+/*check if index buffer is enough for this draw*/
-+gctBOOL
-+gcoINDEX_CheckRange(
-+    IN gcoINDEX Index,
-+    IN gceINDEX_TYPE Type,
-+    IN gctINT Count,
-+    IN gctUINT32  Indices
-+    );
-+
-+/* Query the index capabilities. */
-+gceSTATUS
-+gcoINDEX_QueryCaps(
-+    OUT gctBOOL * Index8,
-+    OUT gctBOOL * Index16,
-+    OUT gctBOOL * Index32,
-+    OUT gctUINT * MaxIndex
-+    );
-+
-+/* Determine the index range in the current index buffer. */
-+gceSTATUS
-+gcoINDEX_GetIndexRange(
-+    IN gcoINDEX Index,
-+    IN gceINDEX_TYPE Type,
-+    IN gctUINT32 Offset,
-+    IN gctUINT32 Count,
-+    OUT gctUINT32 * MinimumIndex,
-+    OUT gctUINT32 * MaximumIndex
-+    );
-+
-+/* Dynamic buffer management. */
-+gceSTATUS
-+gcoINDEX_SetDynamic(
-+    IN gcoINDEX Index,
-+    IN gctSIZE_T Bytes,
-+    IN gctUINT Buffers
-+    );
-+
-+gceSTATUS
-+gcoINDEX_UploadDynamic(
-+    IN gcoINDEX Index,
-+    IN gctCONST_POINTER Data,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/******************************************************************************\
-+********************************** gco3D Object *********************************
-+\******************************************************************************/
-+
-+/* Clear flags. */
-+typedef enum _gceCLEAR
-+{
-+    gcvCLEAR_COLOR              = 0x1,
-+    gcvCLEAR_DEPTH              = 0x2,
-+    gcvCLEAR_STENCIL            = 0x4,
-+    gcvCLEAR_HZ                 = 0x8,
-+    gcvCLEAR_HAS_VAA            = 0x10,
-+}
-+gceCLEAR;
-+
-+/* Blending targets. */
-+typedef enum _gceBLEND_UNIT
-+{
-+    gcvBLEND_SOURCE,
-+    gcvBLEND_TARGET,
-+}
-+gceBLEND_UNIT;
-+
-+/* Construct a new gco3D object. */
-+gceSTATUS
-+gco3D_Construct(
-+    IN gcoHAL Hal,
-+    OUT gco3D * Engine
-+    );
-+
-+/* Destroy an gco3D object. */
-+gceSTATUS
-+gco3D_Destroy(
-+    IN gco3D Engine
-+    );
-+
-+/* Set 3D API type. */
-+gceSTATUS
-+gco3D_SetAPI(
-+    IN gco3D Engine,
-+    IN gceAPI ApiType
-+    );
-+
-+/* Set render target. */
-+gceSTATUS
-+gco3D_SetTarget(
-+    IN gco3D Engine,
-+    IN gcoSURF Surface
-+    );
-+
-+/* Unset render target. */
-+gceSTATUS
-+gco3D_UnsetTarget(
-+    IN gco3D Engine,
-+    IN gcoSURF Surface
-+    );
-+
-+/* Set depth buffer. */
-+gceSTATUS
-+gco3D_SetDepth(
-+    IN gco3D Engine,
-+    IN gcoSURF Surface
-+    );
-+
-+/* Unset depth buffer. */
-+gceSTATUS
-+gco3D_UnsetDepth(
-+    IN gco3D Engine,
-+    IN gcoSURF Surface
-+    );
-+
-+/* Set viewport. */
-+gceSTATUS
-+gco3D_SetViewport(
-+    IN gco3D Engine,
-+    IN gctINT32 Left,
-+    IN gctINT32 Top,
-+    IN gctINT32 Right,
-+    IN gctINT32 Bottom
-+    );
-+
-+/* Set scissors. */
-+gceSTATUS
-+gco3D_SetScissors(
-+    IN gco3D Engine,
-+    IN gctINT32 Left,
-+    IN gctINT32 Top,
-+    IN gctINT32 Right,
-+    IN gctINT32 Bottom
-+    );
-+
-+/* Set clear color. */
-+gceSTATUS
-+gco3D_SetClearColor(
-+    IN gco3D Engine,
-+    IN gctUINT8 Red,
-+    IN gctUINT8 Green,
-+    IN gctUINT8 Blue,
-+    IN gctUINT8 Alpha
-+    );
-+
-+/* Set fixed point clear color. */
-+gceSTATUS
-+gco3D_SetClearColorX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT Red,
-+    IN gctFIXED_POINT Green,
-+    IN gctFIXED_POINT Blue,
-+    IN gctFIXED_POINT Alpha
-+    );
-+
-+/* Set floating point clear color. */
-+gceSTATUS
-+gco3D_SetClearColorF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Red,
-+    IN gctFLOAT Green,
-+    IN gctFLOAT Blue,
-+    IN gctFLOAT Alpha
-+    );
-+
-+/* Set fixed point clear depth. */
-+gceSTATUS
-+gco3D_SetClearDepthX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT Depth
-+    );
-+
-+/* Set floating point clear depth. */
-+gceSTATUS
-+gco3D_SetClearDepthF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Depth
-+    );
-+
-+/* Set clear stencil. */
-+gceSTATUS
-+gco3D_SetClearStencil(
-+    IN gco3D Engine,
-+    IN gctUINT32 Stencil
-+    );
-+
-+/* Clear a Rect sub-surface. */
-+gceSTATUS
-+gco3D_ClearRect(
-+    IN gco3D Engine,
-+    IN gctUINT32 Address,
-+    IN gctPOINTER Memory,
-+    IN gctUINT32 Stride,
-+    IN gceSURF_FORMAT Format,
-+    IN gctINT32 Left,
-+    IN gctINT32 Top,
-+    IN gctINT32 Right,
-+    IN gctINT32 Bottom,
-+    IN gctUINT32 Width,
-+    IN gctUINT32 Height,
-+    IN gctUINT32 Flags
-+    );
-+
-+/* Clear surface. */
-+gceSTATUS
-+gco3D_Clear(
-+    IN gco3D Engine,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Stride,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT32 Width,
-+    IN gctUINT32 Height,
-+    IN gctUINT32 Flags
-+    );
-+
-+
-+/* Clear tile status. */
-+gceSTATUS
-+gco3D_ClearTileStatus(
-+    IN gco3D Engine,
-+    IN gcsSURF_INFO_PTR Surface,
-+    IN gctUINT32 TileStatusAddress,
-+    IN gctUINT32 Flags
-+    );
-+
-+/* Set shading mode. */
-+gceSTATUS
-+gco3D_SetShading(
-+    IN gco3D Engine,
-+    IN gceSHADING Shading
-+    );
-+
-+/* Set blending mode. */
-+gceSTATUS
-+gco3D_EnableBlending(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set blending function. */
-+gceSTATUS
-+gco3D_SetBlendFunction(
-+    IN gco3D Engine,
-+    IN gceBLEND_UNIT Unit,
-+    IN gceBLEND_FUNCTION FunctionRGB,
-+    IN gceBLEND_FUNCTION FunctionAlpha
-+    );
-+
-+/* Set blending mode. */
-+gceSTATUS
-+gco3D_SetBlendMode(
-+    IN gco3D Engine,
-+    IN gceBLEND_MODE ModeRGB,
-+    IN gceBLEND_MODE ModeAlpha
-+    );
-+
-+/* Set blending color. */
-+gceSTATUS
-+gco3D_SetBlendColor(
-+    IN gco3D Engine,
-+    IN gctUINT Red,
-+    IN gctUINT Green,
-+    IN gctUINT Blue,
-+    IN gctUINT Alpha
-+    );
-+
-+/* Set fixed point blending color. */
-+gceSTATUS
-+gco3D_SetBlendColorX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT Red,
-+    IN gctFIXED_POINT Green,
-+    IN gctFIXED_POINT Blue,
-+    IN gctFIXED_POINT Alpha
-+    );
-+
-+/* Set floating point blending color. */
-+gceSTATUS
-+gco3D_SetBlendColorF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Red,
-+    IN gctFLOAT Green,
-+    IN gctFLOAT Blue,
-+    IN gctFLOAT Alpha
-+    );
-+
-+/* Set culling mode. */
-+gceSTATUS
-+gco3D_SetCulling(
-+    IN gco3D Engine,
-+    IN gceCULL Mode
-+    );
-+
-+/* Enable point size */
-+gceSTATUS
-+gco3D_SetPointSizeEnable(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set point sprite */
-+gceSTATUS
-+gco3D_SetPointSprite(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set fill mode. */
-+gceSTATUS
-+gco3D_SetFill(
-+    IN gco3D Engine,
-+    IN gceFILL Mode
-+    );
-+
-+/* Set depth compare mode. */
-+gceSTATUS
-+gco3D_SetDepthCompare(
-+    IN gco3D Engine,
-+    IN gceCOMPARE Compare
-+    );
-+
-+/* Enable depth writing. */
-+gceSTATUS
-+gco3D_EnableDepthWrite(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set depth mode. */
-+gceSTATUS
-+gco3D_SetDepthMode(
-+    IN gco3D Engine,
-+    IN gceDEPTH_MODE Mode
-+    );
-+
-+/* Set depth range. */
-+gceSTATUS
-+gco3D_SetDepthRangeX(
-+    IN gco3D Engine,
-+    IN gceDEPTH_MODE Mode,
-+    IN gctFIXED_POINT Near,
-+    IN gctFIXED_POINT Far
-+    );
-+
-+/* Set depth range. */
-+gceSTATUS
-+gco3D_SetDepthRangeF(
-+    IN gco3D Engine,
-+    IN gceDEPTH_MODE Mode,
-+    IN gctFLOAT Near,
-+    IN gctFLOAT Far
-+    );
-+
-+/* Set last pixel enable */
-+gceSTATUS
-+gco3D_SetLastPixelEnable(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set depth Bias and Scale */
-+gceSTATUS
-+gco3D_SetDepthScaleBiasX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT DepthScale,
-+    IN gctFIXED_POINT DepthBias
-+    );
-+
-+gceSTATUS
-+gco3D_SetDepthScaleBiasF(
-+    IN gco3D Engine,
-+    IN gctFLOAT DepthScale,
-+    IN gctFLOAT DepthBias
-+    );
-+
-+/* Set depth near and far clipping plane. */
-+gceSTATUS
-+gco3D_SetDepthPlaneF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Near,
-+    IN gctFLOAT Far
-+    );
-+
-+/* Enable or disable dithering. */
-+gceSTATUS
-+gco3D_EnableDither(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set color write enable bits. */
-+gceSTATUS
-+gco3D_SetColorWrite(
-+    IN gco3D Engine,
-+    IN gctUINT8 Enable
-+    );
-+
-+/* Enable or disable early depth. */
-+gceSTATUS
-+gco3D_SetEarlyDepth(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Enable or disable all early depth operations. */
-+gceSTATUS
-+gco3D_SetAllEarlyDepthModes(
-+    IN gco3D Engine,
-+    IN gctBOOL Disable
-+    );
-+
-+/* Switch dynamic early mode */
-+gceSTATUS
-+gco3D_SwitchDynamicEarlyDepthMode(
-+    IN gco3D Engine
-+    );
-+
-+/* Set dynamic early mode */
-+gceSTATUS
-+gco3D_DisableDynamicEarlyDepthMode(
-+    IN gco3D Engine,
-+    IN gctBOOL Disable
-+    );
-+
-+/* Enable or disable depth-only mode. */
-+gceSTATUS
-+gco3D_SetDepthOnly(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+typedef struct _gcsSTENCIL_INFO * gcsSTENCIL_INFO_PTR;
-+typedef struct _gcsSTENCIL_INFO
-+{
-+    gceSTENCIL_MODE         mode;
-+
-+    gctUINT8                maskFront;
-+	gctUINT8                maskBack;
-+    gctUINT8                writeMaskFront;
-+    gctUINT8                writeMaskBack;
-+
-+    gctUINT8                referenceFront;
-+
-+    gceCOMPARE              compareFront;
-+    gceSTENCIL_OPERATION    passFront;
-+    gceSTENCIL_OPERATION    failFront;
-+    gceSTENCIL_OPERATION    depthFailFront;
-+
-+    gctUINT8                referenceBack;
-+    gceCOMPARE              compareBack;
-+    gceSTENCIL_OPERATION    passBack;
-+    gceSTENCIL_OPERATION    failBack;
-+    gceSTENCIL_OPERATION    depthFailBack;
-+}
-+gcsSTENCIL_INFO;
-+
-+/* Set stencil mode. */
-+gceSTATUS
-+gco3D_SetStencilMode(
-+    IN gco3D Engine,
-+    IN gceSTENCIL_MODE Mode
-+    );
-+
-+/* Set stencil mask. */
-+gceSTATUS
-+gco3D_SetStencilMask(
-+    IN gco3D Engine,
-+    IN gctUINT8 Mask
-+    );
-+
-+/* Set stencil back mask. */
-+gceSTATUS
-+gco3D_SetStencilMaskBack(
-+    IN gco3D Engine,
-+    IN gctUINT8 Mask
-+    );
-+
-+/* Set stencil write mask. */
-+gceSTATUS
-+gco3D_SetStencilWriteMask(
-+    IN gco3D Engine,
-+    IN gctUINT8 Mask
-+    );
-+
-+/* Set stencil back write mask. */
-+gceSTATUS
-+gco3D_SetStencilWriteMaskBack(
-+    IN gco3D Engine,
-+    IN gctUINT8 Mask
-+    );
-+
-+/* Set stencil reference. */
-+gceSTATUS
-+gco3D_SetStencilReference(
-+    IN gco3D Engine,
-+    IN gctUINT8 Reference,
-+    IN gctBOOL Front
-+    );
-+
-+/* Set stencil compare. */
-+gceSTATUS
-+gco3D_SetStencilCompare(
-+    IN gco3D Engine,
-+    IN gceSTENCIL_WHERE Where,
-+    IN gceCOMPARE Compare
-+    );
-+
-+/* Set stencil operation on pass. */
-+gceSTATUS
-+gco3D_SetStencilPass(
-+    IN gco3D Engine,
-+    IN gceSTENCIL_WHERE Where,
-+    IN gceSTENCIL_OPERATION Operation
-+    );
-+
-+/* Set stencil operation on fail. */
-+gceSTATUS
-+gco3D_SetStencilFail(
-+    IN gco3D Engine,
-+    IN gceSTENCIL_WHERE Where,
-+    IN gceSTENCIL_OPERATION Operation
-+    );
-+
-+/* Set stencil operation on depth fail. */
-+gceSTATUS
-+gco3D_SetStencilDepthFail(
-+    IN gco3D Engine,
-+    IN gceSTENCIL_WHERE Where,
-+    IN gceSTENCIL_OPERATION Operation
-+    );
-+
-+/* Set all stencil states in one blow. */
-+gceSTATUS
-+gco3D_SetStencilAll(
-+    IN gco3D Engine,
-+    IN gcsSTENCIL_INFO_PTR Info
-+    );
-+
-+typedef struct _gcsALPHA_INFO * gcsALPHA_INFO_PTR;
-+typedef struct _gcsALPHA_INFO
-+{
-+    /* Alpha test states. */
-+    gctBOOL                 test;
-+    gceCOMPARE              compare;
-+    gctUINT8                reference;
-+    gctFLOAT                floatReference;
-+
-+    /* Alpha blending states. */
-+    gctBOOL                 blend;
-+
-+    gceBLEND_FUNCTION       srcFuncColor;
-+    gceBLEND_FUNCTION       srcFuncAlpha;
-+    gceBLEND_FUNCTION       trgFuncColor;
-+    gceBLEND_FUNCTION       trgFuncAlpha;
-+
-+    gceBLEND_MODE           modeColor;
-+    gceBLEND_MODE           modeAlpha;
-+
-+    gctUINT32               color;
-+}
-+gcsALPHA_INFO;
-+
-+/* Enable or disable alpha test. */
-+gceSTATUS
-+gco3D_SetAlphaTest(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set alpha test compare. */
-+gceSTATUS
-+gco3D_SetAlphaCompare(
-+    IN gco3D Engine,
-+    IN gceCOMPARE Compare
-+    );
-+
-+/* Set alpha test reference in unsigned integer. */
-+gceSTATUS
-+gco3D_SetAlphaReference(
-+    IN gco3D Engine,
-+    IN gctUINT8 Reference,
-+    IN gctFLOAT FloatReference
-+    );
-+
-+/* Set alpha test reference in fixed point. */
-+gceSTATUS
-+gco3D_SetAlphaReferenceX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT Reference
-+    );
-+
-+/* Set alpha test reference in floating point. */
-+gceSTATUS
-+gco3D_SetAlphaReferenceF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Reference
-+    );
-+
-+/* Enable/Disable anti-alias line. */
-+gceSTATUS
-+gco3D_SetAntiAliasLine(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Set texture slot for anti-alias line. */
-+gceSTATUS
-+gco3D_SetAALineTexSlot(
-+    IN gco3D Engine,
-+    IN gctUINT TexSlot
-+    );
-+
-+/* Set anti-alias line width scale. */
-+gceSTATUS
-+gco3D_SetAALineWidth(
-+    IN gco3D Engine,
-+    IN gctFLOAT Width
-+    );
-+
-+/* Draw a number of primitives. */
-+gceSTATUS
-+gco3D_DrawPrimitives(
-+    IN gco3D Engine,
-+    IN gcePRIMITIVE Type,
-+    IN gctINT StartVertex,
-+    IN gctSIZE_T PrimitiveCount
-+    );
-+
-+gceSTATUS
-+gco3D_DrawPrimitivesCount(
-+    IN gco3D Engine,
-+    IN gcePRIMITIVE Type,
-+    IN gctINT* StartVertex,
-+    IN gctSIZE_T* VertexCount,
-+    IN gctSIZE_T PrimitiveCount
-+    );
-+
-+
-+/* Draw a number of primitives using offsets. */
-+gceSTATUS
-+gco3D_DrawPrimitivesOffset(
-+    IN gco3D Engine,
-+    IN gcePRIMITIVE Type,
-+    IN gctINT32 StartOffset,
-+    IN gctSIZE_T PrimitiveCount
-+    );
-+
-+/* Draw a number of indexed primitives. */
-+gceSTATUS
-+gco3D_DrawIndexedPrimitives(
-+    IN gco3D Engine,
-+    IN gcePRIMITIVE Type,
-+    IN gctINT BaseVertex,
-+    IN gctINT StartIndex,
-+    IN gctSIZE_T PrimitiveCount
-+    );
-+
-+/* Draw a number of indexed primitives using offsets. */
-+gceSTATUS
-+gco3D_DrawIndexedPrimitivesOffset(
-+    IN gco3D Engine,
-+    IN gcePRIMITIVE Type,
-+    IN gctINT32 BaseOffset,
-+    IN gctINT32 StartOffset,
-+    IN gctSIZE_T PrimitiveCount
-+    );
-+
-+/* Enable or disable anti-aliasing. */
-+gceSTATUS
-+gco3D_SetAntiAlias(
-+    IN gco3D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Write data into the command buffer. */
-+gceSTATUS
-+gco3D_WriteBuffer(
-+    IN gco3D Engine,
-+    IN gctCONST_POINTER Data,
-+    IN gctSIZE_T Bytes,
-+    IN gctBOOL Aligned
-+    );
-+
-+/* Send sempahore and stall until sempahore is signalled. */
-+gceSTATUS
-+gco3D_Semaphore(
-+    IN gco3D Engine,
-+    IN gceWHERE From,
-+    IN gceWHERE To,
-+    IN gceHOW How);
-+
-+/* Set the subpixels center. */
-+gceSTATUS
-+gco3D_SetCentroids(
-+    IN gco3D Engine,
-+    IN gctUINT32 Index,
-+    IN gctPOINTER Centroids
-+    );
-+
-+gceSTATUS
-+gco3D_SetLogicOp(
-+    IN gco3D Engine,
-+    IN gctUINT8 Rop
-+    );
-+
-+/* OCL thread walker information. */
-+typedef struct _gcsTHREAD_WALKER_INFO * gcsTHREAD_WALKER_INFO_PTR;
-+typedef struct _gcsTHREAD_WALKER_INFO
-+{
-+    gctUINT32   dimensions;
-+    gctUINT32   traverseOrder;
-+    gctUINT32   enableSwathX;
-+    gctUINT32   enableSwathY;
-+    gctUINT32   enableSwathZ;
-+    gctUINT32   swathSizeX;
-+    gctUINT32   swathSizeY;
-+    gctUINT32   swathSizeZ;
-+    gctUINT32   valueOrder;
-+
-+    gctUINT32   globalSizeX;
-+    gctUINT32   globalOffsetX;
-+    gctUINT32   globalSizeY;
-+    gctUINT32   globalOffsetY;
-+    gctUINT32   globalSizeZ;
-+    gctUINT32   globalOffsetZ;
-+
-+    gctUINT32   workGroupSizeX;
-+    gctUINT32   workGroupCountX;
-+    gctUINT32   workGroupSizeY;
-+    gctUINT32   workGroupCountY;
-+    gctUINT32   workGroupSizeZ;
-+    gctUINT32   workGroupCountZ;
-+
-+    gctUINT32   threadAllocation;
-+}
-+gcsTHREAD_WALKER_INFO;
-+
-+/* Start OCL thread walker. */
-+gceSTATUS
-+gco3D_InvokeThreadWalker(
-+    IN gco3D Engine,
-+    IN gcsTHREAD_WALKER_INFO_PTR Info
-+    );
-+
-+/* Set w clip and w plane limit value. */
-+gceSTATUS
-+gco3D_SetWClipEnable(
-+	IN gco3D Engine,
-+	IN gctBOOL Enable
-+    );
-+
-+gceSTATUS
-+gco3D_GetWClipEnable(
-+    IN gco3D Engine,
-+    OUT gctBOOL * Enable
-+    );
-+
-+gceSTATUS
-+gco3D_SetWPlaneLimitF(
-+	IN gco3D Engine,
-+	IN gctFLOAT Value
-+    );
-+
-+gceSTATUS
-+gco3D_SetWPlaneLimitX(
-+	IN gco3D Engine,
-+	IN gctFIXED_POINT Value
-+    );
-+
-+
-+gceSTATUS
-+gco3D_SetWPlaneLimit(
-+        IN gco3D Engine,
-+        IN gctFLOAT Value
-+        );
-+
-+/*----------------------------------------------------------------------------*/
-+/*-------------------------- gco3D Fragment Processor ------------------------*/
-+
-+/* Set the fragment processor configuration. */
-+gceSTATUS
-+gco3D_SetFragmentConfiguration(
-+    IN gco3D Engine,
-+    IN gctBOOL ColorFromStream,
-+    IN gctBOOL EnableFog,
-+    IN gctBOOL EnableSmoothPoint,
-+    IN gctUINT32 ClipPlanes
-+    );
-+
-+/* Enable/disable texture stage operation. */
-+gceSTATUS
-+gco3D_EnableTextureStage(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gctBOOL Enable
-+    );
-+
-+/* Program the channel enable masks for the color texture function. */
-+gceSTATUS
-+gco3D_SetTextureColorMask(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gctBOOL ColorEnabled,
-+    IN gctBOOL AlphaEnabled
-+    );
-+
-+/* Program the channel enable masks for the alpha texture function. */
-+gceSTATUS
-+gco3D_SetTextureAlphaMask(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gctBOOL ColorEnabled,
-+    IN gctBOOL AlphaEnabled
-+    );
-+
-+/* Program the constant fragment color. */
-+gceSTATUS
-+gco3D_SetFragmentColorX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT Red,
-+    IN gctFIXED_POINT Green,
-+    IN gctFIXED_POINT Blue,
-+    IN gctFIXED_POINT Alpha
-+    );
-+
-+gceSTATUS
-+gco3D_SetFragmentColorF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Red,
-+    IN gctFLOAT Green,
-+    IN gctFLOAT Blue,
-+    IN gctFLOAT Alpha
-+    );
-+
-+/* Program the constant fog color. */
-+gceSTATUS
-+gco3D_SetFogColorX(
-+    IN gco3D Engine,
-+    IN gctFIXED_POINT Red,
-+    IN gctFIXED_POINT Green,
-+    IN gctFIXED_POINT Blue,
-+    IN gctFIXED_POINT Alpha
-+    );
-+
-+gceSTATUS
-+gco3D_SetFogColorF(
-+    IN gco3D Engine,
-+    IN gctFLOAT Red,
-+    IN gctFLOAT Green,
-+    IN gctFLOAT Blue,
-+    IN gctFLOAT Alpha
-+    );
-+
-+/* Program the constant texture color. */
-+gceSTATUS
-+gco3D_SetTetxureColorX(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gctFIXED_POINT Red,
-+    IN gctFIXED_POINT Green,
-+    IN gctFIXED_POINT Blue,
-+    IN gctFIXED_POINT Alpha
-+    );
-+
-+gceSTATUS
-+gco3D_SetTetxureColorF(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gctFLOAT Red,
-+    IN gctFLOAT Green,
-+    IN gctFLOAT Blue,
-+    IN gctFLOAT Alpha
-+    );
-+
-+/* Configure color texture function. */
-+gceSTATUS
-+gco3D_SetColorTextureFunction(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gceTEXTURE_FUNCTION Function,
-+    IN gceTEXTURE_SOURCE Source0,
-+    IN gceTEXTURE_CHANNEL Channel0,
-+    IN gceTEXTURE_SOURCE Source1,
-+    IN gceTEXTURE_CHANNEL Channel1,
-+    IN gceTEXTURE_SOURCE Source2,
-+    IN gceTEXTURE_CHANNEL Channel2,
-+    IN gctINT Scale
-+    );
-+
-+/* Configure alpha texture function. */
-+gceSTATUS
-+gco3D_SetAlphaTextureFunction(
-+    IN gco3D Engine,
-+    IN gctINT Stage,
-+    IN gceTEXTURE_FUNCTION Function,
-+    IN gceTEXTURE_SOURCE Source0,
-+    IN gceTEXTURE_CHANNEL Channel0,
-+    IN gceTEXTURE_SOURCE Source1,
-+    IN gceTEXTURE_CHANNEL Channel1,
-+    IN gceTEXTURE_SOURCE Source2,
-+    IN gceTEXTURE_CHANNEL Channel2,
-+    IN gctINT Scale
-+    );
-+
-+/* Invoke OCL thread walker. */
-+gceSTATUS
-+gcoHARDWARE_InvokeThreadWalker(
-+    IN gcsTHREAD_WALKER_INFO_PTR Info
-+    );
-+
-+/******************************************************************************\
-+******************************* gcoTEXTURE Object *******************************
-+\******************************************************************************/
-+
-+/* Cube faces. */
-+typedef enum _gceTEXTURE_FACE
-+{
-+    gcvFACE_NONE,
-+    gcvFACE_POSITIVE_X,
-+    gcvFACE_NEGATIVE_X,
-+    gcvFACE_POSITIVE_Y,
-+    gcvFACE_NEGATIVE_Y,
-+    gcvFACE_POSITIVE_Z,
-+    gcvFACE_NEGATIVE_Z,
-+}
-+gceTEXTURE_FACE;
-+
-+#if gcdFORCE_MIPMAP
-+typedef enum
-+{
-+    gcvForceMipDisabled  = 0,
-+    gcvForceMipEnable    = 1,
-+    gcvForceMipGenerated = 2,
-+    gcvForceMipNever     = 3,
-+}gceFORCE_MIPMAP;
-+#endif
-+
-+typedef struct _gcsTEXTURE
-+{
-+    /* Addressing modes. */
-+    gceTEXTURE_ADDRESSING       s;
-+    gceTEXTURE_ADDRESSING       t;
-+    gceTEXTURE_ADDRESSING       r;
-+
-+    /* Border color. */
-+    gctUINT8                    border[4];
-+
-+    /* Filters. */
-+    gceTEXTURE_FILTER           minFilter;
-+    gceTEXTURE_FILTER           magFilter;
-+    gceTEXTURE_FILTER           mipFilter;
-+    gctUINT                     anisoFilter;
-+    gctBOOL                     forceTopLevel;
-+    gctBOOL                     autoMipmap;
-+#if gcdFORCE_MIPMAP
-+    gceFORCE_MIPMAP             forceMipmap;
-+#endif
-+    /* Level of detail. */
-+    gctFIXED_POINT              lodBias;
-+    gctFIXED_POINT              lodMin;
-+    gctFIXED_POINT              lodMax;
-+}
-+gcsTEXTURE, * gcsTEXTURE_PTR;
-+
-+/* Construct a new gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_Construct(
-+    IN gcoHAL Hal,
-+    OUT gcoTEXTURE * Texture
-+    );
-+
-+/* Construct a new sized gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_ConstructSized(
-+    IN gcoHAL Hal,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Depth,
-+    IN gctUINT Faces,
-+    IN gctUINT MipMapCount,
-+    IN gcePOOL Pool,
-+    OUT gcoTEXTURE * Texture
-+    );
-+
-+/* Destroy an gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_Destroy(
-+    IN gcoTEXTURE Texture
-+    );
-+#if gcdFORCE_MIPMAP
-+gceSTATUS
-+gcoTEXTURE_DestroyForceMipmap(
-+    IN gcoTEXTURE Texture
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_GetMipLevels(
-+    IN gcoTEXTURE Texture,
-+    OUT gctINT * levels
-+    );
-+#endif
-+/* Replace a mipmap in gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_ReplaceMipMap(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT Level,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctINT imageFormat,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT Depth,
-+    IN gctUINT Faces,
-+    IN gcePOOL Pool
-+    );
-+
-+/* Upload data to an gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_Upload(
-+    IN gcoTEXTURE Texture,
-+    IN gceTEXTURE_FACE Face,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Slice,
-+    IN gctCONST_POINTER Memory,
-+    IN gctINT Stride,
-+    IN gceSURF_FORMAT Format
-+    );
-+
-+/* Upload data to an gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_UploadSub(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT MipMap,
-+    IN gceTEXTURE_FACE Face,
-+    IN gctUINT X,
-+    IN gctUINT Y,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Slice,
-+    IN gctCONST_POINTER Memory,
-+    IN gctINT Stride,
-+    IN gceSURF_FORMAT Format
-+    );
-+
-+/* Upload YUV data to an gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_UploadYUV(
-+    IN gcoTEXTURE Texture,
-+    IN gceTEXTURE_FACE Face,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Slice,
-+    IN gctPOINTER Memory[3],
-+    IN gctINT Stride[3],
-+    IN gceSURF_FORMAT Format
-+    );
-+
-+/* Upload compressed data to an gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_UploadCompressed(
-+    IN gcoTEXTURE Texture,
-+    IN gceTEXTURE_FACE Face,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Slice,
-+    IN gctCONST_POINTER Memory,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Upload compressed sub data to an gcoTEXTURE object. */
-+gceSTATUS
-+gcoTEXTURE_UploadCompressedSub(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT MipMap,
-+    IN gceTEXTURE_FACE Face,
-+    IN gctUINT XOffset,
-+    IN gctUINT YOffset,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Slice,
-+    IN gctCONST_POINTER Memory,
-+    IN gctSIZE_T Size
-+    );
-+
-+/* GetImageFormat of texture. */
-+gceSTATUS
-+gcoTEXTURE_GetImageFormat(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT MipMap,
-+    OUT gctINT *  ImageFormat
-+    );
-+
-+/* Get gcoSURF object for a mipmap level. */
-+gceSTATUS
-+gcoTEXTURE_GetMipMap(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT MipMap,
-+    OUT gcoSURF * Surface
-+    );
-+
-+/* Get gcoSURF object for a mipmap level and face offset. */
-+gceSTATUS
-+gcoTEXTURE_GetMipMapFace(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT MipMap,
-+    IN gceTEXTURE_FACE Face,
-+    OUT gcoSURF * Surface,
-+    OUT gctUINT32_PTR Offset
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_AddMipMap(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT Level,
-+    IN gctINT imageFormat,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Depth,
-+    IN gctUINT Faces,
-+    IN gcePOOL Pool,
-+    OUT gcoSURF * Surface
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_AddMipMapFromClient(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT     Level,
-+    IN gcoSURF    Surface
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_AddMipMapFromSurface(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT     Level,
-+    IN gcoSURF    Surface
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_SetMaxLevel(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT Levels
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_SetEndianHint(
-+    IN gcoTEXTURE Texture,
-+    IN gceENDIAN_HINT EndianHint
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_Disable(
-+    IN gcoHAL Hal,
-+    IN gctINT Sampler
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_Flush(
-+    IN gcoTEXTURE Texture
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_QueryCaps(
-+    IN  gcoHAL    Hal,
-+    OUT gctUINT * MaxWidth,
-+    OUT gctUINT * MaxHeight,
-+    OUT gctUINT * MaxDepth,
-+    OUT gctBOOL * Cubic,
-+    OUT gctBOOL * NonPowerOfTwo,
-+    OUT gctUINT * VertexSamplers,
-+    OUT gctUINT * PixelSamplers
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_GetTiling(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT preferLevel,
-+	OUT gceTILING * Tiling
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_GetClosestFormat(
-+    IN gcoHAL Hal,
-+    IN gceSURF_FORMAT InFormat,
-+    OUT gceSURF_FORMAT* OutFormat
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_RenderIntoMipMap(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT Level
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_IsRenderable(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT Level
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_IsRenderableEx(
-+    IN gcoTEXTURE Texture,
-+    IN gctUINT Level
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_IsComplete(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT MaxLevel
-+    );
-+
-+gceSTATUS
-+gcoTEXTURE_BindTexture(
-+    IN gcoTEXTURE Texture,
-+    IN gctINT Target,
-+    IN gctINT Sampler,
-+    IN gcsTEXTURE_PTR Info
-+    );
-+
-+/******************************************************************************\
-+******************************* gcoSTREAM Object ******************************
-+\******************************************************************************/
-+
-+typedef enum _gceVERTEX_FORMAT
-+{
-+    gcvVERTEX_BYTE,
-+    gcvVERTEX_UNSIGNED_BYTE,
-+    gcvVERTEX_SHORT,
-+    gcvVERTEX_UNSIGNED_SHORT,
-+    gcvVERTEX_INT,
-+    gcvVERTEX_UNSIGNED_INT,
-+    gcvVERTEX_FIXED,
-+    gcvVERTEX_HALF,
-+    gcvVERTEX_FLOAT,
-+    gcvVERTEX_UNSIGNED_INT_10_10_10_2,
-+    gcvVERTEX_INT_10_10_10_2,
-+}
-+gceVERTEX_FORMAT;
-+
-+gceSTATUS
-+gcoSTREAM_Construct(
-+    IN gcoHAL Hal,
-+    OUT gcoSTREAM * Stream
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_Destroy(
-+    IN gcoSTREAM Stream
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_Upload(
-+    IN gcoSTREAM Stream,
-+    IN gctCONST_POINTER Buffer,
-+    IN gctUINT32 Offset,
-+    IN gctSIZE_T Bytes,
-+    IN gctBOOL Dynamic
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_SetStride(
-+    IN gcoSTREAM Stream,
-+    IN gctUINT32 Stride
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_Lock(
-+    IN gcoSTREAM Stream,
-+    OUT gctPOINTER * Logical,
-+    OUT gctUINT32 * Physical
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_Unlock(
-+    IN gcoSTREAM Stream
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_Reserve(
-+    IN gcoSTREAM Stream,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_Flush(
-+    IN gcoSTREAM Stream
-+    );
-+
-+/* Dynamic buffer API. */
-+gceSTATUS
-+gcoSTREAM_SetDynamic(
-+    IN gcoSTREAM Stream,
-+    IN gctSIZE_T Bytes,
-+    IN gctUINT Buffers
-+    );
-+
-+typedef struct _gcsSTREAM_INFO
-+{
-+    gctUINT             index;
-+    gceVERTEX_FORMAT    format;
-+    gctBOOL             normalized;
-+    gctUINT             components;
-+    gctSIZE_T           size;
-+    gctCONST_POINTER    data;
-+    gctUINT             stride;
-+}
-+gcsSTREAM_INFO, * gcsSTREAM_INFO_PTR;
-+
-+gceSTATUS
-+gcoSTREAM_UploadDynamic(
-+    IN gcoSTREAM Stream,
-+    IN gctUINT VertexCount,
-+    IN gctUINT InfoCount,
-+    IN gcsSTREAM_INFO_PTR Info,
-+    IN gcoVERTEX Vertex
-+    );
-+
-+gceSTATUS
-+gcoSTREAM_CPUCacheOperation(
-+    IN gcoSTREAM Stream,
-+    IN gceCACHEOPERATION Operation
-+    );
-+
-+/******************************************************************************\
-+******************************** gcoVERTEX Object ******************************
-+\******************************************************************************/
-+
-+typedef struct _gcsVERTEX_ATTRIBUTES
-+{
-+    gceVERTEX_FORMAT            format;
-+    gctBOOL                     normalized;
-+    gctUINT32                   components;
-+    gctSIZE_T                   size;
-+    gctUINT32                   stream;
-+    gctUINT32                   offset;
-+    gctUINT32                   stride;
-+}
-+gcsVERTEX_ATTRIBUTES;
-+
-+gceSTATUS
-+gcoVERTEX_Construct(
-+    IN gcoHAL Hal,
-+    OUT gcoVERTEX * Vertex
-+    );
-+
-+gceSTATUS
-+gcoVERTEX_Destroy(
-+    IN gcoVERTEX Vertex
-+    );
-+
-+gceSTATUS
-+gcoVERTEX_Reset(
-+    IN gcoVERTEX Vertex
-+    );
-+
-+gceSTATUS
-+gcoVERTEX_EnableAttribute(
-+    IN gcoVERTEX Vertex,
-+    IN gctUINT32 Index,
-+    IN gceVERTEX_FORMAT Format,
-+    IN gctBOOL Normalized,
-+    IN gctUINT32 Components,
-+    IN gcoSTREAM Stream,
-+    IN gctUINT32 Offset,
-+    IN gctUINT32 Stride
-+    );
-+
-+gceSTATUS
-+gcoVERTEX_DisableAttribute(
-+    IN gcoVERTEX Vertex,
-+    IN gctUINT32 Index
-+    );
-+
-+gceSTATUS
-+gcoVERTEX_Bind(
-+    IN gcoVERTEX Vertex
-+    );
-+
-+/*******************************************************************************
-+***** gcoVERTEXARRAY Object ***************************************************/
-+
-+typedef struct _gcsVERTEXARRAY
-+{
-+    /* Enabled. */
-+    gctBOOL             enable;
-+
-+    /* Number of components. */
-+    gctINT              size;
-+
-+    /* Attribute format. */
-+    gceVERTEX_FORMAT    format;
-+
-+    /* Flag whether the attribute is normalized or not. */
-+    gctBOOL             normalized;
-+
-+    /* Stride of the component. */
-+    gctUINT             stride;
-+
-+    /* Pointer to the attribute data. */
-+    gctCONST_POINTER    pointer;
-+
-+    /* Stream object owning the attribute data. */
-+    gcoSTREAM           stream;
-+
-+    /* Generic values for attribute. */
-+    gctFLOAT            genericValue[4];
-+
-+    /* Generic size for attribute. */
-+    gctINT              genericSize;
-+
-+    /* Vertex shader linkage. */
-+    gctUINT             linkage;
-+
-+#if gcdUSE_WCLIP_PATCH
-+    gctBOOL             isPosition;
-+#endif
-+}
-+gcsVERTEXARRAY,
-+* gcsVERTEXARRAY_PTR;
-+
-+gceSTATUS
-+gcoVERTEXARRAY_Construct(
-+    IN gcoHAL Hal,
-+    OUT gcoVERTEXARRAY * Vertex
-+    );
-+
-+gceSTATUS
-+gcoVERTEXARRAY_Destroy(
-+    IN gcoVERTEXARRAY Vertex
-+    );
-+
-+gceSTATUS
-+gcoVERTEXARRAY_Bind(
-+    IN gcoVERTEXARRAY Vertex,
-+    IN gctUINT32 EnableBits,
-+    IN gcsVERTEXARRAY_PTR VertexArray,
-+    IN gctUINT First,
-+    IN gctSIZE_T Count,
-+    IN gceINDEX_TYPE IndexType,
-+    IN gcoINDEX IndexObject,
-+    IN gctPOINTER IndexMemory,
-+    IN OUT gcePRIMITIVE * PrimitiveType,
-+#if gcdUSE_WCLIP_PATCH
-+    IN OUT gctUINT * PrimitiveCount,
-+    IN OUT gctFLOAT * wLimitRms,
-+    IN OUT gctBOOL * wLimitDirty
-+#else
-+    IN OUT gctUINT * PrimitiveCount
-+#endif
-+    );
-+
-+gctUINT
-+gcoVERTEXARRAY_GetMaxStream(
-+    IN gcoVERTEXARRAY Vertex
-+);
-+
-+gceSTATUS
-+gcoVERTEXARRAY_SetMaxStream(
-+    IN gcoVERTEXARRAY Vertex,
-+    gctUINT maxStreams
-+);
-+/*******************************************************************************
-+***** Composition *************************************************************/
-+
-+typedef enum _gceCOMPOSITION
-+{
-+    gcvCOMPOSE_CLEAR = 1,
-+    gcvCOMPOSE_BLUR,
-+    gcvCOMPOSE_DIM,
-+    gcvCOMPOSE_LAYER
-+}
-+gceCOMPOSITION;
-+
-+typedef struct _gcsCOMPOSITION * gcsCOMPOSITION_PTR;
-+typedef struct _gcsCOMPOSITION
-+{
-+    /* Structure size. */
-+    gctUINT                         structSize;
-+
-+    /* Composition operation. */
-+    gceCOMPOSITION                  operation;
-+
-+    /* Layer to be composed. */
-+    gcoSURF                         layer;
-+
-+    /* Source and target coordinates. */
-+    gcsRECT                         srcRect;
-+    gcsRECT                         trgRect;
-+
-+    /* Target rectangle */
-+    gcsPOINT                        v0;
-+    gcsPOINT                        v1;
-+    gcsPOINT                        v2;
-+
-+    /* Blending parameters. */
-+    gctBOOL                         enableBlending;
-+    gctBOOL                         premultiplied;
-+    gctUINT8                        alphaValue;
-+
-+    /* Clear color. */
-+    gctFLOAT                        r;
-+    gctFLOAT                        g;
-+    gctFLOAT                        b;
-+    gctFLOAT                        a;
-+}
-+gcsCOMPOSITION;
-+
-+gceSTATUS
-+gco3D_ProbeComposition(
-+    gctBOOL ResetIfEmpty
-+    );
-+
-+gceSTATUS
-+gco3D_CompositionBegin(
-+    void
-+    );
-+
-+gceSTATUS
-+gco3D_ComposeLayer(
-+    IN gcsCOMPOSITION_PTR Layer
-+    );
-+
-+gceSTATUS
-+gco3D_CompositionSignals(
-+    IN gctHANDLE Process,
-+    IN gctSIGNAL Signal1,
-+    IN gctSIGNAL Signal2
-+    );
-+
-+gceSTATUS
-+gco3D_CompositionEnd(
-+    IN gcoSURF Target,
-+    IN gctBOOL Synchronous
-+    );
-+
-+/* Frame Database */
-+gceSTATUS
-+gcoHAL_AddFrameDB(
-+    void
-+    );
-+
-+gceSTATUS
-+gcoHAL_DumpFrameDB(
-+    gctCONST_STRING Filename OPTIONAL
-+    );
-+
-+gceSTATUS
-+gcoHAL_GetSharedInfo(
-+    IN gctUINT32 Pid,
-+    IN gctUINT32 DataId,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER Data
-+    );
-+
-+gceSTATUS
-+gcoHAL_SetSharedInfo(
-+    IN gctUINT32 DataId,
-+    IN gctPOINTER Data,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+gceSTATUS
-+gcoHARDWARE_GetContext(
-+    IN gcoHARDWARE Hardware,
-+    OUT gctUINT32 * Context
-+    );
-+#endif
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* VIVANTE_NO_3D */
-+#endif /* __gc_hal_engine_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,904 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_engine_vg_h_
-+#define __gc_hal_engine_vg_h_
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+#include "gc_hal_types.h"
-+
-+/******************************************************************************\
-+******************************** VG Enumerations *******************************
-+\******************************************************************************/
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Tiling mode for painting and imagig.
-+**
-+**  This enumeration defines the tiling modes supported by the HAL.  This is
-+**  in fact a one-to-one mapping of the OpenVG 1.1 tile modes.
-+*/
-+typedef enum _gceTILE_MODE
-+{
-+    gcvTILE_FILL,
-+    gcvTILE_PAD,
-+    gcvTILE_REPEAT,
-+    gcvTILE_REFLECT
-+}
-+gceTILE_MODE;
-+
-+/******************************************************************************/
-+/** @ingroup gcoVG
-+**
-+**  @brief  The different paint modes.
-+**
-+**  This enumeration lists the available paint modes.
-+*/
-+typedef enum _gcePAINT_TYPE
-+{
-+    /** Solid color. */
-+    gcvPAINT_MODE_SOLID,
-+
-+    /** Linear gradient. */
-+    gcvPAINT_MODE_LINEAR,
-+
-+    /** Radial gradient. */
-+    gcvPAINT_MODE_RADIAL,
-+
-+    /** Pattern. */
-+    gcvPAINT_MODE_PATTERN,
-+
-+    /** Mode count. */
-+    gcvPAINT_MODE_COUNT
-+}
-+gcePAINT_TYPE;
-+
-+/**
-+** @ingroup gcoVG
-+**
-+**  @brief Types of path data supported by HAL.
-+**
-+**  This enumeration defines the types of path data supported by the HAL.
-+**  This is in fact a one-to-one mapping of the OpenVG 1.1 path types.
-+*/
-+typedef enum _gcePATHTYPE
-+{
-+    gcePATHTYPE_UNKNOWN = -1,
-+    gcePATHTYPE_INT8,
-+    gcePATHTYPE_INT16,
-+    gcePATHTYPE_INT32,
-+    gcePATHTYPE_FLOAT
-+}
-+gcePATHTYPE;
-+
-+/**
-+** @ingroup gcoVG
-+**
-+**  @brief Supported path segment commands.
-+**
-+**  This enumeration defines the path segment commands supported by the HAL.
-+*/
-+typedef enum _gceVGCMD
-+{
-+    gcvVGCMD_END,                        /*  0: GCCMD_TS_OPCODE_END           */
-+    gcvVGCMD_CLOSE,                      /*  1: GCCMD_TS_OPCODE_CLOSE         */
-+    gcvVGCMD_MOVE,                       /*  2: GCCMD_TS_OPCODE_MOVE          */
-+    gcvVGCMD_MOVE_REL,                   /*  3: GCCMD_TS_OPCODE_MOVE_REL      */
-+    gcvVGCMD_LINE,                       /*  4: GCCMD_TS_OPCODE_LINE          */
-+    gcvVGCMD_LINE_REL,                   /*  5: GCCMD_TS_OPCODE_LINE_REL      */
-+    gcvVGCMD_QUAD,                       /*  6: GCCMD_TS_OPCODE_QUADRATIC     */
-+    gcvVGCMD_QUAD_REL,                   /*  7: GCCMD_TS_OPCODE_QUADRATIC_REL */
-+    gcvVGCMD_CUBIC,                      /*  8: GCCMD_TS_OPCODE_CUBIC         */
-+    gcvVGCMD_CUBIC_REL,                  /*  9: GCCMD_TS_OPCODE_CUBIC_REL     */
-+    gcvVGCMD_BREAK,                      /* 10: GCCMD_TS_OPCODE_BREAK         */
-+    gcvVGCMD_HLINE,                      /* 11: ******* R E S E R V E D *******/
-+    gcvVGCMD_HLINE_REL,                  /* 12: ******* R E S E R V E D *******/
-+    gcvVGCMD_VLINE,                      /* 13: ******* R E S E R V E D *******/
-+    gcvVGCMD_VLINE_REL,                  /* 14: ******* R E S E R V E D *******/
-+    gcvVGCMD_SQUAD,                      /* 15: ******* R E S E R V E D *******/
-+    gcvVGCMD_SQUAD_REL,                  /* 16: ******* R E S E R V E D *******/
-+    gcvVGCMD_SCUBIC,                     /* 17: ******* R E S E R V E D *******/
-+    gcvVGCMD_SCUBIC_REL,                 /* 18: ******* R E S E R V E D *******/
-+    gcvVGCMD_SCCWARC,                    /* 19: ******* R E S E R V E D *******/
-+    gcvVGCMD_SCCWARC_REL,                /* 20: ******* R E S E R V E D *******/
-+    gcvVGCMD_SCWARC,                     /* 21: ******* R E S E R V E D *******/
-+    gcvVGCMD_SCWARC_REL,                 /* 22: ******* R E S E R V E D *******/
-+    gcvVGCMD_LCCWARC,                    /* 23: ******* R E S E R V E D *******/
-+    gcvVGCMD_LCCWARC_REL,                /* 24: ******* R E S E R V E D *******/
-+    gcvVGCMD_LCWARC,                     /* 25: ******* R E S E R V E D *******/
-+    gcvVGCMD_LCWARC_REL,                 /* 26: ******* R E S E R V E D *******/
-+
-+    /* The width of the command recognized by the hardware on bits. */
-+    gcvVGCMD_WIDTH = 5,
-+
-+    /* Hardware command mask. */
-+    gcvVGCMD_MASK = (1 << gcvVGCMD_WIDTH) - 1,
-+
-+    /* Command modifiers. */
-+    gcvVGCMD_H_MOD   = 1 << gcvVGCMD_WIDTH,  /* =  32 */
-+    gcvVGCMD_V_MOD   = 2 << gcvVGCMD_WIDTH,  /* =  64 */
-+    gcvVGCMD_S_MOD   = 3 << gcvVGCMD_WIDTH,  /* =  96 */
-+    gcvVGCMD_ARC_MOD = 4 << gcvVGCMD_WIDTH,  /* = 128 */
-+
-+    /* Emulated LINE commands. */
-+    gcvVGCMD_HLINE_EMUL     = gcvVGCMD_H_MOD | gcvVGCMD_LINE,        /* =  36 */
-+    gcvVGCMD_HLINE_EMUL_REL = gcvVGCMD_H_MOD | gcvVGCMD_LINE_REL,    /* =  37 */
-+    gcvVGCMD_VLINE_EMUL     = gcvVGCMD_V_MOD | gcvVGCMD_LINE,        /* =  68 */
-+    gcvVGCMD_VLINE_EMUL_REL = gcvVGCMD_V_MOD | gcvVGCMD_LINE_REL,    /* =  69 */
-+
-+    /* Emulated SMOOTH commands. */
-+    gcvVGCMD_SQUAD_EMUL      = gcvVGCMD_S_MOD | gcvVGCMD_QUAD,       /* = 102 */
-+    gcvVGCMD_SQUAD_EMUL_REL  = gcvVGCMD_S_MOD | gcvVGCMD_QUAD_REL,   /* = 103 */
-+    gcvVGCMD_SCUBIC_EMUL     = gcvVGCMD_S_MOD | gcvVGCMD_CUBIC,      /* = 104 */
-+    gcvVGCMD_SCUBIC_EMUL_REL = gcvVGCMD_S_MOD | gcvVGCMD_CUBIC_REL,  /* = 105 */
-+
-+    /* Emulation ARC commands. */
-+    gcvVGCMD_ARC_LINE     = gcvVGCMD_ARC_MOD | gcvVGCMD_LINE,        /* = 132 */
-+    gcvVGCMD_ARC_LINE_REL = gcvVGCMD_ARC_MOD | gcvVGCMD_LINE_REL,    /* = 133 */
-+    gcvVGCMD_ARC_QUAD     = gcvVGCMD_ARC_MOD | gcvVGCMD_QUAD,        /* = 134 */
-+    gcvVGCMD_ARC_QUAD_REL = gcvVGCMD_ARC_MOD | gcvVGCMD_QUAD_REL     /* = 135 */
-+}
-+gceVGCMD;
-+typedef enum _gceVGCMD * gceVGCMD_PTR;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Blending modes supported by the HAL.
-+**
-+**  This enumeration defines the blending modes supported by the HAL.  This is
-+**  in fact a one-to-one mapping of the OpenVG 1.1 blending modes.
-+*/
-+typedef enum _gceVG_BLEND
-+{
-+    gcvVG_BLEND_SRC,
-+    gcvVG_BLEND_SRC_OVER,
-+    gcvVG_BLEND_DST_OVER,
-+    gcvVG_BLEND_SRC_IN,
-+    gcvVG_BLEND_DST_IN,
-+    gcvVG_BLEND_MULTIPLY,
-+    gcvVG_BLEND_SCREEN,
-+    gcvVG_BLEND_DARKEN,
-+    gcvVG_BLEND_LIGHTEN,
-+    gcvVG_BLEND_ADDITIVE,
-+    gcvVG_BLEND_SUBTRACT,
-+    gcvVG_BLEND_FILTER
-+}
-+gceVG_BLEND;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Image modes supported by the HAL.
-+**
-+**  This enumeration defines the image modes supported by the HAL.  This is
-+**  in fact a one-to-one mapping of the OpenVG 1.1 image modes with the addition
-+**  of NO IMAGE.
-+*/
-+typedef enum _gceVG_IMAGE
-+{
-+    gcvVG_IMAGE_NONE,
-+    gcvVG_IMAGE_NORMAL,
-+    gcvVG_IMAGE_MULTIPLY,
-+    gcvVG_IMAGE_STENCIL,
-+    gcvVG_IMAGE_FILTER
-+}
-+gceVG_IMAGE;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Filter mode patterns and imaging.
-+**
-+**  This enumeration defines the filter modes supported by the HAL.
-+*/
-+typedef enum _gceIMAGE_FILTER
-+{
-+    gcvFILTER_POINT,
-+    gcvFILTER_LINEAR,
-+    gcvFILTER_BI_LINEAR
-+}
-+gceIMAGE_FILTER;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Primitive modes supported by the HAL.
-+**
-+**  This enumeration defines the primitive modes supported by the HAL.
-+*/
-+typedef enum _gceVG_PRIMITIVE
-+{
-+    gcvVG_SCANLINE,
-+    gcvVG_RECTANGLE,
-+    gcvVG_TESSELLATED,
-+    gcvVG_TESSELLATED_TILED
-+}
-+gceVG_PRIMITIVE;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Rendering quality modes supported by the HAL.
-+**
-+**  This enumeration defines the rendering quality modes supported by the HAL.
-+*/
-+typedef enum _gceRENDER_QUALITY
-+{
-+    gcvVG_NONANTIALIASED,
-+    gcvVG_2X2_MSAA,
-+    gcvVG_2X4_MSAA,
-+    gcvVG_4X4_MSAA
-+}
-+gceRENDER_QUALITY;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Fill rules supported by the HAL.
-+**
-+**  This enumeration defines the fill rules supported by the HAL.
-+*/
-+typedef enum _gceFILL_RULE
-+{
-+    gcvVG_EVEN_ODD,
-+    gcvVG_NON_ZERO
-+}
-+gceFILL_RULE;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Cap styles supported by the HAL.
-+**
-+**  This enumeration defines the cap styles supported by the HAL.
-+*/
-+typedef enum _gceCAP_STYLE
-+{
-+    gcvCAP_BUTT,
-+    gcvCAP_ROUND,
-+    gcvCAP_SQUARE
-+}
-+gceCAP_STYLE;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Join styles supported by the HAL.
-+**
-+**  This enumeration defines the join styles supported by the HAL.
-+*/
-+typedef enum _gceJOIN_STYLE
-+{
-+    gcvJOIN_MITER,
-+    gcvJOIN_ROUND,
-+    gcvJOIN_BEVEL
-+}
-+gceJOIN_STYLE;
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Channel mask values.
-+**
-+**  This enumeration defines the values for channel mask used in image
-+**  filtering.
-+*/
-+
-+/* Base values for channel mask definitions. */
-+#define gcvCHANNEL_X    (0)
-+#define gcvCHANNEL_R    (1 << 0)
-+#define gcvCHANNEL_G    (1 << 1)
-+#define gcvCHANNEL_B    (1 << 2)
-+#define gcvCHANNEL_A    (1 << 3)
-+
-+typedef enum _gceCHANNEL
-+{
-+    gcvCHANNEL_XXXX = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X),
-+    gcvCHANNEL_XXXA = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_A),
-+    gcvCHANNEL_XXBX = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_X),
-+    gcvCHANNEL_XXBA = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_A),
-+
-+    gcvCHANNEL_XGXX = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_X),
-+    gcvCHANNEL_XGXA = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_A),
-+    gcvCHANNEL_XGBX = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_X),
-+    gcvCHANNEL_XGBA = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_A),
-+
-+    gcvCHANNEL_RXXX = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X),
-+    gcvCHANNEL_RXXA = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_A),
-+    gcvCHANNEL_RXBX = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_X),
-+    gcvCHANNEL_RXBA = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_A),
-+
-+    gcvCHANNEL_RGXX = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_X),
-+    gcvCHANNEL_RGXA = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_A),
-+    gcvCHANNEL_RGBX = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_X),
-+    gcvCHANNEL_RGBA = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_A),
-+}
-+gceCHANNEL;
-+
-+/******************************************************************************\
-+******************************** VG Structures *******************************
-+\******************************************************************************/
-+
-+/**
-+**  @ingroup    gcoVG
-+**
-+**  @brief      Definition of the color ramp used by the gradient paints.
-+**
-+**  The gcsCOLOR_RAMP structure defines the layout of one single color inside
-+**  a color ramp which is used by gradient paints.
-+*/
-+typedef struct _gcsCOLOR_RAMP
-+{
-+    /** Value for the color stop. */
-+    gctFLOAT        stop;
-+
-+    /** Red color channel value for the color stop. */
-+    gctFLOAT        red;
-+
-+    /** Green color channel value for the color stop. */
-+    gctFLOAT        green;
-+
-+    /** Blue color channel value for the color stop. */
-+    gctFLOAT        blue;
-+
-+    /** Alpha color channel value for the color stop. */
-+    gctFLOAT        alpha;
-+}
-+gcsCOLOR_RAMP, * gcsCOLOR_RAMP_PTR;
-+
-+/**
-+**  @ingroup    gcoVG
-+**
-+**  @brief      Definition of the color ramp used by the gradient paints in fixed form.
-+**
-+**  The gcsCOLOR_RAMP structure defines the layout of one single color inside
-+**  a color ramp which is used by gradient paints.
-+*/
-+typedef struct _gcsFIXED_COLOR_RAMP
-+{
-+    /** Value for the color stop. */
-+    gctFIXED_POINT      stop;
-+
-+    /** Red color channel value for the color stop. */
-+    gctFIXED_POINT      red;
-+
-+    /** Green color channel value for the color stop. */
-+    gctFIXED_POINT      green;
-+
-+    /** Blue color channel value for the color stop. */
-+    gctFIXED_POINT      blue;
-+
-+    /** Alpha color channel value for the color stop. */
-+    gctFIXED_POINT      alpha;
-+}
-+gcsFIXED_COLOR_RAMP, * gcsFIXED_COLOR_RAMP_PTR;
-+
-+
-+/**
-+**  @ingroup gcoVG
-+**
-+**  @brief  Rectangle structure used by the gcoVG object.
-+**
-+**  This structure defines the layout of a rectangle.  Make sure width and
-+**  height are larger than 0.
-+*/
-+typedef struct _gcsVG_RECT * gcsVG_RECT_PTR;
-+typedef struct _gcsVG_RECT
-+{
-+    /** Left location of the rectangle. */
-+    gctINT      x;
-+
-+    /** Top location of the rectangle. */
-+    gctINT      y;
-+
-+    /** Width of the rectangle. */
-+    gctINT      width;
-+
-+    /** Height of the rectangle. */
-+    gctINT      height;
-+}
-+gcsVG_RECT;
-+
-+/**
-+**  @ingroup    gcoVG
-+**
-+**  @brief      Path command buffer attribute structure.
-+**
-+**  The gcsPATH_BUFFER_INFO structure contains the specifics about
-+**  the layout of the path data command buffer.
-+*/
-+typedef struct _gcsPATH_BUFFER_INFO * gcsPATH_BUFFER_INFO_PTR;
-+typedef struct _gcsPATH_BUFFER_INFO
-+{
-+    gctUINT     reservedForHead;
-+    gctUINT     reservedForTail;
-+}
-+gcsPATH_BUFFER_INFO;
-+
-+/**
-+**  @ingroup    gcoVG
-+**
-+**  @brief      Definition of the path data container structure.
-+**
-+**  The gcsPATH structure defines the layout of the path data container.
-+*/
-+typedef struct _gcsPATH_DATA * gcsPATH_DATA_PTR;
-+typedef struct _gcsPATH_DATA
-+{
-+    /* Data container in command buffer format. */
-+    gcsCMDBUFFER    data;
-+
-+    /* Path data type. */
-+    gcePATHTYPE     dataType;
-+}
-+gcsPATH_DATA;
-+
-+
-+/******************************************************************************\
-+********************************* gcoHAL Object ********************************
-+\******************************************************************************/
-+
-+/* Query path data storage attributes. */
-+gceSTATUS
-+gcoHAL_QueryPathStorage(
-+    IN gcoHAL Hal,
-+    OUT gcsPATH_BUFFER_INFO_PTR Information
-+    );
-+
-+/* Associate a completion signal with the command buffer. */
-+gceSTATUS
-+gcoHAL_AssociateCompletion(
-+    IN gcoHAL Hal,
-+    IN gcsPATH_DATA_PTR PathData
-+    );
-+
-+/* Release the current command buffer completion signal. */
-+gceSTATUS
-+gcoHAL_DeassociateCompletion(
-+    IN gcoHAL Hal,
-+    IN gcsPATH_DATA_PTR PathData
-+    );
-+
-+/* Verify whether the command buffer is still in use. */
-+gceSTATUS
-+gcoHAL_CheckCompletion(
-+    IN gcoHAL Hal,
-+    IN gcsPATH_DATA_PTR PathData
-+    );
-+
-+/* Wait until the command buffer is no longer in use. */
-+gceSTATUS
-+gcoHAL_WaitCompletion(
-+    IN gcoHAL Hal,
-+    IN gcsPATH_DATA_PTR PathData
-+    );
-+
-+/* Flush the pixel cache. */
-+gceSTATUS
-+gcoHAL_Flush(
-+    IN gcoHAL Hal
-+    );
-+
-+/* Split a harwdare address into pool and offset. */
-+gceSTATUS
-+gcoHAL_SplitAddress(
-+    IN gcoHAL Hal,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    );
-+
-+/* Combine pool and offset into a harwdare address. */
-+gceSTATUS
-+gcoHAL_CombineAddress(
-+    IN gcoHAL Hal,
-+    IN gcePOOL Pool,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Schedule to free linear video memory allocated. */
-+gceSTATUS
-+gcoHAL_ScheduleVideoMemory(
-+    IN gcoHAL Hal,
-+    IN gctUINT64 Node
-+    );
-+
-+/* Free linear video memory allocated with gcoHAL_AllocateLinearVideoMemory. */
-+gceSTATUS
-+gcoHAL_FreeVideoMemory(
-+    IN gcoHAL Hal,
-+    IN gctUINT64 Node
-+    );
-+
-+/* Query command buffer attributes. */
-+gceSTATUS
-+gcoHAL_QueryCommandBuffer(
-+    IN gcoHAL Hal,
-+    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
-+    );
-+/* Allocate and lock linear video memory. */
-+gceSTATUS
-+gcoHAL_AllocateLinearVideoMemory(
-+    IN gcoHAL Hal,
-+    IN gctUINT Size,
-+    IN gctUINT Alignment,
-+    IN gcePOOL Pool,
-+    OUT gctUINT64 * Node,
-+    OUT gctUINT32 * Address,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+/* Align the specified size accordingly to the hardware requirements. */
-+gceSTATUS
-+gcoHAL_GetAlignedSurfaceSize(
-+    IN gcoHAL Hal,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctUINT32_PTR Width,
-+    IN OUT gctUINT32_PTR Height
-+    );
-+
-+gceSTATUS
-+gcoHAL_ReserveTask(
-+    IN gcoHAL Hal,
-+    IN gceBLOCK Block,
-+    IN gctUINT TaskCount,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    );
-+/******************************************************************************\
-+********************************** gcoVG Object ********************************
-+\******************************************************************************/
-+
-+/** @defgroup gcoVG gcoVG
-+**
-+**  The gcoVG object abstracts the VG hardware pipe.
-+*/
-+
-+gctBOOL
-+gcoVG_IsMaskSupported(
-+    IN gceSURF_FORMAT Format
-+    );
-+
-+gctBOOL
-+gcoVG_IsTargetSupported(
-+    IN gceSURF_FORMAT Format
-+    );
-+
-+gctBOOL
-+gcoVG_IsImageSupported(
-+    IN gceSURF_FORMAT Format
-+    );
-+
-+gctUINT8 gcoVG_PackColorComponent(
-+    gctFLOAT Value
-+    );
-+
-+gceSTATUS
-+gcoVG_Construct(
-+    IN gcoHAL Hal,
-+    OUT gcoVG * Vg
-+    );
-+
-+gceSTATUS
-+gcoVG_Destroy(
-+    IN gcoVG Vg
-+    );
-+
-+gceSTATUS
-+gcoVG_SetTarget(
-+    IN gcoVG Vg,
-+    IN gcoSURF Target
-+    );
-+
-+gceSTATUS
-+gcoVG_UnsetTarget(
-+    IN gcoVG Vg,
-+    IN gcoSURF Surface
-+    );
-+
-+gceSTATUS
-+gcoVG_SetUserToSurface(
-+    IN gcoVG Vg,
-+    IN gctFLOAT UserToSurface[9]
-+    );
-+
-+gceSTATUS
-+gcoVG_SetSurfaceToImage(
-+    IN gcoVG Vg,
-+    IN gctFLOAT SurfaceToImage[9]
-+    );
-+
-+gceSTATUS
-+gcoVG_EnableMask(
-+    IN gcoVG Vg,
-+    IN gctBOOL Enable
-+    );
-+
-+gceSTATUS
-+gcoVG_SetMask(
-+    IN gcoVG Vg,
-+    IN gcoSURF Mask
-+    );
-+
-+gceSTATUS
-+gcoVG_UnsetMask(
-+    IN gcoVG Vg,
-+    IN gcoSURF Surface
-+    );
-+
-+gceSTATUS
-+gcoVG_FlushMask(
-+    IN gcoVG Vg
-+    );
-+
-+gceSTATUS
-+gcoVG_EnableScissor(
-+    IN gcoVG Vg,
-+    IN gctBOOL Enable
-+    );
-+
-+gceSTATUS
-+gcoVG_SetScissor(
-+    IN gcoVG Vg,
-+    IN gctSIZE_T RectangleCount,
-+    IN gcsVG_RECT_PTR Rectangles
-+    );
-+
-+gceSTATUS
-+gcoVG_EnableColorTransform(
-+    IN gcoVG Vg,
-+    IN gctBOOL Enable
-+    );
-+
-+gceSTATUS
-+gcoVG_SetColorTransform(
-+    IN gcoVG Vg,
-+    IN gctFLOAT ColorTransform[8]
-+    );
-+
-+gceSTATUS
-+gcoVG_SetTileFillColor(
-+    IN gcoVG Vg,
-+    IN gctFLOAT Red,
-+    IN gctFLOAT Green,
-+    IN gctFLOAT Blue,
-+    IN gctFLOAT Alpha
-+    );
-+
-+gceSTATUS
-+gcoVG_SetSolidPaint(
-+    IN gcoVG Vg,
-+    IN gctUINT8 Red,
-+    IN gctUINT8 Green,
-+    IN gctUINT8 Blue,
-+    IN gctUINT8 Alpha
-+    );
-+
-+gceSTATUS
-+gcoVG_SetLinearPaint(
-+    IN gcoVG Vg,
-+    IN gctFLOAT Constant,
-+    IN gctFLOAT StepX,
-+    IN gctFLOAT StepY
-+    );
-+
-+gceSTATUS
-+gcoVG_SetRadialPaint(
-+    IN gcoVG Vg,
-+    IN gctFLOAT LinConstant,
-+    IN gctFLOAT LinStepX,
-+    IN gctFLOAT LinStepY,
-+    IN gctFLOAT RadConstant,
-+    IN gctFLOAT RadStepX,
-+    IN gctFLOAT RadStepY,
-+    IN gctFLOAT RadStepXX,
-+    IN gctFLOAT RadStepYY,
-+    IN gctFLOAT RadStepXY
-+    );
-+
-+gceSTATUS
-+gcoVG_SetPatternPaint(
-+    IN gcoVG Vg,
-+    IN gctFLOAT UConstant,
-+    IN gctFLOAT UStepX,
-+    IN gctFLOAT UStepY,
-+    IN gctFLOAT VConstant,
-+    IN gctFLOAT VStepX,
-+    IN gctFLOAT VStepY,
-+    IN gctBOOL Linear
-+    );
-+
-+gceSTATUS
-+gcoVG_SetColorRamp(
-+    IN gcoVG Vg,
-+    IN gcoSURF ColorRamp,
-+    IN gceTILE_MODE ColorRampSpreadMode
-+    );
-+
-+gceSTATUS
-+gcoVG_SetPattern(
-+    IN gcoVG Vg,
-+    IN gcoSURF Pattern,
-+    IN gceTILE_MODE TileMode,
-+    IN gceIMAGE_FILTER Filter
-+    );
-+
-+gceSTATUS
-+gcoVG_SetImageMode(
-+    IN gcoVG Vg,
-+    IN gceVG_IMAGE Mode
-+    );
-+
-+gceSTATUS
-+gcoVG_SetBlendMode(
-+    IN gcoVG Vg,
-+    IN gceVG_BLEND Mode
-+    );
-+
-+gceSTATUS
-+gcoVG_SetRenderingQuality(
-+    IN gcoVG Vg,
-+    IN gceRENDER_QUALITY Quality
-+    );
-+
-+gceSTATUS
-+gcoVG_SetFillRule(
-+    IN gcoVG Vg,
-+    IN gceFILL_RULE FillRule
-+    );
-+
-+gceSTATUS
-+gcoVG_FinalizePath(
-+    IN gcoVG Vg,
-+    IN gcsPATH_DATA_PTR PathData
-+    );
-+
-+gceSTATUS
-+gcoVG_Clear(
-+    IN gcoVG Vg,
-+    IN gctINT X,
-+    IN gctINT Y,
-+    IN gctINT Width,
-+    IN gctINT Height
-+    );
-+
-+gceSTATUS
-+gcoVG_DrawPath(
-+    IN gcoVG Vg,
-+    IN gcsPATH_DATA_PTR PathData,
-+    IN gctFLOAT Scale,
-+    IN gctFLOAT Bias,
-+    IN gctBOOL SoftwareTesselation
-+    );
-+
-+gceSTATUS
-+gcoVG_DrawImage(
-+    IN gcoVG Vg,
-+    IN gcoSURF Source,
-+    IN gcsPOINT_PTR SourceOrigin,
-+    IN gcsPOINT_PTR TargetOrigin,
-+    IN gcsSIZE_PTR SourceSize,
-+    IN gctINT SourceX,
-+    IN gctINT SourceY,
-+    IN gctINT TargetX,
-+    IN gctINT TargetY,
-+    IN gctINT Width,
-+    IN gctINT Height,
-+    IN gctBOOL Mask
-+    );
-+
-+gceSTATUS
-+gcoVG_TesselateImage(
-+    IN gcoVG Vg,
-+    IN gcoSURF Image,
-+    IN gcsVG_RECT_PTR Rectangle,
-+    IN gceIMAGE_FILTER Filter,
-+    IN gctBOOL Mask,
-+    IN gctBOOL SoftwareTesselation
-+    );
-+
-+gceSTATUS
-+gcoVG_Blit(
-+    IN gcoVG Vg,
-+    IN gcoSURF Source,
-+    IN gcoSURF Target,
-+    IN gcsVG_RECT_PTR SrcRect,
-+    IN gcsVG_RECT_PTR TrgRect,
-+    IN gceIMAGE_FILTER Filter,
-+    IN gceVG_BLEND Mode
-+    );
-+
-+gceSTATUS
-+gcoVG_ColorMatrix(
-+    IN gcoVG Vg,
-+    IN gcoSURF Source,
-+    IN gcoSURF Target,
-+    IN const gctFLOAT * Matrix,
-+    IN gceCHANNEL ColorChannels,
-+    IN gctBOOL FilterLinear,
-+    IN gctBOOL FilterPremultiplied,
-+    IN gcsPOINT_PTR SourceOrigin,
-+    IN gcsPOINT_PTR TargetOrigin,
-+    IN gctINT Width,
-+    IN gctINT Height
-+    );
-+
-+gceSTATUS
-+gcoVG_SeparableConvolve(
-+    IN gcoVG Vg,
-+    IN gcoSURF Source,
-+    IN gcoSURF Target,
-+    IN gctINT KernelWidth,
-+    IN gctINT KernelHeight,
-+    IN gctINT ShiftX,
-+    IN gctINT ShiftY,
-+    IN const gctINT16 * KernelX,
-+    IN const gctINT16 * KernelY,
-+    IN gctFLOAT Scale,
-+    IN gctFLOAT Bias,
-+    IN gceTILE_MODE TilingMode,
-+    IN gctFLOAT_PTR FillColor,
-+    IN gceCHANNEL ColorChannels,
-+    IN gctBOOL FilterLinear,
-+    IN gctBOOL FilterPremultiplied,
-+    IN gcsPOINT_PTR SourceOrigin,
-+    IN gcsPOINT_PTR TargetOrigin,
-+    IN gcsSIZE_PTR SourceSize,
-+    IN gctINT Width,
-+    IN gctINT Height
-+    );
-+
-+gceSTATUS
-+gcoVG_GaussianBlur(
-+    IN gcoVG Vg,
-+    IN gcoSURF Source,
-+    IN gcoSURF Target,
-+    IN gctFLOAT StdDeviationX,
-+    IN gctFLOAT StdDeviationY,
-+    IN gceTILE_MODE TilingMode,
-+    IN gctFLOAT_PTR FillColor,
-+    IN gceCHANNEL ColorChannels,
-+    IN gctBOOL FilterLinear,
-+    IN gctBOOL FilterPremultiplied,
-+    IN gcsPOINT_PTR SourceOrigin,
-+    IN gcsPOINT_PTR TargetOrigin,
-+    IN gcsSIZE_PTR SourceSize,
-+    IN gctINT Width,
-+    IN gctINT Height
-+    );
-+
-+gceSTATUS
-+gcoVG_EnableDither(
-+    IN gcoVG Vg,
-+    IN gctBOOL Enable
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif  /* __gc_hal_vg_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,965 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_enum_h_
-+#define __gc_hal_enum_h_
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/* Chip models. */
-+typedef enum _gceCHIPMODEL
-+{
-+    gcv300  = 0x0300,
-+    gcv320  = 0x0320,
-+    gcv350  = 0x0350,
-+    gcv355  = 0x0355,
-+    gcv400  = 0x0400,
-+    gcv410  = 0x0410,
-+    gcv420  = 0x0420,
-+    gcv450  = 0x0450,
-+    gcv500  = 0x0500,
-+    gcv530  = 0x0530,
-+    gcv600  = 0x0600,
-+    gcv700  = 0x0700,
-+    gcv800  = 0x0800,
-+    gcv860  = 0x0860,
-+    gcv880  = 0x0880,
-+    gcv1000 = 0x1000,
-+    gcv2000 = 0x2000,
-+    gcv2100 = 0x2100,
-+    gcv4000 = 0x4000,
-+}
-+gceCHIPMODEL;
-+
-+/* Chip features. */
-+typedef enum _gceFEATURE
-+{
-+    gcvFEATURE_PIPE_2D = 0,
-+    gcvFEATURE_PIPE_3D,
-+    gcvFEATURE_PIPE_VG,
-+    gcvFEATURE_DC,
-+    gcvFEATURE_HIGH_DYNAMIC_RANGE,
-+    gcvFEATURE_MODULE_CG,
-+    gcvFEATURE_MIN_AREA,
-+    gcvFEATURE_BUFFER_INTERLEAVING,
-+    gcvFEATURE_BYTE_WRITE_2D,
-+    gcvFEATURE_ENDIANNESS_CONFIG,
-+    gcvFEATURE_DUAL_RETURN_BUS,
-+    gcvFEATURE_DEBUG_MODE,
-+    gcvFEATURE_YUY2_RENDER_TARGET,
-+    gcvFEATURE_FRAGMENT_PROCESSOR,
-+    gcvFEATURE_2DPE20,
-+    gcvFEATURE_FAST_CLEAR,
-+    gcvFEATURE_YUV420_TILER,
-+    gcvFEATURE_YUY2_AVERAGING,
-+    gcvFEATURE_FLIP_Y,
-+    gcvFEATURE_EARLY_Z,
-+    gcvFEATURE_Z_COMPRESSION,
-+    gcvFEATURE_MSAA,
-+    gcvFEATURE_SPECIAL_ANTI_ALIASING,
-+    gcvFEATURE_SPECIAL_MSAA_LOD,
-+    gcvFEATURE_422_TEXTURE_COMPRESSION,
-+    gcvFEATURE_DXT_TEXTURE_COMPRESSION,
-+    gcvFEATURE_ETC1_TEXTURE_COMPRESSION,
-+    gcvFEATURE_CORRECT_TEXTURE_CONVERTER,
-+    gcvFEATURE_TEXTURE_8K,
-+    gcvFEATURE_SCALER,
-+    gcvFEATURE_YUV420_SCALER,
-+    gcvFEATURE_SHADER_HAS_W,
-+    gcvFEATURE_SHADER_HAS_SIGN,
-+    gcvFEATURE_SHADER_HAS_FLOOR,
-+    gcvFEATURE_SHADER_HAS_CEIL,
-+    gcvFEATURE_SHADER_HAS_SQRT,
-+    gcvFEATURE_SHADER_HAS_TRIG,
-+    gcvFEATURE_VAA,
-+    gcvFEATURE_HZ,
-+    gcvFEATURE_CORRECT_STENCIL,
-+    gcvFEATURE_VG20,
-+    gcvFEATURE_VG_FILTER,
-+    gcvFEATURE_VG21,
-+    gcvFEATURE_VG_DOUBLE_BUFFER,
-+    gcvFEATURE_MC20,
-+    gcvFEATURE_SUPER_TILED,
-+    gcvFEATURE_2D_FILTERBLIT_PLUS_ALPHABLEND,
-+    gcvFEATURE_2D_DITHER,
-+    gcvFEATURE_2D_A8_TARGET,
-+    gcvFEATURE_2D_FILTERBLIT_FULLROTATION,
-+    gcvFEATURE_2D_BITBLIT_FULLROTATION,
-+    gcvFEATURE_WIDE_LINE,
-+    gcvFEATURE_FC_FLUSH_STALL,
-+    gcvFEATURE_FULL_DIRECTFB,
-+    gcvFEATURE_HALF_FLOAT_PIPE,
-+    gcvFEATURE_LINE_LOOP,
-+    gcvFEATURE_2D_YUV_BLIT,
-+    gcvFEATURE_2D_TILING,
-+    gcvFEATURE_NON_POWER_OF_TWO,
-+    gcvFEATURE_3D_TEXTURE,
-+    gcvFEATURE_TEXTURE_ARRAY,
-+    gcvFEATURE_TILE_FILLER,
-+    gcvFEATURE_LOGIC_OP,
-+    gcvFEATURE_COMPOSITION,
-+    gcvFEATURE_MIXED_STREAMS,
-+    gcvFEATURE_2D_MULTI_SOURCE_BLT,
-+    gcvFEATURE_END_EVENT,
-+    gcvFEATURE_VERTEX_10_10_10_2,
-+    gcvFEATURE_TEXTURE_10_10_10_2,
-+    gcvFEATURE_TEXTURE_ANISOTROPIC_FILTERING,
-+    gcvFEATURE_TEXTURE_FLOAT_HALF_FLOAT,
-+	gcvFEATURE_2D_ROTATION_STALL_FIX,
-+    gcvFEATURE_2D_MULTI_SOURCE_BLT_EX,
-+	gcvFEATURE_BUG_FIXES10,
-+    gcvFEATURE_2D_MINOR_TILING,
-+    /* Supertiled compressed textures are supported. */
-+    gcvFEATURE_TEX_COMPRRESSION_SUPERTILED,
-+    gcvFEATURE_FAST_MSAA,
-+    gcvFEATURE_BUG_FIXED_INDEXED_TRIANGLE_STRIP,
-+    gcvFEATURE_TEXTURE_TILED_READ,
-+    gcvFEATURE_DEPTH_BIAS_FIX,
-+    gcvFEATURE_RECT_PRIMITIVE,
-+	gcvFEATURE_BUG_FIXES11,
-+	gcvFEATURE_SUPERTILED_TEXTURE,
-+    gcvFEATURE_2D_NO_COLORBRUSH_INDEX8,
-+    gcvFEATURE_RS_YUV_TARGET,
-+    gcvFEATURE_2D_FC_SOURCE,
-+	gcvFEATURE_PE_DITHER_FIX,
-+    gcvFEATURE_2D_YUV_SEPARATE_STRIDE,
-+    gcvFEATURE_FRUSTUM_CLIP_FIX,
-+    gcvFEATURE_TEXTURE_LINEAR,
-+    gcvFEATURE_TEXTURE_YUV_ASSEMBLER,
-+    gcvFEATURE_SHADER_HAS_INSTRUCTION_CACHE,
-+    gcvFEATURE_DYNAMIC_FREQUENCY_SCALING,
-+    gcvFEATURE_BUGFIX15,
-+    gcvFEATURE_2D_GAMMA,
-+    gcvFEATURE_2D_COLOR_SPACE_CONVERSION,
-+    gcvFEATURE_2D_SUPER_TILE_VERSION,
-+    gcvFEATURE_2D_MIRROR_EXTENSION,
-+    gcvFEATURE_2D_SUPER_TILE_V1,
-+    gcvFEATURE_2D_SUPER_TILE_V2,
-+    gcvFEATURE_2D_SUPER_TILE_V3,
-+    gcvFEATURE_2D_MULTI_SOURCE_BLT_EX2,
-+    gcvFEATURE_ELEMENT_INDEX_UINT,
-+    gcvFEATURE_2D_COMPRESSION,
-+    gcvFEATURE_2D_OPF_YUV_OUTPUT,
-+    gcvFEATURE_2D_MULTI_SRC_BLT_TO_UNIFIED_DST_RECT,
-+    gcvFEATURE_2D_YUV_MODE,
-+    gcvFEATURE_DECOMPRESS_Z16,
-+	gcvFEATURE_LINEAR_RENDER_TARGET,
-+    gcvFEATURE_BUG_FIXES8,
-+    gcvFEATURE_HALTI2,
-+    gcvFEATURE_MMU,
-+}
-+gceFEATURE;
-+
-+/* Chip Power Status. */
-+typedef enum _gceCHIPPOWERSTATE
-+{
-+    gcvPOWER_ON = 0,
-+    gcvPOWER_OFF,
-+    gcvPOWER_IDLE,
-+    gcvPOWER_SUSPEND,
-+    gcvPOWER_SUSPEND_ATPOWERON,
-+    gcvPOWER_OFF_ATPOWERON,
-+    gcvPOWER_IDLE_BROADCAST,
-+    gcvPOWER_SUSPEND_BROADCAST,
-+    gcvPOWER_OFF_BROADCAST,
-+    gcvPOWER_OFF_RECOVERY,
-+    gcvPOWER_OFF_TIMEOUT,
-+    gcvPOWER_ON_AUTO
-+}
-+gceCHIPPOWERSTATE;
-+
-+/* CPU cache operations */
-+typedef enum _gceCACHEOPERATION
-+{
-+    gcvCACHE_CLEAN      = 0x01,
-+    gcvCACHE_INVALIDATE = 0x02,
-+    gcvCACHE_FLUSH      = gcvCACHE_CLEAN  | gcvCACHE_INVALIDATE,
-+    gcvCACHE_MEMORY_BARRIER = 0x04
-+}
-+gceCACHEOPERATION;
-+
-+/* Surface types. */
-+typedef enum _gceSURF_TYPE
-+{
-+    gcvSURF_TYPE_UNKNOWN = 0,
-+    gcvSURF_INDEX,
-+    gcvSURF_VERTEX,
-+    gcvSURF_TEXTURE,
-+    gcvSURF_RENDER_TARGET,
-+    gcvSURF_DEPTH,
-+    gcvSURF_BITMAP,
-+    gcvSURF_TILE_STATUS,
-+	gcvSURF_IMAGE,
-+    gcvSURF_MASK,
-+    gcvSURF_SCISSOR,
-+    gcvSURF_HIERARCHICAL_DEPTH,
-+    gcvSURF_NUM_TYPES, /* Make sure this is the last one! */
-+
-+    /* Combinations. */
-+    gcvSURF_NO_TILE_STATUS = 0x100,
-+    gcvSURF_NO_VIDMEM      = 0x200, /* Used to allocate surfaces with no underlying vidmem node.
-+                                       In Android, vidmem node is allocated by another process. */
-+    gcvSURF_CACHEABLE      = 0x400, /* Used to allocate a cacheable surface */
-+    gcvSURF_FLIP           = 0x800, /* The Resolve Target the will been flip resolve from RT */
-+    gcvSURF_TILE_STATUS_DIRTY  = 0x1000, /* Init tile status to all dirty */
-+
-+    gcvSURF_LINEAR             = 0x2000,
-+    gcvSURF_VG                     = 0x4000,
-+
-+    gcvSURF_TEXTURE_LINEAR               = gcvSURF_TEXTURE
-+                                         | gcvSURF_LINEAR,
-+
-+    gcvSURF_RENDER_TARGET_NO_TILE_STATUS = gcvSURF_RENDER_TARGET
-+                                         | gcvSURF_NO_TILE_STATUS,
-+
-+    gcvSURF_RENDER_TARGET_TS_DIRTY = gcvSURF_RENDER_TARGET
-+                                         | gcvSURF_TILE_STATUS_DIRTY,
-+
-+    gcvSURF_DEPTH_NO_TILE_STATUS         = gcvSURF_DEPTH
-+                                         | gcvSURF_NO_TILE_STATUS,
-+
-+    gcvSURF_DEPTH_TS_DIRTY               = gcvSURF_DEPTH
-+                                         | gcvSURF_TILE_STATUS_DIRTY,
-+
-+    /* Supported surface types with no vidmem node. */
-+    gcvSURF_BITMAP_NO_VIDMEM             = gcvSURF_BITMAP
-+                                         | gcvSURF_NO_VIDMEM,
-+
-+    gcvSURF_TEXTURE_NO_VIDMEM            = gcvSURF_TEXTURE
-+                                         | gcvSURF_NO_VIDMEM,
-+
-+    /* Cacheable surface types with no vidmem node. */
-+    gcvSURF_CACHEABLE_BITMAP_NO_VIDMEM   = gcvSURF_BITMAP_NO_VIDMEM
-+                                         | gcvSURF_CACHEABLE,
-+
-+    gcvSURF_CACHEABLE_BITMAP             = gcvSURF_BITMAP
-+                                         | gcvSURF_CACHEABLE,
-+
-+    gcvSURF_FLIP_BITMAP                  = gcvSURF_BITMAP
-+                                         | gcvSURF_FLIP,
-+}
-+gceSURF_TYPE;
-+
-+typedef enum _gceSURF_USAGE
-+{
-+    gcvSURF_USAGE_UNKNOWN,
-+    gcvSURF_USAGE_RESOLVE_AFTER_CPU,
-+    gcvSURF_USAGE_RESOLVE_AFTER_3D
-+}
-+gceSURF_USAGE;
-+
-+typedef enum _gceSURF_COLOR_TYPE
-+{
-+    gcvSURF_COLOR_UNKNOWN = 0,
-+    gcvSURF_COLOR_LINEAR        = 0x01,
-+    gcvSURF_COLOR_ALPHA_PRE     = 0x02,
-+}
-+gceSURF_COLOR_TYPE;
-+
-+/* Rotation. */
-+typedef enum _gceSURF_ROTATION
-+{
-+    gcvSURF_0_DEGREE = 0,
-+    gcvSURF_90_DEGREE,
-+    gcvSURF_180_DEGREE,
-+    gcvSURF_270_DEGREE,
-+    gcvSURF_FLIP_X,
-+    gcvSURF_FLIP_Y,
-+
-+	gcvSURF_POST_FLIP_X = 0x40000000,
-+    gcvSURF_POST_FLIP_Y = 0x80000000,
-+}
-+gceSURF_ROTATION;
-+
-+typedef enum _gceMIPMAP_IMAGE_FORMAT
-+{
-+    gcvUNKNOWN_MIPMAP_IMAGE_FORMAT  = -2
-+}
-+gceMIPMAP_IMAGE_FORMAT;
-+
-+
-+/* Surface formats. */
-+typedef enum _gceSURF_FORMAT
-+{
-+    /* Unknown format. */
-+    gcvSURF_UNKNOWN             = 0,
-+
-+    /* Palettized formats. */
-+    gcvSURF_INDEX1              = 100,
-+    gcvSURF_INDEX4,
-+    gcvSURF_INDEX8,
-+
-+    /* RGB formats. */
-+    gcvSURF_A2R2G2B2            = 200,
-+    gcvSURF_R3G3B2,
-+    gcvSURF_A8R3G3B2,
-+    gcvSURF_X4R4G4B4,
-+    gcvSURF_A4R4G4B4,
-+    gcvSURF_R4G4B4A4,
-+    gcvSURF_X1R5G5B5,
-+    gcvSURF_A1R5G5B5,
-+    gcvSURF_R5G5B5A1,
-+    gcvSURF_R5G6B5,
-+    gcvSURF_R8G8B8,
-+    gcvSURF_X8R8G8B8,
-+    gcvSURF_A8R8G8B8,
-+    gcvSURF_R8G8B8A8,
-+    gcvSURF_G8R8G8B8,
-+    gcvSURF_R8G8B8G8,
-+    gcvSURF_X2R10G10B10,
-+    gcvSURF_A2R10G10B10,
-+    gcvSURF_X12R12G12B12,
-+    gcvSURF_A12R12G12B12,
-+    gcvSURF_X16R16G16B16,
-+    gcvSURF_A16R16G16B16,
-+    gcvSURF_A32R32G32B32,
-+    gcvSURF_R8G8B8X8,
-+    gcvSURF_R5G5B5X1,
-+    gcvSURF_R4G4B4X4,
-+
-+    /* BGR formats. */
-+    gcvSURF_A4B4G4R4            = 300,
-+    gcvSURF_A1B5G5R5,
-+    gcvSURF_B5G6R5,
-+    gcvSURF_B8G8R8,
-+    gcvSURF_B16G16R16,
-+    gcvSURF_X8B8G8R8,
-+    gcvSURF_A8B8G8R8,
-+    gcvSURF_A2B10G10R10,
-+    gcvSURF_X16B16G16R16,
-+    gcvSURF_A16B16G16R16,
-+    gcvSURF_B32G32R32,
-+    gcvSURF_X32B32G32R32,
-+    gcvSURF_A32B32G32R32,
-+    gcvSURF_B4G4R4A4,
-+    gcvSURF_B5G5R5A1,
-+    gcvSURF_B8G8R8X8,
-+    gcvSURF_B8G8R8A8,
-+    gcvSURF_X4B4G4R4,
-+    gcvSURF_X1B5G5R5,
-+    gcvSURF_B4G4R4X4,
-+    gcvSURF_B5G5R5X1,
-+    gcvSURF_X2B10G10R10,
-+
-+    /* Compressed formats. */
-+    gcvSURF_DXT1                = 400,
-+    gcvSURF_DXT2,
-+    gcvSURF_DXT3,
-+    gcvSURF_DXT4,
-+    gcvSURF_DXT5,
-+    gcvSURF_CXV8U8,
-+    gcvSURF_ETC1,
-+    gcvSURF_R11_EAC,
-+    gcvSURF_SIGNED_R11_EAC,
-+    gcvSURF_RG11_EAC,
-+    gcvSURF_SIGNED_RG11_EAC,
-+    gcvSURF_RGB8_ETC2,
-+    gcvSURF_SRGB8_ETC2,
-+    gcvSURF_RGB8_PUNCHTHROUGH_ALPHA1_ETC2,
-+    gcvSURF_SRGB8_PUNCHTHROUGH_ALPHA1_ETC2,
-+    gcvSURF_RGBA8_ETC2_EAC,
-+    gcvSURF_SRGB8_ALPHA8_ETC2_EAC,
-+
-+    /* YUV formats. */
-+    gcvSURF_YUY2                = 500,
-+    gcvSURF_UYVY,
-+    gcvSURF_YV12,
-+    gcvSURF_I420,
-+    gcvSURF_NV12,
-+    gcvSURF_NV21,
-+    gcvSURF_NV16,
-+    gcvSURF_NV61,
-+    gcvSURF_YVYU,
-+    gcvSURF_VYUY,
-+
-+    /* Depth formats. */
-+    gcvSURF_D16                 = 600,
-+    gcvSURF_D24S8,
-+    gcvSURF_D32,
-+    gcvSURF_D24X8,
-+
-+    /* Alpha formats. */
-+    gcvSURF_A4                  = 700,
-+    gcvSURF_A8,
-+    gcvSURF_A12,
-+    gcvSURF_A16,
-+    gcvSURF_A32,
-+    gcvSURF_A1,
-+
-+    /* Luminance formats. */
-+    gcvSURF_L4                  = 800,
-+    gcvSURF_L8,
-+    gcvSURF_L12,
-+    gcvSURF_L16,
-+    gcvSURF_L32,
-+    gcvSURF_L1,
-+
-+    /* Alpha/Luminance formats. */
-+    gcvSURF_A4L4                = 900,
-+    gcvSURF_A2L6,
-+    gcvSURF_A8L8,
-+    gcvSURF_A4L12,
-+    gcvSURF_A12L12,
-+    gcvSURF_A16L16,
-+
-+    /* Bump formats. */
-+    gcvSURF_L6V5U5              = 1000,
-+    gcvSURF_V8U8,
-+    gcvSURF_X8L8V8U8,
-+    gcvSURF_Q8W8V8U8,
-+    gcvSURF_A2W10V10U10,
-+    gcvSURF_V16U16,
-+    gcvSURF_Q16W16V16U16,
-+
-+    /* R/RG/RA formats. */
-+    gcvSURF_R8                  = 1100,
-+    gcvSURF_X8R8,
-+    gcvSURF_G8R8,
-+    gcvSURF_X8G8R8,
-+    gcvSURF_A8R8,
-+    gcvSURF_R16,
-+    gcvSURF_X16R16,
-+    gcvSURF_G16R16,
-+    gcvSURF_X16G16R16,
-+    gcvSURF_A16R16,
-+    gcvSURF_R32,
-+    gcvSURF_X32R32,
-+    gcvSURF_G32R32,
-+    gcvSURF_X32G32R32,
-+    gcvSURF_A32R32,
-+    gcvSURF_RG16,
-+
-+    /* Floating point formats. */
-+    gcvSURF_R16F                = 1200,
-+    gcvSURF_X16R16F,
-+    gcvSURF_G16R16F,
-+    gcvSURF_X16G16R16F,
-+    gcvSURF_B16G16R16F,
-+    gcvSURF_X16B16G16R16F,
-+    gcvSURF_A16B16G16R16F,
-+    gcvSURF_R32F,
-+    gcvSURF_X32R32F,
-+    gcvSURF_G32R32F,
-+    gcvSURF_X32G32R32F,
-+    gcvSURF_B32G32R32F,
-+    gcvSURF_X32B32G32R32F,
-+    gcvSURF_A32B32G32R32F,
-+    gcvSURF_A16F,
-+    gcvSURF_L16F,
-+    gcvSURF_A16L16F,
-+    gcvSURF_A16R16F,
-+    gcvSURF_A32F,
-+    gcvSURF_L32F,
-+    gcvSURF_A32L32F,
-+    gcvSURF_A32R32F,
-+
-+}
-+gceSURF_FORMAT;
-+
-+/* Pixel swizzle modes. */
-+typedef enum _gceSURF_SWIZZLE
-+{
-+    gcvSURF_NOSWIZZLE = 0,
-+    gcvSURF_ARGB,
-+    gcvSURF_ABGR,
-+    gcvSURF_RGBA,
-+    gcvSURF_BGRA
-+}
-+gceSURF_SWIZZLE;
-+
-+/* Transparency modes. */
-+typedef enum _gceSURF_TRANSPARENCY
-+{
-+    /* Valid only for PE 1.0 */
-+    gcvSURF_OPAQUE = 0,
-+    gcvSURF_SOURCE_MATCH,
-+    gcvSURF_SOURCE_MASK,
-+    gcvSURF_PATTERN_MASK,
-+}
-+gceSURF_TRANSPARENCY;
-+
-+/* Surface Alignment. */
-+typedef enum _gceSURF_ALIGNMENT
-+{
-+    gcvSURF_FOUR = 0,
-+    gcvSURF_SIXTEEN,
-+    gcvSURF_SUPER_TILED,
-+    gcvSURF_SPLIT_TILED,
-+    gcvSURF_SPLIT_SUPER_TILED,
-+}
-+gceSURF_ALIGNMENT;
-+
-+
-+/* Surface Addressing. */
-+typedef enum _gceSURF_ADDRESSING
-+{
-+    gcvSURF_NO_STRIDE_TILED = 0,
-+    gcvSURF_NO_STRIDE_LINEAR,
-+    gcvSURF_STRIDE_TILED,
-+    gcvSURF_STRIDE_LINEAR
-+}
-+gceSURF_ADDRESSING;
-+
-+/* Transparency modes. */
-+typedef enum _gce2D_TRANSPARENCY
-+{
-+    /* Valid only for PE 2.0 */
-+    gcv2D_OPAQUE = 0,
-+    gcv2D_KEYED,
-+    gcv2D_MASKED
-+}
-+gce2D_TRANSPARENCY;
-+
-+/* Mono packing modes. */
-+typedef enum _gceSURF_MONOPACK
-+{
-+    gcvSURF_PACKED8 = 0,
-+    gcvSURF_PACKED16,
-+    gcvSURF_PACKED32,
-+    gcvSURF_UNPACKED,
-+}
-+gceSURF_MONOPACK;
-+
-+/* Blending modes. */
-+typedef enum _gceSURF_BLEND_MODE
-+{
-+    /* Porter-Duff blending modes.                   */
-+    /*                         Fsrc      Fdst        */
-+    gcvBLEND_CLEAR = 0,     /* 0         0           */
-+    gcvBLEND_SRC,           /* 1         0           */
-+    gcvBLEND_DST,           /* 0         1           */
-+    gcvBLEND_SRC_OVER_DST,  /* 1         1 - Asrc    */
-+    gcvBLEND_DST_OVER_SRC,  /* 1 - Adst  1           */
-+    gcvBLEND_SRC_IN_DST,    /* Adst      0           */
-+    gcvBLEND_DST_IN_SRC,    /* 0         Asrc        */
-+    gcvBLEND_SRC_OUT_DST,   /* 1 - Adst  0           */
-+    gcvBLEND_DST_OUT_SRC,   /* 0         1 - Asrc    */
-+    gcvBLEND_SRC_ATOP_DST,  /* Adst      1 - Asrc    */
-+    gcvBLEND_DST_ATOP_SRC,  /* 1 - Adst  Asrc        */
-+    gcvBLEND_SRC_XOR_DST,   /* 1 - Adst  1 - Asrc    */
-+
-+    /* Special blending modes.                       */
-+    gcvBLEND_SET,           /* DST = 1               */
-+    gcvBLEND_SUB            /* DST = DST * (1 - SRC) */
-+}
-+gceSURF_BLEND_MODE;
-+
-+/* Per-pixel alpha modes. */
-+typedef enum _gceSURF_PIXEL_ALPHA_MODE
-+{
-+    gcvSURF_PIXEL_ALPHA_STRAIGHT = 0,
-+    gcvSURF_PIXEL_ALPHA_INVERSED
-+}
-+gceSURF_PIXEL_ALPHA_MODE;
-+
-+/* Global alpha modes. */
-+typedef enum _gceSURF_GLOBAL_ALPHA_MODE
-+{
-+    gcvSURF_GLOBAL_ALPHA_OFF = 0,
-+    gcvSURF_GLOBAL_ALPHA_ON,
-+    gcvSURF_GLOBAL_ALPHA_SCALE
-+}
-+gceSURF_GLOBAL_ALPHA_MODE;
-+
-+/* Color component modes for alpha blending. */
-+typedef enum _gceSURF_PIXEL_COLOR_MODE
-+{
-+    gcvSURF_COLOR_STRAIGHT = 0,
-+    gcvSURF_COLOR_MULTIPLY
-+}
-+gceSURF_PIXEL_COLOR_MODE;
-+
-+/* Color component modes for alpha blending. */
-+typedef enum _gce2D_PIXEL_COLOR_MULTIPLY_MODE
-+{
-+    gcv2D_COLOR_MULTIPLY_DISABLE = 0,
-+    gcv2D_COLOR_MULTIPLY_ENABLE
-+}
-+gce2D_PIXEL_COLOR_MULTIPLY_MODE;
-+
-+/* Color component modes for alpha blending. */
-+typedef enum _gce2D_GLOBAL_COLOR_MULTIPLY_MODE
-+{
-+    gcv2D_GLOBAL_COLOR_MULTIPLY_DISABLE = 0,
-+    gcv2D_GLOBAL_COLOR_MULTIPLY_ALPHA,
-+    gcv2D_GLOBAL_COLOR_MULTIPLY_COLOR
-+}
-+gce2D_GLOBAL_COLOR_MULTIPLY_MODE;
-+
-+/* Alpha blending factor modes. */
-+typedef enum _gceSURF_BLEND_FACTOR_MODE
-+{
-+    gcvSURF_BLEND_ZERO = 0,
-+    gcvSURF_BLEND_ONE,
-+    gcvSURF_BLEND_STRAIGHT,
-+    gcvSURF_BLEND_INVERSED,
-+    gcvSURF_BLEND_COLOR,
-+    gcvSURF_BLEND_COLOR_INVERSED,
-+    gcvSURF_BLEND_SRC_ALPHA_SATURATED,
-+    gcvSURF_BLEND_STRAIGHT_NO_CROSS,
-+    gcvSURF_BLEND_INVERSED_NO_CROSS,
-+    gcvSURF_BLEND_COLOR_NO_CROSS,
-+    gcvSURF_BLEND_COLOR_INVERSED_NO_CROSS,
-+    gcvSURF_BLEND_SRC_ALPHA_SATURATED_CROSS
-+}
-+gceSURF_BLEND_FACTOR_MODE;
-+
-+/* Alpha blending porter duff rules. */
-+typedef enum _gce2D_PORTER_DUFF_RULE
-+{
-+    gcvPD_CLEAR = 0,
-+    gcvPD_SRC,
-+    gcvPD_SRC_OVER,
-+    gcvPD_DST_OVER,
-+    gcvPD_SRC_IN,
-+    gcvPD_DST_IN,
-+    gcvPD_SRC_OUT,
-+    gcvPD_DST_OUT,
-+    gcvPD_SRC_ATOP,
-+    gcvPD_DST_ATOP,
-+    gcvPD_ADD,
-+    gcvPD_XOR,
-+    gcvPD_DST
-+}
-+gce2D_PORTER_DUFF_RULE;
-+
-+/* Alpha blending factor modes. */
-+typedef enum _gce2D_YUV_COLOR_MODE
-+{
-+    gcv2D_YUV_601= 0,
-+    gcv2D_YUV_709,
-+    gcv2D_YUV_USER_DEFINED,
-+    gcv2D_YUV_USER_DEFINED_CLAMP,
-+
-+    /* Default setting is for src. gcv2D_YUV_DST
-+        can be ORed to set dst.
-+    */
-+    gcv2D_YUV_DST = 0x80000000,
-+}
-+gce2D_YUV_COLOR_MODE;
-+
-+typedef enum _gce2D_COMMAND
-+{
-+    gcv2D_CLEAR = 0,
-+    gcv2D_LINE,
-+    gcv2D_BLT,
-+    gcv2D_STRETCH,
-+    gcv2D_HOR_FILTER,
-+    gcv2D_VER_FILTER,
-+    gcv2D_MULTI_SOURCE_BLT,
-+}
-+gce2D_COMMAND;
-+
-+typedef enum _gce2D_TILE_STATUS_CONFIG
-+{
-+    gcv2D_TSC_DISABLE       = 0,
-+    gcv2D_TSC_ENABLE        = 0x00000001,
-+    gcv2D_TSC_COMPRESSED    = 0x00000002,
-+    gcv2D_TSC_DOWN_SAMPLER  = 0x00000004,
-+    gcv2D_TSC_2D_COMPRESSED = 0x00000008,
-+}
-+gce2D_TILE_STATUS_CONFIG;
-+
-+typedef enum _gce2D_QUERY
-+{
-+    gcv2D_QUERY_RGB_ADDRESS_MIN_ALIGN       = 0,
-+    gcv2D_QUERY_RGB_STRIDE_MIN_ALIGN,
-+    gcv2D_QUERY_YUV_ADDRESS_MIN_ALIGN,
-+    gcv2D_QUERY_YUV_STRIDE_MIN_ALIGN,
-+}
-+gce2D_QUERY;
-+
-+typedef enum _gce2D_SUPER_TILE_VERSION
-+{
-+    gcv2D_SUPER_TILE_VERSION_V1       = 1,
-+    gcv2D_SUPER_TILE_VERSION_V2       = 2,
-+    gcv2D_SUPER_TILE_VERSION_V3       = 3,
-+}
-+gce2D_SUPER_TILE_VERSION;
-+
-+typedef enum _gce2D_STATE
-+{
-+    gcv2D_STATE_SPECIAL_FILTER_MIRROR_MODE       = 1,
-+    gcv2D_STATE_SUPER_TILE_VERSION,
-+    gcv2D_STATE_EN_GAMMA,
-+    gcv2D_STATE_DE_GAMMA,
-+    gcv2D_STATE_MULTI_SRC_BLIT_UNIFIED_DST_RECT,
-+    gcv2D_STATE_XRGB_ENABLE,
-+
-+    gcv2D_STATE_ARRAY_EN_GAMMA                   = 0x10001,
-+    gcv2D_STATE_ARRAY_DE_GAMMA,
-+    gcv2D_STATE_ARRAY_CSC_YUV_TO_RGB,
-+    gcv2D_STATE_ARRAY_CSC_RGB_TO_YUV,
-+}
-+gce2D_STATE;
-+
-+#ifndef VIVANTE_NO_3D
-+/* Texture functions. */
-+typedef enum _gceTEXTURE_FUNCTION
-+{
-+    gcvTEXTURE_DUMMY = 0,
-+    gcvTEXTURE_REPLACE = 0,
-+    gcvTEXTURE_MODULATE,
-+    gcvTEXTURE_ADD,
-+    gcvTEXTURE_ADD_SIGNED,
-+    gcvTEXTURE_INTERPOLATE,
-+    gcvTEXTURE_SUBTRACT,
-+    gcvTEXTURE_DOT3
-+}
-+gceTEXTURE_FUNCTION;
-+
-+/* Texture sources. */
-+typedef enum _gceTEXTURE_SOURCE
-+{
-+    gcvCOLOR_FROM_TEXTURE = 0,
-+    gcvCOLOR_FROM_CONSTANT_COLOR,
-+    gcvCOLOR_FROM_PRIMARY_COLOR,
-+    gcvCOLOR_FROM_PREVIOUS_COLOR
-+}
-+gceTEXTURE_SOURCE;
-+
-+/* Texture source channels. */
-+typedef enum _gceTEXTURE_CHANNEL
-+{
-+    gcvFROM_COLOR = 0,
-+    gcvFROM_ONE_MINUS_COLOR,
-+    gcvFROM_ALPHA,
-+    gcvFROM_ONE_MINUS_ALPHA
-+}
-+gceTEXTURE_CHANNEL;
-+#endif /* VIVANTE_NO_3D */
-+
-+/* Filter types. */
-+typedef enum _gceFILTER_TYPE
-+{
-+    gcvFILTER_SYNC = 0,
-+    gcvFILTER_BLUR,
-+    gcvFILTER_USER
-+}
-+gceFILTER_TYPE;
-+
-+/* Filter pass types. */
-+typedef enum _gceFILTER_PASS_TYPE
-+{
-+    gcvFILTER_HOR_PASS = 0,
-+    gcvFILTER_VER_PASS
-+}
-+gceFILTER_PASS_TYPE;
-+
-+/* Endian hints. */
-+typedef enum _gceENDIAN_HINT
-+{
-+    gcvENDIAN_NO_SWAP = 0,
-+    gcvENDIAN_SWAP_WORD,
-+    gcvENDIAN_SWAP_DWORD
-+}
-+gceENDIAN_HINT;
-+
-+/* Tiling modes. */
-+typedef enum _gceTILING
-+{
-+    gcvLINEAR = 0,
-+    gcvTILED,
-+    gcvSUPERTILED,
-+    gcvMULTI_TILED,
-+    gcvMULTI_SUPERTILED,
-+    gcvMINORTILED,
-+}
-+gceTILING;
-+
-+/* 2D pattern type. */
-+typedef enum _gce2D_PATTERN
-+{
-+    gcv2D_PATTERN_SOLID = 0,
-+    gcv2D_PATTERN_MONO,
-+    gcv2D_PATTERN_COLOR,
-+    gcv2D_PATTERN_INVALID
-+}
-+gce2D_PATTERN;
-+
-+/* 2D source type. */
-+typedef enum _gce2D_SOURCE
-+{
-+    gcv2D_SOURCE_MASKED = 0,
-+    gcv2D_SOURCE_MONO,
-+    gcv2D_SOURCE_COLOR,
-+    gcv2D_SOURCE_INVALID
-+}
-+gce2D_SOURCE;
-+
-+/* Pipes. */
-+typedef enum _gcePIPE_SELECT
-+{
-+    gcvPIPE_INVALID = ~0,
-+    gcvPIPE_3D      =  0,
-+    gcvPIPE_2D
-+}
-+gcePIPE_SELECT;
-+
-+/* Hardware type. */
-+typedef enum _gceHARDWARE_TYPE
-+{
-+    gcvHARDWARE_INVALID = 0x00,
-+    gcvHARDWARE_3D      = 0x01,
-+    gcvHARDWARE_2D      = 0x02,
-+    gcvHARDWARE_VG      = 0x04,
-+
-+    gcvHARDWARE_3D2D    = gcvHARDWARE_3D | gcvHARDWARE_2D
-+}
-+gceHARDWARE_TYPE;
-+
-+#define gcdCHIP_COUNT               3
-+
-+typedef enum _gceMMU_MODE
-+{
-+    gcvMMU_MODE_1K,
-+    gcvMMU_MODE_4K,
-+} gceMMU_MODE;
-+
-+/* User signal command codes. */
-+typedef enum _gceUSER_SIGNAL_COMMAND_CODES
-+{
-+    gcvUSER_SIGNAL_CREATE,
-+    gcvUSER_SIGNAL_DESTROY,
-+    gcvUSER_SIGNAL_SIGNAL,
-+    gcvUSER_SIGNAL_WAIT,
-+    gcvUSER_SIGNAL_MAP,
-+    gcvUSER_SIGNAL_UNMAP,
-+}
-+gceUSER_SIGNAL_COMMAND_CODES;
-+
-+/* Sync point command codes. */
-+typedef enum _gceSYNC_POINT_COMMAND_CODES
-+{
-+    gcvSYNC_POINT_CREATE,
-+    gcvSYNC_POINT_DESTROY,
-+    gcvSYNC_POINT_SIGNAL,
-+}
-+gceSYNC_POINT_COMMAND_CODES;
-+
-+/* Event locations. */
-+typedef enum _gceKERNEL_WHERE
-+{
-+    gcvKERNEL_COMMAND,
-+    gcvKERNEL_VERTEX,
-+    gcvKERNEL_TRIANGLE,
-+    gcvKERNEL_TEXTURE,
-+    gcvKERNEL_PIXEL,
-+}
-+gceKERNEL_WHERE;
-+
-+#if gcdENABLE_VG
-+/* Hardware blocks. */
-+typedef enum _gceBLOCK
-+{
-+	gcvBLOCK_COMMAND,
-+	gcvBLOCK_TESSELLATOR,
-+	gcvBLOCK_TESSELLATOR2,
-+	gcvBLOCK_TESSELLATOR3,
-+	gcvBLOCK_RASTER,
-+	gcvBLOCK_VG,
-+	gcvBLOCK_VG2,
-+	gcvBLOCK_VG3,
-+	gcvBLOCK_PIXEL,
-+
-+	/* Number of defined blocks. */
-+	gcvBLOCK_COUNT
-+}
-+gceBLOCK;
-+#endif
-+
-+/* gcdDUMP message type. */
-+typedef enum _gceDEBUG_MESSAGE_TYPE
-+{
-+    gcvMESSAGE_TEXT,
-+    gcvMESSAGE_DUMP
-+}
-+gceDEBUG_MESSAGE_TYPE;
-+
-+typedef enum _gceSPECIAL_HINT
-+{
-+    gceSPECIAL_HINT0,
-+    gceSPECIAL_HINT1,
-+    gceSPECIAL_HINT2,
-+    gceSPECIAL_HINT3,
-+    /* For disable dynamic stream/index */
-+    gceSPECIAL_HINT4
-+}
-+gceSPECIAL_HINT;
-+
-+typedef enum _gceMACHINECODE
-+{
-+    gcvMACHINECODE_HOVERJET0       = 0x0,
-+    gcvMACHINECODE_HOVERJET1      ,
-+
-+    gcvMACHINECODE_TAIJI0         ,
-+    gcvMACHINECODE_TAIJI1         ,
-+    gcvMACHINECODE_TAIJI2         ,
-+
-+    gcvMACHINECODE_ANTUTU0        ,
-+
-+    gcvMACHINECODE_GLB27_RELEASE_0,
-+    gcvMACHINECODE_GLB27_RELEASE_1,
-+
-+    gcvMACHINECODE_WAVESCAPE0     ,
-+    gcvMACHINECODE_WAVESCAPE1     ,
-+
-+    gcvMACHINECODE_NENAMARKV2_4_0 ,
-+    gcvMACHINECODE_NENAMARKV2_4_1 ,
-+
-+    gcvMACHINECODE_GLB25_RELEASE_0,
-+    gcvMACHINECODE_GLB25_RELEASE_1,
-+    gcvMACHINECODE_GLB25_RELEASE_2,
-+}
-+gceMACHINECODE;
-+
-+
-+/******************************************************************************\
-+****************************** Object Declarations *****************************
-+\******************************************************************************/
-+
-+typedef struct _gckCONTEXT          * gckCONTEXT;
-+typedef struct _gcoCMDBUF           * gcoCMDBUF;
-+typedef struct _gcsSTATE_DELTA      * gcsSTATE_DELTA_PTR;
-+typedef struct _gcsQUEUE            * gcsQUEUE_PTR;
-+typedef struct _gcoQUEUE            * gcoQUEUE;
-+typedef struct _gcsHAL_INTERFACE    * gcsHAL_INTERFACE_PTR;
-+typedef struct _gcs2D_PROFILE       * gcs2D_PROFILE_PTR;
-+
-+#if gcdENABLE_VG
-+typedef struct _gcoVGHARDWARE *			gcoVGHARDWARE;
-+typedef struct _gcoVGBUFFER *           gcoVGBUFFER;
-+typedef struct _gckVGHARDWARE *         gckVGHARDWARE;
-+typedef struct _gcsVGCONTEXT *			gcsVGCONTEXT_PTR;
-+typedef struct _gcsVGCONTEXT_MAP *		gcsVGCONTEXT_MAP_PTR;
-+typedef struct _gcsVGCMDQUEUE *			gcsVGCMDQUEUE_PTR;
-+typedef struct _gcsTASK_MASTER_TABLE *	gcsTASK_MASTER_TABLE_PTR;
-+typedef struct _gckVGKERNEL *			gckVGKERNEL;
-+typedef void *					        gctTHREAD;
-+#endif
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_enum_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h	2015-07-27 23:13:06.194879670 +0200
-@@ -0,0 +1,2671 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_h_
-+#define __gc_hal_h_
-+
-+#include "gc_hal_rename.h"
-+#include "gc_hal_types.h"
-+#include "gc_hal_enum.h"
-+#include "gc_hal_base.h"
-+#include "gc_hal_profiler.h"
-+#include "gc_hal_driver.h"
-+#ifndef VIVANTE_NO_3D
-+#include "gc_hal_statistics.h"
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+******************************* Alignment Macros *******************************
-+\******************************************************************************/
-+
-+#define gcmALIGN(n, align) \
-+( \
-+    ((n) + ((align) - 1)) & ~((align) - 1) \
-+)
-+
-+#define gcmALIGN_BASE(n, align) \
-+( \
-+    ((n) & ~((align) - 1)) \
-+)
-+
-+/******************************************************************************\
-+***************************** Element Count Macro *****************************
-+\******************************************************************************/
-+
-+#define gcmSIZEOF(a) \
-+( \
-+    (gctSIZE_T) (sizeof(a)) \
-+)
-+
-+#define gcmCOUNTOF(a) \
-+( \
-+    sizeof(a) / sizeof(a[0]) \
-+)
-+
-+/******************************************************************************\
-+********************************* Cast Macro **********************************
-+\******************************************************************************/
-+#define gcmNAME_TO_PTR(na) \
-+        gckKERNEL_QueryPointerFromName(kernel, gcmALL_TO_UINT32(na))
-+
-+#define gcmPTR_TO_NAME(ptr) \
-+        gckKERNEL_AllocateNameFromPointer(kernel, ptr)
-+
-+#define gcmRELEASE_NAME(na) \
-+        gckKERNEL_DeleteName(kernel, gcmALL_TO_UINT32(na))
-+
-+#ifdef __LP64__
-+
-+#define gcmALL_TO_UINT32(t) \
-+( \
-+    (gctUINT32) (gctUINTPTR_T) (t)\
-+)
-+
-+#define gcmPTR_TO_UINT64(p) \
-+( \
-+    (gctUINT64) (p)\
-+)
-+
-+#define gcmUINT64_TO_PTR(u) \
-+( \
-+    (gctPOINTER) (u)\
-+)
-+
-+#else /* 32 bit */
-+
-+#define gcmALL_TO_UINT32(t) \
-+( \
-+    (gctUINT32) (t)\
-+)
-+
-+#define gcmPTR_TO_UINT64(p) \
-+( \
-+    (gctUINT64) (gctUINTPTR_T) (p)\
-+)
-+
-+#define gcmUINT64_TO_PTR(u) \
-+( \
-+    (gctPOINTER) (gctUINTPTR_T) (u)\
-+)
-+
-+#endif
-+
-+#define gcmUINT64_TO_TYPE(u, t) \
-+( \
-+    (t) (gctUINTPTR_T) (u)\
-+)
-+
-+/******************************************************************************\
-+******************************** Useful Macro *********************************
-+\******************************************************************************/
-+
-+#define gcvINVALID_ADDRESS          ~0U
-+
-+#define gcmGET_PRE_ROTATION(rotate) \
-+    ((rotate) & (~(gcvSURF_POST_FLIP_X | gcvSURF_POST_FLIP_Y)))
-+
-+#define gcmGET_POST_ROTATION(rotate) \
-+    ((rotate) & (gcvSURF_POST_FLIP_X | gcvSURF_POST_FLIP_Y))
-+
-+/******************************************************************************\
-+******************************** gcsOBJECT Object *******************************
-+\******************************************************************************/
-+
-+/* Type of objects. */
-+typedef enum _gceOBJECT_TYPE
-+{
-+    gcvOBJ_UNKNOWN              = 0,
-+    gcvOBJ_2D                   = gcmCC('2','D',' ',' '),
-+    gcvOBJ_3D                   = gcmCC('3','D',' ',' '),
-+    gcvOBJ_ATTRIBUTE            = gcmCC('A','T','T','R'),
-+    gcvOBJ_BRUSHCACHE           = gcmCC('B','R','U','$'),
-+    gcvOBJ_BRUSHNODE            = gcmCC('B','R','U','n'),
-+    gcvOBJ_BRUSH                = gcmCC('B','R','U','o'),
-+    gcvOBJ_BUFFER               = gcmCC('B','U','F','R'),
-+    gcvOBJ_COMMAND              = gcmCC('C','M','D',' '),
-+    gcvOBJ_COMMANDBUFFER        = gcmCC('C','M','D','B'),
-+    gcvOBJ_CONTEXT              = gcmCC('C','T','X','T'),
-+    gcvOBJ_DEVICE               = gcmCC('D','E','V',' '),
-+    gcvOBJ_DUMP                 = gcmCC('D','U','M','P'),
-+    gcvOBJ_EVENT                = gcmCC('E','V','N','T'),
-+    gcvOBJ_FUNCTION             = gcmCC('F','U','N','C'),
-+    gcvOBJ_HAL                  = gcmCC('H','A','L',' '),
-+    gcvOBJ_HARDWARE             = gcmCC('H','A','R','D'),
-+    gcvOBJ_HEAP                 = gcmCC('H','E','A','P'),
-+    gcvOBJ_INDEX                = gcmCC('I','N','D','X'),
-+    gcvOBJ_INTERRUPT            = gcmCC('I','N','T','R'),
-+    gcvOBJ_KERNEL               = gcmCC('K','E','R','N'),
-+    gcvOBJ_KERNEL_FUNCTION      = gcmCC('K','F','C','N'),
-+    gcvOBJ_MEMORYBUFFER         = gcmCC('M','E','M','B'),
-+    gcvOBJ_MMU                  = gcmCC('M','M','U',' '),
-+    gcvOBJ_OS                   = gcmCC('O','S',' ',' '),
-+    gcvOBJ_OUTPUT               = gcmCC('O','U','T','P'),
-+    gcvOBJ_PAINT                = gcmCC('P','N','T',' '),
-+    gcvOBJ_PATH                 = gcmCC('P','A','T','H'),
-+    gcvOBJ_QUEUE                = gcmCC('Q','U','E',' '),
-+    gcvOBJ_SAMPLER              = gcmCC('S','A','M','P'),
-+    gcvOBJ_SHADER               = gcmCC('S','H','D','R'),
-+    gcvOBJ_STREAM               = gcmCC('S','T','R','M'),
-+    gcvOBJ_SURF                 = gcmCC('S','U','R','F'),
-+    gcvOBJ_TEXTURE              = gcmCC('T','X','T','R'),
-+    gcvOBJ_UNIFORM              = gcmCC('U','N','I','F'),
-+    gcvOBJ_VARIABLE             = gcmCC('V','A','R','I'),
-+    gcvOBJ_VERTEX               = gcmCC('V','R','T','X'),
-+    gcvOBJ_VIDMEM               = gcmCC('V','M','E','M'),
-+    gcvOBJ_VG                   = gcmCC('V','G',' ',' '),
-+}
-+gceOBJECT_TYPE;
-+
-+/* gcsOBJECT object defintinon. */
-+typedef struct _gcsOBJECT
-+{
-+    /* Type of an object. */
-+    gceOBJECT_TYPE              type;
-+}
-+gcsOBJECT;
-+
-+typedef struct _gckHARDWARE *       gckHARDWARE;
-+
-+/* CORE flags. */
-+typedef enum _gceCORE
-+{
-+    gcvCORE_MAJOR       = 0x0,
-+    gcvCORE_2D          = 0x1,
-+    gcvCORE_VG          = 0x2
-+}
-+gceCORE;
-+
-+#define gcdMAX_GPU_COUNT               3
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFY_OBJECT
-+**
-+**      Assert if an object is invalid or is not of the specified type.  If the
-+**      object is invalid or not of the specified type, gcvSTATUS_INVALID_OBJECT
-+**      will be returned from the current function.  In retail mode this macro
-+**      does nothing.
-+**
-+**  ARGUMENTS:
-+**
-+**      obj     Object to test.
-+**      t       Expected type of the object.
-+*/
-+#if gcmIS_DEBUG(gcdDEBUG_TRACE)
-+#define _gcmVERIFY_OBJECT(prefix, obj, t) \
-+    if ((obj) == gcvNULL) \
-+    { \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+                      #prefix "VERIFY_OBJECT failed: NULL"); \
-+        prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
-+                      gcmCC_PRINT(t)); \
-+        prefix##ASSERT((obj) != gcvNULL); \
-+        prefix##FOOTER_ARG("status=%d", gcvSTATUS_INVALID_OBJECT); \
-+        return gcvSTATUS_INVALID_OBJECT; \
-+    } \
-+    else if (((gcsOBJECT*) (obj))->type != t) \
-+    { \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+                      #prefix "VERIFY_OBJECT failed: %c%c%c%c", \
-+                      gcmCC_PRINT(((gcsOBJECT*) (obj))->type)); \
-+        prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
-+                      gcmCC_PRINT(t)); \
-+        prefix##ASSERT(((gcsOBJECT*)(obj))->type == t); \
-+        prefix##FOOTER_ARG("status=%d", gcvSTATUS_INVALID_OBJECT); \
-+        return gcvSTATUS_INVALID_OBJECT; \
-+    }
-+
-+#   define gcmVERIFY_OBJECT(obj, t)     _gcmVERIFY_OBJECT(gcm, obj, t)
-+#   define gcmkVERIFY_OBJECT(obj, t)    _gcmVERIFY_OBJECT(gcmk, obj, t)
-+#else
-+#   define gcmVERIFY_OBJECT(obj, t)     do {} while (gcvFALSE)
-+#   define gcmkVERIFY_OBJECT(obj, t)    do {} while (gcvFALSE)
-+#endif
-+
-+/******************************************************************************/
-+/*VERIFY_OBJECT if special return expected*/
-+/******************************************************************************/
-+#ifndef EGL_API_ANDROID
-+#   define _gcmVERIFY_OBJECT_RETURN(prefix, obj, t, retVal) \
-+        do \
-+        { \
-+            if ((obj) == gcvNULL) \
-+            { \
-+                prefix##PRINT_VERSION(); \
-+                prefix##TRACE(gcvLEVEL_ERROR, \
-+                              #prefix "VERIFY_OBJECT_RETURN failed: NULL"); \
-+                prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
-+                              gcmCC_PRINT(t)); \
-+                prefix##ASSERT((obj) != gcvNULL); \
-+                prefix##FOOTER_ARG("retVal=%d", retVal); \
-+                return retVal; \
-+            } \
-+            else if (((gcsOBJECT*) (obj))->type != t) \
-+            { \
-+                prefix##PRINT_VERSION(); \
-+                prefix##TRACE(gcvLEVEL_ERROR, \
-+                              #prefix "VERIFY_OBJECT_RETURN failed: %c%c%c%c", \
-+                              gcmCC_PRINT(((gcsOBJECT*) (obj))->type)); \
-+                prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
-+                              gcmCC_PRINT(t)); \
-+                prefix##ASSERT(((gcsOBJECT*)(obj))->type == t); \
-+                prefix##FOOTER_ARG("retVal=%d", retVal); \
-+                return retVal; \
-+            } \
-+        } \
-+        while (gcvFALSE)
-+#   define gcmVERIFY_OBJECT_RETURN(obj, t, retVal) \
-+                            _gcmVERIFY_OBJECT_RETURN(gcm, obj, t, retVal)
-+#   define gcmkVERIFY_OBJECT_RETURN(obj, t, retVal) \
-+                            _gcmVERIFY_OBJECT_RETURN(gcmk, obj, t, retVal)
-+#else
-+#   define gcmVERIFY_OBJECT_RETURN(obj, t)     do {} while (gcvFALSE)
-+#   define gcmVERIFY_OBJECT_RETURN(obj, t)    do {} while (gcvFALSE)
-+#endif
-+
-+/******************************************************************************\
-+********************************** gckOS Object *********************************
-+\******************************************************************************/
-+
-+/* Construct a new gckOS object. */
-+gceSTATUS
-+gckOS_Construct(
-+    IN gctPOINTER Context,
-+    OUT gckOS * Os
-+    );
-+
-+/* Destroy an gckOS object. */
-+gceSTATUS
-+gckOS_Destroy(
-+    IN gckOS Os
-+    );
-+
-+/* Query the video memory. */
-+gceSTATUS
-+gckOS_QueryVideoMemory(
-+    IN gckOS Os,
-+    OUT gctPHYS_ADDR * InternalAddress,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctPHYS_ADDR * ExternalAddress,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctPHYS_ADDR * ContiguousAddress,
-+    OUT gctSIZE_T * ContiguousSize
-+    );
-+
-+/* Allocate memory from the heap. */
-+gceSTATUS
-+gckOS_Allocate(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+/* Free allocated memory. */
-+gceSTATUS
-+gckOS_Free(
-+    IN gckOS Os,
-+    IN gctPOINTER Memory
-+    );
-+
-+/* Wrapper for allocation memory.. */
-+gceSTATUS
-+gckOS_AllocateMemory(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    );
-+
-+/* Wrapper for freeing memory. */
-+gceSTATUS
-+gckOS_FreeMemory(
-+    IN gckOS Os,
-+    IN gctPOINTER Memory
-+    );
-+
-+/* Allocate paged memory. */
-+gceSTATUS
-+gckOS_AllocatePagedMemory(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPHYS_ADDR * Physical
-+    );
-+
-+/* Allocate paged memory. */
-+gceSTATUS
-+gckOS_AllocatePagedMemoryEx(
-+    IN gckOS Os,
-+    IN gctBOOL Contiguous,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPHYS_ADDR * Physical
-+    );
-+
-+/* Lock pages. */
-+gceSTATUS
-+gckOS_LockPages(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctBOOL Cacheable,
-+    OUT gctPOINTER * Logical,
-+    OUT gctSIZE_T * PageCount
-+    );
-+
-+/* Map pages. */
-+gceSTATUS
-+gckOS_MapPages(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+#ifdef __QNXNTO__
-+    IN gctPOINTER Logical,
-+#endif
-+    IN gctSIZE_T PageCount,
-+    IN gctPOINTER PageTable
-+    );
-+
-+/* Map pages. */
-+gceSTATUS
-+gckOS_MapPagesEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPHYS_ADDR Physical,
-+#ifdef __QNXNTO__
-+    IN gctPOINTER Logical,
-+#endif
-+    IN gctSIZE_T PageCount,
-+    IN gctPOINTER PageTable
-+    );
-+
-+/* Unlock pages. */
-+gceSTATUS
-+gckOS_UnlockPages(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Free paged memory. */
-+gceSTATUS
-+gckOS_FreePagedMemory(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Allocate non-paged memory. */
-+gceSTATUS
-+gckOS_AllocateNonPagedMemory(
-+    IN gckOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Free non-paged memory. */
-+gceSTATUS
-+gckOS_FreeNonPagedMemory(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Allocate contiguous memory. */
-+gceSTATUS
-+gckOS_AllocateContiguous(
-+    IN gckOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Free contiguous memory. */
-+gceSTATUS
-+gckOS_FreeContiguous(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Get the number fo bytes per page. */
-+gceSTATUS
-+gckOS_GetPageSize(
-+    IN gckOS Os,
-+    OUT gctSIZE_T * PageSize
-+    );
-+
-+/* Get the physical address of a corresponding logical address. */
-+gceSTATUS
-+gckOS_GetPhysicalAddress(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Get the physical address of a corresponding logical address. */
-+gceSTATUS
-+gckOS_GetPhysicalAddressProcess(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 ProcessID,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Map physical memory. */
-+gceSTATUS
-+gckOS_MapPhysical(
-+    IN gckOS Os,
-+    IN gctUINT32 Physical,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Unmap previously mapped physical memory. */
-+gceSTATUS
-+gckOS_UnmapPhysical(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Read data from a hardware register. */
-+gceSTATUS
-+gckOS_ReadRegister(
-+    IN gckOS Os,
-+    IN gctUINT32 Address,
-+    OUT gctUINT32 * Data
-+    );
-+
-+/* Read data from a hardware register. */
-+gceSTATUS
-+gckOS_ReadRegisterEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT32 Address,
-+    OUT gctUINT32 * Data
-+    );
-+
-+/* Write data to a hardware register. */
-+gceSTATUS
-+gckOS_WriteRegister(
-+    IN gckOS Os,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Data
-+    );
-+
-+/* Write data to a hardware register. */
-+gceSTATUS
-+gckOS_WriteRegisterEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Data
-+    );
-+
-+/* Write data to a 32-bit memory location. */
-+gceSTATUS
-+gckOS_WriteMemory(
-+    IN gckOS Os,
-+    IN gctPOINTER Address,
-+    IN gctUINT32 Data
-+    );
-+
-+/* Map physical memory into the process space. */
-+gceSTATUS
-+gckOS_MapMemory(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Unmap physical memory from the specified process space. */
-+gceSTATUS
-+gckOS_UnmapMemoryEx(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 PID
-+    );
-+
-+/* Unmap physical memory from the process space. */
-+gceSTATUS
-+gckOS_UnmapMemory(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Unmap user logical memory out of physical memory.
-+ * This function is only supported in Linux currently.
-+ */
-+gceSTATUS
-+gckOS_UnmapUserLogical(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Create a new mutex. */
-+gceSTATUS
-+gckOS_CreateMutex(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Mutex
-+    );
-+
-+/* Delete a mutex. */
-+gceSTATUS
-+gckOS_DeleteMutex(
-+    IN gckOS Os,
-+    IN gctPOINTER Mutex
-+    );
-+
-+/* Acquire a mutex. */
-+gceSTATUS
-+gckOS_AcquireMutex(
-+    IN gckOS Os,
-+    IN gctPOINTER Mutex,
-+    IN gctUINT32 Timeout
-+    );
-+
-+/* Release a mutex. */
-+gceSTATUS
-+gckOS_ReleaseMutex(
-+    IN gckOS Os,
-+    IN gctPOINTER Mutex
-+    );
-+
-+/* Atomically exchange a pair of 32-bit values. */
-+gceSTATUS
-+gckOS_AtomicExchange(
-+    IN gckOS Os,
-+    IN OUT gctUINT32_PTR Target,
-+    IN gctUINT32 NewValue,
-+    OUT gctUINT32_PTR OldValue
-+    );
-+
-+/* Atomically exchange a pair of pointers. */
-+gceSTATUS
-+gckOS_AtomicExchangePtr(
-+    IN gckOS Os,
-+    IN OUT gctPOINTER * Target,
-+    IN gctPOINTER NewValue,
-+    OUT gctPOINTER * OldValue
-+    );
-+
-+#if gcdSMP
-+gceSTATUS
-+gckOS_AtomSetMask(
-+    IN gctPOINTER Atom,
-+    IN gctUINT32 Mask
-+    );
-+
-+gceSTATUS
-+gckOS_AtomClearMask(
-+    IN gctPOINTER Atom,
-+    IN gctUINT32 Mask
-+    );
-+#endif
-+
-+gceSTATUS
-+gckOS_DumpCallStack(
-+    IN gckOS Os
-+    );
-+
-+gceSTATUS
-+gckOS_GetProcessNameByPid(
-+    IN gctINT Pid,
-+    IN gctSIZE_T Length,
-+    OUT gctUINT8_PTR String
-+    );
-+
-+
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomConstruct
-+**
-+**  Create an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Atom
-+**          Pointer to a variable receiving the constructed atom.
-+*/
-+gceSTATUS
-+gckOS_AtomConstruct(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Atom
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomDestroy
-+**
-+**  Destroy an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomDestroy(
-+    IN gckOS Os,
-+    OUT gctPOINTER Atom
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomGet
-+**
-+**  Get the 32-bit value protected by an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT32_PTR Value
-+**          Pointer to a variable the receives the value of the atom.
-+*/
-+gceSTATUS
-+gckOS_AtomGet(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    OUT gctINT32_PTR Value
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomSet
-+**
-+**  Set the 32-bit value protected by an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**      gctINT32 Value
-+**          The value of the atom.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomSet(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    IN gctINT32 Value
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomIncrement
-+**
-+**  Atomically increment the 32-bit integer value inside an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT32_PTR Value
-+**          Pointer to a variable the receives the original value of the atom.
-+*/
-+gceSTATUS
-+gckOS_AtomIncrement(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    OUT gctINT32_PTR Value
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomDecrement
-+**
-+**  Atomically decrement the 32-bit integer value inside an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT32_PTR Value
-+**          Pointer to a variable the receives the original value of the atom.
-+*/
-+gceSTATUS
-+gckOS_AtomDecrement(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    OUT gctINT32_PTR Value
-+    );
-+
-+/* Delay a number of microseconds. */
-+gceSTATUS
-+gckOS_Delay(
-+    IN gckOS Os,
-+    IN gctUINT32 Delay
-+    );
-+
-+/* Get time in milliseconds. */
-+gceSTATUS
-+gckOS_GetTicks(
-+    OUT gctUINT32_PTR Time
-+    );
-+
-+/* Compare time value. */
-+gceSTATUS
-+gckOS_TicksAfter(
-+    IN gctUINT32 Time1,
-+    IN gctUINT32 Time2,
-+    OUT gctBOOL_PTR IsAfter
-+    );
-+
-+/* Get time in microseconds. */
-+gceSTATUS
-+gckOS_GetTime(
-+    OUT gctUINT64_PTR Time
-+    );
-+
-+/* Memory barrier. */
-+gceSTATUS
-+gckOS_MemoryBarrier(
-+    IN gckOS Os,
-+    IN gctPOINTER Address
-+    );
-+
-+/* Map user pointer. */
-+gceSTATUS
-+gckOS_MapUserPointer(
-+    IN gckOS Os,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * KernelPointer
-+    );
-+
-+/* Unmap user pointer. */
-+gceSTATUS
-+gckOS_UnmapUserPointer(
-+    IN gckOS Os,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size,
-+    IN gctPOINTER KernelPointer
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_QueryNeedCopy
-+**
-+**  Query whether the memory can be accessed or mapped directly or it has to be
-+**  copied.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID of the current process.
-+**
-+**  OUTPUT:
-+**
-+**      gctBOOL_PTR NeedCopy
-+**          Pointer to a boolean receiving gcvTRUE if the memory needs a copy or
-+**          gcvFALSE if the memory can be accessed or mapped dircetly.
-+*/
-+gceSTATUS
-+gckOS_QueryNeedCopy(
-+    IN gckOS Os,
-+    IN gctUINT32 ProcessID,
-+    OUT gctBOOL_PTR NeedCopy
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CopyFromUserData
-+**
-+**  Copy data from user to kernel memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER KernelPointer
-+**          Pointer to kernel memory.
-+**
-+**      gctPOINTER Pointer
-+**          Pointer to user memory.
-+**
-+**      gctSIZE_T Size
-+**          Number of bytes to copy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_CopyFromUserData(
-+    IN gckOS Os,
-+    IN gctPOINTER KernelPointer,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CopyToUserData
-+**
-+**  Copy data from kernel to user memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER KernelPointer
-+**          Pointer to kernel memory.
-+**
-+**      gctPOINTER Pointer
-+**          Pointer to user memory.
-+**
-+**      gctSIZE_T Size
-+**          Number of bytes to copy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_CopyToUserData(
-+    IN gckOS Os,
-+    IN gctPOINTER KernelPointer,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size
-+    );
-+
-+#ifdef __QNXNTO__
-+/* Map user physical address. */
-+gceSTATUS
-+gckOS_MapUserPhysical(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Phys,
-+    OUT gctPOINTER * KernelPointer
-+    );
-+#endif
-+
-+gceSTATUS
-+gckOS_SuspendInterrupt(
-+    IN gckOS Os
-+    );
-+
-+gceSTATUS
-+gckOS_SuspendInterruptEx(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS
-+gckOS_ResumeInterrupt(
-+    IN gckOS Os
-+    );
-+
-+gceSTATUS
-+gckOS_ResumeInterruptEx(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+/* Get the base address for the physical memory. */
-+gceSTATUS
-+gckOS_GetBaseAddress(
-+    IN gckOS Os,
-+    OUT gctUINT32_PTR BaseAddress
-+    );
-+
-+/* Perform a memory copy. */
-+gceSTATUS
-+gckOS_MemCopy(
-+    IN gctPOINTER Destination,
-+    IN gctCONST_POINTER Source,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Zero memory. */
-+gceSTATUS
-+gckOS_ZeroMemory(
-+    IN gctPOINTER Memory,
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Device I/O control to the kernel HAL layer. */
-+gceSTATUS
-+gckOS_DeviceControl(
-+    IN gckOS Os,
-+    IN gctBOOL FromUser,
-+    IN gctUINT32 IoControlCode,
-+    IN gctPOINTER InputBuffer,
-+    IN gctSIZE_T InputBufferSize,
-+    OUT gctPOINTER OutputBuffer,
-+    IN gctSIZE_T OutputBufferSize
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetProcessID
-+**
-+**  Get current process ID.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR ProcessID
-+**          Pointer to the variable that receives the process ID.
-+*/
-+gceSTATUS
-+gckOS_GetProcessID(
-+    OUT gctUINT32_PTR ProcessID
-+    );
-+
-+gceSTATUS
-+gckOS_GetCurrentProcessID(
-+    OUT gctUINT32_PTR ProcessID
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetThreadID
-+**
-+**  Get current thread ID.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR ThreadID
-+**          Pointer to the variable that receives the thread ID.
-+*/
-+gceSTATUS
-+gckOS_GetThreadID(
-+    OUT gctUINT32_PTR ThreadID
-+    );
-+
-+/******************************************************************************\
-+********************************** Signal Object *********************************
-+\******************************************************************************/
-+
-+/* Create a signal. */
-+gceSTATUS
-+gckOS_CreateSignal(
-+    IN gckOS Os,
-+    IN gctBOOL ManualReset,
-+    OUT gctSIGNAL * Signal
-+    );
-+
-+/* Destroy a signal. */
-+gceSTATUS
-+gckOS_DestroySignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal
-+    );
-+
-+/* Signal a signal. */
-+gceSTATUS
-+gckOS_Signal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctBOOL State
-+    );
-+
-+/* Wait for a signal. */
-+gceSTATUS
-+gckOS_WaitSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctUINT32 Wait
-+    );
-+
-+/* Map a user signal to the kernel space. */
-+gceSTATUS
-+gckOS_MapSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctHANDLE Process,
-+    OUT gctSIGNAL * MappedSignal
-+    );
-+
-+/* Unmap a user signal */
-+gceSTATUS
-+gckOS_UnmapSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal
-+    );
-+
-+/* Map user memory. */
-+gceSTATUS
-+gckOS_MapUserMemory(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPOINTER Memory,
-+    IN gctUINT32 Physical,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * Info,
-+    OUT gctUINT32_PTR Address
-+    );
-+
-+/* Unmap user memory. */
-+gceSTATUS
-+gckOS_UnmapUserMemory(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPOINTER Memory,
-+    IN gctSIZE_T Size,
-+    IN gctPOINTER Info,
-+    IN gctUINT32 Address
-+    );
-+
-+/******************************************************************************\
-+************************** Android Native Fence Sync ***************************
-+\******************************************************************************/
-+gceSTATUS
-+gckOS_CreateSyncTimeline(
-+    IN gckOS Os,
-+    OUT gctHANDLE * Timeline
-+    );
-+
-+gceSTATUS
-+gckOS_DestroySyncTimeline(
-+    IN gckOS Os,
-+    IN gctHANDLE Timeline
-+    );
-+
-+gceSTATUS
-+gckOS_CreateSyncPoint(
-+    IN gckOS Os,
-+    OUT gctSYNC_POINT * SyncPoint
-+    );
-+
-+gceSTATUS
-+gckOS_ReferenceSyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    );
-+
-+gceSTATUS
-+gckOS_DestroySyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    );
-+
-+gceSTATUS
-+gckOS_SignalSyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    );
-+
-+gceSTATUS
-+gckOS_QuerySyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint,
-+    OUT gctBOOL_PTR State
-+    );
-+
-+gceSTATUS
-+gckOS_CreateNativeFence(
-+    IN gckOS Os,
-+    IN gctHANDLE Timeline,
-+    IN gctSYNC_POINT SyncPoint,
-+    OUT gctINT * FenceFD
-+    );
-+
-+#if !USE_NEW_LINUX_SIGNAL
-+/* Create signal to be used in the user space. */
-+gceSTATUS
-+gckOS_CreateUserSignal(
-+    IN gckOS Os,
-+    IN gctBOOL ManualReset,
-+    OUT gctINT * SignalID
-+    );
-+
-+/* Destroy signal used in the user space. */
-+gceSTATUS
-+gckOS_DestroyUserSignal(
-+    IN gckOS Os,
-+    IN gctINT SignalID
-+    );
-+
-+/* Wait for signal used in the user space. */
-+gceSTATUS
-+gckOS_WaitUserSignal(
-+    IN gckOS Os,
-+    IN gctINT SignalID,
-+    IN gctUINT32 Wait
-+    );
-+
-+/* Signal a signal used in the user space. */
-+gceSTATUS
-+gckOS_SignalUserSignal(
-+    IN gckOS Os,
-+    IN gctINT SignalID,
-+    IN gctBOOL State
-+    );
-+#endif /* USE_NEW_LINUX_SIGNAL */
-+
-+/* Set a signal owned by a process. */
-+#if defined(__QNXNTO__)
-+gceSTATUS
-+gckOS_UserSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctINT Recvid,
-+    IN gctINT Coid
-+    );
-+#else
-+gceSTATUS
-+gckOS_UserSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctHANDLE Process
-+    );
-+#endif
-+
-+/******************************************************************************\
-+** Cache Support
-+*/
-+
-+gceSTATUS
-+gckOS_CacheClean(
-+    gckOS Os,
-+    gctUINT32 ProcessID,
-+    gctPHYS_ADDR Handle,
-+    gctPOINTER Physical,
-+    gctPOINTER Logical,
-+    gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gckOS_CacheFlush(
-+    gckOS Os,
-+    gctUINT32 ProcessID,
-+    gctPHYS_ADDR Handle,
-+    gctPOINTER Physical,
-+    gctPOINTER Logical,
-+    gctSIZE_T Bytes
-+    );
-+
-+gceSTATUS
-+gckOS_CacheInvalidate(
-+    gckOS Os,
-+    gctUINT32 ProcessID,
-+    gctPHYS_ADDR Handle,
-+    gctPOINTER Physical,
-+    gctPOINTER Logical,
-+    gctSIZE_T Bytes
-+    );
-+
-+/******************************************************************************\
-+** Debug Support
-+*/
-+
-+void
-+gckOS_SetDebugLevel(
-+    IN gctUINT32 Level
-+    );
-+
-+void
-+gckOS_SetDebugZone(
-+    IN gctUINT32 Zone
-+    );
-+
-+void
-+gckOS_SetDebugLevelZone(
-+    IN gctUINT32 Level,
-+    IN gctUINT32 Zone
-+    );
-+
-+void
-+gckOS_SetDebugZones(
-+    IN gctUINT32 Zones,
-+    IN gctBOOL Enable
-+    );
-+
-+void
-+gckOS_SetDebugFile(
-+    IN gctCONST_STRING FileName
-+    );
-+
-+/*******************************************************************************
-+** Broadcast interface.
-+*/
-+
-+typedef enum _gceBROADCAST
-+{
-+    /* GPU might be idle. */
-+    gcvBROADCAST_GPU_IDLE,
-+
-+    /* A commit is going to happen. */
-+    gcvBROADCAST_GPU_COMMIT,
-+
-+    /* GPU seems to be stuck. */
-+    gcvBROADCAST_GPU_STUCK,
-+
-+    /* First process gets attached. */
-+    gcvBROADCAST_FIRST_PROCESS,
-+
-+    /* Last process gets detached. */
-+    gcvBROADCAST_LAST_PROCESS,
-+
-+    /* AXI bus error. */
-+    gcvBROADCAST_AXI_BUS_ERROR,
-+}
-+gceBROADCAST;
-+
-+gceSTATUS
-+gckOS_Broadcast(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gceBROADCAST Reason
-+    );
-+
-+gceSTATUS
-+gckOS_BroadcastHurry(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT Urgency
-+    );
-+
-+gceSTATUS
-+gckOS_BroadcastCalibrateSpeed(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT Idle,
-+    IN gctUINT Time
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetGPUPower
-+**
-+**  Set the power of the GPU on or off.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.ß
-+**
-+**      gckCORE Core
-+**          GPU whose power is set.
-+**
-+**      gctBOOL Clock
-+**          gcvTRUE to turn on the clock, or gcvFALSE to turn off the clock.
-+**
-+**      gctBOOL Power
-+**          gcvTRUE to turn on the power, or gcvFALSE to turn off the power.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_SetGPUPower(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctBOOL Clock,
-+    IN gctBOOL Power
-+    );
-+
-+gceSTATUS
-+gckOS_ResetGPU(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS
-+gckOS_PrepareGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS
-+gckOS_FinishGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS
-+gckOS_QueryGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gctUINT32 * Frequency,
-+    OUT gctUINT8 * Scale
-+    );
-+
-+gceSTATUS
-+gckOS_SetGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT8 Scale
-+    );
-+
-+/*******************************************************************************
-+** Semaphores.
-+*/
-+
-+/* Create a new semaphore. */
-+gceSTATUS
-+gckOS_CreateSemaphore(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Semaphore
-+    );
-+
-+#if gcdENABLE_VG
-+gceSTATUS
-+gckOS_CreateSemaphoreVG(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Semaphore
-+    );
-+#endif
-+
-+/* Delete a semahore. */
-+gceSTATUS
-+gckOS_DestroySemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    );
-+
-+/* Acquire a semahore. */
-+gceSTATUS
-+gckOS_AcquireSemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    );
-+
-+/* Try to acquire a semahore. */
-+gceSTATUS
-+gckOS_TryAcquireSemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    );
-+
-+/* Release a semahore. */
-+gceSTATUS
-+gckOS_ReleaseSemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    );
-+
-+/*******************************************************************************
-+** Timer API.
-+*/
-+
-+typedef void (*gctTIMERFUNCTION)(gctPOINTER);
-+
-+/* Create a timer. */
-+gceSTATUS
-+gckOS_CreateTimer(
-+    IN gckOS Os,
-+    IN gctTIMERFUNCTION Function,
-+    IN gctPOINTER Data,
-+    OUT gctPOINTER * Timer
-+    );
-+
-+/* Destory a timer. */
-+gceSTATUS
-+gckOS_DestroyTimer(
-+    IN gckOS Os,
-+    IN gctPOINTER Timer
-+    );
-+
-+/* Start a timer. */
-+gceSTATUS
-+gckOS_StartTimer(
-+    IN gckOS Os,
-+    IN gctPOINTER Timer,
-+    IN gctUINT32 Delay
-+    );
-+
-+/* Stop a timer. */
-+gceSTATUS
-+gckOS_StopTimer(
-+    IN gckOS Os,
-+    IN gctPOINTER Timer
-+    );
-+
-+/* Get the global video memory mutex. */
-+gceSTATUS
-+gckOS_GetVideoMemoryMutex(
-+    IN gckOS Os,
-+    OUT gctPOINTER *Mutex
-+    );
-+
-+/******************************************************************************\
-+********************************* gckHEAP Object ********************************
-+\******************************************************************************/
-+
-+typedef struct _gckHEAP *       gckHEAP;
-+
-+/* Construct a new gckHEAP object. */
-+gceSTATUS
-+gckHEAP_Construct(
-+    IN gckOS Os,
-+    IN gctSIZE_T AllocationSize,
-+    OUT gckHEAP * Heap
-+    );
-+
-+/* Destroy an gckHEAP object. */
-+gceSTATUS
-+gckHEAP_Destroy(
-+    IN gckHEAP Heap
-+    );
-+
-+/* Allocate memory. */
-+gceSTATUS
-+gckHEAP_Allocate(
-+    IN gckHEAP Heap,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Node
-+    );
-+
-+/* Free memory. */
-+gceSTATUS
-+gckHEAP_Free(
-+    IN gckHEAP Heap,
-+    IN gctPOINTER Node
-+    );
-+
-+/* Profile the heap. */
-+gceSTATUS
-+gckHEAP_ProfileStart(
-+    IN gckHEAP Heap
-+    );
-+
-+gceSTATUS
-+gckHEAP_ProfileEnd(
-+    IN gckHEAP Heap,
-+    IN gctCONST_STRING Title
-+    );
-+
-+
-+/******************************************************************************\
-+******************************** gckVIDMEM Object ******************************
-+\******************************************************************************/
-+
-+typedef struct _gckVIDMEM *         gckVIDMEM;
-+typedef struct _gckKERNEL *         gckKERNEL;
-+typedef struct _gckDB *             gckDB;
-+typedef struct _gckDVFS *           gckDVFS;
-+
-+/* Construct a new gckVIDMEM object. */
-+gceSTATUS
-+gckVIDMEM_Construct(
-+    IN gckOS Os,
-+    IN gctUINT32 BaseAddress,
-+    IN gctSIZE_T Bytes,
-+    IN gctSIZE_T Threshold,
-+    IN gctSIZE_T Banking,
-+    OUT gckVIDMEM * Memory
-+    );
-+
-+/* Destroy an gckVDIMEM object. */
-+gceSTATUS
-+gckVIDMEM_Destroy(
-+    IN gckVIDMEM Memory
-+    );
-+
-+/* Allocate rectangular memory. */
-+gceSTATUS
-+gckVIDMEM_Allocate(
-+    IN gckKERNEL Kernel,
-+    IN gckVIDMEM Memory,
-+    IN gctUINT Width,
-+    IN gctUINT Height,
-+    IN gctUINT Depth,
-+    IN gctUINT BytesPerPixel,
-+    IN gctUINT32 Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    );
-+
-+/* Allocate linear memory. */
-+gceSTATUS
-+gckVIDMEM_AllocateLinear(
-+    IN gckKERNEL Kernel,
-+    IN gckVIDMEM Memory,
-+    IN gctSIZE_T Bytes,
-+    IN gctUINT32 Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    );
-+
-+/* Free memory. */
-+gceSTATUS
-+gckVIDMEM_Free(
-+    IN gckKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node
-+    );
-+
-+/* Lock memory. */
-+gceSTATUS
-+gckVIDMEM_Lock(
-+    IN gckKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gctBOOL Cacheable,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Unlock memory. */
-+gceSTATUS
-+gckVIDMEM_Unlock(
-+    IN gckKERNEL Kernel,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctBOOL * Asynchroneous
-+    );
-+
-+/* Construct a gcuVIDMEM_NODE union for virtual memory. */
-+gceSTATUS
-+gckVIDMEM_ConstructVirtual(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL Contiguous,
-+    IN gctSIZE_T Bytes,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    );
-+
-+/* Destroy a gcuVIDMEM_NODE union for virtual memory. */
-+gceSTATUS
-+gckVIDMEM_DestroyVirtual(
-+    IN gcuVIDMEM_NODE_PTR Node
-+    );
-+
-+/******************************************************************************\
-+******************************** gckKERNEL Object ******************************
-+\******************************************************************************/
-+
-+struct _gcsHAL_INTERFACE;
-+
-+/* Notifications. */
-+typedef enum _gceNOTIFY
-+{
-+    gcvNOTIFY_INTERRUPT,
-+    gcvNOTIFY_COMMAND_QUEUE,
-+}
-+gceNOTIFY;
-+
-+/* Flush flags. */
-+typedef enum _gceKERNEL_FLUSH
-+{
-+    gcvFLUSH_COLOR              = 0x01,
-+    gcvFLUSH_DEPTH              = 0x02,
-+    gcvFLUSH_TEXTURE            = 0x04,
-+    gcvFLUSH_2D                 = 0x08,
-+    gcvFLUSH_ALL                = gcvFLUSH_COLOR
-+                                | gcvFLUSH_DEPTH
-+                                | gcvFLUSH_TEXTURE
-+                                | gcvFLUSH_2D,
-+}
-+gceKERNEL_FLUSH;
-+
-+/* Construct a new gckKERNEL object. */
-+gceSTATUS
-+gckKERNEL_Construct(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPOINTER Context,
-+    IN gckDB SharedDB,
-+    OUT gckKERNEL * Kernel
-+    );
-+
-+/* Destroy an gckKERNEL object. */
-+gceSTATUS
-+gckKERNEL_Destroy(
-+    IN gckKERNEL Kernel
-+    );
-+
-+/* Dispatch a user-level command. */
-+gceSTATUS
-+gckKERNEL_Dispatch(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL FromUser,
-+    IN OUT struct _gcsHAL_INTERFACE * Interface
-+    );
-+
-+/* Query the video memory. */
-+gceSTATUS
-+gckKERNEL_QueryVideoMemory(
-+    IN gckKERNEL Kernel,
-+    OUT struct _gcsHAL_INTERFACE * Interface
-+    );
-+
-+/* Lookup the gckVIDMEM object for a pool. */
-+gceSTATUS
-+gckKERNEL_GetVideoMemoryPool(
-+    IN gckKERNEL Kernel,
-+    IN gcePOOL Pool,
-+    OUT gckVIDMEM * VideoMemory
-+    );
-+
-+#if gcdUSE_VIDMEM_PER_PID
-+gceSTATUS
-+gckKERNEL_GetVideoMemoryPoolPid(
-+    IN gckKERNEL Kernel,
-+    IN gcePOOL Pool,
-+    IN gctUINT32 Pid,
-+    OUT gckVIDMEM * VideoMemory
-+    );
-+
-+gceSTATUS
-+gckKERNEL_CreateVideoMemoryPoolPid(
-+    IN gckKERNEL Kernel,
-+    IN gcePOOL Pool,
-+    IN gctUINT32 Pid,
-+    OUT gckVIDMEM * VideoMemory
-+    );
-+
-+gceSTATUS
-+gckKERNEL_RemoveVideoMemoryPoolPid(
-+    IN gckKERNEL Kernel,
-+    IN gckVIDMEM VideoMemory
-+    );
-+#endif
-+
-+/* Map video memory. */
-+gceSTATUS
-+gckKERNEL_MapVideoMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL InUserSpace,
-+    IN gctUINT32 Address,
-+#ifdef __QNXNTO__
-+    IN gctUINT32 Pid,
-+    IN gctUINT32 Bytes,
-+#endif
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Map video memory. */
-+gceSTATUS
-+gckKERNEL_MapVideoMemoryEx(
-+    IN gckKERNEL Kernel,
-+    IN gceCORE Core,
-+    IN gctBOOL InUserSpace,
-+    IN gctUINT32 Address,
-+#ifdef __QNXNTO__
-+    IN gctUINT32 Pid,
-+    IN gctUINT32 Bytes,
-+#endif
-+    OUT gctPOINTER * Logical
-+    );
-+
-+#ifdef __QNXNTO__
-+/* Unmap video memory. */
-+gceSTATUS
-+gckKERNEL_UnmapVideoMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Pid,
-+    IN gctUINT32 Bytes
-+    );
-+#endif
-+
-+/* Map memory. */
-+gceSTATUS
-+gckKERNEL_MapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Logical
-+    );
-+
-+/* Unmap memory. */
-+gceSTATUS
-+gckKERNEL_UnmapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Notification of events. */
-+gceSTATUS
-+gckKERNEL_Notify(
-+    IN gckKERNEL Kernel,
-+    IN gceNOTIFY Notifcation,
-+    IN gctBOOL Data
-+    );
-+
-+gceSTATUS
-+gckKERNEL_QuerySettings(
-+    IN gckKERNEL Kernel,
-+    OUT gcsKERNEL_SETTINGS * Settings
-+    );
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Recovery
-+**
-+**  Try to recover the GPU from a fatal error.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_Recovery(
-+    IN gckKERNEL Kernel
-+    );
-+
-+/* Set the value of timeout on HW operation. */
-+void
-+gckKERNEL_SetTimeOut(
-+    IN gckKERNEL Kernel,
-+    IN gctUINT32 timeOut
-+    );
-+
-+/* Get access to the user data. */
-+gceSTATUS
-+gckKERNEL_OpenUserData(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL NeedCopy,
-+    IN gctPOINTER StaticStorage,
-+    IN gctPOINTER UserPointer,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * KernelPointer
-+    );
-+
-+/* Release resources associated with the user data connection. */
-+gceSTATUS
-+gckKERNEL_CloseUserData(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL NeedCopy,
-+    IN gctBOOL FlushData,
-+    IN gctPOINTER UserPointer,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * KernelPointer
-+    );
-+
-+gceSTATUS
-+gckDVFS_Construct(
-+    IN gckHARDWARE Hardware,
-+    OUT gckDVFS * Frequency
-+    );
-+
-+gceSTATUS
-+gckDVFS_Destroy(
-+    IN gckDVFS Dvfs
-+    );
-+
-+gceSTATUS
-+gckDVFS_Start(
-+    IN gckDVFS Dvfs
-+    );
-+
-+gceSTATUS
-+gckDVFS_Stop(
-+    IN gckDVFS Dvfs
-+    );
-+
-+/******************************************************************************\
-+******************************* gckHARDWARE Object *****************************
-+\******************************************************************************/
-+
-+/* Construct a new gckHARDWARE object. */
-+gceSTATUS
-+gckHARDWARE_Construct(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gckHARDWARE * Hardware
-+    );
-+
-+/* Destroy an gckHARDWARE object. */
-+gceSTATUS
-+gckHARDWARE_Destroy(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+/* Get hardware type. */
-+gceSTATUS
-+gckHARDWARE_GetType(
-+    IN gckHARDWARE Hardware,
-+    OUT gceHARDWARE_TYPE * Type
-+    );
-+
-+/* Query system memory requirements. */
-+gceSTATUS
-+gckHARDWARE_QuerySystemMemory(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * SystemSize,
-+    OUT gctUINT32 * SystemBaseAddress
-+    );
-+
-+/* Build virtual address. */
-+gceSTATUS
-+gckHARDWARE_BuildVirtualAddress(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Query command buffer requirements. */
-+gceSTATUS
-+gckHARDWARE_QueryCommandBuffer(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * Alignment,
-+    OUT gctSIZE_T * ReservedHead,
-+    OUT gctSIZE_T * ReservedTail
-+    );
-+
-+/* Add a WAIT/LINK pair in the command queue. */
-+gceSTATUS
-+gckHARDWARE_WaitLink(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctUINT32 * WaitOffset,
-+    OUT gctSIZE_T * WaitBytes
-+    );
-+
-+/* Kickstart the command processor. */
-+gceSTATUS
-+gckHARDWARE_Execute(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+#ifdef __QNXNTO__
-+    IN gctPOINTER Physical,
-+    IN gctBOOL PhysicalAddresses,
-+#endif
-+    IN gctSIZE_T Bytes
-+    );
-+
-+/* Add an END command in the command queue. */
-+gceSTATUS
-+gckHARDWARE_End(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Add a NOP command in the command queue. */
-+gceSTATUS
-+gckHARDWARE_Nop(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Add a WAIT command in the command queue. */
-+gceSTATUS
-+gckHARDWARE_Wait(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Count,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Add a PIPESELECT command in the command queue. */
-+gceSTATUS
-+gckHARDWARE_PipeSelect(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gcePIPE_SELECT Pipe,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Add a LINK command in the command queue. */
-+gceSTATUS
-+gckHARDWARE_Link(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctPOINTER FetchAddress,
-+    IN gctSIZE_T FetchSize,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Add an EVENT command in the command queue. */
-+gceSTATUS
-+gckHARDWARE_Event(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT8 Event,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Query the available memory. */
-+gceSTATUS
-+gckHARDWARE_QueryMemory(
-+    IN gckHARDWARE Hardware,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctUINT32 * InternalBaseAddress,
-+    OUT gctUINT32 * InternalAlignment,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctUINT32 * ExternalBaseAddress,
-+    OUT gctUINT32 * ExternalAlignment,
-+    OUT gctUINT32 * HorizontalTileSize,
-+    OUT gctUINT32 * VerticalTileSize
-+    );
-+
-+/* Query the identity of the hardware. */
-+gceSTATUS
-+gckHARDWARE_QueryChipIdentity(
-+    IN gckHARDWARE Hardware,
-+    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
-+    );
-+
-+/* Query the shader support. */
-+gceSTATUS
-+gckHARDWARE_QueryShaderCaps(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT * VertexUniforms,
-+    OUT gctUINT * FragmentUniforms,
-+    OUT gctUINT * Varyings
-+    );
-+
-+/* Split a harwdare specific address into API stuff. */
-+gceSTATUS
-+gckHARDWARE_SplitMemory(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    );
-+
-+/* Update command queue tail pointer. */
-+gceSTATUS
-+gckHARDWARE_UpdateQueueTail(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Offset
-+    );
-+
-+/* Convert logical address to hardware specific address. */
-+gceSTATUS
-+gckHARDWARE_ConvertLogical(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    );
-+
-+#ifdef __QNXNTO__
-+/* Convert physical address to hardware specific address. */
-+gceSTATUS
-+gckHARDWARE_ConvertPhysical(
-+    IN gckHARDWARE Hardware,
-+    IN gctPHYS_ADDR Physical,
-+    OUT gctUINT32 * Address
-+    );
-+#endif
-+
-+/* Interrupt manager. */
-+gceSTATUS
-+gckHARDWARE_Interrupt(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL InterruptValid
-+    );
-+
-+/* Program MMU. */
-+gceSTATUS
-+gckHARDWARE_SetMMU(
-+    IN gckHARDWARE Hardware,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Flush the MMU. */
-+gceSTATUS
-+gckHARDWARE_FlushMMU(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+/* Set the page table base address. */
-+gceSTATUS
-+gckHARDWARE_SetMMUv2(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Enable,
-+    IN gctPOINTER MtlbAddress,
-+    IN gceMMU_MODE Mode,
-+    IN gctPOINTER SafeAddress,
-+    IN gctBOOL FromPower
-+    );
-+
-+/* Get idle register. */
-+gceSTATUS
-+gckHARDWARE_GetIdle(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL Wait,
-+    OUT gctUINT32 * Data
-+    );
-+
-+/* Flush the caches. */
-+gceSTATUS
-+gckHARDWARE_Flush(
-+    IN gckHARDWARE Hardware,
-+    IN gceKERNEL_FLUSH Flush,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Enable/disable fast clear. */
-+gceSTATUS
-+gckHARDWARE_SetFastClear(
-+    IN gckHARDWARE Hardware,
-+    IN gctINT Enable,
-+    IN gctINT Compression
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_ReadInterrupt(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32_PTR IDs
-+    );
-+
-+/* Power management. */
-+gceSTATUS
-+gckHARDWARE_SetPowerManagementState(
-+    IN gckHARDWARE Hardware,
-+    IN gceCHIPPOWERSTATE State
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_QueryPowerManagementState(
-+    IN gckHARDWARE Hardware,
-+    OUT gceCHIPPOWERSTATE* State
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_SetPowerManagement(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL PowerManagement
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_SetGpuProfiler(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL GpuProfiler
-+    );
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+gceSTATUS
-+gckHARDWARE_SetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32   FscaleValue
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_GetFscaleValue(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT * FscaleValue,
-+    IN gctUINT * MinFscaleValue,
-+    IN gctUINT * MaxFscaleValue
-+    );
-+#endif
-+
-+#if gcdPOWEROFF_TIMEOUT
-+gceSTATUS
-+gckHARDWARE_SetPowerOffTimeout(
-+    IN gckHARDWARE  Hardware,
-+    IN gctUINT32    Timeout
-+);
-+
-+gceSTATUS
-+gckHARDWARE_QueryPowerOffTimeout(
-+    IN gckHARDWARE  Hardware,
-+    OUT gctUINT32*  Timeout
-+);
-+#endif
-+
-+/* Profile 2D Engine. */
-+gceSTATUS
-+gckHARDWARE_ProfileEngine2D(
-+    IN gckHARDWARE Hardware,
-+    OUT gcs2D_PROFILE_PTR Profile
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_InitializeHardware(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_Reset(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+typedef gceSTATUS (*gctISRMANAGERFUNC)(gctPOINTER Context, gceCORE Core);
-+
-+gceSTATUS
-+gckHARDWARE_SetIsrManager(
-+    IN gckHARDWARE Hardware,
-+    IN gctISRMANAGERFUNC StartIsr,
-+    IN gctISRMANAGERFUNC StopIsr,
-+    IN gctPOINTER Context
-+    );
-+
-+/* Start a composition. */
-+gceSTATUS
-+gckHARDWARE_Compose(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Offset,
-+    IN gctSIZE_T Size,
-+    IN gctUINT8 EventID
-+    );
-+
-+/* Check for Hardware features. */
-+gceSTATUS
-+gckHARDWARE_IsFeatureAvailable(
-+    IN gckHARDWARE Hardware,
-+    IN gceFEATURE Feature
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_DumpMMUException(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_DumpGPUState(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_InitDVFS(
-+    IN gckHARDWARE Hardware
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_QueryLoad(
-+    IN gckHARDWARE Hardware,
-+    OUT gctUINT32 * Load
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_SetDVFSPeroid(
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT32 Frequency
-+    );
-+
-+#if !gcdENABLE_VG
-+/******************************************************************************\
-+***************************** gckINTERRUPT Object ******************************
-+\******************************************************************************/
-+
-+typedef struct _gckINTERRUPT *  gckINTERRUPT;
-+
-+typedef gceSTATUS (* gctINTERRUPT_HANDLER)(
-+    IN gckKERNEL Kernel
-+    );
-+
-+gceSTATUS
-+gckINTERRUPT_Construct(
-+    IN gckKERNEL Kernel,
-+    OUT gckINTERRUPT * Interrupt
-+    );
-+
-+gceSTATUS
-+gckINTERRUPT_Destroy(
-+    IN gckINTERRUPT Interrupt
-+    );
-+
-+gceSTATUS
-+gckINTERRUPT_SetHandler(
-+    IN gckINTERRUPT Interrupt,
-+    IN OUT gctINT32_PTR Id,
-+    IN gctINTERRUPT_HANDLER Handler
-+    );
-+
-+gceSTATUS
-+gckINTERRUPT_Notify(
-+    IN gckINTERRUPT Interrupt,
-+    IN gctBOOL Valid
-+    );
-+#endif
-+/******************************************************************************\
-+******************************** gckEVENT Object *******************************
-+\******************************************************************************/
-+
-+typedef struct _gckEVENT *      gckEVENT;
-+
-+/* Construct a new gckEVENT object. */
-+gceSTATUS
-+gckEVENT_Construct(
-+    IN gckKERNEL Kernel,
-+    OUT gckEVENT * Event
-+    );
-+
-+/* Destroy an gckEVENT object. */
-+gceSTATUS
-+gckEVENT_Destroy(
-+    IN gckEVENT Event
-+    );
-+
-+/* Add a new event to the list of events. */
-+gceSTATUS
-+gckEVENT_AddList(
-+    IN gckEVENT Event,
-+    IN gcsHAL_INTERFACE_PTR Interface,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN gctBOOL AllocateAllowed,
-+    IN gctBOOL FromKernel
-+    );
-+
-+/* Schedule a FreeNonPagedMemory event. */
-+gceSTATUS
-+gckEVENT_FreeNonPagedMemory(
-+    IN gckEVENT Event,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gceKERNEL_WHERE FromWhere
-+    );
-+
-+/* Schedule a FreeContiguousMemory event. */
-+gceSTATUS
-+gckEVENT_FreeContiguousMemory(
-+    IN gckEVENT Event,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gceKERNEL_WHERE FromWhere
-+    );
-+
-+/* Schedule a FreeVideoMemory event. */
-+gceSTATUS
-+gckEVENT_FreeVideoMemory(
-+    IN gckEVENT Event,
-+    IN gcuVIDMEM_NODE_PTR VideoMemory,
-+    IN gceKERNEL_WHERE FromWhere
-+    );
-+
-+/* Schedule a signal event. */
-+gceSTATUS
-+gckEVENT_Signal(
-+    IN gckEVENT Event,
-+    IN gctSIGNAL Signal,
-+    IN gceKERNEL_WHERE FromWhere
-+    );
-+
-+/* Schedule an Unlock event. */
-+gceSTATUS
-+gckEVENT_Unlock(
-+    IN gckEVENT Event,
-+    IN gceKERNEL_WHERE FromWhere,
-+    IN gcuVIDMEM_NODE_PTR Node,
-+    IN gceSURF_TYPE Type
-+    );
-+
-+gceSTATUS
-+gckEVENT_CommitDone(
-+    IN gckEVENT Event,
-+    IN gceKERNEL_WHERE FromWhere
-+    );
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+/* Schedule a FreeVirtualCommandBuffer event. */
-+gceSTATUS
-+gckEVENT_DestroyVirtualCommandBuffer(
-+    IN gckEVENT Event,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gceKERNEL_WHERE FromWhere
-+    );
-+#endif
-+
-+gceSTATUS
-+gckEVENT_Submit(
-+    IN gckEVENT Event,
-+    IN gctBOOL Wait,
-+    IN gctBOOL FromPower
-+    );
-+
-+/* Commit an event queue. */
-+gceSTATUS
-+gckEVENT_Commit(
-+    IN gckEVENT Event,
-+    IN gcsQUEUE_PTR Queue
-+    );
-+
-+/* Schedule a composition event. */
-+gceSTATUS
-+gckEVENT_Compose(
-+    IN gckEVENT Event,
-+    IN gcsHAL_COMPOSE_PTR Info
-+    );
-+
-+/* Event callback routine. */
-+gceSTATUS
-+gckEVENT_Notify(
-+    IN gckEVENT Event,
-+    IN gctUINT32 IDs
-+    );
-+
-+/* Event callback routine. */
-+gceSTATUS
-+gckEVENT_Interrupt(
-+    IN gckEVENT Event,
-+    IN gctUINT32 IDs
-+    );
-+
-+gceSTATUS
-+gckEVENT_Dump(
-+    IN gckEVENT Event
-+    );
-+/******************************************************************************\
-+******************************* gckCOMMAND Object ******************************
-+\******************************************************************************/
-+
-+typedef struct _gckCOMMAND *        gckCOMMAND;
-+
-+/* Construct a new gckCOMMAND object. */
-+gceSTATUS
-+gckCOMMAND_Construct(
-+    IN gckKERNEL Kernel,
-+    OUT gckCOMMAND * Command
-+    );
-+
-+/* Destroy an gckCOMMAND object. */
-+gceSTATUS
-+gckCOMMAND_Destroy(
-+    IN gckCOMMAND Command
-+    );
-+
-+/* Acquire command queue synchronization objects. */
-+gceSTATUS
-+gckCOMMAND_EnterCommit(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromPower
-+    );
-+
-+/* Release command queue synchronization objects. */
-+gceSTATUS
-+gckCOMMAND_ExitCommit(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromPower
-+    );
-+
-+/* Start the command queue. */
-+gceSTATUS
-+gckCOMMAND_Start(
-+    IN gckCOMMAND Command
-+    );
-+
-+/* Stop the command queue. */
-+gceSTATUS
-+gckCOMMAND_Stop(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromRecovery
-+    );
-+
-+/* Commit a buffer to the command queue. */
-+gceSTATUS
-+gckCOMMAND_Commit(
-+    IN gckCOMMAND Command,
-+    IN gckCONTEXT Context,
-+    IN gcoCMDBUF CommandBuffer,
-+    IN gcsSTATE_DELTA_PTR StateDelta,
-+    IN gcsQUEUE_PTR EventQueue,
-+    IN gctUINT32 ProcessID
-+    );
-+
-+/* Reserve space in the command buffer. */
-+gceSTATUS
-+gckCOMMAND_Reserve(
-+    IN gckCOMMAND Command,
-+    IN gctSIZE_T RequestedBytes,
-+    OUT gctPOINTER * Buffer,
-+    OUT gctSIZE_T * BufferSize
-+    );
-+
-+/* Execute reserved space in the command buffer. */
-+gceSTATUS
-+gckCOMMAND_Execute(
-+    IN gckCOMMAND Command,
-+    IN gctSIZE_T RequstedBytes
-+    );
-+
-+/* Stall the command queue. */
-+gceSTATUS
-+gckCOMMAND_Stall(
-+    IN gckCOMMAND Command,
-+    IN gctBOOL FromPower
-+    );
-+
-+/* Attach user process. */
-+gceSTATUS
-+gckCOMMAND_Attach(
-+    IN gckCOMMAND Command,
-+    OUT gckCONTEXT * Context,
-+    OUT gctSIZE_T * StateCount,
-+    IN gctUINT32 ProcessID
-+    );
-+
-+/* Detach user process. */
-+gceSTATUS
-+gckCOMMAND_Detach(
-+    IN gckCOMMAND Command,
-+    IN gckCONTEXT Context
-+    );
-+
-+#if gcdVIRTUAL_COMMAND_BUFFER
-+gceSTATUS
-+gckCOMMAND_DumpExecutingBuffer(
-+    IN gckCOMMAND Command
-+    );
-+#endif
-+
-+/******************************************************************************\
-+********************************* gckMMU Object ********************************
-+\******************************************************************************/
-+
-+typedef struct _gckMMU *            gckMMU;
-+
-+/* Construct a new gckMMU object. */
-+gceSTATUS
-+gckMMU_Construct(
-+    IN gckKERNEL Kernel,
-+    IN gctSIZE_T MmuSize,
-+    OUT gckMMU * Mmu
-+    );
-+
-+/* Destroy an gckMMU object. */
-+gceSTATUS
-+gckMMU_Destroy(
-+    IN gckMMU Mmu
-+    );
-+
-+/* Enable the MMU. */
-+gceSTATUS
-+gckMMU_Enable(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 PhysBaseAddr,
-+    IN gctUINT32 PhysSize
-+    );
-+
-+/* Allocate pages inside the MMU. */
-+gceSTATUS
-+gckMMU_AllocatePages(
-+    IN gckMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    );
-+
-+gceSTATUS
-+gckMMU_AllocatePagesEx(
-+    IN gckMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    IN gceSURF_TYPE Type,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Remove a page table from the MMU. */
-+gceSTATUS
-+gckMMU_FreePages(
-+    IN gckMMU Mmu,
-+    IN gctPOINTER PageTable,
-+    IN gctSIZE_T PageCount
-+    );
-+
-+/* Set the MMU page with info. */
-+gceSTATUS
-+gckMMU_SetPage(
-+   IN gckMMU Mmu,
-+   IN gctUINT32 PageAddress,
-+   IN gctUINT32 *PageEntry
-+   );
-+
-+#ifdef __QNXNTO__
-+gceSTATUS
-+gckMMU_InsertNode(
-+    IN gckMMU Mmu,
-+    IN gcuVIDMEM_NODE_PTR Node);
-+
-+gceSTATUS
-+gckMMU_RemoveNode(
-+    IN gckMMU Mmu,
-+    IN gcuVIDMEM_NODE_PTR Node);
-+#endif
-+
-+#ifdef __QNXNTO__
-+gceSTATUS
-+gckMMU_FreeHandleMemory(
-+    IN gckKERNEL Kernel,
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Pid
-+    );
-+#endif
-+
-+gceSTATUS
-+gckMMU_Flush(
-+    IN gckMMU Mmu
-+    );
-+
-+gceSTATUS
-+gckMMU_DumpPageTableEntry(
-+    IN gckMMU Mmu,
-+    IN gctUINT32 Address
-+    );
-+
-+
-+#if VIVANTE_PROFILER
-+gceSTATUS
-+gckHARDWARE_QueryProfileRegisters(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL   Clear,
-+    OUT gcsPROFILER_COUNTERS * Counters
-+    );
-+#endif
-+
-+#if VIVANTE_PROFILER_CONTEXT
-+gceSTATUS
-+gckHARDWARE_QueryContextProfile(
-+    IN gckHARDWARE Hardware,
-+    IN gctBOOL   Clear,
-+    IN gckCONTEXT Context,
-+    OUT gcsPROFILER_COUNTERS * Counters
-+    );
-+
-+gceSTATUS
-+gckHARDWARE_UpdateContextProfile(
-+    IN gckHARDWARE Hardware,
-+    IN gckCONTEXT Context
-+    );
-+#endif
-+
-+gceSTATUS
-+gckOS_SignalQueryHardware(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    OUT gckHARDWARE * Hardware
-+    );
-+
-+gceSTATUS
-+gckOS_SignalSetHardware(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    gckHARDWARE Hardware
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#if gcdENABLE_VG
-+#include "gc_hal_vg.h"
-+#endif
-+
-+#endif /* __gc_hal_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,185 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_buffer_h_
-+#define __gc_hal_kernel_buffer_h_
-+
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+************************ Command Buffer and Event Objects **********************
-+\******************************************************************************/
-+
-+/* The number of context buffers per user. */
-+#define gcdCONTEXT_BUFFER_COUNT 2
-+
-+/* State delta record. */
-+typedef struct _gcsSTATE_DELTA_RECORD * gcsSTATE_DELTA_RECORD_PTR;
-+typedef struct _gcsSTATE_DELTA_RECORD
-+{
-+    /* State address. */
-+    gctUINT                     address;
-+
-+    /* State mask. */
-+    gctUINT32                   mask;
-+
-+    /* State data. */
-+    gctUINT32                   data;
-+}
-+gcsSTATE_DELTA_RECORD;
-+
-+/* State delta. */
-+typedef struct _gcsSTATE_DELTA
-+{
-+    /* For debugging: the number of delta in the order of creation. */
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    gctUINT                     num;
-+#endif
-+
-+    /* Main state delta ID. Every time state delta structure gets reinitialized,
-+       main ID is incremented. If main state ID overflows, all map entry IDs get
-+       reinitialized to make sure there is no potential erroneous match after
-+       the overflow.*/
-+    gctUINT                     id;
-+
-+    /* The number of contexts pending modification by the delta. */
-+    gctINT                      refCount;
-+
-+    /* Vertex element count for the delta buffer. */
-+    gctUINT                     elementCount;
-+
-+    /* Number of states currently stored in the record array. */
-+    gctUINT                     recordCount;
-+
-+    /* Record array; holds all modified states in gcsSTATE_DELTA_RECORD. */
-+    gctUINT64                   recordArray;
-+
-+    /* Map entry ID is used for map entry validation. If map entry ID does not
-+       match the main state delta ID, the entry and the corresponding state are
-+       considered not in use. */
-+    gctUINT64                   mapEntryID;
-+    gctUINT                     mapEntryIDSize;
-+
-+    /* If the map entry ID matches the main state delta ID, index points to
-+       the state record in the record array. */
-+    gctUINT64                   mapEntryIndex;
-+
-+    /* Previous and next state deltas in gcsSTATE_DELTA. */
-+    gctUINT64                   prev;
-+    gctUINT64                   next;
-+}
-+gcsSTATE_DELTA;
-+
-+/* Command buffer object. */
-+struct _gcoCMDBUF
-+{
-+    /* The object. */
-+    gcsOBJECT                   object;
-+
-+    /* Command buffer entry and exit pipes. */
-+    gcePIPE_SELECT              entryPipe;
-+    gcePIPE_SELECT              exitPipe;
-+
-+    /* Feature usage flags. */
-+    gctBOOL                     using2D;
-+    gctBOOL                     using3D;
-+    gctBOOL                     usingFilterBlit;
-+    gctBOOL                     usingPalette;
-+
-+    /* Physical address of command buffer. Just a name. */
-+    gctUINT32                   physical;
-+
-+    /* Logical address of command buffer. */
-+    gctUINT64                   logical;
-+
-+    /* Number of bytes in command buffer. */
-+    gctUINT                     bytes;
-+
-+    /* Start offset into the command buffer. */
-+    gctUINT                     startOffset;
-+
-+    /* Current offset into the command buffer. */
-+    gctUINT                     offset;
-+
-+    /* Number of free bytes in command buffer. */
-+    gctUINT                     free;
-+
-+    /* Location of the last reserved area. */
-+    gctUINT64                   lastReserve;
-+    gctUINT                     lastOffset;
-+
-+#if gcdSECURE_USER
-+    /* Hint array for the current command buffer. */
-+    gctUINT                     hintArraySize;
-+    gctUINT64                   hintArray;
-+    gctUINT64                   hintArrayTail;
-+#endif
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+    /* Last load state command location and hardware address. */
-+    gctUINT64                   lastLoadStatePtr;
-+    gctUINT32                   lastLoadStateAddress;
-+    gctUINT32                   lastLoadStateCount;
-+#endif
-+};
-+
-+typedef struct _gcsQUEUE
-+{
-+    /* Pointer to next gcsQUEUE structure in gcsQUEUE. */
-+    gctUINT64                   next;
-+
-+    /* Event information. */
-+    gcsHAL_INTERFACE            iface;
-+}
-+gcsQUEUE;
-+
-+/* Event queue. */
-+struct _gcoQUEUE
-+{
-+    /* The object. */
-+    gcsOBJECT                   object;
-+
-+    /* Pointer to current event queue. */
-+    gcsQUEUE_PTR                head;
-+    gcsQUEUE_PTR                tail;
-+
-+#ifdef __QNXNTO__
-+    /* Buffer for records. */
-+    gcsQUEUE_PTR                records;
-+    gctUINT32                   freeBytes;
-+    gctUINT32                   offset;
-+#else
-+    /* List of free records. */
-+    gcsQUEUE_PTR                freeList;
-+#endif
-+    #define gcdIN_QUEUE_RECORD_LIMIT 16
-+    /* Number of records currently in queue */
-+    gctUINT32                   recordCount;
-+};
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_buffer_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,530 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+/*
-+**	Include file for the local memory management.
-+*/
-+
-+#ifndef __gc_hal_mem_h_
-+#define __gc_hal_mem_h_
-+#ifndef VIVANTE_NO_3D
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/*******************************************************************************
-+**  Usage:
-+
-+	The macros to declare MemPool type and functions are
-+	gcmMEM_DeclareFSMemPool (Type, TypeName, Prefix)
-+	gcmMEM_DeclareVSMemPool (Type, TypeName, Prefix)
-+	gcmMEM_DeclareAFSMemPool(Type, TypeName, Prefix)
-+
-+	The data structures for MemPool are
-+	typedef struct _gcsMEM_FS_MEM_POOL *	gcsMEM_FS_MEM_POOL;
-+	typedef struct _gcsMEM_VS_MEM_POOL *	gcsMEM_VS_MEM_POOL;
-+	typedef struct _gcsMEM_AFS_MEM_POOL *	gcsMEM_AFS_MEM_POOL;
-+
-+	The MemPool constructor and destructor functions are
-+	gcfMEM_InitFSMemPool(gcsMEM_FS_MEM_POOL *, gcoOS, gctUINT, gctUINT);
-+	gcfMEM_FreeFSMemPool(gcsMEM_FS_MEM_POOL *);
-+	gcfMEM_InitVSMemPool(gcsMEM_VS_MEM_POOL *, gcoOS, gctUINT, gctBOOL);
-+	gcfMEM_FreeVSMemPool(gcsMEM_VS_MEM_POOL *);
-+	gcfMEM_InitAFSMemPool(gcsMEM_AFS_MEM_POOL *, gcoOS, gctUINT);
-+	gcfMEM_FreeAFSMemPool(gcsMEM_AFS_MEM_POOL *);
-+
-+	FS:  for Fixed-Size data structures
-+	VS:  for Variable-size data structures
-+	AFS: for Array of Fixed-Size data structures
-+
-+
-+	// Example 1: For a fixed-size data structure, struct gcsNode.
-+	// It is used locally in a file, so the functions are static without prefix.
-+	// At top level, declear allocate and free functions.
-+	// The first argument is the data type.
-+	// The second armument is the short name used in the fuctions.
-+	gcmMEM_DeclareFSMemPool(struct gcsNode, Node, );
-+
-+	// The previous macro creates two inline functions,
-+	// _AllocateNode and _FreeNode.
-+
-+	// In function or struct
-+	gcsMEM_FS_MEM_POOL nodeMemPool;
-+
-+	// In function,
-+	struct gcsNode * node;
-+	gceSTATUS status;
-+
-+	// Before using the memory pool, initialize it.
-+	// The second argument is the gcoOS object.
-+	// The third argument is the number of data structures to allocate for each chunk.
-+	status = gcfMEM_InitFSMemPool(&nodeMemPool, os, 100, sizeof(struct gcsNode));
-+	...
-+
-+	// Allocate a node.
-+	status = _AllocateNode(nodeMemPool, &node);
-+	...
-+	// Free a node.
-+	_FreeNode(nodeMemPool, node);
-+
-+	// After using the memory pool, free it.
-+	gcfMEM_FreeFSMemPool(&nodeMemPool);
-+
-+
-+	// Example 2: For array of fixed-size data structures, struct gcsNode.
-+	// It is used in several files, so the functions are extern with prefix.
-+	// At top level, declear allocate and free functions.
-+	// The first argument is the data type, and the second one is the short name
-+	// used in the fuctions.
-+	gcmMEM_DeclareAFSMemPool(struct gcsNode, NodeArray, gcfOpt);
-+
-+	// The previous macro creates two inline functions,
-+	// gcfOpt_AllocateNodeArray and gcfOpt_FreeNodeArray.
-+
-+	// In function or struct
-+	gcsMEM_AFS_MEM_POOL nodeArrayMemPool;
-+
-+	// In function,
-+	struct gcsNode * nodeArray;
-+	gceSTATUS status;
-+
-+	// Before using the array memory pool, initialize it.
-+	// The second argument is the gcoOS object, the third is the number of data
-+	// structures to allocate for each chunk.
-+	status = gcfMEM_InitAFSMemPool(&nodeArrayMemPool, os, sizeof(struct gcsNode));
-+	...
-+
-+	// Allocate a node array of size 100.
-+	status = gcfOpt_AllocateNodeArray(nodeArrayMemPool, &nodeArray, 100);
-+	...
-+	// Free a node array.
-+	gcfOpt_FreeNodeArray(&nodeArrayMemPool, nodeArray);
-+
-+	// After using the array memory pool, free it.
-+	gcfMEM_FreeAFSMemPool(&nodeArrayMemPool);
-+
-+*******************************************************************************/
-+
-+/*******************************************************************************
-+**	To switch back to use gcoOS_Allocate and gcoOS_Free, add
-+**	#define USE_LOCAL_MEMORY_POOL 0
-+**	before including this file.
-+*******************************************************************************/
-+#ifndef USE_LOCAL_MEMORY_POOL
-+/*
-+    USE_LOCAL_MEMORY_POOL
-+
-+    This define enables the local memory management to improve performance.
-+*/
-+#define USE_LOCAL_MEMORY_POOL		1
-+#endif
-+
-+/*******************************************************************************
-+**							Memory Pool Data Structures
-+*******************************************************************************/
-+#if USE_LOCAL_MEMORY_POOL
-+	typedef struct _gcsMEM_FS_MEM_POOL *	gcsMEM_FS_MEM_POOL;
-+	typedef struct _gcsMEM_VS_MEM_POOL *	gcsMEM_VS_MEM_POOL;
-+	typedef struct _gcsMEM_AFS_MEM_POOL *	gcsMEM_AFS_MEM_POOL;
-+#else
-+	typedef gcoOS	gcsMEM_FS_MEM_POOL;
-+	typedef gcoOS	gcsMEM_VS_MEM_POOL;
-+	typedef gcoOS	gcsMEM_AFS_MEM_POOL;
-+#endif
-+
-+/*******************************************************************************
-+**							Memory Pool Macros
-+*******************************************************************************/
-+#if USE_LOCAL_MEMORY_POOL
-+#define gcmMEM_DeclareFSMemPool(Type, TypeName, Prefix) \
-+gceSTATUS \
-+Prefix##_Allocate##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type **					Pointer \
-+	) \
-+{ \
-+	return(gcfMEM_FSMemPoolGetANode(MemPool, (gctPOINTER *) Pointer)); \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_CAllocate##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type **					Pointer \
-+	) \
-+{ \
-+	gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+	gcmERR_RETURN(gcfMEM_FSMemPoolGetANode(MemPool, (gctPOINTER *) Pointer)); \
-+	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, gcmSIZEOF(Type)); \
-+    gcmFOOTER(); \
-+	return gcvSTATUS_OK; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type *					Pointer \
-+	) \
-+{ \
-+    gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+    status = gcfMEM_FSMemPoolFreeANode(MemPool, (gctPOINTER) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName##List( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type *					FirstPointer, \
-+	Type *					LastPointer \
-+	) \
-+{ \
-+    gceSTATUS               status; \
-+    gcmHEADER_ARG("MemPool=0x%x FirstPointer=0x%x LastPointer=0x%x", MemPool, FirstPointer, LastPointer); \
-+    status = gcfMEM_FSMemPoolFreeAList(MemPool, (gctPOINTER) FirstPointer, (gctPOINTER) LastPointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+}
-+
-+#define gcmMEM_DeclareVSMemPool(Type, TypeName, Prefix) \
-+gceSTATUS \
-+Prefix##_Allocate##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Size \
-+	) \
-+{ \
-+    gceSTATUS               status;\
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
-+    status = gcfMEM_VSMemPoolGetANode(MemPool, Size, (gctPOINTER *) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+} \
-+ \
-+gceSTATUS \
-+ Prefix##_CAllocate##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Size \
-+	) \
-+{ \
-+	gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
-+	gcmERR_RETURN(gcfMEM_VSMemPoolGetANode(MemPool, Size, (gctPOINTER *) Pointer)); \
-+	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, size); \
-+    gcmFOOTER(); \
-+	return gcvSTATUS_OK; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type *					Pointer \
-+	) \
-+{ \
-+    gceSTATUS               status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pinter); \
-+    status = gcfMEM_VSMemPoolFreeANode(MemPool, (gctPOINTER) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+}
-+
-+#define gcmMEM_DeclareAFSMemPool(Type, TypeName, Prefix) \
-+gceSTATUS \
-+Prefix##_Allocate##TypeName( \
-+	gcsMEM_AFS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Count \
-+	) \
-+{ \
-+    gceSTATUS               status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
-+    status = gcfMEM_AFSMemPoolGetANode(MemPool, Count, (gctPOINTER *) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_CAllocate##TypeName( \
-+	gcsMEM_AFS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Count \
-+	) \
-+{ \
-+	gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
-+	gcmERR_RETURN(gcfMEM_AFSMemPoolGetANode(MemPool, Count, (gctPOINTER *) Pointer)); \
-+	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, Count * gcmSIZEOF(Type)); \
-+    gcmFOOTER(); \
-+	return gcvSTATUS_OK; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName( \
-+	gcsMEM_AFS_MEM_POOL		MemPool, \
-+	Type *					Pointer \
-+	) \
-+{ \
-+    gceSTATUS               status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+    status = gcfMEM_AFSMemPoolFreeANode(MemPool, (gctPOINTER) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+}
-+
-+#else
-+
-+#define gcmMEM_DeclareFSMemPool(Type, TypeName, Prefix) \
-+gceSTATUS \
-+Prefix##_Allocate##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type **					Pointer \
-+	) \
-+{ \
-+    gceSTATUS               status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+    status = gcoOS_Allocate(MemPool, \
-+							gcmSIZEOF(Type), \
-+							(gctPOINTER *) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_CAllocate##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type **					Pointer \
-+	) \
-+{ \
-+	gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+	gcmERR_RETURN(gcoOS_Allocate(MemPool, \
-+							gcmSIZEOF(Type), \
-+							(gctPOINTER *) Pointer)); \
-+	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, gcmSIZEOF(Type)); \
-+    gcmFOOTER(); \
-+	return gcvSTATUS_OK; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName( \
-+	gcsMEM_FS_MEM_POOL		MemPool, \
-+	Type *					Pointer \
-+	) \
-+{ \
-+    gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+    status = gcmOS_SAFE_FREE(MemPool, Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+}
-+
-+#define gcmMEM_DeclareVSMemPool(Type, TypeName, Prefix) \
-+gceSTATUS \
-+Prefix##_Allocate##TypeName( \
-+	gcsMEM_VS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Size \
-+	) \
-+{ \
-+    gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
-+    status = gcoOS_Allocate(MemPool, \
-+							Size, \
-+							(gctPOINTER *) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_CAllocate##TypeName( \
-+	gcsMEM_VS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Size \
-+	) \
-+{ \
-+	gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
-+	gcmERR_RETURN(gcoOS_Allocate(MemPool, \
-+							Size, \
-+							(gctPOINTER *) Pointer)); \
-+	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, Size); \
-+    gcmFOOTER(); \
-+	return gcvSTATUS_OK; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName( \
-+	gcsMEM_VS_MEM_POOL		MemPool, \
-+	Type *					Pointer \
-+	) \
-+{ \
-+    gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+    status = gcmOS_SAFE_FREE(MemPool, Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+}
-+
-+#define gcmMEM_DeclareAFSMemPool(Type, TypeName, Prefix) \
-+gceSTATUS \
-+Prefix##_Allocate##TypeName( \
-+	gcsMEM_AFS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Count \
-+	) \
-+{ \
-+    gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
-+    status = gcoOS_Allocate(MemPool, \
-+							Count * gcmSIZEOF(Type), \
-+							(gctPOINTER *) Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_CAllocate##TypeName( \
-+	gcsMEM_AFS_MEM_POOL		MemPool, \
-+	Type **					Pointer, \
-+	gctUINT					Count \
-+	) \
-+{ \
-+	gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
-+	gcmERR_RETURN(gcoOS_Allocate(MemPool, \
-+							Count * gcmSIZEOF(Type), \
-+							(gctPOINTER *) Pointer)); \
-+	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, Count * gcmSIZEOF(Type)); \
-+    gcmFOOTER(); \
-+	return gcvSTATUS_OK; \
-+} \
-+ \
-+gceSTATUS \
-+Prefix##_Free##TypeName( \
-+	gcsMEM_AFS_MEM_POOL		MemPool, \
-+	Type *					Pointer \
-+	) \
-+{ \
-+    gceSTATUS				status; \
-+    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
-+    status = gcmOS_SAFE_FREE(MemPool, Pointer); \
-+    gcmFOOTER(); \
-+	return status; \
-+}
-+#endif
-+
-+/*******************************************************************************
-+**							Memory Pool Data Functions
-+*******************************************************************************/
-+gceSTATUS
-+gcfMEM_InitFSMemPool(
-+	IN gcsMEM_FS_MEM_POOL * MemPool,
-+	IN gcoOS				OS,
-+	IN gctUINT				NodeCount,
-+	IN gctUINT				NodeSize
-+	);
-+
-+gceSTATUS
-+gcfMEM_FreeFSMemPool(
-+	IN gcsMEM_FS_MEM_POOL * MemPool
-+	);
-+
-+gceSTATUS
-+gcfMEM_FSMemPoolGetANode(
-+	IN gcsMEM_FS_MEM_POOL	MemPool,
-+	OUT gctPOINTER *		Node
-+	);
-+
-+gceSTATUS
-+gcfMEM_FSMemPoolFreeANode(
-+	IN gcsMEM_FS_MEM_POOL	MemPool,
-+	IN gctPOINTER			Node
-+	);
-+
-+gceSTATUS
-+gcfMEM_FSMemPoolFreeAList(
-+	IN gcsMEM_FS_MEM_POOL	MemPool,
-+	IN gctPOINTER			FirstNode,
-+	IN gctPOINTER			LastNode
-+	);
-+
-+gceSTATUS
-+gcfMEM_InitVSMemPool(
-+	IN gcsMEM_VS_MEM_POOL * MemPool,
-+	IN gcoOS				OS,
-+	IN gctUINT				BlockSize,
-+	IN gctBOOL				RecycleFreeNode
-+	);
-+
-+gceSTATUS
-+gcfMEM_FreeVSMemPool(
-+	IN gcsMEM_VS_MEM_POOL * MemPool
-+	);
-+
-+gceSTATUS
-+gcfMEM_VSMemPoolGetANode(
-+	IN gcsMEM_VS_MEM_POOL	MemPool,
-+	IN gctUINT				Size,
-+	IN gctUINT				Alignment,
-+	OUT gctPOINTER *		Node
-+	);
-+
-+gceSTATUS
-+gcfMEM_VSMemPoolFreeANode(
-+	IN gcsMEM_VS_MEM_POOL	MemPool,
-+	IN gctPOINTER			Node
-+	);
-+
-+gceSTATUS
-+gcfMEM_InitAFSMemPool(
-+	IN gcsMEM_AFS_MEM_POOL *MemPool,
-+	IN gcoOS				OS,
-+	IN gctUINT				NodeCount,
-+	IN gctUINT				NodeSize
-+	);
-+
-+gceSTATUS
-+gcfMEM_FreeAFSMemPool(
-+	IN gcsMEM_AFS_MEM_POOL *MemPool
-+	);
-+
-+gceSTATUS
-+gcfMEM_AFSMemPoolGetANode(
-+	IN gcsMEM_AFS_MEM_POOL	MemPool,
-+	IN gctUINT				Count,
-+	OUT gctPOINTER *		Node
-+	);
-+
-+gceSTATUS
-+gcfMEM_AFSMemPoolFreeANode(
-+	IN gcsMEM_AFS_MEM_POOL	MemPool,
-+	IN gctPOINTER			Node
-+	);
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* VIVANTE_NO_3D */
-+#endif /* __gc_hal_mem_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,947 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_options_h_
-+#define __gc_hal_options_h_
-+
-+/*
-+    gcdPRINT_VERSION
-+
-+        Print HAL version.
-+*/
-+#ifndef gcdPRINT_VERSION
-+#   define gcdPRINT_VERSION                     0
-+#endif
-+
-+/*
-+    USE_NEW_LINUX_SIGNAL
-+
-+        This define enables the Linux kernel signaling between kernel and user.
-+*/
-+#ifndef USE_NEW_LINUX_SIGNAL
-+#   define USE_NEW_LINUX_SIGNAL                 0
-+#endif
-+
-+/*
-+    VIVANTE_PROFILER
-+
-+        This define enables the profiler.
-+*/
-+#ifndef VIVANTE_PROFILER
-+#   define VIVANTE_PROFILER                     1
-+#endif
-+
-+#ifndef VIVANTE_PROFILER_PERDRAW
-+#   define  VIVANTE_PROFILER_PERDRAW    0
-+#endif
-+
-+/*
-+    VIVANTE_PROFILER_CONTEXT
-+
-+        This define enables the profiler according to each hw context.
-+*/
-+#ifndef VIVANTE_PROFILER_CONTEXT
-+#   define VIVANTE_PROFILER_CONTEXT             1
-+#endif
-+
-+/*
-+    gcdUSE_VG
-+
-+        Enable VG HAL layer (only for GC350).
-+*/
-+#ifndef gcdUSE_VG
-+#   define gcdUSE_VG                            0
-+#endif
-+
-+/*
-+    USE_SW_FB
-+
-+        Set to 1 if the frame buffer memory cannot be accessed by the GPU.
-+*/
-+#ifndef USE_SW_FB
-+#   define USE_SW_FB                            0
-+#endif
-+
-+/*
-+    USE_SUPER_SAMPLING
-+
-+        This define enables super-sampling support.
-+*/
-+#define USE_SUPER_SAMPLING                      0
-+
-+/*
-+    PROFILE_HAL_COUNTERS
-+
-+        This define enables HAL counter profiling support.  HW and SHADER
-+        counter profiling depends on this.
-+*/
-+#ifndef PROFILE_HAL_COUNTERS
-+#   define PROFILE_HAL_COUNTERS                 1
-+#endif
-+
-+/*
-+    PROFILE_HW_COUNTERS
-+
-+        This define enables HW counter profiling support.
-+*/
-+#ifndef PROFILE_HW_COUNTERS
-+#   define PROFILE_HW_COUNTERS                  1
-+#endif
-+
-+/*
-+    PROFILE_SHADER_COUNTERS
-+
-+        This define enables SHADER counter profiling support.
-+*/
-+#ifndef PROFILE_SHADER_COUNTERS
-+#   define PROFILE_SHADER_COUNTERS              1
-+#endif
-+
-+/*
-+    COMMAND_PROCESSOR_VERSION
-+
-+        The version of the command buffer and task manager.
-+*/
-+#define COMMAND_PROCESSOR_VERSION               1
-+
-+/*
-+    gcdDUMP_KEY
-+
-+        Set this to a string that appears in 'cat /proc/<pid>/cmdline'. E.g. 'camera'.
-+        HAL will create dumps for the processes matching this key.
-+*/
-+#ifndef gcdDUMP_KEY
-+#   define gcdDUMP_KEY                          "process"
-+#endif
-+
-+/*
-+    gcdDUMP_PATH
-+
-+        The dump file location. Some processes cannot write to the sdcard.
-+        Try apps' data dir, e.g. /data/data/com.android.launcher
-+*/
-+#ifndef gcdDUMP_PATH
-+#if defined(ANDROID)
-+#   define gcdDUMP_PATH                         "/mnt/sdcard/"
-+#else
-+#   define gcdDUMP_PATH                         "./"
-+#endif
-+#endif
-+
-+/*
-+    gcdDUMP
-+
-+        When set to 1, a dump of all states and memory uploads, as well as other
-+        hardware related execution will be printed to the debug console.  This
-+        data can be used for playing back applications.
-+*/
-+#ifndef gcdDUMP
-+#   define gcdDUMP                              0
-+#endif
-+
-+/*
-+    gcdDUMP_API
-+
-+        When set to 1, a high level dump of the EGL and GL/VG APs's are
-+        captured.
-+*/
-+#ifndef gcdDUMP_API
-+#   define gcdDUMP_API                          0
-+#endif
-+
-+/*
-+    gcdDUMP_FRAMERATE
-+        When set to a value other than zero, averaqe frame rate will be dumped.
-+        The value set is the starting frame that the average will be calculated.
-+        This is needed because sometimes first few frames are too slow to be included
-+        in the average. Frame count starts from 1.
-+*/
-+#ifndef gcdDUMP_FRAMERATE
-+#   define gcdDUMP_FRAMERATE					0
-+#endif
-+
-+/*
-+    gcdVIRTUAL_COMMAND_BUFFER
-+        When set to 1, user command buffer and context buffer will be allocated
-+        from gcvPOOL_VIRTUAL.
-+*/
-+#ifndef gcdVIRTUAL_COMMAND_BUFFER
-+#   define gcdVIRTUAL_COMMAND_BUFFER            0
-+#endif
-+
-+/*
-+    gcdENABLE_FSCALE_VAL_ADJUST
-+        When non-zero, FSCALE_VAL when gcvPOWER_ON can be adjusted externally.
-+ */
-+#ifndef gcdENABLE_FSCALE_VAL_ADJUST
-+#   define gcdENABLE_FSCALE_VAL_ADJUST          1
-+#endif
-+
-+/*
-+    gcdDUMP_IN_KERNEL
-+
-+        When set to 1, all dumps will happen in the kernel.  This is handy if
-+        you want the kernel to dump its command buffers as well and the data
-+        needs to be in sync.
-+*/
-+#ifndef gcdDUMP_IN_KERNEL
-+#   define gcdDUMP_IN_KERNEL                    0
-+#endif
-+
-+/*
-+    gcdDUMP_COMMAND
-+
-+        When set to non-zero, the command queue will dump all incoming command
-+        and context buffers as well as all other modifications to the command
-+        queue.
-+*/
-+#ifndef gcdDUMP_COMMAND
-+#   define gcdDUMP_COMMAND                      0
-+#endif
-+
-+/*
-+    gcdDUMP_FRAME_TGA
-+
-+    When set to a value other than 0, a dump of the frame specified by the value,
-+    will be done into frame.tga. Frame count starts from 1.
-+ */
-+#ifndef gcdDUMP_FRAME_TGA
-+#define gcdDUMP_FRAME_TGA                       0
-+#endif
-+/*
-+    gcdNULL_DRIVER
-+
-+    Set to 1 for infinite speed hardware.
-+    Set to 2 for bypassing the HAL.
-+    Set to 3 for bypassing the drivers.
-+*/
-+#ifndef gcdNULL_DRIVER
-+#   define gcdNULL_DRIVER                       0
-+#endif
-+
-+/*
-+    gcdENABLE_TIMEOUT_DETECTION
-+
-+        Enable timeout detection.
-+*/
-+#ifndef gcdENABLE_TIMEOUT_DETECTION
-+#   define gcdENABLE_TIMEOUT_DETECTION          0
-+#endif
-+
-+/*
-+    gcdCMD_BUFFER_SIZE
-+
-+        Number of bytes in a command buffer.
-+*/
-+#ifndef gcdCMD_BUFFER_SIZE
-+#   define gcdCMD_BUFFER_SIZE                   (128 << 10)
-+#endif
-+
-+/*
-+    gcdCMD_BUFFERS
-+
-+        Number of command buffers to use per client.
-+*/
-+#ifndef gcdCMD_BUFFERS
-+#   define gcdCMD_BUFFERS                       2
-+#endif
-+
-+/*
-+    gcdMAX_CMD_BUFFERS
-+
-+        Maximum number of command buffers to use per client.
-+*/
-+#ifndef gcdMAX_CMD_BUFFERS
-+#   define gcdMAX_CMD_BUFFERS                   8
-+#endif
-+
-+/*
-+    gcdCOMMAND_QUEUES
-+
-+        Number of command queues in the kernel.
-+*/
-+#ifndef gcdCOMMAND_QUEUES
-+#   define gcdCOMMAND_QUEUES                    2
-+#endif
-+
-+/*
-+    gcdPOWER_CONTROL_DELAY
-+
-+        The delay in milliseconds required to wait until the GPU has woke up
-+        from a suspend or power-down state.  This is system dependent because
-+        the bus clock also needs to stabalize.
-+*/
-+#ifndef gcdPOWER_CONTROL_DELAY
-+#   define gcdPOWER_CONTROL_DELAY               0
-+#endif
-+
-+/*
-+    gcdMIRROR_PAGETABLE
-+
-+        Enable it when GPUs with old MMU and new MMU exist at same SoC. It makes
-+        each GPU use same virtual address to access same physical memory.
-+*/
-+#ifndef gcdMIRROR_PAGETABLE
-+#   define gcdMIRROR_PAGETABLE                  0
-+#endif
-+
-+/*
-+    gcdMMU_SIZE
-+
-+        Size of the MMU page table in bytes.  Each 4 bytes can hold 4kB worth of
-+        virtual data.
-+*/
-+#ifndef gcdMMU_SIZE
-+#if gcdMIRROR_PAGETABLE
-+#   define gcdMMU_SIZE                          0x200000
-+#else
-+#   define gcdMMU_SIZE                          (2048 << 10)
-+#endif
-+#endif
-+
-+/*
-+    gcdSECURE_USER
-+
-+        Use logical addresses instead of physical addresses in user land.  In
-+        this case a hint table is created for both command buffers and context
-+        buffers, and that hint table will be used to patch up those buffers in
-+        the kernel when they are ready to submit.
-+*/
-+#ifndef gcdSECURE_USER
-+#   define gcdSECURE_USER                       0
-+#endif
-+
-+/*
-+    gcdSECURE_CACHE_SLOTS
-+
-+        Number of slots in the logical to DMA address cache table.  Each time a
-+        logical address needs to be translated into a DMA address for the GPU,
-+        this cache will be walked.  The replacement scheme is LRU.
-+*/
-+#ifndef gcdSECURE_CACHE_SLOTS
-+#   define gcdSECURE_CACHE_SLOTS                1024
-+#endif
-+
-+/*
-+    gcdSECURE_CACHE_METHOD
-+
-+        Replacement scheme used for Secure Cache.  The following options are
-+        available:
-+
-+            gcdSECURE_CACHE_LRU
-+                A standard LRU cache.
-+
-+            gcdSECURE_CACHE_LINEAR
-+                A linear walker with the idea that an application will always
-+                render the scene in a similar way, so the next entry in the
-+                cache should be a hit most of the time.
-+
-+            gcdSECURE_CACHE_HASH
-+                A 256-entry hash table.
-+
-+            gcdSECURE_CACHE_TABLE
-+                A simple cache but with potential of a lot of cache replacement.
-+*/
-+#ifndef gcdSECURE_CACHE_METHOD
-+#   define gcdSECURE_CACHE_METHOD               gcdSECURE_CACHE_HASH
-+#endif
-+
-+/*
-+    gcdREGISTER_ACCESS_FROM_USER
-+
-+        Set to 1 to allow IOCTL calls to get through from user land.  This
-+        should only be in debug or development drops.
-+*/
-+#ifndef gcdREGISTER_ACCESS_FROM_USER
-+#   define gcdREGISTER_ACCESS_FROM_USER         1
-+#endif
-+
-+/*
-+    gcdUSER_HEAP_ALLOCATOR
-+
-+        Set to 1 to enable user mode heap allocator for fast memory allocation
-+        and destroying. Otherwise, memory allocation/destroying in user mode
-+        will be directly managed by system. Only for linux for now.
-+*/
-+#ifndef gcdUSER_HEAP_ALLOCATOR
-+#   define gcdUSER_HEAP_ALLOCATOR               1
-+#endif
-+
-+/*
-+    gcdHEAP_SIZE
-+
-+        Set the allocation size for the internal heaps.  Each time a heap is
-+        full, a new heap will be allocated with this minmimum amount of bytes.
-+        The bigger this size, the fewer heaps there are to allocate, the better
-+        the performance.  However, heaps won't be freed until they are
-+        completely free, so there might be some more memory waste if the size is
-+        too big.
-+*/
-+#ifndef gcdHEAP_SIZE
-+#   define gcdHEAP_SIZE                         (64 << 10)
-+#endif
-+
-+/*
-+    gcdPOWER_SUSNPEND_WHEN_IDLE
-+
-+        Set to 1 to make GPU enter gcvPOWER_SUSPEND when idle detected,
-+        otherwise GPU will enter gcvPOWER_IDLE.
-+*/
-+#ifndef gcdPOWER_SUSNPEND_WHEN_IDLE
-+#   define gcdPOWER_SUSNPEND_WHEN_IDLE          1
-+#endif
-+
-+/*
-+    gcdFPGA_BUILD
-+
-+        This define enables work arounds for FPGA images.
-+*/
-+#ifndef gcdFPGA_BUILD
-+#   define gcdFPGA_BUILD                        0
-+#endif
-+
-+/*
-+    gcdGPU_TIMEOUT
-+
-+        This define specified the number of milliseconds the system will wait
-+        before it broadcasts the GPU is stuck.  In other words, it will define
-+        the timeout of any operation that needs to wait for the GPU.
-+
-+        If the value is 0, no timeout will be checked for.
-+*/
-+#ifndef gcdGPU_TIMEOUT
-+#if gcdFPGA_BUILD
-+#       define gcdGPU_TIMEOUT                   0
-+#   else
-+#       define gcdGPU_TIMEOUT                   20000
-+#   endif
-+#endif
-+
-+/*
-+    gcdGPU_ADVANCETIMER
-+
-+        it is advance timer.
-+*/
-+#ifndef gcdGPU_ADVANCETIMER
-+#   define gcdGPU_ADVANCETIMER                  250
-+#endif
-+
-+/*
-+    gcdSTATIC_LINK
-+
-+        This define disalbes static linking;
-+*/
-+#ifndef gcdSTATIC_LINK
-+#   define gcdSTATIC_LINK                       0
-+#endif
-+
-+/*
-+    gcdUSE_NEW_HEAP
-+
-+        Setting this define to 1 enables new heap.
-+*/
-+#ifndef gcdUSE_NEW_HEAP
-+#   define gcdUSE_NEW_HEAP                      0
-+#endif
-+
-+/*
-+    gcdCMD_NO_2D_CONTEXT
-+
-+        This define enables no-context 2D command buffer.
-+*/
-+#ifndef gcdCMD_NO_2D_CONTEXT
-+#   define gcdCMD_NO_2D_CONTEXT                 1
-+#endif
-+
-+/*
-+    gcdENABLE_BANK_ALIGNMENT
-+
-+    When enabled, video memory is allocated bank aligned. The vendor can modify
-+    _GetSurfaceBankAlignment() and gcoSURF_GetBankOffsetBytes() to define how
-+    different types of allocations are bank and channel aligned.
-+    When disabled (default), no bank alignment is done.
-+*/
-+#ifndef gcdENABLE_BANK_ALIGNMENT
-+#   define gcdENABLE_BANK_ALIGNMENT             0
-+#endif
-+
-+/*
-+    gcdBANK_BIT_START
-+
-+    Specifies the start bit of the bank (inclusive).
-+*/
-+#ifndef gcdBANK_BIT_START
-+#   define gcdBANK_BIT_START                    12
-+#endif
-+
-+/*
-+    gcdBANK_BIT_END
-+
-+    Specifies the end bit of the bank (inclusive).
-+*/
-+#ifndef gcdBANK_BIT_END
-+#   define gcdBANK_BIT_END                      14
-+#endif
-+
-+/*
-+    gcdBANK_CHANNEL_BIT
-+
-+    When set, video memory when allocated bank aligned is allocated such that
-+    render and depth buffer addresses alternate on the channel bit specified.
-+    This option has an effect only when gcdENABLE_BANK_ALIGNMENT is enabled.
-+    When disabled (default), no alteration is done.
-+*/
-+#ifndef gcdBANK_CHANNEL_BIT
-+#   define gcdBANK_CHANNEL_BIT                  7
-+#endif
-+
-+/*
-+    gcdDYNAMIC_SPEED
-+
-+        When non-zero, it informs the kernel driver to use the speed throttling
-+        broadcasting functions to inform the system the GPU should be spet up or
-+        slowed down. It will send a broadcast for slowdown each "interval"
-+        specified by this define in milliseconds
-+        (gckOS_BroadcastCalibrateSpeed).
-+*/
-+#ifndef gcdDYNAMIC_SPEED
-+#    define gcdDYNAMIC_SPEED                    2000
-+#endif
-+
-+/*
-+    gcdDYNAMIC_EVENT_THRESHOLD
-+
-+        When non-zero, it specifies the maximum number of available events at
-+        which the kernel driver will issue a broadcast to speed up the GPU
-+        (gckOS_BroadcastHurry).
-+*/
-+#ifndef gcdDYNAMIC_EVENT_THRESHOLD
-+#    define gcdDYNAMIC_EVENT_THRESHOLD          5
-+#endif
-+
-+/*
-+    gcdENABLE_PROFILING
-+
-+        Enable profiling macros.
-+*/
-+#ifndef gcdENABLE_PROFILING
-+#   define gcdENABLE_PROFILING                  0
-+#endif
-+
-+/*
-+    gcdENABLE_128B_MERGE
-+
-+        Enable 128B merge for the BUS control.
-+*/
-+#ifndef gcdENABLE_128B_MERGE
-+#   define gcdENABLE_128B_MERGE                 0
-+#endif
-+
-+/*
-+    gcdFRAME_DB
-+
-+        When non-zero, it specified the number of frames inside the frame
-+        database. The frame DB will collect per-frame timestamps and hardware
-+        counters.
-+*/
-+#ifndef gcdFRAME_DB
-+#   define gcdFRAME_DB                          0
-+#   define gcdFRAME_DB_RESET                    0
-+#   define gcdFRAME_DB_NAME                     "/var/log/frameDB.log"
-+#endif
-+
-+/*
-+    gcdENABLE_VG
-+            enable the 2D openVG
-+*/
-+
-+#ifndef gcdENABLE_VG
-+#   define gcdENABLE_VG                         0
-+#endif
-+
-+/*
-+    gcdDYNAMIC_MAP_RESERVED_MEMORY
-+
-+        When gcvPOOL_SYSTEM is constructed from RESERVED memory,
-+        driver can map the whole reserved memory to kernel space
-+        at the beginning, or just map a piece of memory when need
-+        to access.
-+
-+        Notice:
-+        -  It's only for the 2D openVG. For other cores, there is
-+           _NO_ need to map reserved memory to kernel.
-+        -  It's meaningless when memory is allocated by
-+           gckOS_AllocateContiguous, in that case, memory is always
-+           mapped by system when allocated.
-+*/
-+#ifndef gcdDYNAMIC_MAP_RESERVED_MEMORY
-+#   define gcdDYNAMIC_MAP_RESERVED_MEMORY      1
-+#endif
-+
-+/*
-+   gcdPAGED_MEMORY_CACHEABLE
-+
-+        When non-zero, paged memory will be cacheable.
-+
-+        Normally, driver will detemines whether a video memory
-+        is cacheable or not. When cacheable is not neccessary,
-+        it will be writecombine.
-+
-+        This option is only for those SOC which can't enable
-+        writecombine without enabling cacheable.
-+*/
-+
-+#ifndef gcdPAGED_MEMORY_CACHEABLE
-+#   define gcdPAGED_MEMORY_CACHEABLE            0
-+#endif
-+
-+/*
-+   gcdNONPAGED_MEMORY_CACHEABLE
-+
-+        When non-zero, non paged memory will be cacheable.
-+*/
-+
-+#ifndef gcdNONPAGED_MEMORY_CACHEABLE
-+#   define gcdNONPAGED_MEMORY_CACHEABLE         0
-+#endif
-+
-+/*
-+   gcdNONPAGED_MEMORY_BUFFERABLE
-+
-+        When non-zero, non paged memory will be bufferable.
-+        gcdNONPAGED_MEMORY_BUFFERABLE and gcdNONPAGED_MEMORY_CACHEABLE
-+        can't be set 1 at same time
-+*/
-+
-+#ifndef gcdNONPAGED_MEMORY_BUFFERABLE
-+#   define gcdNONPAGED_MEMORY_BUFFERABLE        1
-+#endif
-+
-+/*
-+    gcdENABLE_INFINITE_SPEED_HW
-+            enable the Infinte HW , this is for 2D openVG
-+*/
-+
-+#ifndef gcdENABLE_INFINITE_SPEED_HW
-+#   define gcdENABLE_INFINITE_SPEED_HW          0
-+#endif
-+
-+/*
-+    gcdENABLE_TS_DOUBLE_BUFFER
-+            enable the TS double buffer, this is for 2D openVG
-+*/
-+
-+#ifndef gcdENABLE_TS_DOUBLE_BUFFER
-+#   define gcdENABLE_TS_DOUBLE_BUFFER           1
-+#endif
-+
-+/*
-+    gcd6000_SUPPORT
-+
-+    Temporary define to enable/disable 6000 support.
-+ */
-+#ifndef gcd6000_SUPPORT
-+#   define gcd6000_SUPPORT                      0
-+#endif
-+
-+/*
-+    gcdPOWEROFF_TIMEOUT
-+
-+        When non-zero, GPU will power off automatically from
-+        idle state, and gcdPOWEROFF_TIMEOUT is also the default
-+        timeout in milliseconds.
-+ */
-+
-+#ifndef gcdPOWEROFF_TIMEOUT
-+#   define gcdPOWEROFF_TIMEOUT                  300
-+#endif
-+
-+/*
-+    gcdUSE_VIDMEM_PER_PID
-+*/
-+#ifndef gcdUSE_VIDMEM_PER_PID
-+#   define gcdUSE_VIDMEM_PER_PID                0
-+#endif
-+
-+/*
-+    QNX_SINGLE_THREADED_DEBUGGING
-+*/
-+#ifndef QNX_SINGLE_THREADED_DEBUGGING
-+#   define QNX_SINGLE_THREADED_DEBUGGING        0
-+#endif
-+
-+/*
-+    gcdENABLE_RECOVERY
-+
-+        This define enables the recovery code.
-+*/
-+#ifndef gcdENABLE_RECOVERY
-+#   define gcdENABLE_RECOVERY                   0
-+#endif
-+
-+/*
-+    gcdRENDER_THREADS
-+
-+        Number of render threads. Make it zero, and there will be no render
-+        threads.
-+*/
-+#ifndef gcdRENDER_THREADS
-+#   define gcdRENDER_THREADS                    0
-+#endif
-+
-+/*
-+    gcdSMP
-+
-+        This define enables SMP support.
-+
-+        Currently, it only works on Linux/Android,
-+        Kbuild will config it according to whether
-+        CONFIG_SMP is set.
-+
-+*/
-+#ifndef gcdSMP
-+#   define gcdSMP                               0
-+#endif
-+
-+/*
-+    gcdSUPPORT_SWAP_RECTANGLE
-+
-+        Support swap with a specific rectangle.
-+
-+        Set the rectangle with eglSetSwapRectangleANDROID api.
-+*/
-+#ifndef gcdSUPPORT_SWAP_RECTANGLE
-+#   define gcdSUPPORT_SWAP_RECTANGLE            0
-+#endif
-+
-+/*
-+    gcdGPU_LINEAR_BUFFER_ENABLED
-+
-+        Use linear buffer for GPU apps so HWC can do 2D composition.
-+*/
-+#ifndef gcdGPU_LINEAR_BUFFER_ENABLED
-+#   define gcdGPU_LINEAR_BUFFER_ENABLED         1
-+#endif
-+
-+/*
-+    gcdENABLE_RENDER_INTO_WINDOW
-+
-+        Enable Render-Into-Window (ie, No-Resolve) feature on android.
-+        NOTE that even if enabled, it still depends on hardware feature and
-+        android application behavior. When hardware feature or application
-+        behavior can not support render into window mode, it will fail back
-+        to normal mode.
-+        When Render-Into-Window is finally used, window back buffer of android
-+        applications will be allocated matching render target tiling format.
-+        Otherwise buffer tiling is decided by the above option
-+        'gcdGPU_LINEAR_BUFFER_ENABLED'.
-+*/
-+#ifndef gcdENABLE_RENDER_INTO_WINDOW
-+#   define gcdENABLE_RENDER_INTO_WINDOW         1
-+#endif
-+
-+/*
-+    gcdSHARED_RESOLVE_BUFFER_ENABLED
-+
-+        Use shared resolve buffer for all app buffers.
-+*/
-+#ifndef gcdSHARED_RESOLVE_BUFFER_ENABLED
-+#   define gcdSHARED_RESOLVE_BUFFER_ENABLED         0
-+#endif
-+
-+/*
-+     gcdUSE_TRIANGLE_STRIP_PATCH
-+ */
-+#ifndef gcdUSE_TRIANGLE_STRIP_PATCH
-+#   define gcdUSE_TRIANGLE_STRIP_PATCH            1
-+#endif
-+
-+/*
-+    gcdENABLE_OUTER_CACHE_PATCH
-+
-+        Enable the outer cache patch.
-+*/
-+#ifndef gcdENABLE_OUTER_CACHE_PATCH
-+#   define gcdENABLE_OUTER_CACHE_PATCH          0
-+#endif
-+
-+#ifndef gcdANDROID_UNALIGNED_LINEAR_COMPOSITION_ADJUST
-+#   ifdef ANDROID
-+#      define  gcdANDROID_UNALIGNED_LINEAR_COMPOSITION_ADJUST    1
-+#   else
-+#      define  gcdANDROID_UNALIGNED_LINEAR_COMPOSITION_ADJUST    0
-+#   endif
-+#endif
-+
-+#ifndef gcdENABLE_PE_DITHER_FIX
-+#   define gcdENABLE_PE_DITHER_FIX              1
-+#endif
-+
-+#ifndef gcdSHARED_PAGETABLE
-+#   define gcdSHARED_PAGETABLE                  1
-+#endif
-+#ifndef gcdUSE_PVR
-+#   define gcdUSE_PVR			                1
-+#endif
-+
-+/*
-+    gcdSMALL_BLOCK_SIZE
-+
-+        When non-zero, a part of VIDMEM will be reserved for requests
-+        whose requesting size is less than gcdSMALL_BLOCK_SIZE.
-+
-+        For Linux, it's the size of a page. If this requeset fallbacks
-+        to gcvPOOL_CONTIGUOUS or gcvPOOL_VIRTUAL, memory will be wasted
-+        because they allocate a page at least.
-+ */
-+#ifndef gcdSMALL_BLOCK_SIZE
-+#   define gcdSMALL_BLOCK_SIZE                  4096
-+#   define gcdRATIO_FOR_SMALL_MEMORY            32
-+#endif
-+
-+/*
-+    gcdCONTIGUOUS_SIZE_LIMIT
-+        When non-zero, size of video node from gcvPOOL_CONTIGUOUS is
-+        limited by gcdCONTIGUOUS_SIZE_LIMIT.
-+ */
-+#ifndef gcdCONTIGUOUS_SIZE_LIMIT
-+#   define gcdCONTIGUOUS_SIZE_LIMIT             0
-+#endif
-+
-+#ifndef gcdDISALBE_EARLY_EARLY_Z
-+#   define gcdDISALBE_EARLY_EARLY_Z             1
-+#endif
-+
-+#ifndef gcdSHADER_SRC_BY_MACHINECODE
-+#   define gcdSHADER_SRC_BY_MACHINECODE         1
-+#endif
-+
-+/*
-+    gcdLINK_QUEUE_SIZE
-+
-+        When non-zero, driver maintains a queue to record information of
-+        latest lined context buffer and command buffer. Data in this queue
-+        is be used to debug.
-+*/
-+#ifndef gcdLINK_QUEUE_SIZE
-+#   define gcdLINK_QUEUE_SIZE                  0
-+#endif
-+
-+/*  gcdALPHA_KILL_IN_SHADER
-+ *
-+ *  Enable alpha kill inside the shader. This will be set automatically by the
-+ *  HAL if certain states match a criteria.
-+ */
-+#ifndef gcdALPHA_KILL_IN_SHADER
-+#   define gcdALPHA_KILL_IN_SHADER              1
-+#endif
-+
-+/*  gcdHIGH_PRECISION_DELAY_ENABLE
-+ *
-+ *  Enable high precision schedule delay with 1ms unit. otherwise schedule delay up to 10ms.
-+ *  Browser app performance will have obvious drop without this enablement
-+ */
-+#ifndef gcdHIGH_PRECISION_DELAY_ENABLE
-+#   define gcdHIGH_PRECISION_DELAY_ENABLE        1
-+#endif
-+
-+#ifndef gcdUSE_WCLIP_PATCH
-+#   define gcdUSE_WCLIP_PATCH                   1
-+#endif
-+
-+#ifndef gcdHZ_L2_DISALBE
-+#   define gcdHZ_L2_DISALBE                     1
-+#endif
-+
-+#ifndef gcdBUGFIX15_DISABLE
-+#   define gcdBUGFIX15_DISABLE                  1
-+#endif
-+
-+#ifndef gcdDISABLE_HZ_FAST_CLEAR
-+#   define gcdDISABLE_HZ_FAST_CLEAR             1
-+#endif
-+
-+#ifndef gcdUSE_NPOT_PATCH
-+#define gcdUSE_NPOT_PATCH                       1
-+#endif
-+
-+#ifndef gcdSYNC
-+#   define gcdSYNC                              1
-+#endif
-+
-+#ifndef gcdENABLE_SPECIAL_HINT3
-+#   define gcdENABLE_SPECIAL_HINT3               1
-+#endif
-+
-+#if defined(ANDROID)
-+#ifndef gcdPRE_ROTATION
-+#   define gcdPRE_ROTATION                      1
-+#endif
-+#endif
-+
-+/*
-+    gcdDVFS
-+
-+        When non-zero, software will make use of dynamic voltage and
-+        frequency feature.
-+ */
-+#ifndef gcdDVFS
-+#   define gcdDVFS                               1
-+#   define gcdDVFS_ANAYLSE_WINDOW                4
-+#   define gcdDVFS_POLLING_TIME                  (gcdDVFS_ANAYLSE_WINDOW * 4)
-+#endif
-+
-+/*
-+    gcdANDROID_NATIVE_FENCE_SYNC
-+
-+        Enable android native fence sync. It is introduced since jellybean-4.2.
-+        Depends on linux kernel option: CONFIG_SYNC.
-+
-+        0: Disabled
-+        1: Build framework for native fence sync feature, and EGL extension
-+        2: Enable async swap buffers for client
-+           * Native fence sync for client 'queueBuffer' in EGL, which is
-+             'acquireFenceFd' for layer in compositor side.
-+        3. Enable async hwcomposer composition.
-+           * 'releaseFenceFd' for layer in compositor side, which is native
-+             fence sync when client 'dequeueBuffer'
-+           * Native fence sync for compositor 'queueBuffer' in EGL, which is
-+             'acquireFenceFd' for framebuffer target for DC
-+ */
-+#ifndef gcdANDROID_NATIVE_FENCE_SYNC
-+#   define gcdANDROID_NATIVE_FENCE_SYNC        0
-+#endif
-+
-+#ifndef gcdFORCE_MIPMAP
-+#   define gcdFORCE_MIPMAP                     1
-+#endif
-+
-+/*
-+    gcdFORCE_GAL_LOAD_TWICE
-+
-+        When non-zero, each thread except the main one will load libGAL.so twice to avoid potential segmetantion fault when app using dlopen/dlclose.
-+        If threads exit arbitrarily, libGAL.so may not unload until the process quit.
-+ */
-+#ifndef gcdFORCE_GAL_LOAD_TWICE
-+#   define gcdFORCE_GAL_LOAD_TWICE             0
-+#endif
-+
-+#endif /* __gc_hal_options_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h	2015-07-27 23:13:06.214808565 +0200
-@@ -0,0 +1,584 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_profiler_h_
-+#define __gc_hal_profiler_h_
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+#define GLVERTEX_OBJECT 10
-+#define GLVERTEX_OBJECT_BYTES 11
-+
-+#define GLINDEX_OBJECT 20
-+#define GLINDEX_OBJECT_BYTES 21
-+
-+#define GLTEXTURE_OBJECT 30
-+#define GLTEXTURE_OBJECT_BYTES 31
-+
-+#if VIVANTE_PROFILER
-+#define gcmPROFILE_GC(Enum, Value)  gcoPROFILER_Count(gcvNULL, Enum, Value)
-+#else
-+#define gcmPROFILE_GC(Enum, Value)  do { } while (gcvFALSE)
-+#endif
-+
-+#ifndef gcdNEW_PROFILER_FILE
-+#define gcdNEW_PROFILER_FILE    1
-+#endif
-+
-+#define    ES11_CALLS              151
-+#define    ES11_DRAWCALLS          (ES11_CALLS             + 1)
-+#define    ES11_STATECHANGECALLS   (ES11_DRAWCALLS         + 1)
-+#define    ES11_POINTCOUNT         (ES11_STATECHANGECALLS  + 1)
-+#define    ES11_LINECOUNT          (ES11_POINTCOUNT        + 1)
-+#define    ES11_TRIANGLECOUNT      (ES11_LINECOUNT         + 1)
-+
-+#define    ES20_CALLS              159
-+#define    ES20_DRAWCALLS          (ES20_CALLS             + 1)
-+#define    ES20_STATECHANGECALLS   (ES20_DRAWCALLS         + 1)
-+#define    ES20_POINTCOUNT         (ES20_STATECHANGECALLS  + 1)
-+#define    ES20_LINECOUNT          (ES20_POINTCOUNT        + 1)
-+#define    ES20_TRIANGLECOUNT      (ES20_LINECOUNT         + 1)
-+
-+#define    VG11_CALLS              88
-+#define    VG11_DRAWCALLS          (VG11_CALLS              + 1)
-+#define    VG11_STATECHANGECALLS   (VG11_DRAWCALLS          + 1)
-+#define    VG11_FILLCOUNT          (VG11_STATECHANGECALLS   + 1)
-+#define    VG11_STROKECOUNT        (VG11_FILLCOUNT          + 1)
-+/* End of Driver API ID Definitions. */
-+
-+/* HAL & MISC IDs. */
-+#define HAL_VERTBUFNEWBYTEALLOC    1
-+#define HAL_VERTBUFTOTALBYTEALLOC  (HAL_VERTBUFNEWBYTEALLOC     + 1)
-+#define HAL_VERTBUFNEWOBJALLOC     (HAL_VERTBUFTOTALBYTEALLOC   + 1)
-+#define HAL_VERTBUFTOTALOBJALLOC   (HAL_VERTBUFNEWOBJALLOC      + 1)
-+#define HAL_INDBUFNEWBYTEALLOC     (HAL_VERTBUFTOTALOBJALLOC    + 1)
-+#define HAL_INDBUFTOTALBYTEALLOC   (HAL_INDBUFNEWBYTEALLOC      + 1)
-+#define HAL_INDBUFNEWOBJALLOC      (HAL_INDBUFTOTALBYTEALLOC    + 1)
-+#define HAL_INDBUFTOTALOBJALLOC    (HAL_INDBUFNEWOBJALLOC       + 1)
-+#define HAL_TEXBUFNEWBYTEALLOC     (HAL_INDBUFTOTALOBJALLOC     + 1)
-+#define HAL_TEXBUFTOTALBYTEALLOC   (HAL_TEXBUFNEWBYTEALLOC      + 1)
-+#define HAL_TEXBUFNEWOBJALLOC      (HAL_TEXBUFTOTALBYTEALLOC    + 1)
-+#define HAL_TEXBUFTOTALOBJALLOC    (HAL_TEXBUFNEWOBJALLOC       + 1)
-+
-+#define GPU_CYCLES           1
-+#define GPU_READ64BYTE       (GPU_CYCLES         + 1)
-+#define GPU_WRITE64BYTE      (GPU_READ64BYTE     + 1)
-+#define GPU_TOTALCYCLES      (GPU_WRITE64BYTE    + 1)
-+#define GPU_IDLECYCLES       (GPU_TOTALCYCLES    + 1)
-+
-+#define VS_INSTCOUNT          1
-+#define VS_BRANCHINSTCOUNT    (VS_INSTCOUNT          + 1)
-+#define VS_TEXLDINSTCOUNT     (VS_BRANCHINSTCOUNT    + 1)
-+#define VS_RENDEREDVERTCOUNT  (VS_TEXLDINSTCOUNT     + 1)
-+#define VS_SOURCE             (VS_RENDEREDVERTCOUNT  + 1)
-+
-+#define PS_INSTCOUNT          1
-+#define PS_BRANCHINSTCOUNT    (PS_INSTCOUNT          + 1)
-+#define PS_TEXLDINSTCOUNT     (PS_BRANCHINSTCOUNT    + 1)
-+#define PS_RENDEREDPIXCOUNT   (PS_TEXLDINSTCOUNT     + 1)
-+#define PS_SOURCE             (PS_RENDEREDPIXCOUNT   + 1)
-+
-+#define PA_INVERTCOUNT        1
-+#define PA_INPRIMCOUNT        (PA_INVERTCOUNT      + 1)
-+#define PA_OUTPRIMCOUNT       (PA_INPRIMCOUNT      + 1)
-+#define PA_DEPTHCLIPCOUNT     (PA_OUTPRIMCOUNT     + 1)
-+#define PA_TRIVIALREJCOUNT    (PA_DEPTHCLIPCOUNT   + 1)
-+#define PA_CULLCOUNT          (PA_TRIVIALREJCOUNT  + 1)
-+
-+#define SE_TRIANGLECOUNT      1
-+#define SE_LINECOUNT          (SE_TRIANGLECOUNT    + 1)
-+
-+#define RA_VALIDPIXCOUNT      1
-+#define RA_TOTALQUADCOUNT     (RA_VALIDPIXCOUNT      + 1)
-+#define RA_VALIDQUADCOUNTEZ   (RA_TOTALQUADCOUNT     + 1)
-+#define RA_TOTALPRIMCOUNT     (RA_VALIDQUADCOUNTEZ   + 1)
-+#define RA_PIPECACHEMISSCOUNT (RA_TOTALPRIMCOUNT     + 1)
-+#define RA_PREFCACHEMISSCOUNT (RA_PIPECACHEMISSCOUNT + 1)
-+#define RA_EEZCULLCOUNT       (RA_PREFCACHEMISSCOUNT + 1)
-+
-+#define TX_TOTBILINEARREQ     1
-+#define TX_TOTTRILINEARREQ    (TX_TOTBILINEARREQ      + 1)
-+#define TX_TOTDISCARDTEXREQ   (TX_TOTTRILINEARREQ     + 1)
-+#define TX_TOTTEXREQ          (TX_TOTDISCARDTEXREQ    + 1)
-+#define TX_MEMREADCOUNT       (TX_TOTTEXREQ           + 1)
-+#define TX_MEMREADIN8BCOUNT   (TX_MEMREADCOUNT        + 1)
-+#define TX_CACHEMISSCOUNT     (TX_MEMREADIN8BCOUNT    + 1)
-+#define TX_CACHEHITTEXELCOUNT (TX_CACHEMISSCOUNT      + 1)
-+#define TX_CACHEMISSTEXELCOUNT (TX_CACHEHITTEXELCOUNT + 1)
-+
-+#define PE_KILLEDBYCOLOR      1
-+#define PE_KILLEDBYDEPTH      (PE_KILLEDBYCOLOR    + 1)
-+#define PE_DRAWNBYCOLOR       (PE_KILLEDBYDEPTH    + 1)
-+#define PE_DRAWNBYDEPTH       (PE_DRAWNBYCOLOR     + 1)
-+
-+#define MC_READREQ8BPIPE      1
-+#define MC_READREQ8BIP        (MC_READREQ8BPIPE    + 1)
-+#define MC_WRITEREQ8BPIPE     (MC_READREQ8BIP      + 1)
-+
-+#define AXI_READREQSTALLED    1
-+#define AXI_WRITEREQSTALLED   (AXI_READREQSTALLED  + 1)
-+#define AXI_WRITEDATASTALLED  (AXI_WRITEREQSTALLED + 1)
-+
-+#define PVS_INSTRCOUNT        1
-+#define PVS_ALUINSTRCOUNT     (PVS_INSTRCOUNT      + 1)
-+#define PVS_TEXINSTRCOUNT     (PVS_ALUINSTRCOUNT   + 1)
-+#define PVS_ATTRIBCOUNT       (PVS_TEXINSTRCOUNT   + 1)
-+#define PVS_UNIFORMCOUNT      (PVS_ATTRIBCOUNT     + 1)
-+#define PVS_FUNCTIONCOUNT     (PVS_UNIFORMCOUNT    + 1)
-+#define PVS_SOURCE            (PVS_FUNCTIONCOUNT   + 1)
-+
-+#define PPS_INSTRCOUNT       1
-+#define PPS_ALUINSTRCOUNT    (PPS_INSTRCOUNT       + 1)
-+#define PPS_TEXINSTRCOUNT    (PPS_ALUINSTRCOUNT    + 1)
-+#define PPS_ATTRIBCOUNT      (PPS_TEXINSTRCOUNT    + 1)
-+#define PPS_UNIFORMCOUNT     (PPS_ATTRIBCOUNT      + 1)
-+#define PPS_FUNCTIONCOUNT    (PPS_UNIFORMCOUNT     + 1)
-+#define PPS_SOURCE           (PPS_FUNCTIONCOUNT    + 1)
-+/* End of MISC Counter IDs. */
-+
-+#ifdef gcdNEW_PROFILER_FILE
-+
-+/* Category Constants. */
-+#define VPHEADER        0x010000
-+#define VPG_INFO        0x020000
-+#define VPG_TIME        0x030000
-+#define VPG_MEM         0x040000
-+#define VPG_ES11        0x050000
-+#define VPG_ES20        0x060000
-+#define VPG_VG11        0x070000
-+#define VPG_HAL         0x080000
-+#define VPG_HW          0x090000
-+#define VPG_GPU         0x0a0000
-+#define VPG_VS          0x0b0000
-+#define VPG_PS          0x0c0000
-+#define VPG_PA          0x0d0000
-+#define VPG_SETUP       0x0e0000
-+#define VPG_RA          0x0f0000
-+#define VPG_TX          0x100000
-+#define VPG_PE          0x110000
-+#define VPG_MC          0x120000
-+#define VPG_AXI         0x130000
-+#define VPG_PROG        0x140000
-+#define VPG_PVS         0x150000
-+#define VPG_PPS         0x160000
-+#define VPG_ES11_TIME   0x170000
-+#define VPG_ES20_TIME   0x180000
-+#define VPG_FRAME       0x190000
-+#define VPG_ES11_DRAW   0x200000
-+#define VPG_ES20_DRAW   0x210000
-+#define VPG_END         0xff0000
-+
-+/* Info. */
-+#define VPC_INFOCOMPANY         (VPG_INFO + 1)
-+#define VPC_INFOVERSION         (VPC_INFOCOMPANY + 1)
-+#define VPC_INFORENDERER        (VPC_INFOVERSION + 1)
-+#define VPC_INFOREVISION        (VPC_INFORENDERER + 1)
-+#define VPC_INFODRIVER          (VPC_INFOREVISION + 1)
-+#define VPC_INFODRIVERMODE      (VPC_INFODRIVER + 1)
-+#define VPC_INFOSCREENSIZE      (VPC_INFODRIVERMODE + 1)
-+
-+/* Counter Constants. */
-+#define VPC_ELAPSETIME          (VPG_TIME + 1)
-+#define VPC_CPUTIME             (VPC_ELAPSETIME + 1)
-+
-+#define VPC_MEMMAXRES           (VPG_MEM + 1)
-+#define VPC_MEMSHARED           (VPC_MEMMAXRES + 1)
-+#define VPC_MEMUNSHAREDDATA     (VPC_MEMSHARED + 1)
-+#define VPC_MEMUNSHAREDSTACK    (VPC_MEMUNSHAREDDATA + 1)
-+
-+/* OpenGL ES11 Statics Counter IDs. */
-+#define    VPC_ES11CALLS            (VPG_ES11 +    ES11_CALLS)
-+#define    VPC_ES11DRAWCALLS        (VPG_ES11 +    ES11_DRAWCALLS)
-+#define    VPC_ES11STATECHANGECALLS (VPG_ES11 +    ES11_STATECHANGECALLS)
-+#define    VPC_ES11POINTCOUNT       (VPG_ES11 +    ES11_POINTCOUNT)
-+#define    VPC_ES11LINECOUNT        (VPG_ES11 +    ES11_LINECOUNT)
-+#define    VPC_ES11TRIANGLECOUNT    (VPG_ES11 +    ES11_TRIANGLECOUNT)
-+
-+/* OpenGL ES20 Statistics Counter IDs. */
-+#define    VPC_ES20CALLS            (VPG_ES20 +    ES20_CALLS)
-+#define    VPC_ES20DRAWCALLS        (VPG_ES20 +    ES20_DRAWCALLS)
-+#define    VPC_ES20STATECHANGECALLS (VPG_ES20 +    ES20_STATECHANGECALLS)
-+#define    VPC_ES20POINTCOUNT       (VPG_ES20 +    ES20_POINTCOUNT)
-+#define    VPC_ES20LINECOUNT        (VPG_ES20 +    ES20_LINECOUNT)
-+#define    VPC_ES20TRIANGLECOUNT    (VPG_ES20 +    ES20_TRIANGLECOUNT)
-+
-+/* OpenVG Statistics Counter IDs. */
-+#define    VPC_VG11CALLS            (VPG_VG11 +    VG11_CALLS)
-+#define    VPC_VG11DRAWCALLS        (VPG_VG11 +    VG11_DRAWCALLS)
-+#define    VPC_VG11STATECHANGECALLS (VPG_VG11 +    VG11_STATECHANGECALLS)
-+#define    VPC_VG11FILLCOUNT        (VPG_VG11 +    VG11_FILLCOUNT)
-+#define    VPC_VG11STROKECOUNT      (VPG_VG11 +    VG11_STROKECOUNT)
-+
-+/* HAL Counters. */
-+#define VPC_HALVERTBUFNEWBYTEALLOC      (VPG_HAL + HAL_VERTBUFNEWBYTEALLOC)
-+#define VPC_HALVERTBUFTOTALBYTEALLOC    (VPG_HAL + HAL_VERTBUFTOTALBYTEALLOC)
-+#define VPC_HALVERTBUFNEWOBJALLOC       (VPG_HAL + HAL_VERTBUFNEWOBJALLOC)
-+#define VPC_HALVERTBUFTOTALOBJALLOC     (VPG_HAL + HAL_VERTBUFTOTALOBJALLOC)
-+#define VPC_HALINDBUFNEWBYTEALLOC       (VPG_HAL + HAL_INDBUFNEWBYTEALLOC)
-+#define VPC_HALINDBUFTOTALBYTEALLOC     (VPG_HAL + HAL_INDBUFTOTALBYTEALLOC)
-+#define VPC_HALINDBUFNEWOBJALLOC        (VPG_HAL + HAL_INDBUFNEWOBJALLOC)
-+#define VPC_HALINDBUFTOTALOBJALLOC      (VPG_HAL + HAL_INDBUFTOTALOBJALLOC)
-+#define VPC_HALTEXBUFNEWBYTEALLOC       (VPG_HAL + HAL_TEXBUFNEWBYTEALLOC)
-+#define VPC_HALTEXBUFTOTALBYTEALLOC     (VPG_HAL + HAL_TEXBUFTOTALBYTEALLOC)
-+#define VPC_HALTEXBUFNEWOBJALLOC        (VPG_HAL + HAL_TEXBUFNEWOBJALLOC)
-+#define VPC_HALTEXBUFTOTALOBJALLOC      (VPG_HAL + HAL_TEXBUFTOTALOBJALLOC)
-+
-+/* HW: GPU Counters. */
-+#define VPC_GPUCYCLES                   (VPG_GPU + GPU_CYCLES)
-+#define VPC_GPUREAD64BYTE               (VPG_GPU + GPU_READ64BYTE)
-+#define VPC_GPUWRITE64BYTE              (VPG_GPU + GPU_WRITE64BYTE)
-+#define VPC_GPUTOTALCYCLES              (VPG_GPU + GPU_TOTALCYCLES)
-+#define VPC_GPUIDLECYCLES               (VPG_GPU + GPU_IDLECYCLES)
-+
-+/* HW: Shader Counters. */
-+#define VPC_VSINSTCOUNT                 (VPG_VS + VS_INSTCOUNT)
-+#define VPC_VSBRANCHINSTCOUNT           (VPG_VS + VS_BRANCHINSTCOUNT)
-+#define VPC_VSTEXLDINSTCOUNT            (VPG_VS + VS_TEXLDINSTCOUNT)
-+#define VPC_VSRENDEREDVERTCOUNT         (VPG_VS + VS_RENDEREDVERTCOUNT)
-+/* HW: PS Count. */
-+#define VPC_PSINSTCOUNT                 (VPG_PS + PS_INSTCOUNT)
-+#define VPC_PSBRANCHINSTCOUNT           (VPG_PS + PS_BRANCHINSTCOUNT)
-+#define VPC_PSTEXLDINSTCOUNT            (VPG_PS + PS_TEXLDINSTCOUNT)
-+#define VPC_PSRENDEREDPIXCOUNT          (VPG_PS + PS_RENDEREDPIXCOUNT)
-+
-+
-+/* HW: PA Counters. */
-+#define VPC_PAINVERTCOUNT               (VPG_PA + PA_INVERTCOUNT)
-+#define VPC_PAINPRIMCOUNT               (VPG_PA + PA_INPRIMCOUNT)
-+#define VPC_PAOUTPRIMCOUNT              (VPG_PA + PA_OUTPRIMCOUNT)
-+#define VPC_PADEPTHCLIPCOUNT            (VPG_PA + PA_DEPTHCLIPCOUNT)
-+#define VPC_PATRIVIALREJCOUNT           (VPG_PA + PA_TRIVIALREJCOUNT)
-+#define VPC_PACULLCOUNT                 (VPG_PA + PA_CULLCOUNT)
-+
-+/* HW: Setup Counters. */
-+#define VPC_SETRIANGLECOUNT             (VPG_SETUP + SE_TRIANGLECOUNT)
-+#define VPC_SELINECOUNT                 (VPG_SETUP + SE_LINECOUNT)
-+
-+/* HW: RA Counters. */
-+#define VPC_RAVALIDPIXCOUNT             (VPG_RA + RA_VALIDPIXCOUNT)
-+#define VPC_RATOTALQUADCOUNT            (VPG_RA + RA_TOTALQUADCOUNT)
-+#define VPC_RAVALIDQUADCOUNTEZ          (VPG_RA + RA_VALIDQUADCOUNTEZ)
-+#define VPC_RATOTALPRIMCOUNT            (VPG_RA + RA_TOTALPRIMCOUNT)
-+#define VPC_RAPIPECACHEMISSCOUNT        (VPG_RA + RA_PIPECACHEMISSCOUNT)
-+#define VPC_RAPREFCACHEMISSCOUNT        (VPG_RA + RA_PREFCACHEMISSCOUNT)
-+#define VPC_RAEEZCULLCOUNT              (VPG_RA + RA_EEZCULLCOUNT)
-+
-+/* HW: TEX Counters. */
-+#define VPC_TXTOTBILINEARREQ            (VPG_TX + TX_TOTBILINEARREQ)
-+#define VPC_TXTOTTRILINEARREQ           (VPG_TX + TX_TOTTRILINEARREQ)
-+#define VPC_TXTOTDISCARDTEXREQ          (VPG_TX + TX_TOTDISCARDTEXREQ)
-+#define VPC_TXTOTTEXREQ                 (VPG_TX + TX_TOTTEXREQ)
-+#define VPC_TXMEMREADCOUNT              (VPG_TX + TX_MEMREADCOUNT)
-+#define VPC_TXMEMREADIN8BCOUNT          (VPG_TX + TX_MEMREADIN8BCOUNT)
-+#define VPC_TXCACHEMISSCOUNT            (VPG_TX + TX_CACHEMISSCOUNT)
-+#define VPC_TXCACHEHITTEXELCOUNT        (VPG_TX + TX_CACHEHITTEXELCOUNT)
-+#define VPC_TXCACHEMISSTEXELCOUNT       (VPG_TX + TX_CACHEMISSTEXELCOUNT)
-+
-+/* HW: PE Counters. */
-+#define VPC_PEKILLEDBYCOLOR             (VPG_PE + PE_KILLEDBYCOLOR)
-+#define VPC_PEKILLEDBYDEPTH             (VPG_PE + PE_KILLEDBYDEPTH)
-+#define VPC_PEDRAWNBYCOLOR              (VPG_PE + PE_DRAWNBYCOLOR)
-+#define VPC_PEDRAWNBYDEPTH              (VPG_PE + PE_DRAWNBYDEPTH)
-+
-+/* HW: MC Counters. */
-+#define VPC_MCREADREQ8BPIPE             (VPG_MC + MC_READREQ8BPIPE)
-+#define VPC_MCREADREQ8BIP               (VPG_MC + MC_READREQ8BIP)
-+#define VPC_MCWRITEREQ8BPIPE            (VPG_MC + MC_WRITEREQ8BPIPE)
-+
-+/* HW: AXI Counters. */
-+#define VPC_AXIREADREQSTALLED           (VPG_AXI + AXI_READREQSTALLED)
-+#define VPC_AXIWRITEREQSTALLED          (VPG_AXI + AXI_WRITEREQSTALLED)
-+#define VPC_AXIWRITEDATASTALLED         (VPG_AXI + AXI_WRITEDATASTALLED)
-+
-+/* PROGRAM: Shader program counters. */
-+#define VPC_PVSINSTRCOUNT           (VPG_PVS + PVS_INSTRCOUNT)
-+#define VPC_PVSALUINSTRCOUNT        (VPG_PVS + PVS_ALUINSTRCOUNT)
-+#define VPC_PVSTEXINSTRCOUNT        (VPG_PVS + PVS_TEXINSTRCOUNT)
-+#define VPC_PVSATTRIBCOUNT          (VPG_PVS + PVS_ATTRIBCOUNT)
-+#define VPC_PVSUNIFORMCOUNT         (VPG_PVS + PVS_UNIFORMCOUNT)
-+#define VPC_PVSFUNCTIONCOUNT        (VPG_PVS + PVS_FUNCTIONCOUNT)
-+#define VPC_PVSSOURCE               (VPG_PVS + PVS_SOURCE)
-+
-+#define VPC_PPSINSTRCOUNT           (VPG_PPS + PPS_INSTRCOUNT)
-+#define VPC_PPSALUINSTRCOUNT        (VPG_PPS + PPS_ALUINSTRCOUNT)
-+#define VPC_PPSTEXINSTRCOUNT        (VPG_PPS + PPS_TEXINSTRCOUNT)
-+#define VPC_PPSATTRIBCOUNT          (VPG_PPS + PPS_ATTRIBCOUNT)
-+#define VPC_PPSUNIFORMCOUNT         (VPG_PPS + PPS_UNIFORMCOUNT)
-+#define VPC_PPSFUNCTIONCOUNT        (VPG_PPS + PPS_FUNCTIONCOUNT)
-+#define VPC_PPSSOURCE               (VPG_PPS + PPS_SOURCE)
-+
-+#define VPC_PROGRAMHANDLE           (VPG_PROG + 1)
-+
-+#define VPG_ES20_DRAW_NO  (VPG_ES20_DRAW + 1)
-+#define VPG_ES11_DRAW_NO  (VPG_ES11_DRAW + 1)
-+
-+#define VPG_FRAME_USEVBO (VPG_FRAME + 1)
-+
-+#endif
-+
-+
-+/* HW profile information. */
-+typedef struct _gcsPROFILER_COUNTERS
-+{
-+    /* HW static counters. */
-+    gctUINT32       gpuClock;
-+    gctUINT32       axiClock;
-+    gctUINT32       shaderClock;
-+
-+    /* HW vairable counters. */
-+    gctUINT32       gpuClockStart;
-+    gctUINT32       gpuClockEnd;
-+
-+    /* HW vairable counters. */
-+    gctUINT32       gpuCyclesCounter;
-+    gctUINT32       gpuTotalCyclesCounter;
-+    gctUINT32       gpuIdleCyclesCounter;
-+    gctUINT32       gpuTotalRead64BytesPerFrame;
-+    gctUINT32       gpuTotalWrite64BytesPerFrame;
-+
-+    /* PE */
-+    gctUINT32       pe_pixel_count_killed_by_color_pipe;
-+    gctUINT32       pe_pixel_count_killed_by_depth_pipe;
-+    gctUINT32       pe_pixel_count_drawn_by_color_pipe;
-+    gctUINT32       pe_pixel_count_drawn_by_depth_pipe;
-+
-+    /* SH */
-+    gctUINT32       ps_inst_counter;
-+    gctUINT32       rendered_pixel_counter;
-+    gctUINT32       vs_inst_counter;
-+    gctUINT32       rendered_vertice_counter;
-+    gctUINT32       vtx_branch_inst_counter;
-+    gctUINT32       vtx_texld_inst_counter;
-+    gctUINT32       pxl_branch_inst_counter;
-+    gctUINT32       pxl_texld_inst_counter;
-+
-+    /* PA */
-+    gctUINT32       pa_input_vtx_counter;
-+    gctUINT32       pa_input_prim_counter;
-+    gctUINT32       pa_output_prim_counter;
-+    gctUINT32       pa_depth_clipped_counter;
-+    gctUINT32       pa_trivial_rejected_counter;
-+    gctUINT32       pa_culled_counter;
-+
-+    /* SE */
-+    gctUINT32       se_culled_triangle_count;
-+    gctUINT32       se_culled_lines_count;
-+
-+    /* RA */
-+    gctUINT32       ra_valid_pixel_count;
-+    gctUINT32       ra_total_quad_count;
-+    gctUINT32       ra_valid_quad_count_after_early_z;
-+    gctUINT32       ra_total_primitive_count;
-+    gctUINT32       ra_pipe_cache_miss_counter;
-+    gctUINT32       ra_prefetch_cache_miss_counter;
-+    gctUINT32       ra_eez_culled_counter;
-+
-+    /* TX */
-+    gctUINT32       tx_total_bilinear_requests;
-+    gctUINT32       tx_total_trilinear_requests;
-+    gctUINT32       tx_total_discarded_texture_requests;
-+    gctUINT32       tx_total_texture_requests;
-+    gctUINT32       tx_mem_read_count;
-+    gctUINT32       tx_mem_read_in_8B_count;
-+    gctUINT32       tx_cache_miss_count;
-+    gctUINT32       tx_cache_hit_texel_count;
-+    gctUINT32       tx_cache_miss_texel_count;
-+
-+    /* MC */
-+    gctUINT32       mc_total_read_req_8B_from_pipeline;
-+    gctUINT32       mc_total_read_req_8B_from_IP;
-+    gctUINT32       mc_total_write_req_8B_from_pipeline;
-+
-+    /* HI */
-+    gctUINT32       hi_axi_cycles_read_request_stalled;
-+    gctUINT32       hi_axi_cycles_write_request_stalled;
-+    gctUINT32       hi_axi_cycles_write_data_stalled;
-+}
-+gcsPROFILER_COUNTERS;
-+
-+/* HAL profile information. */
-+typedef struct _gcsPROFILER
-+{
-+    gctUINT32       enable;
-+    gctBOOL         enableHal;
-+    gctBOOL         enableHW;
-+    gctBOOL         enableSH;
-+    gctBOOL         isSyncMode;
-+
-+    gctBOOL         useSocket;
-+    gctINT          sockFd;
-+
-+    gctFILE         file;
-+
-+    /* Aggregate Information */
-+
-+    /* Clock Info */
-+    gctUINT64       frameStart;
-+    gctUINT64       frameEnd;
-+
-+    /* Current frame information */
-+    gctUINT32       frameNumber;
-+    gctUINT64       frameStartTimeusec;
-+    gctUINT64       frameEndTimeusec;
-+    gctUINT64       frameStartCPUTimeusec;
-+    gctUINT64       frameEndCPUTimeusec;
-+
-+#if PROFILE_HAL_COUNTERS
-+    gctUINT32       vertexBufferTotalBytesAlloc;
-+    gctUINT32       vertexBufferNewBytesAlloc;
-+    int             vertexBufferTotalObjectsAlloc;
-+    int             vertexBufferNewObjectsAlloc;
-+
-+    gctUINT32       indexBufferTotalBytesAlloc;
-+    gctUINT32       indexBufferNewBytesAlloc;
-+    int             indexBufferTotalObjectsAlloc;
-+    int             indexBufferNewObjectsAlloc;
-+
-+    gctUINT32       textureBufferTotalBytesAlloc;
-+    gctUINT32       textureBufferNewBytesAlloc;
-+    int             textureBufferTotalObjectsAlloc;
-+    int             textureBufferNewObjectsAlloc;
-+
-+    gctUINT32       numCommits;
-+    gctUINT32       drawPointCount;
-+    gctUINT32       drawLineCount;
-+    gctUINT32       drawTriangleCount;
-+    gctUINT32       drawVertexCount;
-+    gctUINT32       redundantStateChangeCalls;
-+#endif
-+
-+    gctUINT32       prevVSInstCount;
-+    gctUINT32       prevVSBranchInstCount;
-+    gctUINT32       prevVSTexInstCount;
-+    gctUINT32       prevVSVertexCount;
-+    gctUINT32       prevPSInstCount;
-+    gctUINT32       prevPSBranchInstCount;
-+    gctUINT32       prevPSTexInstCount;
-+    gctUINT32       prevPSPixelCount;
-+
-+    char*           psSource;
-+    char*           vsSource;
-+
-+}
-+gcsPROFILER;
-+
-+/* Memory profile information. */
-+struct _gcsMemProfile
-+{
-+    /* Memory Usage */
-+    gctUINT32       videoMemUsed;
-+    gctUINT32       systemMemUsed;
-+    gctUINT32       commitBufferSize;
-+    gctUINT32       contextBufferCopyBytes;
-+};
-+
-+/* Shader profile information. */
-+struct _gcsSHADER_PROFILER
-+{
-+    gctUINT32       shaderLength;
-+    gctUINT32       shaderALUCycles;
-+    gctUINT32       shaderTexLoadCycles;
-+    gctUINT32       shaderTempRegCount;
-+    gctUINT32       shaderSamplerRegCount;
-+    gctUINT32       shaderInputRegCount;
-+    gctUINT32       shaderOutputRegCount;
-+};
-+
-+/* Initialize the gcsProfiler. */
-+gceSTATUS
-+gcoPROFILER_Initialize(
-+    IN gcoHAL Hal
-+    );
-+
-+/* Destroy the gcProfiler. */
-+gceSTATUS
-+gcoPROFILER_Destroy(
-+    IN gcoHAL Hal
-+    );
-+
-+/* Write data to profiler. */
-+gceSTATUS
-+gcoPROFILER_Write(
-+    IN gcoHAL Hal,
-+    IN gctSIZE_T ByteCount,
-+    IN gctCONST_POINTER Data
-+    );
-+
-+/* Flush data out. */
-+gceSTATUS
-+gcoPROFILER_Flush(
-+    IN gcoHAL Hal
-+    );
-+
-+/* Call to signal end of frame. */
-+gceSTATUS
-+gcoPROFILER_EndFrame(
-+    IN gcoHAL Hal
-+    );
-+
-+/* Call to signal end of draw. */
-+gceSTATUS
-+gcoPROFILER_EndDraw(
-+    IN gcoHAL Hal,
-+    IN gctBOOL FirstDraw
-+    );
-+
-+/* Increase profile counter Enum by Value. */
-+gceSTATUS
-+gcoPROFILER_Count(
-+	IN gcoHAL Hal,
-+	IN gctUINT32 Enum,
-+	IN gctINT Value
-+	);
-+
-+gceSTATUS
-+gcoPROFILER_ShaderSourceFS(
-+    IN gcoHAL Hal,
-+    IN char* source
-+    );
-+
-+gceSTATUS
-+gcoPROFILER_ShaderSourceVS(
-+    IN gcoHAL Hal,
-+    IN char* source
-+    );
-+
-+/* Profile input vertex shader. */
-+gceSTATUS
-+gcoPROFILER_ShaderVS(
-+    IN gcoHAL Hal,
-+    IN gctPOINTER Vs
-+    );
-+
-+/* Profile input fragment shader. */
-+gceSTATUS
-+gcoPROFILER_ShaderFS(
-+    IN gcoHAL Hal,
-+    IN gctPOINTER Fs
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_profiler_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,1010 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_raster_h_
-+#define __gc_hal_raster_h_
-+
-+#include "gc_hal_enum.h"
-+#include "gc_hal_types.h"
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+****************************** Object Declarations *****************************
-+\******************************************************************************/
-+
-+typedef struct _gcoBRUSH *				gcoBRUSH;
-+typedef struct _gcoBRUSH_CACHE *  		gcoBRUSH_CACHE;
-+
-+/******************************************************************************\
-+******************************** gcoBRUSH Object *******************************
-+\******************************************************************************/
-+
-+/* Create a new solid color gcoBRUSH object. */
-+gceSTATUS
-+gcoBRUSH_ConstructSingleColor(
-+	IN gcoHAL Hal,
-+	IN gctUINT32 ColorConvert,
-+	IN gctUINT32 Color,
-+	IN gctUINT64 Mask,
-+	gcoBRUSH * Brush
-+	);
-+
-+/* Create a new monochrome gcoBRUSH object. */
-+gceSTATUS
-+gcoBRUSH_ConstructMonochrome(
-+	IN gcoHAL Hal,
-+	IN gctUINT32 OriginX,
-+	IN gctUINT32 OriginY,
-+	IN gctUINT32 ColorConvert,
-+	IN gctUINT32 FgColor,
-+	IN gctUINT32 BgColor,
-+	IN gctUINT64 Bits,
-+	IN gctUINT64 Mask,
-+	gcoBRUSH * Brush
-+	);
-+
-+/* Create a color gcoBRUSH object. */
-+gceSTATUS
-+gcoBRUSH_ConstructColor(
-+	IN gcoHAL Hal,
-+	IN gctUINT32 OriginX,
-+	IN gctUINT32 OriginY,
-+	IN gctPOINTER Address,
-+	IN gceSURF_FORMAT Format,
-+	IN gctUINT64 Mask,
-+	gcoBRUSH * Brush
-+	);
-+
-+/* Destroy an gcoBRUSH object. */
-+gceSTATUS
-+gcoBRUSH_Destroy(
-+	IN gcoBRUSH Brush
-+	);
-+
-+/******************************************************************************\
-+******************************** gcoSURF Object *******************************
-+\******************************************************************************/
-+
-+/* Set cipping rectangle. */
-+gceSTATUS
-+gcoSURF_SetClipping(
-+	IN gcoSURF Surface
-+	);
-+
-+/* Clear one or more rectangular areas. */
-+gceSTATUS
-+gcoSURF_Clear2D(
-+	IN gcoSURF DestSurface,
-+	IN gctUINT32 RectCount,
-+	IN gcsRECT_PTR DestRect,
-+	IN gctUINT32 LoColor,
-+	IN gctUINT32 HiColor
-+	);
-+
-+/* Draw one or more Bresenham lines. */
-+gceSTATUS
-+gcoSURF_Line(
-+	IN gcoSURF Surface,
-+	IN gctUINT32 LineCount,
-+	IN gcsRECT_PTR Position,
-+	IN gcoBRUSH Brush,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop
-+	);
-+
-+/* Generic rectangular blit. */
-+gceSTATUS
-+gcoSURF_Blit(
-+	IN OPTIONAL gcoSURF SrcSurface,
-+	IN gcoSURF DestSurface,
-+	IN gctUINT32 RectCount,
-+	IN OPTIONAL gcsRECT_PTR SrcRect,
-+	IN gcsRECT_PTR DestRect,
-+	IN OPTIONAL gcoBRUSH Brush,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN OPTIONAL gceSURF_TRANSPARENCY Transparency,
-+	IN OPTIONAL gctUINT32 TransparencyColor,
-+	IN OPTIONAL gctPOINTER Mask,
-+	IN OPTIONAL gceSURF_MONOPACK MaskPack
-+	);
-+
-+/* Monochrome blit. */
-+gceSTATUS
-+gcoSURF_MonoBlit(
-+	IN gcoSURF DestSurface,
-+	IN gctPOINTER Source,
-+	IN gceSURF_MONOPACK SourcePack,
-+	IN gcsPOINT_PTR SourceSize,
-+	IN gcsPOINT_PTR SourceOrigin,
-+	IN gcsRECT_PTR DestRect,
-+	IN OPTIONAL gcoBRUSH Brush,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gctBOOL ColorConvert,
-+	IN gctUINT8 MonoTransparency,
-+	IN gceSURF_TRANSPARENCY Transparency,
-+	IN gctUINT32 FgColor,
-+	IN gctUINT32 BgColor
-+	);
-+
-+/* Filter blit. */
-+gceSTATUS
-+gcoSURF_FilterBlit(
-+	IN gcoSURF SrcSurface,
-+	IN gcoSURF DestSurface,
-+	IN gcsRECT_PTR SrcRect,
-+	IN gcsRECT_PTR DestRect,
-+	IN gcsRECT_PTR DestSubRect
-+	);
-+
-+/* Enable alpha blending engine in the hardware and disengage the ROP engine. */
-+gceSTATUS
-+gcoSURF_EnableAlphaBlend(
-+	IN gcoSURF Surface,
-+	IN gctUINT8 SrcGlobalAlphaValue,
-+	IN gctUINT8 DstGlobalAlphaValue,
-+	IN gceSURF_PIXEL_ALPHA_MODE SrcAlphaMode,
-+	IN gceSURF_PIXEL_ALPHA_MODE DstAlphaMode,
-+	IN gceSURF_GLOBAL_ALPHA_MODE SrcGlobalAlphaMode,
-+	IN gceSURF_GLOBAL_ALPHA_MODE DstGlobalAlphaMode,
-+	IN gceSURF_BLEND_FACTOR_MODE SrcFactorMode,
-+	IN gceSURF_BLEND_FACTOR_MODE DstFactorMode,
-+	IN gceSURF_PIXEL_COLOR_MODE SrcColorMode,
-+	IN gceSURF_PIXEL_COLOR_MODE DstColorMode
-+	);
-+
-+/* Disable alpha blending engine in the hardware and engage the ROP engine. */
-+gceSTATUS
-+gcoSURF_DisableAlphaBlend(
-+	IN gcoSURF Surface
-+	);
-+
-+/* Copy a rectangular area with format conversion. */
-+gceSTATUS
-+gcoSURF_CopyPixels(
-+	IN gcoSURF Source,
-+	IN gcoSURF Target,
-+	IN gctINT SourceX,
-+	IN gctINT SourceY,
-+	IN gctINT TargetX,
-+	IN gctINT TargetY,
-+	IN gctINT Width,
-+	IN gctINT Height
-+	);
-+
-+/* Read surface pixel. */
-+gceSTATUS
-+gcoSURF_ReadPixel(
-+	IN gcoSURF Surface,
-+	IN gctPOINTER Memory,
-+	IN gctINT X,
-+	IN gctINT Y,
-+	IN gceSURF_FORMAT Format,
-+	OUT gctPOINTER PixelValue
-+	);
-+
-+/* Write surface pixel. */
-+gceSTATUS
-+gcoSURF_WritePixel(
-+	IN gcoSURF Surface,
-+	IN gctPOINTER Memory,
-+	IN gctINT X,
-+	IN gctINT Y,
-+	IN gceSURF_FORMAT Format,
-+	IN gctPOINTER PixelValue
-+	);
-+
-+gceSTATUS
-+gcoSURF_SetDither(
-+    IN gcoSURF Surface,
-+    IN gctBOOL Dither
-+    );
-+/******************************************************************************\
-+********************************** gco2D Object *********************************
-+\******************************************************************************/
-+
-+/* Construct a new gco2D object. */
-+gceSTATUS
-+gco2D_Construct(
-+	IN gcoHAL Hal,
-+	OUT gco2D * Hardware
-+	);
-+
-+/* Destroy an gco2D object. */
-+gceSTATUS
-+gco2D_Destroy(
-+	IN gco2D Hardware
-+	);
-+
-+/* Sets the maximum number of brushes in the brush cache. */
-+gceSTATUS
-+gco2D_SetBrushLimit(
-+	IN gco2D Hardware,
-+	IN gctUINT MaxCount
-+	);
-+
-+/* Flush the brush. */
-+gceSTATUS
-+gco2D_FlushBrush(
-+	IN gco2D Engine,
-+	IN gcoBRUSH Brush,
-+	IN gceSURF_FORMAT Format
-+	);
-+
-+/* Program the specified solid color brush. */
-+gceSTATUS
-+gco2D_LoadSolidBrush(
-+	IN gco2D Engine,
-+	IN gceSURF_FORMAT Format,
-+	IN gctUINT32 ColorConvert,
-+	IN gctUINT32 Color,
-+	IN gctUINT64 Mask
-+	);
-+
-+gceSTATUS
-+gco2D_LoadMonochromeBrush(
-+    IN gco2D Engine,
-+    IN gctUINT32 OriginX,
-+    IN gctUINT32 OriginY,
-+    IN gctUINT32 ColorConvert,
-+    IN gctUINT32 FgColor,
-+    IN gctUINT32 BgColor,
-+    IN gctUINT64 Bits,
-+    IN gctUINT64 Mask
-+    );
-+
-+gceSTATUS
-+gco2D_LoadColorBrush(
-+    IN gco2D Engine,
-+    IN gctUINT32 OriginX,
-+    IN gctUINT32 OriginY,
-+    IN gctUINT32 Address,
-+    IN gceSURF_FORMAT Format,
-+    IN gctUINT64 Mask
-+    );
-+
-+/* Configure monochrome source. */
-+gceSTATUS
-+gco2D_SetMonochromeSource(
-+	IN gco2D Engine,
-+	IN gctBOOL ColorConvert,
-+	IN gctUINT8 MonoTransparency,
-+	IN gceSURF_MONOPACK DataPack,
-+	IN gctBOOL CoordRelative,
-+	IN gceSURF_TRANSPARENCY Transparency,
-+	IN gctUINT32 FgColor,
-+	IN gctUINT32 BgColor
-+	);
-+
-+/* Configure color source. */
-+gceSTATUS
-+gco2D_SetColorSource(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_FORMAT Format,
-+	IN gceSURF_ROTATION Rotation,
-+	IN gctUINT32 SurfaceWidth,
-+	IN gctBOOL CoordRelative,
-+	IN gceSURF_TRANSPARENCY Transparency,
-+	IN gctUINT32 TransparencyColor
-+	);
-+
-+/* Configure color source extension for full rotation. */
-+gceSTATUS
-+gco2D_SetColorSourceEx(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_FORMAT Format,
-+	IN gceSURF_ROTATION Rotation,
-+	IN gctUINT32 SurfaceWidth,
-+	IN gctUINT32 SurfaceHeight,
-+	IN gctBOOL CoordRelative,
-+	IN gceSURF_TRANSPARENCY Transparency,
-+	IN gctUINT32 TransparencyColor
-+	);
-+
-+/* Configure color source. */
-+gceSTATUS
-+gco2D_SetColorSourceAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_FORMAT Format,
-+	IN gceSURF_ROTATION Rotation,
-+	IN gctUINT32 SurfaceWidth,
-+	IN gctUINT32 SurfaceHeight,
-+	IN gctBOOL CoordRelative
-+	);
-+
-+gceSTATUS
-+gco2D_SetColorSourceN(
-+    IN gco2D Engine,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Stride,
-+    IN gceSURF_FORMAT Format,
-+    IN gceSURF_ROTATION Rotation,
-+    IN gctUINT32 SurfaceWidth,
-+    IN gctUINT32 SurfaceHeight,
-+    IN gctUINT32 SurfaceNumber
-+    );
-+
-+/* Configure masked color source. */
-+gceSTATUS
-+gco2D_SetMaskedSource(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_FORMAT Format,
-+	IN gctBOOL CoordRelative,
-+	IN gceSURF_MONOPACK MaskPack
-+	);
-+
-+/* Configure masked color source extension for full rotation. */
-+gceSTATUS
-+gco2D_SetMaskedSourceEx(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_FORMAT Format,
-+	IN gctBOOL CoordRelative,
-+	IN gceSURF_MONOPACK MaskPack,
-+	IN gceSURF_ROTATION Rotation,
-+	IN gctUINT32 SurfaceWidth,
-+	IN gctUINT32 SurfaceHeight
-+	);
-+
-+/* Setup the source rectangle. */
-+gceSTATUS
-+gco2D_SetSource(
-+	IN gco2D Engine,
-+	IN gcsRECT_PTR SrcRect
-+	);
-+
-+/* Set clipping rectangle. */
-+gceSTATUS
-+gco2D_SetClipping(
-+	IN gco2D Engine,
-+	IN gcsRECT_PTR Rect
-+	);
-+
-+/* Configure destination. */
-+gceSTATUS
-+gco2D_SetTarget(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_ROTATION Rotation,
-+	IN gctUINT32 SurfaceWidth
-+	);
-+
-+/* Configure destination extension for full rotation. */
-+gceSTATUS
-+gco2D_SetTargetEx(
-+	IN gco2D Engine,
-+	IN gctUINT32 Address,
-+	IN gctUINT32 Stride,
-+	IN gceSURF_ROTATION Rotation,
-+	IN gctUINT32 SurfaceWidth,
-+	IN gctUINT32 SurfaceHeight
-+	);
-+
-+/* Calculate and program the stretch factors. */
-+gceSTATUS
-+gco2D_CalcStretchFactor(
-+    IN gco2D Engine,
-+    IN gctINT32 SrcSize,
-+    IN gctINT32 DestSize,
-+    OUT gctUINT32_PTR Factor
-+    );
-+
-+gceSTATUS
-+gco2D_SetStretchFactors(
-+	IN gco2D Engine,
-+	IN gctUINT32 HorFactor,
-+	IN gctUINT32 VerFactor
-+	);
-+
-+/* Calculate and program the stretch factors based on the rectangles. */
-+gceSTATUS
-+gco2D_SetStretchRectFactors(
-+	IN gco2D Engine,
-+	IN gcsRECT_PTR SrcRect,
-+	IN gcsRECT_PTR DestRect
-+	);
-+
-+/* Create a new solid color gcoBRUSH object. */
-+gceSTATUS
-+gco2D_ConstructSingleColorBrush(
-+	IN gco2D Engine,
-+	IN gctUINT32 ColorConvert,
-+	IN gctUINT32 Color,
-+	IN gctUINT64 Mask,
-+	gcoBRUSH * Brush
-+	);
-+
-+/* Create a new monochrome gcoBRUSH object. */
-+gceSTATUS
-+gco2D_ConstructMonochromeBrush(
-+	IN gco2D Engine,
-+	IN gctUINT32 OriginX,
-+	IN gctUINT32 OriginY,
-+	IN gctUINT32 ColorConvert,
-+	IN gctUINT32 FgColor,
-+	IN gctUINT32 BgColor,
-+	IN gctUINT64 Bits,
-+	IN gctUINT64 Mask,
-+	gcoBRUSH * Brush
-+	);
-+
-+/* Create a color gcoBRUSH object. */
-+gceSTATUS
-+gco2D_ConstructColorBrush(
-+	IN gco2D Engine,
-+	IN gctUINT32 OriginX,
-+	IN gctUINT32 OriginY,
-+	IN gctPOINTER Address,
-+	IN gceSURF_FORMAT Format,
-+	IN gctUINT64 Mask,
-+	gcoBRUSH * Brush
-+	);
-+
-+/* Clear one or more rectangular areas. */
-+gceSTATUS
-+gco2D_Clear(
-+	IN gco2D Engine,
-+	IN gctUINT32 RectCount,
-+	IN gcsRECT_PTR Rect,
-+	IN gctUINT32 Color32,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+/* Draw one or more Bresenham lines. */
-+gceSTATUS
-+gco2D_Line(
-+	IN gco2D Engine,
-+	IN gctUINT32 LineCount,
-+	IN gcsRECT_PTR Position,
-+	IN gcoBRUSH Brush,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+/* Draw one or more Bresenham lines based on the 32-bit color. */
-+gceSTATUS
-+gco2D_ColorLine(
-+	IN gco2D Engine,
-+	IN gctUINT32 LineCount,
-+	IN gcsRECT_PTR Position,
-+	IN gctUINT32 Color32,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+/* Generic blit. */
-+gceSTATUS
-+gco2D_Blit(
-+	IN gco2D Engine,
-+	IN gctUINT32 RectCount,
-+	IN gcsRECT_PTR Rect,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+gceSTATUS
-+gco2D_Blend(
-+    IN gco2D Engine,
-+    IN gctUINT32 SrcCount,
-+    IN gctUINT32 RectCount,
-+    IN gcsRECT_PTR Rect,
-+    IN gctUINT8 FgRop,
-+    IN gctUINT8 BgRop,
-+    IN gceSURF_FORMAT DestFormat
-+    );
-+
-+/* Batch blit. */
-+gceSTATUS
-+gco2D_BatchBlit(
-+	IN gco2D Engine,
-+	IN gctUINT32 RectCount,
-+	IN gcsRECT_PTR SrcRect,
-+	IN gcsRECT_PTR DestRect,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+/* Stretch blit. */
-+gceSTATUS
-+gco2D_StretchBlit(
-+	IN gco2D Engine,
-+	IN gctUINT32 RectCount,
-+	IN gcsRECT_PTR Rect,
-+	IN gctUINT8 FgRop,
-+	IN gctUINT8 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+/* Monochrome blit. */
-+gceSTATUS
-+gco2D_MonoBlit(
-+	IN gco2D Engine,
-+	IN gctPOINTER StreamBits,
-+	IN gcsPOINT_PTR StreamSize,
-+	IN gcsRECT_PTR StreamRect,
-+	IN gceSURF_MONOPACK SrcStreamPack,
-+	IN gceSURF_MONOPACK DestStreamPack,
-+	IN gcsRECT_PTR DestRect,
-+	IN gctUINT32 FgRop,
-+	IN gctUINT32 BgRop,
-+	IN gceSURF_FORMAT DestFormat
-+	);
-+
-+gceSTATUS
-+gco2D_MonoBlitEx(
-+    IN gco2D        Engine,
-+    IN gctPOINTER   StreamBits,
-+    IN gctINT32     StreamStride,
-+    IN gctINT32     StreamWidth,
-+    IN gctINT32     StreamHeight,
-+    IN gctINT32     StreamX,
-+    IN gctINT32     StreamY,
-+    IN gctUINT32    FgColor,
-+    IN gctUINT32    BgColor,
-+    IN gcsRECT_PTR  SrcRect,
-+    IN gcsRECT_PTR  DstRect,
-+    IN gctUINT8     FgRop,
-+    IN gctUINT8     BgRop
-+    );
-+
-+/* Set kernel size. */
-+gceSTATUS
-+gco2D_SetKernelSize(
-+	IN gco2D Engine,
-+	IN gctUINT8 HorKernelSize,
-+	IN gctUINT8 VerKernelSize
-+	);
-+
-+/* Set filter type. */
-+gceSTATUS
-+gco2D_SetFilterType(
-+	IN gco2D Engine,
-+	IN gceFILTER_TYPE FilterType
-+	);
-+
-+/* Set the filter kernel by user. */
-+gceSTATUS
-+gco2D_SetUserFilterKernel(
-+	IN gco2D Engine,
-+	IN gceFILTER_PASS_TYPE PassType,
-+	IN gctUINT16_PTR KernelArray
-+	);
-+
-+/* Select the pass(es) to be done for user defined filter. */
-+gceSTATUS
-+gco2D_EnableUserFilterPasses(
-+	IN gco2D Engine,
-+	IN gctBOOL HorPass,
-+	IN gctBOOL VerPass
-+	);
-+
-+/* Frees the temporary buffer allocated by filter blit operation. */
-+gceSTATUS
-+gco2D_FreeFilterBuffer(
-+	IN gco2D Engine
-+	);
-+
-+/* Filter blit. */
-+gceSTATUS
-+gco2D_FilterBlit(
-+	IN gco2D Engine,
-+	IN gctUINT32 SrcAddress,
-+	IN gctUINT SrcStride,
-+	IN gctUINT32 SrcUAddress,
-+	IN gctUINT SrcUStride,
-+	IN gctUINT32 SrcVAddress,
-+	IN gctUINT SrcVStride,
-+	IN gceSURF_FORMAT SrcFormat,
-+	IN gceSURF_ROTATION SrcRotation,
-+	IN gctUINT32 SrcSurfaceWidth,
-+	IN gcsRECT_PTR SrcRect,
-+	IN gctUINT32 DestAddress,
-+	IN gctUINT DestStride,
-+	IN gceSURF_FORMAT DestFormat,
-+	IN gceSURF_ROTATION DestRotation,
-+	IN gctUINT32 DestSurfaceWidth,
-+	IN gcsRECT_PTR DestRect,
-+	IN gcsRECT_PTR DestSubRect
-+	);
-+
-+/* Filter blit extension for full rotation. */
-+gceSTATUS
-+gco2D_FilterBlitEx(
-+	IN gco2D Engine,
-+	IN gctUINT32 SrcAddress,
-+	IN gctUINT SrcStride,
-+	IN gctUINT32 SrcUAddress,
-+	IN gctUINT SrcUStride,
-+	IN gctUINT32 SrcVAddress,
-+	IN gctUINT SrcVStride,
-+	IN gceSURF_FORMAT SrcFormat,
-+	IN gceSURF_ROTATION SrcRotation,
-+	IN gctUINT32 SrcSurfaceWidth,
-+	IN gctUINT32 SrcSurfaceHeight,
-+	IN gcsRECT_PTR SrcRect,
-+	IN gctUINT32 DestAddress,
-+	IN gctUINT DestStride,
-+	IN gceSURF_FORMAT DestFormat,
-+	IN gceSURF_ROTATION DestRotation,
-+	IN gctUINT32 DestSurfaceWidth,
-+	IN gctUINT32 DestSurfaceHeight,
-+	IN gcsRECT_PTR DestRect,
-+	IN gcsRECT_PTR DestSubRect
-+	);
-+
-+gceSTATUS
-+gco2D_FilterBlitEx2(
-+    IN gco2D                Engine,
-+    IN gctUINT32_PTR        SrcAddresses,
-+    IN gctUINT32            SrcAddressNum,
-+    IN gctUINT32_PTR        SrcStrides,
-+    IN gctUINT32            SrcStrideNum,
-+    IN gceTILING            SrcTiling,
-+    IN gceSURF_FORMAT       SrcFormat,
-+    IN gceSURF_ROTATION     SrcRotation,
-+    IN gctUINT32            SrcSurfaceWidth,
-+    IN gctUINT32            SrcSurfaceHeight,
-+    IN gcsRECT_PTR          SrcRect,
-+    IN gctUINT32_PTR        DestAddresses,
-+    IN gctUINT32            DestAddressNum,
-+    IN gctUINT32_PTR        DestStrides,
-+    IN gctUINT32            DestStrideNum,
-+    IN gceTILING            DestTiling,
-+    IN gceSURF_FORMAT       DestFormat,
-+    IN gceSURF_ROTATION     DestRotation,
-+    IN gctUINT32            DestSurfaceWidth,
-+    IN gctUINT32            DestSurfaceHeight,
-+    IN gcsRECT_PTR          DestRect,
-+    IN gcsRECT_PTR          DestSubRect
-+    );
-+
-+/* Enable alpha blending engine in the hardware and disengage the ROP engine. */
-+gceSTATUS
-+gco2D_EnableAlphaBlend(
-+	IN gco2D Engine,
-+	IN gctUINT8 SrcGlobalAlphaValue,
-+	IN gctUINT8 DstGlobalAlphaValue,
-+	IN gceSURF_PIXEL_ALPHA_MODE SrcAlphaMode,
-+	IN gceSURF_PIXEL_ALPHA_MODE DstAlphaMode,
-+	IN gceSURF_GLOBAL_ALPHA_MODE SrcGlobalAlphaMode,
-+	IN gceSURF_GLOBAL_ALPHA_MODE DstGlobalAlphaMode,
-+	IN gceSURF_BLEND_FACTOR_MODE SrcFactorMode,
-+	IN gceSURF_BLEND_FACTOR_MODE DstFactorMode,
-+	IN gceSURF_PIXEL_COLOR_MODE SrcColorMode,
-+	IN gceSURF_PIXEL_COLOR_MODE DstColorMode
-+	);
-+
-+/* Enable alpha blending engine in the hardware. */
-+gceSTATUS
-+gco2D_EnableAlphaBlendAdvanced(
-+	IN gco2D Engine,
-+	IN gceSURF_PIXEL_ALPHA_MODE SrcAlphaMode,
-+	IN gceSURF_PIXEL_ALPHA_MODE DstAlphaMode,
-+	IN gceSURF_GLOBAL_ALPHA_MODE SrcGlobalAlphaMode,
-+	IN gceSURF_GLOBAL_ALPHA_MODE DstGlobalAlphaMode,
-+	IN gceSURF_BLEND_FACTOR_MODE SrcFactorMode,
-+	IN gceSURF_BLEND_FACTOR_MODE DstFactorMode
-+	);
-+
-+/* Enable alpha blending engine with Porter Duff rule. */
-+gceSTATUS
-+gco2D_SetPorterDuffBlending(
-+	IN gco2D Engine,
-+	IN gce2D_PORTER_DUFF_RULE Rule
-+	);
-+
-+/* Disable alpha blending engine in the hardware and engage the ROP engine. */
-+gceSTATUS
-+gco2D_DisableAlphaBlend(
-+	IN gco2D Engine
-+	);
-+
-+/* Retrieve the maximum number of 32-bit data chunks for a single DE command. */
-+gctUINT32
-+gco2D_GetMaximumDataCount(
-+	void
-+	);
-+
-+/* Retrieve the maximum number of rectangles, that can be passed in a single DE command. */
-+gctUINT32
-+gco2D_GetMaximumRectCount(
-+	void
-+	);
-+
-+/* Returns the pixel alignment of the surface. */
-+gceSTATUS
-+gco2D_GetPixelAlignment(
-+	gceSURF_FORMAT Format,
-+	gcsPOINT_PTR Alignment
-+	);
-+
-+/* Retrieve monochrome stream pack size. */
-+gceSTATUS
-+gco2D_GetPackSize(
-+	IN gceSURF_MONOPACK StreamPack,
-+	OUT gctUINT32 * PackWidth,
-+	OUT gctUINT32 * PackHeight
-+	);
-+
-+/* Flush the 2D pipeline. */
-+gceSTATUS
-+gco2D_Flush(
-+	IN gco2D Engine
-+	);
-+
-+/* Load 256-entry color table for INDEX8 source surfaces. */
-+gceSTATUS
-+gco2D_LoadPalette(
-+	IN gco2D Engine,
-+	IN gctUINT FirstIndex,
-+	IN gctUINT IndexCount,
-+	IN gctPOINTER ColorTable,
-+	IN gctBOOL ColorConvert
-+	);
-+
-+/* Enable/disable 2D BitBlt mirrorring. */
-+gceSTATUS
-+gco2D_SetBitBlitMirror(
-+	IN gco2D Engine,
-+	IN gctBOOL HorizontalMirror,
-+	IN gctBOOL VerticalMirror
-+	);
-+
-+/*
-+ * Set the transparency for source, destination and pattern.
-+ * It also enable or disable the DFB color key mode.
-+ */
-+gceSTATUS
-+gco2D_SetTransparencyAdvancedEx(
-+    IN gco2D Engine,
-+    IN gce2D_TRANSPARENCY SrcTransparency,
-+    IN gce2D_TRANSPARENCY DstTransparency,
-+    IN gce2D_TRANSPARENCY PatTransparency,
-+    IN gctBOOL EnableDFBColorKeyMode
-+	);
-+
-+/* Set the transparency for source, destination and pattern. */
-+gceSTATUS
-+gco2D_SetTransparencyAdvanced(
-+	IN gco2D Engine,
-+	IN gce2D_TRANSPARENCY SrcTransparency,
-+	IN gce2D_TRANSPARENCY DstTransparency,
-+	IN gce2D_TRANSPARENCY PatTransparency
-+	);
-+
-+/* Set the source color key. */
-+gceSTATUS
-+gco2D_SetSourceColorKeyAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 ColorKey
-+	);
-+
-+/* Set the source color key range. */
-+gceSTATUS
-+gco2D_SetSourceColorKeyRangeAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 ColorKeyLow,
-+	IN gctUINT32 ColorKeyHigh
-+	);
-+
-+/* Set the target color key. */
-+gceSTATUS
-+gco2D_SetTargetColorKeyAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 ColorKey
-+	);
-+
-+/* Set the target color key range. */
-+gceSTATUS
-+gco2D_SetTargetColorKeyRangeAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 ColorKeyLow,
-+	IN gctUINT32 ColorKeyHigh
-+	);
-+
-+/* Set the YUV color space mode. */
-+gceSTATUS
-+gco2D_SetYUVColorMode(
-+	IN gco2D Engine,
-+	IN gce2D_YUV_COLOR_MODE Mode
-+	);
-+
-+/* Setup the source global color value in ARGB8 format. */
-+gceSTATUS gco2D_SetSourceGlobalColorAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 Color32
-+	);
-+
-+/* Setup the target global color value in ARGB8 format. */
-+gceSTATUS gco2D_SetTargetGlobalColorAdvanced(
-+	IN gco2D Engine,
-+	IN gctUINT32 Color32
-+	);
-+
-+/* Setup the source and target pixel multiply modes. */
-+gceSTATUS
-+gco2D_SetPixelMultiplyModeAdvanced(
-+	IN gco2D Engine,
-+	IN gce2D_PIXEL_COLOR_MULTIPLY_MODE SrcPremultiplySrcAlpha,
-+	IN gce2D_PIXEL_COLOR_MULTIPLY_MODE DstPremultiplyDstAlpha,
-+	IN gce2D_GLOBAL_COLOR_MULTIPLY_MODE SrcPremultiplyGlobalMode,
-+	IN gce2D_PIXEL_COLOR_MULTIPLY_MODE DstDemultiplyDstAlpha
-+	);
-+
-+/* Set the GPU clock cycles after which the idle engine will keep auto-flushing. */
-+gceSTATUS
-+gco2D_SetAutoFlushCycles(
-+	IN gco2D Engine,
-+	IN gctUINT32 Cycles
-+	);
-+
-+#if VIVANTE_PROFILER
-+/* Read the profile registers available in the 2D engine and sets them in the profile.
-+   The function will also reset the pixelsRendered counter every time.
-+*/
-+gceSTATUS
-+gco2D_ProfileEngine(
-+	IN gco2D Engine,
-+	OPTIONAL gcs2D_PROFILE_PTR Profile
-+	);
-+#endif
-+
-+/* Enable or disable 2D dithering. */
-+gceSTATUS
-+gco2D_EnableDither(
-+	IN gco2D Engine,
-+	IN gctBOOL Enable
-+	);
-+
-+gceSTATUS
-+gco2D_SetGenericSource(
-+    IN gco2D               Engine,
-+    IN gctUINT32_PTR       Addresses,
-+    IN gctUINT32           AddressNum,
-+    IN gctUINT32_PTR       Strides,
-+    IN gctUINT32           StrideNum,
-+    IN gceTILING           Tiling,
-+    IN gceSURF_FORMAT      Format,
-+    IN gceSURF_ROTATION    Rotation,
-+    IN gctUINT32           SurfaceWidth,
-+    IN gctUINT32           SurfaceHeight
-+);
-+
-+gceSTATUS
-+gco2D_SetGenericTarget(
-+    IN gco2D               Engine,
-+    IN gctUINT32_PTR       Addresses,
-+    IN gctUINT32           AddressNum,
-+    IN gctUINT32_PTR       Strides,
-+    IN gctUINT32           StrideNum,
-+    IN gceTILING           Tiling,
-+    IN gceSURF_FORMAT      Format,
-+    IN gceSURF_ROTATION    Rotation,
-+    IN gctUINT32           SurfaceWidth,
-+    IN gctUINT32           SurfaceHeight
-+);
-+
-+gceSTATUS
-+gco2D_SetCurrentSourceIndex(
-+    IN gco2D        Engine,
-+    IN gctUINT32    SrcIndex
-+    );
-+
-+gceSTATUS
-+gco2D_MultiSourceBlit(
-+    IN gco2D Engine,
-+    IN gctUINT32 SourceMask,
-+    IN gcsRECT_PTR DestRect,
-+    IN gctUINT32 RectCount
-+    );
-+
-+gceSTATUS
-+gco2D_SetROP(
-+    IN gco2D Engine,
-+    IN gctUINT8 FgRop,
-+    IN gctUINT8 BgRop
-+    );
-+
-+gceSTATUS
-+gco2D_SetGdiStretchMode(
-+    IN gco2D Engine,
-+    IN gctBOOL Enable
-+    );
-+
-+gceSTATUS
-+gco2D_SetSourceTileStatus(
-+    IN gco2D Engine,
-+    IN gce2D_TILE_STATUS_CONFIG TSControl,
-+    IN gceSURF_FORMAT CompressedFormat,
-+    IN gctUINT32 ClearValue,
-+    IN gctUINT32 GpuAddress
-+    );
-+
-+gceSTATUS
-+gco2D_SetTargetTileStatus(
-+    IN gco2D Engine,
-+    IN gce2D_TILE_STATUS_CONFIG TileStatusConfig,
-+    IN gceSURF_FORMAT CompressedFormat,
-+    IN gctUINT32 ClearValue,
-+    IN gctUINT32 GpuAddress
-+    );
-+
-+gceSTATUS
-+gco2D_QueryU32(
-+    IN gco2D Engine,
-+    IN gce2D_QUERY Item,
-+    OUT gctUINT32_PTR Value
-+    );
-+
-+gceSTATUS
-+gco2D_SetStateU32(
-+    IN gco2D Engine,
-+    IN gce2D_STATE State,
-+    IN gctUINT32 Value
-+    );
-+
-+gceSTATUS
-+gco2D_SetStateArrayI32(
-+    IN gco2D Engine,
-+    IN gce2D_STATE State,
-+    IN gctINT32_PTR Array,
-+    IN gctINT32 ArraySize
-+    );
-+
-+gceSTATUS
-+gco2D_SetStateArrayU32(
-+    IN gco2D Engine,
-+    IN gce2D_STATE State,
-+    IN gctUINT32_PTR Array,
-+    IN gctINT32 ArraySize
-+    );
-+
-+gceSTATUS
-+gco2D_SetTargetRect(
-+    IN gco2D Engine,
-+    IN gcsRECT_PTR Rect
-+    );
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_raster_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,248 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_rename_h_
-+#define __gc_hal_rename_h_
-+
-+
-+#if defined(_HAL2D_APPENDIX)
-+
-+#define _HAL2D_RENAME_2(api, appendix)  api ## appendix
-+#define _HAL2D_RENAME_1(api, appendix)  _HAL2D_RENAME_2(api, appendix)
-+#define gcmHAL2D(api)                   _HAL2D_RENAME_1(api, _HAL2D_APPENDIX)
-+
-+
-+#define gckOS_Construct                 gcmHAL2D(gckOS_Construct)
-+#define gckOS_Destroy                   gcmHAL2D(gckOS_Destroy)
-+#define gckOS_QueryVideoMemory          gcmHAL2D(gckOS_QueryVideoMemory)
-+#define gckOS_Allocate                  gcmHAL2D(gckOS_Allocate)
-+#define gckOS_Free                      gcmHAL2D(gckOS_Free)
-+#define gckOS_AllocateMemory            gcmHAL2D(gckOS_AllocateMemory)
-+#define gckOS_FreeMemory                gcmHAL2D(gckOS_FreeMemory)
-+#define gckOS_AllocatePagedMemory       gcmHAL2D(gckOS_AllocatePagedMemory)
-+#define gckOS_AllocatePagedMemoryEx     gcmHAL2D(gckOS_AllocatePagedMemoryEx)
-+#define gckOS_LockPages                 gcmHAL2D(gckOS_LockPages)
-+#define gckOS_MapPages                  gcmHAL2D(gckOS_MapPages)
-+#define gckOS_UnlockPages               gcmHAL2D(gckOS_UnlockPages)
-+#define gckOS_FreePagedMemory           gcmHAL2D(gckOS_FreePagedMemory)
-+#define gckOS_AllocateNonPagedMemory    gcmHAL2D(gckOS_AllocateNonPagedMemory)
-+#define gckOS_FreeNonPagedMemory        gcmHAL2D(gckOS_FreeNonPagedMemory)
-+#define gckOS_AllocateContiguous        gcmHAL2D(gckOS_AllocateContiguous)
-+#define gckOS_FreeContiguous            gcmHAL2D(gckOS_FreeContiguous)
-+#define gckOS_GetPageSize               gcmHAL2D(gckOS_GetPageSize)
-+#define gckOS_GetPhysicalAddress        gcmHAL2D(gckOS_GetPhysicalAddress)
-+#define gckOS_GetPhysicalAddressProcess     gcmHAL2D(gckOS_GetPhysicalAddressProcess)
-+#define gckOS_MapPhysical                   gcmHAL2D(gckOS_MapPhysical)
-+#define gckOS_UnmapPhysical             gcmHAL2D(gckOS_UnmapPhysical)
-+#define gckOS_ReadRegister              gcmHAL2D(gckOS_ReadRegister)
-+#define gckOS_WriteRegister             gcmHAL2D(gckOS_WriteRegister)
-+#define gckOS_WriteMemory               gcmHAL2D(gckOS_WriteMemory)
-+#define gckOS_MapMemory                 gcmHAL2D(gckOS_MapMemory)
-+#define gckOS_UnmapMemory               gcmHAL2D(gckOS_UnmapMemory)
-+#define gckOS_UnmapMemoryEx             gcmHAL2D(gckOS_UnmapMemoryEx)
-+#define gckOS_CreateMutex               gcmHAL2D(gckOS_CreateMutex)
-+#define gckOS_DeleteMutex               gcmHAL2D(gckOS_DeleteMutex)
-+#define gckOS_AcquireMutex              gcmHAL2D(gckOS_AcquireMutex)
-+#define gckOS_ReleaseMutex              gcmHAL2D(gckOS_ReleaseMutex)
-+#define gckOS_AtomicExchange            gcmHAL2D(gckOS_AtomicExchange)
-+#define gckOS_AtomicExchangePtr         gcmHAL2D(gckOS_AtomicExchangePtr)
-+#define gckOS_AtomConstruct             gcmHAL2D(gckOS_AtomConstruct)
-+#define gckOS_AtomDestroy               gcmHAL2D(gckOS_AtomDestroy)
-+#define gckOS_AtomGet                   gcmHAL2D(gckOS_AtomGet)
-+#define gckOS_AtomIncrement             gcmHAL2D(gckOS_AtomIncrement)
-+#define gckOS_AtomDecrement             gcmHAL2D(gckOS_AtomDecrement)
-+#define gckOS_Delay                     gcmHAL2D(gckOS_Delay)
-+#define gckOS_GetTime                   gcmHAL2D(gckOS_GetTime)
-+#define gckOS_MemoryBarrier             gcmHAL2D(gckOS_MemoryBarrier)
-+#define gckOS_MapUserPointer            gcmHAL2D(gckOS_MapUserPointer)
-+#define gckOS_UnmapUserPointer          gcmHAL2D(gckOS_UnmapUserPointer)
-+#define gckOS_QueryNeedCopy             gcmHAL2D(gckOS_QueryNeedCopy)
-+#define gckOS_CopyFromUserData          gcmHAL2D(gckOS_CopyFromUserData)
-+#define gckOS_CopyToUserData            gcmHAL2D(gckOS_CopyToUserData)
-+#define gckOS_MapUserPhysical           gcmHAL2D(gckOS_MapUserPhysical)
-+#define gckOS_SuspendInterrupt          gcmHAL2D(gckOS_SuspendInterrupt)
-+#define gckOS_ResumeInterrupt           gcmHAL2D(gckOS_ResumeInterrupt)
-+#define gckOS_GetBaseAddress            gcmHAL2D(gckOS_GetBaseAddress)
-+#define gckOS_MemCopy                   gcmHAL2D(gckOS_MemCopy)
-+#define gckOS_ZeroMemory                gcmHAL2D(gckOS_ZeroMemory)
-+#define gckOS_DeviceControl             gcmHAL2D(gckOS_DeviceControl)
-+#define gckOS_GetProcessID              gcmHAL2D(gckOS_GetProcessID)
-+#define gckOS_GetThreadID               gcmHAL2D(gckOS_GetThreadID)
-+#define gckOS_CreateSignal              gcmHAL2D(gckOS_CreateSignal)
-+#define gckOS_DestroySignal             gcmHAL2D(gckOS_DestroySignal)
-+#define gckOS_Signal                    gcmHAL2D(gckOS_Signal)
-+#define gckOS_WaitSignal                gcmHAL2D(gckOS_WaitSignal)
-+#define gckOS_MapSignal                 gcmHAL2D(gckOS_MapSignal)
-+#define gckOS_MapUserMemory             gcmHAL2D(gckOS_MapUserMemory)
-+#define gckOS_UnmapUserMemory           gcmHAL2D(gckOS_UnmapUserMemory)
-+#define gckOS_CreateUserSignal          gcmHAL2D(gckOS_CreateUserSignal)
-+#define gckOS_DestroyUserSignal         gcmHAL2D(gckOS_DestroyUserSignal)
-+#define gckOS_WaitUserSignal            gcmHAL2D(gckOS_WaitUserSignal)
-+#define gckOS_SignalUserSignal          gcmHAL2D(gckOS_SignalUserSignal)
-+#define gckOS_UserSignal                gcmHAL2D(gckOS_UserSignal)
-+#define gckOS_UserSignal                gcmHAL2D(gckOS_UserSignal)
-+#define gckOS_CacheClean                gcmHAL2D(gckOS_CacheClean)
-+#define gckOS_CacheFlush                gcmHAL2D(gckOS_CacheFlush)
-+#define gckOS_SetDebugLevel             gcmHAL2D(gckOS_SetDebugLevel)
-+#define gckOS_SetDebugZone              gcmHAL2D(gckOS_SetDebugZone)
-+#define gckOS_SetDebugLevelZone         gcmHAL2D(gckOS_SetDebugLevelZone)
-+#define gckOS_SetDebugZones             gcmHAL2D(gckOS_SetDebugZones)
-+#define gckOS_SetDebugFile              gcmHAL2D(gckOS_SetDebugFile)
-+#define gckOS_Broadcast                 gcmHAL2D(gckOS_Broadcast)
-+#define gckOS_SetGPUPower               gcmHAL2D(gckOS_SetGPUPower)
-+#define gckOS_CreateSemaphore           gcmHAL2D(gckOS_CreateSemaphore)
-+#define gckOS_DestroySemaphore          gcmHAL2D(gckOS_DestroySemaphore)
-+#define gckOS_AcquireSemaphore          gcmHAL2D(gckOS_AcquireSemaphore)
-+#define gckOS_ReleaseSemaphore          gcmHAL2D(gckOS_ReleaseSemaphore)
-+#define gckHEAP_Construct               gcmHAL2D(gckHEAP_Construct)
-+#define gckHEAP_Destroy                 gcmHAL2D(gckHEAP_Destroy)
-+#define gckHEAP_Allocate                gcmHAL2D(gckHEAP_Allocate)
-+#define gckHEAP_Free                    gcmHAL2D(gckHEAP_Free)
-+#define gckHEAP_ProfileStart            gcmHAL2D(gckHEAP_ProfileStart)
-+#define gckHEAP_ProfileEnd              gcmHAL2D(gckHEAP_ProfileEnd)
-+#define gckHEAP_Test                    gcmHAL2D(gckHEAP_Test)
-+#define gckVIDMEM_Construct             gcmHAL2D(gckVIDMEM_Construct)
-+#define gckVIDMEM_Destroy               gcmHAL2D(gckVIDMEM_Destroy)
-+#define gckVIDMEM_Allocate              gcmHAL2D(gckVIDMEM_Allocate)
-+#define gckVIDMEM_AllocateLinear        gcmHAL2D(gckVIDMEM_AllocateLinear)
-+#define gckVIDMEM_Free                  gcmHAL2D(gckVIDMEM_Free)
-+#define gckVIDMEM_Lock                  gcmHAL2D(gckVIDMEM_Lock)
-+#define gckVIDMEM_Unlock                gcmHAL2D(gckVIDMEM_Unlock)
-+#define gckVIDMEM_ConstructVirtual      gcmHAL2D(gckVIDMEM_ConstructVirtual)
-+#define gckVIDMEM_DestroyVirtual        gcmHAL2D(gckVIDMEM_DestroyVirtual)
-+#define gckKERNEL_Construct             gcmHAL2D(gckKERNEL_Construct)
-+#define gckKERNEL_Destroy               gcmHAL2D(gckKERNEL_Destroy)
-+#define gckKERNEL_Dispatch              gcmHAL2D(gckKERNEL_Dispatch)
-+#define gckKERNEL_QueryVideoMemory      gcmHAL2D(gckKERNEL_QueryVideoMemory)
-+#define gckKERNEL_GetVideoMemoryPool    gcmHAL2D(gckKERNEL_GetVideoMemoryPool)
-+#define gckKERNEL_MapVideoMemory        gcmHAL2D(gckKERNEL_MapVideoMemory)
-+#define gckKERNEL_UnmapVideoMemory      gcmHAL2D(gckKERNEL_UnmapVideoMemory)
-+#define gckKERNEL_MapMemory             gcmHAL2D(gckKERNEL_MapMemory)
-+#define gckKERNEL_UnmapMemory           gcmHAL2D(gckKERNEL_UnmapMemory)
-+#define gckKERNEL_Notify                gcmHAL2D(gckKERNEL_Notify)
-+#define gckKERNEL_QuerySettings         gcmHAL2D(gckKERNEL_QuerySettings)
-+#define gckKERNEL_Recovery              gcmHAL2D(gckKERNEL_Recovery)
-+#define gckKERNEL_OpenUserData          gcmHAL2D(gckKERNEL_OpenUserData)
-+#define gckKERNEL_CloseUserData         gcmHAL2D(gckKERNEL_CloseUserData)
-+#define gckHARDWARE_Construct           gcmHAL2D(gckHARDWARE_Construct)
-+#define gckHARDWARE_Destroy             gcmHAL2D(gckHARDWARE_Destroy)
-+#define gckHARDWARE_QuerySystemMemory   gcmHAL2D(gckHARDWARE_QuerySystemMemory)
-+#define gckHARDWARE_BuildVirtualAddress     gcmHAL2D(gckHARDWARE_BuildVirtualAddress)
-+#define gckHARDWARE_QueryCommandBuffer      gcmHAL2D(gckHARDWARE_QueryCommandBuffer)
-+#define gckHARDWARE_WaitLink            gcmHAL2D(gckHARDWARE_WaitLink)
-+#define gckHARDWARE_Execute             gcmHAL2D(gckHARDWARE_Execute)
-+#define gckHARDWARE_End                 gcmHAL2D(gckHARDWARE_End)
-+#define gckHARDWARE_Nop                 gcmHAL2D(gckHARDWARE_Nop)
-+#define gckHARDWARE_Wait                gcmHAL2D(gckHARDWARE_Wait)
-+#define gckHARDWARE_PipeSelect          gcmHAL2D(gckHARDWARE_PipeSelect)
-+#define gckHARDWARE_Link                gcmHAL2D(gckHARDWARE_Link)
-+#define gckHARDWARE_Event               gcmHAL2D(gckHARDWARE_Event)
-+#define gckHARDWARE_QueryMemory         gcmHAL2D(gckHARDWARE_QueryMemory)
-+#define gckHARDWARE_QueryChipIdentity   gcmHAL2D(gckHARDWARE_QueryChipIdentity)
-+#define gckHARDWARE_QueryChipSpecs      gcmHAL2D(gckHARDWARE_QueryChipSpecs)
-+#define gckHARDWARE_QueryShaderCaps     gcmHAL2D(gckHARDWARE_QueryShaderCaps)
-+#define gckHARDWARE_ConvertFormat       gcmHAL2D(gckHARDWARE_ConvertFormat)
-+#define gckHARDWARE_SplitMemory         gcmHAL2D(gckHARDWARE_SplitMemory)
-+#define gckHARDWARE_AlignToTile         gcmHAL2D(gckHARDWARE_AlignToTile)
-+#define gckHARDWARE_UpdateQueueTail     gcmHAL2D(gckHARDWARE_UpdateQueueTail)
-+#define gckHARDWARE_ConvertLogical      gcmHAL2D(gckHARDWARE_ConvertLogical)
-+#define gckHARDWARE_ConvertPhysical     gcmHAL2D(gckHARDWARE_ConvertPhysical)
-+#define gckHARDWARE_Interrupt           gcmHAL2D(gckHARDWARE_Interrupt)
-+#define gckHARDWARE_SetMMU              gcmHAL2D(gckHARDWARE_SetMMU)
-+#define gckHARDWARE_FlushMMU            gcmHAL2D(gckHARDWARE_FlushMMU)
-+#define gckHARDWARE_GetIdle             gcmHAL2D(gckHARDWARE_GetIdle)
-+#define gckHARDWARE_Flush               gcmHAL2D(gckHARDWARE_Flush)
-+#define gckHARDWARE_SetFastClear        gcmHAL2D(gckHARDWARE_SetFastClear)
-+#define gckHARDWARE_ReadInterrupt       gcmHAL2D(gckHARDWARE_ReadInterrupt)
-+#define gckHARDWARE_SetPowerManagementState         gcmHAL2D(gckHARDWARE_SetPowerManagementState)
-+#define gckHARDWARE_QueryPowerManagementState       gcmHAL2D(gckHARDWARE_QueryPowerManagementState)
-+#define gckHARDWARE_ProfileEngine2D     gcmHAL2D(gckHARDWARE_ProfileEngine2D)
-+#define gckHARDWARE_InitializeHardware  gcmHAL2D(gckHARDWARE_InitializeHardware)
-+#define gckHARDWARE_Reset               gcmHAL2D(gckHARDWARE_Reset)
-+#define gckINTERRUPT_Construct          gcmHAL2D(gckINTERRUPT_Construct)
-+#define gckINTERRUPT_Destroy            gcmHAL2D(gckINTERRUPT_Destroy)
-+#define gckINTERRUPT_SetHandler         gcmHAL2D(gckINTERRUPT_SetHandler)
-+#define gckINTERRUPT_Notify             gcmHAL2D(gckINTERRUPT_Notify)
-+#define gckEVENT_Construct              gcmHAL2D(gckEVENT_Construct)
-+#define gckEVENT_Destroy                gcmHAL2D(gckEVENT_Destroy)
-+#define gckEVENT_AddList                gcmHAL2D(gckEVENT_AddList)
-+#define gckEVENT_FreeNonPagedMemory     gcmHAL2D(gckEVENT_FreeNonPagedMemory)
-+#define gckEVENT_FreeContiguousMemory   gcmHAL2D(gckEVENT_FreeContiguousMemory)
-+#define gckEVENT_FreeVideoMemory        gcmHAL2D(gckEVENT_FreeVideoMemory)
-+#define gckEVENT_Signal                 gcmHAL2D(gckEVENT_Signal)
-+#define gckEVENT_Unlock                 gcmHAL2D(gckEVENT_Unlock)
-+#define gckEVENT_Submit                 gcmHAL2D(gckEVENT_Submit)
-+#define gckEVENT_Commit                 gcmHAL2D(gckEVENT_Commit)
-+#define gckEVENT_Notify                 gcmHAL2D(gckEVENT_Notify)
-+#define gckEVENT_Interrupt              gcmHAL2D(gckEVENT_Interrupt)
-+#define gckCOMMAND_Construct            gcmHAL2D(gckCOMMAND_Construct)
-+#define gckCOMMAND_Destroy              gcmHAL2D(gckCOMMAND_Destroy)
-+#define gckCOMMAND_EnterCommit          gcmHAL2D(gckCOMMAND_EnterCommit)
-+#define gckCOMMAND_ExitCommit           gcmHAL2D(gckCOMMAND_ExitCommit)
-+#define gckCOMMAND_Start                gcmHAL2D(gckCOMMAND_Start)
-+#define gckCOMMAND_Stop                 gcmHAL2D(gckCOMMAND_Stop)
-+#define gckCOMMAND_Commit               gcmHAL2D(gckCOMMAND_Commit)
-+#define gckCOMMAND_Reserve              gcmHAL2D(gckCOMMAND_Reserve)
-+#define gckCOMMAND_Execute              gcmHAL2D(gckCOMMAND_Execute)
-+#define gckCOMMAND_Stall                gcmHAL2D(gckCOMMAND_Stall)
-+#define gckCOMMAND_Attach               gcmHAL2D(gckCOMMAND_Attach)
-+#define gckCOMMAND_Detach               gcmHAL2D(gckCOMMAND_Detach)
-+#define gckMMU_Construct                gcmHAL2D(gckMMU_Construct)
-+#define gckMMU_Destroy                  gcmHAL2D(gckMMU_Destroy)
-+#define gckMMU_AllocatePages            gcmHAL2D(gckMMU_AllocatePages)
-+#define gckMMU_FreePages                gcmHAL2D(gckMMU_FreePages)
-+#define gckMMU_InsertNode               gcmHAL2D(gckMMU_InsertNode)
-+#define gckMMU_RemoveNode               gcmHAL2D(gckMMU_RemoveNode)
-+#define gckMMU_FreeHandleMemory         gcmHAL2D(gckMMU_FreeHandleMemory)
-+#define gckMMU_Test                     gcmHAL2D(gckMMU_Test)
-+#define gckHARDWARE_QueryProfileRegisters     gcmHAL2D(gckHARDWARE_QueryProfileRegisters)
-+
-+
-+#define FindMdlMap                      gcmHAL2D(FindMdlMap)
-+#define OnProcessExit                   gcmHAL2D(OnProcessExit)
-+
-+#define gckGALDEVICE_Destroy            gcmHAL2D(gckGALDEVICE_Destroy)
-+#define gckOS_Print                     gcmHAL2D(gckOS_Print)
-+#define gckGALDEVICE_FreeMemory         gcmHAL2D(gckGALDEVICE_FreeMemory)
-+#define gckGALDEVICE_AllocateMemory     gcmHAL2D(gckGALDEVICE_AllocateMemory)
-+#define gckOS_DebugBreak                gcmHAL2D(gckOS_DebugBreak)
-+#define gckGALDEVICE_Release_ISR        gcmHAL2D(gckGALDEVICE_Release_ISR)
-+#define gckOS_Verify                    gcmHAL2D(gckOS_Verify)
-+#define gckCOMMAND_Release              gcmHAL2D(gckCOMMAND_Release)
-+#define gckGALDEVICE_Stop               gcmHAL2D(gckGALDEVICE_Stop)
-+#define gckGALDEVICE_Construct          gcmHAL2D(gckGALDEVICE_Construct)
-+#define gckOS_DebugFatal                gcmHAL2D(gckOS_DebugFatal)
-+#define gckOS_DebugTrace                gcmHAL2D(gckOS_DebugTrace)
-+#define gckHARDWARE_GetBaseAddress      gcmHAL2D(gckHARDWARE_GetBaseAddress)
-+#define gckGALDEVICE_Setup_ISR          gcmHAL2D(gckGALDEVICE_Setup_ISR)
-+#define gckKERNEL_AttachProcess         gcmHAL2D(gckKERNEL_AttachProcess)
-+#define gckKERNEL_AttachProcessEx       gcmHAL2D(gckKERNEL_AttachProcessEx)
-+#define gckGALDEVICE_Start_Thread       gcmHAL2D(gckGALDEVICE_Start_Thread)
-+#define gckHARDWARE_QueryIdle           gcmHAL2D(gckHARDWARE_QueryIdle)
-+#define gckGALDEVICE_Start              gcmHAL2D(gckGALDEVICE_Start)
-+#define gckOS_GetKernelLogical          gcmHAL2D(gckOS_GetKernelLogical)
-+#define gckOS_DebugTraceZone            gcmHAL2D(gckOS_DebugTraceZone)
-+#define gckGALDEVICE_Stop_Thread        gcmHAL2D(gckGALDEVICE_Stop_Thread)
-+#define gckHARDWARE_NeedBaseAddress     gcmHAL2D(gckHARDWARE_NeedBaseAddress)
-+
-+#endif
-+
-+#endif /* __gc_hal_rename_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,137 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef _GC_HAL_SECURITY_INTERFACE_H_
-+#define _GC_HAL_SECURITY_INTERFACE_H_
-+/*!
-+ @brief Command codes between kernel module and TrustZone
-+ @discussion
-+ Critical services must be done in TrustZone to avoid sensitive content leak. Most of kernel module is kept in non-Secure os to minimize
-+ code in TrustZone.
-+ */
-+typedef enum kernel_packet_command {
-+    KERNEL_START_COMMAND,
-+    KERNEL_SUBMIT,
-+    KERNEL_MAP_MEMORY,                    /* */
-+    KERNEL_UNMAP_MEMORY,
-+    KERNEL_ALLOCATE_SECRUE_MEMORY,        /*! Security memory management. */
-+    KERNEL_FREE_SECURE_MEMORY,
-+    KERNEL_EXECUTE,                       /* Execute a command buffer. */
-+} kernel_packet_command_t;
-+
-+/*!
-+ @brief gckCOMMAND Object requests TrustZone to start FE.
-+ @discussion
-+ DMA enabled register can only be written in TrustZone to avoid GPU from jumping to a hacked code.
-+ Kernel module need use these command to ask TrustZone start command parser.
-+ */
-+struct kernel_start_command {
-+    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
-+    gctUINT8       gpu;                    /*! Which GPU. */
-+};
-+
-+/*!
-+ @brief gckCOMMAND Object requests TrustZone to submit command buffer.
-+ @discussion
-+ Code in trustzone will check content of command buffer after copying command buffer to TrustZone.
-+ */
-+struct kernel_submit {
-+    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
-+    gctUINT8       gpu;                    /*! Which GPU. */
-+    gctUINT8       kernel_command;         /*! Whether it is a kernel command. */
-+    gctUINT32      command_buffer_handle;  /*! Handle to command buffer. */
-+    gctUINT32      offset;                  /* Offset in command buffer. */
-+    gctUINT32 *    command_buffer;         /*! Content of command buffer need to be submit. */
-+    gctUINT32      command_buffer_length;  /*! Length of command buffer. */
-+};
-+
-+
-+/*!
-+ @brief gckVIDMEM Object requests TrustZone to allocate security memory.
-+ @discussion
-+ Allocate a buffer from security GPU memory.
-+ */
-+struct kernel_allocate_security_memory {
-+    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
-+    gctUINT32      bytes;                  /*! Requested bytes. */
-+    gctUINT32      memory_handle;          /*! Handle of allocated memory. */
-+};
-+
-+/*!
-+ @brief gckVIDMEM Object requests TrustZone to allocate security memory.
-+ @discussion
-+ Free a video memory buffer from security GPU memory.
-+ */
-+struct kernel_free_security_memory {
-+    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
-+    gctUINT32      memory_handle;          /*! Handle of allocated memory. */
-+};
-+
-+struct kernel_execute {
-+    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
-+    gctUINT8       gpu;                    /*! Which GPU. */
-+    gctUINT8       kernel_command;         /*! Whether it is a kernel command. */
-+    gctUINT32 *    command_buffer;         /*! Content of command buffer need to be submit. */
-+    gctUINT32      command_buffer_length;  /*! Length of command buffer. */
-+};
-+
-+typedef struct kernel_map_scatter_gather {
-+    gctUINT32      bytes;
-+    gctUINT32      physical;
-+    struct kernel_map_scatter_gather *next;
-+}
-+kernel_map_scatter_gather_t;
-+
-+struct kernel_map_memory {
-+    kernel_packet_command_t command;
-+    kernel_map_scatter_gather_t *scatter;
-+    gctUINT32       *physicals;
-+    gctUINT32       pageCount;
-+    gctUINT32       gpuAddress;
-+};
-+
-+struct kernel_unmap_memory {
-+    gctUINT32       gpuAddress;
-+    gctUINT32       pageCount;
-+};
-+
-+typedef struct _gcsTA_INTERFACE {
-+    kernel_packet_command_t command;
-+    union {
-+        struct kernel_submit                   Submit;
-+        struct kernel_start_command            StartCommand;
-+        struct kernel_allocate_security_memory AllocateSecurityMemory;
-+        struct kernel_execute                  Execute;
-+        struct kernel_map_memory               MapMemory;
-+        struct kernel_unmap_memory             UnmapMemory;
-+    } u;
-+    gceSTATUS result;
-+} gcsTA_INTERFACE;
-+
-+enum {
-+    gcvTA_COMMAND_INIT,
-+    gcvTA_COMMAND_DISPATCH,
-+
-+    gcvTA_CALLBACK_ALLOC_SECURE_MEM,
-+    gcvTA_CALLBACK_FREE_SECURE_MEM,
-+};
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,115 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_statistics_h_
-+#define __gc_hal_statistics_h_
-+
-+
-+#define VIV_STAT_ENABLE_STATISTICS              0
-+
-+/*  Toal number of frames for which the frame time is accounted. We have storage
-+    to keep frame times for last this many frames.
-+*/
-+#define VIV_STAT_FRAME_BUFFER_SIZE              30
-+
-+/*
-+    Total number of frames sampled for a mode. This means
-+
-+    # of frames for HZ Current  : VIV_STAT_EARLY_Z_SAMPLE_FRAMES
-+    # of frames for HZ Switched : VIV_STAT_EARLY_Z_SAMPLE_FRAMES
-+  +
-+  --------------------------------------------------------
-+                                : (2 * VIV_STAT_EARLY_Z_SAMPLE_FRAMES) frames needed
-+
-+    IMPORTANT: This total must be smaller than VIV_STAT_FRAME_BUFFER_SIZE
-+*/
-+#define VIV_STAT_EARLY_Z_SAMPLE_FRAMES          7
-+#define VIV_STAT_EARLY_Z_LATENCY_FRAMES         2
-+
-+/* Multiplication factor for previous Hz off mode. Make it more than 1.0 to advertise HZ on.*/
-+#define VIV_STAT_EARLY_Z_FACTOR                 (1.05f)
-+
-+/* Defines the statistical data keys monitored by the statistics module */
-+typedef enum _gceSTATISTICS
-+{
-+    gcvFRAME_FPS        =   1,
-+}
-+gceSTATISTICS;
-+
-+/* HAL statistics information. */
-+typedef struct _gcsSTATISTICS_EARLYZ
-+{
-+    gctUINT                     switchBackCount;
-+    gctUINT                     nextCheckPoint;
-+    gctBOOL                     disabled;
-+}
-+gcsSTATISTICS_EARLYZ;
-+
-+
-+/* Defines the statistical data keys monitored by the statistics module */
-+typedef enum _gceSTATISTICS_Call
-+{
-+	gcvSTAT_ES11_GLDRAWELEMENTS      =   1,
-+}
-+gceSTATISTICS_Call;
-+
-+
-+/* HAL statistics information. */
-+typedef struct _gcsSTATISTICS
-+{
-+    gctUINT64                   frameTime[VIV_STAT_FRAME_BUFFER_SIZE];
-+    gctUINT64                   previousFrameTime;
-+    gctUINT                     frame;
-+    gcsSTATISTICS_EARLYZ        earlyZ;
-+	gctUINT						ES11_drawElementsCount;
-+	gctBOOL						applyRTestVAFix;
-+}
-+gcsSTATISTICS;
-+
-+
-+/* Add a frame based data into current statistics. */
-+void
-+gcfSTATISTICS_AddData(
-+    IN gceSTATISTICS Key,
-+    IN gctUINT Value
-+    );
-+
-+/* Marks the frame end and triggers statistical calculations and decisions.*/
-+void
-+gcfSTATISTICS_MarkFrameEnd (
-+    void
-+    );
-+
-+/* Sets whether the dynmaic HZ is disabled or not .*/
-+void
-+gcfSTATISTICS_DisableDynamicEarlyZ (
-+    IN gctBOOL Disabled
-+    );
-+
-+/* Checks whether or not glDrawArray function call will be discarded */
-+gctBOOL
-+gcfSTATISTICS_DiscardCall(
-+	gceSTATISTICS_Call Function
-+	);
-+
-+
-+#endif /*__gc_hal_statistics_h_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,1088 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+#ifndef __gc_hal_types_h_
-+#define __gc_hal_types_h_
-+
-+#include "gc_hal_version.h"
-+#include "gc_hal_options.h"
-+
-+#ifdef _WIN32
-+#pragma warning(disable:4127)   /* Conditional expression is constant (do { }
-+                                ** while(0)). */
-+#pragma warning(disable:4100)   /* Unreferenced formal parameter. */
-+#pragma warning(disable:4204)   /* Non-constant aggregate initializer (C99). */
-+#pragma warning(disable:4131)   /* Uses old-style declarator (for Bison and
-+                                ** Flex generated files). */
-+#pragma warning(disable:4206)   /* Translation unit is empty. */
-+#endif
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+**  Platform macros.
-+*/
-+
-+#if defined(__GNUC__)
-+#   define gcdHAS_ELLIPSES      1       /* GCC always has it. */
-+#elif defined(__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L)
-+#   define gcdHAS_ELLIPSES      1       /* C99 has it. */
-+#elif defined(_MSC_VER) && (_MSC_VER >= 1500)
-+#   define gcdHAS_ELLIPSES      1       /* MSVC 2007+ has it. */
-+#elif defined(UNDER_CE)
-+#if UNDER_CE >= 600
-+#       define gcdHAS_ELLIPSES  1
-+#   else
-+#       define gcdHAS_ELLIPSES  0
-+#   endif
-+#else
-+#   error "gcdHAS_ELLIPSES: Platform could not be determined"
-+#endif
-+
-+/******************************************************************************\
-+************************************ Keyword ***********************************
-+\******************************************************************************/
-+
-+#if (defined(__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L))
-+#   define gcmINLINE            inline      /* C99 keyword. */
-+#elif defined(__GNUC__)
-+#   define gcmINLINE            __inline__  /* GNU keyword. */
-+#elif defined(_MSC_VER) || defined(UNDER_CE)
-+#   define gcmINLINE            __inline    /* Internal keyword. */
-+#else
-+#   error "gcmINLINE: Platform could not be determined"
-+#endif
-+
-+/* Possible debug flags. */
-+#define gcdDEBUG_NONE           0
-+#define gcdDEBUG_ALL            (1 << 0)
-+#define gcdDEBUG_FATAL          (1 << 1)
-+#define gcdDEBUG_TRACE          (1 << 2)
-+#define gcdDEBUG_BREAK          (1 << 3)
-+#define gcdDEBUG_ASSERT         (1 << 4)
-+#define gcdDEBUG_CODE           (1 << 5)
-+#define gcdDEBUG_STACK          (1 << 6)
-+
-+#define gcmIS_DEBUG(flag)       ( gcdDEBUG & (flag | gcdDEBUG_ALL) )
-+
-+#ifndef gcdDEBUG
-+#if (defined(DBG) && DBG) || defined(DEBUG) || defined(_DEBUG)
-+#       define gcdDEBUG         gcdDEBUG_ALL
-+#   else
-+#       define gcdDEBUG         gcdDEBUG_NONE
-+#   endif
-+#endif
-+
-+#ifdef _USRDLL
-+#ifdef _MSC_VER
-+#ifdef HAL_EXPORTS
-+#           define HALAPI       __declspec(dllexport)
-+#       else
-+#           define HALAPI       __declspec(dllimport)
-+#       endif
-+#       define HALDECL          __cdecl
-+#   else
-+#ifdef HAL_EXPORTS
-+#           define HALAPI
-+#       else
-+#           define HALAPI       extern
-+#       endif
-+#   endif
-+#else
-+#   define HALAPI
-+#   define HALDECL
-+#endif
-+
-+/******************************************************************************\
-+********************************** Common Types ********************************
-+\******************************************************************************/
-+
-+#define gcvFALSE                0
-+#define gcvTRUE                 1
-+
-+#define gcvINFINITE             ((gctUINT32) ~0U)
-+
-+#define gcvINVALID_HANDLE       ((gctHANDLE) ~0U)
-+
-+typedef int                     gctBOOL;
-+typedef gctBOOL *               gctBOOL_PTR;
-+
-+typedef int                     gctINT;
-+typedef long                    gctLONG;
-+typedef signed char             gctINT8;
-+typedef signed short            gctINT16;
-+typedef signed int              gctINT32;
-+typedef signed long long        gctINT64;
-+
-+typedef gctINT *                gctINT_PTR;
-+typedef gctINT8 *               gctINT8_PTR;
-+typedef gctINT16 *              gctINT16_PTR;
-+typedef gctINT32 *              gctINT32_PTR;
-+typedef gctINT64 *              gctINT64_PTR;
-+
-+typedef unsigned int            gctUINT;
-+typedef unsigned char           gctUINT8;
-+typedef unsigned short          gctUINT16;
-+typedef unsigned int            gctUINT32;
-+typedef unsigned long long      gctUINT64;
-+typedef unsigned long           gctUINTPTR_T;
-+
-+typedef gctUINT *               gctUINT_PTR;
-+typedef gctUINT8 *              gctUINT8_PTR;
-+typedef gctUINT16 *             gctUINT16_PTR;
-+typedef gctUINT32 *             gctUINT32_PTR;
-+typedef gctUINT64 *             gctUINT64_PTR;
-+
-+typedef unsigned long           gctSIZE_T;
-+typedef gctSIZE_T *             gctSIZE_T_PTR;
-+
-+#ifdef __cplusplus
-+#   define gcvNULL              0
-+#else
-+#   define gcvNULL              ((void *) 0)
-+#endif
-+
-+typedef float                   gctFLOAT;
-+typedef signed int              gctFIXED_POINT;
-+typedef float *                 gctFLOAT_PTR;
-+
-+typedef void *                  gctPHYS_ADDR;
-+typedef void *                  gctHANDLE;
-+typedef void *                  gctFILE;
-+typedef void *                  gctSIGNAL;
-+typedef void *                  gctWINDOW;
-+typedef void *                  gctIMAGE;
-+typedef void *                  gctSYNC_POINT;
-+
-+typedef void *					gctSEMAPHORE;
-+
-+typedef void *                  gctPOINTER;
-+typedef const void *            gctCONST_POINTER;
-+
-+typedef char                    gctCHAR;
-+typedef char *                  gctSTRING;
-+typedef const char *            gctCONST_STRING;
-+
-+typedef struct _gcsCOUNT_STRING
-+{
-+    gctSIZE_T                   Length;
-+    gctCONST_STRING             String;
-+}
-+gcsCOUNT_STRING;
-+
-+typedef union _gcuFLOAT_UINT32
-+{
-+    gctFLOAT    f;
-+    gctUINT32   u;
-+}
-+gcuFLOAT_UINT32;
-+
-+/* Fixed point constants. */
-+#define gcvZERO_X               ((gctFIXED_POINT) 0x00000000)
-+#define gcvHALF_X               ((gctFIXED_POINT) 0x00008000)
-+#define gcvONE_X                ((gctFIXED_POINT) 0x00010000)
-+#define gcvNEGONE_X             ((gctFIXED_POINT) 0xFFFF0000)
-+#define gcvTWO_X                ((gctFIXED_POINT) 0x00020000)
-+
-+/* Stringizing macro. */
-+#define gcmSTRING(Value)        #Value
-+
-+/******************************************************************************\
-+******************************* Fixed Point Math *******************************
-+\******************************************************************************/
-+
-+#define gcmXMultiply(x1, x2)            gcoMATH_MultiplyFixed(x1, x2)
-+#define gcmXDivide(x1, x2)              gcoMATH_DivideFixed(x1, x2)
-+#define gcmXMultiplyDivide(x1, x2, x3)  gcoMATH_MultiplyDivideFixed(x1, x2, x3)
-+
-+/* 2D Engine profile. */
-+typedef struct _gcs2D_PROFILE
-+{
-+    /* Cycle count.
-+       32bit counter incremented every 2D clock cycle.
-+       Wraps back to 0 when the counter overflows.
-+    */
-+    gctUINT32 cycleCount;
-+
-+    /* Pixels rendered by the 2D engine.
-+       Resets to 0 every time it is read. */
-+    gctUINT32 pixelsRendered;
-+}
-+gcs2D_PROFILE;
-+
-+/* Macro to combine four characters into a Charcater Code. */
-+#define gcmCC(c1, c2, c3, c4) \
-+( \
-+    (char) (c1) \
-+    | \
-+    ((char) (c2) <<  8) \
-+    | \
-+    ((char) (c3) << 16) \
-+    | \
-+    ((char) (c4) << 24) \
-+)
-+
-+#define gcmPRINTABLE(c)         ((((c) >= ' ') && ((c) <= '}')) ? ((c) != '%' ?  (c) : ' ') : ' ')
-+
-+#define gcmCC_PRINT(cc) \
-+    gcmPRINTABLE((char) ( (cc)        & 0xFF)), \
-+    gcmPRINTABLE((char) (((cc) >>  8) & 0xFF)), \
-+    gcmPRINTABLE((char) (((cc) >> 16) & 0xFF)), \
-+    gcmPRINTABLE((char) (((cc) >> 24) & 0xFF))
-+
-+/******************************************************************************\
-+****************************** Function Parameters *****************************
-+\******************************************************************************/
-+
-+#define IN
-+#define OUT
-+#define OPTIONAL
-+
-+/******************************************************************************\
-+********************************* Status Codes *********************************
-+\******************************************************************************/
-+
-+typedef enum _gceSTATUS
-+{
-+    gcvSTATUS_OK                    =   0,
-+    gcvSTATUS_FALSE                 =   0,
-+    gcvSTATUS_TRUE                  =   1,
-+    gcvSTATUS_NO_MORE_DATA          =   2,
-+    gcvSTATUS_CACHED                =   3,
-+    gcvSTATUS_MIPMAP_TOO_LARGE      =   4,
-+    gcvSTATUS_NAME_NOT_FOUND        =   5,
-+    gcvSTATUS_NOT_OUR_INTERRUPT     =   6,
-+    gcvSTATUS_MISMATCH              =   7,
-+    gcvSTATUS_MIPMAP_TOO_SMALL      =   8,
-+    gcvSTATUS_LARGER                =   9,
-+    gcvSTATUS_SMALLER               =   10,
-+    gcvSTATUS_CHIP_NOT_READY        =   11,
-+    gcvSTATUS_NEED_CONVERSION       =   12,
-+    gcvSTATUS_SKIP                  =   13,
-+    gcvSTATUS_DATA_TOO_LARGE        =   14,
-+    gcvSTATUS_INVALID_CONFIG        =   15,
-+    gcvSTATUS_CHANGED               =   16,
-+    gcvSTATUS_NOT_SUPPORT_DITHER    =   17,
-+	gcvSTATUS_EXECUTED				=	18,
-+    gcvSTATUS_TERMINATE             =   19,
-+
-+    gcvSTATUS_CONVERT_TO_SINGLE_STREAM    =   20,
-+
-+    gcvSTATUS_INVALID_ARGUMENT      =   -1,
-+    gcvSTATUS_INVALID_OBJECT        =   -2,
-+    gcvSTATUS_OUT_OF_MEMORY         =   -3,
-+    gcvSTATUS_MEMORY_LOCKED         =   -4,
-+    gcvSTATUS_MEMORY_UNLOCKED       =   -5,
-+    gcvSTATUS_HEAP_CORRUPTED        =   -6,
-+    gcvSTATUS_GENERIC_IO            =   -7,
-+    gcvSTATUS_INVALID_ADDRESS       =   -8,
-+    gcvSTATUS_CONTEXT_LOSSED        =   -9,
-+    gcvSTATUS_TOO_COMPLEX           =   -10,
-+    gcvSTATUS_BUFFER_TOO_SMALL      =   -11,
-+    gcvSTATUS_INTERFACE_ERROR       =   -12,
-+    gcvSTATUS_NOT_SUPPORTED         =   -13,
-+    gcvSTATUS_MORE_DATA             =   -14,
-+    gcvSTATUS_TIMEOUT               =   -15,
-+    gcvSTATUS_OUT_OF_RESOURCES      =   -16,
-+    gcvSTATUS_INVALID_DATA          =   -17,
-+    gcvSTATUS_INVALID_MIPMAP        =   -18,
-+    gcvSTATUS_NOT_FOUND             =   -19,
-+    gcvSTATUS_NOT_ALIGNED           =   -20,
-+    gcvSTATUS_INVALID_REQUEST       =   -21,
-+    gcvSTATUS_GPU_NOT_RESPONDING    =   -22,
-+    gcvSTATUS_TIMER_OVERFLOW        =   -23,
-+    gcvSTATUS_VERSION_MISMATCH      =   -24,
-+    gcvSTATUS_LOCKED                =   -25,
-+    gcvSTATUS_INTERRUPTED           =   -26,
-+    gcvSTATUS_DEVICE                =   -27,
-+    gcvSTATUS_NOT_MULTI_PIPE_ALIGNED =   -28,
-+
-+    /* Linker errors. */
-+    gcvSTATUS_GLOBAL_TYPE_MISMATCH  =   -1000,
-+    gcvSTATUS_TOO_MANY_ATTRIBUTES   =   -1001,
-+    gcvSTATUS_TOO_MANY_UNIFORMS     =   -1002,
-+    gcvSTATUS_TOO_MANY_VARYINGS     =   -1003,
-+    gcvSTATUS_UNDECLARED_VARYING    =   -1004,
-+    gcvSTATUS_VARYING_TYPE_MISMATCH =   -1005,
-+    gcvSTATUS_MISSING_MAIN          =   -1006,
-+    gcvSTATUS_NAME_MISMATCH         =   -1007,
-+    gcvSTATUS_INVALID_INDEX         =   -1008,
-+    gcvSTATUS_UNIFORM_TYPE_MISMATCH =   -1009,
-+
-+    /* Compiler errors. */
-+    gcvSTATUS_COMPILER_FE_PREPROCESSOR_ERROR = -2000,
-+    gcvSTATUS_COMPILER_FE_PARSER_ERROR = -2001,
-+}
-+gceSTATUS;
-+
-+/******************************************************************************\
-+********************************* Status Macros ********************************
-+\******************************************************************************/
-+
-+#define gcmIS_ERROR(status)         (status < 0)
-+#define gcmNO_ERROR(status)         (status >= 0)
-+#define gcmIS_SUCCESS(status)       (status == gcvSTATUS_OK)
-+
-+/******************************************************************************\
-+********************************* Field Macros *********************************
-+\******************************************************************************/
-+
-+#define __gcmSTART(reg_field) \
-+    (0 ? reg_field)
-+
-+#define __gcmEND(reg_field) \
-+    (1 ? reg_field)
-+
-+#define __gcmGETSIZE(reg_field) \
-+    (__gcmEND(reg_field) - __gcmSTART(reg_field) + 1)
-+
-+#define __gcmALIGN(data, reg_field) \
-+    (((gctUINT32) (data)) << __gcmSTART(reg_field))
-+
-+#define __gcmMASK(reg_field) \
-+    ((gctUINT32) ((__gcmGETSIZE(reg_field) == 32) \
-+        ?  ~0 \
-+        : (~(~0 << __gcmGETSIZE(reg_field)))))
-+
-+/*******************************************************************************
-+**
-+**  gcmFIELDMASK
-+**
-+**      Get aligned field mask.
-+**
-+**  ARGUMENTS:
-+**
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+*/
-+#define gcmFIELDMASK(reg, field) \
-+( \
-+    __gcmALIGN(__gcmMASK(reg##_##field), reg##_##field) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmGETFIELD
-+**
-+**      Extract the value of a field from specified data.
-+**
-+**  ARGUMENTS:
-+**
-+**      data    Data value.
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+*/
-+#define gcmGETFIELD(data, reg, field) \
-+( \
-+    ((((gctUINT32) (data)) >> __gcmSTART(reg##_##field)) \
-+        & __gcmMASK(reg##_##field)) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmSETFIELD
-+**
-+**      Set the value of a field within specified data.
-+**
-+**  ARGUMENTS:
-+**
-+**      data    Data value.
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+**      value   Value for field.
-+*/
-+#define gcmSETFIELD(data, reg, field, value) \
-+( \
-+    (((gctUINT32) (data)) \
-+        & ~__gcmALIGN(__gcmMASK(reg##_##field), reg##_##field)) \
-+        |  __gcmALIGN((gctUINT32) (value) \
-+            & __gcmMASK(reg##_##field), reg##_##field) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmSETFIELDVALUE
-+**
-+**      Set the value of a field within specified data with a
-+**      predefined value.
-+**
-+**  ARGUMENTS:
-+**
-+**      data    Data value.
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+**      value   Name of the value within the field.
-+*/
-+#define gcmSETFIELDVALUE(data, reg, field, value) \
-+( \
-+    (((gctUINT32) (data)) \
-+        & ~__gcmALIGN(__gcmMASK(reg##_##field), reg##_##field)) \
-+        |  __gcmALIGN(reg##_##field##_##value \
-+            & __gcmMASK(reg##_##field), reg##_##field) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmGETMASKEDFIELDMASK
-+**
-+**      Determine field mask of a masked field.
-+**
-+**  ARGUMENTS:
-+**
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+*/
-+#define gcmGETMASKEDFIELDMASK(reg, field) \
-+( \
-+    gcmSETFIELD(0, reg,          field, ~0) | \
-+    gcmSETFIELD(0, reg, MASK_ ## field, ~0)   \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmSETMASKEDFIELD
-+**
-+**      Set the value of a masked field with specified data.
-+**
-+**  ARGUMENTS:
-+**
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+**      value   Value for field.
-+*/
-+#define gcmSETMASKEDFIELD(reg, field, value) \
-+( \
-+    gcmSETFIELD     (~0, reg,          field, value) & \
-+    gcmSETFIELDVALUE(~0, reg, MASK_ ## field, ENABLED) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmSETMASKEDFIELDVALUE
-+**
-+**      Set the value of a masked field with specified data.
-+**
-+**  ARGUMENTS:
-+**
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+**      value   Value for field.
-+*/
-+#define gcmSETMASKEDFIELDVALUE(reg, field, value) \
-+( \
-+    gcmSETFIELDVALUE(~0, reg,          field, value) & \
-+    gcmSETFIELDVALUE(~0, reg, MASK_ ## field, ENABLED) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFYFIELDVALUE
-+**
-+**      Verify if the value of a field within specified data equals a
-+**      predefined value.
-+**
-+**  ARGUMENTS:
-+**
-+**      data    Data value.
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+**      value   Name of the value within the field.
-+*/
-+#define gcmVERIFYFIELDVALUE(data, reg, field, value) \
-+( \
-+    (((gctUINT32) (data)) >> __gcmSTART(reg##_##field) & \
-+                             __gcmMASK(reg##_##field)) \
-+        == \
-+    (reg##_##field##_##value & __gcmMASK(reg##_##field)) \
-+)
-+
-+/*******************************************************************************
-+**  Bit field macros.
-+*/
-+
-+#define __gcmSTARTBIT(Field) \
-+    ( 1 ? Field )
-+
-+#define __gcmBITSIZE(Field) \
-+    ( 0 ? Field )
-+
-+#define __gcmBITMASK(Field) \
-+( \
-+    (1 << __gcmBITSIZE(Field)) - 1 \
-+)
-+
-+#define gcmGETBITS(Value, Type, Field) \
-+( \
-+    ( ((Type) (Value)) >> __gcmSTARTBIT(Field) ) \
-+    & \
-+    __gcmBITMASK(Field) \
-+)
-+
-+#define gcmSETBITS(Value, Type, Field, NewValue) \
-+( \
-+    ( ((Type) (Value)) \
-+    & ~(__gcmBITMASK(Field) << __gcmSTARTBIT(Field)) \
-+    ) \
-+    | \
-+    ( ( ((Type) (NewValue)) \
-+      & __gcmBITMASK(Field) \
-+      ) << __gcmSTARTBIT(Field) \
-+    ) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  gcmISINREGRANGE
-+**
-+**      Verify whether the specified address is in the register range.
-+**
-+**  ARGUMENTS:
-+**
-+**      Address Address to be verified.
-+**      Name    Name of a register.
-+*/
-+
-+#define gcmISINREGRANGE(Address, Name) \
-+( \
-+    ((Address & (~0U << Name ## _LSB)) == (Name ## _Address >> 2)) \
-+)
-+
-+/*******************************************************************************
-+**
-+**  A set of macros to aid state loading.
-+**
-+**  ARGUMENTS:
-+**
-+**      CommandBuffer   Pointer to a gcoCMDBUF object.
-+**      StateDelta      Pointer to a gcsSTATE_DELTA state delta structure.
-+**      Memory          Destination memory pointer of gctUINT32_PTR type.
-+**      PartOfContext   Whether or not the state is a part of the context.
-+**      FixedPoint      Whether or not the state is of the fixed point format.
-+**      Count           Number of consecutive states to be loaded.
-+**      Address         State address.
-+**      Data            Data to be set to the state.
-+*/
-+
-+/*----------------------------------------------------------------------------*/
-+
-+#if gcmIS_DEBUG(gcdDEBUG_CODE)
-+
-+#   define gcmSTORELOADSTATE(CommandBuffer, Memory, Address, Count) \
-+        CommandBuffer->lastLoadStatePtr     = gcmPTR_TO_UINT64(Memory); \
-+        CommandBuffer->lastLoadStateAddress = Address; \
-+        CommandBuffer->lastLoadStateCount   = Count
-+
-+#   define gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address) \
-+        gcmASSERT( \
-+            (gctUINT) (Memory  - gcmUINT64_TO_TYPE(CommandBuffer->lastLoadStatePtr, gctUINT32_PTR) - 1) \
-+            == \
-+            (gctUINT) (Address - CommandBuffer->lastLoadStateAddress) \
-+            ); \
-+        \
-+        gcmASSERT(CommandBuffer->lastLoadStateCount > 0); \
-+        \
-+        CommandBuffer->lastLoadStateCount -= 1
-+
-+#   define gcmVERIFYLOADSTATEDONE(CommandBuffer) \
-+        gcmASSERT(CommandBuffer->lastLoadStateCount == 0)
-+
-+#else
-+
-+#   define gcmSTORELOADSTATE(CommandBuffer, Memory, Address, Count)
-+#   define gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address)
-+#   define gcmVERIFYLOADSTATEDONE(CommandBuffer)
-+
-+#endif
-+
-+#if gcdSECURE_USER
-+
-+#   define gcmDEFINESECUREUSER() \
-+        gctUINT         __secure_user_offset__; \
-+        gctUINT32_PTR   __secure_user_hintArray__;
-+
-+#   define gcmBEGINSECUREUSER() \
-+        __secure_user_offset__ = reserve->lastOffset; \
-+        \
-+        __secure_user_hintArray__ = gcmUINT64_TO_PTR(reserve->hintArrayTail)
-+
-+#   define gcmENDSECUREUSER() \
-+        reserve->hintArrayTail = gcmPTR_TO_UINT64(__secure_user_hintArray__)
-+
-+#   define gcmSKIPSECUREUSER() \
-+        __secure_user_offset__ += gcmSIZEOF(gctUINT32)
-+
-+#   define gcmUPDATESECUREUSER() \
-+        *__secure_user_hintArray__ = __secure_user_offset__; \
-+        \
-+        __secure_user_offset__    += gcmSIZEOF(gctUINT32); \
-+        __secure_user_hintArray__ += 1
-+
-+#else
-+
-+#   define gcmDEFINESECUREUSER()
-+#   define gcmBEGINSECUREUSER()
-+#   define gcmENDSECUREUSER()
-+#   define gcmSKIPSECUREUSER()
-+#   define gcmUPDATESECUREUSER()
-+
-+#endif
-+
-+/*----------------------------------------------------------------------------*/
-+
-+#if gcdDUMP
-+#   define gcmDUMPSTATEDATA(StateDelta, FixedPoint, Address, Data) \
-+        if (FixedPoint) \
-+        { \
-+            gcmDUMP(gcvNULL, "@[state.x 0x%04X 0x%08X]", \
-+                Address, Data \
-+                ); \
-+        } \
-+        else \
-+        { \
-+            gcmDUMP(gcvNULL, "@[state 0x%04X 0x%08X]", \
-+                Address, Data \
-+                ); \
-+        }
-+#else
-+#   define gcmDUMPSTATEDATA(StateDelta, FixedPoint, Address, Data)
-+#endif
-+
-+/*----------------------------------------------------------------------------*/
-+
-+#define gcmDEFINESTATEBUFFER(CommandBuffer, StateDelta, Memory, ReserveSize) \
-+    gcmDEFINESECUREUSER() \
-+    gctSIZE_T ReserveSize; \
-+    gcoCMDBUF CommandBuffer; \
-+    gctUINT32_PTR Memory; \
-+    gcsSTATE_DELTA_PTR StateDelta
-+
-+#define gcmBEGINSTATEBUFFER(Hardware, CommandBuffer, StateDelta, Memory, ReserveSize) \
-+{ \
-+    gcmONERROR(gcoBUFFER_Reserve( \
-+        Hardware->buffer, ReserveSize, gcvTRUE, &CommandBuffer \
-+        )); \
-+    \
-+    Memory =  gcmUINT64_TO_PTR(CommandBuffer->lastReserve); \
-+    \
-+    StateDelta = Hardware->delta; \
-+    \
-+    gcmBEGINSECUREUSER(); \
-+}
-+
-+#define gcmENDSTATEBUFFER(CommandBuffer, Memory, ReserveSize) \
-+{ \
-+    gcmENDSECUREUSER(); \
-+    \
-+    gcmASSERT( \
-+        gcmUINT64_TO_TYPE(CommandBuffer->lastReserve, gctUINT8_PTR) + ReserveSize \
-+        == \
-+         (gctUINT8_PTR) Memory \
-+        ); \
-+}
-+
-+/*----------------------------------------------------------------------------*/
-+
-+#define gcmBEGINSTATEBATCH(CommandBuffer, Memory, FixedPoint, Address, Count) \
-+{ \
-+    gcmASSERT(((Memory - gcmUINT64_TO_TYPE(CommandBuffer->lastReserve, gctUINT32_PTR)) & 1) == 0); \
-+    gcmASSERT((gctUINT32)Count <= 1024); \
-+    \
-+    gcmVERIFYLOADSTATEDONE(CommandBuffer); \
-+    \
-+    gcmSTORELOADSTATE(CommandBuffer, Memory, Address, Count); \
-+    \
-+    *Memory++ \
-+        = gcmSETFIELDVALUE(0, AQ_COMMAND_LOAD_STATE_COMMAND, OPCODE,  LOAD_STATE) \
-+        | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, FLOAT,   FixedPoint) \
-+        | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, COUNT,   Count) \
-+        | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, ADDRESS, Address); \
-+    \
-+    gcmSKIPSECUREUSER(); \
-+}
-+
-+#define gcmENDSTATEBATCH(CommandBuffer, Memory) \
-+{ \
-+    gcmVERIFYLOADSTATEDONE(CommandBuffer); \
-+    \
-+    gcmASSERT(((Memory - gcmUINT64_TO_TYPE(CommandBuffer->lastReserve, gctUINT32_PTR)) & 1) == 0); \
-+}
-+
-+/*----------------------------------------------------------------------------*/
-+
-+#define gcmSETSTATEDATA(StateDelta, CommandBuffer, Memory, FixedPoint, \
-+                        Address, Data) \
-+{ \
-+    gctUINT32 __temp_data32__; \
-+    \
-+    gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address); \
-+    \
-+    __temp_data32__ = Data; \
-+    \
-+    *Memory++ = __temp_data32__; \
-+    \
-+    gcoHARDWARE_UpdateDelta( \
-+        StateDelta, FixedPoint, Address, 0, __temp_data32__ \
-+        ); \
-+    \
-+    gcmDUMPSTATEDATA(StateDelta, FixedPoint, Address, __temp_data32__); \
-+    \
-+    gcmUPDATESECUREUSER(); \
-+}
-+
-+#define gcmSETCTRLSTATE(StateDelta, CommandBuffer, Memory, Address, Data) \
-+{ \
-+    gctUINT32 __temp_data32__; \
-+    \
-+    gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address); \
-+    \
-+    __temp_data32__ = Data; \
-+    \
-+    *Memory++ = __temp_data32__; \
-+    \
-+    gcmDUMPSTATEDATA(StateDelta, gcvFALSE, Address, __temp_data32__); \
-+    \
-+    gcmSKIPSECUREUSER(); \
-+}
-+
-+#define gcmSETFILLER(CommandBuffer, Memory) \
-+{ \
-+    gcmVERIFYLOADSTATEDONE(CommandBuffer); \
-+    \
-+    Memory += 1; \
-+    \
-+    gcmSKIPSECUREUSER(); \
-+}
-+
-+/*----------------------------------------------------------------------------*/
-+
-+#define gcmSETSINGLESTATE(StateDelta, CommandBuffer, Memory, FixedPoint, \
-+                          Address, Data) \
-+{ \
-+    gcmBEGINSTATEBATCH(CommandBuffer, Memory, FixedPoint, Address, 1); \
-+    gcmSETSTATEDATA(StateDelta, CommandBuffer, Memory, FixedPoint, \
-+                    Address, Data); \
-+    gcmENDSTATEBATCH(CommandBuffer, Memory); \
-+}
-+
-+#define gcmSETSINGLECTRLSTATE(StateDelta, CommandBuffer, Memory, FixedPoint, \
-+                              Address, Data) \
-+{ \
-+    gcmBEGINSTATEBATCH(CommandBuffer, Memory, FixedPoint, Address, 1); \
-+    gcmSETCTRLSTATE(StateDelta, CommandBuffer, Memory, Address, Data); \
-+    gcmENDSTATEBATCH(CommandBuffer, Memory); \
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gcmSETSTARTDECOMMAND
-+**
-+**      Form a START_DE command.
-+**
-+**  ARGUMENTS:
-+**
-+**      Memory          Destination memory pointer of gctUINT32_PTR type.
-+**      Count           Number of the rectangles.
-+*/
-+
-+#define gcmSETSTARTDECOMMAND(Memory, Count) \
-+{ \
-+    *Memory++ \
-+        = gcmSETFIELDVALUE(0, AQ_COMMAND_START_DE_COMMAND, OPCODE,     START_DE) \
-+        | gcmSETFIELD     (0, AQ_COMMAND_START_DE_COMMAND, COUNT,      Count) \
-+        | gcmSETFIELD     (0, AQ_COMMAND_START_DE_COMMAND, DATA_COUNT, 0); \
-+    \
-+    *Memory++ = 0xDEADDEED; \
-+}
-+
-+/******************************************************************************\
-+******************************** Ceiling Macro ********************************
-+\******************************************************************************/
-+#define gcmCEIL(x) ((x - (gctUINT32)x) == 0 ? (gctUINT32)x : (gctUINT32)x + 1)
-+
-+/******************************************************************************\
-+******************************** Min/Max Macros ********************************
-+\******************************************************************************/
-+
-+#define gcmMIN(x, y)            (((x) <= (y)) ?  (x) :  (y))
-+#define gcmMAX(x, y)            (((x) >= (y)) ?  (x) :  (y))
-+#define gcmCLAMP(x, min, max)   (((x) < (min)) ? (min) : \
-+                                 ((x) > (max)) ? (max) : (x))
-+#define gcmABS(x)               (((x) < 0)    ? -(x) :  (x))
-+#define gcmNEG(x)               (((x) < 0)    ?  (x) : -(x))
-+
-+/*******************************************************************************
-+**
-+**  gcmPTR2INT
-+**
-+**      Convert a pointer to an integer value.
-+**
-+**  ARGUMENTS:
-+**
-+**      p       Pointer value.
-+*/
-+#if defined(_WIN32) || (defined(__LP64__) && __LP64__)
-+#   define gcmPTR2INT(p) \
-+    ( \
-+        (gctUINT32) (gctUINT64) (p) \
-+    )
-+#else
-+#   define gcmPTR2INT(p) \
-+    ( \
-+        (gctUINT32) (p) \
-+    )
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmINT2PTR
-+**
-+**      Convert an integer value into a pointer.
-+**
-+**  ARGUMENTS:
-+**
-+**      v       Integer value.
-+*/
-+#ifdef __LP64__
-+#   define gcmINT2PTR(i) \
-+    ( \
-+        (gctPOINTER) (gctINT64) (i) \
-+    )
-+#else
-+#   define gcmINT2PTR(i) \
-+    ( \
-+        (gctPOINTER) (i) \
-+    )
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmOFFSETOF
-+**
-+**      Compute the byte offset of a field inside a structure.
-+**
-+**  ARGUMENTS:
-+**
-+**      s       Structure name.
-+**      field   Field name.
-+*/
-+#define gcmOFFSETOF(s, field) \
-+( \
-+    gcmPTR2INT(& (((struct s *) 0)->field)) \
-+)
-+
-+#define gcmSWAB32(x) ((gctUINT32)( \
-+        (((gctUINT32)(x) & (gctUINT32)0x000000FFUL) << 24) | \
-+        (((gctUINT32)(x) & (gctUINT32)0x0000FF00UL) << 8)  | \
-+        (((gctUINT32)(x) & (gctUINT32)0x00FF0000UL) >> 8)  | \
-+        (((gctUINT32)(x) & (gctUINT32)0xFF000000UL) >> 24)))
-+
-+/*******************************************************************************
-+***** Database ****************************************************************/
-+
-+typedef struct _gcsDATABASE_COUNTERS
-+{
-+    /* Number of currently allocated bytes. */
-+    gctUINT64                   bytes;
-+
-+    /* Maximum number of bytes allocated (memory footprint). */
-+    gctUINT64                   maxBytes;
-+
-+    /* Total number of bytes allocated. */
-+    gctUINT64                   totalBytes;
-+}
-+gcsDATABASE_COUNTERS;
-+
-+typedef struct _gcuDATABASE_INFO
-+{
-+    /* Counters. */
-+    gcsDATABASE_COUNTERS        counters;
-+
-+    /* Time value. */
-+    gctUINT64                   time;
-+}
-+gcuDATABASE_INFO;
-+
-+/*******************************************************************************
-+***** Frame database **********************************************************/
-+
-+/* gcsHAL_FRAME_INFO */
-+typedef struct _gcsHAL_FRAME_INFO
-+{
-+    /* Current timer tick. */
-+    OUT gctUINT64               ticks;
-+
-+    /* Bandwidth counters. */
-+    OUT gctUINT                 readBytes8[8];
-+    OUT gctUINT                 writeBytes8[8];
-+
-+    /* Counters. */
-+    OUT gctUINT                 cycles[8];
-+    OUT gctUINT                 idleCycles[8];
-+    OUT gctUINT                 mcCycles[8];
-+    OUT gctUINT                 readRequests[8];
-+    OUT gctUINT                 writeRequests[8];
-+
-+    /* FE counters. */
-+    OUT gctUINT                 drawCount;
-+    OUT gctUINT                 vertexOutCount;
-+    OUT gctUINT                 vertexMissCount;
-+
-+    /* 3D counters. */
-+    OUT gctUINT                 vertexCount;
-+    OUT gctUINT                 primitiveCount;
-+    OUT gctUINT                 rejectedPrimitives;
-+    OUT gctUINT                 culledPrimitives;
-+    OUT gctUINT                 clippedPrimitives;
-+    OUT gctUINT                 droppedPrimitives;
-+    OUT gctUINT                 frustumClippedPrimitives;
-+    OUT gctUINT                 outPrimitives;
-+    OUT gctUINT                 inPrimitives;
-+    OUT gctUINT                 culledQuadCount;
-+    OUT gctUINT                 totalQuadCount;
-+    OUT gctUINT                 quadCount;
-+    OUT gctUINT                 totalPixelCount;
-+
-+    /* PE counters. */
-+    OUT gctUINT                 colorKilled[8];
-+    OUT gctUINT                 colorDrawn[8];
-+    OUT gctUINT                 depthKilled[8];
-+    OUT gctUINT                 depthDrawn[8];
-+
-+    /* Shader counters. */
-+    OUT gctUINT                 shaderCycles;
-+    OUT gctUINT                 vsInstructionCount;
-+    OUT gctUINT                 vsTextureCount;
-+    OUT gctUINT                 vsBranchCount;
-+    OUT gctUINT                 vsVertices;
-+    OUT gctUINT                 psInstructionCount;
-+    OUT gctUINT                 psTextureCount;
-+    OUT gctUINT                 psBranchCount;
-+    OUT gctUINT                 psPixels;
-+
-+    /* Texture counters. */
-+    OUT gctUINT                 bilinearRequests;
-+    OUT gctUINT                 trilinearRequests;
-+    OUT gctUINT                 txBytes8[2];
-+    OUT gctUINT                 txHitCount;
-+    OUT gctUINT                 txMissCount;
-+}
-+gcsHAL_FRAME_INFO;
-+
-+typedef enum _gcePATCH_ID
-+{
-+    gcePATCH_UNKNOWN = 0xFFFFFFFF,
-+
-+    /* Benchmark list*/
-+    gcePATCH_GLB11 = 0x0,
-+    gcePATCH_GLB21,
-+    gcePATCH_GLB25,
-+    gcePATCH_GLB27,
-+
-+    gcePATCH_BM21,
-+    gcePATCH_MM,
-+    gcePATCH_MM06,
-+    gcePATCH_MM07,
-+    gcePATCH_QUADRANT,
-+    gcePATCH_ANTUTU,
-+    gcePATCH_SMARTBENCH,
-+    gcePATCH_JPCT,
-+    gcePATCH_NENAMARK,
-+    gcePATCH_NENAMARK2,
-+    gcePATCH_NEOCORE,
-+    gcePATCH_GLB,
-+    gcePATCH_GB,
-+    gcePATCH_RTESTVA,
-+    gcePATCH_BMX,
-+    gcePATCH_BMGUI,
-+
-+    /* Game list */
-+    gcePATCH_NBA2013,
-+    gcePATCH_BARDTALE,
-+    gcePATCH_BUSPARKING3D,
-+    gcePATCH_FISHBOODLE,
-+    gcePATCH_SUBWAYSURFER,
-+    gcePATCH_HIGHWAYDRIVER,
-+    gcePATCH_PREMIUM,
-+    gcePATCH_RACEILLEGAL,
-+    gcePATCH_BLABLA,
-+    gcePATCH_MEGARUN,
-+    gcePATCH_GALAXYONFIRE2,
-+    gcePATCH_GLOFTR3HM,
-+    gcePATCH_GLOFTSXHM,
-+    gcePATCH_GLOFTF3HM,
-+    gcePATCH_GLOFTGANG,
-+    gcePATCH_XRUNNER,
-+    gcePATCH_WP,
-+    gcePATCH_DEVIL,
-+    gcePATCH_HOLYARCH,
-+    gcePATCH_MUSE,
-+    gcePATCH_SG,
-+    gcePATCH_SIEGECRAFT,
-+    gcePATCH_CARCHALLENGE,
-+    gcePATCH_HEROESCALL,
-+    gcePATCH_MONOPOLY,
-+    gcePATCH_CTGL20,
-+    gcePATCH_FIREFOX,
-+    gcePATCH_CHORME,
-+    gcePATCH_DUOKANTV,
-+    gcePATCH_TESTAPP,
-+    gcePATCH_GOOGLEEARTH,
-+    gcePATCH_SF4,
-+    gcePATCH_SPEEDRACE,
-+    gcePATCH_AIRNAVY,
-+    gcePATCH_F18NEW,
-+    gcePATCH_F18,
-+    gcePATCH_WISTONESG,
-+    gcvPATCH_VECUNIT_RED,
-+    gcvPATCH_NAMESGAS,
-+    gcvPATCH_AFTERBURNER,
-+    gcvPATCH_UIMARK,
-+    /* Count enum*/
-+    gcePATCH_COUNT,
-+}
-+gcePATCH_ID;
-+
-+#if gcdLINK_QUEUE_SIZE
-+typedef struct _gckLINKDATA * gckLINKDATA;
-+struct _gckLINKDATA
-+{
-+    gctUINT32                   start;
-+    gctUINT32                   end;
-+    gctINT                      pid;
-+};
-+
-+typedef struct _gckLINKQUEUE * gckLINKQUEUE;
-+struct _gckLINKQUEUE
-+{
-+    struct _gckLINKDATA         data[gcdLINK_QUEUE_SIZE];
-+    gctUINT32                   rear;
-+    gctUINT32                   front;
-+    gctUINT32                   count;
-+};
-+#endif
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_types_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,37 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_version_h_
-+#define __gc_hal_version_h_
-+
-+#define gcvVERSION_MAJOR        4
-+
-+#define gcvVERSION_MINOR        6
-+
-+#define gcvVERSION_PATCH        9
-+
-+#define gcvVERSION_BUILD     9754
-+
-+#define gcvVERSION_DATE      __DATE__
-+
-+#define gcvVERSION_TIME      __TIME__
-+
-+#endif /* __gc_hal_version_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,913 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_vg_h_
-+#define __gc_hal_vg_h_
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+
-+#include "gc_hal_rename.h"
-+#include "gc_hal_types.h"
-+#include "gc_hal_enum.h"
-+#include "gc_hal_base.h"
-+
-+#if gcdENABLE_VG
-+
-+/* Thread routine type. */
-+#if defined(LINUX)
-+    typedef gctINT              gctTHREADFUNCRESULT;
-+    typedef gctPOINTER          gctTHREADFUNCPARAMETER;
-+#   define  gctTHREADFUNCTYPE
-+#elif defined(WIN32)
-+    typedef gctUINT             gctTHREADFUNCRESULT;
-+    typedef gctPOINTER          gctTHREADFUNCPARAMETER;
-+#   define  gctTHREADFUNCTYPE   __stdcall
-+#elif defined(__QNXNTO__)
-+    typedef void *              gctTHREADFUNCRESULT;
-+    typedef gctPOINTER          gctTHREADFUNCPARAMETER;
-+#   define  gctTHREADFUNCTYPE
-+#endif
-+
-+typedef gctTHREADFUNCRESULT (gctTHREADFUNCTYPE * gctTHREADFUNC) (
-+    gctTHREADFUNCPARAMETER ThreadParameter
-+    );
-+
-+
-+#if defined(gcvDEBUG)
-+#   undef gcvDEBUG
-+#endif
-+
-+#define gcdFORCE_DEBUG 0
-+#define gcdFORCE_MESSAGES 0
-+
-+
-+#if DBG || defined(DEBUG) || defined(_DEBUG) || gcdFORCE_DEBUG
-+#   define gcvDEBUG 1
-+#else
-+#   define gcvDEBUG 0
-+#endif
-+
-+#define _gcmERROR_RETURN(prefix, func) \
-+    status = func; \
-+    if (gcmIS_ERROR(status)) \
-+    { \
-+        prefix##PRINT_VERSION(); \
-+        prefix##TRACE(gcvLEVEL_ERROR, \
-+            #prefix "ERR_RETURN: status=%d(%s) @ %s(%d)", \
-+            status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
-+        return status; \
-+    } \
-+    do { } while (gcvFALSE)
-+
-+#define gcmERROR_RETURN(func)         _gcmERROR_RETURN(gcm, func)
-+
-+#define gcmLOG_LOCATION()
-+
-+#define gcmkIS_ERROR(status)        (status < 0)
-+
-+#define gcmALIGNDOWN(n, align) \
-+( \
-+    (n) & ~((align) - 1) \
-+)
-+
-+#define gcmIS_VALID_INDEX(Index, Array) \
-+    (((gctUINT) (Index)) < gcmCOUNTOF(Array))
-+
-+
-+#define gcmIS_NAN(x) \
-+( \
-+    ((* (gctUINT32_PTR) &(x)) & 0x7FFFFFFF) == 0x7FFFFFFF \
-+)
-+
-+#define gcmLERP(v1, v2, w) \
-+    ((v1) * (w) + (v2) * (1.0f - (w)))
-+
-+#define gcmINTERSECT(Start1, Start2, Length) \
-+    (gcmABS((Start1) - (Start2)) < (Length))
-+
-+/*******************************************************************************
-+**
-+**  gcmERR_GOTO
-+**
-+**      Prints a message and terminates the current loop on error.
-+**
-+**  ASSUMPTIONS:
-+**
-+**      'status' variable of gceSTATUS type must be defined.
-+**
-+**  ARGUMENTS:
-+**
-+**      Function
-+**          Function to evaluate.
-+*/
-+
-+#define gcmERR_GOTO(Function) \
-+    status = Function; \
-+    if (gcmIS_ERROR(status)) \
-+    { \
-+        gcmTRACE( \
-+            gcvLEVEL_ERROR, \
-+            "gcmERR_GOTO: status=%d @ line=%d in function %s.\n", \
-+            status, __LINE__, __FUNCTION__ \
-+            ); \
-+        goto ErrorHandler; \
-+    }
-+
-+#if gcvDEBUG || gcdFORCE_MESSAGES
-+#   define gcmVERIFY_BOOLEAN(Expression) \
-+        gcmASSERT( \
-+            ( (Expression) == gcvFALSE ) || \
-+            ( (Expression) == gcvTRUE  )    \
-+            )
-+#else
-+#   define gcmVERIFY_BOOLEAN(Expression)
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gcmVERIFYFIELDFIT
-+**
-+**      Verify whether the value fits in the field.
-+**
-+**  ARGUMENTS:
-+**
-+**      data    Data value.
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+**      value   Value for field.
-+*/
-+#define gcmVERIFYFIELDFIT(reg, field, value) \
-+    gcmASSERT( \
-+        (value) <= gcmFIELDMAX(reg, field) \
-+        )
-+/*******************************************************************************
-+**
-+**  gcmFIELDMAX
-+**
-+**      Get field maximum value.
-+**
-+**  ARGUMENTS:
-+**
-+**      reg     Name of register.
-+**      field   Name of field within register.
-+*/
-+#define gcmFIELDMAX(reg, field) \
-+( \
-+    (gctUINT32) \
-+        ( \
-+        (__gcmGETSIZE(reg##_##field) == 32) \
-+                ?  ~0 \
-+                : (~(~0 << __gcmGETSIZE(reg##_##field))) \
-+        ) \
-+)
-+
-+
-+/* ANSI C does not have the 'f' functions, define replacements here. */
-+#define gcmSINF(x)                      ((gctFLOAT) sin(x))
-+#define gcmCOSF(x)                      ((gctFLOAT) cos(x))
-+#define gcmASINF(x)                     ((gctFLOAT) asin(x))
-+#define gcmACOSF(x)                     ((gctFLOAT) acos(x))
-+#define gcmSQRTF(x)                     ((gctFLOAT) sqrt(x))
-+#define gcmFABSF(x)                     ((gctFLOAT) fabs(x))
-+#define gcmFMODF(x, y)                  ((gctFLOAT) fmod((x), (y)))
-+#define gcmCEILF(x)                     ((gctFLOAT) ceil(x))
-+#define gcmFLOORF(x)                    ((gctFLOAT) floor(x))
-+
-+
-+
-+/* Fixed point constants. */
-+#define gcvZERO_X               ((gctFIXED_POINT) 0x00000000)
-+#define gcvHALF_X               ((gctFIXED_POINT) 0x00008000)
-+#define gcvONE_X                ((gctFIXED_POINT) 0x00010000)
-+#define gcvNEGONE_X             ((gctFIXED_POINT) 0xFFFF0000)
-+#define gcvTWO_X                ((gctFIXED_POINT) 0x00020000)
-+
-+/* Integer constants. */
-+#define gcvMAX_POS_INT          ((gctINT) 0x7FFFFFFF)
-+#define gcvMAX_NEG_INT          ((gctINT) 0x80000000)
-+
-+/* Float constants. */
-+#define gcvMAX_POS_FLOAT        ((gctFLOAT)  3.4028235e+038)
-+#define gcvMAX_NEG_FLOAT        ((gctFLOAT) -3.4028235e+038)
-+
-+/******************************************************************************\
-+***************************** Miscellaneous Macro ******************************
-+\******************************************************************************/
-+
-+#define gcmKB2BYTES(Kilobyte) \
-+( \
-+    (Kilobyte) << 10 \
-+)
-+
-+#define gcmMB2BYTES(Megabyte) \
-+( \
-+    (Megabyte) << 20 \
-+)
-+
-+#define gcmMAT(Matrix, Row, Column) \
-+( \
-+    (Matrix) [(Row) * 3 + (Column)] \
-+)
-+
-+#define gcmMAKE2CHAR(Char1, Char2) \
-+( \
-+    ((gctUINT16) (gctUINT8) (Char1) << 0) | \
-+    ((gctUINT16) (gctUINT8) (Char2) << 8) \
-+)
-+
-+#define gcmMAKE4CHAR(Char1, Char2, Char3, Char4) \
-+( \
-+    ((gctUINT32)(gctUINT8) (Char1) <<  0) | \
-+    ((gctUINT32)(gctUINT8) (Char2) <<  8) | \
-+    ((gctUINT32)(gctUINT8) (Char3) << 16) | \
-+    ((gctUINT32)(gctUINT8) (Char4) << 24) \
-+)
-+
-+/* some platforms need to fix the physical address for HW to access*/
-+#define gcmFIXADDRESS(address) \
-+(\
-+    (address)\
-+)
-+
-+#define gcmkFIXADDRESS(address) \
-+(\
-+    (address)\
-+)
-+
-+/******************************************************************************\
-+****************************** Kernel Debug Macro ******************************
-+\******************************************************************************/
-+
-+/* Set signal to signaled state for specified process. */
-+gceSTATUS
-+gckOS_SetSignal(
-+    IN gckOS Os,
-+    IN gctHANDLE Process,
-+    IN gctSIGNAL Signal
-+    );
-+
-+/* Return the kernel logical pointer for the given physical one. */
-+gceSTATUS
-+gckOS_GetKernelLogical(
-+    IN gckOS Os,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * KernelPointer
-+    );
-+
-+/* Return the kernel logical pointer for the given physical one. */
-+gceSTATUS
-+gckOS_GetKernelLogicalEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * KernelPointer
-+    );
-+
-+/*----------------------------------------------------------------------------*/
-+/*----------------------------- Semaphore Object -----------------------------*/
-+
-+/* Increment the value of a semaphore. */
-+gceSTATUS
-+gckOS_IncrementSemaphore(
-+    IN gckOS Os,
-+    IN gctSEMAPHORE Semaphore
-+    );
-+
-+/* Decrement the value of a semaphore (waiting might occur). */
-+gceSTATUS
-+gckOS_DecrementSemaphore(
-+    IN gckOS Os,
-+    IN gctSEMAPHORE Semaphore
-+    );
-+
-+
-+/*----------------------------------------------------------------------------*/
-+/*------------------------------- Thread Object ------------------------------*/
-+
-+/* Start a thread. */
-+gceSTATUS
-+gckOS_StartThread(
-+    IN gckOS Os,
-+    IN gctTHREADFUNC ThreadFunction,
-+    IN gctPOINTER ThreadParameter,
-+    OUT gctTHREAD * Thread
-+    );
-+
-+/* Stop a thread. */
-+gceSTATUS
-+gckOS_StopThread(
-+    IN gckOS Os,
-+    IN gctTHREAD Thread
-+    );
-+
-+/* Verify whether the thread is still running. */
-+gceSTATUS
-+gckOS_VerifyThread(
-+    IN gckOS Os,
-+    IN gctTHREAD Thread
-+    );
-+
-+
-+/* Construct a new gckVGKERNEL object. */
-+gceSTATUS
-+gckVGKERNEL_Construct(
-+    IN gckOS Os,
-+    IN gctPOINTER Context,
-+    IN gckKERNEL  inKernel,
-+    OUT gckVGKERNEL * Kernel
-+    );
-+
-+/* Destroy an gckVGKERNEL object. */
-+gceSTATUS
-+gckVGKERNEL_Destroy(
-+    IN gckVGKERNEL Kernel
-+    );
-+
-+/* Allocate linear video memory. */
-+gceSTATUS
-+gckKERNEL_AllocateLinearMemory(
-+    IN gckKERNEL Kernel,
-+    IN OUT gcePOOL * Pool,
-+    IN gctSIZE_T Bytes,
-+    IN gctSIZE_T Alignment,
-+    IN gceSURF_TYPE Type,
-+    OUT gcuVIDMEM_NODE_PTR * Node
-+    );
-+
-+/* Unmap memory. */
-+gceSTATUS
-+gckKERNEL_UnmapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Dispatch a user-level command. */
-+gceSTATUS
-+gckVGKERNEL_Dispatch(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL FromUser,
-+    IN OUT struct _gcsHAL_INTERFACE * Interface
-+    );
-+
-+/* Query command buffer requirements. */
-+gceSTATUS
-+gckKERNEL_QueryCommandBuffer(
-+    IN gckKERNEL Kernel,
-+    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
-+    );
-+
-+#if gcdDYNAMIC_MAP_RESERVED_MEMORY
-+gceSTATUS
-+gckOS_MapReservedMemoryToKernel(
-+    IN gckOS Os,
-+    IN gctUINT32 Physical,
-+    IN gctINT Bytes,
-+    IN OUT gctPOINTER *Virtual
-+    );
-+
-+gceSTATUS
-+gckOS_UnmapReservedMemoryFromKernel(
-+    IN gctPOINTER Virtual
-+    );
-+#endif
-+
-+/******************************************************************************\
-+******************************* gckVGHARDWARE Object ******************************
-+\******************************************************************************/
-+
-+/* Construct a new gckVGHARDWARE object. */
-+gceSTATUS
-+gckVGHARDWARE_Construct(
-+    IN gckOS Os,
-+    OUT gckVGHARDWARE * Hardware
-+    );
-+
-+/* Destroy an gckVGHARDWARE object. */
-+gceSTATUS
-+gckVGHARDWARE_Destroy(
-+    IN gckVGHARDWARE Hardware
-+    );
-+
-+/* Query system memory requirements. */
-+gceSTATUS
-+gckVGHARDWARE_QuerySystemMemory(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctSIZE_T * SystemSize,
-+    OUT gctUINT32 * SystemBaseAddress
-+    );
-+
-+/* Build virtual address. */
-+gceSTATUS
-+gckVGHARDWARE_BuildVirtualAddress(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Index,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Kickstart the command processor. */
-+gceSTATUS
-+gckVGHARDWARE_Execute(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    IN gctSIZE_T Count
-+    );
-+
-+/* Query the available memory. */
-+gceSTATUS
-+gckVGHARDWARE_QueryMemory(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctSIZE_T * InternalSize,
-+    OUT gctUINT32 * InternalBaseAddress,
-+    OUT gctUINT32 * InternalAlignment,
-+    OUT gctSIZE_T * ExternalSize,
-+    OUT gctUINT32 * ExternalBaseAddress,
-+    OUT gctUINT32 * ExternalAlignment,
-+    OUT gctUINT32 * HorizontalTileSize,
-+    OUT gctUINT32 * VerticalTileSize
-+    );
-+
-+/* Query the identity of the hardware. */
-+gceSTATUS
-+gckVGHARDWARE_QueryChipIdentity(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gceCHIPMODEL* ChipModel,
-+    OUT gctUINT32* ChipRevision,
-+    OUT gctUINT32* ChipFeatures,
-+    OUT gctUINT32* ChipMinorFeatures,
-+    OUT gctUINT32* ChipMinorFeatures1
-+    );
-+
-+/* Convert an API format. */
-+gceSTATUS
-+gckVGHARDWARE_ConvertFormat(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceSURF_FORMAT Format,
-+    OUT gctUINT32 * BitsPerPixel,
-+    OUT gctUINT32 * BytesPerTile
-+    );
-+
-+/* Split a harwdare specific address into API stuff. */
-+gceSTATUS
-+gckVGHARDWARE_SplitMemory(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctUINT32 Address,
-+    OUT gcePOOL * Pool,
-+    OUT gctUINT32 * Offset
-+    );
-+
-+/* Align size to tile boundary. */
-+gceSTATUS
-+gckVGHARDWARE_AlignToTile(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceSURF_TYPE Type,
-+    IN OUT gctUINT32_PTR Width,
-+    IN OUT gctUINT32_PTR Height
-+    );
-+
-+/* Convert logical address to hardware specific address. */
-+gceSTATUS
-+gckVGHARDWARE_ConvertLogical(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Program MMU. */
-+gceSTATUS
-+gckVGHARDWARE_SetMMU(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctPOINTER Logical
-+    );
-+
-+/* Flush the MMU. */
-+gceSTATUS
-+gckVGHARDWARE_FlushMMU(
-+    IN gckVGHARDWARE Hardware
-+    );
-+
-+/* Get idle register. */
-+gceSTATUS
-+gckVGHARDWARE_GetIdle(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctUINT32 * Data
-+    );
-+
-+/* Flush the caches. */
-+gceSTATUS
-+gckVGHARDWARE_Flush(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceKERNEL_FLUSH Flush,
-+    IN gctPOINTER Logical,
-+    IN OUT gctSIZE_T * Bytes
-+    );
-+
-+/* Enable/disable fast clear. */
-+gceSTATUS
-+gckVGHARDWARE_SetFastClear(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctINT Enable
-+    );
-+
-+gceSTATUS
-+gckVGHARDWARE_ReadInterrupt(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctUINT32_PTR IDs
-+    );
-+
-+/* Power management. */
-+gceSTATUS
-+gckVGHARDWARE_SetPowerManagementState(
-+    IN gckVGHARDWARE Hardware,
-+    IN gceCHIPPOWERSTATE State
-+    );
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryPowerManagementState(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gceCHIPPOWERSTATE* State
-+    );
-+
-+gceSTATUS
-+gckVGHARDWARE_SetPowerManagement(
-+    IN gckVGHARDWARE Hardware,
-+    IN gctBOOL PowerManagement
-+    );
-+
-+gceSTATUS
-+gckVGHARDWARE_SetPowerOffTimeout(
-+    IN gckVGHARDWARE  Hardware,
-+    IN gctUINT32    Timeout
-+    );
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryPowerOffTimeout(
-+    IN gckVGHARDWARE  Hardware,
-+    OUT gctUINT32*  Timeout
-+    );
-+
-+gceSTATUS
-+gckVGHARDWARE_QueryIdle(
-+    IN gckVGHARDWARE Hardware,
-+    OUT gctBOOL_PTR IsIdle
-+    );
-+/******************************************************************************\
-+*************************** Command Buffer Structures **************************
-+\******************************************************************************/
-+
-+/* Vacant command buffer marker. */
-+#define gcvVACANT_BUFFER        ((gcsCOMPLETION_SIGNAL_PTR) (1))
-+
-+/* Command buffer header. */
-+typedef struct _gcsCMDBUFFER * gcsCMDBUFFER_PTR;
-+typedef struct _gcsCMDBUFFER
-+{
-+    /* Pointer to the completion signal. */
-+    gcsCOMPLETION_SIGNAL_PTR    completion;
-+
-+    /* The user sets this to the node of the container buffer whitin which
-+       this particular command buffer resides. The kernel sets this to the
-+       node of the internally allocated buffer. */
-+    gctUINT64                   node;
-+
-+    /* Command buffer hardware address. */
-+    gctUINT32                   address;
-+
-+    /* The offset of the buffer from the beginning of the header. */
-+    gctUINT32                   bufferOffset;
-+
-+    /* Size of the area allocated for the data portion of this particular
-+       command buffer (headers and tail reserves are excluded). */
-+    gctSIZE_T                   size;
-+
-+    /* Offset into the buffer [0..size]; reflects exactly how much data has
-+       been put into the command buffer. */
-+    gctUINT                     offset;
-+
-+    /* The number of command units in the buffer for the hardware to
-+       execute. */
-+    gctSIZE_T                   dataCount;
-+
-+    /* MANAGED BY : user HAL (gcoBUFFER object).
-+       USED BY    : user HAL (gcoBUFFER object).
-+       Points to the immediate next allocated command buffer. */
-+    gcsCMDBUFFER_PTR            nextAllocated;
-+
-+    /* MANAGED BY : user layers (HAL and drivers).
-+       USED BY    : kernel HAL (gcoBUFFER object).
-+       Points to the next subbuffer if any. A family of subbuffers are chained
-+       together and are meant to be executed inseparably as a unit. Meaning
-+       that context switching cannot occur while a chain of subbuffers is being
-+       executed. */
-+    gcsCMDBUFFER_PTR            nextSubBuffer;
-+}
-+gcsCMDBUFFER;
-+
-+/* Command queue element. */
-+typedef struct _gcsVGCMDQUEUE
-+{
-+    /* Pointer to the command buffer header. */
-+    gcsCMDBUFFER_PTR            commandBuffer;
-+
-+    /* Dynamic vs. static command buffer state. */
-+    gctBOOL                     dynamic;
-+}
-+gcsVGCMDQUEUE;
-+
-+/* Context map entry. */
-+typedef struct _gcsVGCONTEXT_MAP
-+{
-+    /* State index. */
-+    gctUINT32                   index;
-+
-+    /* New state value. */
-+    gctUINT32                   data;
-+
-+    /* Points to the next entry in the mod list. */
-+    gcsVGCONTEXT_MAP_PTR            next;
-+}
-+gcsVGCONTEXT_MAP;
-+
-+/* gcsVGCONTEXT structure that holds the current context. */
-+typedef struct _gcsVGCONTEXT
-+{
-+    /* Context ID. */
-+    gctUINT64                   id;
-+
-+    /* State caching ebable flag. */
-+    gctBOOL                     stateCachingEnabled;
-+
-+    /* Current pipe. */
-+    gctUINT32                   currentPipe;
-+
-+    /* State map/mod buffer. */
-+    gctSIZE_T                   mapFirst;
-+    gctSIZE_T                   mapLast;
-+#ifdef __QNXNTO__
-+    gctSIZE_T                   mapContainerSize;
-+#endif
-+    gcsVGCONTEXT_MAP_PTR            mapContainer;
-+    gcsVGCONTEXT_MAP_PTR            mapPrev;
-+    gcsVGCONTEXT_MAP_PTR            mapCurr;
-+    gcsVGCONTEXT_MAP_PTR            firstPrevMap;
-+    gcsVGCONTEXT_MAP_PTR            firstCurrMap;
-+
-+    /* Main context buffer. */
-+    gcsCMDBUFFER_PTR            header;
-+    gctUINT32_PTR               buffer;
-+
-+    /* Completion signal. */
-+    gctHANDLE                   process;
-+    gctSIGNAL                   signal;
-+
-+#if defined(__QNXNTO__)
-+    gctINT32                    coid;
-+    gctINT32                    rcvid;
-+#endif
-+}
-+gcsVGCONTEXT;
-+
-+/* User space task header. */
-+typedef struct _gcsTASK * gcsTASK_PTR;
-+typedef struct _gcsTASK
-+{
-+    /* Pointer to the next task for the same interrupt in user space. */
-+    gcsTASK_PTR                 next;
-+
-+    /* Size of the task data that immediately follows the structure. */
-+    gctUINT                     size;
-+
-+    /* Task data starts here. */
-+    /* ... */
-+}
-+gcsTASK;
-+
-+/* User space task master table entry. */
-+typedef struct _gcsTASK_MASTER_ENTRY * gcsTASK_MASTER_ENTRY_PTR;
-+typedef struct _gcsTASK_MASTER_ENTRY
-+{
-+    /* Pointers to the head and to the tail of the task chain. */
-+    gcsTASK_PTR                 head;
-+    gcsTASK_PTR                 tail;
-+}
-+gcsTASK_MASTER_ENTRY;
-+
-+/* User space task master table entry. */
-+typedef struct _gcsTASK_MASTER_TABLE
-+{
-+    /* Table with one entry per block. */
-+    gcsTASK_MASTER_ENTRY        table[gcvBLOCK_COUNT];
-+
-+    /* The total number of tasks sckeduled. */
-+    gctUINT                     count;
-+
-+    /* The total size of event data in bytes. */
-+    gctUINT                     size;
-+
-+#if defined(__QNXNTO__)
-+    gctINT32                    coid;
-+    gctINT32                    rcvid;
-+#endif
-+}
-+gcsTASK_MASTER_TABLE;
-+
-+/******************************************************************************\
-+***************************** gckVGINTERRUPT Object ******************************
-+\******************************************************************************/
-+
-+typedef struct _gckVGINTERRUPT * gckVGINTERRUPT;
-+
-+typedef gceSTATUS (* gctINTERRUPT_HANDLER)(
-+    IN gckVGKERNEL Kernel
-+    );
-+
-+gceSTATUS
-+gckVGINTERRUPT_Construct(
-+    IN gckVGKERNEL Kernel,
-+    OUT gckVGINTERRUPT * Interrupt
-+    );
-+
-+gceSTATUS
-+gckVGINTERRUPT_Destroy(
-+    IN gckVGINTERRUPT Interrupt
-+    );
-+
-+gceSTATUS
-+gckVGINTERRUPT_Enable(
-+    IN gckVGINTERRUPT Interrupt,
-+    IN OUT gctINT32_PTR Id,
-+    IN gctINTERRUPT_HANDLER Handler
-+    );
-+
-+gceSTATUS
-+gckVGINTERRUPT_Disable(
-+    IN gckVGINTERRUPT Interrupt,
-+    IN gctINT32 Id
-+    );
-+
-+#ifndef __QNXNTO__
-+
-+gceSTATUS
-+gckVGINTERRUPT_Enque(
-+    IN gckVGINTERRUPT Interrupt
-+    );
-+
-+#else
-+
-+gceSTATUS
-+gckVGINTERRUPT_Enque(
-+    IN gckVGINTERRUPT Interrupt,
-+    OUT gckOS *Os,
-+    OUT gctSEMAPHORE *Semaphore
-+    );
-+
-+#endif
-+
-+gceSTATUS
-+gckVGINTERRUPT_DumpState(
-+    IN gckVGINTERRUPT Interrupt
-+    );
-+
-+
-+/******************************************************************************\
-+******************************* gckVGCOMMAND Object *******************************
-+\******************************************************************************/
-+
-+typedef struct _gckVGCOMMAND *      gckVGCOMMAND;
-+
-+/* Construct a new gckVGCOMMAND object. */
-+gceSTATUS
-+gckVGCOMMAND_Construct(
-+    IN gckVGKERNEL Kernel,
-+    IN gctUINT TaskGranularity,
-+    IN gctUINT QueueSize,
-+    OUT gckVGCOMMAND * Command
-+    );
-+
-+/* Destroy an gckVGCOMMAND object. */
-+gceSTATUS
-+gckVGCOMMAND_Destroy(
-+    IN gckVGCOMMAND Command
-+    );
-+
-+/* Query command buffer attributes. */
-+gceSTATUS
-+gckVGCOMMAND_QueryCommandBuffer(
-+    IN gckVGCOMMAND Command,
-+    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
-+    );
-+
-+/* Allocate a command queue. */
-+gceSTATUS
-+gckVGCOMMAND_Allocate(
-+    IN gckVGCOMMAND Command,
-+    IN gctSIZE_T Size,
-+    OUT gcsCMDBUFFER_PTR * CommandBuffer,
-+    OUT gctPOINTER * Data
-+    );
-+
-+/* Release memory held by the command queue. */
-+gceSTATUS
-+gckVGCOMMAND_Free(
-+    IN gckVGCOMMAND Command,
-+    IN gcsCMDBUFFER_PTR CommandBuffer
-+    );
-+
-+/* Schedule the command queue for execution. */
-+gceSTATUS
-+gckVGCOMMAND_Execute(
-+    IN gckVGCOMMAND Command,
-+    IN gcsCMDBUFFER_PTR CommandBuffer
-+    );
-+
-+/* Commit a buffer to the command queue. */
-+gceSTATUS
-+gckVGCOMMAND_Commit(
-+    IN gckVGCOMMAND Command,
-+    IN gcsVGCONTEXT_PTR Context,
-+    IN gcsVGCMDQUEUE_PTR Queue,
-+    IN gctUINT EntryCount,
-+    IN gcsTASK_MASTER_TABLE_PTR TaskTable
-+    );
-+
-+/******************************************************************************\
-+********************************* gckVGMMU Object ********************************
-+\******************************************************************************/
-+
-+typedef struct _gckVGMMU *          gckVGMMU;
-+
-+/* Construct a new gckVGMMU object. */
-+gceSTATUS
-+gckVGMMU_Construct(
-+    IN gckVGKERNEL Kernel,
-+    IN gctSIZE_T MmuSize,
-+    OUT gckVGMMU * Mmu
-+    );
-+
-+/* Destroy an gckVGMMU object. */
-+gceSTATUS
-+gckVGMMU_Destroy(
-+    IN gckVGMMU Mmu
-+    );
-+
-+/* Allocate pages inside the MMU. */
-+gceSTATUS
-+gckVGMMU_AllocatePages(
-+    IN gckVGMMU Mmu,
-+    IN gctSIZE_T PageCount,
-+    OUT gctPOINTER * PageTable,
-+    OUT gctUINT32 * Address
-+    );
-+
-+/* Remove a page table from the MMU. */
-+gceSTATUS
-+gckVGMMU_FreePages(
-+    IN gckVGMMU Mmu,
-+    IN gctPOINTER PageTable,
-+    IN gctSIZE_T PageCount
-+    );
-+
-+/* Set the MMU page with info. */
-+gceSTATUS
-+gckVGMMU_SetPage(
-+   IN gckVGMMU Mmu,
-+   IN gctUINT32 PageAddress,
-+   IN gctUINT32 *PageEntry
-+   );
-+
-+/* Flush MMU */
-+gceSTATUS
-+gckVGMMU_Flush(
-+   IN gckVGMMU Mmu
-+   );
-+
-+#endif /* gcdENABLE_VG */
-+
-+#ifdef __cplusplus
-+} /* extern "C" */
-+#endif
-+
-+#endif /* __gc_hal_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,34 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+extern gceSTATUS
-+_DefaultAlloctorInit(
-+    IN gckOS Os,
-+    OUT gckALLOCATOR * Allocator
-+    );
-+
-+gcsALLOCATOR_DESC allocatorArray[] =
-+{
-+    /* Default allocator. */
-+    gcmkDEFINE_ALLOCATOR_DESC("default", _DefaultAlloctorInit),
-+};
-+
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,45 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+extern gceSTATUS
-+_DefaultAlloctorInit(
-+    IN gckOS Os,
-+    OUT gckALLOCATOR * Allocator
-+    );
-+
-+#if LINUX_CMA_FSL
-+gceSTATUS
-+_CMAFSLAlloctorInit(
-+    IN gckOS Os,
-+    OUT gckALLOCATOR * Allocator
-+    );
-+#endif
-+
-+gcsALLOCATOR_DESC allocatorArray[] =
-+{
-+#if LINUX_CMA_FSL
-+    gcmkDEFINE_ALLOCATOR_DESC("cmafsl", _CMAFSLAlloctorInit),
-+#endif
-+    /* Default allocator. */
-+    gcmkDEFINE_ALLOCATOR_DESC("default", _DefaultAlloctorInit),
-+};
-+
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c	2015-07-27 23:13:06.218794344 +0200
-@@ -0,0 +1,412 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+#include "gc_hal_kernel_allocator.h"
-+
-+#include <linux/pagemap.h>
-+#include <linux/seq_file.h>
-+#include <linux/mman.h>
-+#include <asm/atomic.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/slab.h>
-+#include <linux/dma-mapping.h>
-+
-+#define _GC_OBJ_ZONE    gcvZONE_OS
-+
-+typedef struct _gcsCMA_PRIV * gcsCMA_PRIV_PTR;
-+typedef struct _gcsCMA_PRIV {
-+    gctUINT32 cmasize;
-+}
-+gcsCMA_PRIV;
-+
-+struct mdl_cma_priv {
-+    gctPOINTER kvaddr;
-+    dma_addr_t physical;
-+};
-+
-+int gc_cma_usage_show(struct seq_file* m, void* data)
-+{
-+    gcsINFO_NODE *node = m->private;
-+    gckALLOCATOR Allocator = node->device;
-+    gcsCMA_PRIV_PTR priv = Allocator->privateData;
-+
-+    seq_printf(m, "cma:  %u bytes\n", priv->cmasize);
-+
-+    return 0;
-+}
-+
-+static gcsINFO InfoList[] =
-+{
-+    {"cmausage", gc_cma_usage_show},
-+};
-+
-+static void
-+_DefaultAllocatorDebugfsInit(
-+    IN gckALLOCATOR Allocator,
-+    IN gckDEBUGFS_DIR Root
-+    )
-+{
-+    gcmkVERIFY_OK(
-+        gckDEBUGFS_DIR_Init(&Allocator->debugfsDir, Root->root, "cma"));
-+
-+    gcmkVERIFY_OK(gckDEBUGFS_DIR_CreateFiles(
-+        &Allocator->debugfsDir,
-+        InfoList,
-+        gcmCOUNTOF(InfoList),
-+        Allocator
-+        ));
-+}
-+
-+static void
-+_DefaultAllocatorDebugfsCleanup(
-+    IN gckALLOCATOR Allocator
-+    )
-+{
-+    gcmkVERIFY_OK(gckDEBUGFS_DIR_RemoveFiles(
-+        &Allocator->debugfsDir,
-+        InfoList,
-+        gcmCOUNTOF(InfoList)
-+        ));
-+
-+    gckDEBUGFS_DIR_Deinit(&Allocator->debugfsDir);
-+}
-+
-+static gceSTATUS
-+_CMAFSLAlloc(
-+    IN gckALLOCATOR Allocator,
-+    INOUT PLINUX_MDL Mdl,
-+    IN gctSIZE_T NumPages,
-+    IN gctUINT32 Flags
-+    )
-+{
-+    gceSTATUS status;
-+    gcsCMA_PRIV_PTR priv = (gcsCMA_PRIV_PTR)Allocator->privateData;
-+
-+    struct mdl_cma_priv *mdl_priv=gcvNULL;
-+    gckOS os = Allocator->os;
-+
-+    gcmkHEADER_ARG("Mdl=%p NumPages=%d", Mdl, NumPages);
-+
-+    gcmkONERROR(gckOS_Allocate(os, sizeof(struct mdl_cma_priv), (gctPOINTER *)&mdl_priv));
-+    mdl_priv->kvaddr = gcvNULL;
-+
-+    mdl_priv->kvaddr = dma_alloc_writecombine(gcvNULL,
-+            NumPages * PAGE_SIZE,
-+            &mdl_priv->physical,
-+            GFP_KERNEL | gcdNOWARN);
-+
-+    if (mdl_priv->kvaddr == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    Mdl->priv = mdl_priv;
-+    priv->cmasize += NumPages * PAGE_SIZE;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if(mdl_priv)
-+        gckOS_Free(os, mdl_priv);
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static void
-+_CMAFSLFree(
-+    IN gckALLOCATOR Allocator,
-+    IN OUT PLINUX_MDL Mdl
-+    )
-+{
-+    gckOS os = Allocator->os;
-+    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
-+    gcsCMA_PRIV_PTR priv = (gcsCMA_PRIV_PTR)Allocator->privateData;
-+    dma_free_writecombine(gcvNULL,
-+            Mdl->numPages * PAGE_SIZE,
-+            mdl_priv->kvaddr,
-+            mdl_priv->physical);
-+     gckOS_Free(os, mdl_priv);
-+    priv->cmasize -= Mdl->numPages * PAGE_SIZE;
-+}
-+
-+gctINT
-+_CMAFSLMapUser(
-+    gckALLOCATOR Allocator,
-+    PLINUX_MDL Mdl,
-+    PLINUX_MDL_MAP MdlMap,
-+    gctBOOL Cacheable
-+    )
-+{
-+
-+    PLINUX_MDL      mdl = Mdl;
-+    PLINUX_MDL_MAP  mdlMap = MdlMap;
-+    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
-+
-+    gcmkHEADER_ARG("Allocator=%p Mdl=%p MdlMap=%p gctBOOL=%d", Allocator, Mdl, MdlMap, Cacheable);
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
-+    mdlMap->vmaAddr = (gctSTRING)vm_mmap(gcvNULL,
-+                    0L,
-+                    mdl->numPages * PAGE_SIZE,
-+                    PROT_READ | PROT_WRITE,
-+                    MAP_SHARED,
-+                    0);
-+#else
-+    down_write(&current->mm->mmap_sem);
-+
-+    mdlMap->vmaAddr = (gctSTRING)do_mmap_pgoff(gcvNULL,
-+                    0L,
-+                    mdl->numPages * PAGE_SIZE,
-+                    PROT_READ | PROT_WRITE,
-+                    MAP_SHARED,
-+                    0);
-+
-+    up_write(&current->mm->mmap_sem);
-+#endif
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_OS,
-+        "%s(%d): vmaAddr->0x%X for phys_addr->0x%X",
-+        __FUNCTION__, __LINE__,
-+        (gctUINT32)(gctUINTPTR_T)mdlMap->vmaAddr,
-+        (gctUINT32)(gctUINTPTR_T)mdl
-+        );
-+
-+    if (IS_ERR(mdlMap->vmaAddr))
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): do_mmap_pgoff error",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        mdlMap->vmaAddr = gcvNULL;
-+
-+        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+        return gcvSTATUS_OUT_OF_MEMORY;
-+    }
-+
-+    down_write(&current->mm->mmap_sem);
-+
-+    mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
-+
-+    if (mdlMap->vma == gcvNULL)
-+    {
-+        up_write(&current->mm->mmap_sem);
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): find_vma error",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        mdlMap->vmaAddr = gcvNULL;
-+
-+        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+        return gcvSTATUS_OUT_OF_RESOURCES;
-+    }
-+
-+    /* Now map all the vmalloc pages to this user address. */
-+    if (mdl->contiguous)
-+    {
-+        /* map kernel memory to user space.. */
-+        if (dma_mmap_writecombine(gcvNULL,
-+                mdlMap->vma,
-+                mdl_priv->kvaddr,
-+                mdl_priv->physical,
-+                mdl->numPages * PAGE_SIZE) < 0)
-+        {
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): dma_mmap_attrs error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+             mdlMap->vmaAddr = gcvNULL;
-+
-+            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+            return gcvSTATUS_OUT_OF_MEMORY;
-+        }
-+    }
-+    else
-+    {
-+        gckOS_Print("incorrect mdl:conti%d\n",mdl->contiguous);
-+    }
-+
-+    up_write(&current->mm->mmap_sem);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+void
-+_CMAUnmapUser(
-+    IN gckALLOCATOR Allocator,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Size
-+    )
-+{
-+    if (unlikely(current->mm == gcvNULL))
-+    {
-+        /* Do nothing if process is exiting. */
-+        return;
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,4,0)
-+    if (vm_munmap((unsigned long)Logical, Size) < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): vm_munmap failed",
-+                __FUNCTION__, __LINE__
-+                );
-+    }
-+#else
-+    down_write(&current->mm->mmap_sem);
-+    if (do_munmap(current->mm, (unsigned long)Logical, Size) < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): do_munmap failed",
-+                __FUNCTION__, __LINE__
-+                );
-+    }
-+    up_write(&current->mm->mmap_sem);
-+#endif
-+}
-+
-+gceSTATUS
-+_CMAMapKernel(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    OUT gctPOINTER *Logical
-+    )
-+{
-+    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
-+    *Logical =mdl_priv->kvaddr;
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_CMAUnmapKernel(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+extern gceSTATUS
-+_DefaultLogicalToPhysical(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 ProcessID,
-+    OUT gctUINT32_PTR Physical
-+    );
-+
-+extern gceSTATUS
-+_DefaultCache(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Physical,
-+    IN gctUINT32 Bytes,
-+    IN gceCACHEOPERATION Operation
-+    );
-+
-+gceSTATUS
-+_CMAPhysical(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32_PTR Physical
-+    )
-+{
-+    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
-+     gcmkASSERT(!Offset);
-+    *Physical = mdl_priv->physical;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+extern void
-+_DefaultAllocatorDestructor(
-+    IN void* PrivateData
-+    );
-+
-+/* Default allocator operations. */
-+gcsALLOCATOR_OPERATIONS CMAFSLAllocatorOperations = {
-+    .Alloc              = _CMAFSLAlloc,
-+    .Free               = _CMAFSLFree,
-+    .MapUser            = _CMAFSLMapUser,
-+    .UnmapUser          = _CMAUnmapUser,
-+    .MapKernel          = _CMAMapKernel,
-+    .UnmapKernel        = _CMAUnmapKernel,
-+    .LogicalToPhysical  = _DefaultLogicalToPhysical,
-+    .Cache              = _DefaultCache,
-+    .Physical           = _CMAPhysical,
-+};
-+
-+/* Default allocator entry. */
-+gceSTATUS
-+_CMAFSLAlloctorInit(
-+    IN gckOS Os,
-+    OUT gckALLOCATOR * Allocator
-+    )
-+{
-+    gceSTATUS status;
-+    gckALLOCATOR allocator;
-+    gcsCMA_PRIV_PTR priv = gcvNULL;
-+
-+    gcmkONERROR(
-+        gckALLOCATOR_Construct(Os, &CMAFSLAllocatorOperations, &allocator));
-+
-+    priv = kzalloc(gcmSIZEOF(gcsCMA_PRIV), GFP_KERNEL | gcdNOWARN);
-+
-+    if (!priv)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Register private data. */
-+    allocator->privateData = priv;
-+    allocator->privateDataDestructor = _DefaultAllocatorDestructor;
-+
-+    allocator->debugfsInit = _DefaultAllocatorDebugfsInit;
-+    allocator->debugfsCleanup = _DefaultAllocatorDebugfsCleanup;
-+
-+    allocator->capability = gcvALLOC_FLAG_CONTIGUOUS;
-+
-+    *Allocator = allocator;
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,938 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+#include "gc_hal_kernel_allocator.h"
-+#include <linux/pagemap.h>
-+#include <linux/seq_file.h>
-+#include <linux/mman.h>
-+#include <asm/atomic.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/slab.h>
-+
-+#include "gc_hal_kernel_allocator_array.h"
-+#include "gc_hal_kernel_platform.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_OS
-+
-+typedef struct _gcsDEFAULT_PRIV * gcsDEFAULT_PRIV_PTR;
-+typedef struct _gcsDEFAULT_PRIV {
-+    gctUINT32 low;
-+    gctUINT32 high;
-+}
-+gcsDEFAULT_PRIV;
-+
-+/******************************************************************************\
-+************************** Default Allocator Debugfs ***************************
-+\******************************************************************************/
-+
-+int gc_usage_show(struct seq_file* m, void* data)
-+{
-+    gcsINFO_NODE *node = m->private;
-+    gckALLOCATOR Allocator = node->device;
-+    gcsDEFAULT_PRIV_PTR priv = Allocator->privateData;
-+
-+    seq_printf(m, "low:  %u bytes\n", priv->low);
-+    seq_printf(m, "high: %u bytes\n", priv->high);
-+
-+    return 0;
-+}
-+
-+static gcsINFO InfoList[] =
-+{
-+    {"lowHighUsage", gc_usage_show},
-+};
-+
-+static void
-+_DefaultAllocatorDebugfsInit(
-+    IN gckALLOCATOR Allocator,
-+    IN gckDEBUGFS_DIR Root
-+    )
-+{
-+    gcmkVERIFY_OK(
-+        gckDEBUGFS_DIR_Init(&Allocator->debugfsDir, Root->root, "default"));
-+
-+    gcmkVERIFY_OK(gckDEBUGFS_DIR_CreateFiles(
-+        &Allocator->debugfsDir,
-+        InfoList,
-+        gcmCOUNTOF(InfoList),
-+        Allocator
-+        ));
-+}
-+
-+static void
-+_DefaultAllocatorDebugfsCleanup(
-+    IN gckALLOCATOR Allocator
-+    )
-+{
-+    gcmkVERIFY_OK(gckDEBUGFS_DIR_RemoveFiles(
-+        &Allocator->debugfsDir,
-+        InfoList,
-+        gcmCOUNTOF(InfoList)
-+        ));
-+
-+    gckDEBUGFS_DIR_Deinit(&Allocator->debugfsDir);
-+}
-+
-+
-+static void
-+_NonContiguousFree(
-+    IN struct page ** Pages,
-+    IN gctUINT32 NumPages
-+    )
-+{
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Pages=0x%X, NumPages=%d", Pages, NumPages);
-+
-+    gcmkASSERT(Pages != gcvNULL);
-+
-+    for (i = 0; i < NumPages; i++)
-+    {
-+        __free_page(Pages[i]);
-+    }
-+
-+    if (is_vmalloc_addr(Pages))
-+    {
-+        vfree(Pages);
-+    }
-+    else
-+    {
-+        kfree(Pages);
-+    }
-+
-+    gcmkFOOTER_NO();
-+}
-+
-+static struct page **
-+_NonContiguousAlloc(
-+    IN gctUINT32 NumPages
-+    )
-+{
-+    struct page ** pages;
-+    struct page *p;
-+    gctINT i, size;
-+
-+    gcmkHEADER_ARG("NumPages=%lu", NumPages);
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 32)
-+    if (NumPages > totalram_pages)
-+#else
-+    if (NumPages > num_physpages)
-+#endif
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvNULL;
-+    }
-+
-+    size = NumPages * sizeof(struct page *);
-+
-+    pages = kmalloc(size, GFP_KERNEL | gcdNOWARN);
-+
-+    if (!pages)
-+    {
-+        pages = vmalloc(size);
-+
-+        if (!pages)
-+        {
-+            gcmkFOOTER_NO();
-+            return gcvNULL;
-+        }
-+    }
-+
-+    for (i = 0; i < NumPages; i++)
-+    {
-+        p = alloc_page(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN);
-+
-+        if (!p)
-+        {
-+            _NonContiguousFree(pages, i);
-+            gcmkFOOTER_NO();
-+            return gcvNULL;
-+        }
-+
-+        pages[i] = p;
-+    }
-+
-+    gcmkFOOTER_ARG("pages=0x%X", pages);
-+    return pages;
-+}
-+
-+gctSTRING
-+_CreateKernelVirtualMapping(
-+    IN PLINUX_MDL Mdl
-+    )
-+{
-+    gctSTRING addr = 0;
-+    gctINT numPages = Mdl->numPages;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    if (Mdl->contiguous)
-+    {
-+        addr = page_address(Mdl->u.contiguousPages);
-+    }
-+    else
-+    {
-+        addr = vmap(Mdl->u.nonContiguousPages,
-+                    numPages,
-+                    0,
-+                    PAGE_KERNEL);
-+
-+        /* Trigger a page fault. */
-+        memset(addr, 0, numPages * PAGE_SIZE);
-+    }
-+#else
-+    struct page ** pages;
-+    gctBOOL free = gcvFALSE;
-+    gctINT i;
-+
-+    if (Mdl->contiguous)
-+    {
-+        pages = kmalloc(sizeof(struct page *) * numPages, GFP_KERNEL | gcdNOWARN);
-+
-+        if (!pages)
-+        {
-+            return gcvNULL;
-+        }
-+
-+        for (i = 0; i < numPages; i++)
-+        {
-+            pages[i] = nth_page(Mdl->u.contiguousPages, i);
-+        }
-+
-+        free = gcvTRUE;
-+    }
-+    else
-+    {
-+        pages = Mdl->u.nonContiguousPages;
-+    }
-+
-+    /* ioremap() can't work on system memory since 2.6.38. */
-+    addr = vmap(pages, numPages, 0, gcmkNONPAGED_MEMROY_PROT(PAGE_KERNEL));
-+
-+    if (free)
-+    {
-+        kfree(pages);
-+    }
-+
-+#endif
-+
-+    return addr;
-+}
-+
-+void
-+_DestoryKernelVirtualMapping(
-+    IN gctSTRING Addr
-+    )
-+{
-+#if !gcdNONPAGED_MEMORY_CACHEABLE
-+    vunmap(Addr);
-+#endif
-+}
-+
-+void
-+_UnmapUserLogical(
-+    IN gctPOINTER Logical,
-+    IN gctUINT32  Size
-+)
-+{
-+    if (unlikely(current->mm == gcvNULL))
-+    {
-+        /* Do nothing if process is exiting. */
-+        return;
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    if (vm_munmap((unsigned long)Logical, Size) < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): vm_munmap failed",
-+                __FUNCTION__, __LINE__
-+                );
-+    }
-+#else
-+    down_write(&current->mm->mmap_sem);
-+    if (do_munmap(current->mm, (unsigned long)Logical, Size) < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): do_munmap failed",
-+                __FUNCTION__, __LINE__
-+                );
-+    }
-+    up_write(&current->mm->mmap_sem);
-+#endif
-+}
-+
-+/***************************************************************************\
-+************************ Default Allocator **********************************
-+\***************************************************************************/
-+#define C_MAX_PAGENUM  (50*1024)
-+static gceSTATUS
-+_DefaultAlloc(
-+    IN gckALLOCATOR Allocator,
-+    INOUT PLINUX_MDL Mdl,
-+    IN gctSIZE_T NumPages,
-+    IN gctUINT32 Flags
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 order;
-+    gctSIZE_T bytes;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+    gctPOINTER addr = gcvNULL;
-+#endif
-+    gctUINT32 numPages;
-+    gctUINT i = 0;
-+    gctBOOL contiguous = Flags & gcvALLOC_FLAG_CONTIGUOUS;
-+    struct sysinfo temsysinfo;
-+    gcsDEFAULT_PRIV_PTR priv = (gcsDEFAULT_PRIV_PTR)Allocator->privateData;
-+
-+    gcmkHEADER_ARG("Mdl=%p NumPages=%d", Mdl, NumPages);
-+
-+    numPages = NumPages;
-+    bytes = NumPages * PAGE_SIZE;
-+    order = get_order(bytes);
-+
-+    si_meminfo(&temsysinfo);
-+
-+    if (Flags & gcvALLOC_FLAG_MEMLIMIT)
-+    {
-+        if ( (temsysinfo.freeram < NumPages) || ((temsysinfo.freeram-NumPages) < C_MAX_PAGENUM) )
-+        {
-+            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+        }
-+    }
-+
-+    if (contiguous)
-+    {
-+        if (order >= MAX_ORDER)
-+        {
-+            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+        }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+        addr =
-+            alloc_pages_exact(bytes, GFP_KERNEL | gcdNOWARN | __GFP_NORETRY);
-+
-+        Mdl->u.contiguousPages = addr
-+                               ? virt_to_page(addr)
-+                               : gcvNULL;
-+
-+        Mdl->exact = gcvTRUE;
-+#else
-+        Mdl->u.contiguousPages =
-+            alloc_pages(GFP_KERNEL | gcdNOWARN | __GFP_NORETRY, order);
-+#endif
-+
-+        if (Mdl->u.contiguousPages == gcvNULL)
-+        {
-+            Mdl->u.contiguousPages =
-+                alloc_pages(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN, order);
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+            Mdl->exact = gcvFALSE;
-+#endif
-+        }
-+    }
-+    else
-+    {
-+        Mdl->u.nonContiguousPages = _NonContiguousAlloc(numPages);
-+    }
-+
-+    if (Mdl->u.contiguousPages == gcvNULL && Mdl->u.nonContiguousPages == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    for (i = 0; i < numPages; i++)
-+    {
-+        struct page *page;
-+
-+        if (contiguous)
-+        {
-+            page = nth_page(Mdl->u.contiguousPages, i);
-+        }
-+        else
-+        {
-+            page = _NonContiguousToPage(Mdl->u.nonContiguousPages, i);
-+        }
-+
-+        SetPageReserved(page);
-+
-+        if (!PageHighMem(page) && page_to_phys(page))
-+        {
-+            gcmkVERIFY_OK(
-+                gckOS_CacheFlush(Allocator->os, _GetProcessID(), gcvNULL,
-+                                 page_to_phys(page),
-+                                 page_address(page),
-+                                 PAGE_SIZE));
-+
-+            priv->low += PAGE_SIZE;
-+        }
-+        else
-+        {
-+            flush_dcache_page(page);
-+
-+#if !gcdCACHE_FUNCTION_UNIMPLEMENTED && defined(CONFIG_OUTER_CACHE) && gcdENABLE_OUTER_CACHE_PATCH
-+            if (page_to_phys(page))
-+            {
-+                _HandleOuterCache(
-+                    Allocator->os,
-+                    page_to_phys(page),
-+                    gcvNULL,
-+                    PAGE_SIZE,
-+                    gcvCACHE_FLUSH
-+                    );
-+            }
-+#endif
-+
-+            priv->high += PAGE_SIZE;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static void
-+_DefaultFree(
-+    IN gckALLOCATOR Allocator,
-+    IN OUT PLINUX_MDL Mdl
-+    )
-+{
-+    gctINT i;
-+    struct page * page;
-+    gcsDEFAULT_PRIV_PTR priv = (gcsDEFAULT_PRIV_PTR)Allocator->privateData;
-+
-+    for (i = 0; i < Mdl->numPages; i++)
-+    {
-+        if (Mdl->contiguous)
-+        {
-+            page = nth_page(Mdl->u.contiguousPages, i);
-+        }
-+        else
-+        {
-+            page = _NonContiguousToPage(Mdl->u.nonContiguousPages, i);
-+        }
-+
-+        ClearPageReserved(page);
-+
-+        if (PageHighMem(page))
-+        {
-+            priv->high -= PAGE_SIZE;
-+        }
-+        else
-+        {
-+            priv->low -= PAGE_SIZE;
-+        }
-+    }
-+
-+    if (Mdl->contiguous)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+        if (Mdl->exact == gcvTRUE)
-+        {
-+            free_pages_exact(page_address(Mdl->u.contiguousPages), Mdl->numPages * PAGE_SIZE);
-+        }
-+        else
-+#endif
-+        {
-+            __free_pages(Mdl->u.contiguousPages, get_order(Mdl->numPages * PAGE_SIZE));
-+        }
-+    }
-+    else
-+    {
-+        _NonContiguousFree(Mdl->u.nonContiguousPages, Mdl->numPages);
-+    }
-+}
-+
-+gctINT
-+_DefaultMapUser(
-+    gckALLOCATOR Allocator,
-+    PLINUX_MDL Mdl,
-+    PLINUX_MDL_MAP MdlMap,
-+    gctBOOL Cacheable
-+    )
-+{
-+
-+    gctSTRING       addr;
-+    unsigned long   start;
-+    unsigned long   pfn;
-+    gctINT i;
-+    gckOS           os = Allocator->os;
-+    gcsPLATFORM *   platform = os->device->platform;
-+
-+    PLINUX_MDL      mdl = Mdl;
-+    PLINUX_MDL_MAP  mdlMap = MdlMap;
-+
-+    gcmkHEADER_ARG("Allocator=%p Mdl=%p MdlMap=%p gctBOOL=%d", Allocator, Mdl, MdlMap, Cacheable);
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
-+    mdlMap->vmaAddr = (gctSTRING)vm_mmap(gcvNULL,
-+                    0L,
-+                    mdl->numPages * PAGE_SIZE,
-+                    PROT_READ | PROT_WRITE,
-+                    MAP_SHARED,
-+                    0);
-+#else
-+    down_write(&current->mm->mmap_sem);
-+
-+    mdlMap->vmaAddr = (gctSTRING)do_mmap_pgoff(gcvNULL,
-+                    0L,
-+                    mdl->numPages * PAGE_SIZE,
-+                    PROT_READ | PROT_WRITE,
-+                    MAP_SHARED,
-+                    0);
-+
-+    up_write(&current->mm->mmap_sem);
-+#endif
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_OS,
-+        "%s(%d): vmaAddr->0x%X for phys_addr->0x%X",
-+        __FUNCTION__, __LINE__,
-+        (gctUINT32)(gctUINTPTR_T)mdlMap->vmaAddr,
-+        (gctUINT32)(gctUINTPTR_T)mdl
-+        );
-+
-+    if (IS_ERR(mdlMap->vmaAddr))
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): do_mmap_pgoff error",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        mdlMap->vmaAddr = gcvNULL;
-+
-+        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+        return gcvSTATUS_OUT_OF_MEMORY;
-+    }
-+
-+    down_write(&current->mm->mmap_sem);
-+
-+    mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
-+
-+    if (mdlMap->vma == gcvNULL)
-+    {
-+        up_write(&current->mm->mmap_sem);
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): find_vma error",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        mdlMap->vmaAddr = gcvNULL;
-+
-+        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+        return gcvSTATUS_OUT_OF_RESOURCES;
-+    }
-+
-+    mdlMap->vma->vm_flags |= gcdVM_FLAGS;
-+
-+    if (Cacheable == gcvFALSE)
-+    {
-+        /* Make this mapping non-cached. */
-+        mdlMap->vma->vm_page_prot = gcmkPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
-+    }
-+
-+    if (platform && platform->ops->adjustProt)
-+    {
-+        platform->ops->adjustProt(mdlMap->vma);
-+    }
-+
-+    addr = mdl->addr;
-+
-+    /* Now map all the vmalloc pages to this user address. */
-+    if (mdl->contiguous)
-+    {
-+        /* map kernel memory to user space.. */
-+        if (remap_pfn_range(mdlMap->vma,
-+                            mdlMap->vma->vm_start,
-+                            page_to_pfn(mdl->u.contiguousPages),
-+                            mdlMap->vma->vm_end - mdlMap->vma->vm_start,
-+                            mdlMap->vma->vm_page_prot) < 0)
-+        {
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_OS,
-+                "%s(%d): unable to mmap ret",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+            return gcvSTATUS_OUT_OF_MEMORY;
-+        }
-+    }
-+    else
-+    {
-+        start = mdlMap->vma->vm_start;
-+
-+        for (i = 0; i < mdl->numPages; i++)
-+        {
-+            pfn = _NonContiguousToPfn(mdl->u.nonContiguousPages, i);
-+
-+            if (remap_pfn_range(mdlMap->vma,
-+                                start,
-+                                pfn,
-+                                PAGE_SIZE,
-+                                mdlMap->vma->vm_page_prot) < 0)
-+            {
-+                up_write(&current->mm->mmap_sem);
-+
-+                mdlMap->vmaAddr = gcvNULL;
-+
-+                gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+                return gcvSTATUS_OUT_OF_MEMORY;
-+            }
-+
-+            start += PAGE_SIZE;
-+            addr += PAGE_SIZE;
-+        }
-+    }
-+
-+    up_write(&current->mm->mmap_sem);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+void
-+_DefaultUnmapUser(
-+    IN gckALLOCATOR Allocator,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Size
-+    )
-+{
-+    _UnmapUserLogical(Logical, Size);
-+}
-+
-+gceSTATUS
-+_DefaultMapKernel(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    OUT gctPOINTER *Logical
-+    )
-+{
-+    *Logical = _CreateKernelVirtualMapping(Mdl);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_DefaultUnmapKernel(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    _DestoryKernelVirtualMapping(Logical);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_DefaultLogicalToPhysical(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 ProcessID,
-+    OUT gctUINT32_PTR Physical
-+    )
-+{
-+    return _ConvertLogical2Physical(
-+                Allocator->os, Logical, ProcessID, Mdl, Physical);
-+}
-+
-+gceSTATUS
-+_DefaultCache(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 Physical,
-+    IN gctUINT32 Bytes,
-+    IN gceCACHEOPERATION Operation
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_DefaultPhysical(
-+    IN gckALLOCATOR Allocator,
-+    IN PLINUX_MDL Mdl,
-+    IN gctUINT32 Offset,
-+    OUT gctUINT32_PTR Physical
-+    )
-+{
-+    gcmkASSERT(Mdl->pagedMem && !Mdl->contiguous);
-+    *Physical = _NonContiguousToPhys(Mdl->u.nonContiguousPages, Offset);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+void
-+_DefaultAllocatorDestructor(
-+    IN void* PrivateData
-+    )
-+{
-+    kfree(PrivateData);
-+}
-+
-+/* Default allocator operations. */
-+gcsALLOCATOR_OPERATIONS DefaultAllocatorOperations = {
-+    .Alloc              = _DefaultAlloc,
-+    .Free               = _DefaultFree,
-+    .MapUser            = _DefaultMapUser,
-+    .UnmapUser          = _DefaultUnmapUser,
-+    .MapKernel          = _DefaultMapKernel,
-+    .UnmapKernel        = _DefaultUnmapKernel,
-+    .LogicalToPhysical  = _DefaultLogicalToPhysical,
-+    .Cache              = _DefaultCache,
-+    .Physical           = _DefaultPhysical,
-+};
-+
-+/* Default allocator entry. */
-+gceSTATUS
-+_DefaultAlloctorInit(
-+    IN gckOS Os,
-+    OUT gckALLOCATOR * Allocator
-+    )
-+{
-+    gceSTATUS status;
-+    gckALLOCATOR allocator;
-+    gcsDEFAULT_PRIV_PTR priv = gcvNULL;
-+
-+    gcmkONERROR(
-+        gckALLOCATOR_Construct(Os, &DefaultAllocatorOperations, &allocator));
-+
-+    priv = kzalloc(gcmSIZEOF(gcsDEFAULT_PRIV), GFP_KERNEL | gcdNOWARN);
-+
-+    if (!priv)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Register private data. */
-+    allocator->privateData = priv;
-+    allocator->privateDataDestructor = _DefaultAllocatorDestructor;
-+
-+    allocator->debugfsInit = _DefaultAllocatorDebugfsInit;
-+    allocator->debugfsCleanup = _DefaultAllocatorDebugfsCleanup;
-+
-+    *Allocator = allocator;
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+/***************************************************************************\
-+************************ Allocator helper ***********************************
-+\***************************************************************************/
-+
-+gceSTATUS
-+gckALLOCATOR_Construct(
-+    IN gckOS Os,
-+    IN gcsALLOCATOR_OPERATIONS * Operations,
-+    OUT gckALLOCATOR * Allocator
-+    )
-+{
-+    gceSTATUS status;
-+    gckALLOCATOR allocator;
-+
-+    gcmkHEADER_ARG("Os=%p, Operations=%p, Allocator=%p",
-+                   Os, Operations, Allocator);
-+
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Allocator != gcvNULL);
-+    gcmkVERIFY_ARGUMENT
-+        (  Operations
-+        && Operations->Alloc
-+        && Operations->Free
-+        && Operations->MapUser
-+        && Operations->UnmapUser
-+        && Operations->MapKernel
-+        && Operations->UnmapKernel
-+        && Operations->LogicalToPhysical
-+        && Operations->Cache
-+        && Operations->Physical
-+        );
-+
-+    gcmkONERROR(
-+        gckOS_Allocate(Os, gcmSIZEOF(gcsALLOCATOR), (gctPOINTER *)&allocator));
-+
-+    gckOS_ZeroMemory(allocator, gcmSIZEOF(gcsALLOCATOR));
-+
-+    /* Record os. */
-+    allocator->os = Os;
-+
-+    /* Set operations. */
-+    allocator->ops = Operations;
-+
-+    allocator->capability = gcvALLOC_FLAG_CONTIGUOUS
-+                          | gcvALLOC_FLAG_NON_CONTIGUOUS
-+                          | gcvALLOC_FLAG_CACHEABLE
-+                          | gcvALLOC_FLAG_MEMLIMIT;
-+                          ;
-+
-+    *Allocator = allocator;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/******************************************************************************\
-+******************************** Debugfs Support *******************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_AllocatorDebugfsInit(
-+    IN gckOS Os
-+    )
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device = Os->device;
-+
-+    gckDEBUGFS_DIR dir = &Os->allocatorDebugfsDir;
-+
-+    gcmkONERROR(gckDEBUGFS_DIR_Init(dir, device->debugfsDir.root, "allocators"));
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+static void
-+_AllocatorDebugfsCleanup(
-+    IN gckOS Os
-+    )
-+{
-+    gckDEBUGFS_DIR dir = &Os->allocatorDebugfsDir;
-+
-+    gckDEBUGFS_DIR_Deinit(dir);
-+}
-+
-+/***************************************************************************\
-+************************ Allocator management *******************************
-+\***************************************************************************/
-+
-+gceSTATUS
-+gckOS_ImportAllocators(
-+    gckOS Os
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT i;
-+    gckALLOCATOR allocator;
-+
-+    _AllocatorDebugfsInit(Os);
-+
-+    INIT_LIST_HEAD(&Os->allocatorList);
-+
-+    for (i = 0; i < gcmCOUNTOF(allocatorArray); i++)
-+    {
-+        if (allocatorArray[i].construct)
-+        {
-+            /* Construct allocator. */
-+            status = allocatorArray[i].construct(Os, &allocator);
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                gcmkPRINT("["DEVICE_NAME"]: Can't construct allocator(%s)",
-+                          allocatorArray[i].name);
-+
-+                continue;
-+            }
-+
-+            allocator->name = allocatorArray[i].name;
-+
-+            if (allocator->debugfsInit)
-+            {
-+                /* Init allocator's debugfs. */
-+                allocator->debugfsInit(allocator, &Os->allocatorDebugfsDir);
-+            }
-+
-+            list_add_tail(&allocator->head, &Os->allocatorList);
-+        }
-+    }
-+
-+#if gcdDEBUG
-+    list_for_each_entry(allocator, &Os->allocatorList, head)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_WARNING, gcvZONE_OS,
-+            "%s(%d) Allocator: %s",
-+            __FUNCTION__, __LINE__,
-+            allocator->name
-+            );
-+    }
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_FreeAllocators(
-+    gckOS Os
-+    )
-+{
-+    gckALLOCATOR allocator;
-+    gckALLOCATOR temp;
-+
-+    list_for_each_entry_safe(allocator, temp, &Os->allocatorList, head)
-+    {
-+        list_del(&allocator->head);
-+
-+        if (allocator->debugfsCleanup)
-+        {
-+            /* Clean up allocator's debugfs. */
-+            allocator->debugfsCleanup(allocator);
-+        }
-+
-+        /* Free private data. */
-+        if (allocator->privateDataDestructor && allocator->privateData)
-+        {
-+            allocator->privateDataDestructor(allocator->privateData);
-+        }
-+
-+        gckOS_Free(Os, allocator);
-+    }
-+
-+    _AllocatorDebugfsCleanup(Os);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,400 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_allocator_h_
-+#define __gc_hal_kernel_allocator_h_
-+
-+#include "gc_hal_kernel_linux.h"
-+
-+typedef struct _gcsALLOCATOR * gckALLOCATOR;
-+
-+typedef struct _gcsALLOCATOR_OPERATIONS
-+{
-+    /**************************************************************************
-+    **
-+    ** Alloc
-+    **
-+    ** Allocte memory, request size is page aligned.
-+    **
-+    ** INPUT:
-+    **
-+    **    gckALLOCATOR Allocator
-+    **        Pointer to an gckALLOCATOER object.
-+    **
-+    **    PLINUX_Mdl
-+    **        Pointer to Mdl whichs stores information
-+    **        about allocated memory.
-+    **
-+    **    gctSIZE_T NumPages
-+    **        Number of pages need to allocate.
-+    **
-+    **    gctUINT32 Flag
-+    **        Allocation option.
-+    **
-+    ** OUTPUT:
-+    **
-+    **      Nothing.
-+    **
-+    */
-+    gceSTATUS
-+    (*Alloc)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        IN gctSIZE_T NumPages,
-+        IN gctUINT32 Flag
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** Free
-+    **
-+    ** Free memory.
-+    **
-+    ** INPUT:
-+    **
-+    **     gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **     PLINUX_MDL Mdl
-+    **          Mdl which stores information.
-+    **
-+    ** OUTPUT:
-+    **
-+    **      Nothing.
-+    **
-+    */
-+    void
-+    (*Free)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** MapUser
-+    **
-+    ** Map memory to user space.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      PLINUX_MDL Mdl
-+    **          Pointer to a Mdl.
-+    **
-+    **      PLINUX_MDL_MAP MdlMap
-+    **          Pointer to a MdlMap, mapped address is stored
-+    **          in MdlMap->vmaAddr
-+    **
-+    **      gctBOOL Cacheable
-+    **          Whether this mapping is cacheable.
-+    **
-+    ** OUTPUT:
-+    **
-+    **      Nothing.
-+    **
-+    */
-+    gctINT
-+    (*MapUser)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        IN PLINUX_MDL_MAP MdlMap,
-+        IN gctBOOL Cacheable
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** UnmapUser
-+    **
-+    ** Unmap address from user address space.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      gctPOINTER Logical
-+    **          Address to be unmap
-+    **
-+    **      gctUINT32 Size
-+    **          Size of address space
-+    **
-+    ** OUTPUT:
-+    **
-+    **      Nothing.
-+    **
-+    */
-+    void
-+    (*UnmapUser)(
-+        IN gckALLOCATOR Allocator,
-+        IN gctPOINTER Logical,
-+        IN gctUINT32 Size
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** MapKernel
-+    **
-+    ** Map memory to kernel space.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      PLINUX_MDL Mdl
-+    **          Pointer to a Mdl object.
-+    **
-+    ** OUTPUT:
-+    **      gctPOINTER * Logical
-+    **          Mapped kernel address.
-+    */
-+    gceSTATUS
-+    (*MapKernel)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        OUT gctPOINTER *Logical
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** UnmapKernel
-+    **
-+    ** Unmap memory from kernel space.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      PLINUX_MDL Mdl
-+    **          Pointer to a Mdl object.
-+    **
-+    **      gctPOINTER Logical
-+    **          Mapped kernel address.
-+    **
-+    ** OUTPUT:
-+    **
-+    **      Nothing.
-+    **
-+    */
-+    gceSTATUS
-+    (*UnmapKernel)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        IN gctPOINTER Logical
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** LogicalToPhysical
-+    **
-+    ** Get physical address from logical address, logical
-+    ** address could be user virtual address or kernel
-+    ** virtual address.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      PLINUX_MDL Mdl
-+    **          Pointer to a Mdl object.
-+    **
-+    **      gctPOINTER Logical
-+    **          Mapped kernel address.
-+    **
-+    **      gctUINT32 ProcessID
-+    **          pid of current process.
-+    ** OUTPUT:
-+    **
-+    **      gctUINT32_PTR Physical
-+    **          Physical address.
-+    **
-+    */
-+    gceSTATUS
-+    (*LogicalToPhysical)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        IN gctPOINTER Logical,
-+        IN gctUINT32 ProcessID,
-+        OUT gctUINT32_PTR Physical
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** Cache
-+    **
-+    ** Maintain cache coherency.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      PLINUX_MDL Mdl
-+    **          Pointer to a Mdl object.
-+    **
-+    **      gctPOINTER Logical
-+    **          Logical address, could be user address or kernel address
-+    **
-+    **      gctUINT32_PTR Physical
-+    **          Physical address.
-+    **
-+    **      gctUINT32 Bytes
-+    **          Size of memory region.
-+    **
-+    **      gceCACHEOPERATION Opertaion
-+    **          Cache operation.
-+    **
-+    ** OUTPUT:
-+    **
-+    **      Nothing.
-+    **
-+    */
-+    gceSTATUS (*Cache)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        IN gctPOINTER Logical,
-+        IN gctUINT32 Physical,
-+        IN gctUINT32 Bytes,
-+        IN gceCACHEOPERATION Operation
-+        );
-+
-+    /**************************************************************************
-+    **
-+    ** Physical
-+    **
-+    ** Get physical address from a offset in memory region.
-+    **
-+    ** INPUT:
-+    **      gckALLOCATOR Allocator
-+    **          Pointer to an gckALLOCATOER object.
-+    **
-+    **      PLINUX_MDL Mdl
-+    **          Pointer to a Mdl object.
-+    **
-+    **      gctUINT32 Offset
-+    **          Offset in this memory region.
-+    **
-+    ** OUTPUT:
-+    **      gctUINT32_PTR Physical
-+    **          Physical address.
-+    **
-+    */
-+    gceSTATUS (*Physical)(
-+        IN gckALLOCATOR Allocator,
-+        IN PLINUX_MDL Mdl,
-+        IN gctUINT32 Offset,
-+        OUT gctUINT32_PTR Physical
-+        );
-+}
-+gcsALLOCATOR_OPERATIONS;
-+
-+typedef struct _gcsALLOCATOR
-+{
-+    /* Pointer to gckOS Object. */
-+    gckOS                     os;
-+
-+    /* Name. */
-+    gctSTRING                 name;
-+
-+    /* Operations. */
-+    gcsALLOCATOR_OPERATIONS*  ops;
-+
-+    /* Capability of this allocator. */
-+    gctUINT32                 capability;
-+
-+    struct list_head          head;
-+
-+    /* Debugfs entry of this allocator. */
-+    gcsDEBUGFS_DIR            debugfsDir;
-+
-+    /* Init allocator debugfs. */
-+    void                      (*debugfsInit)(gckALLOCATOR, gckDEBUGFS_DIR);
-+
-+    /* Cleanup allocator debugfs. */
-+    void                      (*debugfsCleanup)(gckALLOCATOR);
-+
-+    /* Private data used by customer allocator. */
-+    void *                    privateData;
-+
-+    /* Private data destructor. */
-+    void                      (*privateDataDestructor)(void *);
-+}
-+gcsALLOCATOR;
-+
-+typedef struct _gcsALLOCATOR_DESC
-+{
-+    /* Name of a allocator. */
-+    char *                    name;
-+
-+    /* Entry function to construct a allocator. */
-+    gceSTATUS                 (*construct)(gckOS, gckALLOCATOR *);
-+}
-+gcsALLOCATOR_DESC;
-+
-+/*
-+* Helpers
-+*/
-+
-+/* Fill a gcsALLOCATOR_DESC structure. */
-+#define gcmkDEFINE_ALLOCATOR_DESC(Name, Construct) \
-+    { \
-+        .name      = Name, \
-+        .construct = Construct, \
-+    }
-+
-+/* Construct a allocator. */
-+gceSTATUS
-+gckALLOCATOR_Construct(
-+    IN gckOS Os,
-+    IN gcsALLOCATOR_OPERATIONS * Operations,
-+    OUT gckALLOCATOR * Allocator
-+    );
-+
-+/*
-+    How to implement customer allocator
-+
-+    Build in customer alloctor
-+
-+        It is recommanded that customer allocator is implmented in independent
-+        source file(s) which is specified by CUSOMTER_ALLOCATOR_OBJS in Kbuld.
-+
-+    Register gcsALLOCATOR
-+
-+        For each customer specified allocator, a desciption entry must be added
-+        to allocatorArray defined in gc_hal_kernel_allocator_array.h.
-+
-+        An entry in allocatorArray is a gcsALLOCATOR_DESC structure which describes
-+        name and constructor of a gckALLOCATOR object.
-+
-+
-+    Implement gcsALLOCATOR_DESC.init()
-+
-+        In gcsALLOCATOR_DESC.init(), gckALLOCATOR_Construct should be called
-+        to create a gckALLOCATOR object, customer specified private data can
-+        be put in gcsALLOCATOR.privateData.
-+
-+
-+    Implement gcsALLOCATOR_OPERATIONS
-+
-+        When call gckALLOCATOR_Construct to create a gckALLOCATOR object, a
-+        gcsALLOCATOR_OPERATIONS structure must be provided whose all members
-+        implemented.
-+
-+*/
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,795 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifdef MODULE
-+#include <linux/module.h>
-+#endif
-+#include <linux/init.h>
-+#include <linux/debugfs.h>
-+#include <linux/slab.h>
-+#ifdef MODVERSIONS
-+#include <linux/modversions.h>
-+#endif
-+#include <linux/stddef.h>
-+#include <linux/sched.h>
-+#include <linux/kernel.h>
-+#include <linux/timer.h>
-+#include <linux/delay.h>
-+#include <linux/errno.h>
-+#include <linux/mutex.h>
-+#include <linux/vmalloc.h>
-+#include <linux/types.h>
-+#include <linux/fs.h>
-+#include <linux/poll.h>
-+#include <asm/uaccess.h>
-+#include <linux/completion.h>
-+#include "gc_hal_kernel_linux.h"
-+
-+/*
-+   Prequsite:
-+
-+   1) Debugfs feature must be enabled in the kernel.
-+       1.a) You can enable this, in the compilation of the uImage, all you have to do is, In the "make menuconfig" part,
-+       you have to enable the debugfs in the kernel hacking part of the menu.
-+
-+   HOW TO USE:
-+   1) insert the driver with the following option logFileSize, Ex: insmod galcore.ko ...... logFileSize=10240
-+   This gives a circular buffer of 10 MB
-+
-+   2)Usually after inserting the driver, the debug file system is mounted under /sys/kernel/debug/
-+
-+        2.a)If the debugfs is not mounted, you must do "mount -t debugfs none /sys/kernel/debug"
-+
-+   3) To read what is being printed in the debugfs file system:
-+        Ex : cat /sys/kernel/debug/gpu/galcore_trace
-+
-+   4)To write into the debug file system from user side :
-+        Ex: echo "hello" > cat /sys/kernel/debug/gpu/galcore_trace
-+
-+   5)To write into debugfs from kernel side, Use the function called gckDebugFileSystemPrint
-+
-+
-+   USECASE Kernel Dump:
-+
-+   1) Go to /hal/inc/gc_hal_options.h, and enable the following flags:
-+        - #   define gcdDUMP                              1
-+        - #   define gcdDUMP_IN_KERNEL          1
-+        - #   define gcdDUMP_COMMAND          1
-+
-+    2) Go to /hal/kernel/gc_hal_kernel_command.c and disable the following flag
-+        -#define gcdSIMPLE_COMMAND_DUMP  0
-+
-+    3) Compile the driver
-+    4) insmod it with the logFileSize option
-+    5) Run an application
-+    6) You can get the dump by cat /sys/kernel/debug/gpu/galcore_trace
-+
-+ */
-+
-+/**/
-+typedef va_list gctDBGARGS ;
-+#define gcmkARGS_START(argument, pointer)   va_start(argument, pointer)
-+#define gcmkARGS_END(argument)              	      va_end(argument)
-+
-+#define gcmkDBGFSPRINT(ArgumentSize, Message) \
-+  { \
-+	  gctDBGARGS __arguments__; \
-+	  gcmkARGS_START(__arguments__, Message); \
-+	  _DebugFSPrint(ArgumentSize, Message, __arguments__);\
-+	  gcmkARGS_END(__arguments__); \
-+  }
-+
-+/*Debug File System Node Struct*/
-+struct _gcsDebugFileSystemNode
-+{
-+    /*wait queues for read and write operations*/
-+#if defined(DECLARE_WAIT_QUEUE_HEAD)
-+    wait_queue_head_t read_q , write_q ;
-+#else
-+    struct wait_queue *read_q , *write_q ;
-+#endif
-+    struct dentry *parent ; /*parent directory*/
-+    struct dentry *filen ; /*filename*/
-+    struct semaphore sem ; /* mutual exclusion semaphore */
-+    char *data ; /* The circular buffer data */
-+    int size ; /* Size of the buffer pointed to by 'data' */
-+    int refcount ; /* Files that have this buffer open */
-+    int read_point ; /* Offset in circ. buffer of oldest data */
-+    int write_point ; /* Offset in circ. buffer of newest data */
-+    int offset ; /* Byte number of read_point in the stream */
-+    struct _gcsDebugFileSystemNode *next ;
-+} ;
-+
-+/* amount of data in the queue */
-+#define gcmkNODE_QLEN(node) ( (node)->write_point >= (node)->read_point ? \
-+         (node)->write_point - (node)->read_point : \
-+         (node)->size - (node)->read_point + (node)->write_point)
-+
-+/* byte number of the last byte in the queue */
-+#define gcmkNODE_FIRST_EMPTY_BYTE(node) ((node)->offset + gcmkNODE_QLEN(node))
-+
-+/*Synchronization primitives*/
-+#define gcmkNODE_READQ(node) (&((node)->read_q))
-+#define gcmkNODE_WRITEQ(node) (&((node)->write_q))
-+#define gcmkNODE_SEM(node) (&((node)->sem))
-+
-+/*Utilities*/
-+#define gcmkMIN(x, y) ((x) < (y) ? (x) : y)
-+
-+/*Debug File System Struct*/
-+typedef struct _gcsDebugFileSystem
-+{
-+    gcsDebugFileSystemNode* linkedlist ;
-+    gcsDebugFileSystemNode* currentNode ;
-+    int isInited ;
-+} gcsDebugFileSystem ;
-+
-+
-+/*debug file system*/
-+static gcsDebugFileSystem gc_dbgfs ;
-+
-+
-+
-+/*******************************************************************************
-+ **
-+ **		READ & WRITE FUNCTIONS (START)
-+ **
-+ *******************************************************************************/
-+
-+/*******************************************************************************
-+ **
-+ **  _ReadFromNode
-+ **
-+ **	1) reading bytes out of a circular buffer with wraparound.
-+ **	2)returns caddr_t, pointer to data read, which the caller must free.
-+ **	3) length is (a pointer to) the number of bytes to be read, which will be set by this function to
-+ **	    be the number of bytes actually returned
-+ **
-+ *******************************************************************************/
-+static caddr_t
-+_ReadFromNode (
-+                gcsDebugFileSystemNode* Node ,
-+                size_t *Length ,
-+                loff_t *Offset
-+                )
-+{
-+    caddr_t retval ;
-+    int bytes_copied = 0 , n , start_point , remaining ;
-+
-+    /* is the user trying to read data that has already scrolled off? */
-+    if ( *Offset < Node->offset )
-+    {
-+        *Offset = Node->offset ;
-+    }
-+
-+    /* is the user trying to read past EOF? */
-+    if ( *Offset >= gcmkNODE_FIRST_EMPTY_BYTE ( Node ) )
-+    {
-+        return NULL ;
-+    }
-+
-+    /* find the smaller of the total bytes we have available and what
-+     * the user is asking for */
-+
-+    *Length = gcmkMIN ( *Length , gcmkNODE_FIRST_EMPTY_BYTE ( Node ) - *Offset ) ;
-+
-+    remaining = * Length ;
-+
-+    /* figure out where to start based on user's Offset */
-+    start_point = Node->read_point + ( *Offset - Node->offset ) ;
-+
-+    start_point = start_point % Node->size ;
-+
-+    /* allocate memory to return */
-+    if ( ( retval = kmalloc ( sizeof (char ) * remaining , GFP_KERNEL ) ) == NULL )
-+        return NULL ;
-+
-+    /* copy the (possibly noncontiguous) data to our buffer */
-+    while ( remaining )
-+    {
-+        n = gcmkMIN ( remaining , Node->size - start_point ) ;
-+        memcpy ( retval + bytes_copied , Node->data + start_point , n ) ;
-+        bytes_copied += n ;
-+        remaining -= n ;
-+        start_point = ( start_point + n ) % Node->size ;
-+    }
-+
-+    /* advance user's file pointer */
-+    *Offset += * Length ;
-+
-+    return retval ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **  _WriteToNode
-+ **
-+ ** 1) writes to a circular buffer with wraparound.
-+ ** 2)in case of an overflow, it overwrites the oldest unread data.
-+ **
-+ *********************************************************************************/
-+static void
-+_WriteToNode (
-+               gcsDebugFileSystemNode* Node ,
-+               caddr_t Buf ,
-+               int Length
-+               )
-+{
-+    int bytes_copied = 0 ;
-+    int overflow = 0 ;
-+    int n ;
-+
-+    if ( Length + gcmkNODE_QLEN ( Node ) >= ( Node->size - 1 ) )
-+    {
-+        overflow = 1 ;
-+
-+        /* in case of overflow, figure out where the new buffer will
-+         * begin.  we start by figuring out where the current buffer ENDS:
-+         * node->parent->offset +  gcmkNODE_QLEN.	we then advance the end-offset
-+         * by the Length of the current write, and work backwards to
-+         * figure out what the oldest unoverwritten data will be (i.e.,
-+         * size of the buffer). */
-+        Node->offset = Node->offset + gcmkNODE_QLEN ( Node ) + Length
-+                - Node->size + 1 ;
-+    }
-+
-+    while ( Length )
-+    {
-+        /* how many contiguous bytes are available from the write point to
-+         * the end of the circular buffer? */
-+        n = gcmkMIN ( Length , Node->size - Node->write_point ) ;
-+        memcpy ( Node->data + Node->write_point , Buf + bytes_copied , n ) ;
-+        bytes_copied += n ;
-+        Length -= n ;
-+        Node->write_point = ( Node->write_point + n ) % Node->size ;
-+    }
-+
-+    /* if there is an overflow, reset the read point to read whatever is
-+     * the oldest data that we have, that has not yet been
-+     * overwritten. */
-+    if ( overflow )
-+    {
-+        Node->read_point = ( Node->write_point + 1 ) % Node->size ;
-+    }
-+}
-+
-+
-+/*******************************************************************************
-+ **
-+ ** 		PRINTING UTILITY (START)
-+ **
-+ *******************************************************************************/
-+
-+/*******************************************************************************
-+ **
-+ **  _GetArgumentSize
-+ **
-+ **
-+ *******************************************************************************/
-+static gctINT
-+_GetArgumentSize (
-+                   IN gctCONST_STRING Message
-+                   )
-+{
-+    gctINT i , count ;
-+
-+    for ( i = 0 , count = 0 ; Message[i] ; i += 1 )
-+    {
-+        if ( Message[i] == '%' )
-+        {
-+            count += 1 ;
-+        }
-+    }
-+    return count * sizeof (unsigned int ) ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ ** _AppendString
-+ **
-+ **
-+ *******************************************************************************/
-+static ssize_t
-+_AppendString (
-+                IN gcsDebugFileSystemNode* Node ,
-+                IN gctCONST_STRING String ,
-+                IN int Length
-+                )
-+{
-+    caddr_t message = NULL ;
-+    int n ;
-+
-+    /* if the message is longer than the buffer, just take the beginning
-+     * of it, in hopes that the reader (if any) will have time to read
-+     * before we wrap around and obliterate it */
-+    n = gcmkMIN ( Length , Node->size - 1 ) ;
-+
-+    /* make sure we have the memory for it */
-+    if ( ( message = kmalloc ( n , GFP_KERNEL ) ) == NULL )
-+        return - ENOMEM ;
-+
-+    /* copy into our temp buffer */
-+    memcpy ( message , String , n ) ;
-+
-+    /* now copy it into the circular buffer and free our temp copy */
-+    _WriteToNode ( Node , message , n ) ;
-+    kfree ( message ) ;
-+    return n ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ ** _DebugFSPrint
-+ **
-+ **
-+ *******************************************************************************/
-+static void
-+_DebugFSPrint (
-+                IN unsigned int ArgumentSize ,
-+                IN const char* Message ,
-+                IN gctDBGARGS Arguments
-+
-+                )
-+{
-+    char buffer[MAX_LINE_SIZE] ;
-+    int len ;
-+    down ( gcmkNODE_SEM ( gc_dbgfs.currentNode ) ) ;
-+    len = vsnprintf ( buffer , sizeof (buffer ) , Message , *( va_list * ) & Arguments ) ;
-+    buffer[len] = '\0' ;
-+
-+    /* Add end-of-line if missing. */
-+    if ( buffer[len - 1] != '\n' )
-+    {
-+        buffer[len ++] = '\n' ;
-+        buffer[len] = '\0' ;
-+    }
-+    _AppendString ( gc_dbgfs.currentNode , buffer , len ) ;
-+    up ( gcmkNODE_SEM ( gc_dbgfs.currentNode ) ) ;
-+    wake_up_interruptible ( gcmkNODE_READQ ( gc_dbgfs.currentNode ) ) ; /* blocked in read*/
-+}
-+
-+/*******************************************************************************
-+ **
-+ **                     LINUX SYSTEM FUNCTIONS (START)
-+ **
-+ *******************************************************************************/
-+
-+/*******************************************************************************
-+ **
-+ **  find the vivlog structure associated with an inode.
-+ **  	returns a	pointer to the structure if found, NULL if not found
-+ **
-+ *******************************************************************************/
-+static gcsDebugFileSystemNode*
-+_GetNodeInfo (
-+               IN struct inode *Inode
-+               )
-+{
-+    gcsDebugFileSystemNode* node ;
-+
-+    if ( Inode == NULL )
-+        return NULL ;
-+
-+    for ( node = gc_dbgfs.linkedlist ; node != NULL ; node = node->next )
-+        if ( node->filen->d_inode->i_ino == Inode->i_ino )
-+            return node ;
-+
-+    return NULL ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **   _DebugFSRead
-+ **
-+ *******************************************************************************/
-+static ssize_t
-+_DebugFSRead (
-+               struct file *file ,
-+               char __user * buffer ,
-+               size_t length ,
-+               loff_t * offset
-+               )
-+{
-+    int retval ;
-+    caddr_t data_to_return ;
-+    gcsDebugFileSystemNode* node ;
-+    /* get the metadata about this emlog */
-+    if ( ( node = _GetNodeInfo ( file->f_path.dentry->d_inode ) ) == NULL )
-+    {
-+        printk ( "debugfs_read: record not found\n" ) ;
-+        return - EIO ;
-+    }
-+
-+    if ( down_interruptible ( gcmkNODE_SEM ( node ) ) )
-+    {
-+        return - ERESTARTSYS ;
-+    }
-+
-+    /* wait until there's data available (unless we do nonblocking reads) */
-+    while ( *offset >= gcmkNODE_FIRST_EMPTY_BYTE ( node ) )
-+    {
-+        up ( gcmkNODE_SEM ( node ) ) ;
-+        if ( file->f_flags & O_NONBLOCK )
-+        {
-+            return - EAGAIN ;
-+        }
-+        if ( wait_event_interruptible ( ( *( gcmkNODE_READQ ( node ) ) ) , ( *offset < gcmkNODE_FIRST_EMPTY_BYTE ( node ) ) ) )
-+        {
-+            return - ERESTARTSYS ; /* signal: tell the fs layer to handle it */
-+        }
-+        /* otherwise loop, but first reacquire the lock */
-+        if ( down_interruptible ( gcmkNODE_SEM ( node ) ) )
-+        {
-+            return - ERESTARTSYS ;
-+        }
-+    }
-+    data_to_return = _ReadFromNode ( node , &length , offset ) ;
-+    if ( data_to_return == NULL )
-+    {
-+        retval = 0 ;
-+        goto unlock ;
-+    }
-+    if ( copy_to_user ( buffer , data_to_return , length ) > 0 )
-+    {
-+        retval = - EFAULT ;
-+    }
-+    else
-+    {
-+        retval = length ;
-+    }
-+    kfree ( data_to_return ) ;
-+unlock:
-+    up ( gcmkNODE_SEM ( node ) ) ;
-+    wake_up_interruptible ( gcmkNODE_WRITEQ ( node ) ) ;
-+    return retval ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **_DebugFSWrite
-+ **
-+ *******************************************************************************/
-+static ssize_t
-+_DebugFSWrite (
-+                struct file *file ,
-+                const char __user * buffer ,
-+                size_t length ,
-+                loff_t * offset
-+                )
-+{
-+    caddr_t message = NULL ;
-+    int n ;
-+    gcsDebugFileSystemNode*node ;
-+
-+    /* get the metadata about this log */
-+    if ( ( node = _GetNodeInfo ( file->f_path.dentry->d_inode ) ) == NULL )
-+    {
-+        return - EIO ;
-+    }
-+
-+    if ( down_interruptible ( gcmkNODE_SEM ( node ) ) )
-+    {
-+        return - ERESTARTSYS ;
-+    }
-+
-+    /* if the message is longer than the buffer, just take the beginning
-+     * of it, in hopes that the reader (if any) will have time to read
-+     * before we wrap around and obliterate it */
-+    n = gcmkMIN ( length , node->size - 1 ) ;
-+
-+    /* make sure we have the memory for it */
-+    if ( ( message = kmalloc ( n , GFP_KERNEL ) ) == NULL )
-+    {
-+        up ( gcmkNODE_SEM ( node ) ) ;
-+        return - ENOMEM ;
-+    }
-+
-+    /* copy into our temp buffer */
-+    if ( copy_from_user ( message , buffer , n ) > 0 )
-+    {
-+        up ( gcmkNODE_SEM ( node ) ) ;
-+        kfree ( message ) ;
-+        return - EFAULT ;
-+    }
-+
-+    /* now copy it into the circular buffer and free our temp copy */
-+    _WriteToNode ( node , message , n ) ;
-+
-+    kfree ( message ) ;
-+    up ( gcmkNODE_SEM ( node ) ) ;
-+
-+    /* wake up any readers that might be waiting for the data.  we call
-+     * schedule in the vague hope that a reader will run before the
-+     * writer's next write, to avoid losing data. */
-+    wake_up_interruptible ( gcmkNODE_READQ ( node ) ) ;
-+
-+    return n ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ ** File Operations Table
-+ **
-+ *******************************************************************************/
-+static const struct file_operations debugfs_operations = {
-+                                                          .owner = THIS_MODULE ,
-+                                                          .read = _DebugFSRead ,
-+                                                          .write = _DebugFSWrite ,
-+} ;
-+
-+/*******************************************************************************
-+ **
-+ **                             INTERFACE FUNCTIONS (START)
-+ **
-+ *******************************************************************************/
-+
-+/*******************************************************************************
-+ **
-+ **  gckDebugFileSystemIsEnabled
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+
-+
-+gctINT
-+gckDebugFileSystemIsEnabled ( void )
-+{
-+    return gc_dbgfs.isInited ;
-+}
-+/*******************************************************************************
-+ **
-+ **  gckDebugFileSystemInitialize
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+
-+gctINT
-+gckDebugFileSystemInitialize ( void )
-+{
-+    if ( ! gc_dbgfs.isInited )
-+    {
-+        gc_dbgfs.linkedlist = gcvNULL ;
-+        gc_dbgfs.currentNode = gcvNULL ;
-+        gc_dbgfs.isInited = 1 ;
-+    }
-+    return gc_dbgfs.isInited ;
-+}
-+/*******************************************************************************
-+ **
-+ **  gckDebugFileSystemTerminate
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+
-+gctINT
-+gckDebugFileSystemTerminate ( void )
-+{
-+    gcsDebugFileSystemNode * next = gcvNULL ;
-+    gcsDebugFileSystemNode * temp = gcvNULL ;
-+    if ( gc_dbgfs.isInited )
-+    {
-+        temp = gc_dbgfs.linkedlist ;
-+        while ( temp != gcvNULL )
-+        {
-+            next = temp->next ;
-+            gckDebugFileSystemFreeNode ( temp ) ;
-+            kfree ( temp ) ;
-+            temp = next ;
-+        }
-+        gc_dbgfs.isInited = 0 ;
-+    }
-+    return 0 ;
-+}
-+
-+
-+/*******************************************************************************
-+ **
-+ **  gckDebugFileSystemCreateNode
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ **	 gckDebugFileSystemFreeNode * Device
-+ **		  Pointer to a variable receiving the gcsDebugFileSystemNode object pointer on
-+ **		  success.
-+ *********************************************************************************/
-+
-+gctINT
-+gckDebugFileSystemCreateNode (
-+                               IN gctINT SizeInKB ,
-+                               IN gctCONST_STRING ParentName ,
-+                               IN gctCONST_STRING NodeName ,
-+                               OUT gcsDebugFileSystemNode **Node
-+                               )
-+{
-+    gcsDebugFileSystemNode*node ;
-+    /* allocate space for our metadata and initialize it */
-+    if ( ( node = kmalloc ( sizeof (gcsDebugFileSystemNode ) , GFP_KERNEL ) ) == NULL )
-+        goto struct_malloc_failed ;
-+
-+    /*Zero it out*/
-+    memset ( node , 0 , sizeof (gcsDebugFileSystemNode ) ) ;
-+
-+    /*Init the sync primitives*/
-+#if defined(DECLARE_WAIT_QUEUE_HEAD)
-+    init_waitqueue_head ( gcmkNODE_READQ ( node ) ) ;
-+#else
-+    init_waitqueue ( gcmkNODE_READQ ( node ) ) ;
-+#endif
-+
-+#if defined(DECLARE_WAIT_QUEUE_HEAD)
-+    init_waitqueue_head ( gcmkNODE_WRITEQ ( node ) ) ;
-+#else
-+    init_waitqueue ( gcmkNODE_WRITEQ ( node ) ) ;
-+#endif
-+    sema_init ( gcmkNODE_SEM ( node ) , 1 ) ;
-+    /*End the sync primitives*/
-+
-+
-+    /* figure out how much of a buffer this should be and allocate the buffer */
-+    node->size = 1024 * SizeInKB ;
-+    if ( ( node->data = ( char * ) vmalloc ( sizeof (char ) * node->size ) ) == NULL )
-+        goto data_malloc_failed ;
-+
-+    /*creating the debug file system*/
-+    node->parent = debugfs_create_dir ( ParentName , NULL ) ;
-+
-+    /*creating the file*/
-+    node->filen = debugfs_create_file ( NodeName , S_IRUGO | S_IWUSR , node->parent , NULL ,
-+                                        &debugfs_operations ) ;
-+
-+    /* add it to our linked list */
-+    node->next = gc_dbgfs.linkedlist ;
-+    gc_dbgfs.linkedlist = node ;
-+
-+    /* pass the struct back */
-+    *Node = node ;
-+    return 0 ;
-+
-+    vfree ( node->data ) ;
-+data_malloc_failed:
-+    kfree ( node ) ;
-+struct_malloc_failed:
-+    return - ENOMEM ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **  gckDebugFileSystemFreeNode
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+void
-+gckDebugFileSystemFreeNode (
-+                             IN gcsDebugFileSystemNode * Node
-+                             )
-+{
-+
-+    gcsDebugFileSystemNode **ptr ;
-+
-+    if ( Node == NULL )
-+    {
-+        printk ( "null passed to free_vinfo\n" ) ;
-+        return ;
-+    }
-+
-+    down ( gcmkNODE_SEM ( Node ) ) ;
-+    /*free data*/
-+    vfree ( Node->data ) ;
-+
-+    /*Close Debug fs*/
-+    if ( Node->filen )
-+    {
-+        debugfs_remove ( Node->filen ) ;
-+    }
-+    if ( Node->parent )
-+    {
-+        debugfs_remove ( Node->parent ) ;
-+    }
-+
-+    /* now delete the node from the linked list */
-+    ptr = & ( gc_dbgfs.linkedlist ) ;
-+    while ( *ptr != Node )
-+    {
-+        if ( ! *ptr )
-+        {
-+            printk ( "corrupt info list!\n" ) ;
-+            break ;
-+        }
-+        else
-+            ptr = & ( ( **ptr ).next ) ;
-+    }
-+    *ptr = Node->next ;
-+    up ( gcmkNODE_SEM ( Node ) ) ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **   gckDebugFileSystemSetCurrentNode
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+void
-+gckDebugFileSystemSetCurrentNode (
-+                                   IN gcsDebugFileSystemNode * Node
-+                                   )
-+{
-+    gc_dbgfs.currentNode = Node ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **   gckDebugFileSystemGetCurrentNode
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+void
-+gckDebugFileSystemGetCurrentNode (
-+                                   OUT gcsDebugFileSystemNode ** Node
-+                                   )
-+{
-+    *Node = gc_dbgfs.currentNode ;
-+}
-+
-+/*******************************************************************************
-+ **
-+ **   gckDebugFileSystemPrint
-+ **
-+ **
-+ **  INPUT:
-+ **
-+ **  OUTPUT:
-+ **
-+ *******************************************************************************/
-+void
-+gckDebugFileSystemPrint (
-+                          IN gctCONST_STRING Message ,
-+                          ...
-+                          )
-+{
-+    gcmkDBGFSPRINT ( _GetArgumentSize ( Message ) , Message ) ;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,84 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include <stdarg.h>
-+
-+#ifndef __gc_hal_kernel_debugfs_h_
-+#define __gc_hal_kernel_debugfs_h_
-+
-+ #define MAX_LINE_SIZE 768  	     /* Max bytes for a line of debug info */
-+
-+
-+ typedef struct _gcsDebugFileSystemNode gcsDebugFileSystemNode ;
-+
-+
-+/*******************************************************************************
-+ **
-+ **                             System Related
-+ **
-+ *******************************************************************************/
-+
-+gctINT    gckDebugFileSystemIsEnabled(void);
-+
-+gctINT   gckDebugFileSystemInitialize(void);
-+
-+gctINT   gckDebugFileSystemTerminate(void);
-+
-+
-+/*******************************************************************************
-+ **
-+ **                             Node Related
-+ **
-+ *******************************************************************************/
-+
-+gctINT gckDebugFileSystemCreateNode(
-+ 			IN gctINT SizeInKB,
-+                        IN gctCONST_STRING  ParentName ,
-+                        IN gctCONST_STRING  NodeName,
-+                        OUT gcsDebugFileSystemNode  **Node
-+                        );
-+
-+
-+void gckDebugFileSystemFreeNode(
-+			IN gcsDebugFileSystemNode  * Node
-+			);
-+
-+
-+
-+void gckDebugFileSystemSetCurrentNode(
-+			IN gcsDebugFileSystemNode  * Node
-+			);
-+
-+
-+
-+void gckDebugFileSystemGetCurrentNode(
-+			OUT gcsDebugFileSystemNode  ** Node
-+			);
-+
-+
-+void gckDebugFileSystemPrint(
-+    			IN gctCONST_STRING  Message,
-+    			...
-+   			 );
-+
-+#endif
-+
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,102 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_debug_h_
-+#define __gc_hal_kernel_debug_h_
-+
-+#include <gc_hal_kernel_linux.h>
-+#include <linux/spinlock.h>
-+#include <linux/time.h>
-+#include <stdarg.h>
-+
-+#ifdef __cplusplus
-+extern "C" {
-+#endif
-+
-+/******************************************************************************\
-+****************************** OS-dependent Macros *****************************
-+\******************************************************************************/
-+
-+typedef va_list gctARGUMENTS;
-+
-+#define gcmkARGUMENTS_START(Arguments, Pointer) \
-+    va_start(Arguments, Pointer)
-+
-+#define gcmkARGUMENTS_END(Arguments) \
-+    va_end(Arguments)
-+
-+#define gcmkDECLARE_LOCK(__spinLock__) \
-+    static DEFINE_SPINLOCK(__spinLock__);
-+
-+#define gcmkLOCKSECTION(__spinLock__) \
-+    spin_lock(&__spinLock__)
-+
-+#define gcmkUNLOCKSECTION(__spinLock__) \
-+    spin_unlock(&__spinLock__)
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
-+#   define gcmkGETPROCESSID() \
-+        task_tgid_vnr(current)
-+#else
-+#   define gcmkGETPROCESSID() \
-+        current->tgid
-+#endif
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
-+#   define gcmkGETTHREADID() \
-+        task_pid_vnr(current)
-+#else
-+#   define gcmkGETTHREADID() \
-+        current->pid
-+#endif
-+
-+#define gcmkOUTPUT_STRING(String) \
-+   if(gckDebugFileSystemIsEnabled()) \
-+   	gckDebugFileSystemPrint(String);\
-+   else\
-+   	printk(String); \
-+    touch_softlockup_watchdog()
-+
-+
-+#define gcmkSPRINTF(Destination, Size, Message, Value) \
-+    snprintf(Destination, Size, Message, Value)
-+
-+#define gcmkSPRINTF2(Destination, Size, Message, Value1, Value2) \
-+    snprintf(Destination, Size, Message, Value1, Value2)
-+
-+#define gcmkSPRINTF3(Destination, Size, Message, Value1, Value2, Value3) \
-+    snprintf(Destination, Size, Message, Value1, Value2, Value3)
-+
-+#define gcmkVSPRINTF(Destination, Size, Message, Arguments) \
-+    vsnprintf(Destination, Size, Message, *(va_list *) &Arguments)
-+
-+#define gcmkSTRCAT(Destination, Size, String) \
-+    strncat(Destination, String, Size)
-+
-+/* If not zero, forces data alignment in the variable argument list
-+   by its individual size. */
-+#define gcdALIGNBYSIZE      1
-+
-+#ifdef __cplusplus
-+}
-+#endif
-+
-+#endif /* __gc_hal_kernel_debug_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,1676 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+#include <linux/pagemap.h>
-+#include <linux/seq_file.h>
-+#include <linux/mm.h>
-+#include <linux/mman.h>
-+#include <linux/slab.h>
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
-+#include <mach/hardware.h>
-+#endif
-+#include <linux/pm_runtime.h>
-+
-+#define _GC_OBJ_ZONE    gcvZONE_DEVICE
-+
-+#define DEBUG_FILE 			"galcore_trace"
-+#define PARENT_FILE 		"gpu"
-+
-+
-+#ifdef FLAREON
-+    static struct dove_gpio_irq_handler gc500_handle;
-+#endif
-+
-+#define gcmIS_CORE_PRESENT(Device, Core) (Device->irqLines[Core] > 0)
-+
-+/******************************************************************************\
-+*************************** Memory Allocation Wrappers *************************
-+\******************************************************************************/
-+
-+static gceSTATUS
-+_AllocateMemory(
-+    IN gckGALDEVICE Device,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER *Logical,
-+    OUT gctPHYS_ADDR *Physical,
-+    OUT gctUINT32 *PhysAddr
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Device=0x%x Bytes=%lu", Device, Bytes);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+    gcmkVERIFY_ARGUMENT(Logical != NULL);
-+    gcmkVERIFY_ARGUMENT(Physical != NULL);
-+    gcmkVERIFY_ARGUMENT(PhysAddr != NULL);
-+
-+    gcmkONERROR(gckOS_AllocateContiguous(
-+        Device->os, gcvFALSE, &Bytes, Physical, Logical
-+        ));
-+
-+    *PhysAddr = ((PLINUX_MDL)*Physical)->dmaHandle - Device->baseAddress;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG(
-+        "*Logical=0x%x *Physical=0x%x *PhysAddr=0x%08x",
-+        *Logical, *Physical, *PhysAddr
-+        );
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+_FreeMemory(
-+    IN gckGALDEVICE Device,
-+    IN gctPOINTER Logical,
-+    IN gctPHYS_ADDR Physical)
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Device=0x%x Logical=0x%x Physical=0x%x",
-+                   Device, Logical, Physical);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    status = gckOS_FreeContiguous(
-+        Device->os, Physical, Logical,
-+        ((PLINUX_MDL) Physical)->numPages * PAGE_SIZE
-+        );
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+
-+
-+/******************************************************************************\
-+******************************* Interrupt Handler ******************************
-+\******************************************************************************/
-+static irqreturn_t isrRoutine(int irq, void *ctxt)
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+
-+    device = (gckGALDEVICE) ctxt;
-+
-+    /* Call kernel interrupt notification. */
-+    status = gckKERNEL_Notify(device->kernels[gcvCORE_MAJOR], gcvNOTIFY_INTERRUPT, gcvTRUE);
-+
-+    if (gcmIS_SUCCESS(status))
-+    {
-+        device->dataReadys[gcvCORE_MAJOR] = gcvTRUE;
-+
-+        up(&device->semas[gcvCORE_MAJOR]);
-+
-+        return IRQ_HANDLED;
-+    }
-+
-+    return IRQ_NONE;
-+}
-+
-+static int threadRoutine(void *ctxt)
-+{
-+    gckGALDEVICE device = (gckGALDEVICE) ctxt;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
-+                   "Starting isr Thread with extension=%p",
-+                   device);
-+
-+    for (;;)
-+    {
-+        static int down;
-+
-+        down = down_interruptible(&device->semas[gcvCORE_MAJOR]);
-+        if (down); /*To make gcc 4.6 happye*/
-+        device->dataReadys[gcvCORE_MAJOR] = gcvFALSE;
-+
-+        if (device->killThread == gcvTRUE)
-+        {
-+            /* The daemon exits. */
-+            while (!kthread_should_stop())
-+            {
-+                gckOS_Delay(device->os, 1);
-+            }
-+
-+            return 0;
-+        }
-+
-+        gckKERNEL_Notify(device->kernels[gcvCORE_MAJOR], gcvNOTIFY_INTERRUPT, gcvFALSE);
-+    }
-+}
-+
-+static irqreturn_t isrRoutine2D(int irq, void *ctxt)
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+
-+    device = (gckGALDEVICE) ctxt;
-+
-+    /* Call kernel interrupt notification. */
-+    status = gckKERNEL_Notify(device->kernels[gcvCORE_2D], gcvNOTIFY_INTERRUPT, gcvTRUE);
-+
-+    if (gcmIS_SUCCESS(status))
-+    {
-+        device->dataReadys[gcvCORE_2D] = gcvTRUE;
-+
-+        up(&device->semas[gcvCORE_2D]);
-+
-+        return IRQ_HANDLED;
-+    }
-+
-+    return IRQ_NONE;
-+}
-+
-+static int threadRoutine2D(void *ctxt)
-+{
-+    gckGALDEVICE device = (gckGALDEVICE) ctxt;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
-+                   "Starting isr Thread with extension=%p",
-+                   device);
-+
-+    for (;;)
-+    {
-+        static int down;
-+
-+        down = down_interruptible(&device->semas[gcvCORE_2D]);
-+        if (down); /*To make gcc 4.6 happye*/
-+        device->dataReadys[gcvCORE_2D] = gcvFALSE;
-+
-+        if (device->killThread == gcvTRUE)
-+        {
-+            /* The daemon exits. */
-+            while (!kthread_should_stop())
-+            {
-+                gckOS_Delay(device->os, 1);
-+            }
-+
-+            return 0;
-+        }
-+
-+        gckKERNEL_Notify(device->kernels[gcvCORE_2D], gcvNOTIFY_INTERRUPT, gcvFALSE);
-+    }
-+}
-+
-+static irqreturn_t isrRoutineVG(int irq, void *ctxt)
-+{
-+#if gcdENABLE_VG
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+
-+    device = (gckGALDEVICE) ctxt;
-+
-+	/* Serve the interrupt. */
-+	status = gckVGINTERRUPT_Enque(device->kernels[gcvCORE_VG]->vg->interrupt);
-+
-+	/* Determine the return value. */
-+	return (status == gcvSTATUS_NOT_OUR_INTERRUPT)
-+		? IRQ_RETVAL(0)
-+		: IRQ_RETVAL(1);
-+#else
-+    return IRQ_NONE;
-+#endif
-+}
-+
-+static int threadRoutineVG(void *ctxt)
-+{
-+    gckGALDEVICE device = (gckGALDEVICE) ctxt;
-+
-+    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
-+                   "Starting isr Thread with extension=%p",
-+                   device);
-+
-+    for (;;)
-+    {
-+        static int down;
-+
-+        down = down_interruptible(&device->semas[gcvCORE_VG]);
-+        if (down); /*To make gcc 4.6 happye*/
-+        device->dataReadys[gcvCORE_VG] = gcvFALSE;
-+
-+        if (device->killThread == gcvTRUE)
-+        {
-+            /* The daemon exits. */
-+            while (!kthread_should_stop())
-+            {
-+                gckOS_Delay(device->os, 1);
-+            }
-+
-+            return 0;
-+        }
-+
-+        gckKERNEL_Notify(device->kernels[gcvCORE_VG], gcvNOTIFY_INTERRUPT, gcvFALSE);
-+    }
-+}
-+
-+/******************************************************************************\
-+******************************* gckGALDEVICE Code ******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Construct
-+**
-+**  Constructor.
-+**
-+**  INPUT:
-+**
-+**  OUTPUT:
-+**
-+**      gckGALDEVICE * Device
-+**          Pointer to a variable receiving the gckGALDEVICE object pointer on
-+**          success.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Construct(
-+    IN gctINT IrqLine,
-+    IN gctUINT32 RegisterMemBase,
-+    IN gctSIZE_T RegisterMemSize,
-+    IN gctINT IrqLine2D,
-+    IN gctUINT32 RegisterMemBase2D,
-+    IN gctSIZE_T RegisterMemSize2D,
-+    IN gctINT IrqLineVG,
-+    IN gctUINT32 RegisterMemBaseVG,
-+    IN gctSIZE_T RegisterMemSizeVG,
-+    IN gctUINT32 ContiguousBase,
-+    IN gctSIZE_T ContiguousSize,
-+    IN gctSIZE_T BankSize,
-+    IN gctINT FastClear,
-+    IN gctINT Compression,
-+    IN gctUINT32 PhysBaseAddr,
-+    IN gctUINT32 PhysSize,
-+    IN gctINT Signal,
-+    IN gctUINT LogFileSize,
-+    IN struct device *pdev,
-+    IN gctINT PowerManagement,
-+    IN gctINT GpuProfiler,
-+    OUT gckGALDEVICE *Device
-+    )
-+{
-+    gctUINT32 internalBaseAddress = 0, internalAlignment = 0;
-+    gctUINT32 externalBaseAddress = 0, externalAlignment = 0;
-+    gctUINT32 horizontalTileSize, verticalTileSize;
-+    struct resource* mem_region;
-+    gctUINT32 physAddr;
-+    gctUINT32 physical;
-+    gckGALDEVICE device;
-+    gceSTATUS status;
-+    gctINT32 i;
-+    gceHARDWARE_TYPE type;
-+    gckDB sharedDB = gcvNULL;
-+    gckKERNEL kernel = gcvNULL;
-+
-+    gcmkHEADER_ARG("IrqLine=%d RegisterMemBase=0x%08x RegisterMemSize=%u "
-+                   "IrqLine2D=%d RegisterMemBase2D=0x%08x RegisterMemSize2D=%u "
-+                   "IrqLineVG=%d RegisterMemBaseVG=0x%08x RegisterMemSizeVG=%u "
-+                   "ContiguousBase=0x%08x ContiguousSize=%lu BankSize=%lu "
-+                   "FastClear=%d Compression=%d PhysBaseAddr=0x%x PhysSize=%d Signal=%d",
-+                   IrqLine, RegisterMemBase, RegisterMemSize,
-+                   IrqLine2D, RegisterMemBase2D, RegisterMemSize2D,
-+                   IrqLineVG, RegisterMemBaseVG, RegisterMemSizeVG,
-+                   ContiguousBase, ContiguousSize, BankSize, FastClear, Compression,
-+                   PhysBaseAddr, PhysSize, Signal);
-+
-+    /* Allocate device structure. */
-+    device = kmalloc(sizeof(struct _gckGALDEVICE), GFP_KERNEL);
-+
-+    if (!device)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    memset(device, 0, sizeof(struct _gckGALDEVICE));
-+
-+   device->dbgnode = gcvNULL;
-+   if(LogFileSize != 0)
-+   {
-+	if(gckDebugFileSystemCreateNode(LogFileSize,PARENT_FILE,DEBUG_FILE,&(device->dbgnode)) != 0)
-+	{
-+		gcmkTRACE_ZONE(
-+		gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+		"%s(%d): Failed to create  the debug file system  %s/%s \n",
-+		__FUNCTION__, __LINE__,
-+		PARENT_FILE, DEBUG_FILE
-+		);
-+	}
-+	else
-+	{
-+		/*Everything is OK*/
-+	 	gckDebugFileSystemSetCurrentNode(device->dbgnode);
-+	}
-+    }
-+#ifdef CONFIG_PM
-+    /*Init runtime pm for gpu*/
-+    pm_runtime_enable(pdev);
-+    device->pmdev = pdev;
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+    /*get gpu regulator*/
-+    device->gpu_regulator = regulator_get(pdev, "cpu_vddgpu");
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    device->gpu_regulator = devm_regulator_get(pdev, "pu");
-+#endif
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    if (IS_ERR(device->gpu_regulator)) {
-+	gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+		"%s(%d): Failed to get gpu regulator  %s/%s \n",
-+		__FUNCTION__, __LINE__,
-+		PARENT_FILE, DEBUG_FILE);
-+	gcmkONERROR(gcvSTATUS_NOT_FOUND);
-+    }
-+#endif
-+    /*Initialize the clock structure*/
-+    if (IrqLine != -1) {
-+        device->clk_3d_core = clk_get(pdev, "gpu3d_clk");
-+        if (!IS_ERR(device->clk_3d_core)) {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+            if (cpu_is_mx6q()) {
-+	            device->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
-+	            if (IS_ERR(device->clk_3d_shader)) {
-+	                IrqLine = -1;
-+	                clk_put(device->clk_3d_core);
-+	                device->clk_3d_core = NULL;
-+	                device->clk_3d_shader = NULL;
-+	                gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
-+	            }
-+	          }
-+#else
-+	            device->clk_3d_axi = clk_get(pdev, "gpu3d_axi_clk");
-+	            device->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
-+	            if (IS_ERR(device->clk_3d_shader)) {
-+	                IrqLine = -1;
-+	                clk_put(device->clk_3d_core);
-+	                device->clk_3d_core = NULL;
-+	                device->clk_3d_shader = NULL;
-+	                gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
-+	            }
-+#endif
-+        } else {
-+            IrqLine = -1;
-+            device->clk_3d_core = NULL;
-+            gckOS_Print("galcore: clk_get gpu3d_clk failed, disable 3d!\n");
-+        }
-+    }
-+    if ((IrqLine2D != -1) || (IrqLineVG != -1)) {
-+        device->clk_2d_core = clk_get(pdev, "gpu2d_clk");
-+        if (IS_ERR(device->clk_2d_core)) {
-+            IrqLine2D = -1;
-+            IrqLineVG = -1;
-+            device->clk_2d_core = NULL;
-+            gckOS_Print("galcore: clk_get 2d core clock failed, disable 2d/vg!\n");
-+        } else {
-+	    if (IrqLine2D != -1) {
-+                device->clk_2d_axi = clk_get(pdev, "gpu2d_axi_clk");
-+                if (IS_ERR(device->clk_2d_axi)) {
-+                    device->clk_2d_axi = NULL;
-+                    IrqLine2D = -1;
-+                    gckOS_Print("galcore: clk_get 2d axi clock failed, disable 2d\n");
-+                }
-+            }
-+            if (IrqLineVG != -1) {
-+                device->clk_vg_axi = clk_get(pdev, "openvg_axi_clk");
-+                if (IS_ERR(device->clk_vg_axi)) {
-+                    IrqLineVG = -1;
-+	                device->clk_vg_axi = NULL;
-+	                gckOS_Print("galcore: clk_get vg clock failed, disable vg!\n");
-+                }
-+            }
-+        }
-+    }
-+
-+    if (IrqLine != -1)
-+    {
-+        device->requestedRegisterMemBases[gcvCORE_MAJOR]    = RegisterMemBase;
-+        device->requestedRegisterMemSizes[gcvCORE_MAJOR]    = RegisterMemSize;
-+    }
-+
-+    if (IrqLine2D != -1)
-+    {
-+        device->requestedRegisterMemBases[gcvCORE_2D]       = RegisterMemBase2D;
-+        device->requestedRegisterMemSizes[gcvCORE_2D]       = RegisterMemSize2D;
-+    }
-+
-+    if (IrqLineVG != -1)
-+    {
-+        device->requestedRegisterMemBases[gcvCORE_VG]       = RegisterMemBaseVG;
-+        device->requestedRegisterMemSizes[gcvCORE_VG]       = RegisterMemSizeVG;
-+    }
-+
-+    device->requestedContiguousBase  = 0;
-+    device->requestedContiguousSize  = 0;
-+
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        physical = device->requestedRegisterMemBases[i];
-+
-+        /* Set up register memory region. */
-+        if (physical != 0)
-+        {
-+            mem_region = request_mem_region(
-+                physical, device->requestedRegisterMemSizes[i], "galcore register region"
-+                );
-+
-+            if (mem_region == gcvNULL)
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                    "%s(%d): Failed to claim %lu bytes @ 0x%08X\n",
-+                    __FUNCTION__, __LINE__,
-+                    physical, device->requestedRegisterMemSizes[i]
-+                    );
-+
-+                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+            }
-+
-+            device->registerBases[i] = (gctPOINTER) ioremap_nocache(
-+                physical, device->requestedRegisterMemSizes[i]);
-+
-+            if (device->registerBases[i] == gcvNULL)
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                    "%s(%d): Unable to map %ld bytes @ 0x%08X\n",
-+                    __FUNCTION__, __LINE__,
-+                    physical, device->requestedRegisterMemSizes[i]
-+                    );
-+
-+                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+            }
-+
-+            physical += device->requestedRegisterMemSizes[i];
-+        }
-+        else
-+        {
-+            device->registerBases[i] = gcvNULL;
-+        }
-+    }
-+
-+    /* Set the base address */
-+    device->baseAddress = PhysBaseAddr;
-+
-+    /* Construct the gckOS object. */
-+    gcmkONERROR(gckOS_Construct(device, &device->os));
-+
-+    if (IrqLine != -1)
-+    {
-+        /* Construct the gckKERNEL object. */
-+        gcmkONERROR(gckKERNEL_Construct(
-+            device->os, gcvCORE_MAJOR, device,
-+            gcvNULL, &device->kernels[gcvCORE_MAJOR]));
-+
-+        sharedDB = device->kernels[gcvCORE_MAJOR]->db;
-+
-+        /* Initialize core mapping */
-+        for (i = 0; i < 8; i++)
-+        {
-+            device->coreMapping[i] = gcvCORE_MAJOR;
-+        }
-+
-+        /* Setup the ISR manager. */
-+        gcmkONERROR(gckHARDWARE_SetIsrManager(
-+            device->kernels[gcvCORE_MAJOR]->hardware,
-+            (gctISRMANAGERFUNC) gckGALDEVICE_Enable_ISR,
-+            (gctISRMANAGERFUNC) gckGALDEVICE_Disable_ISR,
-+            device
-+            ));
-+
-+        gcmkONERROR(gckHARDWARE_SetFastClear(
-+            device->kernels[gcvCORE_MAJOR]->hardware, FastClear, Compression
-+            ));
-+
-+        gcmkONERROR(gckHARDWARE_SetPowerManagement(
-+            device->kernels[gcvCORE_MAJOR]->hardware, PowerManagement
-+            ));
-+
-+        gcmkONERROR(gckHARDWARE_SetGpuProfiler(
-+            device->kernels[gcvCORE_MAJOR]->hardware, GpuProfiler
-+            ));
-+
-+#if COMMAND_PROCESSOR_VERSION == 1
-+        /* Start the command queue. */
-+        gcmkONERROR(gckCOMMAND_Start(device->kernels[gcvCORE_MAJOR]->command));
-+#endif
-+    }
-+    else
-+    {
-+        device->kernels[gcvCORE_MAJOR] = gcvNULL;
-+    }
-+
-+    if (IrqLine2D != -1)
-+    {
-+        gcmkONERROR(gckKERNEL_Construct(
-+            device->os, gcvCORE_2D, device,
-+            sharedDB, &device->kernels[gcvCORE_2D]));
-+
-+        if (sharedDB == gcvNULL) sharedDB = device->kernels[gcvCORE_2D]->db;
-+
-+        /* Verify the hardware type */
-+        gcmkONERROR(gckHARDWARE_GetType(device->kernels[gcvCORE_2D]->hardware, &type));
-+
-+        if (type != gcvHARDWARE_2D)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Unexpected hardware type: %d\n",
-+                __FUNCTION__, __LINE__,
-+                type
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        /* Initialize core mapping */
-+        if (device->kernels[gcvCORE_MAJOR] == gcvNULL)
-+        {
-+            for (i = 0; i < 8; i++)
-+            {
-+                device->coreMapping[i] = gcvCORE_2D;
-+            }
-+        }
-+        else
-+        {
-+            device->coreMapping[gcvHARDWARE_2D] = gcvCORE_2D;
-+        }
-+
-+        /* Setup the ISR manager. */
-+        gcmkONERROR(gckHARDWARE_SetIsrManager(
-+            device->kernels[gcvCORE_2D]->hardware,
-+            (gctISRMANAGERFUNC) gckGALDEVICE_Enable_ISR,
-+            (gctISRMANAGERFUNC) gckGALDEVICE_Disable_ISR,
-+            device
-+            ));
-+
-+        gcmkONERROR(gckHARDWARE_SetPowerManagement(
-+            device->kernels[gcvCORE_2D]->hardware, PowerManagement
-+            ));
-+
-+
-+#if COMMAND_PROCESSOR_VERSION == 1
-+        /* Start the command queue. */
-+        gcmkONERROR(gckCOMMAND_Start(device->kernels[gcvCORE_2D]->command));
-+#endif
-+    }
-+    else
-+    {
-+        device->kernels[gcvCORE_2D] = gcvNULL;
-+    }
-+
-+    if (IrqLineVG != -1)
-+    {
-+#if gcdENABLE_VG
-+        gcmkONERROR(gckKERNEL_Construct(
-+            device->os, gcvCORE_VG, device,
-+            sharedDB, &device->kernels[gcvCORE_VG]));
-+        /* Initialize core mapping */
-+        if (device->kernels[gcvCORE_MAJOR] == gcvNULL
-+            && device->kernels[gcvCORE_2D] == gcvNULL
-+            )
-+        {
-+            for (i = 0; i < 8; i++)
-+            {
-+                device->coreMapping[i] = gcvCORE_VG;
-+            }
-+        }
-+        else
-+        {
-+            device->coreMapping[gcvHARDWARE_VG] = gcvCORE_VG;
-+        }
-+
-+
-+        gcmkONERROR(gckVGHARDWARE_SetPowerManagement(
-+            device->kernels[gcvCORE_VG]->vg->hardware,
-+            PowerManagement
-+            ));
-+
-+#endif
-+    }
-+    else
-+    {
-+        device->kernels[gcvCORE_VG] = gcvNULL;
-+    }
-+
-+    /* Initialize the ISR. */
-+    device->irqLines[gcvCORE_MAJOR] = IrqLine;
-+    device->irqLines[gcvCORE_2D]    = IrqLine2D;
-+    device->irqLines[gcvCORE_VG]    = IrqLineVG;
-+
-+    /* Initialize the kernel thread semaphores. */
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->irqLines[i] != -1) sema_init(&device->semas[i], 0);
-+    }
-+
-+    device->signal = Signal;
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->kernels[i] != gcvNULL) break;
-+    }
-+
-+    if (i == gcdMAX_GPU_COUNT)
-+	{
-+		gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+	}
-+
-+#if gcdENABLE_VG
-+    if (i == gcvCORE_VG)
-+    {
-+        /* Query the ceiling of the system memory. */
-+        gcmkONERROR(gckVGHARDWARE_QuerySystemMemory(
-+                device->kernels[i]->vg->hardware,
-+                &device->systemMemorySize,
-+                &device->systemMemoryBaseAddress
-+                ));
-+            /* query the amount of video memory */
-+        gcmkONERROR(gckVGHARDWARE_QueryMemory(
-+            device->kernels[i]->vg->hardware,
-+            &device->internalSize, &internalBaseAddress, &internalAlignment,
-+            &device->externalSize, &externalBaseAddress, &externalAlignment,
-+            &horizontalTileSize, &verticalTileSize
-+            ));
-+    }
-+    else
-+#endif
-+    {
-+        /* Query the ceiling of the system memory. */
-+        gcmkONERROR(gckHARDWARE_QuerySystemMemory(
-+                device->kernels[i]->hardware,
-+                &device->systemMemorySize,
-+                &device->systemMemoryBaseAddress
-+                ));
-+
-+            /* query the amount of video memory */
-+        gcmkONERROR(gckHARDWARE_QueryMemory(
-+            device->kernels[i]->hardware,
-+            &device->internalSize, &internalBaseAddress, &internalAlignment,
-+            &device->externalSize, &externalBaseAddress, &externalAlignment,
-+            &horizontalTileSize, &verticalTileSize
-+            ));
-+    }
-+
-+
-+    /* Grab the first availiable kernel */
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->irqLines[i] != -1)
-+        {
-+            kernel = device->kernels[i];
-+            break;
-+        }
-+    }
-+
-+    /* Set up the internal memory region. */
-+    if (device->internalSize > 0)
-+    {
-+        status = gckVIDMEM_Construct(
-+            device->os,
-+            internalBaseAddress, device->internalSize, internalAlignment,
-+            0, &device->internalVidMem
-+            );
-+
-+        if (gcmIS_ERROR(status))
-+        {
-+            /* Error, disable internal heap. */
-+            device->internalSize = 0;
-+        }
-+        else
-+        {
-+            /* Map internal memory. */
-+            device->internalLogical
-+                = (gctPOINTER) ioremap_nocache(physical, device->internalSize);
-+
-+            if (device->internalLogical == gcvNULL)
-+            {
-+                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+            }
-+
-+            device->internalPhysical = (gctPHYS_ADDR)(gctUINTPTR_T) physical;
-+            device->internalPhysicalName = gcmPTR_TO_NAME(device->internalPhysical);
-+            physical += device->internalSize;
-+        }
-+    }
-+
-+    if (device->externalSize > 0)
-+    {
-+        /* create the external memory heap */
-+        status = gckVIDMEM_Construct(
-+            device->os,
-+            externalBaseAddress, device->externalSize, externalAlignment,
-+            0, &device->externalVidMem
-+            );
-+
-+        if (gcmIS_ERROR(status))
-+        {
-+            /* Error, disable internal heap. */
-+            device->externalSize = 0;
-+        }
-+        else
-+        {
-+            /* Map external memory. */
-+            device->externalLogical
-+                = (gctPOINTER) ioremap_nocache(physical, device->externalSize);
-+
-+            if (device->externalLogical == gcvNULL)
-+            {
-+                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+            }
-+
-+            device->externalPhysical = (gctPHYS_ADDR)(gctUINTPTR_T) physical;
-+            device->externalPhysicalName = gcmPTR_TO_NAME(device->externalPhysical);
-+            physical += device->externalSize;
-+        }
-+    }
-+
-+    /* set up the contiguous memory */
-+    device->contiguousSize = ContiguousSize;
-+
-+    if (ContiguousSize > 0)
-+    {
-+        if (ContiguousBase == 0)
-+        {
-+            while (device->contiguousSize > 0)
-+            {
-+                /* Allocate contiguous memory. */
-+                status = _AllocateMemory(
-+                    device,
-+                    device->contiguousSize,
-+                    &device->contiguousBase,
-+                    &device->contiguousPhysical,
-+                    &physAddr
-+                    );
-+
-+                if (gcmIS_SUCCESS(status))
-+                {
-+                    device->contiguousPhysicalName = gcmPTR_TO_NAME(device->contiguousPhysical);
-+                    status = gckVIDMEM_Construct(
-+                        device->os,
-+                        physAddr | device->systemMemoryBaseAddress,
-+                        device->contiguousSize,
-+                        64,
-+                        BankSize,
-+                        &device->contiguousVidMem
-+                        );
-+
-+                    if (gcmIS_SUCCESS(status))
-+                    {
-+                        break;
-+                    }
-+
-+                    gcmkONERROR(_FreeMemory(
-+                        device,
-+                        device->contiguousBase,
-+                        device->contiguousPhysical
-+                        ));
-+
-+                    gcmRELEASE_NAME(device->contiguousPhysicalName);
-+                    device->contiguousBase     = gcvNULL;
-+                    device->contiguousPhysical = gcvNULL;
-+                }
-+
-+                if (device->contiguousSize <= (4 << 20))
-+                {
-+                    device->contiguousSize = 0;
-+                }
-+                else
-+                {
-+                    device->contiguousSize -= (4 << 20);
-+                }
-+            }
-+        }
-+        else
-+        {
-+            /* Create the contiguous memory heap. */
-+            status = gckVIDMEM_Construct(
-+                device->os,
-+                ContiguousBase | device->systemMemoryBaseAddress,
-+                ContiguousSize,
-+                64, BankSize,
-+                &device->contiguousVidMem
-+                );
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                /* Error, disable contiguous memory pool. */
-+                device->contiguousVidMem = gcvNULL;
-+                device->contiguousSize   = 0;
-+            }
-+            else
-+            {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
-+                mem_region = request_mem_region(
-+                    ContiguousBase, ContiguousSize, "galcore managed memory"
-+                    );
-+
-+                if (mem_region == gcvNULL)
-+                {
-+                    gcmkTRACE_ZONE(
-+                        gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                        "%s(%d): Failed to claim %ld bytes @ 0x%08X\n",
-+                        __FUNCTION__, __LINE__,
-+                        ContiguousSize, ContiguousBase
-+                        );
-+
-+                    gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+                }
-+#endif
-+
-+                device->requestedContiguousBase  = ContiguousBase;
-+                device->requestedContiguousSize  = ContiguousSize;
-+
-+#if !gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
-+                if (gcmIS_CORE_PRESENT(device, gcvCORE_VG))
-+                {
-+                    device->contiguousBase
-+#if gcdPAGED_MEMORY_CACHEABLE
-+                        = (gctPOINTER) ioremap_cached(ContiguousBase, ContiguousSize);
-+#else
-+                        = (gctPOINTER) ioremap_nocache(ContiguousBase, ContiguousSize);
-+#endif
-+                    if (device->contiguousBase == gcvNULL)
-+                    {
-+                        device->contiguousVidMem = gcvNULL;
-+                        device->contiguousSize = 0;
-+
-+                        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+                    }
-+                }
-+#endif
-+
-+                device->contiguousPhysical = gcvNULL;
-+                device->contiguousPhysicalName = 0;
-+                device->contiguousSize     = ContiguousSize;
-+                device->contiguousMapped   = gcvTRUE;
-+            }
-+        }
-+    }
-+
-+    /* Return pointer to the device. */
-+    * Device = device;
-+
-+    gcmkFOOTER_ARG("*Device=0x%x", * Device);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Roll back. */
-+    gcmkVERIFY_OK(gckGALDEVICE_Destroy(device));
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Destroy
-+**
-+**  Class destructor.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Destroy(
-+    gckGALDEVICE Device)
-+{
-+    gctINT i;
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gckKERNEL kernel = gcvNULL;
-+
-+    gcmkHEADER_ARG("Device=0x%x", Device);
-+
-+    if (Device != gcvNULL)
-+    {
-+        /* Grab the first availiable kernel */
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (Device->irqLines[i] != -1)
-+            {
-+                kernel = Device->kernels[i];
-+                break;
-+            }
-+        }
-+        if (Device->internalPhysicalName != 0)
-+        {
-+            gcmRELEASE_NAME(Device->internalPhysicalName);
-+            Device->internalPhysicalName = 0;
-+        }
-+        if (Device->externalPhysicalName != 0)
-+        {
-+            gcmRELEASE_NAME(Device->externalPhysicalName);
-+            Device->externalPhysicalName = 0;
-+        }
-+        if (Device->contiguousPhysicalName != 0)
-+        {
-+            gcmRELEASE_NAME(Device->contiguousPhysicalName);
-+            Device->contiguousPhysicalName = 0;
-+        }
-+
-+
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (Device->kernels[i] != gcvNULL)
-+            {
-+                /* Destroy the gckKERNEL object. */
-+                gcmkVERIFY_OK(gckKERNEL_Destroy(Device->kernels[i]));
-+                Device->kernels[i] = gcvNULL;
-+            }
-+        }
-+
-+        {
-+            if (Device->internalLogical != gcvNULL)
-+            {
-+                /* Unmap the internal memory. */
-+                iounmap(Device->internalLogical);
-+                Device->internalLogical = gcvNULL;
-+            }
-+
-+            if (Device->internalVidMem != gcvNULL)
-+            {
-+                /* Destroy the internal heap. */
-+                gcmkVERIFY_OK(gckVIDMEM_Destroy(Device->internalVidMem));
-+                Device->internalVidMem = gcvNULL;
-+            }
-+        }
-+
-+        {
-+            if (Device->externalLogical != gcvNULL)
-+            {
-+                /* Unmap the external memory. */
-+                iounmap(Device->externalLogical);
-+                Device->externalLogical = gcvNULL;
-+            }
-+
-+            if (Device->externalVidMem != gcvNULL)
-+            {
-+                /* destroy the external heap */
-+                gcmkVERIFY_OK(gckVIDMEM_Destroy(Device->externalVidMem));
-+                Device->externalVidMem = gcvNULL;
-+            }
-+        }
-+
-+        {
-+            if (Device->contiguousBase != gcvNULL)
-+            {
-+                if (Device->contiguousMapped)
-+                {
-+#if !gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
-+                    if (Device->contiguousBase)
-+                    {
-+                        /* Unmap the contiguous memory. */
-+                        iounmap(Device->contiguousBase);
-+                    }
-+#endif
-+                }
-+                else
-+                {
-+                    gcmkONERROR(_FreeMemory(
-+                        Device,
-+                        Device->contiguousBase,
-+                        Device->contiguousPhysical
-+                        ));
-+                }
-+
-+                Device->contiguousBase     = gcvNULL;
-+                Device->contiguousPhysical = gcvNULL;
-+            }
-+
-+            if (Device->requestedContiguousBase != 0)
-+            {
-+                release_mem_region(Device->requestedContiguousBase, Device->requestedContiguousSize);
-+                Device->requestedContiguousBase = 0;
-+                Device->requestedContiguousSize = 0;
-+            }
-+
-+            if (Device->contiguousVidMem != gcvNULL)
-+            {
-+                /* Destroy the contiguous heap. */
-+                gcmkVERIFY_OK(gckVIDMEM_Destroy(Device->contiguousVidMem));
-+                Device->contiguousVidMem = gcvNULL;
-+            }
-+        }
-+
-+	{
-+	    if(gckDebugFileSystemIsEnabled())
-+	    {
-+		 gckDebugFileSystemFreeNode(Device->dbgnode);
-+		 kfree(Device->dbgnode);
-+		 Device->dbgnode = gcvNULL;
-+	    }
-+	}
-+
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (Device->registerBases[i] != gcvNULL)
-+            {
-+                /* Unmap register memory. */
-+                iounmap(Device->registerBases[i]);
-+			    if (Device->requestedRegisterMemBases[i] != 0)
-+			    {
-+				    release_mem_region(Device->requestedRegisterMemBases[i], Device->requestedRegisterMemSizes[i]);
-+			    }
-+
-+                Device->registerBases[i] = gcvNULL;
-+                Device->requestedRegisterMemBases[i] = 0;
-+                Device->requestedRegisterMemSizes[i] = 0;
-+            }
-+        }
-+
-+        /*Disable clock*/
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+        if (Device->clk_3d_axi) {
-+           clk_put(Device->clk_3d_axi);
-+           Device->clk_3d_axi = NULL;
-+        }
-+#endif
-+        if (Device->clk_3d_core) {
-+           clk_put(Device->clk_3d_core);
-+           Device->clk_3d_core = NULL;
-+        }
-+        if (Device->clk_3d_shader) {
-+           clk_put(Device->clk_3d_shader);
-+           Device->clk_3d_shader = NULL;
-+        }
-+        if (Device->clk_2d_core) {
-+           clk_put(Device->clk_2d_core);
-+           Device->clk_2d_core = NULL;
-+        }
-+        if (Device->clk_2d_axi) {
-+           clk_put(Device->clk_2d_axi);
-+           Device->clk_2d_axi = NULL;
-+        }
-+        if (Device->clk_vg_axi) {
-+           clk_put(Device->clk_vg_axi);
-+           Device->clk_vg_axi = NULL;
-+        }
-+
-+#ifdef CONFIG_PM
-+        if(Device->pmdev)
-+            pm_runtime_disable(Device->pmdev);
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+        if (Device->gpu_regulator) {
-+           regulator_put(Device->gpu_regulator);
-+           Device->gpu_regulator = NULL;
-+        }
-+#endif
-+
-+        /* Destroy the gckOS object. */
-+        if (Device->os != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_Destroy(Device->os));
-+            Device->os = gcvNULL;
-+        }
-+
-+        /* Free the device. */
-+        kfree(Device);
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Setup_ISR
-+**
-+**  Start the ISR routine.
-+**
-+**  INPUT:
-+**
-+**      gckGALDEVICE Device
-+**          Pointer to an gckGALDEVICE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      gcvSTATUS_OK
-+**          Setup successfully.
-+**      gcvSTATUS_GENERIC_IO
-+**          Setup failed.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Setup_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT ret = -1;
-+
-+    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    if (Device->irqLines[Core] < 0)
-+    {
-+        gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+    }
-+
-+    /* Hook up the isr based on the irq line. */
-+#ifdef FLAREON
-+    gc500_handle.dev_name  = "galcore interrupt service";
-+    gc500_handle.dev_id    = Device;
-+    switch (Core) {
-+        case gcvCORE_MAJOR:
-+            gc500_handle.handler   = isrRoutine;
-+            break;
-+        case gcvCORE_2D:
-+            gc500_handle.handler   = isrRoutine2D;
-+            break;
-+        case gcvCORE_VG:
-+            gc500_handle.handler   = isrRoutineVG;
-+            break;
-+        default:
-+            break;
-+    }
-+    gc500_handle.intr_gen  = GPIO_INTR_LEVEL_TRIGGER;
-+    gc500_handle.intr_trig = GPIO_TRIG_HIGH_LEVEL;
-+
-+    ret = dove_gpio_request(
-+        DOVE_GPIO0_7, &gc500_handle
-+        );
-+#else
-+    switch (Core) {
-+        case gcvCORE_MAJOR:
-+            ret = request_irq(
-+                Device->irqLines[Core], isrRoutine, 0x0/*IRQF_DISABLED*/,
-+                "galcore interrupt service", Device
-+                );
-+            break;
-+        case gcvCORE_2D:
-+            ret = request_irq(
-+                Device->irqLines[Core], isrRoutine2D, 0x0/*IRQF_DISABLED*/,
-+                "galcore 2D interrupt service", Device
-+                );
-+            break;
-+        case gcvCORE_VG:
-+            ret = request_irq(
-+                Device->irqLines[Core], isrRoutineVG, 0x0/*IRQF_DISABLED*/,
-+                "galcore VG interrupt service", Device
-+                );
-+            break;
-+        default:
-+            break;
-+    }
-+#endif
-+
-+    if (ret != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): Could not register irq line %d (error=%d)\n",
-+            __FUNCTION__, __LINE__,
-+            Device->irqLines[Core], ret
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+    }
-+
-+    Device->isrEnabled[Core] = 1;
-+
-+    /* Mark ISR as initialized. */
-+    Device->isrInitializeds[Core] = gcvTRUE;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckGALDEVICE_Enable_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    if (Device->irqLines[Core] < 0)
-+    {
-+        gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+    }
-+
-+    spin_lock(&Device->kernels[Core]->irq_lock);
-+    if (Device->isrEnabled[Core] == 0)
-+    {
-+        enable_irq(Device->irqLines[Core]);
-+        /* Mark ISR as initialized. */
-+        Device->isrEnabled[Core] = gcvTRUE;
-+    }
-+    Device->isrEnabled[Core]++;
-+    spin_unlock(&Device->kernels[Core]->irq_lock);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Release_ISR
-+**
-+**  Release the irq line.
-+**
-+**  INPUT:
-+**
-+**      gckGALDEVICE Device
-+**          Pointer to an gckGALDEVICE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Release_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    )
-+{
-+    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    /* release the irq */
-+    if (Device->isrInitializeds[Core])
-+    {
-+#ifdef FLAREON
-+        dove_gpio_free(DOVE_GPIO0_7, "galcore interrupt service");
-+#else
-+        free_irq(Device->irqLines[Core], Device);
-+#endif
-+
-+	Device->isrInitializeds[Core] = gcvFALSE;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckGALDEVICE_Disable_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    )
-+{
-+    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    /* disable the irq */
-+    spin_lock(&Device->kernels[Core]->irq_lock);
-+    if (Device->isrEnabled[Core] > 0)
-+    {
-+        Device->isrEnabled[Core]--;
-+        if (Device->isrEnabled[Core] == 0)
-+            disable_irq(Device->irqLines[Core]);
-+    }
-+    spin_unlock(&Device->kernels[Core]->irq_lock);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Start_Threads
-+**
-+**  Start the daemon threads.
-+**
-+**  INPUT:
-+**
-+**      gckGALDEVICE Device
-+**          Pointer to an gckGALDEVICE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      gcvSTATUS_OK
-+**          Start successfully.
-+**      gcvSTATUS_GENERIC_IO
-+**          Start failed.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Start_Threads(
-+    IN gckGALDEVICE Device
-+    )
-+{
-+    gceSTATUS status;
-+    struct task_struct * task;
-+
-+    gcmkHEADER_ARG("Device=0x%x", Device);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    if (Device->kernels[gcvCORE_MAJOR] != gcvNULL)
-+    {
-+        /* Start the kernel thread. */
-+        task = kthread_run(threadRoutine, Device, "galcore daemon thread");
-+
-+        if (IS_ERR(task))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Could not start the kernel thread.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+        }
-+
-+        Device->threadCtxts[gcvCORE_MAJOR]          = task;
-+        Device->threadInitializeds[gcvCORE_MAJOR]   = gcvTRUE;
-+    }
-+
-+    if (Device->kernels[gcvCORE_2D] != gcvNULL)
-+    {
-+        /* Start the kernel thread. */
-+        task = kthread_run(threadRoutine2D, Device, "galcore daemon thread for 2D");
-+
-+        if (IS_ERR(task))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Could not start the kernel thread.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+        }
-+
-+        Device->threadCtxts[gcvCORE_2D]         = task;
-+        Device->threadInitializeds[gcvCORE_2D]  = gcvTRUE;
-+    }
-+    else
-+    {
-+        Device->threadInitializeds[gcvCORE_2D]  = gcvFALSE;
-+    }
-+
-+    if (Device->kernels[gcvCORE_VG] != gcvNULL)
-+    {
-+        /* Start the kernel thread. */
-+        task = kthread_run(threadRoutineVG, Device, "galcore daemon thread for VG");
-+
-+        if (IS_ERR(task))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Could not start the kernel thread.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+        }
-+
-+        Device->threadCtxts[gcvCORE_VG]         = task;
-+        Device->threadInitializeds[gcvCORE_VG]  = gcvTRUE;
-+    }
-+    else
-+    {
-+        Device->threadInitializeds[gcvCORE_VG]  = gcvFALSE;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Stop_Threads
-+**
-+**  Stop the gal device, including the following actions: stop the daemon
-+**  thread, release the irq.
-+**
-+**  INPUT:
-+**
-+**      gckGALDEVICE Device
-+**          Pointer to an gckGALDEVICE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Stop_Threads(
-+    gckGALDEVICE Device
-+    )
-+{
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Device=0x%x", Device);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        /* Stop the kernel threads. */
-+        if (Device->threadInitializeds[i])
-+        {
-+            Device->killThread = gcvTRUE;
-+            up(&Device->semas[i]);
-+
-+            kthread_stop(Device->threadCtxts[i]);
-+            Device->threadCtxts[i]        = gcvNULL;
-+            Device->threadInitializeds[i] = gcvFALSE;
-+        }
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Start
-+**
-+**  Start the gal device, including the following actions: setup the isr routine
-+**  and start the daemoni thread.
-+**
-+**  INPUT:
-+**
-+**      gckGALDEVICE Device
-+**          Pointer to an gckGALDEVICE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      gcvSTATUS_OK
-+**          Start successfully.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Start(
-+    IN gckGALDEVICE Device
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Device=0x%x", Device);
-+
-+    /* Start the kernel thread. */
-+    gcmkONERROR(gckGALDEVICE_Start_Threads(Device));
-+
-+    if (Device->kernels[gcvCORE_MAJOR] != gcvNULL)
-+    {
-+        /* Setup the ISR routine. */
-+        gcmkONERROR(gckGALDEVICE_Setup_ISR(Device, gcvCORE_MAJOR));
-+
-+        /* Switch to SUSPEND power state. */
-+        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
-+            Device->kernels[gcvCORE_MAJOR]->hardware, gcvPOWER_OFF_BROADCAST
-+            ));
-+    }
-+
-+    if (Device->kernels[gcvCORE_2D] != gcvNULL)
-+    {
-+        /* Setup the ISR routine. */
-+        gcmkONERROR(gckGALDEVICE_Setup_ISR(Device, gcvCORE_2D));
-+
-+        /* Switch to SUSPEND power state. */
-+        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
-+            Device->kernels[gcvCORE_2D]->hardware, gcvPOWER_OFF_BROADCAST
-+            ));
-+    }
-+
-+    if (Device->kernels[gcvCORE_VG] != gcvNULL)
-+    {
-+        /* Setup the ISR routine. */
-+        gcmkONERROR(gckGALDEVICE_Setup_ISR(Device, gcvCORE_VG));
-+
-+        /* Switch to SUSPEND power state. */
-+        gcmkONERROR(gckVGHARDWARE_SetPowerManagementState(
-+            Device->kernels[gcvCORE_VG]->vg->hardware, gcvPOWER_OFF_BROADCAST
-+            ));
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckGALDEVICE_Stop
-+**
-+**  Stop the gal device, including the following actions: stop the daemon
-+**  thread, release the irq.
-+**
-+**  INPUT:
-+**
-+**      gckGALDEVICE Device
-+**          Pointer to an gckGALDEVICE object.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+**
-+**  RETURNS:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckGALDEVICE_Stop(
-+    gckGALDEVICE Device
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Device=0x%x", Device);
-+
-+    gcmkVERIFY_ARGUMENT(Device != NULL);
-+
-+    if (Device->kernels[gcvCORE_MAJOR] != gcvNULL)
-+    {
-+        /* Switch to OFF power state. */
-+        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
-+            Device->kernels[gcvCORE_MAJOR]->hardware, gcvPOWER_OFF
-+            ));
-+
-+        /* Remove the ISR routine. */
-+        gcmkONERROR(gckGALDEVICE_Release_ISR(Device, gcvCORE_MAJOR));
-+    }
-+
-+    if (Device->kernels[gcvCORE_2D] != gcvNULL)
-+    {
-+        /* Setup the ISR routine. */
-+        gcmkONERROR(gckGALDEVICE_Release_ISR(Device, gcvCORE_2D));
-+
-+        /* Switch to OFF power state. */
-+        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
-+            Device->kernels[gcvCORE_2D]->hardware, gcvPOWER_OFF
-+            ));
-+    }
-+
-+    if (Device->kernels[gcvCORE_VG] != gcvNULL)
-+    {
-+        /* Setup the ISR routine. */
-+        gcmkONERROR(gckGALDEVICE_Release_ISR(Device, gcvCORE_VG));
-+
-+#if gcdENABLE_VG
-+        /* Switch to OFF power state. */
-+        gcmkONERROR(gckVGHARDWARE_SetPowerManagementState(
-+            Device->kernels[gcvCORE_VG]->vg->hardware, gcvPOWER_OFF
-+            ));
-+#endif
-+    }
-+
-+    /* Stop the kernel thread. */
-+    gcmkONERROR(gckGALDEVICE_Stop_Threads(Device));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,192 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_device_h_
-+#define __gc_hal_kernel_device_h_
-+
-+/******************************************************************************\
-+******************************* gckGALDEVICE Structure *******************************
-+\******************************************************************************/
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+struct contiguous_mem_pool {
-+	struct dma_attrs attrs;
-+	dma_addr_t phys;
-+	void *virt;
-+	size_t size;
-+};
-+#endif
-+
-+typedef struct _gckGALDEVICE
-+{
-+    /* Objects. */
-+    gckOS               os;
-+    gckKERNEL           kernels[gcdMAX_GPU_COUNT];
-+
-+    /* Attributes. */
-+    gctSIZE_T           internalSize;
-+    gctPHYS_ADDR        internalPhysical;
-+    gctUINT32           internalPhysicalName;
-+    gctPOINTER          internalLogical;
-+    gckVIDMEM           internalVidMem;
-+    gctSIZE_T           externalSize;
-+    gctPHYS_ADDR        externalPhysical;
-+    gctUINT32           externalPhysicalName;
-+    gctPOINTER          externalLogical;
-+    gckVIDMEM           externalVidMem;
-+    gckVIDMEM           contiguousVidMem;
-+    gctPOINTER          contiguousBase;
-+    gctPHYS_ADDR        contiguousPhysical;
-+    gctUINT32           contiguousPhysicalName;
-+    gctSIZE_T           contiguousSize;
-+    gctBOOL             contiguousMapped;
-+    gctPOINTER          contiguousMappedUser;
-+    gctSIZE_T           systemMemorySize;
-+    gctUINT32           systemMemoryBaseAddress;
-+    gctPOINTER          registerBases[gcdMAX_GPU_COUNT];
-+    gctSIZE_T           registerSizes[gcdMAX_GPU_COUNT];
-+    gctUINT32           baseAddress;
-+    gctUINT32           requestedRegisterMemBases[gcdMAX_GPU_COUNT];
-+    gctSIZE_T           requestedRegisterMemSizes[gcdMAX_GPU_COUNT];
-+    gctUINT32           requestedContiguousBase;
-+    gctSIZE_T           requestedContiguousSize;
-+
-+    /* IRQ management. */
-+    gctINT              irqLines[gcdMAX_GPU_COUNT];
-+    gctBOOL             isrInitializeds[gcdMAX_GPU_COUNT];
-+    gctINT              isrEnabled[gcdMAX_GPU_COUNT];
-+    gctBOOL             dataReadys[gcdMAX_GPU_COUNT];
-+
-+    /* Thread management. */
-+    struct task_struct  *threadCtxts[gcdMAX_GPU_COUNT];
-+    struct semaphore    semas[gcdMAX_GPU_COUNT];
-+    gctBOOL             threadInitializeds[gcdMAX_GPU_COUNT];
-+    gctBOOL             killThread;
-+
-+    /* Signal management. */
-+    gctINT              signal;
-+
-+    /* Core mapping */
-+    gceCORE             coreMapping[8];
-+
-+    /* States before suspend. */
-+    gceCHIPPOWERSTATE   statesStored[gcdMAX_GPU_COUNT];
-+
-+    /*Device Debug File System Entry in Kernel*/
-+   struct _gcsDebugFileSystemNode * dbgnode;
-+
-+    /* Clock management.*/
-+    struct clk         *clk_3d_core;
-+    struct clk         *clk_3d_shader;
-+    struct clk		   *clk_3d_axi;
-+    struct clk         *clk_2d_core;
-+    struct clk         *clk_2d_axi;
-+    struct clk         *clk_vg_axi;
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    /*Power management.*/
-+    struct regulator      *gpu_regulator;
-+#endif
-+	/*Run time pm*/
-+	struct device		*pmdev;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	struct contiguous_mem_pool *pool;
-+	struct reset_control *rstc[gcdMAX_GPU_COUNT];
-+#endif
-+}
-+* gckGALDEVICE;
-+
-+typedef struct _gcsHAL_PRIVATE_DATA
-+{
-+    gckGALDEVICE        device;
-+    gctPOINTER          mappedMemory;
-+    gctPOINTER          contiguousLogical;
-+    /* The process opening the device may not be the same as the one that closes it. */
-+    gctUINT32           pidOpen;
-+}
-+gcsHAL_PRIVATE_DATA, * gcsHAL_PRIVATE_DATA_PTR;
-+
-+gceSTATUS gckGALDEVICE_Enable_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS gckGALDEVICE_Disable_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS gckGALDEVICE_Setup_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS gckGALDEVICE_Release_ISR(
-+    IN gckGALDEVICE Device,
-+    IN gceCORE Core
-+    );
-+
-+gceSTATUS gckGALDEVICE_Start_Threads(
-+    IN gckGALDEVICE Device
-+    );
-+
-+gceSTATUS gckGALDEVICE_Stop_Threads(
-+    gckGALDEVICE Device
-+    );
-+
-+gceSTATUS gckGALDEVICE_Start(
-+    IN gckGALDEVICE Device
-+    );
-+
-+gceSTATUS gckGALDEVICE_Stop(
-+    gckGALDEVICE Device
-+    );
-+
-+gceSTATUS gckGALDEVICE_Construct(
-+    IN gctINT IrqLine,
-+    IN gctUINT32 RegisterMemBase,
-+    IN gctSIZE_T RegisterMemSize,
-+    IN gctINT IrqLine2D,
-+    IN gctUINT32 RegisterMemBase2D,
-+    IN gctSIZE_T RegisterMemSize2D,
-+    IN gctINT IrqLineVG,
-+    IN gctUINT32 RegisterMemBaseVG,
-+    IN gctSIZE_T RegisterMemSizeVG,
-+    IN gctUINT32 ContiguousBase,
-+    IN gctSIZE_T ContiguousSize,
-+    IN gctSIZE_T BankSize,
-+    IN gctINT FastClear,
-+    IN gctINT Compression,
-+    IN gctUINT32 PhysBaseAddr,
-+    IN gctUINT32 PhysSize,
-+    IN gctINT Signal,
-+    IN gctUINT LogFileSize,
-+    IN struct device *pdev,
-+    IN gctINT PowerManagement,
-+    IN gctINT GpuProfiler,
-+    OUT gckGALDEVICE *Device
-+    );
-+
-+gceSTATUS gckGALDEVICE_Destroy(
-+    IN gckGALDEVICE Device
-+    );
-+
-+#endif /* __gc_hal_kernel_device_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,1476 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*    Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+#include <linux/device.h>
-+#include <linux/slab.h>
-+#include <linux/notifier.h>
-+#include "gc_hal_kernel_linux.h"
-+#include "gc_hal_driver.h"
-+
-+#if USE_PLATFORM_DRIVER
-+#   include <linux/platform_device.h>
-+#endif
-+
-+#ifdef CONFIG_PXA_DVFM
-+#   include <mach/dvfm.h>
-+#   include <mach/pxa3xx_dvfm.h>
-+#endif
-+
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+#    include <linux/resmem_account.h>
-+#    include <linux/kernel.h>
-+#    include <linux/mm.h>
-+#    include <linux/oom.h>
-+#    include <linux/sched.h>
-+#    include <linux/notifier.h>
-+
-+struct task_struct *lowmem_deathpending;
-+
-+static int
-+task_notify_func(struct notifier_block *self, unsigned long val, void *data);
-+
-+static struct notifier_block task_nb = {
-+	.notifier_call	= task_notify_func,
-+};
-+
-+static int
-+task_notify_func(struct notifier_block *self, unsigned long val, void *data)
-+{
-+	struct task_struct *task = data;
-+
-+	if (task == lowmem_deathpending)
-+		lowmem_deathpending = NULL;
-+
-+	return NOTIFY_OK;
-+}
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+#include <mach/viv_gpu.h>
-+#else
-+#include <linux/pm_runtime.h>
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
-+#include <mach/busfreq.h>
-+#else
-+#include <linux/busfreq-imx6.h>
-+#include <linux/reset.h>
-+#endif
-+#endif
-+/* Zone used for header/footer. */
-+#define _GC_OBJ_ZONE    gcvZONE_DRIVER
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+#include <linux/device_cooling.h>
-+#define REG_THERMAL_NOTIFIER(a) register_devfreq_cooling_notifier(a);
-+#define UNREG_THERMAL_NOTIFIER(a) unregister_devfreq_cooling_notifier(a);
-+#else
-+extern int register_thermal_notifier(struct notifier_block *nb);
-+extern int unregister_thermal_notifier(struct notifier_block *nb);
-+#define REG_THERMAL_NOTIFIER(a) register_thermal_notifier(a);
-+#define UNREG_THERMAL_NOTIFIER(a) unregister_thermal_notifier(a);
-+#endif
-+#endif
-+
-+MODULE_DESCRIPTION("Vivante Graphics Driver");
-+MODULE_LICENSE("GPL");
-+
-+static struct class* gpuClass;
-+
-+static gckGALDEVICE galDevice;
-+
-+static uint major = 199;
-+module_param(major, uint, 0644);
-+
-+static int irqLine = -1;
-+module_param(irqLine, int, 0644);
-+
-+static ulong registerMemBase = 0x80000000;
-+module_param(registerMemBase, ulong, 0644);
-+
-+static ulong registerMemSize = 2 << 10;
-+module_param(registerMemSize, ulong, 0644);
-+
-+static int irqLine2D = -1;
-+module_param(irqLine2D, int, 0644);
-+
-+static ulong registerMemBase2D = 0x00000000;
-+module_param(registerMemBase2D, ulong, 0644);
-+
-+static ulong registerMemSize2D = 2 << 10;
-+module_param(registerMemSize2D, ulong, 0644);
-+
-+static int irqLineVG = -1;
-+module_param(irqLineVG, int, 0644);
-+
-+static ulong registerMemBaseVG = 0x00000000;
-+module_param(registerMemBaseVG, ulong, 0644);
-+
-+static ulong registerMemSizeVG = 2 << 10;
-+module_param(registerMemSizeVG, ulong, 0644);
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+static ulong contiguousSize = 128 << 20;
-+#else
-+static ulong contiguousSize = 4 << 20;
-+#endif
-+module_param(contiguousSize, ulong, 0644);
-+
-+static ulong contiguousBase = 0;
-+module_param(contiguousBase, ulong, 0644);
-+
-+static ulong bankSize = 0;
-+module_param(bankSize, ulong, 0644);
-+
-+static int fastClear = -1;
-+module_param(fastClear, int, 0644);
-+
-+static int compression = -1;
-+module_param(compression, int, 0644);
-+
-+static int powerManagement = 1;
-+module_param(powerManagement, int, 0644);
-+
-+static int gpuProfiler = 0;
-+module_param(gpuProfiler, int, 0644);
-+
-+static int signal = 48;
-+module_param(signal, int, 0644);
-+
-+static ulong baseAddress = 0;
-+module_param(baseAddress, ulong, 0644);
-+
-+static ulong physSize = 0;
-+module_param(physSize, ulong, 0644);
-+
-+static uint logFileSize=0;
-+module_param(logFileSize,uint, 0644);
-+
-+static int showArgs = 0;
-+module_param(showArgs, int, 0644);
-+
-+int gpu3DMinClock = 0;
-+module_param(gpu3DMinClock, int, 0644);
-+
-+#if ENABLE_GPU_CLOCK_BY_DRIVER
-+    unsigned long coreClock = 156000000;
-+    module_param(coreClock, ulong, 0644);
-+#endif
-+
-+static int drv_open(
-+    struct inode* inode,
-+    struct file* filp
-+    );
-+
-+static int drv_release(
-+    struct inode* inode,
-+    struct file* filp
-+    );
-+
-+static long drv_ioctl(
-+    struct file* filp,
-+    unsigned int ioctlCode,
-+    unsigned long arg
-+    );
-+
-+static int drv_mmap(
-+    struct file* filp,
-+    struct vm_area_struct* vma
-+    );
-+
-+static struct file_operations driver_fops =
-+{
-+    .owner      = THIS_MODULE,
-+    .open       = drv_open,
-+    .release    = drv_release,
-+    .unlocked_ioctl = drv_ioctl,
-+#ifdef HAVE_COMPAT_IOCTL
-+    .compat_ioctl = drv_ioctl,
-+#endif
-+    .mmap       = drv_mmap,
-+};
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+static size_t viv_gpu_resmem_query(struct task_struct *p, struct reserved_memory_account *m);
-+static struct reserved_memory_account viv_gpu_resmem_handler = {
-+    .name = "viv_gpu",
-+    .get_page_used_by_process = viv_gpu_resmem_query,
-+};
-+
-+size_t viv_gpu_resmem_query(struct task_struct *p, struct reserved_memory_account *m)
-+{
-+    gcuDATABASE_INFO info;
-+    unsigned int processid = p->pid;
-+    gckKERNEL gpukernel = m->data;
-+
-+    /* ignore error happens in this api. */
-+    if (gckKERNEL_QueryProcessDB(gpukernel, processid, false, gcvDB_VIDEO_MEMORY, &info) != gcvSTATUS_OK)
-+	return 0;
-+
-+    /* we return pages. */
-+    if (info.counters.bytes > 0)
-+	return info.counters.bytes / PAGE_SIZE;
-+    return 0;
-+}
-+#endif
-+
-+int drv_open(
-+    struct inode* inode,
-+    struct file* filp
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL attached = gcvFALSE;
-+    gcsHAL_PRIVATE_DATA_PTR data = gcvNULL;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = kmalloc(sizeof(gcsHAL_PRIVATE_DATA), GFP_KERNEL);
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    data->device             = galDevice;
-+    data->mappedMemory       = gcvNULL;
-+    data->contiguousLogical  = gcvNULL;
-+    gcmkONERROR(gckOS_GetProcessID(&data->pidOpen));
-+
-+    /* Attached the process. */
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (galDevice->kernels[i] != gcvNULL)
-+        {
-+            gcmkONERROR(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvTRUE));
-+        }
-+    }
-+    attached = gcvTRUE;
-+
-+    if (!galDevice->contiguousMapped)
-+    {
-+        gcmkONERROR(gckOS_MapMemory(
-+            galDevice->os,
-+            galDevice->contiguousPhysical,
-+            galDevice->contiguousSize,
-+            &data->contiguousLogical
-+            ));
-+    }
-+
-+    filp->private_data = data;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    if (data != gcvNULL)
-+    {
-+        if (data->contiguousLogical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_UnmapMemory(
-+                galDevice->os,
-+                galDevice->contiguousPhysical,
-+                galDevice->contiguousSize,
-+                data->contiguousLogical
-+                ));
-+        }
-+
-+        kfree(data);
-+    }
-+
-+    if (attached)
-+    {
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (galDevice->kernels[i] != gcvNULL)
-+            {
-+                gcmkVERIFY_OK(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvFALSE));
-+            }
-+        }
-+    }
-+
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+int drv_release(
-+    struct inode* inode,
-+    struct file* filp
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_PRIVATE_DATA_PTR data;
-+    gckGALDEVICE device;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = filp->private_data;
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    device = data->device;
-+
-+    if (device == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): device is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if (!device->contiguousMapped)
-+    {
-+        if (data->contiguousLogical != gcvNULL)
-+        {
-+            gcmkONERROR(gckOS_UnmapMemoryEx(
-+                galDevice->os,
-+                galDevice->contiguousPhysical,
-+                galDevice->contiguousSize,
-+                data->contiguousLogical,
-+                data->pidOpen
-+                ));
-+
-+            data->contiguousLogical = gcvNULL;
-+        }
-+    }
-+
-+    /* A process gets detached. */
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (galDevice->kernels[i] != gcvNULL)
-+        {
-+            gcmkONERROR(gckKERNEL_AttachProcessEx(galDevice->kernels[i], gcvFALSE, data->pidOpen));
-+        }
-+    }
-+
-+    kfree(data);
-+    filp->private_data = NULL;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+long drv_ioctl(
-+    struct file* filp,
-+    unsigned int ioctlCode,
-+    unsigned long arg
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+    gctUINT32 copyLen;
-+    DRIVER_ARGS drvArgs;
-+    gckGALDEVICE device;
-+    gcsHAL_PRIVATE_DATA_PTR data;
-+    gctINT32 i, count;
-+
-+    gcmkHEADER_ARG(
-+        "filp=0x%08X ioctlCode=0x%08X arg=0x%08X",
-+        filp, ioctlCode, arg
-+        );
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = filp->private_data;
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    device = data->device;
-+
-+    if (device == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): device is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if ((ioctlCode != IOCTL_GCHAL_INTERFACE)
-+    &&  (ioctlCode != IOCTL_GCHAL_KERNEL_INTERFACE)
-+    )
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): unknown command %d\n",
-+            __FUNCTION__, __LINE__,
-+            ioctlCode
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Get the drvArgs. */
-+    copyLen = copy_from_user(
-+        &drvArgs, (void *) arg, sizeof(DRIVER_ARGS)
-+        );
-+
-+    if (copyLen != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): error copying of the input arguments.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Now bring in the gcsHAL_INTERFACE structure. */
-+    if ((drvArgs.InputBufferSize  != sizeof(gcsHAL_INTERFACE))
-+    ||  (drvArgs.OutputBufferSize != sizeof(gcsHAL_INTERFACE))
-+    )
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): input or/and output structures are invalid.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    copyLen = copy_from_user(
-+        &iface, gcmUINT64_TO_PTR(drvArgs.InputBuffer), sizeof(gcsHAL_INTERFACE)
-+        );
-+
-+    if (copyLen != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): error copying of input HAL interface.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if (iface.command == gcvHAL_CHIP_INFO)
-+    {
-+        count = 0;
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (device->kernels[i] != gcvNULL)
-+            {
-+#if gcdENABLE_VG
-+                if (i == gcvCORE_VG)
-+                {
-+                    iface.u.ChipInfo.types[count] = gcvHARDWARE_VG;
-+                }
-+                else
-+#endif
-+                {
-+                    gcmkVERIFY_OK(gckHARDWARE_GetType(device->kernels[i]->hardware,
-+                                                      &iface.u.ChipInfo.types[count]));
-+                }
-+                count++;
-+            }
-+        }
-+
-+        iface.u.ChipInfo.count = count;
-+        iface.status = status = gcvSTATUS_OK;
-+    }
-+    else
-+    {
-+        if (iface.hardwareType < 0 || iface.hardwareType > 7)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): unknown hardwareType %d\n",
-+                __FUNCTION__, __LINE__,
-+                iface.hardwareType
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+#if gcdENABLE_VG
-+        if (device->coreMapping[iface.hardwareType] == gcvCORE_VG)
-+        {
-+            status = gckVGKERNEL_Dispatch(device->kernels[gcvCORE_VG],
-+                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
-+                                        &iface);
-+        }
-+        else
-+#endif
-+        {
-+            status = gckKERNEL_Dispatch(device->kernels[device->coreMapping[iface.hardwareType]],
-+                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
-+                                        &iface);
-+        }
-+    }
-+
-+    /* Redo system call after pending signal is handled. */
-+    if (status == gcvSTATUS_INTERRUPTED)
-+    {
-+        gcmkFOOTER();
-+        return -ERESTARTSYS;
-+    }
-+
-+    if (gcmIS_SUCCESS(status) && (iface.command == gcvHAL_LOCK_VIDEO_MEMORY))
-+    {
-+        gcuVIDMEM_NODE_PTR node = gcmUINT64_TO_PTR(iface.u.LockVideoMemory.node);
-+        /* Special case for mapped memory. */
-+        if ((data->mappedMemory != gcvNULL)
-+        &&  (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        )
-+        {
-+            /* Compute offset into mapped memory. */
-+            gctUINT32 offset
-+                = (gctUINT8 *) gcmUINT64_TO_PTR(iface.u.LockVideoMemory.memory)
-+                - (gctUINT8 *) device->contiguousBase;
-+
-+            /* Compute offset into user-mapped region. */
-+            iface.u.LockVideoMemory.memory =
-+                gcmPTR_TO_UINT64((gctUINT8 *) data->mappedMemory + offset);
-+        }
-+    }
-+
-+    /* Copy data back to the user. */
-+    copyLen = copy_to_user(
-+        gcmUINT64_TO_PTR(drvArgs.OutputBuffer), &iface, sizeof(gcsHAL_INTERFACE)
-+        );
-+
-+    if (copyLen != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): error copying of output HAL interface.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+static int drv_mmap(
-+    struct file* filp,
-+    struct vm_area_struct* vma
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gcsHAL_PRIVATE_DATA_PTR data;
-+    gckGALDEVICE device;
-+
-+    gcmkHEADER_ARG("filp=0x%08X vma=0x%08X", filp, vma);
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = filp->private_data;
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    device = data->device;
-+
-+    if (device == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): device is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+#if !gcdPAGED_MEMORY_CACHEABLE
-+    vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
-+    vma->vm_flags    |= gcdVM_FLAGS;
-+#endif
-+    vma->vm_pgoff     = 0;
-+
-+    if (device->contiguousMapped)
-+    {
-+        unsigned long size = vma->vm_end - vma->vm_start;
-+        int ret = 0;
-+
-+        if (size > device->contiguousSize)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Invalid mapping size.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        ret = io_remap_pfn_range(
-+            vma,
-+            vma->vm_start,
-+            device->requestedContiguousBase >> PAGE_SHIFT,
-+            size,
-+            vma->vm_page_prot
-+            );
-+
-+        if (ret != 0)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): io_remap_pfn_range failed %d\n",
-+                __FUNCTION__, __LINE__,
-+                ret
-+                );
-+
-+            data->mappedMemory = gcvNULL;
-+
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+
-+        data->mappedMemory = (gctPOINTER) vma->vm_start;
-+
-+        /* Success. */
-+        gcmkFOOTER_NO();
-+        return 0;
-+    }
-+
-+
-+OnError:
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+
-+#if !USE_PLATFORM_DRIVER
-+static int __init drv_init(void)
-+#else
-+static int drv_init(struct device *pdev)
-+#endif
-+{
-+    int ret;
-+    int result = -EINVAL;
-+    gceSTATUS status;
-+    gckGALDEVICE device = gcvNULL;
-+    struct class* device_class = gcvNULL;
-+
-+    gcmkHEADER();
-+
-+#if ENABLE_GPU_CLOCK_BY_DRIVER && (LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,28))
-+    {
-+# if 0
-+        struct clk * clk;
-+
-+        clk = clk_get(NULL, "GCCLK");
-+
-+        if (IS_ERR(clk))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): clk get error: %d\n",
-+                __FUNCTION__, __LINE__,
-+                PTR_ERR(clk)
-+                );
-+
-+            result = -ENODEV;
-+            gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+        }
-+
-+        /*
-+         * APMU_GC_156M, APMU_GC_312M, APMU_GC_PLL2, APMU_GC_PLL2_DIV2 currently.
-+         * Use the 2X clock.
-+         */
-+        if (clk_set_rate(clk, coreClock * 2))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Failed to set core clock.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            result = -EAGAIN;
-+            gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+        }
-+
-+        clk_enable(clk);
-+
-+#if defined(CONFIG_PXA_DVFM) && (LINUX_VERSION_CODE > KERNEL_VERSION(2,6,29))
-+        gc_pwr(1);
-+#   endif
-+# endif
-+    }
-+#endif
-+
-+    printk(KERN_INFO "Galcore version %d.%d.%d.%d\n",
-+        gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH, gcvVERSION_BUILD);
-+    /* when enable gpu profiler, we need to turn off gpu powerMangement */
-+    if(gpuProfiler)
-+        powerManagement = 0;
-+    if (showArgs)
-+    {
-+        printk("galcore options:\n");
-+        printk("  irqLine           = %d\n",      irqLine);
-+        printk("  registerMemBase   = 0x%08lX\n", registerMemBase);
-+        printk("  registerMemSize   = 0x%08lX\n", registerMemSize);
-+
-+        if (irqLine2D != -1)
-+        {
-+            printk("  irqLine2D         = %d\n",      irqLine2D);
-+            printk("  registerMemBase2D = 0x%08lX\n", registerMemBase2D);
-+            printk("  registerMemSize2D = 0x%08lX\n", registerMemSize2D);
-+        }
-+
-+        if (irqLineVG != -1)
-+        {
-+            printk("  irqLineVG         = %d\n",      irqLineVG);
-+            printk("  registerMemBaseVG = 0x%08lX\n", registerMemBaseVG);
-+            printk("  registerMemSizeVG = 0x%08lX\n", registerMemSizeVG);
-+        }
-+
-+        printk("  contiguousSize    = %ld\n",     contiguousSize);
-+        printk("  contiguousBase    = 0x%08lX\n", contiguousBase);
-+        printk("  bankSize          = 0x%08lX\n", bankSize);
-+        printk("  fastClear         = %d\n",      fastClear);
-+        printk("  compression       = %d\n",      compression);
-+        printk("  signal            = %d\n",      signal);
-+        printk("  baseAddress       = 0x%08lX\n", baseAddress);
-+        printk("  physSize          = 0x%08lX\n", physSize);
-+        printk("  logFileSize       = %d KB \n",  logFileSize);
-+        printk("  powerManagement   = %d\n",      powerManagement);
-+        printk("  gpuProfiler   = %d\n",      gpuProfiler);
-+#if ENABLE_GPU_CLOCK_BY_DRIVER
-+        printk("  coreClock       = %lu\n",     coreClock);
-+#endif
-+    }
-+
-+    if(logFileSize != 0)
-+    {
-+    	gckDebugFileSystemInitialize();
-+    }
-+
-+    /* Create the GAL device. */
-+    gcmkONERROR(gckGALDEVICE_Construct(
-+        irqLine,
-+        registerMemBase, registerMemSize,
-+        irqLine2D,
-+        registerMemBase2D, registerMemSize2D,
-+        irqLineVG,
-+        registerMemBaseVG, registerMemSizeVG,
-+        contiguousBase, contiguousSize,
-+        bankSize, fastClear, compression, baseAddress, physSize, signal,
-+        logFileSize,
-+        pdev,
-+        powerManagement,
-+        gpuProfiler,
-+        &device
-+        ));
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	device->pool = dev_get_drvdata(pdev);
-+#endif
-+
-+    /* Start the GAL device. */
-+    gcmkONERROR(gckGALDEVICE_Start(device));
-+
-+    if ((physSize != 0)
-+       && (device->kernels[gcvCORE_MAJOR] != gcvNULL)
-+       && (device->kernels[gcvCORE_MAJOR]->hardware->mmuVersion != 0))
-+    {
-+        status = gckMMU_Enable(device->kernels[gcvCORE_MAJOR]->mmu, baseAddress, physSize);
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
-+            "Enable new MMU: status=%d\n", status);
-+
-+        if ((device->kernels[gcvCORE_2D] != gcvNULL)
-+            && (device->kernels[gcvCORE_2D]->hardware->mmuVersion != 0))
-+        {
-+            status = gckMMU_Enable(device->kernels[gcvCORE_2D]->mmu, baseAddress, physSize);
-+            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
-+                "Enable new MMU for 2D: status=%d\n", status);
-+        }
-+
-+        /* Reset the base address */
-+        device->baseAddress = 0;
-+    }
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+    task_free_register(&task_nb);
-+    viv_gpu_resmem_handler.data = device->kernels[gcvCORE_MAJOR];
-+    register_reserved_memory_account(&viv_gpu_resmem_handler);
-+#endif
-+
-+
-+    /* Register the character device. */
-+    ret = register_chrdev(major, DRV_NAME, &driver_fops);
-+
-+    if (ret < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): Could not allocate major number for mmap.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    if (major == 0)
-+    {
-+        major = ret;
-+    }
-+
-+    /* Create the device class. */
-+    device_class = class_create(THIS_MODULE, "graphics_class");
-+
-+    if (IS_ERR(device_class))
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): Failed to create the class.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
-+    device_create(device_class, NULL, MKDEV(major, 0), NULL, "galcore");
-+#else
-+    device_create(device_class, NULL, MKDEV(major, 0), "galcore");
-+#endif
-+
-+    galDevice = device;
-+    gpuClass  = device_class;
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_DRIVER,
-+        "%s(%d): irqLine=%d, contiguousSize=%lu, memBase=0x%lX\n",
-+        __FUNCTION__, __LINE__,
-+        irqLine, contiguousSize, registerMemBase
-+        );
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    /* Roll back. */
-+    if (device_class != gcvNULL)
-+    {
-+        device_destroy(device_class, MKDEV(major, 0));
-+        class_destroy(device_class);
-+    }
-+
-+    if (device != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckGALDEVICE_Stop(device));
-+        gcmkVERIFY_OK(gckGALDEVICE_Destroy(device));
-+    }
-+
-+    gcmkFOOTER();
-+    return result;
-+}
-+
-+#if !USE_PLATFORM_DRIVER
-+static void __exit drv_exit(void)
-+#else
-+static void drv_exit(void)
-+#endif
-+{
-+    gcmkHEADER();
-+
-+#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
-+    task_free_unregister(&task_nb);
-+    unregister_reserved_memory_account(&viv_gpu_resmem_handler);
-+#endif
-+
-+    gcmkASSERT(gpuClass != gcvNULL);
-+    device_destroy(gpuClass, MKDEV(major, 0));
-+    class_destroy(gpuClass);
-+
-+    unregister_chrdev(major, DRV_NAME);
-+
-+    gcmkVERIFY_OK(gckGALDEVICE_Stop(galDevice));
-+    gcmkVERIFY_OK(gckGALDEVICE_Destroy(galDevice));
-+
-+   if(gckDebugFileSystemIsEnabled())
-+   {
-+   	 gckDebugFileSystemTerminate();
-+   }
-+
-+#if ENABLE_GPU_CLOCK_BY_DRIVER && LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,28)
-+    {
-+# if 0
-+        struct clk * clk = NULL;
-+
-+#if defined(CONFIG_PXA_DVFM) && (LINUX_VERSION_CODE > KERNEL_VERSION(2,6,29))
-+        gc_pwr(0);
-+#endif
-+        clk = clk_get(NULL, "GCCLK");
-+        clk_disable(clk);
-+# endif
-+    }
-+#endif
-+
-+    gcmkFOOTER_NO();
-+}
-+
-+#if !USE_PLATFORM_DRIVER
-+    module_init(drv_init);
-+    module_exit(drv_exit);
-+#else
-+
-+#ifdef CONFIG_DOVE_GPU
-+#   define DEVICE_NAME "dove_gpu"
-+#else
-+#   define DEVICE_NAME "galcore"
-+#endif
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+static int thermal_hot_pm_notify(struct notifier_block *nb, unsigned long event,
-+	void *dummy)
-+{
-+    static gctUINT orgFscale, minFscale, maxFscale;
-+    static gctBOOL critical;
-+    gckHARDWARE hardware = galDevice->kernels[gcvCORE_MAJOR]->hardware;
-+
-+    if (event > 4) {
-+	critical = gcvTRUE;
-+        gckHARDWARE_GetFscaleValue(hardware,&orgFscale,&minFscale, &maxFscale);
-+        gckHARDWARE_SetFscaleValue(hardware, minFscale);
-+        gckOS_Print("System is too hot. GPU3D scalign to %d/64 clock.\n", minFscale);
-+    } else if (event > 1) {
-+        gckHARDWARE_GetFscaleValue(hardware,&orgFscale,&minFscale, &maxFscale);
-+        gckHARDWARE_SetFscaleValue(hardware, maxFscale - (8 * event));
-+    } else if (orgFscale) {
-+        gckHARDWARE_SetFscaleValue(hardware, orgFscale);
-+	if (critical) {
-+            gckOS_Print("Hot alarm is canceled. GPU3D clock will return to %d/64\n", orgFscale);
-+            critical = gcvFALSE;
-+        }
-+    }
-+    return NOTIFY_OK;
-+}
-+
-+static struct notifier_block thermal_hot_pm_notifier = {
-+    .notifier_call = thermal_hot_pm_notify,
-+    };
-+#endif
-+
-+
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
-+static int gpu_probe(struct platform_device *pdev)
-+#else
-+static int __devinit gpu_probe(struct platform_device *pdev)
-+#endif
-+{
-+    int ret = -ENODEV;
-+    struct resource* res;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	struct contiguous_mem_pool *pool;
-+	struct reset_control *rstc;
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+	struct device_node *dn =pdev->dev.of_node;
-+	const u32 *prop;
-+#else
-+	struct viv_gpu_platform_data *pdata;
-+#endif
-+    gcmkHEADER();
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "phys_baseaddr");
-+    if (res)
-+        baseAddress = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_3d");
-+    if (res)
-+        irqLine = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_3d");
-+    if (res)
-+    {
-+        registerMemBase = res->start;
-+        registerMemSize = res->end - res->start + 1;
-+    }
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_2d");
-+    if (res)
-+        irqLine2D = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_2d");
-+    if (res)
-+    {
-+        registerMemBase2D = res->start;
-+        registerMemSize2D = res->end - res->start + 1;
-+    }
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_vg");
-+    if (res)
-+        irqLineVG = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_vg");
-+    if (res)
-+    {
-+        registerMemBaseVG = res->start;
-+        registerMemSizeVG = res->end - res->start + 1;
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	pool = devm_kzalloc(&pdev->dev, sizeof(*pool), GFP_KERNEL);
-+	if (!pool)
-+		return -ENOMEM;
-+	pool->size = contiguousSize;
-+	init_dma_attrs(&pool->attrs);
-+	dma_set_attr(DMA_ATTR_WRITE_COMBINE, &pool->attrs);
-+	pool->virt = dma_alloc_attrs(&pdev->dev, pool->size, &pool->phys,
-+				     GFP_KERNEL, &pool->attrs);
-+	if (!pool->virt) {
-+		dev_err(&pdev->dev, "Failed to allocate contiguous memory\n");
-+		return -ENOMEM;
-+	}
-+	contiguousBase = pool->phys;
-+	dev_set_drvdata(&pdev->dev, pool);
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+	prop = of_get_property(dn, "contiguousbase", NULL);
-+	if(prop)
-+		contiguousBase = *prop;
-+	of_property_read_u32(dn,"contiguoussize", (u32 *)&contiguousSize);
-+#else
-+    pdata = pdev->dev.platform_data;
-+    if (pdata) {
-+        contiguousBase = pdata->reserved_mem_base;
-+        contiguousSize = pdata->reserved_mem_size;
-+     }
-+#endif
-+    if (contiguousSize == 0)
-+       gckOS_Print("Warning: No contiguous memory is reserverd for gpu.!\n ");
-+    ret = drv_init(&pdev->dev);
-+
-+    if (!ret)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	rstc = devm_reset_control_get(&pdev->dev, "gpu3d");
-+	galDevice->rstc[gcvCORE_MAJOR] = IS_ERR(rstc) ? NULL : rstc;
-+
-+	rstc = devm_reset_control_get(&pdev->dev, "gpu2d");
-+	galDevice->rstc[gcvCORE_2D] = IS_ERR(rstc) ? NULL : rstc;
-+
-+	rstc = devm_reset_control_get(&pdev->dev, "gpuvg");
-+	galDevice->rstc[gcvCORE_VG] = IS_ERR(rstc) ? NULL : rstc;
-+#endif
-+        platform_set_drvdata(pdev, galDevice);
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+        if (galDevice->kernels[gcvCORE_MAJOR])
-+            REG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
-+#endif
-+        gcmkFOOTER_NO();
-+        return ret;
-+    }
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    UNREG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
-+#endif
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	dma_free_attrs(&pdev->dev, pool->size, pool->virt, pool->phys,
-+		       &pool->attrs);
-+#endif
-+    gcmkFOOTER_ARG(KERN_INFO "Failed to register gpu driver: %d\n", ret);
-+    return ret;
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
-+static int gpu_remove(struct platform_device *pdev)
-+#else
-+static int __devexit gpu_remove(struct platform_device *pdev)
-+#endif
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	gckGALDEVICE device = platform_get_drvdata(pdev);
-+	struct contiguous_mem_pool *pool = device->pool;
-+#endif
-+    gcmkHEADER();
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    if(galDevice->kernels[gcvCORE_MAJOR])
-+        UNREG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
-+#endif
-+    drv_exit();
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	dma_free_attrs(&pdev->dev, pool->size, pool->virt, pool->phys,
-+		       &pool->attrs);
-+#endif
-+    gcmkFOOTER_NO();
-+    return 0;
-+}
-+
-+static int gpu_suspend(struct platform_device *dev, pm_message_t state)
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+    gctINT i;
-+
-+    device = platform_get_drvdata(dev);
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->kernels[i] != gcvNULL)
-+        {
-+            /* Store states. */
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_QueryPowerManagementState(device->kernels[i]->vg->hardware, &device->statesStored[i]);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_QueryPowerManagementState(device->kernels[i]->hardware, &device->statesStored[i]);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_OFF);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_OFF);
-+            }
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+
-+        }
-+    }
-+
-+    return 0;
-+}
-+
-+static int gpu_resume(struct platform_device *dev)
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+    gctINT i;
-+    gceCHIPPOWERSTATE   statesStored;
-+
-+    device = platform_get_drvdata(dev);
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->kernels[i] != gcvNULL)
-+        {
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_ON);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_ON);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+
-+            /* Convert global state to crossponding internal state. */
-+            switch(device->statesStored[i])
-+            {
-+            case gcvPOWER_OFF:
-+                statesStored = gcvPOWER_OFF_BROADCAST;
-+                break;
-+            case gcvPOWER_IDLE:
-+                statesStored = gcvPOWER_IDLE_BROADCAST;
-+                break;
-+            case gcvPOWER_SUSPEND:
-+                statesStored = gcvPOWER_SUSPEND_BROADCAST;
-+                break;
-+            case gcvPOWER_ON:
-+                statesStored = gcvPOWER_ON_AUTO;
-+                break;
-+            default:
-+                statesStored = device->statesStored[i];
-+                break;
-+        }
-+
-+            /* Restore states. */
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, statesStored);
-+    }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, statesStored);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+        }
-+    }
-+
-+    return 0;
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+static const struct of_device_id mxs_gpu_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-gpu", },
-+	{/* sentinel */}
-+};
-+MODULE_DEVICE_TABLE(of, mxs_gpu_dt_ids);
-+
-+#ifdef CONFIG_PM
-+static int gpu_runtime_suspend(struct device *dev)
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 7)
-+	release_bus_freq(BUS_FREQ_HIGH);
-+#endif
-+	return 0;
-+}
-+
-+static int gpu_runtime_resume(struct device *dev)
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 7)
-+	request_bus_freq(BUS_FREQ_HIGH);
-+#endif
-+	return 0;
-+}
-+
-+static int gpu_system_suspend(struct device *dev)
-+{
-+	pm_message_t state={0};
-+	return gpu_suspend(to_platform_device(dev), state);
-+}
-+
-+static int gpu_system_resume(struct device *dev)
-+{
-+	return gpu_resume(to_platform_device(dev));
-+}
-+
-+static const struct dev_pm_ops gpu_pm_ops = {
-+	SET_RUNTIME_PM_OPS(gpu_runtime_suspend, gpu_runtime_resume, NULL)
-+	SET_SYSTEM_SLEEP_PM_OPS(gpu_system_suspend, gpu_system_resume)
-+};
-+#endif
-+#endif
-+
-+static struct platform_driver gpu_driver = {
-+    .probe      = gpu_probe,
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
-+    .remove     = gpu_remove,
-+#else
-+    .remove     = __devexit_p(gpu_remove),
-+#endif
-+
-+    .suspend    = gpu_suspend,
-+    .resume     = gpu_resume,
-+
-+    .driver     = {
-+        .name   = DEVICE_NAME,
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+		.of_match_table = mxs_gpu_dt_ids,
-+#if CONFIG_PM
-+		.pm		= &gpu_pm_ops,
-+#endif
-+#endif
-+    }
-+};
-+
-+#if 0 /*CONFIG_DOVE_GPU*/
-+static struct resource gpu_resources[] = {
-+    {
-+        .name   = "gpu_irq",
-+        .flags  = IORESOURCE_IRQ,
-+    },
-+    {
-+        .name   = "gpu_base",
-+        .flags  = IORESOURCE_MEM,
-+    },
-+    {
-+        .name   = "gpu_mem",
-+        .flags  = IORESOURCE_MEM,
-+    },
-+};
-+
-+static struct platform_device * gpu_device;
-+#endif
-+
-+static int __init gpu_init(void)
-+{
-+    int ret = 0;
-+
-+#if 0 /*ndef CONFIG_DOVE_GPU*/
-+    gpu_resources[0].start = gpu_resources[0].end = irqLine;
-+
-+    gpu_resources[1].start = registerMemBase;
-+    gpu_resources[1].end   = registerMemBase + registerMemSize - 1;
-+
-+    gpu_resources[2].start = contiguousBase;
-+    gpu_resources[2].end   = contiguousBase + contiguousSize - 1;
-+
-+    /* Allocate device */
-+    gpu_device = platform_device_alloc(DEVICE_NAME, -1);
-+    if (!gpu_device)
-+    {
-+        printk(KERN_ERR "galcore: platform_device_alloc failed.\n");
-+        ret = -ENOMEM;
-+        goto out;
-+    }
-+
-+    /* Insert resource */
-+    ret = platform_device_add_resources(gpu_device, gpu_resources, 3);
-+    if (ret)
-+    {
-+        printk(KERN_ERR "galcore: platform_device_add_resources failed.\n");
-+        goto put_dev;
-+    }
-+
-+    /* Add device */
-+    ret = platform_device_add(gpu_device);
-+    if (ret)
-+    {
-+        printk(KERN_ERR "galcore: platform_device_add failed.\n");
-+        goto put_dev;
-+    }
-+#endif
-+
-+    ret = platform_driver_register(&gpu_driver);
-+    if (!ret)
-+    {
-+        goto out;
-+    }
-+
-+#if 0 /*ndef CONFIG_DOVE_GPU*/
-+    platform_device_del(gpu_device);
-+put_dev:
-+    platform_device_put(gpu_device);
-+#endif
-+
-+out:
-+    return ret;
-+}
-+
-+static void __exit gpu_exit(void)
-+{
-+    platform_driver_unregister(&gpu_driver);
-+#if 0 /*ndef CONFIG_DOVE_GPU*/
-+    platform_device_unregister(gpu_device);
-+#endif
-+}
-+
-+module_init(gpu_init);
-+module_exit(gpu_exit);
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,216 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+#include "gc_hal_kernel_device.h"
-+
-+#include <linux/iommu.h>
-+#include <linux/platform_device.h>
-+
-+#define _GC_OBJ_ZONE gcvZONE_OS
-+
-+typedef struct _gcsIOMMU
-+{
-+    struct iommu_domain * domain;
-+    struct device *       device;
-+}
-+gcsIOMMU;
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+static int
-+_IOMMU_Fault_Handler(
-+    struct iommu_domain * Domain,
-+    struct device * Dev,
-+    unsigned long DomainAddress,
-+    int flags,
-+    void * args
-+    )
-+#else
-+static int
-+_IOMMU_Fault_Handler(
-+    struct iommu_domain * Domain,
-+    struct device * Dev,
-+    unsigned long DomainAddress,
-+    int flags
-+    )
-+#endif
-+{
-+    return 0;
-+}
-+
-+static int
-+_FlatMapping(
-+    IN gckIOMMU Iommu
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 physical;
-+
-+    for (physical = 0; physical < 0x80000000; physical += PAGE_SIZE)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "Map %x => %x bytes = %d",
-+            physical, physical, PAGE_SIZE
-+            );
-+
-+        gcmkONERROR(gckIOMMU_Map(Iommu, physical, physical, PAGE_SIZE));
-+    }
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    return status;
-+}
-+
-+void
-+gckIOMMU_Destory(
-+    IN gckOS Os,
-+    IN gckIOMMU Iommu
-+    )
-+{
-+    gcmkHEADER();
-+
-+    if (Iommu->domain && Iommu->device)
-+    {
-+        iommu_attach_device(Iommu->domain, Iommu->device);
-+    }
-+
-+    if (Iommu->domain)
-+    {
-+        iommu_domain_free(Iommu->domain);
-+    }
-+
-+    if (Iommu)
-+    {
-+        gcmkOS_SAFE_FREE(Os, Iommu);
-+    }
-+
-+    gcmkFOOTER_NO();
-+}
-+
-+gceSTATUS
-+gckIOMMU_Construct(
-+    IN gckOS Os,
-+    OUT gckIOMMU * Iommu
-+    )
-+{
-+    gceSTATUS status;
-+    gckIOMMU iommu = gcvNULL;
-+    struct device *dev;
-+    int ret;
-+
-+    gcmkHEADER();
-+
-+    dev = &Os->device->platform->device->dev;
-+
-+    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcsIOMMU), (gctPOINTER *)&iommu));
-+
-+    gckOS_ZeroMemory(iommu, gcmSIZEOF(gcsIOMMU));
-+
-+    iommu->domain = iommu_domain_alloc(&platform_bus_type);
-+
-+    if (!iommu->domain)
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "iommu_domain_alloc() fail");
-+
-+        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    iommu_set_fault_handler(iommu->domain, _IOMMU_Fault_Handler, dev);
-+#else
-+    iommu_set_fault_handler(iommu->domain, _IOMMU_Fault_Handler);
-+#endif
-+
-+    ret = iommu_attach_device(iommu->domain, dev);
-+
-+    if (ret)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS, "iommu_attach_device() fail %d", ret);
-+
-+        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+    }
-+
-+    iommu->device = dev;
-+
-+    _FlatMapping(iommu);
-+
-+    *Iommu = iommu;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    gckIOMMU_Destory(Os, iommu);
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckIOMMU_Map(
-+    IN gckIOMMU Iommu,
-+    IN gctUINT32 DomainAddress,
-+    IN gctUINT32 Physical,
-+    IN gctUINT32 Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    int ret;
-+
-+    gcmkHEADER_ARG("DomainAddress=%#X, Physical=%#X, Bytes=%d",
-+                   DomainAddress, Physical, Bytes);
-+
-+    ret = iommu_map(Iommu->domain, DomainAddress, Physical, Bytes, 0);
-+
-+    if (ret)
-+    {
-+        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+    gcmkFOOTER();
-+    return status;
-+
-+}
-+
-+gceSTATUS
-+gckIOMMU_Unmap(
-+    IN gckIOMMU Iommu,
-+    IN gctUINT32 DomainAddress,
-+    IN gctUINT32 Bytes
-+    )
-+{
-+    gcmkHEADER();
-+
-+    iommu_unmap(Iommu->domain, DomainAddress, Bytes);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,481 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+
-+#define _GC_OBJ_ZONE    gcvZONE_KERNEL
-+
-+/******************************************************************************\
-+******************************* gckKERNEL API Code ******************************
-+\******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_QueryVideoMemory
-+**
-+**  Query the amount of video memory.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**  OUTPUT:
-+**
-+**      gcsHAL_INTERFACE * Interface
-+**          Pointer to an gcsHAL_INTERFACE structure that will be filled in with
-+**          the memory information.
-+*/
-+gceSTATUS
-+gckKERNEL_QueryVideoMemory(
-+    IN gckKERNEL Kernel,
-+    OUT gcsHAL_INTERFACE * Interface
-+    )
-+{
-+    gckGALDEVICE device;
-+
-+    gcmkHEADER_ARG("Kernel=%p", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Interface != NULL);
-+
-+    /* Extract the pointer to the gckGALDEVICE class. */
-+    device = (gckGALDEVICE) Kernel->context;
-+
-+    /* Get internal memory size and physical address. */
-+    Interface->u.QueryVideoMemory.internalSize = device->internalSize;
-+    Interface->u.QueryVideoMemory.internalPhysical = device->internalPhysicalName;
-+
-+    /* Get external memory size and physical address. */
-+    Interface->u.QueryVideoMemory.externalSize = device->externalSize;
-+    Interface->u.QueryVideoMemory.externalPhysical = device->externalPhysicalName;
-+
-+    /* Get contiguous memory size and physical address. */
-+    Interface->u.QueryVideoMemory.contiguousSize = device->contiguousSize;
-+    Interface->u.QueryVideoMemory.contiguousPhysical = device->contiguousPhysicalName;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_GetVideoMemoryPool
-+**
-+**  Get the gckVIDMEM object belonging to the specified pool.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gcePOOL Pool
-+**          Pool to query gckVIDMEM object for.
-+**
-+**  OUTPUT:
-+**
-+**      gckVIDMEM * VideoMemory
-+**          Pointer to a variable that will hold the pointer to the gckVIDMEM
-+**          object belonging to the requested pool.
-+*/
-+gceSTATUS
-+gckKERNEL_GetVideoMemoryPool(
-+    IN gckKERNEL Kernel,
-+    IN gcePOOL Pool,
-+    OUT gckVIDMEM * VideoMemory
-+    )
-+{
-+    gckGALDEVICE device;
-+    gckVIDMEM videoMemory;
-+
-+    gcmkHEADER_ARG("Kernel=%p Pool=%d", Kernel, Pool);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(VideoMemory != NULL);
-+
-+    /* Extract the pointer to the gckGALDEVICE class. */
-+    device = (gckGALDEVICE) Kernel->context;
-+
-+    /* Dispatch on pool. */
-+    switch (Pool)
-+    {
-+    case gcvPOOL_LOCAL_INTERNAL:
-+        /* Internal memory. */
-+        videoMemory = device->internalVidMem;
-+        break;
-+
-+    case gcvPOOL_LOCAL_EXTERNAL:
-+        /* External memory. */
-+        videoMemory = device->externalVidMem;
-+        break;
-+
-+    case gcvPOOL_SYSTEM:
-+        /* System memory. */
-+        videoMemory = device->contiguousVidMem;
-+        break;
-+
-+    default:
-+        /* Unknown pool. */
-+        videoMemory = NULL;
-+    }
-+
-+    /* Return pointer to the gckVIDMEM object. */
-+    *VideoMemory = videoMemory;
-+
-+    /* Return status. */
-+    gcmkFOOTER_ARG("*VideoMemory=%p", *VideoMemory);
-+    return (videoMemory == NULL) ? gcvSTATUS_OUT_OF_MEMORY : gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_MapMemory
-+**
-+**  Map video memory into the current process space.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of video memory to map.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to map.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that will hold the base address of the mapped
-+**          memory region.
-+*/
-+gceSTATUS
-+gckKERNEL_MapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gckKERNEL kernel = Kernel;
-+    gctPHYS_ADDR physical = gcmNAME_TO_PTR(Physical);
-+
-+    return gckOS_MapMemory(Kernel->os, physical, Bytes, Logical);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_UnmapMemory
-+**
-+**  Unmap video memory from the current process space.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of video memory to map.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to map.
-+**
-+**      gctPOINTER Logical
-+**          Base address of the mapped memory region.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_UnmapMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gckKERNEL kernel = Kernel;
-+    gctPHYS_ADDR physical = gcmNAME_TO_PTR(Physical);
-+
-+    return gckOS_UnmapMemory(Kernel->os, physical, Bytes, Logical);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_MapVideoMemory
-+**
-+**  Get the logical address for a hardware specific memory address for the
-+**  current process.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL InUserSpace
-+**          gcvTRUE to map the memory into the user space.
-+**
-+**      gctUINT32 Address
-+**          Hardware specific memory address.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that will hold the logical address of the
-+**          specified memory address.
-+*/
-+gceSTATUS
-+gckKERNEL_MapVideoMemoryEx(
-+    IN gckKERNEL Kernel,
-+    IN gceCORE Core,
-+    IN gctBOOL InUserSpace,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gckGALDEVICE device;
-+    PLINUX_MDL mdl;
-+    PLINUX_MDL_MAP mdlMap;
-+    gcePOOL pool;
-+    gctUINT32 offset, base;
-+    gceSTATUS status;
-+    gctPOINTER logical;
-+
-+    gcmkHEADER_ARG("Kernel=%p InUserSpace=%d Address=%08x",
-+                   Kernel, InUserSpace, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Logical != NULL);
-+
-+    /* Extract the pointer to the gckGALDEVICE class. */
-+    device = (gckGALDEVICE) Kernel->context;
-+
-+#if gcdENABLE_VG
-+    if (Core == gcvCORE_VG)
-+    {
-+        /* Split the memory address into a pool type and offset. */
-+        gcmkONERROR(
-+            gckVGHARDWARE_SplitMemory(Kernel->vg->hardware, Address, &pool, &offset));
-+    }
-+    else
-+#endif
-+    {
-+        /* Split the memory address into a pool type and offset. */
-+        gcmkONERROR(
-+            gckHARDWARE_SplitMemory(Kernel->hardware, Address, &pool, &offset));
-+    }
-+
-+    /* Dispatch on pool. */
-+    switch (pool)
-+    {
-+    case gcvPOOL_LOCAL_INTERNAL:
-+        /* Internal memory. */
-+        logical = device->internalLogical;
-+        break;
-+
-+    case gcvPOOL_LOCAL_EXTERNAL:
-+        /* External memory. */
-+        logical = device->externalLogical;
-+        break;
-+
-+    case gcvPOOL_SYSTEM:
-+        /* System memory. */
-+        if (device->contiguousMapped)
-+        {
-+            logical = device->contiguousBase;
-+        }
-+        else
-+        {
-+            gctINT processID;
-+            gckOS_GetProcessID(&processID);
-+
-+            mdl = (PLINUX_MDL) device->contiguousPhysical;
-+
-+            mdlMap = FindMdlMap(mdl, processID);
-+            gcmkASSERT(mdlMap);
-+
-+            logical = (gctPOINTER) mdlMap->vmaAddr;
-+        }
-+#if gcdENABLE_VG
-+        if (Core == gcvCORE_VG)
-+        {
-+            gcmkVERIFY_OK(
-+                gckVGHARDWARE_SplitMemory(Kernel->vg->hardware,
-+                                        device->contiguousVidMem->baseAddress,
-+                                        &pool,
-+                                        &base));
-+        }
-+        else
-+#endif
-+        {
-+            gctUINT32 baseAddress = 0;
-+
-+            if (Kernel->hardware->mmuVersion == 0)
-+            {
-+                gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
-+            }
-+
-+            gcmkVERIFY_OK(
-+                gckHARDWARE_SplitMemory(Kernel->hardware,
-+                                        device->contiguousVidMem->baseAddress - baseAddress,
-+                                        &pool,
-+                                        &base));
-+        }
-+        offset -= base;
-+        break;
-+
-+    default:
-+        /* Invalid memory pool. */
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Build logical address of specified address. */
-+    *Logical = (gctPOINTER) ((gctUINT8_PTR) logical + offset);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Logical=%p", *Logical);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Retunn the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckKERNEL_MapVideoMemory
-+**
-+**  Get the logical address for a hardware specific memory address for the
-+**  current process.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gctBOOL InUserSpace
-+**          gcvTRUE to map the memory into the user space.
-+**
-+**      gctUINT32 Address
-+**          Hardware specific memory address.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that will hold the logical address of the
-+**          specified memory address.
-+*/
-+gceSTATUS
-+gckKERNEL_MapVideoMemory(
-+    IN gckKERNEL Kernel,
-+    IN gctBOOL InUserSpace,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    return gckKERNEL_MapVideoMemoryEx(Kernel, gcvCORE_MAJOR, InUserSpace, Address, Logical);
-+}
-+/*******************************************************************************
-+**
-+**  gckKERNEL_Notify
-+**
-+**  This function iscalled by clients to notify the gckKERNRL object of an event.
-+**
-+**  INPUT:
-+**
-+**      gckKERNEL Kernel
-+**          Pointer to an gckKERNEL object.
-+**
-+**      gceNOTIFY Notification
-+**          Notification event.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckKERNEL_Notify(
-+    IN gckKERNEL Kernel,
-+    IN gceNOTIFY Notification,
-+    IN gctBOOL Data
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Kernel=%p Notification=%d Data=%d",
-+                   Kernel, Notification, Data);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+
-+    /* Dispatch on notifcation. */
-+    switch (Notification)
-+    {
-+    case gcvNOTIFY_INTERRUPT:
-+        /* Process the interrupt. */
-+#if COMMAND_PROCESSOR_VERSION > 1
-+        status = gckINTERRUPT_Notify(Kernel->interrupt, Data);
-+#else
-+        status = gckHARDWARE_Interrupt(Kernel->hardware, Data);
-+#endif
-+        break;
-+
-+    default:
-+        status = gcvSTATUS_OK;
-+        break;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckKERNEL_QuerySettings(
-+    IN gckKERNEL Kernel,
-+    OUT gcsKERNEL_SETTINGS * Settings
-+    )
-+{
-+    gckGALDEVICE device;
-+
-+    gcmkHEADER_ARG("Kernel=%p", Kernel);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
-+    gcmkVERIFY_ARGUMENT(Settings != gcvNULL);
-+
-+    /* Extract the pointer to the gckGALDEVICE class. */
-+    device = (gckGALDEVICE) Kernel->context;
-+
-+    /* Fill in signal. */
-+    Settings->signal = device->signal;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("Settings->signal=%d", Settings->signal);
-+    return gcvSTATUS_OK;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,94 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_linux_h_
-+#define __gc_hal_kernel_linux_h_
-+
-+#include <linux/version.h>
-+#include <linux/init.h>
-+#include <linux/module.h>
-+#include <linux/fs.h>
-+#include <linux/mm.h>
-+#include <linux/sched.h>
-+#include <linux/signal.h>
-+#ifdef FLAREON
-+#   include <asm/arch-realview/dove_gpio_irq.h>
-+#endif
-+#include <linux/interrupt.h>
-+#include <linux/vmalloc.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/kthread.h>
-+
-+#ifdef MODVERSIONS
-+#  include <linux/modversions.h>
-+#endif
-+#include <asm/io.h>
-+#include <asm/uaccess.h>
-+
-+#if ENABLE_GPU_CLOCK_BY_DRIVER && LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,28)
-+#include <linux/clk.h>
-+#include <linux/regulator/consumer.h>
-+#endif
-+
-+#define NTSTRSAFE_NO_CCH_FUNCTIONS
-+#include "gc_hal.h"
-+#include "gc_hal_driver.h"
-+#include "gc_hal_kernel.h"
-+#include "gc_hal_kernel_device.h"
-+#include "gc_hal_kernel_os.h"
-+#include "gc_hal_kernel_debugfs.h"
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,31)
-+#define FIND_TASK_BY_PID(x) pid_task(find_vpid(x), PIDTYPE_PID)
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
-+#define FIND_TASK_BY_PID(x) find_task_by_vpid(x)
-+#else
-+#define FIND_TASK_BY_PID(x) find_task_by_pid(x)
-+#endif
-+
-+#define _WIDE(string)				L##string
-+#define WIDE(string)				_WIDE(string)
-+
-+#define countof(a)					(sizeof(a) / sizeof(a[0]))
-+
-+#define DRV_NAME          			"galcore"
-+
-+#define GetPageCount(size, offset) 	((((size) + ((offset) & ~PAGE_CACHE_MASK)) + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT)
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION (3,7,0)
-+#define gcdVM_FLAGS (VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_DONTDUMP)
-+#else
-+#define gcdVM_FLAGS (VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_RESERVED)
-+#endif
-+
-+static inline gctINT
-+GetOrder(
-+	IN gctINT numPages
-+	)
-+{
-+    gctINT order = 0;
-+
-+	while ((1 << order) <  numPages) order++;
-+
-+	return order;
-+}
-+
-+#endif /* __gc_hal_kernel_linux_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c	2015-07-27 23:13:06.222780123 +0200
-@@ -0,0 +1,32 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+
-+gctINT
-+gckMATH_ModuloInt(
-+    IN gctINT X,
-+    IN gctINT Y
-+    )
-+{
-+    if(Y ==0) {return 0;}
-+    else {return X % Y;}
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,9078 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+
-+#include <linux/pagemap.h>
-+#include <linux/seq_file.h>
-+#include <linux/mm.h>
-+#include <linux/mman.h>
-+#include <linux/sched.h>
-+#include <asm/atomic.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/slab.h>
-+#include <linux/idr.h>
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
-+#include <mach/hardware.h>
-+#endif
-+#include <linux/workqueue.h>
-+#include <linux/idr.h>
-+#if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,23)
-+#include <linux/math64.h>
-+#endif
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+#include <linux/reset.h>
-+static inline void imx_gpc_power_up_pu(bool flag) {}
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+#include <mach/common.h>
-+#endif
-+#include <linux/delay.h>
-+#include <linux/pm_runtime.h>
-+
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+#include <linux/file.h>
-+#include "gc_hal_kernel_sync.h"
-+#endif
-+
-+
-+#define _GC_OBJ_ZONE    gcvZONE_OS
-+
-+/*******************************************************************************
-+***** Version Signature *******************************************************/
-+
-+#ifdef ANDROID
-+const char * _PLATFORM = "\n\0$PLATFORM$Android$\n";
-+#else
-+const char * _PLATFORM = "\n\0$PLATFORM$Linux$\n";
-+#endif
-+
-+#define USER_SIGNAL_TABLE_LEN_INIT  64
-+#define gcdSUPPRESS_OOM_MESSAGE 1
-+
-+#define MEMORY_LOCK(os) \
-+    gcmkVERIFY_OK(gckOS_AcquireMutex( \
-+                                (os), \
-+                                (os)->memoryLock, \
-+                                gcvINFINITE))
-+
-+#define MEMORY_UNLOCK(os) \
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex((os), (os)->memoryLock))
-+
-+#define MEMORY_MAP_LOCK(os) \
-+    gcmkVERIFY_OK(gckOS_AcquireMutex( \
-+                                (os), \
-+                                (os)->memoryMapLock, \
-+                                gcvINFINITE))
-+
-+#define MEMORY_MAP_UNLOCK(os) \
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex((os), (os)->memoryMapLock))
-+
-+/* Protection bit when mapping memroy to user sapce */
-+#define gcmkPAGED_MEMROY_PROT(x)    pgprot_writecombine(x)
-+
-+#if gcdNONPAGED_MEMORY_BUFFERABLE
-+#define gcmkIOREMAP                 ioremap_wc
-+#define gcmkNONPAGED_MEMROY_PROT(x) pgprot_writecombine(x)
-+#elif !gcdNONPAGED_MEMORY_CACHEABLE
-+#define gcmkIOREMAP                 ioremap_nocache
-+#define gcmkNONPAGED_MEMROY_PROT(x) pgprot_noncached(x)
-+#endif
-+
-+#if gcdSUPPRESS_OOM_MESSAGE
-+#define gcdNOWARN __GFP_NOWARN
-+#else
-+#define gcdNOWARN 0
-+#endif
-+
-+#define gcdINFINITE_TIMEOUT     (60 * 1000)
-+#define gcdDETECT_TIMEOUT       0
-+#define gcdDETECT_DMA_ADDRESS   1
-+#define gcdDETECT_DMA_STATE     1
-+
-+#define gcdUSE_NON_PAGED_MEMORY_CACHE 10
-+
-+/******************************************************************************\
-+********************************** Structures **********************************
-+\******************************************************************************/
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+typedef struct _gcsNonPagedMemoryCache
-+{
-+#ifndef NO_DMA_COHERENT
-+    gctINT                           size;
-+    gctSTRING                        addr;
-+    dma_addr_t                       dmaHandle;
-+#else
-+    long                             order;
-+    struct page *                    page;
-+#endif
-+
-+    struct _gcsNonPagedMemoryCache * prev;
-+    struct _gcsNonPagedMemoryCache * next;
-+}
-+gcsNonPagedMemoryCache;
-+#endif /* gcdUSE_NON_PAGED_MEMORY_CACHE */
-+
-+typedef struct _gcsUSER_MAPPING * gcsUSER_MAPPING_PTR;
-+typedef struct _gcsUSER_MAPPING
-+{
-+    /* Pointer to next mapping structure. */
-+    gcsUSER_MAPPING_PTR         next;
-+
-+    /* Physical address of this mapping. */
-+    gctUINT32                   physical;
-+
-+    /* Logical address of this mapping. */
-+    gctPOINTER                  logical;
-+
-+    /* Number of bytes of this mapping. */
-+    gctSIZE_T                   bytes;
-+
-+    /* Starting address of this mapping. */
-+    gctINT8_PTR                 start;
-+
-+    /* Ending address of this mapping. */
-+    gctINT8_PTR                 end;
-+}
-+gcsUSER_MAPPING;
-+
-+typedef struct _gcsINTEGER_DB * gcsINTEGER_DB_PTR;
-+typedef struct _gcsINTEGER_DB
-+{
-+    struct idr                  idr;
-+    spinlock_t                  lock;
-+    gctINT                      curr;
-+}
-+gcsINTEGER_DB;
-+
-+struct _gckOS
-+{
-+    /* Object. */
-+    gcsOBJECT                   object;
-+
-+    /* Heap. */
-+    gckHEAP                     heap;
-+
-+    /* Pointer to device */
-+    gckGALDEVICE                device;
-+
-+    /* Memory management */
-+    gctPOINTER                  memoryLock;
-+    gctPOINTER                  memoryMapLock;
-+
-+    struct _LINUX_MDL           *mdlHead;
-+    struct _LINUX_MDL           *mdlTail;
-+
-+    /* Kernel process ID. */
-+    gctUINT32                   kernelProcessID;
-+
-+    /* Signal management. */
-+
-+    /* Lock. */
-+    gctPOINTER                  signalMutex;
-+
-+    /* signal id database. */
-+    gcsINTEGER_DB               signalDB;
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    /* Lock. */
-+    gctPOINTER                  syncPointMutex;
-+
-+    /* sync point id database. */
-+    gcsINTEGER_DB               syncPointDB;
-+#endif
-+
-+    gcsUSER_MAPPING_PTR         userMap;
-+    gctPOINTER                  debugLock;
-+
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    gctUINT                      cacheSize;
-+    gcsNonPagedMemoryCache *     cacheHead;
-+    gcsNonPagedMemoryCache *     cacheTail;
-+#endif
-+
-+    /* workqueue for os timer. */
-+    struct workqueue_struct *   workqueue;
-+
-+    int                         gpu_clk_on[3];
-+    struct mutex                gpu_clk_mutex;
-+
-+    gctPOINTER                  vidmemMutex;
-+};
-+
-+typedef struct _gcsSIGNAL * gcsSIGNAL_PTR;
-+typedef struct _gcsSIGNAL
-+{
-+    /* Kernel sync primitive. */
-+    struct completion obj;
-+
-+    /* Manual reset flag. */
-+    gctBOOL manualReset;
-+
-+    /* The reference counter. */
-+    atomic_t ref;
-+
-+    /* The owner of the signal. */
-+    gctHANDLE process;
-+
-+    gckHARDWARE hardware;
-+
-+    /* ID. */
-+    gctUINT32 id;
-+}
-+gcsSIGNAL;
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+typedef struct _gcsSYNC_POINT * gcsSYNC_POINT_PTR;
-+typedef struct _gcsSYNC_POINT
-+{
-+    /* The reference counter. */
-+    atomic_t ref;
-+
-+    /* State. */
-+    atomic_t state;
-+
-+    /* timeline. */
-+    struct sync_timeline * timeline;
-+
-+    /* ID. */
-+    gctUINT32 id;
-+}
-+gcsSYNC_POINT;
-+#endif
-+
-+typedef struct _gcsPageInfo * gcsPageInfo_PTR;
-+typedef struct _gcsPageInfo
-+{
-+    struct page **pages;
-+    gctUINT32_PTR pageTable;
-+}
-+gcsPageInfo;
-+
-+typedef struct _gcsOSTIMER * gcsOSTIMER_PTR;
-+typedef struct _gcsOSTIMER
-+{
-+    struct delayed_work     work;
-+    gctTIMERFUNCTION        function;
-+    gctPOINTER              data;
-+} gcsOSTIMER;
-+
-+/******************************************************************************\
-+******************************* Private Functions ******************************
-+\******************************************************************************/
-+
-+static gctINT
-+_GetProcessID(
-+    void
-+    )
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
-+    return task_tgid_vnr(current);
-+#else
-+    return current->tgid;
-+#endif
-+}
-+
-+static gctINT
-+_GetThreadID(
-+    void
-+    )
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
-+    return task_pid_vnr(current);
-+#else
-+    return current->pid;
-+#endif
-+}
-+
-+static PLINUX_MDL
-+_CreateMdl(
-+    IN gctINT ProcessID
-+    )
-+{
-+    PLINUX_MDL  mdl;
-+
-+    gcmkHEADER_ARG("ProcessID=%d", ProcessID);
-+
-+    mdl = (PLINUX_MDL)kzalloc(sizeof(struct _LINUX_MDL), GFP_KERNEL | gcdNOWARN);
-+    if (mdl == gcvNULL)
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvNULL;
-+    }
-+
-+    mdl->pid    = ProcessID;
-+    mdl->maps   = gcvNULL;
-+    mdl->prev   = gcvNULL;
-+    mdl->next   = gcvNULL;
-+
-+    gcmkFOOTER_ARG("0x%X", mdl);
-+    return mdl;
-+}
-+
-+static gceSTATUS
-+_DestroyMdlMap(
-+    IN PLINUX_MDL Mdl,
-+    IN PLINUX_MDL_MAP MdlMap
-+    );
-+
-+static gceSTATUS
-+_DestroyMdl(
-+    IN PLINUX_MDL Mdl
-+    )
-+{
-+    PLINUX_MDL_MAP mdlMap, next;
-+
-+    gcmkHEADER_ARG("Mdl=0x%X", Mdl);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Mdl != gcvNULL);
-+
-+    mdlMap = Mdl->maps;
-+
-+    while (mdlMap != gcvNULL)
-+    {
-+        next = mdlMap->next;
-+
-+        gcmkVERIFY_OK(_DestroyMdlMap(Mdl, mdlMap));
-+
-+        mdlMap = next;
-+    }
-+
-+    kfree(Mdl);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+static PLINUX_MDL_MAP
-+_CreateMdlMap(
-+    IN PLINUX_MDL Mdl,
-+    IN gctINT ProcessID
-+    )
-+{
-+    PLINUX_MDL_MAP  mdlMap;
-+
-+    gcmkHEADER_ARG("Mdl=0x%X ProcessID=%d", Mdl, ProcessID);
-+
-+    mdlMap = (PLINUX_MDL_MAP)kmalloc(sizeof(struct _LINUX_MDL_MAP), GFP_KERNEL | gcdNOWARN);
-+    if (mdlMap == gcvNULL)
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvNULL;
-+    }
-+
-+    mdlMap->pid     = ProcessID;
-+    mdlMap->vmaAddr = gcvNULL;
-+    mdlMap->vma     = gcvNULL;
-+    mdlMap->count   = 0;
-+
-+    mdlMap->next    = Mdl->maps;
-+    Mdl->maps       = mdlMap;
-+
-+    gcmkFOOTER_ARG("0x%X", mdlMap);
-+    return mdlMap;
-+}
-+
-+static gceSTATUS
-+_DestroyMdlMap(
-+    IN PLINUX_MDL Mdl,
-+    IN PLINUX_MDL_MAP MdlMap
-+    )
-+{
-+    PLINUX_MDL_MAP  prevMdlMap;
-+
-+    gcmkHEADER_ARG("Mdl=0x%X MdlMap=0x%X", Mdl, MdlMap);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(MdlMap != gcvNULL);
-+    gcmkASSERT(Mdl->maps != gcvNULL);
-+
-+    if (Mdl->maps == MdlMap)
-+    {
-+        Mdl->maps = MdlMap->next;
-+    }
-+    else
-+    {
-+        prevMdlMap = Mdl->maps;
-+
-+        while (prevMdlMap->next != MdlMap)
-+        {
-+            prevMdlMap = prevMdlMap->next;
-+
-+            gcmkASSERT(prevMdlMap != gcvNULL);
-+        }
-+
-+        prevMdlMap->next = MdlMap->next;
-+    }
-+
-+    kfree(MdlMap);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+extern PLINUX_MDL_MAP
-+FindMdlMap(
-+    IN PLINUX_MDL Mdl,
-+    IN gctINT ProcessID
-+    )
-+{
-+    PLINUX_MDL_MAP  mdlMap;
-+
-+    gcmkHEADER_ARG("Mdl=0x%X ProcessID=%d", Mdl, ProcessID);
-+    if(Mdl == gcvNULL)
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvNULL;
-+    }
-+    mdlMap = Mdl->maps;
-+
-+    while (mdlMap != gcvNULL)
-+    {
-+        if (mdlMap->pid == ProcessID)
-+        {
-+            gcmkFOOTER_ARG("0x%X", mdlMap);
-+            return mdlMap;
-+        }
-+
-+        mdlMap = mdlMap->next;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvNULL;
-+}
-+
-+void
-+OnProcessExit(
-+    IN gckOS Os,
-+    IN gckKERNEL Kernel
-+    )
-+{
-+}
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,25)
-+static inline int
-+is_vmalloc_addr(
-+    void *Addr
-+    )
-+{
-+    unsigned long addr = (unsigned long)Addr;
-+
-+    return addr >= VMALLOC_START && addr < VMALLOC_END;
-+}
-+#endif
-+
-+static void
-+_NonContiguousFree(
-+    IN struct page ** Pages,
-+    IN gctUINT32 NumPages
-+    )
-+{
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Pages=0x%X, NumPages=%d", Pages, NumPages);
-+
-+    gcmkASSERT(Pages != gcvNULL);
-+
-+    for (i = 0; i < NumPages; i++)
-+    {
-+        __free_page(Pages[i]);
-+    }
-+
-+    if (is_vmalloc_addr(Pages))
-+    {
-+        vfree(Pages);
-+    }
-+    else
-+    {
-+        kfree(Pages);
-+    }
-+
-+    gcmkFOOTER_NO();
-+}
-+
-+static struct page **
-+_NonContiguousAlloc(
-+    IN gctUINT32 NumPages
-+    )
-+{
-+    struct page ** pages;
-+    struct page *p;
-+    gctINT i, size;
-+
-+    gcmkHEADER_ARG("NumPages=%lu", NumPages);
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 32)
-+    if (NumPages > totalram_pages)
-+#else
-+    if (NumPages > num_physpages)
-+#endif
-+    {
-+        gcmkFOOTER_NO();
-+        return gcvNULL;
-+    }
-+
-+    size = NumPages * sizeof(struct page *);
-+
-+    pages = kmalloc(size, GFP_KERNEL | gcdNOWARN);
-+
-+    if (!pages)
-+    {
-+        pages = vmalloc(size);
-+
-+        if (!pages)
-+        {
-+            gcmkFOOTER_NO();
-+            return gcvNULL;
-+        }
-+    }
-+
-+    for (i = 0; i < NumPages; i++)
-+    {
-+        p = alloc_page(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN);
-+
-+        if (!p)
-+        {
-+            _NonContiguousFree(pages, i);
-+            gcmkFOOTER_NO();
-+            return gcvNULL;
-+        }
-+
-+        pages[i] = p;
-+    }
-+
-+    gcmkFOOTER_ARG("pages=0x%X", pages);
-+    return pages;
-+}
-+
-+static inline struct page *
-+_NonContiguousToPage(
-+    IN struct page ** Pages,
-+    IN gctUINT32 Index
-+    )
-+{
-+    gcmkASSERT(Pages != gcvNULL);
-+    return Pages[Index];
-+}
-+
-+static inline unsigned long
-+_NonContiguousToPfn(
-+    IN struct page ** Pages,
-+    IN gctUINT32 Index
-+    )
-+{
-+    gcmkASSERT(Pages != gcvNULL);
-+    return page_to_pfn(_NonContiguousToPage(Pages, Index));
-+}
-+
-+static inline unsigned long
-+_NonContiguousToPhys(
-+    IN struct page ** Pages,
-+    IN gctUINT32 Index
-+    )
-+{
-+    gcmkASSERT(Pages != gcvNULL);
-+    return page_to_phys(_NonContiguousToPage(Pages, Index));
-+}
-+
-+
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+
-+static gctBOOL
-+_AddNonPagedMemoryCache(
-+    gckOS Os,
-+#ifndef NO_DMA_COHERENT
-+    gctINT Size,
-+    gctSTRING Addr,
-+    dma_addr_t DmaHandle
-+#else
-+    long Order,
-+    struct page * Page
-+#endif
-+    )
-+{
-+    gcsNonPagedMemoryCache *cache;
-+
-+    if (Os->cacheSize >= gcdUSE_NON_PAGED_MEMORY_CACHE)
-+    {
-+        return gcvFALSE;
-+    }
-+
-+    /* Allocate the cache record */
-+    cache = (gcsNonPagedMemoryCache *)kmalloc(sizeof(gcsNonPagedMemoryCache), GFP_ATOMIC);
-+
-+    if (cache == gcvNULL) return gcvFALSE;
-+
-+#ifndef NO_DMA_COHERENT
-+    cache->size  = Size;
-+    cache->addr  = Addr;
-+    cache->dmaHandle = DmaHandle;
-+#else
-+    cache->order = Order;
-+    cache->page  = Page;
-+#endif
-+
-+    /* Add to list */
-+    if (Os->cacheHead == gcvNULL)
-+    {
-+        cache->prev   = gcvNULL;
-+        cache->next   = gcvNULL;
-+        Os->cacheHead =
-+        Os->cacheTail = cache;
-+    }
-+    else
-+    {
-+        /* Add to the tail. */
-+        cache->prev         = Os->cacheTail;
-+        cache->next         = gcvNULL;
-+        Os->cacheTail->next = cache;
-+        Os->cacheTail       = cache;
-+    }
-+
-+    Os->cacheSize++;
-+
-+    return gcvTRUE;
-+}
-+
-+#ifndef NO_DMA_COHERENT
-+static gctSTRING
-+_GetNonPagedMemoryCache(
-+    gckOS Os,
-+    gctINT Size,
-+    dma_addr_t * DmaHandle
-+    )
-+#else
-+static struct page *
-+_GetNonPagedMemoryCache(
-+    gckOS Os,
-+    long Order
-+    )
-+#endif
-+{
-+    gcsNonPagedMemoryCache *cache;
-+#ifndef NO_DMA_COHERENT
-+    gctSTRING addr;
-+#else
-+    struct page * page;
-+#endif
-+
-+    if (Os->cacheHead == gcvNULL) return gcvNULL;
-+
-+    /* Find the right cache */
-+    cache = Os->cacheHead;
-+
-+    while (cache != gcvNULL)
-+    {
-+#ifndef NO_DMA_COHERENT
-+        if (cache->size == Size) break;
-+#else
-+        if (cache->order == Order) break;
-+#endif
-+
-+        cache = cache->next;
-+    }
-+
-+    if (cache == gcvNULL) return gcvNULL;
-+
-+    /* Remove the cache from list */
-+    if (cache == Os->cacheHead)
-+    {
-+        Os->cacheHead = cache->next;
-+
-+        if (Os->cacheHead == gcvNULL)
-+        {
-+            Os->cacheTail = gcvNULL;
-+        }
-+    }
-+    else
-+    {
-+        cache->prev->next = cache->next;
-+
-+        if (cache == Os->cacheTail)
-+        {
-+            Os->cacheTail = cache->prev;
-+        }
-+        else
-+        {
-+            cache->next->prev = cache->prev;
-+        }
-+    }
-+
-+    /* Destroy cache */
-+#ifndef NO_DMA_COHERENT
-+    addr       = cache->addr;
-+    *DmaHandle = cache->dmaHandle;
-+#else
-+    page       = cache->page;
-+#endif
-+
-+    kfree(cache);
-+
-+    Os->cacheSize--;
-+
-+#ifndef NO_DMA_COHERENT
-+    return addr;
-+#else
-+    return page;
-+#endif
-+}
-+
-+static void
-+_FreeAllNonPagedMemoryCache(
-+    gckOS Os
-+    )
-+{
-+    gcsNonPagedMemoryCache *cache, *nextCache;
-+
-+    MEMORY_LOCK(Os);
-+
-+    cache = Os->cacheHead;
-+
-+    while (cache != gcvNULL)
-+    {
-+        if (cache != Os->cacheTail)
-+        {
-+            nextCache = cache->next;
-+        }
-+        else
-+        {
-+            nextCache = gcvNULL;
-+        }
-+
-+        /* Remove the cache from list */
-+        if (cache == Os->cacheHead)
-+        {
-+            Os->cacheHead = cache->next;
-+
-+            if (Os->cacheHead == gcvNULL)
-+            {
-+                Os->cacheTail = gcvNULL;
-+            }
-+        }
-+        else
-+        {
-+            cache->prev->next = cache->next;
-+
-+            if (cache == Os->cacheTail)
-+            {
-+                Os->cacheTail = cache->prev;
-+            }
-+            else
-+            {
-+                cache->next->prev = cache->prev;
-+            }
-+        }
-+
-+#ifndef NO_DMA_COHERENT
-+    dma_free_coherent(gcvNULL,
-+                    cache->size,
-+                    cache->addr,
-+                    cache->dmaHandle);
-+#else
-+    free_pages((unsigned long)page_address(cache->page), cache->order);
-+#endif
-+
-+        kfree(cache);
-+
-+        cache = nextCache;
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+}
-+
-+#endif /* gcdUSE_NON_PAGED_MEMORY_CACHE */
-+
-+/*******************************************************************************
-+** Integer Id Management.
-+*/
-+gceSTATUS
-+_AllocateIntegerId(
-+    IN gcsINTEGER_DB_PTR Database,
-+    IN gctPOINTER KernelPointer,
-+    OUT gctUINT32 *Id
-+    )
-+{
-+    int result;
-+    gctINT next;
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 9, 0)
-+    idr_preload(GFP_KERNEL | gcdNOWARN);
-+
-+    spin_lock(&Database->lock);
-+
-+    next = (Database->curr + 1 <= 0) ? 1 : Database->curr + 1;
-+    result = idr_alloc(&Database->idr, KernelPointer, next, 0, GFP_ATOMIC);
-+
-+    if (!result)
-+    {
-+        Database->curr = *Id;
-+    }
-+
-+    spin_unlock(&Database->lock);
-+
-+    idr_preload_end();
-+
-+    if (result < 0)
-+    {
-+        return gcvSTATUS_OUT_OF_RESOURCES;
-+    }
-+
-+    *Id = result;
-+#else
-+again:
-+    if (idr_pre_get(&Database->idr, GFP_KERNEL | gcdNOWARN) == 0)
-+    {
-+        return gcvSTATUS_OUT_OF_MEMORY;
-+    }
-+
-+    spin_lock(&Database->lock);
-+
-+    next = (Database->curr + 1 <= 0) ? 1 : Database->curr + 1;
-+
-+    /* Try to get a id greater than current id. */
-+    result = idr_get_new_above(&Database->idr, KernelPointer, next, Id);
-+
-+    if (!result)
-+    {
-+        Database->curr = *Id;
-+    }
-+
-+    spin_unlock(&Database->lock);
-+
-+    if (result == -EAGAIN)
-+    {
-+        goto again;
-+    }
-+
-+    if (result != 0)
-+    {
-+        return gcvSTATUS_OUT_OF_RESOURCES;
-+    }
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_QueryIntegerId(
-+    IN gcsINTEGER_DB_PTR Database,
-+    IN gctUINT32  Id,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    gctPOINTER pointer;
-+
-+    spin_lock(&Database->lock);
-+
-+    pointer = idr_find(&Database->idr, Id);
-+
-+    spin_unlock(&Database->lock);
-+
-+    if(pointer)
-+    {
-+        *KernelPointer = pointer;
-+        return gcvSTATUS_OK;
-+    }
-+    else
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_OS,
-+                "%s(%d) Id = %d is not found",
-+                __FUNCTION__, __LINE__, Id);
-+
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+}
-+
-+gceSTATUS
-+_DestroyIntegerId(
-+    IN gcsINTEGER_DB_PTR Database,
-+    IN gctUINT32 Id
-+    )
-+{
-+    spin_lock(&Database->lock);
-+
-+    idr_remove(&Database->idr, Id);
-+
-+    spin_unlock(&Database->lock);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+static void
-+_UnmapUserLogical(
-+    IN gctINT Pid,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32  Size
-+)
-+{
-+    if (unlikely(current->mm == gcvNULL))
-+    {
-+        /* Do nothing if process is exiting. */
-+        return;
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    if (vm_munmap((unsigned long)Logical, Size) < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): vm_munmap failed",
-+                __FUNCTION__, __LINE__
-+                );
-+    }
-+#else
-+    down_write(&current->mm->mmap_sem);
-+    if (do_munmap(current->mm, (unsigned long)Logical, Size) < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): do_munmap failed",
-+                __FUNCTION__, __LINE__
-+                );
-+    }
-+    up_write(&current->mm->mmap_sem);
-+#endif
-+}
-+
-+gceSTATUS
-+_QueryProcessPageTable(
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    spinlock_t *lock;
-+    gctUINTPTR_T logical = (gctUINTPTR_T)Logical;
-+    pgd_t *pgd;
-+    pud_t *pud;
-+    pmd_t *pmd;
-+    pte_t *pte;
-+
-+    if (!current->mm)
-+    {
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    pgd = pgd_offset(current->mm, logical);
-+    if (pgd_none(*pgd) || pgd_bad(*pgd))
-+    {
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    pud = pud_offset(pgd, logical);
-+    if (pud_none(*pud) || pud_bad(*pud))
-+    {
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    pmd = pmd_offset(pud, logical);
-+    if (pmd_none(*pmd) || pmd_bad(*pmd))
-+    {
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    pte = pte_offset_map_lock(current->mm, pmd, logical, &lock);
-+    if (!pte)
-+    {
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    if (!pte_present(*pte))
-+    {
-+        pte_unmap_unlock(pte, lock);
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    *Address = (pte_pfn(*pte) << PAGE_SHIFT) | (logical & ~PAGE_MASK);
-+    pte_unmap_unlock(pte, lock);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Construct
-+**
-+**  Construct a new gckOS object.
-+**
-+**  INPUT:
-+**
-+**      gctPOINTER Context
-+**          Pointer to the gckGALDEVICE class.
-+**
-+**  OUTPUT:
-+**
-+**      gckOS * Os
-+**          Pointer to a variable that will hold the pointer to the gckOS object.
-+*/
-+gceSTATUS
-+gckOS_Construct(
-+    IN gctPOINTER Context,
-+    OUT gckOS * Os
-+    )
-+{
-+    gckOS os;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Context=0x%X", Context);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Os != gcvNULL);
-+
-+    /* Allocate the gckOS object. */
-+    os = (gckOS) kmalloc(gcmSIZEOF(struct _gckOS), GFP_KERNEL | gcdNOWARN);
-+
-+    if (os == gcvNULL)
-+    {
-+        /* Out of memory. */
-+        gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+        return gcvSTATUS_OUT_OF_MEMORY;
-+    }
-+
-+    /* Zero the memory. */
-+    gckOS_ZeroMemory(os, gcmSIZEOF(struct _gckOS));
-+
-+    /* Initialize the gckOS object. */
-+    os->object.type = gcvOBJ_OS;
-+
-+    /* Set device device. */
-+    os->device = Context;
-+
-+    /* IMPORTANT! No heap yet. */
-+    os->heap = gcvNULL;
-+
-+    /* Initialize the memory lock. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &os->memoryLock));
-+    gcmkONERROR(gckOS_CreateMutex(os, &os->memoryMapLock));
-+
-+    /* Create debug lock mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &os->debugLock));
-+
-+
-+    os->mdlHead = os->mdlTail = gcvNULL;
-+
-+    /* Get the kernel process ID. */
-+    gcmkONERROR(gckOS_GetProcessID(&os->kernelProcessID));
-+
-+    /*
-+     * Initialize the signal manager.
-+     */
-+
-+    /* Initialize mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &os->signalMutex));
-+
-+    /* Initialize signal id database lock. */
-+    spin_lock_init(&os->signalDB.lock);
-+
-+    /* Initialize signal id database. */
-+    idr_init(&os->signalDB.idr);
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    /*
-+     * Initialize the sync point manager.
-+     */
-+
-+    /* Initialize mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &os->syncPointMutex));
-+
-+    /* Initialize sync point id database lock. */
-+    spin_lock_init(&os->syncPointDB.lock);
-+
-+    /* Initialize sync point id database. */
-+    idr_init(&os->syncPointDB.idr);
-+#endif
-+
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    os->cacheSize = 0;
-+    os->cacheHead = gcvNULL;
-+    os->cacheTail = gcvNULL;
-+#endif
-+
-+    /* Create a workqueue for os timer. */
-+    os->workqueue = create_singlethread_workqueue("galcore workqueue");
-+
-+    if (os->workqueue == gcvNULL)
-+    {
-+        /* Out of memory. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    mutex_init(&os->gpu_clk_mutex);
-+
-+    /* Construct a video memory mutex. */
-+    gcmkONERROR(gckOS_CreateMutex(os, &os->vidmemMutex));
-+
-+    /* Return pointer to the gckOS object. */
-+    *Os = os;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Os=0x%X", *Os);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    if (os->syncPointMutex != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_DeleteMutex(os, os->syncPointMutex));
-+    }
-+#endif
-+
-+    if (os->signalMutex != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_DeleteMutex(os, os->signalMutex));
-+    }
-+
-+    if (os->heap != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(
-+            gckHEAP_Destroy(os->heap));
-+    }
-+
-+    if (os->memoryMapLock != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_DeleteMutex(os, os->memoryMapLock));
-+    }
-+
-+    if (os->memoryLock != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_DeleteMutex(os, os->memoryLock));
-+    }
-+
-+    if (os->debugLock != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(
-+            gckOS_DeleteMutex(os, os->debugLock));
-+    }
-+
-+    if (os->workqueue != gcvNULL)
-+    {
-+        destroy_workqueue(os->workqueue);
-+    }
-+
-+    kfree(os);
-+
-+    /* Return the error. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Destroy
-+**
-+**  Destroy an gckOS object.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object that needs to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_Destroy(
-+    IN gckOS Os
-+    )
-+{
-+    gckHEAP heap;
-+
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    _FreeAllNonPagedMemoryCache(Os);
-+#endif
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+    /*
-+     * Destroy the sync point manager.
-+     */
-+
-+    /* Destroy the mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->syncPointMutex));
-+#endif
-+
-+    /*
-+     * Destroy the signal manager.
-+     */
-+
-+    /* Destroy the mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->signalMutex));
-+
-+    if (Os->heap != gcvNULL)
-+    {
-+        /* Mark gckHEAP as gone. */
-+        heap     = Os->heap;
-+        Os->heap = gcvNULL;
-+
-+        /* Destroy the gckHEAP object. */
-+        gcmkVERIFY_OK(gckHEAP_Destroy(heap));
-+    }
-+
-+    /* Destroy the memory lock. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->memoryMapLock));
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->memoryLock));
-+
-+    /* Destroy debug lock mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->debugLock));
-+
-+    /* Destroy video memory mutex. */
-+    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->vidmemMutex));
-+
-+    /* Wait for all works done. */
-+    flush_workqueue(Os->workqueue);
-+
-+    /* Destory work queue. */
-+    destroy_workqueue(Os->workqueue);
-+
-+    /* Flush the debug cache. */
-+    gcmkDEBUGFLUSH(~0U);
-+
-+    /* Mark the gckOS object as unknown. */
-+    Os->object.type = gcvOBJ_UNKNOWN;
-+
-+    /* Free the gckOS object. */
-+    kfree(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+static gctSTRING
-+_CreateKernelVirtualMapping(
-+    IN PLINUX_MDL Mdl
-+    )
-+{
-+    gctSTRING addr = 0;
-+    gctINT numPages = Mdl->numPages;
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    if (Mdl->contiguous)
-+    {
-+        addr = page_address(Mdl->u.contiguousPages);
-+    }
-+    else
-+    {
-+        addr = vmap(Mdl->u.nonContiguousPages,
-+                    numPages,
-+                    0,
-+                    PAGE_KERNEL);
-+
-+        /* Trigger a page fault. */
-+        memset(addr, 0, numPages * PAGE_SIZE);
-+    }
-+#else
-+    struct page ** pages;
-+    gctBOOL free = gcvFALSE;
-+    gctINT i;
-+
-+    if (Mdl->contiguous)
-+    {
-+        pages = kmalloc(sizeof(struct page *) * numPages, GFP_KERNEL | gcdNOWARN);
-+
-+        if (!pages)
-+        {
-+            return gcvNULL;
-+        }
-+
-+        for (i = 0; i < numPages; i++)
-+        {
-+            pages[i] = nth_page(Mdl->u.contiguousPages, i);
-+        }
-+
-+        free = gcvTRUE;
-+    }
-+    else
-+    {
-+        pages = Mdl->u.nonContiguousPages;
-+    }
-+
-+    /* ioremap() can't work on system memory since 2.6.38. */
-+    addr = vmap(pages, numPages, 0, gcmkNONPAGED_MEMROY_PROT(PAGE_KERNEL));
-+
-+    /* Trigger a page fault. */
-+    memset(addr, 0, numPages * PAGE_SIZE);
-+
-+    if (free)
-+    {
-+        kfree(pages);
-+    }
-+
-+#endif
-+
-+    return addr;
-+}
-+
-+static void
-+_DestoryKernelVirtualMapping(
-+    IN gctSTRING Addr
-+    )
-+{
-+#if !gcdNONPAGED_MEMORY_CACHEABLE
-+    vunmap(Addr);
-+#endif
-+}
-+
-+gceSTATUS
-+gckOS_CreateKernelVirtualMapping(
-+    IN gctPHYS_ADDR Physical,
-+    OUT gctSIZE_T * PageCount,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    *PageCount = ((PLINUX_MDL)Physical)->numPages;
-+    *Logical = _CreateKernelVirtualMapping((PLINUX_MDL)Physical);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_DestroyKernelVirtualMapping(
-+    IN gctPOINTER Logical
-+    )
-+{
-+    _DestoryKernelVirtualMapping((gctSTRING)Logical);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Allocate
-+**
-+**  Allocate memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Memory
-+**          Pointer to a variable that will hold the allocated memory location.
-+*/
-+gceSTATUS
-+gckOS_Allocate(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Bytes=%lu", Os, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    /* Do we have a heap? */
-+    if (Os->heap != gcvNULL)
-+    {
-+        /* Allocate from the heap. */
-+        gcmkONERROR(gckHEAP_Allocate(Os->heap, Bytes, Memory));
-+    }
-+    else
-+    {
-+        gcmkONERROR(gckOS_AllocateMemory(Os, Bytes, Memory));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Memory=0x%X", *Memory);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Free
-+**
-+**  Free allocated memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Memory
-+**          Pointer to memory allocation to free.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_Free(
-+    IN gckOS Os,
-+    IN gctPOINTER Memory
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Memory=0x%X", Os, Memory);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    /* Do we have a heap? */
-+    if (Os->heap != gcvNULL)
-+    {
-+        /* Free from the heap. */
-+        gcmkONERROR(gckHEAP_Free(Os->heap, Memory));
-+    }
-+    else
-+    {
-+        gcmkONERROR(gckOS_FreeMemory(Os, Memory));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AllocateMemory
-+**
-+**  Allocate memory wrapper.
-+**
-+**  INPUT:
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Memory
-+**          Pointer to a variable that will hold the allocated memory location.
-+*/
-+gceSTATUS
-+gckOS_AllocateMemory(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Memory
-+    )
-+{
-+    gctPOINTER memory;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Bytes=%lu", Os, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    if (Bytes > PAGE_SIZE)
-+    {
-+        memory = (gctPOINTER) vmalloc(Bytes);
-+    }
-+    else
-+    {
-+        memory = (gctPOINTER) kmalloc(Bytes, GFP_KERNEL | gcdNOWARN);
-+    }
-+
-+    if (memory == gcvNULL)
-+    {
-+        /* Out of memory. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Return pointer to the memory allocation. */
-+    *Memory = memory;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Memory=0x%X", *Memory);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_FreeMemory
-+**
-+**  Free allocated memory wrapper.
-+**
-+**  INPUT:
-+**
-+**      gctPOINTER Memory
-+**          Pointer to memory allocation to free.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_FreeMemory(
-+    IN gckOS Os,
-+    IN gctPOINTER Memory
-+    )
-+{
-+    gcmkHEADER_ARG("Memory=0x%X", Memory);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+
-+    /* Free the memory from the OS pool. */
-+    if (is_vmalloc_addr(Memory))
-+    {
-+        vfree(Memory);
-+    }
-+    else
-+    {
-+        kfree(Memory);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MapMemory
-+**
-+**  Map physical memory into the current process.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Start of physical address memory.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to map.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Memory
-+**          Pointer to a variable that will hold the logical address of the
-+**          mapped memory.
-+*/
-+gceSTATUS
-+gckOS_MapMemory(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    PLINUX_MDL_MAP  mdlMap;
-+    PLINUX_MDL      mdl = (PLINUX_MDL)Physical;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != 0);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    MEMORY_LOCK(Os);
-+
-+    mdlMap = FindMdlMap(mdl, _GetProcessID());
-+
-+    if (mdlMap == gcvNULL)
-+    {
-+        mdlMap = _CreateMdlMap(mdl, _GetProcessID());
-+
-+        if (mdlMap == gcvNULL)
-+        {
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+            return gcvSTATUS_OUT_OF_MEMORY;
-+        }
-+    }
-+
-+    if (mdlMap->vmaAddr == gcvNULL)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
-+        mdlMap->vmaAddr = (char *)vm_mmap(gcvNULL,
-+                    0L,
-+                    mdl->numPages * PAGE_SIZE,
-+                    PROT_READ | PROT_WRITE,
-+                    MAP_SHARED,
-+                    0);
-+#else
-+        down_write(&current->mm->mmap_sem);
-+
-+        mdlMap->vmaAddr = (char *)do_mmap_pgoff(gcvNULL,
-+                    0L,
-+                    mdl->numPages * PAGE_SIZE,
-+                    PROT_READ | PROT_WRITE,
-+                    MAP_SHARED,
-+                    0);
-+
-+        up_write(&current->mm->mmap_sem);
-+#endif
-+
-+        if (IS_ERR(mdlMap->vmaAddr))
-+        {
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): do_mmap_pgoff error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): mdl->numPages: %d mdl->vmaAddr: 0x%X",
-+                __FUNCTION__, __LINE__,
-+                mdl->numPages,
-+                mdlMap->vmaAddr
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+            return gcvSTATUS_OUT_OF_MEMORY;
-+        }
-+
-+        down_write(&current->mm->mmap_sem);
-+
-+        mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
-+
-+        if (!mdlMap->vma)
-+        {
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): find_vma error.",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            up_write(&current->mm->mmap_sem);
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+            return gcvSTATUS_OUT_OF_RESOURCES;
-+        }
-+
-+#ifndef NO_DMA_COHERENT
-+        if (dma_mmap_coherent(gcvNULL,
-+                    mdlMap->vma,
-+                    mdl->addr,
-+                    mdl->dmaHandle,
-+                    mdl->numPages * PAGE_SIZE) < 0)
-+        {
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): dma_mmap_coherent error.",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+            return gcvSTATUS_OUT_OF_RESOURCES;
-+        }
-+#else
-+#if !gcdPAGED_MEMORY_CACHEABLE
-+        mdlMap->vma->vm_page_prot = gcmkPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
-+        mdlMap->vma->vm_flags |= gcdVM_FLAGS;
-+#   endif
-+        mdlMap->vma->vm_pgoff = 0;
-+
-+        if (remap_pfn_range(mdlMap->vma,
-+                            mdlMap->vma->vm_start,
-+                            mdl->dmaHandle >> PAGE_SHIFT,
-+                            mdl->numPages*PAGE_SIZE,
-+                            mdlMap->vma->vm_page_prot) < 0)
-+        {
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): remap_pfn_range error.",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+            return gcvSTATUS_OUT_OF_RESOURCES;
-+        }
-+#endif
-+
-+        up_write(&current->mm->mmap_sem);
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    *Logical = mdlMap->vmaAddr;
-+
-+    gcmkFOOTER_ARG("*Logical=0x%X", *Logical);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnmapMemory
-+**
-+**  Unmap physical memory out of the current process.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Start of physical address memory.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to unmap.
-+**
-+**      gctPOINTER Memory
-+**          Pointer to a previously mapped memory region.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnmapMemory(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu Logical=0x%X",
-+                   Os, Physical, Bytes, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != 0);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    gckOS_UnmapMemoryEx(Os, Physical, Bytes, Logical, _GetProcessID());
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnmapMemoryEx
-+**
-+**  Unmap physical memory in the specified process.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Start of physical address memory.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to unmap.
-+**
-+**      gctPOINTER Memory
-+**          Pointer to a previously mapped memory region.
-+**
-+**      gctUINT32 PID
-+**          Pid of the process that opened the device and mapped this memory.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnmapMemoryEx(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 PID
-+    )
-+{
-+    PLINUX_MDL_MAP          mdlMap;
-+    PLINUX_MDL              mdl = (PLINUX_MDL)Physical;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu Logical=0x%X PID=%d",
-+                   Os, Physical, Bytes, Logical, PID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != 0);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(PID != 0);
-+
-+    MEMORY_LOCK(Os);
-+
-+    if (Logical)
-+    {
-+        mdlMap = FindMdlMap(mdl, PID);
-+
-+        if (mdlMap == gcvNULL || mdlMap->vmaAddr == gcvNULL)
-+        {
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+        }
-+
-+        _UnmapUserLogical(PID, mdlMap->vmaAddr, mdl->numPages * PAGE_SIZE);
-+
-+        gcmkVERIFY_OK(_DestroyMdlMap(mdl, mdlMap));
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnmapUserLogical
-+**
-+**  Unmap user logical memory out of physical memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Start of physical address memory.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to unmap.
-+**
-+**      gctPOINTER Memory
-+**          Pointer to a previously mapped memory region.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnmapUserLogical(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu Logical=0x%X",
-+                   Os, Physical, Bytes, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != 0);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    gckOS_UnmapMemory(Os, Physical, Bytes, Logical);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AllocateNonPagedMemory
-+**
-+**  Allocate a number of pages from non-paged memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctBOOL InUserSpace
-+**          gcvTRUE if the pages need to be mapped into user space.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that holds the number of bytes to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that hold the number of bytes allocated.
-+**
-+**      gctPHYS_ADDR * Physical
-+**          Pointer to a variable that will hold the physical address of the
-+**          allocation.
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that will hold the logical address of the
-+**          allocation.
-+*/
-+gceSTATUS
-+gckOS_AllocateNonPagedMemory(
-+    IN gckOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gctSIZE_T bytes;
-+    gctINT numPages;
-+    PLINUX_MDL mdl = gcvNULL;
-+    PLINUX_MDL_MAP mdlMap = gcvNULL;
-+    gctSTRING addr;
-+#ifdef NO_DMA_COHERENT
-+    struct page * page;
-+    long size, order;
-+    gctPOINTER vaddr;
-+#endif
-+    gctBOOL locked = gcvFALSE;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X InUserSpace=%d *Bytes=%lu",
-+                   Os, InUserSpace, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(*Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Align number of bytes to page size. */
-+    bytes = gcmALIGN(*Bytes, PAGE_SIZE);
-+
-+    /* Get total number of pages.. */
-+    numPages = GetPageCount(bytes, 0);
-+
-+    /* Allocate mdl+vector structure */
-+    mdl = _CreateMdl(_GetProcessID());
-+    if (mdl == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    mdl->pagedMem = 0;
-+    mdl->numPages = numPages;
-+
-+    MEMORY_LOCK(Os);
-+    locked = gcvTRUE;
-+
-+#ifndef NO_DMA_COHERENT
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    addr = _GetNonPagedMemoryCache(Os,
-+                mdl->numPages * PAGE_SIZE,
-+                &mdl->dmaHandle);
-+
-+    if (addr == gcvNULL)
-+#endif
-+    {
-+        addr = dma_zalloc_coherent(gcvNULL,
-+                mdl->numPages * PAGE_SIZE,
-+                &mdl->dmaHandle,
-+                GFP_KERNEL | gcdNOWARN);
-+    }
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    if(addr == gcvNULL)
-+    {
-+            MEMORY_UNLOCK(Os);
-+            locked = gcvFALSE;
-+            /*Free all cache and try again*/
-+            _FreeAllNonPagedMemoryCache(Os);
-+            MEMORY_LOCK(Os);
-+            locked = gcvTRUE;
-+            addr = dma_zalloc_coherent(gcvNULL,
-+                mdl->numPages * PAGE_SIZE,
-+                &mdl->dmaHandle,
-+                GFP_KERNEL | gcdNOWARN);
-+    }
-+#endif
-+#else
-+    size    = mdl->numPages * PAGE_SIZE;
-+    order   = get_order(size);
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    page = _GetNonPagedMemoryCache(Os, order);
-+
-+    if (page == gcvNULL)
-+#endif
-+    {
-+        page = alloc_pages(GFP_KERNEL | gcdNOWARN, order);
-+    }
-+
-+    if (page == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    vaddr           = (gctPOINTER)page_address(page);
-+    mdl->contiguous = gcvTRUE;
-+    mdl->u.contiguousPages = page;
-+    addr            = _CreateKernelVirtualMapping(mdl);
-+    mdl->dmaHandle  = virt_to_phys(vaddr);
-+    mdl->kaddr      = vaddr;
-+    mdl->u.contiguousPages = page;
-+
-+#if !defined(CONFIG_PPC)
-+    /* Cache invalidate. */
-+    dma_sync_single_for_device(
-+                gcvNULL,
-+                page_to_phys(page),
-+                bytes,
-+                DMA_FROM_DEVICE);
-+#endif
-+
-+    while (size > 0)
-+    {
-+        SetPageReserved(virt_to_page(vaddr));
-+
-+        vaddr   += PAGE_SIZE;
-+        size    -= PAGE_SIZE;
-+    }
-+#endif
-+
-+    if (addr == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    mdl->addr = addr;
-+
-+    /* Return allocated memory. */
-+    *Bytes = bytes;
-+    *Physical = (gctPHYS_ADDR) mdl;
-+
-+    if (InUserSpace)
-+    {
-+        mdlMap = _CreateMdlMap(mdl, _GetProcessID());
-+
-+        if (mdlMap == gcvNULL)
-+        {
-+            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+        }
-+
-+        /* Only after mmap this will be valid. */
-+
-+        /* We need to map this to user space. */
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
-+        mdlMap->vmaAddr = (gctSTRING) vm_mmap(gcvNULL,
-+                0L,
-+                mdl->numPages * PAGE_SIZE,
-+                PROT_READ | PROT_WRITE,
-+                MAP_SHARED,
-+                0);
-+#else
-+        down_write(&current->mm->mmap_sem);
-+
-+        mdlMap->vmaAddr = (gctSTRING) do_mmap_pgoff(gcvNULL,
-+                0L,
-+                mdl->numPages * PAGE_SIZE,
-+                PROT_READ | PROT_WRITE,
-+                MAP_SHARED,
-+                0);
-+
-+        up_write(&current->mm->mmap_sem);
-+#endif
-+
-+        if (IS_ERR(mdlMap->vmaAddr))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): do_mmap_pgoff error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+        }
-+
-+        down_write(&current->mm->mmap_sem);
-+
-+        mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
-+
-+        if (mdlMap->vma == gcvNULL)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): find_vma error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+
-+#ifndef NO_DMA_COHERENT
-+        if (dma_mmap_coherent(gcvNULL,
-+                mdlMap->vma,
-+                mdl->addr,
-+                mdl->dmaHandle,
-+                mdl->numPages * PAGE_SIZE) < 0)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): dma_mmap_coherent error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+#else
-+        mdlMap->vma->vm_page_prot = gcmkNONPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
-+        mdlMap->vma->vm_flags |= gcdVM_FLAGS;
-+        mdlMap->vma->vm_pgoff = 0;
-+
-+        if (remap_pfn_range(mdlMap->vma,
-+                            mdlMap->vma->vm_start,
-+                            mdl->dmaHandle >> PAGE_SHIFT,
-+                            mdl->numPages * PAGE_SIZE,
-+                            mdlMap->vma->vm_page_prot))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_WARNING, gcvZONE_OS,
-+                "%s(%d): remap_pfn_range error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+#endif /* NO_DMA_COHERENT */
-+
-+        up_write(&current->mm->mmap_sem);
-+
-+        *Logical = mdlMap->vmaAddr;
-+    }
-+    else
-+    {
-+        *Logical = (gctPOINTER)mdl->addr;
-+    }
-+
-+    /*
-+     * Add this to a global list.
-+     * Will be used by get physical address
-+     * and mapuser pointer functions.
-+     */
-+
-+    if (!Os->mdlHead)
-+    {
-+        /* Initialize the queue. */
-+        Os->mdlHead = Os->mdlTail = mdl;
-+    }
-+    else
-+    {
-+        /* Add to the tail. */
-+        mdl->prev = Os->mdlTail;
-+        Os->mdlTail->next = mdl;
-+        Os->mdlTail = mdl;
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu *Physical=0x%X *Logical=0x%X",
-+                   *Bytes, *Physical, *Logical);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (mdlMap != gcvNULL)
-+    {
-+        /* Free LINUX_MDL_MAP. */
-+        gcmkVERIFY_OK(_DestroyMdlMap(mdl, mdlMap));
-+    }
-+
-+    if (mdl != gcvNULL)
-+    {
-+        /* Free LINUX_MDL. */
-+        gcmkVERIFY_OK(_DestroyMdl(mdl));
-+    }
-+
-+    if (locked)
-+    {
-+        /* Unlock memory. */
-+        MEMORY_UNLOCK(Os);
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_FreeNonPagedMemory
-+**
-+**  Free previously allocated and mapped pages from non-paged memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes allocated.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the allocated memory.
-+**
-+**      gctPOINTER Logical
-+**          Logical address of the allocated memory.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS gckOS_FreeNonPagedMemory(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    PLINUX_MDL mdl;
-+    PLINUX_MDL_MAP mdlMap;
-+#ifdef NO_DMA_COHERENT
-+    unsigned size;
-+    gctPOINTER vaddr;
-+#endif /* NO_DMA_COHERENT */
-+
-+    gcmkHEADER_ARG("Os=0x%X Bytes=%lu Physical=0x%X Logical=0x%X",
-+                   Os, Bytes, Physical, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Physical != 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Convert physical address into a pointer to a MDL. */
-+    mdl = (PLINUX_MDL) Physical;
-+
-+    MEMORY_LOCK(Os);
-+
-+#ifndef NO_DMA_COHERENT
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    if (!_AddNonPagedMemoryCache(Os,
-+                                 mdl->numPages * PAGE_SIZE,
-+                                 mdl->addr,
-+                                 mdl->dmaHandle))
-+#endif
-+    {
-+        dma_free_coherent(gcvNULL,
-+                mdl->numPages * PAGE_SIZE,
-+                mdl->addr,
-+                mdl->dmaHandle);
-+    }
-+#else
-+    size    = mdl->numPages * PAGE_SIZE;
-+    vaddr   = mdl->kaddr;
-+
-+    while (size > 0)
-+    {
-+        ClearPageReserved(virt_to_page(vaddr));
-+
-+        vaddr   += PAGE_SIZE;
-+        size    -= PAGE_SIZE;
-+    }
-+
-+#if gcdUSE_NON_PAGED_MEMORY_CACHE
-+    if (!_AddNonPagedMemoryCache(Os,
-+                                 get_order(mdl->numPages * PAGE_SIZE),
-+                                 virt_to_page(mdl->kaddr)))
-+#endif
-+    {
-+        free_pages((unsigned long)mdl->kaddr, get_order(mdl->numPages * PAGE_SIZE));
-+    }
-+
-+    _DestoryKernelVirtualMapping(mdl->addr);
-+#endif /* NO_DMA_COHERENT */
-+
-+    mdlMap = mdl->maps;
-+
-+    while (mdlMap != gcvNULL)
-+    {
-+        if (mdlMap->vmaAddr != gcvNULL)
-+        {
-+            /* No mapped memory exists when free nonpaged memory */
-+            gcmkASSERT(0);
-+        }
-+
-+        mdlMap = mdlMap->next;
-+    }
-+
-+    /* Remove the node from global list.. */
-+    if (mdl == Os->mdlHead)
-+    {
-+        if ((Os->mdlHead = mdl->next) == gcvNULL)
-+        {
-+            Os->mdlTail = gcvNULL;
-+        }
-+    }
-+    else
-+    {
-+        mdl->prev->next = mdl->next;
-+        if (mdl == Os->mdlTail)
-+        {
-+            Os->mdlTail = mdl->prev;
-+        }
-+        else
-+        {
-+            mdl->next->prev = mdl->prev;
-+        }
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    gcmkVERIFY_OK(_DestroyMdl(mdl));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_ReadRegister
-+**
-+**  Read data from a register.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 Address
-+**          Address of register.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Data
-+**          Pointer to a variable that receives the data read from the register.
-+*/
-+gceSTATUS
-+gckOS_ReadRegister(
-+    IN gckOS Os,
-+    IN gctUINT32 Address,
-+    OUT gctUINT32 * Data
-+    )
-+{
-+    return gckOS_ReadRegisterEx(Os, gcvCORE_MAJOR, Address, Data);
-+}
-+
-+gceSTATUS
-+gckOS_ReadRegisterEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT32 Address,
-+    OUT gctUINT32 * Data
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Core=%d Address=0x%X", Os, Core, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Address < Os->device->requestedRegisterMemSizes[Core]);
-+    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
-+
-+    if(Address != 0x10) mutex_lock(&Os->gpu_clk_mutex);
-+    BUG_ON(!Os->gpu_clk_on[Core]);
-+
-+    if(Address)
-+    {
-+        gctUINT32 AQHiClockControl = readl((gctUINT8 *)Os->device->registerBases[Core]);
-+        BUG_ON((AQHiClockControl & 0x3) == 0x3);
-+    }
-+
-+    *Data = readl((gctUINT8 *)Os->device->registerBases[Core] + Address);
-+    if(Address != 0x10) mutex_unlock(&Os->gpu_clk_mutex);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_WriteRegister
-+**
-+**  Write data to a register.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 Address
-+**          Address of register.
-+**
-+**      gctUINT32 Data
-+**          Data for register.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_WriteRegister(
-+    IN gckOS Os,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Data
-+    )
-+{
-+    return gckOS_WriteRegisterEx(Os, gcvCORE_MAJOR, Address, Data);
-+}
-+
-+gceSTATUS
-+gckOS_WriteRegisterEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT32 Address,
-+    IN gctUINT32 Data
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Core=%d Address=0x%X Data=0x%08x", Os, Core, Address, Data);
-+
-+    gcmkVERIFY_ARGUMENT(Address < Os->device->requestedRegisterMemSizes[Core]);
-+
-+    mutex_lock(&Os->gpu_clk_mutex);
-+    BUG_ON(!Os->gpu_clk_on[Core]);
-+
-+    if(Address)
-+    {
-+        gctUINT32 AQHiClockControl = readl((gctUINT8 *)Os->device->registerBases[Core]);
-+        BUG_ON((AQHiClockControl & 0x3) == 0x3);
-+    }
-+
-+    writel(Data, (gctUINT8 *)Os->device->registerBases[Core] + Address);
-+    mutex_unlock(&Os->gpu_clk_mutex);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetPageSize
-+**
-+**  Get the system's page size.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * PageSize
-+**          Pointer to a variable that will receive the system's page size.
-+*/
-+gceSTATUS gckOS_GetPageSize(
-+    IN gckOS Os,
-+    OUT gctSIZE_T * PageSize
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(PageSize != gcvNULL);
-+
-+    /* Return the page size. */
-+    *PageSize = (gctSIZE_T) PAGE_SIZE;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*PageSize", *PageSize);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetPhysicalAddress
-+**
-+**  Get the physical system address of a corresponding virtual address.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Poinetr to a variable that receives the 32-bit physical adress.
-+*/
-+gceSTATUS
-+gckOS_GetPhysicalAddress(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 processID;
-+
-+    gcmkHEADER_ARG("Os=0x%X Logical=0x%X", Os, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Query page table of current process first. */
-+    status = _QueryProcessPageTable(Logical, Address);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        /* Get current process ID. */
-+        processID = _GetProcessID();
-+
-+        /* Route through other function. */
-+        gcmkONERROR(
-+            gckOS_GetPhysicalAddressProcess(Os, Logical, processID, Address));
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdSECURE_USER
-+static gceSTATUS
-+gckOS_AddMapping(
-+    IN gckOS Os,
-+    IN gctUINT32 Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gcsUSER_MAPPING_PTR map;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Logical=0x%X Bytes=%lu",
-+                   Os, Physical, Logical, Bytes);
-+
-+    gcmkONERROR(gckOS_Allocate(Os,
-+                               gcmSIZEOF(gcsUSER_MAPPING),
-+                               (gctPOINTER *) &map));
-+
-+    map->next     = Os->userMap;
-+    map->physical = Physical - Os->device->baseAddress;
-+    map->logical  = Logical;
-+    map->bytes    = Bytes;
-+    map->start    = (gctINT8_PTR) Logical;
-+    map->end      = map->start + Bytes;
-+
-+    Os->userMap = map;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+static gceSTATUS
-+gckOS_RemoveMapping(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gceSTATUS status;
-+    gcsUSER_MAPPING_PTR map, prev;
-+
-+    gcmkHEADER_ARG("Os=0x%X Logical=0x%X Bytes=%lu", Os, Logical, Bytes);
-+
-+    for (map = Os->userMap, prev = gcvNULL; map != gcvNULL; map = map->next)
-+    {
-+        if ((map->logical == Logical)
-+        &&  (map->bytes   == Bytes)
-+        )
-+        {
-+            break;
-+        }
-+
-+        prev = map;
-+    }
-+
-+    if (map == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_INVALID_ADDRESS);
-+    }
-+
-+    if (prev == gcvNULL)
-+    {
-+        Os->userMap = map->next;
-+    }
-+    else
-+    {
-+        prev->next = map->next;
-+    }
-+
-+    gcmkONERROR(gcmkOS_SAFE_FREE(Os, map));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+static gceSTATUS
-+_ConvertLogical2Physical(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 ProcessID,
-+    IN PLINUX_MDL Mdl,
-+    OUT gctUINT32_PTR Physical
-+    )
-+{
-+    gctINT8_PTR base, vBase;
-+    gctUINT32 offset;
-+    PLINUX_MDL_MAP map;
-+    gcsUSER_MAPPING_PTR userMap;
-+
-+    base = (Mdl == gcvNULL) ? gcvNULL : (gctINT8_PTR) Mdl->addr;
-+
-+    /* Check for the logical address match. */
-+    if ((base != gcvNULL)
-+    &&  ((gctINT8_PTR) Logical >= base)
-+    &&  ((gctINT8_PTR) Logical <  base + Mdl->numPages * PAGE_SIZE)
-+    )
-+    {
-+        offset = (gctINT8_PTR) Logical - base;
-+
-+        if (Mdl->dmaHandle != 0)
-+        {
-+            /* The memory was from coherent area. */
-+            *Physical = (gctUINT32) Mdl->dmaHandle + offset;
-+        }
-+        else if (Mdl->pagedMem && !Mdl->contiguous)
-+        {
-+            /* paged memory is not mapped to kernel space. */
-+            return gcvSTATUS_INVALID_ADDRESS;
-+        }
-+        else
-+        {
-+            *Physical = gcmPTR2INT(virt_to_phys(base)) + offset;
-+        }
-+
-+        return gcvSTATUS_OK;
-+    }
-+
-+    /* Walk user maps. */
-+    for (userMap = Os->userMap; userMap != gcvNULL; userMap = userMap->next)
-+    {
-+        if (((gctINT8_PTR) Logical >= userMap->start)
-+        &&  ((gctINT8_PTR) Logical <  userMap->end)
-+        )
-+        {
-+            *Physical = userMap->physical
-+                      + (gctUINT32) ((gctINT8_PTR) Logical - userMap->start);
-+
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+
-+    if (ProcessID != Os->kernelProcessID)
-+    {
-+        map   = FindMdlMap(Mdl, (gctINT) ProcessID);
-+        vBase = (map == gcvNULL) ? gcvNULL : (gctINT8_PTR) map->vmaAddr;
-+
-+        /* Is the given address within that range. */
-+        if ((vBase != gcvNULL)
-+        &&  ((gctINT8_PTR) Logical >= vBase)
-+        &&  ((gctINT8_PTR) Logical <  vBase + Mdl->numPages * PAGE_SIZE)
-+        )
-+        {
-+            offset = (gctINT8_PTR) Logical - vBase;
-+
-+            if (Mdl->dmaHandle != 0)
-+            {
-+                /* The memory was from coherent area. */
-+                *Physical = (gctUINT32) Mdl->dmaHandle + offset;
-+            }
-+            else if (Mdl->pagedMem && !Mdl->contiguous)
-+            {
-+                *Physical = _NonContiguousToPhys(Mdl->u.nonContiguousPages, offset/PAGE_SIZE);
-+            }
-+            else
-+            {
-+                *Physical = page_to_phys(Mdl->u.contiguousPages) + offset;
-+            }
-+
-+            return gcvSTATUS_OK;
-+        }
-+    }
-+
-+    /* Address not yet found. */
-+    return gcvSTATUS_INVALID_ADDRESS;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetPhysicalAddressProcess
-+**
-+**  Get the physical system address of a corresponding virtual address for a
-+**  given process.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctPOINTER Logical
-+**          Logical address.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32 * Address
-+**          Poinetr to a variable that receives the 32-bit physical adress.
-+*/
-+gceSTATUS
-+gckOS_GetPhysicalAddressProcess(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    IN gctUINT32 ProcessID,
-+    OUT gctUINT32 * Address
-+    )
-+{
-+    PLINUX_MDL mdl;
-+    gctINT8_PTR base;
-+    gceSTATUS status = gcvSTATUS_INVALID_ADDRESS;
-+
-+    gcmkHEADER_ARG("Os=0x%X Logical=0x%X ProcessID=%d", Os, Logical, ProcessID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    MEMORY_LOCK(Os);
-+
-+    /* First try the contiguous memory pool. */
-+    if (Os->device->contiguousMapped)
-+    {
-+        base = (gctINT8_PTR) Os->device->contiguousBase;
-+
-+        if (((gctINT8_PTR) Logical >= base)
-+        &&  ((gctINT8_PTR) Logical <  base + Os->device->contiguousSize)
-+        )
-+        {
-+            /* Convert logical address into physical. */
-+            *Address = Os->device->contiguousVidMem->baseAddress
-+                     + (gctINT8_PTR) Logical - base;
-+            status   = gcvSTATUS_OK;
-+        }
-+    }
-+    else
-+    {
-+        /* Try the contiguous memory pool. */
-+        mdl = (PLINUX_MDL) Os->device->contiguousPhysical;
-+        status = _ConvertLogical2Physical(Os,
-+                                          Logical,
-+                                          ProcessID,
-+                                          mdl,
-+                                          Address);
-+    }
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        /* Walk all MDLs. */
-+        for (mdl = Os->mdlHead; mdl != gcvNULL; mdl = mdl->next)
-+        {
-+            /* Try this MDL. */
-+            status = _ConvertLogical2Physical(Os,
-+                                              Logical,
-+                                              ProcessID,
-+                                              mdl,
-+                                              Address);
-+            if (gcmIS_SUCCESS(status))
-+            {
-+                break;
-+            }
-+        }
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    gcmkONERROR(status);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MapPhysical
-+**
-+**  Map a physical address into kernel space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 Physical
-+**          Physical address of the memory to map.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to map.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that receives the base address of the mapped
-+**          memory.
-+*/
-+gceSTATUS
-+gckOS_MapPhysical(
-+    IN gckOS Os,
-+    IN gctUINT32 Physical,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gctPOINTER logical;
-+    PLINUX_MDL mdl;
-+    gctUINT32 physical = Physical;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    MEMORY_LOCK(Os);
-+
-+    /* Go through our mapping to see if we know this physical address already. */
-+    mdl = Os->mdlHead;
-+
-+    while (mdl != gcvNULL)
-+    {
-+        if (mdl->dmaHandle != 0)
-+        {
-+            if ((physical >= mdl->dmaHandle)
-+            &&  (physical < mdl->dmaHandle + mdl->numPages * PAGE_SIZE)
-+            )
-+            {
-+                *Logical = mdl->addr + (physical - mdl->dmaHandle);
-+                break;
-+            }
-+        }
-+
-+        mdl = mdl->next;
-+    }
-+
-+    if (mdl == gcvNULL)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	struct contiguous_mem_pool *pool = Os->device->pool;
-+
-+	if (Physical >= pool->phys && Physical < pool->phys + pool->size)
-+		logical = (gctPOINTER)(Physical - pool->phys + pool->virt);
-+	else
-+		logical = gcvNULL;
-+#else
-+        /* Map memory as cached memory. */
-+        request_mem_region(physical, Bytes, "MapRegion");
-+        logical = (gctPOINTER) ioremap_nocache(physical, Bytes);
-+#endif
-+
-+        if (logical == gcvNULL)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_OS,
-+                "%s(%d): Failed to map physical address 0x%08x",
-+                __FUNCTION__, __LINE__, Physical
-+                );
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            /* Out of resources. */
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+            return gcvSTATUS_OUT_OF_RESOURCES;
-+        }
-+
-+        /* Return pointer to mapped memory. */
-+        *Logical = logical;
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Logical=0x%X", *Logical);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnmapPhysical
-+**
-+**  Unmap a previously mapped memory region from kernel memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Logical
-+**          Pointer to the base address of the memory to unmap.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to unmap.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnmapPhysical(
-+    IN gckOS Os,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    PLINUX_MDL  mdl;
-+
-+    gcmkHEADER_ARG("Os=0x%X Logical=0x%X Bytes=%lu", Os, Logical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    MEMORY_LOCK(Os);
-+
-+    mdl = Os->mdlHead;
-+
-+    while (mdl != gcvNULL)
-+    {
-+        if (mdl->addr != gcvNULL)
-+        {
-+            if (Logical >= (gctPOINTER)mdl->addr
-+                    && Logical < (gctPOINTER)((gctSTRING)mdl->addr + mdl->numPages * PAGE_SIZE))
-+            {
-+                break;
-+            }
-+        }
-+
-+        mdl = mdl->next;
-+    }
-+
-+    if (mdl == gcvNULL)
-+    {
-+        /* Unmap the memory. */
-+        iounmap(Logical);
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CreateMutex
-+**
-+**  Create a new mutex.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Mutex
-+**          Pointer to a variable that will hold a pointer to the mutex.
-+*/
-+gceSTATUS
-+gckOS_CreateMutex(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Mutex
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Validate the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
-+
-+    /* Allocate the mutex structure. */
-+    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(struct mutex), Mutex));
-+
-+    /* Initialize the mutex. */
-+    mutex_init(*Mutex);
-+
-+    /* Return status. */
-+    gcmkFOOTER_ARG("*Mutex=0x%X", *Mutex);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DeleteMutex
-+**
-+**  Delete a mutex.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Mutex
-+**          Pointer to the mute to be deleted.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_DeleteMutex(
-+    IN gckOS Os,
-+    IN gctPOINTER Mutex
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Mutex=0x%X", Os, Mutex);
-+
-+    /* Validate the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
-+
-+    /* Destroy the mutex. */
-+    mutex_destroy(Mutex);
-+
-+    /* Free the mutex structure. */
-+    gcmkONERROR(gckOS_Free(Os, Mutex));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AcquireMutex
-+**
-+**  Acquire a mutex.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Mutex
-+**          Pointer to the mutex to be acquired.
-+**
-+**      gctUINT32 Timeout
-+**          Timeout value specified in milliseconds.
-+**          Specify the value of gcvINFINITE to keep the thread suspended
-+**          until the mutex has been acquired.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AcquireMutex(
-+    IN gckOS Os,
-+    IN gctPOINTER Mutex,
-+    IN gctUINT32 Timeout
-+    )
-+{
-+#if gcdDETECT_TIMEOUT
-+    gctUINT32 timeout;
-+#endif
-+
-+    gcmkHEADER_ARG("Os=0x%X Mutex=0x%0x Timeout=%u", Os, Mutex, Timeout);
-+
-+    /* Validate the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
-+
-+#if gcdDETECT_TIMEOUT
-+    timeout = 0;
-+
-+    for (;;)
-+    {
-+        /* Try to acquire the mutex. */
-+        if (mutex_trylock(Mutex))
-+        {
-+            /* Success. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        /* Advance the timeout. */
-+        timeout += 1;
-+
-+        if (Timeout == gcvINFINITE)
-+        {
-+            if (timeout == gcdINFINITE_TIMEOUT)
-+            {
-+                gctUINT32 dmaAddress1, dmaAddress2;
-+                gctUINT32 dmaState1, dmaState2;
-+
-+                dmaState1   = dmaState2   =
-+                dmaAddress1 = dmaAddress2 = 0;
-+
-+                /* Verify whether DMA is running. */
-+                gcmkVERIFY_OK(_VerifyDMA(
-+                    Os, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
-+                    ));
-+
-+#if gcdDETECT_DMA_ADDRESS
-+                /* Dump only if DMA appears stuck. */
-+                if (
-+                    (dmaAddress1 == dmaAddress2)
-+#if gcdDETECT_DMA_STATE
-+                 && (dmaState1   == dmaState2)
-+#      endif
-+                )
-+#   endif
-+                {
-+                    gcmkVERIFY_OK(_DumpGPUState(Os, gcvCORE_MAJOR));
-+
-+                    gcmkPRINT(
-+                        "%s(%d): mutex 0x%X; forced message flush.",
-+                        __FUNCTION__, __LINE__, Mutex
-+                        );
-+
-+                    /* Flush the debug cache. */
-+                    gcmkDEBUGFLUSH(dmaAddress2);
-+                }
-+
-+                timeout = 0;
-+            }
-+        }
-+        else
-+        {
-+            /* Timedout? */
-+            if (timeout >= Timeout)
-+            {
-+                break;
-+            }
-+        }
-+
-+        /* Wait for 1 millisecond. */
-+        gcmkVERIFY_OK(gckOS_Delay(Os, 1));
-+    }
-+#else
-+    if (Timeout == gcvINFINITE)
-+    {
-+        /* Lock the mutex. */
-+        mutex_lock(Mutex);
-+
-+        /* Success. */
-+        gcmkFOOTER_NO();
-+        return gcvSTATUS_OK;
-+    }
-+
-+    for (;;)
-+    {
-+        /* Try to acquire the mutex. */
-+        if (mutex_trylock(Mutex))
-+        {
-+            /* Success. */
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        if (Timeout-- == 0)
-+        {
-+            break;
-+        }
-+
-+        /* Wait for 1 millisecond. */
-+        gcmkVERIFY_OK(gckOS_Delay(Os, 1));
-+    }
-+#endif
-+
-+    /* Timeout. */
-+    gcmkFOOTER_ARG("status=%d", gcvSTATUS_TIMEOUT);
-+    return gcvSTATUS_TIMEOUT;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_ReleaseMutex
-+**
-+**  Release an acquired mutex.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Mutex
-+**          Pointer to the mutex to be released.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_ReleaseMutex(
-+    IN gckOS Os,
-+    IN gctPOINTER Mutex
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Mutex=0x%0x", Os, Mutex);
-+
-+    /* Validate the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
-+
-+    /* Release the mutex. */
-+    mutex_unlock(Mutex);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomicExchange
-+**
-+**  Atomically exchange a pair of 32-bit values.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      IN OUT gctINT32_PTR Target
-+**          Pointer to the 32-bit value to exchange.
-+**
-+**      IN gctINT32 NewValue
-+**          Specifies a new value for the 32-bit value pointed to by Target.
-+**
-+**      OUT gctINT32_PTR OldValue
-+**          The old value of the 32-bit value pointed to by Target.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomicExchange(
-+    IN gckOS Os,
-+    IN OUT gctUINT32_PTR Target,
-+    IN gctUINT32 NewValue,
-+    OUT gctUINT32_PTR OldValue
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Target=0x%X NewValue=%u", Os, Target, NewValue);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+    /* Exchange the pair of 32-bit values. */
-+    *OldValue = (gctUINT32) atomic_xchg((atomic_t *) Target, (int) NewValue);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*OldValue=%u", *OldValue);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomicExchangePtr
-+**
-+**  Atomically exchange a pair of pointers.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      IN OUT gctPOINTER * Target
-+**          Pointer to the 32-bit value to exchange.
-+**
-+**      IN gctPOINTER NewValue
-+**          Specifies a new value for the pointer pointed to by Target.
-+**
-+**      OUT gctPOINTER * OldValue
-+**          The old value of the pointer pointed to by Target.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomicExchangePtr(
-+    IN gckOS Os,
-+    IN OUT gctPOINTER * Target,
-+    IN gctPOINTER NewValue,
-+    OUT gctPOINTER * OldValue
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Target=0x%X NewValue=0x%X", Os, Target, NewValue);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+    /* Exchange the pair of pointers. */
-+    *OldValue = (gctPOINTER)(gctUINTPTR_T) atomic_xchg((atomic_t *) Target, (int)(gctUINTPTR_T) NewValue);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*OldValue=0x%X", *OldValue);
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdSMP
-+/*******************************************************************************
-+**
-+**  gckOS_AtomicSetMask
-+**
-+**  Atomically set mask to Atom
-+**
-+**  INPUT:
-+**      IN OUT gctPOINTER Atom
-+**          Pointer to the atom to set.
-+**
-+**      IN gctUINT32 Mask
-+**          Mask to set.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomSetMask(
-+    IN gctPOINTER Atom,
-+    IN gctUINT32 Mask
-+    )
-+{
-+    gctUINT32 oval, nval;
-+
-+    gcmkHEADER_ARG("Atom=0x%0x", Atom);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    do
-+    {
-+        oval = atomic_read((atomic_t *) Atom);
-+        nval = oval | Mask;
-+    } while (atomic_cmpxchg((atomic_t *) Atom, oval, nval) != oval);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomClearMask
-+**
-+**  Atomically clear mask from Atom
-+**
-+**  INPUT:
-+**      IN OUT gctPOINTER Atom
-+**          Pointer to the atom to clear.
-+**
-+**      IN gctUINT32 Mask
-+**          Mask to clear.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomClearMask(
-+    IN gctPOINTER Atom,
-+    IN gctUINT32 Mask
-+    )
-+{
-+    gctUINT32 oval, nval;
-+
-+    gcmkHEADER_ARG("Atom=0x%0x", Atom);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    do
-+    {
-+        oval = atomic_read((atomic_t *) Atom);
-+        nval = oval & ~Mask;
-+    } while (atomic_cmpxchg((atomic_t *) Atom, oval, nval) != oval);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomConstruct
-+**
-+**  Create an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Atom
-+**          Pointer to a variable receiving the constructed atom.
-+*/
-+gceSTATUS
-+gckOS_AtomConstruct(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Atom
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    /* Allocate the atom. */
-+    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(atomic_t), Atom));
-+
-+    /* Initialize the atom. */
-+    atomic_set((atomic_t *) *Atom, 0);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Atom=0x%X", *Atom);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomDestroy
-+**
-+**  Destroy an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom to destroy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomDestroy(
-+    IN gckOS Os,
-+    OUT gctPOINTER Atom
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    /* Free the atom. */
-+    gcmkONERROR(gcmkOS_SAFE_FREE(Os, Atom));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomGet
-+**
-+**  Get the 32-bit value protected by an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT32_PTR Value
-+**          Pointer to a variable the receives the value of the atom.
-+*/
-+gceSTATUS
-+gckOS_AtomGet(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    OUT gctINT32_PTR Value
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    /* Return the current value of atom. */
-+    *Value = atomic_read((atomic_t *) Atom);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Value=%d", *Value);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomSet
-+**
-+**  Set the 32-bit value protected by an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**      gctINT32 Value
-+**          The value of the atom.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AtomSet(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    IN gctINT32 Value
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x Value=%d", Os, Atom);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    /* Set the current value of atom. */
-+    atomic_set((atomic_t *) Atom, Value);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomIncrement
-+**
-+**  Atomically increment the 32-bit integer value inside an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT32_PTR Value
-+**          Pointer to a variable that receives the original value of the atom.
-+*/
-+gceSTATUS
-+gckOS_AtomIncrement(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    OUT gctINT32_PTR Value
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    /* Increment the atom. */
-+    *Value = atomic_inc_return((atomic_t *) Atom) - 1;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Value=%d", *Value);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AtomDecrement
-+**
-+**  Atomically decrement the 32-bit integer value inside an atom.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gctPOINTER Atom
-+**          Pointer to the atom.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT32_PTR Value
-+**          Pointer to a variable that receives the original value of the atom.
-+*/
-+gceSTATUS
-+gckOS_AtomDecrement(
-+    IN gckOS Os,
-+    IN gctPOINTER Atom,
-+    OUT gctINT32_PTR Value
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
-+
-+    /* Decrement the atom. */
-+    *Value = atomic_dec_return((atomic_t *) Atom) + 1;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Value=%d", *Value);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Delay
-+**
-+**  Delay execution of the current thread for a number of milliseconds.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 Delay
-+**          Delay to sleep, specified in milliseconds.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_Delay(
-+    IN gckOS Os,
-+    IN gctUINT32 Delay
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Delay=%u", Os, Delay);
-+
-+    if (Delay > 0)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 28)
-+        ktime_t delay = ktime_set(Delay/1000, (Delay%1000) * NSEC_PER_MSEC);
-+        __set_current_state(TASK_UNINTERRUPTIBLE);
-+        schedule_hrtimeout(&delay, HRTIMER_MODE_REL);
-+#else
-+        msleep(Delay);
-+#endif
-+
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetTicks
-+**
-+**  Get the number of milliseconds since the system started.
-+**
-+**  INPUT:
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR Time
-+**          Pointer to a variable to get time.
-+**
-+*/
-+gceSTATUS
-+gckOS_GetTicks(
-+    OUT gctUINT32_PTR Time
-+    )
-+{
-+     gcmkHEADER();
-+
-+    *Time = jiffies_to_msecs(jiffies);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_TicksAfter
-+**
-+**  Compare time values got from gckOS_GetTicks.
-+**
-+**  INPUT:
-+**      gctUINT32 Time1
-+**          First time value to be compared.
-+**
-+**      gctUINT32 Time2
-+**          Second time value to be compared.
-+**
-+**  OUTPUT:
-+**
-+**      gctBOOL_PTR IsAfter
-+**          Pointer to a variable to result.
-+**
-+*/
-+gceSTATUS
-+gckOS_TicksAfter(
-+    IN gctUINT32 Time1,
-+    IN gctUINT32 Time2,
-+    OUT gctBOOL_PTR IsAfter
-+    )
-+{
-+    gcmkHEADER();
-+
-+    *IsAfter = time_after((unsigned long)Time1, (unsigned long)Time2);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetTime
-+**
-+**  Get the number of microseconds since the system started.
-+**
-+**  INPUT:
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT64_PTR Time
-+**          Pointer to a variable to get time.
-+**
-+*/
-+gceSTATUS
-+gckOS_GetTime(
-+    OUT gctUINT64_PTR Time
-+    )
-+{
-+    gcmkHEADER();
-+
-+    *Time = 0;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MemoryBarrier
-+**
-+**  Make sure the CPU has executed everything up to this point and the data got
-+**  written to the specified pointer.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Address
-+**          Address of memory that needs to be barriered.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_MemoryBarrier(
-+    IN gckOS Os,
-+    IN gctPOINTER Address
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Address=0x%X", Os, Address);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+#if gcdNONPAGED_MEMORY_BUFFERABLE \
-+    && defined (CONFIG_ARM) \
-+    && (LINUX_VERSION_CODE < KERNEL_VERSION(2,6,34))
-+    /* drain write buffer */
-+    dsb();
-+
-+    /* drain outer cache's write buffer? */
-+#else
-+    mb();
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AllocatePagedMemory
-+**
-+**  Allocate memory from the paged pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPHYS_ADDR * Physical
-+**          Pointer to a variable that receives the physical address of the
-+**          memory allocation.
-+*/
-+gceSTATUS
-+gckOS_AllocatePagedMemory(
-+    IN gckOS Os,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPHYS_ADDR * Physical
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Bytes=%lu", Os, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+
-+    /* Allocate the memory. */
-+    gcmkONERROR(gckOS_AllocatePagedMemoryEx(Os, gcvFALSE, Bytes, Physical));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Physical=0x%X", *Physical);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AllocatePagedMemoryEx
-+**
-+**  Allocate memory from the paged pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctBOOL Contiguous
-+**          Need contiguous memory or not.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctPHYS_ADDR * Physical
-+**          Pointer to a variable that receives the physical address of the
-+**          memory allocation.
-+*/
-+gceSTATUS
-+gckOS_AllocatePagedMemoryEx(
-+    IN gckOS Os,
-+    IN gctBOOL Contiguous,
-+    IN gctSIZE_T Bytes,
-+    OUT gctPHYS_ADDR * Physical
-+    )
-+{
-+    gctINT numPages;
-+    gctINT i;
-+    PLINUX_MDL mdl = gcvNULL;
-+    gctSIZE_T bytes;
-+    gctBOOL locked = gcvFALSE;
-+    gceSTATUS status;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+    gctPOINTER addr = gcvNULL;
-+#endif
-+
-+    gcmkHEADER_ARG("Os=0x%X Contiguous=%d Bytes=%lu", Os, Contiguous, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+
-+    bytes = gcmALIGN(Bytes, PAGE_SIZE);
-+
-+    numPages = GetPageCount(bytes, 0);
-+
-+    MEMORY_LOCK(Os);
-+    locked = gcvTRUE;
-+
-+    mdl = _CreateMdl(_GetProcessID());
-+    if (mdl == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    if (Contiguous)
-+    {
-+        gctUINT32 order = get_order(bytes);
-+
-+        if (order >= MAX_ORDER)
-+        {
-+            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+        }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+        addr =
-+            alloc_pages_exact(numPages * PAGE_SIZE, GFP_KERNEL | gcdNOWARN | __GFP_NORETRY);
-+
-+        mdl->u.contiguousPages = addr
-+                               ? virt_to_page(addr)
-+                               : gcvNULL;
-+
-+        mdl->exact = gcvTRUE;
-+#else
-+        mdl->u.contiguousPages =
-+            alloc_pages(GFP_KERNEL | gcdNOWARN | __GFP_NORETRY, order);
-+#endif
-+        if (mdl->u.contiguousPages == gcvNULL)
-+        {
-+            mdl->u.contiguousPages =
-+                alloc_pages(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN, order);
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+            mdl->exact = gcvFALSE;
-+#endif
-+        }
-+    }
-+    else
-+    {
-+        mdl->u.nonContiguousPages = _NonContiguousAlloc(numPages);
-+    }
-+
-+    if (mdl->u.contiguousPages == gcvNULL && mdl->u.nonContiguousPages == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    mdl->dmaHandle  = 0;
-+    mdl->addr       = 0;
-+    mdl->numPages   = numPages;
-+    mdl->pagedMem   = 1;
-+    mdl->contiguous = Contiguous;
-+
-+    for (i = 0; i < mdl->numPages; i++)
-+    {
-+        struct page *page;
-+
-+        if (mdl->contiguous)
-+        {
-+            page = nth_page(mdl->u.contiguousPages, i);
-+        }
-+        else
-+        {
-+            page = _NonContiguousToPage(mdl->u.nonContiguousPages, i);
-+        }
-+
-+        SetPageReserved(page);
-+
-+        if (!PageHighMem(page) && page_to_phys(page))
-+        {
-+            gcmkVERIFY_OK(
-+                gckOS_CacheFlush(Os, _GetProcessID(), gcvNULL,
-+                                 (gctPOINTER)(gctUINTPTR_T)page_to_phys(page),
-+                                 page_address(page),
-+                                 PAGE_SIZE));
-+        }
-+    }
-+
-+    /* Return physical address. */
-+    *Physical = (gctPHYS_ADDR) mdl;
-+
-+    /*
-+     * Add this to a global list.
-+     * Will be used by get physical address
-+     * and mapuser pointer functions.
-+     */
-+    if (!Os->mdlHead)
-+    {
-+        /* Initialize the queue. */
-+        Os->mdlHead = Os->mdlTail = mdl;
-+    }
-+    else
-+    {
-+        /* Add to tail. */
-+        mdl->prev           = Os->mdlTail;
-+        Os->mdlTail->next   = mdl;
-+        Os->mdlTail         = mdl;
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Physical=0x%X", *Physical);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (mdl != gcvNULL)
-+    {
-+        /* Free the memory. */
-+        _DestroyMdl(mdl);
-+    }
-+
-+    if (locked)
-+    {
-+        /* Unlock the memory. */
-+        MEMORY_UNLOCK(Os);
-+    }
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_FreePagedMemory
-+**
-+**  Free memory allocated from the paged pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the allocation.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes of the allocation.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_FreePagedMemory(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    PLINUX_MDL mdl = (PLINUX_MDL) Physical;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    /*addr = mdl->addr;*/
-+
-+    MEMORY_LOCK(Os);
-+
-+    for (i = 0; i < mdl->numPages; i++)
-+    {
-+        if (mdl->contiguous)
-+        {
-+            ClearPageReserved(nth_page(mdl->u.contiguousPages, i));
-+        }
-+        else
-+        {
-+            ClearPageReserved(_NonContiguousToPage(mdl->u.nonContiguousPages, i));
-+        }
-+    }
-+
-+    if (mdl->contiguous)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+        if (mdl->exact == gcvTRUE)
-+        {
-+            free_pages_exact(page_address(mdl->u.contiguousPages), mdl->numPages * PAGE_SIZE);
-+        }
-+        else
-+#endif
-+        {
-+            __free_pages(mdl->u.contiguousPages, GetOrder(mdl->numPages));
-+        }
-+    }
-+    else
-+    {
-+        _NonContiguousFree(mdl->u.nonContiguousPages, mdl->numPages);
-+    }
-+
-+    /* Remove the node from global list. */
-+    if (mdl == Os->mdlHead)
-+    {
-+        if ((Os->mdlHead = mdl->next) == gcvNULL)
-+        {
-+            Os->mdlTail = gcvNULL;
-+        }
-+    }
-+    else
-+    {
-+        mdl->prev->next = mdl->next;
-+
-+        if (mdl == Os->mdlTail)
-+        {
-+            Os->mdlTail = mdl->prev;
-+        }
-+        else
-+        {
-+            mdl->next->prev = mdl->prev;
-+        }
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Free the structure... */
-+    gcmkVERIFY_OK(_DestroyMdl(mdl));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_LockPages
-+**
-+**  Lock memory allocated from the paged pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the allocation.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes of the allocation.
-+**
-+**      gctBOOL Cacheable
-+**          Cache mode of mapping.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that receives the address of the mapped
-+**          memory.
-+**
-+**      gctSIZE_T * PageCount
-+**          Pointer to a variable that receives the number of pages required for
-+**          the page table according to the GPU page size.
-+*/
-+gceSTATUS
-+gckOS_LockPages(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctBOOL Cacheable,
-+    OUT gctPOINTER * Logical,
-+    OUT gctSIZE_T * PageCount
-+    )
-+{
-+    PLINUX_MDL      mdl;
-+    PLINUX_MDL_MAP  mdlMap;
-+    gctSTRING       addr;
-+    unsigned long   start;
-+    unsigned long   pfn;
-+    gctINT          i;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(PageCount != gcvNULL);
-+
-+    mdl = (PLINUX_MDL) Physical;
-+
-+    MEMORY_LOCK(Os);
-+
-+    mdlMap = FindMdlMap(mdl, _GetProcessID());
-+
-+    if (mdlMap == gcvNULL)
-+    {
-+        mdlMap = _CreateMdlMap(mdl, _GetProcessID());
-+
-+        if (mdlMap == gcvNULL)
-+        {
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+            return gcvSTATUS_OUT_OF_MEMORY;
-+        }
-+    }
-+
-+    if (mdlMap->vmaAddr == gcvNULL)
-+    {
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
-+        mdlMap->vmaAddr = (gctSTRING)vm_mmap(gcvNULL,
-+                        0L,
-+                        mdl->numPages * PAGE_SIZE,
-+                        PROT_READ | PROT_WRITE,
-+                        MAP_SHARED,
-+                        0);
-+#else
-+        down_write(&current->mm->mmap_sem);
-+
-+        mdlMap->vmaAddr = (gctSTRING)do_mmap_pgoff(gcvNULL,
-+                        0L,
-+                        mdl->numPages * PAGE_SIZE,
-+                        PROT_READ | PROT_WRITE,
-+                        MAP_SHARED,
-+                        0);
-+
-+        up_write(&current->mm->mmap_sem);
-+#endif
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): vmaAddr->0x%X for phys_addr->0x%X",
-+            __FUNCTION__, __LINE__,
-+            (gctUINT32)(gctUINTPTR_T)mdlMap->vmaAddr,
-+            (gctUINT32)(gctUINTPTR_T)mdl
-+            );
-+
-+        if (IS_ERR(mdlMap->vmaAddr))
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_OS,
-+                "%s(%d): do_mmap_pgoff error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+            return gcvSTATUS_OUT_OF_MEMORY;
-+        }
-+
-+        down_write(&current->mm->mmap_sem);
-+
-+        mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
-+
-+        if (mdlMap->vma == gcvNULL)
-+        {
-+            up_write(&current->mm->mmap_sem);
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_OS,
-+                "%s(%d): find_vma error",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            mdlMap->vmaAddr = gcvNULL;
-+
-+            MEMORY_UNLOCK(Os);
-+
-+            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_RESOURCES);
-+            return gcvSTATUS_OUT_OF_RESOURCES;
-+        }
-+
-+        mdlMap->vma->vm_flags |= gcdVM_FLAGS;
-+
-+        if (Cacheable == gcvFALSE)
-+        {
-+            /* Make this mapping non-cached. */
-+            mdlMap->vma->vm_page_prot = gcmkPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
-+        }
-+
-+        addr = mdl->addr;
-+
-+        /* Now map all the vmalloc pages to this user address. */
-+        if (mdl->contiguous)
-+        {
-+            /* map kernel memory to user space.. */
-+            if (remap_pfn_range(mdlMap->vma,
-+                                mdlMap->vma->vm_start,
-+                                page_to_pfn(mdl->u.contiguousPages),
-+                                mdlMap->vma->vm_end - mdlMap->vma->vm_start,
-+                                mdlMap->vma->vm_page_prot) < 0)
-+            {
-+                up_write(&current->mm->mmap_sem);
-+
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_INFO, gcvZONE_OS,
-+                    "%s(%d): unable to mmap ret",
-+                    __FUNCTION__, __LINE__
-+                    );
-+
-+                mdlMap->vmaAddr = gcvNULL;
-+
-+                MEMORY_UNLOCK(Os);
-+
-+                gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+                return gcvSTATUS_OUT_OF_MEMORY;
-+            }
-+        }
-+        else
-+        {
-+            start = mdlMap->vma->vm_start;
-+
-+            for (i = 0; i < mdl->numPages; i++)
-+            {
-+                pfn = _NonContiguousToPfn(mdl->u.nonContiguousPages, i);
-+
-+                if (remap_pfn_range(mdlMap->vma,
-+                                    start,
-+                                    pfn,
-+                                    PAGE_SIZE,
-+                                    mdlMap->vma->vm_page_prot) < 0)
-+                {
-+                    up_write(&current->mm->mmap_sem);
-+
-+                    gcmkTRACE_ZONE(
-+                        gcvLEVEL_INFO, gcvZONE_OS,
-+                        "%s(%d): gctPHYS_ADDR->0x%X Logical->0x%X Unable to map addr->0x%X to start->0x%X",
-+                        __FUNCTION__, __LINE__,
-+                        (gctUINT32)(gctUINTPTR_T)Physical,
-+                        (gctUINT32)(gctUINTPTR_T)*Logical,
-+                        (gctUINT32)(gctUINTPTR_T)addr,
-+                        (gctUINT32)(gctUINTPTR_T)start
-+                        );
-+
-+                    mdlMap->vmaAddr = gcvNULL;
-+
-+                    MEMORY_UNLOCK(Os);
-+
-+                    gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+                    return gcvSTATUS_OUT_OF_MEMORY;
-+                }
-+
-+                start += PAGE_SIZE;
-+                addr += PAGE_SIZE;
-+            }
-+        }
-+
-+        up_write(&current->mm->mmap_sem);
-+    }
-+
-+    mdlMap->count++;
-+
-+    /* Convert pointer to MDL. */
-+    *Logical = mdlMap->vmaAddr;
-+
-+    /* Return the page number according to the GPU page size. */
-+    gcmkASSERT((PAGE_SIZE % 4096) == 0);
-+    gcmkASSERT((PAGE_SIZE / 4096) >= 1);
-+
-+    *PageCount = mdl->numPages * (PAGE_SIZE / 4096);
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    gcmkVERIFY_OK(gckOS_CacheFlush(
-+        Os,
-+        _GetProcessID(),
-+        Physical,
-+        gcvNULL,
-+        (gctPOINTER)mdlMap->vmaAddr,
-+        mdl->numPages * PAGE_SIZE
-+        ));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Logical=0x%X *PageCount=%lu", *Logical, *PageCount);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MapPages
-+**
-+**  Map paged memory into a page table.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the allocation.
-+**
-+**      gctSIZE_T PageCount
-+**          Number of pages required for the physical address.
-+**
-+**      gctPOINTER PageTable
-+**          Pointer to the page table to fill in.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_MapPages(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T PageCount,
-+    IN gctPOINTER PageTable
-+    )
-+{
-+    return gckOS_MapPagesEx(Os,
-+                            gcvCORE_MAJOR,
-+                            Physical,
-+                            PageCount,
-+                            PageTable);
-+}
-+
-+gceSTATUS
-+gckOS_MapPagesEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T PageCount,
-+    IN gctPOINTER PageTable
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    PLINUX_MDL  mdl;
-+    gctUINT32*  table;
-+    gctUINT32   offset;
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    gckMMU      mmu;
-+    PLINUX_MDL  mmuMdl;
-+    gctUINT32   bytes;
-+    gctPHYS_ADDR pageTablePhysical;
-+#endif
-+
-+    gcmkHEADER_ARG("Os=0x%X Core=%d Physical=0x%X PageCount=%u PageTable=0x%X",
-+                   Os, Core, Physical, PageCount, PageTable);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(PageCount > 0);
-+    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
-+
-+    /* Convert pointer to MDL. */
-+    mdl = (PLINUX_MDL)Physical;
-+
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_OS,
-+        "%s(%d): Physical->0x%X PageCount->0x%X PagedMemory->?%d",
-+        __FUNCTION__, __LINE__,
-+        (gctUINT32)(gctUINTPTR_T)Physical,
-+        (gctUINT32)(gctUINTPTR_T)PageCount,
-+        mdl->pagedMem
-+        );
-+
-+    MEMORY_LOCK(Os);
-+
-+    table = (gctUINT32 *)PageTable;
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    mmu = Os->device->kernels[Core]->mmu;
-+    bytes = PageCount * sizeof(*table);
-+    mmuMdl = (PLINUX_MDL)mmu->pageTablePhysical;
-+#endif
-+
-+     /* Get all the physical addresses and store them in the page table. */
-+
-+    offset = 0;
-+
-+    if (mdl->pagedMem)
-+    {
-+        /* Try to get the user pages so DMA can happen. */
-+        while (PageCount-- > 0)
-+        {
-+#if gcdENABLE_VG
-+            if (Core == gcvCORE_VG)
-+            {
-+                if (mdl->contiguous)
-+                {
-+                    gcmkONERROR(
-+                        gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
-+                             page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
-+                             table));
-+                }
-+                else
-+                {
-+                    gcmkONERROR(
-+                        gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
-+                             _NonContiguousToPhys(mdl->u.nonContiguousPages, offset),
-+                             table));
-+                }
-+            }
-+            else
-+#endif
-+            {
-+                if (mdl->contiguous)
-+                {
-+                    gcmkONERROR(
-+                        gckMMU_SetPage(Os->device->kernels[Core]->mmu,
-+                             page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
-+                             table));
-+                }
-+                else
-+                {
-+                    gcmkONERROR(
-+                        gckMMU_SetPage(Os->device->kernels[Core]->mmu,
-+                             _NonContiguousToPhys(mdl->u.nonContiguousPages, offset),
-+                             table));
-+                }
-+            }
-+
-+            table++;
-+            offset += 1;
-+        }
-+    }
-+    else
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): we should not get this call for Non Paged Memory!",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        while (PageCount-- > 0)
-+        {
-+#if gcdENABLE_VG
-+            if (Core == gcvCORE_VG)
-+            {
-+                gcmkONERROR(
-+                        gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
-+                                         page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
-+                                         table));
-+            }
-+            else
-+#endif
-+            {
-+                gcmkONERROR(
-+                        gckMMU_SetPage(Os->device->kernels[Core]->mmu,
-+                                         page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
-+                                         table));
-+            }
-+            table++;
-+            offset += 1;
-+        }
-+    }
-+
-+#if gcdNONPAGED_MEMORY_CACHEABLE
-+    /* Get physical address of pageTable */
-+    pageTablePhysical = (gctPHYS_ADDR)(mmuMdl->dmaHandle +
-+                        ((gctUINT32 *)PageTable - mmu->pageTableLogical));
-+
-+    /* Flush the mmu page table cache. */
-+    gcmkONERROR(gckOS_CacheClean(
-+        Os,
-+        _GetProcessID(),
-+        gcvNULL,
-+        pageTablePhysical,
-+        PageTable,
-+        bytes
-+        ));
-+#endif
-+
-+OnError:
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnlockPages
-+**
-+**  Unlock memory allocated from the paged pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the allocation.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes of the allocation.
-+**
-+**      gctPOINTER Logical
-+**          Address of the mapped memory.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnlockPages(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctSIZE_T Bytes,
-+    IN gctPOINTER Logical
-+    )
-+{
-+    PLINUX_MDL_MAP          mdlMap;
-+    PLINUX_MDL              mdl = (PLINUX_MDL)Physical;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%u Logical=0x%X",
-+                   Os, Physical, Bytes, Logical);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Make sure there is already a mapping...*/
-+    gcmkVERIFY_ARGUMENT(mdl->u.nonContiguousPages != gcvNULL
-+                       || mdl->u.contiguousPages != gcvNULL);
-+
-+    MEMORY_LOCK(Os);
-+
-+    mdlMap = mdl->maps;
-+
-+    while (mdlMap != gcvNULL)
-+    {
-+        if ((mdlMap->vmaAddr != gcvNULL) && (_GetProcessID() == mdlMap->pid))
-+        {
-+            if (--mdlMap->count == 0)
-+            {
-+                _UnmapUserLogical(mdlMap->pid, mdlMap->vmaAddr, mdl->numPages * PAGE_SIZE);
-+                mdlMap->vmaAddr = gcvNULL;
-+            }
-+        }
-+
-+        mdlMap = mdlMap->next;
-+    }
-+
-+    MEMORY_UNLOCK(Os);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AllocateContiguous
-+**
-+**  Allocate memory from the contiguous pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctBOOL InUserSpace
-+**          gcvTRUE if the pages need to be mapped into user space.
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to the number of bytes to allocate.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIZE_T * Bytes
-+**          Pointer to a variable that receives the number of bytes allocated.
-+**
-+**      gctPHYS_ADDR * Physical
-+**          Pointer to a variable that receives the physical address of the
-+**          memory allocation.
-+**
-+**      gctPOINTER * Logical
-+**          Pointer to a variable that receives the logical address of the
-+**          memory allocation.
-+*/
-+gceSTATUS
-+gckOS_AllocateContiguous(
-+    IN gckOS Os,
-+    IN gctBOOL InUserSpace,
-+    IN OUT gctSIZE_T * Bytes,
-+    OUT gctPHYS_ADDR * Physical,
-+    OUT gctPOINTER * Logical
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X InUserSpace=%d *Bytes=%lu",
-+                   Os, InUserSpace, gcmOPT_VALUE(Bytes));
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Bytes != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(*Bytes > 0);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+
-+    /* Same as non-paged memory for now. */
-+    gcmkONERROR(gckOS_AllocateNonPagedMemory(Os,
-+                                             InUserSpace,
-+                                             Bytes,
-+                                             Physical,
-+                                             Logical));
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*Bytes=%lu *Physical=0x%X *Logical=0x%X",
-+                   *Bytes, *Physical, *Logical);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_FreeContiguous
-+**
-+**  Free memory allocated from the contiguous pool.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPHYS_ADDR Physical
-+**          Physical address of the allocation.
-+**
-+**      gctPOINTER Logical
-+**          Logicval address of the allocation.
-+**
-+**      gctSIZE_T Bytes
-+**          Number of bytes of the allocation.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_FreeContiguous(
-+    IN gckOS Os,
-+    IN gctPHYS_ADDR Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Logical=0x%X Bytes=%lu",
-+                   Os, Physical, Logical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    /* Same of non-paged memory for now. */
-+    gcmkONERROR(gckOS_FreeNonPagedMemory(Os, Bytes, Physical, Logical));
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdENABLE_VG
-+/******************************************************************************
-+**
-+**  gckOS_GetKernelLogical
-+**
-+**  Return the kernel logical pointer that corresponods to the specified
-+**  hardware address.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 Address
-+**          Hardware physical address.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * KernelPointer
-+**          Pointer to a variable receiving the pointer in kernel address space.
-+*/
-+gceSTATUS
-+gckOS_GetKernelLogical(
-+    IN gckOS Os,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    return gckOS_GetKernelLogicalEx(Os, gcvCORE_MAJOR, Address, KernelPointer);
-+}
-+
-+gceSTATUS
-+gckOS_GetKernelLogicalEx(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT32 Address,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Core=%d Address=0x%08x", Os, Core, Address);
-+
-+    do
-+    {
-+        gckGALDEVICE device;
-+        gckKERNEL kernel;
-+        gcePOOL pool;
-+        gctUINT32 offset;
-+        gctPOINTER logical;
-+
-+        /* Extract the pointer to the gckGALDEVICE class. */
-+        device = (gckGALDEVICE) Os->device;
-+
-+        /* Kernel shortcut. */
-+        kernel = device->kernels[Core];
-+#if gcdENABLE_VG
-+       if (Core == gcvCORE_VG)
-+       {
-+           gcmkERR_BREAK(gckVGHARDWARE_SplitMemory(
-+                kernel->vg->hardware, Address, &pool, &offset
-+                ));
-+       }
-+       else
-+#endif
-+       {
-+        /* Split the memory address into a pool type and offset. */
-+            gcmkERR_BREAK(gckHARDWARE_SplitMemory(
-+                kernel->hardware, Address, &pool, &offset
-+                ));
-+       }
-+
-+        /* Dispatch on pool. */
-+        switch (pool)
-+        {
-+        case gcvPOOL_LOCAL_INTERNAL:
-+            /* Internal memory. */
-+            logical = device->internalLogical;
-+            break;
-+
-+        case gcvPOOL_LOCAL_EXTERNAL:
-+            /* External memory. */
-+            logical = device->externalLogical;
-+            break;
-+
-+        case gcvPOOL_SYSTEM:
-+            /* System memory. */
-+            logical = device->contiguousBase;
-+            break;
-+
-+        default:
-+            /* Invalid memory pool. */
-+            gcmkFOOTER();
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+        }
-+
-+        /* Build logical address of specified address. */
-+        * KernelPointer = ((gctUINT8_PTR) logical) + offset;
-+
-+        /* Success. */
-+        gcmkFOOTER_ARG("*KernelPointer=0x%X", *KernelPointer);
-+        return gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    /* Return status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MapUserPointer
-+**
-+**  Map a pointer from the user process into the kernel address space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Pointer
-+**          Pointer in user process space that needs to be mapped.
-+**
-+**      gctSIZE_T Size
-+**          Number of bytes that need to be mapped.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * KernelPointer
-+**          Pointer to a variable receiving the mapped pointer in kernel address
-+**          space.
-+*/
-+gceSTATUS
-+gckOS_MapUserPointer(
-+    IN gckOS Os,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * KernelPointer
-+    )
-+{
-+    gctPOINTER buf = gcvNULL;
-+    gctUINT32 len;
-+
-+    gcmkHEADER_ARG("Os=0x%X Pointer=0x%X Size=%lu", Os, Pointer, Size);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
-+
-+    buf = kmalloc(Size, GFP_KERNEL | gcdNOWARN);
-+    if (buf == gcvNULL)
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): Failed to allocate memory.",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
-+        return gcvSTATUS_OUT_OF_MEMORY;
-+    }
-+
-+    len = copy_from_user(buf, Pointer, Size);
-+    if (len != 0)
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): Failed to copy data from user.",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        if (buf != gcvNULL)
-+        {
-+            kfree(buf);
-+        }
-+
-+        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_GENERIC_IO);
-+        return gcvSTATUS_GENERIC_IO;
-+    }
-+
-+    *KernelPointer = buf;
-+
-+    gcmkFOOTER_ARG("*KernelPointer=0x%X", *KernelPointer);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnmapUserPointer
-+**
-+**  Unmap a user process pointer from the kernel address space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Pointer
-+**          Pointer in user process space that needs to be unmapped.
-+**
-+**      gctSIZE_T Size
-+**          Number of bytes that need to be unmapped.
-+**
-+**      gctPOINTER KernelPointer
-+**          Pointer in kernel address space that needs to be unmapped.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnmapUserPointer(
-+    IN gckOS Os,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size,
-+    IN gctPOINTER KernelPointer
-+    )
-+{
-+    gctUINT32 len;
-+
-+    gcmkHEADER_ARG("Os=0x%X Pointer=0x%X Size=%lu KernelPointer=0x%X",
-+                   Os, Pointer, Size, KernelPointer);
-+
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
-+
-+    len = copy_to_user(Pointer, KernelPointer, Size);
-+
-+    kfree(KernelPointer);
-+
-+    if (len != 0)
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): Failed to copy data to user.",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkFOOTER_ARG("status=%d", gcvSTATUS_GENERIC_IO);
-+        return gcvSTATUS_GENERIC_IO;
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_QueryNeedCopy
-+**
-+**  Query whether the memory can be accessed or mapped directly or it has to be
-+**  copied.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID of the current process.
-+**
-+**  OUTPUT:
-+**
-+**      gctBOOL_PTR NeedCopy
-+**          Pointer to a boolean receiving gcvTRUE if the memory needs a copy or
-+**          gcvFALSE if the memory can be accessed or mapped dircetly.
-+*/
-+gceSTATUS
-+gckOS_QueryNeedCopy(
-+    IN gckOS Os,
-+    IN gctUINT32 ProcessID,
-+    OUT gctBOOL_PTR NeedCopy
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X ProcessID=%d", Os, ProcessID);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(NeedCopy != gcvNULL);
-+
-+    /* We need to copy data. */
-+    *NeedCopy = gcvTRUE;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*NeedCopy=%d", *NeedCopy);
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CopyFromUserData
-+**
-+**  Copy data from user to kernel memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER KernelPointer
-+**          Pointer to kernel memory.
-+**
-+**      gctPOINTER Pointer
-+**          Pointer to user memory.
-+**
-+**      gctSIZE_T Size
-+**          Number of bytes to copy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_CopyFromUserData(
-+    IN gckOS Os,
-+    IN gctPOINTER KernelPointer,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X KernelPointer=0x%X Pointer=0x%X Size=%lu",
-+                   Os, KernelPointer, Pointer, Size);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+
-+    /* Copy data from user. */
-+    if (copy_from_user(KernelPointer, Pointer, Size) != 0)
-+    {
-+        /* Could not copy all the bytes. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CopyToUserData
-+**
-+**  Copy data from kernel to user memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER KernelPointer
-+**          Pointer to kernel memory.
-+**
-+**      gctPOINTER Pointer
-+**          Pointer to user memory.
-+**
-+**      gctSIZE_T Size
-+**          Number of bytes to copy.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_CopyToUserData(
-+    IN gckOS Os,
-+    IN gctPOINTER KernelPointer,
-+    IN gctPOINTER Pointer,
-+    IN gctSIZE_T Size
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X KernelPointer=0x%X Pointer=0x%X Size=%lu",
-+                   Os, KernelPointer, Pointer, Size);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+
-+    /* Copy data to user. */
-+    if (copy_to_user(Pointer, KernelPointer, Size) != 0)
-+    {
-+        /* Could not copy all the bytes. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_WriteMemory
-+**
-+**  Write data to a memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctPOINTER Address
-+**          Address of the memory to write to.
-+**
-+**      gctUINT32 Data
-+**          Data for register.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_WriteMemory(
-+    IN gckOS Os,
-+    IN gctPOINTER Address,
-+    IN gctUINT32 Data
-+    )
-+{
-+    gceSTATUS status;
-+    gcmkHEADER_ARG("Os=0x%X Address=0x%X Data=%u", Os, Address, Data);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    /* Write memory. */
-+    if (access_ok(VERIFY_WRITE, Address, 4))
-+    {
-+        /* User address. */
-+        if(put_user(Data, (gctUINT32*)Address))
-+        {
-+            gcmkONERROR(gcvSTATUS_INVALID_ADDRESS);
-+        }
-+    }
-+    else
-+    {
-+        /* Kernel address. */
-+        *(gctUINT32 *)Address = Data;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MapUserMemory
-+**
-+**  Lock down a user buffer and return an DMA'able address to be used by the
-+**  hardware to access it.
-+**
-+**  INPUT:
-+**
-+**      gctPOINTER Memory
-+**          Pointer to memory to lock down.
-+**
-+**      gctSIZE_T Size
-+**          Size in bytes of the memory to lock down.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Info
-+**          Pointer to variable receiving the information record required by
-+**          gckOS_UnmapUserMemory.
-+**
-+**      gctUINT32_PTR Address
-+**          Pointer to a variable that will receive the address DMA'able by the
-+**          hardware.
-+*/
-+gceSTATUS
-+gckOS_MapUserMemory(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPOINTER Memory,
-+    IN gctUINT32 Physical,
-+    IN gctSIZE_T Size,
-+    OUT gctPOINTER * Info,
-+    OUT gctUINT32_PTR Address
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%x Core=%d Memory=0x%x Size=%lu", Os, Core, Memory, Size);
-+
-+#if gcdSECURE_USER
-+    gcmkONERROR(gckOS_AddMapping(Os, *Address, Memory, Size));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+#else
-+{
-+    gctSIZE_T pageCount, i, j;
-+    gctUINT32_PTR pageTable;
-+    gctUINT32 address = 0, physical = ~0U;
-+    gctUINTPTR_T start, end, memory;
-+    gctUINT32 offset;
-+    gctINT result = 0;
-+
-+    gcsPageInfo_PTR info = gcvNULL;
-+    struct page **pages = gcvNULL;
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL || Physical != ~0U);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
-+
-+    do
-+    {
-+        memory = (gctUINTPTR_T) Memory;
-+
-+        /* Get the number of required pages. */
-+        end = (memory + Size + PAGE_SIZE - 1) >> PAGE_SHIFT;
-+        start = memory >> PAGE_SHIFT;
-+        pageCount = end - start;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): pageCount: %d.",
-+            __FUNCTION__, __LINE__,
-+            pageCount
-+            );
-+
-+        /* Overflow. */
-+        if ((memory + Size) < memory)
-+        {
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+        }
-+
-+        MEMORY_MAP_LOCK(Os);
-+
-+        /* Allocate the Info struct. */
-+        info = (gcsPageInfo_PTR)kmalloc(sizeof(gcsPageInfo), GFP_KERNEL | gcdNOWARN);
-+
-+        if (info == gcvNULL)
-+        {
-+            status = gcvSTATUS_OUT_OF_MEMORY;
-+            break;
-+        }
-+
-+        /* Allocate the array of page addresses. */
-+        pages = (struct page **)kmalloc(pageCount * sizeof(struct page *), GFP_KERNEL | gcdNOWARN);
-+
-+        if (pages == gcvNULL)
-+        {
-+            status = gcvSTATUS_OUT_OF_MEMORY;
-+            break;
-+        }
-+
-+        if (Physical != ~0U)
-+        {
-+            for (i = 0; i < pageCount; i++)
-+            {
-+                pages[i] = pfn_to_page((Physical >> PAGE_SHIFT) + i);
-+                get_page(pages[i]);
-+            }
-+        }
-+        else
-+        {
-+            /* Get the user pages. */
-+            down_read(&current->mm->mmap_sem);
-+
-+            result = get_user_pages(current,
-+                    current->mm,
-+                    memory & PAGE_MASK,
-+                    pageCount,
-+                    1,
-+                    0,
-+                    pages,
-+                    gcvNULL
-+                    );
-+
-+            up_read(&current->mm->mmap_sem);
-+
-+            if (result <=0 || result < pageCount)
-+            {
-+                struct vm_area_struct *vma;
-+
-+                /* Release the pages if any. */
-+                if (result > 0)
-+                {
-+                    for (i = 0; i < result; i++)
-+                    {
-+                        if (pages[i] == gcvNULL)
-+                        {
-+                            break;
-+                        }
-+
-+                        page_cache_release(pages[i]);
-+                        pages[i] = gcvNULL;
-+                    }
-+
-+                    result = 0;
-+                }
-+
-+                vma = find_vma(current->mm, memory);
-+
-+                if (vma && (vma->vm_flags & VM_PFNMAP))
-+                {
-+                    pte_t       * pte;
-+                    spinlock_t  * ptl;
-+                    gctUINTPTR_T logical = memory;
-+
-+                    for (i = 0; i < pageCount; i++)
-+                    {
-+                        pgd_t * pgd = pgd_offset(current->mm, logical);
-+                        pud_t * pud = pud_offset(pgd, logical);
-+
-+                        if (pud)
-+                        {
-+                            pmd_t * pmd = pmd_offset(pud, logical);
-+                            pte = pte_offset_map_lock(current->mm, pmd, logical, &ptl);
-+                            if (!pte)
-+                            {
-+                                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+                            }
-+                        }
-+                        else
-+                        {
-+                            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+                        }
-+
-+                        pages[i] = pte_page(*pte);
-+                        pte_unmap_unlock(pte, ptl);
-+
-+                        /* Advance to next. */
-+                        logical += PAGE_SIZE;
-+                    }
-+                }
-+                else
-+                {
-+                    gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+                }
-+
-+                /* Check if this memory is contiguous for old mmu. */
-+                if (Os->device->kernels[Core]->hardware->mmuVersion == 0)
-+                {
-+                    for (i = 1; i < pageCount; i++)
-+                    {
-+                        if (pages[i] != nth_page(pages[0], i))
-+                        {
-+                            /* Non-contiguous. */
-+                            break;
-+                        }
-+                    }
-+
-+                    if (i == pageCount)
-+                    {
-+                        /* Contiguous memory. */
-+                        physical = page_to_phys(pages[0]) | (memory & ~PAGE_MASK);
-+
-+                        if (!((physical - Os->device->baseAddress) & 0x80000000))
-+                        {
-+                            kfree(pages);
-+                            pages = gcvNULL;
-+
-+                            info->pages = gcvNULL;
-+                            info->pageTable = gcvNULL;
-+
-+                            MEMORY_MAP_UNLOCK(Os);
-+
-+                            *Address = physical - Os->device->baseAddress;
-+                            *Info    = info;
-+
-+                            gcmkFOOTER_ARG("*Info=0x%X *Address=0x%08x",
-+                                           *Info, *Address);
-+
-+                            return gcvSTATUS_OK;
-+                        }
-+                    }
-+                }
-+
-+                /* Reference pages. */
-+                for (i = 0; i < pageCount; i++)
-+                {
-+                    get_page(pages[i]);
-+                }
-+            }
-+        }
-+
-+        for (i = 0; i < pageCount; i++)
-+        {
-+#ifdef CONFIG_ARM
-+            gctUINT32 data;
-+            get_user(data, (gctUINT32*)((memory & PAGE_MASK) + i * PAGE_SIZE));
-+#endif
-+
-+            /* Flush(clean) the data cache. */
-+            gcmkONERROR(gckOS_CacheFlush(Os, _GetProcessID(), gcvNULL,
-+                             (gctPOINTER)(gctUINTPTR_T)page_to_phys(pages[i]),
-+                             (gctPOINTER)(memory & PAGE_MASK) + i*PAGE_SIZE,
-+                             PAGE_SIZE));
-+        }
-+
-+#if gcdENABLE_VG
-+        if (Core == gcvCORE_VG)
-+        {
-+            /* Allocate pages inside the page table. */
-+            gcmkERR_BREAK(gckVGMMU_AllocatePages(Os->device->kernels[Core]->vg->mmu,
-+                                              pageCount * (PAGE_SIZE/4096),
-+                                              (gctPOINTER *) &pageTable,
-+                                              &address));
-+        }
-+        else
-+#endif
-+        {
-+            /* Allocate pages inside the page table. */
-+            gcmkERR_BREAK(gckMMU_AllocatePages(Os->device->kernels[Core]->mmu,
-+                                              pageCount * (PAGE_SIZE/4096),
-+                                              (gctPOINTER *) &pageTable,
-+                                              &address));
-+        }
-+
-+        /* Fill the page table. */
-+        for (i = 0; i < pageCount; i++)
-+        {
-+            gctUINT32 phys;
-+            gctUINT32_PTR tab = pageTable + i * (PAGE_SIZE/4096);
-+
-+            phys = page_to_phys(pages[i]);
-+
-+#if gcdENABLE_VG
-+            if (Core == gcvCORE_VG)
-+            {
-+                /* Get the physical address from page struct. */
-+                gcmkONERROR(
-+                    gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
-+                                   phys,
-+                                   tab));
-+            }
-+            else
-+#endif
-+            {
-+                /* Get the physical address from page struct. */
-+                gcmkONERROR(
-+                    gckMMU_SetPage(Os->device->kernels[Core]->mmu,
-+                                   phys,
-+                                   tab));
-+            }
-+
-+            for (j = 1; j < (PAGE_SIZE/4096); j++)
-+            {
-+                pageTable[i * (PAGE_SIZE/4096) + j] = pageTable[i * (PAGE_SIZE/4096)] + 4096 * j;
-+            }
-+
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_INFO, gcvZONE_OS,
-+                "%s(%d): pageTable[%d]: 0x%X 0x%X.",
-+                __FUNCTION__, __LINE__,
-+                i, phys, pageTable[i]);
-+        }
-+
-+#if gcdENABLE_VG
-+        if (Core == gcvCORE_VG)
-+        {
-+            gcmkONERROR(gckVGMMU_Flush(Os->device->kernels[Core]->vg->mmu));
-+        }
-+        else
-+#endif
-+        {
-+            gcmkONERROR(gckMMU_Flush(Os->device->kernels[Core]->mmu));
-+        }
-+
-+        /* Save pointer to page table. */
-+        info->pageTable = pageTable;
-+        info->pages = pages;
-+
-+        *Info = (gctPOINTER) info;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): info->pages: 0x%X, info->pageTable: 0x%X, info: 0x%X.",
-+            __FUNCTION__, __LINE__,
-+            info->pages,
-+            info->pageTable,
-+            info
-+            );
-+
-+        offset = (Physical != ~0U)
-+               ? (Physical & ~PAGE_MASK)
-+               : (memory & ~PAGE_MASK);
-+
-+        /* Return address. */
-+        *Address = address + offset;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): Address: 0x%X.",
-+            __FUNCTION__, __LINE__,
-+            *Address
-+            );
-+
-+        /* Success. */
-+        status = gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+OnError:
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): error occured: %d.",
-+            __FUNCTION__, __LINE__,
-+            status
-+            );
-+
-+        /* Release page array. */
-+        if (result > 0 && pages != gcvNULL)
-+        {
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): error: page table is freed.",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            for (i = 0; i < result; i++)
-+            {
-+                if (pages[i] == gcvNULL)
-+                {
-+                    break;
-+                }
-+                page_cache_release(pages[i]);
-+            }
-+        }
-+
-+        if (info!= gcvNULL && pages != gcvNULL)
-+        {
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): error: pages is freed.",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            /* Free the page table. */
-+            kfree(pages);
-+            info->pages = gcvNULL;
-+        }
-+
-+        /* Release page info struct. */
-+        if (info != gcvNULL)
-+        {
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): error: info is freed.",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            /* Free the page info struct. */
-+            kfree(info);
-+            *Info = gcvNULL;
-+        }
-+    }
-+
-+    MEMORY_MAP_UNLOCK(Os);
-+
-+    /* Return the status. */
-+    if (gcmIS_SUCCESS(status))
-+    {
-+        gcmkFOOTER_ARG("*Info=0x%X *Address=0x%08x", *Info, *Address);
-+    }
-+    else
-+    {
-+        gcmkFOOTER();
-+    }
-+
-+    return status;
-+}
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UnmapUserMemory
-+**
-+**  Unlock a user buffer and that was previously locked down by
-+**  gckOS_MapUserMemory.
-+**
-+**  INPUT:
-+**
-+**      gctPOINTER Memory
-+**          Pointer to memory to unlock.
-+**
-+**      gctSIZE_T Size
-+**          Size in bytes of the memory to unlock.
-+**
-+**      gctPOINTER Info
-+**          Information record returned by gckOS_MapUserMemory.
-+**
-+**      gctUINT32_PTR Address
-+**          The address returned by gckOS_MapUserMemory.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UnmapUserMemory(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctPOINTER Memory,
-+    IN gctSIZE_T Size,
-+    IN gctPOINTER Info,
-+    IN gctUINT32 Address
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Core=%d Memory=0x%X Size=%lu Info=0x%X Address0x%08x",
-+                   Os, Core, Memory, Size, Info, Address);
-+
-+#if gcdSECURE_USER
-+    gcmkONERROR(gckOS_RemoveMapping(Os, Memory, Size));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+#else
-+{
-+    gctUINTPTR_T memory, start, end;
-+    gcsPageInfo_PTR info;
-+    gctSIZE_T pageCount, i;
-+    struct page **pages;
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Size > 0);
-+    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
-+
-+    do
-+    {
-+        info = (gcsPageInfo_PTR) Info;
-+
-+        pages = info->pages;
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): info=0x%X, pages=0x%X.",
-+            __FUNCTION__, __LINE__,
-+            info, pages
-+            );
-+
-+        /* Invalid page array. */
-+        if (pages == gcvNULL && info->pageTable == gcvNULL)
-+        {
-+            kfree(info);
-+
-+            gcmkFOOTER_NO();
-+            return gcvSTATUS_OK;
-+        }
-+
-+        memory = (gctUINTPTR_T)Memory;
-+        end = (memory + Size + PAGE_SIZE - 1) >> PAGE_SHIFT;
-+        start = memory >> PAGE_SHIFT;
-+        pageCount = end - start;
-+
-+        /* Overflow. */
-+        if ((memory + Size) < memory)
-+        {
-+            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+        }
-+
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_INFO, gcvZONE_OS,
-+            "%s(%d): memory: 0x%X, pageCount: %d, pageTable: 0x%X.",
-+            __FUNCTION__, __LINE__,
-+            memory, pageCount, info->pageTable
-+            );
-+
-+        MEMORY_MAP_LOCK(Os);
-+
-+        gcmkASSERT(info->pageTable != gcvNULL);
-+
-+#if gcdENABLE_VG
-+        if (Core == gcvCORE_VG)
-+        {
-+            /* Free the pages from the MMU. */
-+            gcmkERR_BREAK(gckVGMMU_FreePages(Os->device->kernels[Core]->vg->mmu,
-+                                          info->pageTable,
-+                                          pageCount * (PAGE_SIZE/4096)
-+                                          ));
-+        }
-+        else
-+#endif
-+        {
-+            /* Free the pages from the MMU. */
-+            gcmkERR_BREAK(gckMMU_FreePages(Os->device->kernels[Core]->mmu,
-+                                          info->pageTable,
-+                                          pageCount * (PAGE_SIZE/4096)
-+                                          ));
-+        }
-+
-+        /* Release the page cache. */
-+        if (pages)
-+        {
-+            for (i = 0; i < pageCount; i++)
-+            {
-+                gcmkTRACE_ZONE(
-+                    gcvLEVEL_INFO, gcvZONE_OS,
-+                    "%s(%d): pages[%d]: 0x%X.",
-+                    __FUNCTION__, __LINE__,
-+                    i, pages[i]
-+                    );
-+
-+                if (!PageReserved(pages[i]))
-+                {
-+                     SetPageDirty(pages[i]);
-+                }
-+
-+                page_cache_release(pages[i]);
-+            }
-+        }
-+
-+        /* Success. */
-+        status = gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    if (info != gcvNULL)
-+    {
-+        /* Free the page array. */
-+        if (info->pages != gcvNULL)
-+        {
-+            kfree(info->pages);
-+        }
-+
-+        kfree(info);
-+    }
-+
-+    MEMORY_MAP_UNLOCK(Os);
-+
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetBaseAddress
-+**
-+**  Get the base address for the physical memory.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR BaseAddress
-+**          Pointer to a variable that will receive the base address.
-+*/
-+gceSTATUS
-+gckOS_GetBaseAddress(
-+    IN gckOS Os,
-+    OUT gctUINT32_PTR BaseAddress
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(BaseAddress != gcvNULL);
-+
-+    /* Return base address. */
-+    *BaseAddress = Os->device->baseAddress;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*BaseAddress=0x%08x", *BaseAddress);
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_SuspendInterrupt(
-+    IN gckOS Os
-+    )
-+{
-+    return gckOS_SuspendInterruptEx(Os, gcvCORE_MAJOR);
-+}
-+
-+gceSTATUS
-+gckOS_SuspendInterruptEx(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Core=%d", Os, Core);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+    disable_irq(Os->device->irqLines[Core]);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_ResumeInterrupt(
-+    IN gckOS Os
-+    )
-+{
-+    return gckOS_ResumeInterruptEx(Os, gcvCORE_MAJOR);
-+}
-+
-+gceSTATUS
-+gckOS_ResumeInterruptEx(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Core=%d", Os, Core);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+    enable_irq(Os->device->irqLines[Core]);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_MemCopy(
-+    IN gctPOINTER Destination,
-+    IN gctCONST_POINTER Source,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Destination=0x%X Source=0x%X Bytes=%lu",
-+                   Destination, Source, Bytes);
-+
-+    gcmkVERIFY_ARGUMENT(Destination != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Source != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    memcpy(Destination, Source, Bytes);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_ZeroMemory(
-+    IN gctPOINTER Memory,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Memory=0x%X Bytes=%lu", Memory, Bytes);
-+
-+    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+    memset(Memory, 0, Bytes);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+********************************* Cache Control ********************************
-+*******************************************************************************/
-+
-+#if !gcdCACHE_FUNCTION_UNIMPLEMENTED && defined(CONFIG_OUTER_CACHE)
-+static inline gceSTATUS
-+outer_func(
-+    gceCACHEOPERATION Type,
-+    unsigned long Start,
-+    unsigned long End
-+    )
-+{
-+    switch (Type)
-+    {
-+        case gcvCACHE_CLEAN:
-+            outer_clean_range(Start, End);
-+            break;
-+        case gcvCACHE_INVALIDATE:
-+            outer_inv_range(Start, End);
-+            break;
-+        case gcvCACHE_FLUSH:
-+            outer_flush_range(Start, End);
-+            break;
-+        default:
-+            return gcvSTATUS_INVALID_ARGUMENT;
-+            break;
-+    }
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdENABLE_OUTER_CACHE_PATCH
-+/*******************************************************************************
-+**  _HandleOuterCache
-+**
-+**  Handle the outer cache for the specified addresses.
-+**
-+**  ARGUMENTS:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID Logical belongs.
-+**
-+**      gctPHYS_ADDR Handle
-+**          Physical address handle.  If gcvNULL it is video memory.
-+**
-+**      gctPOINTER Physical
-+**          Physical address to flush.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to flush.
-+**
-+**      gctSIZE_T Bytes
-+**          Size of the address range in bytes to flush.
-+**
-+**      gceOUTERCACHE_OPERATION Type
-+**          Operation need to be execute.
-+*/
-+static gceSTATUS
-+_HandleOuterCache(
-+    IN gckOS Os,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Handle,
-+    IN gctPOINTER Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes,
-+    IN gceCACHEOPERATION Type
-+    )
-+{
-+    gceSTATUS status;
-+    gctUINT32 i, pageNum;
-+    unsigned long paddr;
-+    gctPOINTER vaddr;
-+
-+    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
-+                   Os, ProcessID, Handle, Logical, Bytes);
-+
-+    if (Physical != gcvNULL)
-+    {
-+        /* Non paged memory or gcvPOOL_USER surface */
-+        paddr = (unsigned long) Physical;
-+        gcmkONERROR(outer_func(Type, paddr, paddr + Bytes));
-+    }
-+    else if ((Handle == gcvNULL)
-+    || (Handle != gcvNULL && ((PLINUX_MDL)Handle)->contiguous)
-+    )
-+    {
-+        /* Video Memory or contiguous virtual memory */
-+        gcmkONERROR(gckOS_GetPhysicalAddress(Os, Logical, (gctUINT32*)&paddr));
-+        gcmkONERROR(outer_func(Type, paddr, paddr + Bytes));
-+    }
-+    else
-+    {
-+        /* Non contiguous virtual memory */
-+        vaddr = (gctPOINTER)gcmALIGN_BASE((gctUINTPTR_T)Logical, PAGE_SIZE);
-+        pageNum = GetPageCount(Bytes, 0);
-+
-+        for (i = 0; i < pageNum; i += 1)
-+        {
-+            gcmkONERROR(_ConvertLogical2Physical(
-+                Os,
-+                vaddr + PAGE_SIZE * i,
-+                ProcessID,
-+                (PLINUX_MDL)Handle,
-+                (gctUINT32*)&paddr
-+                ));
-+
-+            gcmkONERROR(outer_func(Type, paddr, paddr + PAGE_SIZE));
-+        }
-+    }
-+
-+    mb();
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-+#endif
-+
-+/*******************************************************************************
-+**  gckOS_CacheClean
-+**
-+**  Clean the cache for the specified addresses.  The GPU is going to need the
-+**  data.  If the system is allocating memory as non-cachable, this function can
-+**  be ignored.
-+**
-+**  ARGUMENTS:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID Logical belongs.
-+**
-+**      gctPHYS_ADDR Handle
-+**          Physical address handle.  If gcvNULL it is video memory.
-+**
-+**      gctPOINTER Physical
-+**          Physical address to flush.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to flush.
-+**
-+**      gctSIZE_T Bytes
-+**          Size of the address range in bytes to flush.
-+*/
-+gceSTATUS
-+gckOS_CacheClean(
-+    IN gckOS Os,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Handle,
-+    IN gctPOINTER Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
-+                   Os, ProcessID, Handle, Logical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+#if !gcdCACHE_FUNCTION_UNIMPLEMENTED
-+#ifdef CONFIG_ARM
-+
-+    /* Inner cache. */
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,35)
-+    dmac_map_area(Logical, Bytes, DMA_TO_DEVICE);
-+#      else
-+    dmac_clean_range(Logical, Logical + Bytes);
-+#      endif
-+
-+#if defined(CONFIG_OUTER_CACHE)
-+    /* Outer cache. */
-+#if gcdENABLE_OUTER_CACHE_PATCH
-+    _HandleOuterCache(Os, ProcessID, Handle, Physical, Logical, Bytes, gcvCACHE_CLEAN);
-+#else
-+    outer_clean_range((unsigned long) Handle, (unsigned long) Handle + Bytes);
-+#endif
-+#endif
-+
-+#elif defined(CONFIG_MIPS)
-+
-+    dma_cache_wback((unsigned long) Logical, Bytes);
-+
-+#elif defined(CONFIG_PPC)
-+
-+    /* TODO */
-+
-+#else
-+    dma_sync_single_for_device(
-+              gcvNULL,
-+              (dma_addr_t)Physical,
-+              Bytes,
-+              DMA_TO_DEVICE);
-+#endif
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**  gckOS_CacheInvalidate
-+**
-+**  Invalidate the cache for the specified addresses. The GPU is going to need
-+**  data.  If the system is allocating memory as non-cachable, this function can
-+**  be ignored.
-+**
-+**  ARGUMENTS:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID Logical belongs.
-+**
-+**      gctPHYS_ADDR Handle
-+**          Physical address handle.  If gcvNULL it is video memory.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to flush.
-+**
-+**      gctSIZE_T Bytes
-+**          Size of the address range in bytes to flush.
-+*/
-+gceSTATUS
-+gckOS_CacheInvalidate(
-+    IN gckOS Os,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Handle,
-+    IN gctPOINTER Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
-+                   Os, ProcessID, Handle, Logical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+#if !gcdCACHE_FUNCTION_UNIMPLEMENTED
-+#ifdef CONFIG_ARM
-+
-+    /* Inner cache. */
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,35)
-+    dmac_map_area(Logical, Bytes, DMA_FROM_DEVICE);
-+#      else
-+    dmac_inv_range(Logical, Logical + Bytes);
-+#      endif
-+
-+#if defined(CONFIG_OUTER_CACHE)
-+    /* Outer cache. */
-+#if gcdENABLE_OUTER_CACHE_PATCH
-+    _HandleOuterCache(Os, ProcessID, Handle, Physical, Logical, Bytes, gcvCACHE_INVALIDATE);
-+#else
-+    outer_inv_range((unsigned long) Handle, (unsigned long) Handle + Bytes);
-+#endif
-+#endif
-+
-+#elif defined(CONFIG_MIPS)
-+    dma_cache_inv((unsigned long) Logical, Bytes);
-+#elif defined(CONFIG_PPC)
-+    /* TODO */
-+#else
-+    dma_sync_single_for_device(
-+              gcvNULL,
-+              (dma_addr_t)Physical,
-+              Bytes,
-+              DMA_FROM_DEVICE);
-+#endif
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**  gckOS_CacheFlush
-+**
-+**  Clean the cache for the specified addresses and invalidate the lines as
-+**  well.  The GPU is going to need and modify the data.  If the system is
-+**  allocating memory as non-cachable, this function can be ignored.
-+**
-+**  ARGUMENTS:
-+**
-+**      gckOS Os
-+**          Pointer to gckOS object.
-+**
-+**      gctUINT32 ProcessID
-+**          Process ID Logical belongs.
-+**
-+**      gctPHYS_ADDR Handle
-+**          Physical address handle.  If gcvNULL it is video memory.
-+**
-+**      gctPOINTER Logical
-+**          Logical address to flush.
-+**
-+**      gctSIZE_T Bytes
-+**          Size of the address range in bytes to flush.
-+*/
-+gceSTATUS
-+gckOS_CacheFlush(
-+    IN gckOS Os,
-+    IN gctUINT32 ProcessID,
-+    IN gctPHYS_ADDR Handle,
-+    IN gctPOINTER Physical,
-+    IN gctPOINTER Logical,
-+    IN gctSIZE_T Bytes
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
-+                   Os, ProcessID, Handle, Logical, Bytes);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Bytes > 0);
-+
-+#if !gcdCACHE_FUNCTION_UNIMPLEMENTED
-+#ifdef CONFIG_ARM
-+    /* Inner cache. */
-+    dmac_flush_range(Logical, Logical + Bytes);
-+
-+#if defined(CONFIG_OUTER_CACHE)
-+    /* Outer cache. */
-+#if gcdENABLE_OUTER_CACHE_PATCH
-+    _HandleOuterCache(Os, ProcessID, Handle, Physical, Logical, Bytes, gcvCACHE_FLUSH);
-+#else
-+    outer_flush_range((unsigned long) Handle, (unsigned long) Handle + Bytes);
-+#endif
-+#endif
-+
-+#elif defined(CONFIG_MIPS)
-+    dma_cache_wback_inv((unsigned long) Logical, Bytes);
-+#elif defined(CONFIG_PPC)
-+    /* TODO */
-+#else
-+    dma_sync_single_for_device(
-+              gcvNULL,
-+              (dma_addr_t)Physical,
-+              Bytes,
-+              DMA_BIDIRECTIONAL);
-+#endif
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+********************************* Broadcasting *********************************
-+*******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Broadcast
-+**
-+**  System hook for broadcast events from the kernel driver.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gceBROADCAST Reason
-+**          Reason for the broadcast.  Can be one of the following values:
-+**
-+**              gcvBROADCAST_GPU_IDLE
-+**                  Broadcasted when the kernel driver thinks the GPU might be
-+**                  idle.  This can be used to handle power management.
-+**
-+**              gcvBROADCAST_GPU_COMMIT
-+**                  Broadcasted when any client process commits a command
-+**                  buffer.  This can be used to handle power management.
-+**
-+**              gcvBROADCAST_GPU_STUCK
-+**                  Broadcasted when the kernel driver hits the timeout waiting
-+**                  for the GPU.
-+**
-+**              gcvBROADCAST_FIRST_PROCESS
-+**                  First process is trying to connect to the kernel.
-+**
-+**              gcvBROADCAST_LAST_PROCESS
-+**                  Last process has detached from the kernel.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_Broadcast(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gceBROADCAST Reason
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Hardware=0x%X Reason=%d", Os, Hardware, Reason);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
-+
-+    switch (Reason)
-+    {
-+    case gcvBROADCAST_FIRST_PROCESS:
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "First process has attached");
-+        break;
-+
-+    case gcvBROADCAST_LAST_PROCESS:
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "Last process has detached");
-+
-+        /* Put GPU OFF. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetPowerManagementState(Hardware,
-+                                                gcvPOWER_OFF_BROADCAST));
-+        break;
-+
-+    case gcvBROADCAST_GPU_IDLE:
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "GPU idle.");
-+
-+        /* Put GPU IDLE. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetPowerManagementState(Hardware,
-+#if gcdPOWER_SUSNPEND_WHEN_IDLE
-+                                                gcvPOWER_SUSPEND_BROADCAST));
-+#else
-+                                                gcvPOWER_IDLE_BROADCAST));
-+#endif
-+
-+        /* Add idle process DB. */
-+        gcmkONERROR(gckKERNEL_AddProcessDB(Hardware->kernel,
-+                                           1,
-+                                           gcvDB_IDLE,
-+                                           gcvNULL, gcvNULL, 0));
-+        break;
-+
-+    case gcvBROADCAST_GPU_COMMIT:
-+        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "COMMIT has arrived.");
-+
-+        /* Add busy process DB. */
-+        gcmkONERROR(gckKERNEL_AddProcessDB(Hardware->kernel,
-+                                           0,
-+                                           gcvDB_IDLE,
-+                                           gcvNULL, gcvNULL, 0));
-+
-+        /* Put GPU ON. */
-+        gcmkONERROR(
-+            gckHARDWARE_SetPowerManagementState(Hardware, gcvPOWER_ON_AUTO));
-+        break;
-+
-+    case gcvBROADCAST_GPU_STUCK:
-+        gcmkTRACE_N(gcvLEVEL_ERROR, 0, "gcvBROADCAST_GPU_STUCK\n");
-+#if !gcdENABLE_RECOVERY
-+        gcmkONERROR(gckHARDWARE_DumpGPUState(Hardware));
-+#endif
-+        gcmkONERROR(gckKERNEL_Recovery(Hardware->kernel));
-+        break;
-+
-+    case gcvBROADCAST_AXI_BUS_ERROR:
-+        gcmkTRACE_N(gcvLEVEL_ERROR, 0, "gcvBROADCAST_AXI_BUS_ERROR\n");
-+        gcmkONERROR(gckHARDWARE_DumpGPUState(Hardware));
-+        gcmkONERROR(gckKERNEL_Recovery(Hardware->kernel));
-+        break;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_BroadcastHurry
-+**
-+**  The GPU is running too slow.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gctUINT Urgency
-+**          The higher the number, the higher the urgency to speed up the GPU.
-+**          The maximum value is defined by the gcdDYNAMIC_EVENT_THRESHOLD.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_BroadcastHurry(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT Urgency
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x Urgency=%u", Os, Hardware, Urgency);
-+
-+    /* Do whatever you need to do to speed up the GPU now. */
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_BroadcastCalibrateSpeed
-+**
-+**  Calibrate the speed of the GPU.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gckHARDWARE Hardware
-+**          Pointer to the gckHARDWARE object.
-+**
-+**      gctUINT Idle, Time
-+**          Idle/Time will give the percentage the GPU is idle, so you can use
-+**          this to calibrate the working point of the GPU.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_BroadcastCalibrateSpeed(
-+    IN gckOS Os,
-+    IN gckHARDWARE Hardware,
-+    IN gctUINT Idle,
-+    IN gctUINT Time
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x Idle=%u Time=%u",
-+                   Os, Hardware, Idle, Time);
-+
-+    /* Do whatever you need to do to callibrate the GPU speed. */
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+********************************** Semaphores **********************************
-+*******************************************************************************/
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CreateSemaphore
-+**
-+**  Create a semaphore.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Semaphore
-+**          Pointer to the variable that will receive the created semaphore.
-+*/
-+gceSTATUS
-+gckOS_CreateSemaphore(
-+    IN gckOS Os,
-+    OUT gctPOINTER * Semaphore
-+    )
-+{
-+    gceSTATUS status;
-+    struct semaphore *sem = gcvNULL;
-+
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    /* Allocate the semaphore structure. */
-+    sem = (struct semaphore *)kmalloc(gcmSIZEOF(struct semaphore), GFP_KERNEL | gcdNOWARN);
-+    if (sem == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Initialize the semaphore. */
-+    sema_init(sem, 1);
-+
-+    /* Return to caller. */
-+    *Semaphore = (gctPOINTER) sem;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_AcquireSemaphore
-+**
-+**  Acquire a semaphore.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Semaphore
-+**          Pointer to the semaphore thet needs to be acquired.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_AcquireSemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%08X Semaphore=0x%08X", Os, Semaphore);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    /* Acquire the semaphore. */
-+    if (down_interruptible((struct semaphore *) Semaphore))
-+    {
-+        gcmkONERROR(gcvSTATUS_INTERRUPTED);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_TryAcquireSemaphore
-+**
-+**  Try to acquire a semaphore.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Semaphore
-+**          Pointer to the semaphore thet needs to be acquired.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_TryAcquireSemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    )
-+{
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%x", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    /* Acquire the semaphore. */
-+    if (down_trylock((struct semaphore *) Semaphore))
-+    {
-+        /* Timeout. */
-+        status = gcvSTATUS_TIMEOUT;
-+        gcmkFOOTER();
-+        return status;
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_ReleaseSemaphore
-+**
-+**  Release a previously acquired semaphore.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Semaphore
-+**          Pointer to the semaphore thet needs to be released.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_ReleaseSemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%X", Os, Semaphore);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    /* Release the semaphore. */
-+    up((struct semaphore *) Semaphore);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DestroySemaphore
-+**
-+**  Destroy a semaphore.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Semaphore
-+**          Pointer to the semaphore thet needs to be destroyed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_DestroySemaphore(
-+    IN gckOS Os,
-+    IN gctPOINTER Semaphore
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%X", Os, Semaphore);
-+
-+     /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    /* Free the sempahore structure. */
-+    kfree(Semaphore);
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetProcessID
-+**
-+**  Get current process ID.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR ProcessID
-+**          Pointer to the variable that receives the process ID.
-+*/
-+gceSTATUS
-+gckOS_GetProcessID(
-+    OUT gctUINT32_PTR ProcessID
-+    )
-+{
-+    /* Get process ID. */
-+    if (ProcessID != gcvNULL)
-+    {
-+        *ProcessID = _GetProcessID();
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_GetThreadID
-+**
-+**  Get current thread ID.
-+**
-+**  INPUT:
-+**
-+**      Nothing.
-+**
-+**  OUTPUT:
-+**
-+**      gctUINT32_PTR ThreadID
-+**          Pointer to the variable that receives the thread ID.
-+*/
-+gceSTATUS
-+gckOS_GetThreadID(
-+    OUT gctUINT32_PTR ThreadID
-+    )
-+{
-+    /* Get thread ID. */
-+    if (ThreadID != gcvNULL)
-+    {
-+        *ThreadID = _GetThreadID();
-+    }
-+
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetGPUPower
-+**
-+**  Set the power of the GPU on or off.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gckCORE Core
-+**          GPU whose power is set.
-+**
-+**      gctBOOL Clock
-+**          gcvTRUE to turn on the clock, or gcvFALSE to turn off the clock.
-+**
-+**      gctBOOL Power
-+**          gcvTRUE to turn on the power, or gcvFALSE to turn off the power.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_SetGPUPower(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctBOOL Clock,
-+    IN gctBOOL Power
-+    )
-+{
-+    struct clk *clk_3dcore = Os->device->clk_3d_core;
-+    struct clk *clk_3dshader = Os->device->clk_3d_shader;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    struct clk *clk_3d_axi = Os->device->clk_3d_axi;
-+#endif
-+    struct clk *clk_2dcore = Os->device->clk_2d_core;
-+    struct clk *clk_2d_axi = Os->device->clk_2d_axi;
-+    struct clk *clk_vg_axi = Os->device->clk_vg_axi;
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    int ret;
-+#endif
-+
-+    gctBOOL oldClockState = gcvFALSE;
-+    gctBOOL oldPowerState = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Os=0x%X Core=%d Clock=%d Power=%d", Os, Core, Clock, Power);
-+
-+    if (Os->device->kernels[Core] != NULL)
-+    {
-+#if gcdENABLE_VG
-+        if (Core == gcvCORE_VG)
-+        {
-+            oldClockState = Os->device->kernels[Core]->vg->hardware->clockState;
-+            oldPowerState = Os->device->kernels[Core]->vg->hardware->powerState;
-+        }
-+        else
-+        {
-+#endif
-+            oldClockState = Os->device->kernels[Core]->hardware->clockState;
-+            oldPowerState = Os->device->kernels[Core]->hardware->powerState;
-+#if gcdENABLE_VG
-+        }
-+#endif
-+    }
-+	if((Power == gcvTRUE) && (oldPowerState == gcvFALSE))
-+	{
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+        if(!IS_ERR(Os->device->gpu_regulator)) {
-+            ret = regulator_enable(Os->device->gpu_regulator);
-+            if (ret != 0)
-+                gckOS_Print("%s(%d): fail to enable pu regulator %d!\n",
-+                    __FUNCTION__, __LINE__, ret);
-+        }
-+#else
-+        imx_gpc_power_up_pu(true);
-+#endif
-+
-+#ifdef CONFIG_PM
-+		pm_runtime_get_sync(Os->device->pmdev);
-+#endif
-+	}
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+    if (Clock == gcvTRUE) {
-+        if (oldClockState == gcvFALSE) {
-+            mutex_lock(&Os->gpu_clk_mutex);
-+            switch (Core) {
-+            case gcvCORE_MAJOR:
-+                clk_enable(clk_3dcore);
-+                if (cpu_is_mx6q())
-+                    clk_enable(clk_3dshader);
-+                break;
-+            case gcvCORE_2D:
-+                clk_enable(clk_2dcore);
-+                clk_enable(clk_2d_axi);
-+                break;
-+            case gcvCORE_VG:
-+                clk_enable(clk_2dcore);
-+                clk_enable(clk_vg_axi);
-+                break;
-+            default:
-+                break;
-+            }
-+            Os->gpu_clk_on[Core] = 1;
-+            mutex_unlock(&Os->gpu_clk_mutex);
-+        }
-+    } else {
-+        if (oldClockState == gcvTRUE) {
-+            mutex_lock(&Os->gpu_clk_mutex);
-+            switch (Core) {
-+            case gcvCORE_MAJOR:
-+                if (cpu_is_mx6q())
-+                    clk_disable(clk_3dshader);
-+                clk_disable(clk_3dcore);
-+                break;
-+           case gcvCORE_2D:
-+                clk_disable(clk_2dcore);
-+                clk_disable(clk_2d_axi);
-+                break;
-+            case gcvCORE_VG:
-+                clk_disable(clk_2dcore);
-+                clk_disable(clk_vg_axi);
-+                break;
-+            default:
-+                break;
-+            }
-+            Os->gpu_clk_on[Core] = 0;
-+            mutex_unlock(&Os->gpu_clk_mutex);
-+        }
-+    }
-+#else
-+    if (Clock == gcvTRUE) {
-+        if (oldClockState == gcvFALSE) {
-+            mutex_lock(&Os->gpu_clk_mutex);
-+            switch (Core) {
-+            case gcvCORE_MAJOR:
-+                clk_prepare_enable(clk_3dcore);
-+                clk_prepare_enable(clk_3dshader);
-+                clk_prepare_enable(clk_3d_axi);
-+                break;
-+            case gcvCORE_2D:
-+                clk_prepare_enable(clk_2dcore);
-+                clk_prepare_enable(clk_2d_axi);
-+                break;
-+            case gcvCORE_VG:
-+                clk_prepare_enable(clk_2dcore);
-+                clk_prepare_enable(clk_vg_axi);
-+                break;
-+            default:
-+                break;
-+            }
-+            Os->gpu_clk_on[Core] = 1;
-+            mutex_unlock(&Os->gpu_clk_mutex);
-+        }
-+    } else {
-+        if (oldClockState == gcvTRUE) {
-+            mutex_lock(&Os->gpu_clk_mutex);
-+            switch (Core) {
-+            case gcvCORE_MAJOR:
-+                clk_disable_unprepare(clk_3d_axi);
-+                clk_disable_unprepare(clk_3dshader);
-+                clk_disable_unprepare(clk_3dcore);
-+                break;
-+           case gcvCORE_2D:
-+                clk_disable_unprepare(clk_2d_axi);
-+                clk_disable_unprepare(clk_2dcore);
-+                break;
-+            case gcvCORE_VG:
-+                clk_disable_unprepare(clk_vg_axi);
-+                clk_disable_unprepare(clk_2dcore);
-+                break;
-+            default:
-+                break;
-+            }
-+            Os->gpu_clk_on[Core] = 0;
-+            mutex_unlock(&Os->gpu_clk_mutex);
-+        }
-+    }
-+#endif
-+	if((Power == gcvFALSE) && (oldPowerState == gcvTRUE))
-+	{
-+#ifdef CONFIG_PM
-+		pm_runtime_put_sync(Os->device->pmdev);
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+        if(!IS_ERR(Os->device->gpu_regulator))
-+            regulator_disable(Os->device->gpu_regulator);
-+#else
-+        imx_gpc_power_up_pu(false);
-+#endif
-+
-+	}
-+    /* TODO: Put your code here. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_ResetGPU
-+**
-+**  Reset the GPU.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gckCORE Core
-+**          GPU whose power is set.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_ResetGPU(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+#define SRC_SCR_OFFSET 0
-+#define BP_SRC_SCR_GPU3D_RST 1
-+#define BP_SRC_SCR_GPU2D_RST 4
-+    void __iomem *src_base = IO_ADDRESS(SRC_BASE_ADDR);
-+    gctUINT32 bit_offset,val;
-+
-+    gcmkHEADER_ARG("Os=0x%X Core=%d", Os, Core);
-+
-+    if(Core == gcvCORE_MAJOR) {
-+        bit_offset = BP_SRC_SCR_GPU3D_RST;
-+    } else if((Core == gcvCORE_VG)
-+            ||(Core == gcvCORE_2D)) {
-+        bit_offset = BP_SRC_SCR_GPU2D_RST;
-+    } else {
-+        return gcvSTATUS_INVALID_CONFIG;
-+    }
-+    val = __raw_readl(src_base + SRC_SCR_OFFSET);
-+    val &= ~(1 << (bit_offset));
-+    val |= (1 << (bit_offset));
-+    __raw_writel(val, src_base + SRC_SCR_OFFSET);
-+
-+    while ((__raw_readl(src_base + SRC_SCR_OFFSET) &
-+                (1 << (bit_offset))) != 0) {
-+    }
-+
-+    gcmkFOOTER_NO();
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+	struct reset_control *rstc = Os->device->rstc[Core];
-+	if (rstc)
-+		reset_control_reset(rstc);
-+#else
-+    imx_src_reset_gpu((int)Core);
-+#endif
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_PrepareGPUFrequency
-+**
-+**  Prepare to set GPU frequency and voltage.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gckCORE Core
-+**          GPU whose frequency and voltage will be set.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_PrepareGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_FinishGPUFrequency
-+**
-+**  Finish GPU frequency setting.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gckCORE Core
-+**          GPU whose frequency and voltage is set.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_FinishGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_QueryGPUFrequency
-+**
-+**  Query the current frequency of the GPU.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gckCORE Core
-+**          GPU whose power is set.
-+**
-+**      gctUINT32 * Frequency
-+**          Pointer to a gctUINT32 to obtain current frequency, in MHz.
-+**
-+**      gctUINT8 * Scale
-+**          Pointer to a gctUINT8 to obtain current scale(1 - 64).
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_QueryGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    OUT gctUINT32 * Frequency,
-+    OUT gctUINT8 * Scale
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetGPUFrequency
-+**
-+**  Set frequency and voltage of the GPU.
-+**
-+**      1. DVFS manager gives the target scale of full frequency, BSP must find
-+**         a real frequency according to this scale and board's configure.
-+**
-+**      2. BSP should find a suitable voltage for this frequency.
-+**
-+**      3. BSP must make sure setting take effect before this function returns.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to a gckOS object.
-+**
-+**      gckCORE Core
-+**          GPU whose power is set.
-+**
-+**      gctUINT8 Scale
-+**          Target scale of full frequency, range is [1, 64]. 1 means 1/64 of
-+**          full frequency and 64 means 64/64 of full frequency.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_SetGPUFrequency(
-+    IN gckOS Os,
-+    IN gceCORE Core,
-+    IN gctUINT8 Scale
-+    )
-+{
-+    return gcvSTATUS_OK;
-+}
-+
-+/*----------------------------------------------------------------------------*/
-+/*----- Profile --------------------------------------------------------------*/
-+
-+gceSTATUS
-+gckOS_GetProfileTick(
-+    OUT gctUINT64_PTR Tick
-+    )
-+{
-+    struct timespec time;
-+
-+    ktime_get_ts(&time);
-+
-+    *Tick = time.tv_nsec + time.tv_sec * 1000000000ULL;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_QueryProfileTickRate(
-+    OUT gctUINT64_PTR TickRate
-+    )
-+{
-+    struct timespec res;
-+
-+    hrtimer_get_res(CLOCK_MONOTONIC, &res);
-+
-+    *TickRate = res.tv_nsec + res.tv_sec * 1000000000ULL;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gctUINT32
-+gckOS_ProfileToMS(
-+    IN gctUINT64 Ticks
-+    )
-+{
-+#if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,23)
-+    return div_u64(Ticks, 1000000);
-+#else
-+    gctUINT64 rem = Ticks;
-+    gctUINT64 b = 1000000;
-+    gctUINT64 res, d = 1;
-+    gctUINT32 high = rem >> 32;
-+
-+    /* Reduce the thing a bit first */
-+    res = 0;
-+    if (high >= 1000000)
-+    {
-+        high /= 1000000;
-+        res   = (gctUINT64) high << 32;
-+        rem  -= (gctUINT64) (high * 1000000) << 32;
-+    }
-+
-+    while (((gctINT64) b > 0) && (b < rem))
-+    {
-+        b <<= 1;
-+        d <<= 1;
-+    }
-+
-+    do
-+    {
-+        if (rem >= b)
-+        {
-+            rem -= b;
-+            res += d;
-+        }
-+
-+        b >>= 1;
-+        d >>= 1;
-+    }
-+    while (d);
-+
-+    return (gctUINT32) res;
-+#endif
-+}
-+
-+/******************************************************************************\
-+******************************* Signal Management ******************************
-+\******************************************************************************/
-+
-+#undef _GC_OBJ_ZONE
-+#define _GC_OBJ_ZONE    gcvZONE_SIGNAL
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CreateSignal
-+**
-+**  Create a new signal.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctBOOL ManualReset
-+**          If set to gcvTRUE, gckOS_Signal with gcvFALSE must be called in
-+**          order to set the signal to nonsignaled state.
-+**          If set to gcvFALSE, the signal will automatically be set to
-+**          nonsignaled state by gckOS_WaitSignal function.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIGNAL * Signal
-+**          Pointer to a variable receiving the created gctSIGNAL.
-+*/
-+gceSTATUS
-+gckOS_CreateSignal(
-+    IN gckOS Os,
-+    IN gctBOOL ManualReset,
-+    OUT gctSIGNAL * Signal
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSIGNAL_PTR signal;
-+
-+    gcmkHEADER_ARG("Os=0x%X ManualReset=%d", Os, ManualReset);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+
-+    /* Create an event structure. */
-+    signal = (gcsSIGNAL_PTR) kmalloc(sizeof(gcsSIGNAL), GFP_KERNEL | gcdNOWARN);
-+
-+    if (signal == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Save the process ID. */
-+    signal->process = (gctHANDLE)(gctUINTPTR_T) _GetProcessID();
-+    signal->manualReset = ManualReset;
-+    signal->hardware = gcvNULL;
-+    init_completion(&signal->obj);
-+    atomic_set(&signal->ref, 1);
-+
-+    gcmkONERROR(_AllocateIntegerId(&Os->signalDB, signal, &signal->id));
-+
-+    *Signal = (gctSIGNAL)(gctUINTPTR_T)signal->id;
-+
-+    gcmkFOOTER_ARG("*Signal=0x%X", *Signal);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (signal != gcvNULL)
-+    {
-+        kfree(signal);
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_SignalQueryHardware(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    OUT gckHARDWARE * Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSIGNAL_PTR signal;
-+
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Hardware=0x%X", Os, Signal, Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
-+
-+    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
-+
-+    *Hardware = signal->hardware;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_SignalSetHardware(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gckHARDWARE Hardware
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSIGNAL_PTR signal;
-+
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Hardware=0x%X", Os, Signal, Hardware);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+
-+    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
-+
-+    signal->hardware = Hardware;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DestroySignal
-+**
-+**  Destroy a signal.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the gctSIGNAL.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_DestroySignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSIGNAL_PTR signal;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X", Os, Signal);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Os, Os->signalMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
-+
-+    gcmkASSERT(signal->id == (gctUINT32)(gctUINTPTR_T)Signal);
-+
-+    if (atomic_dec_and_test(&signal->ref))
-+    {
-+        gcmkVERIFY_OK(_DestroyIntegerId(&Os->signalDB, signal->id));
-+
-+        /* Free the sgianl. */
-+        kfree(signal);
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_Signal
-+**
-+**  Set a state of the specified signal.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the gctSIGNAL.
-+**
-+**      gctBOOL State
-+**          If gcvTRUE, the signal will be set to signaled state.
-+**          If gcvFALSE, the signal will be set to nonsignaled state.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_Signal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctBOOL State
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSIGNAL_PTR signal;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X State=%d", Os, Signal, State);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Os, Os->signalMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
-+
-+    gcmkASSERT(signal->id == (gctUINT32)(gctUINTPTR_T)Signal);
-+
-+    if (State)
-+    {
-+        /* unbind the signal from hardware. */
-+        signal->hardware = gcvNULL;
-+
-+        /* Set the event to a signaled state. */
-+        complete(&signal->obj);
-+    }
-+    else
-+    {
-+        /* Set the event to an unsignaled state. */
-+        reinit_completion(&signal->obj);
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+#if gcdENABLE_VG
-+gceSTATUS
-+gckOS_SetSignalVG(
-+    IN gckOS Os,
-+    IN gctHANDLE Process,
-+    IN gctSIGNAL Signal
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT result;
-+    struct task_struct * userTask;
-+    struct siginfo info;
-+
-+    userTask = FIND_TASK_BY_PID((pid_t)(gctUINTPTR_T) Process);
-+
-+    if (userTask != gcvNULL)
-+    {
-+        info.si_signo = 48;
-+        info.si_code  = __SI_CODE(__SI_RT, SI_KERNEL);
-+        info.si_pid   = 0;
-+        info.si_uid   = 0;
-+        info.si_ptr   = (gctPOINTER) Signal;
-+
-+        /* Signals with numbers between 32 and 63 are real-time,
-+           send a real-time signal to the user process. */
-+        result = send_sig_info(48, &info, userTask);
-+
-+        printk("gckOS_SetSignalVG:0x%x\n", result);
-+        /* Error? */
-+        if (result < 0)
-+        {
-+            status = gcvSTATUS_GENERIC_IO;
-+
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): an error has occurred.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+        }
-+        else
-+        {
-+            status = gcvSTATUS_OK;
-+        }
-+    }
-+    else
-+    {
-+        status = gcvSTATUS_GENERIC_IO;
-+
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): an error has occurred.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+#endif
-+
-+/*******************************************************************************
-+**
-+**  gckOS_UserSignal
-+**
-+**  Set the specified signal which is owned by a process to signaled state.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the gctSIGNAL.
-+**
-+**      gctHANDLE Process
-+**          Handle of process owning the signal.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_UserSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctHANDLE Process
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIGNAL signal;
-+
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Process=%d",
-+                   Os, Signal, (gctINT32)(gctUINTPTR_T)Process);
-+
-+    /* Map the signal into kernel space. */
-+    gcmkONERROR(gckOS_MapSignal(Os, Signal, Process, &signal));
-+
-+    /* Signal. */
-+    status = gckOS_Signal(Os, signal, gcvTRUE);
-+
-+    /* Unmap the signal */
-+    gcmkVERIFY_OK(gckOS_UnmapSignal(Os, Signal));
-+
-+    gcmkFOOTER();
-+    return status;
-+
-+OnError:
-+    /* Return the status. */
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_WaitSignal
-+**
-+**  Wait for a signal to become signaled.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the gctSIGNAL.
-+**
-+**      gctUINT32 Wait
-+**          Number of milliseconds to wait.
-+**          Pass the value of gcvINFINITE for an infinite wait.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_WaitSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctUINT32 Wait
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gcsSIGNAL_PTR signal;
-+
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Wait=0x%08X", Os, Signal, Wait);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+
-+    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
-+
-+    gcmkASSERT(signal->id == (gctUINT32)(gctUINTPTR_T)Signal);
-+
-+    might_sleep();
-+
-+    spin_lock_irq(&signal->obj.wait.lock);
-+
-+    if (signal->obj.done)
-+    {
-+        if (!signal->manualReset)
-+        {
-+            signal->obj.done = 0;
-+        }
-+
-+        status = gcvSTATUS_OK;
-+    }
-+    else if (Wait == 0)
-+    {
-+        status = gcvSTATUS_TIMEOUT;
-+    }
-+    else
-+    {
-+        /* Convert wait to milliseconds. */
-+#if gcdDETECT_TIMEOUT
-+        gctINT timeout = (Wait == gcvINFINITE)
-+            ? gcdINFINITE_TIMEOUT * HZ / 1000
-+            : Wait * HZ / 1000;
-+
-+        gctUINT complained = 0;
-+#else
-+        gctINT timeout = (Wait == gcvINFINITE)
-+            ? MAX_SCHEDULE_TIMEOUT
-+            : Wait * HZ / 1000;
-+#endif
-+
-+        DECLARE_WAITQUEUE(wait, current);
-+        wait.flags |= WQ_FLAG_EXCLUSIVE;
-+        __add_wait_queue_tail(&signal->obj.wait, &wait);
-+
-+        while (gcvTRUE)
-+        {
-+            if (signal_pending(current))
-+            {
-+                /* Interrupt received. */
-+                status = gcvSTATUS_INTERRUPTED;
-+                break;
-+            }
-+
-+            __set_current_state(TASK_INTERRUPTIBLE);
-+            spin_unlock_irq(&signal->obj.wait.lock);
-+            timeout = schedule_timeout(timeout);
-+            spin_lock_irq(&signal->obj.wait.lock);
-+
-+            if (signal->obj.done)
-+            {
-+                if (!signal->manualReset)
-+                {
-+                    signal->obj.done = 0;
-+                }
-+
-+                status = gcvSTATUS_OK;
-+                break;
-+            }
-+
-+#if gcdDETECT_TIMEOUT
-+            if ((Wait == gcvINFINITE) && (timeout == 0))
-+            {
-+                gctUINT32 dmaAddress1, dmaAddress2;
-+                gctUINT32 dmaState1, dmaState2;
-+
-+                dmaState1   = dmaState2   =
-+                dmaAddress1 = dmaAddress2 = 0;
-+
-+                /* Verify whether DMA is running. */
-+                gcmkVERIFY_OK(_VerifyDMA(
-+                    Os, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
-+                    ));
-+
-+#if gcdDETECT_DMA_ADDRESS
-+                /* Dump only if DMA appears stuck. */
-+                if (
-+                    (dmaAddress1 == dmaAddress2)
-+#if gcdDETECT_DMA_STATE
-+                 && (dmaState1   == dmaState2)
-+#endif
-+                )
-+#endif
-+                {
-+                    /* Increment complain count. */
-+                    complained += 1;
-+
-+                    gcmkVERIFY_OK(_DumpGPUState(Os, gcvCORE_MAJOR));
-+
-+                    gcmkPRINT(
-+                        "%s(%d): signal 0x%X; forced message flush (%d).",
-+                        __FUNCTION__, __LINE__, Signal, complained
-+                        );
-+
-+                    /* Flush the debug cache. */
-+                    gcmkDEBUGFLUSH(dmaAddress2);
-+                }
-+
-+                /* Reset timeout. */
-+                timeout = gcdINFINITE_TIMEOUT * HZ / 1000;
-+            }
-+#endif
-+
-+            if (timeout == 0)
-+            {
-+
-+                status = gcvSTATUS_TIMEOUT;
-+                break;
-+            }
-+        }
-+
-+        __remove_wait_queue(&signal->obj.wait, &wait);
-+
-+#if gcdDETECT_TIMEOUT
-+        if (complained)
-+        {
-+            gcmkPRINT(
-+                "%s(%d): signal=0x%X; waiting done; status=%d",
-+                __FUNCTION__, __LINE__, Signal, status
-+                );
-+        }
-+#endif
-+    }
-+
-+    spin_unlock_irq(&signal->obj.wait.lock);
-+
-+OnError:
-+    /* Return status. */
-+    gcmkFOOTER_ARG("Signal=0x%X status=%d", Signal, status);
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_MapSignal
-+**
-+**  Map a signal in to the current process space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to tha gctSIGNAL to map.
-+**
-+**      gctHANDLE Process
-+**          Handle of process owning the signal.
-+**
-+**  OUTPUT:
-+**
-+**      gctSIGNAL * MappedSignal
-+**          Pointer to a variable receiving the mapped gctSIGNAL.
-+*/
-+gceSTATUS
-+gckOS_MapSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal,
-+    IN gctHANDLE Process,
-+    OUT gctSIGNAL * MappedSignal
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSIGNAL_PTR signal;
-+    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Process=0x%X", Os, Signal, Process);
-+
-+    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(MappedSignal != gcvNULL);
-+
-+    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
-+
-+    if(atomic_inc_return(&signal->ref) <= 1)
-+    {
-+        /* The previous value is 0, it has been deleted. */
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    *MappedSignal = (gctSIGNAL) Signal;
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*MappedSignal=0x%X", *MappedSignal);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER_NO();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**	gckOS_UnmapSignal
-+**
-+**	Unmap a signal .
-+**
-+**	INPUT:
-+**
-+**		gckOS Os
-+**			Pointer to an gckOS object.
-+**
-+**		gctSIGNAL Signal
-+**			Pointer to that gctSIGNAL mapped.
-+*/
-+gceSTATUS
-+gckOS_UnmapSignal(
-+    IN gckOS Os,
-+    IN gctSIGNAL Signal
-+    )
-+{
-+    return gckOS_DestroySignal(Os, Signal);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CreateUserSignal
-+**
-+**  Create a new signal to be used in the user space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctBOOL ManualReset
-+**          If set to gcvTRUE, gckOS_Signal with gcvFALSE must be called in
-+**          order to set the signal to nonsignaled state.
-+**          If set to gcvFALSE, the signal will automatically be set to
-+**          nonsignaled state by gckOS_WaitSignal function.
-+**
-+**  OUTPUT:
-+**
-+**      gctINT * SignalID
-+**          Pointer to a variable receiving the created signal's ID.
-+*/
-+gceSTATUS
-+gckOS_CreateUserSignal(
-+    IN gckOS Os,
-+    IN gctBOOL ManualReset,
-+    OUT gctINT * SignalID
-+    )
-+{
-+    gceSTATUS status;
-+    gctSIZE_T signal;
-+
-+    /* Create a new signal. */
-+    status = gckOS_CreateSignal(Os, ManualReset, (gctSIGNAL *) &signal);
-+    *SignalID = (gctINT) signal;
-+
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DestroyUserSignal
-+**
-+**  Destroy a signal to be used in the user space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctINT SignalID
-+**          The signal's ID.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_DestroyUserSignal(
-+    IN gckOS Os,
-+    IN gctINT SignalID
-+    )
-+{
-+    return gckOS_DestroySignal(Os, (gctSIGNAL)(gctUINTPTR_T)SignalID);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_WaitUserSignal
-+**
-+**  Wait for a signal used in the user mode to become signaled.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctINT SignalID
-+**          Signal ID.
-+**
-+**      gctUINT32 Wait
-+**          Number of milliseconds to wait.
-+**          Pass the value of gcvINFINITE for an infinite wait.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_WaitUserSignal(
-+    IN gckOS Os,
-+    IN gctINT SignalID,
-+    IN gctUINT32 Wait
-+    )
-+{
-+    return gckOS_WaitSignal(Os, (gctSIGNAL)(gctUINTPTR_T)SignalID, Wait);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SignalUserSignal
-+**
-+**  Set a state of the specified signal to be used in the user space.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to an gckOS object.
-+**
-+**      gctINT SignalID
-+**          SignalID.
-+**
-+**      gctBOOL State
-+**          If gcvTRUE, the signal will be set to signaled state.
-+**          If gcvFALSE, the signal will be set to nonsignaled state.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_SignalUserSignal(
-+    IN gckOS Os,
-+    IN gctINT SignalID,
-+    IN gctBOOL State
-+    )
-+{
-+    return gckOS_Signal(Os, (gctSIGNAL)(gctUINTPTR_T)SignalID, State);
-+}
-+
-+#if gcdENABLE_VG
-+gceSTATUS
-+gckOS_CreateSemaphoreVG(
-+    IN gckOS Os,
-+    OUT gctSEMAPHORE * Semaphore
-+    )
-+{
-+    gceSTATUS status;
-+    struct semaphore * newSemaphore;
-+
-+    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%x", Os, Semaphore);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    do
-+    {
-+        /* Allocate the semaphore structure. */
-+    	newSemaphore = (struct semaphore *)kmalloc(gcmSIZEOF(struct semaphore), GFP_KERNEL | gcdNOWARN);
-+    	if (newSemaphore == gcvNULL)
-+    	{
-+        	gcmkERR_BREAK(gcvSTATUS_OUT_OF_MEMORY);
-+    	}
-+
-+        /* Initialize the semaphore. */
-+        sema_init(newSemaphore, 0);
-+
-+        /* Set the handle. */
-+        * Semaphore = (gctSEMAPHORE) newSemaphore;
-+
-+        /* Success. */
-+        status = gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+
-+gceSTATUS
-+gckOS_IncrementSemaphore(
-+    IN gckOS Os,
-+    IN gctSEMAPHORE Semaphore
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%x", Os, Semaphore);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    /* Increment the semaphore's count. */
-+    up((struct semaphore *) Semaphore);
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_DecrementSemaphore(
-+    IN gckOS Os,
-+    IN gctSEMAPHORE Semaphore
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT result;
-+
-+    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%x", Os, Semaphore);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
-+
-+    do
-+    {
-+        /* Decrement the semaphore's count. If the count is zero, wait
-+           until it gets incremented. */
-+        result = down_interruptible((struct semaphore *) Semaphore);
-+
-+        /* Signal received? */
-+        if (result != 0)
-+        {
-+            status = gcvSTATUS_TERMINATE;
-+            break;
-+        }
-+
-+        /* Success. */
-+        status = gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_SetSignal
-+**
-+**  Set the specified signal to signaled state.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctHANDLE Process
-+**          Handle of process owning the signal.
-+**
-+**      gctSIGNAL Signal
-+**          Pointer to the gctSIGNAL.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_SetSignal(
-+    IN gckOS Os,
-+    IN gctHANDLE Process,
-+    IN gctSIGNAL Signal
-+    )
-+{
-+    gceSTATUS status;
-+    gctINT result;
-+    struct task_struct * userTask;
-+    struct siginfo info;
-+
-+    userTask = FIND_TASK_BY_PID((pid_t)(gctUINTPTR_T) Process);
-+
-+    if (userTask != gcvNULL)
-+    {
-+        info.si_signo = 48;
-+        info.si_code  = __SI_CODE(__SI_RT, SI_KERNEL);
-+        info.si_pid   = 0;
-+        info.si_uid   = 0;
-+        info.si_ptr   = (gctPOINTER) Signal;
-+
-+        /* Signals with numbers between 32 and 63 are real-time,
-+           send a real-time signal to the user process. */
-+        result = send_sig_info(48, &info, userTask);
-+
-+        /* Error? */
-+        if (result < 0)
-+        {
-+            status = gcvSTATUS_GENERIC_IO;
-+
-+            gcmkTRACE(
-+                gcvLEVEL_ERROR,
-+                "%s(%d): an error has occurred.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+        }
-+        else
-+        {
-+            status = gcvSTATUS_OK;
-+        }
-+    }
-+    else
-+    {
-+        status = gcvSTATUS_GENERIC_IO;
-+
-+        gcmkTRACE(
-+            gcvLEVEL_ERROR,
-+            "%s(%d): an error has occurred.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+    }
-+
-+    /* Return status. */
-+    return status;
-+}
-+
-+/******************************************************************************\
-+******************************** Thread Object *********************************
-+\******************************************************************************/
-+
-+gceSTATUS
-+gckOS_StartThread(
-+    IN gckOS Os,
-+    IN gctTHREADFUNC ThreadFunction,
-+    IN gctPOINTER ThreadParameter,
-+    OUT gctTHREAD * Thread
-+    )
-+{
-+    gceSTATUS status;
-+    struct task_struct * thread;
-+
-+    gcmkHEADER_ARG("Os=0x%X ", Os);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(ThreadFunction != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Thread != gcvNULL);
-+
-+    do
-+    {
-+        /* Create the thread. */
-+        thread = kthread_create(
-+            ThreadFunction,
-+            ThreadParameter,
-+            "Vivante Kernel Thread"
-+            );
-+
-+        /* Failed? */
-+        if (IS_ERR(thread))
-+        {
-+            status = gcvSTATUS_GENERIC_IO;
-+            break;
-+        }
-+
-+        /* Start the thread. */
-+        wake_up_process(thread);
-+
-+        /* Set the thread handle. */
-+        * Thread = (gctTHREAD) thread;
-+
-+        /* Success. */
-+        status = gcvSTATUS_OK;
-+    }
-+    while (gcvFALSE);
-+
-+    gcmkFOOTER();
-+    /* Return the status. */
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_StopThread(
-+    IN gckOS Os,
-+    IN gctTHREAD Thread
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Thread=0x%x", Os, Thread);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Thread != gcvNULL);
-+
-+    /* Thread should have already been enabled to terminate. */
-+    kthread_stop((struct task_struct *) Thread);
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_VerifyThread(
-+    IN gckOS Os,
-+    IN gctTHREAD Thread
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X Thread=0x%x", Os, Thread);
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Thread != gcvNULL);
-+
-+    gcmkFOOTER_NO();
-+    /* Success. */
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+/******************************************************************************\
-+******************************** Software Timer ********************************
-+\******************************************************************************/
-+
-+void
-+_TimerFunction(
-+    struct work_struct * work
-+    )
-+{
-+    gcsOSTIMER_PTR timer = (gcsOSTIMER_PTR)work;
-+
-+    gctTIMERFUNCTION function = timer->function;
-+
-+    function(timer->data);
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_CreateTimer
-+**
-+**  Create a software timer.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctTIMERFUNCTION Function.
-+**          Pointer to a call back function which will be called when timer is
-+**          expired.
-+**
-+**      gctPOINTER Data.
-+**          Private data which will be passed to call back function.
-+**
-+**  OUTPUT:
-+**
-+**      gctPOINTER * Timer
-+**          Pointer to a variable receiving the created timer.
-+*/
-+gceSTATUS
-+gckOS_CreateTimer(
-+    IN gckOS Os,
-+    IN gctTIMERFUNCTION Function,
-+    IN gctPOINTER Data,
-+    OUT gctPOINTER * Timer
-+    )
-+{
-+    gceSTATUS status;
-+    gcsOSTIMER_PTR pointer;
-+    gcmkHEADER_ARG("Os=0x%X Function=0x%X Data=0x%X", Os, Function, Data);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
-+
-+    gcmkONERROR(gckOS_Allocate(Os, sizeof(gcsOSTIMER), (gctPOINTER)&pointer));
-+
-+    pointer->function = Function;
-+    pointer->data = Data;
-+
-+    INIT_DELAYED_WORK(&pointer->work, _TimerFunction);
-+
-+    *Timer = pointer;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_DestroyTimer
-+**
-+**  Destory a software timer.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Timer
-+**          Pointer to the timer to be destoryed.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_DestroyTimer(
-+    IN gckOS Os,
-+    IN gctPOINTER Timer
-+    )
-+{
-+    gcsOSTIMER_PTR timer;
-+    gcmkHEADER_ARG("Os=0x%X Timer=0x%X", Os, Timer);
-+
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
-+
-+    timer = (gcsOSTIMER_PTR)Timer;
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,23)
-+    cancel_delayed_work_sync(&timer->work);
-+#else
-+    cancel_delayed_work(&timer->work);
-+    flush_workqueue(Os->workqueue);
-+#endif
-+
-+    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, Timer));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_StartTimer
-+**
-+**  Schedule a software timer.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Timer
-+**          Pointer to the timer to be scheduled.
-+**
-+**      gctUINT32 Delay
-+**          Delay in milliseconds.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_StartTimer(
-+    IN gckOS Os,
-+    IN gctPOINTER Timer,
-+    IN gctUINT32 Delay
-+    )
-+{
-+    gcsOSTIMER_PTR timer;
-+
-+    gcmkHEADER_ARG("Os=0x%X Timer=0x%X Delay=%u", Os, Timer, Delay);
-+
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
-+    gcmkVERIFY_ARGUMENT(Delay != 0);
-+
-+    timer = (gcsOSTIMER_PTR)Timer;
-+
-+    if (unlikely(delayed_work_pending(&timer->work)))
-+    {
-+        if (unlikely(!cancel_delayed_work(&timer->work)))
-+        {
-+            cancel_work_sync(&timer->work.work);
-+
-+            if (unlikely(delayed_work_pending(&timer->work)))
-+            {
-+                gckOS_Print("gckOS_StartTimer error, the pending worker cannot complete!!!! \n");
-+
-+                return gcvSTATUS_INVALID_REQUEST;
-+            }
-+        }
-+    }
-+
-+    queue_delayed_work(Os->workqueue, &timer->work, msecs_to_jiffies(Delay));
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+/*******************************************************************************
-+**
-+**  gckOS_StopTimer
-+**
-+**  Cancel a unscheduled timer.
-+**
-+**  INPUT:
-+**
-+**      gckOS Os
-+**          Pointer to the gckOS object.
-+**
-+**      gctPOINTER Timer
-+**          Pointer to the timer to be cancel.
-+**
-+**  OUTPUT:
-+**
-+**      Nothing.
-+*/
-+gceSTATUS
-+gckOS_StopTimer(
-+    IN gckOS Os,
-+    IN gctPOINTER Timer
-+    )
-+{
-+    gcsOSTIMER_PTR timer;
-+    gcmkHEADER_ARG("Os=0x%X Timer=0x%X", Os, Timer);
-+
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
-+
-+    timer = (gcsOSTIMER_PTR)Timer;
-+
-+    cancel_delayed_work(&timer->work);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+gceSTATUS
-+gckOS_DumpCallStack(
-+    IN gckOS Os
-+    )
-+{
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+    dump_stack();
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+
-+gceSTATUS
-+gckOS_GetProcessNameByPid(
-+    IN gctINT Pid,
-+    IN gctSIZE_T Length,
-+    OUT gctUINT8_PTR String
-+    )
-+{
-+    struct task_struct *task;
-+
-+    /* Get the task_struct of the task with pid. */
-+    rcu_read_lock();
-+
-+    task = FIND_TASK_BY_PID(Pid);
-+
-+    if (task == gcvNULL)
-+    {
-+        rcu_read_unlock();
-+        return gcvSTATUS_NOT_FOUND;
-+    }
-+
-+    /* Get name of process. */
-+    strncpy(String, task->comm, Length);
-+
-+    rcu_read_unlock();
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_GetVideoMemoryMutex(
-+    IN gckOS Os,
-+    OUT gctPOINTER *Mutex
-+    )
-+{
-+    gcmkHEADER_ARG("Mutex=x%X", Mutex);
-+
-+    *Mutex = Os->vidmemMutex;
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+}
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+
-+gceSTATUS
-+gckOS_CreateSyncPoint(
-+    IN gckOS Os,
-+    OUT gctSYNC_POINT * SyncPoint
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSYNC_POINT_PTR syncPoint;
-+
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+
-+    /* Create an sync point structure. */
-+    syncPoint = (gcsSYNC_POINT_PTR) kmalloc(
-+            sizeof(gcsSYNC_POINT), GFP_KERNEL | gcdNOWARN);
-+
-+    if (syncPoint == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Initialize the sync point. */
-+    atomic_set(&syncPoint->ref, 1);
-+    atomic_set(&syncPoint->state, 0);
-+
-+    gcmkONERROR(_AllocateIntegerId(&Os->syncPointDB, syncPoint, &syncPoint->id));
-+
-+    *SyncPoint = (gctSYNC_POINT)(gctUINTPTR_T)syncPoint->id;
-+
-+    gcmkFOOTER_ARG("*SyncPonint=%d", syncPoint->id);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (syncPoint != gcvNULL)
-+    {
-+        kfree(syncPoint);
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_ReferenceSyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSYNC_POINT_PTR syncPoint;
-+
-+    gcmkHEADER_ARG("Os=0x%X", Os);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
-+
-+    gcmkONERROR(
-+        _QueryIntegerId(&Os->syncPointDB,
-+                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
-+                        (gctPOINTER)&syncPoint));
-+
-+    /* Initialize the sync point. */
-+    atomic_inc(&syncPoint->ref);
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_DestroySyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSYNC_POINT_PTR syncPoint;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Os=0x%X SyncPoint=%d", Os, (gctUINT32)(gctUINTPTR_T)SyncPoint);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Os, Os->syncPointMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    gcmkONERROR(
-+        _QueryIntegerId(&Os->syncPointDB,
-+                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
-+                        (gctPOINTER)&syncPoint));
-+
-+    gcmkASSERT(syncPoint->id == (gctUINT32)(gctUINTPTR_T)SyncPoint);
-+
-+    if (atomic_dec_and_test(&syncPoint->ref))
-+    {
-+        gcmkVERIFY_OK(_DestroyIntegerId(&Os->syncPointDB, syncPoint->id));
-+
-+        /* Free the sgianl. */
-+        syncPoint->timeline = gcvNULL;
-+        kfree(syncPoint);
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_SignalSyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSYNC_POINT_PTR syncPoint;
-+    gctBOOL acquired = gcvFALSE;
-+
-+    gcmkHEADER_ARG("Os=0x%X SyncPoint=%d", Os, (gctUINT32)(gctUINTPTR_T)SyncPoint);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
-+
-+    gcmkONERROR(gckOS_AcquireMutex(Os, Os->syncPointMutex, gcvINFINITE));
-+    acquired = gcvTRUE;
-+
-+    gcmkONERROR(
-+        _QueryIntegerId(&Os->syncPointDB,
-+                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
-+                        (gctPOINTER)&syncPoint));
-+
-+    gcmkASSERT(syncPoint->id == (gctUINT32)(gctUINTPTR_T)SyncPoint);
-+
-+    /* Get state. */
-+    atomic_set(&syncPoint->state, gcvTRUE);
-+
-+    /* Signal timeline. */
-+    if (syncPoint->timeline)
-+    {
-+        sync_timeline_signal(syncPoint->timeline);
-+    }
-+
-+    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
-+    acquired = gcvFALSE;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (acquired)
-+    {
-+        /* Release the mutex. */
-+        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_QuerySyncPoint(
-+    IN gckOS Os,
-+    IN gctSYNC_POINT SyncPoint,
-+    OUT gctBOOL_PTR State
-+    )
-+{
-+    gceSTATUS status;
-+    gcsSYNC_POINT_PTR syncPoint;
-+
-+    gcmkHEADER_ARG("Os=0x%X SyncPoint=%d", Os, (gctUINT32)(gctUINTPTR_T)SyncPoint);
-+
-+    /* Verify the arguments. */
-+    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
-+    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
-+
-+    gcmkONERROR(
-+        _QueryIntegerId(&Os->syncPointDB,
-+                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
-+                        (gctPOINTER)&syncPoint));
-+
-+    gcmkASSERT(syncPoint->id == (gctUINT32)(gctUINTPTR_T)SyncPoint);
-+
-+    /* Get state. */
-+    *State = atomic_read(&syncPoint->state);
-+
-+    /* Success. */
-+    gcmkFOOTER_ARG("*State=%d", *State);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_CreateSyncTimeline(
-+    IN gckOS Os,
-+    OUT gctHANDLE * Timeline
-+    )
-+{
-+    struct viv_sync_timeline * timeline;
-+
-+    /* Create viv sync timeline. */
-+    timeline = viv_sync_timeline_create("viv timeline", Os);
-+
-+    if (timeline == gcvNULL)
-+    {
-+        /* Out of memory. */
-+        return gcvSTATUS_OUT_OF_MEMORY;
-+    }
-+
-+    *Timeline = (gctHANDLE) timeline;
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_DestroySyncTimeline(
-+    IN gckOS Os,
-+    IN gctHANDLE Timeline
-+    )
-+{
-+    struct viv_sync_timeline * timeline;
-+    gcmkASSERT(Timeline != gcvNULL);
-+
-+    /* Destroy timeline. */
-+    timeline = (struct viv_sync_timeline *) Timeline;
-+    sync_timeline_destroy(&timeline->obj);
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_CreateNativeFence(
-+    IN gckOS Os,
-+    IN gctHANDLE Timeline,
-+    IN gctSYNC_POINT SyncPoint,
-+    OUT gctINT * FenceFD
-+    )
-+{
-+    int fd = -1;
-+    struct viv_sync_timeline *timeline;
-+    struct sync_pt * pt = gcvNULL;
-+    struct sync_fence * fence;
-+    char name[32];
-+    gcsSYNC_POINT_PTR syncPoint;
-+    gceSTATUS status;
-+
-+    gcmkHEADER_ARG("Os=0x%X Timeline=0x%X SyncPoint=%d",
-+                   Os, Timeline, (gctUINT)(gctUINTPTR_T)SyncPoint);
-+
-+    gcmkONERROR(
-+        _QueryIntegerId(&Os->syncPointDB,
-+                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
-+                        (gctPOINTER)&syncPoint));
-+
-+    /* Cast timeline. */
-+    timeline = (struct viv_sync_timeline *) Timeline;
-+
-+    fd = get_unused_fd();
-+
-+    if (fd < 0)
-+    {
-+        /* Out of resources. */
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+    /* Create viv_sync_pt. */
-+    pt = viv_sync_pt_create(timeline, SyncPoint);
-+
-+    if (pt == gcvNULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Reference sync_timeline. */
-+    syncPoint->timeline = &timeline->obj;
-+
-+    /* Build fence name. */
-+    snprintf(name, 32, "viv sync_fence-%u", (gctUINT)(gctUINTPTR_T)SyncPoint);
-+
-+    /* Create sync_fence. */
-+    fence = sync_fence_create(name, pt);
-+
-+    if (fence == NULL)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    /* Install fence to fd. */
-+    sync_fence_install(fence, fd);
-+
-+    *FenceFD = fd;
-+    gcmkFOOTER_ARG("*FenceFD=%d", fd);
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    /* Error roll back. */
-+    if (pt)
-+    {
-+        sync_pt_free(pt);
-+    }
-+
-+    if (fd > 0)
-+    {
-+        put_unused_fd(fd);
-+    }
-+
-+    gcmkFOOTER();
-+    return status;
-+}
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,83 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_os_h_
-+#define __gc_hal_kernel_os_h_
-+
-+typedef struct _LINUX_MDL_MAP
-+{
-+    gctINT                  pid;
-+    gctPOINTER              vmaAddr;
-+    gctUINT32               count;
-+    struct vm_area_struct * vma;
-+    struct _LINUX_MDL_MAP * next;
-+}
-+LINUX_MDL_MAP;
-+
-+typedef struct _LINUX_MDL_MAP * PLINUX_MDL_MAP;
-+
-+typedef struct _LINUX_MDL
-+{
-+    gctINT                  pid;
-+    char *                  addr;
-+
-+    union _pages
-+    {
-+        /* Pointer to a array of pages. */
-+        struct page *       contiguousPages;
-+        /* Pointer to a array of pointers to page. */
-+        struct page **      nonContiguousPages;
-+    }
-+    u;
-+
-+#ifdef NO_DMA_COHERENT
-+    gctPOINTER              kaddr;
-+#endif /* NO_DMA_COHERENT */
-+
-+    gctINT                  numPages;
-+    gctINT                  pagedMem;
-+    gctBOOL                 contiguous;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
-+    gctBOOL                 exact;
-+#endif
-+    dma_addr_t              dmaHandle;
-+    PLINUX_MDL_MAP          maps;
-+    struct _LINUX_MDL *     prev;
-+    struct _LINUX_MDL *     next;
-+}
-+LINUX_MDL, *PLINUX_MDL;
-+
-+extern PLINUX_MDL_MAP
-+FindMdlMap(
-+    IN PLINUX_MDL Mdl,
-+    IN gctINT PID
-+    );
-+
-+typedef struct _DRIVER_ARGS
-+{
-+    gctUINT64               InputBuffer;
-+    gctUINT64               InputBufferSize;
-+    gctUINT64               OutputBuffer;
-+    gctUINT64               OutputBufferSize;
-+}
-+DRIVER_ARGS;
-+
-+#endif /* __gc_hal_kernel_os_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,279 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef _gc_hal_kernel_platform_h_
-+#define _gc_hal_kernel_platform_h_
-+#include <linux/mm.h>
-+
-+typedef struct _gcsMODULE_PARAMETERS
-+{
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+    gctINT  irqLine3D0;
-+    gctUINT registerMemBase3D0;
-+    gctUINT registerMemSize3D0;
-+    gctINT  irqLine3D1;
-+    gctUINT registerMemBase3D1;
-+    gctUINT registerMemSize3D1;
-+#else
-+    gctINT  irqLine;
-+    gctUINT registerMemBase;
-+    gctUINT registerMemSize;
-+#endif
-+    gctINT  irqLine2D;
-+    gctUINT registerMemBase2D;
-+    gctUINT registerMemSize2D;
-+    gctINT  irqLineVG;
-+    gctUINT registerMemBaseVG;
-+    gctUINT registerMemSizeVG;
-+    gctUINT contiguousSize;
-+    gctUINT contiguousBase;
-+    gctUINT contiguousRequested;
-+    gctUINT bankSize;
-+    gctINT  fastClear;
-+    gctINT  compression;
-+    gctINT  powerManagement;
-+    gctINT  gpuProfiler;
-+    gctINT  signal;
-+    gctUINT baseAddress;
-+    gctUINT physSize;
-+    gctUINT logFileSize;
-+    gctUINT recovery;
-+    gctUINT stuckDump;
-+    gctUINT showArgs;
-+    gctUINT gpu3DMinClock;
-+}
-+gcsMODULE_PARAMETERS;
-+
-+typedef struct _gcsPLATFORM * gckPLATFORM;
-+
-+typedef struct _gcsPLATFORM_OPERATIONS
-+{
-+    /*******************************************************************************
-+    **
-+    **  needAddDevice
-+    **
-+    **  Determine whether platform_device is created by initialization code.
-+    **  If platform_device is created by BSP, return gcvFLASE here.
-+    */
-+    gctBOOL
-+    (*needAddDevice)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  adjustParam
-+    **
-+    **  Override content of arguments, if a argument is not changed here, it will
-+    **  keep as default value or value set by insmod command line.
-+    */
-+    gceSTATUS
-+    (*adjustParam)(
-+        IN gckPLATFORM Platform,
-+        OUT gcsMODULE_PARAMETERS *Args
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  adjustDriver
-+    **
-+    **  Override content of platform_driver which will be registered.
-+    */
-+    gceSTATUS
-+    (*adjustDriver)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  getPower
-+    **
-+    **  Prepare power and clock operation.
-+    */
-+    gceSTATUS
-+    (*getPower)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  putPower
-+    **
-+    **  Finish power and clock operation.
-+    */
-+    gceSTATUS
-+    (*putPower)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  allocPriv
-+    **
-+    **  Construct platform private data.
-+    */
-+    gceSTATUS
-+    (*allocPriv)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  freePriv
-+    **
-+    **  free platform private data.
-+    */
-+    gceSTATUS
-+    (*freePriv)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  setPower
-+    **
-+    **  Set power state of specified GPU.
-+    **
-+    **  INPUT:
-+    **
-+    **      gceCORE GPU
-+    **          GPU neeed to config.
-+    **
-+    **      gceBOOL Enable
-+    **          Enable or disable power.
-+    */
-+    gceSTATUS
-+    (*setPower)(
-+        IN gckPLATFORM Platform,
-+        IN gceCORE GPU,
-+        IN gctBOOL Enable
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  setClock
-+    **
-+    **  Set clock state of specified GPU.
-+    **
-+    **  INPUT:
-+    **
-+    **      gceCORE GPU
-+    **          GPU neeed to config.
-+    **
-+    **      gceBOOL Enable
-+    **          Enable or disable clock.
-+    */
-+    gceSTATUS
-+    (*setClock)(
-+        IN gckPLATFORM Platform,
-+        IN gceCORE GPU,
-+        IN gctBOOL Enable
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  reset
-+    **
-+    **  Reset GPU outside.
-+    **
-+    **  INPUT:
-+    **
-+    **      gceCORE GPU
-+    **          GPU neeed to reset.
-+    */
-+    gceSTATUS
-+    (*reset)(
-+        IN gckPLATFORM Platform,
-+        IN gceCORE GPU
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  getGPUPhysical
-+    **
-+    **  Convert CPU physical address to GPU physical address if they are
-+    **  different.
-+    */
-+    gceSTATUS
-+    (*getGPUPhysical)(
-+        IN gckPLATFORM Platform,
-+        IN gctUINT32 CPUPhysical,
-+        OUT gctUINT32_PTR GPUPhysical
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  adjustProt
-+    **
-+    **  Override Prot flag when mapping paged memory to userspace.
-+    */
-+    gceSTATUS
-+    (*adjustProt)(
-+        IN struct vm_area_struct * vma
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  shrinkMemory
-+    **
-+    **  Do something to collect memory, eg, act as oom killer.
-+    */
-+    gceSTATUS
-+    (*shrinkMemory)(
-+        IN gckPLATFORM Platform
-+        );
-+
-+    /*******************************************************************************
-+    **
-+    **  cache
-+    **
-+    **  Cache operation.
-+    */
-+    gceSTATUS
-+    (*cache)(
-+        IN gckPLATFORM Platform,
-+        IN gctUINT32 ProcessID,
-+        IN gctPHYS_ADDR Handle,
-+        IN gctUINT32 Physical,
-+        IN gctPOINTER Logical,
-+        IN gctSIZE_T Bytes,
-+        IN gceCACHEOPERATION Operation
-+        );
-+}
-+gcsPLATFORM_OPERATIONS;
-+
-+typedef struct _gcsPLATFORM
-+{
-+    struct platform_device* device;
-+    struct platform_driver* driver;
-+
-+    gcsPLATFORM_OPERATIONS* ops;
-+
-+    void*                   priv;
-+}
-+gcsPLATFORM;
-+
-+void
-+gckPLATFORM_QueryOperations(
-+    IN gcsPLATFORM_OPERATIONS ** Operations
-+    );
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,1347 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include <linux/device.h>
-+#include <linux/slab.h>
-+
-+#include "gc_hal_kernel_linux.h"
-+#include "gc_hal_driver.h"
-+
-+#if USE_PLATFORM_DRIVER
-+#   include <linux/platform_device.h>
-+#endif
-+
-+#ifdef CONFIG_PXA_DVFM
-+#   include <mach/dvfm.h>
-+#   include <mach/pxa3xx_dvfm.h>
-+#endif
-+
-+
-+/* Zone used for header/footer. */
-+#define _GC_OBJ_ZONE    gcvZONE_DRIVER
-+
-+MODULE_DESCRIPTION("Vivante Graphics Driver");
-+MODULE_LICENSE("GPL");
-+
-+static struct class* gpuClass;
-+
-+static gcsPLATFORM platform;
-+
-+static gckGALDEVICE galDevice;
-+
-+static uint major = 199;
-+module_param(major, uint, 0644);
-+
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+static int irqLine3D0 = -1;
-+module_param(irqLine3D0, int, 0644);
-+
-+static ulong registerMemBase3D0 = 0;
-+module_param(registerMemBase3D0, ulong, 0644);
-+
-+static ulong registerMemSize3D0 = 2 << 10;
-+module_param(registerMemSize3D0, ulong, 0644);
-+
-+static int irqLine3D1 = -1;
-+module_param(irqLine3D1, int, 0644);
-+
-+static ulong registerMemBase3D1 = 0;
-+module_param(registerMemBase3D1, ulong, 0644);
-+
-+static ulong registerMemSize3D1 = 2 << 10;
-+module_param(registerMemSize3D1, ulong, 0644);
-+#else
-+static int irqLine = -1;
-+module_param(irqLine, int, 0644);
-+
-+static ulong registerMemBase = 0x80000000;
-+module_param(registerMemBase, ulong, 0644);
-+
-+static ulong registerMemSize = 2 << 10;
-+module_param(registerMemSize, ulong, 0644);
-+#endif
-+
-+static int irqLine2D = -1;
-+module_param(irqLine2D, int, 0644);
-+
-+static ulong registerMemBase2D = 0x00000000;
-+module_param(registerMemBase2D, ulong, 0644);
-+
-+static ulong registerMemSize2D = 2 << 10;
-+module_param(registerMemSize2D, ulong, 0644);
-+
-+static int irqLineVG = -1;
-+module_param(irqLineVG, int, 0644);
-+
-+static ulong registerMemBaseVG = 0x00000000;
-+module_param(registerMemBaseVG, ulong, 0644);
-+
-+static ulong registerMemSizeVG = 2 << 10;
-+module_param(registerMemSizeVG, ulong, 0644);
-+
-+#ifndef gcdDEFAULT_CONTIGUOUS_SIZE
-+#define gcdDEFAULT_CONTIGUOUS_SIZE (4 << 20)
-+#endif
-+static ulong contiguousSize = gcdDEFAULT_CONTIGUOUS_SIZE;
-+module_param(contiguousSize, ulong, 0644);
-+
-+static ulong contiguousBase = 0;
-+module_param(contiguousBase, ulong, 0644);
-+
-+static ulong bankSize = 0;
-+module_param(bankSize, ulong, 0644);
-+
-+static int fastClear = -1;
-+module_param(fastClear, int, 0644);
-+
-+static int compression = -1;
-+module_param(compression, int, 0644);
-+
-+static int powerManagement = -1;
-+module_param(powerManagement, int, 0644);
-+
-+static int gpuProfiler = 0;
-+module_param(gpuProfiler, int, 0644);
-+
-+static int signal = 48;
-+module_param(signal, int, 0644);
-+
-+static ulong baseAddress = 0;
-+module_param(baseAddress, ulong, 0644);
-+
-+static ulong physSize = 0;
-+module_param(physSize, ulong, 0644);
-+
-+static uint logFileSize = 0;
-+module_param(logFileSize,uint, 0644);
-+
-+static uint recovery = 1;
-+module_param(recovery, uint, 0644);
-+MODULE_PARM_DESC(recovery, "Recover GPU from stuck (1: Enable, 0: Disable)");
-+
-+/* Middle needs about 40KB buffer, Maximal may need more than 200KB buffer. */
-+static uint stuckDump = 1;
-+module_param(stuckDump, uint, 0644);
-+MODULE_PARM_DESC(stuckDump, "Level of stuck dump content (1: Minimal, 2: Middle, 3: Maximal)");
-+
-+static int showArgs = 0;
-+module_param(showArgs, int, 0644);
-+
-+static int mmu = 1;
-+module_param(mmu, int, 0644);
-+
-+static int gpu3DMinClock = 1;
-+
-+static int contiguousRequested = 0;
-+
-+static int drv_open(
-+    struct inode* inode,
-+    struct file* filp
-+    );
-+
-+static int drv_release(
-+    struct inode* inode,
-+    struct file* filp
-+    );
-+
-+static long drv_ioctl(
-+    struct file* filp,
-+    unsigned int ioctlCode,
-+    unsigned long arg
-+    );
-+
-+static int drv_mmap(
-+    struct file* filp,
-+    struct vm_area_struct* vma
-+    );
-+
-+static struct file_operations driver_fops =
-+{
-+    .owner      = THIS_MODULE,
-+    .open       = drv_open,
-+    .release    = drv_release,
-+    .unlocked_ioctl = drv_ioctl,
-+#ifdef HAVE_COMPAT_IOCTL
-+    .compat_ioctl = drv_ioctl,
-+#endif
-+    .mmap       = drv_mmap,
-+};
-+
-+void
-+_UpdateModuleParam(
-+    gcsMODULE_PARAMETERS *Param
-+    )
-+{
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+#else
-+    irqLine           = Param->irqLine ;
-+    registerMemBase   = Param->registerMemBase;
-+    registerMemSize   = Param->registerMemSize;
-+#endif
-+    irqLine2D         = Param->irqLine2D      ;
-+    registerMemBase2D = Param->registerMemBase2D;
-+    registerMemSize2D = Param->registerMemSize2D;
-+    irqLineVG         = Param->irqLineVG;
-+    registerMemBaseVG = Param->registerMemBaseVG;
-+    registerMemSizeVG = Param->registerMemSizeVG;
-+    contiguousSize    = Param->contiguousSize;
-+    contiguousBase    = Param->contiguousBase;
-+    bankSize          = Param->bankSize;
-+    fastClear         = Param->fastClear;
-+    compression       = Param->compression;
-+    powerManagement   = Param->powerManagement;
-+    gpuProfiler       = Param->gpuProfiler;
-+    signal            = Param->signal;
-+    baseAddress       = Param->baseAddress;
-+    physSize          = Param->physSize;
-+    logFileSize       = Param->logFileSize;
-+    recovery          = Param->recovery;
-+    stuckDump         = Param->stuckDump;
-+    showArgs          = Param->showArgs;
-+    contiguousRequested = Param->contiguousRequested;
-+    gpu3DMinClock     = Param->gpu3DMinClock;
-+}
-+
-+void
-+gckOS_DumpParam(
-+    void
-+    )
-+{
-+    printk("Galcore options:\n");
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+    printk("  irqLine3D0         = %d\n",      irqLine3D0);
-+    printk("  registerMemBase3D0 = 0x%08lX\n", registerMemBase3D0);
-+    printk("  registerMemSize3D0 = 0x%08lX\n", registerMemSize3D0);
-+
-+    if (irqLine3D1 != -1)
-+    {
-+        printk("  irqLine3D1         = %d\n",      irqLine3D1);
-+        printk("  registerMemBase3D1 = 0x%08lX\n", registerMemBase3D1);
-+        printk("  registerMemSize3D1 = 0x%08lX\n", registerMemSize3D1);
-+    }
-+#else
-+    printk("  irqLine           = %d\n",      irqLine);
-+    printk("  registerMemBase   = 0x%08lX\n", registerMemBase);
-+    printk("  registerMemSize   = 0x%08lX\n", registerMemSize);
-+#endif
-+
-+    if (irqLine2D != -1)
-+    {
-+        printk("  irqLine2D         = %d\n",      irqLine2D);
-+        printk("  registerMemBase2D = 0x%08lX\n", registerMemBase2D);
-+        printk("  registerMemSize2D = 0x%08lX\n", registerMemSize2D);
-+    }
-+
-+    if (irqLineVG != -1)
-+    {
-+        printk("  irqLineVG         = %d\n",      irqLineVG);
-+        printk("  registerMemBaseVG = 0x%08lX\n", registerMemBaseVG);
-+        printk("  registerMemSizeVG = 0x%08lX\n", registerMemSizeVG);
-+    }
-+
-+    printk("  contiguousSize    = %ld\n",     contiguousSize);
-+    printk("  contiguousBase    = 0x%08lX\n", contiguousBase);
-+    printk("  bankSize          = 0x%08lX\n", bankSize);
-+    printk("  fastClear         = %d\n",      fastClear);
-+    printk("  compression       = %d\n",      compression);
-+    printk("  signal            = %d\n",      signal);
-+    printk("  powerManagement   = %d\n",      powerManagement);
-+    printk("  baseAddress       = 0x%08lX\n", baseAddress);
-+    printk("  physSize          = 0x%08lX\n", physSize);
-+    printk("  logFileSize       = %d KB \n",  logFileSize);
-+    printk("  recovery          = %d\n",      recovery);
-+    printk("  stuckDump         = %d\n",      stuckDump);
-+    printk("  gpuProfiler       = %d\n",      gpuProfiler);
-+}
-+
-+int drv_open(
-+    struct inode* inode,
-+    struct file* filp
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL attached = gcvFALSE;
-+    gcsHAL_PRIVATE_DATA_PTR data = gcvNULL;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = kmalloc(sizeof(gcsHAL_PRIVATE_DATA), GFP_KERNEL | __GFP_NOWARN);
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    data->device             = galDevice;
-+    data->mappedMemory       = gcvNULL;
-+    data->contiguousLogical  = gcvNULL;
-+    gcmkONERROR(gckOS_GetProcessID(&data->pidOpen));
-+
-+    /* Attached the process. */
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (galDevice->kernels[i] != gcvNULL)
-+        {
-+            gcmkONERROR(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvTRUE));
-+        }
-+    }
-+    attached = gcvTRUE;
-+
-+    if (!galDevice->contiguousMapped)
-+    {
-+        if (galDevice->contiguousPhysical != gcvNULL)
-+        {
-+            gcmkONERROR(gckOS_MapMemory(
-+                galDevice->os,
-+                galDevice->contiguousPhysical,
-+                galDevice->contiguousSize,
-+                &data->contiguousLogical
-+                ));
-+        }
-+    }
-+
-+    filp->private_data = data;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    if (data != gcvNULL)
-+    {
-+        if (data->contiguousLogical != gcvNULL)
-+        {
-+            gcmkVERIFY_OK(gckOS_UnmapMemory(
-+                galDevice->os,
-+                galDevice->contiguousPhysical,
-+                galDevice->contiguousSize,
-+                data->contiguousLogical
-+                ));
-+        }
-+
-+        kfree(data);
-+    }
-+
-+    if (attached)
-+    {
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (galDevice->kernels[i] != gcvNULL)
-+            {
-+                gcmkVERIFY_OK(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvFALSE));
-+            }
-+        }
-+    }
-+
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+int drv_release(
-+    struct inode* inode,
-+    struct file* filp
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_PRIVATE_DATA_PTR data;
-+    gckGALDEVICE device;
-+    gctINT i;
-+
-+    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = filp->private_data;
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    device = data->device;
-+
-+    if (device == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): device is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if (!device->contiguousMapped)
-+    {
-+        if (data->contiguousLogical != gcvNULL)
-+        {
-+            gcmkONERROR(gckOS_UnmapMemoryEx(
-+                galDevice->os,
-+                galDevice->contiguousPhysical,
-+                galDevice->contiguousSize,
-+                data->contiguousLogical,
-+                data->pidOpen
-+                ));
-+
-+            data->contiguousLogical = gcvNULL;
-+        }
-+    }
-+
-+    /* A process gets detached. */
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (galDevice->kernels[i] != gcvNULL)
-+        {
-+            gcmkONERROR(gckKERNEL_AttachProcessEx(galDevice->kernels[i], gcvFALSE, data->pidOpen));
-+        }
-+    }
-+
-+    kfree(data);
-+    filp->private_data = NULL;
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+long drv_ioctl(
-+    struct file* filp,
-+    unsigned int ioctlCode,
-+    unsigned long arg
-+    )
-+{
-+    gceSTATUS status;
-+    gcsHAL_INTERFACE iface;
-+    gctUINT32 copyLen;
-+    DRIVER_ARGS drvArgs;
-+    gckGALDEVICE device;
-+    gcsHAL_PRIVATE_DATA_PTR data;
-+    gctINT32 i, count;
-+    gckVIDMEM_NODE nodeObject;
-+
-+    gcmkHEADER_ARG(
-+        "filp=0x%08X ioctlCode=0x%08X arg=0x%08X",
-+        filp, ioctlCode, arg
-+        );
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = filp->private_data;
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    device = data->device;
-+
-+    if (device == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): device is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if ((ioctlCode != IOCTL_GCHAL_INTERFACE)
-+    &&  (ioctlCode != IOCTL_GCHAL_KERNEL_INTERFACE)
-+    )
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): unknown command %d\n",
-+            __FUNCTION__, __LINE__,
-+            ioctlCode
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Get the drvArgs. */
-+    copyLen = copy_from_user(
-+        &drvArgs, (void *) arg, sizeof(DRIVER_ARGS)
-+        );
-+
-+    if (copyLen != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): error copying of the input arguments.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Now bring in the gcsHAL_INTERFACE structure. */
-+    if ((drvArgs.InputBufferSize  != sizeof(gcsHAL_INTERFACE))
-+    ||  (drvArgs.OutputBufferSize != sizeof(gcsHAL_INTERFACE))
-+    )
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): input or/and output structures are invalid.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    copyLen = copy_from_user(
-+        &iface, gcmUINT64_TO_PTR(drvArgs.InputBuffer), sizeof(gcsHAL_INTERFACE)
-+        );
-+
-+    if (copyLen != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): error copying of input HAL interface.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    if (iface.command == gcvHAL_CHIP_INFO)
-+    {
-+        count = 0;
-+        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+        {
-+            if (device->kernels[i] != gcvNULL)
-+            {
-+#if gcdENABLE_VG
-+                if (i == gcvCORE_VG)
-+                {
-+                    iface.u.ChipInfo.types[count] = gcvHARDWARE_VG;
-+                }
-+                else
-+#endif
-+                {
-+                    gcmkVERIFY_OK(gckHARDWARE_GetType(device->kernels[i]->hardware,
-+                                                      &iface.u.ChipInfo.types[count]));
-+                }
-+                count++;
-+            }
-+        }
-+
-+        iface.u.ChipInfo.count = count;
-+        iface.status = status = gcvSTATUS_OK;
-+    }
-+    else
-+    {
-+        if (iface.hardwareType > 7)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): unknown hardwareType %d\n",
-+                __FUNCTION__, __LINE__,
-+                iface.hardwareType
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+#if gcdENABLE_VG
-+        if (device->coreMapping[iface.hardwareType] == gcvCORE_VG)
-+        {
-+            status = gckVGKERNEL_Dispatch(device->kernels[gcvCORE_VG],
-+                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
-+                                        &iface);
-+        }
-+        else
-+#endif
-+        {
-+            status = gckKERNEL_Dispatch(device->kernels[device->coreMapping[iface.hardwareType]],
-+                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
-+                                        &iface);
-+        }
-+    }
-+
-+    /* Redo system call after pending signal is handled. */
-+    if (status == gcvSTATUS_INTERRUPTED)
-+    {
-+        gcmkFOOTER();
-+        return -ERESTARTSYS;
-+    }
-+
-+    if (gcmIS_SUCCESS(status) && (iface.command == gcvHAL_LOCK_VIDEO_MEMORY))
-+    {
-+        gcuVIDMEM_NODE_PTR node;
-+        gctUINT32 processID;
-+
-+        gckOS_GetProcessID(&processID);
-+
-+        gcmkONERROR(gckVIDMEM_HANDLE_Lookup(device->kernels[device->coreMapping[iface.hardwareType]],
-+                                processID,
-+                                (gctUINT32)iface.u.LockVideoMemory.node,
-+                                &nodeObject));
-+        node = nodeObject->node;
-+
-+        /* Special case for mapped memory. */
-+        if ((data->mappedMemory != gcvNULL)
-+        &&  (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
-+        )
-+        {
-+            /* Compute offset into mapped memory. */
-+            gctUINT32 offset
-+                = (gctUINT8 *) gcmUINT64_TO_PTR(iface.u.LockVideoMemory.memory)
-+                - (gctUINT8 *) device->contiguousBase;
-+
-+            /* Compute offset into user-mapped region. */
-+            iface.u.LockVideoMemory.memory =
-+                gcmPTR_TO_UINT64((gctUINT8 *) data->mappedMemory + offset);
-+        }
-+    }
-+
-+    /* Copy data back to the user. */
-+    copyLen = copy_to_user(
-+        gcmUINT64_TO_PTR(drvArgs.OutputBuffer), &iface, sizeof(gcsHAL_INTERFACE)
-+        );
-+
-+    if (copyLen != 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): error copying of output HAL interface.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+static int drv_mmap(
-+    struct file* filp,
-+    struct vm_area_struct* vma
-+    )
-+{
-+    gceSTATUS status = gcvSTATUS_OK;
-+    gcsHAL_PRIVATE_DATA_PTR data;
-+    gckGALDEVICE device;
-+
-+    gcmkHEADER_ARG("filp=0x%08X vma=0x%08X", filp, vma);
-+
-+    if (filp == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): filp is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    data = filp->private_data;
-+
-+    if (data == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): private_data is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+    device = data->device;
-+
-+    if (device == gcvNULL)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): device is NULL\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+    }
-+
-+#if !gcdPAGED_MEMORY_CACHEABLE
-+    vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
-+    vma->vm_flags    |= gcdVM_FLAGS;
-+#endif
-+    vma->vm_pgoff     = 0;
-+
-+    if (device->contiguousMapped)
-+    {
-+        unsigned long size = vma->vm_end - vma->vm_start;
-+        int ret = 0;
-+
-+        if (size > device->contiguousSize)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): Invalid mapping size.\n",
-+                __FUNCTION__, __LINE__
-+                );
-+
-+            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
-+        }
-+
-+        ret = io_remap_pfn_range(
-+            vma,
-+            vma->vm_start,
-+            device->requestedContiguousBase >> PAGE_SHIFT,
-+            size,
-+            vma->vm_page_prot
-+            );
-+
-+        if (ret != 0)
-+        {
-+            gcmkTRACE_ZONE(
-+                gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                "%s(%d): io_remap_pfn_range failed %d\n",
-+                __FUNCTION__, __LINE__,
-+                ret
-+                );
-+
-+            data->mappedMemory = gcvNULL;
-+
-+            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+        }
-+
-+        data->mappedMemory = (gctPOINTER) vma->vm_start;
-+
-+        /* Success. */
-+        gcmkFOOTER_NO();
-+        return 0;
-+    }
-+
-+OnError:
-+    gcmkFOOTER();
-+    return -ENOTTY;
-+}
-+
-+
-+#if !USE_PLATFORM_DRIVER
-+static int __init drv_init(void)
-+#else
-+static int drv_init(void)
-+#endif
-+{
-+    int ret;
-+    int result = -EINVAL;
-+    gceSTATUS status;
-+    gckGALDEVICE device = gcvNULL;
-+    struct class* device_class = gcvNULL;
-+
-+    gcsDEVICE_CONSTRUCT_ARGS args = {
-+        .recovery           = recovery,
-+        .stuckDump          = stuckDump,
-+        .gpu3DMinClock      = gpu3DMinClock,
-+        .contiguousRequested = contiguousRequested,
-+        .platform           = &platform,
-+        .mmu                = mmu,
-+    };
-+
-+    gcmkHEADER();
-+
-+    printk(KERN_INFO "Galcore version %d.%d.%d.%d\n",
-+        gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH, gcvVERSION_BUILD);
-+
-+#if !VIVANTE_PROFILER_PM
-+    /* when enable gpu profiler, we need to turn off gpu powerMangement */
-+    if (gpuProfiler)
-+    {
-+        powerManagement = 0;
-+    }
-+#endif
-+
-+    if (showArgs)
-+    {
-+        gckOS_DumpParam();
-+    }
-+
-+    if (logFileSize != 0)
-+    {
-+        gckDEBUGFS_Initialize();
-+    }
-+
-+    /* Create the GAL device. */
-+    status = gckGALDEVICE_Construct(
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+        irqLine3D0,
-+        registerMemBase3D0, registerMemSize3D0,
-+        irqLine3D1,
-+        registerMemBase3D1, registerMemSize3D1,
-+#else
-+        irqLine,
-+        registerMemBase, registerMemSize,
-+#endif
-+        irqLine2D,
-+        registerMemBase2D, registerMemSize2D,
-+        irqLineVG,
-+        registerMemBaseVG, registerMemSizeVG,
-+        contiguousBase, contiguousSize,
-+        bankSize, fastClear, compression, baseAddress, physSize, signal,
-+        logFileSize,
-+        powerManagement,
-+        gpuProfiler,
-+        &args,
-+        &device
-+    );
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+                       "%s(%d): Failed to create the GAL device: status=%d\n",
-+                       __FUNCTION__, __LINE__, status);
-+
-+        goto OnError;
-+    }
-+
-+    /* Start the GAL device. */
-+    gcmkONERROR(gckGALDEVICE_Start(device));
-+
-+    if ((physSize != 0)
-+       && (device->kernels[gcvCORE_MAJOR] != gcvNULL)
-+       && (device->kernels[gcvCORE_MAJOR]->hardware->mmuVersion != 0))
-+    {
-+        /* Reset the base address */
-+        device->baseAddress = 0;
-+    }
-+
-+    /* Register the character device. */
-+    ret = register_chrdev(major, DEVICE_NAME, &driver_fops);
-+
-+    if (ret < 0)
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): Could not allocate major number for mmap.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    if (major == 0)
-+    {
-+        major = ret;
-+    }
-+
-+    /* Create the device class. */
-+    device_class = class_create(THIS_MODULE, "graphics_class");
-+
-+    if (IS_ERR(device_class))
-+    {
-+        gcmkTRACE_ZONE(
-+            gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+            "%s(%d): Failed to create the class.\n",
-+            __FUNCTION__, __LINE__
-+            );
-+
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
-+    device_create(device_class, NULL, MKDEV(major, 0), NULL, DEVICE_NAME);
-+#else
-+    device_create(device_class, NULL, MKDEV(major, 0), DEVICE_NAME);
-+#endif
-+
-+    galDevice = device;
-+    gpuClass  = device_class;
-+
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_DRIVER,
-+        "%s(%d): irqLine3D0=%d, contiguousSize=%lu, memBase3D0=0x%lX\n",
-+        __FUNCTION__, __LINE__,
-+        irqLine3D0, contiguousSize, registerMemBase3D0
-+        );
-+#else
-+    gcmkTRACE_ZONE(
-+        gcvLEVEL_INFO, gcvZONE_DRIVER,
-+        "%s(%d): irqLine=%d, contiguousSize=%lu, memBase=0x%lX\n",
-+        __FUNCTION__, __LINE__,
-+        irqLine, contiguousSize, registerMemBase
-+        );
-+#endif
-+
-+    /* Success. */
-+    gcmkFOOTER_NO();
-+    return 0;
-+
-+OnError:
-+    /* Roll back. */
-+    if (device_class != gcvNULL)
-+    {
-+        device_destroy(device_class, MKDEV(major, 0));
-+        class_destroy(device_class);
-+    }
-+
-+    if (device != gcvNULL)
-+    {
-+        gcmkVERIFY_OK(gckGALDEVICE_Stop(device));
-+        gcmkVERIFY_OK(gckGALDEVICE_Destroy(device));
-+    }
-+
-+    gcmkFOOTER();
-+    return result;
-+}
-+
-+#if !USE_PLATFORM_DRIVER
-+static void __exit drv_exit(void)
-+#else
-+static void drv_exit(void)
-+#endif
-+{
-+    gcmkHEADER();
-+
-+    gcmkASSERT(gpuClass != gcvNULL);
-+    device_destroy(gpuClass, MKDEV(major, 0));
-+    class_destroy(gpuClass);
-+
-+    unregister_chrdev(major, DEVICE_NAME);
-+
-+    gcmkVERIFY_OK(gckGALDEVICE_Stop(galDevice));
-+    gcmkVERIFY_OK(gckGALDEVICE_Destroy(galDevice));
-+
-+    if(gckDEBUGFS_IsEnabled())
-+    {
-+        gckDEBUGFS_Terminate();
-+    }
-+
-+    gcmkFOOTER_NO();
-+}
-+
-+#if !USE_PLATFORM_DRIVER
-+    module_init(drv_init);
-+    module_exit(drv_exit);
-+#else
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
-+static int gpu_probe(struct platform_device *pdev)
-+#else
-+static int __devinit gpu_probe(struct platform_device *pdev)
-+#endif
-+{
-+    int ret = -ENODEV;
-+    gcsMODULE_PARAMETERS moduleParam = {
-+#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
-+#else
-+        .irqLine            = irqLine,
-+        .registerMemBase    = registerMemBase,
-+        .registerMemSize    = registerMemSize,
-+#endif
-+        .irqLine2D          = irqLine2D,
-+        .registerMemBase2D  = registerMemBase2D,
-+        .registerMemSize2D  = registerMemSize2D,
-+        .irqLineVG          = irqLineVG,
-+        .registerMemBaseVG  = registerMemBaseVG,
-+        .registerMemSizeVG  = registerMemSizeVG,
-+        .contiguousSize     = contiguousSize,
-+        .contiguousBase     = contiguousBase,
-+        .bankSize           = bankSize,
-+        .fastClear          = fastClear,
-+        .compression        = compression,
-+        .powerManagement    = powerManagement,
-+        .gpuProfiler        = gpuProfiler,
-+        .signal             = signal,
-+        .baseAddress        = baseAddress,
-+        .physSize           = physSize,
-+        .logFileSize        = logFileSize,
-+        .recovery           = recovery,
-+        .stuckDump          = stuckDump,
-+        .showArgs           = showArgs,
-+        .gpu3DMinClock      = gpu3DMinClock,
-+    };
-+
-+    gcmkHEADER();
-+
-+    platform.device = pdev;
-+
-+    if (platform.ops->getPower)
-+    {
-+        if (gcmIS_ERROR(platform.ops->getPower(&platform)))
-+        {
-+            gcmkFOOTER_NO();
-+            return ret;
-+        }
-+    }
-+
-+    if (platform.ops->adjustParam)
-+    {
-+        /* Override default module param. */
-+        platform.ops->adjustParam(&platform, &moduleParam);
-+
-+        /* Update module param because drv_init() uses them directly. */
-+        _UpdateModuleParam(&moduleParam);
-+    }
-+
-+    ret = drv_init();
-+
-+    if (!ret)
-+    {
-+        platform_set_drvdata(pdev, galDevice);
-+
-+        gcmkFOOTER_NO();
-+        return ret;
-+    }
-+
-+    gcmkFOOTER_ARG(KERN_INFO "Failed to register gpu driver: %d\n", ret);
-+    return ret;
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
-+static int gpu_remove(struct platform_device *pdev)
-+#else
-+static int __devexit gpu_remove(struct platform_device *pdev)
-+#endif
-+{
-+    gcmkHEADER();
-+
-+    drv_exit();
-+
-+    if (platform.ops->putPower)
-+    {
-+        platform.ops->putPower(&platform);
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return 0;
-+}
-+
-+static int gpu_suspend(struct platform_device *dev, pm_message_t state)
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+    gctINT i;
-+
-+    device = platform_get_drvdata(dev);
-+
-+    if (!device)
-+    {
-+        return -1;
-+    }
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->kernels[i] != gcvNULL)
-+        {
-+            /* Store states. */
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_QueryPowerManagementState(device->kernels[i]->vg->hardware, &device->statesStored[i]);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_QueryPowerManagementState(device->kernels[i]->hardware, &device->statesStored[i]);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_OFF);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_OFF);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+
-+        }
-+    }
-+
-+    return 0;
-+}
-+
-+static int gpu_resume(struct platform_device *dev)
-+{
-+    gceSTATUS status;
-+    gckGALDEVICE device;
-+    gctINT i;
-+    gceCHIPPOWERSTATE   statesStored;
-+
-+    device = platform_get_drvdata(dev);
-+
-+    if (!device)
-+    {
-+        return -1;
-+    }
-+
-+    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
-+    {
-+        if (device->kernels[i] != gcvNULL)
-+        {
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_ON);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_ON);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+
-+            /* Convert global state to crossponding internal state. */
-+            switch(device->statesStored[i])
-+            {
-+            case gcvPOWER_OFF:
-+                statesStored = gcvPOWER_OFF_BROADCAST;
-+                break;
-+            case gcvPOWER_IDLE:
-+                statesStored = gcvPOWER_IDLE_BROADCAST;
-+                break;
-+            case gcvPOWER_SUSPEND:
-+                statesStored = gcvPOWER_SUSPEND_BROADCAST;
-+                break;
-+            case gcvPOWER_ON:
-+                statesStored = gcvPOWER_ON_AUTO;
-+                break;
-+            default:
-+                statesStored = device->statesStored[i];
-+                break;
-+            }
-+
-+            /* Restore states. */
-+#if gcdENABLE_VG
-+            if (i == gcvCORE_VG)
-+            {
-+                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, statesStored);
-+            }
-+            else
-+#endif
-+            {
-+                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, statesStored);
-+            }
-+
-+            if (gcmIS_ERROR(status))
-+            {
-+                return -1;
-+            }
-+        }
-+    }
-+
-+    return 0;
-+}
-+
-+#if defined(CONFIG_PM) && LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 30)
-+#ifdef CONFIG_PM_SLEEP
-+static int gpu_system_suspend(struct device *dev)
-+{
-+    pm_message_t state={0};
-+    return gpu_suspend(to_platform_device(dev), state);
-+}
-+
-+static int gpu_system_resume(struct device *dev)
-+{
-+    return gpu_resume(to_platform_device(dev));
-+}
-+#endif
-+
-+static const struct dev_pm_ops gpu_pm_ops = {
-+    SET_SYSTEM_SLEEP_PM_OPS(gpu_system_suspend, gpu_system_resume)
-+};
-+#endif
-+
-+static struct platform_driver gpu_driver = {
-+    .probe      = gpu_probe,
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
-+    .remove     = gpu_remove,
-+#else
-+    .remove     = __devexit_p(gpu_remove),
-+#endif
-+
-+    .suspend    = gpu_suspend,
-+    .resume     = gpu_resume,
-+
-+    .driver     = {
-+        .name   = DEVICE_NAME,
-+#if defined(CONFIG_PM) && LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 30)
-+        .pm     = &gpu_pm_ops,
-+#endif
-+    }
-+};
-+
-+static int __init gpu_init(void)
-+{
-+    int ret = 0;
-+
-+    memset(&platform, 0, sizeof(gcsPLATFORM));
-+
-+    gckPLATFORM_QueryOperations(&platform.ops);
-+
-+    if (platform.ops == gcvNULL)
-+    {
-+        printk(KERN_ERR "galcore: No platform specific operations.\n");
-+        ret = -ENODEV;
-+        goto out;
-+    }
-+
-+    if (platform.ops->allocPriv)
-+    {
-+        /* Allocate platform private data. */
-+        if (gcmIS_ERROR(platform.ops->allocPriv(&platform)))
-+        {
-+            ret = -ENOMEM;
-+            goto out;
-+        }
-+    }
-+
-+    if (platform.ops->needAddDevice
-+     && platform.ops->needAddDevice(&platform))
-+    {
-+        /* Allocate device */
-+        platform.device = platform_device_alloc(DEVICE_NAME, -1);
-+        if (!platform.device)
-+        {
-+            printk(KERN_ERR "galcore: platform_device_alloc failed.\n");
-+            ret = -ENOMEM;
-+            goto out;
-+        }
-+
-+        /* Add device */
-+        ret = platform_device_add(platform.device);
-+        if (ret)
-+        {
-+            printk(KERN_ERR "galcore: platform_device_add failed.\n");
-+            goto put_dev;
-+        }
-+    }
-+
-+    platform.driver = &gpu_driver;
-+
-+    if (platform.ops->adjustDriver)
-+    {
-+        /* Override default platform_driver struct. */
-+        platform.ops->adjustDriver(&platform);
-+    }
-+
-+    ret = platform_driver_register(&gpu_driver);
-+    if (!ret)
-+    {
-+        goto out;
-+    }
-+
-+    platform_device_del(platform.device);
-+put_dev:
-+    platform_device_put(platform.device);
-+
-+out:
-+    return ret;
-+}
-+
-+static void __exit gpu_exit(void)
-+{
-+    platform_driver_unregister(&gpu_driver);
-+
-+    if (platform.ops->needAddDevice
-+     && platform.ops->needAddDevice(&platform))
-+    {
-+        platform_device_unregister(platform.device);
-+    }
-+
-+    if (platform.priv)
-+    {
-+        /* Free platform private data. */
-+        platform.ops->freePriv(&platform);
-+    }
-+}
-+
-+module_init(gpu_init);
-+module_exit(gpu_exit);
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,385 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+#include <linux/slab.h>
-+
-+#include "tee_client_api.h"
-+
-+#define _GC_OBJ_ZONE gcvZONE_OS
-+
-+#define GPU3D_UUID   { 0xcc9f80ea, 0xa836, 0x11e3, { 0x9b, 0x07, 0x78, 0x2b, 0xcb, 0x5c, 0xf3, 0xe3 } }
-+
-+static const TEEC_UUID gpu3d_uuid = GPU3D_UUID;
-+TEEC_Context teecContext;
-+
-+typedef struct _gcsSecurityChannel {
-+    gckOS               os;
-+    TEEC_Session        session;
-+    int *               virtual;
-+    TEEC_SharedMemory   inputBuffer;
-+    gctUINT32           bytes;
-+    gctPOINTER          mutex;
-+} gcsSecurityChannel;
-+
-+TEEC_SharedMemory *
-+gpu3d_allocate_secure_mem(
-+    gckOS Os,
-+    unsigned int size
-+    )
-+{
-+    TEEC_Result result;
-+    TEEC_Context *context = &teecContext;
-+    TEEC_SharedMemory *shm = NULL;
-+    void *handle = NULL;
-+    unsigned int phyAddr = 0xFFFFFFFF;
-+    gceSTATUS status;
-+    gctSIZE_T bytes = size;
-+
-+    shm = kmalloc(sizeof(TEEC_SharedMemory), GFP_KERNEL);
-+
-+    if (NULL == shm)
-+    {
-+        return NULL;
-+    }
-+
-+    memset(shm, 0, sizeof(TEEC_SharedMemory));
-+
-+    status = gckOS_AllocatePagedMemoryEx(
-+                Os,
-+                gcvALLOC_FLAG_SECURITY,
-+                bytes,
-+                gcvNULL,
-+                (gctPHYS_ADDR *)&handle);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+         kfree(shm);
-+         return NULL;
-+    }
-+
-+    status = gckOS_PhysicalToPhysicalAddress(
-+                Os,
-+                handle,
-+                &phyAddr);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+         kfree(shm);
-+         return NULL;
-+    }
-+
-+    /* record the handle into shm->user_data */
-+    shm->userdata = handle;
-+
-+    /* [b] Bulk input buffer. */
-+    shm->size = size;
-+    shm->flags = TEEC_MEM_INPUT;
-+
-+    /* Use TEE Client API to register the underlying memory buffer. */
-+    shm->phyAddr = (void *)phyAddr;
-+
-+    result = TEEC_RegisterSharedMemory(
-+            context,
-+            shm);
-+
-+    if (result != TEEC_SUCCESS)
-+    {
-+        gckOS_FreePagedMemory(Os, (gctPHYS_ADDR)handle, shm->size);
-+        kfree(shm);
-+        return NULL;
-+    }
-+
-+    return shm;
-+}
-+
-+void gpu3d_release_secure_mem(
-+    gckOS Os,
-+    void *shm_handle
-+    )
-+{
-+    TEEC_SharedMemory *shm = shm_handle;
-+    void * handle;
-+
-+    if (!shm)
-+    {
-+        return;
-+    }
-+
-+    handle = shm->userdata;
-+
-+    TEEC_ReleaseSharedMemory(shm);
-+    gckOS_FreePagedMemory(Os, (gctPHYS_ADDR)handle, shm->size);
-+
-+    kfree(shm);
-+
-+    return;
-+}
-+
-+static TEEC_Result gpu3d_session_callback(
-+    TEEC_Session*   session,
-+    uint32_t    commandID,
-+    TEEC_Operation* operation,
-+    void*   userdata
-+    )
-+{
-+    gcsSecurityChannel *channel = userdata;
-+
-+    if (channel == gcvNULL)
-+    {
-+        return TEEC_ERROR_BAD_PARAMETERS;
-+    }
-+
-+    switch(commandID)
-+    {
-+        case gcvTA_CALLBACK_ALLOC_SECURE_MEM:
-+        {
-+            uint32_t size = operation->params[0].value.a;
-+            TEEC_SharedMemory *shm = NULL;
-+
-+            shm = gpu3d_allocate_secure_mem(channel->os, size);
-+
-+            /* use the value to save the pointer in client side */
-+            operation->params[0].value.a = (uint32_t)shm;
-+            operation->params[0].value.b = (uint32_t)shm->phyAddr;
-+
-+            break;
-+        }
-+        case gcvTA_CALLBACK_FREE_SECURE_MEM:
-+        {
-+            TEEC_SharedMemory *shm = (TEEC_SharedMemory *)operation->params[0].value.a;
-+
-+            gpu3d_release_secure_mem(channel->os, shm);
-+            break;
-+        }
-+        default:
-+            break;
-+    }
-+
-+    return TEEC_SUCCESS;
-+}
-+
-+gceSTATUS
-+gckOS_OpenSecurityChannel(
-+    IN gckOS Os,
-+    IN gceCORE GPU,
-+    OUT gctUINT32 *Channel
-+    )
-+{
-+    gceSTATUS status;
-+    TEEC_Result result;
-+    static bool initialized = gcvFALSE;
-+    gcsSecurityChannel *channel = gcvNULL;
-+
-+    TEEC_Operation operation = {0};
-+
-+    /* Connect to TEE. */
-+    if (initialized == gcvFALSE)
-+    {
-+        result = TEEC_InitializeContext(NULL, &teecContext);
-+
-+        if (result != TEEC_SUCCESS) {
-+            gcmkONERROR(gcvSTATUS_CHIP_NOT_READY);
-+        }
-+
-+        initialized = gcvTRUE;
-+    }
-+
-+    /* Construct channel. */
-+    gcmkONERROR(
-+        gckOS_Allocate(Os, gcmSIZEOF(*channel), (gctPOINTER *)&channel));
-+
-+    gckOS_ZeroMemory(channel, gcmSIZEOF(gcsSecurityChannel));
-+
-+    channel->os = Os;
-+
-+    gcmkONERROR(gckOS_CreateMutex(Os, &channel->mutex));
-+
-+    /* Allocate shared memory for passing gcTA_INTERFACE. */
-+    channel->bytes = gcmSIZEOF(gcsTA_INTERFACE);
-+    channel->virtual = kmalloc(channel->bytes, GFP_KERNEL | __GFP_NOWARN);
-+
-+    if (!channel->virtual)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
-+    }
-+
-+    channel->inputBuffer.size    = channel->bytes;
-+    channel->inputBuffer.flags   = TEEC_MEM_INPUT | TEEC_MEM_OUTPUT;
-+    channel->inputBuffer.phyAddr = (void *)virt_to_phys(channel->virtual);
-+
-+    result = TEEC_RegisterSharedMemory(&teecContext, &channel->inputBuffer);
-+
-+    if (result != TEEC_SUCCESS)
-+    {
-+        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
-+    }
-+
-+    operation.paramTypes = TEEC_PARAM_TYPES(
-+            TEEC_VALUE_INPUT,
-+            TEEC_NONE,
-+            TEEC_NONE,
-+            TEEC_NONE);
-+
-+    operation.params[0].value.a = GPU;
-+
-+    /* Open session with TEE application. */
-+    result = TEEC_OpenSession(
-+                &teecContext,
-+                &channel->session,
-+                &gpu3d_uuid,
-+                TEEC_LOGIN_USER,
-+                NULL,
-+                &operation,
-+                NULL);
-+
-+    /* Prepare callback. */
-+    TEEC_RegisterCallback(&channel->session, gpu3d_session_callback, channel);
-+
-+    *Channel = (gctUINT32)channel;
-+
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    if (channel)
-+    {
-+        if (channel->virtual)
-+        {
-+        }
-+
-+        if (channel->mutex)
-+        {
-+            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, channel->mutex));
-+        }
-+
-+        gcmkVERIFY_OK(gckOS_Free(Os, channel));
-+    }
-+
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_CloseSecurityChannel(
-+    IN gctUINT32 Channel
-+    )
-+{
-+    /* TODO . */
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+gckOS_CallSecurityService(
-+    IN gctUINT32 Channel,
-+    IN gcsTA_INTERFACE *Interface
-+    )
-+{
-+    gceSTATUS status;
-+    TEEC_Result result;
-+    gcsSecurityChannel *channel = (gcsSecurityChannel *)Channel;
-+    TEEC_Operation operation = {0};
-+
-+    gcmkHEADER();
-+    gcmkVERIFY_ARGUMENT(Channel != 0);
-+
-+    gckOS_AcquireMutex(channel->os, channel->mutex, gcvINFINITE);
-+
-+    gckOS_MemCopy(channel->virtual, Interface, channel->bytes);
-+
-+    operation.paramTypes = TEEC_PARAM_TYPES(
-+            TEEC_MEMREF_PARTIAL_INPUT,
-+            TEEC_NONE,
-+            TEEC_NONE,
-+            TEEC_NONE);
-+
-+    /* Note: we use the updated size in the MemRef output by the encryption. */
-+    operation.params[0].memref.parent = &channel->inputBuffer;
-+    operation.params[0].memref.offset = 0;
-+    operation.params[0].memref.size = sizeof(gcsTA_INTERFACE);
-+    operation.started = true;
-+
-+    /* Start the commit command within the TEE application. */
-+    result = TEEC_InvokeCommand(
-+            &channel->session,
-+            gcvTA_COMMAND_DISPATCH,
-+            &operation,
-+            NULL);
-+
-+    gckOS_MemCopy(Interface, channel->virtual, channel->bytes);
-+
-+    gckOS_ReleaseMutex(channel->os, channel->mutex);
-+
-+    if (result != TEEC_SUCCESS)
-+    {
-+        gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-+
-+gceSTATUS
-+gckOS_InitSecurityChannel(
-+    IN gctUINT32 Channel
-+    )
-+{
-+    gceSTATUS status;
-+    TEEC_Result result;
-+    gcsSecurityChannel *channel = (gcsSecurityChannel *)Channel;
-+    TEEC_Operation operation = {0};
-+
-+    gcmkHEADER();
-+    gcmkVERIFY_ARGUMENT(Channel != 0);
-+
-+    operation.paramTypes = TEEC_PARAM_TYPES(
-+            TEEC_MEMREF_PARTIAL_INPUT,
-+            TEEC_NONE,
-+            TEEC_NONE,
-+            TEEC_NONE);
-+
-+    /* Note: we use the updated size in the MemRef output by the encryption. */
-+    operation.params[0].memref.parent = &channel->inputBuffer;
-+    operation.params[0].memref.offset = 0;
-+    operation.params[0].memref.size = gcmSIZEOF(gcsTA_INTERFACE);
-+    operation.started = true;
-+
-+    /* Start the commit command within the TEE application. */
-+    result = TEEC_InvokeCommand(
-+            &channel->session,
-+            gcvTA_COMMAND_INIT,
-+            &operation,
-+            NULL);
-+
-+    if (result != TEEC_SUCCESS)
-+    {
-+        gcmkONERROR(gcvSTATUS_GENERIC_IO);
-+    }
-+
-+    gcmkFOOTER_NO();
-+    return gcvSTATUS_OK;
-+
-+OnError:
-+    gcmkFOOTER();
-+    return status;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,174 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include <linux/kernel.h>
-+#include <linux/file.h>
-+#include <linux/fs.h>
-+#include <linux/miscdevice.h>
-+#include <linux/module.h>
-+#include <linux/syscalls.h>
-+#include <linux/uaccess.h>
-+
-+#include "gc_hal_kernel_sync.h"
-+
-+#if gcdANDROID_NATIVE_FENCE_SYNC
-+
-+static struct sync_pt *
-+viv_sync_pt_dup(
-+    struct sync_pt * sync_pt
-+    )
-+{
-+    gceSTATUS status;
-+    struct viv_sync_pt *pt;
-+    struct viv_sync_pt *src;
-+    struct viv_sync_timeline *obj;
-+
-+    src = (struct viv_sync_pt *) sync_pt;
-+    obj = (struct viv_sync_timeline *) sync_pt->parent;
-+
-+    /* Create the new sync_pt. */
-+    pt = (struct viv_sync_pt *)
-+        sync_pt_create(&obj->obj, sizeof(struct viv_sync_pt));
-+
-+    pt->stamp = src->stamp;
-+    pt->sync = src->sync;
-+
-+    /* Reference sync point. */
-+    status = gckOS_ReferenceSyncPoint(obj->os, pt->sync);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        sync_pt_free((struct sync_pt *)pt);
-+        return NULL;
-+    }
-+
-+    return (struct sync_pt *)pt;
-+}
-+
-+static int
-+viv_sync_pt_has_signaled(
-+    struct sync_pt * sync_pt
-+    )
-+{
-+    gceSTATUS status;
-+    gctBOOL state;
-+    struct viv_sync_pt * pt;
-+    struct viv_sync_timeline * obj;
-+
-+    pt  = (struct viv_sync_pt *)sync_pt;
-+    obj = (struct viv_sync_timeline *)sync_pt->parent;
-+
-+    status = gckOS_QuerySyncPoint(obj->os, pt->sync, &state);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        /* Error. */
-+        return -1;
-+    }
-+
-+    return state;
-+}
-+
-+static int
-+viv_sync_pt_compare(
-+    struct sync_pt * a,
-+    struct sync_pt * b
-+    )
-+{
-+    int ret;
-+    struct viv_sync_pt * pt1 = (struct viv_sync_pt *) a;
-+    struct viv_sync_pt * pt2 = (struct viv_sync_pt *) b;
-+
-+    ret = (pt1->stamp <  pt2->stamp) ? -1
-+        : (pt1->stamp == pt2->stamp) ?  0
-+        : 1;
-+
-+    return ret;
-+}
-+
-+static void
-+viv_sync_pt_free(
-+    struct sync_pt * sync_pt
-+    )
-+{
-+    struct viv_sync_pt * pt;
-+    struct viv_sync_timeline * obj;
-+
-+    pt  = (struct viv_sync_pt *) sync_pt;
-+    obj = (struct viv_sync_timeline *) sync_pt->parent;
-+
-+    gckOS_DestroySyncPoint(obj->os, pt->sync);
-+}
-+
-+static struct sync_timeline_ops viv_timeline_ops =
-+{
-+    .driver_name = "viv_sync",
-+    .dup = viv_sync_pt_dup,
-+    .has_signaled = viv_sync_pt_has_signaled,
-+    .compare = viv_sync_pt_compare,
-+    .free_pt = viv_sync_pt_free,
-+};
-+
-+struct viv_sync_timeline *
-+viv_sync_timeline_create(
-+    const char * name,
-+    gckOS os
-+    )
-+{
-+    struct viv_sync_timeline * obj;
-+
-+    obj = (struct viv_sync_timeline *)
-+        sync_timeline_create(&viv_timeline_ops, sizeof(struct viv_sync_timeline), name);
-+
-+    obj->os    = os;
-+    obj->stamp = 0;
-+
-+    return obj;
-+}
-+
-+struct sync_pt *
-+viv_sync_pt_create(
-+    struct viv_sync_timeline * obj,
-+    gctSYNC_POINT SyncPoint
-+    )
-+{
-+    gceSTATUS status;
-+    struct viv_sync_pt * pt;
-+
-+    pt = (struct viv_sync_pt *)
-+        sync_pt_create(&obj->obj, sizeof(struct viv_sync_pt));
-+
-+    pt->stamp = obj->stamp++;
-+    pt->sync  = SyncPoint;
-+
-+    /* Dup signal. */
-+    status = gckOS_ReferenceSyncPoint(obj->os, SyncPoint);
-+
-+    if (gcmIS_ERROR(status))
-+    {
-+        sync_pt_free((struct sync_pt *)pt);
-+        return NULL;
-+    }
-+
-+    return (struct sync_pt *) pt;
-+}
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,71 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2013 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#ifndef __gc_hal_kernel_sync_h_
-+#define __gc_hal_kernel_sync_h_
-+
-+#include <linux/types.h>
-+
-+#include <uapi/sync.h>
-+
-+#include <gc_hal.h>
-+#include <gc_hal_base.h>
-+
-+struct viv_sync_timeline
-+{
-+    /* Parent object. */
-+    struct sync_timeline obj;
-+
-+    /* Timestamp when sync_pt is created. */
-+    gctUINT stamp;
-+
-+    /* Pointer to os struct. */
-+    gckOS os;
-+};
-+
-+
-+struct viv_sync_pt
-+{
-+    /* Parent object. */
-+    struct sync_pt pt;
-+
-+    /* Reference sync point*/
-+    gctSYNC_POINT sync;
-+
-+    /* Timestamp when sync_pt is created. */
-+    gctUINT stamp;
-+};
-+
-+/* Create viv_sync_timeline object. */
-+struct viv_sync_timeline *
-+viv_sync_timeline_create(
-+    const char * Name,
-+    gckOS Os
-+    );
-+
-+/* Create viv_sync_pt object. */
-+struct sync_pt *
-+viv_sync_pt_create(
-+    struct viv_sync_timeline * Obj,
-+    gctSYNC_POINT SyncPoint
-+    );
-+
-+#endif /* __gc_hal_kernel_sync_h_ */
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,880 @@
-+/****************************************************************************
-+*
-+*    Copyright (C) 2005 - 2014 by Vivante Corp.
-+*
-+*    This program is free software; you can redistribute it and/or modify
-+*    it under the terms of the GNU General Public License as published by
-+*    the Free Software Foundation; either version 2 of the license, or
-+*    (at your option) any later version.
-+*
-+*    This program is distributed in the hope that it will be useful,
-+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+*    GNU General Public License for more details.
-+*
-+*    You should have received a copy of the GNU General Public License
-+*    along with this program; if not write to the Free Software
-+*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+*
-+*****************************************************************************/
-+
-+
-+#include "gc_hal_kernel_linux.h"
-+#include "gc_hal_kernel_platform.h"
-+#include "gc_hal_kernel_device.h"
-+#include "gc_hal_driver.h"
-+#include <linux/slab.h>
-+
-+#if USE_PLATFORM_DRIVER
-+#   include <linux/platform_device.h>
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+#include <mach/viv_gpu.h>
-+#else
-+#include <linux/pm_runtime.h>
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
-+#include <mach/busfreq.h>
-+#else
-+#include <linux/busfreq-imx6.h>
-+#include <linux/reset.h>
-+#endif
-+#endif
-+
-+#include <linux/clk.h>
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
-+#include <mach/hardware.h>
-+#endif
-+#include <linux/pm_runtime.h>
-+
-+#include <linux/regulator/consumer.h>
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+#include <linux/device_cooling.h>
-+#define REG_THERMAL_NOTIFIER(a) register_devfreq_cooling_notifier(a);
-+#define UNREG_THERMAL_NOTIFIER(a) unregister_devfreq_cooling_notifier(a);
-+#else
-+extern int register_thermal_notifier(struct notifier_block *nb);
-+extern int unregister_thermal_notifier(struct notifier_block *nb);
-+#define REG_THERMAL_NOTIFIER(a) register_thermal_notifier(a);
-+#define UNREG_THERMAL_NOTIFIER(a) unregister_thermal_notifier(a);
-+#endif
-+
-+static int initgpu3DMinClock = 1;
-+module_param(initgpu3DMinClock, int, 0644);
-+
-+struct platform_device *pdevice;
-+
-+#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
-+#    include <linux/kernel.h>
-+#    include <linux/mm.h>
-+#    include <linux/oom.h>
-+#    include <linux/sched.h>
-+
-+struct task_struct *lowmem_deathpending;
-+
-+static int
-+task_notify_func(struct notifier_block *self, unsigned long val, void *data);
-+
-+static struct notifier_block task_nb = {
-+	.notifier_call	= task_notify_func,
-+};
-+
-+static int
-+task_notify_func(struct notifier_block *self, unsigned long val, void *data)
-+{
-+	struct task_struct *task = data;
-+
-+	if (task == lowmem_deathpending)
-+		lowmem_deathpending = NULL;
-+
-+	return NOTIFY_OK;
-+}
-+
-+extern struct task_struct *lowmem_deathpending;
-+static unsigned long lowmem_deathpending_timeout;
-+
-+static int force_contiguous_lowmem_shrink(IN gckKERNEL Kernel)
-+{
-+	struct task_struct *p;
-+	struct task_struct *selected = NULL;
-+	int tasksize;
-+        int ret = -1;
-+	int min_adj = 0;
-+	int selected_tasksize = 0;
-+	int selected_oom_adj;
-+	/*
-+	 * If we already have a death outstanding, then
-+	 * bail out right away; indicating to vmscan
-+	 * that we have nothing further to offer on
-+	 * this pass.
-+	 *
-+	 */
-+	if (lowmem_deathpending &&
-+	    time_before_eq(jiffies, lowmem_deathpending_timeout))
-+		return 0;
-+	selected_oom_adj = min_adj;
-+
-+       rcu_read_lock();
-+	for_each_process(p) {
-+		struct mm_struct *mm;
-+		struct signal_struct *sig;
-+                gcuDATABASE_INFO info;
-+		int oom_adj;
-+
-+		task_lock(p);
-+		mm = p->mm;
-+		sig = p->signal;
-+		if (!mm || !sig) {
-+			task_unlock(p);
-+			continue;
-+		}
-+		oom_adj = sig->oom_score_adj;
-+		if (oom_adj < min_adj) {
-+			task_unlock(p);
-+			continue;
-+		}
-+
-+		tasksize = 0;
-+		task_unlock(p);
-+               rcu_read_unlock();
-+
-+		if (gckKERNEL_QueryProcessDB(Kernel, p->pid, gcvFALSE, gcvDB_VIDEO_MEMORY, &info) == gcvSTATUS_OK){
-+			tasksize += info.counters.bytes / PAGE_SIZE;
-+		}
-+		if (gckKERNEL_QueryProcessDB(Kernel, p->pid, gcvFALSE, gcvDB_CONTIGUOUS, &info) == gcvSTATUS_OK){
-+			tasksize += info.counters.bytes / PAGE_SIZE;
-+		}
-+
-+               rcu_read_lock();
-+
-+		if (tasksize <= 0)
-+			continue;
-+
-+		gckOS_Print("<gpu> pid %d (%s), adj %d, size %d \n", p->pid, p->comm, oom_adj, tasksize);
-+
-+		if (selected) {
-+			if (oom_adj < selected_oom_adj)
-+				continue;
-+			if (oom_adj == selected_oom_adj &&
-+			    tasksize <= selected_tasksize)
-+				continue;
-+		}
-+		selected = p;
-+		selected_tasksize = tasksize;
-+		selected_oom_adj = oom_adj;
-+	}
-+	if (selected) {
-+		gckOS_Print("<gpu> send sigkill to %d (%s), adj %d, size %d\n",
-+			     selected->pid, selected->comm,
-+			     selected_oom_adj, selected_tasksize);
-+		lowmem_deathpending = selected;
-+		lowmem_deathpending_timeout = jiffies + HZ;
-+		force_sig(SIGKILL, selected);
-+		ret = 0;
-+	}
-+       rcu_read_unlock();
-+	return ret;
-+}
-+
-+
-+gceSTATUS
-+_ShrinkMemory(
-+    IN gckPLATFORM Platform
-+    )
-+{
-+    struct platform_device *pdev;
-+    gckGALDEVICE galDevice;
-+    gckKERNEL kernel;
-+
-+    pdev = Platform->device;
-+
-+    galDevice = platform_get_drvdata(pdev);
-+
-+    kernel = galDevice->kernels[gcvCORE_MAJOR];
-+
-+    if (kernel != gcvNULL)
-+    {
-+        force_contiguous_lowmem_shrink(kernel);
-+    }
-+    else
-+    {
-+        gcmkPRINT("%s(%d) can't find kernel! ", __FUNCTION__, __LINE__);
-+    }
-+
-+    return gcvSTATUS_OK;
-+}
-+#endif
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+static int thermal_hot_pm_notify(struct notifier_block *nb, unsigned long event,
-+       void *dummy)
-+{
-+    static gctUINT orgFscale, minFscale, maxFscale;
-+    static gctBOOL bAlreadyTooHot = gcvFALSE;
-+    gckHARDWARE hardware;
-+    gckGALDEVICE galDevice;
-+
-+    galDevice = platform_get_drvdata(pdevice);
-+    if (!galDevice)
-+    {
-+        /* GPU is not ready, so it is meaningless to change GPU freq. */
-+        return NOTIFY_OK;
-+    }
-+
-+    if (!galDevice->kernels[gcvCORE_MAJOR])
-+    {
-+        return NOTIFY_OK;
-+    }
-+
-+    hardware = galDevice->kernels[gcvCORE_MAJOR]->hardware;
-+
-+    if (!hardware)
-+    {
-+        return NOTIFY_OK;
-+    }
-+
-+    if (event && !bAlreadyTooHot) {
-+        gckHARDWARE_GetFscaleValue(hardware,&orgFscale,&minFscale, &maxFscale);
-+        gckHARDWARE_SetFscaleValue(hardware, minFscale);
-+        bAlreadyTooHot = gcvTRUE;
-+        gckOS_Print("System is too hot. GPU3D will work at %d/64 clock.\n", minFscale);
-+    } else if (!event && bAlreadyTooHot) {
-+        gckHARDWARE_SetFscaleValue(hardware, orgFscale);
-+        gckOS_Print("Hot alarm is canceled. GPU3D clock will return to %d/64\n", orgFscale);
-+        bAlreadyTooHot = gcvFALSE;
-+    }
-+    return NOTIFY_OK;
-+}
-+
-+static struct notifier_block thermal_hot_pm_notifier = {
-+    .notifier_call = thermal_hot_pm_notify,
-+    };
-+
-+static ssize_t show_gpu3DMinClock(struct device_driver *dev, char *buf)
-+{
-+    gctUINT currentf,minf,maxf;
-+    gckGALDEVICE galDevice;
-+
-+    galDevice = platform_get_drvdata(pdevice);
-+    if(galDevice->kernels[gcvCORE_MAJOR])
-+    {
-+         gckHARDWARE_GetFscaleValue(galDevice->kernels[gcvCORE_MAJOR]->hardware,
-+            &currentf, &minf, &maxf);
-+    }
-+    snprintf(buf, PAGE_SIZE, "%d\n", minf);
-+    return strlen(buf);
-+}
-+
-+static ssize_t update_gpu3DMinClock(struct device_driver *dev, const char *buf, size_t count)
-+{
-+
-+    gctINT fields;
-+    gctUINT MinFscaleValue;
-+    gckGALDEVICE galDevice;
-+
-+    galDevice = platform_get_drvdata(pdevice);
-+    if(galDevice->kernels[gcvCORE_MAJOR])
-+    {
-+         fields = sscanf(buf, "%d", &MinFscaleValue);
-+         if (fields < 1)
-+             return -EINVAL;
-+
-+         gckHARDWARE_SetMinFscaleValue(galDevice->kernels[gcvCORE_MAJOR]->hardware,MinFscaleValue);
-+    }
-+
-+    return count;
-+}
-+
-+static DRIVER_ATTR(gpu3DMinClock, S_IRUGO | S_IWUSR, show_gpu3DMinClock, update_gpu3DMinClock);
-+#endif
-+
-+
-+
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+static const struct of_device_id mxs_gpu_dt_ids[] = {
-+    { .compatible = "fsl,imx6q-gpu", },
-+    {/* sentinel */}
-+};
-+MODULE_DEVICE_TABLE(of, mxs_gpu_dt_ids);
-+#endif
-+
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+struct contiguous_mem_pool {
-+    struct dma_attrs attrs;
-+    dma_addr_t phys;
-+    void *virt;
-+    size_t size;
-+};
-+#endif
-+
-+struct imx_priv {
-+    /* Clock management.*/
-+    struct clk         *clk_3d_core;
-+    struct clk         *clk_3d_shader;
-+    struct clk         *clk_3d_axi;
-+    struct clk         *clk_2d_core;
-+    struct clk         *clk_2d_axi;
-+    struct clk         *clk_vg_axi;
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    /*Power management.*/
-+    struct regulator      *gpu_regulator;
-+#endif
-+#endif
-+       /*Run time pm*/
-+       struct device           *pmdev;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    struct contiguous_mem_pool *pool;
-+    struct reset_control *rstc[gcdMAX_GPU_COUNT];
-+#endif
-+};
-+
-+static struct imx_priv imxPriv;
-+
-+gceSTATUS
-+gckPLATFORM_AdjustParam(
-+    IN gckPLATFORM Platform,
-+    OUT gcsMODULE_PARAMETERS *Args
-+    )
-+{
-+     struct resource* res;
-+     struct platform_device* pdev = Platform->device;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+       struct device_node *dn =pdev->dev.of_node;
-+       const u32 *prop;
-+#else
-+       struct viv_gpu_platform_data *pdata;
-+#endif
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "phys_baseaddr");
-+    if (res)
-+        Args->baseAddress = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_3d");
-+    if (res)
-+        Args->irqLine = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_3d");
-+    if (res)
-+    {
-+        Args->registerMemBase = res->start;
-+        Args->registerMemSize = res->end - res->start + 1;
-+    }
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_2d");
-+    if (res)
-+        Args->irqLine2D = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_2d");
-+    if (res)
-+    {
-+        Args->registerMemBase2D = res->start;
-+        Args->registerMemSize2D = res->end - res->start + 1;
-+    }
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_vg");
-+    if (res)
-+        Args->irqLineVG = res->start;
-+
-+    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_vg");
-+    if (res)
-+    {
-+        Args->registerMemBaseVG = res->start;
-+        Args->registerMemSizeVG = res->end - res->start + 1;
-+    }
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+       Args->contiguousBase = 0;
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+       prop = of_get_property(dn, "contiguousbase", NULL);
-+       if(prop)
-+               Args->contiguousBase = *prop;
-+       of_property_read_u32(dn,"contiguoussize", (u32 *)&contiguousSize);
-+#else
-+    pdata = pdev->dev.platform_data;
-+    if (pdata) {
-+        Args->contiguousBase = pdata->reserved_mem_base;
-+       Args->contiguousSize = pdata->reserved_mem_size;
-+     }
-+#endif
-+    if (Args->contiguousSize == 0)
-+       gckOS_Print("Warning: No contiguous memory is reserverd for gpu.!\n ");
-+
-+    Args->gpu3DMinClock = initgpu3DMinClock;
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_AllocPriv(
-+    IN gckPLATFORM Platform
-+    )
-+{
-+    Platform->priv = &imxPriv;
-+
-+#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
-+    task_free_register(&task_nb);
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_FreePriv(
-+    IN gckPLATFORM Platform
-+    )
-+{
-+#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
-+    task_free_unregister(&task_nb);
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_GetPower(
-+    IN gckPLATFORM Platform
-+    )
-+{
-+    struct device* pdev = &Platform->device->dev;
-+    struct imx_priv *priv = Platform->priv;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    struct reset_control *rstc;
-+#endif
-+
-+#ifdef CONFIG_PM
-+    /*Init runtime pm for gpu*/
-+    pm_runtime_enable(pdev);
-+    priv->pmdev = pdev;
-+#endif
-+
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    rstc = devm_reset_control_get(pdev, "gpu3d");
-+    priv->rstc[gcvCORE_MAJOR] = IS_ERR(rstc) ? NULL : rstc;
-+    rstc = devm_reset_control_get(pdev, "gpu2d");
-+    priv->rstc[gcvCORE_2D] = IS_ERR(rstc) ? NULL : rstc;
-+    rstc = devm_reset_control_get(pdev, "gpuvg");
-+    priv->rstc[gcvCORE_VG] = IS_ERR(rstc) ? NULL : rstc;
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+    /*get gpu regulator*/
-+    priv->gpu_regulator = regulator_get(pdev, "cpu_vddgpu");
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    priv->gpu_regulator = devm_regulator_get(pdev, "pu");
-+#endif
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    if (IS_ERR(priv->gpu_regulator)) {
-+       gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DRIVER,
-+               "%s(%d): Failed to get gpu regulator \n",
-+               __FUNCTION__, __LINE__);
-+       return gcvSTATUS_NOT_FOUND;
-+    }
-+#endif
-+#endif
-+
-+    /*Initialize the clock structure*/
-+    priv->clk_3d_core = clk_get(pdev, "gpu3d_clk");
-+    if (!IS_ERR(priv->clk_3d_core)) {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+        if (cpu_is_mx6q()) {
-+               priv->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
-+               if (IS_ERR(priv->clk_3d_shader)) {
-+                   clk_put(priv->clk_3d_core);
-+                   priv->clk_3d_core = NULL;
-+                   priv->clk_3d_shader = NULL;
-+                   gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
-+               }
-+             }
-+#else
-+               priv->clk_3d_axi = clk_get(pdev, "gpu3d_axi_clk");
-+               priv->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
-+               if (IS_ERR(priv->clk_3d_shader)) {
-+                   clk_put(priv->clk_3d_core);
-+                   priv->clk_3d_core = NULL;
-+                   priv->clk_3d_shader = NULL;
-+                   gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
-+               }
-+#endif
-+    } else {
-+        priv->clk_3d_core = NULL;
-+        gckOS_Print("galcore: clk_get gpu3d_clk failed, disable 3d!\n");
-+    }
-+
-+    priv->clk_2d_core = clk_get(pdev, "gpu2d_clk");
-+    if (IS_ERR(priv->clk_2d_core)) {
-+        priv->clk_2d_core = NULL;
-+        gckOS_Print("galcore: clk_get 2d core clock failed, disable 2d/vg!\n");
-+    } else {
-+        priv->clk_2d_axi = clk_get(pdev, "gpu2d_axi_clk");
-+        if (IS_ERR(priv->clk_2d_axi)) {
-+            priv->clk_2d_axi = NULL;
-+            gckOS_Print("galcore: clk_get 2d axi clock failed, disable 2d\n");
-+        }
-+
-+        priv->clk_vg_axi = clk_get(pdev, "openvg_axi_clk");
-+        if (IS_ERR(priv->clk_vg_axi)) {
-+               priv->clk_vg_axi = NULL;
-+               gckOS_Print("galcore: clk_get vg clock failed, disable vg!\n");
-+        }
-+    }
-+
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    pdevice = Platform->device;
-+    REG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
-+    {
-+        int ret = 0;
-+        ret = driver_create_file(pdevice->dev.driver, &driver_attr_gpu3DMinClock);
-+        if(ret)
-+            dev_err(&pdevice->dev, "create gpu3DMinClock attr failed (%d)\n", ret);
-+    }
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_PutPower(
-+    IN gckPLATFORM Platform
-+    )
-+{
-+    struct imx_priv *priv = Platform->priv;
-+
-+    /*Disable clock*/
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    if (priv->clk_3d_axi) {
-+       clk_put(priv->clk_3d_axi);
-+       priv->clk_3d_axi = NULL;
-+    }
-+#endif
-+    if (priv->clk_3d_core) {
-+       clk_put(priv->clk_3d_core);
-+       priv->clk_3d_core = NULL;
-+    }
-+    if (priv->clk_3d_shader) {
-+       clk_put(priv->clk_3d_shader);
-+       priv->clk_3d_shader = NULL;
-+    }
-+    if (priv->clk_2d_core) {
-+       clk_put(priv->clk_2d_core);
-+       priv->clk_2d_core = NULL;
-+    }
-+    if (priv->clk_2d_axi) {
-+       clk_put(priv->clk_2d_axi);
-+       priv->clk_2d_axi = NULL;
-+    }
-+    if (priv->clk_vg_axi) {
-+       clk_put(priv->clk_vg_axi);
-+       priv->clk_vg_axi = NULL;
-+    }
-+
-+#ifdef CONFIG_PM
-+    if(priv->pmdev)
-+        pm_runtime_disable(priv->pmdev);
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+    if (priv->gpu_regulator) {
-+       regulator_put(priv->gpu_regulator);
-+       priv->gpu_regulator = NULL;
-+    }
-+#endif
-+
-+#if gcdENABLE_FSCALE_VAL_ADJUST
-+    UNREG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
-+
-+    driver_remove_file(pdevice->dev.driver, &driver_attr_gpu3DMinClock);
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_SetPower(
-+    IN gckPLATFORM Platform,
-+    IN gceCORE GPU,
-+    IN gctBOOL Enable
-+    )
-+{
-+    struct imx_priv* priv = Platform->priv;
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    int ret;
-+#endif
-+#endif
-+
-+    if (Enable)
-+    {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+        if(!IS_ERR(priv->gpu_regulator)) {
-+            ret = regulator_enable(priv->gpu_regulator);
-+            if (ret != 0)
-+                gckOS_Print("%s(%d): fail to enable pu regulator %d!\n",
-+                    __FUNCTION__, __LINE__, ret);
-+        }
-+#else
-+        imx_gpc_power_up_pu(true);
-+#endif
-+#endif
-+
-+#ifdef CONFIG_PM
-+		pm_runtime_get_sync(priv->pmdev);
-+#endif
-+	}
-+    else
-+    {
-+#ifdef CONFIG_PM
-+        pm_runtime_put_sync(priv->pmdev);
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+        if(!IS_ERR(priv->gpu_regulator))
-+            regulator_disable(priv->gpu_regulator);
-+#else
-+        imx_gpc_power_up_pu(false);
-+#endif
-+#endif
-+
-+    }
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_SetClock(
-+    IN gckPLATFORM Platform,
-+    IN gceCORE GPU,
-+    IN gctBOOL Enable
-+    )
-+{
-+    struct imx_priv* priv = Platform->priv;
-+    struct clk *clk_3dcore = priv->clk_3d_core;
-+    struct clk *clk_3dshader = priv->clk_3d_shader;
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    struct clk *clk_3d_axi = priv->clk_3d_axi;
-+#endif
-+    struct clk *clk_2dcore = priv->clk_2d_core;
-+    struct clk *clk_2d_axi = priv->clk_2d_axi;
-+    struct clk *clk_vg_axi = priv->clk_vg_axi;
-+
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+    if (Enable) {
-+        switch (GPU) {
-+        case gcvCORE_MAJOR:
-+            clk_enable(clk_3dcore);
-+            if (cpu_is_mx6q())
-+                clk_enable(clk_3dshader);
-+            break;
-+        case gcvCORE_2D:
-+            clk_enable(clk_2dcore);
-+            clk_enable(clk_2d_axi);
-+            break;
-+        case gcvCORE_VG:
-+            clk_enable(clk_2dcore);
-+            clk_enable(clk_vg_axi);
-+            break;
-+        default:
-+            break;
-+        }
-+    } else {
-+        switch (GPU) {
-+        case gcvCORE_MAJOR:
-+            if (cpu_is_mx6q())
-+                clk_disable(clk_3dshader);
-+            clk_disable(clk_3dcore);
-+            break;
-+       case gcvCORE_2D:
-+            clk_disable(clk_2dcore);
-+            clk_disable(clk_2d_axi);
-+            break;
-+        case gcvCORE_VG:
-+            clk_disable(clk_2dcore);
-+            clk_disable(clk_vg_axi);
-+            break;
-+        default:
-+            break;
-+        }
-+    }
-+#else
-+    if (Enable) {
-+        switch (GPU) {
-+        case gcvCORE_MAJOR:
-+            clk_prepare(clk_3dcore);
-+            clk_enable(clk_3dcore);
-+            clk_prepare(clk_3dshader);
-+            clk_enable(clk_3dshader);
-+            clk_prepare(clk_3d_axi);
-+            clk_enable(clk_3d_axi);
-+            break;
-+        case gcvCORE_2D:
-+            clk_prepare(clk_2dcore);
-+            clk_enable(clk_2dcore);
-+            clk_prepare(clk_2d_axi);
-+            clk_enable(clk_2d_axi);
-+            break;
-+        case gcvCORE_VG:
-+            clk_prepare(clk_2dcore);
-+            clk_enable(clk_2dcore);
-+            clk_prepare(clk_vg_axi);
-+            clk_enable(clk_vg_axi);
-+            break;
-+        default:
-+            break;
-+        }
-+    } else {
-+        switch (GPU) {
-+        case gcvCORE_MAJOR:
-+            clk_disable(clk_3dshader);
-+            clk_unprepare(clk_3dshader);
-+            clk_disable(clk_3dcore);
-+            clk_unprepare(clk_3dcore);
-+            clk_disable(clk_3d_axi);
-+            clk_unprepare(clk_3d_axi);
-+            break;
-+       case gcvCORE_2D:
-+            clk_disable(clk_2dcore);
-+            clk_unprepare(clk_2dcore);
-+            clk_disable(clk_2d_axi);
-+            clk_unprepare(clk_2d_axi);
-+            break;
-+        case gcvCORE_VG:
-+            clk_disable(clk_2dcore);
-+            clk_unprepare(clk_2dcore);
-+            clk_disable(clk_vg_axi);
-+            clk_unprepare(clk_vg_axi);
-+            break;
-+        default:
-+            break;
-+        }
-+    }
-+#endif
-+
-+    return gcvSTATUS_OK;
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+#ifdef CONFIG_PM
-+static int gpu_runtime_suspend(struct device *dev)
-+{
-+    release_bus_freq(BUS_FREQ_HIGH);
-+    return 0;
-+}
-+
-+static int gpu_runtime_resume(struct device *dev)
-+{
-+    request_bus_freq(BUS_FREQ_HIGH);
-+    return 0;
-+}
-+
-+static struct dev_pm_ops gpu_pm_ops;
-+#endif
-+#endif
-+
-+gceSTATUS
-+_AdjustDriver(
-+    IN gckPLATFORM Platform
-+    )
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    struct platform_driver * driver = Platform->driver;
-+#endif
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    driver->driver.of_match_table = mxs_gpu_dt_ids;
-+#endif
-+
-+    /* Override PM callbacks to add runtime PM callbacks. */
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
-+    /* Fill local structure with original value. */
-+    memcpy(&gpu_pm_ops, driver->driver.pm, sizeof(struct dev_pm_ops));
-+
-+    /* Add runtime PM callback. */
-+#ifdef CONFIG_PM
-+    gpu_pm_ops.runtime_suspend = gpu_runtime_suspend;
-+    gpu_pm_ops.runtime_resume = gpu_runtime_resume;
-+    gpu_pm_ops.runtime_idle = NULL;
-+#endif
-+
-+    /* Replace callbacks. */
-+    driver->driver.pm = &gpu_pm_ops;
-+#endif
-+    return gcvSTATUS_OK;
-+}
-+
-+gceSTATUS
-+_Reset(
-+    IN gckPLATFORM Platform,
-+    gceCORE GPU
-+    )
-+{
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
-+#define SRC_SCR_OFFSET 0
-+#define BP_SRC_SCR_GPU3D_RST 1
-+#define BP_SRC_SCR_GPU2D_RST 4
-+    void __iomem *src_base = IO_ADDRESS(SRC_BASE_ADDR);
-+    gctUINT32 bit_offset,val;
-+
-+    if(GPU == gcvCORE_MAJOR) {
-+        bit_offset = BP_SRC_SCR_GPU3D_RST;
-+    } else if((GPU == gcvCORE_VG)
-+            ||(GPU == gcvCORE_2D)) {
-+        bit_offset = BP_SRC_SCR_GPU2D_RST;
-+    } else {
-+        return gcvSTATUS_INVALID_CONFIG;
-+    }
-+    val = __raw_readl(src_base + SRC_SCR_OFFSET);
-+    val &= ~(1 << (bit_offset));
-+    val |= (1 << (bit_offset));
-+    __raw_writel(val, src_base + SRC_SCR_OFFSET);
-+
-+    while ((__raw_readl(src_base + SRC_SCR_OFFSET) &
-+                (1 << (bit_offset))) != 0) {
-+    }
-+
-+    return gcvSTATUS_NOT_SUPPORTED;
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
-+    struct imx_priv* priv = Platform->priv;
-+    struct reset_control *rstc = priv->rstc[GPU];
-+    if (rstc)
-+        reset_control_reset(rstc);
-+#else
-+    imx_src_reset_gpu((int)GPU);
-+#endif
-+    return gcvSTATUS_OK;
-+}
-+
-+gcsPLATFORM_OPERATIONS platformOperations = {
-+    .adjustParam  = gckPLATFORM_AdjustParam,
-+    .allocPriv    = _AllocPriv,
-+    .freePriv     = _FreePriv,
-+    .getPower     = _GetPower,
-+    .putPower     = _PutPower,
-+    .setPower     = _SetPower,
-+    .setClock     = _SetClock,
-+    .adjustDriver = _AdjustDriver,
-+    .reset        = _Reset,
-+#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
-+    .shrinkMemory = _ShrinkMemory,
-+#endif
-+};
-+
-+void
-+gckPLATFORM_QueryOperations(
-+    IN gcsPLATFORM_OPERATIONS ** Operations
-+    )
-+{
-+     *Operations = &platformOperations;
-+}
-+
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config
---- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,15 @@
-+EXTRA_CFLAGS += -DgcdDEFAULT_CONTIGUOUS_SIZE=134217728
-+
-+ifneq ($(CONFIG_ANDROID),)
-+# build for android
-+EXTRA_CFLAGS += -DgcdANDROID_NATIVE_FENCE_SYNC=3
-+
-+ifeq ($(CONFIG_SYNC),)
-+$(warn CONFIG_SYNC is not set in kernel config)
-+$(warn Android native fence sync needs CONFIG_SYNC)
-+endif
-+endif
-+
-+EXTRA_CFLAGS += -DLINUX_CMA_FSL=1
-+ALLOCATOR_ARRAY_H_LOCATION := $(OS_KERNEL_DIR)/allocator/freescale
-+CUSTOMER_ALLOCATOR_OBJS := $(ALLOCATOR_ARRAY_H_LOCATION)/gc_hal_kernel_allocator_cma.o
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/Kbuild linux-xbian-imx6/drivers/mxc/gpu-viv/Kbuild
---- linux-4.1.3/drivers/mxc/gpu-viv/Kbuild	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/Kbuild	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,236 @@
-+##############################################################################
-+#
-+#    Copyright (C) 2005 - 2013 by Vivante Corp.
-+#
-+#    This program is free software; you can redistribute it and/or modify
-+#    it under the terms of the GNU General Public License as published by
-+#    the Free Software Foundation; either version 2 of the license, or
-+#    (at your option) any later version.
-+#
-+#    This program is distributed in the hope that it will be useful,
-+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-+#    GNU General Public License for more details.
-+#
-+#    You should have received a copy of the GNU General Public License
-+#    along with this program; if not write to the Free Software
-+#    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-+#
-+##############################################################################
-+
-+
-+#
-+# Linux build file for kernel HAL driver.
-+#
-+
-+AQROOT := $(srctree)/drivers/mxc/gpu-viv
-+AQARCH := $(AQROOT)/arch/XAQ2
-+AQVGARCH := $(AQROOT)/arch/GC350
-+
-+include $(AQROOT)/config
-+
-+KERNEL_DIR ?= $(TOOL_DIR)/kernel
-+
-+OS_KERNEL_DIR   := hal/os/linux/kernel
-+ARCH_KERNEL_DIR := arch/$(notdir $(AQARCH))/hal/kernel
-+ARCH_VG_KERNEL_DIR := arch/$(notdir $(AQVGARCH))/hal/kernel
-+HAL_KERNEL_DIR  := hal/kernel
-+
-+# EXTRA_CFLAGS += -Werror
-+
-+OBJS := $(OS_KERNEL_DIR)/gc_hal_kernel_device.o \
-+        $(OS_KERNEL_DIR)/gc_hal_kernel_driver.o \
-+        $(OS_KERNEL_DIR)/gc_hal_kernel_linux.o \
-+        $(OS_KERNEL_DIR)/gc_hal_kernel_math.o \
-+        $(OS_KERNEL_DIR)/gc_hal_kernel_os.o \
-+        $(OS_KERNEL_DIR)/gc_hal_kernel_debugfs.o
-+
-+OBJS += $(HAL_KERNEL_DIR)/gc_hal_kernel.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_command.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_db.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_debug.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_event.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_heap.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_mmu.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_video_memory.o \
-+        $(HAL_KERNEL_DIR)/gc_hal_kernel_power.o
-+
-+OBJS += $(ARCH_KERNEL_DIR)/gc_hal_kernel_context.o \
-+        $(ARCH_KERNEL_DIR)/gc_hal_kernel_hardware.o
-+
-+ifeq ($(VIVANTE_ENABLE_VG), 1)
-+OBJS +=\
-+          $(HAL_KERNEL_DIR)/gc_hal_kernel_vg.o\
-+          $(HAL_KERNEL_DIR)/gc_hal_kernel_command_vg.o\
-+          $(HAL_KERNEL_DIR)/gc_hal_kernel_interrupt_vg.o\
-+          $(HAL_KERNEL_DIR)/gc_hal_kernel_mmu_vg.o\
-+          $(ARCH_VG_KERNEL_DIR)/gc_hal_kernel_hardware_command_vg.o\
-+          $(ARCH_VG_KERNEL_DIR)/gc_hal_kernel_hardware_vg.o
-+endif
-+
-+ifneq ($(CONFIG_SYNC),)
-+OBJS += $(OS_KERNEL_DIR)/gc_hal_kernel_sync.o
-+endif
-+
-+ifeq ($(KERNELRELEASE), )
-+
-+.PHONY: all clean install
-+
-+# Define targets.
-+all:
-+	@make V=$(V) ARCH=$(ARCH_TYPE) -C $(KERNEL_DIR) SUBDIRS=`pwd` modules
-+
-+clean:
-+	@rm -rf $(OBJS)
-+	@rm -rf modules.order Module.symvers
-+	@find $(AQROOT) -name ".gc_*.cmd" | xargs rm -f
-+
-+install: all
-+	@mkdir -p $(SDK_DIR)/drivers
-+
-+else
-+
-+
-+EXTRA_CFLAGS += -DLINUX -DDRIVER
-+
-+ifeq ($(ENUM_WORKAROUND), 1)
-+EXTRA_CFLAGS += -DENUM_WORKAROUND=1
-+else
-+EXTRA_CFLAGS += -DENUM_WORKAROUND=0
-+endif
-+
-+ifeq ($(FLAREON),1)
-+EXTRA_CFLAGS += -DFLAREON
-+endif
-+
-+ifeq ($(DEBUG), 1)
-+EXTRA_CFLAGS += -DDBG=1 -DDEBUG -D_DEBUG
-+else
-+EXTRA_CFLAGS += -DDBG=0
-+endif
-+
-+ifeq ($(NO_DMA_COHERENT), 1)
-+EXTRA_CFLAGS += -DNO_DMA_COHERENT
-+endif
-+
-+ifeq ($(CONFIG_DOVE_GPU), 1)
-+EXTRA_CFLAGS += -DCONFIG_DOVE_GPU=1
-+endif
-+
-+ifneq ($(USE_PLATFORM_DRIVER), 0)
-+EXTRA_CFLAGS += -DUSE_PLATFORM_DRIVER=1
-+else
-+EXTRA_CFLAGS += -DUSE_PLATFORM_DRIVER=0
-+endif
-+
-+
-+EXTRA_CFLAGS += -DVIVANTE_PROFILER=1
-+EXTRA_CFLAGS += -DVIVANTE_PROFILER_CONTEXT=1
-+
-+
-+ifeq ($(ANDROID), 1)
-+EXTRA_CFLAGS += -DANDROID=1
-+endif
-+
-+ifeq ($(ENABLE_GPU_CLOCK_BY_DRIVER), 1)
-+EXTRA_CFLAGS += -DENABLE_GPU_CLOCK_BY_DRIVER=1
-+else
-+EXTRA_CFLAGS += -DENABLE_GPU_CLOCK_BY_DRIVER=0
-+endif
-+
-+ifeq ($(USE_NEW_LINUX_SIGNAL), 1)
-+EXTRA_CFLAGS += -DUSE_NEW_LINUX_SIGNAL=1
-+else
-+EXTRA_CFLAGS += -DUSE_NEW_LINUX_SIGNAL=0
-+endif
-+
-+ifeq ($(NO_USER_DIRECT_ACCESS_FROM_KERNEL), 1)
-+EXTRA_CFLAGS += -DNO_USER_DIRECT_ACCESS_FROM_KERNEL=1
-+else
-+EXTRA_CFLAGS += -DNO_USER_DIRECT_ACCESS_FROM_KERNEL=0
-+endif
-+
-+ifeq ($(FORCE_ALL_VIDEO_MEMORY_CACHED), 1)
-+EXTRA_CFLAGS += -DgcdPAGED_MEMORY_CACHEABLE=1
-+else
-+EXTRA_CFLAGS += -DgcdPAGED_MEMORY_CACHEABLE=0
-+endif
-+
-+ifeq ($(NONPAGED_MEMORY_CACHEABLE), 1)
-+EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_CACHEABLE=1
-+else
-+EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_CACHEABLE=0
-+endif
-+
-+ifeq ($(NONPAGED_MEMORY_BUFFERABLE), 1)
-+EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_BUFFERABLE=1
-+else
-+EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_BUFFERABLE=0
-+endif
-+
-+ifeq ($(CACHE_FUNCTION_UNIMPLEMENTED), 1)
-+EXTRA_CFLAGS += -DgcdCACHE_FUNCTION_UNIMPLEMENTED=1
-+else
-+EXTRA_CFLAGS += -DgcdCACHE_FUNCTION_UNIMPLEMENTED=0
-+endif
-+
-+ifeq ($(SUPPORT_SWAP_RECTANGLE), 1)
-+EXTRA_CFLAGS += -DgcdSUPPORT_SWAP_RECTANGLE=1
-+else
-+EXTRA_CFLAGS += -DgcdSUPPORT_SWAP_RECTANGLE=0
-+endif
-+
-+ifeq ($(VIVANTE_ENABLE_VG), 1)
-+EXTRA_CFLAGS += -DgcdENABLE_VG=1
-+else
-+EXTRA_CFLAGS += -DgcdENABLE_VG=0
-+endif
-+
-+ifeq ($(CONFIG_SMP), y)
-+EXTRA_CFLAGS += -DgcdSMP=1
-+else
-+EXTRA_CFLAGS += -DgcdSMP=0
-+endif
-+
-+ifeq ($(VIVANTE_NO_3D),1)
-+EXTRA_CFLAGS += -DVIVANTE_NO_3D
-+endif
-+
-+ifeq ($(ENABLE_OUTER_CACHE_PATCH), 1)
-+EXTRA_CFLAGS += -DgcdENABLE_OUTER_CACHE_PATCH=1
-+else
-+EXTRA_CFLAGS += -DgcdENABLE_OUTER_CACHE_PATCH=0
-+endif
-+
-+ifeq ($(USE_BANK_ALIGNMENT), 1)
-+    EXTRA_CFLAGS += -DgcdENABLE_BANK_ALIGNMENT=1
-+    ifneq ($(BANK_BIT_START), 0)
-+	        ifneq ($(BANK_BIT_END), 0)
-+	            EXTRA_CFLAGS += -DgcdBANK_BIT_START=$(BANK_BIT_START)
-+	            EXTRA_CFLAGS += -DgcdBANK_BIT_END=$(BANK_BIT_END)
-+	        endif
-+    endif
-+
-+    ifneq ($(BANK_CHANNEL_BIT), 0)
-+        EXTRA_CFLAGS += -DgcdBANK_CHANNEL_BIT=$(BANK_CHANNEL_BIT)
-+    endif
-+endif
-+
-+ifneq ($(CONFIG_SYNC),)
-+EXTRA_CFLAGS += -DgcdANDROID_NATIVE_FENCE_SYNC=1
-+endif
-+
-+EXTRA_CFLAGS += -I$(AQROOT)/hal/kernel/inc
-+EXTRA_CFLAGS += -I$(AQROOT)/hal/kernel
-+EXTRA_CFLAGS += -I$(AQARCH)/hal/kernel
-+EXTRA_CFLAGS += -I$(AQROOT)/hal/os/linux/kernel
-+
-+ifeq ($(VIVANTE_ENABLE_VG), 1)
-+EXTRA_CFLAGS += -I$(AQVGARCH)/hal/kernel
-+endif
-+
-+obj-$(CONFIG_MXC_GPU_VIV) += galcore.o
-+
-+galcore-objs  := $(OBJS)
-+
-+endif
-diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/Kconfig linux-xbian-imx6/drivers/mxc/gpu-viv/Kconfig
---- linux-4.1.3/drivers/mxc/gpu-viv/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/gpu-viv/Kconfig	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,9 @@
-+menu "MXC Vivante GPU support"
-+	depends on SOC_IMX6Q
-+
-+config MXC_GPU_VIV
-+	tristate "MXC Vivante GPU support"
-+	---help---
-+         Say Y to get the GPU driver support.
-+
-+endmenu
-diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/Kconfig linux-xbian-imx6/drivers/mxc/hdmi-cec/Kconfig
---- linux-4.1.3/drivers/mxc/hdmi-cec/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/hdmi-cec/Kconfig	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,11 @@
-+
-+menu "MXC HDMI CEC (Consumer Electronics Control) support"
-+
-+config MXC_HDMI_CEC
-+	tristate "Support for MXC HDMI CEC (Consumer Electronics Control)"
-+	depends on MFD_MXC_HDMI
-+	depends on FB_MXC_HDMI || DRM_IMX_HDMI
-+	help
-+	  The HDMI CEC device implement low level protocol on i.MX6x platforms.
-+
-+endmenu
-diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/Makefile linux-xbian-imx6/drivers/mxc/hdmi-cec/Makefile
---- linux-4.1.3/drivers/mxc/hdmi-cec/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/hdmi-cec/Makefile	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1 @@
-+obj-$(CONFIG_MXC_HDMI_CEC)                  += mxc_hdmi-cec.o
-diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c
---- linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,786 @@
-+/*
-+ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file mxc_hdmi-cec.c
-+ *
-+ * @brief HDMI CEC system initialization and file operation implementation
-+ *
-+ * @ingroup HDMI
-+ */
-+
-+//#define DEBUG
-+
-+#include <linux/module.h>
-+#include <linux/kernel.h>
-+#include <linux/mm.h>
-+#include <linux/fs.h>
-+#include <linux/stat.h>
-+#include <linux/platform_device.h>
-+#include <linux/poll.h>
-+#include <linux/wait.h>
-+#include <linux/list.h>
-+#include <linux/delay.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/uaccess.h>
-+#include <linux/io.h>
-+#include <linux/slab.h>
-+#include <linux/vmalloc.h>
-+#include <linux/workqueue.h>
-+#include <linux/sizes.h>
-+
-+#include <linux/console.h>
-+#include <linux/types.h>
-+#include <linux/mfd/mxc-hdmi-core.h>
-+#include <linux/pinctrl/consumer.h>
-+
-+#include <video/mxc_hdmi.h>
-+
-+#include "mxc_hdmi-cec.h"
-+
-+#define MAXCLIENTS 15
-+
-+struct hdmi_cec_priv {
-+	u8 la;
-+	struct list_head msg_head;
-+	struct list_head client_node;
-+	struct list_head wakeup_node;
-+	wait_queue_head_t hdmi_cec_qm;
-+	spinlock_t i_lock_cl;
-+};
-+
-+struct hdmi_cec_event {
-+	u8 event_type;
-+	u8 msg_len;
-+	u8 msg[MAX_MESSAGE_LEN];
-+};
-+
-+struct hdmi_cec_event_list {
-+	struct hdmi_cec_event data;
-+	u8 libcec_la;
-+	struct list_head msg_node;
-+};
-+
-+struct hdmi_cec_shared {
-+	bool write_busy;
-+	int  receive_error;
-+	int  send_error;
-+	struct delayed_work hdmi_cec_work;
-+	spinlock_t i_lock;
-+	spinlock_t buffer_lock;
-+	struct mutex m_lock;
-+	struct list_head client_head;
-+	struct list_head buffer_head;
-+	int nr_ff;
-+	u16 addresses;
-+	u8 latest_cec_stat;
-+	u32 physical_address;
-+};
-+
-+static struct hdmi_cec_shared hdmi_cec_root;
-+
-+static bool hdmi_cec_state;
-+static int hdmi_cec_ready = 0;
-+static int hdmi_cec_major;
-+static struct class *hdmi_cec_class;
-+static u8 open_count = 0;
-+
-+static int in_worker = 0;
-+
-+static wait_queue_head_t hdmi_cec_qs, hdmi_cec_qw;
-+
-+static int SIGNAL_FREE_ARB = 0;
-+
-+static inline bool la_is_local(u8 la)
-+{
-+	return (la == 0xf) ? false : hdmi_cec_root.addresses & BIT(la);
-+}
-+
-+static inline u8 get_o(u8 la)
-+{
-+	return (la >> 4);
-+}
-+
-+static inline u8 get_o_e(struct hdmi_cec_event_list *event)
-+{
-+	return (event->data.msg[0] >> 4);
-+}
-+
-+static inline u8 get_d(u8 la)
-+{
-+	return (la & 0x0f);
-+}
-+
-+static inline u8 get_d_e(struct hdmi_cec_event_list *event)
-+{
-+	return (event->data.msg[0] & 0x0f);
-+}
-+
-+int mxc_hdmi_cec_buffer(uint16_t offset, int len, u8 cec_type, u8 llla)
-+{
-+	struct hdmi_cec_event_list *event = NULL;
-+	unsigned long flags;
-+	u8 i;
-+
-+	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_ATOMIC);
-+	if (NULL == event) {
-+		pr_err("%s: Not enough memory!\n", __func__);
-+		return -ENOMEM;
-+	}
-+	event->data.msg_len = len;
-+	if (!event->data.msg_len || event->data.msg_len > MAX_MESSAGE_LEN) {
-+		pr_err("%s: Bad message size %d!\n", __func__, event->data.msg_len);
-+		kfree(event);
-+		return -E2BIG;
-+	}
-+
-+	for (i = 0; i < event->data.msg_len; i++)
-+		event->data.msg[i] = hdmi_readb(offset+i);
-+
-+	event->data.event_type = cec_type;
-+	event->libcec_la = llla ? llla : get_o(event->data.msg[0]);
-+
-+	spin_lock_irqsave(&hdmi_cec_root.buffer_lock, flags);
-+	list_add_tail(&event->msg_node, &hdmi_cec_root.buffer_head);
-+	spin_unlock_irqrestore(&hdmi_cec_root.buffer_lock, flags);
-+	return 0;
-+}
-+
-+static irqreturn_t mxc_hdmi_cec_isr(int irq, void *data)
-+{
-+	u8 cec_stat = 0;
-+	u8 val;
-+	unsigned long flags;
-+	irqreturn_t ret = IRQ_HANDLED;
-+
-+	cec_stat = hdmi_readb(HDMI_IH_CEC_STAT0);
-+	if (!cec_stat || !hdmi_cec_state) {
-+		ret = IRQ_NONE;
-+		goto done;
-+	}
-+
-+	pr_debug("%s:  HDMI CEC interrupt handler\n", __func__);
-+
-+	spin_lock_irqsave(&hdmi_cec_root.i_lock, flags);
-+
-+	hdmi_writeb(0x7f, HDMI_IH_MUTE_CEC_STAT0);
-+	hdmi_writeb(cec_stat, HDMI_IH_CEC_STAT0);
-+
-+	if (cec_stat & (HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_ARB_LOST)) {
-+		hdmi_cec_root.send_error++;
-+		SIGNAL_FREE_ARB = cec_stat & HDMI_IH_CEC_STAT0_ERROR_INIT ? SIGNAL_FREE_TIME_RESEND : SIGNAL_FREE_LOST;
-+		pr_debug("%s:  error %d\n", __func__, hdmi_cec_root.send_error);
-+		wake_up(&hdmi_cec_qs);
-+	}
-+	if (cec_stat & (HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_DONE)) {
-+		mxc_hdmi_cec_buffer(HDMI_CEC_TX_DATA0, hdmi_readb(HDMI_CEC_TX_CNT),
-+				  cec_stat & HDMI_IH_CEC_STAT0_NACK ? MESSAGE_TYPE_NOACK : MESSAGE_TYPE_SEND_SUCCESS, 0);
-+		hdmi_cec_root.send_error = 0;
-+		hdmi_cec_root.write_busy = false;
-+		wake_up(&hdmi_cec_qs);
-+		hdmi_writeb(0, HDMI_CEC_TX_CNT);
-+	}
-+	if (cec_stat & HDMI_IH_CEC_STAT0_EOM) {
-+		mxc_hdmi_cec_buffer(HDMI_CEC_RX_DATA0, hdmi_readb(HDMI_CEC_RX_CNT), MESSAGE_TYPE_RECEIVE_SUCCESS, 0);
-+		hdmi_writeb(0, HDMI_CEC_LOCK);
-+	}
-+
-+	pr_debug("%s:  HDMI CEC interrupt received %#x\n", __func__, cec_stat);
-+	if (!in_worker) {
-+		in_worker = 1;
-+		schedule_delayed_work(&hdmi_cec_root.hdmi_cec_work, msecs_to_jiffies(20));
-+	}
-+
-+	spin_unlock_irqrestore(&hdmi_cec_root.i_lock, flags);
-+	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL;
-+	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
-+
-+done:
-+	return ret;
-+}
-+
-+static void __mxc_hdmi_cec_msg(struct hdmi_cec_event_list *event, struct hdmi_cec_priv *client, struct list_head *wakeup, u8 event_type)
-+{
-+	struct hdmi_cec_event_list *tevent = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL);
-+	unsigned long flags;
-+
-+	if (!tevent) {
-+		pr_err("%s: Not enough memory!\n", __func__);
-+		return;
-+	}
-+	memcpy(&tevent->data, &event->data, min(sizeof(struct hdmi_cec_event), (size_t)(event->data.msg_len + 2)));
-+	if (event_type)
-+		tevent->data.event_type = event_type;
-+
-+	spin_lock_irqsave(&client->i_lock_cl, flags);
-+	list_add_tail(&tevent->msg_node, &client->msg_head);
-+	spin_unlock_irqrestore(&client->i_lock_cl, flags);
-+
-+	if (wakeup)
-+		list_add_tail(&client->wakeup_node, wakeup);
-+}
-+
-+void mxc_hdmi_cec_handle(u32 cec_stat)
-+{
-+	struct hdmi_cec_event_list *event = NULL;
-+	struct hdmi_cec_priv *client = NULL;
-+
-+	if (cec_stat)
-+		hdmi_cec_root.physical_address = cec_stat;
-+
-+	/* HDMI cable connected / HDMI cable disconnected */
-+	if (!hdmi_cec_ready)
-+		return;
-+	pr_debug("%s: enter\n", __func__);
-+
-+	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_ATOMIC);
-+	if (!event) {
-+		pr_err("%s: Not enough memory!\n", __func__);
-+		return;
-+	}
-+	event->data.event_type = cec_stat ?
-+		MESSAGE_TYPE_CONNECTED : MESSAGE_TYPE_DISCONNECTED;
-+
-+	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
-+		mutex_lock(&hdmi_cec_root.m_lock);
-+		__mxc_hdmi_cec_msg(event, client, NULL, 0);
-+		mutex_unlock(&hdmi_cec_root.m_lock);
-+		wake_up(&client->hdmi_cec_qm);
-+	}
-+	pr_debug("%s: exit\n", __func__);
-+}
-+EXPORT_SYMBOL(mxc_hdmi_cec_handle);
-+
-+void mxc_hdmi_cec_msg(void)
-+{
-+	struct hdmi_cec_event_list *event = NULL;
-+	struct hdmi_cec_priv *client = NULL;
-+	unsigned long flags;
-+	LIST_HEAD(wakeup);
-+
-+	spin_lock_irqsave(&hdmi_cec_root.buffer_lock, flags);
-+	event = list_first_entry_or_null(&hdmi_cec_root.buffer_head, struct hdmi_cec_event_list, msg_node);
-+	if (!event) {
-+		spin_unlock_irqrestore(&hdmi_cec_root.buffer_lock, flags);
-+		return;
-+	}
-+	list_del_init(&event->msg_node);
-+	spin_unlock_irqrestore(&hdmi_cec_root.buffer_lock, flags);
-+
-+	event->data.event_type = (event->data.event_type == MESSAGE_TYPE_NOACK && la_is_local(event->data.msg[0] & 0x0f)) ?
-+								MESSAGE_TYPE_SEND_SUCCESS : event->data.event_type;
-+
-+	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
-+		if (client->la == 0xff) continue;
-+		pr_debug("client %d: MSG from %d to %d, %x. (clla: %d) ET: %d\n", client->la, get_o(event->data.msg[0]), get_d(event->data.msg[0]), event->data.msg[1], event->libcec_la, event->data.event_type);
-+
-+		if ((event->data.event_type == MESSAGE_TYPE_RECEIVE_SUCCESS &&
-+					((get_d_e(event) == 15 && event->libcec_la != client->la) || (event->data.msg[0] & 0x0f) == client->la))
-+		    ||
-+		    (event->data.event_type != MESSAGE_TYPE_RECEIVE_SUCCESS &&
-+					((get_o_e(event) == get_d_e(event) && client->la == 15) || client->la == get_o_e(event))) )
-+		{
-+			pr_debug("writing to %d\n", client->la);
-+			__mxc_hdmi_cec_msg(event, client, &wakeup, 0);
-+		}
-+
-+		if ((event->data.event_type == MESSAGE_TYPE_SEND_SUCCESS) &&
-+					((la_is_local(event->data.msg[0] & 0x0f) && (event->data.msg[0] & 0x0f) == client->la)
-+					||
-+					((event->data.msg[0] & 0x0f) == 15 && !event->libcec_la)) )
-+		{
-+			pr_debug("writing to %d\n", client->la);
-+			__mxc_hdmi_cec_msg(event, client, &wakeup, MESSAGE_TYPE_RECEIVE_SUCCESS);
-+		}
-+	}
-+	list_for_each_entry(client, &wakeup, wakeup_node)
-+		wake_up(&(client->hdmi_cec_qm));
-+	kfree(event);
-+}
-+
-+static void mxc_hdmi_cec_worker(struct work_struct *work)
-+{
-+	pr_debug("%s: \n", __func__);
-+	while (!list_empty_careful(&hdmi_cec_root.buffer_head))
-+		mxc_hdmi_cec_msg();
-+	in_worker = 0;
-+	pr_debug("%s:  exit\n", __func__);
-+}
-+
-+static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec);
-+/*!
-+ * @brief open function for cec file operation
-+ *
-+ * @return  0 on success or negative error code on error
-+ */
-+static int hdmi_cec_open(struct inode *inode, struct file *filp)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = NULL;
-+
-+	mutex_lock(&hdmi_cec_root.m_lock);
-+	if (open_count == MAXCLIENTS || !hdmi_cec_ready) {
-+		mutex_unlock(&hdmi_cec_root.m_lock);
-+		return -EBUSY;
-+	}
-+	open_count++;
-+
-+	hdmi_cec = kzalloc(sizeof(struct hdmi_cec_priv), GFP_KERNEL);
-+	hdmi_cec->la = -1;
-+	init_waitqueue_head(&(hdmi_cec->hdmi_cec_qm));
-+	spin_lock_init(&(hdmi_cec->i_lock_cl));
-+	INIT_LIST_HEAD(&hdmi_cec->msg_head);
-+
-+	filp->private_data = (void *)(hdmi_cec);
-+
-+	list_add_tail(&hdmi_cec->client_node, &hdmi_cec_root.client_head);
-+	hdmi_cec_set_address(15, hdmi_cec);
-+	mutex_unlock(&hdmi_cec_root.m_lock);
-+
-+	return 0;
-+}
-+
-+static ssize_t hdmi_cec_read(struct file *file, char __user *buf, size_t count,
-+			    loff_t *ppos)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = file->private_data;
-+	int ret = 0;
-+
-+	if (!open_count || hdmi_cec->la == 0xff)
-+		return -ENODEV;
-+
-+	pr_debug("%s:  client la %x, (addr %x)\n", __func__, hdmi_cec->la, (unsigned int)hdmi_cec);
-+
-+	count = min(count, sizeof(struct hdmi_cec_event));
-+	do {
-+		unsigned long flags;
-+		struct hdmi_cec_event_list *event = NULL;
-+
-+		spin_lock_irqsave(&(hdmi_cec->i_lock_cl), flags);
-+		if (!list_empty(&hdmi_cec->msg_head)) {
-+			event = list_first_entry_or_null(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
-+			list_del(&event->msg_node);
-+		}
-+		spin_unlock_irqrestore(&(hdmi_cec->i_lock_cl), flags);
-+
-+		if (event) {
-+			ret = copy_to_user(buf, &event->data, count) ? -EFAULT : count;
-+			kfree(event);
-+		}
-+		else if (file->f_flags & O_NONBLOCK) {
-+			ret = -EAGAIN;
-+		}
-+		else if (wait_event_interruptible(hdmi_cec->hdmi_cec_qm, (!list_empty(&hdmi_cec->msg_head)))) {
-+			ret = -ERESTARTSYS;
-+		}
-+	} while(!ret);
-+
-+	pr_debug("%s:  exit %d\n", __func__, ret);
-+	return ret;
-+}
-+
-+static ssize_t hdmi_cec_write(struct file *file, const char __user *buf,
-+			     size_t count, loff_t *ppos)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = file->private_data;
-+	int ret = 0 , i = 0;
-+	u8 msg[MAX_MESSAGE_LEN];
-+	u8 val = 0;
-+	int timeout = 1500;
-+
-+	if (!open_count || hdmi_cec->la == 0xff)
-+		return -ENODEV;
-+
-+	if (count > MAX_MESSAGE_LEN)
-+		return -E2BIG;
-+
-+	memset(&msg, 0, MAX_MESSAGE_LEN);
-+	if (copy_from_user(&msg, buf, count))
-+		return -EFAULT;
-+
-+	if (file->f_flags & O_NONBLOCK && hdmi_cec_root.write_busy)
-+		return -EAGAIN;
-+	else if (wait_event_interruptible(hdmi_cec_qw, (!hdmi_cec_root.write_busy)))
-+		return -ERESTARTSYS;
-+
-+	mutex_lock(&hdmi_cec_root.m_lock);
-+	pr_debug("%s: \n", __func__);
-+	hdmi_cec_root.write_busy = true;
-+
-+	hdmi_writeb(count, HDMI_CEC_TX_CNT);
-+	for (i = 0; i < count; i++)
-+		hdmi_writeb(msg[i], HDMI_CEC_TX_DATA0+i);
-+
-+	if (get_d(msg[0]) == 15) {
-+		ret = count;
-+		mxc_hdmi_cec_buffer(HDMI_CEC_TX_DATA0, count, MESSAGE_TYPE_RECEIVE_SUCCESS, hdmi_cec->la);
-+		pr_debug("%s:  wait_event la_is_local\n", __func__);
-+		hdmi_cec_root.write_busy = false;
-+	}
-+
-+	do {
-+		val = hdmi_readb(HDMI_CEC_CTRL); val |= 0x01; val &= ~0x6;
-+		val |= SIGNAL_FREE_ARB;
-+		hdmi_writeb(val, HDMI_CEC_CTRL);
-+		SIGNAL_FREE_ARB = SIGNAL_FREE_TIME_NORMAL;
-+
-+		ret = wait_event_timeout(hdmi_cec_qs, !((val = hdmi_readb(HDMI_CEC_CTRL)) & 0x01), msecs_to_jiffies(timeout));
-+		pr_debug("%s:  wait_event ret %d\n", __func__, ret);
-+		if (hdmi_cec_root.send_error > 5 || ret < 2) {
-+			hdmi_writeb(0, HDMI_CEC_TX_CNT);
-+			hdmi_cec_root.write_busy = false;
-+			ret = -EIO;
-+		} else if (hdmi_cec_root.send_error && ret > 1) {
-+			pr_debug("%s: --- resending msg\n", __func__);
-+			timeout = jiffies_to_msecs(ret);
-+			ret = 0;
-+		} else if (ret > 1) {
-+			ret = count;
-+		}
-+	} while(!ret);
-+
-+	mutex_unlock(&hdmi_cec_root.m_lock);
-+	wake_up(&hdmi_cec_qw);
-+	return ret;
-+}
-+
-+static void hdmi_cec_hwenable(void)
-+{
-+	u8 val;
-+
-+	pr_debug("%s: \n", __func__);
-+	hdmi_cec_state = true;
-+
-+	val = hdmi_readb(HDMI_MC_CLKDIS);
-+	val &= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+	hdmi_writeb(val, HDMI_MC_CLKDIS);
-+
-+	val = HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_NACK |
-+		HDMI_IH_CEC_STAT0_EOM | HDMI_IH_CEC_STAT0_DONE |
-+		HDMI_IH_CEC_STAT0_ARB_LOST;
-+	hdmi_writeb(val, HDMI_CEC_POLARITY);
-+
-+	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL;
-+	hdmi_writeb(val, HDMI_CEC_MASK);
-+	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
-+	hdmi_writeb(0x0, HDMI_CEC_LOCK);
-+	hdmi_writeb(0x2, HDMI_CEC_CTRL);
-+}
-+
-+static void hdmi_cec_hwdisable(void)
-+{
-+	u8 val;
-+
-+	pr_debug("%s: \n", __func__);
-+	hdmi_cec_state = false;
-+
-+	hdmi_writeb(0x10, HDMI_CEC_CTRL);
-+
-+	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL |
-+		HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_ARB_LOST |
-+		HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_EOM |
-+		HDMI_IH_CEC_STAT0_DONE;
-+	hdmi_writeb(val, HDMI_CEC_MASK);
-+	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
-+
-+	hdmi_writeb(0x0, HDMI_CEC_POLARITY);
-+
-+	val = hdmi_readb(HDMI_MC_CLKDIS);
-+	val |= HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+	hdmi_writeb(val, HDMI_MC_CLKDIS);
-+}
-+
-+static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec)
-+{
-+
-+	if (hdmi_cec->la == arg)
-+		return 0;
-+
-+	pr_debug("%s: to %d\n", __func__, arg);
-+
-+	if (arg == 15)
-+		hdmi_cec_root.nr_ff++;
-+	if (hdmi_cec->la == 15)
-+		hdmi_cec_root.nr_ff--;
-+	else
-+		hdmi_cec_root.addresses &= ~BIT(hdmi_cec->la);
-+
-+	hdmi_cec->la = arg;
-+	if ((u8)arg != 0xff)
-+		hdmi_cec_root.addresses |= BIT(arg);
-+	else
-+		wake_up(&hdmi_cec->hdmi_cec_qm);
-+
-+	if (!hdmi_cec_root.nr_ff)
-+		hdmi_cec_root.addresses &= ~BIT(15);
-+
-+	hdmi_writeb(hdmi_cec_root.addresses & 0xff, HDMI_CEC_ADDR_L);
-+	/* 
-+	 * Don't register LA = 15 to with hardware. with it set, broadcast messages are never
-+	 * sent (considered local by CEC controler)
-+	 */
-+	hdmi_writeb((hdmi_cec_root.addresses & 0x7f00) >> 8, HDMI_CEC_ADDR_H);
-+	return 0;
-+}
-+
-+/*!
-+ * @brief IO ctrl function for vpu file operation
-+ * @param cmd IO ctrl command
-+ * @return  0 on success or negative error code on error
-+ */
-+static long hdmi_cec_ioctl(struct file *filp, u_int cmd,
-+		     u_long arg)
-+{
-+	int ret = 0, i;
-+	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
-+
-+	pr_debug("%s: \n", __func__);
-+
-+	if (!open_count)
-+		return -ENODEV;
-+
-+	switch (cmd) {
-+	case HDMICEC_IOC_SETLOGICALADDRESS:
-+		mutex_lock(&hdmi_cec_root.m_lock);
-+		ret = hdmi_cec_set_address(arg, hdmi_cec);
-+		mutex_unlock(&hdmi_cec_root.m_lock);
-+		/*
-+		 * in case we have more clients, inform them about PA change.
-+		 * (if libCEC is not in monitoring mode, it won't allow more
-+		 * clients with same PA - it changes all previous holders of
-+		 * that 'taken' PA to 1000.
-+		 * to avoid that, we expand PA further by replacing first empty
-+		 * dimension with LA (for instance if our PA is 2.2.0.0, we 
-+		 * change to 2.2.X.0 all concurent clients, where X is actual LA
-+		 */
-+		if (open_count > 1 && arg != 15)
-+			mxc_hdmi_cec_handle(hdmi_cec_root.physical_address);
-+		break;
-+
-+	case HDMICEC_IOC_STARTDEVICE:
-+		if (!hdmi_cec_state)
-+			hdmi_cec_hwenable();
-+		break;
-+
-+	case HDMICEC_IOC_STOPDEVICE:
-+		hdmi_cec_set_address(-1, hdmi_cec);
-+		if (hdmi_cec_state && open_count < 2)
-+			hdmi_cec_hwdisable();
-+		break;
-+
-+	case HDMICEC_IOC_GETPHYADDRESS:
-+		ret = copy_to_user((void __user *)arg, &hdmi_cec_root.physical_address,
-+					4*sizeof(u8))?-EFAULT:0;
-+		if (open_count > 1) {
-+			for (i = 0; i < 4 && ((u8*)arg)[i] != 0x0; i++);
-+			((u8*)arg)[i] = hdmi_cec->la;
-+		}
-+		break;
-+
-+	default:
-+		ret = -EINVAL;
-+		break;
-+	}
-+
-+	return ret;
-+}
-+
-+void hdmi_cec_start_device(void)
-+{
-+	if(open_count && hdmi_cec_ready && !hdmi_cec_state)
-+		hdmi_cec_hwenable();
-+}
-+EXPORT_SYMBOL(hdmi_cec_start_device);
-+
-+void hdmi_cec_stop_device(void)
-+{
-+	if(hdmi_cec_ready && hdmi_cec_state)
-+		hdmi_cec_hwdisable();
-+}
-+EXPORT_SYMBOL(hdmi_cec_stop_device);
-+
-+/*!
-+* @brief Release function for vpu file operation
-+* @return  0 on success or negative error code on error
-+*/
-+static int hdmi_cec_release(struct inode *inode, struct file *filp)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
-+	struct hdmi_cec_priv *client, *t;
-+	unsigned long flags;
-+
-+	pr_debug("%s: \n", __func__);
-+
-+	mutex_lock(&hdmi_cec_root.m_lock);
-+	spin_lock_irqsave(&hdmi_cec->i_lock_cl, flags);
-+
-+	hdmi_cec_set_address(-1, hdmi_cec);
-+	if (!--open_count)
-+		hdmi_cec_hwdisable();
-+	while (!list_empty(&hdmi_cec->msg_head)) {
-+		struct hdmi_cec_event_list *event = NULL;
-+
-+		event = list_first_entry(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
-+		list_del(&event->msg_node);
-+		kfree(event);
-+	}
-+	spin_unlock_irqrestore(&hdmi_cec->i_lock_cl, flags);
-+
-+	list_for_each_entry_safe(client, t, &hdmi_cec_root.client_head, client_node) {
-+		if (client == hdmi_cec) {
-+			list_del(&client->client_node);
-+			filp->private_data = NULL;
-+			kfree(client);
-+		}
-+	}
-+
-+	mutex_unlock(&hdmi_cec_root.m_lock);
-+	return 0;
-+}
-+
-+static unsigned int hdmi_cec_poll(struct file *file, poll_table *wait)
-+{
-+	unsigned int mask = 0;
-+	struct hdmi_cec_priv *hdmi_cec = file->private_data;
-+
-+	pr_debug("%s: poll client %lx, la %d\n", __func__, (unsigned long)hdmi_cec, hdmi_cec->la);
-+
-+	if (hdmi_cec->la == 0xff)
-+		return POLLHUP;
-+
-+	poll_wait(file, &hdmi_cec->hdmi_cec_qm, wait);
-+	poll_wait(file, &hdmi_cec_qw, wait);
-+
-+	if (!hdmi_cec_root.write_busy)
-+		mask = (POLLOUT | POLLWRNORM);
-+	if (!list_empty(&hdmi_cec->msg_head))
-+		mask |= (POLLIN | POLLRDNORM);
-+
-+	return mask;
-+}
-+
-+const struct file_operations hdmi_cec_fops = {
-+	.owner = THIS_MODULE,
-+	.read = hdmi_cec_read,
-+	.write = hdmi_cec_write,
-+	.open = hdmi_cec_open,
-+	.unlocked_ioctl = hdmi_cec_ioctl,
-+	.release = hdmi_cec_release,
-+	.poll = hdmi_cec_poll,
-+};
-+
-+static int hdmi_cec_dev_probe(struct platform_device *pdev)
-+{
-+	int err = 0;
-+	struct device *temp_class;
-+	struct resource *res;
-+	struct pinctrl *pinctrl;
-+	int irq = platform_get_irq(pdev, 0);
-+
-+	hdmi_cec_major = register_chrdev(hdmi_cec_major, "mxc_hdmi_cec", &hdmi_cec_fops);
-+	if (hdmi_cec_major < 0) {
-+		dev_err(&pdev->dev, "%s: unable to get a major for HDMI CEC\n", __func__);
-+		err = -EBUSY;
-+		goto out;
-+	}
-+
-+	res = platform_get_resource(pdev, IORESOURCE_IRQ, 0);
-+	if (unlikely(res == NULL)) {
-+		dev_err(&pdev->dev, "%s: No HDMI irq line provided\n", __func__);
-+		goto err_out_chrdev;
-+	}
-+	spin_lock_init(&hdmi_cec_root.i_lock);
-+
-+	err = devm_request_irq(&pdev->dev, irq, mxc_hdmi_cec_isr, IRQF_SHARED,
-+			dev_name(&pdev->dev), &hdmi_cec_root);
-+	if (err < 0) {
-+		dev_err(&pdev->dev, "%s: Unable to request irq: %d\n", __func__, err);
-+		goto err_out_chrdev;
-+	}
-+
-+	hdmi_cec_class = class_create(THIS_MODULE, "mxc_hdmi_cec");
-+	if (IS_ERR(hdmi_cec_class)) {
-+		err = PTR_ERR(hdmi_cec_class);
-+		goto err_out_chrdev;
-+	}
-+
-+	temp_class = device_create(hdmi_cec_class, NULL,
-+			MKDEV(hdmi_cec_major, 0), NULL, "mxc_hdmi_cec");
-+	if (IS_ERR(temp_class)) {
-+		err = PTR_ERR(temp_class);
-+		goto err_out_class;
-+	}
-+
-+	pinctrl = devm_pinctrl_get_select_default(&pdev->dev);
-+	if (IS_ERR(pinctrl)) {
-+		dev_err(&pdev->dev, "%s: can't get/select CEC pinctrl\n", __func__);
-+		goto err_out_class;
-+	}
-+
-+	init_waitqueue_head(&hdmi_cec_qs);
-+	init_waitqueue_head(&hdmi_cec_qw);
-+
-+	INIT_LIST_HEAD(&hdmi_cec_root.client_head);
-+	INIT_LIST_HEAD(&hdmi_cec_root.buffer_head);
-+
-+	mutex_init(&hdmi_cec_root.m_lock);
-+	hdmi_cec_root.addresses = 0;
-+	platform_set_drvdata(pdev, &hdmi_cec_root);
-+	INIT_DELAYED_WORK(&hdmi_cec_root.hdmi_cec_work, mxc_hdmi_cec_worker);
-+
-+	dev_info(&pdev->dev, "%s: HDMI CEC initialized\n", __func__);
-+	hdmi_cec_ready = 1;
-+	goto out;
-+
-+err_out_class:
-+	device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
-+	class_destroy(hdmi_cec_class);
-+err_out_chrdev:
-+	unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
-+out:
-+	return err;
-+}
-+
-+static int hdmi_cec_dev_remove(struct platform_device *pdev)
-+{
-+	if (hdmi_cec_major > 0) {
-+		flush_scheduled_work();
-+		device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
-+		class_destroy(hdmi_cec_class);
-+		unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
-+		hdmi_cec_major = 0;
-+	}
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_hdmi_cec_match[] = {
-+	{ .compatible = "fsl,imx6q-hdmi-cec", },
-+	{ .compatible = "fsl,imx6dl-hdmi-cec", },
-+	{ /* sentinel */ }
-+};
-+
-+static struct platform_driver mxc_hdmi_cec_driver = {
-+	.probe = hdmi_cec_dev_probe,
-+	.remove = hdmi_cec_dev_remove,
-+	.driver = {
-+		.name = "mxc_hdmi_cec",
-+		.of_match_table	= imx_hdmi_cec_match,
-+	},
-+};
-+
-+module_platform_driver(mxc_hdmi_cec_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("Linux HDMI CEC driver for Freescale i.MX/MXC");
-+MODULE_LICENSE("GPL");
-+MODULE_ALIAS("platform:mxc_hdmi_cec");
-+
-diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c
---- linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,765 @@
-+/*
-+ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file mxc_hdmi-cec.c
-+ *
-+ * @brief HDMI CEC system initialization and file operation implementation
-+ *
-+ * @ingroup HDMI
-+ */
-+
-+//#define DEBUG
-+
-+#include <linux/module.h>
-+#include <linux/kernel.h>
-+#include <linux/mm.h>
-+#include <linux/fs.h>
-+#include <linux/stat.h>
-+#include <linux/platform_device.h>
-+#include <linux/poll.h>
-+#include <linux/wait.h>
-+#include <linux/list.h>
-+#include <linux/delay.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/uaccess.h>
-+#include <linux/io.h>
-+#include <linux/slab.h>
-+#include <linux/vmalloc.h>
-+#include <linux/workqueue.h>
-+#include <linux/sizes.h>
-+
-+#include <linux/console.h>
-+#include <linux/types.h>
-+#include <linux/mfd/mxc-hdmi-core.h>
-+#include <linux/pinctrl/consumer.h>
-+
-+#include <video/mxc_hdmi.h>
-+
-+#include "mxc_hdmi-cec.h"
-+
-+#define MAXCLIENTS 15
-+
-+struct hdmi_cec_priv {
-+	u8 la;
-+	u8 libcec_la;
-+	struct list_head msg_head;
-+	struct list_head client_node;
-+	struct list_head wakeup_node;
-+	wait_queue_head_t hdmi_cec_qm;
-+	spinlock_t i_lock_cl;
-+};
-+
-+struct hdmi_cec_event {
-+	u8 event_type;
-+	u8 msg_len;
-+	u8 msg[MAX_MESSAGE_LEN];
-+};
-+
-+struct hdmi_cec_event_list {
-+	struct hdmi_cec_event data;
-+	struct list_head msg_node;
-+};
-+
-+struct hdmi_cec_shared {
-+	bool write_busy;
-+	int  receive_error;
-+	int  send_error;
-+	struct delayed_work hdmi_cec_work, hdmi_msg_trigger;
-+	spinlock_t i_lock;
-+	struct mutex m_lock_cl;
-+	struct list_head client_head;
-+	int nr_ff;
-+	u16 addresses;
-+	u8 latest_cec_stat;
-+	u32 physical_address;
-+};
-+
-+static struct hdmi_cec_shared hdmi_cec_root;
-+
-+static bool hdmi_cec_state;
-+static int hdmi_cec_ready = 0;
-+static int hdmi_cec_major;
-+static struct class *hdmi_cec_class;
-+static u8 open_count = 0;
-+
-+static wait_queue_head_t hdmi_cec_qs, hdmi_cec_qw;
-+
-+static inline bool la_is_local(u8 la)
-+{
-+	return (la == 0xf) ? false : hdmi_cec_root.addresses & BIT(la);
-+}
-+
-+static irqreturn_t mxc_hdmi_cec_isr(int irq, void *data)
-+{
-+	u8 cec_stat = 0;
-+	unsigned long flags;
-+	irqreturn_t ret = IRQ_HANDLED;
-+
-+	spin_lock_irqsave(&hdmi_cec_root.i_lock, flags);
-+
-+	cec_stat = hdmi_readb(HDMI_IH_CEC_STAT0);
-+	if (!cec_stat) {
-+		ret = IRQ_NONE;
-+		goto irqnone;
-+	}
-+	hdmi_writeb(0x7f, HDMI_IH_MUTE_CEC_STAT0);
-+	hdmi_writeb(cec_stat, HDMI_IH_CEC_STAT0);
-+
-+	if (cec_stat & HDMI_IH_CEC_STAT0_ERROR_INIT) {
-+		hdmi_cec_root.send_error++;
-+		pr_debug("%s:  error %d\n", __func__, hdmi_cec_root.send_error);
-+		wake_up(&hdmi_cec_qs);
-+	}
-+	if (cec_stat & (HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_DONE)) {
-+		hdmi_cec_root.send_error = 0;
-+		wake_up(&hdmi_cec_qs);
-+	}
-+
-+	hdmi_cec_root.latest_cec_stat = cec_stat;
-+	pr_debug("%s:  HDMI CEC interrupt received\n", __func__);
-+	schedule_delayed_work(&(hdmi_cec_root.hdmi_cec_work), msecs_to_jiffies(5));
-+
-+irqnone:
-+	spin_unlock_irqrestore(&hdmi_cec_root.i_lock, flags);
-+	return ret;
-+}
-+
-+static void __mxc_hdmi_cec_msg(struct hdmi_cec_event_list *event, struct hdmi_cec_priv *client, struct list_head *wakeup, u8 event_type)
-+{
-+	struct hdmi_cec_event_list *tevent = NULL;
-+	unsigned long flags;
-+
-+	if (!(tevent = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL))) {
-+		pr_err("%s: Not enough memory!\n", __func__);
-+		return;
-+	}
-+	memcpy(tevent, event, max(sizeof(struct hdmi_cec_event_list),(size_t)event->data.msg_len));
-+	if (event_type)
-+		tevent->data.event_type = event_type;
-+	spin_lock_irqsave(&client->i_lock_cl, flags);
-+	list_add_tail(&tevent->msg_node, &client->msg_head);
-+	spin_unlock_irqrestore(&client->i_lock_cl, flags);
-+
-+	if (wakeup)
-+		list_add_tail(&client->wakeup_node, wakeup);
-+	pr_debug("%s:  -- event to client %x\n", __func__, (int)client);
-+}
-+
-+void mxc_hdmi_cec_handle(u32 cec_stat)
-+{
-+	struct hdmi_cec_event_list *event = NULL;
-+	struct hdmi_cec_priv *client = NULL;
-+
-+	if (cec_stat)
-+		hdmi_cec_root.physical_address = cec_stat;
-+
-+	/* HDMI cable connected / HDMI cable disconnected */
-+	if (!hdmi_cec_ready)
-+		return;
-+	pr_debug("%s: enter\n", __func__);
-+
-+	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL);
-+	if (!event) {
-+		pr_err("%s: Not enough memory!\n", __func__);
-+		return;
-+	}
-+	event->data.event_type = cec_stat ?
-+		MESSAGE_TYPE_CONNECTED : MESSAGE_TYPE_DISCONNECTED;
-+
-+	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
-+		__mxc_hdmi_cec_msg(event, client, NULL, 0);
-+		wake_up(&client->hdmi_cec_qm);
-+	}
-+	pr_debug("%s: exit\n", __func__);
-+}
-+EXPORT_SYMBOL(mxc_hdmi_cec_handle);
-+
-+void mxc_hdmi_cec_msg(u8 event_type)
-+{
-+	struct hdmi_cec_event_list *event = NULL;
-+	struct hdmi_cec_priv *client = NULL;
-+	u8 i;
-+	LIST_HEAD(wakeup);
-+
-+	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL);
-+	if (NULL == event) {
-+		pr_err("%s: Not enough memory!\n", __func__);
-+		goto error2;
-+	}
-+	event->data.msg_len = (event_type == MESSAGE_TYPE_RECEIVE_SUCCESS) ?
-+		hdmi_readb(HDMI_CEC_RX_CNT) : hdmi_readb(HDMI_CEC_TX_CNT);
-+
-+	if (!event->data.msg_len || event->data.msg_len > MAX_MESSAGE_LEN) {
-+		pr_err("%s: Bad message size %d!\n", __func__, event->data.msg_len);
-+		goto error1;
-+	}
-+
-+	for (i = 0; i < event->data.msg_len; i++)
-+		event->data.msg[i] = (event_type == MESSAGE_TYPE_RECEIVE_SUCCESS) ?
-+				hdmi_readb(HDMI_CEC_RX_DATA0+i) : hdmi_readb(HDMI_CEC_TX_DATA0+i);
-+
-+	if (event_type == MESSAGE_TYPE_RECEIVE_SUCCESS)
-+		hdmi_writeb(0x0, HDMI_CEC_LOCK);
-+
-+	event->data.event_type = (event_type == MESSAGE_TYPE_NOACK && la_is_local(event->data.msg[0] & 0x0f)) ?
-+								MESSAGE_TYPE_SEND_SUCCESS : event_type;
-+
-+	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
-+		if (client->la == 0xff) continue;
-+		pr_debug("%s:  -- l:%x, r:%x, ch:%x LA: %x\n", __func__, (event->data.msg[0] & 0xf0) >> 4, event->data.msg[0] & 0x0f, client->libcec_la, client->la);
-+
-+		if ((event_type == MESSAGE_TYPE_RECEIVE_SUCCESS && 
-+					(((event->data.msg[0] & 0x0f) == 15 && client->libcec_la != client->la) || (event->data.msg[0] & 0x0f) == client->la))
-+		    ||
-+		    (event_type != MESSAGE_TYPE_RECEIVE_SUCCESS &&
-+					(client->libcec_la == (int)client->la)) )
-+		{
-+			pr_debug("%s:  -- adding msg %x->%x to client %x (event: %x)\n", __func__, (event->data.msg[0] & 0xf0) >> 4, event->data.msg[0] & 0x0f, client->la, (int)event);
-+			__mxc_hdmi_cec_msg(event, client, &wakeup, 0);
-+		}
-+
-+		if ((event->data.event_type == MESSAGE_TYPE_SEND_SUCCESS) &&
-+					((la_is_local(event->data.msg[0] & 0x0f) && (event->data.msg[0] & 0x0f) == client->la)
-+					||
-+					((event->data.msg[0] & 0x0f) == 15 && !client->libcec_la)) )
-+		{
-+			pr_debug("%s:  -- COPYing event to client %x\n", __func__, (int)client);
-+			__mxc_hdmi_cec_msg(event, client, &wakeup, MESSAGE_TYPE_RECEIVE_SUCCESS);
-+		}
-+		client->libcec_la = 0;
-+	}
-+	list_for_each_entry(client, &wakeup, wakeup_node)
-+		wake_up(&(client->hdmi_cec_qm));
-+
-+error1:
-+	kfree(event);
-+error2:
-+	if (event_type != MESSAGE_TYPE_RECEIVE_SUCCESS) {
-+		mutex_lock(&hdmi_cec_root.m_lock_cl);
-+		hdmi_cec_root.write_busy = false;
-+		hdmi_writeb(0, HDMI_CEC_TX_CNT);
-+		mutex_unlock(&hdmi_cec_root.m_lock_cl);
-+		wake_up(&hdmi_cec_qw);
-+	}
-+}
-+
-+static void mxc_hdmi_cec_worker(struct work_struct *work)
-+{
-+	unsigned long flags;
-+	u8 val;
-+
-+	pr_debug("%s: \n", __func__);
-+	if (hdmi_cec_root.latest_cec_stat && open_count) {
-+		/* The current transmission is successful (for initiator only).*/
-+		if (hdmi_cec_root.latest_cec_stat & HDMI_IH_CEC_STAT0_DONE) {
-+			mxc_hdmi_cec_msg(MESSAGE_TYPE_SEND_SUCCESS);
-+		}
-+		/*A frame is not acknowledged in a directly addressed message. Or a frame is negatively acknowledged in
-+		a broadcast message (for initiator only).*/
-+		if (hdmi_cec_root.latest_cec_stat & HDMI_IH_CEC_STAT0_NACK) {
-+			mxc_hdmi_cec_msg(MESSAGE_TYPE_NOACK);
-+		}
-+		/*EOM is detected so that the received data is ready in the receiver data buffer*/
-+		if (hdmi_cec_root.latest_cec_stat & HDMI_IH_CEC_STAT0_EOM) {
-+			mxc_hdmi_cec_msg(MESSAGE_TYPE_RECEIVE_SUCCESS);
-+		}
-+		hdmi_cec_root.latest_cec_stat = 0;
-+	}
-+
-+	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL | HDMI_IH_CEC_STAT0_ARB_LOST;
-+//	spin_lock_irqsave(&hdmi_cec_root.i_lock, flags);
-+	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
-+//	spin_unlock_irqrestore(&hdmi_cec_root.i_lock, flags);
-+	pr_debug("%s:  exit\n", __func__);
-+}
-+
-+static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec);
-+/*!
-+ * @brief open function for cec file operation
-+ *
-+ * @return  0 on success or negative error code on error
-+ */
-+static int hdmi_cec_open(struct inode *inode, struct file *filp)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = NULL;
-+
-+	mutex_lock(&hdmi_cec_root.m_lock_cl);
-+	if (open_count == MAXCLIENTS || !hdmi_cec_ready) {
-+		mutex_unlock(&hdmi_cec_root.m_lock_cl);
-+		return -EBUSY;
-+	}
-+	open_count++;
-+
-+	hdmi_cec = kzalloc(sizeof(struct hdmi_cec_priv), GFP_KERNEL);
-+	hdmi_cec->la = -1;
-+	init_waitqueue_head(&(hdmi_cec->hdmi_cec_qm));
-+	spin_lock_init(&(hdmi_cec->i_lock_cl));
-+	INIT_LIST_HEAD(&hdmi_cec->msg_head);
-+
-+	filp->private_data = (void *)(hdmi_cec);
-+
-+	list_add_tail(&hdmi_cec->client_node, &hdmi_cec_root.client_head);
-+	hdmi_cec_set_address(15, hdmi_cec);
-+	mutex_unlock(&hdmi_cec_root.m_lock_cl);
-+
-+	return 0;
-+}
-+
-+/*
-+ * run delayed mxc_hdmi_cec_msg() to deal with msgs to LAs registered on local CEC.
-+ * imx CEC is not transporting such messages through (local) interface
-+ * (messages with destination the same as any regstered LA)
-+ */
-+static void mxc_hdmi_cec_msg_trigger(struct work_struct *work)
-+{
-+	mxc_hdmi_cec_msg(MESSAGE_TYPE_SEND_SUCCESS);
-+}
-+
-+static ssize_t hdmi_cec_read(struct file *file, char __user *buf, size_t count,
-+			    loff_t *ppos)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = file->private_data;
-+	int ret = 0;
-+
-+	if (!open_count || hdmi_cec->la == 0xff)
-+		return -ENODEV;
-+
-+	pr_debug("%s:  client la %x, (addr %x)\n", __func__, hdmi_cec->la, (unsigned int)hdmi_cec);
-+
-+	count = min(count, sizeof(struct hdmi_cec_event));
-+	do {
-+		unsigned long flags;
-+		struct hdmi_cec_event_list *event = NULL;
-+
-+		spin_lock_irqsave(&(hdmi_cec->i_lock_cl), flags);
-+		if (!list_empty(&hdmi_cec->msg_head)) {
-+			event = list_first_entry_or_null(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
-+			list_del(&event->msg_node);
-+		}
-+		spin_unlock_irqrestore(&(hdmi_cec->i_lock_cl), flags);
-+
-+		if (event) {
-+			ret = copy_to_user(buf, &event->data, count) ? -EFAULT : count;
-+			kfree(event);
-+		}
-+		else if (file->f_flags & O_NONBLOCK) {
-+			ret = -EAGAIN;
-+		}
-+		else if (wait_event_interruptible(hdmi_cec->hdmi_cec_qm, (!list_empty(&hdmi_cec->msg_head)))) {
-+			ret = -ERESTARTSYS;
-+		}
-+	} while(!ret);
-+
-+	pr_debug("%s:  exit %d\n", __func__, ret);
-+	return ret;
-+}
-+
-+static ssize_t hdmi_cec_write(struct file *file, const char __user *buf,
-+			     size_t count, loff_t *ppos)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = file->private_data;
-+	int ret = 0 , i = 0;
-+	u8 msg[MAX_MESSAGE_LEN];
-+	u8 val = 0;
-+	int timeout = 1500;
-+
-+	if (!open_count || hdmi_cec->la == 0xff)
-+		return -ENODEV;
-+
-+	if (count > MAX_MESSAGE_LEN)
-+		return -E2BIG;
-+
-+	memset(&msg, 0, MAX_MESSAGE_LEN);
-+	if (copy_from_user(&msg, buf, count))
-+		return -EFAULT;
-+
-+	if (file->f_flags & O_NONBLOCK && hdmi_cec_root.write_busy)
-+		return -EAGAIN;
-+	else if (wait_event_interruptible(hdmi_cec_qw, (!hdmi_cec_root.write_busy)))
-+		return -ERESTARTSYS;
-+
-+	mutex_lock(&hdmi_cec_root.m_lock_cl);
-+	pr_debug("%s: \n", __func__);
-+	hdmi_cec_root.write_busy = true;
-+
-+	hdmi_writeb(count, HDMI_CEC_TX_CNT);
-+	for (i = 0; i < count; i++)
-+		hdmi_writeb(msg[i], HDMI_CEC_TX_DATA0+i);
-+
-+	hdmi_cec->libcec_la = hdmi_cec->la;
-+	if (la_is_local(msg[0] & 0x0f)) {
-+		ret = count;
-+		schedule_delayed_work(&(hdmi_cec_root.hdmi_msg_trigger), msecs_to_jiffies(20));
-+		pr_debug("%s:  wait_event la_is_local\n", __func__);
-+	} else
-+
-+	do {
-+		val = hdmi_readb(HDMI_CEC_CTRL) | 0x01;
-+		val |= hdmi_cec_root.send_error ? SIGNAL_FREE_TIME_RESEND : SIGNAL_FREE_TIME_NORMAL;
-+		hdmi_writeb(val, HDMI_CEC_CTRL);
-+
-+		ret = wait_event_timeout(hdmi_cec_qs, !((val = hdmi_readb(HDMI_CEC_CTRL)) & 0x01), msecs_to_jiffies(timeout));
-+		pr_debug("%s:  wait_event ret %d\n", __func__, ret);
-+		if (hdmi_cec_root.send_error > 5 || ret < 2) {
-+			hdmi_writeb(0, HDMI_CEC_TX_CNT);
-+			hdmi_cec_root.write_busy = false;
-+			wake_up(&hdmi_cec_qw);
-+			ret = -EIO;
-+		} else if (hdmi_cec_root.send_error && ret > 1) {
-+			pr_debug("%s: --- resending msg\n", __func__);
-+			timeout = jiffies_to_msecs(ret);
-+			ret = 0;
-+		} else if (ret > 1) {
-+			ret = count;
-+		}
-+	} while(!ret);
-+
-+	mutex_unlock(&hdmi_cec_root.m_lock_cl);
-+	return ret;
-+}
-+
-+static void hdmi_cec_hwenable(void)
-+{
-+	u8 val;
-+
-+	pr_debug("%s: \n", __func__);
-+	hdmi_cec_state = true;
-+
-+	val = hdmi_readb(HDMI_MC_CLKDIS);
-+	val &= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+	hdmi_writeb(val, HDMI_MC_CLKDIS);
-+
-+	val = HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_NACK |
-+		HDMI_IH_CEC_STAT0_EOM | HDMI_IH_CEC_STAT0_DONE;
-+	hdmi_writeb(val, HDMI_CEC_POLARITY);
-+
-+	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL |
-+		HDMI_IH_CEC_STAT0_ARB_LOST;
-+	hdmi_writeb(val, HDMI_CEC_MASK);
-+	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
-+	hdmi_writeb(0x0, HDMI_CEC_LOCK);
-+	hdmi_writeb(0x02, HDMI_CEC_CTRL);
-+}
-+
-+static void hdmi_cec_hwdisable(void)
-+{
-+	u8 val;
-+
-+	pr_debug("%s: \n", __func__);
-+	hdmi_cec_state = false;
-+
-+	hdmi_writeb(0x10, HDMI_CEC_CTRL);
-+
-+	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL |
-+		HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_ARB_LOST |
-+		HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_EOM |
-+		HDMI_IH_CEC_STAT0_DONE;
-+	hdmi_writeb(val, HDMI_CEC_MASK);
-+	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
-+
-+	hdmi_writeb(0x0, HDMI_CEC_POLARITY);
-+
-+	val = hdmi_readb(HDMI_MC_CLKDIS);
-+	val |= HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+	hdmi_writeb(val, HDMI_MC_CLKDIS);
-+}
-+
-+static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec)
-+{
-+
-+	if (hdmi_cec->la == arg)
-+		return 0;
-+
-+	pr_debug("%s: to %d\n", __func__, arg);
-+
-+	if (arg == 15)
-+		hdmi_cec_root.nr_ff++;
-+	if (hdmi_cec->la == 15)
-+		hdmi_cec_root.nr_ff--;
-+	else
-+		hdmi_cec_root.addresses &= ~BIT(hdmi_cec->la);
-+
-+	hdmi_cec->la = arg;
-+	if ((u8)arg != 0xff)
-+		hdmi_cec_root.addresses |= BIT(arg);
-+	else
-+		wake_up(&hdmi_cec->hdmi_cec_qm);
-+
-+	if (!hdmi_cec_root.nr_ff)
-+		hdmi_cec_root.addresses &= ~BIT(15);
-+
-+	hdmi_writeb(hdmi_cec_root.addresses & 0xff, HDMI_CEC_ADDR_L);
-+	/* 
-+	 * Don't register LA = 15 to with hardware. with it set, broadcast messages are never
-+	 * sent (considered local by CEC controler)
-+	 */
-+	hdmi_writeb((hdmi_cec_root.addresses & 0x7f00) >> 8, HDMI_CEC_ADDR_H);
-+	return 0;
-+}
-+
-+/*!
-+ * @brief IO ctrl function for vpu file operation
-+ * @param cmd IO ctrl command
-+ * @return  0 on success or negative error code on error
-+ */
-+static long hdmi_cec_ioctl(struct file *filp, u_int cmd,
-+		     u_long arg)
-+{
-+	int ret = 0, i;
-+	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
-+
-+	pr_debug("%s: \n", __func__);
-+
-+	if (!open_count)
-+		return -ENODEV;
-+
-+	switch (cmd) {
-+	case HDMICEC_IOC_SETLOGICALADDRESS:
-+		mutex_lock(&hdmi_cec_root.m_lock_cl);
-+		ret = hdmi_cec_set_address(arg, hdmi_cec);
-+		mutex_unlock(&hdmi_cec_root.m_lock_cl);
-+		/*
-+		 * in case we have more clients, inform them about PA change.
-+		 * (if libCEC is not in monitoring mode, it won't allow more
-+		 * clients with same PA - it changes all previous holders of
-+		 * that 'taken' PA to 1000.
-+		 * to avoid that, we expand PA further by replacing first empty
-+		 * dimension with LA (for instance if our PA is 2.2.0.0, we 
-+		 * change to 2.2.X.0 all concurent clients, where X is actual LA
-+		 */
-+		if (open_count > 1 && arg != 15)
-+			mxc_hdmi_cec_handle(hdmi_cec_root.physical_address);
-+		break;
-+
-+	case HDMICEC_IOC_STARTDEVICE:
-+		if (!hdmi_cec_state)
-+			hdmi_cec_hwenable();
-+		break;
-+
-+	case HDMICEC_IOC_STOPDEVICE:
-+		hdmi_cec_set_address(-1, hdmi_cec);
-+		if (hdmi_cec_state && open_count < 2)
-+			hdmi_cec_hwdisable();
-+		break;
-+
-+	case HDMICEC_IOC_GETPHYADDRESS:
-+		ret = copy_to_user((void __user *)arg, &hdmi_cec_root.physical_address,
-+					4*sizeof(u8))?-EFAULT:0;
-+		if (open_count > 1) {
-+			for (i = 0; i < 4 && ((u8*)arg)[i] != 0x0; i++);
-+			((u8*)arg)[i] = hdmi_cec->la;
-+		}
-+		break;
-+
-+	default:
-+		ret = -EINVAL;
-+		break;
-+	}
-+
-+	return ret;
-+}
-+
-+void hdmi_cec_start_device(void)
-+{
-+	if(open_count && hdmi_cec_ready && !hdmi_cec_state)
-+		hdmi_cec_hwenable();
-+}
-+EXPORT_SYMBOL(hdmi_cec_start_device);
-+
-+void hdmi_cec_stop_device(void)
-+{
-+	if(hdmi_cec_ready && hdmi_cec_state)
-+		hdmi_cec_hwdisable();
-+}
-+EXPORT_SYMBOL(hdmi_cec_stop_device);
-+
-+/*!
-+* @brief Release function for vpu file operation
-+* @return  0 on success or negative error code on error
-+*/
-+static int hdmi_cec_release(struct inode *inode, struct file *filp)
-+{
-+	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
-+	struct hdmi_cec_priv *client, *t;
-+	unsigned long flags;
-+
-+	pr_debug("%s: \n", __func__);
-+
-+	mutex_lock(&hdmi_cec_root.m_lock_cl);
-+	spin_lock_irqsave(&hdmi_cec->i_lock_cl, flags);
-+
-+	hdmi_cec_set_address(-1, hdmi_cec);
-+	if (open_count > 0)
-+		open_count--;
-+	if (!open_count)
-+		hdmi_cec_hwdisable();
-+	while (!list_empty(&hdmi_cec->msg_head)) {
-+		struct hdmi_cec_event_list *event = NULL;
-+
-+		event = list_first_entry(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
-+		list_del(&event->msg_node);
-+		kfree(event);
-+	}
-+
-+	spin_unlock_irqrestore(&hdmi_cec->i_lock_cl, flags);
-+
-+	list_for_each_entry_safe(client, t, &hdmi_cec_root.client_head, client_node) {
-+		if (client == hdmi_cec) {
-+			list_del(&client->client_node);
-+			filp->private_data = NULL;
-+			kfree(client);
-+		}
-+	}
-+
-+	mutex_unlock(&hdmi_cec_root.m_lock_cl);
-+	return 0;
-+}
-+
-+static unsigned int hdmi_cec_poll(struct file *file, poll_table *wait)
-+{
-+	unsigned int mask = 0;
-+	struct hdmi_cec_priv *hdmi_cec = file->private_data;
-+
-+	pr_debug("%s: poll client %lx, la %d\n", __func__, (unsigned long)hdmi_cec, hdmi_cec->la);
-+
-+	if (hdmi_cec->la == 0xff)
-+		return POLLHUP;
-+
-+	poll_wait(file, &hdmi_cec->hdmi_cec_qm, wait);
-+	poll_wait(file, &hdmi_cec_qw, wait);
-+
-+	if (!hdmi_cec_root.write_busy)
-+		mask = (POLLOUT | POLLWRNORM);
-+	if (!list_empty(&hdmi_cec->msg_head))
-+		mask |= (POLLIN | POLLRDNORM);
-+
-+	return mask;
-+}
-+
-+const struct file_operations hdmi_cec_fops = {
-+	.owner = THIS_MODULE,
-+	.read = hdmi_cec_read,
-+	.write = hdmi_cec_write,
-+	.open = hdmi_cec_open,
-+	.unlocked_ioctl = hdmi_cec_ioctl,
-+	.release = hdmi_cec_release,
-+	.poll = hdmi_cec_poll,
-+};
-+
-+static int hdmi_cec_dev_probe(struct platform_device *pdev)
-+{
-+	int err = 0;
-+	struct device *temp_class;
-+	struct resource *res;
-+	struct pinctrl *pinctrl;
-+	int irq = platform_get_irq(pdev, 0);
-+
-+	hdmi_cec_major = register_chrdev(hdmi_cec_major, "mxc_hdmi_cec", &hdmi_cec_fops);
-+	if (hdmi_cec_major < 0) {
-+		dev_err(&pdev->dev, "%s: unable to get a major for HDMI CEC\n", __func__);
-+		err = -EBUSY;
-+		goto out;
-+	}
-+
-+	res = platform_get_resource(pdev, IORESOURCE_IRQ, 0);
-+	if (unlikely(res == NULL)) {
-+		dev_err(&pdev->dev, "%s: No HDMI irq line provided\n", __func__);
-+		goto err_out_chrdev;
-+	}
-+	spin_lock_init(&hdmi_cec_root.i_lock);
-+
-+	err = devm_request_irq(&pdev->dev, irq, mxc_hdmi_cec_isr, IRQF_SHARED,
-+			dev_name(&pdev->dev), &hdmi_cec_root);
-+	if (err < 0) {
-+		dev_err(&pdev->dev, "%s: Unable to request irq: %d\n", __func__, err);
-+		goto err_out_chrdev;
-+	}
-+
-+	hdmi_cec_class = class_create(THIS_MODULE, "mxc_hdmi_cec");
-+	if (IS_ERR(hdmi_cec_class)) {
-+		err = PTR_ERR(hdmi_cec_class);
-+		goto err_out_chrdev;
-+	}
-+
-+	temp_class = device_create(hdmi_cec_class, NULL,
-+			MKDEV(hdmi_cec_major, 0), NULL, "mxc_hdmi_cec");
-+	if (IS_ERR(temp_class)) {
-+		err = PTR_ERR(temp_class);
-+		goto err_out_class;
-+	}
-+
-+	pinctrl = devm_pinctrl_get_select_default(&pdev->dev);
-+	if (IS_ERR(pinctrl)) {
-+		dev_err(&pdev->dev, "%s: can't get/select CEC pinctrl\n", __func__);
-+		goto err_out_class;
-+	}
-+
-+	init_waitqueue_head(&hdmi_cec_qs);
-+	init_waitqueue_head(&hdmi_cec_qw);
-+
-+	INIT_LIST_HEAD(&hdmi_cec_root.client_head);
-+
-+	mutex_init(&hdmi_cec_root.m_lock_cl);
-+	hdmi_cec_root.addresses = 0;
-+	platform_set_drvdata(pdev, &hdmi_cec_root);
-+	INIT_DELAYED_WORK(&hdmi_cec_root.hdmi_cec_work, mxc_hdmi_cec_worker);
-+	INIT_DELAYED_WORK(&hdmi_cec_root.hdmi_msg_trigger, mxc_hdmi_cec_msg_trigger);
-+
-+	dev_info(&pdev->dev, "%s: HDMI CEC initialized\n", __func__);
-+	hdmi_cec_ready = 1;
-+	goto out;
-+
-+err_out_class:
-+	device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
-+	class_destroy(hdmi_cec_class);
-+err_out_chrdev:
-+	unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
-+out:
-+	return err;
-+}
-+
-+static int hdmi_cec_dev_remove(struct platform_device *pdev)
-+{
-+	if (hdmi_cec_major > 0) {
-+		flush_scheduled_work();
-+		device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
-+		class_destroy(hdmi_cec_class);
-+		unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
-+		hdmi_cec_major = 0;
-+	}
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_hdmi_cec_match[] = {
-+	{ .compatible = "fsl,imx6q-hdmi-cec", },
-+	{ .compatible = "fsl,imx6dl-hdmi-cec", },
-+	{ /* sentinel */ }
-+};
-+
-+static struct platform_driver mxc_hdmi_cec_driver = {
-+	.probe = hdmi_cec_dev_probe,
-+	.remove = hdmi_cec_dev_remove,
-+	.driver = {
-+		.name = "mxc_hdmi_cec",
-+		.of_match_table	= imx_hdmi_cec_match,
-+	},
-+};
-+
-+module_platform_driver(mxc_hdmi_cec_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("Linux HDMI CEC driver for Freescale i.MX/MXC");
-+MODULE_LICENSE("GPL");
-+MODULE_ALIAS("platform:mxc_hdmi_cec");
-+
-diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h
---- linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,53 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+#ifndef _HDMICEC_H_
-+#define _HDMICEC_H_
-+#include <linux/ioctl.h>
-+
-+/*
-+ * Ioctl definitions
-+ */
-+
-+/* Use 'k' as magic number */
-+#define HDMICEC_IOC_MAGIC  'H'
-+/*
-+ * S means "Set" through a ptr,
-+ * T means "Tell" directly with the argument value
-+ * G means "Get": reply by setting through a pointer
-+ * Q means "Query": response is on the return value
-+ * X means "eXchange": G and S atomically
-+ * H means "sHift": T and Q atomically
-+ */
-+#define HDMICEC_IOC_SETLOGICALADDRESS  \
-+				_IOW(HDMICEC_IOC_MAGIC, 1, unsigned char)
-+#define HDMICEC_IOC_STARTDEVICE	_IO(HDMICEC_IOC_MAGIC,  2)
-+#define HDMICEC_IOC_STOPDEVICE	_IO(HDMICEC_IOC_MAGIC,  3)
-+#define HDMICEC_IOC_GETPHYADDRESS	\
-+				_IOR(HDMICEC_IOC_MAGIC, 4, unsigned char[4])
-+#define HDMICEC_IOC_LOG \
-+				_IOW(HDMICEC_IOC_MAGIC, 5, unsigned char[255])
-+
-+#define MAX_MESSAGE_LEN                         16
-+
-+#define MESSAGE_TYPE_RECEIVE_SUCCESS            1
-+#define MESSAGE_TYPE_NOACK                      2
-+#define MESSAGE_TYPE_DISCONNECTED               3
-+#define MESSAGE_TYPE_CONNECTED                  4
-+#define MESSAGE_TYPE_SEND_SUCCESS               5
-+
-+#define SIGNAL_FREE_LOST			BIT(2)
-+#define SIGNAL_FREE_TIME_NORMAL			BIT(1)
-+#define SIGNAL_FREE_TIME_RESEND			0
-+
-+#endif				/* !_HDMICEC_H_ */
-+
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,495 @@
-+/*
-+ * Copyright 2009-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*
-+ * @file ipu_calc_stripes_sizes.c
-+ *
-+ * @brief IPU IC functions
-+ *
-+ * @ingroup IPU
-+ */
-+
-+#include <linux/ipu-v3.h>
-+#include <linux/module.h>
-+#include <linux/math64.h>
-+
-+#define BPP_32 0
-+#define BPP_16 3
-+#define BPP_8 5
-+#define BPP_24 1
-+#define BPP_12 4
-+#define BPP_18 2
-+
-+static u32 truncate(u32 up, /* 0: down; else: up */
-+					u64 a, /* must be non-negative */
-+					u32 b)
-+{
-+	u32 d;
-+	u64 div;
-+	div = div_u64(a, b);
-+	d = b * (div >> 32);
-+	if (up && (a > (((u64)d) << 32)))
-+		return d+b;
-+	else
-+		return d;
-+}
-+
-+static unsigned int f_calc(unsigned int pfs, unsigned int bpp, unsigned int *write)
-+{/* return input_f */
-+	unsigned int f_calculated = 0;
-+	switch (pfs) {
-+	case IPU_PIX_FMT_YVU422P:
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_YUV444P:
-+		f_calculated = 16;
-+		break;
-+
-+	case IPU_PIX_FMT_RGB565:
-+	case IPU_PIX_FMT_YUYV:
-+	case IPU_PIX_FMT_UYVY:
-+		f_calculated = 8;
-+		break;
-+
-+	case IPU_PIX_FMT_NV12:
-+		f_calculated = 8;
-+		break;
-+
-+	default:
-+		f_calculated = 0;
-+		break;
-+
-+	}
-+	if (!f_calculated) {
-+		switch (bpp) {
-+		case BPP_32:
-+			f_calculated = 2;
-+			break;
-+
-+		case BPP_16:
-+			f_calculated = 4;
-+			break;
-+
-+		case BPP_8:
-+		case BPP_24:
-+			f_calculated = 8;
-+			break;
-+
-+		case BPP_12:
-+			f_calculated = 16;
-+			break;
-+
-+		case BPP_18:
-+			f_calculated = 32;
-+			break;
-+
-+		default:
-+			f_calculated = 0;
-+			break;
-+			}
-+		}
-+	return f_calculated;
-+}
-+
-+
-+static unsigned int m_calc(unsigned int pfs)
-+{
-+	unsigned int m_calculated = 0;
-+	switch (pfs) {
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YVU422P:
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_YUV444P:
-+		m_calculated = 16;
-+		break;
-+
-+	case IPU_PIX_FMT_NV12:
-+	case IPU_PIX_FMT_YUYV:
-+	case IPU_PIX_FMT_UYVY:
-+		m_calculated = 8;
-+		break;
-+
-+	default:
-+		m_calculated = 8;
-+		break;
-+
-+	}
-+	return m_calculated;
-+}
-+
-+static int calc_split_resize_coeffs(unsigned int inSize, unsigned int outSize,
-+				    unsigned int *resizeCoeff,
-+				    unsigned int *downsizeCoeff)
-+{
-+	uint32_t tempSize;
-+	uint32_t tempDownsize;
-+
-+	if (inSize > 4096) {
-+		pr_debug("IC input size(%d) cannot exceed 4096\n",
-+			inSize);
-+		return -EINVAL;
-+	}
-+
-+	if (outSize > 1024) {
-+		pr_debug("IC output size(%d) cannot exceed 1024\n",
-+			outSize);
-+		return -EINVAL;
-+	}
-+
-+	if ((outSize << 3) < inSize) {
-+		pr_debug("IC cannot downsize more than 8:1\n");
-+		return -EINVAL;
-+	}
-+
-+	/* Compute downsizing coefficient */
-+	/* Output of downsizing unit cannot be more than 1024 */
-+	tempDownsize = 0;
-+	tempSize = inSize;
-+	while (((tempSize > 1024) || (tempSize >= outSize * 2)) &&
-+	       (tempDownsize < 2)) {
-+		tempSize >>= 1;
-+		tempDownsize++;
-+	}
-+	*downsizeCoeff = tempDownsize;
-+
-+	/* compute resizing coefficient using the following equation:
-+	   resizeCoeff = M*(SI -1)/(SO - 1)
-+	   where M = 2^13, SI - input size, SO - output size    */
-+	*resizeCoeff = (8192L * (tempSize - 1)) / (outSize - 1);
-+	if (*resizeCoeff >= 16384L) {
-+		pr_debug("Overflow on IC resize coefficient.\n");
-+		return -EINVAL;
-+	}
-+
-+	pr_debug("resizing from %u -> %u pixels, "
-+		"downsize=%u, resize=%u.%lu (reg=%u)\n", inSize, outSize,
-+		*downsizeCoeff, (*resizeCoeff >= 8192L) ? 1 : 0,
-+		((*resizeCoeff & 0x1FFF) * 10000L) / 8192L, *resizeCoeff);
-+
-+	return 0;
-+}
-+
-+/* Stripe parameters calculator */
-+/**************************************************************************
-+Notes:
-+MSW = the maximal width allowed for a stripe
-+	i.MX31: 720, i.MX35: 800, i.MX37/51/53: 1024
-+cirr = the maximal inverse resizing ratio for which overlap in the input
-+	is requested; typically cirr~2
-+flags
-+	bit 0 - equal_stripes
-+		0  each stripe is allowed to have independent parameters
-+		for maximal image quality
-+		1  the stripes are requested to have identical parameters
-+	(except the base address), for maximal performance
-+	bit 1 - vertical/horizontal
-+		0 horizontal
-+		1 vertical
-+
-+If performance is the top priority (above image quality)
-+	Avoid overlap, by setting CIRR = 0
-+		This will also force effectively identical_stripes = 1
-+	Choose IF & OF that corresponds to the same IOX/SX for both stripes
-+	Choose IFW & OFW such that
-+	IFW/IM, IFW/IF, OFW/OM, OFW/OF are even integers
-+	The function returns an error status:
-+	0: no error
-+	1: invalid input parameters -> aborted without result
-+		Valid parameters should satisfy the following conditions
-+		IFW <= OFW, otherwise downsizing is required
-+					 - which is not supported yet
-+		4 <= IFW,OFW, so some interpolation may be needed even without overlap
-+		IM, OM, IF, OF should not vanish
-+		2*IF <= IFW
-+		so the frame can be split to two equal stripes, even without overlap
-+		2*(OF+IF/irr_opt) <= OFW
-+		so a valid positive INW exists even for equal stripes
-+		OF <= MSW, otherwise, the left stripe cannot be sufficiently large
-+		MSW < OFW, so splitting to stripes is required
-+		OFW <= 2*MSW, so two stripes are sufficient
-+		(this also implies that 2<=MSW)
-+	2: OF is not a multiple of OM - not fully-supported yet
-+	Output is produced but OW is not guaranited to be a multiple of OM
-+	4: OFW reduced to be a multiple of OM
-+	8: CIRR > 1: truncated to 1
-+	Overlap is not supported (and not needed) y for upsizing)
-+**************************************************************************/
-+int ipu_calc_stripes_sizes(const unsigned int input_frame_width,
-+			   /* input frame width;>1 */
-+			   unsigned int output_frame_width, /* output frame width; >1 */
-+			   const unsigned int maximal_stripe_width,
-+			   /* the maximal width allowed for a stripe */
-+			   const unsigned long long cirr, /* see above */
-+			   const unsigned int flags, /* see above */
-+			   u32 input_pixelformat,/* pixel format after of read channel*/
-+			   u32 output_pixelformat,/* pixel format after of write channel*/
-+			   struct stripe_param *left,
-+			   struct stripe_param *right)
-+{
-+	const unsigned int irr_frac_bits = 13;
-+	const unsigned long irr_steps = 1 << irr_frac_bits;
-+	const u64 dirr = ((u64)1) << (32 - 2);
-+	/* The maximum relative difference allowed between the irrs */
-+	const u64 cr = ((u64)4) << 32;
-+	/* The importance ratio between the two terms in the cost function below */
-+
-+	unsigned int status;
-+	unsigned int temp;
-+	unsigned int onw_min;
-+	unsigned int inw = 0, onw = 0, inw_best = 0;
-+	/* number of pixels in the left stripe NOT hidden by the right stripe */
-+	u64 irr_opt; /* the optimal inverse resizing ratio */
-+	u64 rr_opt; /* the optimal resizing ratio = 1/irr_opt*/
-+	u64 dinw; /* the misalignment between the stripes */
-+	/* (measured in units of input columns) */
-+	u64 difwl, difwr = 0;
-+	/* The number of input columns not reflected in the output */
-+	/* the resizing ratio used for the right stripe is */
-+	/*   left->irr and right->irr respectively */
-+	u64 cost, cost_min;
-+	u64 div; /* result of division */
-+	bool equal_stripes = (flags & 0x1) != 0;
-+	bool vertical =      (flags & 0x2) != 0;
-+
-+	unsigned int input_m, input_f, output_m, output_f; /* parameters for upsizing by stripes */
-+	unsigned int resize_coeff;
-+	unsigned int downsize_coeff;
-+
-+	status = 0;
-+
-+	if (vertical) {
-+		input_f = 2;
-+		input_m = 8;
-+		output_f = 8;
-+		output_m = 2;
-+	} else {
-+		input_f = f_calc(input_pixelformat, 0, NULL);
-+		input_m = m_calc(input_pixelformat);
-+		output_f = input_m;
-+		output_m = m_calc(output_pixelformat);
-+	}
-+	if ((input_frame_width < 4) || (output_frame_width < 4))
-+		return 1;
-+
-+	irr_opt = div_u64((((u64)(input_frame_width - 1)) << 32),
-+			  (output_frame_width - 1));
-+	rr_opt = div_u64((((u64)(output_frame_width - 1)) << 32),
-+			 (input_frame_width - 1));
-+
-+	if ((input_m == 0) || (output_m == 0) || (input_f == 0) || (output_f == 0)
-+	    || (input_frame_width < (2 * input_f))
-+	    || ((((u64)output_frame_width) << 32) <
-+		(2 * ((((u64)output_f) << 32) + (input_f * rr_opt))))
-+	    || (maximal_stripe_width < output_f)
-+	    || ((output_frame_width <= maximal_stripe_width)
-+		&& (equal_stripes == 0))
-+	    || ((2 * maximal_stripe_width) < output_frame_width))
-+		return 1;
-+
-+	if (output_f % output_m)
-+		status += 2;
-+
-+	temp = truncate(0, (((u64)output_frame_width) << 32), output_m);
-+	if (temp < output_frame_width) {
-+		output_frame_width = temp;
-+		status += 4;
-+	}
-+
-+	pr_debug("---------------->\n"
-+		   "if  = %d\n"
-+		   "im  = %d\n"
-+		   "of = %d\n"
-+		   "om = %d\n"
-+		   "irr_opt  = %llu\n"
-+		   "rr_opt   = %llu\n"
-+		   "cirr     = %llu\n"
-+		   "pixel in  = %08x\n"
-+		   "pixel out = %08x\n"
-+		   "ifw = %d\n"
-+		   "ofwidth = %d\n",
-+		   input_f,
-+		   input_m,
-+		   output_f,
-+		   output_m,
-+		   irr_opt,
-+		   rr_opt,
-+		   cirr,
-+		   input_pixelformat,
-+		   output_pixelformat,
-+		   input_frame_width,
-+		   output_frame_width
-+		   );
-+
-+	if (equal_stripes) {
-+		if ((irr_opt > cirr) /* overlap in the input is not requested */
-+		    && ((input_frame_width % (input_m << 1)) == 0)
-+		    && ((input_frame_width % (input_f << 1)) == 0)
-+		    && ((output_frame_width % (output_m << 1)) == 0)
-+		    && ((output_frame_width % (output_f << 1)) == 0)) {
-+			/* without overlap */
-+			left->input_width = right->input_width = right->input_column =
-+				input_frame_width >> 1;
-+			left->output_width = right->output_width = right->output_column =
-+				output_frame_width >> 1;
-+			left->input_column = 0;
-+			left->output_column = 0;
-+			div = div_u64(((((u64)irr_steps) << 32) *
-+				       (right->input_width - 1)), (right->output_width - 1));
-+			left->irr = right->irr = truncate(0, div, 1);
-+		} else { /* with overlap */
-+			onw = truncate(0, (((u64)output_frame_width - 1) << 32) >> 1,
-+				       output_f);
-+			inw = truncate(0, onw * irr_opt, input_f);
-+			/* this is the maximal inw which allows the same resizing ratio */
-+			/* in both stripes */
-+			onw = truncate(1, (inw * rr_opt), output_f);
-+			div = div_u64((((u64)(irr_steps * inw)) <<
-+				       32), onw);
-+			left->irr = right->irr = truncate(0, div, 1);
-+			left->output_width = right->output_width =
-+				output_frame_width - onw;
-+			/* These are valid assignments for output_width, */
-+			/* assuming output_f is a multiple of output_m */
-+			div = (((u64)(left->output_width-1) * (left->irr)) << 32);
-+			div = (((u64)1) << 32) + div_u64(div, irr_steps);
-+
-+			left->input_width = right->input_width = truncate(1, div, input_m);
-+
-+			div = div_u64((((u64)((right->output_width - 1) * right->irr)) <<
-+				       32), irr_steps);
-+			difwr = (((u64)(input_frame_width - 1 - inw)) << 32) - div;
-+			div = div_u64((difwr + (((u64)input_f) << 32)), 2);
-+			left->input_column = truncate(0, div, input_f);
-+
-+
-+			/* This splits the truncated input columns evenly */
-+			/*    between the left and right margins */
-+			right->input_column = left->input_column + inw;
-+			left->output_column = 0;
-+			right->output_column = onw;
-+		}
-+		if (left->input_width > left->output_width) {
-+			if (calc_split_resize_coeffs(left->input_width,
-+						     left->output_width,
-+						     &resize_coeff,
-+						     &downsize_coeff) < 0)
-+				return -EINVAL;
-+
-+			if (downsize_coeff > 0) {
-+				left->irr = right->irr =
-+					(downsize_coeff << 14) | resize_coeff;
-+			}
-+		}
-+		pr_debug("inw %d, onw %d, ilw %d, ilc %d, olw %d,"
-+			 " irw %d, irc %d, orw %d, orc %d, "
-+			 "difwr  %llu, lirr %u\n",
-+			 inw, onw, left->input_width,
-+			 left->input_column, left->output_width,
-+			 right->input_width, right->input_column,
-+			 right->output_width,
-+			 right->output_column, difwr, left->irr);
-+		} else { /* independent stripes */
-+		onw_min = output_frame_width - maximal_stripe_width;
-+		/* onw is a multiple of output_f, in the range */
-+		/* [max(output_f,output_frame_width-maximal_stripe_width),*/
-+		/*min(output_frame_width-2,maximal_stripe_width)] */
-+		/* definitely beyond the cost of any valid setting */
-+		cost_min = (((u64)input_frame_width) << 32) + cr;
-+		onw = truncate(0, ((u64)maximal_stripe_width), output_f);
-+		if (output_frame_width - onw == 1)
-+			onw -= output_f; /*  => onw and output_frame_width-1-onw are positive */
-+		inw = truncate(0, onw * irr_opt, input_f);
-+		/* this is the maximal inw which allows the same resizing ratio */
-+		/* in both stripes */
-+		onw = truncate(1, inw * rr_opt, output_f);
-+		do {
-+			div = div_u64((((u64)(irr_steps * inw)) << 32), onw);
-+			left->irr = truncate(0, div, 1);
-+			div = div_u64((((u64)(onw * left->irr)) << 32),
-+				      irr_steps);
-+			dinw = (((u64)inw) << 32) - div;
-+
-+			div = div_u64((((u64)((output_frame_width - 1 - onw) * left->irr)) <<
-+				       32), irr_steps);
-+
-+			difwl = (((u64)(input_frame_width - 1 - inw)) << 32) - div;
-+
-+			cost = difwl + (((u64)(cr * dinw)) >> 32);
-+
-+			if (cost < cost_min) {
-+				inw_best = inw;
-+				cost_min = cost;
-+			}
-+
-+			inw -= input_f;
-+			onw = truncate(1, inw * rr_opt, output_f);
-+			/* This is the minimal onw which allows the same resizing ratio */
-+			/*     in both stripes */
-+		} while (onw >= onw_min);
-+
-+		inw = inw_best;
-+		onw = truncate(1, inw * rr_opt, output_f);
-+		div = div_u64((((u64)(irr_steps * inw)) << 32), onw);
-+		left->irr = truncate(0, div, 1);
-+
-+		left->output_width = onw;
-+		right->output_width = output_frame_width - onw;
-+		/* These are valid assignments for output_width, */
-+		/* assuming output_f is a multiple of output_m */
-+		left->input_width = truncate(1, ((u64)(inw + 1)) << 32, input_m);
-+		right->input_width = truncate(1, ((u64)(input_frame_width - inw)) <<
-+					      32, input_m);
-+
-+		div = div_u64((((u64)(irr_steps * (input_frame_width - 1 - inw))) <<
-+			       32), (right->output_width - 1));
-+		right->irr = truncate(0, div, 1);
-+		temp = truncate(0, ((u64)left->irr) * ((((u64)1) << 32) + dirr), 1);
-+		if (temp < right->irr)
-+			right->irr = temp;
-+		div = div_u64(((u64)((right->output_width - 1) * right->irr) <<
-+			       32), irr_steps);
-+		difwr = (u64)(input_frame_width - 1 - inw) - div;
-+
-+
-+		div = div_u64((difwr + (((u64)input_f) << 32)), 2);
-+		left->input_column = truncate(0, div, input_f);
-+
-+		/* This splits the truncated input columns evenly */
-+		/*    between the left and right margins */
-+		right->input_column = left->input_column + inw;
-+		left->output_column = 0;
-+		right->output_column = onw;
-+		if (left->input_width > left->output_width) {
-+			if (calc_split_resize_coeffs(left->input_width,
-+						     left->output_width,
-+						     &resize_coeff,
-+						     &downsize_coeff) < 0)
-+				return -EINVAL;
-+			left->irr = (downsize_coeff << 14) | resize_coeff;
-+		}
-+		if (right->input_width > right->output_width) {
-+			if (calc_split_resize_coeffs(right->input_width,
-+						     right->output_width,
-+						     &resize_coeff,
-+						     &downsize_coeff) < 0)
-+				return -EINVAL;
-+			right->irr = (downsize_coeff << 14) | resize_coeff;
-+		}
-+	}
-+	return status;
-+}
-+EXPORT_SYMBOL(ipu_calc_stripes_sizes);
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_capture.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_capture.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_capture.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_capture.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,816 @@
-+/*
-+ * Copyright 2008-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file ipu_capture.c
-+ *
-+ * @brief IPU capture dase functions
-+ *
-+ * @ingroup IPU
-+ */
-+#include <linux/clk.h>
-+#include <linux/delay.h>
-+#include <linux/errno.h>
-+#include <linux/init.h>
-+#include <linux/io.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/module.h>
-+#include <linux/spinlock.h>
-+#include <linux/types.h>
-+
-+#include "ipu_prv.h"
-+#include "ipu_regs.h"
-+
-+/*!
-+ * _ipu_csi_mclk_set
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	pixel_clk   desired pixel clock frequency in Hz
-+ * @param	csi         csi 0 or csi 1
-+ *
-+ * @return	Returns 0 on success or negative error code on fail
-+ */
-+int _ipu_csi_mclk_set(struct ipu_soc *ipu, uint32_t pixel_clk, uint32_t csi)
-+{
-+	uint32_t temp;
-+	uint32_t div_ratio;
-+
-+	div_ratio = (clk_get_rate(ipu->ipu_clk) / pixel_clk) - 1;
-+
-+	if (div_ratio > 0xFF || div_ratio < 0) {
-+		dev_dbg(ipu->dev, "value of pixel_clk extends normal range\n");
-+		return -EINVAL;
-+	}
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_SENS_CONF);
-+	temp &= ~CSI_SENS_CONF_DIVRATIO_MASK;
-+	ipu_csi_write(ipu, csi, temp |
-+			(div_ratio << CSI_SENS_CONF_DIVRATIO_SHIFT),
-+			CSI_SENS_CONF);
-+
-+	return 0;
-+}
-+
-+/*!
-+ * ipu_csi_init_interface
-+ *	Sets initial values for the CSI registers.
-+ *	The width and height of the sensor and the actual frame size will be
-+ *	set to the same values.
-+ * @param	ipu		ipu handler
-+ * @param	width		Sensor width
-+ * @param       height		Sensor height
-+ * @param       pixel_fmt	pixel format
-+ * @param       cfg_param	ipu_csi_signal_cfg_t structure
-+ * @param       csi             csi 0 or csi 1
-+ *
-+ * @return      0 for success, -EINVAL for error
-+ */
-+int32_t
-+ipu_csi_init_interface(struct ipu_soc *ipu, uint16_t width, uint16_t height,
-+	uint32_t pixel_fmt, ipu_csi_signal_cfg_t cfg_param)
-+{
-+	uint32_t data = 0;
-+	uint32_t csi = cfg_param.csi;
-+
-+	/* Set SENS_DATA_FORMAT bits (8, 9 and 10)
-+	   RGB or YUV444 is 0 which is current value in data so not set
-+	   explicitly
-+	   This is also the default value if attempts are made to set it to
-+	   something invalid. */
-+	switch (pixel_fmt) {
-+	case IPU_PIX_FMT_YUYV:
-+		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_YUV422_YUYV;
-+		break;
-+	case IPU_PIX_FMT_UYVY:
-+		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_YUV422_UYVY;
-+		break;
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_BGR24:
-+		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_RGB_YUV444;
-+		break;
-+	case IPU_PIX_FMT_GENERIC:
-+	case IPU_PIX_FMT_GENERIC_16:
-+		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_BAYER;
-+		break;
-+	case IPU_PIX_FMT_RGB565:
-+		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_RGB565;
-+		break;
-+	case IPU_PIX_FMT_RGB555:
-+		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_RGB555;
-+		break;
-+	default:
-+		return -EINVAL;
-+	}
-+
-+	/* Set the CSI_SENS_CONF register remaining fields */
-+	data |= cfg_param.data_width << CSI_SENS_CONF_DATA_WIDTH_SHIFT |
-+		cfg_param.data_fmt << CSI_SENS_CONF_DATA_FMT_SHIFT |
-+		cfg_param.data_pol << CSI_SENS_CONF_DATA_POL_SHIFT |
-+		cfg_param.Vsync_pol << CSI_SENS_CONF_VSYNC_POL_SHIFT |
-+		cfg_param.Hsync_pol << CSI_SENS_CONF_HSYNC_POL_SHIFT |
-+		cfg_param.pixclk_pol << CSI_SENS_CONF_PIX_CLK_POL_SHIFT |
-+		cfg_param.ext_vsync << CSI_SENS_CONF_EXT_VSYNC_SHIFT |
-+		cfg_param.clk_mode << CSI_SENS_CONF_SENS_PRTCL_SHIFT |
-+		cfg_param.pack_tight << CSI_SENS_CONF_PACK_TIGHT_SHIFT |
-+		cfg_param.force_eof << CSI_SENS_CONF_FORCE_EOF_SHIFT |
-+		cfg_param.data_en_pol << CSI_SENS_CONF_DATA_EN_POL_SHIFT;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	ipu_csi_write(ipu, csi, data, CSI_SENS_CONF);
-+
-+	/* Setup sensor frame size */
-+	ipu_csi_write(ipu, csi, (width - 1) | (height - 1) << 16, CSI_SENS_FRM_SIZE);
-+
-+	/* Set CCIR registers */
-+	if (cfg_param.clk_mode == IPU_CSI_CLK_MODE_CCIR656_PROGRESSIVE) {
-+		ipu_csi_write(ipu, csi, 0x40030, CSI_CCIR_CODE_1);
-+		ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
-+	} else if (cfg_param.clk_mode == IPU_CSI_CLK_MODE_CCIR656_INTERLACED) {
-+		if (width == 720 && height == 625) {
-+			/* PAL case */
-+			/*
-+			 * Field0BlankEnd = 0x6, Field0BlankStart = 0x2,
-+			 * Field0ActiveEnd = 0x4, Field0ActiveStart = 0
-+			 */
-+			ipu_csi_write(ipu, csi, 0x40596, CSI_CCIR_CODE_1);
-+			/*
-+			 * Field1BlankEnd = 0x7, Field1BlankStart = 0x3,
-+			 * Field1ActiveEnd = 0x5, Field1ActiveStart = 0x1
-+			 */
-+			ipu_csi_write(ipu, csi, 0xD07DF, CSI_CCIR_CODE_2);
-+
-+			ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
-+
-+		} else if (width == 720 && height == 525) {
-+			/* NTSC case */
-+			/*
-+			 * Field0BlankEnd = 0x7, Field0BlankStart = 0x3,
-+			 * Field0ActiveEnd = 0x5, Field0ActiveStart = 0x1
-+			 */
-+			ipu_csi_write(ipu, csi, 0xD07DF, CSI_CCIR_CODE_1);
-+			/*
-+			 * Field1BlankEnd = 0x6, Field1BlankStart = 0x2,
-+			 * Field1ActiveEnd = 0x4, Field1ActiveStart = 0
-+			 */
-+			ipu_csi_write(ipu, csi, 0x40596, CSI_CCIR_CODE_2);
-+			ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
-+		} else {
-+			dev_err(ipu->dev, "Unsupported CCIR656 interlaced "
-+					"video mode\n");
-+			mutex_unlock(&ipu->mutex_lock);
-+			_ipu_put(ipu);
-+			return -EINVAL;
-+		}
-+		_ipu_csi_ccir_err_detection_enable(ipu, csi);
-+	} else if ((cfg_param.clk_mode ==
-+			IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_DDR) ||
-+		(cfg_param.clk_mode ==
-+			IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_SDR) ||
-+		(cfg_param.clk_mode ==
-+			IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_DDR) ||
-+		(cfg_param.clk_mode ==
-+			IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_SDR)) {
-+		ipu_csi_write(ipu, csi, 0x40030, CSI_CCIR_CODE_1);
-+		ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
-+		_ipu_csi_ccir_err_detection_enable(ipu, csi);
-+	} else if ((cfg_param.clk_mode == IPU_CSI_CLK_MODE_GATED_CLK) ||
-+		   (cfg_param.clk_mode == IPU_CSI_CLK_MODE_NONGATED_CLK)) {
-+		_ipu_csi_ccir_err_detection_disable(ipu, csi);
-+	}
-+
-+	dev_dbg(ipu->dev, "CSI_SENS_CONF = 0x%08X\n",
-+		ipu_csi_read(ipu, csi, CSI_SENS_CONF));
-+	dev_dbg(ipu->dev, "CSI_ACT_FRM_SIZE = 0x%08X\n",
-+		ipu_csi_read(ipu, csi, CSI_ACT_FRM_SIZE));
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_csi_init_interface);
-+
-+/*!
-+ * ipu_csi_get_sensor_protocol
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi         csi 0 or csi 1
-+ *
-+ * @return	Returns sensor protocol
-+ */
-+int32_t ipu_csi_get_sensor_protocol(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	int ret;
-+	_ipu_get(ipu);
-+	ret = (ipu_csi_read(ipu, csi, CSI_SENS_CONF) &
-+		CSI_SENS_CONF_SENS_PRTCL_MASK) >>
-+		CSI_SENS_CONF_SENS_PRTCL_SHIFT;
-+	_ipu_put(ipu);
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_csi_get_sensor_protocol);
-+
-+/*!
-+ * ipu_csi_enable_mclk
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi         csi 0 or csi 1
-+ * @param       flag        true to enable mclk, false to disable mclk
-+ * @param       wait        true to wait 100ms make clock stable, false not wait
-+ *
-+ * @return      Returns 0 on success
-+ */
-+int ipu_csi_enable_mclk(struct ipu_soc *ipu, int csi, bool flag, bool wait)
-+{
-+	/* Return immediately if there is no csi_clk to manage */
-+	if (ipu->csi_clk[csi] == NULL)
-+		return 0;
-+
-+	if (flag) {
-+		clk_enable(ipu->csi_clk[csi]);
-+		if (wait == true)
-+			msleep(10);
-+	} else {
-+		clk_disable(ipu->csi_clk[csi]);
-+	}
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_csi_enable_mclk);
-+
-+/*!
-+ * ipu_csi_get_window_size
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	width	pointer to window width
-+ * @param	height	pointer to window height
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void ipu_csi_get_window_size(struct ipu_soc *ipu, uint32_t *width, uint32_t *height, uint32_t csi)
-+{
-+	uint32_t reg;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	reg = ipu_csi_read(ipu, csi, CSI_ACT_FRM_SIZE);
-+	*width = (reg & 0xFFFF) + 1;
-+	*height = (reg >> 16 & 0xFFFF) + 1;
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_csi_get_window_size);
-+
-+/*!
-+ * ipu_csi_set_window_size
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	width	window width
-+ * @param       height	window height
-+ * @param       csi	csi 0 or csi 1
-+ */
-+void ipu_csi_set_window_size(struct ipu_soc *ipu, uint32_t width, uint32_t height, uint32_t csi)
-+{
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	ipu_csi_write(ipu, csi, (width - 1) | (height - 1) << 16, CSI_ACT_FRM_SIZE);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_csi_set_window_size);
-+
-+/*!
-+ * ipu_csi_set_window_pos
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       left	uint32 window x start
-+ * @param       top	uint32 window y start
-+ * @param       csi	csi 0 or csi 1
-+ */
-+void ipu_csi_set_window_pos(struct ipu_soc *ipu, uint32_t left, uint32_t top, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
-+	temp &= ~(CSI_HSC_MASK | CSI_VSC_MASK);
-+	temp |= ((top << CSI_VSC_SHIFT) | (left << CSI_HSC_SHIFT));
-+	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_csi_set_window_pos);
-+
-+/*!
-+ * _ipu_csi_horizontal_downsize_enable
-+ *	Enable horizontal downsizing(decimation) by 2.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void _ipu_csi_horizontal_downsize_enable(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
-+	temp |= CSI_HORI_DOWNSIZE_EN;
-+	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
-+}
-+
-+/*!
-+ * _ipu_csi_horizontal_downsize_disable
-+ *	Disable horizontal downsizing(decimation) by 2.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void _ipu_csi_horizontal_downsize_disable(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
-+	temp &= ~CSI_HORI_DOWNSIZE_EN;
-+	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
-+}
-+
-+/*!
-+ * _ipu_csi_vertical_downsize_enable
-+ *	Enable vertical downsizing(decimation) by 2.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void _ipu_csi_vertical_downsize_enable(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
-+	temp |= CSI_VERT_DOWNSIZE_EN;
-+	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
-+}
-+
-+/*!
-+ * _ipu_csi_vertical_downsize_disable
-+ *	Disable vertical downsizing(decimation) by 2.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void _ipu_csi_vertical_downsize_disable(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
-+	temp &= ~CSI_VERT_DOWNSIZE_EN;
-+	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
-+}
-+
-+/*!
-+ * _ipu_csi_set_test_generator
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	active       1 for active and 0 for inactive
-+ * @param       r_value	     red value for the generated pattern of even pixel
-+ * @param       g_value      green value for the generated pattern of even
-+ *			     pixel
-+ * @param       b_value      blue value for the generated pattern of even pixel
-+ * @param	pixel_clk   desired pixel clock frequency in Hz
-+ * @param       csi          csi 0 or csi 1
-+ */
-+void _ipu_csi_set_test_generator(struct ipu_soc *ipu, bool active, uint32_t r_value,
-+	uint32_t g_value, uint32_t b_value, uint32_t pix_clk, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_TST_CTRL);
-+
-+	if (active == false) {
-+		temp &= ~CSI_TEST_GEN_MODE_EN;
-+		ipu_csi_write(ipu, csi, temp, CSI_TST_CTRL);
-+	} else {
-+		/* Set sensb_mclk div_ratio*/
-+		_ipu_csi_mclk_set(ipu, pix_clk, csi);
-+
-+		temp &= ~(CSI_TEST_GEN_R_MASK | CSI_TEST_GEN_G_MASK |
-+			CSI_TEST_GEN_B_MASK);
-+		temp |= CSI_TEST_GEN_MODE_EN;
-+		temp |= (r_value << CSI_TEST_GEN_R_SHIFT) |
-+			(g_value << CSI_TEST_GEN_G_SHIFT) |
-+			(b_value << CSI_TEST_GEN_B_SHIFT);
-+		ipu_csi_write(ipu, csi, temp, CSI_TST_CTRL);
-+	}
-+}
-+
-+/*!
-+ * _ipu_csi_ccir_err_detection_en
-+ *	Enable error detection and correction for
-+ *	CCIR interlaced mode with protection bit.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void _ipu_csi_ccir_err_detection_enable(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_CCIR_CODE_1);
-+	temp |= CSI_CCIR_ERR_DET_EN;
-+	ipu_csi_write(ipu, csi, temp, CSI_CCIR_CODE_1);
-+
-+}
-+
-+/*!
-+ * _ipu_csi_ccir_err_detection_disable
-+ *	Disable error detection and correction for
-+ *	CCIR interlaced mode with protection bit.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	csi	csi 0 or csi 1
-+ */
-+void _ipu_csi_ccir_err_detection_disable(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_CCIR_CODE_1);
-+	temp &= ~CSI_CCIR_ERR_DET_EN;
-+	ipu_csi_write(ipu, csi, temp, CSI_CCIR_CODE_1);
-+
-+}
-+
-+/*!
-+ * _ipu_csi_set_mipi_di
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	num	MIPI data identifier 0-3 handled by CSI
-+ * @param	di_val	data identifier value
-+ * @param	csi	csi 0 or csi 1
-+ *
-+ * @return	Returns 0 on success or negative error code on fail
-+ */
-+int _ipu_csi_set_mipi_di(struct ipu_soc *ipu, uint32_t num, uint32_t di_val, uint32_t csi)
-+{
-+	uint32_t temp;
-+	int retval = 0;
-+
-+	if (di_val > 0xFFL) {
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_MIPI_DI);
-+
-+	switch (num) {
-+	case IPU_CSI_MIPI_DI0:
-+		temp &= ~CSI_MIPI_DI0_MASK;
-+		temp |= (di_val << CSI_MIPI_DI0_SHIFT);
-+		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
-+		break;
-+	case IPU_CSI_MIPI_DI1:
-+		temp &= ~CSI_MIPI_DI1_MASK;
-+		temp |= (di_val << CSI_MIPI_DI1_SHIFT);
-+		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
-+		break;
-+	case IPU_CSI_MIPI_DI2:
-+		temp &= ~CSI_MIPI_DI2_MASK;
-+		temp |= (di_val << CSI_MIPI_DI2_SHIFT);
-+		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
-+		break;
-+	case IPU_CSI_MIPI_DI3:
-+		temp &= ~CSI_MIPI_DI3_MASK;
-+		temp |= (di_val << CSI_MIPI_DI3_SHIFT);
-+		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
-+		break;
-+	default:
-+		retval = -EINVAL;
-+	}
-+
-+err:
-+	return retval;
-+}
-+
-+/*!
-+ * _ipu_csi_set_skip_isp
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	skip		select frames to be skipped and set the
-+ *				correspond bits to 1
-+ * @param	max_ratio	number of frames in a skipping set and the
-+ * 				maximum value of max_ratio is 5
-+ * @param	csi		csi 0 or csi 1
-+ *
-+ * @return	Returns 0 on success or negative error code on fail
-+ */
-+int _ipu_csi_set_skip_isp(struct ipu_soc *ipu, uint32_t skip, uint32_t max_ratio, uint32_t csi)
-+{
-+	uint32_t temp;
-+	int retval = 0;
-+
-+	if (max_ratio > 5) {
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_SKIP);
-+	temp &= ~(CSI_MAX_RATIO_SKIP_ISP_MASK | CSI_SKIP_ISP_MASK);
-+	temp |= (max_ratio << CSI_MAX_RATIO_SKIP_ISP_SHIFT) |
-+		(skip << CSI_SKIP_ISP_SHIFT);
-+	ipu_csi_write(ipu, csi, temp, CSI_SKIP);
-+
-+err:
-+	return retval;
-+}
-+
-+/*!
-+ * _ipu_csi_set_skip_smfc
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	skip		select frames to be skipped and set the
-+ *				correspond bits to 1
-+ * @param	max_ratio	number of frames in a skipping set and the
-+ *				maximum value of max_ratio is 5
-+ * @param	id		csi to smfc skipping id
-+ * @param	csi		csi 0 or csi 1
-+ *
-+ * @return	Returns 0 on success or negative error code on fail
-+ */
-+int _ipu_csi_set_skip_smfc(struct ipu_soc *ipu, uint32_t skip,
-+	uint32_t max_ratio, uint32_t id, uint32_t csi)
-+{
-+	uint32_t temp;
-+	int retval = 0;
-+
-+	if (max_ratio > 5 || id > 3) {
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	temp = ipu_csi_read(ipu, csi, CSI_SKIP);
-+	temp &= ~(CSI_MAX_RATIO_SKIP_SMFC_MASK | CSI_ID_2_SKIP_MASK |
-+			CSI_SKIP_SMFC_MASK);
-+	temp |= (max_ratio << CSI_MAX_RATIO_SKIP_SMFC_SHIFT) |
-+			(id << CSI_ID_2_SKIP_SHIFT) |
-+			(skip << CSI_SKIP_SMFC_SHIFT);
-+	ipu_csi_write(ipu, csi, temp, CSI_SKIP);
-+
-+err:
-+	return retval;
-+}
-+
-+/*!
-+ * _ipu_smfc_init
-+ *	Map CSI frames to IDMAC channels.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel		IDMAC channel 0-3
-+ * @param	mipi_id		mipi id number 0-3
-+ * @param	csi		csi0 or csi1
-+ */
-+void _ipu_smfc_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t mipi_id, uint32_t csi)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_smfc_read(ipu, SMFC_MAP);
-+
-+	switch (channel) {
-+	case CSI_MEM0:
-+		temp &= ~SMFC_MAP_CH0_MASK;
-+		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH0_SHIFT;
-+		break;
-+	case CSI_MEM1:
-+		temp &= ~SMFC_MAP_CH1_MASK;
-+		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH1_SHIFT;
-+		break;
-+	case CSI_MEM2:
-+		temp &= ~SMFC_MAP_CH2_MASK;
-+		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH2_SHIFT;
-+		break;
-+	case CSI_MEM3:
-+		temp &= ~SMFC_MAP_CH3_MASK;
-+		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH3_SHIFT;
-+		break;
-+	default:
-+		return;
-+	}
-+
-+	ipu_smfc_write(ipu, temp, SMFC_MAP);
-+}
-+
-+/*!
-+ * _ipu_smfc_set_wmc
-+ *	Caution: The number of required channels,  the enabled channels
-+ *	and the FIFO size per channel are configured restrictedly.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel		IDMAC channel 0-3
-+ * @param	set		set 1 or clear 0
-+ * @param	level		water mark level when FIFO is on the
-+ *				relative size
-+ */
-+void _ipu_smfc_set_wmc(struct ipu_soc *ipu, ipu_channel_t channel, bool set, uint32_t level)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_smfc_read(ipu, SMFC_WMC);
-+
-+	switch (channel) {
-+	case CSI_MEM0:
-+		if (set == true) {
-+			temp &= ~SMFC_WM0_SET_MASK;
-+			temp |= level << SMFC_WM0_SET_SHIFT;
-+		} else {
-+			temp &= ~SMFC_WM0_CLR_MASK;
-+			temp |= level << SMFC_WM0_CLR_SHIFT;
-+		}
-+		break;
-+	case CSI_MEM1:
-+		if (set == true) {
-+			temp &= ~SMFC_WM1_SET_MASK;
-+			temp |= level << SMFC_WM1_SET_SHIFT;
-+		} else {
-+			temp &= ~SMFC_WM1_CLR_MASK;
-+			temp |= level << SMFC_WM1_CLR_SHIFT;
-+		}
-+		break;
-+	case CSI_MEM2:
-+		if (set == true) {
-+			temp &= ~SMFC_WM2_SET_MASK;
-+			temp |= level << SMFC_WM2_SET_SHIFT;
-+		} else {
-+			temp &= ~SMFC_WM2_CLR_MASK;
-+			temp |= level << SMFC_WM2_CLR_SHIFT;
-+		}
-+		break;
-+	case CSI_MEM3:
-+		if (set == true) {
-+			temp &= ~SMFC_WM3_SET_MASK;
-+			temp |= level << SMFC_WM3_SET_SHIFT;
-+		} else {
-+			temp &= ~SMFC_WM3_CLR_MASK;
-+			temp |= level << SMFC_WM3_CLR_SHIFT;
-+		}
-+		break;
-+	default:
-+		return;
-+	}
-+
-+	ipu_smfc_write(ipu, temp, SMFC_WMC);
-+}
-+
-+/*!
-+ * _ipu_smfc_set_burst_size
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel		IDMAC channel 0-3
-+ * @param	bs		burst size of IDMAC channel,
-+ *				the value programmed here shoud be BURST_SIZE-1
-+ */
-+void _ipu_smfc_set_burst_size(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t bs)
-+{
-+	uint32_t temp;
-+
-+	temp = ipu_smfc_read(ipu, SMFC_BS);
-+
-+	switch (channel) {
-+	case CSI_MEM0:
-+		temp &= ~SMFC_BS0_MASK;
-+		temp |= bs << SMFC_BS0_SHIFT;
-+		break;
-+	case CSI_MEM1:
-+		temp &= ~SMFC_BS1_MASK;
-+		temp |= bs << SMFC_BS1_SHIFT;
-+		break;
-+	case CSI_MEM2:
-+		temp &= ~SMFC_BS2_MASK;
-+		temp |= bs << SMFC_BS2_SHIFT;
-+		break;
-+	case CSI_MEM3:
-+		temp &= ~SMFC_BS3_MASK;
-+		temp |= bs << SMFC_BS3_SHIFT;
-+		break;
-+	default:
-+		return;
-+	}
-+
-+	ipu_smfc_write(ipu, temp, SMFC_BS);
-+}
-+
-+/*!
-+ * _ipu_csi_init
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel      IDMAC channel
-+ * @param	csi	     csi 0 or csi 1
-+ *
-+ * @return	Returns 0 on success or negative error code on fail
-+ */
-+int _ipu_csi_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t csi)
-+{
-+	uint32_t csi_sens_conf, csi_dest;
-+	int retval = 0;
-+
-+	switch (channel) {
-+	case CSI_MEM0:
-+	case CSI_MEM1:
-+	case CSI_MEM2:
-+	case CSI_MEM3:
-+		csi_dest = CSI_DATA_DEST_IDMAC;
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+	case CSI_PRP_VF_MEM:
-+		csi_dest = CSI_DATA_DEST_IC;
-+		break;
-+	default:
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	csi_sens_conf = ipu_csi_read(ipu, csi, CSI_SENS_CONF);
-+	csi_sens_conf &= ~CSI_SENS_CONF_DATA_DEST_MASK;
-+	ipu_csi_write(ipu, csi, csi_sens_conf | (csi_dest <<
-+		CSI_SENS_CONF_DATA_DEST_SHIFT), CSI_SENS_CONF);
-+err:
-+	return retval;
-+}
-+
-+/*!
-+ * csi_irq_handler
-+ *
-+ * @param	irq		interrupt id
-+ * @param	dev_id		pointer to ipu handler
-+ *
-+ * @return	Returns if irq is handled
-+ */
-+static irqreturn_t csi_irq_handler(int irq, void *dev_id)
-+{
-+	struct ipu_soc *ipu = dev_id;
-+	struct completion *comp = &ipu->csi_comp;
-+
-+	complete(comp);
-+	return IRQ_HANDLED;
-+}
-+
-+/*!
-+ * _ipu_csi_wait4eof
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel      IDMAC channel
-+ *
-+ */
-+void _ipu_csi_wait4eof(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	int ret;
-+	int irq = 0;
-+
-+	if (channel == CSI_MEM0)
-+		irq = IPU_IRQ_CSI0_OUT_EOF;
-+	else if (channel == CSI_MEM1)
-+		irq = IPU_IRQ_CSI1_OUT_EOF;
-+	else if (channel == CSI_MEM2)
-+		irq = IPU_IRQ_CSI2_OUT_EOF;
-+	else if (channel == CSI_MEM3)
-+		irq = IPU_IRQ_CSI3_OUT_EOF;
-+	else if (channel == CSI_PRP_ENC_MEM)
-+		irq = IPU_IRQ_PRP_ENC_OUT_EOF;
-+	else if (channel == CSI_PRP_VF_MEM)
-+		irq = IPU_IRQ_PRP_VF_OUT_EOF;
-+	else{
-+		dev_err(ipu->dev, "Not a CSI channel\n");
-+		return;
-+	}
-+
-+	init_completion(&ipu->csi_comp);
-+	ret = ipu_request_irq(ipu, irq, csi_irq_handler, 0, NULL, ipu);
-+	if (ret < 0) {
-+		dev_err(ipu->dev, "CSI irq %d in use\n", irq);
-+		return;
-+	}
-+	ret = wait_for_completion_timeout(&ipu->csi_comp, msecs_to_jiffies(500));
-+	ipu_free_irq(ipu, irq, ipu);
-+	dev_dbg(ipu->dev, "CSI stop timeout - %d * 10ms\n", 5 - ret);
-+}
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_common.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_common.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_common.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_common.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,3151 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file ipu_common.c
-+ *
-+ * @brief This file contains the IPU driver common API functions.
-+ *
-+ * @ingroup IPU
-+ */
-+
-+
-+#include <linux/clk.h>
-+#include <linux/clk-provider.h>
-+#include <linux/clk/clk-conf.h>
-+
-+
-+#include <linux/busfreq-imx6.h>
-+#include <linux/delay.h>
-+#include <linux/err.h>
-+#include <linux/init.h>
-+#include <linux/interrupt.h>
-+#include <linux/io.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/irq.h>
-+#include <linux/irqdesc.h>
-+#include <linux/module.h>
-+#include <linux/mod_devicetable.h>
-+#include <linux/of_device.h>
-+#include <linux/platform_device.h>
-+#include <linux/pm_runtime.h>
-+#include <linux/reset.h>
-+#include <linux/spinlock.h>
-+#include <linux/types.h>
-+
-+#include <asm/cacheflush.h>
-+
-+#include "ipu_param_mem.h"
-+#include "ipu_regs.h"
-+
-+static struct ipu_soc ipu_array[MXC_IPU_MAX_NUM];
-+int g_ipu_hw_rev;
-+
-+/* Static functions */
-+static irqreturn_t ipu_sync_irq_handler(int irq, void *desc);
-+static irqreturn_t ipu_err_irq_handler(int irq, void *desc);
-+
-+static inline uint32_t channel_2_dma(ipu_channel_t ch, ipu_buffer_t type)
-+{
-+	return ((uint32_t) ch >> (6 * type)) & 0x3F;
-+};
-+
-+static inline int _ipu_is_ic_chan(uint32_t dma_chan)
-+{
-+	return (((dma_chan >= 11) && (dma_chan <= 22) && (dma_chan != 17) &&
-+		(dma_chan != 18)));
-+}
-+
-+static inline int _ipu_is_vdi_out_chan(uint32_t dma_chan)
-+{
-+	return (dma_chan == 5);
-+}
-+
-+static inline int _ipu_is_ic_graphic_chan(uint32_t dma_chan)
-+{
-+	return (dma_chan == 14 || dma_chan == 15);
-+}
-+
-+/* Either DP BG or DP FG can be graphic window */
-+static inline int _ipu_is_dp_graphic_chan(uint32_t dma_chan)
-+{
-+	return (dma_chan == 23 || dma_chan == 27);
-+}
-+
-+static inline int _ipu_is_irt_chan(uint32_t dma_chan)
-+{
-+	return ((dma_chan >= 45) && (dma_chan <= 50));
-+}
-+
-+static inline int _ipu_is_dmfc_chan(uint32_t dma_chan)
-+{
-+	return ((dma_chan >= 23) && (dma_chan <= 29));
-+}
-+
-+static inline int _ipu_is_smfc_chan(uint32_t dma_chan)
-+{
-+	return ((dma_chan >= 0) && (dma_chan <= 3));
-+}
-+
-+static inline int _ipu_is_trb_chan(uint32_t dma_chan)
-+{
-+	return (((dma_chan == 8) || (dma_chan == 9) ||
-+		 (dma_chan == 10) || (dma_chan == 13) ||
-+		 (dma_chan == 21) || (dma_chan == 23) ||
-+		 (dma_chan == 27) || (dma_chan == 28)) &&
-+		(g_ipu_hw_rev >= IPU_V3DEX));
-+}
-+
-+/*
-+ * We usually use IDMAC 23 as full plane and IDMAC 27 as partial
-+ * plane.
-+ * IDMAC 23/24/28/41 can drive a display respectively - primary
-+ * IDMAC 27 depends on IDMAC 23 - nonprimary
-+ */
-+static inline int _ipu_is_primary_disp_chan(uint32_t dma_chan)
-+{
-+	return ((dma_chan == 23) || (dma_chan == 24) ||
-+		(dma_chan == 28) || (dma_chan == 41));
-+}
-+
-+static inline int _ipu_is_sync_irq(uint32_t irq)
-+{
-+	/* sync interrupt register number */
-+	int reg_num = irq / 32 + 1;
-+
-+	return ((reg_num == 1)  || (reg_num == 2)  || (reg_num == 3)  ||
-+		(reg_num == 4)  || (reg_num == 7)  || (reg_num == 8)  ||
-+		(reg_num == 11) || (reg_num == 12) || (reg_num == 13) ||
-+		(reg_num == 14) || (reg_num == 15));
-+}
-+
-+#define idma_is_valid(ch)	(ch != NO_DMA)
-+#define idma_mask(ch)		(idma_is_valid(ch) ? (1UL << (ch & 0x1F)) : 0)
-+#define idma_is_set(ipu, reg, dma)	(ipu_idmac_read(ipu, reg(dma)) & idma_mask(dma))
-+#define tri_cur_buf_mask(ch)	(idma_mask(ch*2) * 3)
-+#define tri_cur_buf_shift(ch)	(ffs(idma_mask(ch*2)) - 1)
-+
-+static int ipu_clk_setup_enable(struct ipu_soc *ipu,
-+			struct ipu_pltfm_data *pdata)
-+{
-+	char pixel_clk_0[] = "ipu1_pclk_0";
-+	char pixel_clk_1[] = "ipu1_pclk_1";
-+	char pixel_clk_0_sel[] = "ipu1_pclk0_sel";
-+	char pixel_clk_1_sel[] = "ipu1_pclk1_sel";
-+	char pixel_clk_0_div[] = "ipu1_pclk0_div";
-+	char pixel_clk_1_div[] = "ipu1_pclk1_div";
-+	char *ipu_pixel_clk_sel1[] = { "ipu1", "ipu1_di0", "ipu1_di1", };
-+	char *ipu_pixel_clk_sel2[] = { "ipu2", "ipu2_di0", "ipu2_di1", };
-+	char **ipu_pixel_clk_sel;
-+	struct clk *clk;
-+	int ret;
-+
-+	strncpy(ipu->pixel_clk_0, pixel_clk_0, sizeof(ipu->pixel_clk_0));
-+	ipu->pixel_clk_0[3] += pdata->id;
-+	strncpy(ipu->pixel_clk_1, pixel_clk_1, sizeof(ipu->pixel_clk_1));
-+	ipu->pixel_clk_1[3] += pdata->id;
-+	strncpy(ipu->pixel_clk_0_sel, pixel_clk_0_sel, sizeof(ipu->pixel_clk_0_sel));
-+	ipu->pixel_clk_0_sel[3] += pdata->id;
-+	strncpy(ipu->pixel_clk_1_sel, pixel_clk_1_sel, sizeof(ipu->pixel_clk_1_sel));
-+	ipu->pixel_clk_1_sel[3] += pdata->id;
-+	strncpy(ipu->pixel_clk_0_div, pixel_clk_0_div, sizeof(ipu->pixel_clk_0_div));
-+	ipu->pixel_clk_0_div[3] += pdata->id;
-+	strncpy(ipu->pixel_clk_1_div, pixel_clk_1_div, sizeof(ipu->pixel_clk_1_div));
-+	ipu->pixel_clk_1_div[3] += pdata->id;
-+
-+	if (pdata->id == 0)
-+		ipu_pixel_clk_sel = ipu_pixel_clk_sel1;
-+	else 
-+		ipu_pixel_clk_sel = ipu_pixel_clk_sel2;
-+
-+	clk = clk_register_mux_pix_clk(ipu->dev, ipu->pixel_clk_0_sel,
-+			(const char **)ipu_pixel_clk_sel,
-+			ARRAY_SIZE(ipu_pixel_clk_sel1),
-+			0, pdata->id, 0, 0);
-+	if (IS_ERR(clk)) {
-+		dev_err(ipu->dev, "clk_register mux di0 failed");
-+		return PTR_ERR(clk);
-+	}
-+	ipu->pixel_clk_sel[0] = clk;
-+	clk = clk_register_mux_pix_clk(ipu->dev, ipu->pixel_clk_1_sel,
-+			(const char **)ipu_pixel_clk_sel,
-+			ARRAY_SIZE(ipu_pixel_clk_sel1),
-+			0, pdata->id, 1, 0);
-+	if (IS_ERR(clk)) {
-+		dev_err(ipu->dev, "clk_register mux di1 failed");
-+		return PTR_ERR(clk);
-+	}
-+	ipu->pixel_clk_sel[1] = clk;
-+
-+	clk = clk_register_div_pix_clk(ipu->dev, ipu->pixel_clk_0_div,
-+				ipu->pixel_clk_0_sel, 0, pdata->id, 0, 0);
-+	if (IS_ERR(clk)) {
-+		dev_err(ipu->dev, "clk register di0 div failed");
-+		return PTR_ERR(clk);
-+	}
-+	clk = clk_register_div_pix_clk(ipu->dev, ipu->pixel_clk_1_div,
-+			ipu->pixel_clk_1_sel, CLK_SET_RATE_PARENT, pdata->id, 1, 0);
-+	if (IS_ERR(clk)) {
-+		dev_err(ipu->dev, "clk register di1 div failed");
-+		return PTR_ERR(clk);
-+	}
-+
-+	ipu->pixel_clk[0] = clk_register_gate_pix_clk(ipu->dev, ipu->pixel_clk_0,
-+				ipu->pixel_clk_0_div, CLK_SET_RATE_PARENT,
-+				pdata->id, 0, 0);
-+	if (IS_ERR(ipu->pixel_clk[0])) {
-+		dev_err(ipu->dev, "clk register di0 gate failed");
-+		return PTR_ERR(ipu->pixel_clk[0]);
-+	}
-+	ipu->pixel_clk[1] = clk_register_gate_pix_clk(ipu->dev, ipu->pixel_clk_1,
-+				ipu->pixel_clk_1_div, CLK_SET_RATE_PARENT,
-+				pdata->id, 1, 0);
-+	if (IS_ERR(ipu->pixel_clk[1])) {
-+		dev_err(ipu->dev, "clk register di1 gate failed");
-+		return PTR_ERR(ipu->pixel_clk[1]);
-+	}
-+
-+	ret = clk_set_parent(ipu->pixel_clk_sel[0], ipu->ipu_clk);
-+	if (ret) {
-+		dev_err(ipu->dev, "clk set parent failed %s, %d", __clk_get_name(ipu->ipu_clk), ret);
-+		return ret;
-+	}
-+
-+	ret = clk_set_parent(ipu->pixel_clk_sel[1], ipu->ipu_clk);
-+	if (ret) {
-+		dev_err(ipu->dev, "clk set parent failed %s, %d", __clk_get_name(ipu->ipu_clk), ret);
-+		return ret;
-+	}
-+
-+	ipu->di_clk[0] = devm_clk_get(ipu->dev, "di0");
-+	if (IS_ERR(ipu->di_clk[0])) {
-+		dev_err(ipu->dev, "clk_get di0 failed");
-+		return PTR_ERR(ipu->di_clk[0]);
-+	}
-+	ipu->di_clk[1] = devm_clk_get(ipu->dev, "di1");
-+	if (IS_ERR(ipu->di_clk[1])) {
-+		dev_err(ipu->dev, "clk_get di1 failed");
-+		return PTR_ERR(ipu->di_clk[1]);
-+	}
-+
-+	ipu->di_clk_sel[0] = devm_clk_get(ipu->dev, "di0_sel");
-+	if (IS_ERR(ipu->di_clk_sel[0])) {
-+		dev_err(ipu->dev, "clk_get di0_sel failed");
-+		return PTR_ERR(ipu->di_clk_sel[0]);
-+	}
-+	ipu->di_clk_sel[1] = devm_clk_get(ipu->dev, "di1_sel");
-+	if (IS_ERR(ipu->di_clk_sel[1])) {
-+		dev_err(ipu->dev, "clk_get di1_sel failed");
-+		return PTR_ERR(ipu->di_clk_sel[1]);
-+	}
-+
-+	return 0;
-+}
-+
-+static int ipu_mem_reset(struct ipu_soc *ipu)
-+{
-+	int timeout = 1000;
-+
-+	ipu_cm_write(ipu, 0x807FFFFF, IPU_MEM_RST);
-+
-+	while (ipu_cm_read(ipu, IPU_MEM_RST) & 0x80000000) {
-+		if (!timeout--)
-+			return -ETIME;
-+		msleep(1);
-+	}
-+
-+	return 0;
-+}
-+
-+struct ipu_soc *ipu_get_soc(int id)
-+{
-+	if (id >= MXC_IPU_MAX_NUM)
-+		return ERR_PTR(-ENODEV);
-+	else if (!ipu_array[id].online)
-+		return ERR_PTR(-ENODEV);
-+	else
-+		return &(ipu_array[id]);
-+}
-+EXPORT_SYMBOL_GPL(ipu_get_soc);
-+
-+void _ipu_get(struct ipu_soc *ipu)
-+{
-+	int ret;
-+
-+	ret = clk_enable(ipu->ipu_clk);
-+	if (ret < 0)
-+		BUG();
-+}
-+
-+void _ipu_put(struct ipu_soc *ipu)
-+{
-+	clk_disable(ipu->ipu_clk);
-+}
-+
-+void ipu_disable_hsp_clk(struct ipu_soc *ipu)
-+{
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_disable_hsp_clk);
-+
-+static struct platform_device_id imx_ipu_type[] = {
-+	{
-+		.name = "ipu-imx6q",
-+		.driver_data = IPU_V3H,
-+	}, {
-+		/* sentinel */
-+	}
-+};
-+MODULE_DEVICE_TABLE(platform, imx_ipu_type);
-+
-+static const struct of_device_id imx_ipuv3_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-ipu", .data = &imx_ipu_type[IMX6Q_IPU], },
-+	{ /* sentinel */ }
-+};
-+MODULE_DEVICE_TABLE(of, imx_ipuv3_dt_ids);
-+
-+/*!
-+ * This function is called by the driver framework to initialize the IPU
-+ * hardware.
-+ *
-+ * @param	dev	The device structure for the IPU passed in by the
-+ *			driver framework.
-+ *
-+ * @return      Returns 0 on success or negative error code on error
-+ */
-+static int ipu_probe(struct platform_device *pdev)
-+{
-+	struct ipu_soc *ipu;
-+	struct resource *res;
-+	unsigned long ipu_base;
-+	const struct of_device_id *of_id =
-+			of_match_device(imx_ipuv3_dt_ids, &pdev->dev);
-+	struct ipu_pltfm_data *pltfm_data;
-+	int ret = 0;
-+	u32 bypass_reset;
-+
-+	dev_dbg(&pdev->dev, "<%s>\n", __func__);
-+
-+	pltfm_data = devm_kzalloc(&pdev->dev, sizeof(struct ipu_pltfm_data),
-+				GFP_KERNEL);
-+	if (!pltfm_data)
-+		return -ENOMEM;
-+
-+	ret = of_property_read_u32(pdev->dev.of_node,
-+					"bypass_reset", &bypass_reset);
-+	if (ret < 0) {
-+		dev_dbg(&pdev->dev, "can not get bypass_reset\n");
-+		return ret;
-+	}
-+	pltfm_data->bypass_reset = (bool)bypass_reset;
-+
-+	pltfm_data->id = of_alias_get_id(pdev->dev.of_node, "ipu");
-+	if (pltfm_data->id < 0) {
-+		dev_dbg(&pdev->dev, "can not get alias id\n");
-+		return pltfm_data->id;
-+	} else
-+		dev_dbg(&pdev->dev, "get alias id %d\n", pltfm_data->id);
-+
-+	if (of_id)
-+		pdev->id_entry = of_id->data;
-+	pltfm_data->devtype = pdev->id_entry->driver_data;
-+	g_ipu_hw_rev = pltfm_data->devtype;
-+
-+	ipu = &ipu_array[pltfm_data->id];
-+	memset(ipu, 0, sizeof(struct ipu_soc));
-+	ipu->dev = &pdev->dev;
-+	ipu->pdata = pltfm_data;
-+	dev_dbg(ipu->dev, "IPU rev:%d\n", g_ipu_hw_rev);
-+	spin_lock_init(&ipu->int_reg_spin_lock);
-+	spin_lock_init(&ipu->rdy_reg_spin_lock);
-+	mutex_init(&ipu->mutex_lock);
-+
-+	ipu->irq_sync = platform_get_irq(pdev, 0);
-+	ipu->irq_err = platform_get_irq(pdev, 1);
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+
-+	if (!res || ipu->irq_sync < 0 || ipu->irq_err < 0) {
-+		dev_err(&pdev->dev, "can't get device resources\n");
-+		return -ENODEV;
-+	}
-+
-+	if (!devm_request_mem_region(&pdev->dev, res->start,
-+				     resource_size(res), pdev->name))
-+		return -EBUSY;
-+
-+	ret = devm_request_irq(&pdev->dev, ipu->irq_sync,
-+			ipu_sync_irq_handler, 0, pdev->name, ipu);
-+	if (ret) {
-+		dev_err(ipu->dev, "request SYNC interrupt failed\n");
-+		return ret;
-+	}
-+	ret = devm_request_irq(&pdev->dev, ipu->irq_err,
-+			ipu_err_irq_handler, 0, pdev->name, ipu);
-+	if (ret) {
-+		dev_err(ipu->dev, "request ERR interrupt failed\n");
-+		return ret;
-+	}
-+
-+	ipu_base = res->start;
-+	/* base fixup */
-+	if (g_ipu_hw_rev == IPU_V3H)	/* IPUv3H */
-+		ipu_base += IPUV3H_REG_BASE;
-+	else if (g_ipu_hw_rev == IPU_V3M)	/* IPUv3M */
-+		ipu_base += IPUV3M_REG_BASE;
-+	else			/* IPUv3D, v3E, v3EX */
-+		ipu_base += IPUV3DEX_REG_BASE;
-+
-+	ipu->cm_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_CM_REG_BASE, PAGE_SIZE);
-+	ipu->ic_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_IC_REG_BASE, PAGE_SIZE);
-+	ipu->idmac_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_IDMAC_REG_BASE, PAGE_SIZE);
-+	/* DP Registers are accessed thru the SRM */
-+	ipu->dp_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_SRM_REG_BASE, PAGE_SIZE);
-+	ipu->dc_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_DC_REG_BASE, PAGE_SIZE);
-+	ipu->dmfc_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_DMFC_REG_BASE, PAGE_SIZE);
-+	ipu->di_reg[0] = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_DI0_REG_BASE, PAGE_SIZE);
-+	ipu->di_reg[1] = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_DI1_REG_BASE, PAGE_SIZE);
-+	ipu->smfc_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_SMFC_REG_BASE, PAGE_SIZE);
-+	ipu->csi_reg[0] = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_CSI0_REG_BASE, PAGE_SIZE);
-+	ipu->csi_reg[1] = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_CSI1_REG_BASE, PAGE_SIZE);
-+	ipu->cpmem_base = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_CPMEM_REG_BASE, SZ_128K);
-+	ipu->tpmem_base = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_TPM_REG_BASE, SZ_64K);
-+	ipu->dc_tmpl_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_DC_TMPL_REG_BASE, SZ_128K);
-+	ipu->vdi_reg = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_VDI_REG_BASE, PAGE_SIZE);
-+	ipu->disp_base[1] = devm_ioremap(&pdev->dev,
-+				ipu_base + IPU_DISP1_BASE, SZ_4K);
-+	if (!ipu->cm_reg || !ipu->ic_reg || !ipu->idmac_reg ||
-+		!ipu->dp_reg || !ipu->dc_reg || !ipu->dmfc_reg ||
-+		!ipu->di_reg[0] || !ipu->di_reg[1] || !ipu->smfc_reg ||
-+		!ipu->csi_reg[0] || !ipu->csi_reg[1] || !ipu->cpmem_base ||
-+		!ipu->tpmem_base || !ipu->dc_tmpl_reg || !ipu->disp_base[1]
-+		|| !ipu->vdi_reg)
-+		return -ENOMEM;
-+
-+	dev_dbg(ipu->dev, "IPU CM Regs = %p\n", ipu->cm_reg);
-+	dev_dbg(ipu->dev, "IPU IC Regs = %p\n", ipu->ic_reg);
-+	dev_dbg(ipu->dev, "IPU IDMAC Regs = %p\n", ipu->idmac_reg);
-+	dev_dbg(ipu->dev, "IPU DP Regs = %p\n", ipu->dp_reg);
-+	dev_dbg(ipu->dev, "IPU DC Regs = %p\n", ipu->dc_reg);
-+	dev_dbg(ipu->dev, "IPU DMFC Regs = %p\n", ipu->dmfc_reg);
-+	dev_dbg(ipu->dev, "IPU DI0 Regs = %p\n", ipu->di_reg[0]);
-+	dev_dbg(ipu->dev, "IPU DI1 Regs = %p\n", ipu->di_reg[1]);
-+	dev_dbg(ipu->dev, "IPU SMFC Regs = %p\n", ipu->smfc_reg);
-+	dev_dbg(ipu->dev, "IPU CSI0 Regs = %p\n", ipu->csi_reg[0]);
-+	dev_dbg(ipu->dev, "IPU CSI1 Regs = %p\n", ipu->csi_reg[1]);
-+	dev_dbg(ipu->dev, "IPU CPMem = %p\n", ipu->cpmem_base);
-+	dev_dbg(ipu->dev, "IPU TPMem = %p\n", ipu->tpmem_base);
-+	dev_dbg(ipu->dev, "IPU DC Template Mem = %p\n", ipu->dc_tmpl_reg);
-+	dev_dbg(ipu->dev, "IPU Display Region 1 Mem = %p\n", ipu->disp_base[1]);
-+	dev_dbg(ipu->dev, "IPU VDI Regs = %p\n", ipu->vdi_reg);
-+
-+	ipu->ipu_clk = devm_clk_get(ipu->dev, "bus");
-+	if (IS_ERR(ipu->ipu_clk)) {
-+		dev_err(ipu->dev, "clk_get ipu failed");
-+		return PTR_ERR(ipu->ipu_clk);
-+	}
-+
-+	/* ipu_clk is always prepared */
-+	ret = clk_prepare_enable(ipu->ipu_clk);
-+	if (ret < 0) {
-+		dev_err(ipu->dev, "ipu clk enable failed\n");
-+		return ret;
-+	}
-+
-+	ipu->online = true;
-+
-+	platform_set_drvdata(pdev, ipu);
-+
-+	if (!pltfm_data->bypass_reset) {
-+		ret = device_reset(&pdev->dev);
-+		if (ret) {
-+			dev_err(&pdev->dev, "failed to reset: %d\n", ret);
-+			return ret;
-+		}
-+
-+		ipu_mem_reset(ipu);
-+
-+		ipu_disp_init(ipu);
-+
-+		/* Set MCU_T to divide MCU access window into 2 */
-+		ipu_cm_write(ipu, 0x00400000L | (IPU_MCU_T_DEFAULT << 18),
-+			     IPU_DISP_GEN);
-+	}
-+
-+	/* setup ipu clk tree after ipu reset  */
-+	ret = ipu_clk_setup_enable(ipu, pltfm_data);
-+	if (ret < 0) {
-+		dev_err(ipu->dev, "ipu clk setup failed\n");
-+		ipu->online = false;
-+		return ret;
-+	}
-+
-+	/* Set sync refresh channels and CSI->mem channel as high priority */
-+	ipu_idmac_write(ipu, 0x18800001L, IDMAC_CHA_PRI(0));
-+
-+	/* Enable error interrupts by default */
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(5));
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(6));
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(9));
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(10));
-+
-+	if (!pltfm_data->bypass_reset)
-+		clk_disable(ipu->ipu_clk);
-+
-+	register_ipu_device(ipu, ipu->pdata->id);
-+
-+	pm_runtime_enable(&pdev->dev);
-+
-+	return ret;
-+}
-+
-+int ipu_remove(struct platform_device *pdev)
-+{
-+	struct ipu_soc *ipu = platform_get_drvdata(pdev);
-+
-+	unregister_ipu_device(ipu, ipu->pdata->id);
-+
-+	clk_put(ipu->ipu_clk);
-+
-+	return 0;
-+}
-+
-+void ipu_dump_registers(struct ipu_soc *ipu)
-+{
-+	dev_dbg(ipu->dev, "IPU_CONF = \t0x%08X\n", ipu_cm_read(ipu, IPU_CONF));
-+	dev_dbg(ipu->dev, "IDMAC_CONF = \t0x%08X\n", ipu_idmac_read(ipu, IDMAC_CONF));
-+	dev_dbg(ipu->dev, "IDMAC_CHA_EN1 = \t0x%08X\n",
-+	       ipu_idmac_read(ipu, IDMAC_CHA_EN(0)));
-+	dev_dbg(ipu->dev, "IDMAC_CHA_EN2 = \t0x%08X\n",
-+	       ipu_idmac_read(ipu, IDMAC_CHA_EN(32)));
-+	dev_dbg(ipu->dev, "IDMAC_CHA_PRI1 = \t0x%08X\n",
-+	       ipu_idmac_read(ipu, IDMAC_CHA_PRI(0)));
-+	dev_dbg(ipu->dev, "IDMAC_CHA_PRI2 = \t0x%08X\n",
-+	       ipu_idmac_read(ipu, IDMAC_CHA_PRI(32)));
-+	dev_dbg(ipu->dev, "IDMAC_BAND_EN1 = \t0x%08X\n",
-+	       ipu_idmac_read(ipu, IDMAC_BAND_EN(0)));
-+	dev_dbg(ipu->dev, "IDMAC_BAND_EN2 = \t0x%08X\n",
-+	       ipu_idmac_read(ipu, IDMAC_BAND_EN(32)));
-+	dev_dbg(ipu->dev, "IPU_CHA_DB_MODE_SEL0 = \t0x%08X\n",
-+	       ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(0)));
-+	dev_dbg(ipu->dev, "IPU_CHA_DB_MODE_SEL1 = \t0x%08X\n",
-+	       ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(32)));
-+	if (g_ipu_hw_rev >= IPU_V3DEX) {
-+		dev_dbg(ipu->dev, "IPU_CHA_TRB_MODE_SEL0 = \t0x%08X\n",
-+		       ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(0)));
-+		dev_dbg(ipu->dev, "IPU_CHA_TRB_MODE_SEL1 = \t0x%08X\n",
-+		       ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(32)));
-+	}
-+	dev_dbg(ipu->dev, "DMFC_WR_CHAN = \t0x%08X\n",
-+	       ipu_dmfc_read(ipu, DMFC_WR_CHAN));
-+	dev_dbg(ipu->dev, "DMFC_WR_CHAN_DEF = \t0x%08X\n",
-+	       ipu_dmfc_read(ipu, DMFC_WR_CHAN_DEF));
-+	dev_dbg(ipu->dev, "DMFC_DP_CHAN = \t0x%08X\n",
-+	       ipu_dmfc_read(ipu, DMFC_DP_CHAN));
-+	dev_dbg(ipu->dev, "DMFC_DP_CHAN_DEF = \t0x%08X\n",
-+	       ipu_dmfc_read(ipu, DMFC_DP_CHAN_DEF));
-+	dev_dbg(ipu->dev, "DMFC_IC_CTRL = \t0x%08X\n",
-+	       ipu_dmfc_read(ipu, DMFC_IC_CTRL));
-+	dev_dbg(ipu->dev, "IPU_FS_PROC_FLOW1 = \t0x%08X\n",
-+	       ipu_cm_read(ipu, IPU_FS_PROC_FLOW1));
-+	dev_dbg(ipu->dev, "IPU_FS_PROC_FLOW2 = \t0x%08X\n",
-+	       ipu_cm_read(ipu, IPU_FS_PROC_FLOW2));
-+	dev_dbg(ipu->dev, "IPU_FS_PROC_FLOW3 = \t0x%08X\n",
-+	       ipu_cm_read(ipu, IPU_FS_PROC_FLOW3));
-+	dev_dbg(ipu->dev, "IPU_FS_DISP_FLOW1 = \t0x%08X\n",
-+	       ipu_cm_read(ipu, IPU_FS_DISP_FLOW1));
-+	dev_dbg(ipu->dev, "IPU_VDIC_VDI_FSIZE = \t0x%08X\n",
-+	       ipu_vdi_read(ipu, VDI_FSIZE));
-+	dev_dbg(ipu->dev, "IPU_VDIC_VDI_C = \t0x%08X\n",
-+	       ipu_vdi_read(ipu, VDI_C));
-+	dev_dbg(ipu->dev, "IPU_IC_CONF = \t0x%08X\n",
-+	       ipu_ic_read(ipu, IC_CONF));
-+}
-+
-+/*!
-+ * This function is called to initialize a logical IPU channel.
-+ *
-+ * @param	ipu	ipu handler
-+ * @param       channel Input parameter for the logical channel ID to init.
-+ *
-+ * @param       params  Input parameter containing union of channel
-+ *                      initialization parameters.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_init_channel(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params)
-+{
-+	int ret = 0;
-+	bool bad_pixfmt;
-+	uint32_t ipu_conf, reg, in_g_pixel_fmt, sec_dma;
-+
-+	dev_dbg(ipu->dev, "init channel = %d\n", IPU_CHAN_ID(channel));
-+
-+	ret = pm_runtime_get_sync(ipu->dev);
-+	if (ret < 0) {
-+		dev_err(ipu->dev, "ch = %d, pm_runtime_get failed:%d!\n",
-+				IPU_CHAN_ID(channel), ret);
-+		dump_stack();
-+		return ret;
-+	}
-+	/*
-+	 * Here, ret could be 1 if the device's runtime PM status was
-+	 * already 'active', so clear it to be 0.
-+	 */
-+	ret = 0;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	/* Re-enable error interrupts every time a channel is initialized */
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(5));
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(6));
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(9));
-+	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(10));
-+
-+	if (ipu->channel_init_mask & (1L << IPU_CHAN_ID(channel))) {
-+		dev_warn(ipu->dev, "Warning: channel already initialized %d\n",
-+			IPU_CHAN_ID(channel));
-+	}
-+
-+	ipu_conf = ipu_cm_read(ipu, IPU_CONF);
-+
-+	switch (channel) {
-+	case CSI_MEM0:
-+	case CSI_MEM1:
-+	case CSI_MEM2:
-+	case CSI_MEM3:
-+		if (params->csi_mem.csi > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+
-+		if (params->csi_mem.interlaced)
-+			ipu->chan_is_interlaced[channel_2_dma(channel,
-+				IPU_OUTPUT_BUFFER)] = true;
-+		else
-+			ipu->chan_is_interlaced[channel_2_dma(channel,
-+				IPU_OUTPUT_BUFFER)] = false;
-+
-+		ipu->smfc_use_count++;
-+		ipu->csi_channel[params->csi_mem.csi] = channel;
-+
-+		/*SMFC setting*/
-+		if (params->csi_mem.mipi_en) {
-+			ipu_conf |= (1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
-+				params->csi_mem.csi));
-+			_ipu_smfc_init(ipu, channel, params->csi_mem.mipi_vc,
-+				params->csi_mem.csi);
-+			_ipu_csi_set_mipi_di(ipu, params->csi_mem.mipi_vc,
-+				params->csi_mem.mipi_id, params->csi_mem.csi);
-+		} else {
-+			ipu_conf &= ~(1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
-+				params->csi_mem.csi));
-+			_ipu_smfc_init(ipu, channel, 0, params->csi_mem.csi);
-+		}
-+
-+		/*CSI data (include compander) dest*/
-+		_ipu_csi_init(ipu, channel, params->csi_mem.csi);
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+		if (params->csi_prp_enc_mem.csi > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+		if ((ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM) ||
-+			(ipu->using_ic_dirct_ch == MEM_VDI_MEM)) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+		ipu->using_ic_dirct_ch = CSI_PRP_ENC_MEM;
-+
-+		ipu->ic_use_count++;
-+		ipu->csi_channel[params->csi_prp_enc_mem.csi] = channel;
-+
-+		if (params->csi_prp_enc_mem.mipi_en) {
-+			ipu_conf |= (1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
-+				params->csi_prp_enc_mem.csi));
-+			_ipu_csi_set_mipi_di(ipu,
-+				params->csi_prp_enc_mem.mipi_vc,
-+				params->csi_prp_enc_mem.mipi_id,
-+				params->csi_prp_enc_mem.csi);
-+		} else
-+			ipu_conf &= ~(1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
-+				params->csi_prp_enc_mem.csi));
-+
-+		/*CSI0/1 feed into IC*/
-+		ipu_conf &= ~IPU_CONF_IC_INPUT;
-+		if (params->csi_prp_enc_mem.csi)
-+			ipu_conf |= IPU_CONF_CSI_SEL;
-+		else
-+			ipu_conf &= ~IPU_CONF_CSI_SEL;
-+
-+		/*PRP skip buffer in memory, only valid when RWS_EN is true*/
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg & ~FS_ENC_IN_VALID, IPU_FS_PROC_FLOW1);
-+
-+		/*CSI data (include compander) dest*/
-+		_ipu_csi_init(ipu, channel, params->csi_prp_enc_mem.csi);
-+		_ipu_ic_init_prpenc(ipu, params, true);
-+		break;
-+	case CSI_PRP_VF_MEM:
-+		if (params->csi_prp_vf_mem.csi > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+		if ((ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM) ||
-+			(ipu->using_ic_dirct_ch == MEM_VDI_MEM)) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+		ipu->using_ic_dirct_ch = CSI_PRP_VF_MEM;
-+
-+		ipu->ic_use_count++;
-+		ipu->csi_channel[params->csi_prp_vf_mem.csi] = channel;
-+
-+		if (params->csi_prp_vf_mem.mipi_en) {
-+			ipu_conf |= (1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
-+				params->csi_prp_vf_mem.csi));
-+			_ipu_csi_set_mipi_di(ipu,
-+				params->csi_prp_vf_mem.mipi_vc,
-+				params->csi_prp_vf_mem.mipi_id,
-+				params->csi_prp_vf_mem.csi);
-+		} else
-+			ipu_conf &= ~(1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
-+				params->csi_prp_vf_mem.csi));
-+
-+		/*CSI0/1 feed into IC*/
-+		ipu_conf &= ~IPU_CONF_IC_INPUT;
-+		if (params->csi_prp_vf_mem.csi)
-+			ipu_conf |= IPU_CONF_CSI_SEL;
-+		else
-+			ipu_conf &= ~IPU_CONF_CSI_SEL;
-+
-+		/*PRP skip buffer in memory, only valid when RWS_EN is true*/
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg & ~FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
-+
-+		/*CSI data (include compander) dest*/
-+		_ipu_csi_init(ipu, channel, params->csi_prp_vf_mem.csi);
-+		_ipu_ic_init_prpvf(ipu, params, true);
-+		break;
-+	case MEM_PRP_VF_MEM:
-+		if (params->mem_prp_vf_mem.graphics_combine_en) {
-+			sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
-+			in_g_pixel_fmt = params->mem_prp_vf_mem.in_g_pixel_fmt;
-+			bad_pixfmt =
-+				_ipu_ch_param_bad_alpha_pos(in_g_pixel_fmt);
-+
-+			if (params->mem_prp_vf_mem.alpha_chan_en) {
-+				if (bad_pixfmt) {
-+					dev_err(ipu->dev, "bad pixel format "
-+						"for graphics plane from "
-+						"ch%d\n", sec_dma);
-+					ret = -EINVAL;
-+					goto err;
-+				}
-+				ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
-+			}
-+			ipu->sec_chan_en[IPU_CHAN_ID(channel)] = true;
-+		}
-+
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg | FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
-+
-+		_ipu_ic_init_prpvf(ipu, params, false);
-+		ipu->ic_use_count++;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		if ((ipu->using_ic_dirct_ch == CSI_PRP_VF_MEM) ||
-+			(ipu->using_ic_dirct_ch == MEM_VDI_MEM) ||
-+		     (ipu->using_ic_dirct_ch == CSI_PRP_ENC_MEM)) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+		ipu->using_ic_dirct_ch = MEM_VDI_PRP_VF_MEM;
-+		ipu->ic_use_count++;
-+		ipu->vdi_use_count++;
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		reg &= ~FS_VDI_SRC_SEL_MASK;
-+		ipu_cm_write(ipu, reg , IPU_FS_PROC_FLOW1);
-+
-+		if (params->mem_prp_vf_mem.graphics_combine_en)
-+			ipu->sec_chan_en[IPU_CHAN_ID(channel)] = true;
-+		_ipu_ic_init_prpvf(ipu, params, false);
-+		_ipu_vdi_init(ipu, channel, params);
-+		break;
-+	case MEM_VDI_PRP_VF_MEM_P:
-+	case MEM_VDI_PRP_VF_MEM_N:
-+	case MEM_VDI_MEM_P:
-+	case MEM_VDI_MEM_N:
-+		_ipu_vdi_init(ipu, channel, params);
-+		break;
-+	case MEM_VDI_MEM:
-+		if ((ipu->using_ic_dirct_ch == CSI_PRP_VF_MEM) ||
-+			(ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM) ||
-+		     (ipu->using_ic_dirct_ch == CSI_PRP_ENC_MEM)) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+		ipu->using_ic_dirct_ch = MEM_VDI_MEM;
-+		ipu->ic_use_count++;
-+		ipu->vdi_use_count++;
-+		_ipu_vdi_init(ipu, channel, params);
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		ipu->ic_use_count++;
-+		ipu->rot_use_count++;
-+		_ipu_ic_init_rotate_vf(ipu, params);
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		ipu->ic_use_count++;
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg | FS_ENC_IN_VALID, IPU_FS_PROC_FLOW1);
-+		_ipu_ic_init_prpenc(ipu, params, false);
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		ipu->ic_use_count++;
-+		ipu->rot_use_count++;
-+		_ipu_ic_init_rotate_enc(ipu, params);
-+		break;
-+	case MEM_PP_MEM:
-+		if (params->mem_pp_mem.graphics_combine_en) {
-+			sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
-+			in_g_pixel_fmt = params->mem_pp_mem.in_g_pixel_fmt;
-+			bad_pixfmt =
-+				_ipu_ch_param_bad_alpha_pos(in_g_pixel_fmt);
-+
-+			if (params->mem_pp_mem.alpha_chan_en) {
-+				if (bad_pixfmt) {
-+					dev_err(ipu->dev, "bad pixel format "
-+						"for graphics plane from "
-+						"ch%d\n", sec_dma);
-+					ret = -EINVAL;
-+					goto err;
-+				}
-+				ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
-+			}
-+
-+			ipu->sec_chan_en[IPU_CHAN_ID(channel)] = true;
-+		}
-+
-+		_ipu_ic_init_pp(ipu, params);
-+		ipu->ic_use_count++;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		_ipu_ic_init_rotate_pp(ipu, params);
-+		ipu->ic_use_count++;
-+		ipu->rot_use_count++;
-+		break;
-+	case MEM_DC_SYNC:
-+		if (params->mem_dc_sync.di > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+
-+		ipu->dc_di_assignment[1] = params->mem_dc_sync.di;
-+		_ipu_dc_init(ipu, 1, params->mem_dc_sync.di,
-+			     params->mem_dc_sync.interlaced,
-+			     params->mem_dc_sync.out_pixel_fmt);
-+		ipu->di_use_count[params->mem_dc_sync.di]++;
-+		ipu->dc_use_count++;
-+		ipu->dmfc_use_count++;
-+		break;
-+	case MEM_BG_SYNC:
-+		if (params->mem_dp_bg_sync.di > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+
-+		if (params->mem_dp_bg_sync.alpha_chan_en)
-+			ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
-+
-+		ipu->dc_di_assignment[5] = params->mem_dp_bg_sync.di;
-+		_ipu_dp_init(ipu, channel, params->mem_dp_bg_sync.in_pixel_fmt,
-+			     params->mem_dp_bg_sync.out_pixel_fmt);
-+		_ipu_dc_init(ipu, 5, params->mem_dp_bg_sync.di,
-+			     params->mem_dp_bg_sync.interlaced,
-+			     params->mem_dp_bg_sync.out_pixel_fmt);
-+		ipu->di_use_count[params->mem_dp_bg_sync.di]++;
-+		ipu->dc_use_count++;
-+		ipu->dp_use_count++;
-+		ipu->dmfc_use_count++;
-+		break;
-+	case MEM_FG_SYNC:
-+		_ipu_dp_init(ipu, channel, params->mem_dp_fg_sync.in_pixel_fmt,
-+			     params->mem_dp_fg_sync.out_pixel_fmt);
-+
-+		if (params->mem_dp_fg_sync.alpha_chan_en)
-+			ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
-+
-+		ipu->dc_use_count++;
-+		ipu->dp_use_count++;
-+		ipu->dmfc_use_count++;
-+		break;
-+	case DIRECT_ASYNC0:
-+		if (params->direct_async.di > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+
-+		ipu->dc_di_assignment[8] = params->direct_async.di;
-+		_ipu_dc_init(ipu, 8, params->direct_async.di, false, IPU_PIX_FMT_GENERIC);
-+		ipu->di_use_count[params->direct_async.di]++;
-+		ipu->dc_use_count++;
-+		break;
-+	case DIRECT_ASYNC1:
-+		if (params->direct_async.di > 1) {
-+			ret = -EINVAL;
-+			goto err;
-+		}
-+
-+		ipu->dc_di_assignment[9] = params->direct_async.di;
-+		_ipu_dc_init(ipu, 9, params->direct_async.di, false, IPU_PIX_FMT_GENERIC);
-+		ipu->di_use_count[params->direct_async.di]++;
-+		ipu->dc_use_count++;
-+		break;
-+	default:
-+		dev_err(ipu->dev, "Missing channel initialization\n");
-+		break;
-+	}
-+
-+	ipu->channel_init_mask |= 1L << IPU_CHAN_ID(channel);
-+
-+	ipu_cm_write(ipu, ipu_conf, IPU_CONF);
-+
-+err:
-+	mutex_unlock(&ipu->mutex_lock);
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_init_channel);
-+
-+/*!
-+ * This function is called to uninitialize a logical IPU channel.
-+ *
-+ * @param	ipu	ipu handler
-+ * @param       channel Input parameter for the logical channel ID to uninit.
-+ */
-+void ipu_uninit_channel(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t reg;
-+	uint32_t in_dma, out_dma = 0;
-+	uint32_t ipu_conf;
-+	uint32_t dc_chan = 0;
-+	int ret;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	if ((ipu->channel_init_mask & (1L << IPU_CHAN_ID(channel))) == 0) {
-+		dev_dbg(ipu->dev, "Channel already uninitialized %d\n",
-+			IPU_CHAN_ID(channel));
-+		mutex_unlock(&ipu->mutex_lock);
-+		return;
-+	}
-+
-+	/* Make sure channel is disabled */
-+	/* Get input and output dma channels */
-+	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
-+	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
-+
-+	if (idma_is_set(ipu, IDMAC_CHA_EN, in_dma) ||
-+	    idma_is_set(ipu, IDMAC_CHA_EN, out_dma)) {
-+		dev_err(ipu->dev,
-+			"Channel %d is not disabled, disable first\n",
-+			IPU_CHAN_ID(channel));
-+		mutex_unlock(&ipu->mutex_lock);
-+		return;
-+	}
-+
-+	ipu_conf = ipu_cm_read(ipu, IPU_CONF);
-+
-+	/* Reset the double buffer */
-+	reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(in_dma));
-+	ipu_cm_write(ipu, reg & ~idma_mask(in_dma), IPU_CHA_DB_MODE_SEL(in_dma));
-+	reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(out_dma));
-+	ipu_cm_write(ipu, reg & ~idma_mask(out_dma), IPU_CHA_DB_MODE_SEL(out_dma));
-+
-+	/* Reset the triple buffer */
-+	reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(in_dma));
-+	ipu_cm_write(ipu, reg & ~idma_mask(in_dma), IPU_CHA_TRB_MODE_SEL(in_dma));
-+	reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(out_dma));
-+	ipu_cm_write(ipu, reg & ~idma_mask(out_dma), IPU_CHA_TRB_MODE_SEL(out_dma));
-+
-+	if (_ipu_is_ic_chan(in_dma) || _ipu_is_dp_graphic_chan(in_dma)) {
-+		ipu->sec_chan_en[IPU_CHAN_ID(channel)] = false;
-+		ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = false;
-+	}
-+
-+	switch (channel) {
-+	case CSI_MEM0:
-+	case CSI_MEM1:
-+	case CSI_MEM2:
-+	case CSI_MEM3:
-+		ipu->smfc_use_count--;
-+		if (ipu->csi_channel[0] == channel) {
-+			ipu->csi_channel[0] = CHAN_NONE;
-+		} else if (ipu->csi_channel[1] == channel) {
-+			ipu->csi_channel[1] = CHAN_NONE;
-+		}
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+		ipu->ic_use_count--;
-+		if (ipu->using_ic_dirct_ch == CSI_PRP_ENC_MEM)
-+			ipu->using_ic_dirct_ch = 0;
-+		_ipu_ic_uninit_prpenc(ipu);
-+		if (ipu->csi_channel[0] == channel) {
-+			ipu->csi_channel[0] = CHAN_NONE;
-+		} else if (ipu->csi_channel[1] == channel) {
-+			ipu->csi_channel[1] = CHAN_NONE;
-+		}
-+		break;
-+	case CSI_PRP_VF_MEM:
-+		ipu->ic_use_count--;
-+		if (ipu->using_ic_dirct_ch == CSI_PRP_VF_MEM)
-+			ipu->using_ic_dirct_ch = 0;
-+		_ipu_ic_uninit_prpvf(ipu);
-+		if (ipu->csi_channel[0] == channel) {
-+			ipu->csi_channel[0] = CHAN_NONE;
-+		} else if (ipu->csi_channel[1] == channel) {
-+			ipu->csi_channel[1] = CHAN_NONE;
-+		}
-+		break;
-+	case MEM_PRP_VF_MEM:
-+		ipu->ic_use_count--;
-+		_ipu_ic_uninit_prpvf(ipu);
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg & ~FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		ipu->ic_use_count--;
-+		ipu->vdi_use_count--;
-+		if (ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM)
-+			ipu->using_ic_dirct_ch = 0;
-+		_ipu_ic_uninit_prpvf(ipu);
-+		_ipu_vdi_uninit(ipu);
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg & ~FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
-+		break;
-+	case MEM_VDI_MEM:
-+		ipu->ic_use_count--;
-+		ipu->vdi_use_count--;
-+		if (ipu->using_ic_dirct_ch == MEM_VDI_MEM)
-+			ipu->using_ic_dirct_ch = 0;
-+		_ipu_vdi_uninit(ipu);
-+		break;
-+	case MEM_VDI_PRP_VF_MEM_P:
-+	case MEM_VDI_PRP_VF_MEM_N:
-+	case MEM_VDI_MEM_P:
-+	case MEM_VDI_MEM_N:
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		ipu->rot_use_count--;
-+		ipu->ic_use_count--;
-+		_ipu_ic_uninit_rotate_vf(ipu);
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		ipu->ic_use_count--;
-+		_ipu_ic_uninit_prpenc(ipu);
-+		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+		ipu_cm_write(ipu, reg & ~FS_ENC_IN_VALID, IPU_FS_PROC_FLOW1);
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		ipu->rot_use_count--;
-+		ipu->ic_use_count--;
-+		_ipu_ic_uninit_rotate_enc(ipu);
-+		break;
-+	case MEM_PP_MEM:
-+		ipu->ic_use_count--;
-+		_ipu_ic_uninit_pp(ipu);
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		ipu->rot_use_count--;
-+		ipu->ic_use_count--;
-+		_ipu_ic_uninit_rotate_pp(ipu);
-+		break;
-+	case MEM_DC_SYNC:
-+		dc_chan = 1;
-+		_ipu_dc_uninit(ipu, 1);
-+		ipu->di_use_count[ipu->dc_di_assignment[1]]--;
-+		ipu->dc_use_count--;
-+		ipu->dmfc_use_count--;
-+		break;
-+	case MEM_BG_SYNC:
-+		dc_chan = 5;
-+		_ipu_dp_uninit(ipu, channel);
-+		_ipu_dc_uninit(ipu, 5);
-+		ipu->di_use_count[ipu->dc_di_assignment[5]]--;
-+		ipu->dc_use_count--;
-+		ipu->dp_use_count--;
-+		ipu->dmfc_use_count--;
-+		break;
-+	case MEM_FG_SYNC:
-+		_ipu_dp_uninit(ipu, channel);
-+		ipu->dc_use_count--;
-+		ipu->dp_use_count--;
-+		ipu->dmfc_use_count--;
-+		break;
-+	case DIRECT_ASYNC0:
-+		dc_chan = 8;
-+		_ipu_dc_uninit(ipu, 8);
-+		ipu->di_use_count[ipu->dc_di_assignment[8]]--;
-+		ipu->dc_use_count--;
-+		break;
-+	case DIRECT_ASYNC1:
-+		dc_chan = 9;
-+		_ipu_dc_uninit(ipu, 9);
-+		ipu->di_use_count[ipu->dc_di_assignment[9]]--;
-+		ipu->dc_use_count--;
-+		break;
-+	default:
-+		break;
-+	}
-+
-+	if (ipu->ic_use_count == 0)
-+		ipu_conf &= ~IPU_CONF_IC_EN;
-+	if (ipu->vdi_use_count == 0) {
-+		ipu_conf &= ~IPU_CONF_ISP_EN;
-+		ipu_conf &= ~IPU_CONF_VDI_EN;
-+		ipu_conf &= ~IPU_CONF_IC_INPUT;
-+	}
-+	if (ipu->rot_use_count == 0)
-+		ipu_conf &= ~IPU_CONF_ROT_EN;
-+	if (ipu->dc_use_count == 0)
-+		ipu_conf &= ~IPU_CONF_DC_EN;
-+	if (ipu->dp_use_count == 0)
-+		ipu_conf &= ~IPU_CONF_DP_EN;
-+	if (ipu->dmfc_use_count == 0)
-+		ipu_conf &= ~IPU_CONF_DMFC_EN;
-+	if (ipu->di_use_count[0] == 0) {
-+		ipu_conf &= ~IPU_CONF_DI0_EN;
-+	}
-+	if (ipu->di_use_count[1] == 0) {
-+		ipu_conf &= ~IPU_CONF_DI1_EN;
-+	}
-+	if (ipu->smfc_use_count == 0)
-+		ipu_conf &= ~IPU_CONF_SMFC_EN;
-+
-+	ipu_cm_write(ipu, ipu_conf, IPU_CONF);
-+
-+	ipu->channel_init_mask &= ~(1L << IPU_CHAN_ID(channel));
-+
-+	/*
-+	 * Disable pixel clk and its parent clock(if the parent clock
-+	 * usecount is 1) after clearing DC/DP/DI bits in IPU_CONF
-+	 * register to prevent LVDS display channel starvation.
-+	 */
-+	if (_ipu_is_primary_disp_chan(in_dma))
-+		clk_disable_unprepare(ipu->pixel_clk[ipu->dc_di_assignment[dc_chan]]);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+
-+	ret = pm_runtime_put_sync_suspend(ipu->dev);
-+	if (ret < 0) {
-+		dev_err(ipu->dev, "ch = %d, pm_runtime_put failed:%d!\n",
-+				IPU_CHAN_ID(channel), ret);
-+		dump_stack();
-+	}
-+
-+	WARN_ON(ipu->ic_use_count < 0);
-+	WARN_ON(ipu->vdi_use_count < 0);
-+	WARN_ON(ipu->rot_use_count < 0);
-+	WARN_ON(ipu->dc_use_count < 0);
-+	WARN_ON(ipu->dp_use_count < 0);
-+	WARN_ON(ipu->dmfc_use_count < 0);
-+	WARN_ON(ipu->smfc_use_count < 0);
-+}
-+EXPORT_SYMBOL(ipu_uninit_channel);
-+
-+/*!
-+ * This function is called to initialize buffer(s) for logical IPU channel.
-+ *
-+ * @param	ipu		ipu handler
-+ *
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to initialize.
-+ *
-+ * @param       pixel_fmt       Input parameter for pixel format of buffer.
-+ *                              Pixel format is a FOURCC ASCII code.
-+ *
-+ * @param       width           Input parameter for width of buffer in pixels.
-+ *
-+ * @param       height          Input parameter for height of buffer in pixels.
-+ *
-+ * @param       stride          Input parameter for stride length of buffer
-+ *                              in pixels.
-+ *
-+ * @param       rot_mode        Input parameter for rotation setting of buffer.
-+ *                              A rotation setting other than
-+ *                              IPU_ROTATE_VERT_FLIP
-+ *                              should only be used for input buffers of
-+ *                              rotation channels.
-+ *
-+ * @param       phyaddr_0       Input parameter buffer 0 physical address.
-+ *
-+ * @param       phyaddr_1       Input parameter buffer 1 physical address.
-+ *                              Setting this to a value other than NULL enables
-+ *                              double buffering mode.
-+ *
-+ * @param       phyaddr_2       Input parameter buffer 2 physical address.
-+ *                              Setting this to a value other than NULL enables
-+ *                              triple buffering mode, phyaddr_1 should not be
-+ *                              NULL then.
-+ *
-+ * @param       u		private u offset for additional cropping,
-+ *				zero if not used.
-+ *
-+ * @param       v		private v offset for additional cropping,
-+ *				zero if not used.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_init_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
-+				ipu_buffer_t type,
-+				uint32_t pixel_fmt,
-+				uint16_t width, uint16_t height,
-+				uint32_t stride,
-+				ipu_rotate_mode_t rot_mode,
-+				dma_addr_t phyaddr_0, dma_addr_t phyaddr_1,
-+				dma_addr_t phyaddr_2,
-+				uint32_t u, uint32_t v)
-+{
-+	uint32_t reg;
-+	uint32_t dma_chan;
-+	uint32_t burst_size;
-+
-+	dma_chan = channel_2_dma(channel, type);
-+	if (!idma_is_valid(dma_chan))
-+		return -EINVAL;
-+
-+	if (stride < width * bytes_per_pixel(pixel_fmt))
-+		stride = width * bytes_per_pixel(pixel_fmt);
-+
-+	if (stride % 4) {
-+		dev_err(ipu->dev,
-+			"Stride not 32-bit aligned, stride = %d\n", stride);
-+		return -EINVAL;
-+	}
-+	/* IC & IRT channels' width must be multiple of 8 pixels */
-+	if ((_ipu_is_ic_chan(dma_chan) || _ipu_is_irt_chan(dma_chan))
-+		&& (width % 8)) {
-+		dev_err(ipu->dev, "Width must be 8 pixel multiple\n");
-+		return -EINVAL;
-+	}
-+
-+	if (_ipu_is_vdi_out_chan(dma_chan) &&
-+		((width < 16) || (height < 16) || (width % 2) || (height % 4))) {
-+		dev_err(ipu->dev, "vdi width/height limited err\n");
-+		return -EINVAL;
-+	}
-+
-+	/* IPUv3EX and IPUv3M support triple buffer */
-+	if ((!_ipu_is_trb_chan(dma_chan)) && phyaddr_2) {
-+		dev_err(ipu->dev, "Chan%d doesn't support triple buffer "
-+				   "mode\n", dma_chan);
-+		return -EINVAL;
-+	}
-+	if (!phyaddr_1 && phyaddr_2) {
-+		dev_err(ipu->dev, "Chan%d's buf1 physical addr is NULL for "
-+				   "triple buffer mode\n", dma_chan);
-+		return -EINVAL;
-+	}
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	/* Build parameter memory data for DMA channel */
-+	_ipu_ch_param_init(ipu, dma_chan, pixel_fmt, width, height, stride, u, v, 0,
-+			   phyaddr_0, phyaddr_1, phyaddr_2);
-+
-+	/* Set correlative channel parameter of local alpha channel */
-+	if ((_ipu_is_ic_graphic_chan(dma_chan) ||
-+	     _ipu_is_dp_graphic_chan(dma_chan)) &&
-+	    (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] == true)) {
-+		_ipu_ch_param_set_alpha_use_separate_channel(ipu, dma_chan, true);
-+		_ipu_ch_param_set_alpha_buffer_memory(ipu, dma_chan);
-+		_ipu_ch_param_set_alpha_condition_read(ipu, dma_chan);
-+		/* fix alpha width as 8 and burst size as 16*/
-+		_ipu_ch_params_set_alpha_width(ipu, dma_chan, 8);
-+		_ipu_ch_param_set_burst_size(ipu, dma_chan, 16);
-+	} else if (_ipu_is_ic_graphic_chan(dma_chan) &&
-+		   ipu_pixel_format_has_alpha(pixel_fmt))
-+		_ipu_ch_param_set_alpha_use_separate_channel(ipu, dma_chan, false);
-+
-+	if (rot_mode)
-+		_ipu_ch_param_set_rotation(ipu, dma_chan, rot_mode);
-+
-+	/* IC and ROT channels have restriction of 8 or 16 pix burst length */
-+	if (_ipu_is_ic_chan(dma_chan) || _ipu_is_vdi_out_chan(dma_chan)) {
-+		if ((width % 16) == 0)
-+			_ipu_ch_param_set_burst_size(ipu, dma_chan, 16);
-+		else
-+			_ipu_ch_param_set_burst_size(ipu, dma_chan, 8);
-+	} else if (_ipu_is_irt_chan(dma_chan)) {
-+		_ipu_ch_param_set_burst_size(ipu, dma_chan, 8);
-+		_ipu_ch_param_set_block_mode(ipu, dma_chan);
-+	} else if (_ipu_is_dmfc_chan(dma_chan)) {
-+		burst_size = _ipu_ch_param_get_burst_size(ipu, dma_chan);
-+		_ipu_dmfc_set_wait4eot(ipu, dma_chan, width);
-+		_ipu_dmfc_set_burst_size(ipu, dma_chan, burst_size);
-+	}
-+
-+	if (_ipu_disp_chan_is_interlaced(ipu, channel) ||
-+		ipu->chan_is_interlaced[dma_chan])
-+		_ipu_ch_param_set_interlaced_scan(ipu, dma_chan);
-+
-+	if (_ipu_is_ic_chan(dma_chan) || _ipu_is_irt_chan(dma_chan) ||
-+		_ipu_is_vdi_out_chan(dma_chan)) {
-+		burst_size = _ipu_ch_param_get_burst_size(ipu, dma_chan);
-+		_ipu_ic_idma_init(ipu, dma_chan, width, height, burst_size,
-+			rot_mode);
-+	} else if (_ipu_is_smfc_chan(dma_chan)) {
-+		burst_size = _ipu_ch_param_get_burst_size(ipu, dma_chan);
-+		/*
-+		 * This is different from IPUv3 spec, but it is confirmed
-+		 * in IPUforum that SMFC burst size should be NPB[6:3]
-+		 * when IDMAC works in 16-bit generic data mode.
-+		 */
-+		if (pixel_fmt == IPU_PIX_FMT_GENERIC)
-+			/* 8 bits per pixel */
-+			burst_size = burst_size >> 4;
-+		else if (pixel_fmt == IPU_PIX_FMT_GENERIC_16)
-+			/* 16 bits per pixel */
-+			burst_size = burst_size >> 3;
-+		else
-+			burst_size = burst_size >> 2;
-+		_ipu_smfc_set_burst_size(ipu, channel, burst_size-1);
-+	}
-+
-+	/* AXI-id */
-+	if (idma_is_set(ipu, IDMAC_CHA_PRI, dma_chan)) {
-+		unsigned reg = IDMAC_CH_LOCK_EN_1;
-+		uint32_t value = 0;
-+		if (ipu->pdata->devtype == IPU_V3H) {
-+			_ipu_ch_param_set_axi_id(ipu, dma_chan, 0);
-+			switch (dma_chan) {
-+			case 5:
-+				value = 0x3;
-+				break;
-+			case 11:
-+				value = 0x3 << 2;
-+				break;
-+			case 12:
-+				value = 0x3 << 4;
-+				break;
-+			case 14:
-+				value = 0x3 << 6;
-+				break;
-+			case 15:
-+				value = 0x3 << 8;
-+				break;
-+			case 20:
-+				value = 0x3 << 10;
-+				break;
-+			case 21:
-+				value = 0x3 << 12;
-+				break;
-+			case 22:
-+				value = 0x3 << 14;
-+				break;
-+			case 23:
-+				value = 0x3 << 16;
-+				break;
-+			case 27:
-+				value = 0x3 << 18;
-+				break;
-+			case 28:
-+				value = 0x3 << 20;
-+				break;
-+			case 45:
-+				reg = IDMAC_CH_LOCK_EN_2;
-+				value = 0x3 << 0;
-+				break;
-+			case 46:
-+				reg = IDMAC_CH_LOCK_EN_2;
-+				value = 0x3 << 2;
-+				break;
-+			case 47:
-+				reg = IDMAC_CH_LOCK_EN_2;
-+				value = 0x3 << 4;
-+				break;
-+			case 48:
-+				reg = IDMAC_CH_LOCK_EN_2;
-+				value = 0x3 << 6;
-+				break;
-+			case 49:
-+				reg = IDMAC_CH_LOCK_EN_2;
-+				value = 0x3 << 8;
-+				break;
-+			case 50:
-+				reg = IDMAC_CH_LOCK_EN_2;
-+				value = 0x3 << 10;
-+				break;
-+			default:
-+				break;
-+			}
-+			value |= ipu_idmac_read(ipu, reg);
-+			ipu_idmac_write(ipu, value, reg);
-+		} else
-+			_ipu_ch_param_set_axi_id(ipu, dma_chan, 1);
-+	} else {
-+		if (ipu->pdata->devtype == IPU_V3H)
-+			_ipu_ch_param_set_axi_id(ipu, dma_chan, 1);
-+	}
-+
-+	_ipu_ch_param_dump(ipu, dma_chan);
-+
-+	if (phyaddr_2 && g_ipu_hw_rev >= IPU_V3DEX) {
-+		reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(dma_chan));
-+		reg &= ~idma_mask(dma_chan);
-+		ipu_cm_write(ipu, reg, IPU_CHA_DB_MODE_SEL(dma_chan));
-+
-+		reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan));
-+		reg |= idma_mask(dma_chan);
-+		ipu_cm_write(ipu, reg, IPU_CHA_TRB_MODE_SEL(dma_chan));
-+
-+		/* Set IDMAC third buffer's cpmem number */
-+		/* See __ipu_ch_get_third_buf_cpmem_num() for mapping */
-+		ipu_idmac_write(ipu, 0x00444047L, IDMAC_SUB_ADDR_4);
-+		ipu_idmac_write(ipu, 0x46004241L, IDMAC_SUB_ADDR_3);
-+		ipu_idmac_write(ipu, 0x00000045L, IDMAC_SUB_ADDR_1);
-+
-+		/* Reset to buffer 0 */
-+		ipu_cm_write(ipu, tri_cur_buf_mask(dma_chan),
-+				IPU_CHA_TRIPLE_CUR_BUF(dma_chan));
-+	} else {
-+		reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan));
-+		reg &= ~idma_mask(dma_chan);
-+		ipu_cm_write(ipu, reg, IPU_CHA_TRB_MODE_SEL(dma_chan));
-+
-+		reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(dma_chan));
-+		if (phyaddr_1)
-+			reg |= idma_mask(dma_chan);
-+		else
-+			reg &= ~idma_mask(dma_chan);
-+		ipu_cm_write(ipu, reg, IPU_CHA_DB_MODE_SEL(dma_chan));
-+
-+		/* Reset to buffer 0 */
-+		ipu_cm_write(ipu, idma_mask(dma_chan),
-+				IPU_CHA_CUR_BUF(dma_chan));
-+
-+	}
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_init_channel_buffer);
-+
-+/*!
-+ * This function is called to update the physical address of a buffer for
-+ * a logical IPU channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to initialize.
-+ *
-+ * @param       bufNum          Input parameter for buffer number to update.
-+ *                              0 or 1 are the only valid values.
-+ *
-+ * @param       phyaddr         Input parameter buffer physical address.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail. This function will fail if the buffer is set to ready.
-+ */
-+int32_t ipu_update_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
-+				ipu_buffer_t type, uint32_t bufNum, dma_addr_t phyaddr)
-+{
-+	uint32_t reg;
-+	int ret = 0;
-+	uint32_t dma_chan = channel_2_dma(channel, type);
-+	unsigned long lock_flags;
-+
-+	if (dma_chan == IDMA_CHAN_INVALID)
-+		return -EINVAL;
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	if (bufNum == 0)
-+		reg = ipu_cm_read(ipu, IPU_CHA_BUF0_RDY(dma_chan));
-+	else if (bufNum == 1)
-+		reg = ipu_cm_read(ipu, IPU_CHA_BUF1_RDY(dma_chan));
-+	else
-+		reg = ipu_cm_read(ipu, IPU_CHA_BUF2_RDY(dma_chan));
-+
-+	if ((reg & idma_mask(dma_chan)) == 0)
-+		_ipu_ch_param_set_buffer(ipu, dma_chan, bufNum, phyaddr);
-+	else
-+		ret = -EACCES;
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_update_channel_buffer);
-+
-+/*!
-+ * This function is called to update the band mode setting for
-+ * a logical IPU channel.
-+ *
-+ * @param	ipu		ipu handler
-+ *
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to initialize.
-+ *
-+ * @param       band_height     Input parameter for band lines:
-+ *				shoule be log2(4/8/16/32/64/128/256).
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_set_channel_bandmode(struct ipu_soc *ipu, ipu_channel_t channel,
-+				 ipu_buffer_t type, uint32_t band_height)
-+{
-+	uint32_t reg;
-+	int ret = 0;
-+	uint32_t dma_chan = channel_2_dma(channel, type);
-+
-+	if ((2 > band_height) || (8 < band_height))
-+		return -EINVAL;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	reg = ipu_idmac_read(ipu, IDMAC_BAND_EN(dma_chan));
-+	reg |= 1 << (dma_chan % 32);
-+	ipu_idmac_write(ipu, reg, IDMAC_BAND_EN(dma_chan));
-+
-+	_ipu_ch_param_set_bandmode(ipu, dma_chan, band_height);
-+	dev_dbg(ipu->dev, "dma_chan:%d, band_height:%d.\n\n",
-+				dma_chan, 1 << band_height);
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_set_channel_bandmode);
-+
-+/*!
-+ * This function is called to initialize a buffer for logical IPU channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to initialize.
-+ *
-+ * @param       pixel_fmt       Input parameter for pixel format of buffer.
-+ *                              Pixel format is a FOURCC ASCII code.
-+ *
-+ * @param       width           Input parameter for width of buffer in pixels.
-+ *
-+ * @param       height          Input parameter for height of buffer in pixels.
-+ *
-+ * @param       stride          Input parameter for stride length of buffer
-+ *                              in pixels.
-+ *
-+ * @param       u		predefined private u offset for additional cropping,
-+ *								zero if not used.
-+ *
-+ * @param       v		predefined private v offset for additional cropping,
-+ *								zero if not used.
-+ *
-+ * @param			vertical_offset vertical offset for Y coordinate
-+ * 								in the existed frame
-+ *
-+ *
-+ * @param			horizontal_offset horizontal offset for X coordinate
-+ * 								in the existed frame
-+ *
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ *              This function will fail if any buffer is set to ready.
-+ */
-+
-+int32_t ipu_update_channel_offset(struct ipu_soc *ipu,
-+				ipu_channel_t channel, ipu_buffer_t type,
-+				uint32_t pixel_fmt,
-+				uint16_t width, uint16_t height,
-+				uint32_t stride,
-+				uint32_t u, uint32_t v,
-+				uint32_t vertical_offset, uint32_t horizontal_offset)
-+{
-+	int ret = 0;
-+	uint32_t dma_chan = channel_2_dma(channel, type);
-+	unsigned long lock_flags;
-+
-+	if (dma_chan == IDMA_CHAN_INVALID)
-+		return -EINVAL;
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	if ((ipu_cm_read(ipu, IPU_CHA_BUF0_RDY(dma_chan)) & idma_mask(dma_chan)) ||
-+	    (ipu_cm_read(ipu, IPU_CHA_BUF1_RDY(dma_chan)) & idma_mask(dma_chan)) ||
-+	    ((ipu_cm_read(ipu, IPU_CHA_BUF2_RDY(dma_chan)) & idma_mask(dma_chan)) &&
-+	     (ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan)) & idma_mask(dma_chan)) &&
-+	     _ipu_is_trb_chan(dma_chan)))
-+		ret = -EACCES;
-+	else
-+		_ipu_ch_offset_update(ipu, dma_chan, pixel_fmt, width, height, stride,
-+				      u, v, 0, vertical_offset, horizontal_offset);
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_update_channel_offset);
-+
-+
-+/*!
-+ * This function is called to set a channel's buffer as ready.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to initialize.
-+ *
-+ * @param       bufNum          Input parameter for which buffer number set to
-+ *                              ready state.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_select_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
-+			ipu_buffer_t type, uint32_t bufNum)
-+{
-+	uint32_t dma_chan = channel_2_dma(channel, type);
-+	unsigned long lock_flags;
-+
-+	if (dma_chan == IDMA_CHAN_INVALID)
-+		return -EINVAL;
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	/* Mark buffer to be ready. */
-+	if (bufNum == 0)
-+		ipu_cm_write(ipu, idma_mask(dma_chan),
-+			     IPU_CHA_BUF0_RDY(dma_chan));
-+	else if (bufNum == 1)
-+		ipu_cm_write(ipu, idma_mask(dma_chan),
-+			     IPU_CHA_BUF1_RDY(dma_chan));
-+	else
-+		ipu_cm_write(ipu, idma_mask(dma_chan),
-+			     IPU_CHA_BUF2_RDY(dma_chan));
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_select_buffer);
-+
-+/*!
-+ * This function is called to set a channel's buffer as ready.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       bufNum          Input parameter for which buffer number set to
-+ *                              ready state.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_select_multi_vdi_buffer(struct ipu_soc *ipu, uint32_t bufNum)
-+{
-+
-+	uint32_t dma_chan = channel_2_dma(MEM_VDI_PRP_VF_MEM, IPU_INPUT_BUFFER);
-+	uint32_t mask_bit =
-+		idma_mask(channel_2_dma(MEM_VDI_PRP_VF_MEM_P, IPU_INPUT_BUFFER))|
-+		idma_mask(dma_chan)|
-+		idma_mask(channel_2_dma(MEM_VDI_PRP_VF_MEM_N, IPU_INPUT_BUFFER));
-+	unsigned long lock_flags;
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	/* Mark buffers to be ready. */
-+	if (bufNum == 0)
-+		ipu_cm_write(ipu, mask_bit, IPU_CHA_BUF0_RDY(dma_chan));
-+	else
-+		ipu_cm_write(ipu, mask_bit, IPU_CHA_BUF1_RDY(dma_chan));
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_select_multi_vdi_buffer);
-+
-+#define NA	-1
-+static int proc_dest_sel[] = {
-+	0, 1, 1, 3, 5, 5, 4, 7, 8, 9, 10, 11, 12, 14, 15, 16,
-+	0, 1, 1, 5, 5, 5, 5, 5, 7, 8, 9, 10, 11, 12, 14, 31 };
-+static int proc_src_sel[] = { 0, 6, 7, 6, 7, 8, 5, NA, NA, NA,
-+  NA, NA, NA, NA, NA,  1,  2,  3,  4,  7,  8, NA, 8, NA };
-+static int disp_src_sel[] = { 0, 6, 7, 8, 3, 4, 5, NA, NA, NA,
-+  NA, NA, NA, NA, NA,  1, NA,  2, NA,  3,  4,  4,  4,  4 };
-+
-+
-+/*!
-+ * This function links 2 channels together for automatic frame
-+ * synchronization. The output of the source channel is linked to the input of
-+ * the destination channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       src_ch          Input parameter for the logical channel ID of
-+ *                              the source channel.
-+ *
-+ * @param       dest_ch         Input parameter for the logical channel ID of
-+ *                              the destination channel.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_link_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch)
-+{
-+	int retval = 0;
-+	uint32_t fs_proc_flow1;
-+	uint32_t fs_proc_flow2;
-+	uint32_t fs_proc_flow3;
-+	uint32_t fs_disp_flow1;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	fs_proc_flow1 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+	fs_proc_flow2 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW2);
-+	fs_proc_flow3 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW3);
-+	fs_disp_flow1 = ipu_cm_read(ipu, IPU_FS_DISP_FLOW1);
-+
-+	switch (src_ch) {
-+	case CSI_MEM0:
-+		fs_proc_flow3 &= ~FS_SMFC0_DEST_SEL_MASK;
-+		fs_proc_flow3 |=
-+			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+			FS_SMFC0_DEST_SEL_OFFSET;
-+		break;
-+	case CSI_MEM1:
-+		fs_proc_flow3 &= ~FS_SMFC1_DEST_SEL_MASK;
-+		fs_proc_flow3 |=
-+			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+			FS_SMFC1_DEST_SEL_OFFSET;
-+		break;
-+	case CSI_MEM2:
-+		fs_proc_flow3 &= ~FS_SMFC2_DEST_SEL_MASK;
-+		fs_proc_flow3 |=
-+			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+			FS_SMFC2_DEST_SEL_OFFSET;
-+		break;
-+	case CSI_MEM3:
-+		fs_proc_flow3 &= ~FS_SMFC3_DEST_SEL_MASK;
-+		fs_proc_flow3 |=
-+			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+			FS_SMFC3_DEST_SEL_OFFSET;
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+			FS_PRPENC_DEST_SEL_OFFSET;
-+		break;
-+	case CSI_PRP_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+			FS_PRPVF_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_PP_MEM:
-+		fs_proc_flow2 &= ~FS_PP_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PP_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		fs_proc_flow2 &= ~FS_PP_ROT_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PP_ROT_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PRPENC_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		fs_proc_flow2 &= ~FS_PRPENC_ROT_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PRPENC_ROT_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_PRP_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PRPVF_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PRPVF_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_ROT_DEST_SEL_MASK;
-+		fs_proc_flow2 |=
-+		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
-+		    FS_PRPVF_ROT_DEST_SEL_OFFSET;
-+		break;
-+	case MEM_VDOA_MEM:
-+		fs_proc_flow3 &= ~FS_VDOA_DEST_SEL_MASK;
-+		if (MEM_VDI_MEM == dest_ch)
-+			fs_proc_flow3 |= FS_VDOA_DEST_SEL_VDI;
-+		else if (MEM_PP_MEM == dest_ch)
-+			fs_proc_flow3 |= FS_VDOA_DEST_SEL_IC;
-+		else {
-+			retval = -EINVAL;
-+			goto err;
-+		}
-+		break;
-+	default:
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	switch (dest_ch) {
-+	case MEM_PP_MEM:
-+		fs_proc_flow1 &= ~FS_PP_SRC_SEL_MASK;
-+		if (MEM_VDOA_MEM == src_ch)
-+			fs_proc_flow1 |= FS_PP_SRC_SEL_VDOA;
-+		else
-+			fs_proc_flow1 |= proc_src_sel[IPU_CHAN_ID(src_ch)] <<
-+						FS_PP_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		fs_proc_flow1 &= ~FS_PP_ROT_SRC_SEL_MASK;
-+		fs_proc_flow1 |=
-+		    proc_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_PP_ROT_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
-+		fs_proc_flow1 |=
-+		    proc_src_sel[IPU_CHAN_ID(src_ch)] << FS_PRP_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		fs_proc_flow1 &= ~FS_PRPENC_ROT_SRC_SEL_MASK;
-+		fs_proc_flow1 |=
-+		    proc_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_PRPENC_ROT_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_PRP_VF_MEM:
-+		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
-+		fs_proc_flow1 |=
-+		    proc_src_sel[IPU_CHAN_ID(src_ch)] << FS_PRP_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
-+		fs_proc_flow1 |=
-+		    proc_src_sel[IPU_CHAN_ID(src_ch)] << FS_PRP_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		fs_proc_flow1 &= ~FS_PRPVF_ROT_SRC_SEL_MASK;
-+		fs_proc_flow1 |=
-+		    proc_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_PRPVF_ROT_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_DC_SYNC:
-+		fs_disp_flow1 &= ~FS_DC1_SRC_SEL_MASK;
-+		fs_disp_flow1 |=
-+		    disp_src_sel[IPU_CHAN_ID(src_ch)] << FS_DC1_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_BG_SYNC:
-+		fs_disp_flow1 &= ~FS_DP_SYNC0_SRC_SEL_MASK;
-+		fs_disp_flow1 |=
-+		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_DP_SYNC0_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_FG_SYNC:
-+		fs_disp_flow1 &= ~FS_DP_SYNC1_SRC_SEL_MASK;
-+		fs_disp_flow1 |=
-+		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_DP_SYNC1_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_DC_ASYNC:
-+		fs_disp_flow1 &= ~FS_DC2_SRC_SEL_MASK;
-+		fs_disp_flow1 |=
-+		    disp_src_sel[IPU_CHAN_ID(src_ch)] << FS_DC2_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_BG_ASYNC0:
-+		fs_disp_flow1 &= ~FS_DP_ASYNC0_SRC_SEL_MASK;
-+		fs_disp_flow1 |=
-+		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_DP_ASYNC0_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_FG_ASYNC0:
-+		fs_disp_flow1 &= ~FS_DP_ASYNC1_SRC_SEL_MASK;
-+		fs_disp_flow1 |=
-+		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
-+		    FS_DP_ASYNC1_SRC_SEL_OFFSET;
-+		break;
-+	case MEM_VDI_MEM:
-+		fs_proc_flow1 &= ~FS_VDI_SRC_SEL_MASK;
-+		if (MEM_VDOA_MEM == src_ch)
-+			fs_proc_flow1 |= FS_VDI_SRC_SEL_VDOA;
-+		else {
-+			retval = -EINVAL;
-+			goto err;
-+		}
-+		break;
-+	default:
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	ipu_cm_write(ipu, fs_proc_flow1, IPU_FS_PROC_FLOW1);
-+	ipu_cm_write(ipu, fs_proc_flow2, IPU_FS_PROC_FLOW2);
-+	ipu_cm_write(ipu, fs_proc_flow3, IPU_FS_PROC_FLOW3);
-+	ipu_cm_write(ipu, fs_disp_flow1, IPU_FS_DISP_FLOW1);
-+
-+err:
-+	mutex_unlock(&ipu->mutex_lock);
-+	return retval;
-+}
-+EXPORT_SYMBOL(ipu_link_channels);
-+
-+/*!
-+ * This function unlinks 2 channels and disables automatic frame
-+ * synchronization.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       src_ch          Input parameter for the logical channel ID of
-+ *                              the source channel.
-+ *
-+ * @param       dest_ch         Input parameter for the logical channel ID of
-+ *                              the destination channel.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_unlink_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch)
-+{
-+	int retval = 0;
-+	uint32_t fs_proc_flow1;
-+	uint32_t fs_proc_flow2;
-+	uint32_t fs_proc_flow3;
-+	uint32_t fs_disp_flow1;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	fs_proc_flow1 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
-+	fs_proc_flow2 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW2);
-+	fs_proc_flow3 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW3);
-+	fs_disp_flow1 = ipu_cm_read(ipu, IPU_FS_DISP_FLOW1);
-+
-+	switch (src_ch) {
-+	case CSI_MEM0:
-+		fs_proc_flow3 &= ~FS_SMFC0_DEST_SEL_MASK;
-+		break;
-+	case CSI_MEM1:
-+		fs_proc_flow3 &= ~FS_SMFC1_DEST_SEL_MASK;
-+		break;
-+	case CSI_MEM2:
-+		fs_proc_flow3 &= ~FS_SMFC2_DEST_SEL_MASK;
-+		break;
-+	case CSI_MEM3:
-+		fs_proc_flow3 &= ~FS_SMFC3_DEST_SEL_MASK;
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
-+		break;
-+	case CSI_PRP_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
-+		break;
-+	case MEM_PP_MEM:
-+		fs_proc_flow2 &= ~FS_PP_DEST_SEL_MASK;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		fs_proc_flow2 &= ~FS_PP_ROT_DEST_SEL_MASK;
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		fs_proc_flow2 &= ~FS_PRPENC_ROT_DEST_SEL_MASK;
-+		break;
-+	case MEM_PRP_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		fs_proc_flow2 &= ~FS_PRPVF_ROT_DEST_SEL_MASK;
-+		break;
-+	case MEM_VDOA_MEM:
-+		fs_proc_flow3 &= ~FS_VDOA_DEST_SEL_MASK;
-+		break;
-+	default:
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	switch (dest_ch) {
-+	case MEM_PP_MEM:
-+		fs_proc_flow1 &= ~FS_PP_SRC_SEL_MASK;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		fs_proc_flow1 &= ~FS_PP_ROT_SRC_SEL_MASK;
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		fs_proc_flow1 &= ~FS_PRPENC_ROT_SRC_SEL_MASK;
-+		break;
-+	case MEM_PRP_VF_MEM:
-+		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		fs_proc_flow1 &= ~FS_PRPVF_ROT_SRC_SEL_MASK;
-+		break;
-+	case MEM_DC_SYNC:
-+		fs_disp_flow1 &= ~FS_DC1_SRC_SEL_MASK;
-+		break;
-+	case MEM_BG_SYNC:
-+		fs_disp_flow1 &= ~FS_DP_SYNC0_SRC_SEL_MASK;
-+		break;
-+	case MEM_FG_SYNC:
-+		fs_disp_flow1 &= ~FS_DP_SYNC1_SRC_SEL_MASK;
-+		break;
-+	case MEM_DC_ASYNC:
-+		fs_disp_flow1 &= ~FS_DC2_SRC_SEL_MASK;
-+		break;
-+	case MEM_BG_ASYNC0:
-+		fs_disp_flow1 &= ~FS_DP_ASYNC0_SRC_SEL_MASK;
-+		break;
-+	case MEM_FG_ASYNC0:
-+		fs_disp_flow1 &= ~FS_DP_ASYNC1_SRC_SEL_MASK;
-+		break;
-+	case MEM_VDI_MEM:
-+		fs_proc_flow1 &= ~FS_VDI_SRC_SEL_MASK;
-+		break;
-+	default:
-+		retval = -EINVAL;
-+		goto err;
-+	}
-+
-+	ipu_cm_write(ipu, fs_proc_flow1, IPU_FS_PROC_FLOW1);
-+	ipu_cm_write(ipu, fs_proc_flow2, IPU_FS_PROC_FLOW2);
-+	ipu_cm_write(ipu, fs_proc_flow3, IPU_FS_PROC_FLOW3);
-+	ipu_cm_write(ipu, fs_disp_flow1, IPU_FS_DISP_FLOW1);
-+
-+err:
-+	mutex_unlock(&ipu->mutex_lock);
-+	return retval;
-+}
-+EXPORT_SYMBOL(ipu_unlink_channels);
-+
-+/*!
-+ * This function check whether a logical channel was enabled.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @return      This function returns 1 while request channel is enabled or
-+ *              0 for not enabled.
-+ */
-+int32_t ipu_is_channel_busy(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t reg;
-+	uint32_t in_dma;
-+	uint32_t out_dma;
-+
-+	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
-+	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
-+
-+	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(in_dma));
-+	if (reg & idma_mask(in_dma))
-+		return 1;
-+	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(out_dma));
-+	if (reg & idma_mask(out_dma))
-+		return 1;
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_is_channel_busy);
-+
-+/*!
-+ * This function enables a logical channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_enable_channel(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t reg;
-+	uint32_t ipu_conf;
-+	uint32_t in_dma;
-+	uint32_t out_dma;
-+	uint32_t sec_dma;
-+	uint32_t thrd_dma;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	if (ipu->channel_enable_mask & (1L << IPU_CHAN_ID(channel))) {
-+		dev_err(ipu->dev, "Warning: channel already enabled %d\n",
-+			IPU_CHAN_ID(channel));
-+		mutex_unlock(&ipu->mutex_lock);
-+		return -EACCES;
-+	}
-+
-+	/* Get input and output dma channels */
-+	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
-+	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
-+
-+	ipu_conf = ipu_cm_read(ipu, IPU_CONF);
-+	if (ipu->di_use_count[0] > 0) {
-+		ipu_conf |= IPU_CONF_DI0_EN;
-+	}
-+	if (ipu->di_use_count[1] > 0) {
-+		ipu_conf |= IPU_CONF_DI1_EN;
-+	}
-+	if (ipu->dp_use_count > 0)
-+		ipu_conf |= IPU_CONF_DP_EN;
-+	if (ipu->dc_use_count > 0)
-+		ipu_conf |= IPU_CONF_DC_EN;
-+	if (ipu->dmfc_use_count > 0)
-+		ipu_conf |= IPU_CONF_DMFC_EN;
-+	if (ipu->ic_use_count > 0)
-+		ipu_conf |= IPU_CONF_IC_EN;
-+	if (ipu->vdi_use_count > 0) {
-+		ipu_conf |= IPU_CONF_ISP_EN;
-+		ipu_conf |= IPU_CONF_VDI_EN;
-+		ipu_conf |= IPU_CONF_IC_INPUT;
-+	}
-+	if (ipu->rot_use_count > 0)
-+		ipu_conf |= IPU_CONF_ROT_EN;
-+	if (ipu->smfc_use_count > 0)
-+		ipu_conf |= IPU_CONF_SMFC_EN;
-+	ipu_cm_write(ipu, ipu_conf, IPU_CONF);
-+
-+	if (idma_is_valid(in_dma)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(in_dma));
-+		ipu_idmac_write(ipu, reg | idma_mask(in_dma), IDMAC_CHA_EN(in_dma));
-+	}
-+	if (idma_is_valid(out_dma)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(out_dma));
-+		ipu_idmac_write(ipu, reg | idma_mask(out_dma), IDMAC_CHA_EN(out_dma));
-+	}
-+
-+	if ((ipu->sec_chan_en[IPU_CHAN_ID(channel)]) &&
-+		((channel == MEM_PP_MEM) || (channel == MEM_PRP_VF_MEM) ||
-+		 (channel == MEM_VDI_PRP_VF_MEM))) {
-+		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(sec_dma));
-+		ipu_idmac_write(ipu, reg | idma_mask(sec_dma), IDMAC_CHA_EN(sec_dma));
-+	}
-+	if ((ipu->thrd_chan_en[IPU_CHAN_ID(channel)]) &&
-+		((channel == MEM_PP_MEM) || (channel == MEM_PRP_VF_MEM))) {
-+		thrd_dma = channel_2_dma(channel, IPU_ALPHA_IN_BUFFER);
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(thrd_dma));
-+		ipu_idmac_write(ipu, reg | idma_mask(thrd_dma), IDMAC_CHA_EN(thrd_dma));
-+
-+		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
-+		reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
-+		ipu_idmac_write(ipu, reg | idma_mask(sec_dma), IDMAC_SEP_ALPHA);
-+	} else if ((ipu->thrd_chan_en[IPU_CHAN_ID(channel)]) &&
-+		   ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC))) {
-+		thrd_dma = channel_2_dma(channel, IPU_ALPHA_IN_BUFFER);
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(thrd_dma));
-+		ipu_idmac_write(ipu, reg | idma_mask(thrd_dma), IDMAC_CHA_EN(thrd_dma));
-+		reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
-+		ipu_idmac_write(ipu, reg | idma_mask(in_dma), IDMAC_SEP_ALPHA);
-+	}
-+
-+	if ((channel == MEM_DC_SYNC) || (channel == MEM_BG_SYNC) ||
-+	    (channel == MEM_FG_SYNC)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_WM_EN(in_dma));
-+		ipu_idmac_write(ipu, reg | idma_mask(in_dma), IDMAC_WM_EN(in_dma));
-+
-+		_ipu_dp_dc_enable(ipu, channel);
-+	}
-+
-+	if (_ipu_is_ic_chan(in_dma) || _ipu_is_ic_chan(out_dma) ||
-+		_ipu_is_irt_chan(in_dma) || _ipu_is_irt_chan(out_dma) ||
-+		_ipu_is_vdi_out_chan(out_dma))
-+		_ipu_ic_enable_task(ipu, channel);
-+
-+	ipu->channel_enable_mask |= 1L << IPU_CHAN_ID(channel);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_enable_channel);
-+
-+/*!
-+ * This function check buffer ready for a logical channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to clear.
-+ *
-+ * @param       bufNum          Input parameter for which buffer number clear
-+ * 				ready state.
-+ *
-+ */
-+int32_t ipu_check_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+		uint32_t bufNum)
-+{
-+	uint32_t dma_chan = channel_2_dma(channel, type);
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+
-+	if (dma_chan == IDMA_CHAN_INVALID)
-+		return -EINVAL;
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	if (bufNum == 0)
-+		reg = ipu_cm_read(ipu, IPU_CHA_BUF0_RDY(dma_chan));
-+	else if (bufNum == 1)
-+		reg = ipu_cm_read(ipu, IPU_CHA_BUF1_RDY(dma_chan));
-+	else
-+		reg = ipu_cm_read(ipu, IPU_CHA_BUF2_RDY(dma_chan));
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	if (reg & idma_mask(dma_chan))
-+		return 1;
-+	else
-+		return 0;
-+}
-+EXPORT_SYMBOL(ipu_check_buffer_ready);
-+
-+/*!
-+ * This function clear buffer ready for a logical channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       type            Input parameter which buffer to clear.
-+ *
-+ * @param       bufNum          Input parameter for which buffer number clear
-+ * 				ready state.
-+ *
-+ */
-+void _ipu_clear_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+		uint32_t bufNum)
-+{
-+	uint32_t dma_ch = channel_2_dma(channel, type);
-+
-+	if (!idma_is_valid(dma_ch))
-+		return;
-+
-+	ipu_cm_write(ipu, 0xF0300000, IPU_GPR); /* write one to clear */
-+	if (bufNum == 0)
-+		ipu_cm_write(ipu, idma_mask(dma_ch),
-+				IPU_CHA_BUF0_RDY(dma_ch));
-+	else if (bufNum == 1)
-+		ipu_cm_write(ipu, idma_mask(dma_ch),
-+				IPU_CHA_BUF1_RDY(dma_ch));
-+	else
-+		ipu_cm_write(ipu, idma_mask(dma_ch),
-+				IPU_CHA_BUF2_RDY(dma_ch));
-+	ipu_cm_write(ipu, 0x0, IPU_GPR); /* write one to set */
-+}
-+
-+void ipu_clear_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+		uint32_t bufNum)
-+{
-+	unsigned long lock_flags;
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	_ipu_clear_buffer_ready(ipu, channel, type, bufNum);
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+}
-+EXPORT_SYMBOL(ipu_clear_buffer_ready);
-+
-+/*!
-+ * This function disables a logical channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       wait_for_stop   Flag to set whether to wait for channel end
-+ *                              of frame or return immediately.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_disable_channel(struct ipu_soc *ipu, ipu_channel_t channel, bool wait_for_stop)
-+{
-+	uint32_t reg;
-+	uint32_t in_dma;
-+	uint32_t out_dma;
-+	uint32_t sec_dma = NO_DMA;
-+	uint32_t thrd_dma = NO_DMA;
-+	uint16_t fg_pos_x, fg_pos_y;
-+	unsigned long lock_flags;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	if ((ipu->channel_enable_mask & (1L << IPU_CHAN_ID(channel))) == 0) {
-+		dev_dbg(ipu->dev, "Channel already disabled %d\n",
-+			IPU_CHAN_ID(channel));
-+		mutex_unlock(&ipu->mutex_lock);
-+		return -EACCES;
-+	}
-+
-+	/* Get input and output dma channels */
-+	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
-+	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
-+
-+	if ((idma_is_valid(in_dma) &&
-+		!idma_is_set(ipu, IDMAC_CHA_EN, in_dma))
-+		&& (idma_is_valid(out_dma) &&
-+		!idma_is_set(ipu, IDMAC_CHA_EN, out_dma))) {
-+		mutex_unlock(&ipu->mutex_lock);
-+		return -EINVAL;
-+	}
-+
-+	if (ipu->sec_chan_en[IPU_CHAN_ID(channel)])
-+		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
-+	if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)]) {
-+		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
-+		thrd_dma = channel_2_dma(channel, IPU_ALPHA_IN_BUFFER);
-+	}
-+
-+	if ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC) ||
-+	    (channel == MEM_DC_SYNC)) {
-+		if (channel == MEM_FG_SYNC) {
-+			_ipu_disp_get_window_pos(ipu, channel, &fg_pos_x, &fg_pos_y);
-+			_ipu_disp_set_window_pos(ipu, channel, 0, 0);
-+		}
-+
-+		_ipu_dp_dc_disable(ipu, channel, false);
-+
-+		/*
-+		 * wait for BG channel EOF then disable FG-IDMAC,
-+		 * it avoid FG NFB4EOF error.
-+		 */
-+		if ((channel == MEM_FG_SYNC) && (ipu_is_channel_busy(ipu, MEM_BG_SYNC))) {
-+			int timeout = 50;
-+
-+			ipu_cm_write(ipu, IPUIRQ_2_MASK(IPU_IRQ_BG_SYNC_EOF),
-+					IPUIRQ_2_STATREG(IPU_IRQ_BG_SYNC_EOF));
-+			while ((ipu_cm_read(ipu, IPUIRQ_2_STATREG(IPU_IRQ_BG_SYNC_EOF)) &
-+						IPUIRQ_2_MASK(IPU_IRQ_BG_SYNC_EOF)) == 0) {
-+				msleep(10);
-+				timeout -= 10;
-+				if (timeout <= 0) {
-+					dev_err(ipu->dev, "warning: wait for bg sync eof timeout\n");
-+					break;
-+				}
-+			}
-+		}
-+	} else if (wait_for_stop && !_ipu_is_smfc_chan(out_dma) &&
-+		   channel != CSI_PRP_VF_MEM && channel != CSI_PRP_ENC_MEM) {
-+		while (idma_is_set(ipu, IDMAC_CHA_BUSY, in_dma) ||
-+		       idma_is_set(ipu, IDMAC_CHA_BUSY, out_dma) ||
-+			(ipu->sec_chan_en[IPU_CHAN_ID(channel)] &&
-+			idma_is_set(ipu, IDMAC_CHA_BUSY, sec_dma)) ||
-+			(ipu->thrd_chan_en[IPU_CHAN_ID(channel)] &&
-+			idma_is_set(ipu, IDMAC_CHA_BUSY, thrd_dma))) {
-+			uint32_t irq = 0xffffffff;
-+			int timeout = 50000;
-+
-+			if (idma_is_set(ipu, IDMAC_CHA_BUSY, out_dma))
-+				irq = out_dma;
-+			if (ipu->sec_chan_en[IPU_CHAN_ID(channel)] &&
-+				idma_is_set(ipu, IDMAC_CHA_BUSY, sec_dma))
-+				irq = sec_dma;
-+			if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] &&
-+				idma_is_set(ipu, IDMAC_CHA_BUSY, thrd_dma))
-+				irq = thrd_dma;
-+			if (idma_is_set(ipu, IDMAC_CHA_BUSY, in_dma))
-+				irq = in_dma;
-+
-+			if (irq == 0xffffffff) {
-+				dev_dbg(ipu->dev, "warning: no channel busy, break\n");
-+				break;
-+			}
-+
-+			ipu_cm_write(ipu, IPUIRQ_2_MASK(irq),
-+					IPUIRQ_2_STATREG(irq));
-+
-+			dev_dbg(ipu->dev, "warning: channel %d busy, need wait\n", irq);
-+
-+			while (((ipu_cm_read(ipu, IPUIRQ_2_STATREG(irq))
-+				& IPUIRQ_2_MASK(irq)) == 0) &&
-+				(idma_is_set(ipu, IDMAC_CHA_BUSY, irq))) {
-+				udelay(10);
-+				timeout -= 10;
-+				if (timeout <= 0) {
-+					ipu_dump_registers(ipu);
-+					dev_err(ipu->dev, "warning: disable ipu dma channel %d during its busy state\n", irq);
-+					break;
-+				}
-+			}
-+			dev_dbg(ipu->dev, "wait_time:%d\n", 50000 - timeout);
-+
-+		}
-+	}
-+
-+	if ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC) ||
-+	    (channel == MEM_DC_SYNC)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_WM_EN(in_dma));
-+		ipu_idmac_write(ipu, reg & ~idma_mask(in_dma), IDMAC_WM_EN(in_dma));
-+	}
-+
-+	/* Disable IC task */
-+	if (_ipu_is_ic_chan(in_dma) || _ipu_is_ic_chan(out_dma) ||
-+		_ipu_is_irt_chan(in_dma) || _ipu_is_irt_chan(out_dma) ||
-+		_ipu_is_vdi_out_chan(out_dma))
-+		_ipu_ic_disable_task(ipu, channel);
-+
-+	/* Disable DMA channel(s) */
-+	if (idma_is_valid(in_dma)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(in_dma));
-+		ipu_idmac_write(ipu, reg & ~idma_mask(in_dma), IDMAC_CHA_EN(in_dma));
-+		ipu_cm_write(ipu, idma_mask(in_dma), IPU_CHA_CUR_BUF(in_dma));
-+		ipu_cm_write(ipu, tri_cur_buf_mask(in_dma),
-+					IPU_CHA_TRIPLE_CUR_BUF(in_dma));
-+	}
-+	if (idma_is_valid(out_dma)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(out_dma));
-+		ipu_idmac_write(ipu, reg & ~idma_mask(out_dma), IDMAC_CHA_EN(out_dma));
-+		ipu_cm_write(ipu, idma_mask(out_dma), IPU_CHA_CUR_BUF(out_dma));
-+		ipu_cm_write(ipu, tri_cur_buf_mask(out_dma),
-+					IPU_CHA_TRIPLE_CUR_BUF(out_dma));
-+	}
-+	if (ipu->sec_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(sec_dma)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(sec_dma));
-+		ipu_idmac_write(ipu, reg & ~idma_mask(sec_dma), IDMAC_CHA_EN(sec_dma));
-+		ipu_cm_write(ipu, idma_mask(sec_dma), IPU_CHA_CUR_BUF(sec_dma));
-+	}
-+	if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(thrd_dma)) {
-+		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(thrd_dma));
-+		ipu_idmac_write(ipu, reg & ~idma_mask(thrd_dma), IDMAC_CHA_EN(thrd_dma));
-+		if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC) {
-+			reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
-+			ipu_idmac_write(ipu, reg & ~idma_mask(in_dma), IDMAC_SEP_ALPHA);
-+		} else {
-+			reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
-+			ipu_idmac_write(ipu, reg & ~idma_mask(sec_dma), IDMAC_SEP_ALPHA);
-+		}
-+		ipu_cm_write(ipu, idma_mask(thrd_dma), IPU_CHA_CUR_BUF(thrd_dma));
-+	}
-+
-+	if (channel == MEM_FG_SYNC)
-+		_ipu_disp_set_window_pos(ipu, channel, fg_pos_x, fg_pos_y);
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	/* Set channel buffers NOT to be ready */
-+	if (idma_is_valid(in_dma)) {
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_VIDEO_IN_BUFFER, 0);
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_VIDEO_IN_BUFFER, 1);
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_VIDEO_IN_BUFFER, 2);
-+	}
-+	if (idma_is_valid(out_dma)) {
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_OUTPUT_BUFFER, 0);
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_OUTPUT_BUFFER, 1);
-+	}
-+	if (ipu->sec_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(sec_dma)) {
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_GRAPH_IN_BUFFER, 0);
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_GRAPH_IN_BUFFER, 1);
-+	}
-+	if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(thrd_dma)) {
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_ALPHA_IN_BUFFER, 0);
-+		_ipu_clear_buffer_ready(ipu, channel, IPU_ALPHA_IN_BUFFER, 1);
-+	}
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	ipu->channel_enable_mask &= ~(1L << IPU_CHAN_ID(channel));
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_disable_channel);
-+
-+/*!
-+ * This function enables CSI.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       csi	csi num 0 or 1
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_enable_csi(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t reg;
-+
-+	if (csi > 1) {
-+		dev_err(ipu->dev, "Wrong csi num_%d\n", csi);
-+		return -EINVAL;
-+	}
-+
-+	_ipu_get(ipu);
-+	mutex_lock(&ipu->mutex_lock);
-+	ipu->csi_use_count[csi]++;
-+
-+	if (ipu->csi_use_count[csi] == 1) {
-+		reg = ipu_cm_read(ipu, IPU_CONF);
-+		if (csi == 0)
-+			ipu_cm_write(ipu, reg | IPU_CONF_CSI0_EN, IPU_CONF);
-+		else
-+			ipu_cm_write(ipu, reg | IPU_CONF_CSI1_EN, IPU_CONF);
-+	}
-+	mutex_unlock(&ipu->mutex_lock);
-+	_ipu_put(ipu);
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_enable_csi);
-+
-+/*!
-+ * This function disables CSI.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       csi	csi num 0 or 1
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_disable_csi(struct ipu_soc *ipu, uint32_t csi)
-+{
-+	uint32_t reg;
-+
-+	if (csi > 1) {
-+		dev_err(ipu->dev, "Wrong csi num_%d\n", csi);
-+		return -EINVAL;
-+	}
-+	_ipu_get(ipu);
-+	mutex_lock(&ipu->mutex_lock);
-+	ipu->csi_use_count[csi]--;
-+	if (ipu->csi_use_count[csi] == 0) {
-+		_ipu_csi_wait4eof(ipu, ipu->csi_channel[csi]);
-+		reg = ipu_cm_read(ipu, IPU_CONF);
-+		if (csi == 0)
-+			ipu_cm_write(ipu, reg & ~IPU_CONF_CSI0_EN, IPU_CONF);
-+		else
-+			ipu_cm_write(ipu, reg & ~IPU_CONF_CSI1_EN, IPU_CONF);
-+	}
-+	mutex_unlock(&ipu->mutex_lock);
-+	_ipu_put(ipu);
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_disable_csi);
-+
-+static irqreturn_t ipu_sync_irq_handler(int irq, void *desc)
-+{
-+	struct ipu_soc *ipu = desc;
-+	int i;
-+	uint32_t line, bit, int_stat, int_ctrl;
-+	irqreturn_t result = IRQ_NONE;
-+	const int int_reg[] = { 1, 2, 3, 4, 11, 12, 13, 14, 15, 0 };
-+
-+	spin_lock(&ipu->int_reg_spin_lock);
-+
-+	for (i = 0; int_reg[i] != 0; i++) {
-+		int_stat = ipu_cm_read(ipu, IPU_INT_STAT(int_reg[i]));
-+		int_ctrl = ipu_cm_read(ipu, IPU_INT_CTRL(int_reg[i]));
-+		int_stat &= int_ctrl;
-+		ipu_cm_write(ipu, int_stat, IPU_INT_STAT(int_reg[i]));
-+		while ((line = ffs(int_stat)) != 0) {
-+			bit = --line;
-+			int_stat &= ~(1UL << line);
-+			line += (int_reg[i] - 1) * 32;
-+			result |=
-+			    ipu->irq_list[line].handler(line,
-+						       ipu->irq_list[line].
-+						       dev_id);
-+			if (ipu->irq_list[line].flags & IPU_IRQF_ONESHOT) {
-+				int_ctrl &= ~(1UL << bit);
-+				ipu_cm_write(ipu, int_ctrl,
-+						IPU_INT_CTRL(int_reg[i]));
-+			}
-+		}
-+	}
-+
-+	spin_unlock(&ipu->int_reg_spin_lock);
-+
-+	return result;
-+}
-+
-+static irqreturn_t ipu_err_irq_handler(int irq, void *desc)
-+{
-+	struct ipu_soc *ipu = desc;
-+	int i;
-+	uint32_t int_stat;
-+	const int err_reg[] = { 5, 6, 9, 10, 0 };
-+
-+	spin_lock(&ipu->int_reg_spin_lock);
-+
-+	for (i = 0; err_reg[i] != 0; i++) {
-+		int_stat = ipu_cm_read(ipu, IPU_INT_STAT(err_reg[i]));
-+		int_stat &= ipu_cm_read(ipu, IPU_INT_CTRL(err_reg[i]));
-+		if (int_stat) {
-+			ipu_cm_write(ipu, int_stat, IPU_INT_STAT(err_reg[i]));
-+			dev_warn(ipu->dev,
-+				"IPU Warning - IPU_INT_STAT_%d = 0x%08X\n",
-+				err_reg[i], int_stat);
-+			/* Disable interrupts so we only get error once */
-+			int_stat = ipu_cm_read(ipu, IPU_INT_CTRL(err_reg[i])) &
-+					~int_stat;
-+			ipu_cm_write(ipu, int_stat, IPU_INT_CTRL(err_reg[i]));
-+		}
-+	}
-+
-+	spin_unlock(&ipu->int_reg_spin_lock);
-+
-+	return IRQ_HANDLED;
-+}
-+
-+/*!
-+ * This function enables the interrupt for the specified interrupt line.
-+ * The interrupt lines are defined in \b ipu_irq_line enum.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       irq             Interrupt line to enable interrupt for.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int ipu_enable_irq(struct ipu_soc *ipu, uint32_t irq)
-+{
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+	int ret = 0;
-+
-+	_ipu_get(ipu);
-+
-+	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	/*
-+	 * Check sync interrupt handler only, since we do nothing for
-+	 * error interrupts but than print out register values in the
-+	 * error interrupt source handler.
-+	 */
-+	if (_ipu_is_sync_irq(irq) && (ipu->irq_list[irq].handler == NULL)) {
-+		dev_err(ipu->dev, "handler hasn't been registered on sync "
-+				  "irq %d\n", irq);
-+		ret = -EACCES;
-+		goto out;
-+	}
-+
-+	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
-+	reg |= IPUIRQ_2_MASK(irq);
-+	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
-+out:
-+	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	_ipu_put(ipu);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_enable_irq);
-+
-+/*!
-+ * This function disables the interrupt for the specified interrupt line.
-+ * The interrupt lines are defined in \b ipu_irq_line enum.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       irq             Interrupt line to disable interrupt for.
-+ *
-+ */
-+void ipu_disable_irq(struct ipu_soc *ipu, uint32_t irq)
-+{
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+
-+	_ipu_get(ipu);
-+
-+	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
-+	reg &= ~IPUIRQ_2_MASK(irq);
-+	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
-+
-+	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_disable_irq);
-+
-+/*!
-+ * This function clears the interrupt for the specified interrupt line.
-+ * The interrupt lines are defined in \b ipu_irq_line enum.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       irq             Interrupt line to clear interrupt for.
-+ *
-+ */
-+void ipu_clear_irq(struct ipu_soc *ipu, uint32_t irq)
-+{
-+	unsigned long lock_flags;
-+
-+	_ipu_get(ipu);
-+
-+	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	ipu_cm_write(ipu, IPUIRQ_2_MASK(irq), IPUIRQ_2_STATREG(irq));
-+
-+	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_clear_irq);
-+
-+/*!
-+ * This function returns the current interrupt status for the specified
-+ * interrupt line. The interrupt lines are defined in \b ipu_irq_line enum.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       irq             Interrupt line to get status for.
-+ *
-+ * @return      Returns true if the interrupt is pending/asserted or false if
-+ *              the interrupt is not pending.
-+ */
-+bool ipu_get_irq_status(struct ipu_soc *ipu, uint32_t irq)
-+{
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+
-+	_ipu_get(ipu);
-+
-+	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
-+	reg = ipu_cm_read(ipu, IPUIRQ_2_STATREG(irq));
-+	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	_ipu_put(ipu);
-+
-+	if (reg & IPUIRQ_2_MASK(irq))
-+		return true;
-+	else
-+		return false;
-+}
-+EXPORT_SYMBOL(ipu_get_irq_status);
-+
-+/*!
-+ * This function registers an interrupt handler function for the specified
-+ * interrupt line. The interrupt lines are defined in \b ipu_irq_line enum.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       irq             Interrupt line to get status for.
-+ *
-+ * @param       handler         Input parameter for address of the handler
-+ *                              function.
-+ *
-+ * @param       irq_flags       Flags for interrupt mode. Currently not used.
-+ *
-+ * @param       devname         Input parameter for string name of driver
-+ *                              registering the handler.
-+ *
-+ * @param       dev_id          Input parameter for pointer of data to be
-+ *                              passed to the handler.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int ipu_request_irq(struct ipu_soc *ipu, uint32_t irq,
-+		    irqreturn_t(*handler) (int, void *),
-+		    uint32_t irq_flags, const char *devname, void *dev_id)
-+{
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+	int ret = 0;
-+
-+	BUG_ON(irq >= IPU_IRQ_COUNT);
-+
-+	_ipu_get(ipu);
-+
-+	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	if (ipu->irq_list[irq].handler != NULL) {
-+		dev_err(ipu->dev,
-+			"handler already installed on irq %d\n", irq);
-+		ret = -EINVAL;
-+		goto out;
-+	}
-+
-+	/*
-+	 * Check sync interrupt handler only, since we do nothing for
-+	 * error interrupts but than print out register values in the
-+	 * error interrupt source handler.
-+	 */
-+	if (_ipu_is_sync_irq(irq) && (handler == NULL)) {
-+		dev_err(ipu->dev, "handler is NULL for sync irq %d\n", irq);
-+		ret = -EINVAL;
-+		goto out;
-+	}
-+
-+	ipu->irq_list[irq].handler = handler;
-+	ipu->irq_list[irq].flags = irq_flags;
-+	ipu->irq_list[irq].dev_id = dev_id;
-+	ipu->irq_list[irq].name = devname;
-+
-+	/* clear irq stat for previous use */
-+	ipu_cm_write(ipu, IPUIRQ_2_MASK(irq), IPUIRQ_2_STATREG(irq));
-+	/* enable the interrupt */
-+	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
-+	reg |= IPUIRQ_2_MASK(irq);
-+	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
-+out:
-+	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	_ipu_put(ipu);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_request_irq);
-+
-+/*!
-+ * This function unregisters an interrupt handler for the specified interrupt
-+ * line. The interrupt lines are defined in \b ipu_irq_line enum.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       irq             Interrupt line to get status for.
-+ *
-+ * @param       dev_id          Input parameter for pointer of data to be passed
-+ *                              to the handler. This must match value passed to
-+ *                              ipu_request_irq().
-+ *
-+ */
-+void ipu_free_irq(struct ipu_soc *ipu, uint32_t irq, void *dev_id)
-+{
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+
-+	_ipu_get(ipu);
-+
-+	if (ipu->irq_list[irq].dev_id != dev_id)
-+		return;
-+
-+	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	/* disable the interrupt */
-+	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
-+	reg &= ~IPUIRQ_2_MASK(irq);
-+	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
-+	memset(&ipu->irq_list[irq], 0, sizeof(ipu->irq_list[irq]));
-+
-+	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
-+
-+	_ipu_put(ipu);
-+}
-+EXPORT_SYMBOL(ipu_free_irq);
-+
-+uint32_t ipu_get_cur_buffer_idx(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type)
-+{
-+	uint32_t reg, dma_chan;
-+
-+	dma_chan = channel_2_dma(channel, type);
-+	if (!idma_is_valid(dma_chan))
-+		return -EINVAL;
-+
-+	reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan));
-+	if ((reg & idma_mask(dma_chan)) && _ipu_is_trb_chan(dma_chan)) {
-+		reg = ipu_cm_read(ipu, IPU_CHA_TRIPLE_CUR_BUF(dma_chan));
-+		return (reg & tri_cur_buf_mask(dma_chan)) >>
-+				tri_cur_buf_shift(dma_chan);
-+	} else {
-+		reg = ipu_cm_read(ipu, IPU_CHA_CUR_BUF(dma_chan));
-+		if (reg & idma_mask(dma_chan))
-+			return 1;
-+		else
-+			return 0;
-+	}
-+}
-+EXPORT_SYMBOL(ipu_get_cur_buffer_idx);
-+
-+uint32_t _ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t stat = 0;
-+	uint32_t task_stat_reg = ipu_cm_read(ipu, IPU_PROC_TASK_STAT);
-+
-+	switch (channel) {
-+	case MEM_PRP_VF_MEM:
-+		stat = (task_stat_reg & TSTAT_VF_MASK) >> TSTAT_VF_OFFSET;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		stat = (task_stat_reg & TSTAT_VF_MASK) >> TSTAT_VF_OFFSET;
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		stat =
-+		    (task_stat_reg & TSTAT_VF_ROT_MASK) >> TSTAT_VF_ROT_OFFSET;
-+		break;
-+	case MEM_PRP_ENC_MEM:
-+		stat = (task_stat_reg & TSTAT_ENC_MASK) >> TSTAT_ENC_OFFSET;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		stat =
-+		    (task_stat_reg & TSTAT_ENC_ROT_MASK) >>
-+		    TSTAT_ENC_ROT_OFFSET;
-+		break;
-+	case MEM_PP_MEM:
-+		stat = (task_stat_reg & TSTAT_PP_MASK) >> TSTAT_PP_OFFSET;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		stat =
-+		    (task_stat_reg & TSTAT_PP_ROT_MASK) >> TSTAT_PP_ROT_OFFSET;
-+		break;
-+
-+	default:
-+		stat = TASK_STAT_IDLE;
-+		break;
-+	}
-+	return stat;
-+}
-+
-+/*!
-+ * This function check for  a logical channel status
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel         Input parameter for the logical channel ID.
-+ *
-+ * @return      This function returns 0 on idle and 1 on busy.
-+ *
-+ */
-+uint32_t ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t dma_status;
-+
-+	_ipu_get(ipu);
-+	mutex_lock(&ipu->mutex_lock);
-+	dma_status = ipu_is_channel_busy(ipu, channel);
-+	mutex_unlock(&ipu->mutex_lock);
-+	_ipu_put(ipu);
-+
-+	dev_dbg(ipu->dev, "%s, dma_status:%d.\n", __func__, dma_status);
-+
-+	return dma_status;
-+}
-+EXPORT_SYMBOL(ipu_channel_status);
-+
-+int32_t ipu_swap_channel(struct ipu_soc *ipu, ipu_channel_t from_ch, ipu_channel_t to_ch)
-+{
-+	uint32_t reg;
-+	unsigned long lock_flags;
-+	int from_dma = channel_2_dma(from_ch, IPU_INPUT_BUFFER);
-+	int to_dma = channel_2_dma(to_ch, IPU_INPUT_BUFFER);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	/* enable target channel */
-+	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(to_dma));
-+	ipu_idmac_write(ipu, reg | idma_mask(to_dma), IDMAC_CHA_EN(to_dma));
-+
-+	ipu->channel_enable_mask |= 1L << IPU_CHAN_ID(to_ch);
-+
-+	/* switch dp dc */
-+	_ipu_dp_dc_disable(ipu, from_ch, true);
-+
-+	/* disable source channel */
-+	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(from_dma));
-+	ipu_idmac_write(ipu, reg & ~idma_mask(from_dma), IDMAC_CHA_EN(from_dma));
-+	ipu_cm_write(ipu, idma_mask(from_dma), IPU_CHA_CUR_BUF(from_dma));
-+	ipu_cm_write(ipu, tri_cur_buf_mask(from_dma),
-+				IPU_CHA_TRIPLE_CUR_BUF(from_dma));
-+
-+	ipu->channel_enable_mask &= ~(1L << IPU_CHAN_ID(from_ch));
-+
-+	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
-+	_ipu_clear_buffer_ready(ipu, from_ch, IPU_VIDEO_IN_BUFFER, 0);
-+	_ipu_clear_buffer_ready(ipu, from_ch, IPU_VIDEO_IN_BUFFER, 1);
-+	_ipu_clear_buffer_ready(ipu, from_ch, IPU_VIDEO_IN_BUFFER, 2);
-+	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_swap_channel);
-+
-+uint32_t bytes_per_pixel(uint32_t fmt)
-+{
-+	switch (fmt) {
-+	case IPU_PIX_FMT_GENERIC:	/*generic data */
-+	case IPU_PIX_FMT_RGB332:
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YUV444P:
-+		return 1;
-+		break;
-+	case IPU_PIX_FMT_GENERIC_16:	/* generic data */
-+	case IPU_PIX_FMT_RGB565:
-+	case IPU_PIX_FMT_YUYV:
-+	case IPU_PIX_FMT_UYVY:
-+		return 2;
-+		break;
-+	case IPU_PIX_FMT_BGR24:
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_YUV444:
-+		return 3;
-+		break;
-+	case IPU_PIX_FMT_GENERIC_32:	/*generic data */
-+	case IPU_PIX_FMT_BGR32:
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_RGB32:
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_ABGR32:
-+		return 4;
-+		break;
-+	default:
-+		return 1;
-+		break;
-+	}
-+	return 0;
-+}
-+EXPORT_SYMBOL(bytes_per_pixel);
-+
-+ipu_color_space_t format_to_colorspace(uint32_t fmt)
-+{
-+	switch (fmt) {
-+	case IPU_PIX_FMT_RGB666:
-+	case IPU_PIX_FMT_RGB565:
-+	case IPU_PIX_FMT_BGR24:
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_GBR24:
-+	case IPU_PIX_FMT_BGR32:
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_RGB32:
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_ABGR32:
-+	case IPU_PIX_FMT_LVDS666:
-+	case IPU_PIX_FMT_LVDS888:
-+		return RGB;
-+		break;
-+
-+	default:
-+		return YCbCr;
-+		break;
-+	}
-+	return RGB;
-+}
-+
-+bool ipu_pixel_format_has_alpha(uint32_t fmt)
-+{
-+	switch (fmt) {
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_ABGR32:
-+		return true;
-+		break;
-+	default:
-+		return false;
-+		break;
-+	}
-+	return false;
-+}
-+
-+bool ipu_ch_param_bad_alpha_pos(uint32_t pixel_fmt)
-+{
-+	return _ipu_ch_param_bad_alpha_pos(pixel_fmt);
-+}
-+EXPORT_SYMBOL(ipu_ch_param_bad_alpha_pos);
-+
-+#ifdef CONFIG_PM
-+static int ipu_suspend(struct device *dev)
-+{
-+	struct ipu_soc *ipu = dev_get_drvdata(dev);
-+
-+	/* All IDMAC channel and IPU clock should be disabled.*/
-+	if (ipu->pdata->pg)
-+		ipu->pdata->pg(1);
-+
-+	dev_dbg(dev, "ipu suspend.\n");
-+	return 0;
-+}
-+
-+static int ipu_resume(struct device *dev)
-+{
-+	struct ipu_soc *ipu = dev_get_drvdata(dev);
-+
-+	if (ipu->pdata->pg) {
-+		ipu->pdata->pg(0);
-+
-+		_ipu_get(ipu);
-+		_ipu_dmfc_init(ipu, dmfc_type_setup, 1);
-+		/* Set sync refresh channels as high priority */
-+		ipu_idmac_write(ipu, 0x18800001L, IDMAC_CHA_PRI(0));
-+		_ipu_put(ipu);
-+	}
-+	dev_dbg(dev, "ipu resume.\n");
-+	return 0;
-+}
-+
-+int ipu_runtime_suspend(struct device *dev)
-+{
-+	dev_dbg(dev, "ipu busfreq high release.\n");
-+	release_bus_freq(BUS_FREQ_HIGH);
-+
-+	return 0;
-+}
-+
-+int ipu_runtime_resume(struct device *dev)
-+{
-+	dev_dbg(dev, "ipu busfreq high requst.\n");
-+	request_bus_freq(BUS_FREQ_HIGH);
-+
-+	return 0;
-+}
-+
-+static const struct dev_pm_ops ipu_pm_ops = {
-+	SET_RUNTIME_PM_OPS(ipu_runtime_suspend, ipu_runtime_resume, NULL)
-+	SET_SYSTEM_SLEEP_PM_OPS(ipu_suspend, ipu_resume)
-+};
-+#endif
-+
-+/*!
-+ * This structure contains pointers to the power management callback functions.
-+ */
-+static struct platform_driver mxcipu_driver = {
-+	.driver = {
-+			.name		= "imx-ipuv3",
-+			.of_match_table	= imx_ipuv3_dt_ids,
-+		#ifdef CONFIG_PM
-+			.pm	= &ipu_pm_ops,
-+		#endif
-+	},
-+	.probe		= ipu_probe,
-+	.id_table	= imx_ipu_type,
-+	.remove		= ipu_remove,
-+};
-+
-+int32_t __init ipu_gen_init(void)
-+{
-+	int32_t ret;
-+
-+	ret = platform_driver_register(&mxcipu_driver);
-+	return 0;
-+}
-+
-+subsys_initcall(ipu_gen_init);
-+
-+static void __exit ipu_gen_uninit(void)
-+{
-+	platform_driver_unregister(&mxcipu_driver);
-+}
-+
-+module_exit(ipu_gen_uninit);
-+
-+MODULE_DESCRIPTION("i.MX IPU v3 driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_device.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_device.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_device.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_device.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,3725 @@
-+/*
-+ * Copyright 2005-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file ipu_device.c
-+ *
-+ * @brief This file contains the IPUv3 driver device interface and fops functions.
-+ *
-+ * @ingroup IPU
-+ */
-+#include <linux/clk.h>
-+#include <linux/cpumask.h>
-+#include <linux/delay.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/err.h>
-+#include <linux/init.h>
-+#include <linux/io.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/kernel.h>
-+#include <linux/kthread.h>
-+#include <linux/module.h>
-+#include <linux/platform_device.h>
-+#include <linux/poll.h>
-+#include <linux/sched.h>
-+#include <linux/sched/rt.h>
-+#include <linux/slab.h>
-+#include <linux/spinlock.h>
-+#include <linux/time.h>
-+#include <linux/types.h>
-+#include <linux/vmalloc.h>
-+#include <linux/wait.h>
-+
-+#include <asm/cacheflush.h>
-+#include <asm/outercache.h>
-+
-+#include "ipu_param_mem.h"
-+#include "ipu_regs.h"
-+#include "vdoa.h"
-+
-+#define CHECK_RETCODE(cont, str, err, label, ret)			\
-+do {									\
-+	if (cont) {							\
-+		dev_err(t->dev, "ERR:[0x%p]-no:0x%x "#str" ret:%d,"	\
-+				"line:%d\n", t, t->task_no, ret, __LINE__);\
-+		if (ret != -EACCES) {					\
-+			t->state = err;					\
-+			goto label;					\
-+		}							\
-+	}								\
-+} while (0)
-+
-+#define CHECK_RETCODE_CONT(cont, str, err, ret)				\
-+do {									\
-+	if (cont) {							\
-+		dev_err(t->dev, "ERR:[0x%p]-no:0x%x"#str" ret:%d,"	\
-+				"line:%d\n", t, t->task_no, ret, __LINE__);\
-+		if (ret != -EACCES) {					\
-+			if (t->state == STATE_OK)			\
-+				t->state = err;				\
-+		}							\
-+	}								\
-+} while (0)
-+
-+#undef DBG_IPU_PERF
-+#ifdef DBG_IPU_PERF
-+#define CHECK_PERF(ts)							\
-+do {									\
-+	getnstimeofday(ts);						\
-+} while (0)
-+
-+#define DECLARE_PERF_VAR						\
-+	struct timespec ts_queue;					\
-+	struct timespec ts_dotask;					\
-+	struct timespec ts_waitirq;					\
-+	struct timespec ts_sche;					\
-+	struct timespec ts_rel;						\
-+	struct timespec ts_frame
-+
-+#define PRINT_TASK_STATISTICS						\
-+do {									\
-+	ts_queue = timespec_sub(tsk->ts_dotask, tsk->ts_queue);		\
-+	ts_dotask = timespec_sub(tsk->ts_waitirq, tsk->ts_dotask);	\
-+	ts_waitirq = timespec_sub(tsk->ts_inirq, tsk->ts_waitirq);	\
-+	ts_sche = timespec_sub(tsk->ts_wakeup, tsk->ts_inirq);		\
-+	ts_rel = timespec_sub(tsk->ts_rel, tsk->ts_wakeup);		\
-+	ts_frame = timespec_sub(tsk->ts_rel, tsk->ts_queue);		\
-+	dev_dbg(tsk->dev, "[0x%p] no-0x%x, ts_q:%ldus, ts_do:%ldus,"	\
-+		"ts_waitirq:%ldus,ts_sche:%ldus, ts_rel:%ldus,"		\
-+		"ts_frame: %ldus\n", tsk, tsk->task_no,			\
-+	ts_queue.tv_nsec / NSEC_PER_USEC + ts_queue.tv_sec * USEC_PER_SEC,\
-+	ts_dotask.tv_nsec / NSEC_PER_USEC + ts_dotask.tv_sec * USEC_PER_SEC,\
-+	ts_waitirq.tv_nsec / NSEC_PER_USEC + ts_waitirq.tv_sec * USEC_PER_SEC,\
-+	ts_sche.tv_nsec / NSEC_PER_USEC + ts_sche.tv_sec * USEC_PER_SEC,\
-+	ts_rel.tv_nsec / NSEC_PER_USEC + ts_rel.tv_sec * USEC_PER_SEC,\
-+	ts_frame.tv_nsec / NSEC_PER_USEC + ts_frame.tv_sec * USEC_PER_SEC); \
-+	if ((ts_frame.tv_nsec/NSEC_PER_USEC + ts_frame.tv_sec*USEC_PER_SEC) > \
-+		80000)	\
-+		dev_dbg(tsk->dev, "ts_frame larger than 80ms [0x%p] no-0x%x.\n"\
-+				, tsk, tsk->task_no);	\
-+} while (0)
-+#else
-+#define CHECK_PERF(ts)
-+#define DECLARE_PERF_VAR
-+#define PRINT_TASK_STATISTICS
-+#endif
-+
-+#define	IPU_PP_CH_VF	(IPU_TASK_ID_VF - 1)
-+#define	IPU_PP_CH_PP	(IPU_TASK_ID_PP - 1)
-+#define MAX_PP_CH	(IPU_TASK_ID_MAX - 1)
-+#define VDOA_DEF_TIMEOUT_MS	(HZ/2)
-+
-+/* Strucutures and variables for exporting MXC IPU as device*/
-+typedef enum {
-+	STATE_OK = 0,
-+	STATE_QUEUE,
-+	STATE_IN_PROGRESS,
-+	STATE_ERR,
-+	STATE_TIMEOUT,
-+	STATE_RES_TIMEOUT,
-+	STATE_NO_IPU,
-+	STATE_NO_IRQ,
-+	STATE_IPU_BUSY,
-+	STATE_IRQ_FAIL,
-+	STATE_IRQ_TIMEOUT,
-+	STATE_ENABLE_CHAN_FAIL,
-+	STATE_DISABLE_CHAN_FAIL,
-+	STATE_SEL_BUF_FAIL,
-+	STATE_INIT_CHAN_FAIL,
-+	STATE_LINK_CHAN_FAIL,
-+	STATE_UNLINK_CHAN_FAIL,
-+	STATE_INIT_CHAN_BUF_FAIL,
-+	STATE_INIT_CHAN_BAND_FAIL,
-+	STATE_SYS_NO_MEM,
-+	STATE_VDOA_IRQ_TIMEOUT,
-+	STATE_VDOA_IRQ_FAIL,
-+	STATE_VDOA_TASK_FAIL,
-+} ipu_state_t;
-+
-+enum {
-+	INPUT_CHAN_VDI_P = 1,
-+	INPUT_CHAN,
-+	INPUT_CHAN_VDI_N,
-+};
-+
-+struct ipu_state_msg {
-+	int state;
-+	char *msg;
-+} state_msg[] = {
-+	{STATE_OK, "ok"},
-+	{STATE_QUEUE, "split queue"},
-+	{STATE_IN_PROGRESS, "split in progress"},
-+	{STATE_ERR, "error"},
-+	{STATE_TIMEOUT, "split task timeout"},
-+	{STATE_RES_TIMEOUT, "wait resource timeout"},
-+	{STATE_NO_IPU, "no ipu found"},
-+	{STATE_NO_IRQ, "no irq found for task"},
-+	{STATE_IPU_BUSY, "ipu busy"},
-+	{STATE_IRQ_FAIL, "request irq failed"},
-+	{STATE_IRQ_TIMEOUT, "wait for irq timeout"},
-+	{STATE_ENABLE_CHAN_FAIL, "ipu enable channel fail"},
-+	{STATE_DISABLE_CHAN_FAIL, "ipu disable channel fail"},
-+	{STATE_SEL_BUF_FAIL, "ipu select buf fail"},
-+	{STATE_INIT_CHAN_FAIL, "ipu init channel fail"},
-+	{STATE_LINK_CHAN_FAIL, "ipu link channel fail"},
-+	{STATE_UNLINK_CHAN_FAIL, "ipu unlink channel fail"},
-+	{STATE_INIT_CHAN_BUF_FAIL, "ipu init channel buffer fail"},
-+	{STATE_INIT_CHAN_BAND_FAIL, "ipu init channel band mode fail"},
-+	{STATE_SYS_NO_MEM, "sys no mem: -ENOMEM"},
-+	{STATE_VDOA_IRQ_TIMEOUT, "wait for vdoa irq timeout"},
-+	{STATE_VDOA_IRQ_FAIL, "vdoa irq fail"},
-+	{STATE_VDOA_TASK_FAIL, "vdoa task fail"},
-+};
-+
-+struct stripe_setting {
-+	u32 iw;
-+	u32 ih;
-+	u32 ow;
-+	u32 oh;
-+	u32 outh_resize_ratio;
-+	u32 outv_resize_ratio;
-+	u32 i_left_pos;
-+	u32 i_right_pos;
-+	u32 i_top_pos;
-+	u32 i_bottom_pos;
-+	u32 o_left_pos;
-+	u32 o_right_pos;
-+	u32 o_top_pos;
-+	u32 o_bottom_pos;
-+	u32 rl_split_line;
-+	u32 ud_split_line;
-+};
-+
-+struct task_set {
-+#define	NULL_MODE	0x0
-+#define	IC_MODE		0x1
-+#define	ROT_MODE	0x2
-+#define	VDI_MODE	0x4
-+#define IPU_PREPROCESS_MODE_MASK	(IC_MODE | ROT_MODE | VDI_MODE)
-+/* VDOA_MODE means this task use vdoa, and VDOA has two modes:
-+ * BAND MODE and non-BAND MODE. Non-band mode will do transfer data
-+ * to memory. BAND mode needs hareware sync with IPU, it is used default
-+ * if connected to VDIC.
-+ */
-+#define	VDOA_MODE	0x8
-+#define	VDOA_BAND_MODE	0x10
-+	u8	mode;
-+#define IC_VF	0x1
-+#define IC_PP	0x2
-+#define ROT_VF	0x4
-+#define ROT_PP	0x8
-+#define VDI_VF	0x10
-+#define	VDOA_ONLY	0x20
-+	u8	task;
-+#define NO_SPLIT	0x0
-+#define RL_SPLIT	0x1
-+#define UD_SPLIT	0x2
-+#define LEFT_STRIPE	0x1
-+#define RIGHT_STRIPE	0x2
-+#define UP_STRIPE	0x4
-+#define DOWN_STRIPE	0x8
-+#define SPLIT_MASK	0xF
-+	u8	split_mode;
-+	u8	band_lines;
-+	ipu_channel_t ic_chan;
-+	ipu_channel_t rot_chan;
-+	ipu_channel_t vdi_ic_p_chan;
-+	ipu_channel_t vdi_ic_n_chan;
-+
-+	u32 i_off;
-+	u32 i_uoff;
-+	u32 i_voff;
-+	u32 istride;
-+
-+	u32 ov_off;
-+	u32 ov_uoff;
-+	u32 ov_voff;
-+	u32 ovstride;
-+
-+	u32 ov_alpha_off;
-+	u32 ov_alpha_stride;
-+
-+	u32 o_off;
-+	u32 o_uoff;
-+	u32 o_voff;
-+	u32 ostride;
-+
-+	u32 r_fmt;
-+	u32 r_width;
-+	u32 r_height;
-+	u32 r_stride;
-+	dma_addr_t r_paddr;
-+
-+	struct stripe_setting sp_setting;
-+};
-+
-+struct ipu_split_task {
-+	struct ipu_task task;
-+	struct ipu_task_entry *parent_task;
-+	struct ipu_task_entry *child_task;
-+	u32 task_no;
-+};
-+
-+struct ipu_task_entry {
-+	struct ipu_input input;
-+	struct ipu_output output;
-+
-+	bool overlay_en;
-+	struct ipu_overlay overlay;
-+#define DEF_TIMEOUT_MS	1000
-+#define DEF_DELAY_MS 20
-+	int	timeout;
-+	int	irq;
-+
-+	u8	task_id;
-+	u8	ipu_id;
-+	u8	task_in_list;
-+	u8	split_done;
-+	struct mutex split_lock;
-+	struct mutex vdic_lock;
-+	wait_queue_head_t split_waitq;
-+
-+	struct list_head node;
-+	struct list_head split_list;
-+	struct ipu_soc *ipu;
-+	struct device *dev;
-+	struct task_set set;
-+	wait_queue_head_t task_waitq;
-+	struct completion irq_comp;
-+	struct kref refcount;
-+	ipu_state_t state;
-+	u32 task_no;
-+	atomic_t done;
-+	atomic_t res_free;
-+	atomic_t res_get;
-+
-+	struct ipu_task_entry *parent;
-+	char *vditmpbuf[2];
-+	u32 old_save_lines;
-+	u32 old_size;
-+	bool buf1filled;
-+	bool buf0filled;
-+
-+	vdoa_handle_t vdoa_handle;
-+	struct vdoa_output_mem {
-+		void *vaddr;
-+		dma_addr_t paddr;
-+		int size;
-+	} vdoa_dma;
-+
-+#ifdef DBG_IPU_PERF
-+	struct timespec ts_queue;
-+	struct timespec ts_dotask;
-+	struct timespec ts_waitirq;
-+	struct timespec ts_inirq;
-+	struct timespec ts_wakeup;
-+	struct timespec ts_rel;
-+#endif
-+};
-+
-+struct ipu_channel_tabel {
-+	struct mutex	lock;
-+	u8		used[MXC_IPU_MAX_NUM][MAX_PP_CH];
-+	u8		vdoa_used;
-+};
-+
-+struct ipu_thread_data {
-+	struct ipu_soc *ipu;
-+	u32	id;
-+	u32	is_vdoa;
-+};
-+
-+struct ipu_alloc_list {
-+	struct list_head list;
-+	dma_addr_t phy_addr;
-+	void *cpu_addr;
-+	u32 size;
-+	void *file_index;
-+};
-+
-+static LIST_HEAD(ipu_alloc_list);
-+static DEFINE_MUTEX(ipu_alloc_lock);
-+static struct ipu_channel_tabel	ipu_ch_tbl;
-+static LIST_HEAD(ipu_task_list);
-+static DEFINE_SPINLOCK(ipu_task_list_lock);
-+static DECLARE_WAIT_QUEUE_HEAD(thread_waitq);
-+static DECLARE_WAIT_QUEUE_HEAD(res_waitq);
-+static atomic_t req_cnt;
-+static atomic_t file_index = ATOMIC_INIT(1);
-+static int major;
-+static int max_ipu_no;
-+static int thread_id;
-+static atomic_t frame_no;
-+static struct class *ipu_class;
-+static struct device *ipu_dev;
-+static int debug;
-+module_param(debug, int, 0600);
-+#ifdef DBG_IPU_PERF
-+static struct timespec ts_frame_max;
-+static u32 ts_frame_avg;
-+static atomic_t frame_cnt;
-+#endif
-+
-+static bool deinterlace_3_field(struct ipu_task_entry *t)
-+{
-+	return ((t->set.mode & VDI_MODE) &&
-+		(t->input.deinterlace.motion != HIGH_MOTION));
-+}
-+
-+static u32 tiled_filed_size(struct ipu_task_entry *t)
-+{
-+	u32 field_size;
-+
-+	/* note: page_align is required by VPU hw ouput buffer */
-+	field_size = TILED_NV12_FRAME_SIZE(t->input.width, t->input.height/2);
-+	return field_size;
-+}
-+
-+static bool only_ic(u8 mode)
-+{
-+	mode = mode & IPU_PREPROCESS_MODE_MASK;
-+	return ((mode == IC_MODE) || (mode == VDI_MODE));
-+}
-+
-+static bool only_rot(u8 mode)
-+{
-+	mode = mode & IPU_PREPROCESS_MODE_MASK;
-+	return (mode == ROT_MODE);
-+}
-+
-+static bool ic_and_rot(u8 mode)
-+{
-+	mode = mode & IPU_PREPROCESS_MODE_MASK;
-+	return ((mode == (IC_MODE | ROT_MODE)) ||
-+		 (mode == (VDI_MODE | ROT_MODE)));
-+}
-+
-+static bool need_split(struct ipu_task_entry *t)
-+{
-+	return ((t->set.split_mode != NO_SPLIT) || (t->task_no & SPLIT_MASK));
-+}
-+
-+unsigned int fmt_to_bpp(unsigned int pixelformat)
-+{
-+	u32 bpp;
-+
-+	switch (pixelformat) {
-+	case IPU_PIX_FMT_RGB565:
-+	/*interleaved 422*/
-+	case IPU_PIX_FMT_YUYV:
-+	case IPU_PIX_FMT_UYVY:
-+	/*non-interleaved 422*/
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YVU422P:
-+		bpp = 16;
-+		break;
-+	case IPU_PIX_FMT_BGR24:
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_YUV444:
-+	case IPU_PIX_FMT_YUV444P:
-+		bpp = 24;
-+		break;
-+	case IPU_PIX_FMT_BGR32:
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_RGB32:
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_ABGR32:
-+		bpp = 32;
-+		break;
-+	/*non-interleaved 420*/
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_NV12:
-+		bpp = 12;
-+		break;
-+	default:
-+		bpp = 8;
-+		break;
-+	}
-+	return bpp;
-+}
-+EXPORT_SYMBOL_GPL(fmt_to_bpp);
-+
-+cs_t colorspaceofpixel(int fmt)
-+{
-+	switch (fmt) {
-+	case IPU_PIX_FMT_RGB565:
-+	case IPU_PIX_FMT_RGB666:
-+	case IPU_PIX_FMT_BGR24:
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_BGR32:
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_RGB32:
-+	case IPU_PIX_FMT_ABGR32:
-+		return RGB_CS;
-+		break;
-+	case IPU_PIX_FMT_UYVY:
-+	case IPU_PIX_FMT_YUYV:
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_YVU422P:
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YUV444:
-+	case IPU_PIX_FMT_YUV444P:
-+	case IPU_PIX_FMT_NV12:
-+	case IPU_PIX_FMT_TILED_NV12:
-+	case IPU_PIX_FMT_TILED_NV12F:
-+		return YUV_CS;
-+		break;
-+	default:
-+		return NULL_CS;
-+	}
-+}
-+EXPORT_SYMBOL_GPL(colorspaceofpixel);
-+
-+int need_csc(int ifmt, int ofmt)
-+{
-+	cs_t ics, ocs;
-+
-+	ics = colorspaceofpixel(ifmt);
-+	ocs = colorspaceofpixel(ofmt);
-+
-+	if ((ics == NULL_CS) || (ocs == NULL_CS))
-+		return -1;
-+	else if (ics != ocs)
-+		return 1;
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL_GPL(need_csc);
-+
-+static int soc_max_in_width(u32 is_vdoa)
-+{
-+	return is_vdoa ? 8192 : 4096;
-+}
-+
-+static int soc_max_vdi_in_width(void)
-+{
-+	return IPU_MAX_VDI_IN_WIDTH;
-+}
-+static int soc_max_in_height(void)
-+{
-+	return 4096;
-+}
-+
-+static int soc_max_out_width(void)
-+{
-+	/* mx51/mx53/mx6q is 1024*/
-+	return 1024;
-+}
-+
-+static int soc_max_out_height(void)
-+{
-+	/* mx51/mx53/mx6q is 1024*/
-+	return 1024;
-+}
-+
-+static void dump_task_info(struct ipu_task_entry *t)
-+{
-+	if (!debug)
-+		return;
-+	dev_dbg(t->dev, "[0x%p]input:\n", (void *)t);
-+	dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n", (void *)t, t->input.format);
-+	dev_dbg(t->dev, "[0x%p]\twidth = %d\n", (void *)t, t->input.width);
-+	dev_dbg(t->dev, "[0x%p]\theight = %d\n", (void *)t, t->input.height);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.w = %d\n", (void *)t, t->input.crop.w);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.h = %d\n", (void *)t, t->input.crop.h);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.pos.x = %d\n",
-+			(void *)t, t->input.crop.pos.x);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.pos.y = %d\n",
-+			(void *)t, t->input.crop.pos.y);
-+	dev_dbg(t->dev, "[0x%p]input buffer:\n", (void *)t);
-+	dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n", (void *)t, t->input.paddr);
-+	dev_dbg(t->dev, "[0x%p]\ti_off = 0x%x\n", (void *)t, t->set.i_off);
-+	dev_dbg(t->dev, "[0x%p]\ti_uoff = 0x%x\n", (void *)t, t->set.i_uoff);
-+	dev_dbg(t->dev, "[0x%p]\ti_voff = 0x%x\n", (void *)t, t->set.i_voff);
-+	dev_dbg(t->dev, "[0x%p]\tistride = %d\n", (void *)t, t->set.istride);
-+	if (t->input.deinterlace.enable) {
-+		dev_dbg(t->dev, "[0x%p]deinterlace enabled with:\n", (void *)t);
-+		if (t->input.deinterlace.motion != HIGH_MOTION) {
-+			dev_dbg(t->dev, "[0x%p]\tlow/medium motion\n", (void *)t);
-+			dev_dbg(t->dev, "[0x%p]\tpaddr_n = 0x%x\n",
-+				(void *)t, t->input.paddr_n);
-+		} else
-+			dev_dbg(t->dev, "[0x%p]\thigh motion\n", (void *)t);
-+	}
-+
-+	dev_dbg(t->dev, "[0x%p]output:\n", (void *)t);
-+	dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n", (void *)t, t->output.format);
-+	dev_dbg(t->dev, "[0x%p]\twidth = %d\n", (void *)t, t->output.width);
-+	dev_dbg(t->dev, "[0x%p]\theight = %d\n", (void *)t, t->output.height);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.w = %d\n", (void *)t, t->output.crop.w);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.h = %d\n", (void *)t, t->output.crop.h);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.pos.x = %d\n",
-+			(void *)t, t->output.crop.pos.x);
-+	dev_dbg(t->dev, "[0x%p]\tcrop.pos.y = %d\n",
-+			(void *)t, t->output.crop.pos.y);
-+	dev_dbg(t->dev, "[0x%p]\trotate = %d\n", (void *)t, t->output.rotate);
-+	dev_dbg(t->dev, "[0x%p]output buffer:\n", (void *)t);
-+	dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n", (void *)t, t->output.paddr);
-+	dev_dbg(t->dev, "[0x%p]\to_off = 0x%x\n", (void *)t, t->set.o_off);
-+	dev_dbg(t->dev, "[0x%p]\to_uoff = 0x%x\n", (void *)t, t->set.o_uoff);
-+	dev_dbg(t->dev, "[0x%p]\to_voff = 0x%x\n", (void *)t, t->set.o_voff);
-+	dev_dbg(t->dev, "[0x%p]\tostride = %d\n", (void *)t, t->set.ostride);
-+
-+	if (t->overlay_en) {
-+		dev_dbg(t->dev, "[0x%p]overlay:\n", (void *)t);
-+		dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n",
-+				(void *)t, t->overlay.format);
-+		dev_dbg(t->dev, "[0x%p]\twidth = %d\n",
-+				(void *)t, t->overlay.width);
-+		dev_dbg(t->dev, "[0x%p]\theight = %d\n",
-+				(void *)t, t->overlay.height);
-+		dev_dbg(t->dev, "[0x%p]\tcrop.w = %d\n",
-+				(void *)t, t->overlay.crop.w);
-+		dev_dbg(t->dev, "[0x%p]\tcrop.h = %d\n",
-+				(void *)t, t->overlay.crop.h);
-+		dev_dbg(t->dev, "[0x%p]\tcrop.pos.x = %d\n",
-+				(void *)t, t->overlay.crop.pos.x);
-+		dev_dbg(t->dev, "[0x%p]\tcrop.pos.y = %d\n",
-+				(void *)t, t->overlay.crop.pos.y);
-+		dev_dbg(t->dev, "[0x%p]overlay buffer:\n", (void *)t);
-+		dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n",
-+				(void *)t, t->overlay.paddr);
-+		dev_dbg(t->dev, "[0x%p]\tov_off = 0x%x\n",
-+				(void *)t, t->set.ov_off);
-+		dev_dbg(t->dev, "[0x%p]\tov_uoff = 0x%x\n",
-+				(void *)t, t->set.ov_uoff);
-+		dev_dbg(t->dev, "[0x%p]\tov_voff = 0x%x\n",
-+				(void *)t, t->set.ov_voff);
-+		dev_dbg(t->dev, "[0x%p]\tovstride = %d\n",
-+				(void *)t, t->set.ovstride);
-+		if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
-+			dev_dbg(t->dev, "[0x%p]local alpha enabled with:\n",
-+					(void *)t);
-+			dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n",
-+					(void *)t, t->overlay.alpha.loc_alp_paddr);
-+			dev_dbg(t->dev, "[0x%p]\tov_alpha_off = 0x%x\n",
-+					(void *)t, t->set.ov_alpha_off);
-+			dev_dbg(t->dev, "[0x%p]\tov_alpha_stride = %d\n",
-+					(void *)t, t->set.ov_alpha_stride);
-+		} else
-+			dev_dbg(t->dev, "[0x%p]globle alpha enabled with value 0x%x\n",
-+					(void *)t, t->overlay.alpha.gvalue);
-+		if (t->overlay.colorkey.enable)
-+			dev_dbg(t->dev, "[0x%p]colorkey enabled with value 0x%x\n",
-+					(void *)t, t->overlay.colorkey.value);
-+	}
-+
-+	dev_dbg(t->dev, "[0x%p]want task_id = %d\n", (void *)t, t->task_id);
-+	dev_dbg(t->dev, "[0x%p]want task mode is 0x%x\n",
-+				(void *)t, t->set.mode);
-+	dev_dbg(t->dev, "[0x%p]\tIC_MODE = 0x%x\n", (void *)t, IC_MODE);
-+	dev_dbg(t->dev, "[0x%p]\tROT_MODE = 0x%x\n", (void *)t, ROT_MODE);
-+	dev_dbg(t->dev, "[0x%p]\tVDI_MODE = 0x%x\n", (void *)t, VDI_MODE);
-+	dev_dbg(t->dev, "[0x%p]\tTask_no = 0x%x\n\n\n", (void *)t, t->task_no);
-+}
-+
-+static void dump_check_err(struct device *dev, int err)
-+{
-+	switch (err) {
-+	case IPU_CHECK_ERR_INPUT_CROP:
-+		dev_err(dev, "input crop setting error\n");
-+		break;
-+	case IPU_CHECK_ERR_OUTPUT_CROP:
-+		dev_err(dev, "output crop setting error\n");
-+		break;
-+	case IPU_CHECK_ERR_OVERLAY_CROP:
-+		dev_err(dev, "overlay crop setting error\n");
-+		break;
-+	case IPU_CHECK_ERR_INPUT_OVER_LIMIT:
-+		dev_err(dev, "input over limitation\n");
-+		break;
-+	case IPU_CHECK_ERR_OVERLAY_WITH_VDI:
-+		dev_err(dev, "do not support overlay with deinterlace\n");
-+		break;
-+	case IPU_CHECK_ERR_OV_OUT_NO_FIT:
-+		dev_err(dev,
-+			"width/height of overlay and ic output should be same\n");
-+		break;
-+	case IPU_CHECK_ERR_PROC_NO_NEED:
-+		dev_err(dev, "no ipu processing need\n");
-+		break;
-+	case IPU_CHECK_ERR_SPLIT_INPUTW_OVER:
-+		dev_err(dev, "split mode input width overflow\n");
-+		break;
-+	case IPU_CHECK_ERR_SPLIT_INPUTH_OVER:
-+		dev_err(dev, "split mode input height overflow\n");
-+		break;
-+	case IPU_CHECK_ERR_SPLIT_OUTPUTW_OVER:
-+		dev_err(dev, "split mode output width overflow\n");
-+		break;
-+	case IPU_CHECK_ERR_SPLIT_OUTPUTH_OVER:
-+		dev_err(dev, "split mode output height overflow\n");
-+		break;
-+	case IPU_CHECK_ERR_SPLIT_WITH_ROT:
-+		dev_err(dev, "not support split mode with rotation\n");
-+		break;
-+	case IPU_CHECK_ERR_W_DOWNSIZE_OVER:
-+		dev_err(dev, "horizontal downsizing ratio overflow\n");
-+		break;
-+	case IPU_CHECK_ERR_H_DOWNSIZE_OVER:
-+		dev_err(dev, "vertical downsizing ratio overflow\n");
-+		break;
-+	default:
-+		break;
-+	}
-+}
-+
-+static void dump_check_warn(struct device *dev, int warn)
-+{
-+	if (warn & IPU_CHECK_WARN_INPUT_OFFS_NOT8ALIGN)
-+		dev_warn(dev, "input u/v offset not 8 align\n");
-+	if (warn & IPU_CHECK_WARN_OUTPUT_OFFS_NOT8ALIGN)
-+		dev_warn(dev, "output u/v offset not 8 align\n");
-+	if (warn & IPU_CHECK_WARN_OVERLAY_OFFS_NOT8ALIGN)
-+		dev_warn(dev, "overlay u/v offset not 8 align\n");
-+}
-+
-+static int set_crop(struct ipu_crop *crop, int width, int height, int fmt)
-+{
-+	if ((width == 0) || (height == 0)) {
-+		pr_err("Invalid param: width=%d, height=%d\n", width, height);
-+		return -EINVAL;
-+	}
-+
-+	if ((IPU_PIX_FMT_TILED_NV12 == fmt) ||
-+		(IPU_PIX_FMT_TILED_NV12F == fmt)) {
-+		if (crop->w || crop->h) {
-+			if (((crop->w + crop->pos.x) > width)
-+			|| ((crop->h + crop->pos.y) > height)
-+			|| (0 != (crop->w % IPU_PIX_FMT_TILED_NV12_MBALIGN))
-+			|| (0 != (crop->h % IPU_PIX_FMT_TILED_NV12_MBALIGN))
-+			|| (0 != (crop->pos.x % IPU_PIX_FMT_TILED_NV12_MBALIGN))
-+			|| (0 != (crop->pos.y % IPU_PIX_FMT_TILED_NV12_MBALIGN))
-+			) {
-+				pr_err("set_crop error MB align.\n");
-+				return -EINVAL;
-+			}
-+		} else {
-+			crop->pos.x = 0;
-+			crop->pos.y = 0;
-+			crop->w = width;
-+			crop->h = height;
-+			if ((0 != (crop->w % IPU_PIX_FMT_TILED_NV12_MBALIGN))
-+			|| (0 != (crop->h % IPU_PIX_FMT_TILED_NV12_MBALIGN))) {
-+				pr_err("set_crop error w/h MB align.\n");
-+				return -EINVAL;
-+			}
-+		}
-+	} else {
-+		if (crop->w || crop->h) {
-+			if (((crop->w + crop->pos.x) > (width + 16))
-+			|| ((crop->h + crop->pos.y) > height + 16)) {
-+				pr_err("set_crop error exceeds width/height.\n");
-+				return -EINVAL;
-+			}
-+		} else {
-+			crop->pos.x = 0;
-+			crop->pos.y = 0;
-+			crop->w = width;
-+			crop->h = height;
-+		}
-+		crop->w -= crop->w%8;
-+		crop->h -= crop->h%8;
-+	}
-+
-+	if ((crop->w == 0) || (crop->h == 0)) {
-+		pr_err("Invalid crop param: crop.w=%d, crop.h=%d\n",
-+			crop->w, crop->h);
-+		return -EINVAL;
-+	}
-+
-+	return 0;
-+}
-+
-+static void update_offset(unsigned int fmt,
-+				unsigned int width, unsigned int height,
-+				unsigned int pos_x, unsigned int pos_y,
-+				int *off, int *uoff, int *voff, int *stride)
-+{
-+	/* NOTE: u v offset should based on start point of off*/
-+	switch (fmt) {
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YUV420P:
-+		*off = pos_y * width + pos_x;
-+		*uoff = (width * (height - pos_y) - pos_x)
-+			+ (width/2) * (pos_y/2) + pos_x/2;
-+		/* In case height is odd, round up to even */
-+		*voff = *uoff + (width/2) * ((height+1)/2);
-+		break;
-+	case IPU_PIX_FMT_YVU420P:
-+		*off = pos_y * width + pos_x;
-+		*voff = (width * (height - pos_y) - pos_x)
-+			+ (width/2) * (pos_y/2) + pos_x/2;
-+		/* In case height is odd, round up to even */
-+		*uoff = *voff + (width/2) * ((height+1)/2);
-+		break;
-+	case IPU_PIX_FMT_YVU422P:
-+		*off = pos_y * width + pos_x;
-+		*voff = (width * (height - pos_y) - pos_x)
-+			+ (width/2) * pos_y + pos_x/2;
-+		*uoff = *voff + (width/2) * height;
-+		break;
-+	case IPU_PIX_FMT_YUV422P:
-+		*off = pos_y * width + pos_x;
-+		*uoff = (width * (height - pos_y) - pos_x)
-+			+ (width/2) * pos_y + pos_x/2;
-+		*voff = *uoff + (width/2) * height;
-+		break;
-+	case IPU_PIX_FMT_YUV444P:
-+		*off = pos_y * width + pos_x;
-+		*uoff = width * height;
-+		*voff = width * height * 2;
-+		break;
-+	case IPU_PIX_FMT_NV12:
-+		*off = pos_y * width + pos_x;
-+		*uoff = (width * (height - pos_y) - pos_x)
-+			+ width * (pos_y/2) + pos_x;
-+		break;
-+	case IPU_PIX_FMT_TILED_NV12:
-+		/*
-+		 * tiled format, progressive:
-+		 * assuming that line is aligned with MB height (aligned to 16)
-+		 * offset = line * stride + (pixel / MB_width) * pixels_in_MB
-+		 * = line * stride + (pixel / 16) * 256
-+		 * = line * stride + pixel * 16
-+		 */
-+		*off = pos_y * width + (pos_x << 4);
-+		*uoff = ALIGN(width * height, SZ_4K) + (*off >> 1) - *off;
-+		break;
-+	case IPU_PIX_FMT_TILED_NV12F:
-+		/*
-+		 * tiled format, interlaced:
-+		 * same as above, only number of pixels in MB is 128,
-+		 * instead of 256
-+		 */
-+		*off = (pos_y >> 1) * width + (pos_x << 3);
-+		*uoff = ALIGN(width * height/2, SZ_4K) + (*off >> 1) - *off;
-+		break;
-+	default:
-+		*off = (pos_y * width + pos_x) * fmt_to_bpp(fmt)/8;
-+		break;
-+	}
-+	*stride = width * bytes_per_pixel(fmt);
-+}
-+
-+static int update_split_setting(struct ipu_task_entry *t, bool vdi_split)
-+{
-+	struct stripe_param left_stripe;
-+	struct stripe_param right_stripe;
-+	struct stripe_param up_stripe;
-+	struct stripe_param down_stripe;
-+	u32 iw, ih, ow, oh;
-+	u32 max_width;
-+	int ret;
-+
-+	if (t->output.rotate >= IPU_ROTATE_90_RIGHT)
-+		return IPU_CHECK_ERR_SPLIT_WITH_ROT;
-+
-+	iw = t->input.crop.w;
-+	ih = t->input.crop.h;
-+
-+	ow = t->output.crop.w;
-+	oh = t->output.crop.h;
-+
-+	memset(&left_stripe, 0, sizeof(left_stripe));
-+	memset(&right_stripe, 0, sizeof(right_stripe));
-+	memset(&up_stripe, 0, sizeof(up_stripe));
-+	memset(&down_stripe, 0, sizeof(down_stripe));
-+
-+	if (t->set.split_mode & RL_SPLIT) {
-+		/*
-+		 * We do want equal strips: initialize stripes in case
-+		 * calc_stripes returns before actually doing the calculation
-+		 */
-+		left_stripe.input_width = iw / 2;
-+		left_stripe.output_width = ow / 2;
-+		right_stripe.input_column = iw / 2;
-+		right_stripe.output_column = ow / 2;
-+
-+		if (vdi_split)
-+			max_width = soc_max_vdi_in_width();
-+		else
-+			max_width = soc_max_out_width();
-+		ret = ipu_calc_stripes_sizes(iw,
-+				ow,
-+				max_width,
-+				(((unsigned long long)1) << 32), /* 32bit for fractional*/
-+				1, /* equal stripes */
-+				t->input.format,
-+				t->output.format,
-+				&left_stripe,
-+				&right_stripe);
-+		if (ret < 0)
-+			return IPU_CHECK_ERR_W_DOWNSIZE_OVER;
-+		else if (ret)
-+			dev_dbg(t->dev, "Warn: no:0x%x,calc_stripes ret:%d\n",
-+				 t->task_no, ret);
-+		t->set.sp_setting.iw = left_stripe.input_width;
-+		t->set.sp_setting.ow = left_stripe.output_width;
-+		t->set.sp_setting.outh_resize_ratio = left_stripe.irr;
-+		t->set.sp_setting.i_left_pos = left_stripe.input_column;
-+		t->set.sp_setting.o_left_pos = left_stripe.output_column;
-+		t->set.sp_setting.i_right_pos = right_stripe.input_column;
-+		t->set.sp_setting.o_right_pos = right_stripe.output_column;
-+	} else {
-+		t->set.sp_setting.iw = iw;
-+		t->set.sp_setting.ow = ow;
-+		t->set.sp_setting.outh_resize_ratio = 0;
-+		t->set.sp_setting.i_left_pos = 0;
-+		t->set.sp_setting.o_left_pos = 0;
-+		t->set.sp_setting.i_right_pos = 0;
-+		t->set.sp_setting.o_right_pos = 0;
-+	}
-+	if ((t->set.sp_setting.iw + t->set.sp_setting.i_right_pos) > (iw+16))
-+		return IPU_CHECK_ERR_SPLIT_INPUTW_OVER;
-+	if (((t->set.sp_setting.ow + t->set.sp_setting.o_right_pos) > ow)
-+		|| (t->set.sp_setting.ow > soc_max_out_width()))
-+		return IPU_CHECK_ERR_SPLIT_OUTPUTW_OVER;
-+	if (rounddown(t->set.sp_setting.ow, 8) * 8 <=
-+	    rounddown(t->set.sp_setting.iw, 8))
-+		return IPU_CHECK_ERR_W_DOWNSIZE_OVER;
-+
-+	if (t->set.split_mode & UD_SPLIT) {
-+		/*
-+		 * We do want equal strips: initialize stripes in case
-+		 * calc_stripes returns before actually doing the calculation
-+		 */
-+		up_stripe.input_width = ih / 2;
-+		up_stripe.output_width = oh / 2;
-+		down_stripe.input_column = ih / 2;
-+		down_stripe.output_column = oh / 2;
-+		ret = ipu_calc_stripes_sizes(ih,
-+				oh,
-+				soc_max_out_height(),
-+				(((unsigned long long)1) << 32), /* 32bit for fractional*/
-+				0x1 | 0x2, /* equal stripes and vertical */
-+				t->input.format,
-+				t->output.format,
-+				&up_stripe,
-+				&down_stripe);
-+		if (ret < 0)
-+			return IPU_CHECK_ERR_H_DOWNSIZE_OVER;
-+		else if (ret)
-+			dev_err(t->dev, "Warn: no:0x%x,calc_stripes ret:%d\n",
-+				 t->task_no, ret);
-+		t->set.sp_setting.ih = up_stripe.input_width;
-+		t->set.sp_setting.oh = up_stripe.output_width;
-+		t->set.sp_setting.outv_resize_ratio = up_stripe.irr;
-+		t->set.sp_setting.i_top_pos = up_stripe.input_column;
-+		t->set.sp_setting.o_top_pos = up_stripe.output_column;
-+		t->set.sp_setting.i_bottom_pos = down_stripe.input_column;
-+		t->set.sp_setting.o_bottom_pos = down_stripe.output_column;
-+	} else {
-+		t->set.sp_setting.ih = ih;
-+		t->set.sp_setting.oh = oh;
-+		t->set.sp_setting.outv_resize_ratio = 0;
-+		t->set.sp_setting.i_top_pos = 0;
-+		t->set.sp_setting.o_top_pos = 0;
-+		t->set.sp_setting.i_bottom_pos = 0;
-+		t->set.sp_setting.o_bottom_pos = 0;
-+	}
-+
-+	/* downscale case: enforce limits */
-+	if (((t->set.sp_setting.ih + t->set.sp_setting.i_bottom_pos) > (ih))
-+	     && (t->set.sp_setting.ih >= t->set.sp_setting.oh))
-+		return IPU_CHECK_ERR_SPLIT_INPUTH_OVER;
-+	/* upscale case: relax limits because ipu_calc_stripes_sizes() may
-+	   create input stripe that falls just outside of the input window */
-+	else if ((t->set.sp_setting.ih + t->set.sp_setting.i_bottom_pos)
-+		 > (ih+16))
-+		return IPU_CHECK_ERR_SPLIT_INPUTH_OVER;
-+	if (((t->set.sp_setting.oh + t->set.sp_setting.o_bottom_pos) > oh)
-+		|| (t->set.sp_setting.oh > soc_max_out_height()))
-+		return IPU_CHECK_ERR_SPLIT_OUTPUTH_OVER;
-+	if (rounddown(t->set.sp_setting.oh, 8) * 8 <=
-+	    rounddown(t->set.sp_setting.ih, 8))
-+		return IPU_CHECK_ERR_H_DOWNSIZE_OVER;
-+
-+	return IPU_CHECK_OK;
-+}
-+
-+static int check_task(struct ipu_task_entry *t)
-+{
-+	int tmp;
-+	int ret = IPU_CHECK_OK;
-+	int timeout;
-+	bool vdi_split = false;
-+	int ocw, och;
-+
-+	if ((IPU_PIX_FMT_TILED_NV12 == t->overlay.format) ||
-+		(IPU_PIX_FMT_TILED_NV12F == t->overlay.format) ||
-+		(IPU_PIX_FMT_TILED_NV12 == t->output.format) ||
-+		(IPU_PIX_FMT_TILED_NV12F == t->output.format) ||
-+		((IPU_PIX_FMT_TILED_NV12F == t->input.format) &&
-+			!t->input.deinterlace.enable)) {
-+		ret = IPU_CHECK_ERR_NOT_SUPPORT;
-+		goto done;
-+	}
-+
-+	/* check input */
-+	ret = set_crop(&t->input.crop, t->input.width, t->input.height,
-+		t->input.format);
-+	if (ret < 0) {
-+		ret = IPU_CHECK_ERR_INPUT_CROP;
-+		goto done;
-+	} else
-+		update_offset(t->input.format, t->input.width, t->input.height,
-+				t->input.crop.pos.x, t->input.crop.pos.y,
-+				&t->set.i_off, &t->set.i_uoff,
-+				&t->set.i_voff, &t->set.istride);
-+
-+	/* check output */
-+	ret = set_crop(&t->output.crop, t->output.width, t->output.height,
-+		t->output.format);
-+	if (ret < 0) {
-+		ret = IPU_CHECK_ERR_OUTPUT_CROP;
-+		goto done;
-+	} else
-+		update_offset(t->output.format,
-+				t->output.width, t->output.height,
-+				t->output.crop.pos.x, t->output.crop.pos.y,
-+				&t->set.o_off, &t->set.o_uoff,
-+				&t->set.o_voff, &t->set.ostride);
-+
-+	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
-+		/*
-+		 * Cache output width and height and
-+		 * swap them so that we may check
-+		 * downsize overflow correctly.
-+		 */
-+		ocw = t->output.crop.h;
-+		och = t->output.crop.w;
-+	} else {
-+		ocw = t->output.crop.w;
-+		och = t->output.crop.h;
-+	}
-+
-+	if (ocw * 8 <= t->input.crop.w) {
-+		ret = IPU_CHECK_ERR_W_DOWNSIZE_OVER;
-+		goto done;
-+	}
-+
-+	if (och * 8 <= t->input.crop.h) {
-+		ret = IPU_CHECK_ERR_H_DOWNSIZE_OVER;
-+		goto done;
-+	}
-+
-+	if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
-+		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
-+		if ((t->input.crop.w > soc_max_in_width(1)) ||
-+			(t->input.crop.h > soc_max_in_height())) {
-+			ret = IPU_CHECK_ERR_INPUT_OVER_LIMIT;
-+			goto done;
-+		}
-+		/* output fmt: NV12 and YUYV, now don't support resize */
-+		if (((IPU_PIX_FMT_NV12 != t->output.format) &&
-+				(IPU_PIX_FMT_YUYV != t->output.format)) ||
-+			(t->input.crop.w != t->output.crop.w) ||
-+			(t->input.crop.h != t->output.crop.h)) {
-+			ret = IPU_CHECK_ERR_NOT_SUPPORT;
-+			goto done;
-+		}
-+	}
-+
-+	/* check overlay if there is */
-+	if (t->overlay_en) {
-+		if (t->input.deinterlace.enable) {
-+			ret = IPU_CHECK_ERR_OVERLAY_WITH_VDI;
-+			goto done;
-+		}
-+
-+		ret = set_crop(&t->overlay.crop, t->overlay.width,
-+			t->overlay.height, t->overlay.format);
-+		if (ret < 0) {
-+			ret = IPU_CHECK_ERR_OVERLAY_CROP;
-+			goto done;
-+		} else {
-+			ocw = t->output.crop.w;
-+			och = t->output.crop.h;
-+
-+			if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
-+				ocw = t->output.crop.h;
-+				och = t->output.crop.w;
-+			}
-+			if ((t->overlay.crop.w != ocw) ||
-+			    (t->overlay.crop.h != och)) {
-+				ret = IPU_CHECK_ERR_OV_OUT_NO_FIT;
-+				goto done;
-+			}
-+
-+			update_offset(t->overlay.format,
-+					t->overlay.width, t->overlay.height,
-+					t->overlay.crop.pos.x, t->overlay.crop.pos.y,
-+					&t->set.ov_off, &t->set.ov_uoff,
-+					&t->set.ov_voff, &t->set.ovstride);
-+			if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
-+				t->set.ov_alpha_stride = t->overlay.width;
-+				t->set.ov_alpha_off = t->overlay.crop.pos.y *
-+					t->overlay.width + t->overlay.crop.pos.x;
-+			}
-+		}
-+	}
-+
-+	/* input overflow? */
-+	if (!((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
-+		(IPU_PIX_FMT_TILED_NV12F == t->input.format))) {
-+		if ((t->input.crop.w > soc_max_in_width(0)) ||
-+			(t->input.crop.h > soc_max_in_height())) {
-+				ret = IPU_CHECK_ERR_INPUT_OVER_LIMIT;
-+				goto done;
-+		}
-+	}
-+
-+	/* check task mode */
-+	t->set.mode = NULL_MODE;
-+	t->set.split_mode = NO_SPLIT;
-+
-+	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
-+		/*output swap*/
-+		tmp = t->output.crop.w;
-+		t->output.crop.w = t->output.crop.h;
-+		t->output.crop.h = tmp;
-+	}
-+
-+	if (t->output.rotate >= IPU_ROTATE_90_RIGHT)
-+		t->set.mode |= ROT_MODE;
-+
-+	/*need resize or CSC?*/
-+	if ((t->input.crop.w != t->output.crop.w) ||
-+			(t->input.crop.h != t->output.crop.h) ||
-+			need_csc(t->input.format, t->output.format))
-+		t->set.mode |= IC_MODE;
-+
-+	/*need cropping?*/
-+	if ((t->input.crop.w != t->input.width)       ||
-+		(t->input.crop.h != t->input.height)  ||
-+		(t->output.crop.w != t->output.width) ||
-+		(t->output.crop.h != t->output.height))
-+		t->set.mode |= IC_MODE;
-+
-+	/*need flip?*/
-+	if ((t->set.mode == NULL_MODE) && (t->output.rotate > IPU_ROTATE_NONE))
-+		t->set.mode |= IC_MODE;
-+
-+	/*need IDMAC do format(same color space)?*/
-+	if ((t->set.mode == NULL_MODE) && (t->input.format != t->output.format))
-+		t->set.mode |= IC_MODE;
-+
-+	/*overlay support*/
-+	if (t->overlay_en)
-+		t->set.mode |= IC_MODE;
-+
-+	/*deinterlace*/
-+	if (t->input.deinterlace.enable) {
-+		t->set.mode &= ~IC_MODE;
-+		t->set.mode |= VDI_MODE;
-+	}
-+	if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
-+		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
-+		if (t->set.mode & ROT_MODE) {
-+			ret = IPU_CHECK_ERR_NOT_SUPPORT;
-+			goto done;
-+		}
-+		t->set.mode |= VDOA_MODE;
-+		if (IPU_PIX_FMT_TILED_NV12F == t->input.format)
-+			t->set.mode |= VDOA_BAND_MODE;
-+		t->set.mode &= ~IC_MODE;
-+	}
-+
-+	if ((t->set.mode & (IC_MODE | VDI_MODE)) &&
-+		(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
-+		if (t->output.crop.w > soc_max_out_width())
-+			t->set.split_mode |= RL_SPLIT;
-+		if (t->output.crop.h > soc_max_out_height())
-+			t->set.split_mode |= UD_SPLIT;
-+		if (!t->set.split_mode && (t->set.mode & VDI_MODE) &&
-+				(t->input.crop.w > soc_max_vdi_in_width())) {
-+			t->set.split_mode |= RL_SPLIT;
-+			vdi_split = true;
-+		}
-+		if (t->set.split_mode) {
-+			if ((t->set.split_mode == RL_SPLIT) ||
-+				 (t->set.split_mode == UD_SPLIT))
-+				timeout = DEF_TIMEOUT_MS * 2 + DEF_DELAY_MS;
-+			else
-+				timeout = DEF_TIMEOUT_MS * 4 + DEF_DELAY_MS;
-+			if (t->timeout < timeout)
-+				t->timeout = timeout;
-+
-+			ret = update_split_setting(t, vdi_split);
-+			if (ret > IPU_CHECK_ERR_MIN)
-+				goto done;
-+		}
-+	}
-+
-+	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
-+		/*output swap*/
-+		tmp = t->output.crop.w;
-+		t->output.crop.w = t->output.crop.h;
-+		t->output.crop.h = tmp;
-+	}
-+
-+	if (t->set.mode == NULL_MODE) {
-+		ret = IPU_CHECK_ERR_PROC_NO_NEED;
-+		goto done;
-+	}
-+
-+	if ((t->set.i_uoff % 8) || (t->set.i_voff % 8))
-+		ret |= IPU_CHECK_WARN_INPUT_OFFS_NOT8ALIGN;
-+	if ((t->set.o_uoff % 8) || (t->set.o_voff % 8))
-+		ret |= IPU_CHECK_WARN_OUTPUT_OFFS_NOT8ALIGN;
-+	if (t->overlay_en && ((t->set.ov_uoff % 8) || (t->set.ov_voff % 8)))
-+		ret |= IPU_CHECK_WARN_OVERLAY_OFFS_NOT8ALIGN;
-+
-+done:
-+	/* dump msg */
-+	if (debug) {
-+		if (ret > IPU_CHECK_ERR_MIN)
-+			dump_check_err(t->dev, ret);
-+		else if (ret != IPU_CHECK_OK)
-+			dump_check_warn(t->dev, ret);
-+	}
-+
-+	return ret;
-+}
-+
-+static int prepare_task(struct ipu_task_entry *t)
-+{
-+	int ret = 0;
-+
-+	ret = check_task(t);
-+	if (ret > IPU_CHECK_ERR_MIN)
-+		return -EINVAL;
-+
-+	if (t->set.mode & VDI_MODE) {
-+		t->task_id = IPU_TASK_ID_VF;
-+		t->set.task = VDI_VF;
-+		if (t->set.mode & ROT_MODE)
-+			t->set.task |= ROT_VF;
-+	}
-+
-+	if (VDOA_MODE == t->set.mode) {
-+		if (t->set.task != 0) {
-+			dev_err(t->dev, "ERR: vdoa only task:0x%x, [0x%p].\n",
-+					t->set.task, t);
-+			return -EINVAL;
-+		}
-+		t->set.task |= VDOA_ONLY;
-+	}
-+
-+	if (VDOA_BAND_MODE & t->set.mode) {
-+		/* to save band size: 1<<3 = 8 lines */
-+		t->set.band_lines = 3;
-+	}
-+
-+	dump_task_info(t);
-+
-+	return ret;
-+}
-+
-+static uint32_t ic_vf_pp_is_busy(struct ipu_soc *ipu, bool is_vf)
-+{
-+	uint32_t	status;
-+	uint32_t	status_vf;
-+	uint32_t	status_rot;
-+
-+	if (is_vf) {
-+		status = ipu_channel_status(ipu, MEM_VDI_PRP_VF_MEM);
-+		status_vf = ipu_channel_status(ipu, MEM_PRP_VF_MEM);
-+		status_rot = ipu_channel_status(ipu, MEM_ROT_VF_MEM);
-+		return status || status_vf || status_rot;
-+	} else {
-+		status = ipu_channel_status(ipu, MEM_PP_MEM);
-+		status_rot = ipu_channel_status(ipu, MEM_ROT_PP_MEM);
-+		return status || status_rot;
-+	}
-+}
-+
-+static int _get_vdoa_ipu_res(struct ipu_task_entry *t)
-+{
-+	int		i;
-+	struct ipu_soc	*ipu;
-+	u8		*used;
-+	uint32_t	found_ipu = 0;
-+	uint32_t	found_vdoa = 0;
-+	struct ipu_channel_tabel	*tbl = &ipu_ch_tbl;
-+
-+	mutex_lock(&tbl->lock);
-+	if (t->set.mode & VDOA_MODE) {
-+		if (NULL != t->vdoa_handle)
-+			found_vdoa = 1;
-+		else {
-+			found_vdoa = tbl->vdoa_used ? 0 : 1;
-+			if (found_vdoa) {
-+				tbl->vdoa_used = 1;
-+				vdoa_get_handle(&t->vdoa_handle);
-+			} else
-+				/* first get vdoa->ipu resource sequence */
-+				goto out;
-+			if (t->set.task & VDOA_ONLY)
-+				goto out;
-+		}
-+	}
-+
-+	for (i = 0; i < max_ipu_no; i++) {
-+		ipu = ipu_get_soc(i);
-+		if (IS_ERR(ipu))
-+			dev_err(t->dev, "no:0x%x,found_vdoa:%d, ipu:%d\n",
-+				 t->task_no, found_vdoa, i);
-+
-+		used = &tbl->used[i][IPU_PP_CH_VF];
-+		if (t->set.mode & VDI_MODE) {
-+			if (0 == *used) {
-+				*used = 1;
-+				found_ipu = 1;
-+				break;
-+			}
-+		} else if ((t->set.mode & IC_MODE) || only_rot(t->set.mode)) {
-+			if (0 == *used) {
-+				t->task_id = IPU_TASK_ID_VF;
-+				if (t->set.mode & IC_MODE)
-+					t->set.task |= IC_VF;
-+				if (t->set.mode & ROT_MODE)
-+					t->set.task |= ROT_VF;
-+				*used = 1;
-+				found_ipu = 1;
-+				break;
-+			}
-+		} else
-+			dev_err(t->dev, "no:0x%x,found_vdoa:%d, mode:0x%x\n",
-+				 t->task_no, found_vdoa, t->set.mode);
-+	}
-+	if (found_ipu)
-+		goto next;
-+
-+	for (i = 0; i < max_ipu_no; i++) {
-+		ipu = ipu_get_soc(i);
-+		if (IS_ERR(ipu))
-+			dev_err(t->dev, "no:0x%x,found_vdoa:%d, ipu:%d\n",
-+				 t->task_no, found_vdoa, i);
-+
-+		if ((t->set.mode & IC_MODE) || only_rot(t->set.mode)) {
-+			used = &tbl->used[i][IPU_PP_CH_PP];
-+			if (0 == *used) {
-+				t->task_id = IPU_TASK_ID_PP;
-+				if (t->set.mode & IC_MODE)
-+					t->set.task |= IC_PP;
-+				if (t->set.mode & ROT_MODE)
-+					t->set.task |= ROT_PP;
-+				*used = 1;
-+				found_ipu = 1;
-+				break;
-+			}
-+		}
-+	}
-+
-+next:
-+	if (found_ipu) {
-+		t->ipu = ipu;
-+		t->ipu_id = i;
-+		t->dev = ipu->dev;
-+		if (atomic_inc_return(&t->res_get) == 2)
-+			dev_err(t->dev,
-+				"ERR no:0x%x,found_vdoa:%d,get ipu twice\n",
-+				 t->task_no, found_vdoa);
-+	}
-+out:
-+	dev_dbg(t->dev,
-+		"%s:no:0x%x,found_vdoa:%d, found_ipu:%d\n",
-+		 __func__, t->task_no, found_vdoa, found_ipu);
-+	mutex_unlock(&tbl->lock);
-+	if (t->set.task & VDOA_ONLY)
-+		return found_vdoa;
-+	else if (t->set.mode & VDOA_MODE)
-+		return found_vdoa && found_ipu;
-+	else
-+		return found_ipu;
-+}
-+
-+static void put_vdoa_ipu_res(struct ipu_task_entry *tsk, int vdoa_only)
-+{
-+	int ret;
-+	int rel_vdoa = 0, rel_ipu = 0;
-+	struct ipu_channel_tabel	*tbl = &ipu_ch_tbl;
-+
-+	mutex_lock(&tbl->lock);
-+	if (tsk->set.mode & VDOA_MODE) {
-+		if (!tbl->vdoa_used && tsk->vdoa_handle)
-+			dev_err(tsk->dev,
-+				"ERR no:0x%x,vdoa not used,mode:0x%x\n",
-+				 tsk->task_no, tsk->set.mode);
-+		if (tbl->vdoa_used && tsk->vdoa_handle) {
-+			tbl->vdoa_used = 0;
-+			vdoa_put_handle(&tsk->vdoa_handle);
-+			if (tsk->ipu)
-+				tsk->ipu->vdoa_en = 0;
-+			rel_vdoa = 1;
-+			if (vdoa_only || (tsk->set.task & VDOA_ONLY))
-+				goto out;
-+		}
-+	}
-+
-+	tbl->used[tsk->ipu_id][tsk->task_id - 1] = 0;
-+	rel_ipu = 1;
-+	ret = atomic_inc_return(&tsk->res_free);
-+	if (ret == 2)
-+		dev_err(tsk->dev,
-+			"ERR no:0x%x,rel_vdoa:%d,put ipu twice\n",
-+			 tsk->task_no, rel_vdoa);
-+out:
-+	dev_dbg(tsk->dev,
-+		"%s:no:0x%x,rel_vdoa:%d, rel_ipu:%d\n",
-+		 __func__, tsk->task_no, rel_vdoa, rel_ipu);
-+	mutex_unlock(&tbl->lock);
-+}
-+
-+static int get_vdoa_ipu_res(struct ipu_task_entry *t)
-+{
-+	int		ret;
-+	uint32_t	found = 0;
-+
-+	found = _get_vdoa_ipu_res(t);
-+	if (!found) {
-+		t->ipu_id = -1;
-+		t->ipu = NULL;
-+		/* blocking to get resource */
-+		ret = atomic_inc_return(&req_cnt);
-+		dev_dbg(t->dev,
-+			"wait_res:no:0x%x,req_cnt:%d\n", t->task_no, ret);
-+		ret = wait_event_timeout(res_waitq, _get_vdoa_ipu_res(t),
-+				 msecs_to_jiffies(t->timeout - DEF_DELAY_MS));
-+		if (ret == 0) {
-+			dev_err(t->dev, "ERR[0x%p,no-0x%x] wait_res timeout:%dms!\n",
-+					 t, t->task_no, t->timeout - DEF_DELAY_MS);
-+			ret = -ETIMEDOUT;
-+			t->state = STATE_RES_TIMEOUT;
-+			goto out;
-+		} else {
-+			if (!(t->set.task & VDOA_ONLY) && (!t->ipu))
-+				dev_err(t->dev,
-+					"ERR[no-0x%x] can not get ipu!\n",
-+					t->task_no);
-+			ret = atomic_read(&req_cnt);
-+			if (ret > 0)
-+				ret = atomic_dec_return(&req_cnt);
-+			else
-+				dev_err(t->dev,
-+					"ERR[no-0x%x] req_cnt:%d mismatch!\n",
-+					t->task_no, ret);
-+			dev_dbg(t->dev, "no-0x%x,[0x%p],req_cnt:%d, got_res!\n",
-+						t->task_no, t, ret);
-+			found = 1;
-+		}
-+	}
-+
-+out:
-+	return found;
-+}
-+
-+static struct ipu_task_entry *create_task_entry(struct ipu_task *task)
-+{
-+	struct ipu_task_entry *tsk;
-+
-+	tsk = kzalloc(sizeof(struct ipu_task_entry), GFP_KERNEL);
-+	if (!tsk)
-+		return ERR_PTR(-ENOMEM);
-+	kref_init(&tsk->refcount);
-+	tsk->state = -EINVAL;
-+	tsk->ipu_id = -1;
-+	tsk->dev = ipu_dev;
-+	tsk->input = task->input;
-+	tsk->output = task->output;
-+	tsk->overlay_en = task->overlay_en;
-+	if (tsk->overlay_en)
-+		tsk->overlay = task->overlay;
-+	if (task->timeout > DEF_TIMEOUT_MS)
-+		tsk->timeout = task->timeout;
-+	else
-+		tsk->timeout = DEF_TIMEOUT_MS;
-+
-+	return tsk;
-+}
-+
-+static void task_mem_free(struct kref *ref)
-+{
-+	struct ipu_task_entry *tsk =
-+			container_of(ref, struct ipu_task_entry, refcount);
-+	kfree(tsk);
-+}
-+
-+int create_split_child_task(struct ipu_split_task *sp_task)
-+{
-+	int ret = 0;
-+	struct ipu_task_entry *tsk;
-+
-+	tsk = create_task_entry(&sp_task->task);
-+	if (IS_ERR(tsk))
-+		return PTR_ERR(tsk);
-+
-+	sp_task->child_task = tsk;
-+	tsk->task_no = sp_task->task_no;
-+
-+	ret = prepare_task(tsk);
-+	if (ret < 0)
-+		goto err;
-+
-+	tsk->parent = sp_task->parent_task;
-+	tsk->set.sp_setting = sp_task->parent_task->set.sp_setting;
-+
-+	list_add(&tsk->node, &tsk->parent->split_list);
-+	dev_dbg(tsk->dev, "[0x%p] sp_tsk Q list,no-0x%x\n", tsk, tsk->task_no);
-+	tsk->state = STATE_QUEUE;
-+	CHECK_PERF(&tsk->ts_queue);
-+err:
-+	return ret;
-+}
-+
-+static inline int sp_task_check_done(struct ipu_split_task *sp_task,
-+			struct ipu_task_entry *parent, int num, int *idx)
-+{
-+	int i;
-+	int ret = 0;
-+	struct ipu_task_entry *tsk;
-+	struct mutex *lock = &parent->split_lock;
-+
-+	*idx = -EINVAL;
-+	mutex_lock(lock);
-+	for (i = 0; i < num; i++) {
-+		tsk = sp_task[i].child_task;
-+		if (tsk && tsk->split_done) {
-+			*idx = i;
-+			ret = 1;
-+			goto out;
-+		}
-+	}
-+
-+out:
-+	mutex_unlock(lock);
-+	return ret;
-+}
-+
-+static int create_split_task(
-+		int stripe,
-+		struct ipu_split_task *sp_task)
-+{
-+	struct ipu_task *task = &(sp_task->task);
-+	struct ipu_task_entry *t = sp_task->parent_task;
-+	int ret;
-+
-+	sp_task->task_no |= stripe;
-+
-+	task->input = t->input;
-+	task->output = t->output;
-+	task->overlay_en = t->overlay_en;
-+	if (task->overlay_en)
-+		task->overlay = t->overlay;
-+	task->task_id = t->task_id;
-+	if ((t->set.split_mode == RL_SPLIT) ||
-+		 (t->set.split_mode == UD_SPLIT))
-+		task->timeout = t->timeout / 2;
-+	else
-+		task->timeout = t->timeout / 4;
-+
-+	task->input.crop.w = t->set.sp_setting.iw;
-+	task->input.crop.h = t->set.sp_setting.ih;
-+	if (task->overlay_en) {
-+		task->overlay.crop.w = t->set.sp_setting.ow;
-+		task->overlay.crop.h = t->set.sp_setting.oh;
-+	}
-+	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
-+		task->output.crop.w = t->set.sp_setting.oh;
-+		task->output.crop.h = t->set.sp_setting.ow;
-+		t->set.sp_setting.rl_split_line = t->set.sp_setting.o_bottom_pos;
-+		t->set.sp_setting.ud_split_line = t->set.sp_setting.o_right_pos;
-+
-+	} else {
-+		task->output.crop.w = t->set.sp_setting.ow;
-+		task->output.crop.h = t->set.sp_setting.oh;
-+		t->set.sp_setting.rl_split_line = t->set.sp_setting.o_right_pos;
-+		t->set.sp_setting.ud_split_line = t->set.sp_setting.o_bottom_pos;
-+	}
-+
-+	if (stripe & LEFT_STRIPE)
-+		task->input.crop.pos.x += t->set.sp_setting.i_left_pos;
-+	else if (stripe & RIGHT_STRIPE)
-+		task->input.crop.pos.x += t->set.sp_setting.i_right_pos;
-+	if (stripe & UP_STRIPE)
-+		task->input.crop.pos.y += t->set.sp_setting.i_top_pos;
-+	else if (stripe & DOWN_STRIPE)
-+		task->input.crop.pos.y += t->set.sp_setting.i_bottom_pos;
-+
-+	if (task->overlay_en) {
-+		if (stripe & LEFT_STRIPE)
-+			task->overlay.crop.pos.x += t->set.sp_setting.o_left_pos;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->overlay.crop.pos.x += t->set.sp_setting.o_right_pos;
-+		if (stripe & UP_STRIPE)
-+			task->overlay.crop.pos.y += t->set.sp_setting.o_top_pos;
-+		else if (stripe & DOWN_STRIPE)
-+			task->overlay.crop.pos.y += t->set.sp_setting.o_bottom_pos;
-+	}
-+
-+	switch (t->output.rotate) {
-+	case IPU_ROTATE_NONE:
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_left_pos;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_right_pos;
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_top_pos;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_bottom_pos;
-+		break;
-+	case IPU_ROTATE_VERT_FLIP:
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_left_pos;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_right_pos;
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
-+		break;
-+	case IPU_ROTATE_HORIZ_FLIP:
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_top_pos;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_bottom_pos;
-+		break;
-+	case IPU_ROTATE_180:
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
-+		break;
-+	case IPU_ROTATE_90_RIGHT:
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_left_pos;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_right_pos;
-+		break;
-+	case IPU_ROTATE_90_RIGHT_HFLIP:
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_top_pos;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_bottom_pos;
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_left_pos;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.y += t->set.sp_setting.o_right_pos;
-+		break;
-+	case IPU_ROTATE_90_RIGHT_VFLIP:
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.x =
-+					t->output.crop.pos.x + t->output.crop.w
-+					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
-+		break;
-+	case IPU_ROTATE_90_LEFT:
-+		if (stripe & UP_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_top_pos;
-+		else if (stripe & DOWN_STRIPE)
-+			task->output.crop.pos.x += t->set.sp_setting.o_bottom_pos;
-+		if (stripe & LEFT_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
-+		else if (stripe & RIGHT_STRIPE)
-+			task->output.crop.pos.y =
-+					t->output.crop.pos.y + t->output.crop.h
-+					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
-+		break;
-+	default:
-+		dev_err(t->dev, "ERR:should not be here\n");
-+		break;
-+	}
-+
-+	ret = create_split_child_task(sp_task);
-+	if (ret < 0)
-+		dev_err(t->dev, "ERR:create_split_child_task() ret:%d\n", ret);
-+	return ret;
-+}
-+
-+static int queue_split_task(struct ipu_task_entry *t,
-+				struct ipu_split_task *sp_task, uint32_t size)
-+{
-+	int err[4];
-+	int ret = 0;
-+	int i, j;
-+	struct ipu_task_entry *tsk = NULL;
-+	struct mutex *lock = &t->split_lock;
-+	struct mutex *vdic_lock = &t->vdic_lock;
-+
-+	dev_dbg(t->dev, "Split task 0x%p, no-0x%x, size:%d\n",
-+			 t, t->task_no, size);
-+	mutex_init(lock);
-+	mutex_init(vdic_lock);
-+	init_waitqueue_head(&t->split_waitq);
-+	INIT_LIST_HEAD(&t->split_list);
-+	for (j = 0; j < size; j++) {
-+		memset(&sp_task[j], 0, sizeof(*sp_task));
-+		sp_task[j].parent_task = t;
-+		sp_task[j].task_no = t->task_no;
-+	}
-+
-+	if (t->set.split_mode == RL_SPLIT) {
-+		i = 0;
-+		err[i] = create_split_task(RIGHT_STRIPE, &sp_task[i]);
-+		if (err[i] < 0)
-+			goto err_start;
-+		i = 1;
-+		err[i] = create_split_task(LEFT_STRIPE, &sp_task[i]);
-+	} else if (t->set.split_mode == UD_SPLIT) {
-+		i = 0;
-+		err[i] = create_split_task(DOWN_STRIPE, &sp_task[i]);
-+		if (err[i] < 0)
-+			goto err_start;
-+		i = 1;
-+		err[i] = create_split_task(UP_STRIPE, &sp_task[i]);
-+	} else {
-+		i = 0;
-+		err[i] = create_split_task(RIGHT_STRIPE | DOWN_STRIPE, &sp_task[i]);
-+		if (err[i] < 0)
-+			goto err_start;
-+		i = 1;
-+		err[i] = create_split_task(LEFT_STRIPE | DOWN_STRIPE, &sp_task[i]);
-+		if (err[i] < 0)
-+			goto err_start;
-+		i = 2;
-+		err[i] = create_split_task(RIGHT_STRIPE | UP_STRIPE, &sp_task[i]);
-+		if (err[i] < 0)
-+			goto err_start;
-+		i = 3;
-+		err[i] = create_split_task(LEFT_STRIPE | UP_STRIPE, &sp_task[i]);
-+	}
-+
-+err_start:
-+	for (j = 0; j < (i + 1); j++) {
-+		if (err[j] < 0) {
-+			if (sp_task[j].child_task)
-+				dev_err(t->dev,
-+				 "sp_task[%d],no-0x%x fail state:%d, queue err:%d.\n",
-+				j, sp_task[j].child_task->task_no,
-+				sp_task[j].child_task->state, err[j]);
-+			goto err_exit;
-+		}
-+		dev_dbg(t->dev, "[0x%p] sp_task[%d], no-0x%x state:%s, queue ret:%d.\n",
-+			sp_task[j].child_task, j, sp_task[j].child_task->task_no,
-+			state_msg[sp_task[j].child_task->state].msg, err[j]);
-+	}
-+
-+	return ret;
-+
-+err_exit:
-+	for (j = 0; j < (i + 1); j++) {
-+		if (err[j] < 0 && !ret)
-+			ret = err[j];
-+		tsk = sp_task[j].child_task;
-+		if (!tsk)
-+			continue;
-+		kfree(tsk);
-+	}
-+	t->state = STATE_ERR;
-+	return ret;
-+
-+}
-+
-+static int init_tiled_buf(struct ipu_soc *ipu, struct ipu_task_entry *t,
-+				ipu_channel_t channel, uint32_t ch_type)
-+{
-+	int ret = 0;
-+	int i;
-+	uint32_t ipu_fmt;
-+	dma_addr_t inbuf_base = 0;
-+	u32 field_size;
-+	struct vdoa_params param;
-+	struct vdoa_ipu_buf buf;
-+	struct ipu_soc *ipu_idx;
-+	u32 ipu_stride, obuf_size;
-+	u32 height, width;
-+	ipu_buffer_t type;
-+
-+	if ((IPU_PIX_FMT_YUYV != t->output.format) &&
-+		(IPU_PIX_FMT_NV12 != t->output.format)) {
-+		dev_err(t->dev, "ERR:[0x%d] output format\n", t->task_no);
-+		return -EINVAL;
-+	}
-+
-+	memset(&param, 0, sizeof(param));
-+	/* init channel tiled bufs */
-+	if (deinterlace_3_field(t) &&
-+		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
-+		field_size = tiled_filed_size(t);
-+		if (INPUT_CHAN_VDI_P == ch_type) {
-+			inbuf_base = t->input.paddr + field_size;
-+			param.vfield_buf.prev_veba = inbuf_base + t->set.i_off;
-+		} else if (INPUT_CHAN == ch_type) {
-+			inbuf_base = t->input.paddr_n;
-+			param.vfield_buf.cur_veba = inbuf_base + t->set.i_off;
-+		} else if (INPUT_CHAN_VDI_N == ch_type) {
-+			inbuf_base = t->input.paddr_n + field_size;
-+			param.vfield_buf.next_veba = inbuf_base + t->set.i_off;
-+		} else
-+			return -EINVAL;
-+		height = t->input.crop.h >> 1; /* field format for vdoa */
-+		width = t->input.crop.w;
-+		param.vfield_buf.vubo = t->set.i_uoff;
-+		param.interlaced = 1;
-+		param.scan_order = 1;
-+		type = IPU_INPUT_BUFFER;
-+	} else if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) &&
-+			(INPUT_CHAN == ch_type)) {
-+		height = t->input.crop.h;
-+		width = t->input.crop.w;
-+		param.vframe_buf.veba = t->input.paddr + t->set.i_off;
-+		param.vframe_buf.vubo = t->set.i_uoff;
-+		type = IPU_INPUT_BUFFER;
-+	} else
-+		return -EINVAL;
-+
-+	param.band_mode = (t->set.mode & VDOA_BAND_MODE) ? 1 : 0;
-+	if (param.band_mode && (t->set.band_lines != 3) &&
-+		 (t->set.band_lines != 4) && (t->set.band_lines != 5))
-+		return -EINVAL;
-+	else if (param.band_mode)
-+		param.band_lines = (1 << t->set.band_lines);
-+	for (i = 0; i < max_ipu_no; i++) {
-+		ipu_idx = ipu_get_soc(i);
-+		if (!IS_ERR(ipu_idx) && ipu_idx == ipu)
-+			break;
-+	}
-+	if (t->set.task & VDOA_ONLY)
-+		/* dummy, didn't need ipu res */
-+		i = 0;
-+	if (max_ipu_no == i) {
-+		dev_err(t->dev, "ERR:[0x%p] get ipu num\n", t);
-+		return -EINVAL;
-+	}
-+
-+	param.ipu_num = i;
-+	param.vpu_stride = t->input.width;
-+	param.height = height;
-+	param.width = width;
-+	if (IPU_PIX_FMT_NV12 == t->output.format)
-+		param.pfs = VDOA_PFS_NV12;
-+	else
-+		param.pfs = VDOA_PFS_YUYV;
-+	ipu_fmt = (param.pfs == VDOA_PFS_YUYV) ? IPU_PIX_FMT_YUYV :
-+				IPU_PIX_FMT_NV12;
-+	ipu_stride = param.width * bytes_per_pixel(ipu_fmt);
-+	obuf_size = PAGE_ALIGN(param.width * param.height *
-+				fmt_to_bpp(ipu_fmt)/8);
-+	dev_dbg(t->dev, "band_mode:%d, band_lines:%d\n",
-+			param.band_mode, param.band_lines);
-+	if (!param.band_mode) {
-+		/* note: if only for tiled -> raster convert and
-+		   no other post-processing, we don't need alloc buf
-+		   and use output buffer directly.
-+		*/
-+		if (t->set.task & VDOA_ONLY)
-+			param.ieba0 = t->output.paddr;
-+		else {
-+			dev_err(t->dev, "ERR:[0x%d] vdoa task\n", t->task_no);
-+			return -EINVAL;
-+		}
-+	} else {
-+		if (IPU_PIX_FMT_TILED_NV12F != t->input.format) {
-+			dev_err(t->dev, "ERR [0x%d] vdoa task\n", t->task_no);
-+			return -EINVAL;
-+		}
-+	}
-+	ret = vdoa_setup(t->vdoa_handle, &param);
-+	if (ret)
-+		goto done;
-+	vdoa_get_output_buf(t->vdoa_handle, &buf);
-+	if (t->set.task & VDOA_ONLY)
-+		goto done;
-+
-+	ret = ipu_init_channel_buffer(ipu,
-+			channel,
-+			type,
-+			ipu_fmt,
-+			width,
-+			height,
-+			ipu_stride,
-+			IPU_ROTATE_NONE,
-+			buf.ieba0,
-+			buf.ieba1,
-+			0,
-+			buf.iubo,
-+			0);
-+	if (ret < 0) {
-+		t->state = STATE_INIT_CHAN_BUF_FAIL;
-+		goto done;
-+	}
-+
-+	if (param.band_mode) {
-+		ret = ipu_set_channel_bandmode(ipu, channel,
-+				type, t->set.band_lines);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BAND_FAIL;
-+			goto done;
-+		}
-+	}
-+done:
-+	return ret;
-+}
-+
-+static int init_tiled_ch_bufs(struct ipu_soc *ipu, struct ipu_task_entry *t)
-+{
-+	int ret = 0;
-+
-+	if (IPU_PIX_FMT_TILED_NV12 == t->input.format) {
-+		ret = init_tiled_buf(ipu, t, t->set.ic_chan, INPUT_CHAN);
-+		CHECK_RETCODE(ret < 0, "init tiled_ch", t->state, done, ret);
-+	} else if (IPU_PIX_FMT_TILED_NV12F == t->input.format) {
-+		ret = init_tiled_buf(ipu, t, t->set.ic_chan, INPUT_CHAN);
-+		CHECK_RETCODE(ret < 0, "init tiled_ch-c", t->state, done, ret);
-+		ret = init_tiled_buf(ipu, t, t->set.vdi_ic_p_chan,
-+					INPUT_CHAN_VDI_P);
-+		CHECK_RETCODE(ret < 0, "init tiled_ch-p", t->state, done, ret);
-+		ret = init_tiled_buf(ipu, t, t->set.vdi_ic_n_chan,
-+					INPUT_CHAN_VDI_N);
-+		CHECK_RETCODE(ret < 0, "init tiled_ch-n", t->state, done, ret);
-+	} else {
-+		ret = -EINVAL;
-+		dev_err(t->dev, "ERR[no-0x%x] invalid fmt:0x%x!\n",
-+			t->task_no, t->input.format);
-+	}
-+
-+done:
-+	return ret;
-+}
-+
-+static int init_ic(struct ipu_soc *ipu, struct ipu_task_entry *t)
-+{
-+	int ret = 0;
-+	ipu_channel_params_t params;
-+	dma_addr_t inbuf = 0, ovbuf = 0, ov_alp_buf = 0;
-+	dma_addr_t inbuf_p = 0, inbuf_n = 0;
-+	dma_addr_t outbuf = 0;
-+	int out_uoff = 0, out_voff = 0, out_rot;
-+	int out_w = 0, out_h = 0, out_stride;
-+	int out_fmt;
-+	u32 vdi_frame_idx = 0;
-+
-+	memset(&params, 0, sizeof(params));
-+
-+	/* is it need link a rot channel */
-+	if (ic_and_rot(t->set.mode)) {
-+		outbuf = t->set.r_paddr;
-+		out_w = t->set.r_width;
-+		out_h = t->set.r_height;
-+		out_stride = t->set.r_stride;
-+		out_fmt = t->set.r_fmt;
-+		out_uoff = 0;
-+		out_voff = 0;
-+		out_rot = IPU_ROTATE_NONE;
-+	} else {
-+		outbuf = t->output.paddr + t->set.o_off;
-+		out_w = t->output.crop.w;
-+		out_h = t->output.crop.h;
-+		out_stride = t->set.ostride;
-+		out_fmt = t->output.format;
-+		out_uoff = t->set.o_uoff;
-+		out_voff = t->set.o_voff;
-+		out_rot = t->output.rotate;
-+	}
-+
-+	/* settings */
-+	params.mem_prp_vf_mem.in_width = t->input.crop.w;
-+	params.mem_prp_vf_mem.out_width = out_w;
-+	params.mem_prp_vf_mem.in_height = t->input.crop.h;
-+	params.mem_prp_vf_mem.out_height = out_h;
-+	params.mem_prp_vf_mem.in_pixel_fmt = t->input.format;
-+	params.mem_prp_vf_mem.out_pixel_fmt = out_fmt;
-+	params.mem_prp_vf_mem.motion_sel = t->input.deinterlace.motion;
-+
-+	params.mem_prp_vf_mem.outh_resize_ratio =
-+			t->set.sp_setting.outh_resize_ratio;
-+	params.mem_prp_vf_mem.outv_resize_ratio =
-+			t->set.sp_setting.outv_resize_ratio;
-+
-+	if (t->overlay_en) {
-+		params.mem_prp_vf_mem.in_g_pixel_fmt = t->overlay.format;
-+		params.mem_prp_vf_mem.graphics_combine_en = 1;
-+		if (t->overlay.alpha.mode == IPU_ALPHA_MODE_GLOBAL)
-+			params.mem_prp_vf_mem.global_alpha_en = 1;
-+		else if (t->overlay.alpha.loc_alp_paddr)
-+			params.mem_prp_vf_mem.alpha_chan_en = 1;
-+		/* otherwise, alpha bending per pixel is used. */
-+		params.mem_prp_vf_mem.alpha = t->overlay.alpha.gvalue;
-+		if (t->overlay.colorkey.enable) {
-+			params.mem_prp_vf_mem.key_color_en = 1;
-+			params.mem_prp_vf_mem.key_color = t->overlay.colorkey.value;
-+		}
-+	}
-+
-+	if (t->input.deinterlace.enable) {
-+		if (t->input.deinterlace.field_fmt & IPU_DEINTERLACE_FIELD_MASK)
-+			params.mem_prp_vf_mem.field_fmt =
-+				IPU_DEINTERLACE_FIELD_BOTTOM;
-+		else
-+			params.mem_prp_vf_mem.field_fmt =
-+				IPU_DEINTERLACE_FIELD_TOP;
-+
-+		if (t->input.deinterlace.field_fmt & IPU_DEINTERLACE_RATE_EN)
-+			vdi_frame_idx = t->input.deinterlace.field_fmt &
-+						IPU_DEINTERLACE_RATE_FRAME1;
-+	}
-+
-+	if (t->set.mode & VDOA_MODE)
-+		ipu->vdoa_en = 1;
-+
-+	/* init channels */
-+	if (!(t->set.task & VDOA_ONLY)) {
-+		ret = ipu_init_channel(ipu, t->set.ic_chan, &params);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_FAIL;
-+			goto done;
-+		}
-+	}
-+
-+	if (deinterlace_3_field(t)) {
-+		ret = ipu_init_channel(ipu, t->set.vdi_ic_p_chan, &params);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_FAIL;
-+			goto done;
-+		}
-+		ret = ipu_init_channel(ipu, t->set.vdi_ic_n_chan, &params);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_FAIL;
-+			goto done;
-+		}
-+	}
-+
-+	/* init channel bufs */
-+	if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
-+		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
-+		ret = init_tiled_ch_bufs(ipu, t);
-+		if (ret < 0)
-+			goto done;
-+	} else {
-+		if ((deinterlace_3_field(t)) &&
-+			(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
-+			if (params.mem_prp_vf_mem.field_fmt ==
-+				IPU_DEINTERLACE_FIELD_TOP) {
-+				if (vdi_frame_idx) {
-+					inbuf_p = t->input.paddr + t->set.istride +
-+							t->set.i_off;
-+					inbuf = t->input.paddr_n + t->set.i_off;
-+					inbuf_n = t->input.paddr_n + t->set.istride +
-+							t->set.i_off;
-+					params.mem_prp_vf_mem.field_fmt =
-+						IPU_DEINTERLACE_FIELD_BOTTOM;
-+				} else {
-+					inbuf_p = t->input.paddr + t->set.i_off;
-+					inbuf = t->input.paddr + t->set.istride + t->set.i_off;
-+					inbuf_n = t->input.paddr_n + t->set.i_off;
-+				}
-+			} else {
-+				if (vdi_frame_idx) {
-+					inbuf_p = t->input.paddr + t->set.i_off;
-+					inbuf = t->input.paddr_n + t->set.istride + t->set.i_off;
-+					inbuf_n = t->input.paddr_n + t->set.i_off;
-+					params.mem_prp_vf_mem.field_fmt =
-+						IPU_DEINTERLACE_FIELD_TOP;
-+				} else {
-+					inbuf_p = t->input.paddr + t->set.istride +
-+							t->set.i_off;
-+					inbuf = t->input.paddr + t->set.i_off;
-+					inbuf_n = t->input.paddr_n + t->set.istride +
-+							t->set.i_off;
-+				}
-+			}
-+		} else {
-+			if (t->input.deinterlace.enable) {
-+				if (params.mem_prp_vf_mem.field_fmt ==
-+					IPU_DEINTERLACE_FIELD_TOP) {
-+					if (vdi_frame_idx) {
-+						inbuf = t->input.paddr + t->set.istride + t->set.i_off;
-+						params.mem_prp_vf_mem.field_fmt =
-+							IPU_DEINTERLACE_FIELD_BOTTOM;
-+					} else
-+						inbuf = t->input.paddr + t->set.i_off;
-+				} else {
-+					if (vdi_frame_idx) {
-+						inbuf = t->input.paddr + t->set.i_off;
-+						params.mem_prp_vf_mem.field_fmt =
-+							IPU_DEINTERLACE_FIELD_TOP;
-+					} else
-+						inbuf = t->input.paddr + t->set.istride + t->set.i_off;
-+				}
-+			} else
-+				inbuf = t->input.paddr + t->set.i_off;
-+		}
-+
-+		if (t->overlay_en)
-+			ovbuf = t->overlay.paddr + t->set.ov_off;
-+	}
-+	if (t->overlay_en && (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL))
-+		ov_alp_buf = t->overlay.alpha.loc_alp_paddr
-+			+ t->set.ov_alpha_off;
-+
-+	if ((IPU_PIX_FMT_TILED_NV12 != t->input.format) &&
-+		(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
-+		ret = ipu_init_channel_buffer(ipu,
-+				t->set.ic_chan,
-+				IPU_INPUT_BUFFER,
-+				t->input.format,
-+				t->input.crop.w,
-+				t->input.crop.h,
-+				t->set.istride,
-+				IPU_ROTATE_NONE,
-+				inbuf,
-+				0,
-+				0,
-+				t->set.i_uoff,
-+				t->set.i_voff);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BUF_FAIL;
-+			goto done;
-+		}
-+	}
-+	if (deinterlace_3_field(t) &&
-+		(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
-+		ret = ipu_init_channel_buffer(ipu,
-+				t->set.vdi_ic_p_chan,
-+				IPU_INPUT_BUFFER,
-+				t->input.format,
-+				t->input.crop.w,
-+				t->input.crop.h,
-+				t->set.istride,
-+				IPU_ROTATE_NONE,
-+				inbuf_p,
-+				0,
-+				0,
-+				t->set.i_uoff,
-+				t->set.i_voff);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BUF_FAIL;
-+			goto done;
-+		}
-+
-+		ret = ipu_init_channel_buffer(ipu,
-+				t->set.vdi_ic_n_chan,
-+				IPU_INPUT_BUFFER,
-+				t->input.format,
-+				t->input.crop.w,
-+				t->input.crop.h,
-+				t->set.istride,
-+				IPU_ROTATE_NONE,
-+				inbuf_n,
-+				0,
-+				0,
-+				t->set.i_uoff,
-+				t->set.i_voff);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BUF_FAIL;
-+			goto done;
-+		}
-+	}
-+
-+	if (t->overlay_en) {
-+		ret = ipu_init_channel_buffer(ipu,
-+				t->set.ic_chan,
-+				IPU_GRAPH_IN_BUFFER,
-+				t->overlay.format,
-+				t->overlay.crop.w,
-+				t->overlay.crop.h,
-+				t->set.ovstride,
-+				IPU_ROTATE_NONE,
-+				ovbuf,
-+				0,
-+				0,
-+				t->set.ov_uoff,
-+				t->set.ov_voff);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BUF_FAIL;
-+			goto done;
-+		}
-+	}
-+
-+	if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
-+		ret = ipu_init_channel_buffer(ipu,
-+				t->set.ic_chan,
-+				IPU_ALPHA_IN_BUFFER,
-+				IPU_PIX_FMT_GENERIC,
-+				t->overlay.crop.w,
-+				t->overlay.crop.h,
-+				t->set.ov_alpha_stride,
-+				IPU_ROTATE_NONE,
-+				ov_alp_buf,
-+				0,
-+				0,
-+				0, 0);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BUF_FAIL;
-+			goto done;
-+		}
-+	}
-+
-+	if (!(t->set.task & VDOA_ONLY)) {
-+		ret = ipu_init_channel_buffer(ipu,
-+				t->set.ic_chan,
-+				IPU_OUTPUT_BUFFER,
-+				out_fmt,
-+				out_w,
-+				out_h,
-+				out_stride,
-+				out_rot,
-+				outbuf,
-+				0,
-+				0,
-+				out_uoff,
-+				out_voff);
-+		if (ret < 0) {
-+			t->state = STATE_INIT_CHAN_BUF_FAIL;
-+			goto done;
-+		}
-+	}
-+
-+	if ((t->set.mode & VDOA_BAND_MODE) && (t->set.task & VDI_VF)) {
-+		ret = ipu_link_channels(ipu, MEM_VDOA_MEM, t->set.ic_chan);
-+		CHECK_RETCODE(ret < 0, "ipu_link_ch vdoa_ic",
-+				STATE_LINK_CHAN_FAIL, done, ret);
-+	}
-+
-+done:
-+	return ret;
-+}
-+
-+static void uninit_ic(struct ipu_soc *ipu, struct ipu_task_entry *t)
-+{
-+	int ret;
-+
-+	if ((t->set.mode & VDOA_BAND_MODE) && (t->set.task & VDI_VF)) {
-+		ret = ipu_unlink_channels(ipu, MEM_VDOA_MEM, t->set.ic_chan);
-+		CHECK_RETCODE_CONT(ret < 0, "ipu_unlink_ch vdoa_ic",
-+				STATE_UNLINK_CHAN_FAIL, ret);
-+	}
-+	ipu_uninit_channel(ipu, t->set.ic_chan);
-+	if (deinterlace_3_field(t)) {
-+		ipu_uninit_channel(ipu, t->set.vdi_ic_p_chan);
-+		ipu_uninit_channel(ipu, t->set.vdi_ic_n_chan);
-+	}
-+}
-+
-+static int init_rot(struct ipu_soc *ipu, struct ipu_task_entry *t)
-+{
-+	int ret = 0;
-+	dma_addr_t inbuf = 0, outbuf = 0;
-+	int in_uoff = 0, in_voff = 0;
-+	int in_fmt, in_width, in_height, in_stride;
-+
-+	/* init channel */
-+	ret = ipu_init_channel(ipu, t->set.rot_chan, NULL);
-+	if (ret < 0) {
-+		t->state = STATE_INIT_CHAN_FAIL;
-+		goto done;
-+	}
-+
-+	/* init channel buf */
-+	/* is it need link to a ic channel */
-+	if (ic_and_rot(t->set.mode)) {
-+		in_fmt = t->set.r_fmt;
-+		in_width = t->set.r_width;
-+		in_height = t->set.r_height;
-+		in_stride = t->set.r_stride;
-+		inbuf = t->set.r_paddr;
-+		in_uoff = 0;
-+		in_voff = 0;
-+	} else {
-+		in_fmt = t->input.format;
-+		in_width = t->input.crop.w;
-+		in_height = t->input.crop.h;
-+		in_stride = t->set.istride;
-+		inbuf = t->input.paddr + t->set.i_off;
-+		in_uoff = t->set.i_uoff;
-+		in_voff = t->set.i_voff;
-+	}
-+	outbuf = t->output.paddr + t->set.o_off;
-+
-+	ret = ipu_init_channel_buffer(ipu,
-+			t->set.rot_chan,
-+			IPU_INPUT_BUFFER,
-+			in_fmt,
-+			in_width,
-+			in_height,
-+			in_stride,
-+			t->output.rotate,
-+			inbuf,
-+			0,
-+			0,
-+			in_uoff,
-+			in_voff);
-+	if (ret < 0) {
-+		t->state = STATE_INIT_CHAN_BUF_FAIL;
-+		goto done;
-+	}
-+
-+	ret = ipu_init_channel_buffer(ipu,
-+			t->set.rot_chan,
-+			IPU_OUTPUT_BUFFER,
-+			t->output.format,
-+			t->output.crop.w,
-+			t->output.crop.h,
-+			t->set.ostride,
-+			IPU_ROTATE_NONE,
-+			outbuf,
-+			0,
-+			0,
-+			t->set.o_uoff,
-+			t->set.o_voff);
-+	if (ret < 0) {
-+		t->state = STATE_INIT_CHAN_BUF_FAIL;
-+		goto done;
-+	}
-+
-+done:
-+	return ret;
-+}
-+
-+static void uninit_rot(struct ipu_soc *ipu, struct ipu_task_entry *t)
-+{
-+	ipu_uninit_channel(ipu, t->set.rot_chan);
-+}
-+
-+static int get_irq(struct ipu_task_entry *t)
-+{
-+	int irq;
-+	ipu_channel_t chan;
-+
-+	if (only_ic(t->set.mode))
-+		chan = t->set.ic_chan;
-+	else
-+		chan = t->set.rot_chan;
-+
-+	switch (chan) {
-+	case MEM_ROT_VF_MEM:
-+		irq = IPU_IRQ_PRP_VF_ROT_OUT_EOF;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		irq = IPU_IRQ_PP_ROT_OUT_EOF;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+	case MEM_PRP_VF_MEM:
-+		irq = IPU_IRQ_PRP_VF_OUT_EOF;
-+		break;
-+	case MEM_PP_MEM:
-+		irq = IPU_IRQ_PP_OUT_EOF;
-+		break;
-+	case MEM_VDI_MEM:
-+		irq = IPU_IRQ_VDIC_OUT_EOF;
-+		break;
-+	default:
-+		irq = -EINVAL;
-+	}
-+
-+	return irq;
-+}
-+
-+static irqreturn_t task_irq_handler(int irq, void *dev_id)
-+{
-+	struct ipu_task_entry *prev_tsk = dev_id;
-+
-+	CHECK_PERF(&prev_tsk->ts_inirq);
-+	complete(&prev_tsk->irq_comp);
-+	dev_dbg(prev_tsk->dev, "[0x%p] no-0x%x in-irq!",
-+				 prev_tsk, prev_tsk->task_no);
-+
-+	return IRQ_HANDLED;
-+}
-+
-+/* Fix deinterlace up&down split mode medium line */
-+static void vdi_split_process(struct ipu_soc *ipu, struct ipu_task_entry *t)
-+{
-+	u32 vdi_size;
-+	u32 vdi_save_lines;
-+	u32 stripe_mode;
-+	u32 task_no;
-+	u32 i, offset_addr;
-+	u32 line_size;
-+	unsigned char  *base_off;
-+	struct ipu_task_entry *parent = t->parent;
-+	struct mutex *lock = &parent->vdic_lock;
-+
-+	if (!parent) {
-+		dev_err(t->dev, "ERR[0x%x]invalid parent\n", t->task_no);
-+		return;
-+	}
-+	mutex_lock(lock);
-+	stripe_mode = t->task_no & 0xf;
-+	task_no = t->task_no >> 4;
-+
-+	/* Save both luma and chroma part for interleaved YUV(e.g. YUYV).
-+	 * Save luma part for non-interleaved and partial-interleaved
-+	 * YUV format (e.g NV12 and YV12). */
-+	if (t->output.format == IPU_PIX_FMT_YUYV ||
-+			t->output.format == IPU_PIX_FMT_UYVY)
-+		line_size = t->output.crop.w * fmt_to_bpp(t->output.format)/8;
-+	else
-+		line_size = t->output.crop.w;
-+
-+	vdi_save_lines = (t->output.crop.h - t->set.sp_setting.ud_split_line)/2;
-+	vdi_size = vdi_save_lines * line_size;
-+	if (vdi_save_lines <= 0) {
-+		dev_err(t->dev, "[0x%p] vdi_save_line error\n", (void *)t);
-+		mutex_unlock(lock);
-+		return;
-+	}
-+
-+	/*check vditmpbuf buffer have alloced or buffer size is changed */
-+	if ((vdi_save_lines != parent->old_save_lines) ||
-+		(vdi_size != parent->old_size)) {
-+		if (parent->vditmpbuf[0] != NULL)
-+			kfree(parent->vditmpbuf[0]);
-+		if (parent->vditmpbuf[1] != NULL)
-+			kfree(parent->vditmpbuf[1]);
-+
-+		parent->vditmpbuf[0] = kmalloc(vdi_size, GFP_KERNEL);
-+		if (parent->vditmpbuf[0] == NULL) {
-+			dev_err(t->dev,
-+				"[0x%p]Falied Alloc vditmpbuf[0]\n", (void *)t);
-+			mutex_unlock(lock);
-+			return;
-+		}
-+		memset(parent->vditmpbuf[0], 0, vdi_size);
-+
-+		parent->vditmpbuf[1] = kmalloc(vdi_size, GFP_KERNEL);
-+		if (parent->vditmpbuf[1] == NULL) {
-+			dev_err(t->dev,
-+				"[0x%p]Falied Alloc vditmpbuf[1]\n", (void *)t);
-+			mutex_unlock(lock);
-+			return;
-+		}
-+		memset(parent->vditmpbuf[1], 0, vdi_size);
-+
-+		parent->old_save_lines = vdi_save_lines;
-+		parent->old_size = vdi_size;
-+	}
-+
-+	if (pfn_valid(t->output.paddr >> PAGE_SHIFT)) {
-+		base_off = page_address(pfn_to_page(t->output.paddr >> PAGE_SHIFT));
-+		base_off += t->output.paddr & ((1 << PAGE_SHIFT) - 1);
-+	} else {
-+		base_off = (char *)ioremap_nocache(t->output.paddr,
-+				t->output.width * t->output.height *
-+				fmt_to_bpp(t->output.format)/8);
-+	}
-+	if (base_off == NULL) {
-+		dev_err(t->dev, "ERR[0x%p]Failed get virtual address\n", t);
-+		mutex_unlock(lock);
-+		return;
-+	}
-+
-+	/* UP stripe or UP&LEFT stripe */
-+	if ((stripe_mode == UP_STRIPE) ||
-+			(stripe_mode == (UP_STRIPE | LEFT_STRIPE))) {
-+		if (!parent->buf0filled) {
-+			offset_addr = t->set.o_off +
-+				t->set.sp_setting.ud_split_line*t->set.ostride;
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + vdi_size);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+				t->output.paddr + offset_addr + vdi_size);
-+
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(parent->vditmpbuf[0] + i*line_size,
-+					base_off + offset_addr +
-+					i*t->set.ostride, line_size);
-+			parent->buf0filled = true;
-+		} else {
-+			offset_addr = t->set.o_off + (t->output.crop.h -
-+					vdi_save_lines) * t->set.ostride;
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(base_off + offset_addr + i*t->set.ostride,
-+						parent->vditmpbuf[0] + i*line_size, line_size);
-+
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + i*t->set.ostride);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + i*t->set.ostride);
-+			parent->buf0filled = false;
-+		}
-+	}
-+	/*Down stripe or Down&Left stripe*/
-+	else if ((stripe_mode == DOWN_STRIPE) ||
-+			(stripe_mode == (DOWN_STRIPE | LEFT_STRIPE))) {
-+		if (!parent->buf0filled) {
-+			offset_addr = t->set.o_off + vdi_save_lines*t->set.ostride;
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + vdi_size);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + vdi_size);
-+
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(parent->vditmpbuf[0] + i*line_size,
-+						base_off + offset_addr + i*t->set.ostride,
-+						line_size);
-+			parent->buf0filled = true;
-+		} else {
-+			offset_addr = t->set.o_off;
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(base_off + offset_addr + i*t->set.ostride,
-+						parent->vditmpbuf[0] + i*line_size,
-+						line_size);
-+
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + i*t->set.ostride);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + i*t->set.ostride);
-+			parent->buf0filled = false;
-+		}
-+	}
-+	/*Up&Right stripe*/
-+	else if (stripe_mode == (UP_STRIPE | RIGHT_STRIPE)) {
-+		if (!parent->buf1filled) {
-+			offset_addr = t->set.o_off +
-+				t->set.sp_setting.ud_split_line*t->set.ostride;
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + vdi_size);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + vdi_size);
-+
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(parent->vditmpbuf[1] + i*line_size,
-+						base_off + offset_addr + i*t->set.ostride,
-+						line_size);
-+			parent->buf1filled = true;
-+		} else {
-+			offset_addr = t->set.o_off +
-+				(t->output.crop.h - vdi_save_lines)*t->set.ostride;
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(base_off + offset_addr + i*t->set.ostride,
-+						parent->vditmpbuf[1] + i*line_size,
-+						line_size);
-+
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + i*t->set.ostride);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + i*t->set.ostride);
-+			parent->buf1filled = false;
-+		}
-+	}
-+	/*Down stripe or Down&Right stript*/
-+	else if (stripe_mode == (DOWN_STRIPE | RIGHT_STRIPE)) {
-+		if (!parent->buf1filled) {
-+			offset_addr = t->set.o_off + vdi_save_lines*t->set.ostride;
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + vdi_save_lines*t->set.ostride);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + vdi_save_lines*t->set.ostride);
-+
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(parent->vditmpbuf[1] + i*line_size,
-+						base_off + offset_addr + i*t->set.ostride,
-+						line_size);
-+			parent->buf1filled = true;
-+		} else {
-+			offset_addr = t->set.o_off;
-+			for (i = 0; i < vdi_save_lines; i++)
-+				memcpy(base_off + offset_addr + i*t->set.ostride,
-+						parent->vditmpbuf[1] + i*line_size,
-+						line_size);
-+
-+			dmac_flush_range(base_off + offset_addr,
-+					base_off + offset_addr + vdi_save_lines*t->set.ostride);
-+			outer_flush_range(t->output.paddr + offset_addr,
-+					t->output.paddr + offset_addr + vdi_save_lines*t->set.ostride);
-+			parent->buf1filled = false;
-+		}
-+	}
-+	if (!pfn_valid(t->output.paddr >> PAGE_SHIFT))
-+		iounmap(base_off);
-+	mutex_unlock(lock);
-+}
-+
-+static void do_task_release(struct ipu_task_entry *t, int fail)
-+{
-+	int ret;
-+	struct ipu_soc *ipu = t->ipu;
-+
-+	if (t->input.deinterlace.enable && !fail &&
-+			(t->task_no & (UP_STRIPE | DOWN_STRIPE)))
-+		vdi_split_process(ipu, t);
-+
-+	ipu_free_irq(ipu, t->irq, t);
-+
-+	if (t->vdoa_dma.vaddr)
-+		dma_free_coherent(t->dev,
-+			t->vdoa_dma.size,
-+			t->vdoa_dma.vaddr,
-+			t->vdoa_dma.paddr);
-+
-+	if (only_ic(t->set.mode)) {
-+		ret = ipu_disable_channel(ipu, t->set.ic_chan, true);
-+		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_ic",
-+				STATE_DISABLE_CHAN_FAIL, ret);
-+		if (deinterlace_3_field(t)) {
-+			ret = ipu_disable_channel(ipu, t->set.vdi_ic_p_chan,
-+							true);
-+			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_ic_p",
-+					STATE_DISABLE_CHAN_FAIL, ret);
-+			ret = ipu_disable_channel(ipu, t->set.vdi_ic_n_chan,
-+							true);
-+			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_ic_n",
-+					STATE_DISABLE_CHAN_FAIL, ret);
-+		}
-+	} else if (only_rot(t->set.mode)) {
-+		ret = ipu_disable_channel(ipu, t->set.rot_chan, true);
-+		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_rot",
-+				STATE_DISABLE_CHAN_FAIL, ret);
-+	} else if (ic_and_rot(t->set.mode)) {
-+		ret = ipu_unlink_channels(ipu, t->set.ic_chan, t->set.rot_chan);
-+		CHECK_RETCODE_CONT(ret < 0, "ipu_unlink_ch",
-+				STATE_UNLINK_CHAN_FAIL, ret);
-+		ret = ipu_disable_channel(ipu, t->set.rot_chan, true);
-+		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch ic_and_rot-rot",
-+				STATE_DISABLE_CHAN_FAIL, ret);
-+		ret = ipu_disable_channel(ipu, t->set.ic_chan, true);
-+		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch ic_and_rot-ic",
-+				STATE_DISABLE_CHAN_FAIL, ret);
-+		if (deinterlace_3_field(t)) {
-+			ret = ipu_disable_channel(ipu, t->set.vdi_ic_p_chan,
-+							true);
-+			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch icrot-ic-p",
-+					STATE_DISABLE_CHAN_FAIL, ret);
-+			ret = ipu_disable_channel(ipu, t->set.vdi_ic_n_chan,
-+							true);
-+			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch icrot-ic-n",
-+					STATE_DISABLE_CHAN_FAIL, ret);
-+		}
-+	}
-+
-+	if (only_ic(t->set.mode))
-+		uninit_ic(ipu, t);
-+	else if (only_rot(t->set.mode))
-+		uninit_rot(ipu, t);
-+	else if (ic_and_rot(t->set.mode)) {
-+		uninit_ic(ipu, t);
-+		uninit_rot(ipu, t);
-+	}
-+
-+	t->state = STATE_OK;
-+	CHECK_PERF(&t->ts_rel);
-+	return;
-+}
-+
-+static void do_task_vdoa_only(struct ipu_task_entry *t)
-+{
-+	int ret;
-+
-+	ret = init_tiled_ch_bufs(NULL, t);
-+	CHECK_RETCODE(ret < 0, "do_vdoa_only", STATE_ERR, out, ret);
-+	ret = vdoa_start(t->vdoa_handle, VDOA_DEF_TIMEOUT_MS);
-+	vdoa_stop(t->vdoa_handle);
-+	CHECK_RETCODE(ret < 0, "vdoa_wait4complete, do_vdoa_only",
-+			STATE_VDOA_IRQ_TIMEOUT, out, ret);
-+
-+	t->state = STATE_OK;
-+out:
-+	return;
-+}
-+
-+static void do_task(struct ipu_task_entry *t)
-+{
-+	int r_size;
-+	int irq;
-+	int ret;
-+	uint32_t busy;
-+	struct ipu_soc *ipu = t->ipu;
-+
-+	CHECK_PERF(&t->ts_dotask);
-+
-+	if (!ipu) {
-+		t->state = STATE_NO_IPU;
-+		return;
-+	}
-+
-+	init_completion(&t->irq_comp);
-+	dev_dbg(ipu->dev, "[0x%p]Do task no:0x%x: id %d\n", (void *)t,
-+		 t->task_no, t->task_id);
-+	dump_task_info(t);
-+
-+	if (t->set.task & IC_PP) {
-+		t->set.ic_chan = MEM_PP_MEM;
-+		dev_dbg(ipu->dev, "[0x%p]ic channel MEM_PP_MEM\n", (void *)t);
-+	} else if (t->set.task & IC_VF) {
-+		t->set.ic_chan = MEM_PRP_VF_MEM;
-+		dev_dbg(ipu->dev, "[0x%p]ic channel MEM_PRP_VF_MEM\n", (void *)t);
-+	} else if (t->set.task & VDI_VF) {
-+		if (t->set.mode & VDOA_BAND_MODE) {
-+			t->set.ic_chan = MEM_VDI_MEM;
-+			if (deinterlace_3_field(t)) {
-+				t->set.vdi_ic_p_chan = MEM_VDI_MEM_P;
-+				t->set.vdi_ic_n_chan = MEM_VDI_MEM_N;
-+			}
-+			dev_dbg(ipu->dev, "[0x%p]ic ch MEM_VDI_MEM\n",
-+					 (void *)t);
-+		} else {
-+			t->set.ic_chan = MEM_VDI_PRP_VF_MEM;
-+			if (deinterlace_3_field(t)) {
-+				t->set.vdi_ic_p_chan = MEM_VDI_PRP_VF_MEM_P;
-+				t->set.vdi_ic_n_chan = MEM_VDI_PRP_VF_MEM_N;
-+			}
-+			dev_dbg(ipu->dev,
-+				"[0x%p]ic ch MEM_VDI_PRP_VF_MEM\n", t);
-+		}
-+	}
-+
-+	if (t->set.task & ROT_PP) {
-+		t->set.rot_chan = MEM_ROT_PP_MEM;
-+		dev_dbg(ipu->dev, "[0x%p]rot channel MEM_ROT_PP_MEM\n", (void *)t);
-+	} else if (t->set.task & ROT_VF) {
-+		t->set.rot_chan = MEM_ROT_VF_MEM;
-+		dev_dbg(ipu->dev, "[0x%p]rot channel MEM_ROT_VF_MEM\n", (void *)t);
-+	}
-+
-+	if (t->task_id == IPU_TASK_ID_VF)
-+		busy = ic_vf_pp_is_busy(ipu, true);
-+	else if (t->task_id == IPU_TASK_ID_PP)
-+		busy = ic_vf_pp_is_busy(ipu, false);
-+	else {
-+		dev_err(ipu->dev, "ERR[no:0x%x]ipu task_id:%d invalid!\n",
-+				t->task_no, t->task_id);
-+		return;
-+	}
-+	if (busy) {
-+		dev_err(ipu->dev, "ERR[0x%p-no:0x%x]ipu task_id:%d busy!\n",
-+				(void *)t, t->task_no, t->task_id);
-+		t->state = STATE_IPU_BUSY;
-+		return;
-+	}
-+
-+	irq = get_irq(t);
-+	if (irq < 0) {
-+		t->state = STATE_NO_IRQ;
-+		return;
-+	}
-+	t->irq = irq;
-+
-+	/* channel setup */
-+	if (only_ic(t->set.mode)) {
-+		dev_dbg(t->dev, "[0x%p]only ic mode\n", (void *)t);
-+		ret = init_ic(ipu, t);
-+		CHECK_RETCODE(ret < 0, "init_ic only_ic",
-+				t->state, chan_setup, ret);
-+	} else if (only_rot(t->set.mode)) {
-+		dev_dbg(t->dev, "[0x%p]only rot mode\n", (void *)t);
-+		ret = init_rot(ipu, t);
-+		CHECK_RETCODE(ret < 0, "init_rot only_rot",
-+				t->state, chan_setup, ret);
-+	} else if (ic_and_rot(t->set.mode)) {
-+		int rot_idx = (t->task_id == IPU_TASK_ID_VF) ? 0 : 1;
-+
-+		dev_dbg(t->dev, "[0x%p]ic + rot mode\n", (void *)t);
-+		t->set.r_fmt = t->output.format;
-+		if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
-+			t->set.r_width = t->output.crop.h;
-+			t->set.r_height = t->output.crop.w;
-+		} else {
-+			t->set.r_width = t->output.crop.w;
-+			t->set.r_height = t->output.crop.h;
-+		}
-+		t->set.r_stride = t->set.r_width *
-+			bytes_per_pixel(t->set.r_fmt);
-+		r_size = PAGE_ALIGN(t->set.r_width * t->set.r_height
-+			* fmt_to_bpp(t->set.r_fmt)/8);
-+
-+		if (r_size > ipu->rot_dma[rot_idx].size) {
-+			dev_dbg(t->dev, "[0x%p]realloc rot buffer\n", (void *)t);
-+
-+			if (ipu->rot_dma[rot_idx].vaddr)
-+				dma_free_coherent(t->dev,
-+					ipu->rot_dma[rot_idx].size,
-+					ipu->rot_dma[rot_idx].vaddr,
-+					ipu->rot_dma[rot_idx].paddr);
-+
-+			ipu->rot_dma[rot_idx].size = r_size;
-+			ipu->rot_dma[rot_idx].vaddr = dma_zalloc_coherent(t->dev,
-+						r_size,
-+						&ipu->rot_dma[rot_idx].paddr,
-+						GFP_DMA | GFP_KERNEL);
-+			CHECK_RETCODE(ipu->rot_dma[rot_idx].vaddr == NULL,
-+					"ic_and_rot", STATE_SYS_NO_MEM,
-+					chan_setup, -ENOMEM);
-+		}
-+		t->set.r_paddr = ipu->rot_dma[rot_idx].paddr;
-+
-+		dev_dbg(t->dev, "[0x%p]rotation:\n", (void *)t);
-+		dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n", (void *)t, t->set.r_fmt);
-+		dev_dbg(t->dev, "[0x%p]\twidth = %d\n", (void *)t, t->set.r_width);
-+		dev_dbg(t->dev, "[0x%p]\theight = %d\n", (void *)t, t->set.r_height);
-+		dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n", (void *)t, t->set.r_paddr);
-+		dev_dbg(t->dev, "[0x%p]\trstride = %d\n", (void *)t, t->set.r_stride);
-+
-+		ret = init_ic(ipu, t);
-+		CHECK_RETCODE(ret < 0, "init_ic ic_and_rot",
-+				t->state, chan_setup, ret);
-+		ret = init_rot(ipu, t);
-+		CHECK_RETCODE(ret < 0, "init_rot ic_and_rot",
-+				t->state, chan_setup, ret);
-+		ret = ipu_link_channels(ipu, t->set.ic_chan,
-+				t->set.rot_chan);
-+		CHECK_RETCODE(ret < 0, "ipu_link_ch ic_and_rot",
-+				STATE_LINK_CHAN_FAIL, chan_setup, ret);
-+	} else {
-+		dev_err(t->dev, "ERR [0x%p]do task: should not be here\n", t);
-+		t->state = STATE_ERR;
-+		return;
-+	}
-+
-+	ret = ipu_request_irq(ipu, irq, task_irq_handler, 0, NULL, t);
-+	CHECK_RETCODE(ret < 0, "ipu_req_irq",
-+			STATE_IRQ_FAIL, chan_setup, ret);
-+
-+	/* enable/start channel */
-+	if (only_ic(t->set.mode)) {
-+		ret = ipu_enable_channel(ipu, t->set.ic_chan);
-+		CHECK_RETCODE(ret < 0, "ipu_enable_ch only_ic",
-+				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+		if (deinterlace_3_field(t)) {
-+			ret = ipu_enable_channel(ipu, t->set.vdi_ic_p_chan);
-+			CHECK_RETCODE(ret < 0, "ipu_enable_ch only_ic_p",
-+					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+			ret = ipu_enable_channel(ipu, t->set.vdi_ic_n_chan);
-+			CHECK_RETCODE(ret < 0, "ipu_enable_ch only_ic_n",
-+					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+		}
-+
-+		ret = ipu_select_buffer(ipu, t->set.ic_chan, IPU_OUTPUT_BUFFER,
-+					0);
-+		CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic",
-+				STATE_SEL_BUF_FAIL, chan_buf, ret);
-+		if (t->overlay_en) {
-+			ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+						IPU_GRAPH_IN_BUFFER, 0);
-+			CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic_g",
-+					STATE_SEL_BUF_FAIL, chan_buf, ret);
-+			if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
-+				ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+							IPU_ALPHA_IN_BUFFER, 0);
-+				CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic_a",
-+						STATE_SEL_BUF_FAIL, chan_buf,
-+						ret);
-+			}
-+		}
-+		if (!(t->set.mode & VDOA_BAND_MODE)) {
-+			if (deinterlace_3_field(t))
-+				ipu_select_multi_vdi_buffer(ipu, 0);
-+			else {
-+				ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+							IPU_INPUT_BUFFER, 0);
-+				CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic_i",
-+					STATE_SEL_BUF_FAIL, chan_buf, ret);
-+			}
-+		}
-+	} else if (only_rot(t->set.mode)) {
-+		ret = ipu_enable_channel(ipu, t->set.rot_chan);
-+		CHECK_RETCODE(ret < 0, "ipu_enable_ch only_rot",
-+				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+		ret = ipu_select_buffer(ipu, t->set.rot_chan,
-+						IPU_OUTPUT_BUFFER, 0);
-+		CHECK_RETCODE(ret < 0, "ipu_sel_buf only_rot_o",
-+				STATE_SEL_BUF_FAIL, chan_buf, ret);
-+		ret = ipu_select_buffer(ipu, t->set.rot_chan,
-+						IPU_INPUT_BUFFER, 0);
-+		CHECK_RETCODE(ret < 0, "ipu_sel_buf only_rot_i",
-+				STATE_SEL_BUF_FAIL, chan_buf, ret);
-+	} else if (ic_and_rot(t->set.mode)) {
-+		ret = ipu_enable_channel(ipu, t->set.rot_chan);
-+		CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-rot",
-+				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+		ret = ipu_enable_channel(ipu, t->set.ic_chan);
-+		CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-ic",
-+				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+		if (deinterlace_3_field(t)) {
-+			ret = ipu_enable_channel(ipu, t->set.vdi_ic_p_chan);
-+			CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-p",
-+					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+			ret = ipu_enable_channel(ipu, t->set.vdi_ic_n_chan);
-+			CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-n",
-+					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
-+		}
-+
-+		ret = ipu_select_buffer(ipu, t->set.rot_chan,
-+						IPU_OUTPUT_BUFFER, 0);
-+		CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-rot-o",
-+				STATE_SEL_BUF_FAIL, chan_buf, ret);
-+		if (t->overlay_en) {
-+			ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+							IPU_GRAPH_IN_BUFFER, 0);
-+			CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-ic-g",
-+					STATE_SEL_BUF_FAIL, chan_buf, ret);
-+			if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
-+				ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+							IPU_ALPHA_IN_BUFFER, 0);
-+				CHECK_RETCODE(ret < 0, "ipu_sel_buf icrot-ic-a",
-+						STATE_SEL_BUF_FAIL,
-+						chan_buf, ret);
-+			}
-+		}
-+		ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+						IPU_OUTPUT_BUFFER, 0);
-+		CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-ic-o",
-+				STATE_SEL_BUF_FAIL, chan_buf, ret);
-+		if (deinterlace_3_field(t))
-+			ipu_select_multi_vdi_buffer(ipu, 0);
-+		else {
-+			ret = ipu_select_buffer(ipu, t->set.ic_chan,
-+							IPU_INPUT_BUFFER, 0);
-+			CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-ic-i",
-+					STATE_SEL_BUF_FAIL, chan_buf, ret);
-+		}
-+	}
-+
-+	if (need_split(t))
-+		t->state = STATE_IN_PROGRESS;
-+
-+	if (t->set.mode & VDOA_BAND_MODE) {
-+		ret = vdoa_start(t->vdoa_handle, VDOA_DEF_TIMEOUT_MS);
-+		CHECK_RETCODE(ret < 0, "vdoa_wait4complete, do_vdoa_band",
-+				STATE_VDOA_IRQ_TIMEOUT, chan_rel, ret);
-+	}
-+
-+	CHECK_PERF(&t->ts_waitirq);
-+	ret = wait_for_completion_timeout(&t->irq_comp,
-+				 msecs_to_jiffies(t->timeout - DEF_DELAY_MS));
-+	CHECK_PERF(&t->ts_wakeup);
-+	CHECK_RETCODE(ret == 0, "wait_for_comp_timeout",
-+			STATE_IRQ_TIMEOUT, chan_rel, ret);
-+	dev_dbg(t->dev, "[0x%p] no-0x%x ipu irq done!", t, t->task_no);
-+
-+chan_rel:
-+chan_buf:
-+chan_en:
-+chan_setup:
-+	if (t->set.mode & VDOA_BAND_MODE)
-+		vdoa_stop(t->vdoa_handle);
-+	do_task_release(t, t->state >= STATE_ERR);
-+	return;
-+}
-+
-+static void do_task_vdoa_vdi(struct ipu_task_entry *t)
-+{
-+	int i;
-+	int ret;
-+	u32 stripe_width;
-+
-+	/* FIXME: crop mode not support now */
-+	stripe_width = t->input.width >> 1;
-+	t->input.crop.pos.x = 0;
-+	t->input.crop.pos.y = 0;
-+	t->input.crop.w = stripe_width;
-+	t->input.crop.h = t->input.height;
-+	t->output.crop.w = stripe_width;
-+	t->output.crop.h = t->input.height;
-+
-+	for (i = 0; i < 2; i++) {
-+		t->input.crop.pos.x = t->input.crop.pos.x + i * stripe_width;
-+		t->output.crop.pos.x = t->output.crop.pos.x + i * stripe_width;
-+		/* check input */
-+		ret = set_crop(&t->input.crop, t->input.width, t->input.height,
-+			t->input.format);
-+		if (ret < 0) {
-+			ret = STATE_ERR;
-+			goto done;
-+		} else
-+			update_offset(t->input.format,
-+					t->input.width, t->input.height,
-+					t->input.crop.pos.x,
-+					t->input.crop.pos.y,
-+					&t->set.i_off, &t->set.i_uoff,
-+					&t->set.i_voff, &t->set.istride);
-+		dev_dbg(t->dev, "i_off:0x%x, i_uoff:0x%x, istride:%d.\n",
-+			t->set.i_off, t->set.i_uoff, t->set.istride);
-+		/* check output */
-+		ret = set_crop(&t->output.crop, t->input.width,
-+					t->output.height, t->output.format);
-+		if (ret < 0) {
-+			ret = STATE_ERR;
-+			goto done;
-+		} else
-+			update_offset(t->output.format,
-+					t->output.width, t->output.height,
-+					t->output.crop.pos.x,
-+					t->output.crop.pos.y,
-+					&t->set.o_off, &t->set.o_uoff,
-+					&t->set.o_voff, &t->set.ostride);
-+
-+		dev_dbg(t->dev, "o_off:0x%x, o_uoff:0x%x, ostride:%d.\n",
-+				t->set.o_off, t->set.o_uoff, t->set.ostride);
-+
-+		do_task(t);
-+	}
-+
-+	return;
-+done:
-+	dev_err(t->dev, "ERR %s set_crop.\n", __func__);
-+	t->state = ret;
-+	return;
-+}
-+
-+static void get_res_do_task(struct ipu_task_entry *t)
-+{
-+	uint32_t	found;
-+	uint32_t	split_child;
-+	struct mutex	*lock;
-+
-+	found = get_vdoa_ipu_res(t);
-+	if (!found) {
-+		dev_err(t->dev, "ERR:[0x%p] no-0x%x can not get res\n",
-+			t, t->task_no);
-+		return;
-+	} else {
-+		if (t->set.task & VDOA_ONLY)
-+			do_task_vdoa_only(t);
-+		else if ((IPU_PIX_FMT_TILED_NV12F == t->input.format) &&
-+				(t->set.mode & VDOA_BAND_MODE) &&
-+				(t->input.crop.w > soc_max_vdi_in_width()))
-+			do_task_vdoa_vdi(t);
-+		else
-+			do_task(t);
-+		put_vdoa_ipu_res(t, 0);
-+	}
-+	if (t->state != STATE_OK) {
-+		dev_err(t->dev, "ERR:[0x%p] no-0x%x state: %s\n",
-+			t, t->task_no, state_msg[t->state].msg);
-+	}
-+
-+	split_child = need_split(t) && t->parent;
-+	if (split_child) {
-+		lock = &t->parent->split_lock;
-+		mutex_lock(lock);
-+		t->split_done = 1;
-+		mutex_unlock(lock);
-+		wake_up(&t->parent->split_waitq);
-+	}
-+
-+	return;
-+}
-+
-+static void wait_split_task_complete(struct ipu_task_entry *parent,
-+				struct ipu_split_task *sp_task, uint32_t size)
-+{
-+	struct ipu_task_entry *tsk = NULL;
-+	int ret = 0, rc;
-+	int j, idx = -1;
-+	unsigned long flags;
-+	struct mutex *lock = &parent->split_lock;
-+	int k, busy_vf, busy_pp;
-+	struct ipu_soc *ipu;
-+	DECLARE_PERF_VAR;
-+
-+	for (j = 0; j < size; j++) {
-+		rc = wait_event_timeout(
-+			parent->split_waitq,
-+			sp_task_check_done(sp_task, parent, size, &idx),
-+			msecs_to_jiffies(parent->timeout - DEF_DELAY_MS));
-+		if (!rc) {
-+			dev_err(parent->dev,
-+				"ERR:[0x%p] no-0x%x, split_task timeout,j:%d,"
-+				"size:%d.\n",
-+				 parent, parent->task_no, j, size);
-+			ret = -ETIMEDOUT;
-+			goto out;
-+		} else {
-+			if (idx < 0) {
-+				dev_err(parent->dev,
-+				"ERR:[0x%p] no-0x%x, invalid task idx:%d\n",
-+				 parent, parent->task_no, idx);
-+				continue;
-+			}
-+			tsk = sp_task[idx].child_task;
-+			mutex_lock(lock);
-+			if (!tsk->split_done || !tsk->ipu)
-+				dev_err(tsk->dev,
-+				"ERR:no-0x%x,split not done:%d/null ipu:0x%p\n",
-+				 tsk->task_no, tsk->split_done, tsk->ipu);
-+			tsk->split_done = 0;
-+			mutex_unlock(lock);
-+
-+			dev_dbg(tsk->dev,
-+				"[0x%p] no-0x%x sp_tsk[%d] done,state:%d.\n",
-+				 tsk, tsk->task_no, idx, tsk->state);
-+			#ifdef DBG_IPU_PERF
-+				CHECK_PERF(&tsk->ts_rel);
-+				PRINT_TASK_STATISTICS;
-+			#endif
-+		}
-+	}
-+
-+out:
-+	if (ret == -ETIMEDOUT) {
-+		/* debug */
-+		for (k = 0; k < max_ipu_no; k++) {
-+			ipu = ipu_get_soc(k);
-+			if (IS_ERR(ipu)) {
-+				dev_err(parent->dev, "no:0x%x, null ipu:%d\n",
-+				 parent->task_no, k);
-+			} else {
-+				busy_vf = ic_vf_pp_is_busy(ipu, true);
-+				busy_pp = ic_vf_pp_is_busy(ipu, false);
-+				dev_err(parent->dev,
-+					"ERR:ipu[%d] busy_vf:%d, busy_pp:%d.\n",
-+					k, busy_vf, busy_pp);
-+			}
-+		}
-+		for (k = 0; k < size; k++) {
-+			tsk = sp_task[k].child_task;
-+			if (!tsk)
-+				continue;
-+			dev_err(parent->dev,
-+				"ERR: sp_task[%d][0x%p] no-0x%x done:%d,"
-+				 "state:%s,on_list:%d, ipu:0x%p,timeout!\n",
-+				 k, tsk, tsk->task_no, tsk->split_done,
-+				 state_msg[tsk->state].msg, tsk->task_in_list,
-+				 tsk->ipu);
-+		}
-+	}
-+
-+	for (j = 0; j < size; j++) {
-+		tsk = sp_task[j].child_task;
-+		if (!tsk)
-+			continue;
-+		spin_lock_irqsave(&ipu_task_list_lock, flags);
-+		if (tsk->task_in_list) {
-+			list_del(&tsk->node);
-+			tsk->task_in_list = 0;
-+			dev_dbg(tsk->dev,
-+				"[0x%p] no-0x%x,id:%d sp_tsk timeout list_del.\n",
-+				 tsk, tsk->task_no, tsk->task_id);
-+		}
-+		spin_unlock_irqrestore(&ipu_task_list_lock, flags);
-+		if (!tsk->ipu)
-+			continue;
-+		if (tsk->state != STATE_OK) {
-+			dev_err(tsk->dev,
-+				"ERR:[0x%p] no-0x%x,id:%d, sp_tsk state: %s\n",
-+					tsk, tsk->task_no, tsk->task_id,
-+					state_msg[tsk->state].msg);
-+		}
-+		kref_put(&tsk->refcount, task_mem_free);
-+	}
-+
-+	kfree(parent->vditmpbuf[0]);
-+	kfree(parent->vditmpbuf[1]);
-+
-+	if (ret < 0)
-+		parent->state = STATE_TIMEOUT;
-+	else
-+		parent->state = STATE_OK;
-+	return;
-+}
-+
-+static inline int find_task(struct ipu_task_entry **t, int thread_id)
-+{
-+	int found;
-+	unsigned long flags;
-+	struct ipu_task_entry *tsk;
-+	struct list_head *task_list = &ipu_task_list;
-+
-+	*t = NULL;
-+	spin_lock_irqsave(&ipu_task_list_lock, flags);
-+	found = !list_empty(task_list);
-+	if (found) {
-+		tsk = list_first_entry(task_list, struct ipu_task_entry, node);
-+		if (tsk->task_in_list) {
-+			list_del(&tsk->node);
-+			tsk->task_in_list = 0;
-+			*t = tsk;
-+			kref_get(&tsk->refcount);
-+			dev_dbg(tsk->dev,
-+			"thread_id:%d,[0x%p] task_no:0x%x,mode:0x%x list_del\n",
-+			thread_id, tsk, tsk->task_no, tsk->set.mode);
-+		} else
-+			dev_err(tsk->dev,
-+			"thread_id:%d,task_no:0x%x,mode:0x%x not on list_del\n",
-+			thread_id, tsk->task_no, tsk->set.mode);
-+	}
-+	spin_unlock_irqrestore(&ipu_task_list_lock, flags);
-+
-+	return found;
-+}
-+
-+static int ipu_task_thread(void *argv)
-+{
-+	struct ipu_task_entry *tsk;
-+	struct ipu_task_entry *sp_tsk0;
-+	struct ipu_split_task sp_task[4];
-+	/* priority lower than irq_thread */
-+	const struct sched_param param = {
-+		.sched_priority = MAX_USER_RT_PRIO/2 - 1,
-+	};
-+	int ret;
-+	int curr_thread_id;
-+	uint32_t size;
-+	unsigned long flags;
-+	unsigned int cpu;
-+	struct cpumask cpu_mask;
-+	struct ipu_thread_data *data = (struct ipu_thread_data *)argv;
-+
-+	thread_id++;
-+	curr_thread_id = thread_id;
-+	sched_setscheduler(current, SCHED_FIFO, &param);
-+
-+	if (!data->is_vdoa) {
-+		cpu = cpumask_first(cpu_online_mask);
-+		cpumask_set_cpu(cpu, &cpu_mask);
-+		ret = sched_setaffinity(data->ipu->thread[data->id]->pid,
-+			&cpu_mask);
-+		if (ret < 0) {
-+			pr_err("%s: sched_setaffinity fail:%d.\n", __func__, ret);
-+		}
-+		pr_debug("%s: sched_setaffinity cpu:%d.\n", __func__, cpu);
-+	}
-+
-+	while (!kthread_should_stop()) {
-+		int split_fail = 0;
-+		int split_parent;
-+		int split_child;
-+
-+		wait_event_interruptible(thread_waitq, find_task(&tsk, curr_thread_id));
-+
-+		if (!tsk) {
-+			pr_err("thread:%d can not find task.\n",
-+				curr_thread_id);
-+			continue;
-+		}
-+
-+		/* note: other threads run split child task */
-+		split_parent = need_split(tsk) && !tsk->parent;
-+		split_child = need_split(tsk) && tsk->parent;
-+		if (split_parent) {
-+			if ((tsk->set.split_mode == RL_SPLIT) ||
-+				 (tsk->set.split_mode == UD_SPLIT))
-+				size = 2;
-+			else
-+				size = 4;
-+			ret = queue_split_task(tsk, sp_task, size);
-+			if (ret < 0) {
-+				split_fail = 1;
-+			} else {
-+				struct list_head *pos;
-+
-+				spin_lock_irqsave(&ipu_task_list_lock, flags);
-+
-+				sp_tsk0 = list_first_entry(&tsk->split_list,
-+						struct ipu_task_entry, node);
-+				list_del(&sp_tsk0->node);
-+
-+				list_for_each(pos, &tsk->split_list) {
-+					struct ipu_task_entry *tmp;
-+
-+					tmp = list_entry(pos,
-+						struct ipu_task_entry, node);
-+					tmp->task_in_list = 1;
-+					dev_dbg(tmp->dev,
-+						"[0x%p] no-0x%x,id:%d sp_tsk "
-+						"add_to_list.\n", tmp,
-+						tmp->task_no, tmp->task_id);
-+				}
-+				/* add to global list */
-+				list_splice(&tsk->split_list, &ipu_task_list);
-+
-+				spin_unlock_irqrestore(&ipu_task_list_lock,
-+									flags);
-+				/* let the parent thread do the first sp_task */
-+				/* FIXME: ensure the correct sequence for split
-+					4size: 5/6->9/a*/
-+				if (!sp_tsk0)
-+					dev_err(tsk->dev,
-+					"ERR: no-0x%x,can not get split_tsk0\n",
-+					tsk->task_no);
-+				wake_up_interruptible(&thread_waitq);
-+				get_res_do_task(sp_tsk0);
-+				dev_dbg(sp_tsk0->dev,
-+					"thread:%d complete tsk no:0x%x.\n",
-+					curr_thread_id, sp_tsk0->task_no);
-+				ret = atomic_read(&req_cnt);
-+				if (ret > 0) {
-+					wake_up(&res_waitq);
-+					dev_dbg(sp_tsk0->dev,
-+					"sp_tsk0 sche thread:%d no:0x%x,"
-+					"req_cnt:%d\n", curr_thread_id,
-+					sp_tsk0->task_no, ret);
-+					/* For other threads to get_res */
-+					schedule();
-+				}
-+			}
-+		} else
-+			get_res_do_task(tsk);
-+
-+		/* wait for all 4 sp_task finished here or timeout
-+			and then release all resources */
-+		if (split_parent && !split_fail)
-+			wait_split_task_complete(tsk, sp_task, size);
-+
-+		if (!split_child) {
-+			atomic_inc(&tsk->done);
-+			wake_up(&tsk->task_waitq);
-+		}
-+
-+		dev_dbg(tsk->dev, "thread:%d complete tsk no:0x%x-[0x%p].\n",
-+				curr_thread_id, tsk->task_no, tsk);
-+		ret = atomic_read(&req_cnt);
-+		if (ret > 0) {
-+			wake_up(&res_waitq);
-+			dev_dbg(tsk->dev, "sche thread:%d no:0x%x,req_cnt:%d\n",
-+				curr_thread_id, tsk->task_no, ret);
-+			/* note: give cpu to other threads to get_res */
-+			schedule();
-+		}
-+
-+		kref_put(&tsk->refcount, task_mem_free);
-+	}
-+
-+	pr_info("ERR %s exit.\n", __func__);
-+	return 0;
-+}
-+
-+int ipu_check_task(struct ipu_task *task)
-+{
-+	struct ipu_task_entry *tsk;
-+	int ret = 0;
-+
-+	tsk = create_task_entry(task);
-+	if (IS_ERR(tsk))
-+		return PTR_ERR(tsk);
-+
-+	ret = check_task(tsk);
-+
-+	task->input = tsk->input;
-+	task->output = tsk->output;
-+	task->overlay = tsk->overlay;
-+	dump_task_info(tsk);
-+
-+	kref_put(&tsk->refcount, task_mem_free);
-+	if (ret != 0)
-+		pr_debug("%s ret:%d.\n", __func__, ret);
-+	return ret;
-+}
-+EXPORT_SYMBOL_GPL(ipu_check_task);
-+
-+int ipu_queue_task(struct ipu_task *task)
-+{
-+	struct ipu_task_entry *tsk;
-+	unsigned long flags;
-+	int ret;
-+	u32 tmp_task_no;
-+	DECLARE_PERF_VAR;
-+
-+	tsk = create_task_entry(task);
-+	if (IS_ERR(tsk))
-+		return PTR_ERR(tsk);
-+
-+	CHECK_PERF(&tsk->ts_queue);
-+	ret = prepare_task(tsk);
-+	if (ret < 0)
-+		goto done;
-+
-+	if (need_split(tsk)) {
-+		CHECK_PERF(&tsk->ts_dotask);
-+		CHECK_PERF(&tsk->ts_waitirq);
-+		CHECK_PERF(&tsk->ts_inirq);
-+		CHECK_PERF(&tsk->ts_wakeup);
-+	}
-+
-+	/* task_no last four bits for split task type*/
-+	tmp_task_no = atomic_inc_return(&frame_no);
-+	tsk->task_no = tmp_task_no << 4;
-+	init_waitqueue_head(&tsk->task_waitq);
-+
-+	spin_lock_irqsave(&ipu_task_list_lock, flags);
-+	list_add_tail(&tsk->node, &ipu_task_list);
-+	tsk->task_in_list = 1;
-+	dev_dbg(tsk->dev, "[0x%p,no-0x%x] list_add_tail\n", tsk, tsk->task_no);
-+	spin_unlock_irqrestore(&ipu_task_list_lock, flags);
-+	wake_up_interruptible(&thread_waitq);
-+
-+	ret = wait_event_timeout(tsk->task_waitq, atomic_read(&tsk->done),
-+						msecs_to_jiffies(tsk->timeout));
-+	if (0 == ret) {
-+		/* note: the timeout should larger than the internal timeout!*/
-+		ret = -ETIMEDOUT;
-+		dev_err(tsk->dev, "ERR: [0x%p] no-0x%x, timeout:%dms!\n",
-+				tsk, tsk->task_no, tsk->timeout);
-+	} else {
-+		if (STATE_OK != tsk->state) {
-+			dev_err(tsk->dev, "ERR: [0x%p] no-0x%x,state %d: %s\n",
-+				tsk, tsk->task_no, tsk->state,
-+				state_msg[tsk->state].msg);
-+			ret = -ECANCELED;
-+		} else
-+			ret = 0;
-+	}
-+
-+	spin_lock_irqsave(&ipu_task_list_lock, flags);
-+	if (tsk->task_in_list) {
-+		list_del(&tsk->node);
-+		tsk->task_in_list = 0;
-+		dev_dbg(tsk->dev, "[0x%p] no:0x%x list_del\n",
-+				tsk, tsk->task_no);
-+	}
-+	spin_unlock_irqrestore(&ipu_task_list_lock, flags);
-+
-+#ifdef DBG_IPU_PERF
-+	CHECK_PERF(&tsk->ts_rel);
-+	PRINT_TASK_STATISTICS;
-+	if (ts_frame_avg == 0)
-+		ts_frame_avg = ts_frame.tv_nsec / NSEC_PER_USEC +
-+				ts_frame.tv_sec * USEC_PER_SEC;
-+	else
-+		ts_frame_avg = (ts_frame_avg + ts_frame.tv_nsec / NSEC_PER_USEC
-+				+ ts_frame.tv_sec * USEC_PER_SEC)/2;
-+	if (timespec_compare(&ts_frame, &ts_frame_max) > 0)
-+		ts_frame_max = ts_frame;
-+
-+	atomic_inc(&frame_cnt);
-+
-+	if ((atomic_read(&frame_cnt) %  1000) == 0)
-+		pr_debug("ipu_dev: max frame time:%ldus, avg frame time:%dus,"
-+			"frame_cnt:%d\n", ts_frame_max.tv_nsec / NSEC_PER_USEC
-+			+ ts_frame_max.tv_sec * USEC_PER_SEC,
-+			ts_frame_avg, atomic_read(&frame_cnt));
-+#endif
-+done:
-+	if (ret < 0)
-+		dev_err(tsk->dev, "ERR: no-0x%x,ipu_queue_task err:%d\n",
-+				tsk->task_no, ret);
-+
-+	kref_put(&tsk->refcount, task_mem_free);
-+
-+	return ret;
-+}
-+EXPORT_SYMBOL_GPL(ipu_queue_task);
-+
-+static int mxc_ipu_open(struct inode *inode, struct file *file)
-+{
-+	file->private_data = (void *)atomic_inc_return(&file_index);
-+	return 0;
-+}
-+
-+static long mxc_ipu_ioctl(struct file *file,
-+		unsigned int cmd, unsigned long arg)
-+{
-+	int __user *argp = (void __user *)arg;
-+	int ret = 0;
-+
-+	switch (cmd) {
-+	case IPU_CHECK_TASK:
-+		{
-+			struct ipu_task task;
-+
-+			if (copy_from_user
-+					(&task, (struct ipu_task *) arg,
-+					 sizeof(struct ipu_task)))
-+				return -EFAULT;
-+			ret = ipu_check_task(&task);
-+			if (copy_to_user((struct ipu_task *) arg,
-+				&task, sizeof(struct ipu_task)))
-+				return -EFAULT;
-+			break;
-+		}
-+	case IPU_QUEUE_TASK:
-+		{
-+			struct ipu_task task;
-+
-+			if (copy_from_user
-+					(&task, (struct ipu_task *) arg,
-+					 sizeof(struct ipu_task)))
-+				return -EFAULT;
-+			ret = ipu_queue_task(&task);
-+			break;
-+		}
-+	case IPU_ALLOC:
-+		{
-+			int size;
-+			struct ipu_alloc_list *mem;
-+
-+			mem = kzalloc(sizeof(*mem), GFP_KERNEL);
-+			if (mem == NULL)
-+				return -ENOMEM;
-+
-+			if (get_user(size, argp))
-+				return -EFAULT;
-+
-+			mem->size = PAGE_ALIGN(size);
-+
-+			mem->cpu_addr = dma_zalloc_coherent(ipu_dev, size,
-+							   &mem->phy_addr,
-+							   GFP_DMA | GFP_KERNEL);
-+			if (mem->cpu_addr == NULL) {
-+				kfree(mem);
-+				return -ENOMEM;
-+			}
-+			mem->file_index = file->private_data;
-+			mutex_lock(&ipu_alloc_lock);
-+			list_add(&mem->list, &ipu_alloc_list);
-+			mutex_unlock(&ipu_alloc_lock);
-+
-+			dev_dbg(ipu_dev, "allocated %d bytes @ 0x%08X\n",
-+				mem->size, mem->phy_addr);
-+
-+			if (put_user(mem->phy_addr, argp))
-+				return -EFAULT;
-+
-+			break;
-+		}
-+	case IPU_FREE:
-+		{
-+			unsigned long offset;
-+			struct ipu_alloc_list *mem;
-+
-+			if (get_user(offset, argp))
-+				return -EFAULT;
-+
-+			ret = -EINVAL;
-+			mutex_lock(&ipu_alloc_lock);
-+			list_for_each_entry(mem, &ipu_alloc_list, list) {
-+				if (mem->phy_addr == offset) {
-+					list_del(&mem->list);
-+					dma_free_coherent(ipu_dev,
-+							  mem->size,
-+							  mem->cpu_addr,
-+							  mem->phy_addr);
-+					kfree(mem);
-+					ret = 0;
-+					break;
-+				}
-+			}
-+			mutex_unlock(&ipu_alloc_lock);
-+			if (0 == ret)
-+				dev_dbg(ipu_dev, "free %d bytes @ 0x%08X\n",
-+					mem->size, mem->phy_addr);
-+
-+			break;
-+		}
-+	default:
-+		break;
-+	}
-+	return ret;
-+}
-+
-+static int mxc_ipu_mmap(struct file *file, struct vm_area_struct *vma)
-+{
-+	bool found = false;
-+	u32 len;
-+	unsigned long offset = vma->vm_pgoff << PAGE_SHIFT;
-+	struct ipu_alloc_list *mem;
-+
-+	mutex_lock(&ipu_alloc_lock);
-+	list_for_each_entry(mem, &ipu_alloc_list, list) {
-+		if (offset == mem->phy_addr) {
-+			found = true;
-+			len = mem->size;
-+			break;
-+		}
-+	}
-+	mutex_unlock(&ipu_alloc_lock);
-+	if (!found)
-+		return -EINVAL;
-+
-+	if (vma->vm_end - vma->vm_start > len)
-+		return -EINVAL;
-+
-+	vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
-+
-+	if (remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
-+				vma->vm_end - vma->vm_start,
-+				vma->vm_page_prot)) {
-+		printk(KERN_ERR
-+				"mmap failed!\n");
-+		return -ENOBUFS;
-+	}
-+	return 0;
-+}
-+
-+static int mxc_ipu_release(struct inode *inode, struct file *file)
-+{
-+	struct ipu_alloc_list *mem;
-+	struct ipu_alloc_list *n;
-+
-+	mutex_lock(&ipu_alloc_lock);
-+	list_for_each_entry_safe(mem, n, &ipu_alloc_list, list) {
-+		if ((mem->cpu_addr != 0) &&
-+			(file->private_data == mem->file_index)) {
-+			list_del(&mem->list);
-+			dma_free_coherent(ipu_dev,
-+					  mem->size,
-+					  mem->cpu_addr,
-+					  mem->phy_addr);
-+			dev_dbg(ipu_dev, "rel-free %d bytes @ 0x%08X\n",
-+				mem->size, mem->phy_addr);
-+			kfree(mem);
-+		}
-+	}
-+	mutex_unlock(&ipu_alloc_lock);
-+	atomic_dec(&file_index);
-+
-+	return 0;
-+}
-+
-+static struct file_operations mxc_ipu_fops = {
-+	.owner = THIS_MODULE,
-+	.open = mxc_ipu_open,
-+	.mmap = mxc_ipu_mmap,
-+	.release = mxc_ipu_release,
-+	.unlocked_ioctl = mxc_ipu_ioctl,
-+};
-+
-+int register_ipu_device(struct ipu_soc *ipu, int id)
-+{
-+	int ret = 0;
-+	static int idx;
-+	static struct ipu_thread_data thread_data[5];
-+
-+	if (!major) {
-+		major = register_chrdev(0, "mxc_ipu", &mxc_ipu_fops);
-+		if (major < 0) {
-+			printk(KERN_ERR "Unable to register mxc_ipu as a char device\n");
-+			ret = major;
-+			goto register_cdev_fail;
-+		}
-+
-+		ipu_class = class_create(THIS_MODULE, "mxc_ipu");
-+		if (IS_ERR(ipu_class)) {
-+			ret = PTR_ERR(ipu_class);
-+			goto ipu_class_fail;
-+		}
-+
-+		ipu_dev = device_create(ipu_class, NULL, MKDEV(major, 0),
-+				NULL, "mxc_ipu");
-+		if (IS_ERR(ipu_dev)) {
-+			ret = PTR_ERR(ipu_dev);
-+			goto dev_create_fail;
-+		}
-+		ipu_dev->dma_mask = kmalloc(sizeof(*ipu_dev->dma_mask), GFP_KERNEL);
-+		*ipu_dev->dma_mask = DMA_BIT_MASK(32);
-+		ipu_dev->coherent_dma_mask = DMA_BIT_MASK(32);
-+
-+		mutex_init(&ipu_ch_tbl.lock);
-+	}
-+	max_ipu_no = ++id;
-+	ipu->rot_dma[0].size = 0;
-+	ipu->rot_dma[1].size = 0;
-+
-+	thread_data[idx].ipu = ipu;
-+	thread_data[idx].id = 0;
-+	thread_data[idx].is_vdoa = 0;
-+	ipu->thread[0] = kthread_run(ipu_task_thread, &thread_data[idx++],
-+					"ipu%d_task", id);
-+	if (IS_ERR(ipu->thread[0])) {
-+		ret = PTR_ERR(ipu->thread[0]);
-+		goto kthread0_fail;
-+	}
-+
-+	thread_data[idx].ipu = ipu;
-+	thread_data[idx].id = 1;
-+	thread_data[idx].is_vdoa = 0;
-+	ipu->thread[1] = kthread_run(ipu_task_thread, &thread_data[idx++],
-+				"ipu%d_task", id);
-+	if (IS_ERR(ipu->thread[1])) {
-+		ret = PTR_ERR(ipu->thread[1]);
-+		goto kthread1_fail;
-+	}
-+
-+
-+	return ret;
-+
-+kthread1_fail:
-+	kthread_stop(ipu->thread[0]);
-+kthread0_fail:
-+	if (id == 0)
-+		device_destroy(ipu_class, MKDEV(major, 0));
-+dev_create_fail:
-+	if (id == 0) {
-+		class_destroy(ipu_class);
-+	}
-+ipu_class_fail:
-+	if (id == 0)
-+		unregister_chrdev(major, "mxc_ipu");
-+register_cdev_fail:
-+	return ret;
-+}
-+
-+void unregister_ipu_device(struct ipu_soc *ipu, int id)
-+{
-+	int i;
-+
-+	kthread_stop(ipu->thread[0]);
-+	kthread_stop(ipu->thread[1]);
-+	for (i = 0; i < 2; i++) {
-+		if (ipu->rot_dma[i].vaddr)
-+			dma_free_coherent(ipu_dev,
-+				ipu->rot_dma[i].size,
-+				ipu->rot_dma[i].vaddr,
-+				ipu->rot_dma[i].paddr);
-+	}
-+
-+	if (major) {
-+		device_destroy(ipu_class, MKDEV(major, 0));
-+		class_destroy(ipu_class);
-+		unregister_chrdev(major, "mxc_ipu");
-+		major = 0;
-+	}
-+}
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_disp.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_disp.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_disp.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_disp.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,1956 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file ipu_disp.c
-+ *
-+ * @brief IPU display submodule API functions
-+ *
-+ * @ingroup IPU
-+ */
-+
-+#include <linux/clk.h>
-+#include <linux/clk-provider.h>
-+#include <linux/delay.h>
-+#include <linux/err.h>
-+#include <linux/errno.h>
-+#include <linux/io.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/module.h>
-+#include <linux/spinlock.h>
-+#include <linux/types.h>
-+
-+#include <asm/atomic.h>
-+
-+#include "ipu_param_mem.h"
-+#include "ipu_regs.h"
-+
-+struct dp_csc_param_t {
-+	int mode;
-+	void *coeff;
-+};
-+
-+#define SYNC_WAVE 0
-+#define NULL_WAVE (-1)
-+#define ASYNC_SER_WAVE 6
-+
-+/* DC display ID assignments */
-+#define DC_DISP_ID_SYNC(di)	(di)
-+#define DC_DISP_ID_SERIAL	2
-+#define DC_DISP_ID_ASYNC	3
-+
-+int dmfc_type_setup;
-+
-+void _ipu_dmfc_init(struct ipu_soc *ipu, int dmfc_type, int first)
-+{
-+	u32 dmfc_wr_chan, dmfc_dp_chan;
-+
-+	if (first) {
-+		if (dmfc_type_setup > dmfc_type)
-+			dmfc_type = dmfc_type_setup;
-+		else
-+			dmfc_type_setup = dmfc_type;
-+
-+		/* disable DMFC-IC channel*/
-+		ipu_dmfc_write(ipu, 0x2, DMFC_IC_CTRL);
-+	} else if (dmfc_type_setup >= DMFC_HIGH_RESOLUTION_DC) {
-+		dev_dbg(ipu->dev, "DMFC high resolution has set, will not change\n");
-+		return;
-+	} else
-+		dmfc_type_setup = dmfc_type;
-+
-+	if (dmfc_type == DMFC_HIGH_RESOLUTION_DC) {
-+		/* 1 - segment 0~3;
-+		 * 5B - segement 4, 5;
-+		 * 5F - segement 6, 7;
-+		 * 1C, 2C and 6B, 6F unused;
-+		 */
-+		dev_info(ipu->dev, "IPU DMFC DC HIGH RESOLUTION: 1(0~3), 5B(4,5), 5F(6,7)\n");
-+		dmfc_wr_chan = 0x00000088;
-+		dmfc_dp_chan = 0x00009694;
-+		ipu->dmfc_size_28 = 256*4;
-+		ipu->dmfc_size_29 = 0;
-+		ipu->dmfc_size_24 = 0;
-+		ipu->dmfc_size_27 = 128*4;
-+		ipu->dmfc_size_23 = 128*4;
-+	} else if (dmfc_type == DMFC_HIGH_RESOLUTION_DP) {
-+		/* 1 - segment 0, 1;
-+		 * 5B - segement 2~5;
-+		 * 5F - segement 6,7;
-+		 * 1C, 2C and 6B, 6F unused;
-+		 */
-+		dev_info(ipu->dev, "IPU DMFC DP HIGH RESOLUTION: 1(0,1), 5B(2~5), 5F(6,7)\n");
-+		dmfc_wr_chan = 0x00000090;
-+		dmfc_dp_chan = 0x0000968a;
-+		ipu->dmfc_size_28 = 128*4;
-+		ipu->dmfc_size_29 = 0;
-+		ipu->dmfc_size_24 = 0;
-+		ipu->dmfc_size_27 = 128*4;
-+		ipu->dmfc_size_23 = 256*4;
-+	} else if (dmfc_type == DMFC_HIGH_RESOLUTION_ONLY_DP) {
-+		/* 5B - segement 0~3;
-+		 * 5F - segement 4~7;
-+		 * 1, 1C, 2C and 6B, 6F unused;
-+		 */
-+		dev_info(ipu->dev, "IPU DMFC ONLY-DP HIGH RESOLUTION: 5B(0~3), 5F(4~7)\n");
-+		dmfc_wr_chan = 0x00000000;
-+		dmfc_dp_chan = 0x00008c88;
-+		ipu->dmfc_size_28 = 0;
-+		ipu->dmfc_size_29 = 0;
-+		ipu->dmfc_size_24 = 0;
-+		ipu->dmfc_size_27 = 256*4;
-+		ipu->dmfc_size_23 = 256*4;
-+	} else {
-+		/* 1 - segment 0, 1;
-+		 * 5B - segement 4, 5;
-+		 * 5F - segement 6, 7;
-+		 * 1C, 2C and 6B, 6F unused;
-+		 */
-+		dev_info(ipu->dev, "IPU DMFC NORMAL mode: 1(0~1), 5B(4,5), 5F(6,7)\n");
-+		dmfc_wr_chan = 0x00000090;
-+		dmfc_dp_chan = 0x00009694;
-+		ipu->dmfc_size_28 = 128*4;
-+		ipu->dmfc_size_29 = 0;
-+		ipu->dmfc_size_24 = 0;
-+		ipu->dmfc_size_27 = 128*4;
-+		ipu->dmfc_size_23 = 128*4;
-+	}
-+	ipu_dmfc_write(ipu, dmfc_wr_chan, DMFC_WR_CHAN);
-+	ipu_dmfc_write(ipu, 0x202020F6, DMFC_WR_CHAN_DEF);
-+	ipu_dmfc_write(ipu, dmfc_dp_chan, DMFC_DP_CHAN);
-+	/* Enable chan 5 watermark set at 5 bursts and clear at 7 bursts */
-+	ipu_dmfc_write(ipu, 0x2020F6F6, DMFC_DP_CHAN_DEF);
-+}
-+
-+static int __init dmfc_setup(char *options)
-+{
-+	get_option(&options, &dmfc_type_setup);
-+	if (dmfc_type_setup > DMFC_HIGH_RESOLUTION_ONLY_DP)
-+		dmfc_type_setup = DMFC_HIGH_RESOLUTION_ONLY_DP;
-+	return 1;
-+}
-+__setup("dmfc=", dmfc_setup);
-+
-+void _ipu_dmfc_set_wait4eot(struct ipu_soc *ipu, int dma_chan, int width)
-+{
-+	u32 dmfc_gen1 = ipu_dmfc_read(ipu, DMFC_GENERAL1);
-+
-+	if (width >= HIGH_RESOLUTION_WIDTH) {
-+		if (dma_chan == 23)
-+			_ipu_dmfc_init(ipu, DMFC_HIGH_RESOLUTION_DP, 0);
-+		else if (dma_chan == 28)
-+			_ipu_dmfc_init(ipu, DMFC_HIGH_RESOLUTION_DC, 0);
-+	}
-+
-+	if (dma_chan == 23) { /*5B*/
-+		if (ipu->dmfc_size_23/width > 3)
-+			dmfc_gen1 |= 1UL << 20;
-+		else
-+			dmfc_gen1 &= ~(1UL << 20);
-+	} else if (dma_chan == 24) { /*6B*/
-+		if (ipu->dmfc_size_24/width > 1)
-+			dmfc_gen1 |= 1UL << 22;
-+		else
-+			dmfc_gen1 &= ~(1UL << 22);
-+	} else if (dma_chan == 27) { /*5F*/
-+		if (ipu->dmfc_size_27/width > 2)
-+			dmfc_gen1 |= 1UL << 21;
-+		else
-+			dmfc_gen1 &= ~(1UL << 21);
-+	} else if (dma_chan == 28) { /*1*/
-+		if (ipu->dmfc_size_28/width > 2)
-+			dmfc_gen1 |= 1UL << 16;
-+		else
-+			dmfc_gen1 &= ~(1UL << 16);
-+	} else if (dma_chan == 29) { /*6F*/
-+		if (ipu->dmfc_size_29/width > 1)
-+			dmfc_gen1 |= 1UL << 23;
-+		else
-+			dmfc_gen1 &= ~(1UL << 23);
-+	}
-+
-+	ipu_dmfc_write(ipu, dmfc_gen1, DMFC_GENERAL1);
-+}
-+
-+void _ipu_dmfc_set_burst_size(struct ipu_soc *ipu, int dma_chan, int burst_size)
-+{
-+	u32 dmfc_wr_chan = ipu_dmfc_read(ipu, DMFC_WR_CHAN);
-+	u32 dmfc_dp_chan = ipu_dmfc_read(ipu, DMFC_DP_CHAN);
-+	int dmfc_bs = 0;
-+
-+	switch (burst_size) {
-+	case 64:
-+		dmfc_bs = 0x40;
-+		break;
-+	case 32:
-+	case 20:
-+		dmfc_bs = 0x80;
-+		break;
-+	case 16:
-+		dmfc_bs = 0xc0;
-+		break;
-+	default:
-+		dev_err(ipu->dev, "Unsupported burst size %d\n",
-+			burst_size);
-+		return;
-+	}
-+
-+	if (dma_chan == 23) { /*5B*/
-+		dmfc_dp_chan &= ~(0xc0);
-+		dmfc_dp_chan |= dmfc_bs;
-+	} else if (dma_chan == 27) { /*5F*/
-+		dmfc_dp_chan &= ~(0xc000);
-+		dmfc_dp_chan |= (dmfc_bs << 8);
-+	} else if (dma_chan == 28) { /*1*/
-+		dmfc_wr_chan &= ~(0xc0);
-+		dmfc_wr_chan |= dmfc_bs;
-+	}
-+
-+	ipu_dmfc_write(ipu, dmfc_wr_chan, DMFC_WR_CHAN);
-+	ipu_dmfc_write(ipu, dmfc_dp_chan, DMFC_DP_CHAN);
-+}
-+
-+static void _ipu_di_data_wave_config(struct ipu_soc *ipu,
-+				int di, int wave_gen,
-+				int access_size, int component_size)
-+{
-+	u32 reg;
-+	reg = (access_size << DI_DW_GEN_ACCESS_SIZE_OFFSET) |
-+	    (component_size << DI_DW_GEN_COMPONENT_SIZE_OFFSET);
-+	ipu_di_write(ipu, di, reg, DI_DW_GEN(wave_gen));
-+}
-+
-+static void _ipu_di_data_pin_config(struct ipu_soc *ipu,
-+			int di, int wave_gen, int di_pin, int set,
-+			int up, int down)
-+{
-+	u32 reg;
-+
-+	reg = ipu_di_read(ipu, di, DI_DW_GEN(wave_gen));
-+	reg &= ~(0x3 << (di_pin * 2));
-+	reg |= set << (di_pin * 2);
-+	ipu_di_write(ipu, di, reg, DI_DW_GEN(wave_gen));
-+
-+	ipu_di_write(ipu, di, (down << 16) | up, DI_DW_SET(wave_gen, set));
-+}
-+
-+static void _ipu_di_sync_config(struct ipu_soc *ipu,
-+				int di, int wave_gen,
-+				int run_count, int run_src,
-+				int offset_count, int offset_src,
-+				int repeat_count, int cnt_clr_src,
-+				int cnt_polarity_gen_en,
-+				int cnt_polarity_clr_src,
-+				int cnt_polarity_trigger_src,
-+				int cnt_up, int cnt_down)
-+{
-+	u32 reg;
-+
-+	if ((run_count >= 0x1000) || (offset_count >= 0x1000) || (repeat_count >= 0x1000) ||
-+		(cnt_up >= 0x400) || (cnt_down >= 0x400)) {
-+		dev_err(ipu->dev, "DI%d counters out of range.\n", di);
-+		return;
-+	}
-+
-+	reg = (run_count << 19) | (++run_src << 16) |
-+	    (offset_count << 3) | ++offset_src;
-+	ipu_di_write(ipu, di, reg, DI_SW_GEN0(wave_gen));
-+	reg = (cnt_polarity_gen_en << 29) | (++cnt_clr_src << 25) |
-+	    (++cnt_polarity_trigger_src << 12) | (++cnt_polarity_clr_src << 9);
-+	reg |= (cnt_down << 16) | cnt_up;
-+	if (repeat_count == 0) {
-+		/* Enable auto reload */
-+		reg |= 0x10000000;
-+	}
-+	ipu_di_write(ipu, di, reg, DI_SW_GEN1(wave_gen));
-+	reg = ipu_di_read(ipu, di, DI_STP_REP(wave_gen));
-+	reg &= ~(0xFFFF << (16 * ((wave_gen - 1) & 0x1)));
-+	reg |= repeat_count << (16 * ((wave_gen - 1) & 0x1));
-+	ipu_di_write(ipu, di, reg, DI_STP_REP(wave_gen));
-+}
-+
-+static void _ipu_dc_map_link(struct ipu_soc *ipu,
-+		int current_map,
-+		int base_map_0, int buf_num_0,
-+		int base_map_1, int buf_num_1,
-+		int base_map_2, int buf_num_2)
-+{
-+	int ptr_0 = base_map_0 * 3 + buf_num_0;
-+	int ptr_1 = base_map_1 * 3 + buf_num_1;
-+	int ptr_2 = base_map_2 * 3 + buf_num_2;
-+	int ptr;
-+	u32 reg;
-+	ptr = (ptr_2 << 10) +  (ptr_1 << 5) + ptr_0;
-+
-+	reg = ipu_dc_read(ipu, DC_MAP_CONF_PTR(current_map));
-+	reg &= ~(0x1F << ((16 * (current_map & 0x1))));
-+	reg |= ptr << ((16 * (current_map & 0x1)));
-+	ipu_dc_write(ipu, reg, DC_MAP_CONF_PTR(current_map));
-+}
-+
-+static void _ipu_dc_map_config(struct ipu_soc *ipu,
-+		int map, int byte_num, int offset, int mask)
-+{
-+	int ptr = map * 3 + byte_num;
-+	u32 reg;
-+
-+	reg = ipu_dc_read(ipu, DC_MAP_CONF_VAL(ptr));
-+	reg &= ~(0xFFFF << (16 * (ptr & 0x1)));
-+	reg |= ((offset << 8) | mask) << (16 * (ptr & 0x1));
-+	ipu_dc_write(ipu, reg, DC_MAP_CONF_VAL(ptr));
-+
-+	reg = ipu_dc_read(ipu, DC_MAP_CONF_PTR(map));
-+	reg &= ~(0x1F << ((16 * (map & 0x1)) + (5 * byte_num)));
-+	reg |= ptr << ((16 * (map & 0x1)) + (5 * byte_num));
-+	ipu_dc_write(ipu, reg, DC_MAP_CONF_PTR(map));
-+}
-+
-+static void _ipu_dc_map_clear(struct ipu_soc *ipu, int map)
-+{
-+	u32 reg = ipu_dc_read(ipu, DC_MAP_CONF_PTR(map));
-+	ipu_dc_write(ipu, reg & ~(0xFFFF << (16 * (map & 0x1))),
-+		     DC_MAP_CONF_PTR(map));
-+}
-+
-+static void _ipu_dc_write_tmpl(struct ipu_soc *ipu,
-+			int word, u32 opcode, u32 operand, int map,
-+			int wave, int glue, int sync, int stop)
-+{
-+	u32 reg;
-+
-+	if (opcode == WRG) {
-+		reg = sync;
-+		reg |= (glue << 4);
-+		reg |= (++wave << 11);
-+		reg |= ((operand & 0x1FFFF) << 15);
-+		ipu_dc_tmpl_write(ipu, reg, word * 8);
-+
-+		reg = (operand >> 17);
-+		reg |= opcode << 7;
-+		reg |= (stop << 9);
-+		ipu_dc_tmpl_write(ipu, reg, word * 8 + 4);
-+	} else {
-+		reg = sync;
-+		reg |= (glue << 4);
-+		reg |= (++wave << 11);
-+		reg |= (++map << 15);
-+		reg |= (operand << 20) & 0xFFF00000;
-+		ipu_dc_tmpl_write(ipu, reg, word * 8);
-+
-+		reg = (operand >> 12);
-+		reg |= opcode << 4;
-+		reg |= (stop << 9);
-+		ipu_dc_tmpl_write(ipu, reg, word * 8 + 4);
-+	}
-+}
-+
-+static void _ipu_dc_link_event(struct ipu_soc *ipu,
-+		int chan, int event, int addr, int priority)
-+{
-+	u32 reg;
-+	u32 address_shift;
-+	if (event < DC_EVEN_UGDE0) {
-+		reg = ipu_dc_read(ipu, DC_RL_CH(chan, event));
-+		reg &= ~(0xFFFF << (16 * (event & 0x1)));
-+		reg |= ((addr << 8) | priority) << (16 * (event & 0x1));
-+		ipu_dc_write(ipu, reg, DC_RL_CH(chan, event));
-+	} else {
-+		reg = ipu_dc_read(ipu, DC_UGDE_0((event - DC_EVEN_UGDE0) / 2));
-+		if ((event - DC_EVEN_UGDE0) & 0x1) {
-+			reg &= ~(0x2FF << 16);
-+			reg |= (addr << 16);
-+			reg |= priority ? (2 << 24) : 0x0;
-+		} else {
-+			reg &= ~0xFC00FFFF;
-+			if (priority)
-+				chan = (chan >> 1) +
-+					((((chan & 0x1) + ((chan & 0x2) >> 1))) | (chan >> 3));
-+			else
-+				chan = 0x7;
-+			address_shift = ((event - DC_EVEN_UGDE0) >> 1) ? 7 : 8;
-+			reg |= (addr << address_shift) | (priority << 3) | chan;
-+		}
-+		ipu_dc_write(ipu, reg, DC_UGDE_0((event - DC_EVEN_UGDE0) / 2));
-+	}
-+}
-+
-+/*     Y = R *  1.200 + G *  2.343 + B *  .453 + 0.250;
-+       U = R * -.672 + G * -1.328 + B *  2.000 + 512.250.;
-+       V = R *  2.000 + G * -1.672 + B * -.328 + 512.250.;*/
-+static const int rgb2ycbcr_coeff[5][3] = {
-+	{0x4D, 0x96, 0x1D},
-+	{-0x2B, -0x55, 0x80},
-+	{0x80, -0x6B, -0x15},
-+	{0x0000, 0x0200, 0x0200},	/* B0, B1, B2 */
-+	{0x2, 0x2, 0x2},	/* S0, S1, S2 */
-+};
-+
-+/*     R = (1.164 * (Y - 16)) + (1.596 * (Cr - 128));
-+       G = (1.164 * (Y - 16)) - (0.392 * (Cb - 128)) - (0.813 * (Cr - 128));
-+       B = (1.164 * (Y - 16)) + (2.017 * (Cb - 128); */
-+static const int ycbcr2rgb_coeff[5][3] = {
-+	{0x095, 0x000, 0x0CC},
-+	{0x095, 0x3CE, 0x398},
-+	{0x095, 0x0FF, 0x000},
-+	{0x3E42, 0x010A, 0x3DD6},	/*B0,B1,B2 */
-+	{0x1, 0x1, 0x1},	/*S0,S1,S2 */
-+};
-+
-+#define mask_a(a) ((u32)(a) & 0x3FF)
-+#define mask_b(b) ((u32)(b) & 0x3FFF)
-+
-+/* Pls keep S0, S1 and S2 as 0x2 by using this convertion */
-+static int _rgb_to_yuv(int n, int red, int green, int blue)
-+{
-+	int c;
-+	c = red * rgb2ycbcr_coeff[n][0];
-+	c += green * rgb2ycbcr_coeff[n][1];
-+	c += blue * rgb2ycbcr_coeff[n][2];
-+	c /= 16;
-+	c += rgb2ycbcr_coeff[3][n] * 4;
-+	c += 8;
-+	c /= 16;
-+	if (c < 0)
-+		c = 0;
-+	if (c > 255)
-+		c = 255;
-+	return c;
-+}
-+
-+/*
-+ * Row is for BG: 	RGB2YUV YUV2RGB RGB2RGB YUV2YUV CSC_NONE
-+ * Column is for FG:	RGB2YUV YUV2RGB RGB2RGB YUV2YUV CSC_NONE
-+ */
-+static struct dp_csc_param_t dp_csc_array[CSC_NUM][CSC_NUM] = {
-+{{DP_COM_CONF_CSC_DEF_BOTH, &rgb2ycbcr_coeff}, {0, 0}, {0, 0}, {DP_COM_CONF_CSC_DEF_BG, &rgb2ycbcr_coeff}, {DP_COM_CONF_CSC_DEF_BG, &rgb2ycbcr_coeff} },
-+{{0, 0}, {DP_COM_CONF_CSC_DEF_BOTH, &ycbcr2rgb_coeff}, {DP_COM_CONF_CSC_DEF_BG, &ycbcr2rgb_coeff}, {0, 0}, {DP_COM_CONF_CSC_DEF_BG, &ycbcr2rgb_coeff} },
-+{{0, 0}, {DP_COM_CONF_CSC_DEF_FG, &ycbcr2rgb_coeff}, {0, 0}, {0, 0}, {0, 0} },
-+{{DP_COM_CONF_CSC_DEF_FG, &rgb2ycbcr_coeff}, {0, 0}, {0, 0}, {0, 0}, {0, 0} },
-+{{DP_COM_CONF_CSC_DEF_FG, &rgb2ycbcr_coeff}, {DP_COM_CONF_CSC_DEF_FG, &ycbcr2rgb_coeff}, {0, 0}, {0, 0}, {0, 0} }
-+};
-+
-+void __ipu_dp_csc_setup(struct ipu_soc *ipu,
-+		int dp, struct dp_csc_param_t dp_csc_param,
-+		bool srm_mode_update)
-+{
-+	u32 reg;
-+	const int (*coeff)[5][3];
-+
-+	if (dp_csc_param.mode >= 0) {
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(dp));
-+		reg &= ~DP_COM_CONF_CSC_DEF_MASK;
-+		reg |= dp_csc_param.mode;
-+		ipu_dp_write(ipu, reg, DP_COM_CONF(dp));
-+	}
-+
-+	coeff = dp_csc_param.coeff;
-+
-+	if (coeff) {
-+		ipu_dp_write(ipu, mask_a((*coeff)[0][0]) |
-+				(mask_a((*coeff)[0][1]) << 16), DP_CSC_A_0(dp));
-+		ipu_dp_write(ipu, mask_a((*coeff)[0][2]) |
-+				(mask_a((*coeff)[1][0]) << 16), DP_CSC_A_1(dp));
-+		ipu_dp_write(ipu, mask_a((*coeff)[1][1]) |
-+				(mask_a((*coeff)[1][2]) << 16), DP_CSC_A_2(dp));
-+		ipu_dp_write(ipu, mask_a((*coeff)[2][0]) |
-+				(mask_a((*coeff)[2][1]) << 16), DP_CSC_A_3(dp));
-+		ipu_dp_write(ipu, mask_a((*coeff)[2][2]) |
-+				(mask_b((*coeff)[3][0]) << 16) |
-+				((*coeff)[4][0] << 30), DP_CSC_0(dp));
-+		ipu_dp_write(ipu, mask_b((*coeff)[3][1]) | ((*coeff)[4][1] << 14) |
-+				(mask_b((*coeff)[3][2]) << 16) |
-+				((*coeff)[4][2] << 30), DP_CSC_1(dp));
-+	}
-+
-+	if (srm_mode_update) {
-+		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+	}
-+}
-+
-+int _ipu_dp_init(struct ipu_soc *ipu,
-+		ipu_channel_t channel, uint32_t in_pixel_fmt,
-+		uint32_t out_pixel_fmt)
-+{
-+	int in_fmt, out_fmt;
-+	int dp;
-+	int partial = false;
-+	uint32_t reg;
-+
-+	if (channel == MEM_FG_SYNC) {
-+		dp = DP_SYNC;
-+		partial = true;
-+	} else if (channel == MEM_BG_SYNC) {
-+		dp = DP_SYNC;
-+		partial = false;
-+	} else if (channel == MEM_BG_ASYNC0) {
-+		dp = DP_ASYNC0;
-+		partial = false;
-+	} else {
-+		return -EINVAL;
-+	}
-+
-+	in_fmt = format_to_colorspace(in_pixel_fmt);
-+	out_fmt = format_to_colorspace(out_pixel_fmt);
-+
-+	if (partial) {
-+		if (in_fmt == RGB) {
-+			if (out_fmt == RGB)
-+				ipu->fg_csc_type = RGB2RGB;
-+			else
-+				ipu->fg_csc_type = RGB2YUV;
-+		} else {
-+			if (out_fmt == RGB)
-+				ipu->fg_csc_type = YUV2RGB;
-+			else
-+				ipu->fg_csc_type = YUV2YUV;
-+		}
-+	} else {
-+		if (in_fmt == RGB) {
-+			if (out_fmt == RGB)
-+				ipu->bg_csc_type = RGB2RGB;
-+			else
-+				ipu->bg_csc_type = RGB2YUV;
-+		} else {
-+			if (out_fmt == RGB)
-+				ipu->bg_csc_type = YUV2RGB;
-+			else
-+				ipu->bg_csc_type = YUV2YUV;
-+		}
-+	}
-+
-+	/* Transform color key from rgb to yuv if CSC is enabled */
-+	reg = ipu_dp_read(ipu, DP_COM_CONF(dp));
-+	if (ipu->color_key_4rgb && (reg & DP_COM_CONF_GWCKE) &&
-+			(((ipu->fg_csc_type == RGB2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
-+			 ((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == RGB2YUV)) ||
-+			 ((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
-+			 ((ipu->fg_csc_type == YUV2RGB) && (ipu->bg_csc_type == YUV2RGB)))) {
-+		int red, green, blue;
-+		int y, u, v;
-+		uint32_t color_key = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(dp)) & 0xFFFFFFL;
-+
-+		dev_dbg(ipu->dev, "_ipu_dp_init color key 0x%x need change to yuv fmt!\n", color_key);
-+
-+		red = (color_key >> 16) & 0xFF;
-+		green = (color_key >> 8) & 0xFF;
-+		blue = color_key & 0xFF;
-+
-+		y = _rgb_to_yuv(0, red, green, blue);
-+		u = _rgb_to_yuv(1, red, green, blue);
-+		v = _rgb_to_yuv(2, red, green, blue);
-+		color_key = (y << 16) | (u << 8) | v;
-+
-+		reg = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(dp)) & 0xFF000000L;
-+		ipu_dp_write(ipu, reg | color_key, DP_GRAPH_WIND_CTRL(dp));
-+		ipu->color_key_4rgb = false;
-+
-+		dev_dbg(ipu->dev, "_ipu_dp_init color key change to yuv fmt 0x%x!\n", color_key);
-+	}
-+
-+	__ipu_dp_csc_setup(ipu, dp, dp_csc_array[ipu->bg_csc_type][ipu->fg_csc_type], true);
-+
-+	return 0;
-+}
-+
-+void _ipu_dp_uninit(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	int dp;
-+	int partial = false;
-+
-+	if (channel == MEM_FG_SYNC) {
-+		dp = DP_SYNC;
-+		partial = true;
-+	} else if (channel == MEM_BG_SYNC) {
-+		dp = DP_SYNC;
-+		partial = false;
-+	} else if (channel == MEM_BG_ASYNC0) {
-+		dp = DP_ASYNC0;
-+		partial = false;
-+	} else {
-+		return;
-+	}
-+
-+	if (partial)
-+		ipu->fg_csc_type = CSC_NONE;
-+	else
-+		ipu->bg_csc_type = CSC_NONE;
-+
-+	__ipu_dp_csc_setup(ipu, dp, dp_csc_array[ipu->bg_csc_type][ipu->fg_csc_type], false);
-+}
-+
-+void _ipu_dc_init(struct ipu_soc *ipu, int dc_chan, int di, bool interlaced, uint32_t pixel_fmt)
-+{
-+	u32 reg = 0;
-+
-+	if ((dc_chan == 1) || (dc_chan == 5)) {
-+		if (interlaced) {
-+			if (di) {
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 1, 3);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 1, 2);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 1, 1);
-+				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE1, 9, 5);
-+					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE1, 8, 5);
-+				}
-+			} else {
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 0, 3);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 0, 2);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 0, 1);
-+				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE0, 10, 5);
-+					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE0, 11, 5);
-+				}
-+			}
-+		} else {
-+			if (di) {
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 2, 3);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 3, 2);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 1, 1);
-+				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE1, 9, 5);
-+					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE1, 8, 5);
-+				}
-+			} else {
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 5, 3);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 6, 2);
-+				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 12, 1);
-+				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE0, 10, 5);
-+					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE0, 11, 5);
-+				}
-+			}
-+		}
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NF, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NFIELD, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOF, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOFIELD, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR, 0, 0);
-+
-+		reg = 0x2;
-+		reg |= DC_DISP_ID_SYNC(di) << DC_WR_CH_CONF_PROG_DISP_ID_OFFSET;
-+		reg |= di << 2;
-+		if (interlaced)
-+			reg |= DC_WR_CH_CONF_FIELD_MODE;
-+	} else if ((dc_chan == 8) || (dc_chan == 9)) {
-+		/* async channels */
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_0, 0x64, 1);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_1, 0x64, 1);
-+
-+		reg = 0x3;
-+		reg |= DC_DISP_ID_SERIAL << DC_WR_CH_CONF_PROG_DISP_ID_OFFSET;
-+	}
-+	ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
-+
-+	ipu_dc_write(ipu, 0x00000000, DC_WR_CH_ADDR(dc_chan));
-+
-+	ipu_dc_write(ipu, 0x00000084, DC_GEN);
-+}
-+
-+void _ipu_dc_uninit(struct ipu_soc *ipu, int dc_chan)
-+{
-+	if ((dc_chan == 1) || (dc_chan == 5)) {
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NF, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NFIELD, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOF, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOFIELD, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE1, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE1, 0, 0);
-+	} else if ((dc_chan == 8) || (dc_chan == 9)) {
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_W_0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_W_1, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_W_0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_W_1, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_1, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_R_0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_R_1, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_R_0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_R_1, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_R_0, 0, 0);
-+		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_R_1, 0, 0);
-+	}
-+}
-+
-+int _ipu_disp_chan_is_interlaced(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	if (channel == MEM_DC_SYNC)
-+		return !!(ipu_dc_read(ipu, DC_WR_CH_CONF_1) &
-+			  DC_WR_CH_CONF_FIELD_MODE);
-+	else if ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC))
-+		return !!(ipu_dc_read(ipu, DC_WR_CH_CONF_5) &
-+			  DC_WR_CH_CONF_FIELD_MODE);
-+	return 0;
-+}
-+
-+void _ipu_dp_dc_enable(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	int di;
-+	uint32_t reg;
-+	uint32_t dc_chan;
-+	int irq = 0;
-+
-+	if (channel == MEM_FG_SYNC)
-+		irq = IPU_IRQ_DP_SF_END;
-+	else if (channel == MEM_DC_SYNC)
-+		dc_chan = 1;
-+	else if (channel == MEM_BG_SYNC)
-+		dc_chan = 5;
-+	else
-+		return;
-+
-+	if (channel == MEM_FG_SYNC) {
-+		/* Enable FG channel */
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(DP_SYNC));
-+		ipu_dp_write(ipu, reg | DP_COM_CONF_FG_EN, DP_COM_CONF(DP_SYNC));
-+
-+		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+		return;
-+	} else if (channel == MEM_BG_SYNC) {
-+		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+	}
-+
-+	di = ipu->dc_di_assignment[dc_chan];
-+
-+	/* Make sure other DC sync channel is not assigned same DI */
-+	reg = ipu_dc_read(ipu, DC_WR_CH_CONF(6 - dc_chan));
-+	if ((di << 2) == (reg & DC_WR_CH_CONF_PROG_DI_ID)) {
-+		reg &= ~DC_WR_CH_CONF_PROG_DI_ID;
-+		reg |= di ? 0 : DC_WR_CH_CONF_PROG_DI_ID;
-+		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(6 - dc_chan));
-+	}
-+
-+	reg = ipu_dc_read(ipu, DC_WR_CH_CONF(dc_chan));
-+	reg |= 4 << DC_WR_CH_CONF_PROG_TYPE_OFFSET;
-+	ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
-+
-+	clk_prepare_enable(ipu->pixel_clk[di]);
-+}
-+
-+static irqreturn_t dc_irq_handler(int irq, void *dev_id)
-+{
-+	struct ipu_soc *ipu = dev_id;
-+	struct completion *comp = &ipu->dc_comp;
-+	uint32_t reg;
-+	uint32_t dc_chan;
-+
-+	if (irq == IPU_IRQ_DC_FC_1)
-+		dc_chan = 1;
-+	else
-+		dc_chan = 5;
-+
-+	if (!ipu->dc_swap) {
-+		reg = ipu_dc_read(ipu, DC_WR_CH_CONF(dc_chan));
-+		reg &= ~DC_WR_CH_CONF_PROG_TYPE_MASK;
-+		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
-+
-+		reg = ipu_cm_read(ipu, IPU_DISP_GEN);
-+		if (ipu->dc_di_assignment[dc_chan])
-+			reg &= ~DI1_COUNTER_RELEASE;
-+		else
-+			reg &= ~DI0_COUNTER_RELEASE;
-+		ipu_cm_write(ipu, reg, IPU_DISP_GEN);
-+	}
-+
-+	complete(comp);
-+	return IRQ_HANDLED;
-+}
-+
-+void _ipu_dp_dc_disable(struct ipu_soc *ipu, ipu_channel_t channel, bool swap)
-+{
-+	int ret;
-+	uint32_t reg;
-+	uint32_t csc;
-+	uint32_t dc_chan;
-+	int irq = 0;
-+	int timeout = 50;
-+
-+	ipu->dc_swap = swap;
-+
-+	if (channel == MEM_DC_SYNC) {
-+		dc_chan = 1;
-+		irq = IPU_IRQ_DC_FC_1;
-+	} else if (channel == MEM_BG_SYNC) {
-+		dc_chan = 5;
-+		irq = IPU_IRQ_DP_SF_END;
-+	} else if (channel == MEM_FG_SYNC) {
-+		/* Disable FG channel */
-+		dc_chan = 5;
-+
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(DP_SYNC));
-+		csc = reg & DP_COM_CONF_CSC_DEF_MASK;
-+		if (csc == DP_COM_CONF_CSC_DEF_FG)
-+			reg &= ~DP_COM_CONF_CSC_DEF_MASK;
-+
-+		reg &= ~DP_COM_CONF_FG_EN;
-+		ipu_dp_write(ipu, reg, DP_COM_CONF(DP_SYNC));
-+
-+		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+
-+		if (ipu_is_channel_busy(ipu, MEM_BG_SYNC)) {
-+			ipu_cm_write(ipu, IPUIRQ_2_MASK(IPU_IRQ_DP_SF_END),
-+					IPUIRQ_2_STATREG(IPU_IRQ_DP_SF_END));
-+			while ((ipu_cm_read(ipu, IPUIRQ_2_STATREG(IPU_IRQ_DP_SF_END)) &
-+						IPUIRQ_2_MASK(IPU_IRQ_DP_SF_END)) == 0) {
-+				msleep(2);
-+				timeout -= 2;
-+				if (timeout <= 0)
-+					break;
-+			}
-+		}
-+		return;
-+	} else {
-+		return;
-+	}
-+
-+	init_completion(&ipu->dc_comp);
-+	ret = ipu_request_irq(ipu, irq, dc_irq_handler, 0, NULL, ipu);
-+	if (ret < 0) {
-+		dev_err(ipu->dev, "DC irq %d in use\n", irq);
-+		return;
-+	}
-+	ret = wait_for_completion_timeout(&ipu->dc_comp, msecs_to_jiffies(50));
-+	ipu_free_irq(ipu, irq, ipu);
-+	dev_dbg(ipu->dev, "DC stop timeout - %d * 10ms\n", 5 - ret);
-+
-+	if (ipu->dc_swap) {
-+		/* Swap DC channel 1 and 5 settings, and disable old dc chan */
-+		reg = ipu_dc_read(ipu, DC_WR_CH_CONF(dc_chan));
-+		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(6 - dc_chan));
-+		reg &= ~DC_WR_CH_CONF_PROG_TYPE_MASK;
-+		reg ^= DC_WR_CH_CONF_PROG_DI_ID;
-+		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
-+	}
-+}
-+
-+void _ipu_init_dc_mappings(struct ipu_soc *ipu)
-+{
-+	/* IPU_PIX_FMT_RGB24 */
-+	_ipu_dc_map_clear(ipu, 0);
-+	_ipu_dc_map_config(ipu, 0, 0, 7, 0xFF);
-+	_ipu_dc_map_config(ipu, 0, 1, 15, 0xFF);
-+	_ipu_dc_map_config(ipu, 0, 2, 23, 0xFF);
-+
-+	/* IPU_PIX_FMT_RGB666 */
-+	_ipu_dc_map_clear(ipu, 1);
-+	_ipu_dc_map_config(ipu, 1, 0, 5, 0xFC);
-+	_ipu_dc_map_config(ipu, 1, 1, 11, 0xFC);
-+	_ipu_dc_map_config(ipu, 1, 2, 17, 0xFC);
-+
-+	/* IPU_PIX_FMT_YUV444 */
-+	_ipu_dc_map_clear(ipu, 2);
-+	_ipu_dc_map_config(ipu, 2, 0, 15, 0xFF);
-+	_ipu_dc_map_config(ipu, 2, 1, 23, 0xFF);
-+	_ipu_dc_map_config(ipu, 2, 2, 7, 0xFF);
-+
-+	/* IPU_PIX_FMT_RGB565 */
-+	_ipu_dc_map_clear(ipu, 3);
-+	_ipu_dc_map_config(ipu, 3, 0, 4, 0xF8);
-+	_ipu_dc_map_config(ipu, 3, 1, 10, 0xFC);
-+	_ipu_dc_map_config(ipu, 3, 2, 15, 0xF8);
-+
-+	/* IPU_PIX_FMT_LVDS666 */
-+	_ipu_dc_map_clear(ipu, 4);
-+	_ipu_dc_map_config(ipu, 4, 0, 5, 0xFC);
-+	_ipu_dc_map_config(ipu, 4, 1, 13, 0xFC);
-+	_ipu_dc_map_config(ipu, 4, 2, 21, 0xFC);
-+
-+	/* IPU_PIX_FMT_VYUY 16bit width */
-+	_ipu_dc_map_clear(ipu, 5);
-+	_ipu_dc_map_config(ipu, 5, 0, 7, 0xFF);
-+	_ipu_dc_map_config(ipu, 5, 1, 0, 0x0);
-+	_ipu_dc_map_config(ipu, 5, 2, 15, 0xFF);
-+	_ipu_dc_map_clear(ipu, 6);
-+	_ipu_dc_map_config(ipu, 6, 0, 0, 0x0);
-+	_ipu_dc_map_config(ipu, 6, 1, 7, 0xFF);
-+	_ipu_dc_map_config(ipu, 6, 2, 15, 0xFF);
-+
-+	/* IPU_PIX_FMT_UYUV 16bit width */
-+	_ipu_dc_map_clear(ipu, 7);
-+	_ipu_dc_map_link(ipu, 7, 6, 0, 6, 1, 6, 2);
-+	_ipu_dc_map_clear(ipu, 8);
-+	_ipu_dc_map_link(ipu, 8, 5, 0, 5, 1, 5, 2);
-+
-+	/* IPU_PIX_FMT_YUYV 16bit width */
-+	_ipu_dc_map_clear(ipu, 9);
-+	_ipu_dc_map_link(ipu, 9, 5, 2, 5, 1, 5, 0);
-+	_ipu_dc_map_clear(ipu, 10);
-+	_ipu_dc_map_link(ipu, 10, 5, 1, 5, 2, 5, 0);
-+
-+	/* IPU_PIX_FMT_YVYU 16bit width */
-+	_ipu_dc_map_clear(ipu, 11);
-+	_ipu_dc_map_link(ipu, 11, 5, 1, 5, 2, 5, 0);
-+	_ipu_dc_map_clear(ipu, 12);
-+	_ipu_dc_map_link(ipu, 12, 5, 2, 5, 1, 5, 0);
-+
-+	/* IPU_PIX_FMT_GBR24 */
-+	/* IPU_PIX_FMT_VYU444 */
-+	_ipu_dc_map_clear(ipu, 13);
-+	_ipu_dc_map_link(ipu, 13, 0, 2, 0, 0, 0, 1);
-+
-+	/* IPU_PIX_FMT_BGR24 */
-+	_ipu_dc_map_clear(ipu, 14);
-+	_ipu_dc_map_link(ipu, 14, 0, 2, 0, 1, 0, 0);
-+}
-+
-+int _ipu_pixfmt_to_map(uint32_t fmt)
-+{
-+	switch (fmt) {
-+	case IPU_PIX_FMT_GENERIC:
-+	case IPU_PIX_FMT_RGB24:
-+		return 0;
-+	case IPU_PIX_FMT_RGB666:
-+		return 1;
-+	case IPU_PIX_FMT_YUV444:
-+		return 2;
-+	case IPU_PIX_FMT_RGB565:
-+		return 3;
-+	case IPU_PIX_FMT_LVDS666:
-+		return 4;
-+	case IPU_PIX_FMT_VYUY:
-+		return 6;
-+	case IPU_PIX_FMT_UYVY:
-+		return 8;
-+	case IPU_PIX_FMT_YUYV:
-+		return 10;
-+	case IPU_PIX_FMT_YVYU:
-+		return 12;
-+	case IPU_PIX_FMT_GBR24:
-+	case IPU_PIX_FMT_VYU444:
-+		return 13;
-+	case IPU_PIX_FMT_BGR24:
-+		return 14;
-+	}
-+
-+	return -1;
-+}
-+
-+/*!
-+ * This function sets the colorspace for of dp.
-+ * modes.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       param         	If it's not NULL, update the csc table
-+ *                              with this parameter.
-+ *
-+ * @return      N/A
-+ */
-+void _ipu_dp_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3])
-+{
-+	int dp;
-+	struct dp_csc_param_t dp_csc_param;
-+
-+	if (channel == MEM_FG_SYNC)
-+		dp = DP_SYNC;
-+	else if (channel == MEM_BG_SYNC)
-+		dp = DP_SYNC;
-+	else if (channel == MEM_BG_ASYNC0)
-+		dp = DP_ASYNC0;
-+	else
-+		return;
-+
-+	dp_csc_param.mode = -1;
-+	dp_csc_param.coeff = param;
-+	__ipu_dp_csc_setup(ipu, dp, dp_csc_param, true);
-+}
-+
-+void ipu_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3])
-+{
-+	_ipu_dp_set_csc_coefficients(ipu, channel, param);
-+}
-+EXPORT_SYMBOL(ipu_set_csc_coefficients);
-+
-+/*!
-+ * This function is called to adapt synchronous LCD panel to IPU restriction.
-+ *
-+ */
-+void adapt_panel_to_ipu_restricitions(struct ipu_soc *ipu, uint16_t *v_start_width,
-+					uint16_t *v_sync_width,
-+					uint16_t *v_end_width)
-+{
-+	if (*v_end_width < 2) {
-+		uint16_t diff = 2 - *v_end_width;
-+		if (*v_start_width >= diff) {
-+			*v_end_width = 2;
-+			*v_start_width = *v_start_width - diff;
-+		} else if (*v_sync_width > diff) {
-+			*v_end_width = 2;
-+			*v_sync_width = *v_sync_width - diff;
-+		} else
-+			dev_err(ipu->dev, "WARNING: try to adapt timming, but failed\n");
-+		dev_err(ipu->dev, "WARNING: adapt panel end blank lines\n");
-+	}
-+}
-+
-+/*!
-+ * This function is called to initialize a synchronous LCD panel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       disp            The DI the panel is attached to.
-+ *
-+ * @param       pixel_clk       Desired pixel clock frequency in Hz.
-+ *
-+ * @param       pixel_fmt       Input parameter for pixel format of buffer.
-+ *                              Pixel format is a FOURCC ASCII code.
-+ *
-+ * @param       width           The width of panel in pixels.
-+ *
-+ * @param       height          The height of panel in pixels.
-+ *
-+ * @param       hStartWidth     The number of pixel clocks between the HSYNC
-+ *                              signal pulse and the start of valid data.
-+ *
-+ * @param       hSyncWidth      The width of the HSYNC signal in units of pixel
-+ *                              clocks.
-+ *
-+ * @param       hEndWidth       The number of pixel clocks between the end of
-+ *                              valid data and the HSYNC signal for next line.
-+ *
-+ * @param       vStartWidth     The number of lines between the VSYNC
-+ *                              signal pulse and the start of valid data.
-+ *
-+ * @param       vSyncWidth      The width of the VSYNC signal in units of lines
-+ *
-+ * @param       vEndWidth       The number of lines between the end of valid
-+ *                              data and the VSYNC signal for next frame.
-+ *
-+ * @param       sig             Bitfield of signal polarities for LCD interface.
-+ *
-+ * @return      This function returns 0 on success or negative error code on
-+ *              fail.
-+ */
-+int32_t ipu_init_sync_panel(struct ipu_soc *ipu, int disp, uint32_t pixel_clk,
-+			    uint16_t width, uint16_t height,
-+			    uint32_t pixel_fmt,
-+			    uint16_t h_start_width, uint16_t h_sync_width,
-+			    uint16_t h_end_width, uint16_t v_start_width,
-+			    uint16_t v_sync_width, uint16_t v_end_width,
-+			    uint32_t v_to_h_sync, ipu_di_signal_cfg_t sig)
-+{
-+	uint32_t field0_offset = 0;
-+	uint32_t field1_offset;
-+	uint32_t reg;
-+	uint32_t di_gen, vsync_cnt;
-+	uint32_t div, rounded_pixel_clk;
-+	uint32_t h_total, v_total;
-+	int map;
-+	int ret;
-+	struct clk *ldb_di0_clk, *ldb_di1_clk;
-+	struct clk *di_parent;
-+
-+	dev_dbg(ipu->dev, "panel size = %d x %d\n", width, height);
-+
-+	if ((v_sync_width == 0) || (h_sync_width == 0))
-+		return -EINVAL;
-+
-+	adapt_panel_to_ipu_restricitions(ipu, &v_start_width, &v_sync_width, &v_end_width);
-+	h_total = width + h_sync_width + h_start_width + h_end_width;
-+	v_total = height + v_sync_width + v_start_width + v_end_width;
-+
-+	/* Init clocking */
-+	dev_dbg(ipu->dev, "pixel clk = %d\n", pixel_clk);
-+
-+	di_parent = clk_get_parent(ipu->di_clk_sel[disp]);
-+	if (!di_parent) {
-+		dev_err(ipu->dev, "get di clk parent fail\n");
-+		return -EINVAL;
-+	}
-+	ldb_di0_clk = clk_get(ipu->dev, "ldb_di0");
-+	if (IS_ERR(ldb_di0_clk)) {
-+		dev_err(ipu->dev, "clk_get di0 failed");
-+		return PTR_ERR(ldb_di0_clk);
-+	}
-+	ldb_di1_clk = clk_get(ipu->dev, "ldb_di1");
-+	if (IS_ERR(ldb_di1_clk)) {
-+		dev_err(ipu->dev, "clk_get di1 failed");
-+		return PTR_ERR(ldb_di1_clk);
-+	}
-+
-+	if (ldb_di0_clk == di_parent || ldb_di1_clk == di_parent) {
-+		/* if di clk parent is tve/ldb, then keep it;*/
-+		dev_dbg(ipu->dev, "use special clk parent\n");
-+		ret = clk_set_parent(ipu->pixel_clk_sel[disp], ipu->di_clk[disp]);
-+		if (ret) {
-+			dev_err(ipu->dev, "set pixel clk error:%d\n", ret);
-+			return ret;
-+		}
-+		clk_put(ldb_di0_clk);
-+		clk_put(ldb_di1_clk);
-+	} else {
-+		/* try ipu clk first*/
-+		dev_dbg(ipu->dev, "try ipu internal clk\n");
-+		ret = clk_set_parent(ipu->pixel_clk_sel[disp], ipu->ipu_clk);
-+		if (ret) {
-+			dev_err(ipu->dev, "set pixel clk error:%d\n", ret);
-+			return ret;
-+		}
-+		rounded_pixel_clk = clk_round_rate(ipu->pixel_clk[disp], pixel_clk);
-+		dev_dbg(ipu->dev, "rounded pix clk:%d\n", rounded_pixel_clk);
-+		/*
-+		 * we will only use 1/2 fraction for ipu clk,
-+		 * so if the clk rate is not fit, try ext clk.
-+		 */
-+		if (!sig.int_clk &&
-+			((rounded_pixel_clk >= pixel_clk + pixel_clk/200) ||
-+			(rounded_pixel_clk <= pixel_clk - pixel_clk/200))) {
-+			dev_dbg(ipu->dev, "try ipu ext di clk\n");
-+
-+			rounded_pixel_clk =
-+				clk_round_rate(ipu->di_clk[disp], pixel_clk);
-+			ret = clk_set_rate(ipu->di_clk[disp],
-+						rounded_pixel_clk);
-+			if (ret) {
-+				dev_err(ipu->dev,
-+					"set di clk rate error:%d\n", ret);
-+				return ret;
-+			}
-+			dev_dbg(ipu->dev, "di clk:%d\n", rounded_pixel_clk);
-+			ret = clk_set_parent(ipu->pixel_clk_sel[disp],
-+						ipu->di_clk[disp]);
-+			if (ret) {
-+				dev_err(ipu->dev,
-+					"set pixel clk parent error:%d\n", ret);
-+				return ret;
-+			}
-+		}
-+	}
-+	rounded_pixel_clk = clk_round_rate(ipu->pixel_clk[disp], pixel_clk);
-+	dev_dbg(ipu->dev, "round pixel clk:%d\n", rounded_pixel_clk);
-+	ret = clk_set_rate(ipu->pixel_clk[disp], rounded_pixel_clk);
-+	if (ret) {
-+		dev_err(ipu->dev, "set pixel clk rate error:%d\n", ret);
-+		return ret;
-+	}
-+	msleep(5);
-+	/* Get integer portion of divider */
-+	div = clk_get_rate(clk_get_parent(ipu->pixel_clk_sel[disp])) / rounded_pixel_clk;
-+	dev_dbg(ipu->dev, "div:%d\n", div);
-+	if (!div) {
-+		dev_err(ipu->dev, "invalid pixel clk div = 0\n");
-+		return -EINVAL;
-+	}
-+
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	_ipu_di_data_wave_config(ipu, disp, SYNC_WAVE, div - 1, div - 1);
-+	_ipu_di_data_pin_config(ipu, disp, SYNC_WAVE, DI_PIN15, 3, 0, div * 2);
-+
-+	map = _ipu_pixfmt_to_map(pixel_fmt);
-+	if (map < 0) {
-+		dev_dbg(ipu->dev, "IPU_DISP: No MAP\n");
-+		mutex_unlock(&ipu->mutex_lock);
-+		return -EINVAL;
-+	}
-+
-+	/*clear DI*/
-+	di_gen = ipu_di_read(ipu, disp, DI_GENERAL);
-+	di_gen &= (0x3 << 20);
-+	ipu_di_write(ipu, disp, di_gen, DI_GENERAL);
-+
-+	if (sig.interlaced) {
-+		if (g_ipu_hw_rev >= IPU_V3DEX) {
-+			/* Internal VSYNC for each frame */
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_COUNT_1, 		/* counter */
-+					v_total*2 - 1, 	/* run count */
-+					(3 - 1),	/* run_resolution, counter 1 can reference to counter 6,7,8 with run_resolution=2,3,4 */
-+					1, 		/* offset */
-+					(3 - 1), 	/* offset resolution, 3=counter 7 */
-+					0, 		/* repeat count */
-+					DI_SYNC_NONE, 	/* CNT_CLR_SEL */
-+					0, 		/* CNT_POLARITY_GEN_EN */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
-+					0, 		/* COUNT UP */
-+					0		/* COUNT DOWN */
-+					);
-+
-+			/* HSYNC waveform on DI_PIN02 */
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_HSYNC, 		/* counter */
-+					h_total - 1,	/* run count */
-+					DI_SYNC_CLK,	/* run_resolution, counter 2 can reference to counter 5,7 with run_resolution=3,4 */
-+					0, 		/* offset */
-+					DI_SYNC_NONE, 	/* offset resolution */
-+					0, 		/* repeat count */
-+					DI_SYNC_NONE, 	/* CNT_CLR_SEL */
-+					1, 		/* CNT_POLARITY_GEN_EN */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					DI_SYNC_CLK, 	/* CNT_POLARITY_TRIGGER_SEL */
-+					0, 		/* COUNT UP */
-+					2*h_sync_width		/* COUNT DOWN */
-+					);
-+
-+			/* VSYNC waveform on DI_PIN03 */
-+			vsync_cnt = DI_SYNC_VSYNC;
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_VSYNC, 		/* counter */
-+					v_total - 1,	/* run count */
-+					(4 - 1),	/* run_resolution, counter 3 can reference to counter 7 with run_resolution=4 */
-+					1, 			/* offset */
-+					(4 - 1), 	/* offset resolution, 4=counter 7 */
-+					2, 		/* repeat count */
-+					DI_SYNC_COUNT_1, 	/* CNT_CLR_SEL */
-+					1, 		/* CNT_POLARITY_GEN_EN */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					(4 - 1),	/* CNT_POLARITY_TRIGGER_SEL, 4=counter 7 */
-+					0, 		/* COUNT UP */
-+					2*v_sync_width		/* COUNT DOWN */
-+					);
-+
-+			/* Active Field */
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_AFIELD, 		/* counter */
-+					(v_total/2 + 1) - 1, 	/* run count */
-+					DI_SYNC_HSYNC,	/* run_resolution */
-+					h_total/2, /*  offset */
-+					DI_SYNC_CLK,	/* offset resolution */
-+					2, 		/* repeat count */
-+					DI_SYNC_COUNT_1, 	/* CNT_CLR_SEL */
-+					0, 		/* CNT_POLARITY_GEN_EN */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
-+					0, 		/* COUNT UP */
-+					0		/* COUNT DOWN */
-+					);
-+
-+			/* Active Line */
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_ALINE, 		/* counter */
-+					0, 		/* run count */
-+					DI_SYNC_HSYNC,	/* run_resolution */
-+					(v_start_width + v_sync_width) / 2, 		/*  offset */
-+					DI_SYNC_HSYNC, 	/* offset resolution */
-+					height/2, 	/* repeat count */
-+					DI_SYNC_AFIELD, 		/* CNT_CLR_SEL */
-+					0, 		/* CNT_POLARITY_GEN_EN */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
-+					0, 		/* COUNT UP */
-+					0		/* COUNT DOWN */
-+					);
-+
-+			/* Active Pixel */
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_APIXEL, 		/* counter */
-+					0, 		/* run count  */
-+					DI_SYNC_CLK,	/* run_resolution */
-+					h_start_width + h_sync_width, 	/* offset  */
-+					DI_SYNC_CLK, 	/* offset resolution */
-+					width, 		/* repeat count  */
-+					DI_SYNC_ALINE, 		/* CNT_CLR_SEL  */
-+					0, 		/* CNT_POLARITY_GEN_EN  */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL  */
-+					0, 		/* COUNT UP  */
-+					0		/* COUNT DOWN */
-+					);
-+
-+			/* Half line HSYNC */
-+			_ipu_di_sync_config(ipu,
-+					disp, 		/* display */
-+					DI_SYNC_COUNT_7, 		/* counter */
-+					h_total/2 - 1,	/* run count */
-+					DI_SYNC_CLK,	/* run_resolution */
-+					0, 		/* offset */
-+					DI_SYNC_NONE, 	/* offset resolution */
-+					0, 		/* repeat count */
-+					DI_SYNC_NONE, 	/* CNT_CLR_SEL */
-+					0, 		/* CNT_POLARITY_GEN_EN */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
-+					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
-+					0, 		/* COUNT UP */
-+					0		/* COUNT DOWN */
-+					);
-+
-+			ipu_di_write(ipu, disp, v_total / 2 - 1, DI_SCR_CONF);
-+
-+			/* set y_sel = 1 */
-+			di_gen |= ((DI_SYNC_HSYNC-1)<<28);
-+		} else {
-+			/* Internal HSYNC waveform */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_INT_HSYNC, h_total - 1, DI_SYNC_CLK,
-+					0, DI_SYNC_NONE, 0, DI_SYNC_NONE, 0, DI_SYNC_NONE,
-+					DI_SYNC_NONE, 0, 0);
-+
-+			field1_offset = v_sync_width + v_start_width + height / 2 +
-+				v_end_width;
-+			if (sig.odd_field_first) {
-+				field0_offset = field1_offset - 1;
-+				field1_offset = 0;
-+			}
-+			v_total += v_start_width + v_end_width;
-+
-+			/* HSYNC waveform */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_HSYNC, h_total - 1, DI_SYNC_CLK,
-+					0, DI_SYNC_NONE, 0, DI_SYNC_NONE, 0,
-+					DI_SYNC_NONE, DI_SYNC_NONE, 0, 4);
-+
-+			/* Field 1 VSYNC waveform */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_VSYNC, v_total - 1, DI_SYNC_INT_HSYNC,
-+					field0_offset,
-+					field0_offset ? DI_SYNC_INT_HSYNC : DI_SYNC_NONE,
-+					0, DI_SYNC_NONE, 0,
-+					DI_SYNC_NONE, DI_SYNC_NONE, 0, 4);
-+
-+			/* Active Field */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_AFIELD,
-+					field0_offset ?
-+					field0_offset : field1_offset - 2,
-+					DI_SYNC_INT_HSYNC, v_start_width + v_sync_width, DI_SYNC_INT_HSYNC, 
-+					2, DI_SYNC_VSYNC, 0, DI_SYNC_NONE, DI_SYNC_NONE, 0, 0);
-+
-+			/* Active Line */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_ALINE, 0, DI_SYNC_INT_HSYNC,
-+					0, DI_SYNC_NONE,
-+					height / 2, DI_SYNC_AFIELD, 0, DI_SYNC_NONE,
-+					DI_SYNC_NONE, 0, 0);
-+
-+			/* Active Pixel */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_APIXEL, 0, DI_SYNC_CLK,
-+					h_sync_width + h_start_width, DI_SYNC_CLK,
-+					width, DI_SYNC_ALINE, 0, DI_SYNC_NONE, DI_SYNC_NONE,
-+					0, 0);
-+
-+			/* DC VSYNC waveform */
-+			vsync_cnt = DI_SYNC_COUNT_7;
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_7, 0, DI_SYNC_INT_HSYNC,
-+					field1_offset,
-+					field1_offset ? DI_SYNC_INT_HSYNC : DI_SYNC_NONE,
-+					1, DI_SYNC_VSYNC, 0, DI_SYNC_NONE, DI_SYNC_NONE, 0, 0);
-+
-+			/* Field 0 VSYNC waveform */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_8, v_total - 1, DI_SYNC_INT_HSYNC,
-+					0, DI_SYNC_NONE,
-+					0, DI_SYNC_NONE, 0, DI_SYNC_NONE,
-+					DI_SYNC_NONE, 0, 0);
-+
-+			/* ??? */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_9, v_total - 1, (DI_SYNC_HSYNC - 1),
-+					0, DI_SYNC_NONE,
-+					0, DI_SYNC_NONE, 6, DI_SYNC_NONE,
-+					DI_SYNC_NONE, 0, 0);
-+
-+			reg = ipu_di_read(ipu, disp, DI_SW_GEN1(9));
-+			reg |= 0x8000;
-+			ipu_di_write(ipu, disp, reg, DI_SW_GEN1(9));
-+
-+			ipu_di_write(ipu, disp, v_sync_width + v_start_width +
-+					v_end_width + height / 2 - 1, DI_SCR_CONF);
-+		}
-+
-+		/* Init template microcode */
-+		if (disp) {
-+			_ipu_dc_write_tmpl(ipu, 1, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+				_ipu_dc_write_tmpl(ipu, 8, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				_ipu_dc_write_tmpl(ipu, 9, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				/* configure user events according to DISP NUM */
-+				ipu_dc_write(ipu, (width - 1), DC_UGDE_3(disp));
-+			}
-+		} else {
-+			_ipu_dc_write_tmpl(ipu, 0, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+				_ipu_dc_write_tmpl(ipu, 10, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				_ipu_dc_write_tmpl(ipu, 11, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				/* configure user events according to DISP NUM */
-+				ipu_dc_write(ipu, width - 1, DC_UGDE_3(disp));
-+			}
-+		}
-+
-+		if (sig.Hsync_pol)
-+			di_gen |= DI_GEN_POLARITY_2;
-+		if (sig.Vsync_pol)
-+			di_gen |= DI_GEN_POLARITY_3;
-+	} else {
-+		/* Setup internal HSYNC waveform */
-+		_ipu_di_sync_config(ipu, disp, DI_SYNC_INT_HSYNC, h_total - 1, DI_SYNC_CLK,
-+					0, DI_SYNC_NONE, 0, DI_SYNC_NONE, 0, DI_SYNC_NONE,
-+					DI_SYNC_NONE, 0, 0);
-+
-+		/* Setup external (delayed) HSYNC waveform */
-+		_ipu_di_sync_config(ipu, disp, DI_SYNC_HSYNC, h_total - 1,
-+				    DI_SYNC_CLK, div * v_to_h_sync, DI_SYNC_CLK,
-+				    0, DI_SYNC_NONE, 1, DI_SYNC_NONE,
-+				    DI_SYNC_CLK, 0, h_sync_width * 2);
-+		/* Setup VSYNC waveform */
-+		vsync_cnt = DI_SYNC_VSYNC;
-+		_ipu_di_sync_config(ipu, disp, DI_SYNC_VSYNC, v_total - 1,
-+				    DI_SYNC_INT_HSYNC, 0, DI_SYNC_NONE, 0,
-+				    DI_SYNC_NONE, 1, DI_SYNC_NONE,
-+				    DI_SYNC_INT_HSYNC, 0, v_sync_width * 2);
-+		ipu_di_write(ipu, disp, v_total - 1, DI_SCR_CONF);
-+
-+		/* Setup active data waveform to sync with DC */
-+		_ipu_di_sync_config(ipu, disp, DI_SYNC_ALINE, 0, DI_SYNC_HSYNC,
-+				    v_sync_width + v_start_width, DI_SYNC_HSYNC, height,
-+				    DI_SYNC_VSYNC, 0, DI_SYNC_NONE,
-+				    DI_SYNC_NONE, 0, 0);
-+		_ipu_di_sync_config(ipu, disp, DI_SYNC_APIXEL, 0, DI_SYNC_CLK,
-+				    h_sync_width + h_start_width, DI_SYNC_CLK,
-+				    width, DI_SYNC_ALINE, 0, DI_SYNC_NONE, DI_SYNC_NONE, 0,
-+				    0);
-+
-+		/* set VGA delayed hsync/vsync no matter VGA enabled */
-+		if (disp) {
-+			/* couter 7 for VGA delay HSYNC */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_7,
-+					h_total - 1, DI_SYNC_CLK,
-+					18, DI_SYNC_CLK,
-+					0, DI_SYNC_NONE,
-+					1, DI_SYNC_NONE, DI_SYNC_CLK,
-+					0, h_sync_width * 2);
-+
-+			/* couter 8 for VGA delay VSYNC */
-+			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_8,
-+					v_total - 1, DI_SYNC_INT_HSYNC,
-+					1, DI_SYNC_INT_HSYNC,
-+					0, DI_SYNC_NONE,
-+					1, DI_SYNC_NONE, DI_SYNC_INT_HSYNC,
-+					0, v_sync_width * 2);
-+		}
-+
-+		/* reset all unused counters */
-+		if (!disp) {
-+			ipu_di_write(ipu, disp, 0, DI_SW_GEN0(7));
-+			ipu_di_write(ipu, disp, 0, DI_SW_GEN1(7));
-+			ipu_di_write(ipu, disp, 0, DI_STP_REP(7));
-+			ipu_di_write(ipu, disp, 0, DI_SW_GEN0(8));
-+			ipu_di_write(ipu, disp, 0, DI_SW_GEN1(8));
-+			ipu_di_write(ipu, disp, 0, DI_STP_REP(8));
-+		}
-+		ipu_di_write(ipu, disp, 0, DI_SW_GEN0(9));
-+		ipu_di_write(ipu, disp, 0, DI_SW_GEN1(9));
-+		ipu_di_write(ipu, disp, 0, DI_STP_REP(9));
-+
-+		/* Init template microcode */
-+		if (disp) {
-+			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+				_ipu_dc_write_tmpl(ipu, 8, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				_ipu_dc_write_tmpl(ipu, 9, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				/* configure user events according to DISP NUM */
-+				ipu_dc_write(ipu, (width - 1), DC_UGDE_3(disp));
-+			}
-+			_ipu_dc_write_tmpl(ipu, 2, WROD(0), 0, map, SYNC_WAVE, 8, DI_SYNC_APIXEL, 1);
-+			_ipu_dc_write_tmpl(ipu, 3, WROD(0), 0, map, SYNC_WAVE, 4, DI_SYNC_APIXEL, 0);
-+			_ipu_dc_write_tmpl(ipu, 4, WRG, 0, map, NULL_WAVE, 0, DI_SYNC_CLK, 1);
-+			_ipu_dc_write_tmpl(ipu, 1, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+
-+		} else {
-+			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
-+				_ipu_dc_write_tmpl(ipu, 10, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				_ipu_dc_write_tmpl(ipu, 11, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+				/* configure user events according to DISP NUM */
-+				ipu_dc_write(ipu, width - 1, DC_UGDE_3(disp));
-+			}
-+		   _ipu_dc_write_tmpl(ipu, 5, WROD(0), 0, map, SYNC_WAVE, 8, DI_SYNC_APIXEL, 1);
-+		   _ipu_dc_write_tmpl(ipu, 6, WROD(0), 0, map, SYNC_WAVE, 4, DI_SYNC_APIXEL, 0);
-+		   _ipu_dc_write_tmpl(ipu, 7, WRG, 0, map, NULL_WAVE, 0, DI_SYNC_CLK, 1);
-+		   _ipu_dc_write_tmpl(ipu, 12, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
-+		}
-+
-+		if (sig.Hsync_pol) {
-+			di_gen |= DI_GEN_POLARITY_2;
-+			if (disp)
-+				di_gen |= DI_GEN_POLARITY_7;
-+		}
-+		if (sig.Vsync_pol) {
-+			di_gen |= DI_GEN_POLARITY_3;
-+			if (disp)
-+				di_gen |= DI_GEN_POLARITY_8;
-+		}
-+	}
-+	/* changinc DISP_CLK polarity: it can be wrong for some applications */
-+	if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
-+		(pixel_fmt == IPU_PIX_FMT_UYVY) ||
-+		(pixel_fmt == IPU_PIX_FMT_YVYU) ||
-+		(pixel_fmt == IPU_PIX_FMT_VYUY))
-+			di_gen |= 0x00020000;
-+
-+	if (!sig.clk_pol)
-+		di_gen |= DI_GEN_POLARITY_DISP_CLK;
-+
-+	ipu_di_write(ipu, disp, di_gen, DI_GENERAL);
-+
-+	ipu_di_write(ipu, disp, (--vsync_cnt << DI_VSYNC_SEL_OFFSET) |
-+			0x00000002, DI_SYNC_AS_GEN);
-+	reg = ipu_di_read(ipu, disp, DI_POL);
-+	reg &= ~(DI_POL_DRDY_DATA_POLARITY | DI_POL_DRDY_POLARITY_15);
-+	if (sig.enable_pol)
-+		reg |= DI_POL_DRDY_POLARITY_15;
-+	if (sig.data_pol)
-+		reg |= DI_POL_DRDY_DATA_POLARITY;
-+	ipu_di_write(ipu, disp, reg, DI_POL);
-+
-+	ipu_dc_write(ipu, width, DC_DISP_CONF2(DC_DISP_ID_SYNC(disp)));
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_init_sync_panel);
-+
-+void ipu_uninit_sync_panel(struct ipu_soc *ipu, int disp)
-+{
-+	uint32_t reg;
-+	uint32_t di_gen;
-+
-+	if ((disp != 0) || (disp != 1))
-+		return;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	di_gen = ipu_di_read(ipu, disp, DI_GENERAL);
-+	di_gen |= 0x3ff | DI_GEN_POLARITY_DISP_CLK;
-+	ipu_di_write(ipu, disp, di_gen, DI_GENERAL);
-+
-+	reg = ipu_di_read(ipu, disp, DI_POL);
-+	reg |= 0x3ffffff;
-+	ipu_di_write(ipu, disp, reg, DI_POL);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+}
-+EXPORT_SYMBOL(ipu_uninit_sync_panel);
-+
-+int ipu_init_async_panel(struct ipu_soc *ipu, int disp, int type, uint32_t cycle_time,
-+			 uint32_t pixel_fmt, ipu_adc_sig_cfg_t sig)
-+{
-+	int map;
-+	u32 ser_conf = 0;
-+	u32 div;
-+	u32 di_clk = clk_get_rate(ipu->ipu_clk);
-+
-+	/* round up cycle_time, then calcalate the divider using scaled math */
-+	cycle_time += (1000000000UL / di_clk) - 1;
-+	div = (cycle_time * (di_clk / 256UL)) / (1000000000UL / 256UL);
-+
-+	map = _ipu_pixfmt_to_map(pixel_fmt);
-+	if (map < 0)
-+		return -EINVAL;
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	if (type == IPU_PANEL_SERIAL) {
-+		ipu_di_write(ipu, disp, (div << 24) | ((sig.ifc_width - 1) << 4),
-+			     DI_DW_GEN(ASYNC_SER_WAVE));
-+
-+		_ipu_di_data_pin_config(ipu, disp, ASYNC_SER_WAVE, DI_PIN_CS,
-+					0, 0, (div * 2) + 1);
-+		_ipu_di_data_pin_config(ipu, disp, ASYNC_SER_WAVE, DI_PIN_SER_CLK,
-+					1, div, div * 2);
-+		_ipu_di_data_pin_config(ipu, disp, ASYNC_SER_WAVE, DI_PIN_SER_RS,
-+					2, 0, 0);
-+
-+		_ipu_dc_write_tmpl(ipu, 0x64, WROD(0), 0, map, ASYNC_SER_WAVE, 0, 0, 1);
-+
-+		/* Configure DC for serial panel */
-+		ipu_dc_write(ipu, 0x14, DC_DISP_CONF1(DC_DISP_ID_SERIAL));
-+
-+		if (sig.clk_pol)
-+			ser_conf |= DI_SER_CONF_SERIAL_CLK_POL;
-+		if (sig.data_pol)
-+			ser_conf |= DI_SER_CONF_SERIAL_DATA_POL;
-+		if (sig.rs_pol)
-+			ser_conf |= DI_SER_CONF_SERIAL_RS_POL;
-+		if (sig.cs_pol)
-+			ser_conf |= DI_SER_CONF_SERIAL_CS_POL;
-+		ipu_di_write(ipu, disp, ser_conf, DI_SER_CONF);
-+	}
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_init_async_panel);
-+
-+/*!
-+ * This function sets the foreground and background plane global alpha blending
-+ * modes. This function also sets the DP graphic plane according to the
-+ * parameter of IPUv3 DP channel.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param	channel		IPUv3 DP channel
-+ *
-+ * @param       enable          Boolean to enable or disable global alpha
-+ *                              blending. If disabled, local blending is used.
-+ *
-+ * @param       alpha           Global alpha value.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_disp_set_global_alpha(struct ipu_soc *ipu, ipu_channel_t channel,
-+				bool enable, uint8_t alpha)
-+{
-+	uint32_t reg;
-+	uint32_t flow;
-+	bool bg_chan;
-+
-+	if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC)
-+		flow = DP_SYNC;
-+	else if (channel == MEM_BG_ASYNC0 || channel == MEM_FG_ASYNC0)
-+		flow = DP_ASYNC0;
-+	else if (channel == MEM_BG_ASYNC1 || channel == MEM_FG_ASYNC1)
-+		flow = DP_ASYNC1;
-+	else
-+		return -EINVAL;
-+
-+	if (channel == MEM_BG_SYNC || channel == MEM_BG_ASYNC0 ||
-+	    channel == MEM_BG_ASYNC1)
-+		bg_chan = true;
-+	else
-+		bg_chan = false;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	if (bg_chan) {
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GWSEL, DP_COM_CONF(flow));
-+	} else {
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+		ipu_dp_write(ipu, reg | DP_COM_CONF_GWSEL, DP_COM_CONF(flow));
-+	}
-+
-+	if (enable) {
-+		reg = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(flow)) & 0x00FFFFFFL;
-+		ipu_dp_write(ipu, reg | ((uint32_t) alpha << 24),
-+			     DP_GRAPH_WIND_CTRL(flow));
-+
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+		ipu_dp_write(ipu, reg | DP_COM_CONF_GWAM, DP_COM_CONF(flow));
-+	} else {
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GWAM, DP_COM_CONF(flow));
-+	}
-+
-+	reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+	ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_disp_set_global_alpha);
-+
-+/*!
-+ * This function sets the transparent color key for SDC graphic plane.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       enable          Boolean to enable or disable color key
-+ *
-+ * @param       colorKey        24-bit RGB color for transparent color key.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_disp_set_color_key(struct ipu_soc *ipu, ipu_channel_t channel,
-+				bool enable, uint32_t color_key)
-+{
-+	uint32_t reg, flow;
-+	int y, u, v;
-+	int red, green, blue;
-+
-+	if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC)
-+		flow = DP_SYNC;
-+	else if (channel == MEM_BG_ASYNC0 || channel == MEM_FG_ASYNC0)
-+		flow = DP_ASYNC0;
-+	else if (channel == MEM_BG_ASYNC1 || channel == MEM_FG_ASYNC1)
-+		flow = DP_ASYNC1;
-+	else
-+		return -EINVAL;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	ipu->color_key_4rgb = true;
-+	/* Transform color key from rgb to yuv if CSC is enabled */
-+	if (((ipu->fg_csc_type == RGB2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
-+			((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == RGB2YUV)) ||
-+			((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
-+			((ipu->fg_csc_type == YUV2RGB) && (ipu->bg_csc_type == YUV2RGB))) {
-+
-+		dev_dbg(ipu->dev, "color key 0x%x need change to yuv fmt\n", color_key);
-+
-+		red = (color_key >> 16) & 0xFF;
-+		green = (color_key >> 8) & 0xFF;
-+		blue = color_key & 0xFF;
-+
-+		y = _rgb_to_yuv(0, red, green, blue);
-+		u = _rgb_to_yuv(1, red, green, blue);
-+		v = _rgb_to_yuv(2, red, green, blue);
-+		color_key = (y << 16) | (u << 8) | v;
-+
-+		ipu->color_key_4rgb = false;
-+
-+		dev_dbg(ipu->dev, "color key change to yuv fmt 0x%x\n", color_key);
-+	}
-+
-+	if (enable) {
-+		reg = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(flow)) & 0xFF000000L;
-+		ipu_dp_write(ipu, reg | color_key, DP_GRAPH_WIND_CTRL(flow));
-+
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+		ipu_dp_write(ipu, reg | DP_COM_CONF_GWCKE, DP_COM_CONF(flow));
-+	} else {
-+		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GWCKE, DP_COM_CONF(flow));
-+	}
-+
-+	reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+	ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_disp_set_color_key);
-+
-+/*!
-+ * This function sets the gamma correction for DP output.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       enable          Boolean to enable or disable gamma correction.
-+ *
-+ * @param       constk        	Gamma piecewise linear approximation constk coeff.
-+ *
-+ * @param       slopek        	Gamma piecewise linear approximation slopek coeff.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t ipu_disp_set_gamma_correction(struct ipu_soc *ipu, ipu_channel_t channel, bool enable, int constk[], int slopek[])
-+{
-+	uint32_t reg, flow, i;
-+
-+	if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC)
-+		flow = DP_SYNC;
-+	else if (channel == MEM_BG_ASYNC0 || channel == MEM_FG_ASYNC0)
-+		flow = DP_ASYNC0;
-+	else if (channel == MEM_BG_ASYNC1 || channel == MEM_FG_ASYNC1)
-+		flow = DP_ASYNC1;
-+	else
-+		return -EINVAL;
-+
-+	_ipu_get(ipu);
-+
-+	mutex_lock(&ipu->mutex_lock);
-+
-+	for (i = 0; i < 8; i++)
-+		ipu_dp_write(ipu, (constk[2*i] & 0x1ff) | ((constk[2*i+1] & 0x1ff) << 16), DP_GAMMA_C(flow, i));
-+	for (i = 0; i < 4; i++)
-+		ipu_dp_write(ipu, (slopek[4*i] & 0xff) | ((slopek[4*i+1] & 0xff) << 8) |
-+			((slopek[4*i+2] & 0xff) << 16) | ((slopek[4*i+3] & 0xff) << 24), DP_GAMMA_S(flow, i));
-+
-+	reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
-+	if (enable) {
-+		if ((ipu->bg_csc_type == RGB2YUV) || (ipu->bg_csc_type == YUV2YUV))
-+			reg |= DP_COM_CONF_GAMMA_YUV_EN;
-+		else
-+			reg &= ~DP_COM_CONF_GAMMA_YUV_EN;
-+		ipu_dp_write(ipu, reg | DP_COM_CONF_GAMMA_EN, DP_COM_CONF(flow));
-+	} else
-+		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GAMMA_EN, DP_COM_CONF(flow));
-+
-+	reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
-+	ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+
-+	mutex_unlock(&ipu->mutex_lock);
-+
-+	_ipu_put(ipu);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(ipu_disp_set_gamma_correction);
-+
-+/*!
-+ * This function sets the window position of the foreground or background plane.
-+ * modes.
-+ *
-+ * @param	ipu		ipu handler
-+ * @param       channel         Input parameter for the logical channel ID.
-+ *
-+ * @param       x_pos           The X coordinate position to place window at.
-+ *                              The position is relative to the top left corner.
-+ *
-+ * @param       y_pos           The Y coordinate position to place window at.
-+ *                              The position is relative to the top left corner.
-+ *
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int32_t _ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
-+				int16_t x_pos, int16_t y_pos)
-+{
-+	u32 reg;
-+	uint32_t flow = 0;
-+	uint32_t dp_srm_shift;
-+
-+	if ((channel == MEM_FG_SYNC) || (channel == MEM_BG_SYNC)) {
-+		flow = DP_SYNC;
-+		dp_srm_shift = 3;
-+	} else if (channel == MEM_FG_ASYNC0) {
-+		flow = DP_ASYNC0;
-+		dp_srm_shift = 5;
-+	} else if (channel == MEM_FG_ASYNC1) {
-+		flow = DP_ASYNC1;
-+		dp_srm_shift = 7;
-+	} else
-+		return -EINVAL;
-+
-+	ipu_dp_write(ipu, (x_pos << 16) | y_pos, DP_FG_POS(flow));
-+
-+	if (ipu_is_channel_busy(ipu, channel)) {
-+		/* controled by FSU if channel enabled */
-+		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) & (~(0x3 << dp_srm_shift));
-+		reg |= (0x1 << dp_srm_shift);
-+		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+	} else {
-+		/* disable auto swap, controled by MCU if channel disabled */
-+		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) & (~(0x3 << dp_srm_shift));
-+		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
-+	}
-+
-+	return 0;
-+}
-+
-+int32_t ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
-+				int16_t x_pos, int16_t y_pos)
-+{
-+	int ret;
-+
-+	_ipu_get(ipu);
-+	mutex_lock(&ipu->mutex_lock);
-+	ret = _ipu_disp_set_window_pos(ipu, channel, x_pos, y_pos);
-+	mutex_unlock(&ipu->mutex_lock);
-+	_ipu_put(ipu);
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_disp_set_window_pos);
-+
-+int32_t _ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
-+				int16_t *x_pos, int16_t *y_pos)
-+{
-+	u32 reg;
-+	uint32_t flow = 0;
-+
-+	if (channel == MEM_FG_SYNC)
-+		flow = DP_SYNC;
-+	else if (channel == MEM_FG_ASYNC0)
-+		flow = DP_ASYNC0;
-+	else if (channel == MEM_FG_ASYNC1)
-+		flow = DP_ASYNC1;
-+	else
-+		return -EINVAL;
-+
-+	reg = ipu_dp_read(ipu, DP_FG_POS(flow));
-+
-+	*x_pos = (reg >> 16) & 0x7FF;
-+	*y_pos = reg & 0x7FF;
-+
-+	return 0;
-+}
-+int32_t ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
-+				int16_t *x_pos, int16_t *y_pos)
-+{
-+	int ret;
-+
-+	_ipu_get(ipu);
-+	mutex_lock(&ipu->mutex_lock);
-+	ret = _ipu_disp_get_window_pos(ipu, channel, x_pos, y_pos);
-+	mutex_unlock(&ipu->mutex_lock);
-+	_ipu_put(ipu);
-+	return ret;
-+}
-+EXPORT_SYMBOL(ipu_disp_get_window_pos);
-+
-+void ipu_disp_direct_write(struct ipu_soc *ipu, ipu_channel_t channel, u32 value, u32 offset)
-+{
-+	if (channel == DIRECT_ASYNC0)
-+		writel(value, ipu->disp_base[0] + offset);
-+	else if (channel == DIRECT_ASYNC1)
-+		writel(value, ipu->disp_base[1] + offset);
-+}
-+EXPORT_SYMBOL(ipu_disp_direct_write);
-+
-+void ipu_reset_disp_panel(struct ipu_soc *ipu)
-+{
-+	uint32_t tmp;
-+
-+	tmp = ipu_di_read(ipu, 1, DI_GENERAL);
-+	ipu_di_write(ipu, 1, tmp | 0x08, DI_GENERAL);
-+	msleep(10); /* tRES >= 100us */
-+	tmp = ipu_di_read(ipu, 1, DI_GENERAL);
-+	ipu_di_write(ipu, 1, tmp & ~0x08, DI_GENERAL);
-+	msleep(60);
-+
-+	return;
-+}
-+EXPORT_SYMBOL(ipu_reset_disp_panel);
-+
-+void ipu_disp_init(struct ipu_soc *ipu)
-+{
-+	ipu->fg_csc_type = ipu->bg_csc_type = CSC_NONE;
-+	ipu->color_key_4rgb = true;
-+	_ipu_init_dc_mappings(ipu);
-+	_ipu_dmfc_init(ipu, DMFC_NORMAL, 1);
-+}
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_ic.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_ic.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_ic.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_ic.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,924 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*
-+ * @file ipu_ic.c
-+ *
-+ * @brief IPU IC functions
-+ *
-+ * @ingroup IPU
-+ */
-+#include <linux/errno.h>
-+#include <linux/init.h>
-+#include <linux/io.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/spinlock.h>
-+#include <linux/types.h>
-+#include <linux/videodev2.h>
-+
-+#include "ipu_param_mem.h"
-+#include "ipu_regs.h"
-+
-+enum {
-+	IC_TASK_VIEWFINDER,
-+	IC_TASK_ENCODER,
-+	IC_TASK_POST_PROCESSOR
-+};
-+
-+static void _init_csc(struct ipu_soc *ipu, uint8_t ic_task, ipu_color_space_t in_format,
-+		      ipu_color_space_t out_format, int csc_index);
-+
-+static int _calc_resize_coeffs(struct ipu_soc *ipu,
-+				uint32_t inSize, uint32_t outSize,
-+				uint32_t *resizeCoeff,
-+				uint32_t *downsizeCoeff);
-+
-+void _ipu_vdi_set_top_field_man(struct ipu_soc *ipu, bool top_field_0)
-+{
-+	uint32_t reg;
-+
-+	reg = ipu_vdi_read(ipu, VDI_C);
-+	if (top_field_0)
-+		reg &= ~VDI_C_TOP_FIELD_MAN_1;
-+	else
-+		reg |= VDI_C_TOP_FIELD_MAN_1;
-+	ipu_vdi_write(ipu, reg, VDI_C);
-+}
-+
-+void _ipu_vdi_set_motion(struct ipu_soc *ipu, ipu_motion_sel motion_sel)
-+{
-+	uint32_t reg;
-+
-+	reg = ipu_vdi_read(ipu, VDI_C);
-+	reg &= ~(VDI_C_MOT_SEL_FULL | VDI_C_MOT_SEL_MED | VDI_C_MOT_SEL_LOW);
-+	if (motion_sel == HIGH_MOTION)
-+		reg |= VDI_C_MOT_SEL_FULL;
-+	else if (motion_sel == MED_MOTION)
-+		reg |= VDI_C_MOT_SEL_MED;
-+	else
-+		reg |= VDI_C_MOT_SEL_LOW;
-+
-+	ipu_vdi_write(ipu, reg, VDI_C);
-+	dev_dbg(ipu->dev, "VDI_C = \t0x%08X\n", reg);
-+}
-+
-+void ic_dump_register(struct ipu_soc *ipu)
-+{
-+	printk(KERN_DEBUG "IC_CONF = \t0x%08X\n", ipu_ic_read(ipu, IC_CONF));
-+	printk(KERN_DEBUG "IC_PRP_ENC_RSC = \t0x%08X\n",
-+	       ipu_ic_read(ipu, IC_PRP_ENC_RSC));
-+	printk(KERN_DEBUG "IC_PRP_VF_RSC = \t0x%08X\n",
-+	       ipu_ic_read(ipu, IC_PRP_VF_RSC));
-+	printk(KERN_DEBUG "IC_PP_RSC = \t0x%08X\n", ipu_ic_read(ipu, IC_PP_RSC));
-+	printk(KERN_DEBUG "IC_IDMAC_1 = \t0x%08X\n", ipu_ic_read(ipu, IC_IDMAC_1));
-+	printk(KERN_DEBUG "IC_IDMAC_2 = \t0x%08X\n", ipu_ic_read(ipu, IC_IDMAC_2));
-+	printk(KERN_DEBUG "IC_IDMAC_3 = \t0x%08X\n", ipu_ic_read(ipu, IC_IDMAC_3));
-+}
-+
-+void _ipu_ic_enable_task(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t ic_conf;
-+
-+	ic_conf = ipu_ic_read(ipu, IC_CONF);
-+	switch (channel) {
-+	case CSI_PRP_VF_MEM:
-+	case MEM_PRP_VF_MEM:
-+		ic_conf |= IC_CONF_PRPVF_EN;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		ic_conf |= IC_CONF_PRPVF_EN;
-+		break;
-+	case MEM_VDI_MEM:
-+		ic_conf |= IC_CONF_PRPVF_EN | IC_CONF_RWS_EN ;
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		ic_conf |= IC_CONF_PRPVF_ROT_EN;
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+	case MEM_PRP_ENC_MEM:
-+		ic_conf |= IC_CONF_PRPENC_EN;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		ic_conf |= IC_CONF_PRPENC_ROT_EN;
-+		break;
-+	case MEM_PP_MEM:
-+		ic_conf |= IC_CONF_PP_EN;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		ic_conf |= IC_CONF_PP_ROT_EN;
-+		break;
-+	default:
-+		break;
-+	}
-+	ipu_ic_write(ipu, ic_conf, IC_CONF);
-+}
-+
-+void _ipu_ic_disable_task(struct ipu_soc *ipu, ipu_channel_t channel)
-+{
-+	uint32_t ic_conf;
-+
-+	ic_conf = ipu_ic_read(ipu, IC_CONF);
-+	switch (channel) {
-+	case CSI_PRP_VF_MEM:
-+	case MEM_PRP_VF_MEM:
-+		ic_conf &= ~IC_CONF_PRPVF_EN;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM:
-+		ic_conf &= ~IC_CONF_PRPVF_EN;
-+		break;
-+	case MEM_VDI_MEM:
-+		ic_conf &= ~(IC_CONF_PRPVF_EN | IC_CONF_RWS_EN);
-+		break;
-+	case MEM_ROT_VF_MEM:
-+		ic_conf &= ~IC_CONF_PRPVF_ROT_EN;
-+		break;
-+	case CSI_PRP_ENC_MEM:
-+	case MEM_PRP_ENC_MEM:
-+		ic_conf &= ~IC_CONF_PRPENC_EN;
-+		break;
-+	case MEM_ROT_ENC_MEM:
-+		ic_conf &= ~IC_CONF_PRPENC_ROT_EN;
-+		break;
-+	case MEM_PP_MEM:
-+		ic_conf &= ~IC_CONF_PP_EN;
-+		break;
-+	case MEM_ROT_PP_MEM:
-+		ic_conf &= ~IC_CONF_PP_ROT_EN;
-+		break;
-+	default:
-+		break;
-+	}
-+	ipu_ic_write(ipu, ic_conf, IC_CONF);
-+}
-+
-+void _ipu_vdi_init(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params)
-+{
-+	uint32_t reg;
-+	uint32_t pixel_fmt;
-+	uint32_t pix_per_burst;
-+
-+	reg = ((params->mem_prp_vf_mem.in_height-1) << 16) |
-+	  (params->mem_prp_vf_mem.in_width-1);
-+	ipu_vdi_write(ipu, reg, VDI_FSIZE);
-+
-+	/* Full motion, only vertical filter is used
-+	   Burst size is 4 accesses */
-+	if (params->mem_prp_vf_mem.in_pixel_fmt ==
-+	     IPU_PIX_FMT_UYVY ||
-+	     params->mem_prp_vf_mem.in_pixel_fmt ==
-+	     IPU_PIX_FMT_YUYV) {
-+		pixel_fmt = VDI_C_CH_422;
-+		pix_per_burst = 32;
-+	 } else {
-+		pixel_fmt = VDI_C_CH_420;
-+		pix_per_burst = 64;
-+	}
-+
-+	reg = ipu_vdi_read(ipu, VDI_C);
-+	reg |= pixel_fmt;
-+	switch (channel) {
-+	case MEM_VDI_PRP_VF_MEM:
-+		reg |= VDI_C_BURST_SIZE2_4;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM_P:
-+		reg |= VDI_C_BURST_SIZE1_4 | VDI_C_VWM1_SET_1 | VDI_C_VWM1_CLR_2;
-+		break;
-+	case MEM_VDI_PRP_VF_MEM_N:
-+		reg |= VDI_C_BURST_SIZE3_4 | VDI_C_VWM3_SET_1 | VDI_C_VWM3_CLR_2;
-+		break;
-+
-+	case MEM_VDI_MEM:
-+		reg |= (((pix_per_burst >> 2) - 1) & VDI_C_BURST_SIZE_MASK)
-+				<< VDI_C_BURST_SIZE2_OFFSET;
-+		break;
-+	case MEM_VDI_MEM_P:
-+		reg |= (((pix_per_burst >> 2) - 1) & VDI_C_BURST_SIZE_MASK)
-+				<< VDI_C_BURST_SIZE1_OFFSET;
-+		reg |= VDI_C_VWM1_SET_2 | VDI_C_VWM1_CLR_2;
-+		break;
-+	case MEM_VDI_MEM_N:
-+		reg |= (((pix_per_burst >> 2) - 1) & VDI_C_BURST_SIZE_MASK)
-+				<< VDI_C_BURST_SIZE3_OFFSET;
-+		reg |= VDI_C_VWM3_SET_2 | VDI_C_VWM3_CLR_2;
-+		break;
-+	default:
-+		break;
-+	}
-+	ipu_vdi_write(ipu, reg, VDI_C);
-+
-+	if (params->mem_prp_vf_mem.field_fmt == IPU_DEINTERLACE_FIELD_TOP)
-+		_ipu_vdi_set_top_field_man(ipu, true);
-+	else if (params->mem_prp_vf_mem.field_fmt == IPU_DEINTERLACE_FIELD_BOTTOM)
-+		_ipu_vdi_set_top_field_man(ipu, false);
-+
-+	_ipu_vdi_set_motion(ipu, params->mem_prp_vf_mem.motion_sel);
-+
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~IC_CONF_RWS_EN;
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+void _ipu_vdi_uninit(struct ipu_soc *ipu)
-+{
-+	ipu_vdi_write(ipu, 0, VDI_FSIZE);
-+	ipu_vdi_write(ipu, 0, VDI_C);
-+}
-+
-+int _ipu_ic_init_prpvf(struct ipu_soc *ipu, ipu_channel_params_t *params,
-+		       bool src_is_csi)
-+{
-+	uint32_t reg, ic_conf;
-+	uint32_t downsizeCoeff, resizeCoeff;
-+	ipu_color_space_t in_fmt, out_fmt;
-+	int ret = 0;
-+
-+	/* Setup vertical resizing */
-+	if (!params->mem_prp_vf_mem.outv_resize_ratio) {
-+		ret = _calc_resize_coeffs(ipu, params->mem_prp_vf_mem.in_height,
-+					params->mem_prp_vf_mem.out_height,
-+					&resizeCoeff, &downsizeCoeff);
-+		if (ret < 0) {
-+			dev_err(ipu->dev, "failed to calculate prpvf height "
-+				"scaling coefficients\n");
-+			return ret;
-+		}
-+
-+		reg = (downsizeCoeff << 30) | (resizeCoeff << 16);
-+	} else
-+		reg = (params->mem_prp_vf_mem.outv_resize_ratio) << 16;
-+
-+	/* Setup horizontal resizing */
-+	if (!params->mem_prp_vf_mem.outh_resize_ratio) {
-+		ret = _calc_resize_coeffs(ipu, params->mem_prp_vf_mem.in_width,
-+					params->mem_prp_vf_mem.out_width,
-+					&resizeCoeff, &downsizeCoeff);
-+		if (ret < 0) {
-+			dev_err(ipu->dev, "failed to calculate prpvf width "
-+				"scaling coefficients\n");
-+			return ret;
-+		}
-+
-+		reg |= (downsizeCoeff << 14) | resizeCoeff;
-+	} else
-+		reg |= params->mem_prp_vf_mem.outh_resize_ratio;
-+
-+	ipu_ic_write(ipu, reg, IC_PRP_VF_RSC);
-+
-+	ic_conf = ipu_ic_read(ipu, IC_CONF);
-+
-+	/* Setup color space conversion */
-+	in_fmt = format_to_colorspace(params->mem_prp_vf_mem.in_pixel_fmt);
-+	out_fmt = format_to_colorspace(params->mem_prp_vf_mem.out_pixel_fmt);
-+	if (in_fmt == RGB) {
-+		if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
-+			/* Enable RGB->YCBCR CSC1 */
-+			_init_csc(ipu, IC_TASK_VIEWFINDER, RGB, out_fmt, 1);
-+			ic_conf |= IC_CONF_PRPVF_CSC1;
-+		}
-+	}
-+	if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
-+		if (out_fmt == RGB) {
-+			/* Enable YCBCR->RGB CSC1 */
-+			_init_csc(ipu, IC_TASK_VIEWFINDER, YCbCr, RGB, 1);
-+			ic_conf |= IC_CONF_PRPVF_CSC1;
-+		} else {
-+			/* TODO: Support YUV<->YCbCr conversion? */
-+		}
-+	}
-+
-+	if (params->mem_prp_vf_mem.graphics_combine_en) {
-+		ic_conf |= IC_CONF_PRPVF_CMB;
-+
-+		if (!(ic_conf & IC_CONF_PRPVF_CSC1)) {
-+			/* need transparent CSC1 conversion */
-+			_init_csc(ipu, IC_TASK_VIEWFINDER, RGB, RGB, 1);
-+			ic_conf |= IC_CONF_PRPVF_CSC1;  /* Enable RGB->RGB CSC */
-+		}
-+		in_fmt = format_to_colorspace(params->mem_prp_vf_mem.in_g_pixel_fmt);
-+		out_fmt = format_to_colorspace(params->mem_prp_vf_mem.out_pixel_fmt);
-+		if (in_fmt == RGB) {
-+			if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
-+				/* Enable RGB->YCBCR CSC2 */
-+				_init_csc(ipu, IC_TASK_VIEWFINDER, RGB, out_fmt, 2);
-+				ic_conf |= IC_CONF_PRPVF_CSC2;
-+			}
-+		}
-+		if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
-+			if (out_fmt == RGB) {
-+				/* Enable YCBCR->RGB CSC2 */
-+				_init_csc(ipu, IC_TASK_VIEWFINDER, YCbCr, RGB, 2);
-+				ic_conf |= IC_CONF_PRPVF_CSC2;
-+			} else {
-+				/* TODO: Support YUV<->YCbCr conversion? */
-+			}
-+		}
-+
-+		if (params->mem_prp_vf_mem.global_alpha_en) {
-+			ic_conf |= IC_CONF_IC_GLB_LOC_A;
-+			reg = ipu_ic_read(ipu, IC_CMBP_1);
-+			reg &= ~(0xff);
-+			reg |= params->mem_prp_vf_mem.alpha;
-+			ipu_ic_write(ipu, reg, IC_CMBP_1);
-+		} else
-+			ic_conf &= ~IC_CONF_IC_GLB_LOC_A;
-+
-+		if (params->mem_prp_vf_mem.key_color_en) {
-+			ic_conf |= IC_CONF_KEY_COLOR_EN;
-+			ipu_ic_write(ipu, params->mem_prp_vf_mem.key_color,
-+					IC_CMBP_2);
-+		} else
-+			ic_conf &= ~IC_CONF_KEY_COLOR_EN;
-+	} else {
-+		ic_conf &= ~IC_CONF_PRPVF_CMB;
-+	}
-+
-+	if (src_is_csi)
-+		ic_conf &= ~IC_CONF_RWS_EN;
-+	else
-+		ic_conf |= IC_CONF_RWS_EN;
-+
-+	ipu_ic_write(ipu, ic_conf, IC_CONF);
-+
-+	return ret;
-+}
-+
-+void _ipu_ic_uninit_prpvf(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~(IC_CONF_PRPVF_EN | IC_CONF_PRPVF_CMB |
-+		 IC_CONF_PRPVF_CSC2 | IC_CONF_PRPVF_CSC1);
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+void _ipu_ic_init_rotate_vf(struct ipu_soc *ipu, ipu_channel_params_t *params)
-+{
-+}
-+
-+void _ipu_ic_uninit_rotate_vf(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~IC_CONF_PRPVF_ROT_EN;
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+int _ipu_ic_init_prpenc(struct ipu_soc *ipu, ipu_channel_params_t *params,
-+			bool src_is_csi)
-+{
-+	uint32_t reg, ic_conf;
-+	uint32_t downsizeCoeff, resizeCoeff;
-+	ipu_color_space_t in_fmt, out_fmt;
-+	int ret = 0;
-+
-+	/* Setup vertical resizing */
-+	if (!params->mem_prp_enc_mem.outv_resize_ratio) {
-+		ret = _calc_resize_coeffs(ipu,
-+					params->mem_prp_enc_mem.in_height,
-+					params->mem_prp_enc_mem.out_height,
-+					&resizeCoeff, &downsizeCoeff);
-+		if (ret < 0) {
-+			dev_err(ipu->dev, "failed to calculate prpenc height "
-+				"scaling coefficients\n");
-+			return ret;
-+		}
-+
-+		reg = (downsizeCoeff << 30) | (resizeCoeff << 16);
-+	} else
-+		reg = (params->mem_prp_enc_mem.outv_resize_ratio) << 16;
-+
-+	/* Setup horizontal resizing */
-+	if (!params->mem_prp_enc_mem.outh_resize_ratio) {
-+		ret = _calc_resize_coeffs(ipu, params->mem_prp_enc_mem.in_width,
-+					params->mem_prp_enc_mem.out_width,
-+					&resizeCoeff, &downsizeCoeff);
-+		if (ret < 0) {
-+			dev_err(ipu->dev, "failed to calculate prpenc width "
-+				"scaling coefficients\n");
-+			return ret;
-+		}
-+
-+		reg |= (downsizeCoeff << 14) | resizeCoeff;
-+	} else
-+		reg |= params->mem_prp_enc_mem.outh_resize_ratio;
-+
-+	ipu_ic_write(ipu, reg, IC_PRP_ENC_RSC);
-+
-+	ic_conf = ipu_ic_read(ipu, IC_CONF);
-+
-+	/* Setup color space conversion */
-+	in_fmt = format_to_colorspace(params->mem_prp_enc_mem.in_pixel_fmt);
-+	out_fmt = format_to_colorspace(params->mem_prp_enc_mem.out_pixel_fmt);
-+	if (in_fmt == RGB) {
-+		if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
-+			/* Enable RGB->YCBCR CSC1 */
-+			_init_csc(ipu, IC_TASK_ENCODER, RGB, out_fmt, 1);
-+			ic_conf |= IC_CONF_PRPENC_CSC1;
-+		}
-+	}
-+	if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
-+		if (out_fmt == RGB) {
-+			/* Enable YCBCR->RGB CSC1 */
-+			_init_csc(ipu, IC_TASK_ENCODER, YCbCr, RGB, 1);
-+			ic_conf |= IC_CONF_PRPENC_CSC1;
-+		} else {
-+			/* TODO: Support YUV<->YCbCr conversion? */
-+		}
-+	}
-+
-+	if (src_is_csi)
-+		ic_conf &= ~IC_CONF_RWS_EN;
-+	else
-+		ic_conf |= IC_CONF_RWS_EN;
-+
-+	ipu_ic_write(ipu, ic_conf, IC_CONF);
-+
-+	return ret;
-+}
-+
-+void _ipu_ic_uninit_prpenc(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~(IC_CONF_PRPENC_EN | IC_CONF_PRPENC_CSC1);
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+void _ipu_ic_init_rotate_enc(struct ipu_soc *ipu, ipu_channel_params_t *params)
-+{
-+}
-+
-+void _ipu_ic_uninit_rotate_enc(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~(IC_CONF_PRPENC_ROT_EN);
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+int _ipu_ic_init_pp(struct ipu_soc *ipu, ipu_channel_params_t *params)
-+{
-+	uint32_t reg, ic_conf;
-+	uint32_t downsizeCoeff, resizeCoeff;
-+	ipu_color_space_t in_fmt, out_fmt;
-+	int ret = 0;
-+
-+	/* Setup vertical resizing */
-+	if (!params->mem_pp_mem.outv_resize_ratio) {
-+		ret = _calc_resize_coeffs(ipu, params->mem_pp_mem.in_height,
-+				    params->mem_pp_mem.out_height,
-+				    &resizeCoeff, &downsizeCoeff);
-+		if (ret < 0) {
-+			dev_err(ipu->dev, "failed to calculate pp height "
-+				"scaling coefficients\n");
-+			return ret;
-+		}
-+
-+		reg = (downsizeCoeff << 30) | (resizeCoeff << 16);
-+	} else {
-+		reg = (params->mem_pp_mem.outv_resize_ratio) << 16;
-+	}
-+
-+	/* Setup horizontal resizing */
-+	if (!params->mem_pp_mem.outh_resize_ratio) {
-+		ret = _calc_resize_coeffs(ipu, params->mem_pp_mem.in_width,
-+					params->mem_pp_mem.out_width,
-+					&resizeCoeff, &downsizeCoeff);
-+		if (ret < 0) {
-+			dev_err(ipu->dev, "failed to calculate pp width "
-+				"scaling coefficients\n");
-+			return ret;
-+		}
-+
-+		reg |= (downsizeCoeff << 14) | resizeCoeff;
-+	} else {
-+		reg |= params->mem_pp_mem.outh_resize_ratio;
-+	}
-+
-+	ipu_ic_write(ipu, reg, IC_PP_RSC);
-+
-+	ic_conf = ipu_ic_read(ipu, IC_CONF);
-+
-+	/* Setup color space conversion */
-+	in_fmt = format_to_colorspace(params->mem_pp_mem.in_pixel_fmt);
-+	out_fmt = format_to_colorspace(params->mem_pp_mem.out_pixel_fmt);
-+	if (in_fmt == RGB) {
-+		if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
-+			/* Enable RGB->YCBCR CSC1 */
-+			_init_csc(ipu, IC_TASK_POST_PROCESSOR, RGB, out_fmt, 1);
-+			ic_conf |= IC_CONF_PP_CSC1;
-+		}
-+	}
-+	if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
-+		if (out_fmt == RGB) {
-+			/* Enable YCBCR->RGB CSC1 */
-+			_init_csc(ipu, IC_TASK_POST_PROCESSOR, YCbCr, RGB, 1);
-+			ic_conf |= IC_CONF_PP_CSC1;
-+		} else {
-+			/* TODO: Support YUV<->YCbCr conversion? */
-+		}
-+	}
-+
-+	if (params->mem_pp_mem.graphics_combine_en) {
-+		ic_conf |= IC_CONF_PP_CMB;
-+
-+		if (!(ic_conf & IC_CONF_PP_CSC1)) {
-+			/* need transparent CSC1 conversion */
-+			_init_csc(ipu, IC_TASK_POST_PROCESSOR, RGB, RGB, 1);
-+			ic_conf |= IC_CONF_PP_CSC1;  /* Enable RGB->RGB CSC */
-+		}
-+
-+		in_fmt = format_to_colorspace(params->mem_pp_mem.in_g_pixel_fmt);
-+		out_fmt = format_to_colorspace(params->mem_pp_mem.out_pixel_fmt);
-+		if (in_fmt == RGB) {
-+			if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
-+				/* Enable RGB->YCBCR CSC2 */
-+				_init_csc(ipu, IC_TASK_POST_PROCESSOR, RGB, out_fmt, 2);
-+				ic_conf |= IC_CONF_PP_CSC2;
-+			}
-+		}
-+		if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
-+			if (out_fmt == RGB) {
-+				/* Enable YCBCR->RGB CSC2 */
-+				_init_csc(ipu, IC_TASK_POST_PROCESSOR, YCbCr, RGB, 2);
-+				ic_conf |= IC_CONF_PP_CSC2;
-+			} else {
-+				/* TODO: Support YUV<->YCbCr conversion? */
-+			}
-+		}
-+
-+		if (params->mem_pp_mem.global_alpha_en) {
-+			ic_conf |= IC_CONF_IC_GLB_LOC_A;
-+			reg = ipu_ic_read(ipu, IC_CMBP_1);
-+			reg &= ~(0xff00);
-+			reg |= (params->mem_pp_mem.alpha << 8);
-+			ipu_ic_write(ipu, reg, IC_CMBP_1);
-+		} else
-+			ic_conf &= ~IC_CONF_IC_GLB_LOC_A;
-+
-+		if (params->mem_pp_mem.key_color_en) {
-+			ic_conf |= IC_CONF_KEY_COLOR_EN;
-+			ipu_ic_write(ipu, params->mem_pp_mem.key_color,
-+					IC_CMBP_2);
-+		} else
-+			ic_conf &= ~IC_CONF_KEY_COLOR_EN;
-+	} else {
-+		ic_conf &= ~IC_CONF_PP_CMB;
-+	}
-+
-+	ipu_ic_write(ipu, ic_conf, IC_CONF);
-+
-+	return ret;
-+}
-+
-+void _ipu_ic_uninit_pp(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~(IC_CONF_PP_EN | IC_CONF_PP_CSC1 | IC_CONF_PP_CSC2 |
-+		 IC_CONF_PP_CMB);
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+void _ipu_ic_init_rotate_pp(struct ipu_soc *ipu, ipu_channel_params_t *params)
-+{
-+}
-+
-+void _ipu_ic_uninit_rotate_pp(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+	reg = ipu_ic_read(ipu, IC_CONF);
-+	reg &= ~IC_CONF_PP_ROT_EN;
-+	ipu_ic_write(ipu, reg, IC_CONF);
-+}
-+
-+int _ipu_ic_idma_init(struct ipu_soc *ipu, int dma_chan,
-+		uint16_t width, uint16_t height,
-+		int burst_size, ipu_rotate_mode_t rot)
-+{
-+	u32 ic_idmac_1, ic_idmac_2, ic_idmac_3;
-+	u32 temp_rot = bitrev8(rot) >> 5;
-+	bool need_hor_flip = false;
-+
-+	if ((burst_size != 8) && (burst_size != 16)) {
-+		dev_dbg(ipu->dev, "Illegal burst length for IC\n");
-+		return -EINVAL;
-+	}
-+
-+	width--;
-+	height--;
-+
-+	if (temp_rot & 0x2)	/* Need horizontal flip */
-+		need_hor_flip = true;
-+
-+	ic_idmac_1 = ipu_ic_read(ipu, IC_IDMAC_1);
-+	ic_idmac_2 = ipu_ic_read(ipu, IC_IDMAC_2);
-+	ic_idmac_3 = ipu_ic_read(ipu, IC_IDMAC_3);
-+	if (dma_chan == 22) {	/* PP output - CB2 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB2_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB2_BURST_16;
-+
-+		if (need_hor_flip)
-+			ic_idmac_1 |= IC_IDMAC_1_PP_FLIP_RS;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_PP_FLIP_RS;
-+
-+		ic_idmac_2 &= ~IC_IDMAC_2_PP_HEIGHT_MASK;
-+		ic_idmac_2 |= height << IC_IDMAC_2_PP_HEIGHT_OFFSET;
-+
-+		ic_idmac_3 &= ~IC_IDMAC_3_PP_WIDTH_MASK;
-+		ic_idmac_3 |= width << IC_IDMAC_3_PP_WIDTH_OFFSET;
-+	} else if (dma_chan == 11) {	/* PP Input - CB5 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB5_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB5_BURST_16;
-+	} else if (dma_chan == 47) {	/* PP Rot input */
-+		ic_idmac_1 &= ~IC_IDMAC_1_PP_ROT_MASK;
-+		ic_idmac_1 |= temp_rot << IC_IDMAC_1_PP_ROT_OFFSET;
-+	}
-+
-+	if (dma_chan == 12) {	/* PRP Input - CB6 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB6_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB6_BURST_16;
-+	}
-+
-+	if (dma_chan == 20) {	/* PRP ENC output - CB0 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB0_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB0_BURST_16;
-+
-+		if (need_hor_flip)
-+			ic_idmac_1 |= IC_IDMAC_1_PRPENC_FLIP_RS;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_PRPENC_FLIP_RS;
-+
-+		ic_idmac_2 &= ~IC_IDMAC_2_PRPENC_HEIGHT_MASK;
-+		ic_idmac_2 |= height << IC_IDMAC_2_PRPENC_HEIGHT_OFFSET;
-+
-+		ic_idmac_3 &= ~IC_IDMAC_3_PRPENC_WIDTH_MASK;
-+		ic_idmac_3 |= width << IC_IDMAC_3_PRPENC_WIDTH_OFFSET;
-+
-+	} else if (dma_chan == 45) {	/* PRP ENC Rot input */
-+		ic_idmac_1 &= ~IC_IDMAC_1_PRPENC_ROT_MASK;
-+		ic_idmac_1 |= temp_rot << IC_IDMAC_1_PRPENC_ROT_OFFSET;
-+	}
-+
-+	if (dma_chan == 21) {	/* PRP VF output - CB1 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB1_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB1_BURST_16;
-+
-+		if (need_hor_flip)
-+			ic_idmac_1 |= IC_IDMAC_1_PRPVF_FLIP_RS;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_PRPVF_FLIP_RS;
-+
-+		ic_idmac_2 &= ~IC_IDMAC_2_PRPVF_HEIGHT_MASK;
-+		ic_idmac_2 |= height << IC_IDMAC_2_PRPVF_HEIGHT_OFFSET;
-+
-+		ic_idmac_3 &= ~IC_IDMAC_3_PRPVF_WIDTH_MASK;
-+		ic_idmac_3 |= width << IC_IDMAC_3_PRPVF_WIDTH_OFFSET;
-+
-+	} else if (dma_chan == 46) {	/* PRP VF Rot input */
-+		ic_idmac_1 &= ~IC_IDMAC_1_PRPVF_ROT_MASK;
-+		ic_idmac_1 |= temp_rot << IC_IDMAC_1_PRPVF_ROT_OFFSET;
-+	}
-+
-+	if (dma_chan == 14) {	/* PRP VF graphics combining input - CB3 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB3_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB3_BURST_16;
-+	} else if (dma_chan == 15) {	/* PP graphics combining input - CB4 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB4_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB4_BURST_16;
-+	} else if (dma_chan == 5) {	/* VDIC OUTPUT - CB7 */
-+		if (burst_size == 16)
-+			ic_idmac_1 |= IC_IDMAC_1_CB7_BURST_16;
-+		else
-+			ic_idmac_1 &= ~IC_IDMAC_1_CB7_BURST_16;
-+	}
-+
-+	ipu_ic_write(ipu, ic_idmac_1, IC_IDMAC_1);
-+	ipu_ic_write(ipu, ic_idmac_2, IC_IDMAC_2);
-+	ipu_ic_write(ipu, ic_idmac_3, IC_IDMAC_3);
-+	return 0;
-+}
-+
-+static void _init_csc(struct ipu_soc *ipu, uint8_t ic_task, ipu_color_space_t in_format,
-+		      ipu_color_space_t out_format, int csc_index)
-+{
-+	/*
-+	 * Y =  0.257 * R + 0.504 * G + 0.098 * B +  16;
-+	 * U = -0.148 * R - 0.291 * G + 0.439 * B + 128;
-+	 * V =  0.439 * R - 0.368 * G - 0.071 * B + 128;
-+	 */
-+	static const uint32_t rgb2ycbcr_coeff[4][3] = {
-+		{0x0042, 0x0081, 0x0019},
-+		{0x01DA, 0x01B6, 0x0070},
-+		{0x0070, 0x01A2, 0x01EE},
-+		{0x0040, 0x0200, 0x0200},	/* A0, A1, A2 */
-+	};
-+
-+	/* transparent RGB->RGB matrix for combining
-+	 */
-+	static const uint32_t rgb2rgb_coeff[4][3] = {
-+		{0x0080, 0x0000, 0x0000},
-+		{0x0000, 0x0080, 0x0000},
-+		{0x0000, 0x0000, 0x0080},
-+		{0x0000, 0x0000, 0x0000},	/* A0, A1, A2 */
-+	};
-+
-+/*     R = (1.164 * (Y - 16)) + (1.596 * (Cr - 128));
-+       G = (1.164 * (Y - 16)) - (0.392 * (Cb - 128)) - (0.813 * (Cr - 128));
-+       B = (1.164 * (Y - 16)) + (2.017 * (Cb - 128); */
-+	static const uint32_t ycbcr2rgb_coeff[4][3] = {
-+		{149, 0, 204},
-+		{149, 462, 408},
-+		{149, 255, 0},
-+		{8192 - 446, 266, 8192 - 554},	/* A0, A1, A2 */
-+	};
-+
-+	uint32_t param;
-+	uint32_t *base = NULL;
-+
-+	if (ic_task == IC_TASK_ENCODER) {
-+		base = (uint32_t *)ipu->tpmem_base + 0x2008 / 4;
-+	} else if (ic_task == IC_TASK_VIEWFINDER) {
-+		if (csc_index == 1)
-+			base = (uint32_t *)ipu->tpmem_base + 0x4028 / 4;
-+		else
-+			base = (uint32_t *)ipu->tpmem_base + 0x4040 / 4;
-+	} else if (ic_task == IC_TASK_POST_PROCESSOR) {
-+		if (csc_index == 1)
-+			base = (uint32_t *)ipu->tpmem_base + 0x6060 / 4;
-+		else
-+			base = (uint32_t *)ipu->tpmem_base + 0x6078 / 4;
-+	} else {
-+		BUG();
-+	}
-+
-+	if ((in_format == YCbCr) && (out_format == RGB)) {
-+		/* Init CSC (YCbCr->RGB) */
-+		param = (ycbcr2rgb_coeff[3][0] << 27) |
-+			(ycbcr2rgb_coeff[0][0] << 18) |
-+			(ycbcr2rgb_coeff[1][1] << 9) | ycbcr2rgb_coeff[2][2];
-+		writel(param, base++);
-+		/* scale = 2, sat = 0 */
-+		param = (ycbcr2rgb_coeff[3][0] >> 5) | (2L << (40 - 32));
-+		writel(param, base++);
-+
-+		param = (ycbcr2rgb_coeff[3][1] << 27) |
-+			(ycbcr2rgb_coeff[0][1] << 18) |
-+			(ycbcr2rgb_coeff[1][0] << 9) | ycbcr2rgb_coeff[2][0];
-+		writel(param, base++);
-+		param = (ycbcr2rgb_coeff[3][1] >> 5);
-+		writel(param, base++);
-+
-+		param = (ycbcr2rgb_coeff[3][2] << 27) |
-+			(ycbcr2rgb_coeff[0][2] << 18) |
-+			(ycbcr2rgb_coeff[1][2] << 9) | ycbcr2rgb_coeff[2][1];
-+		writel(param, base++);
-+		param = (ycbcr2rgb_coeff[3][2] >> 5);
-+		writel(param, base++);
-+	} else if ((in_format == RGB) && (out_format == YCbCr)) {
-+		/* Init CSC (RGB->YCbCr) */
-+		param = (rgb2ycbcr_coeff[3][0] << 27) |
-+			(rgb2ycbcr_coeff[0][0] << 18) |
-+			(rgb2ycbcr_coeff[1][1] << 9) | rgb2ycbcr_coeff[2][2];
-+		writel(param, base++);
-+		/* scale = 1, sat = 0 */
-+		param = (rgb2ycbcr_coeff[3][0] >> 5) | (1UL << 8);
-+		writel(param, base++);
-+
-+		param = (rgb2ycbcr_coeff[3][1] << 27) |
-+			(rgb2ycbcr_coeff[0][1] << 18) |
-+			(rgb2ycbcr_coeff[1][0] << 9) | rgb2ycbcr_coeff[2][0];
-+		writel(param, base++);
-+		param = (rgb2ycbcr_coeff[3][1] >> 5);
-+		writel(param, base++);
-+
-+		param = (rgb2ycbcr_coeff[3][2] << 27) |
-+			(rgb2ycbcr_coeff[0][2] << 18) |
-+			(rgb2ycbcr_coeff[1][2] << 9) | rgb2ycbcr_coeff[2][1];
-+		writel(param, base++);
-+		param = (rgb2ycbcr_coeff[3][2] >> 5);
-+		writel(param, base++);
-+	} else if ((in_format == RGB) && (out_format == RGB)) {
-+		/* Init CSC */
-+		param =
-+		    (rgb2rgb_coeff[3][0] << 27) | (rgb2rgb_coeff[0][0] << 18) |
-+		    (rgb2rgb_coeff[1][1] << 9) | rgb2rgb_coeff[2][2];
-+		writel(param, base++);
-+		/* scale = 2, sat = 0 */
-+		param = (rgb2rgb_coeff[3][0] >> 5) | (2UL << 8);
-+		writel(param, base++);
-+
-+		param =
-+		    (rgb2rgb_coeff[3][1] << 27) | (rgb2rgb_coeff[0][1] << 18) |
-+		    (rgb2rgb_coeff[1][0] << 9) | rgb2rgb_coeff[2][0];
-+		writel(param, base++);
-+		param = (rgb2rgb_coeff[3][1] >> 5);
-+		writel(param, base++);
-+
-+		param =
-+		    (rgb2rgb_coeff[3][2] << 27) | (rgb2rgb_coeff[0][2] << 18) |
-+		    (rgb2rgb_coeff[1][2] << 9) | rgb2rgb_coeff[2][1];
-+		writel(param, base++);
-+		param = (rgb2rgb_coeff[3][2] >> 5);
-+		writel(param, base++);
-+	} else {
-+		dev_err(ipu->dev, "Unsupported color space conversion\n");
-+	}
-+}
-+
-+static int _calc_resize_coeffs(struct ipu_soc *ipu,
-+				uint32_t inSize, uint32_t outSize,
-+				uint32_t *resizeCoeff,
-+				uint32_t *downsizeCoeff)
-+{
-+	uint32_t tempSize;
-+	uint32_t tempDownsize;
-+
-+	if (inSize > 4096) {
-+		dev_err(ipu->dev, "IC input size(%d) cannot exceed 4096\n",
-+			inSize);
-+		return -EINVAL;
-+	}
-+
-+	if (outSize > 1024) {
-+		dev_err(ipu->dev, "IC output size(%d) cannot exceed 1024\n",
-+			outSize);
-+		return -EINVAL;
-+	}
-+
-+	if ((outSize << 3) < inSize) {
-+		dev_err(ipu->dev, "IC cannot downsize more than 8:1\n");
-+		return -EINVAL;
-+	}
-+
-+	/* Compute downsizing coefficient */
-+	/* Output of downsizing unit cannot be more than 1024 */
-+	tempDownsize = 0;
-+	tempSize = inSize;
-+	while (((tempSize > 1024) || (tempSize >= outSize * 2)) &&
-+	       (tempDownsize < 2)) {
-+		tempSize >>= 1;
-+		tempDownsize++;
-+	}
-+	*downsizeCoeff = tempDownsize;
-+
-+	/* compute resizing coefficient using the following equation:
-+	   resizeCoeff = M*(SI -1)/(SO - 1)
-+	   where M = 2^13, SI - input size, SO - output size    */
-+	*resizeCoeff = (8192L * (tempSize - 1)) / (outSize - 1);
-+	if (*resizeCoeff >= 16384L) {
-+		dev_err(ipu->dev, "Overflow on IC resize coefficient.\n");
-+		return -EINVAL;
-+	}
-+
-+	dev_dbg(ipu->dev, "resizing from %u -> %u pixels, "
-+		"downsize=%u, resize=%u.%lu (reg=%u)\n", inSize, outSize,
-+		*downsizeCoeff, (*resizeCoeff >= 8192L) ? 1 : 0,
-+		((*resizeCoeff & 0x1FFF) * 10000L) / 8192L, *resizeCoeff);
-+
-+	return 0;
-+}
-+
-+void _ipu_vdi_toggle_top_field_man(struct ipu_soc *ipu)
-+{
-+	uint32_t reg;
-+	uint32_t mask_reg;
-+
-+	reg = ipu_vdi_read(ipu, VDI_C);
-+	mask_reg = reg & VDI_C_TOP_FIELD_MAN_1;
-+	if (mask_reg == VDI_C_TOP_FIELD_MAN_1)
-+		reg &= ~VDI_C_TOP_FIELD_MAN_1;
-+	else
-+		reg |= VDI_C_TOP_FIELD_MAN_1;
-+
-+	ipu_vdi_write(ipu, reg, VDI_C);
-+}
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_param_mem.h linux-xbian-imx6/drivers/mxc/ipu3/ipu_param_mem.h
---- linux-4.1.3/drivers/mxc/ipu3/ipu_param_mem.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_param_mem.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,921 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+#ifndef __INCLUDE_IPU_PARAM_MEM_H__
-+#define __INCLUDE_IPU_PARAM_MEM_H__
-+
-+#include <linux/bitrev.h>
-+#include <linux/types.h>
-+
-+#include "ipu_prv.h"
-+
-+extern u32 *ipu_cpmem_base;
-+
-+struct ipu_ch_param_word {
-+	uint32_t data[5];
-+	uint32_t res[3];
-+};
-+
-+struct ipu_ch_param {
-+	struct ipu_ch_param_word word[2];
-+};
-+
-+#define ipu_ch_param_addr(ipu, ch) (((struct ipu_ch_param *)ipu->cpmem_base) + (ch))
-+
-+#define _param_word(base, w) \
-+	(((struct ipu_ch_param *)(base))->word[(w)].data)
-+
-+#define ipu_ch_param_set_field(base, w, bit, size, v) { \
-+	int i = (bit) / 32; \
-+	int off = (bit) % 32; \
-+	_param_word(base, w)[i] |= (v) << off; \
-+	if (((bit)+(size)-1)/32 > i) { \
-+		_param_word(base, w)[i + 1] |= (v) >> (off ? (32 - off) : 0); \
-+	} \
-+}
-+
-+#define ipu_ch_param_set_field_io(base, w, bit, size, v) { \
-+	int i = (bit) / 32; \
-+	int off = (bit) % 32; \
-+	unsigned reg_offset; \
-+	u32 temp; \
-+	reg_offset = sizeof(struct ipu_ch_param_word) * w / 4; \
-+	reg_offset += i; \
-+	temp = readl((u32 *)base + reg_offset); \
-+	temp |= (v) << off; \
-+	writel(temp, (u32 *)base + reg_offset); \
-+	if (((bit)+(size)-1)/32 > i) { \
-+		reg_offset++; \
-+		temp = readl((u32 *)base + reg_offset); \
-+		temp |= (v) >> (off ? (32 - off) : 0); \
-+		writel(temp, (u32 *)base + reg_offset); \
-+	} \
-+}
-+
-+#define ipu_ch_param_mod_field(base, w, bit, size, v) { \
-+	int i = (bit) / 32; \
-+	int off = (bit) % 32; \
-+	u32 mask = (1UL << size) - 1; \
-+	u32 temp = _param_word(base, w)[i]; \
-+	temp &= ~(mask << off); \
-+	_param_word(base, w)[i] = temp | (v) << off; \
-+	if (((bit)+(size)-1)/32 > i) { \
-+		temp = _param_word(base, w)[i + 1]; \
-+		temp &= ~(mask >> (32 - off)); \
-+		_param_word(base, w)[i + 1] = \
-+			temp | ((v) >> (off ? (32 - off) : 0)); \
-+	} \
-+}
-+
-+#define ipu_ch_param_mod_field_io(base, w, bit, size, v) { \
-+	int i = (bit) / 32; \
-+	int off = (bit) % 32; \
-+	u32 mask = (1UL << size) - 1; \
-+	unsigned reg_offset; \
-+	u32 temp; \
-+	reg_offset = sizeof(struct ipu_ch_param_word) * w / 4; \
-+	reg_offset += i; \
-+	temp = readl((u32 *)base + reg_offset); \
-+	temp &= ~(mask << off); \
-+	temp |= (v) << off; \
-+	writel(temp, (u32 *)base + reg_offset); \
-+	if (((bit)+(size)-1)/32 > i) { \
-+		reg_offset++; \
-+		temp = readl((u32 *)base + reg_offset); \
-+		temp &= ~(mask >> (32 - off)); \
-+		temp |= ((v) >> (off ? (32 - off) : 0)); \
-+		writel(temp, (u32 *)base + reg_offset); \
-+	} \
-+}
-+
-+#define ipu_ch_param_read_field(base, w, bit, size) ({ \
-+	u32 temp2; \
-+	int i = (bit) / 32; \
-+	int off = (bit) % 32; \
-+	u32 mask = (1UL << size) - 1; \
-+	u32 temp1 = _param_word(base, w)[i]; \
-+	temp1 = mask & (temp1 >> off); \
-+	if (((bit)+(size)-1)/32 > i) { \
-+		temp2 = _param_word(base, w)[i + 1]; \
-+		temp2 &= mask >> (off ? (32 - off) : 0); \
-+		temp1 |= temp2 << (off ? (32 - off) : 0); \
-+	} \
-+	temp1; \
-+})
-+
-+#define ipu_ch_param_read_field_io(base, w, bit, size) ({ \
-+	u32 temp1, temp2; \
-+	int i = (bit) / 32; \
-+	int off = (bit) % 32; \
-+	u32 mask = (1UL << size) - 1; \
-+	unsigned reg_offset; \
-+	reg_offset = sizeof(struct ipu_ch_param_word) * w / 4; \
-+	reg_offset += i; \
-+	temp1 = readl((u32 *)base + reg_offset); \
-+	temp1 = mask & (temp1 >> off); \
-+	if (((bit)+(size)-1)/32 > i) { \
-+		reg_offset++; \
-+		temp2 = readl((u32 *)base + reg_offset); \
-+		temp2 &= mask >> (off ? (32 - off) : 0); \
-+		temp1 |= temp2 << (off ? (32 - off) : 0); \
-+	} \
-+	temp1; \
-+})
-+
-+static inline int __ipu_ch_get_third_buf_cpmem_num(int ch)
-+{
-+	switch (ch) {
-+	case 8:
-+		return 64;
-+	case 9:
-+		return 65;
-+	case 10:
-+		return 66;
-+	case 13:
-+		return 67;
-+	case 21:
-+		return 68;
-+	case 23:
-+		return 69;
-+	case 27:
-+		return 70;
-+	case 28:
-+		return 71;
-+	default:
-+		return -EINVAL;
-+	}
-+	return 0;
-+}
-+
-+static inline void _ipu_ch_params_set_packing(struct ipu_ch_param *p,
-+					      int red_width, int red_offset,
-+					      int green_width, int green_offset,
-+					      int blue_width, int blue_offset,
-+					      int alpha_width, int alpha_offset)
-+{
-+	/* Setup red width and offset */
-+	ipu_ch_param_set_field(p, 1, 116, 3, red_width - 1);
-+	ipu_ch_param_set_field(p, 1, 128, 5, red_offset);
-+	/* Setup green width and offset */
-+	ipu_ch_param_set_field(p, 1, 119, 3, green_width - 1);
-+	ipu_ch_param_set_field(p, 1, 133, 5, green_offset);
-+	/* Setup blue width and offset */
-+	ipu_ch_param_set_field(p, 1, 122, 3, blue_width - 1);
-+	ipu_ch_param_set_field(p, 1, 138, 5, blue_offset);
-+	/* Setup alpha width and offset */
-+	ipu_ch_param_set_field(p, 1, 125, 3, alpha_width - 1);
-+	ipu_ch_param_set_field(p, 1, 143, 5, alpha_offset);
-+}
-+
-+static inline void _ipu_ch_param_dump(struct ipu_soc *ipu, int ch)
-+{
-+	struct ipu_ch_param *p = ipu_ch_param_addr(ipu, ch);
-+	dev_dbg(ipu->dev, "ch %d word 0 - %08X %08X %08X %08X %08X\n", ch,
-+		 p->word[0].data[0], p->word[0].data[1], p->word[0].data[2],
-+		 p->word[0].data[3], p->word[0].data[4]);
-+	dev_dbg(ipu->dev, "ch %d word 1 - %08X %08X %08X %08X %08X\n", ch,
-+		 p->word[1].data[0], p->word[1].data[1], p->word[1].data[2],
-+		 p->word[1].data[3], p->word[1].data[4]);
-+	dev_dbg(ipu->dev, "PFS 0x%x, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 85, 4));
-+	dev_dbg(ipu->dev, "BPP 0x%x, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 107, 3));
-+	dev_dbg(ipu->dev, "NPB 0x%x\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 78, 7));
-+
-+	dev_dbg(ipu->dev, "FW %d, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 125, 13));
-+	dev_dbg(ipu->dev, "FH %d, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 138, 12));
-+	dev_dbg(ipu->dev, "EBA0 0x%x\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 0, 29) << 3);
-+	dev_dbg(ipu->dev, "EBA1 0x%x\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 29, 29) << 3);
-+	dev_dbg(ipu->dev, "Stride %d\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 102, 14));
-+	dev_dbg(ipu->dev, "scan_order %d\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 113, 1));
-+	dev_dbg(ipu->dev, "uv_stride %d\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 128, 14));
-+	dev_dbg(ipu->dev, "u_offset 0x%x\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 46, 22) << 3);
-+	dev_dbg(ipu->dev, "v_offset 0x%x\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 68, 22) << 3);
-+
-+	dev_dbg(ipu->dev, "Width0 %d+1, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 116, 3));
-+	dev_dbg(ipu->dev, "Width1 %d+1, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 119, 3));
-+	dev_dbg(ipu->dev, "Width2 %d+1, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 122, 3));
-+	dev_dbg(ipu->dev, "Width3 %d+1, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 125, 3));
-+	dev_dbg(ipu->dev, "Offset0 %d, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 128, 5));
-+	dev_dbg(ipu->dev, "Offset1 %d, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 133, 5));
-+	dev_dbg(ipu->dev, "Offset2 %d, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 138, 5));
-+	dev_dbg(ipu->dev, "Offset3 %d\n",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 143, 5));
-+}
-+
-+static inline void fill_cpmem(struct ipu_soc *ipu, int ch, struct ipu_ch_param *params)
-+{
-+	int i, w;
-+	void *addr = ipu_ch_param_addr(ipu, ch);
-+
-+	/* 2 words, 5 valid data */
-+	for (w = 0; w < 2; w++) {
-+		for (i = 0; i < 5; i++) {
-+			writel(params->word[w].data[i], addr);
-+			addr += 4;
-+		}
-+		addr += 12;
-+	}
-+}
-+
-+static inline void _ipu_ch_param_init(struct ipu_soc *ipu, int ch,
-+				      uint32_t pixel_fmt, uint32_t width,
-+				      uint32_t height, uint32_t stride,
-+				      uint32_t u, uint32_t v,
-+				      uint32_t uv_stride, dma_addr_t addr0,
-+				      dma_addr_t addr1, dma_addr_t addr2)
-+{
-+	uint32_t u_offset = 0;
-+	uint32_t v_offset = 0;
-+	int32_t sub_ch = 0;
-+	struct ipu_ch_param params;
-+
-+	memset(&params, 0, sizeof(params));
-+
-+	ipu_ch_param_set_field(&params, 0, 125, 13, width - 1);
-+
-+	if (((ch == 8) || (ch == 9) || (ch == 10)) && !ipu->vdoa_en) {
-+		ipu_ch_param_set_field(&params, 0, 138, 12, (height / 2) - 1);
-+		ipu_ch_param_set_field(&params, 1, 102, 14, (stride * 2) - 1);
-+	} else {
-+		/* note: for vdoa+vdi- ch8/9/10, always use band mode */
-+		ipu_ch_param_set_field(&params, 0, 138, 12, height - 1);
-+		ipu_ch_param_set_field(&params, 1, 102, 14, stride - 1);
-+	}
-+
-+	/* EBA is 8-byte aligned */
-+	ipu_ch_param_set_field(&params, 1, 0, 29, addr0 >> 3);
-+	ipu_ch_param_set_field(&params, 1, 29, 29, addr1 >> 3);
-+	if (addr0%8)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's EBA0 is not 8-byte aligned\n", ch);
-+	if (addr1%8)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's EBA1 is not 8-byte aligned\n", ch);
-+
-+	switch (pixel_fmt) {
-+	case IPU_PIX_FMT_GENERIC:
-+		/*Represents 8-bit Generic data */
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 5);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 6);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 63);	/* burst size */
-+
-+		break;
-+	case IPU_PIX_FMT_GENERIC_16:
-+		/* Represents 16-bit generic data */
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 6);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+
-+		break;
-+	case IPU_PIX_FMT_GENERIC_32:
-+		/*Represents 32-bit Generic data */
-+		break;
-+	case IPU_PIX_FMT_RGB565:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 5, 0, 6, 5, 5, 11, 8, 16);
-+		break;
-+	case IPU_PIX_FMT_BGR24:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 1);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 19);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 8, 0, 8, 8, 8, 16, 8, 24);
-+		break;
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_YUV444:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 1);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 19);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 8, 16, 8, 8, 8, 0, 8, 24);
-+		break;
-+	case IPU_PIX_FMT_VYU444:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 1);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 19);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 8, 8, 8, 0, 8, 16, 8, 24);
-+		break;
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_BGR32:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 0);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 15);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 8, 8, 8, 16, 8, 24, 8, 0);
-+		break;
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_RGB32:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 0);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 15);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 8, 24, 8, 16, 8, 8, 8, 0);
-+		break;
-+	case IPU_PIX_FMT_ABGR32:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 0);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 15);	/* burst size */
-+
-+		_ipu_ch_params_set_packing(&params, 8, 0, 8, 8, 8, 16, 8, 24);
-+		break;
-+	case IPU_PIX_FMT_UYVY:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 0xA);	/* pix format */
-+		if ((ch == 8) || (ch == 9) || (ch == 10)) {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 15);  /* burst size */
-+		} else {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+		}
-+		break;
-+	case IPU_PIX_FMT_YUYV:
-+		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 0x8);	/* pix format */
-+		if ((ch == 8) || (ch == 9) || (ch == 10)) {
-+			if (ipu->vdoa_en) {
-+				ipu_ch_param_set_field(&params, 1, 78, 7, 31);
-+			} else {
-+				ipu_ch_param_set_field(&params, 1, 78, 7, 15);
-+			}
-+		} else {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+		}
-+		break;
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YUV420P:
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 2);	/* pix format */
-+
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		u_offset = stride * height;
-+		v_offset = u_offset + (uv_stride * height / 2);
-+		if ((ch == 8) || (ch == 9) || (ch == 10)) {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 15);  /* burst size */
-+			uv_stride = uv_stride*2;
-+		} else {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 63);  /* burst size */
-+		}
-+		break;
-+	case IPU_PIX_FMT_YVU420P:
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 2);	/* pix format */
-+
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		v_offset = stride * height;
-+		u_offset = v_offset + (uv_stride * height / 2);
-+		if ((ch == 8) || (ch == 9) || (ch == 10)) {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 15);  /* burst size */
-+			uv_stride = uv_stride*2;
-+		} else {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 31);  /* burst size */
-+		}
-+		break;
-+	case IPU_PIX_FMT_YVU422P:
-+		/* BPP & pixel format */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 1);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		v_offset = (v == 0) ? stride * height : v;
-+		u_offset = (u == 0) ? v_offset + v_offset / 2 : u;
-+		break;
-+	case IPU_PIX_FMT_YUV422P:
-+		/* BPP & pixel format */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 1);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		u_offset = (u == 0) ? stride * height : u;
-+		v_offset = (v == 0) ? u_offset + u_offset / 2 : v;
-+		break;
-+	case IPU_PIX_FMT_YUV444P:
-+		/* BPP & pixel format */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 0);	/* pix format */
-+		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+		uv_stride = stride;
-+		u_offset = (u == 0) ? stride * height : u;
-+		v_offset = (v == 0) ? u_offset * 2 : v;
-+		break;
-+	case IPU_PIX_FMT_NV12:
-+		/* BPP & pixel format */
-+		ipu_ch_param_set_field(&params, 1, 85, 4, 4);	/* pix format */
-+		uv_stride = stride;
-+		u_offset = (u == 0) ? stride * height : u;
-+		if ((ch == 8) || (ch == 9) || (ch == 10)) {
-+			if (ipu->vdoa_en) {
-+				 /* one field buffer, memory width 64bits */
-+				ipu_ch_param_set_field(&params, 1, 78, 7, 63);
-+			} else {
-+				ipu_ch_param_set_field(&params, 1, 78, 7, 15);
-+				 /* top/bottom field in one buffer*/
-+				uv_stride = uv_stride*2;
-+			}
-+		} else {
-+			ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
-+		}
-+		break;
-+	default:
-+		dev_err(ipu->dev, "mxc ipu: unimplemented pixel format\n");
-+		break;
-+	}
-+	/*set burst size to 16*/
-+
-+
-+	if (uv_stride)
-+		ipu_ch_param_set_field(&params, 1, 128, 14, uv_stride - 1);
-+
-+	/* Get the uv offset from user when need cropping */
-+	if (u || v) {
-+		u_offset = u;
-+		v_offset = v;
-+	}
-+
-+	/* UBO and VBO are 22-bit and 8-byte aligned */
-+	if (u_offset/8 > 0x3fffff)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's U offset exceeds IPU limitation\n", ch);
-+	if (v_offset/8 > 0x3fffff)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's V offset exceeds IPU limitation\n", ch);
-+	if (u_offset%8)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's U offset is not 8-byte aligned\n", ch);
-+	if (v_offset%8)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's V offset is not 8-byte aligned\n", ch);
-+
-+	ipu_ch_param_set_field(&params, 0, 46, 22, u_offset / 8);
-+	ipu_ch_param_set_field(&params, 0, 68, 22, v_offset / 8);
-+
-+	dev_dbg(ipu->dev, "initializing idma ch %d @ %p\n", ch, ipu_ch_param_addr(ipu, ch));
-+	fill_cpmem(ipu, ch, &params);
-+	if (addr2) {
-+		sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+		if (sub_ch <= 0)
-+			return;
-+
-+		ipu_ch_param_set_field(&params, 1, 0, 29, addr2 >> 3);
-+		ipu_ch_param_set_field(&params, 1, 29, 29, 0);
-+		if (addr2%8)
-+			dev_warn(ipu->dev,
-+				 "IDMAC%d's sub-CPMEM entry%d EBA0 is not "
-+				 "8-byte aligned\n", ch, sub_ch);
-+
-+		dev_dbg(ipu->dev, "initializing idma ch %d @ %p sub cpmem\n", ch,
-+					ipu_ch_param_addr(ipu, sub_ch));
-+		fill_cpmem(ipu, sub_ch, &params);
-+	}
-+};
-+
-+static inline void _ipu_ch_param_set_burst_size(struct ipu_soc *ipu,
-+						uint32_t ch,
-+						uint16_t burst_pixels)
-+{
-+	int32_t sub_ch = 0;
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 78, 7,
-+			       burst_pixels - 1);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 78, 7,
-+			       burst_pixels - 1);
-+};
-+
-+static inline int _ipu_ch_param_get_burst_size(struct ipu_soc *ipu, uint32_t ch)
-+{
-+	return ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 78, 7) + 1;
-+};
-+
-+static inline int _ipu_ch_param_get_bpp(struct ipu_soc *ipu, uint32_t ch)
-+{
-+	return ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 107, 3);
-+};
-+
-+static inline void _ipu_ch_param_set_buffer(struct ipu_soc *ipu, uint32_t ch,
-+					int bufNum, dma_addr_t phyaddr)
-+{
-+	if (bufNum == 2) {
-+		ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+		if (ch <= 0)
-+			return;
-+		bufNum = 0;
-+	}
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 29 * bufNum, 29,
-+			       phyaddr / 8);
-+};
-+
-+static inline void _ipu_ch_param_set_rotation(struct ipu_soc *ipu, uint32_t ch,
-+					      ipu_rotate_mode_t rot)
-+{
-+	u32 temp_rot = bitrev8(rot) >> 5;
-+	int32_t sub_ch = 0;
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 119, 3, temp_rot);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 119, 3, temp_rot);
-+};
-+
-+static inline void _ipu_ch_param_set_block_mode(struct ipu_soc *ipu, uint32_t ch)
-+{
-+	int32_t sub_ch = 0;
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 117, 2, 1);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 117, 2, 1);
-+};
-+
-+static inline void _ipu_ch_param_set_alpha_use_separate_channel(struct ipu_soc *ipu,
-+								uint32_t ch,
-+								bool option)
-+{
-+	int32_t sub_ch = 0;
-+
-+	if (option) {
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 89, 1, 1);
-+	} else {
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 89, 1, 0);
-+	}
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+
-+	if (option) {
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 89, 1, 1);
-+	} else {
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 89, 1, 0);
-+	}
-+};
-+
-+static inline void _ipu_ch_param_set_alpha_condition_read(struct ipu_soc *ipu, uint32_t ch)
-+{
-+	int32_t sub_ch = 0;
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 149, 1, 1);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 149, 1, 1);
-+};
-+
-+static inline void _ipu_ch_param_set_alpha_buffer_memory(struct ipu_soc *ipu, uint32_t ch)
-+{
-+	int alp_mem_idx;
-+	int32_t sub_ch = 0;
-+
-+	switch (ch) {
-+	case 14: /* PRP graphic */
-+		alp_mem_idx = 0;
-+		break;
-+	case 15: /* PP graphic */
-+		alp_mem_idx = 1;
-+		break;
-+	case 23: /* DP BG SYNC graphic */
-+		alp_mem_idx = 4;
-+		break;
-+	case 27: /* DP FG SYNC graphic */
-+		alp_mem_idx = 2;
-+		break;
-+	default:
-+		dev_err(ipu->dev, "unsupported correlative channel of local "
-+			"alpha channel\n");
-+		return;
-+	}
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 90, 3, alp_mem_idx);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 90, 3, alp_mem_idx);
-+};
-+
-+static inline void _ipu_ch_param_set_interlaced_scan(struct ipu_soc *ipu, uint32_t ch)
-+{
-+	u32 stride;
-+	int32_t sub_ch = 0;
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+
-+	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, ch), 0, 113, 1, 1);
-+	if (sub_ch > 0)
-+		ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 113, 1, 1);
-+	stride = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 102, 14) + 1;
-+	/* ILO is 20-bit and 8-byte aligned */
-+	if (stride/8 > 0xfffff)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's ILO exceeds IPU limitation\n", ch);
-+	if (stride%8)
-+		dev_warn(ipu->dev,
-+			 "IDMAC%d's ILO is not 8-byte aligned\n", ch);
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 58, 20, stride / 8);
-+	if (sub_ch > 0)
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 58, 20,
-+				       stride / 8);
-+	stride *= 2;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 102, 14, stride - 1);
-+	if (sub_ch > 0)
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 102, 14,
-+				       stride - 1);
-+};
-+
-+static inline void _ipu_ch_param_set_axi_id(struct ipu_soc *ipu, uint32_t ch, uint32_t id)
-+{
-+	int32_t sub_ch = 0;
-+
-+	id %= 4;
-+
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 93, 2, id);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 93, 2, id);
-+};
-+
-+/* IDMAC U/V offset changing support */
-+/* U and V input is not affected, */
-+/* the update is done by new calculation according to */
-+/* vertical_offset and horizontal_offset */
-+static inline void _ipu_ch_offset_update(struct ipu_soc *ipu,
-+					int ch,
-+					uint32_t pixel_fmt,
-+					uint32_t width,
-+					uint32_t height,
-+					uint32_t stride,
-+					uint32_t u,
-+					uint32_t v,
-+					uint32_t uv_stride,
-+					uint32_t vertical_offset,
-+					uint32_t horizontal_offset)
-+{
-+	uint32_t u_offset = 0;
-+	uint32_t v_offset = 0;
-+	uint32_t old_offset = 0;
-+	uint32_t u_fix = 0;
-+	uint32_t v_fix = 0;
-+	int32_t sub_ch = 0;
-+
-+	switch (pixel_fmt) {
-+	case IPU_PIX_FMT_GENERIC:
-+	case IPU_PIX_FMT_GENERIC_16:
-+	case IPU_PIX_FMT_GENERIC_32:
-+	case IPU_PIX_FMT_RGB565:
-+	case IPU_PIX_FMT_BGR24:
-+	case IPU_PIX_FMT_RGB24:
-+	case IPU_PIX_FMT_YUV444:
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_BGR32:
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_RGB32:
-+	case IPU_PIX_FMT_ABGR32:
-+	case IPU_PIX_FMT_UYVY:
-+	case IPU_PIX_FMT_YUYV:
-+		break;
-+
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YUV420P:
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		u_offset = stride * (height - vertical_offset - 1) +
-+					(stride - horizontal_offset) +
-+					(uv_stride * vertical_offset / 2) +
-+					horizontal_offset / 2;
-+		v_offset = u_offset + (uv_stride * height / 2);
-+		u_fix = u ? (u + (uv_stride * vertical_offset / 2) +
-+					(horizontal_offset / 2) -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					u_offset;
-+		v_fix = v ? (v + (uv_stride * vertical_offset / 2) +
-+					(horizontal_offset / 2) -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					v_offset;
-+
-+		break;
-+	case IPU_PIX_FMT_YVU420P:
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		v_offset = stride * (height - vertical_offset - 1) +
-+					(stride - horizontal_offset) +
-+					(uv_stride * vertical_offset / 2) +
-+					horizontal_offset / 2;
-+		u_offset = v_offset + (uv_stride * height / 2);
-+		u_fix = u ? (u + (uv_stride * vertical_offset / 2) +
-+					(horizontal_offset / 2) -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					u_offset;
-+		v_fix = v ? (v + (uv_stride * vertical_offset / 2) +
-+					(horizontal_offset / 2) -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					v_offset;
-+
-+		break;
-+	case IPU_PIX_FMT_YVU422P:
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		v_offset = stride * (height - vertical_offset - 1) +
-+					(stride - horizontal_offset) +
-+					(uv_stride * vertical_offset) +
-+					horizontal_offset / 2;
-+		u_offset = v_offset + uv_stride * height;
-+		u_fix = u ? (u + (uv_stride * vertical_offset) +
-+					horizontal_offset / 2 -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					u_offset;
-+		v_fix = v ? (v + (uv_stride * vertical_offset) +
-+					horizontal_offset / 2 -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					v_offset;
-+		break;
-+	case IPU_PIX_FMT_YUV422P:
-+		if (uv_stride < stride / 2)
-+			uv_stride = stride / 2;
-+
-+		u_offset = stride * (height - vertical_offset - 1) +
-+					(stride - horizontal_offset) +
-+					(uv_stride * vertical_offset) +
-+					horizontal_offset / 2;
-+		v_offset = u_offset + uv_stride * height;
-+		u_fix = u ? (u + (uv_stride * vertical_offset) +
-+					horizontal_offset / 2 -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					u_offset;
-+		v_fix = v ? (v + (uv_stride * vertical_offset) +
-+					horizontal_offset / 2 -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					v_offset;
-+		break;
-+
-+	case IPU_PIX_FMT_YUV444P:
-+		uv_stride = stride;
-+		u_offset = stride * (height - vertical_offset - 1) +
-+					(stride - horizontal_offset) +
-+					(uv_stride * vertical_offset) +
-+					horizontal_offset;
-+		v_offset = u_offset + uv_stride * height;
-+		u_fix = u ? (u + (uv_stride * vertical_offset) +
-+					horizontal_offset -
-+					(stride * vertical_offset) -
-+					(horizontal_offset)) :
-+					u_offset;
-+		v_fix = v ? (v + (uv_stride * vertical_offset) +
-+					horizontal_offset -
-+					(stride * vertical_offset) -
-+					(horizontal_offset)) :
-+					v_offset;
-+		break;
-+	case IPU_PIX_FMT_NV12:
-+		uv_stride = stride;
-+		u_offset = stride * (height - vertical_offset - 1) +
-+					(stride - horizontal_offset) +
-+					(uv_stride * vertical_offset / 2) +
-+					horizontal_offset;
-+		u_fix = u ? (u + (uv_stride * vertical_offset / 2) +
-+					horizontal_offset -
-+					(stride * vertical_offset) - (horizontal_offset)) :
-+					u_offset;
-+
-+		break;
-+	default:
-+		dev_err(ipu->dev, "mxc ipu: unimplemented pixel format\n");
-+		break;
-+	}
-+
-+
-+
-+	if (u_fix > u_offset)
-+		u_offset = u_fix;
-+
-+	if (v_fix > v_offset)
-+		v_offset = v_fix;
-+
-+	/* UBO and VBO are 22-bit and 8-byte aligned */
-+	if (u_offset/8 > 0x3fffff)
-+		dev_warn(ipu->dev,
-+			"IDMAC%d's U offset exceeds IPU limitation\n", ch);
-+	if (v_offset/8 > 0x3fffff)
-+		dev_warn(ipu->dev,
-+			"IDMAC%d's V offset exceeds IPU limitation\n", ch);
-+	if (u_offset%8)
-+		dev_warn(ipu->dev,
-+			"IDMAC%d's U offset is not 8-byte aligned\n", ch);
-+	if (v_offset%8)
-+		dev_warn(ipu->dev,
-+			"IDMAC%d's V offset is not 8-byte aligned\n", ch);
-+
-+	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 46, 22);
-+	if (old_offset != u_offset / 8)
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 46, 22, u_offset / 8);
-+	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 68, 22);
-+	if (old_offset != v_offset / 8)
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 68, 22, v_offset / 8);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 46, 22);
-+	if (old_offset != u_offset / 8)
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 46, 22, u_offset / 8);
-+	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 68, 22);
-+	if (old_offset != v_offset / 8)
-+		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 68, 22, v_offset / 8);
-+};
-+
-+static inline void _ipu_ch_params_set_alpha_width(struct ipu_soc *ipu, uint32_t ch, int alpha_width)
-+{
-+	int32_t sub_ch = 0;
-+
-+	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, ch), 1, 125, 3, alpha_width - 1);
-+
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 125, 3, alpha_width - 1);
-+};
-+
-+static inline void _ipu_ch_param_set_bandmode(struct ipu_soc *ipu,
-+			uint32_t ch, uint32_t band_height)
-+{
-+	int32_t sub_ch = 0;
-+
-+	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, ch),
-+					0, 114, 3, band_height - 1);
-+	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
-+	if (sub_ch <= 0)
-+		return;
-+	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, sub_ch),
-+					0, 114, 3, band_height - 1);
-+
-+	dev_dbg(ipu->dev, "BNDM 0x%x, ",
-+		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 114, 3));
-+}
-+
-+/*
-+ * The IPUv3 IDMAC has a bug to read 32bpp pixels from a graphics plane
-+ * whose alpha component is at the most significant 8 bits. The bug only
-+ * impacts on cases in which the relevant separate alpha channel is enabled.
-+ *
-+ * Return true on bad alpha component position, otherwise, return false.
-+ */
-+static inline bool _ipu_ch_param_bad_alpha_pos(uint32_t pixel_fmt)
-+{
-+	switch (pixel_fmt) {
-+	case IPU_PIX_FMT_BGRA32:
-+	case IPU_PIX_FMT_BGR32:
-+	case IPU_PIX_FMT_RGBA32:
-+	case IPU_PIX_FMT_RGB32:
-+		return true;
-+	}
-+
-+	return false;
-+}
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_pixel_clk.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_pixel_clk.c
---- linux-4.1.3/drivers/mxc/ipu3/ipu_pixel_clk.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_pixel_clk.c	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,317 @@
-+/*
-+ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file ipu_pixel_clk.c
-+ *
-+ * @brief IPU pixel clock implementation
-+ *
-+ * @ingroup IPU
-+ */
-+
-+#include <linux/clk-provider.h>
-+#include <linux/err.h>
-+#include <linux/io.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/module.h>
-+#include <linux/slab.h>
-+#include <linux/string.h>
-+
-+#include "ipu_prv.h"
-+#include "ipu_regs.h"
-+
-+ /*
-+ * muxd clock implementation
-+ */
-+struct clk_di_mux {
-+	struct clk_hw hw;
-+	u8		ipu_id;
-+	u8		di_id;
-+	u8		flags;
-+	u8		index;
-+};
-+#define to_clk_di_mux(_hw) container_of(_hw, struct clk_di_mux, hw)
-+
-+static int _ipu_pixel_clk_set_parent(struct clk_hw *hw, u8 index)
-+{
-+	struct clk_di_mux *mux = to_clk_di_mux(hw);
-+	struct ipu_soc *ipu = ipu_get_soc(mux->ipu_id);
-+	u32 di_gen;
-+
-+	di_gen = ipu_di_read(ipu, mux->di_id, DI_GENERAL);
-+	if (index == 0)
-+		/* ipu1_clk or ipu2_clk internal clk */
-+		di_gen &= ~DI_GEN_DI_CLK_EXT;
-+	else
-+		di_gen |= DI_GEN_DI_CLK_EXT;
-+
-+	ipu_di_write(ipu, mux->di_id, di_gen, DI_GENERAL);
-+	mux->index = index;
-+	pr_debug("ipu_pixel_clk: di_clk_ext:0x%x, di_gen reg:0x%x.\n",
-+			!(di_gen & DI_GEN_DI_CLK_EXT), di_gen);
-+	return 0;
-+}
-+
-+static u8 _ipu_pixel_clk_get_parent(struct clk_hw *hw)
-+{
-+	struct clk_di_mux *mux = to_clk_di_mux(hw);
-+
-+	return mux->index;
-+}
-+
-+const struct clk_ops clk_mux_di_ops = {
-+	.get_parent = _ipu_pixel_clk_get_parent,
-+	.set_parent = _ipu_pixel_clk_set_parent,
-+};
-+
-+struct clk *clk_register_mux_pix_clk(struct device *dev, const char *name,
-+		const char **parent_names, u8 num_parents, unsigned long flags,
-+		u8 ipu_id, u8 di_id, u8 clk_mux_flags)
-+{
-+	struct clk_di_mux *mux;
-+	struct clk *clk;
-+	struct clk_init_data init;
-+
-+	mux = kzalloc(sizeof(struct clk_di_mux), GFP_KERNEL);
-+	if (!mux)
-+		return ERR_PTR(-ENOMEM);
-+
-+	init.name = name;
-+	init.ops = &clk_mux_di_ops;
-+	init.flags = flags;
-+	init.parent_names = parent_names;
-+	init.num_parents = num_parents;
-+
-+	mux->ipu_id = ipu_id;
-+	mux->di_id = di_id;
-+	mux->flags = clk_mux_flags | CLK_SET_RATE_PARENT;
-+	mux->hw.init = &init;
-+
-+	clk = clk_register(dev, &mux->hw);
-+	if (IS_ERR(clk))
-+		kfree(mux);
-+
-+	return clk;
-+}
-+
-+/*
-+ * Gated clock implementation
-+ */
-+struct clk_di_div {
-+	struct clk_hw hw;
-+	u8		ipu_id;
-+	u8		di_id;
-+	u8		flags;
-+};
-+#define to_clk_di_div(_hw) container_of(_hw, struct clk_di_div, hw)
-+
-+static unsigned long _ipu_pixel_clk_div_recalc_rate(struct clk_hw *hw,
-+					unsigned long parent_rate)
-+{
-+	struct clk_di_div *di_div = to_clk_di_div(hw);
-+	struct ipu_soc *ipu = ipu_get_soc(di_div->ipu_id);
-+	u32 div;
-+	u64 final_rate = (unsigned long long)parent_rate * 16;
-+
-+	_ipu_get(ipu);
-+	div = ipu_di_read(ipu, di_div->di_id, DI_BS_CLKGEN0);
-+	_ipu_put(ipu);
-+	pr_debug("ipu_di%d read BS_CLKGEN0 div:%d, final_rate:%lld, prate:%ld\n",
-+			di_div->di_id, div, final_rate, parent_rate);
-+
-+	if (div == 0)
-+		return 0;
-+	do_div(final_rate, div);
-+
-+	return (unsigned long)final_rate;
-+}
-+
-+static long _ipu_pixel_clk_div_round_rate(struct clk_hw *hw, unsigned long rate,
-+			       unsigned long *parent_clk_rate)
-+{
-+	u64 div, final_rate;
-+	u32 remainder;
-+	u64 parent_rate = (unsigned long long)(*parent_clk_rate) * 16;
-+
-+	/*
-+	 * Calculate divider
-+	 * Fractional part is 4 bits,
-+	 * so simply multiply by 2^4 to get fractional part.
-+	 */
-+	div = parent_rate;
-+	remainder = do_div(div, rate);
-+	/* Round the divider value */
-+	if (remainder > (rate/2))
-+		div++;
-+	if (div < 0x10)            /* Min DI disp clock divider is 1 */
-+		div = 0x10;
-+	if (div & ~0xFEF)
-+		div &= 0xFF8;
-+	else {
-+		/* Round up divider if it gets us closer to desired pix clk */
-+		if ((div & 0xC) == 0xC) {
-+			div += 0x10;
-+			div &= ~0xF;
-+		}
-+	}
-+	final_rate = parent_rate;
-+	do_div(final_rate, div);
-+
-+	return final_rate;
-+}
-+
-+static int _ipu_pixel_clk_div_set_rate(struct clk_hw *hw, unsigned long rate,
-+			    unsigned long parent_clk_rate)
-+{
-+	struct clk_di_div *di_div = to_clk_di_div(hw);
-+	struct ipu_soc *ipu = ipu_get_soc(di_div->ipu_id);
-+	u64 div, parent_rate;
-+	u32 remainder;
-+
-+	parent_rate = (unsigned long long)parent_clk_rate * 16;
-+	div = parent_rate;
-+	remainder = do_div(div, rate);
-+	/* Round the divider value */
-+	if (remainder > (rate/2))
-+		div++;
-+
-+	/* Round up divider if it gets us closer to desired pix clk */
-+	if ((div & 0xC) == 0xC) {
-+		div += 0x10;
-+		div &= ~0xF;
-+	}
-+	if (div > 0x1000)
-+		pr_err("Overflow, di:%d, DI_BS_CLKGEN0 div:0x%x\n",
-+				di_div->di_id, (u32)div);
-+	_ipu_get(ipu);
-+	ipu_di_write(ipu, di_div->di_id, (u32)div, DI_BS_CLKGEN0);
-+
-+	/* Setup pixel clock timing */
-+	/* FIXME: needs to be more flexible */
-+	/* Down time is half of period */
-+	ipu_di_write(ipu, di_div->di_id, ((u32)div / 16) << 16, DI_BS_CLKGEN1);
-+	_ipu_put(ipu);
-+
-+	return 0;
-+}
-+
-+static struct clk_ops clk_div_ops = {
-+	.recalc_rate = _ipu_pixel_clk_div_recalc_rate,
-+	.round_rate = _ipu_pixel_clk_div_round_rate,
-+	.set_rate = _ipu_pixel_clk_div_set_rate,
-+};
-+
-+struct clk *clk_register_div_pix_clk(struct device *dev, const char *name,
-+		const char *parent_name, unsigned long flags,
-+		u8 ipu_id, u8 di_id, u8 clk_div_flags)
-+{
-+	struct clk_di_div *di_div;
-+	struct clk *clk;
-+	struct clk_init_data init;
-+
-+	di_div = kzalloc(sizeof(struct clk_di_div), GFP_KERNEL);
-+	if (!di_div)
-+		return ERR_PTR(-ENOMEM);
-+
-+	/* struct clk_di_div assignments */
-+	di_div->ipu_id = ipu_id;
-+	di_div->di_id = di_id;
-+	di_div->flags = clk_div_flags;
-+
-+	init.name = name;
-+	init.ops = &clk_div_ops;
-+	init.flags = flags | CLK_SET_RATE_PARENT;
-+	init.parent_names = parent_name ? &parent_name : NULL;
-+	init.num_parents = parent_name ? 1 : 0;
-+
-+	di_div->hw.init = &init;
-+
-+	clk = clk_register(dev, &di_div->hw);
-+	if (IS_ERR(clk))
-+		kfree(clk);
-+
-+	return clk;
-+}
-+
-+/*
-+ * Gated clock implementation
-+ */
-+struct clk_di_gate {
-+	struct clk_hw hw;
-+	u8		ipu_id;
-+	u8		di_id;
-+	u8		flags;
-+};
-+#define to_clk_di_gate(_hw) container_of(_hw, struct clk_di_gate, hw)
-+
-+static int _ipu_pixel_clk_enable(struct clk_hw *hw)
-+{
-+	struct clk_di_gate *gate = to_clk_di_gate(hw);
-+	struct ipu_soc *ipu = ipu_get_soc(gate->ipu_id);
-+	u32 disp_gen;
-+
-+	disp_gen = ipu_cm_read(ipu, IPU_DISP_GEN);
-+	disp_gen |= gate->di_id ? DI1_COUNTER_RELEASE : DI0_COUNTER_RELEASE;
-+	ipu_cm_write(ipu, disp_gen, IPU_DISP_GEN);
-+
-+	return 0;
-+}
-+
-+static void _ipu_pixel_clk_disable(struct clk_hw *hw)
-+{
-+	struct clk_di_gate *gate = to_clk_di_gate(hw);
-+	struct ipu_soc *ipu = ipu_get_soc(gate->ipu_id);
-+	u32 disp_gen;
-+
-+	disp_gen = ipu_cm_read(ipu, IPU_DISP_GEN);
-+	disp_gen &= gate->di_id ? ~DI1_COUNTER_RELEASE : ~DI0_COUNTER_RELEASE;
-+	ipu_cm_write(ipu, disp_gen, IPU_DISP_GEN);
-+
-+}
-+
-+
-+static struct clk_ops clk_gate_di_ops = {
-+	.enable = _ipu_pixel_clk_enable,
-+	.disable = _ipu_pixel_clk_disable,
-+};
-+
-+struct clk *clk_register_gate_pix_clk(struct device *dev, const char *name,
-+		const char *parent_name, unsigned long flags,
-+		u8 ipu_id, u8 di_id, u8 clk_gate_flags)
-+{
-+	struct clk_di_gate *gate;
-+	struct clk *clk;
-+	struct clk_init_data init;
-+
-+	gate = kzalloc(sizeof(struct clk_di_gate), GFP_KERNEL);
-+	if (!gate)
-+		return ERR_PTR(-ENOMEM);
-+
-+	gate->ipu_id = ipu_id;
-+	gate->di_id = di_id;
-+	gate->flags = clk_gate_flags;
-+
-+	init.name = name;
-+	init.ops = &clk_gate_di_ops;
-+	init.flags = flags | CLK_SET_RATE_PARENT;
-+	init.parent_names = parent_name ? &parent_name : NULL;
-+	init.num_parents = parent_name ? 1 : 0;
-+
-+	gate->hw.init = &init;
-+
-+	clk = clk_register(dev, &gate->hw);
-+	if (IS_ERR(clk))
-+		kfree(clk);
-+
-+	return clk;
-+}
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_prv.h linux-xbian-imx6/drivers/mxc/ipu3/ipu_prv.h
---- linux-4.1.3/drivers/mxc/ipu3/ipu_prv.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_prv.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,363 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+#ifndef __INCLUDE_IPU_PRV_H__
-+#define __INCLUDE_IPU_PRV_H__
-+
-+#include <linux/clkdev.h>
-+#include <linux/device.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/interrupt.h>
-+#include <linux/types.h>
-+
-+#define MXC_IPU_MAX_NUM		2
-+#define MXC_DI_NUM_PER_IPU	2
-+
-+/* Globals */
-+extern int dmfc_type_setup;
-+
-+#define IDMA_CHAN_INVALID	0xFF
-+#define HIGH_RESOLUTION_WIDTH	1024
-+
-+struct ipu_irq_node {
-+	irqreturn_t(*handler) (int, void *);	/*!< the ISR */
-+	const char *name;	/*!< device associated with the interrupt */
-+	void *dev_id;		/*!< some unique information for the ISR */
-+	__u32 flags;		/*!< not used */
-+};
-+
-+enum csc_type_t {
-+	RGB2YUV = 0,
-+	YUV2RGB,
-+	RGB2RGB,
-+	YUV2YUV,
-+	CSC_NONE,
-+	CSC_NUM
-+};
-+
-+enum imx_ipu_type {
-+	IMX6Q_IPU,
-+};
-+
-+struct ipu_pltfm_data {
-+	u32 id;
-+	u32 devtype;
-+	int (*init) (int);
-+	void (*pg) (int);
-+
-+	/*
-+	 * Bypass reset to avoid display channel being
-+	 * stopped by probe since it may starts to work
-+	 * in bootloader.
-+	 */
-+	bool bypass_reset;
-+};
-+
-+struct ipu_soc {
-+	bool online;
-+	struct ipu_pltfm_data *pdata;
-+
-+	/*clk*/
-+	struct clk *ipu_clk;
-+	struct clk *di_clk[2];
-+	struct clk *di_clk_sel[2];
-+	struct clk *pixel_clk[2];
-+	struct clk *pixel_clk_sel[2];
-+	struct clk *csi_clk[2];
-+
-+	/*irq*/
-+	int irq_sync;
-+	int irq_err;
-+	struct ipu_irq_node irq_list[IPU_IRQ_COUNT];
-+
-+	/*reg*/
-+	void __iomem *cm_reg;
-+	void __iomem *idmac_reg;
-+	void __iomem *dp_reg;
-+	void __iomem *ic_reg;
-+	void __iomem *dc_reg;
-+	void __iomem *dc_tmpl_reg;
-+	void __iomem *dmfc_reg;
-+	void __iomem *di_reg[2];
-+	void __iomem *smfc_reg;
-+	void __iomem *csi_reg[2];
-+	void __iomem *cpmem_base;
-+	void __iomem *tpmem_base;
-+	void __iomem *disp_base[2];
-+	void __iomem *vdi_reg;
-+
-+	struct device *dev;
-+
-+	ipu_channel_t csi_channel[2];
-+	ipu_channel_t using_ic_dirct_ch;
-+	unsigned char dc_di_assignment[10];
-+	bool sec_chan_en[24];
-+	bool thrd_chan_en[24];
-+	bool chan_is_interlaced[52];
-+	uint32_t channel_init_mask;
-+	uint32_t channel_enable_mask;
-+
-+	/*use count*/
-+	int dc_use_count;
-+	int dp_use_count;
-+	int dmfc_use_count;
-+	int smfc_use_count;
-+	int ic_use_count;
-+	int rot_use_count;
-+	int vdi_use_count;
-+	int di_use_count[2];
-+	int csi_use_count[2];
-+
-+	struct mutex mutex_lock;
-+	spinlock_t int_reg_spin_lock;
-+	spinlock_t rdy_reg_spin_lock;
-+
-+	int dmfc_size_28;
-+	int dmfc_size_29;
-+	int dmfc_size_24;
-+	int dmfc_size_27;
-+	int dmfc_size_23;
-+
-+	enum csc_type_t fg_csc_type;
-+	enum csc_type_t bg_csc_type;
-+	bool color_key_4rgb;
-+	bool dc_swap;
-+	struct completion dc_comp;
-+	struct completion csi_comp;
-+
-+	struct rot_mem {
-+		void *vaddr;
-+		dma_addr_t paddr;
-+		int size;
-+	} rot_dma[2];
-+
-+	int	vdoa_en;
-+	struct task_struct *thread[2];
-+
-+	char pixel_clk_0[12];
-+	char pixel_clk_1[12];
-+	char pixel_clk_0_sel[15];
-+	char pixel_clk_1_sel[15];
-+	char pixel_clk_0_div[15];
-+	char pixel_clk_1_div[15];
-+	char ipu_pixel_clk_sel[3][9];
-+};
-+
-+struct ipu_channel {
-+	u8 video_in_dma;
-+	u8 alpha_in_dma;
-+	u8 graph_in_dma;
-+	u8 out_dma;
-+};
-+
-+enum ipu_dmfc_type {
-+	DMFC_NORMAL = 0,
-+	DMFC_HIGH_RESOLUTION_DC,
-+	DMFC_HIGH_RESOLUTION_DP,
-+	DMFC_HIGH_RESOLUTION_ONLY_DP,
-+};
-+
-+static inline u32 ipu_cm_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->cm_reg + offset);
-+}
-+
-+static inline void ipu_cm_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->cm_reg + offset);
-+}
-+
-+static inline u32 ipu_idmac_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->idmac_reg + offset);
-+}
-+
-+static inline void ipu_idmac_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->idmac_reg + offset);
-+}
-+
-+static inline u32 ipu_dc_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->dc_reg + offset);
-+}
-+
-+static inline void ipu_dc_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->dc_reg + offset);
-+}
-+
-+static inline u32 ipu_dc_tmpl_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->dc_tmpl_reg + offset);
-+}
-+
-+static inline void ipu_dc_tmpl_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->dc_tmpl_reg + offset);
-+}
-+
-+static inline u32 ipu_dmfc_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->dmfc_reg + offset);
-+}
-+
-+static inline void ipu_dmfc_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->dmfc_reg + offset);
-+}
-+
-+static inline u32 ipu_dp_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->dp_reg + offset);
-+}
-+
-+static inline void ipu_dp_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->dp_reg + offset);
-+}
-+
-+static inline u32 ipu_di_read(struct ipu_soc *ipu, int di, unsigned offset)
-+{
-+	return readl(ipu->di_reg[di] + offset);
-+}
-+
-+static inline void ipu_di_write(struct ipu_soc *ipu, int di,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->di_reg[di] + offset);
-+}
-+
-+static inline u32 ipu_csi_read(struct ipu_soc *ipu, int csi, unsigned offset)
-+{
-+	return readl(ipu->csi_reg[csi] + offset);
-+}
-+
-+static inline void ipu_csi_write(struct ipu_soc *ipu, int csi,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->csi_reg[csi] + offset);
-+}
-+
-+static inline u32 ipu_smfc_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->smfc_reg + offset);
-+}
-+
-+static inline void ipu_smfc_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->smfc_reg + offset);
-+}
-+
-+static inline u32 ipu_vdi_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->vdi_reg + offset);
-+}
-+
-+static inline void ipu_vdi_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->vdi_reg + offset);
-+}
-+
-+static inline u32 ipu_ic_read(struct ipu_soc *ipu, unsigned offset)
-+{
-+	return readl(ipu->ic_reg + offset);
-+}
-+
-+static inline void ipu_ic_write(struct ipu_soc *ipu,
-+		u32 value, unsigned offset)
-+{
-+	writel(value, ipu->ic_reg + offset);
-+}
-+
-+int register_ipu_device(struct ipu_soc *ipu, int id);
-+void unregister_ipu_device(struct ipu_soc *ipu, int id);
-+ipu_color_space_t format_to_colorspace(uint32_t fmt);
-+bool ipu_pixel_format_has_alpha(uint32_t fmt);
-+
-+void ipu_dump_registers(struct ipu_soc *ipu);
-+
-+uint32_t _ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel);
-+
-+void ipu_disp_init(struct ipu_soc *ipu);
-+void _ipu_init_dc_mappings(struct ipu_soc *ipu);
-+int _ipu_dp_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t in_pixel_fmt,
-+		 uint32_t out_pixel_fmt);
-+void _ipu_dp_uninit(struct ipu_soc *ipu, ipu_channel_t channel);
-+void _ipu_dc_init(struct ipu_soc *ipu, int dc_chan, int di, bool interlaced, uint32_t pixel_fmt);
-+void _ipu_dc_uninit(struct ipu_soc *ipu, int dc_chan);
-+void _ipu_dp_dc_enable(struct ipu_soc *ipu, ipu_channel_t channel);
-+void _ipu_dp_dc_disable(struct ipu_soc *ipu, ipu_channel_t channel, bool swap);
-+void _ipu_dmfc_init(struct ipu_soc *ipu, int dmfc_type, int first);
-+void _ipu_dmfc_set_wait4eot(struct ipu_soc *ipu, int dma_chan, int width);
-+void _ipu_dmfc_set_burst_size(struct ipu_soc *ipu, int dma_chan, int burst_size);
-+int _ipu_disp_chan_is_interlaced(struct ipu_soc *ipu, ipu_channel_t channel);
-+
-+void _ipu_ic_enable_task(struct ipu_soc *ipu, ipu_channel_t channel);
-+void _ipu_ic_disable_task(struct ipu_soc *ipu, ipu_channel_t channel);
-+int  _ipu_ic_init_prpvf(struct ipu_soc *ipu, ipu_channel_params_t *params,
-+			bool src_is_csi);
-+void _ipu_vdi_init(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params);
-+void _ipu_vdi_uninit(struct ipu_soc *ipu);
-+void _ipu_ic_uninit_prpvf(struct ipu_soc *ipu);
-+void _ipu_ic_init_rotate_vf(struct ipu_soc *ipu, ipu_channel_params_t *params);
-+void _ipu_ic_uninit_rotate_vf(struct ipu_soc *ipu);
-+void _ipu_ic_init_csi(struct ipu_soc *ipu, ipu_channel_params_t *params);
-+void _ipu_ic_uninit_csi(struct ipu_soc *ipu);
-+int  _ipu_ic_init_prpenc(struct ipu_soc *ipu, ipu_channel_params_t *params,
-+			 bool src_is_csi);
-+void _ipu_ic_uninit_prpenc(struct ipu_soc *ipu);
-+void _ipu_ic_init_rotate_enc(struct ipu_soc *ipu, ipu_channel_params_t *params);
-+void _ipu_ic_uninit_rotate_enc(struct ipu_soc *ipu);
-+int  _ipu_ic_init_pp(struct ipu_soc *ipu, ipu_channel_params_t *params);
-+void _ipu_ic_uninit_pp(struct ipu_soc *ipu);
-+void _ipu_ic_init_rotate_pp(struct ipu_soc *ipu, ipu_channel_params_t *params);
-+void _ipu_ic_uninit_rotate_pp(struct ipu_soc *ipu);
-+int _ipu_ic_idma_init(struct ipu_soc *ipu, int dma_chan, uint16_t width, uint16_t height,
-+		      int burst_size, ipu_rotate_mode_t rot);
-+void _ipu_vdi_toggle_top_field_man(struct ipu_soc *ipu);
-+int _ipu_csi_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t csi);
-+int _ipu_csi_set_mipi_di(struct ipu_soc *ipu, uint32_t num, uint32_t di_val, uint32_t csi);
-+void ipu_csi_set_test_generator(struct ipu_soc *ipu, bool active, uint32_t r_value,
-+		uint32_t g_value, uint32_t b_value,
-+		uint32_t pix_clk, uint32_t csi);
-+void _ipu_csi_ccir_err_detection_enable(struct ipu_soc *ipu, uint32_t csi);
-+void _ipu_csi_ccir_err_detection_disable(struct ipu_soc *ipu, uint32_t csi);
-+void _ipu_csi_wait4eof(struct ipu_soc *ipu, ipu_channel_t channel);
-+void _ipu_smfc_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t mipi_id, uint32_t csi);
-+void _ipu_smfc_set_burst_size(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t bs);
-+void _ipu_dp_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3]);
-+int32_t _ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
-+		int16_t x_pos, int16_t y_pos);
-+int32_t _ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
-+		int16_t *x_pos, int16_t *y_pos);
-+void _ipu_get(struct ipu_soc *ipu);
-+void _ipu_put(struct ipu_soc *ipu);
-+
-+struct clk *clk_register_mux_pix_clk(struct device *dev, const char *name,
-+		const char **parent_names, u8 num_parents, unsigned long flags,
-+		u8 ipu_id, u8 di_id, u8 clk_mux_flags);
-+struct clk *clk_register_div_pix_clk(struct device *dev, const char *name,
-+		const char *parent_name, unsigned long flags,
-+		u8 ipu_id, u8 di_id, u8 clk_div_flags);
-+struct clk *clk_register_gate_pix_clk(struct device *dev, const char *name,
-+		const char *parent_name, unsigned long flags,
-+		u8 ipu_id, u8 di_id, u8 clk_gate_flags);
-+#endif				/* __INCLUDE_IPU_PRV_H__ */
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_regs.h linux-xbian-imx6/drivers/mxc/ipu3/ipu_regs.h
---- linux-4.1.3/drivers/mxc/ipu3/ipu_regs.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_regs.h	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,749 @@
-+/*
-+ * Copyright (C) 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*
-+ * @file ipu_regs.h
-+ *
-+ * @brief IPU Register definitions
-+ *
-+ * @ingroup IPU
-+ */
-+#ifndef __IPU_REGS_INCLUDED__
-+#define __IPU_REGS_INCLUDED__
-+
-+enum imx_ipu_rev {
-+	IPU_V3DEX = 2,
-+	IPU_V3M,
-+	IPU_V3H,
-+};
-+
-+/*
-+ * hw_rev 2: IPUV3DEX
-+ * hw_rev 3: IPUV3M
-+ * hw_rev 4: IPUV3H
-+ */
-+extern int g_ipu_hw_rev;
-+
-+#define IPU_MAX_VDI_IN_WIDTH	({g_ipu_hw_rev >= 3 ? \
-+				   (968) : \
-+				   (720); })
-+#define IPU_DISP0_BASE		0x00000000
-+#define IPU_MCU_T_DEFAULT	8
-+#define IPU_DISP1_BASE		({g_ipu_hw_rev < 4 ? \
-+				(IPU_MCU_T_DEFAULT << 25) : \
-+				(0x00000000); })
-+#define IPUV3DEX_REG_BASE	0x1E000000
-+#define IPUV3M_REG_BASE		0x06000000
-+#define IPUV3H_REG_BASE		0x00200000
-+
-+#define IPU_CM_REG_BASE		0x00000000
-+#define IPU_IDMAC_REG_BASE	0x00008000
-+#define IPU_ISP_REG_BASE	0x00010000
-+#define IPU_DP_REG_BASE		0x00018000
-+#define IPU_IC_REG_BASE		0x00020000
-+#define IPU_IRT_REG_BASE	0x00028000
-+#define IPU_CSI0_REG_BASE	0x00030000
-+#define IPU_CSI1_REG_BASE	0x00038000
-+#define IPU_DI0_REG_BASE	0x00040000
-+#define IPU_DI1_REG_BASE	0x00048000
-+#define IPU_SMFC_REG_BASE	0x00050000
-+#define IPU_DC_REG_BASE		0x00058000
-+#define IPU_DMFC_REG_BASE	0x00060000
-+#define IPU_VDI_REG_BASE	0x00068000
-+#define IPU_CPMEM_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
-+				   (0x00100000) : \
-+				   (0x01000000); })
-+#define IPU_LUT_REG_BASE	0x01020000
-+#define IPU_SRM_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
-+				   (0x00140000) : \
-+				   (0x01040000); })
-+#define IPU_TPM_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
-+				   (0x00160000) : \
-+				   (0x01060000); })
-+#define IPU_DC_TMPL_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
-+				   (0x00180000) : \
-+				   (0x01080000); })
-+#define IPU_ISP_TBPR_REG_BASE	0x010C0000
-+
-+/* Register addresses */
-+/* IPU Common registers */
-+#define IPU_CM_REG(offset)		(offset)
-+
-+#define IPU_CONF			IPU_CM_REG(0)
-+#define IPU_SRM_PRI1			IPU_CM_REG(0x00A0)
-+#define IPU_SRM_PRI2			IPU_CM_REG(0x00A4)
-+#define IPU_FS_PROC_FLOW1		IPU_CM_REG(0x00A8)
-+#define IPU_FS_PROC_FLOW2		IPU_CM_REG(0x00AC)
-+#define IPU_FS_PROC_FLOW3		IPU_CM_REG(0x00B0)
-+#define IPU_FS_DISP_FLOW1		IPU_CM_REG(0x00B4)
-+#define IPU_FS_DISP_FLOW2		IPU_CM_REG(0x00B8)
-+#define IPU_SKIP			IPU_CM_REG(0x00BC)
-+#define IPU_DISP_ALT_CONF		IPU_CM_REG(0x00C0)
-+#define IPU_DISP_GEN			IPU_CM_REG(0x00C4)
-+#define IPU_DISP_ALT1			IPU_CM_REG(0x00C8)
-+#define IPU_DISP_ALT2			IPU_CM_REG(0x00CC)
-+#define IPU_DISP_ALT3			IPU_CM_REG(0x00D0)
-+#define IPU_DISP_ALT4			IPU_CM_REG(0x00D4)
-+#define IPU_SNOOP			IPU_CM_REG(0x00D8)
-+#define IPU_MEM_RST			IPU_CM_REG(0x00DC)
-+#define IPU_PM				IPU_CM_REG(0x00E0)
-+#define IPU_GPR				IPU_CM_REG(0x00E4)
-+#define IPU_CHA_DB_MODE_SEL(ch)		IPU_CM_REG(0x0150 + 4 * ((ch) / 32))
-+#define IPU_ALT_CHA_DB_MODE_SEL(ch)	IPU_CM_REG(0x0168 + 4 * ((ch) / 32))
-+/*
-+ * IPUv3D doesn't support triple buffer, so point
-+ * IPU_CHA_TRB_MODE_SEL, IPU_CHA_TRIPLE_CUR_BUF and
-+ * IPU_CHA_BUF2_RDY to readonly
-+ * IPU_ALT_CUR_BUF0 for IPUv3D.
-+ */
-+#define IPU_CHA_TRB_MODE_SEL(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0178 + 4 * ((ch) / 32)) : \
-+					    (0x012C); })
-+#define IPU_CHA_TRIPLE_CUR_BUF(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					      (0x0258 + \
-+					       4 * (((ch) * 2) / 32)) : \
-+					      (0x012C); })
-+#define IPU_CHA_BUF2_RDY(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0288 + 4 * ((ch) / 32)) : \
-+					    (0x012C); })
-+#define IPU_CHA_CUR_BUF(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x023C + 4 * ((ch) / 32)) : \
-+					    (0x0124 + 4 * ((ch) / 32)); })
-+#define IPU_ALT_CUR_BUF0	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0244) : \
-+					    (0x012C); })
-+#define IPU_ALT_CUR_BUF1	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0248) : \
-+					    (0x0130); })
-+#define IPU_SRM_STAT		IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x024C) : \
-+					    (0x0134); })
-+#define IPU_PROC_TASK_STAT	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0250) : \
-+					    (0x0138); })
-+#define IPU_DISP_TASK_STAT	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0254) : \
-+					    (0x013C); })
-+#define IPU_CHA_BUF0_RDY(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0268 + 4 * ((ch) / 32)) : \
-+					    (0x0140 + 4 * ((ch) / 32)); })
-+#define IPU_CHA_BUF1_RDY(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0270 + 4 * ((ch) / 32)) : \
-+					    (0x0148 + 4 * ((ch) / 32)); })
-+#define IPU_ALT_CHA_BUF0_RDY(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					     (0x0278 + 4 * ((ch) / 32)) : \
-+					     (0x0158 + 4 * ((ch) / 32)); })
-+#define IPU_ALT_CHA_BUF1_RDY(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					     (0x0280 + 4 * ((ch) / 32)) : \
-+					     (0x0160 + 4 * ((ch) / 32)); })
-+
-+#define IPU_INT_CTRL(n)		IPU_CM_REG(0x003C + 4 * ((n) - 1))
-+#define IPU_INT_STAT(n)		IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
-+					    (0x0200 + 4 * ((n) - 1)) : \
-+					    (0x00E8 + 4 * ((n) - 1)); })
-+
-+#define IPUIRQ_2_STATREG(irq)	IPU_CM_REG(IPU_INT_STAT(1) + 4 * ((irq) / 32))
-+#define IPUIRQ_2_CTRLREG(irq)	IPU_CM_REG(IPU_INT_CTRL(1) + 4 * ((irq) / 32))
-+#define IPUIRQ_2_MASK(irq)	(1UL << ((irq) & 0x1F))
-+
-+/* IPU VDI registers */
-+#define IPU_VDI_REG(offset)	(offset)
-+
-+#define VDI_FSIZE		IPU_VDI_REG(0)
-+#define VDI_C			IPU_VDI_REG(0x0004)
-+
-+/* IPU CSI Registers */
-+#define IPU_CSI_REG(offset)	(offset)
-+
-+#define CSI_SENS_CONF		IPU_CSI_REG(0)
-+#define CSI_SENS_FRM_SIZE	IPU_CSI_REG(0x0004)
-+#define CSI_ACT_FRM_SIZE	IPU_CSI_REG(0x0008)
-+#define CSI_OUT_FRM_CTRL	IPU_CSI_REG(0x000C)
-+#define CSI_TST_CTRL		IPU_CSI_REG(0x0010)
-+#define CSI_CCIR_CODE_1		IPU_CSI_REG(0x0014)
-+#define CSI_CCIR_CODE_2		IPU_CSI_REG(0x0018)
-+#define CSI_CCIR_CODE_3		IPU_CSI_REG(0x001C)
-+#define CSI_MIPI_DI		IPU_CSI_REG(0x0020)
-+#define CSI_SKIP		IPU_CSI_REG(0x0024)
-+#define CSI_CPD_CTRL		IPU_CSI_REG(0x0028)
-+#define CSI_CPD_RC(n)		IPU_CSI_REG(0x002C + 4 * (n))
-+#define CSI_CPD_RS(n)		IPU_CSI_REG(0x004C + 4 * (n))
-+#define CSI_CPD_GRC(n)		IPU_CSI_REG(0x005C + 4 * (n))
-+#define CSI_CPD_GRS(n)		IPU_CSI_REG(0x007C + 4 * (n))
-+#define CSI_CPD_GBC(n)		IPU_CSI_REG(0x008C + 4 * (n))
-+#define CSI_CPD_GBS(n)		IPU_CSI_REG(0x00AC + 4 * (n))
-+#define CSI_CPD_BC(n)		IPU_CSI_REG(0x00BC + 4 * (n))
-+#define CSI_CPD_BS(n)		IPU_CSI_REG(0x00DC + 4 * (n))
-+#define CSI_CPD_OFFSET1		IPU_CSI_REG(0x00EC)
-+#define CSI_CPD_OFFSET2		IPU_CSI_REG(0x00F0)
-+
-+/* IPU SMFC Registers */
-+#define IPU_SMFC_REG(offset)	(offset)
-+
-+#define SMFC_MAP		IPU_SMFC_REG(0)
-+#define SMFC_WMC		IPU_SMFC_REG(0x0004)
-+#define SMFC_BS			IPU_SMFC_REG(0x0008)
-+
-+/* IPU IC Registers */
-+#define IPU_IC_REG(offset)	(offset)
-+
-+#define IC_CONF			IPU_IC_REG(0)
-+#define IC_PRP_ENC_RSC		IPU_IC_REG(0x0004)
-+#define IC_PRP_VF_RSC		IPU_IC_REG(0x0008)
-+#define IC_PP_RSC		IPU_IC_REG(0x000C)
-+#define IC_CMBP_1		IPU_IC_REG(0x0010)
-+#define IC_CMBP_2		IPU_IC_REG(0x0014)
-+#define IC_IDMAC_1		IPU_IC_REG(0x0018)
-+#define IC_IDMAC_2		IPU_IC_REG(0x001C)
-+#define IC_IDMAC_3		IPU_IC_REG(0x0020)
-+#define IC_IDMAC_4		IPU_IC_REG(0x0024)
-+
-+/* IPU IDMAC Registers */
-+#define IPU_IDMAC_REG(offset)	(offset)
-+
-+#define IDMAC_CONF		IPU_IDMAC_REG(0x0000)
-+#define IDMAC_CHA_EN(ch)	IPU_IDMAC_REG(0x0004 + 4 * ((ch) / 32))
-+#define IDMAC_SEP_ALPHA		IPU_IDMAC_REG(0x000C)
-+#define IDMAC_ALT_SEP_ALPHA	IPU_IDMAC_REG(0x0010)
-+#define IDMAC_CHA_PRI(ch)	IPU_IDMAC_REG(0x0014 + 4 * ((ch) / 32))
-+#define IDMAC_WM_EN(ch)		IPU_IDMAC_REG(0x001C + 4 * ((ch) / 32))
-+#define IDMAC_CH_LOCK_EN_1	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0024) : 0; })
-+#define IDMAC_CH_LOCK_EN_2	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0028) : \
-+					       (0x0024); })
-+#define IDMAC_SUB_ADDR_0	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x002C) : \
-+					       (0x0028); })
-+#define IDMAC_SUB_ADDR_1	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0030) : \
-+					       (0x002C); })
-+#define IDMAC_SUB_ADDR_2	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0034) : \
-+					       (0x0030); })
-+/*
-+ * IPUv3D doesn't support IDMAC_SUB_ADDR_3 and IDMAC_SUB_ADDR_4,
-+ * so point them to readonly IDMAC_CHA_BUSY1 for IPUv3D.
-+ */
-+#define IDMAC_SUB_ADDR_3	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0038) : \
-+					       (0x0040); })
-+#define IDMAC_SUB_ADDR_4	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x003C) : \
-+					       (0x0040); })
-+#define IDMAC_BAND_EN(ch)	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0040 + 4 * ((ch) / 32)) : \
-+					       (0x0034 + 4 * ((ch) / 32)); })
-+#define IDMAC_CHA_BUSY(ch)	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
-+					       (0x0100 + 4 * ((ch) / 32)) : \
-+					       (0x0040 + 4 * ((ch) / 32)); })
-+
-+/* IPU DI Registers */
-+#define IPU_DI_REG(offset)	(offset)
-+
-+#define DI_GENERAL		IPU_DI_REG(0)
-+#define DI_BS_CLKGEN0		IPU_DI_REG(0x0004)
-+#define DI_BS_CLKGEN1		IPU_DI_REG(0x0008)
-+#define DI_SW_GEN0(gen)		IPU_DI_REG(0x000C + 4 * ((gen) - 1))
-+#define DI_SW_GEN1(gen)		IPU_DI_REG(0x0030 + 4 * ((gen) - 1))
-+#define DI_STP_REP(gen)		IPU_DI_REG(0x0148 + 4 * (((gen) - 1) / 2))
-+#define DI_SYNC_AS_GEN		IPU_DI_REG(0x0054)
-+#define DI_DW_GEN(gen)		IPU_DI_REG(0x0058 + 4 * (gen))
-+#define DI_DW_SET(gen, set)	IPU_DI_REG(0x0088 + 4 * ((gen) + 0xC * (set)))
-+#define DI_SER_CONF		IPU_DI_REG(0x015C)
-+#define DI_SSC			IPU_DI_REG(0x0160)
-+#define DI_POL			IPU_DI_REG(0x0164)
-+#define DI_AW0			IPU_DI_REG(0x0168)
-+#define DI_AW1			IPU_DI_REG(0x016C)
-+#define DI_SCR_CONF		IPU_DI_REG(0x0170)
-+#define DI_STAT			IPU_DI_REG(0x0174)
-+
-+/* IPU DMFC Registers */
-+#define IPU_DMFC_REG(offset)	(offset)
-+
-+#define DMFC_RD_CHAN		IPU_DMFC_REG(0)
-+#define DMFC_WR_CHAN		IPU_DMFC_REG(0x0004)
-+#define DMFC_WR_CHAN_DEF	IPU_DMFC_REG(0x0008)
-+#define DMFC_DP_CHAN		IPU_DMFC_REG(0x000C)
-+#define DMFC_DP_CHAN_DEF	IPU_DMFC_REG(0x0010)
-+#define DMFC_GENERAL1		IPU_DMFC_REG(0x0014)
-+#define DMFC_GENERAL2		IPU_DMFC_REG(0x0018)
-+#define DMFC_IC_CTRL		IPU_DMFC_REG(0x001C)
-+#define DMFC_STAT		IPU_DMFC_REG(0x0020)
-+
-+/* IPU DC Registers */
-+#define IPU_DC_REG(offset)	(offset)
-+
-+#define DC_MAP_CONF_PTR(n)	IPU_DC_REG(0x0108 + ((n) & ~0x1) * 2)
-+#define DC_MAP_CONF_VAL(n)	IPU_DC_REG(0x0144 + ((n) & ~0x1) * 2)
-+
-+#define _RL_CH_2_OFFSET(ch)	(((ch) == 0) ? 8 : ( \
-+				 ((ch) == 1) ? 0x24 : ( \
-+				 ((ch) == 2) ? 0x40 : ( \
-+				 ((ch) == 5) ? 0x64 : ( \
-+				 ((ch) == 6) ? 0x80 : ( \
-+				 ((ch) == 8) ? 0x9C : ( \
-+				 ((ch) == 9) ? 0xBC : (-1))))))))
-+#define DC_RL_CH(ch, evt)	IPU_DC_REG(_RL_CH_2_OFFSET(ch) + \
-+					   ((evt) & ~0x1) * 2)
-+
-+#define DC_EVT_NF		0
-+#define DC_EVT_NL		1
-+#define DC_EVT_EOF		2
-+#define DC_EVT_NFIELD		3
-+#define DC_EVT_EOL		4
-+#define DC_EVT_EOFIELD		5
-+#define DC_EVT_NEW_ADDR		6
-+#define DC_EVT_NEW_CHAN		7
-+#define DC_EVT_NEW_DATA		8
-+
-+#define DC_EVT_NEW_ADDR_W_0	0
-+#define DC_EVT_NEW_ADDR_W_1	1
-+#define DC_EVT_NEW_CHAN_W_0	2
-+#define DC_EVT_NEW_CHAN_W_1	3
-+#define DC_EVT_NEW_DATA_W_0	4
-+#define DC_EVT_NEW_DATA_W_1	5
-+#define DC_EVT_NEW_ADDR_R_0	6
-+#define DC_EVT_NEW_ADDR_R_1	7
-+#define DC_EVT_NEW_CHAN_R_0	8
-+#define DC_EVT_NEW_CHAN_R_1	9
-+#define DC_EVT_NEW_DATA_R_0	10
-+#define DC_EVT_NEW_DATA_R_1	11
-+#define DC_EVEN_UGDE0 		12
-+#define DC_ODD_UGDE0 		13
-+#define DC_EVEN_UGDE1 		14
-+#define DC_ODD_UGDE1 		15
-+#define DC_EVEN_UGDE2 		16
-+#define DC_ODD_UGDE2 		17
-+#define DC_EVEN_UGDE3 		18
-+#define DC_ODD_UGDE3 		19
-+
-+#define dc_ch_offset(ch) \
-+({ \
-+	const u8 _offset[] = { \
-+		0, 0x1C, 0x38, 0x54, 0x58, 0x5C, 0x78, 0, 0x94, 0xB4}; \
-+	_offset[ch]; \
-+})
-+#define DC_WR_CH_CONF(ch)	IPU_DC_REG(dc_ch_offset(ch))
-+#define DC_WR_CH_ADDR(ch)	IPU_DC_REG(dc_ch_offset(ch) + 4)
-+
-+#define DC_WR_CH_CONF_1		IPU_DC_REG(0x001C)
-+#define DC_WR_CH_ADDR_1		IPU_DC_REG(0x0020)
-+#define DC_WR_CH_CONF_5		IPU_DC_REG(0x005C)
-+#define DC_WR_CH_ADDR_5		IPU_DC_REG(0x0060)
-+#define DC_GEN			IPU_DC_REG(0x00D4)
-+#define DC_DISP_CONF1(disp)	IPU_DC_REG(0x00D8 + 4 * (disp))
-+#define DC_DISP_CONF2(disp)	IPU_DC_REG(0x00E8 + 4 * (disp))
-+#define DC_STAT			IPU_DC_REG(0x01C8)
-+#define DC_UGDE_0(evt)		IPU_DC_REG(0x0174 + 16 * (evt))
-+#define DC_UGDE_1(evt)		IPU_DC_REG(0x0178 + 16 * (evt))
-+#define DC_UGDE_2(evt)		IPU_DC_REG(0x017C + 16 * (evt))
-+#define DC_UGDE_3(evt)		IPU_DC_REG(0x0180 + 16 * (evt))
-+
-+/* IPU DP Registers */
-+#define IPU_DP_REG(offset)		(offset)
-+
-+#define DP_SYNC				0
-+#define DP_ASYNC0			0x60
-+#define DP_ASYNC1			0xBC
-+#define DP_COM_CONF(flow)		IPU_DP_REG(flow)
-+#define DP_GRAPH_WIND_CTRL(flow)	IPU_DP_REG(0x0004 + (flow))
-+#define DP_FG_POS(flow)			IPU_DP_REG(0x0008 + (flow))
-+#define DP_GAMMA_C(flow, i)		IPU_DP_REG(0x0014 + (flow) + 4 * (i))
-+#define DP_GAMMA_S(flow, i)		IPU_DP_REG(0x0034 + (flow) + 4 * (i))
-+#define DP_CSC_A_0(flow)		IPU_DP_REG(0x0044 + (flow))
-+#define DP_CSC_A_1(flow)		IPU_DP_REG(0x0048 + (flow))
-+#define DP_CSC_A_2(flow)		IPU_DP_REG(0x004C + (flow))
-+#define DP_CSC_A_3(flow)		IPU_DP_REG(0x0050 + (flow))
-+#define DP_CSC_0(flow)			IPU_DP_REG(0x0054 + (flow))
-+#define DP_CSC_1(flow)			IPU_DP_REG(0x0058 + (flow))
-+
-+enum {
-+	IPU_CONF_CSI0_EN = 0x00000001,
-+	IPU_CONF_CSI1_EN = 0x00000002,
-+	IPU_CONF_IC_EN = 0x00000004,
-+	IPU_CONF_ROT_EN = 0x00000008,
-+	IPU_CONF_ISP_EN = 0x00000010,
-+	IPU_CONF_DP_EN = 0x00000020,
-+	IPU_CONF_DI0_EN = 0x00000040,
-+	IPU_CONF_DI1_EN = 0x00000080,
-+	IPU_CONF_DMFC_EN = 0x00000400,
-+	IPU_CONF_SMFC_EN = 0x00000100,
-+	IPU_CONF_DC_EN = 0x00000200,
-+	IPU_CONF_VDI_EN = 0x00001000,
-+	IPU_CONF_IDMAC_DIS = 0x00400000,
-+	IPU_CONF_IC_DMFC_SEL = 0x02000000,
-+	IPU_CONF_IC_DMFC_SYNC = 0x04000000,
-+	IPU_CONF_VDI_DMFC_SYNC = 0x08000000,
-+	IPU_CONF_CSI0_DATA_SOURCE = 0x10000000,
-+	IPU_CONF_CSI0_DATA_SOURCE_OFFSET = 28,
-+	IPU_CONF_CSI1_DATA_SOURCE = 0x20000000,
-+	IPU_CONF_IC_INPUT = 0x40000000,
-+	IPU_CONF_CSI_SEL = 0x80000000,
-+
-+	DI0_COUNTER_RELEASE = 0x01000000,
-+	DI1_COUNTER_RELEASE = 0x02000000,
-+
-+	FS_PRPVF_ROT_SRC_SEL_MASK = 0x00000F00,
-+	FS_PRPVF_ROT_SRC_SEL_OFFSET = 8,
-+	FS_PRPENC_ROT_SRC_SEL_MASK = 0x0000000F,
-+	FS_PRPENC_ROT_SRC_SEL_OFFSET = 0,
-+	FS_PP_ROT_SRC_SEL_MASK = 0x000F0000,
-+	FS_PP_ROT_SRC_SEL_OFFSET = 16,
-+	FS_PP_SRC_SEL_MASK = 0x0000F000,
-+	FS_PP_SRC_SEL_VDOA = 0x00008000,
-+	FS_PP_SRC_SEL_OFFSET = 12,
-+	FS_PRP_SRC_SEL_MASK = 0x0F000000,
-+	FS_PRP_SRC_SEL_OFFSET = 24,
-+	FS_VF_IN_VALID = 0x80000000,
-+	FS_ENC_IN_VALID = 0x40000000,
-+	FS_VDI_SRC_SEL_MASK = 0x30000000,
-+	FS_VDI_SRC_SEL_VDOA = 0x20000000,
-+	FS_VDOA_DEST_SEL_MASK = 0x00030000,
-+	FS_VDOA_DEST_SEL_VDI = 0x00020000,
-+	FS_VDOA_DEST_SEL_IC = 0x00010000,
-+	FS_VDI_SRC_SEL_OFFSET = 28,
-+
-+
-+	FS_PRPENC_DEST_SEL_MASK = 0x0000000F,
-+	FS_PRPENC_DEST_SEL_OFFSET = 0,
-+	FS_PRPVF_DEST_SEL_MASK = 0x000000F0,
-+	FS_PRPVF_DEST_SEL_OFFSET = 4,
-+	FS_PRPVF_ROT_DEST_SEL_MASK = 0x00000F00,
-+	FS_PRPVF_ROT_DEST_SEL_OFFSET = 8,
-+	FS_PP_DEST_SEL_MASK = 0x0000F000,
-+	FS_PP_DEST_SEL_OFFSET = 12,
-+	FS_PP_ROT_DEST_SEL_MASK = 0x000F0000,
-+	FS_PP_ROT_DEST_SEL_OFFSET = 16,
-+	FS_PRPENC_ROT_DEST_SEL_MASK = 0x00F00000,
-+	FS_PRPENC_ROT_DEST_SEL_OFFSET = 20,
-+
-+	FS_SMFC0_DEST_SEL_MASK = 0x0000000F,
-+	FS_SMFC0_DEST_SEL_OFFSET = 0,
-+	FS_SMFC1_DEST_SEL_MASK = 0x00000070,
-+	FS_SMFC1_DEST_SEL_OFFSET = 4,
-+	FS_SMFC2_DEST_SEL_MASK = 0x00000780,
-+	FS_SMFC2_DEST_SEL_OFFSET = 7,
-+	FS_SMFC3_DEST_SEL_MASK = 0x00003800,
-+	FS_SMFC3_DEST_SEL_OFFSET = 11,
-+
-+	FS_DC1_SRC_SEL_MASK = 0x00F00000,
-+	FS_DC1_SRC_SEL_OFFSET = 20,
-+	FS_DC2_SRC_SEL_MASK = 0x000F0000,
-+	FS_DC2_SRC_SEL_OFFSET = 16,
-+	FS_DP_SYNC0_SRC_SEL_MASK = 0x0000000F,
-+	FS_DP_SYNC0_SRC_SEL_OFFSET = 0,
-+	FS_DP_SYNC1_SRC_SEL_MASK = 0x000000F0,
-+	FS_DP_SYNC1_SRC_SEL_OFFSET = 4,
-+	FS_DP_ASYNC0_SRC_SEL_MASK = 0x00000F00,
-+	FS_DP_ASYNC0_SRC_SEL_OFFSET = 8,
-+	FS_DP_ASYNC1_SRC_SEL_MASK = 0x0000F000,
-+	FS_DP_ASYNC1_SRC_SEL_OFFSET = 12,
-+
-+	FS_AUTO_REF_PER_MASK = 0,
-+	FS_AUTO_REF_PER_OFFSET = 16,
-+
-+	TSTAT_VF_MASK = 0x0000000C,
-+	TSTAT_VF_OFFSET = 2,
-+	TSTAT_VF_ROT_MASK = 0x00000300,
-+	TSTAT_VF_ROT_OFFSET = 8,
-+	TSTAT_ENC_MASK = 0x00000003,
-+	TSTAT_ENC_OFFSET = 0,
-+	TSTAT_ENC_ROT_MASK = 0x000000C0,
-+	TSTAT_ENC_ROT_OFFSET = 6,
-+	TSTAT_PP_MASK = 0x00000030,
-+	TSTAT_PP_OFFSET = 4,
-+	TSTAT_PP_ROT_MASK = 0x00000C00,
-+	TSTAT_PP_ROT_OFFSET = 10,
-+
-+	TASK_STAT_IDLE = 0,
-+	TASK_STAT_ACTIVE = 1,
-+	TASK_STAT_WAIT4READY = 2,
-+
-+	/* Image Converter Register bits */
-+	IC_CONF_PRPENC_EN = 0x00000001,
-+	IC_CONF_PRPENC_CSC1 = 0x00000002,
-+	IC_CONF_PRPENC_ROT_EN = 0x00000004,
-+	IC_CONF_PRPVF_EN = 0x00000100,
-+	IC_CONF_PRPVF_CSC1 = 0x00000200,
-+	IC_CONF_PRPVF_CSC2 = 0x00000400,
-+	IC_CONF_PRPVF_CMB = 0x00000800,
-+	IC_CONF_PRPVF_ROT_EN = 0x00001000,
-+	IC_CONF_PP_EN = 0x00010000,
-+	IC_CONF_PP_CSC1 = 0x00020000,
-+	IC_CONF_PP_CSC2 = 0x00040000,
-+	IC_CONF_PP_CMB = 0x00080000,
-+	IC_CONF_PP_ROT_EN = 0x00100000,
-+	IC_CONF_IC_GLB_LOC_A = 0x10000000,
-+	IC_CONF_KEY_COLOR_EN = 0x20000000,
-+	IC_CONF_RWS_EN = 0x40000000,
-+	IC_CONF_CSI_MEM_WR_EN = 0x80000000,
-+
-+	IC_RSZ_MAX_RESIZE_RATIO = 0x00004000,
-+
-+	IC_IDMAC_1_CB0_BURST_16 = 0x00000001,
-+	IC_IDMAC_1_CB1_BURST_16 = 0x00000002,
-+	IC_IDMAC_1_CB2_BURST_16 = 0x00000004,
-+	IC_IDMAC_1_CB3_BURST_16 = 0x00000008,
-+	IC_IDMAC_1_CB4_BURST_16 = 0x00000010,
-+	IC_IDMAC_1_CB5_BURST_16 = 0x00000020,
-+	IC_IDMAC_1_CB6_BURST_16 = 0x00000040,
-+	IC_IDMAC_1_CB7_BURST_16 = 0x00000080,
-+	IC_IDMAC_1_PRPENC_ROT_MASK = 0x00003800,
-+	IC_IDMAC_1_PRPENC_ROT_OFFSET = 11,
-+	IC_IDMAC_1_PRPVF_ROT_MASK = 0x0001C000,
-+	IC_IDMAC_1_PRPVF_ROT_OFFSET = 14,
-+	IC_IDMAC_1_PP_ROT_MASK = 0x000E0000,
-+	IC_IDMAC_1_PP_ROT_OFFSET = 17,
-+	IC_IDMAC_1_PP_FLIP_RS = 0x00400000,
-+	IC_IDMAC_1_PRPVF_FLIP_RS = 0x00200000,
-+	IC_IDMAC_1_PRPENC_FLIP_RS = 0x00100000,
-+
-+	IC_IDMAC_2_PRPENC_HEIGHT_MASK = 0x000003FF,
-+	IC_IDMAC_2_PRPENC_HEIGHT_OFFSET = 0,
-+	IC_IDMAC_2_PRPVF_HEIGHT_MASK = 0x000FFC00,
-+	IC_IDMAC_2_PRPVF_HEIGHT_OFFSET = 10,
-+	IC_IDMAC_2_PP_HEIGHT_MASK = 0x3FF00000,
-+	IC_IDMAC_2_PP_HEIGHT_OFFSET = 20,
-+
-+	IC_IDMAC_3_PRPENC_WIDTH_MASK = 0x000003FF,
-+	IC_IDMAC_3_PRPENC_WIDTH_OFFSET = 0,
-+	IC_IDMAC_3_PRPVF_WIDTH_MASK = 0x000FFC00,
-+	IC_IDMAC_3_PRPVF_WIDTH_OFFSET = 10,
-+	IC_IDMAC_3_PP_WIDTH_MASK = 0x3FF00000,
-+	IC_IDMAC_3_PP_WIDTH_OFFSET = 20,
-+
-+	CSI_SENS_CONF_DATA_FMT_SHIFT = 8,
-+	CSI_SENS_CONF_DATA_FMT_MASK = 0x00000700,
-+	CSI_SENS_CONF_DATA_FMT_RGB_YUV444 = 0L,
-+	CSI_SENS_CONF_DATA_FMT_YUV422_YUYV = 1L,
-+	CSI_SENS_CONF_DATA_FMT_YUV422_UYVY = 2L,
-+	CSI_SENS_CONF_DATA_FMT_BAYER = 3L,
-+	CSI_SENS_CONF_DATA_FMT_RGB565 = 4L,
-+	CSI_SENS_CONF_DATA_FMT_RGB555 = 5L,
-+	CSI_SENS_CONF_DATA_FMT_RGB444 = 6L,
-+	CSI_SENS_CONF_DATA_FMT_JPEG = 7L,
-+
-+	CSI_SENS_CONF_VSYNC_POL_SHIFT = 0,
-+	CSI_SENS_CONF_HSYNC_POL_SHIFT = 1,
-+	CSI_SENS_CONF_DATA_POL_SHIFT = 2,
-+	CSI_SENS_CONF_PIX_CLK_POL_SHIFT = 3,
-+	CSI_SENS_CONF_SENS_PRTCL_MASK = 0x00000070L,
-+	CSI_SENS_CONF_SENS_PRTCL_SHIFT = 4,
-+	CSI_SENS_CONF_PACK_TIGHT_SHIFT = 7,
-+	CSI_SENS_CONF_DATA_WIDTH_SHIFT = 11,
-+	CSI_SENS_CONF_EXT_VSYNC_SHIFT = 15,
-+	CSI_SENS_CONF_DIVRATIO_SHIFT = 16,
-+
-+	CSI_SENS_CONF_DIVRATIO_MASK = 0x00FF0000L,
-+	CSI_SENS_CONF_DATA_DEST_SHIFT = 24,
-+	CSI_SENS_CONF_DATA_DEST_MASK = 0x07000000L,
-+	CSI_SENS_CONF_JPEG8_EN_SHIFT = 27,
-+	CSI_SENS_CONF_JPEG_EN_SHIFT = 28,
-+	CSI_SENS_CONF_FORCE_EOF_SHIFT = 29,
-+	CSI_SENS_CONF_DATA_EN_POL_SHIFT = 31,
-+
-+	CSI_DATA_DEST_ISP = 1L,
-+	CSI_DATA_DEST_IC = 2L,
-+	CSI_DATA_DEST_IDMAC = 4L,
-+
-+	CSI_CCIR_ERR_DET_EN = 0x01000000L,
-+	CSI_HORI_DOWNSIZE_EN = 0x80000000L,
-+	CSI_VERT_DOWNSIZE_EN = 0x40000000L,
-+	CSI_TEST_GEN_MODE_EN = 0x01000000L,
-+
-+	CSI_HSC_MASK = 0x1FFF0000,
-+	CSI_HSC_SHIFT = 16,
-+	CSI_VSC_MASK = 0x00000FFF,
-+	CSI_VSC_SHIFT = 0,
-+
-+	CSI_TEST_GEN_R_MASK = 0x000000FFL,
-+	CSI_TEST_GEN_R_SHIFT = 0,
-+	CSI_TEST_GEN_G_MASK = 0x0000FF00L,
-+	CSI_TEST_GEN_G_SHIFT = 8,
-+	CSI_TEST_GEN_B_MASK = 0x00FF0000L,
-+	CSI_TEST_GEN_B_SHIFT = 16,
-+
-+	CSI_MIPI_DI0_MASK = 0x000000FFL,
-+	CSI_MIPI_DI0_SHIFT = 0,
-+	CSI_MIPI_DI1_MASK = 0x0000FF00L,
-+	CSI_MIPI_DI1_SHIFT = 8,
-+	CSI_MIPI_DI2_MASK = 0x00FF0000L,
-+	CSI_MIPI_DI2_SHIFT = 16,
-+	CSI_MIPI_DI3_MASK = 0xFF000000L,
-+	CSI_MIPI_DI3_SHIFT = 24,
-+
-+	CSI_MAX_RATIO_SKIP_ISP_MASK = 0x00070000L,
-+	CSI_MAX_RATIO_SKIP_ISP_SHIFT = 16,
-+	CSI_SKIP_ISP_MASK = 0x00F80000L,
-+	CSI_SKIP_ISP_SHIFT = 19,
-+	CSI_MAX_RATIO_SKIP_SMFC_MASK = 0x00000007L,
-+	CSI_MAX_RATIO_SKIP_SMFC_SHIFT = 0,
-+	CSI_SKIP_SMFC_MASK = 0x000000F8L,
-+	CSI_SKIP_SMFC_SHIFT = 3,
-+	CSI_ID_2_SKIP_MASK = 0x00000300L,
-+	CSI_ID_2_SKIP_SHIFT = 8,
-+
-+	CSI_COLOR_FIRST_ROW_MASK = 0x00000002L,
-+	CSI_COLOR_FIRST_COMP_MASK = 0x00000001L,
-+
-+	SMFC_MAP_CH0_MASK = 0x00000007L,
-+	SMFC_MAP_CH0_SHIFT = 0,
-+	SMFC_MAP_CH1_MASK = 0x00000038L,
-+	SMFC_MAP_CH1_SHIFT = 3,
-+	SMFC_MAP_CH2_MASK = 0x000001C0L,
-+	SMFC_MAP_CH2_SHIFT = 6,
-+	SMFC_MAP_CH3_MASK = 0x00000E00L,
-+	SMFC_MAP_CH3_SHIFT = 9,
-+
-+	SMFC_WM0_SET_MASK = 0x00000007L,
-+	SMFC_WM0_SET_SHIFT = 0,
-+	SMFC_WM1_SET_MASK = 0x000001C0L,
-+	SMFC_WM1_SET_SHIFT = 6,
-+	SMFC_WM2_SET_MASK = 0x00070000L,
-+	SMFC_WM2_SET_SHIFT = 16,
-+	SMFC_WM3_SET_MASK = 0x01C00000L,
-+	SMFC_WM3_SET_SHIFT = 22,
-+
-+	SMFC_WM0_CLR_MASK = 0x00000038L,
-+	SMFC_WM0_CLR_SHIFT = 3,
-+	SMFC_WM1_CLR_MASK = 0x00000E00L,
-+	SMFC_WM1_CLR_SHIFT = 9,
-+	SMFC_WM2_CLR_MASK = 0x00380000L,
-+	SMFC_WM2_CLR_SHIFT = 19,
-+	SMFC_WM3_CLR_MASK = 0x0E000000L,
-+	SMFC_WM3_CLR_SHIFT = 25,
-+
-+	SMFC_BS0_MASK = 0x0000000FL,
-+	SMFC_BS0_SHIFT = 0,
-+	SMFC_BS1_MASK = 0x000000F0L,
-+	SMFC_BS1_SHIFT = 4,
-+	SMFC_BS2_MASK = 0x00000F00L,
-+	SMFC_BS2_SHIFT = 8,
-+	SMFC_BS3_MASK = 0x0000F000L,
-+	SMFC_BS3_SHIFT = 12,
-+
-+	PF_CONF_TYPE_MASK = 0x00000007,
-+	PF_CONF_TYPE_SHIFT = 0,
-+	PF_CONF_PAUSE_EN = 0x00000010,
-+	PF_CONF_RESET = 0x00008000,
-+	PF_CONF_PAUSE_ROW_MASK = 0x00FF0000,
-+	PF_CONF_PAUSE_ROW_SHIFT = 16,
-+
-+	DI_DW_GEN_ACCESS_SIZE_OFFSET = 24,
-+	DI_DW_GEN_COMPONENT_SIZE_OFFSET = 16,
-+
-+	DI_GEN_DI_CLK_EXT = 0x100000,
-+	DI_GEN_POLARITY_DISP_CLK = 0x00020000,
-+	DI_GEN_POLARITY_1 = 0x00000001,
-+	DI_GEN_POLARITY_2 = 0x00000002,
-+	DI_GEN_POLARITY_3 = 0x00000004,
-+	DI_GEN_POLARITY_4 = 0x00000008,
-+	DI_GEN_POLARITY_5 = 0x00000010,
-+	DI_GEN_POLARITY_6 = 0x00000020,
-+	DI_GEN_POLARITY_7 = 0x00000040,
-+	DI_GEN_POLARITY_8 = 0x00000080,
-+
-+	DI_POL_DRDY_DATA_POLARITY = 0x00000080,
-+	DI_POL_DRDY_POLARITY_15 = 0x00000010,
-+
-+	DI_VSYNC_SEL_OFFSET = 13,
-+
-+	DC_WR_CH_CONF_FIELD_MODE = 0x00000200,
-+	DC_WR_CH_CONF_PROG_TYPE_OFFSET = 5,
-+	DC_WR_CH_CONF_PROG_TYPE_MASK = 0x000000E0,
-+	DC_WR_CH_CONF_PROG_DI_ID = 0x00000004,
-+	DC_WR_CH_CONF_PROG_DISP_ID_OFFSET = 3,
-+	DC_WR_CH_CONF_PROG_DISP_ID_MASK = 0x00000018,
-+
-+	DC_UGDE_0_ODD_EN = 0x02000000,
-+	DC_UGDE_0_ID_CODED_MASK = 0x00000007,
-+	DC_UGDE_0_ID_CODED_OFFSET = 0,
-+	DC_UGDE_0_EV_PRIORITY_MASK = 0x00000078,
-+	DC_UGDE_0_EV_PRIORITY_OFFSET = 3,
-+
-+	DP_COM_CONF_FG_EN = 0x00000001,
-+	DP_COM_CONF_GWSEL = 0x00000002,
-+	DP_COM_CONF_GWAM = 0x00000004,
-+	DP_COM_CONF_GWCKE = 0x00000008,
-+	DP_COM_CONF_CSC_DEF_MASK = 0x00000300,
-+	DP_COM_CONF_CSC_DEF_OFFSET = 8,
-+	DP_COM_CONF_CSC_DEF_FG = 0x00000300,
-+	DP_COM_CONF_CSC_DEF_BG = 0x00000200,
-+	DP_COM_CONF_CSC_DEF_BOTH = 0x00000100,
-+	DP_COM_CONF_GAMMA_EN = 0x00001000,
-+	DP_COM_CONF_GAMMA_YUV_EN = 0x00002000,
-+
-+	DI_SER_CONF_LLA_SER_ACCESS = 0x00000020,
-+	DI_SER_CONF_SERIAL_CLK_POL = 0x00000010,
-+	DI_SER_CONF_SERIAL_DATA_POL = 0x00000008,
-+	DI_SER_CONF_SERIAL_RS_POL = 0x00000004,
-+	DI_SER_CONF_SERIAL_CS_POL = 0x00000002,
-+	DI_SER_CONF_WAIT4SERIAL = 0x00000001,
-+
-+	VDI_C_CH_420 = 0x00000000,
-+	VDI_C_CH_422 = 0x00000002,
-+	VDI_C_MOT_SEL_FULL = 0x00000008,
-+	VDI_C_MOT_SEL_LOW = 0x00000004,
-+	VDI_C_MOT_SEL_MED = 0x00000000,
-+	VDI_C_BURST_SIZE1_4 = 0x00000030,
-+	VDI_C_BURST_SIZE2_4 = 0x00000300,
-+	VDI_C_BURST_SIZE3_4 = 0x00003000,
-+	VDI_C_BURST_SIZE_MASK = 0xF,
-+	VDI_C_BURST_SIZE1_OFFSET = 4,
-+	VDI_C_BURST_SIZE2_OFFSET = 8,
-+	VDI_C_BURST_SIZE3_OFFSET = 12,
-+	VDI_C_VWM1_SET_1 = 0x00000000,
-+	VDI_C_VWM1_SET_2 = 0x00010000,
-+	VDI_C_VWM1_CLR_2 = 0x00080000,
-+	VDI_C_VWM3_SET_1 = 0x00000000,
-+	VDI_C_VWM3_SET_2 = 0x00400000,
-+	VDI_C_VWM3_CLR_2 = 0x02000000,
-+	VDI_C_TOP_FIELD_MAN_1 = 0x40000000,
-+	VDI_C_TOP_FIELD_AUTO_1 = 0x80000000,
-+};
-+
-+enum di_pins {
-+	DI_PIN11 = 0,
-+	DI_PIN12 = 1,
-+	DI_PIN13 = 2,
-+	DI_PIN14 = 3,
-+	DI_PIN15 = 4,
-+	DI_PIN16 = 5,
-+	DI_PIN17 = 6,
-+	DI_PIN_CS = 7,
-+
-+	DI_PIN_SER_CLK = 0,
-+	DI_PIN_SER_RS = 1,
-+};
-+
-+enum di_sync_wave {
-+	DI_SYNC_NONE = -1,
-+	DI_SYNC_CLK = 0,
-+	DI_SYNC_INT_HSYNC = 1,
-+	DI_SYNC_COUNT_1 = 1,
-+	DI_SYNC_HSYNC = 2,
-+	DI_SYNC_VSYNC = 3,
-+	DI_SYNC_AFIELD = 4,
-+	DI_SYNC_ALINE = 5,
-+	DI_SYNC_APIXEL = 6,
-+	DI_SYNC_COUNT_7 = 7,
-+	DI_SYNC_COUNT_8 = 8,
-+	DI_SYNC_COUNT_9 = 9,
-+};
-+
-+/* DC template opcodes */
-+#define WROD(lf)		(0x18 | (lf << 1))
-+#define WRG	        	(0x01)
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/Kconfig linux-xbian-imx6/drivers/mxc/ipu3/Kconfig
---- linux-4.1.3/drivers/mxc/ipu3/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/Kconfig	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,2 @@
-+config MXC_IPU_V3_FSL
-+	bool
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/Makefile linux-xbian-imx6/drivers/mxc/ipu3/Makefile
---- linux-4.1.3/drivers/mxc/ipu3/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/Makefile	2015-07-27 23:13:06.226765901 +0200
-@@ -0,0 +1,4 @@
-+obj-$(CONFIG_MXC_IPU_V3_FSL) = mxc_ipu.o
-+
-+mxc_ipu-objs := ipu_common.o ipu_ic.o ipu_disp.o ipu_capture.o ipu_device.o \
-+		ipu_calc_stripes_sizes.o vdoa.o ipu_pixel_clk.o
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/vdoa.c linux-xbian-imx6/drivers/mxc/ipu3/vdoa.c
---- linux-4.1.3/drivers/mxc/ipu3/vdoa.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/vdoa.c	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,547 @@
-+/*
-+ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/clk.h>
-+#include <linux/err.h>
-+#include <linux/io.h>
-+#include <linux/ipu.h>
-+#include <linux/genalloc.h>
-+#include <linux/module.h>
-+#include <linux/platform_device.h>
-+#include <linux/slab.h>
-+#include <linux/types.h>
-+#include <linux/of.h>
-+#include <linux/of_irq.h>
-+#include <linux/of_pci.h>
-+
-+#include "vdoa.h"
-+/* 6band(3field* double buffer) * (width*2) * bandline(8)
-+	= 6x1024x2x8 = 96k or 72k(1.5byte) */
-+#define MAX_VDOA_IRAM_SIZE	(1024*96)
-+#define VDOA_IRAM_SIZE		(1024*72)
-+
-+#define VDOAC_BAND_HEIGHT_32LINES	(32)
-+#define VDOAC_BAND_HEIGHT_16LINES	(16)
-+#define VDOAC_BAND_HEIGHT_8LINES	(8)
-+#define VDOAC_THREE_FRAMES		(0x1 << 2)
-+#define VDOAC_SYNC_BAND_MODE		(0x1 << 3)
-+#define VDOAC_SCAN_ORDER_INTERLACED	(0x1 << 4)
-+#define VDOAC_PFS_YUYV			(0x1 << 5)
-+#define VDOAC_IPU_SEL_1			(0x1 << 6)
-+#define VDOAFP_FH_MASK			(0x1FFF)
-+#define VDOAFP_FH_SHIFT			(16)
-+#define VDOAFP_FW_MASK			(0x3FFF)
-+#define VDOAFP_FW_SHIFT			(0)
-+#define VDOASL_VSLY_MASK		(0x3FFF)
-+#define VDOASL_VSLY_SHIFT		(16)
-+#define VDOASL_ISLY_MASK		(0x7FFF)
-+#define VDOASL_ISLY_SHIFT		(0)
-+#define VDOASRR_START_XFER		(0x2)
-+#define VDOASRR_SWRST			(0x1)
-+#define VDOAIEIST_TRANSFER_ERR		(0x2)
-+#define VDOAIEIST_TRANSFER_END		(0x1)
-+
-+#define	VDOAC		(0x0)	/* Control Register */
-+#define	VDOASRR		(0x4)	/* Start and Reset Register */
-+#define	VDOAIE		(0x8)	/* Interrupt Enable Register */
-+#define	VDOAIST		(0xc)	/* Interrupt Status Register */
-+#define	VDOAFP		(0x10)	/* Frame Parameters Register */
-+#define	VDOAIEBA00	(0x14)	/* External Buffer n Frame m Address Register */
-+#define	VDOAIEBA01	(0x18)	/* External Buffer n Frame m Address Register */
-+#define	VDOAIEBA02	(0x1c)	/* External Buffer n Frame m Address Register */
-+#define	VDOAIEBA10	(0x20)	/* External Buffer n Frame m Address Register */
-+#define	VDOAIEBA11	(0x24)	/* External Buffer n Frame m Address Register */
-+#define	VDOAIEBA12	(0x28)	/* External Buffer n Frame m Address Register */
-+#define	VDOASL		(0x2c)	/* IPU Stride Line Register */
-+#define	VDOAIUBO	(0x30)	/* IPU Chroma Buffer Offset Register */
-+#define	VDOAVEBA0	(0x34)	/* External Buffer m Address Register */
-+#define	VDOAVEBA1	(0x38)	/* External Buffer m Address Register */
-+#define	VDOAVEBA2	(0x3c)	/* External Buffer m Address Register */
-+#define	VDOAVUBO	(0x40)	/* VPU Chroma Buffer Offset */
-+#define	VDOASR		(0x44)	/* Status Register */
-+#define	VDOATD		(0x48)	/* Test Debug Register */
-+
-+
-+enum {
-+	VDOA_INIT	= 0x1,
-+	VDOA_GET	= 0x2,
-+	VDOA_SETUP	= 0x4,
-+	VDOA_GET_OBUF	= 0x8,
-+	VDOA_START	= 0x10,
-+	VDOA_INIRQ	= 0x20,
-+	VDOA_STOP	= 0x40,
-+	VDOA_PUT	= VDOA_INIT,
-+};
-+
-+enum {
-+	VDOA_NULL	= 0,
-+	VDOA_FRAME	= 1,
-+	VDOA_PREV_FIELD	= 2,
-+	VDOA_CURR_FIELD	= 3,
-+	VDOA_NEXT_FIELD	= 4,
-+};
-+
-+#define CHECK_STATE(expect, retcode)					\
-+do {									\
-+	if (!((expect) & vdoa->state)) {				\
-+		dev_err(vdoa->dev, "ERR: %s state:0x%x, expect:0x%x.\n",\
-+				__func__, vdoa->state, (expect));	\
-+		retcode;						\
-+	}								\
-+} while (0)
-+
-+#define CHECK_NULL_PTR(ptr)						\
-+do {									\
-+	pr_debug("vdoa_ptr:0x%p in %s state:0x%x.\n",			\
-+			vdoa, __func__, vdoa->state);			\
-+	if (NULL == (ptr)) {						\
-+		pr_err("ERR vdoa: %s state:0x%x null ptr.\n",		\
-+				__func__, vdoa->state);			\
-+	}								\
-+} while (0)
-+
-+struct vdoa_info {
-+	int		state;
-+	struct device	*dev;
-+	struct clk	*vdoa_clk;
-+	void __iomem	*reg_base;
-+	struct gen_pool	*iram_pool;
-+	unsigned long	iram_base;
-+	unsigned long	iram_paddr;
-+	int		irq;
-+	int		field;
-+	struct completion comp;
-+};
-+
-+static struct vdoa_info *g_vdoa;
-+static unsigned long iram_size;
-+static DEFINE_MUTEX(vdoa_lock);
-+
-+static inline void vdoa_read_register(struct vdoa_info *vdoa,
-+				u32 reg, u32 *val)
-+{
-+	*val = ioread32(vdoa->reg_base + reg);
-+	dev_dbg(vdoa->dev, "read_reg:0x%02x, val:0x%08x.\n", reg, *val);
-+}
-+
-+static inline void vdoa_write_register(struct vdoa_info *vdoa,
-+				u32 reg, u32 val)
-+{
-+	iowrite32(val, vdoa->reg_base + reg);
-+	dev_dbg(vdoa->dev, "\t\twrite_reg:0x%02x, val:0x%08x.\n", reg, val);
-+}
-+
-+static void dump_registers(struct vdoa_info *vdoa)
-+{
-+	int i;
-+	u32 data;
-+
-+	for (i = VDOAC; i < VDOATD; i += 4)
-+		vdoa_read_register(vdoa, i, &data);
-+}
-+
-+int vdoa_setup(vdoa_handle_t handle, struct vdoa_params *params)
-+{
-+	int	band_size;
-+	int	total_band_size = 0;
-+	int	ipu_stride;
-+	u32	data;
-+	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
-+
-+	CHECK_NULL_PTR(vdoa);
-+	CHECK_STATE(VDOA_GET | VDOA_GET_OBUF | VDOA_STOP, return -EINVAL);
-+	if (VDOA_GET == vdoa->state) {
-+		dev_dbg(vdoa->dev, "w:%d, h:%d.\n",
-+			 params->width, params->height);
-+		data = (params->band_lines == VDOAC_BAND_HEIGHT_32LINES) ? 2 :
-+			((params->band_lines == VDOAC_BAND_HEIGHT_16LINES) ?
-+				 1 : 0);
-+		data |= params->scan_order ? VDOAC_SCAN_ORDER_INTERLACED : 0;
-+		data |= params->band_mode ? VDOAC_SYNC_BAND_MODE : 0;
-+		data |= params->pfs ? VDOAC_PFS_YUYV : 0;
-+		data |= params->ipu_num ? VDOAC_IPU_SEL_1 : 0;
-+		vdoa_write_register(vdoa, VDOAC, data);
-+
-+		data = ((params->width & VDOAFP_FW_MASK) << VDOAFP_FW_SHIFT) |
-+			((params->height & VDOAFP_FH_MASK) << VDOAFP_FH_SHIFT);
-+		vdoa_write_register(vdoa, VDOAFP, data);
-+
-+		ipu_stride = params->pfs ? params->width << 1 : params->width;
-+		data = ((params->vpu_stride & VDOASL_VSLY_MASK) <<
-+							VDOASL_VSLY_SHIFT) |
-+			((ipu_stride & VDOASL_ISLY_MASK) << VDOASL_ISLY_SHIFT);
-+		vdoa_write_register(vdoa, VDOASL, data);
-+
-+		dev_dbg(vdoa->dev, "band_mode:%d, band_line:%d, base:0x%lx.\n",
-+		params->band_mode, params->band_lines, vdoa->iram_paddr);
-+	}
-+	/*
-+	 * band size	= (luma_per_line + chroma_per_line) * bandLines
-+	 *		= width * (3/2 or 2) * bandLines
-+	 * double buffer mode used.
-+	 */
-+	if (params->pfs)
-+		band_size = (params->width << 1) * params->band_lines;
-+	else
-+		band_size = ((params->width * 3) >> 1) *
-+						params->band_lines;
-+	if (params->interlaced) {
-+		total_band_size = 6 * band_size; /* 3 frames*double buffer */
-+		if (iram_size < total_band_size) {
-+			dev_err(vdoa->dev, "iram_size:0x%lx is smaller than "
-+				"request:0x%x!\n", iram_size, total_band_size);
-+			return -EINVAL;
-+		}
-+		if (params->vfield_buf.prev_veba) {
-+			if (params->band_mode) {
-+				vdoa_write_register(vdoa, VDOAIEBA00,
-+							vdoa->iram_paddr);
-+				vdoa_write_register(vdoa, VDOAIEBA10,
-+						 vdoa->iram_paddr + band_size);
-+			} else
-+				vdoa_write_register(vdoa, VDOAIEBA00,
-+							params->ieba0);
-+			vdoa_write_register(vdoa, VDOAVEBA0,
-+					params->vfield_buf.prev_veba);
-+			vdoa->field = VDOA_PREV_FIELD;
-+		}
-+		if (params->vfield_buf.cur_veba) {
-+			if (params->band_mode) {
-+				vdoa_write_register(vdoa, VDOAIEBA01,
-+					 vdoa->iram_paddr + band_size * 2);
-+				vdoa_write_register(vdoa, VDOAIEBA11,
-+					 vdoa->iram_paddr + band_size * 3);
-+			} else
-+				vdoa_write_register(vdoa, VDOAIEBA01,
-+							params->ieba1);
-+			vdoa_write_register(vdoa, VDOAVEBA1,
-+					params->vfield_buf.cur_veba);
-+			vdoa->field = VDOA_CURR_FIELD;
-+		}
-+		if (params->vfield_buf.next_veba) {
-+			if (params->band_mode) {
-+				vdoa_write_register(vdoa, VDOAIEBA02,
-+					 vdoa->iram_paddr + band_size * 4);
-+				vdoa_write_register(vdoa, VDOAIEBA12,
-+					 vdoa->iram_paddr + band_size * 5);
-+			} else
-+				vdoa_write_register(vdoa, VDOAIEBA02,
-+							params->ieba2);
-+			vdoa_write_register(vdoa, VDOAVEBA2,
-+					params->vfield_buf.next_veba);
-+			vdoa->field = VDOA_NEXT_FIELD;
-+			vdoa_read_register(vdoa, VDOAC, &data);
-+			data |= VDOAC_THREE_FRAMES;
-+			vdoa_write_register(vdoa, VDOAC, data);
-+		}
-+
-+		if (!params->pfs)
-+			vdoa_write_register(vdoa, VDOAIUBO,
-+				 params->width * params->band_lines);
-+		vdoa_write_register(vdoa, VDOAVUBO,
-+				 params->vfield_buf.vubo);
-+		dev_dbg(vdoa->dev, "total band_size:0x%x.\n", band_size*6);
-+	} else if (params->band_mode) {
-+		/* used for progressive frame resize on PrP channel */
-+		BUG(); /* currently not support */
-+		/* progressvie frame: band mode */
-+		vdoa_write_register(vdoa, VDOAIEBA00, vdoa->iram_paddr);
-+		vdoa_write_register(vdoa, VDOAIEBA10,
-+					 vdoa->iram_paddr + band_size);
-+		if (!params->pfs)
-+			vdoa_write_register(vdoa, VDOAIUBO,
-+					params->width * params->band_lines);
-+		dev_dbg(vdoa->dev, "total band_size:0x%x\n", band_size*2);
-+	} else {
-+		/* progressive frame: mem->mem, non-band mode */
-+		vdoa->field = VDOA_FRAME;
-+		vdoa_write_register(vdoa, VDOAVEBA0, params->vframe_buf.veba);
-+		vdoa_write_register(vdoa, VDOAVUBO, params->vframe_buf.vubo);
-+		vdoa_write_register(vdoa, VDOAIEBA00, params->ieba0);
-+		if (!params->pfs)
-+			/* note: iubo is relative value, based on ieba0 */
-+			vdoa_write_register(vdoa, VDOAIUBO,
-+					params->width * params->height);
-+	}
-+	vdoa->state = VDOA_SETUP;
-+	return 0;
-+}
-+
-+void vdoa_get_output_buf(vdoa_handle_t handle, struct vdoa_ipu_buf *buf)
-+{
-+	u32	data;
-+	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
-+
-+	CHECK_NULL_PTR(vdoa);
-+	CHECK_STATE(VDOA_SETUP, return);
-+	vdoa->state = VDOA_GET_OBUF;
-+	memset(buf, 0, sizeof(*buf));
-+
-+	vdoa_read_register(vdoa, VDOAC, &data);
-+	switch (vdoa->field) {
-+	case VDOA_FRAME:
-+	case VDOA_PREV_FIELD:
-+		vdoa_read_register(vdoa, VDOAIEBA00, &buf->ieba0);
-+		if (data & VDOAC_SYNC_BAND_MODE)
-+			vdoa_read_register(vdoa, VDOAIEBA10, &buf->ieba1);
-+		break;
-+	case VDOA_CURR_FIELD:
-+		vdoa_read_register(vdoa, VDOAIEBA01, &buf->ieba0);
-+		vdoa_read_register(vdoa, VDOAIEBA11, &buf->ieba1);
-+		break;
-+	case VDOA_NEXT_FIELD:
-+		vdoa_read_register(vdoa, VDOAIEBA02, &buf->ieba0);
-+		vdoa_read_register(vdoa, VDOAIEBA12, &buf->ieba1);
-+		break;
-+	default:
-+		BUG();
-+		break;
-+	}
-+	if (!(data & VDOAC_PFS_YUYV))
-+		vdoa_read_register(vdoa, VDOAIUBO, &buf->iubo);
-+}
-+
-+int vdoa_start(vdoa_handle_t handle, int timeout_ms)
-+{
-+	int ret;
-+	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
-+
-+	CHECK_NULL_PTR(vdoa);
-+	CHECK_STATE(VDOA_GET_OBUF, return -EINVAL);
-+	vdoa->state = VDOA_START;
-+	init_completion(&vdoa->comp);
-+	vdoa_write_register(vdoa, VDOAIST,
-+			VDOAIEIST_TRANSFER_ERR | VDOAIEIST_TRANSFER_END);
-+	vdoa_write_register(vdoa, VDOAIE,
-+			VDOAIEIST_TRANSFER_ERR | VDOAIEIST_TRANSFER_END);
-+
-+	enable_irq(vdoa->irq);
-+	vdoa_write_register(vdoa, VDOASRR, VDOASRR_START_XFER);
-+	dump_registers(vdoa);
-+
-+	ret = wait_for_completion_timeout(&vdoa->comp,
-+			msecs_to_jiffies(timeout_ms));
-+
-+	return ret > 0 ? 0 : -ETIMEDOUT;
-+}
-+
-+void vdoa_stop(vdoa_handle_t handle)
-+{
-+	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
-+
-+	CHECK_NULL_PTR(vdoa);
-+	CHECK_STATE(VDOA_GET | VDOA_START | VDOA_INIRQ, return);
-+	vdoa->state = VDOA_STOP;
-+
-+	disable_irq(vdoa->irq);
-+
-+	vdoa_write_register(vdoa, VDOASRR, VDOASRR_SWRST);
-+}
-+
-+void vdoa_get_handle(vdoa_handle_t *handle)
-+{
-+	struct vdoa_info *vdoa = g_vdoa;
-+
-+	CHECK_NULL_PTR(handle);
-+	*handle = (vdoa_handle_t *)NULL;
-+	CHECK_STATE(VDOA_INIT, return);
-+	mutex_lock(&vdoa_lock);
-+	clk_prepare_enable(vdoa->vdoa_clk);
-+	vdoa->state = VDOA_GET;
-+	vdoa->field = VDOA_NULL;
-+	vdoa_write_register(vdoa, VDOASRR, VDOASRR_SWRST);
-+
-+	*handle = (vdoa_handle_t *)vdoa;
-+}
-+
-+void vdoa_put_handle(vdoa_handle_t *handle)
-+{
-+	struct vdoa_info *vdoa = (struct vdoa_info *)(*handle);
-+
-+	CHECK_NULL_PTR(vdoa);
-+	CHECK_STATE(VDOA_STOP, return);
-+	if (vdoa != g_vdoa)
-+		BUG();
-+
-+	clk_disable_unprepare(vdoa->vdoa_clk);
-+	vdoa->state = VDOA_PUT;
-+	*handle = (vdoa_handle_t *)NULL;
-+	mutex_unlock(&vdoa_lock);
-+}
-+
-+static irqreturn_t vdoa_irq_handler(int irq, void *data)
-+{
-+	u32 status, mask, val;
-+	struct vdoa_info *vdoa = data;
-+
-+	CHECK_NULL_PTR(vdoa);
-+	CHECK_STATE(VDOA_START, return IRQ_HANDLED);
-+	vdoa->state = VDOA_INIRQ;
-+	vdoa_read_register(vdoa, VDOAIST, &status);
-+	vdoa_read_register(vdoa, VDOAIE, &mask);
-+	val = status & mask;
-+	vdoa_write_register(vdoa, VDOAIST, val);
-+	if (VDOAIEIST_TRANSFER_ERR & val)
-+		dev_err(vdoa->dev, "vdoa Transfer err irq!\n");
-+	if (VDOAIEIST_TRANSFER_END & val)
-+		dev_dbg(vdoa->dev, "vdoa Transfer end irq!\n");
-+	if (0 == val) {
-+		dev_err(vdoa->dev, "vdoa unknown irq!\n");
-+		BUG();
-+	}
-+
-+	complete(&vdoa->comp);
-+	return IRQ_HANDLED;
-+}
-+
-+/* IRAM Size in Kbytes, example:vdoa_iram_size=64, 64KBytes */
-+static int __init vdoa_iram_size_setup(char *options)
-+{
-+	int ret;
-+
-+	ret = kstrtol(options, 0, &iram_size);
-+	if (ret)
-+		iram_size = 0;
-+	else
-+		iram_size *= SZ_1K;
-+
-+	return 1;
-+}
-+__setup("vdoa_iram_size=", vdoa_iram_size_setup);
-+
-+static const struct of_device_id imx_vdoa_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-vdoa", },
-+	{ /* sentinel */ }
-+};
-+
-+static int vdoa_probe(struct platform_device *pdev)
-+{
-+	int ret;
-+	struct vdoa_info *vdoa;
-+	struct resource *res;
-+	struct resource *res_irq;
-+	struct device	*dev = &pdev->dev;
-+	struct device_node *np = pdev->dev.of_node;
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res) {
-+		dev_err(dev, "can't get device resources\n");
-+		return -ENOENT;
-+	}
-+
-+	res_irq = platform_get_resource(pdev, IORESOURCE_IRQ, 0);
-+	if (!res_irq) {
-+		dev_err(dev, "failed to get irq resource\n");
-+		return -ENOENT;
-+	}
-+
-+	vdoa = devm_kzalloc(dev, sizeof(struct vdoa_info), GFP_KERNEL);
-+	if (!vdoa)
-+		return -ENOMEM;
-+	vdoa->dev = dev;
-+
-+	vdoa->reg_base = devm_ioremap_resource(&pdev->dev, res);
-+	if (!vdoa->reg_base)
-+		return -EBUSY;
-+
-+	vdoa->irq = res_irq->start;
-+	ret = devm_request_irq(dev, vdoa->irq, vdoa_irq_handler, 0,
-+				"vdoa", vdoa);
-+	if (ret) {
-+		dev_err(dev, "can't claim irq %d\n", vdoa->irq);
-+		return ret;
-+	}
-+	disable_irq(vdoa->irq);
-+
-+	vdoa->vdoa_clk = devm_clk_get(dev, NULL);
-+	if (IS_ERR(vdoa->vdoa_clk)) {
-+		dev_err(dev, "failed to get vdoa_clk\n");
-+		return PTR_ERR(vdoa->vdoa_clk);
-+	}
-+
-+	vdoa->iram_pool = of_get_named_gen_pool(np, "iram", 0);
-+	if (!vdoa->iram_pool) {
-+		dev_err(&pdev->dev, "iram pool not available\n");
-+		return -ENOMEM;
-+	}
-+
-+	if ((iram_size == 0) || (iram_size > MAX_VDOA_IRAM_SIZE))
-+		iram_size = VDOA_IRAM_SIZE;
-+
-+	vdoa->iram_base = gen_pool_alloc(vdoa->iram_pool, iram_size);
-+	if (!vdoa->iram_base) {
-+		dev_err(&pdev->dev, "unable to alloc iram\n");
-+		return -ENOMEM;
-+	}
-+
-+	vdoa->iram_paddr = gen_pool_virt_to_phys(vdoa->iram_pool,
-+						 vdoa->iram_base);
-+
-+	dev_dbg(dev, "iram_base:0x%lx,iram_paddr:0x%lx,size:0x%lx\n",
-+		 vdoa->iram_base, vdoa->iram_paddr, iram_size);
-+
-+	vdoa->state = VDOA_INIT;
-+	dev_set_drvdata(dev, vdoa);
-+	g_vdoa = vdoa;
-+	dev_info(dev, "i.MX Video Data Order Adapter(VDOA) driver probed\n");
-+	return 0;
-+}
-+
-+static int vdoa_remove(struct platform_device *pdev)
-+{
-+	struct vdoa_info *vdoa = dev_get_drvdata(&pdev->dev);
-+
-+	gen_pool_free(vdoa->iram_pool, vdoa->iram_base, iram_size);
-+	kfree(vdoa);
-+	dev_set_drvdata(&pdev->dev, NULL);
-+
-+	return 0;
-+}
-+
-+static struct platform_driver vdoa_driver = {
-+	.driver = {
-+		.name = "mxc_vdoa",
-+		.of_match_table = imx_vdoa_dt_ids,
-+	},
-+	.probe = vdoa_probe,
-+	.remove = vdoa_remove,
-+};
-+
-+static int __init vdoa_init(void)
-+{
-+	int err;
-+
-+	err = platform_driver_register(&vdoa_driver);
-+	if (err) {
-+		pr_err("vdoa_driver register failed\n");
-+		return -ENODEV;
-+	}
-+	return 0;
-+}
-+
-+static void __exit vdoa_cleanup(void)
-+{
-+	platform_driver_unregister(&vdoa_driver);
-+}
-+
-+module_init(vdoa_init);
-+module_exit(vdoa_cleanup);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("i.MX Video Data Order Adapter(VDOA) driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/mxc/ipu3/vdoa.h linux-xbian-imx6/drivers/mxc/ipu3/vdoa.h
---- linux-4.1.3/drivers/mxc/ipu3/vdoa.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/ipu3/vdoa.h	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,69 @@
-+/*
-+ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __VDOA_H__
-+#define __VDOA_H__
-+
-+#define VDOA_PFS_YUYV (1)
-+#define VDOA_PFS_NV12 (0)
-+
-+
-+struct vfield_buf {
-+	u32	prev_veba;
-+	u32	cur_veba;
-+	u32	next_veba;
-+	u32	vubo;
-+};
-+
-+struct vframe_buf {
-+	u32	veba;
-+	u32	vubo;
-+};
-+
-+struct vdoa_params {
-+	u32	width;
-+	u32	height;
-+	int	vpu_stride;
-+	int	interlaced;
-+	int	scan_order;
-+	int	ipu_num;
-+	int	band_lines;
-+	int	band_mode;
-+	int	pfs;
-+	u32	ieba0;
-+	u32	ieba1;
-+	u32	ieba2;
-+	struct	vframe_buf vframe_buf;
-+	struct	vfield_buf vfield_buf;
-+};
-+struct vdoa_ipu_buf {
-+	u32	ieba0;
-+	u32	ieba1;
-+	u32	iubo;
-+};
-+
-+struct vdoa_info;
-+typedef void *vdoa_handle_t;
-+
-+int vdoa_setup(vdoa_handle_t handle, struct vdoa_params *params);
-+void vdoa_get_output_buf(vdoa_handle_t handle, struct vdoa_ipu_buf *buf);
-+int  vdoa_start(vdoa_handle_t handle, int timeout_ms);
-+void vdoa_stop(vdoa_handle_t handle);
-+void vdoa_get_handle(vdoa_handle_t *handle);
-+void vdoa_put_handle(vdoa_handle_t *handle);
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/Kconfig linux-xbian-imx6/drivers/mxc/Kconfig
---- linux-4.1.3/drivers/mxc/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/Kconfig	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,25 @@
-+# drivers/mxc/Kconfig
-+
-+if ARCH_MXC
-+
-+menu "MXC support drivers"
-+
-+config MXC_IPU
-+	tristate "Image Processing Unit Driver"
-+	select MXC_IPU_V3_FSL
-+	depends on !IMX_IPUV3_CORE
-+	help
-+	  If you plan to use the Image Processing unit, say
-+	  Y here. IPU is needed by Framebuffer and V4L2 drivers.
-+
-+source "drivers/mxc/gpu-viv/Kconfig"
-+source "drivers/mxc/ipu3/Kconfig"
-+source "drivers/mxc/asrc/Kconfig"
-+source "drivers/mxc/vpu/Kconfig"
-+source "drivers/mxc/hdmi-cec/Kconfig"
-+source "drivers/mxc/mipi/Kconfig"
-+source "drivers/mxc/mlb/Kconfig"
-+
-+endmenu
-+
-+endif
-diff -Nur linux-4.1.3/drivers/mxc/Makefile linux-xbian-imx6/drivers/mxc/Makefile
---- linux-4.1.3/drivers/mxc/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/Makefile	2015-07-27 23:13:06.166979215 +0200
-@@ -0,0 +1,7 @@
-+obj-$(CONFIG_MXC_GPU_VIV) += gpu-viv/
-+obj-$(CONFIG_MXC_IPU_V3_FSL) += ipu3/
-+obj-$(CONFIG_MXC_ASRC) += asrc/
-+obj-$(CONFIG_MXC_VPU) += vpu/
-+obj-$(CONFIG_MXC_HDMI_CEC) += hdmi-cec/
-+obj-$(CONFIG_MXC_MIPI_CSI2) += mipi/
-+obj-$(CONFIG_MXC_MLB) += mlb/
-diff -Nur linux-4.1.3/drivers/mxc/mipi/Kconfig linux-xbian-imx6/drivers/mxc/mipi/Kconfig
---- linux-4.1.3/drivers/mxc/mipi/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mipi/Kconfig	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,14 @@
-+#
-+# MIPI configuration
-+#
-+
-+menu "MXC MIPI Support"
-+
-+config MXC_MIPI_CSI2
-+	tristate "MIPI CSI2 support"
-+	depends on SOC_IMX6Q
-+	default n
-+	---help---
-+	Say Y to get the MIPI CSI2 support.
-+
-+endmenu
-diff -Nur linux-4.1.3/drivers/mxc/mipi/Makefile linux-xbian-imx6/drivers/mxc/mipi/Makefile
---- linux-4.1.3/drivers/mxc/mipi/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mipi/Makefile	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,4 @@
-+#
-+# Makefile for the mipi interface driver
-+#
-+obj-$(CONFIG_MXC_MIPI_CSI2) += mxc_mipi_csi2.o
-diff -Nur linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.c linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.c
---- linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.c	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,540 @@
-+/*
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/module.h>
-+#include <linux/types.h>
-+#include <linux/interrupt.h>
-+#include <linux/irq.h>
-+#include <linux/irqdesc.h>
-+#include <linux/init.h>
-+#include <linux/platform_device.h>
-+#include <linux/err.h>
-+#include <linux/clk.h>
-+#include <linux/console.h>
-+#include <linux/io.h>
-+#include <linux/bitops.h>
-+#include <linux/delay.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/slab.h>
-+#include <linux/of.h>
-+
-+#include <linux/mipi_csi2.h>
-+
-+#include "mxc_mipi_csi2.h"
-+
-+static struct mipi_csi2_info *gmipi_csi2;
-+
-+void _mipi_csi2_lock(struct mipi_csi2_info *info)
-+{
-+	if (!in_irq() && !in_softirq())
-+		mutex_lock(&info->mutex_lock);
-+}
-+
-+void _mipi_csi2_unlock(struct mipi_csi2_info *info)
-+{
-+	if (!in_irq() && !in_softirq())
-+		mutex_unlock(&info->mutex_lock);
-+}
-+
-+static inline void mipi_csi2_write(struct mipi_csi2_info *info,
-+		unsigned value, unsigned offset)
-+{
-+	writel(value, info->mipi_csi2_base + offset);
-+}
-+
-+static inline unsigned int mipi_csi2_read(struct mipi_csi2_info *info,
-+		unsigned offset)
-+{
-+	return readl(info->mipi_csi2_base + offset);
-+}
-+
-+/*!
-+ * This function is called to enable the mipi csi2 interface.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns setted value
-+ */
-+bool mipi_csi2_enable(struct mipi_csi2_info *info)
-+{
-+	bool status;
-+
-+	_mipi_csi2_lock(info);
-+
-+	if (!info->mipi_en) {
-+		info->mipi_en = true;
-+		clk_prepare_enable(info->cfg_clk);
-+		clk_prepare_enable(info->dphy_clk);
-+	} else
-+		mipi_dbg("mipi csi2 already enabled!\n");
-+
-+	status = info->mipi_en;
-+
-+	_mipi_csi2_unlock(info);
-+
-+	return status;
-+}
-+EXPORT_SYMBOL(mipi_csi2_enable);
-+
-+/*!
-+ * This function is called to disable the mipi csi2 interface.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns setted value
-+ */
-+bool mipi_csi2_disable(struct mipi_csi2_info *info)
-+{
-+	bool status;
-+
-+	_mipi_csi2_lock(info);
-+
-+	if (info->mipi_en) {
-+		info->mipi_en = false;
-+		clk_disable_unprepare(info->dphy_clk);
-+		clk_disable_unprepare(info->cfg_clk);
-+	} else
-+		mipi_dbg("mipi csi2 already disabled!\n");
-+
-+	status = info->mipi_en;
-+
-+	_mipi_csi2_unlock(info);
-+
-+	return status;
-+}
-+EXPORT_SYMBOL(mipi_csi2_disable);
-+
-+/*!
-+ * This function is called to get mipi csi2 disable/enable status.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns mipi csi2 status
-+ */
-+bool mipi_csi2_get_status(struct mipi_csi2_info *info)
-+{
-+	bool status;
-+
-+	_mipi_csi2_lock(info);
-+	status = info->mipi_en;
-+	_mipi_csi2_unlock(info);
-+
-+	return status;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_status);
-+
-+/*!
-+ * This function is called to set mipi lanes.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns setted value
-+ */
-+unsigned int mipi_csi2_set_lanes(struct mipi_csi2_info *info)
-+{
-+	unsigned int lanes;
-+
-+	_mipi_csi2_lock(info);
-+	mipi_csi2_write(info, info->lanes - 1, MIPI_CSI2_N_LANES);
-+	lanes = mipi_csi2_read(info, MIPI_CSI2_N_LANES);
-+	_mipi_csi2_unlock(info);
-+
-+	return lanes;
-+}
-+EXPORT_SYMBOL(mipi_csi2_set_lanes);
-+
-+/*!
-+ * This function is called to set mipi data type.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns setted value
-+ */
-+unsigned int mipi_csi2_set_datatype(struct mipi_csi2_info *info,
-+					unsigned int datatype)
-+{
-+	unsigned int dtype;
-+
-+	_mipi_csi2_lock(info);
-+	info->datatype = datatype;
-+	dtype = info->datatype;
-+	_mipi_csi2_unlock(info);
-+
-+	return dtype;
-+}
-+EXPORT_SYMBOL(mipi_csi2_set_datatype);
-+
-+/*!
-+ * This function is called to get mipi data type.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns mipi data type
-+ */
-+unsigned int mipi_csi2_get_datatype(struct mipi_csi2_info *info)
-+{
-+	unsigned int dtype;
-+
-+	_mipi_csi2_lock(info);
-+	dtype = info->datatype;
-+	_mipi_csi2_unlock(info);
-+
-+	return dtype;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_datatype);
-+
-+/*!
-+ * This function is called to get mipi csi2 dphy status.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns dphy status
-+ */
-+unsigned int mipi_csi2_dphy_status(struct mipi_csi2_info *info)
-+{
-+	unsigned int status;
-+
-+	_mipi_csi2_lock(info);
-+	status = mipi_csi2_read(info, MIPI_CSI2_PHY_STATE);
-+	_mipi_csi2_unlock(info);
-+
-+	return status;
-+}
-+EXPORT_SYMBOL(mipi_csi2_dphy_status);
-+
-+/*!
-+ * This function is called to get mipi csi2 error1 status.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns error1 value
-+ */
-+unsigned int mipi_csi2_get_error1(struct mipi_csi2_info *info)
-+{
-+	unsigned int err1;
-+
-+	_mipi_csi2_lock(info);
-+	err1 = mipi_csi2_read(info, MIPI_CSI2_ERR1);
-+	_mipi_csi2_unlock(info);
-+
-+	return err1;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_error1);
-+
-+/*!
-+ * This function is called to get mipi csi2 error1 status.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns error1 value
-+ */
-+unsigned int mipi_csi2_get_error2(struct mipi_csi2_info *info)
-+{
-+	unsigned int err2;
-+
-+	_mipi_csi2_lock(info);
-+	err2 = mipi_csi2_read(info, MIPI_CSI2_ERR2);
-+	_mipi_csi2_unlock(info);
-+
-+	return err2;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_error2);
-+
-+/*!
-+ * This function is called to enable mipi to ipu pixel clock.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int mipi_csi2_pixelclk_enable(struct mipi_csi2_info *info)
-+{
-+	return clk_prepare_enable(info->pixel_clk);
-+}
-+EXPORT_SYMBOL(mipi_csi2_pixelclk_enable);
-+
-+/*!
-+ * This function is called to disable mipi to ipu pixel clock.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+void mipi_csi2_pixelclk_disable(struct mipi_csi2_info *info)
-+{
-+	clk_disable_unprepare(info->pixel_clk);
-+}
-+EXPORT_SYMBOL(mipi_csi2_pixelclk_disable);
-+
-+/*!
-+ * This function is called to power on mipi csi2.
-+ *
-+ * @param	info		mipi csi2 hander
-+ * @return      Returns 0 on success or negative error code on fail
-+ */
-+int mipi_csi2_reset(struct mipi_csi2_info *info)
-+{
-+	_mipi_csi2_lock(info);
-+
-+	mipi_csi2_write(info, 0x0, MIPI_CSI2_PHY_SHUTDOWNZ);
-+	mipi_csi2_write(info, 0x0, MIPI_CSI2_DPHY_RSTZ);
-+	mipi_csi2_write(info, 0x0, MIPI_CSI2_CSI2_RESETN);
-+
-+	mipi_csi2_write(info, 0x00000001, MIPI_CSI2_PHY_TST_CTRL0);
-+	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL1);
-+	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL0);
-+	mipi_csi2_write(info, 0x00000002, MIPI_CSI2_PHY_TST_CTRL0);
-+	mipi_csi2_write(info, 0x00010044, MIPI_CSI2_PHY_TST_CTRL1);
-+	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL0);
-+	mipi_csi2_write(info, 0x00000014, MIPI_CSI2_PHY_TST_CTRL1);
-+	mipi_csi2_write(info, 0x00000002, MIPI_CSI2_PHY_TST_CTRL0);
-+	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL0);
-+
-+	mipi_csi2_write(info, 0xffffffff, MIPI_CSI2_PHY_SHUTDOWNZ);
-+	mipi_csi2_write(info, 0xffffffff, MIPI_CSI2_DPHY_RSTZ);
-+	mipi_csi2_write(info, 0xffffffff, MIPI_CSI2_CSI2_RESETN);
-+
-+	_mipi_csi2_unlock(info);
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(mipi_csi2_reset);
-+
-+/*!
-+ * This function is called to get mipi csi2 info.
-+ *
-+ * @return      Returns mipi csi2 info struct pointor
-+ */
-+struct mipi_csi2_info *mipi_csi2_get_info(void)
-+{
-+	return gmipi_csi2;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_info);
-+
-+/*!
-+ * This function is called to get mipi csi2 bind ipu num.
-+ *
-+ * @return      Returns mipi csi2 bind ipu num
-+ */
-+int mipi_csi2_get_bind_ipu(struct mipi_csi2_info *info)
-+{
-+	int ipu_id;
-+
-+	_mipi_csi2_lock(info);
-+	ipu_id = info->ipu_id;
-+	_mipi_csi2_unlock(info);
-+
-+	return ipu_id;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_bind_ipu);
-+
-+/*!
-+ * This function is called to get mipi csi2 bind csi num.
-+ *
-+ * @return      Returns mipi csi2 bind csi num
-+ */
-+unsigned int mipi_csi2_get_bind_csi(struct mipi_csi2_info *info)
-+{
-+	unsigned int csi_id;
-+
-+	_mipi_csi2_lock(info);
-+	csi_id = info->csi_id;
-+	_mipi_csi2_unlock(info);
-+
-+	return csi_id;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_bind_csi);
-+
-+/*!
-+ * This function is called to get mipi csi2 virtual channel.
-+ *
-+ * @return      Returns mipi csi2 virtual channel num
-+ */
-+unsigned int mipi_csi2_get_virtual_channel(struct mipi_csi2_info *info)
-+{
-+	unsigned int v_channel;
-+
-+	_mipi_csi2_lock(info);
-+	v_channel = info->v_channel;
-+	_mipi_csi2_unlock(info);
-+
-+	return v_channel;
-+}
-+EXPORT_SYMBOL(mipi_csi2_get_virtual_channel);
-+
-+/**
-+ * This function is called by the driver framework to initialize the MIPI CSI2
-+ * device.
-+ *
-+ * @param	pdev	The device structure for the MIPI CSI2 passed in by the
-+ *			driver framework.
-+ *
-+ * @return      Returns 0 on success or negative error code on error
-+ */
-+static int mipi_csi2_probe(struct platform_device *pdev)
-+{
-+	struct device *dev = &pdev->dev;
-+	struct device_node *np = pdev->dev.of_node;
-+	struct resource *res;
-+	u32 mipi_csi2_dphy_ver;
-+	int ret;
-+
-+	gmipi_csi2 = kmalloc(sizeof(struct mipi_csi2_info), GFP_KERNEL);
-+	if (!gmipi_csi2) {
-+		ret = -ENOMEM;
-+		goto alloc_failed;
-+	}
-+
-+	ret = of_property_read_u32(np, "ipu_id", &(gmipi_csi2->ipu_id));
-+	if (ret) {
-+		dev_err(&pdev->dev, "ipu_id missing or invalid\n");
-+		goto err;
-+	}
-+
-+	ret = of_property_read_u32(np, "csi_id", &(gmipi_csi2->csi_id));
-+	if (ret) {
-+		dev_err(&pdev->dev, "csi_id missing or invalid\n");
-+		goto err;
-+	}
-+
-+	ret = of_property_read_u32(np, "v_channel", &(gmipi_csi2->v_channel));
-+	if (ret) {
-+		dev_err(&pdev->dev, "v_channel missing or invalid\n");
-+		goto err;
-+	}
-+
-+	ret = of_property_read_u32(np, "lanes", &(gmipi_csi2->lanes));
-+	if (ret) {
-+		dev_err(&pdev->dev, "lanes missing or invalid\n");
-+		goto err;
-+	}
-+
-+	if ((gmipi_csi2->ipu_id < 0) || (gmipi_csi2->ipu_id > 1) ||
-+		(gmipi_csi2->csi_id > 1) || (gmipi_csi2->v_channel > 3) ||
-+		(gmipi_csi2->lanes > 4)) {
-+		dev_err(&pdev->dev, "invalid param for mipi csi2!\n");
-+		ret = -EINVAL;
-+		goto err;
-+	}
-+
-+	/* initialize mutex */
-+	mutex_init(&gmipi_csi2->mutex_lock);
-+
-+	/* get mipi csi2 informaiton */
-+	gmipi_csi2->pdev = pdev;
-+	gmipi_csi2->mipi_en = false;
-+
-+	gmipi_csi2->cfg_clk = devm_clk_get(dev, "cfg_clk");
-+	if (IS_ERR(gmipi_csi2->cfg_clk)) {
-+		dev_err(&pdev->dev, "failed to get cfg_clk\n");
-+		ret = PTR_ERR(gmipi_csi2->cfg_clk);
-+		goto err;
-+	}
-+
-+	/* get mipi dphy clk */
-+	gmipi_csi2->dphy_clk = devm_clk_get(dev, "dphy_clk");
-+	if (IS_ERR(gmipi_csi2->dphy_clk)) {
-+		dev_err(&pdev->dev, "failed to get dphy pll_ref_clk\n");
-+		ret = PTR_ERR(gmipi_csi2->dphy_clk);
-+		goto err;
-+	}
-+
-+	/* get mipi to ipu pixel clk */
-+	gmipi_csi2->pixel_clk = devm_clk_get(dev, "pixel_clk");
-+	if (IS_ERR(gmipi_csi2->pixel_clk)) {
-+		dev_err(&pdev->dev, "failed to get mipi pixel clk\n");
-+		ret = PTR_ERR(gmipi_csi2->pixel_clk);
-+		goto err;
-+	}
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res) {
-+		ret = -ENODEV;
-+		goto err;
-+	}
-+
-+	/* mipi register mapping */
-+	gmipi_csi2->mipi_csi2_base = ioremap(res->start, PAGE_SIZE);
-+	if (!gmipi_csi2->mipi_csi2_base) {
-+		ret = -ENOMEM;
-+		goto err;
-+	}
-+
-+	/* mipi dphy clk enable for register access */
-+	clk_prepare_enable(gmipi_csi2->dphy_clk);
-+	/* get mipi csi2 dphy version */
-+	mipi_csi2_dphy_ver = mipi_csi2_read(gmipi_csi2, MIPI_CSI2_VERSION);
-+
-+	clk_disable_unprepare(gmipi_csi2->dphy_clk);
-+
-+	platform_set_drvdata(pdev, gmipi_csi2);
-+
-+	dev_info(&pdev->dev, "i.MX MIPI CSI2 driver probed\n");
-+	dev_info(&pdev->dev, "i.MX MIPI CSI2 dphy version is 0x%x\n",
-+						mipi_csi2_dphy_ver);
-+
-+	return 0;
-+
-+err:
-+	kfree(gmipi_csi2);
-+alloc_failed:
-+	dev_err(&pdev->dev, "i.MX MIPI CSI2 driver probed -  error\n");
-+	return ret;
-+}
-+
-+static int mipi_csi2_remove(struct platform_device *pdev)
-+{
-+	/* unmapping mipi register */
-+	iounmap(gmipi_csi2->mipi_csi2_base);
-+
-+	kfree(gmipi_csi2);
-+
-+	dev_set_drvdata(&pdev->dev, NULL);
-+
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_mipi_csi2_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-mipi-csi2", },
-+	{ /* sentinel */ }
-+};
-+
-+static struct platform_driver mipi_csi2_driver = {
-+	.driver = {
-+		   .name = "mxc_mipi_csi2",
-+		   .of_match_table = imx_mipi_csi2_dt_ids,
-+	},
-+	.probe = mipi_csi2_probe,
-+	.remove = mipi_csi2_remove,
-+};
-+
-+static int __init mipi_csi2_init(void)
-+{
-+	int err;
-+
-+	err = platform_driver_register(&mipi_csi2_driver);
-+	if (err) {
-+		pr_err("mipi_csi2_driver register failed\n");
-+		return -ENODEV;
-+	}
-+
-+	pr_info("MIPI CSI2 driver module loaded\n");
-+
-+	return 0;
-+}
-+
-+static void __exit mipi_csi2_cleanup(void)
-+{
-+	platform_driver_unregister(&mipi_csi2_driver);
-+}
-+
-+subsys_initcall(mipi_csi2_init);
-+module_exit(mipi_csi2_cleanup);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("i.MX MIPI CSI2 driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.h linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.h
---- linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.h	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,46 @@
-+/*
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __MXC_MIPI_CSI2_H__
-+#define __MXC_MIPI_CSI2_H__
-+
-+#ifdef DEBUG
-+#define mipi_dbg(fmt, ...)	\
-+	printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__)
-+#else
-+#define mipi_dbg(fmt, ...)
-+#endif
-+
-+/* driver private data */
-+struct mipi_csi2_info {
-+	bool		mipi_en;
-+	int		ipu_id;
-+	unsigned int	csi_id;
-+	unsigned int	v_channel;
-+	unsigned int	lanes;
-+	unsigned int	datatype;
-+	struct clk	*cfg_clk;
-+	struct clk	*dphy_clk;
-+	struct clk	*pixel_clk;
-+	void __iomem	*mipi_csi2_base;
-+	struct platform_device	*pdev;
-+
-+	struct mutex mutex_lock;
-+};
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/mxc/mlb/Kconfig linux-xbian-imx6/drivers/mxc/mlb/Kconfig
---- linux-4.1.3/drivers/mxc/mlb/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mlb/Kconfig	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,17 @@
-+#
-+# MLB150 configuration
-+#
-+
-+menu "MXC Media Local Bus Driver"
-+
-+config MXC_MLB
-+	boolean
-+
-+config MXC_MLB150
-+	tristate "MLB150 support"
-+	depends on SOC_IMX6Q
-+	select MXC_MLB
-+	---help---
-+	Say Y to get the MLB150 support.
-+
-+endmenu
-diff -Nur linux-4.1.3/drivers/mxc/mlb/Makefile linux-xbian-imx6/drivers/mxc/mlb/Makefile
---- linux-4.1.3/drivers/mxc/mlb/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mlb/Makefile	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,5 @@
-+#
-+# Makefile for the i.MX6Q/DL MLB150 driver
-+#
-+
-+obj-$(CONFIG_MXC_MLB150) += mxc_mlb150.o
-diff -Nur linux-4.1.3/drivers/mxc/mlb/mxc_mlb150.c linux-xbian-imx6/drivers/mxc/mlb/mxc_mlb150.c
---- linux-4.1.3/drivers/mxc/mlb/mxc_mlb150.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/mlb/mxc_mlb150.c	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,2778 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/cdev.h>
-+#include <linux/circ_buf.h>
-+#include <linux/clk.h>
-+#include <linux/delay.h>
-+#include <linux/device.h>
-+#include <linux/errno.h>
-+#include <linux/fs.h>
-+#include <linux/genalloc.h>
-+#include <linux/init.h>
-+#include <linux/interrupt.h>
-+#include <linux/io.h>
-+#include <linux/kernel.h>
-+#include <linux/module.h>
-+#include <linux/mxc_mlb.h>
-+#include <linux/of.h>
-+#include <linux/platform_device.h>
-+#include <linux/poll.h>
-+#include <linux/regulator/consumer.h>
-+#include <linux/sched.h>
-+#include <linux/slab.h>
-+#include <linux/spinlock.h>
-+#include <linux/uaccess.h>
-+
-+#define DRIVER_NAME "mxc_mlb150"
-+
-+/*
-+ * MLB module memory map registers define
-+ */
-+#define REG_MLBC0		0x0
-+#define MLBC0_MLBEN		(0x1)
-+#define MLBC0_MLBCLK_MASK	(0x7 << 2)
-+#define MLBC0_MLBCLK_SHIFT	(2)
-+#define MLBC0_MLBPEN		(0x1 << 5)
-+#define MLBC0_MLBLK		(0x1 << 7)
-+#define MLBC0_ASYRETRY		(0x1 << 12)
-+#define MLBC0_CTLRETRY		(0x1 << 12)
-+#define MLBC0_FCNT_MASK		(0x7 << 15)
-+#define MLBC0_FCNT_SHIFT	(15)
-+
-+#define REG_MLBPC0		0x8
-+#define MLBPC0_MCLKHYS		(0x1 << 11)
-+
-+#define REG_MS0			0xC
-+#define REG_MS1			0x14
-+
-+#define REG_MSS			0x20
-+#define MSS_RSTSYSCMD		(0x1)
-+#define MSS_LKSYSCMD		(0x1 << 1)
-+#define MSS_ULKSYSCMD		(0x1 << 2)
-+#define MSS_CSSYSCMD		(0x1 << 3)
-+#define MSS_SWSYSCMD		(0x1 << 4)
-+#define MSS_SERVREQ		(0x1 << 5)
-+
-+#define REG_MSD			0x24
-+
-+#define REG_MIEN		0x2C
-+#define MIEN_ISOC_PE		(0x1)
-+#define MIEN_ISOC_BUFO		(0x1 << 1)
-+#define MIEN_SYNC_PE		(0x1 << 16)
-+#define MIEN_ARX_DONE		(0x1 << 17)
-+#define MIEN_ARX_PE		(0x1 << 18)
-+#define MIEN_ARX_BREAK		(0x1 << 19)
-+#define MIEN_ATX_DONE		(0x1 << 20)
-+#define MIEN_ATX_PE		(0x1 << 21)
-+#define MIEN_ATX_BREAK		(0x1 << 22)
-+#define MIEN_CRX_DONE		(0x1 << 24)
-+#define MIEN_CRX_PE		(0x1 << 25)
-+#define MIEN_CRX_BREAK		(0x1 << 26)
-+#define MIEN_CTX_DONE		(0x1 << 27)
-+#define MIEN_CTX_PE		(0x1 << 28)
-+#define MIEN_CTX_BREAK		(0x1 << 29)
-+
-+#define REG_MLBPC2		0x34
-+#define REG_MLBPC1		0x38
-+#define MLBPC1_VAL		(0x00000888)
-+
-+#define REG_MLBC1		0x3C
-+#define MLBC1_LOCK		(0x1 << 6)
-+#define MLBC1_CLKM		(0x1 << 7)
-+#define MLBC1_NDA_MASK		(0xFF << 8)
-+#define MLBC1_NDA_SHIFT		(8)
-+
-+#define REG_HCTL		0x80
-+#define HCTL_RST0		(0x1)
-+#define HCTL_RST1		(0x1 << 1)
-+#define HCTL_EN			(0x1 << 15)
-+
-+#define REG_HCMR0		0x88
-+#define REG_HCMR1		0x8C
-+#define REG_HCER0		0x90
-+#define REG_HCER1		0x94
-+#define REG_HCBR0		0x98
-+#define REG_HCBR1		0x9C
-+
-+#define REG_MDAT0		0xC0
-+#define REG_MDAT1		0xC4
-+#define REG_MDAT2		0xC8
-+#define REG_MDAT3		0xCC
-+
-+#define REG_MDWE0		0xD0
-+#define REG_MDWE1		0xD4
-+#define REG_MDWE2		0xD8
-+#define REG_MDWE3		0xDC
-+
-+#define REG_MCTL		0xE0
-+#define MCTL_XCMP		(0x1)
-+
-+#define REG_MADR		0xE4
-+#define MADR_WNR		(0x1 << 31)
-+#define MADR_TB			(0x1 << 30)
-+#define MADR_ADDR_MASK		(0x7f << 8)
-+#define MADR_ADDR_SHIFT		(0)
-+
-+#define REG_ACTL		0x3C0
-+#define ACTL_MPB		(0x1 << 4)
-+#define ACTL_DMAMODE		(0x1 << 2)
-+#define ACTL_SMX		(0x1 << 1)
-+#define ACTL_SCE		(0x1)
-+
-+#define REG_ACSR0		0x3D0
-+#define REG_ACSR1		0x3D4
-+#define REG_ACMR0		0x3D8
-+#define REG_ACMR1		0x3DC
-+
-+#define REG_CAT_MDATn(ch) (REG_MDAT0 + ((ch % 8) >> 1) * 4)
-+#define REG_CAT_MDWEn(ch) (REG_MDWE0 + ((ch % 8) >> 1) * 4)
-+
-+#define INT_AHB0_CH_START	(0)
-+#define INT_AHB1_CH_START	(32)
-+
-+#define LOGIC_CH_NUM		(64)
-+#define BUF_CDT_OFFSET		(0x0)
-+#define BUF_ADT_OFFSET		(0x40)
-+#define BUF_CAT_MLB_OFFSET	(0x80)
-+#define BUF_CAT_HBI_OFFSET	(0x88)
-+#define BUF_CTR_END_OFFSET	(0x8F)
-+
-+#define CAT_MODE_RX		(0x1 << 0)
-+#define CAT_MODE_TX		(0x1 << 1)
-+#define CAT_MODE_INBOUND_DMA	(0x1 << 8)
-+#define CAT_MODE_OUTBOUND_DMA	(0x1 << 9)
-+
-+#define CH_SYNC_DEFAULT_QUAD	(1)
-+#define CH_SYNC_MAX_QUAD	(15)
-+#define CH_SYNC_CDT_BUF_DEP	(CH_SYNC_DEFAULT_QUAD * 4 * 4)
-+#define CH_SYNC_ADT_BUF_MULTI	(4)
-+#define CH_SYNC_ADT_BUF_DEP	(CH_SYNC_CDT_BUF_DEP * CH_SYNC_ADT_BUF_MULTI)
-+#define CH_SYNC_BUF_SZ		(CH_SYNC_MAX_QUAD * 4 * 4 * \
-+				CH_SYNC_ADT_BUF_MULTI)
-+#define CH_CTRL_CDT_BUF_DEP	(64)
-+#define CH_CTRL_ADT_BUF_DEP	(CH_CTRL_CDT_BUF_DEP)
-+#define CH_CTRL_BUF_SZ		(CH_CTRL_ADT_BUF_DEP)
-+#define CH_ASYNC_MDP_PACKET_LEN	(1024)
-+#define CH_ASYNC_MEP_PACKET_LEN	(1536)
-+#define CH_ASYNC_CDT_BUF_DEP	(CH_ASYNC_MEP_PACKET_LEN)
-+#define CH_ASYNC_ADT_BUF_DEP	(CH_ASYNC_CDT_BUF_DEP)
-+#define CH_ASYNC_BUF_SZ		(CH_ASYNC_ADT_BUF_DEP)
-+#define CH_ISOC_BLK_SIZE_188	(188)
-+#define CH_ISOC_BLK_SIZE_196	(196)
-+#define CH_ISOC_BLK_SIZE	(CH_ISOC_BLK_SIZE_188)
-+#define CH_ISOC_BLK_NUM		(1)
-+#define CH_ISOC_CDT_BUF_DEP	(CH_ISOC_BLK_SIZE * CH_ISOC_BLK_NUM)
-+#define CH_ISOC_ADT_BUF_DEP	(CH_ISOC_CDT_BUF_DEP)
-+#define CH_ISOC_BUF_SZ		(1024)
-+
-+#define CH_SYNC_DBR_BUF_OFFSET	(0x0)
-+#define CH_CTRL_DBR_BUF_OFFSET	(CH_SYNC_DBR_BUF_OFFSET + \
-+				2 * (CH_SYNC_MAX_QUAD * 4 * 4))
-+#define CH_ASYNC_DBR_BUF_OFFSET	(CH_CTRL_DBR_BUF_OFFSET + \
-+				2 * CH_CTRL_CDT_BUF_DEP)
-+#define CH_ISOC_DBR_BUF_OFFSET	(CH_ASYNC_DBR_BUF_OFFSET + \
-+				2 * CH_ASYNC_CDT_BUF_DEP)
-+
-+#define DBR_BUF_START 0x00000
-+
-+#define CDT_LEN			(16)
-+#define ADT_LEN			(16)
-+#define CAT_LEN			(2)
-+
-+#define CDT_SZ			(CDT_LEN * LOGIC_CH_NUM)
-+#define ADT_SZ			(ADT_LEN * LOGIC_CH_NUM)
-+#define CAT_SZ			(CAT_LEN * LOGIC_CH_NUM * 2)
-+
-+#define CDT_BASE(base)		(base + BUF_CDT_OFFSET)
-+#define ADT_BASE(base)		(base + BUF_ADT_OFFSET)
-+#define CAT_MLB_BASE(base)	(base + BUF_CAT_MLB_OFFSET)
-+#define CAT_HBI_BASE(base)	(base + BUF_CAT_HBI_OFFSET)
-+
-+#define CDTn_ADDR(base, n)	(base + BUF_CDT_OFFSET + n * CDT_LEN)
-+#define ADTn_ADDR(base, n)	(base + BUF_ADT_OFFSET + n * ADT_LEN)
-+#define CATn_MLB_ADDR(base, n)	(base + BUF_CAT_MLB_OFFSET + n * CAT_LEN)
-+#define CATn_HBI_ADDR(base, n)	(base + BUF_CAT_HBI_OFFSET + n * CAT_LEN)
-+
-+#define CAT_CL_SHIFT		(0x0)
-+#define CAT_CT_SHIFT		(8)
-+#define CAT_CE			(0x1 << 11)
-+#define CAT_RNW			(0x1 << 12)
-+#define CAT_MT			(0x1 << 13)
-+#define CAT_FCE			(0x1 << 14)
-+#define CAT_MFE			(0x1 << 14)
-+
-+#define CDT_WSBC_SHIFT		(14)
-+#define CDT_WPC_SHIFT		(11)
-+#define CDT_RSBC_SHIFT		(30)
-+#define CDT_RPC_SHIFT		(27)
-+#define CDT_WPC_1_SHIFT		(12)
-+#define CDT_RPC_1_SHIFT		(28)
-+#define CDT_WPTR_SHIFT		(0)
-+#define CDT_SYNC_WSTS_MASK	(0x0000f000)
-+#define CDT_SYNC_WSTS_SHIFT	(12)
-+#define CDT_CTRL_ASYNC_WSTS_MASK	(0x0000f000)
-+#define CDT_CTRL_ASYNC_WSTS_SHIFT	(12)
-+#define CDT_ISOC_WSTS_MASK	(0x0000e000)
-+#define CDT_ISOC_WSTS_SHIFT	(13)
-+#define CDT_RPTR_SHIFT		(16)
-+#define CDT_SYNC_RSTS_MASK	(0xf0000000)
-+#define CDT_SYNC_RSTS_SHIFT	(28)
-+#define CDT_CTRL_ASYNC_RSTS_MASK	(0xf0000000)
-+#define CDT_CTRL_ASYNC_RSTS_SHIFT	(28)
-+#define CDT_ISOC_RSTS_MASK	(0xe0000000)
-+#define CDT_ISOC_RSTS_SHIFT	(29)
-+#define CDT_CTRL_ASYNC_WSTS_1	(0x1 << 14)
-+#define CDT_CTRL_ASYNC_RSTS_1	(0x1 << 15)
-+#define CDT_BD_SHIFT		(0)
-+#define CDT_BA_SHIFT		(16)
-+#define CDT_BS_SHIFT		(0)
-+#define CDT_BF_SHIFT		(31)
-+
-+#define ADT_PG			(0x1 << 13)
-+#define ADT_LE			(0x1 << 14)
-+#define ADT_CE			(0x1 << 15)
-+#define ADT_BD1_SHIFT		(0)
-+#define ADT_ERR1		(0x1 << 13)
-+#define ADT_DNE1		(0x1 << 14)
-+#define ADT_RDY1		(0x1 << 15)
-+#define ADT_BD2_SHIFT		(16)
-+#define ADT_ERR2		(0x1 << 29)
-+#define ADT_DNE2		(0x1 << 30)
-+#define ADT_RDY2		(0x1 << 31)
-+#define ADT_BA1_SHIFT		(0x0)
-+#define ADT_BA2_SHIFT		(0x0)
-+#define ADT_PS1			(0x1 << 12)
-+#define ADT_PS2			(0x1 << 28)
-+#define ADT_MEP1		(0x1 << 11)
-+#define ADT_MEP2		(0x1 << 27)
-+
-+#define MLB_MINOR_DEVICES	4
-+#define MLB_CONTROL_DEV_NAME	"ctrl"
-+#define MLB_ASYNC_DEV_NAME	"async"
-+#define MLB_SYNC_DEV_NAME	"sync"
-+#define MLB_ISOC_DEV_NAME	"isoc"
-+
-+#define TX_CHANNEL		0
-+#define RX_CHANNEL		1
-+
-+#define TRANS_RING_NODES	(1 << 3)
-+
-+enum MLB_CTYPE {
-+	MLB_CTYPE_SYNC,
-+	MLB_CTYPE_CTRL,
-+	MLB_CTYPE_ASYNC,
-+	MLB_CTYPE_ISOC,
-+};
-+
-+enum CLK_SPEED {
-+	CLK_256FS,
-+	CLK_512FS,
-+	CLK_1024FS,
-+	CLK_2048FS,
-+	CLK_3072FS,
-+	CLK_4096FS,
-+	CLK_6144FS,
-+	CLK_8192FS,
-+};
-+
-+struct mlb_ringbuf {
-+	s8 *virt_bufs[TRANS_RING_NODES];
-+	u32 phy_addrs[TRANS_RING_NODES];
-+	s32 head;
-+	s32 tail;
-+	s32 unit_size;
-+	s32 total_size;
-+	rwlock_t rb_lock ____cacheline_aligned; /* ring index lock */
-+};
-+
-+struct mlb_channel_info {
-+	/* Input MLB channel address */
-+	u32 address;
-+	/* Internal AHB channel label */
-+	u32 cl;
-+	/* DBR buf head */
-+	u32 dbr_buf_head;
-+};
-+
-+struct mlb_dev_info {
-+	/* device node name */
-+	const char dev_name[20];
-+	/* channel type */
-+	const unsigned int channel_type;
-+	/* ch fps */
-+	enum CLK_SPEED fps;
-+	/* channel info for tx/rx */
-+	struct mlb_channel_info channels[2];
-+	/* ring buffer */
-+	u8 *rbuf_base_virt;
-+	u32 rbuf_base_phy;
-+	struct mlb_ringbuf rx_rbuf;
-+	struct mlb_ringbuf tx_rbuf;
-+	/* exception event */
-+	unsigned long ex_event;
-+	/* tx busy indicator */
-+	unsigned long tx_busy;
-+	/* channel started up or not */
-+	atomic_t on;
-+	/* device open count */
-+	atomic_t opencnt;
-+	/* wait queue head for channel */
-+	wait_queue_head_t rx_wq;
-+	wait_queue_head_t tx_wq;
-+	/* TX OK */
-+	s32 tx_ok;
-+	/* spinlock for event access */
-+	spinlock_t event_lock;
-+	/*
-+	 * Block size for isoc mode
-+	 * This variable can be configured in ioctl
-+	 */
-+	u32 isoc_blksz;
-+	/*
-+	 * Quads number for sync mode
-+	 * This variable can be confifured in ioctl
-+	 */
-+	u32 sync_quad;
-+	/* Buffer depth in cdt */
-+	u32 cdt_buf_dep;
-+	/* Buffer depth in adt */
-+	u32 adt_buf_dep;
-+	/* Buffer size to hold data */
-+	u32 buf_size;
-+};
-+
-+struct mlb_data {
-+	struct mlb_dev_info *devinfo;
-+	struct clk *clk_mlb3p;
-+	struct clk *clk_mlb6p;
-+	struct cdev cdev;
-+	struct class *class;	/* device class */
-+	dev_t firstdev;
-+#ifdef CONFIG_REGULATOR
-+	struct regulator *nvcc;
-+#endif
-+	void __iomem *membase;	/* mlb module base address */
-+	struct gen_pool *iram_pool;
-+	u32 iram_size;
-+	u32 irq_ahb0;
-+	u32 irq_ahb1;
-+	u32 irq_mlb;
-+};
-+
-+/*
-+ * For optimization, we use fixed channel label for
-+ * input channels of each mode
-+ * SYNC: CL = 0 for RX, CL = 64 for TX
-+ * CTRL: CL = 1 for RX, CL = 65 for TX
-+ * ASYNC: CL = 2 for RX, CL = 66 for TX
-+ * ISOC: CL = 3 for RX, CL = 67 for TX
-+ */
-+#define SYNC_RX_CL_AHB0		0
-+#define CTRL_RX_CL_AHB0		1
-+#define ASYNC_RX_CL_AHB0	2
-+#define ISOC_RX_CL_AHB0		3
-+#define SYNC_TX_CL_AHB0		4
-+#define CTRL_TX_CL_AHB0		5
-+#define ASYNC_TX_CL_AHB0	6
-+#define ISOC_TX_CL_AHB0		7
-+
-+#define SYNC_RX_CL_AHB1		32
-+#define CTRL_RX_CL_AHB1		33
-+#define ASYNC_RX_CL_AHB1	34
-+#define ISOC_RX_CL_AHB1		35
-+#define SYNC_TX_CL_AHB1		36
-+#define CTRL_TX_CL_AHB1		37
-+#define ASYNC_TX_CL_AHB1	38
-+#define ISOC_TX_CL_AHB1		39
-+
-+#define SYNC_RX_CL	SYNC_RX_CL_AHB0
-+#define CTRL_RX_CL	CTRL_RX_CL_AHB0
-+#define ASYNC_RX_CL	ASYNC_RX_CL_AHB0
-+#define ISOC_RX_CL	ISOC_RX_CL_AHB0
-+
-+#define SYNC_TX_CL	SYNC_TX_CL_AHB0
-+#define CTRL_TX_CL	CTRL_TX_CL_AHB0
-+#define ASYNC_TX_CL	ASYNC_TX_CL_AHB0
-+#define ISOC_TX_CL	ISOC_TX_CL_AHB0
-+
-+static struct mlb_dev_info mlb_devinfo[MLB_MINOR_DEVICES] = {
-+	{
-+	.dev_name = MLB_SYNC_DEV_NAME,
-+	.channel_type = MLB_CTYPE_SYNC,
-+	.channels = {
-+		[0] = {
-+			.cl = SYNC_TX_CL,
-+			.dbr_buf_head = CH_SYNC_DBR_BUF_OFFSET,
-+		},
-+		[1] = {
-+			.cl = SYNC_RX_CL,
-+			.dbr_buf_head = CH_SYNC_DBR_BUF_OFFSET
-+					+ CH_SYNC_BUF_SZ,
-+		},
-+	},
-+	.rx_rbuf = {
-+		.unit_size = CH_SYNC_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[0].rx_rbuf.rb_lock),
-+	},
-+	.tx_rbuf = {
-+		.unit_size = CH_SYNC_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[0].tx_rbuf.rb_lock),
-+	},
-+	.cdt_buf_dep = CH_SYNC_CDT_BUF_DEP,
-+	.adt_buf_dep = CH_SYNC_ADT_BUF_DEP,
-+	.buf_size = CH_SYNC_BUF_SZ,
-+	.on = ATOMIC_INIT(0),
-+	.opencnt = ATOMIC_INIT(0),
-+	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[0].event_lock),
-+	},
-+	{
-+	.dev_name = MLB_CONTROL_DEV_NAME,
-+	.channel_type = MLB_CTYPE_CTRL,
-+	.channels = {
-+		[0] = {
-+			.cl = CTRL_TX_CL,
-+			.dbr_buf_head = CH_CTRL_DBR_BUF_OFFSET,
-+		},
-+		[1] = {
-+			.cl = CTRL_RX_CL,
-+			.dbr_buf_head = CH_CTRL_DBR_BUF_OFFSET
-+					+ CH_CTRL_BUF_SZ,
-+		},
-+	},
-+	.rx_rbuf = {
-+		.unit_size = CH_CTRL_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[1].rx_rbuf.rb_lock),
-+	},
-+	.tx_rbuf = {
-+		.unit_size = CH_CTRL_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[1].tx_rbuf.rb_lock),
-+	},
-+	.cdt_buf_dep = CH_CTRL_CDT_BUF_DEP,
-+	.adt_buf_dep = CH_CTRL_ADT_BUF_DEP,
-+	.buf_size = CH_CTRL_BUF_SZ,
-+	.on = ATOMIC_INIT(0),
-+	.opencnt = ATOMIC_INIT(0),
-+	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[1].event_lock),
-+	},
-+	{
-+	.dev_name = MLB_ASYNC_DEV_NAME,
-+	.channel_type = MLB_CTYPE_ASYNC,
-+	.channels = {
-+		[0] = {
-+			.cl = ASYNC_TX_CL,
-+			.dbr_buf_head = CH_ASYNC_DBR_BUF_OFFSET,
-+		},
-+		[1] = {
-+			.cl = ASYNC_RX_CL,
-+			.dbr_buf_head = CH_ASYNC_DBR_BUF_OFFSET
-+					+ CH_ASYNC_BUF_SZ,
-+		},
-+	},
-+	.rx_rbuf = {
-+		.unit_size = CH_ASYNC_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[2].rx_rbuf.rb_lock),
-+	},
-+	.tx_rbuf = {
-+		.unit_size = CH_ASYNC_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[2].tx_rbuf.rb_lock),
-+	},
-+	.cdt_buf_dep = CH_ASYNC_CDT_BUF_DEP,
-+	.adt_buf_dep = CH_ASYNC_ADT_BUF_DEP,
-+	.buf_size = CH_ASYNC_BUF_SZ,
-+	.on = ATOMIC_INIT(0),
-+	.opencnt = ATOMIC_INIT(0),
-+	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[2].event_lock),
-+	},
-+	{
-+	.dev_name = MLB_ISOC_DEV_NAME,
-+	.channel_type = MLB_CTYPE_ISOC,
-+	.channels = {
-+		[0] = {
-+			.cl = ISOC_TX_CL,
-+			.dbr_buf_head = CH_ISOC_DBR_BUF_OFFSET,
-+		},
-+		[1] = {
-+			.cl = ISOC_RX_CL,
-+			.dbr_buf_head = CH_ISOC_DBR_BUF_OFFSET
-+					+ CH_ISOC_BUF_SZ,
-+		},
-+	},
-+	.rx_rbuf = {
-+		.unit_size = CH_ISOC_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[3].rx_rbuf.rb_lock),
-+	},
-+	.tx_rbuf = {
-+		.unit_size = CH_ISOC_BUF_SZ,
-+		.rb_lock =
-+			__RW_LOCK_UNLOCKED(mlb_devinfo[3].tx_rbuf.rb_lock),
-+	},
-+	.cdt_buf_dep = CH_ISOC_CDT_BUF_DEP,
-+	.adt_buf_dep = CH_ISOC_ADT_BUF_DEP,
-+	.buf_size = CH_ISOC_BUF_SZ,
-+	.on = ATOMIC_INIT(0),
-+	.opencnt = ATOMIC_INIT(0),
-+	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[3].event_lock),
-+	.isoc_blksz = CH_ISOC_BLK_SIZE_188,
-+	},
-+};
-+
-+static void __iomem *mlb_base;
-+
-+DEFINE_SPINLOCK(ctr_lock);
-+
-+#ifdef DEBUG
-+#define DUMP_REG(reg) pr_debug(#reg": 0x%08x\n", __raw_readl(mlb_base + reg))
-+
-+static void mlb150_dev_dump_reg(void)
-+{
-+	pr_debug("mxc_mlb150: Dump registers:\n");
-+	DUMP_REG(REG_MLBC0);
-+	DUMP_REG(REG_MLBPC0);
-+	DUMP_REG(REG_MS0);
-+	DUMP_REG(REG_MS1);
-+	DUMP_REG(REG_MSS);
-+	DUMP_REG(REG_MSD);
-+	DUMP_REG(REG_MIEN);
-+	DUMP_REG(REG_MLBPC2);
-+	DUMP_REG(REG_MLBPC1);
-+	DUMP_REG(REG_MLBC1);
-+	DUMP_REG(REG_HCTL);
-+	DUMP_REG(REG_HCMR0);
-+	DUMP_REG(REG_HCMR1);
-+	DUMP_REG(REG_HCER0);
-+	DUMP_REG(REG_HCER1);
-+	DUMP_REG(REG_HCBR0);
-+	DUMP_REG(REG_HCBR1);
-+	DUMP_REG(REG_MDAT0);
-+	DUMP_REG(REG_MDAT1);
-+	DUMP_REG(REG_MDAT2);
-+	DUMP_REG(REG_MDAT3);
-+	DUMP_REG(REG_MDWE0);
-+	DUMP_REG(REG_MDWE1);
-+	DUMP_REG(REG_MDWE2);
-+	DUMP_REG(REG_MDWE3);
-+	DUMP_REG(REG_MCTL);
-+	DUMP_REG(REG_MADR);
-+	DUMP_REG(REG_ACTL);
-+	DUMP_REG(REG_ACSR0);
-+	DUMP_REG(REG_ACSR1);
-+	DUMP_REG(REG_ACMR0);
-+	DUMP_REG(REG_ACMR1);
-+}
-+
-+static void mlb150_dev_dump_hex(const u8 *buf, u32 len)
-+{
-+	print_hex_dump(KERN_DEBUG, "CTR DUMP:",
-+			DUMP_PREFIX_OFFSET, 8, 1, buf, len, 0);
-+}
-+#endif
-+
-+static inline void mlb150_dev_enable_ctr_write(u32 mdat0_bits_en,
-+		u32 mdat1_bits_en, u32 mdat2_bits_en, u32 mdat3_bits_en)
-+{
-+	__raw_writel(mdat0_bits_en, mlb_base + REG_MDWE0);
-+	__raw_writel(mdat1_bits_en, mlb_base + REG_MDWE1);
-+	__raw_writel(mdat2_bits_en, mlb_base + REG_MDWE2);
-+	__raw_writel(mdat3_bits_en, mlb_base + REG_MDWE3);
-+}
-+
-+#ifdef DEBUG
-+static inline u8 mlb150_dev_dbr_read(u32 dbr_addr)
-+{
-+	s32 timeout = 1000;
-+	u8  dbr_val = 0;
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&ctr_lock, flags);
-+	__raw_writel(MADR_TB | dbr_addr,
-+		mlb_base + REG_MADR);
-+
-+	while ((!(__raw_readl(mlb_base + REG_MCTL)
-+			& MCTL_XCMP)) &&
-+			timeout--)
-+		;
-+
-+	if (0 == timeout) {
-+		spin_unlock_irqrestore(&ctr_lock, flags);
-+		return -ETIME;
-+	}
-+
-+	dbr_val = __raw_readl(mlb_base + REG_MDAT0) & 0x000000ff;
-+
-+	__raw_writel(0, mlb_base + REG_MCTL);
-+	spin_unlock_irqrestore(&ctr_lock, flags);
-+
-+	return dbr_val;
-+}
-+
-+static inline s32 mlb150_dev_dbr_write(u32 dbr_addr, u8 dbr_val)
-+{
-+	s32 timeout = 1000;
-+	u32 mdat0 = dbr_val & 0x000000ff;
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&ctr_lock, flags);
-+	__raw_writel(mdat0, mlb_base + REG_MDAT0);
-+
-+	__raw_writel(MADR_WNR | MADR_TB | dbr_addr,
-+			mlb_base + REG_MADR);
-+
-+	while ((!(__raw_readl(mlb_base + REG_MCTL)
-+			& MCTL_XCMP)) &&
-+			timeout--)
-+		;
-+
-+	if (timeout <= 0) {
-+		spin_unlock_irqrestore(&ctr_lock, flags);
-+		return -ETIME;
-+	}
-+
-+	__raw_writel(0, mlb_base + REG_MCTL);
-+	spin_unlock_irqrestore(&ctr_lock, flags);
-+
-+	return 0;
-+}
-+
-+static inline s32 mlb150_dev_dbr_dump(u32 addr, u32 size)
-+{
-+	u8 *dump_buf = NULL;
-+	u8 *buf_ptr = NULL;
-+	s32 i;
-+
-+	dump_buf = kzalloc(size, GFP_KERNEL);
-+	if (!dump_buf) {
-+		pr_err("can't allocate enough memory\n");
-+		return -ENOMEM;
-+	}
-+
-+	for (i = 0, buf_ptr = dump_buf;
-+			i < size; ++i, ++buf_ptr)
-+		*buf_ptr = mlb150_dev_dbr_read(addr + i);
-+
-+	mlb150_dev_dump_hex(dump_buf, size);
-+
-+	kfree(dump_buf);
-+
-+	return 0;
-+}
-+#endif
-+
-+static s32 mlb150_dev_ctr_read(u32 ctr_offset, u32 *ctr_val)
-+{
-+	s32 timeout = 1000;
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&ctr_lock, flags);
-+	__raw_writel(ctr_offset, mlb_base + REG_MADR);
-+
-+	while ((!(__raw_readl(mlb_base + REG_MCTL)
-+			& MCTL_XCMP)) &&
-+			timeout--)
-+		;
-+
-+	if (timeout <= 0) {
-+		spin_unlock_irqrestore(&ctr_lock, flags);
-+		pr_debug("mxc_mlb150: Read CTR timeout\n");
-+		return -ETIME;
-+	}
-+
-+	ctr_val[0] = __raw_readl(mlb_base + REG_MDAT0);
-+	ctr_val[1] = __raw_readl(mlb_base + REG_MDAT1);
-+	ctr_val[2] = __raw_readl(mlb_base + REG_MDAT2);
-+	ctr_val[3] = __raw_readl(mlb_base + REG_MDAT3);
-+
-+	__raw_writel(0, mlb_base + REG_MCTL);
-+
-+	spin_unlock_irqrestore(&ctr_lock, flags);
-+
-+	return 0;
-+}
-+
-+static s32 mlb150_dev_ctr_write(u32 ctr_offset, const u32 *ctr_val)
-+{
-+	s32 timeout = 1000;
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&ctr_lock, flags);
-+
-+	__raw_writel(ctr_val[0], mlb_base + REG_MDAT0);
-+	__raw_writel(ctr_val[1], mlb_base + REG_MDAT1);
-+	__raw_writel(ctr_val[2], mlb_base + REG_MDAT2);
-+	__raw_writel(ctr_val[3], mlb_base + REG_MDAT3);
-+
-+	__raw_writel(MADR_WNR | ctr_offset,
-+			mlb_base + REG_MADR);
-+
-+	while ((!(__raw_readl(mlb_base + REG_MCTL)
-+			& MCTL_XCMP)) &&
-+			timeout--)
-+		;
-+
-+	if (timeout <= 0) {
-+		spin_unlock_irqrestore(&ctr_lock, flags);
-+		pr_debug("mxc_mlb150: Write CTR timeout\n");
-+		return -ETIME;
-+	}
-+
-+	__raw_writel(0, mlb_base + REG_MCTL);
-+
-+	spin_unlock_irqrestore(&ctr_lock, flags);
-+
-+#ifdef DEBUG_CTR
-+	{
-+		u32 ctr_rd[4] = { 0 };
-+
-+		if (!mlb150_dev_ctr_read(ctr_offset, ctr_rd)) {
-+			if (ctr_val[0] == ctr_rd[0] &&
-+				ctr_val[1] == ctr_rd[1] &&
-+				ctr_val[2] == ctr_rd[2] &&
-+				ctr_val[3] == ctr_rd[3])
-+				return 0;
-+			else {
-+				pr_debug("mxc_mlb150: ctr write failed\n");
-+				pr_debug("offset: 0x%x\n", ctr_offset);
-+				pr_debug("Write: 0x%x 0x%x 0x%x 0x%x\n",
-+						ctr_val[3], ctr_val[2],
-+						ctr_val[1], ctr_val[0]);
-+				pr_debug("Read: 0x%x 0x%x 0x%x 0x%x\n",
-+						ctr_rd[3], ctr_rd[2],
-+						ctr_rd[1], ctr_rd[0]);
-+				return -EBADE;
-+			}
-+		} else {
-+			pr_debug("mxc_mlb150: ctr read failed\n");
-+			return -EBADE;
-+		}
-+	}
-+#endif
-+
-+	return 0;
-+}
-+
-+#ifdef DEBUG
-+static s32 mlb150_dev_cat_read(u32 ctr_offset, u32 ch, u16 *cat_val)
-+{
-+	u16 ctr_val[8] = { 0 };
-+
-+	if (mlb150_dev_ctr_read(ctr_offset, (u32 *)ctr_val))
-+		return -ETIME;
-+
-+	/*
-+	 * Use u16 array to get u32 array value,
-+	 * need to convert
-+	 */
-+	cat_val = ctr_val[ch % 8];
-+
-+	 return 0;
-+}
-+#endif
-+
-+static s32 mlb150_dev_cat_write(u32 ctr_offset, u32 ch, const u16 cat_val)
-+{
-+	u16 ctr_val[8] = { 0 };
-+
-+	if (mlb150_dev_ctr_read(ctr_offset, (u32 *)ctr_val))
-+		return -ETIME;
-+
-+	ctr_val[ch % 8] = cat_val;
-+	if (mlb150_dev_ctr_write(ctr_offset, (u32 *)ctr_val))
-+		return -ETIME;
-+
-+	return 0;
-+}
-+
-+#define mlb150_dev_cat_mlb_read(ch, cat_val)	\
-+	mlb150_dev_cat_read(BUF_CAT_MLB_OFFSET + (ch >> 3), ch, cat_val)
-+#define mlb150_dev_cat_mlb_write(ch, cat_val)	\
-+	mlb150_dev_cat_write(BUF_CAT_MLB_OFFSET + (ch >> 3), ch, cat_val)
-+#define mlb150_dev_cat_hbi_read(ch, cat_val)	\
-+	mlb150_dev_cat_read(BUF_CAT_HBI_OFFSET + (ch >> 3), ch, cat_val)
-+#define mlb150_dev_cat_hbi_write(ch, cat_val)	\
-+	mlb150_dev_cat_write(BUF_CAT_HBI_OFFSET + (ch >> 3), ch, cat_val)
-+
-+#define mlb150_dev_cdt_read(ch, cdt_val)	\
-+	mlb150_dev_ctr_read(BUF_CDT_OFFSET + ch, cdt_val)
-+#define mlb150_dev_cdt_write(ch, cdt_val)	\
-+	mlb150_dev_ctr_write(BUF_CDT_OFFSET + ch, cdt_val)
-+#define mlb150_dev_adt_read(ch, adt_val)	\
-+	mlb150_dev_ctr_read(BUF_ADT_OFFSET + ch, adt_val)
-+#define mlb150_dev_adt_write(ch, adt_val)	\
-+	mlb150_dev_ctr_write(BUF_ADT_OFFSET + ch, adt_val)
-+
-+static s32 mlb150_dev_get_adt_sts(u32 ch)
-+{
-+	s32 timeout = 1000;
-+	unsigned long flags;
-+	u32 reg;
-+
-+	spin_lock_irqsave(&ctr_lock, flags);
-+	__raw_writel(BUF_ADT_OFFSET + ch,
-+			mlb_base + REG_MADR);
-+
-+	while ((!(__raw_readl(mlb_base + REG_MCTL)
-+			& MCTL_XCMP)) &&
-+			timeout--)
-+		;
-+
-+	if (timeout <= 0) {
-+		spin_unlock_irqrestore(&ctr_lock, flags);
-+		pr_debug("mxc_mlb150: Read CTR timeout\n");
-+		return -ETIME;
-+	}
-+
-+	reg = __raw_readl(mlb_base + REG_MDAT1);
-+
-+	__raw_writel(0, mlb_base + REG_MCTL);
-+	spin_unlock_irqrestore(&ctr_lock, flags);
-+
-+#ifdef DEBUG_ADT
-+	pr_debug("mxc_mlb150: Get ch %d adt sts: 0x%08x\n", ch, reg);
-+#endif
-+
-+	return reg;
-+}
-+
-+#ifdef DEBUG
-+static void mlb150_dev_dump_ctr_tbl(u32 ch_start, u32 ch_end)
-+{
-+	u32 i = 0;
-+	u32 ctr_val[4] = { 0 };
-+
-+	pr_debug("mxc_mlb150: CDT Table");
-+	for (i = BUF_CDT_OFFSET + ch_start;
-+			i < BUF_CDT_OFFSET + ch_end;
-+			++i) {
-+		mlb150_dev_ctr_read(i, ctr_val);
-+		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
-+			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
-+	}
-+
-+	pr_debug("mxc_mlb150: ADT Table");
-+	for (i = BUF_ADT_OFFSET + ch_start;
-+			i < BUF_ADT_OFFSET + ch_end;
-+			++i) {
-+		mlb150_dev_ctr_read(i, ctr_val);
-+		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
-+			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
-+	}
-+
-+	pr_debug("mxc_mlb150: CAT MLB Table");
-+	for (i = BUF_CAT_MLB_OFFSET + (ch_start >> 3);
-+			i <= BUF_CAT_MLB_OFFSET + ((ch_end + 8) >> 3);
-+			++i) {
-+		mlb150_dev_ctr_read(i, ctr_val);
-+		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
-+			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
-+	}
-+
-+	pr_debug("mxc_mlb150: CAT HBI Table");
-+	for (i = BUF_CAT_HBI_OFFSET + (ch_start >> 3);
-+			i <= BUF_CAT_HBI_OFFSET + ((ch_end + 8) >> 3);
-+			++i) {
-+		mlb150_dev_ctr_read(i, ctr_val);
-+		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
-+			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
-+	}
-+}
-+#endif
-+
-+/*
-+ * Initial the MLB module device
-+ */
-+static inline void  mlb150_dev_enable_dma_irq(u32 enable)
-+{
-+	u32 ch_rx_mask = (1 << SYNC_RX_CL_AHB0) | (1 << CTRL_RX_CL_AHB0)
-+			| (1 << ASYNC_RX_CL_AHB0) | (1 << ISOC_RX_CL_AHB0)
-+			| (1 << SYNC_TX_CL_AHB0) | (1 << CTRL_TX_CL_AHB0)
-+			| (1 << ASYNC_TX_CL_AHB0) | (1 << ISOC_TX_CL_AHB0);
-+	u32 ch_tx_mask = (1 << (SYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (CTRL_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ASYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ISOC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (SYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (CTRL_TX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ASYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ISOC_TX_CL_AHB1 - INT_AHB1_CH_START));
-+
-+	if (enable) {
-+		__raw_writel(ch_rx_mask, mlb_base + REG_ACMR0);
-+		__raw_writel(ch_tx_mask, mlb_base + REG_ACMR1);
-+	} else {
-+		__raw_writel(0x0, mlb_base + REG_ACMR0);
-+		__raw_writel(0x0, mlb_base + REG_ACMR1);
-+	}
-+}
-+
-+
-+static void mlb150_dev_init_ir_amba_ahb(void)
-+{
-+	u32 reg = 0;
-+
-+	/*
-+	 * Step 1. Program the ACMRn registers to enable interrupts from all
-+	 * active DMA channels
-+	 */
-+	mlb150_dev_enable_dma_irq(1);
-+
-+	/*
-+	 * Step 2. Select the status clear method:
-+	 * ACTL.SCE = 0, hardware clears on read
-+	 * ACTL.SCE = 1, software writes a '1' to clear
-+	 * We only support DMA MODE 1
-+	 */
-+	reg = __raw_readl(mlb_base + REG_ACTL);
-+	reg |= ACTL_DMAMODE;
-+#ifdef MULTIPLE_PACKAGE_MODE
-+	reg |= REG_ACTL_MPB;
-+#endif
-+
-+	/*
-+	 *  Step 3. Select 1 or 2 interrupt signals:
-+	 * ACTL.SMX = 0: one interrupt for channels 0 - 31 on ahb_init[0]
-+	 *	and another interrupt for channels 32 - 63 on ahb_init[1]
-+	 * ACTL.SMX = 1: singel interrupt all channels on ahb_init[0]
-+	 */
-+	reg &= ~ACTL_SMX;
-+
-+	__raw_writel(reg, mlb_base + REG_ACTL);
-+}
-+
-+static inline void mlb150_dev_enable_ir_mlb(u32 enable)
-+{
-+	/*
-+	 * Step 1, Select the MSn to be cleared by software,
-+	 * writing a '0' to the appropriate bits
-+	 */
-+	__raw_writel(0, mlb_base + REG_MS0);
-+	__raw_writel(0, mlb_base + REG_MS1);
-+
-+	/*
-+	 * Step 1, Program MIEN to enable protocol error
-+	 * interrupts for all active MLB channels
-+	 */
-+	if (enable)
-+		__raw_writel(MIEN_CTX_PE |
-+			MIEN_CRX_PE | MIEN_ATX_PE |
-+			MIEN_ARX_PE | MIEN_SYNC_PE |
-+			MIEN_ISOC_PE,
-+			mlb_base + REG_MIEN);
-+	else
-+		__raw_writel(0, mlb_base + REG_MIEN);
-+}
-+
-+static inline void mlb150_enable_pll(struct mlb_data *drvdata)
-+{
-+	u32 c0_val;
-+
-+	__raw_writel(MLBPC1_VAL,
-+			drvdata->membase + REG_MLBPC1);
-+
-+	c0_val = __raw_readl(drvdata->membase + REG_MLBC0);
-+	if (c0_val & MLBC0_MLBPEN) {
-+		c0_val &= ~MLBC0_MLBPEN;
-+		__raw_writel(c0_val,
-+				drvdata->membase + REG_MLBC0);
-+	}
-+
-+	clk_prepare_enable(drvdata->clk_mlb6p);
-+
-+	c0_val |= (MLBC0_MLBPEN);
-+	__raw_writel(c0_val, drvdata->membase + REG_MLBC0);
-+}
-+
-+static inline void mlb150_disable_pll(struct mlb_data *drvdata)
-+{
-+	u32 c0_val;
-+
-+	clk_disable_unprepare(drvdata->clk_mlb6p);
-+
-+	c0_val = __raw_readl(drvdata->membase + REG_MLBC0);
-+
-+	__raw_writel(0x0, drvdata->membase + REG_MLBPC1);
-+
-+	c0_val &= ~MLBC0_MLBPEN;
-+	__raw_writel(c0_val, drvdata->membase + REG_MLBC0);
-+}
-+
-+static void mlb150_dev_reset_cdt(void)
-+{
-+	int i = 0;
-+	u32 ctr_val[4] = { 0 };
-+
-+	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
-+			0xffffffff, 0xffffffff);
-+
-+	for (i = 0; i < (LOGIC_CH_NUM); ++i)
-+		mlb150_dev_ctr_write(BUF_CDT_OFFSET + i, ctr_val);
-+}
-+
-+static s32 mlb150_dev_init_ch_cdt(struct mlb_dev_info *pdevinfo, u32 ch,
-+		enum MLB_CTYPE ctype, u32 ch_func)
-+{
-+	u32 cdt_val[4] = { 0 };
-+
-+	/* a. Set the 14-bit base address (BA) */
-+	pr_debug("mxc_mlb150: ctype: %d, ch: %d, dbr_buf_head: 0x%08x",
-+		ctype, ch, pdevinfo->channels[ch_func].dbr_buf_head);
-+	cdt_val[3] = (pdevinfo->channels[ch_func].dbr_buf_head)
-+			<< CDT_BA_SHIFT;
-+	/*
-+	 * b. Set the 12-bit or 13-bit buffer depth (BD)
-+	 * BD = buffer depth in bytes - 1
-+	 * For synchronous channels: (BD + 1) = 4 * m * bpf
-+	 * For control channels: (BD + 1) >= max packet length (64)
-+	 * For asynchronous channels: (BD + 1) >= max packet length
-+	 * 1024 for a MOST Data packet (MDP);
-+	 * 1536 for a MOST Ethernet Packet (MEP)
-+	 * For isochronous channels: (BD + 1) mod (BS + 1) = 0
-+	 * BS
-+	 */
-+	if (MLB_CTYPE_ISOC == ctype)
-+		cdt_val[1] |= (pdevinfo->isoc_blksz - 1);
-+	/* BD */
-+	cdt_val[3] |= (pdevinfo->cdt_buf_dep - 1) << CDT_BD_SHIFT;
-+
-+	pr_debug("mxc_mlb150: Set CDT val of channel %d, type: %d: "
-+		"0x%08x 0x%08x 0x%08x 0x%08x\n",
-+		ch, ctype, cdt_val[3], cdt_val[2], cdt_val[1], cdt_val[0]);
-+
-+	if (mlb150_dev_cdt_write(ch, cdt_val))
-+		return -ETIME;
-+
-+#ifdef DEBUG_CTR
-+	{
-+		u32 cdt_rd[4] = { 0 };
-+		if (!mlb150_dev_cdt_read(ch, cdt_rd)) {
-+			pr_debug("mxc_mlb150: CDT val of channel %d: "
-+				"0x%08x 0x%08x 0x%08x 0x%08x\n",
-+				ch, cdt_rd[3], cdt_rd[2], cdt_rd[1], cdt_rd[0]);
-+			if (cdt_rd[3] == cdt_val[3] &&
-+				cdt_rd[2] == cdt_val[2] &&
-+				cdt_rd[1] == cdt_val[1] &&
-+				cdt_rd[0] == cdt_val[0]) {
-+				pr_debug("mxc_mlb150: set cdt succeed!\n");
-+				return 0;
-+			} else {
-+				pr_debug("mxc_mlb150: set cdt failed!\n");
-+				return -EBADE;
-+			}
-+		} else {
-+			pr_debug("mxc_mlb150: Read CDT val of channel %d failed\n",
-+					ch);
-+			return -EBADE;
-+		}
-+	}
-+#endif
-+
-+	return 0;
-+}
-+
-+static s32 mlb150_dev_init_ch_cat(u32 ch, u32 cl,
-+		u32 cat_mode, enum MLB_CTYPE ctype)
-+{
-+	u16 cat_val = 0;
-+#ifdef DEBUG_CTR
-+	u16 cat_rd = 0;
-+#endif
-+
-+	cat_val = CAT_CE | (ctype << CAT_CT_SHIFT) | cl;
-+
-+	if (cat_mode & CAT_MODE_OUTBOUND_DMA)
-+		cat_val |= CAT_RNW;
-+
-+	if (MLB_CTYPE_SYNC == ctype)
-+		cat_val |= CAT_MT;
-+
-+	switch (cat_mode) {
-+	case CAT_MODE_RX | CAT_MODE_INBOUND_DMA:
-+	case CAT_MODE_TX | CAT_MODE_OUTBOUND_DMA:
-+		pr_debug("mxc_mlb150: set CAT val of channel %d, type: %d: 0x%04x\n",
-+			ch, ctype, cat_val);
-+
-+		if (mlb150_dev_cat_mlb_write(ch, cat_val))
-+			return -ETIME;
-+#ifdef DEBUG_CTR
-+		if (!mlb150_dev_cat_mlb_read(ch, &cat_rd))
-+			pr_debug("mxc_mlb150: CAT val of mlb channel %d: 0x%04x",
-+					ch, cat_rd);
-+		else {
-+			pr_debug("mxc_mlb150: Read CAT of mlb channel %d failed\n",
-+					ch);
-+				return -EBADE;
-+		}
-+#endif
-+		break;
-+	case CAT_MODE_TX | CAT_MODE_INBOUND_DMA:
-+	case CAT_MODE_RX | CAT_MODE_OUTBOUND_DMA:
-+		pr_debug("mxc_mlb150: set CAT val of channel %d, type: %d: 0x%04x\n",
-+			cl, ctype, cat_val);
-+
-+		if (mlb150_dev_cat_hbi_write(cl, cat_val))
-+			return -ETIME;
-+#ifdef DEBUG_CTR
-+		if (!mlb150_dev_cat_hbi_read(cl, &cat_rd))
-+			pr_debug("mxc_mlb150: CAT val of hbi channel %d: 0x%04x",
-+					cl, cat_rd);
-+		else {
-+			pr_debug("mxc_mlb150: Read CAT of hbi channel %d failed\n",
-+					cl);
-+				return -EBADE;
-+		}
-+#endif
-+		break;
-+	default:
-+		return EBADRQC;
-+	}
-+
-+#ifdef DEBUG_CTR
-+	{
-+		if (cat_val == cat_rd) {
-+			pr_debug("mxc_mlb150: set cat succeed!\n");
-+			return 0;
-+		} else {
-+			pr_debug("mxc_mlb150: set cat failed!\n");
-+			return -EBADE;
-+		}
-+	}
-+#endif
-+	return 0;
-+}
-+
-+static void mlb150_dev_reset_cat(void)
-+{
-+	int i = 0;
-+	u32 ctr_val[4] = { 0 };
-+
-+	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
-+			0xffffffff, 0xffffffff);
-+
-+	for (i = 0; i < (LOGIC_CH_NUM >> 3); ++i) {
-+		mlb150_dev_ctr_write(BUF_CAT_MLB_OFFSET + i, ctr_val);
-+		mlb150_dev_ctr_write(BUF_CAT_HBI_OFFSET + i, ctr_val);
-+	}
-+}
-+
-+static void mlb150_dev_init_rfb(struct mlb_dev_info *pdevinfo, u32 rx_ch,
-+		u32 tx_ch, enum MLB_CTYPE ctype)
-+{
-+	u32 rx_cl = pdevinfo->channels[RX_CHANNEL].cl;
-+	u32 tx_cl = pdevinfo->channels[TX_CHANNEL].cl;
-+	/* Step 1, Initialize all bits of CAT to '0' */
-+	mlb150_dev_reset_cat();
-+	mlb150_dev_reset_cdt();
-+	/*
-+	 * Step 2, Initialize logical channel
-+	 * Step 3, Program the CDT for channel N
-+	 */
-+	mlb150_dev_init_ch_cdt(pdevinfo, rx_cl, ctype, RX_CHANNEL);
-+	mlb150_dev_init_ch_cdt(pdevinfo, tx_cl, ctype, TX_CHANNEL);
-+
-+	/* Step 4&5, Program the CAT for the inbound and outbound DMA */
-+	mlb150_dev_init_ch_cat(rx_ch, rx_cl,
-+			CAT_MODE_RX | CAT_MODE_INBOUND_DMA,
-+			ctype);
-+	mlb150_dev_init_ch_cat(rx_ch, rx_cl,
-+			CAT_MODE_RX | CAT_MODE_OUTBOUND_DMA,
-+			ctype);
-+	mlb150_dev_init_ch_cat(tx_ch, tx_cl,
-+			CAT_MODE_TX | CAT_MODE_INBOUND_DMA,
-+			ctype);
-+	mlb150_dev_init_ch_cat(tx_ch, tx_cl,
-+			CAT_MODE_TX | CAT_MODE_OUTBOUND_DMA,
-+			ctype);
-+}
-+
-+static void mlb150_dev_reset_adt(void)
-+{
-+	int i = 0;
-+	u32 ctr_val[4] = { 0 };
-+
-+	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
-+			0xffffffff, 0xffffffff);
-+
-+	for (i = 0; i < (LOGIC_CH_NUM); ++i)
-+		mlb150_dev_ctr_write(BUF_ADT_OFFSET + i, ctr_val);
-+}
-+
-+static void mlb150_dev_reset_whole_ctr(void)
-+{
-+	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
-+			0xffffffff, 0xffffffff);
-+	mlb150_dev_reset_cdt();
-+	mlb150_dev_reset_adt();
-+	mlb150_dev_reset_cat();
-+}
-+
-+#define CLR_REG(reg)  __raw_writel(0x0, mlb_base + reg)
-+
-+static void mlb150_dev_reset_all_regs(void)
-+{
-+	CLR_REG(REG_MLBC0);
-+	CLR_REG(REG_MLBPC0);
-+	CLR_REG(REG_MS0);
-+	CLR_REG(REG_MS1);
-+	CLR_REG(REG_MSS);
-+	CLR_REG(REG_MSD);
-+	CLR_REG(REG_MIEN);
-+	CLR_REG(REG_MLBPC2);
-+	CLR_REG(REG_MLBPC1);
-+	CLR_REG(REG_MLBC1);
-+	CLR_REG(REG_HCTL);
-+	CLR_REG(REG_HCMR0);
-+	CLR_REG(REG_HCMR1);
-+	CLR_REG(REG_HCER0);
-+	CLR_REG(REG_HCER1);
-+	CLR_REG(REG_HCBR0);
-+	CLR_REG(REG_HCBR1);
-+	CLR_REG(REG_MDAT0);
-+	CLR_REG(REG_MDAT1);
-+	CLR_REG(REG_MDAT2);
-+	CLR_REG(REG_MDAT3);
-+	CLR_REG(REG_MDWE0);
-+	CLR_REG(REG_MDWE1);
-+	CLR_REG(REG_MDWE2);
-+	CLR_REG(REG_MDWE3);
-+	CLR_REG(REG_MCTL);
-+	CLR_REG(REG_MADR);
-+	CLR_REG(REG_ACTL);
-+	CLR_REG(REG_ACSR0);
-+	CLR_REG(REG_ACSR1);
-+	CLR_REG(REG_ACMR0);
-+	CLR_REG(REG_ACMR1);
-+}
-+
-+static inline s32 mlb150_dev_pipo_start(struct mlb_ringbuf *rbuf,
-+						u32 ahb_ch, u32 buf_addr)
-+{
-+	u32 ctr_val[4] = { 0 };
-+
-+	ctr_val[1] |= ADT_RDY1;
-+	ctr_val[2] = buf_addr;
-+
-+	if (mlb150_dev_adt_write(ahb_ch, ctr_val))
-+		return -ETIME;
-+
-+	return 0;
-+}
-+
-+static inline s32 mlb150_dev_pipo_next(u32 ahb_ch, enum MLB_CTYPE ctype,
-+				u32 dne_sts, u32 buf_addr)
-+{
-+	u32 ctr_val[4] = { 0 };
-+
-+	if (MLB_CTYPE_ASYNC == ctype ||
-+		MLB_CTYPE_CTRL == ctype) {
-+		ctr_val[1] |= ADT_PS1;
-+		ctr_val[1] |= ADT_PS2;
-+	}
-+
-+	/*
-+	 * Clear DNE1 and ERR1
-+	 * Set the page ready bit (RDY1)
-+	 */
-+	if (dne_sts & ADT_DNE1) {
-+		ctr_val[1] |= ADT_RDY2;
-+		ctr_val[3] = buf_addr;
-+	} else {
-+		ctr_val[1] |= ADT_RDY1;
-+		ctr_val[2] = buf_addr;
-+	}
-+
-+	if (mlb150_dev_adt_write(ahb_ch, ctr_val))
-+		return -ETIME;
-+
-+	return 0;
-+}
-+
-+static inline s32 mlb150_dev_pipo_stop(struct mlb_ringbuf *rbuf, u32 ahb_ch)
-+{
-+	u32 ctr_val[4] = { 0 };
-+	unsigned long flags;
-+
-+	write_lock_irqsave(&rbuf->rb_lock, flags);
-+	rbuf->head = rbuf->tail = 0;
-+	write_unlock_irqrestore(&rbuf->rb_lock, flags);
-+
-+	if (mlb150_dev_adt_write(ahb_ch, ctr_val))
-+		return -ETIME;
-+
-+	return 0;
-+}
-+
-+static s32 mlb150_dev_init_ch_amba_ahb(struct mlb_dev_info *pdevinfo,
-+					struct mlb_channel_info *chinfo,
-+					enum MLB_CTYPE ctype)
-+{
-+	u32 ctr_val[4] = { 0 };
-+
-+	/* a. Set the 32-bit base address (BA1) */
-+	ctr_val[3] = 0;
-+	ctr_val[2] = 0;
-+	ctr_val[1] = (pdevinfo->adt_buf_dep - 1) << ADT_BD1_SHIFT;
-+	ctr_val[1] |= (pdevinfo->adt_buf_dep - 1) << ADT_BD2_SHIFT;
-+	if (MLB_CTYPE_ASYNC == ctype ||
-+		MLB_CTYPE_CTRL == ctype) {
-+		ctr_val[1] |= ADT_PS1;
-+		ctr_val[1] |= ADT_PS2;
-+	}
-+
-+	ctr_val[0] |= (ADT_LE | ADT_CE);
-+
-+	pr_debug("mxc_mlb150: Set ADT val of channel %d, ctype: %d: "
-+		"0x%08x 0x%08x 0x%08x 0x%08x\n",
-+		chinfo->cl, ctype, ctr_val[3], ctr_val[2],
-+		ctr_val[1], ctr_val[0]);
-+
-+	if (mlb150_dev_adt_write(chinfo->cl, ctr_val))
-+		return -ETIME;
-+
-+#ifdef DEBUG_CTR
-+	{
-+		u32 ctr_rd[4] = { 0 };
-+		if (!mlb150_dev_adt_read(chinfo->cl, ctr_rd)) {
-+			pr_debug("mxc_mlb150: ADT val of channel %d: "
-+				"0x%08x 0x%08x 0x%08x 0x%08x\n",
-+				chinfo->cl, ctr_rd[3], ctr_rd[2],
-+				ctr_rd[1], ctr_rd[0]);
-+			if (ctr_rd[3] == ctr_val[3] &&
-+				ctr_rd[2] == ctr_val[2] &&
-+				ctr_rd[1] == ctr_val[1] &&
-+				ctr_rd[0] == ctr_val[0]) {
-+				pr_debug("mxc_mlb150: set adt succeed!\n");
-+				return 0;
-+			} else {
-+				pr_debug("mxc_mlb150: set adt failed!\n");
-+				return -EBADE;
-+			}
-+		} else {
-+			pr_debug("mxc_mlb150: Read ADT val of channel %d failed\n",
-+					chinfo->cl);
-+			return -EBADE;
-+		}
-+	}
-+#endif
-+
-+	return 0;
-+}
-+
-+static void mlb150_dev_init_amba_ahb(struct mlb_dev_info *pdevinfo,
-+					enum MLB_CTYPE ctype)
-+{
-+	struct mlb_channel_info *tx_chinfo = &pdevinfo->channels[TX_CHANNEL];
-+	struct mlb_channel_info *rx_chinfo = &pdevinfo->channels[RX_CHANNEL];
-+
-+	/* Step 1, Initialize all bits of the ADT to '0' */
-+	mlb150_dev_reset_adt();
-+
-+	/*
-+	 * Step 2, Select a logic channel
-+	 * Step 3, Program the AMBA AHB block ping page for channel N
-+	 * Step 4, Program the AMBA AHB block pong page for channel N
-+	 */
-+	mlb150_dev_init_ch_amba_ahb(pdevinfo, rx_chinfo, ctype);
-+	mlb150_dev_init_ch_amba_ahb(pdevinfo, tx_chinfo, ctype);
-+}
-+
-+static void mlb150_dev_exit(void)
-+{
-+	u32 c0_val, hctl_val;
-+
-+	/* Disable EN bits */
-+	c0_val = __raw_readl(mlb_base + REG_MLBC0);
-+	c0_val &= ~(MLBC0_MLBEN | MLBC0_MLBPEN);
-+	__raw_writel(c0_val, mlb_base + REG_MLBC0);
-+
-+	hctl_val = __raw_readl(mlb_base + REG_HCTL);
-+	hctl_val &= ~HCTL_EN;
-+	__raw_writel(hctl_val, mlb_base + REG_HCTL);
-+
-+	__raw_writel(0x0, mlb_base + REG_HCMR0);
-+	__raw_writel(0x0, mlb_base + REG_HCMR1);
-+
-+	mlb150_dev_enable_dma_irq(0);
-+	mlb150_dev_enable_ir_mlb(0);
-+}
-+
-+static void mlb150_dev_init(void)
-+{
-+	u32 c0_val;
-+	u32 ch_rx_mask = (1 << SYNC_RX_CL_AHB0) | (1 << CTRL_RX_CL_AHB0)
-+			| (1 << ASYNC_RX_CL_AHB0) | (1 << ISOC_RX_CL_AHB0)
-+			| (1 << SYNC_TX_CL_AHB0) | (1 << CTRL_TX_CL_AHB0)
-+			| (1 << ASYNC_TX_CL_AHB0) | (1 << ISOC_TX_CL_AHB0);
-+	u32 ch_tx_mask = (1 << (SYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (CTRL_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ASYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ISOC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (SYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (CTRL_TX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ASYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
-+			(1 << (ISOC_TX_CL_AHB1 - INT_AHB1_CH_START));
-+
-+	/* Disable EN bits */
-+	mlb150_dev_exit();
-+
-+	/*
-+	 * Step 1. Initialize CTR and registers
-+	 * a. Set all bit of the CTR (CAT, CDT, and ADT) to 0.
-+	 */
-+	mlb150_dev_reset_whole_ctr();
-+
-+	/* a. Set all bit of the CTR (CAT, CDT, and ADT) to 0. */
-+	mlb150_dev_reset_all_regs();
-+
-+	/*
-+	 * Step 2, Configure the MediaLB interface
-+	 * Select pin mode and clock, 3-pin and 256fs
-+	 */
-+	c0_val = __raw_readl(mlb_base + REG_MLBC0);
-+	c0_val &= ~(MLBC0_MLBPEN | MLBC0_MLBCLK_MASK);
-+	__raw_writel(c0_val, mlb_base + REG_MLBC0);
-+
-+	c0_val |= MLBC0_MLBEN;
-+	__raw_writel(c0_val, mlb_base + REG_MLBC0);
-+
-+	/* Step 3, Configure the HBI interface */
-+	__raw_writel(ch_rx_mask, mlb_base + REG_HCMR0);
-+	__raw_writel(ch_tx_mask, mlb_base + REG_HCMR1);
-+	__raw_writel(HCTL_EN, mlb_base + REG_HCTL);
-+
-+	mlb150_dev_init_ir_amba_ahb();
-+
-+	mlb150_dev_enable_ir_mlb(1);
-+}
-+
-+static s32 mlb150_dev_unmute_syn_ch(u32 rx_ch, u32 rx_cl, u32 tx_ch, u32 tx_cl)
-+{
-+	u32 timeout = 10000;
-+
-+	/*
-+	 * Check that MediaLB clock is running (MLBC1.CLKM = 0)
-+	 * If MLBC1.CLKM = 1, clear the register bit, wait one
-+	 * APB or I/O clock cycle and repeat the check
-+	 */
-+	while ((__raw_readl(mlb_base + REG_MLBC1) & MLBC1_CLKM)
-+			&& --timeout)
-+		__raw_writel(~MLBC1_CLKM, mlb_base + REG_MLBC1);
-+
-+	if (0 == timeout)
-+		return -ETIME;
-+
-+	timeout = 10000;
-+	/* Poll for MLB lock (MLBC0.MLBLK = 1) */
-+	while (!(__raw_readl(mlb_base + REG_MLBC0) & MLBC0_MLBLK)
-+			&& --timeout)
-+		;
-+
-+	if (0 == timeout)
-+		return -ETIME;
-+
-+	/* Unmute synchronous channel(s) */
-+	mlb150_dev_cat_mlb_write(rx_ch, CAT_CE | rx_cl);
-+	mlb150_dev_cat_mlb_write(tx_ch,
-+			CAT_CE | tx_cl | CAT_RNW);
-+	mlb150_dev_cat_hbi_write(rx_cl,
-+			CAT_CE | rx_cl | CAT_RNW);
-+	mlb150_dev_cat_hbi_write(tx_cl, CAT_CE | tx_cl);
-+
-+	return 0;
-+}
-+
-+/* In case the user calls channel shutdown, but rx or tx is not completed yet */
-+static s32 mlb150_trans_complete_check(struct mlb_dev_info *pdevinfo)
-+{
-+	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
-+	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
-+	s32 timeout = 1024;
-+
-+	while (timeout--) {
-+		read_lock(&tx_rbuf->rb_lock);
-+		if (!CIRC_CNT(tx_rbuf->head, tx_rbuf->tail, TRANS_RING_NODES)) {
-+			read_unlock(&tx_rbuf->rb_lock);
-+			break;
-+		} else
-+			read_unlock(&tx_rbuf->rb_lock);
-+	}
-+
-+	if (timeout <= 0) {
-+		pr_debug("TX complete check timeout!\n");
-+		return -ETIME;
-+	}
-+
-+	timeout = 1024;
-+	while (timeout--) {
-+		read_lock(&rx_rbuf->rb_lock);
-+		if (!CIRC_CNT(rx_rbuf->head, rx_rbuf->tail, TRANS_RING_NODES)) {
-+			read_unlock(&rx_rbuf->rb_lock);
-+			break;
-+		} else
-+			read_unlock(&rx_rbuf->rb_lock);
-+	}
-+
-+	if (timeout <= 0) {
-+		pr_debug("RX complete check timeout!\n");
-+		return -ETIME;
-+	}
-+
-+	/*
-+	 * Interrupt from TX can only inform that the data is sent
-+	 * to AHB bus, not mean that it is sent to MITB. Thus we add
-+	 * a delay here for data to be completed sent.
-+	 */
-+	udelay(1000);
-+
-+	return 0;
-+}
-+
-+/*
-+ * Enable/Disable the MLB IRQ
-+ */
-+static void mxc_mlb150_irq_enable(struct mlb_data *drvdata, u8 enable)
-+{
-+	if (enable) {
-+		enable_irq(drvdata->irq_ahb0);
-+		enable_irq(drvdata->irq_ahb1);
-+		enable_irq(drvdata->irq_mlb);
-+	} else {
-+		disable_irq(drvdata->irq_ahb0);
-+		disable_irq(drvdata->irq_ahb1);
-+		disable_irq(drvdata->irq_mlb);
-+	}
-+}
-+
-+/*
-+ * Enable the MLB channel
-+ */
-+static s32 mlb_channel_enable(struct mlb_data *drvdata,
-+				int chan_dev_id, int on)
-+{
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+	struct mlb_channel_info *tx_chinfo = &pdevinfo->channels[TX_CHANNEL];
-+	struct mlb_channel_info *rx_chinfo = &pdevinfo->channels[RX_CHANNEL];
-+	u32 tx_ch = tx_chinfo->address;
-+	u32 rx_ch = rx_chinfo->address;
-+	u32 tx_cl = tx_chinfo->cl;
-+	u32 rx_cl = rx_chinfo->cl;
-+	s32 ret = 0;
-+
-+	/*
-+	 * setup the direction, enable, channel type,
-+	 * mode select, channel address and mask buf start
-+	 */
-+	if (on) {
-+		u32 ctype = pdevinfo->channel_type;
-+
-+		mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
-+				0xffffffff, 0xffffffff);
-+		mlb150_dev_init_rfb(pdevinfo, rx_ch, tx_ch, ctype);
-+
-+		mlb150_dev_init_amba_ahb(pdevinfo, ctype);
-+
-+#ifdef DEBUG
-+		mlb150_dev_dump_ctr_tbl(0, tx_chinfo->cl + 1);
-+#endif
-+		/* Synchronize and unmute synchrouous channel */
-+		if (MLB_CTYPE_SYNC == ctype) {
-+			ret = mlb150_dev_unmute_syn_ch(rx_ch, rx_cl,
-+							tx_ch, tx_cl);
-+			if (ret)
-+				return ret;
-+		}
-+
-+		mlb150_dev_enable_ctr_write(0x0, ADT_RDY1 | ADT_DNE1 |
-+				ADT_ERR1 | ADT_PS1 |
-+				ADT_RDY2 | ADT_DNE2 | ADT_ERR2 | ADT_PS2,
-+				0xffffffff, 0xffffffff);
-+
-+		if (pdevinfo->fps >= CLK_2048FS)
-+			mlb150_enable_pll(drvdata);
-+
-+		atomic_set(&pdevinfo->on, 1);
-+
-+#ifdef DEBUG
-+		mlb150_dev_dump_reg();
-+		mlb150_dev_dump_ctr_tbl(0, tx_chinfo->cl + 1);
-+#endif
-+		/* Init RX ADT */
-+		mlb150_dev_pipo_start(&pdevinfo->rx_rbuf, rx_cl,
-+					pdevinfo->rx_rbuf.phy_addrs[0]);
-+	} else {
-+		mlb150_dev_pipo_stop(&pdevinfo->rx_rbuf, rx_cl);
-+
-+		mlb150_dev_enable_dma_irq(0);
-+		mlb150_dev_enable_ir_mlb(0);
-+
-+		mlb150_dev_reset_cat();
-+
-+		atomic_set(&pdevinfo->on, 0);
-+
-+		if (pdevinfo->fps >= CLK_2048FS)
-+			mlb150_disable_pll(drvdata);
-+	}
-+
-+	return 0;
-+}
-+
-+/*
-+ * MLB interrupt handler
-+ */
-+static void mlb_rx_isr(s32 ctype, u32 ahb_ch, struct mlb_dev_info *pdevinfo)
-+{
-+	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
-+	s32 head, tail, adt_sts;
-+	u32 rx_buf_ptr;
-+
-+#ifdef DEBUG_RX
-+	pr_debug("mxc_mlb150: mlb_rx_isr\n");
-+#endif
-+
-+	read_lock(&rx_rbuf->rb_lock);
-+
-+	head = (rx_rbuf->head + 1) & (TRANS_RING_NODES - 1);
-+	tail = ACCESS_ONCE(rx_rbuf->tail);
-+	read_unlock(&rx_rbuf->rb_lock);
-+
-+	if (CIRC_SPACE(head, tail, TRANS_RING_NODES) >= 1) {
-+		rx_buf_ptr = rx_rbuf->phy_addrs[head];
-+
-+		/* commit the item before incrementing the head */
-+		smp_wmb();
-+
-+		write_lock(&rx_rbuf->rb_lock);
-+		rx_rbuf->head = head;
-+		write_unlock(&rx_rbuf->rb_lock);
-+
-+		/* wake up the reader */
-+		wake_up_interruptible(&pdevinfo->rx_wq);
-+	} else {
-+		rx_buf_ptr = rx_rbuf->phy_addrs[head];
-+		pr_debug("drop RX package, due to no space, (%d,%d)\n",
-+				head, tail);
-+	}
-+
-+	adt_sts = mlb150_dev_get_adt_sts(ahb_ch);
-+	/*  Set ADT for RX */
-+	mlb150_dev_pipo_next(ahb_ch, ctype, adt_sts, rx_buf_ptr);
-+}
-+
-+static void mlb_tx_isr(s32 ctype, u32 ahb_ch, struct mlb_dev_info *pdevinfo)
-+{
-+	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
-+	s32 head, tail, adt_sts;
-+	u32 tx_buf_ptr;
-+
-+	read_lock(&tx_rbuf->rb_lock);
-+
-+	head = ACCESS_ONCE(tx_rbuf->head);
-+	tail = (tx_rbuf->tail + 1) & (TRANS_RING_NODES - 1);
-+	read_unlock(&tx_rbuf->rb_lock);
-+
-+	smp_mb();
-+	write_lock(&tx_rbuf->rb_lock);
-+	tx_rbuf->tail = tail;
-+	write_unlock(&tx_rbuf->rb_lock);
-+
-+	/* check the current tx buffer is available or not */
-+	if (CIRC_CNT(head, tail, TRANS_RING_NODES) >= 1) {
-+		/* read index before reading contents at that index */
-+		smp_read_barrier_depends();
-+
-+		tx_buf_ptr = tx_rbuf->phy_addrs[tail];
-+
-+		wake_up_interruptible(&pdevinfo->tx_wq);
-+
-+		adt_sts = mlb150_dev_get_adt_sts(ahb_ch);
-+		/*  Set ADT for TX */
-+		mlb150_dev_pipo_next(ahb_ch, ctype, adt_sts, tx_buf_ptr);
-+	}
-+}
-+
-+static irqreturn_t mlb_ahb_isr(int irq, void *dev_id)
-+{
-+	u32 acsr0, hcer0;
-+	u32 ch_mask = (1 << SYNC_RX_CL) | (1 << CTRL_RX_CL)
-+			| (1 << ASYNC_RX_CL) | (1 << ISOC_RX_CL)
-+			| (1 << SYNC_TX_CL) | (1 << CTRL_TX_CL)
-+			| (1 << ASYNC_TX_CL) | (1 << ISOC_TX_CL);
-+
-+	/*
-+	 * Step 5, Read the ACSRn registers to determine which channel or
-+	 * channels are causing the interrupt
-+	 */
-+	acsr0 = __raw_readl(mlb_base + REG_ACSR0);
-+
-+	hcer0 = __raw_readl(mlb_base + REG_HCER0);
-+
-+	/*
-+	 * Step 6, If ACTL.SCE = 1, write the result of step 5 back to ACSR0
-+	 * and ACSR1 to clear the interrupt
-+	 * We'll not set ACTL_SCE
-+	 */
-+
-+	if (ch_mask & hcer0)
-+		pr_err("CH encounters an AHB error: 0x%x\n", hcer0);
-+
-+	if ((1 << SYNC_RX_CL) & acsr0)
-+		mlb_rx_isr(MLB_CTYPE_SYNC, SYNC_RX_CL,
-+				&mlb_devinfo[MLB_CTYPE_SYNC]);
-+
-+	if ((1 << CTRL_RX_CL) & acsr0)
-+		mlb_rx_isr(MLB_CTYPE_CTRL, CTRL_RX_CL,
-+				&mlb_devinfo[MLB_CTYPE_CTRL]);
-+
-+	if ((1 << ASYNC_RX_CL) & acsr0)
-+		mlb_rx_isr(MLB_CTYPE_ASYNC, ASYNC_RX_CL,
-+				&mlb_devinfo[MLB_CTYPE_ASYNC]);
-+
-+	if ((1 << ISOC_RX_CL) & acsr0)
-+		mlb_rx_isr(MLB_CTYPE_ISOC, ISOC_RX_CL,
-+				&mlb_devinfo[MLB_CTYPE_ISOC]);
-+
-+	if ((1 << SYNC_TX_CL) & acsr0)
-+		mlb_tx_isr(MLB_CTYPE_SYNC, SYNC_TX_CL,
-+				&mlb_devinfo[MLB_CTYPE_SYNC]);
-+
-+	if ((1 << CTRL_TX_CL) & acsr0)
-+		mlb_tx_isr(MLB_CTYPE_CTRL, CTRL_TX_CL,
-+				&mlb_devinfo[MLB_CTYPE_CTRL]);
-+
-+	if ((1 << ASYNC_TX_CL) & acsr0)
-+		mlb_tx_isr(MLB_CTYPE_ASYNC, ASYNC_TX_CL,
-+				&mlb_devinfo[MLB_CTYPE_ASYNC]);
-+
-+	if ((1 << ISOC_TX_CL) & acsr0)
-+		mlb_tx_isr(MLB_CTYPE_ASYNC, ISOC_TX_CL,
-+				&mlb_devinfo[MLB_CTYPE_ISOC]);
-+
-+	return IRQ_HANDLED;
-+}
-+
-+static irqreturn_t mlb_isr(int irq, void *dev_id)
-+{
-+	u32 rx_int_sts, tx_int_sts, ms0,
-+		ms1, tx_cis, rx_cis, ctype;
-+	int minor;
-+	u32 cdt_val[4] = { 0 };
-+
-+	/*
-+	 * Step 4, Read the MSn register to determine which channel(s)
-+	 * are causing the interrupt
-+	 */
-+	ms0 = __raw_readl(mlb_base + REG_MS0);
-+	ms1 = __raw_readl(mlb_base + REG_MS1);
-+
-+	/*
-+	 * The MLB150_MS0, MLB150_MS1 registers need to be cleared. In
-+	 * the spec description, the registers should  be cleared when
-+	 * enabling interrupt. In fact, we also should clear it in ISR.
-+	 */
-+	__raw_writel(0, mlb_base + REG_MS0);
-+	__raw_writel(0, mlb_base + REG_MS1);
-+
-+	pr_debug("mxc_mlb150: mlb interrupt:0x%08x 0x%08x\n",
-+			(u32)ms0, (u32)ms1);
-+
-+	for (minor = 0; minor < MLB_MINOR_DEVICES; minor++) {
-+		struct mlb_dev_info *pdevinfo = &mlb_devinfo[minor];
-+		u32 rx_mlb_ch = pdevinfo->channels[RX_CHANNEL].address;
-+		u32 tx_mlb_ch = pdevinfo->channels[TX_CHANNEL].address;
-+		u32 rx_mlb_cl = pdevinfo->channels[RX_CHANNEL].cl;
-+		u32 tx_mlb_cl = pdevinfo->channels[TX_CHANNEL].cl;
-+
-+		tx_cis = rx_cis = 0;
-+
-+		ctype = pdevinfo->channel_type;
-+		rx_int_sts = (rx_mlb_ch < 31) ? ms0 : ms1;
-+		tx_int_sts = (tx_mlb_ch < 31) ? ms0 : ms1;
-+
-+		pr_debug("mxc_mlb150: channel interrupt: "
-+				"tx %d: 0x%08x, rx %d: 0x%08x\n",
-+			tx_mlb_ch, (u32)tx_int_sts, rx_mlb_ch, (u32)rx_int_sts);
-+
-+		/* Get tx channel interrupt status */
-+		if (tx_int_sts & (1 << (tx_mlb_ch % 32))) {
-+			mlb150_dev_cdt_read(tx_mlb_cl, cdt_val);
-+			pr_debug("mxc_mlb150: TX_CH: %d, cdt_val[3]: 0x%08x, "
-+					"cdt_val[2]: 0x%08x, "
-+					"cdt_val[1]: 0x%08x, "
-+					"cdt_val[0]: 0x%08x\n",
-+					tx_mlb_ch, cdt_val[3], cdt_val[2],
-+					cdt_val[1], cdt_val[0]);
-+			switch (ctype) {
-+			case MLB_CTYPE_SYNC:
-+				tx_cis = (cdt_val[2] & ~CDT_SYNC_WSTS_MASK)
-+					>> CDT_SYNC_WSTS_SHIFT;
-+				/*
-+				 * Clear RSTS/WSTS errors to resume
-+				 * channel operation
-+				 * a. For synchronous channels: WSTS[3] = 0
-+				 */
-+				cdt_val[2] &= ~(0x8 << CDT_SYNC_WSTS_SHIFT);
-+				break;
-+			case MLB_CTYPE_CTRL:
-+			case MLB_CTYPE_ASYNC:
-+				tx_cis = (cdt_val[2] &
-+					~CDT_CTRL_ASYNC_WSTS_MASK)
-+					>> CDT_CTRL_ASYNC_WSTS_SHIFT;
-+				tx_cis = (cdt_val[3] & CDT_CTRL_ASYNC_WSTS_1) ?
-+					(tx_cis | (0x1 << 4)) : tx_cis;
-+				/*
-+				 * b. For async and ctrl channels:
-+				 * RSTS[4]/WSTS[4] = 0
-+				 * and RSTS[2]/WSTS[2] = 0
-+				 */
-+				cdt_val[3] &= ~CDT_CTRL_ASYNC_WSTS_1;
-+				cdt_val[2] &=
-+					~(0x4 << CDT_CTRL_ASYNC_WSTS_SHIFT);
-+				break;
-+			case MLB_CTYPE_ISOC:
-+				tx_cis = (cdt_val[2] & ~CDT_ISOC_WSTS_MASK)
-+					>> CDT_ISOC_WSTS_SHIFT;
-+				/* c. For isoc channels: WSTS[2:1] = 0x00 */
-+				cdt_val[2] &= ~(0x6 << CDT_ISOC_WSTS_SHIFT);
-+				break;
-+			default:
-+				break;
-+			}
-+			mlb150_dev_cdt_write(tx_mlb_ch, cdt_val);
-+		}
-+
-+		/* Get rx channel interrupt status */
-+		if (rx_int_sts & (1 << (rx_mlb_ch % 32))) {
-+			mlb150_dev_cdt_read(rx_mlb_cl, cdt_val);
-+			pr_debug("mxc_mlb150: RX_CH: %d, cdt_val[3]: 0x%08x, "
-+					"cdt_val[2]: 0x%08x, "
-+					"cdt_val[1]: 0x%08x, "
-+					"cdt_val[0]: 0x%08x\n",
-+					rx_mlb_ch, cdt_val[3], cdt_val[2],
-+					cdt_val[1], cdt_val[0]);
-+			switch (ctype) {
-+			case MLB_CTYPE_SYNC:
-+				tx_cis = (cdt_val[2] & ~CDT_SYNC_RSTS_MASK)
-+					>> CDT_SYNC_RSTS_SHIFT;
-+				cdt_val[2] &= ~(0x8 << CDT_SYNC_WSTS_SHIFT);
-+				break;
-+			case MLB_CTYPE_CTRL:
-+			case MLB_CTYPE_ASYNC:
-+				tx_cis =
-+					(cdt_val[2] & ~CDT_CTRL_ASYNC_RSTS_MASK)
-+					>> CDT_CTRL_ASYNC_RSTS_SHIFT;
-+				tx_cis = (cdt_val[3] & CDT_CTRL_ASYNC_RSTS_1) ?
-+					(tx_cis | (0x1 << 4)) : tx_cis;
-+				cdt_val[3] &= ~CDT_CTRL_ASYNC_RSTS_1;
-+				cdt_val[2] &=
-+					~(0x4 << CDT_CTRL_ASYNC_RSTS_SHIFT);
-+				break;
-+			case MLB_CTYPE_ISOC:
-+				tx_cis = (cdt_val[2] & ~CDT_ISOC_RSTS_MASK)
-+					>> CDT_ISOC_RSTS_SHIFT;
-+				cdt_val[2] &= ~(0x6 << CDT_ISOC_WSTS_SHIFT);
-+				break;
-+			default:
-+				break;
-+			}
-+			mlb150_dev_cdt_write(rx_mlb_ch, cdt_val);
-+		}
-+
-+		if (!tx_cis && !rx_cis)
-+			continue;
-+
-+		/* fill exception event */
-+		spin_lock(&pdevinfo->event_lock);
-+		pdevinfo->ex_event |= (rx_cis << 16) | tx_cis;
-+		spin_unlock(&pdevinfo->event_lock);
-+	}
-+
-+	return IRQ_HANDLED;
-+}
-+
-+static int mxc_mlb150_open(struct inode *inode, struct file *filp)
-+{
-+	int minor, ring_buf_size, buf_size, j, ret;
-+	void __iomem *buf_addr;
-+	ulong phy_addr;
-+	struct mlb_dev_info *pdevinfo = NULL;
-+	struct mlb_channel_info *pchinfo = NULL;
-+	struct mlb_data *drvdata;
-+
-+	minor = MINOR(inode->i_rdev);
-+	drvdata = container_of(inode->i_cdev, struct mlb_data, cdev);
-+
-+	if (minor < 0 || minor >= MLB_MINOR_DEVICES) {
-+		pr_err("no device\n");
-+		return -ENODEV;
-+	}
-+
-+	/* open for each channel device */
-+	if (atomic_cmpxchg(&mlb_devinfo[minor].opencnt, 0, 1) != 0) {
-+		pr_err("busy\n");
-+		return -EBUSY;
-+	}
-+
-+	clk_prepare_enable(drvdata->clk_mlb3p);
-+
-+	/* initial MLB module */
-+	mlb150_dev_init();
-+
-+	pdevinfo = &mlb_devinfo[minor];
-+	pchinfo = &pdevinfo->channels[TX_CHANNEL];
-+
-+	ring_buf_size = pdevinfo->buf_size;
-+	buf_size = ring_buf_size * (TRANS_RING_NODES * 2);
-+	buf_addr = (void __iomem *)gen_pool_alloc(drvdata->iram_pool, buf_size);
-+	if (buf_addr == NULL) {
-+		ret = -ENOMEM;
-+		pr_err("can not alloc rx/tx buffers: %d\n", buf_size);
-+		return ret;
-+	}
-+	phy_addr = gen_pool_virt_to_phys(drvdata->iram_pool, (ulong)buf_addr);
-+	pr_debug("IRAM Range: Virt 0x%p - 0x%p, Phys 0x%x - 0x%x, size: 0x%x\n",
-+			buf_addr, (buf_addr + buf_size - 1), (u32)phy_addr,
-+			(u32)(phy_addr + buf_size - 1), buf_size);
-+	pdevinfo->rbuf_base_virt = buf_addr;
-+	pdevinfo->rbuf_base_phy = phy_addr;
-+	drvdata->iram_size = buf_size;
-+
-+	memset(buf_addr, 0, buf_size);
-+
-+	for (j = 0; j < (TRANS_RING_NODES);
-+		++j, buf_addr += ring_buf_size, phy_addr += ring_buf_size) {
-+		pdevinfo->rx_rbuf.virt_bufs[j] = buf_addr;
-+		pdevinfo->rx_rbuf.phy_addrs[j] = phy_addr;
-+		pr_debug("RX Ringbuf[%d]: 0x%p 0x%x\n",
-+			j, buf_addr, (u32)phy_addr);
-+	}
-+	pdevinfo->rx_rbuf.unit_size = ring_buf_size;
-+	pdevinfo->rx_rbuf.total_size = buf_size;
-+	for (j = 0; j < (TRANS_RING_NODES);
-+		++j, buf_addr += ring_buf_size, phy_addr += ring_buf_size) {
-+		pdevinfo->tx_rbuf.virt_bufs[j] = buf_addr;
-+		pdevinfo->tx_rbuf.phy_addrs[j] = phy_addr;
-+		pr_debug("TX Ringbuf[%d]: 0x%p 0x%x\n",
-+			j, buf_addr, (u32)phy_addr);
-+	}
-+
-+	pdevinfo->tx_rbuf.unit_size = ring_buf_size;
-+	pdevinfo->tx_rbuf.total_size = buf_size;
-+
-+	/* reset the buffer read/write ptr */
-+	pdevinfo->rx_rbuf.head = pdevinfo->rx_rbuf.tail = 0;
-+	pdevinfo->tx_rbuf.head = pdevinfo->tx_rbuf.tail = 0;
-+	pdevinfo->ex_event = 0;
-+	pdevinfo->tx_ok = 0;
-+
-+	init_waitqueue_head(&pdevinfo->rx_wq);
-+	init_waitqueue_head(&pdevinfo->tx_wq);
-+
-+	drvdata = container_of(inode->i_cdev, struct mlb_data, cdev);
-+	drvdata->devinfo = pdevinfo;
-+	mxc_mlb150_irq_enable(drvdata, 1);
-+	filp->private_data = drvdata;
-+
-+	return 0;
-+}
-+
-+static int mxc_mlb150_release(struct inode *inode, struct file *filp)
-+{
-+	int minor;
-+	struct mlb_data *drvdata = filp->private_data;
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+
-+	minor = MINOR(inode->i_rdev);
-+	mxc_mlb150_irq_enable(drvdata, 0);
-+
-+#ifdef DEBUG
-+	mlb150_dev_dump_reg();
-+	mlb150_dev_dump_ctr_tbl(0, pdevinfo->channels[TX_CHANNEL].cl + 1);
-+#endif
-+
-+	gen_pool_free(drvdata->iram_pool,
-+			(ulong)pdevinfo->rbuf_base_virt, drvdata->iram_size);
-+
-+	mlb150_dev_exit();
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->on)
-+		&& (pdevinfo->fps >= CLK_2048FS))
-+		clk_disable_unprepare(drvdata->clk_mlb6p);
-+
-+	atomic_set(&pdevinfo->on, 0);
-+
-+	clk_disable_unprepare(drvdata->clk_mlb3p);
-+	/* decrease the open count */
-+	atomic_set(&pdevinfo->opencnt, 0);
-+
-+	drvdata->devinfo = NULL;
-+
-+	return 0;
-+}
-+
-+static long mxc_mlb150_ioctl(struct file *filp,
-+			 unsigned int cmd, unsigned long arg)
-+{
-+	struct inode *inode = filp->f_path.dentry->d_inode;
-+	struct mlb_data *drvdata = filp->private_data;
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+	void __user *argp = (void __user *)arg;
-+	unsigned long flags, event;
-+	int minor;
-+
-+	minor = MINOR(inode->i_rdev);
-+
-+	switch (cmd) {
-+	case MLB_CHAN_SETADDR:
-+		{
-+			unsigned int caddr;
-+			/* get channel address from user space */
-+			if (copy_from_user(&caddr, argp, sizeof(caddr))) {
-+				pr_err("mxc_mlb150: copy from user failed\n");
-+				return -EFAULT;
-+			}
-+			pdevinfo->channels[TX_CHANNEL].address =
-+							(caddr >> 16) & 0xFFFF;
-+			pdevinfo->channels[RX_CHANNEL].address = caddr & 0xFFFF;
-+			pr_debug("mxc_mlb150: set ch addr, tx: %d, rx: %d\n",
-+					pdevinfo->channels[TX_CHANNEL].address,
-+					pdevinfo->channels[RX_CHANNEL].address);
-+			break;
-+		}
-+
-+	case MLB_CHAN_STARTUP:
-+		if (atomic_read(&pdevinfo->on)) {
-+			pr_debug("mxc_mlb150: channel alreadly startup\n");
-+			break;
-+		}
-+		if (mlb_channel_enable(drvdata, minor, 1))
-+			return -EFAULT;
-+		break;
-+	case MLB_CHAN_SHUTDOWN:
-+		if (atomic_read(&pdevinfo->on) == 0) {
-+			pr_debug("mxc_mlb150: channel areadly shutdown\n");
-+			break;
-+		}
-+		mlb150_trans_complete_check(pdevinfo);
-+		mlb_channel_enable(drvdata, minor, 0);
-+		break;
-+	case MLB_CHAN_GETEVENT:
-+		/* get and clear the ex_event */
-+		spin_lock_irqsave(&pdevinfo->event_lock, flags);
-+		event = pdevinfo->ex_event;
-+		pdevinfo->ex_event = 0;
-+		spin_unlock_irqrestore(&pdevinfo->event_lock, flags);
-+
-+		if (event) {
-+			if (copy_to_user(argp, &event, sizeof(event))) {
-+				pr_err("mxc_mlb150: copy to user failed\n");
-+				return -EFAULT;
-+			}
-+		} else
-+			return -EAGAIN;
-+		break;
-+	case MLB_SET_ISOC_BLKSIZE_188:
-+		pdevinfo->isoc_blksz = 188;
-+		pdevinfo->cdt_buf_dep = pdevinfo->adt_buf_dep =
-+					pdevinfo->isoc_blksz * CH_ISOC_BLK_NUM;
-+		break;
-+	case MLB_SET_ISOC_BLKSIZE_196:
-+		pdevinfo->isoc_blksz = 196;
-+		pdevinfo->cdt_buf_dep = pdevinfo->adt_buf_dep =
-+					pdevinfo->isoc_blksz * CH_ISOC_BLK_NUM;
-+		break;
-+	case MLB_SET_SYNC_QUAD:
-+		{
-+			u32 quad;
-+
-+			if (copy_from_user(&quad, argp, sizeof(quad))) {
-+				pr_err("mxc_mlb150: get quad number "
-+						"from user failed\n");
-+				return -EFAULT;
-+			}
-+			if (quad <= 0 || quad > 3) {
-+				pr_err("mxc_mlb150: Invalid Quadlets!"
-+					"Quadlets in Sync mode can "
-+					"only be 1, 2, 3\n");
-+				return -EINVAL;
-+			}
-+			pdevinfo->sync_quad = quad;
-+			/* Each quadlets is 4 bytes */
-+			pdevinfo->cdt_buf_dep = quad * 4 * 4;
-+			pdevinfo->adt_buf_dep =
-+				pdevinfo->cdt_buf_dep * CH_SYNC_ADT_BUF_MULTI;
-+		}
-+		break;
-+	case MLB_SET_FPS:
-+		{
-+			u32 fps, c0_val;
-+
-+			/* get fps from user space */
-+			if (copy_from_user(&fps, argp, sizeof(fps))) {
-+				pr_err("mxc_mlb150: copy from user failed\n");
-+				return -EFAULT;
-+			}
-+
-+			c0_val = __raw_readl(mlb_base + REG_MLBC0);
-+			c0_val &= ~MLBC0_MLBCLK_MASK;
-+
-+			/* check fps value */
-+			switch (fps) {
-+			case 256:
-+			case 512:
-+			case 1024:
-+				pdevinfo->fps = fps >> 9;
-+				c0_val &= ~MLBC0_MLBPEN;
-+				c0_val |= (fps >> 9)
-+					<< MLBC0_MLBCLK_SHIFT;
-+
-+				if (1024 == fps) {
-+					/*
-+					 * Invert output clock phase
-+					 * in 1024 fps
-+					 */
-+					__raw_writel(0x1,
-+						mlb_base + REG_MLBPC2);
-+				}
-+				break;
-+			case 2048:
-+			case 3072:
-+			case 4096:
-+				pdevinfo->fps = (fps >> 10) + 1;
-+				c0_val |= ((fps >> 10) + 1)
-+					<< MLBC0_MLBCLK_SHIFT;
-+				break;
-+			case 6144:
-+				pdevinfo->fps = fps >> 10;
-+				c0_val |= ((fps >> 10) + 1)
-+					<< MLBC0_MLBCLK_SHIFT;
-+				break;
-+			case 8192:
-+				pdevinfo->fps = (fps >> 10) - 1;
-+				c0_val |= ((fps >> 10) - 1)
-+						<< MLBC0_MLBCLK_SHIFT;
-+				break;
-+			default:
-+				pr_debug("mxc_mlb150: invalid fps argument: %d\n",
-+						fps);
-+				return -EINVAL;
-+			}
-+
-+			__raw_writel(c0_val, mlb_base + REG_MLBC0);
-+
-+			pr_debug("mxc_mlb150: set fps to %d, MLBC0: 0x%08x\n",
-+				fps,
-+				(u32)__raw_readl(mlb_base + REG_MLBC0));
-+
-+			break;
-+		}
-+
-+	case MLB_GET_VER:
-+		{
-+			u32 version;
-+
-+			/* get MLB device module version */
-+			version = 0x03030003;
-+
-+			pr_debug("mxc_mlb150: get version: 0x%08x\n",
-+					version);
-+
-+			if (copy_to_user(argp, &version, sizeof(version))) {
-+				pr_err("mxc_mlb150: copy to user failed\n");
-+				return -EFAULT;
-+			}
-+			break;
-+		}
-+
-+	case MLB_SET_DEVADDR:
-+		{
-+			u32 c1_val;
-+			u8 devaddr;
-+
-+			/* get MLB device address from user space */
-+			if (copy_from_user
-+				(&devaddr, argp, sizeof(unsigned char))) {
-+				pr_err("mxc_mlb150: copy from user failed\n");
-+				return -EFAULT;
-+			}
-+
-+			c1_val = __raw_readl(mlb_base + REG_MLBC1);
-+			c1_val &= ~MLBC1_NDA_MASK;
-+			c1_val |= devaddr << MLBC1_NDA_SHIFT;
-+			__raw_writel(c1_val, mlb_base + REG_MLBC1);
-+			pr_debug("mxc_mlb150: set dev addr, dev addr: %d, "
-+				"MLBC1: 0x%08x\n", devaddr,
-+				(u32)__raw_readl(mlb_base + REG_MLBC1));
-+
-+			break;
-+		}
-+
-+	case MLB_IRQ_DISABLE:
-+		{
-+			disable_irq(drvdata->irq_mlb);
-+			break;
-+		}
-+
-+	case MLB_IRQ_ENABLE:
-+		{
-+			enable_irq(drvdata->irq_mlb);
-+			break;
-+		}
-+	default:
-+		pr_info("mxc_mlb150: Invalid ioctl command\n");
-+		return -EINVAL;
-+	}
-+
-+	return 0;
-+}
-+
-+/*
-+ * MLB read routine
-+ * Read the current received data from queued buffer,
-+ * and free this buffer for hw to fill ingress data.
-+ */
-+static ssize_t mxc_mlb150_read(struct file *filp, char __user *buf,
-+			    size_t count, loff_t *f_pos)
-+{
-+	int size;
-+	struct mlb_data *drvdata = filp->private_data;
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
-+	int head, tail;
-+	unsigned long flags;
-+
-+	read_lock_irqsave(&rx_rbuf->rb_lock, flags);
-+
-+	head = ACCESS_ONCE(rx_rbuf->head);
-+	tail = rx_rbuf->tail;
-+
-+	read_unlock_irqrestore(&rx_rbuf->rb_lock, flags);
-+
-+	/* check the current rx buffer is available or not */
-+	if (0 == CIRC_CNT(head, tail, TRANS_RING_NODES)) {
-+
-+		if (filp->f_flags & O_NONBLOCK)
-+			return -EAGAIN;
-+
-+		do {
-+			DEFINE_WAIT(__wait);
-+
-+			for (;;) {
-+				prepare_to_wait(&pdevinfo->rx_wq,
-+						&__wait, TASK_INTERRUPTIBLE);
-+
-+				read_lock_irqsave(&rx_rbuf->rb_lock, flags);
-+				if (CIRC_CNT(rx_rbuf->head, rx_rbuf->tail,
-+						TRANS_RING_NODES) > 0) {
-+					read_unlock_irqrestore(&rx_rbuf->rb_lock,
-+								flags);
-+					break;
-+				}
-+				read_unlock_irqrestore(&rx_rbuf->rb_lock,
-+							flags);
-+
-+				if (!signal_pending(current)) {
-+					schedule();
-+					continue;
-+				}
-+				return -ERESTARTSYS;
-+			}
-+			finish_wait(&pdevinfo->rx_wq, &__wait);
-+		} while (0);
-+	}
-+
-+	/* read index before reading contents at that index */
-+	smp_read_barrier_depends();
-+
-+	size = pdevinfo->adt_buf_dep;
-+	if (size > count) {
-+		/* the user buffer is too small */
-+		pr_warning
-+			("mxc_mlb150: received data size is bigger than "
-+			"size: %d, count: %d\n", size, count);
-+		return -EINVAL;
-+	}
-+
-+	/* extract one item from the buffer */
-+	if (copy_to_user(buf, rx_rbuf->virt_bufs[tail], size)) {
-+		pr_err("mxc_mlb150: copy from user failed\n");
-+		return -EFAULT;
-+	}
-+
-+	/* finish reading descriptor before incrementing tail */
-+	smp_mb();
-+
-+	write_lock_irqsave(&rx_rbuf->rb_lock, flags);
-+	rx_rbuf->tail = (tail + 1) & (TRANS_RING_NODES - 1);
-+	write_unlock_irqrestore(&rx_rbuf->rb_lock, flags);
-+
-+	*f_pos = 0;
-+
-+	return size;
-+}
-+
-+/*
-+ * MLB write routine
-+ * Copy the user data to tx channel buffer,
-+ * and prepare the channel current/next buffer ptr.
-+ */
-+static ssize_t mxc_mlb150_write(struct file *filp, const char __user *buf,
-+			     size_t count, loff_t *f_pos)
-+{
-+	s32 ret = 0;
-+	struct mlb_channel_info *pchinfo = NULL;
-+	struct mlb_data *drvdata = filp->private_data;
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
-+	int head, tail;
-+	unsigned long flags;
-+
-+	/*
-+	 * minor = MINOR(filp->f_dentry->d_inode->i_rdev);
-+	 */
-+	pchinfo = &pdevinfo->channels[TX_CHANNEL];
-+
-+	if (count > pdevinfo->buf_size) {
-+		/* too many data to write */
-+		pr_warning("mxc_mlb150: overflow write data\n");
-+		return -EFBIG;
-+	}
-+
-+	*f_pos = 0;
-+
-+	read_lock_irqsave(&tx_rbuf->rb_lock, flags);
-+
-+	head = tx_rbuf->head;
-+	tail = ACCESS_ONCE(tx_rbuf->tail);
-+	read_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
-+
-+	if (0 == CIRC_SPACE(head, tail, TRANS_RING_NODES)) {
-+		if (filp->f_flags & O_NONBLOCK)
-+			return -EAGAIN;
-+		do {
-+			DEFINE_WAIT(__wait);
-+
-+			for (;;) {
-+				prepare_to_wait(&pdevinfo->tx_wq,
-+						&__wait, TASK_INTERRUPTIBLE);
-+
-+				read_lock_irqsave(&tx_rbuf->rb_lock, flags);
-+				if (CIRC_SPACE(tx_rbuf->head, tx_rbuf->tail,
-+							TRANS_RING_NODES) > 0) {
-+					read_unlock_irqrestore(&tx_rbuf->rb_lock,
-+							flags);
-+					break;
-+				}
-+				read_unlock_irqrestore(&tx_rbuf->rb_lock,
-+								flags);
-+
-+				if (!signal_pending(current)) {
-+					schedule();
-+					continue;
-+				}
-+				return -ERESTARTSYS;
-+			}
-+			finish_wait(&pdevinfo->tx_wq, &__wait);
-+		} while (0);
-+	}
-+
-+	if (copy_from_user((void *)tx_rbuf->virt_bufs[head], buf, count)) {
-+		read_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
-+		pr_err("mxc_mlb: copy from user failed\n");
-+		ret = -EFAULT;
-+		goto out;
-+	}
-+
-+	write_lock_irqsave(&tx_rbuf->rb_lock, flags);
-+	smp_wmb();
-+	tx_rbuf->head = (head + 1) & (TRANS_RING_NODES - 1);
-+	write_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
-+
-+	if (0 == CIRC_CNT(head, tail, TRANS_RING_NODES)) {
-+		u32 tx_buf_ptr, ahb_ch;
-+		s32 adt_sts;
-+		u32 ctype = pdevinfo->channel_type;
-+
-+		/* read index before reading contents at that index */
-+		smp_read_barrier_depends();
-+
-+		tx_buf_ptr = tx_rbuf->phy_addrs[tail];
-+
-+		ahb_ch = pdevinfo->channels[TX_CHANNEL].cl;
-+		adt_sts = mlb150_dev_get_adt_sts(ahb_ch);
-+
-+		/*  Set ADT for TX */
-+		mlb150_dev_pipo_next(ahb_ch, ctype, adt_sts, tx_buf_ptr);
-+	}
-+
-+	ret = count;
-+out:
-+	return ret;
-+}
-+
-+static unsigned int mxc_mlb150_poll(struct file *filp,
-+				 struct poll_table_struct *wait)
-+{
-+	int minor;
-+	unsigned int ret = 0;
-+	struct mlb_data *drvdata = filp->private_data;
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
-+	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
-+	int head, tail;
-+	unsigned long flags;
-+
-+
-+	minor = MINOR(filp->f_path.dentry->d_inode->i_rdev);
-+
-+	poll_wait(filp, &pdevinfo->rx_wq, wait);
-+	poll_wait(filp, &pdevinfo->tx_wq, wait);
-+
-+	read_lock_irqsave(&tx_rbuf->rb_lock, flags);
-+	head = tx_rbuf->head;
-+	tail = tx_rbuf->tail;
-+	read_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
-+
-+	/* check the tx buffer is avaiable or not */
-+	if (CIRC_SPACE(head, tail, TRANS_RING_NODES) >= 1)
-+		ret |= POLLOUT | POLLWRNORM;
-+
-+	read_lock_irqsave(&rx_rbuf->rb_lock, flags);
-+	head = rx_rbuf->head;
-+	tail = rx_rbuf->tail;
-+	read_unlock_irqrestore(&rx_rbuf->rb_lock, flags);
-+
-+	/* check the rx buffer filled or not */
-+	if (CIRC_CNT(head, tail, TRANS_RING_NODES) >= 1)
-+		ret |= POLLIN | POLLRDNORM;
-+
-+
-+	/* check the exception event */
-+	if (pdevinfo->ex_event)
-+		ret |= POLLIN | POLLRDNORM;
-+
-+	return ret;
-+}
-+
-+/*
-+ * char dev file operations structure
-+ */
-+static const struct file_operations mxc_mlb150_fops = {
-+
-+	.owner = THIS_MODULE,
-+	.open = mxc_mlb150_open,
-+	.release = mxc_mlb150_release,
-+	.unlocked_ioctl = mxc_mlb150_ioctl,
-+	.poll = mxc_mlb150_poll,
-+	.read = mxc_mlb150_read,
-+	.write = mxc_mlb150_write,
-+};
-+
-+static struct platform_device_id imx_mlb150_devtype[] = {
-+	{
-+		.name = "imx6q-mlb150",
-+		.driver_data = 0,
-+	}, {
-+		/* sentinel */
-+	}
-+};
-+MODULE_DEVICE_TABLE(platform, imx_mlb150_devtype);
-+
-+static const struct of_device_id mlb150_imx_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-mlb150", .data = &imx_mlb150_devtype[0], },
-+	{ /* sentinel */ }
-+};
-+
-+/*
-+ * This function is called whenever the MLB device is detected.
-+ */
-+static int mxc_mlb150_probe(struct platform_device *pdev)
-+{
-+	int ret, mlb_major, i;
-+	struct mlb_data *drvdata;
-+	struct resource *res;
-+	struct device_node *np = pdev->dev.of_node;
-+
-+	drvdata = devm_kzalloc(&pdev->dev, sizeof(struct mlb_data),
-+				GFP_KERNEL);
-+	if (!drvdata) {
-+		dev_err(&pdev->dev, "can't allocate enough memory\n");
-+		return -ENOMEM;
-+	}
-+
-+	/*
-+	 * Register MLB lld as four character devices
-+	 */
-+	ret = alloc_chrdev_region(&drvdata->firstdev, 0,
-+			MLB_MINOR_DEVICES, "mxc_mlb150");
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "alloc region error\n");
-+		goto err_reg;
-+	}
-+	mlb_major = MAJOR(drvdata->firstdev);
-+	dev_dbg(&pdev->dev, "MLB device major: %d\n", mlb_major);
-+
-+	cdev_init(&drvdata->cdev, &mxc_mlb150_fops);
-+	drvdata->cdev.owner = THIS_MODULE;
-+
-+	ret = cdev_add(&drvdata->cdev, drvdata->firstdev, MLB_MINOR_DEVICES);
-+	if (ret) {
-+		dev_err(&pdev->dev, "can't add cdev\n");
-+		goto err_reg;
-+	}
-+
-+	/* create class and device for udev information */
-+	drvdata->class = class_create(THIS_MODULE, "mlb150");
-+	if (IS_ERR(drvdata->class)) {
-+		dev_err(&pdev->dev, "failed to create device class\n");
-+		ret = -ENOMEM;
-+		goto err_class;
-+	}
-+
-+	for (i = 0; i < MLB_MINOR_DEVICES; i++) {
-+		struct device *class_dev;
-+
-+		class_dev = device_create(drvdata->class, NULL,
-+				MKDEV(mlb_major, i),
-+				NULL, mlb_devinfo[i].dev_name);
-+		if (IS_ERR(class_dev)) {
-+			dev_err(&pdev->dev, "failed to create mlb150 %s"
-+				" class device\n", mlb_devinfo[i].dev_name);
-+			ret = -ENOMEM;
-+			goto err_dev;
-+		}
-+	}
-+
-+	/* ahb0 irq */
-+	drvdata->irq_ahb0 = platform_get_irq(pdev,  1);
-+	if (drvdata->irq_ahb0 < 0) {
-+		dev_err(&pdev->dev, "No ahb0 irq line provided\n");
-+		goto err_dev;
-+	}
-+	dev_dbg(&pdev->dev, "ahb0_irq: %d\n", drvdata->irq_ahb0);
-+	if (devm_request_irq(&pdev->dev, drvdata->irq_ahb0, mlb_ahb_isr,
-+				0, "mlb_ahb0", NULL)) {
-+		dev_err(&pdev->dev, "can't claim irq %d\n", drvdata->irq_ahb0);
-+		goto err_dev;
-+	}
-+
-+	/* ahb1 irq */
-+	drvdata->irq_ahb1 = platform_get_irq(pdev,  2);
-+	if (drvdata->irq_ahb1 < 0) {
-+		dev_err(&pdev->dev, "No ahb1 irq line provided\n");
-+		goto err_dev;
-+	}
-+	dev_dbg(&pdev->dev, "ahb1_irq: %d\n", drvdata->irq_ahb1);
-+	if (devm_request_irq(&pdev->dev, drvdata->irq_ahb1, mlb_ahb_isr,
-+				0, "mlb_ahb1", NULL)) {
-+		dev_err(&pdev->dev, "can't claim irq %d\n", drvdata->irq_ahb1);
-+		goto err_dev;
-+	}
-+
-+	/* mlb irq */
-+	drvdata->irq_mlb  = platform_get_irq(pdev,  0);
-+	if (drvdata->irq_mlb < 0) {
-+		dev_err(&pdev->dev, "No mlb irq line provided\n");
-+		goto err_dev;
-+	}
-+	dev_dbg(&pdev->dev, "mlb_irq: %d\n", drvdata->irq_mlb);
-+	if (devm_request_irq(&pdev->dev, drvdata->irq_mlb, mlb_isr,
-+				0, "mlb", NULL)) {
-+		dev_err(&pdev->dev, "can't claim irq %d\n", drvdata->irq_mlb);
-+		goto err_dev;
-+	}
-+
-+	/* ioremap from phy mlb to kernel space */
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res) {
-+		dev_err(&pdev->dev, "can't get device resources\n");
-+		ret = -ENOENT;
-+		goto err_dev;
-+	}
-+	mlb_base = devm_ioremap_resource(&pdev->dev, res);
-+	dev_dbg(&pdev->dev, "mapped base address: 0x%08x\n", (u32)mlb_base);
-+	if (IS_ERR(mlb_base)) {
-+		dev_err(&pdev->dev,
-+			"failed to get ioremap base\n");
-+		ret = PTR_ERR(mlb_base);
-+		goto err_dev;
-+	}
-+	drvdata->membase = mlb_base;
-+
-+#ifdef CONFIG_REGULATOR
-+	drvdata->nvcc = devm_regulator_get(&pdev->dev, "reg_nvcc");
-+	if (!IS_ERR(drvdata->nvcc)) {
-+		regulator_set_voltage(drvdata->nvcc, 2500000, 2500000);
-+		dev_err(&pdev->dev, "enalbe regulator\n");
-+		ret = regulator_enable(drvdata->nvcc);
-+		if (ret) {
-+			dev_err(&pdev->dev, "vdd set voltage error\n");
-+			goto err_dev;
-+		}
-+	}
-+#endif
-+
-+	/* enable clock */
-+	drvdata->clk_mlb3p = devm_clk_get(&pdev->dev, "mlb");
-+	if (IS_ERR(drvdata->clk_mlb3p)) {
-+		dev_err(&pdev->dev, "unable to get mlb clock\n");
-+		ret = PTR_ERR(drvdata->clk_mlb3p);
-+		goto err_dev;
-+	}
-+
-+	drvdata->clk_mlb6p = devm_clk_get(&pdev->dev, "pll8_mlb");
-+	if (IS_ERR(drvdata->clk_mlb6p)) {
-+		dev_err(&pdev->dev, "unable to get mlb pll clock\n");
-+		ret = PTR_ERR(drvdata->clk_mlb6p);
-+		goto err_dev;
-+	}
-+
-+
-+	drvdata->iram_pool = of_get_named_gen_pool(np, "iram", 0);
-+	if (!drvdata->iram_pool) {
-+		dev_err(&pdev->dev, "iram pool not available\n");
-+		ret = -ENOMEM;
-+		goto err_dev;
-+	}
-+
-+	drvdata->devinfo = NULL;
-+	mxc_mlb150_irq_enable(drvdata, 0);
-+	platform_set_drvdata(pdev, drvdata);
-+	return 0;
-+
-+err_dev:
-+	for (--i; i >= 0; i--)
-+		device_destroy(drvdata->class, MKDEV(mlb_major, i));
-+
-+	class_destroy(drvdata->class);
-+err_class:
-+	cdev_del(&drvdata->cdev);
-+err_reg:
-+	unregister_chrdev_region(drvdata->firstdev, MLB_MINOR_DEVICES);
-+
-+	return ret;
-+}
-+
-+static int mxc_mlb150_remove(struct platform_device *pdev)
-+{
-+	int i;
-+	struct mlb_data *drvdata = platform_get_drvdata(pdev);
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->on)
-+		&& (pdevinfo->fps >= CLK_2048FS))
-+		clk_disable_unprepare(drvdata->clk_mlb6p);
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->opencnt))
-+		clk_disable_unprepare(drvdata->clk_mlb3p);
-+
-+	/* disable mlb power */
-+#ifdef CONFIG_REGULATOR
-+	if (!IS_ERR(drvdata->nvcc))
-+		regulator_disable(drvdata->nvcc);
-+#endif
-+
-+	/* destroy mlb device class */
-+	for (i = MLB_MINOR_DEVICES - 1; i >= 0; i--)
-+		device_destroy(drvdata->class,
-+				MKDEV(MAJOR(drvdata->firstdev), i));
-+	class_destroy(drvdata->class);
-+
-+	cdev_del(&drvdata->cdev);
-+
-+	/* Unregister the two MLB devices */
-+	unregister_chrdev_region(drvdata->firstdev, MLB_MINOR_DEVICES);
-+
-+	return 0;
-+}
-+
-+#ifdef CONFIG_PM
-+static int mxc_mlb150_suspend(struct platform_device *pdev, pm_message_t state)
-+{
-+	struct mlb_data *drvdata = platform_get_drvdata(pdev);
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->on)
-+		&& (pdevinfo->fps >= CLK_2048FS))
-+		clk_disable_unprepare(drvdata->clk_mlb6p);
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->opencnt)) {
-+		mlb150_dev_exit();
-+		clk_disable_unprepare(drvdata->clk_mlb3p);
-+	}
-+
-+	return 0;
-+}
-+
-+static int mxc_mlb150_resume(struct platform_device *pdev)
-+{
-+	struct mlb_data *drvdata = platform_get_drvdata(pdev);
-+	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->opencnt)) {
-+		clk_prepare_enable(drvdata->clk_mlb3p);
-+		mlb150_dev_init();
-+	}
-+
-+	if (pdevinfo && atomic_read(&pdevinfo->on) &&
-+		(pdevinfo->fps >= CLK_2048FS))
-+		clk_prepare_enable(drvdata->clk_mlb6p);
-+
-+	return 0;
-+}
-+#else
-+#define mxc_mlb150_suspend NULL
-+#define mxc_mlb150_resume NULL
-+#endif
-+
-+/*
-+ * platform driver structure for MLB
-+ */
-+static struct platform_driver mxc_mlb150_driver = {
-+	.driver = {
-+		.name = DRIVER_NAME,
-+		.owner  = THIS_MODULE,
-+		.of_match_table = mlb150_imx_dt_ids,
-+	},
-+	.probe = mxc_mlb150_probe,
-+	.remove = mxc_mlb150_remove,
-+	.suspend = mxc_mlb150_suspend,
-+	.resume = mxc_mlb150_resume,
-+	.id_table = imx_mlb150_devtype,
-+};
-+
-+static int __init mxc_mlb150_init(void)
-+{
-+	return platform_driver_register(&mxc_mlb150_driver);
-+}
-+
-+static void __exit mxc_mlb150_exit(void)
-+{
-+	platform_driver_unregister(&mxc_mlb150_driver);
-+}
-+
-+module_init(mxc_mlb150_init);
-+module_exit(mxc_mlb150_exit);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("MLB150 low level driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/mxc/vpu/Kconfig linux-xbian-imx6/drivers/mxc/vpu/Kconfig
---- linux-4.1.3/drivers/mxc/vpu/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/vpu/Kconfig	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,31 @@
-+#
-+# Codec configuration
-+#
-+
-+menu "MXC VPU(Video Processing Unit) support"
-+
-+config MXC_VPU
-+	  tristate "Support for MXC VPU(Video Processing Unit)"
-+	  depends on (SOC_IMX27 || SOC_IMX5 || SOC_IMX6Q)
-+	  default y
-+	---help---
-+	  The VPU codec device provides codec function for H.264/MPEG4/H.263,
-+	  as well as MPEG2/VC-1/DivX on some platforms.
-+
-+config MXC_VPU_DEBUG
-+	bool "MXC VPU debugging"
-+	depends on MXC_VPU != n
-+	help
-+	  This is an option for the developers; most people should
-+	  say N here.  This enables MXC VPU driver debugging.
-+
-+config MX6_VPU_352M
-+	bool "MX6 VPU 352M"
-+	depends on MXC_VPU
-+	default n
-+	help
-+	 Increase VPU frequncy to 352M, the config will disable bus frequency
-+	 adjust dynamic, and CPU lowest setpoint will be 352Mhz.
-+	 This config is used for special VPU use case.
-+
-+endmenu
-diff -Nur linux-4.1.3/drivers/mxc/vpu/Makefile linux-xbian-imx6/drivers/mxc/vpu/Makefile
---- linux-4.1.3/drivers/mxc/vpu/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/vpu/Makefile	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,9 @@
-+#
-+# Makefile for the VPU drivers.
-+#
-+
-+obj-$(CONFIG_MXC_VPU)                  += mxc_vpu.o
-+
-+ifeq ($(CONFIG_MXC_VPU_DEBUG),y)
-+EXTRA_CFLAGS += -DDEBUG
-+endif
-diff -Nur linux-4.1.3/drivers/mxc/vpu/mxc_vpu.c linux-xbian-imx6/drivers/mxc/vpu/mxc_vpu.c
---- linux-4.1.3/drivers/mxc/vpu/mxc_vpu.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/mxc/vpu/mxc_vpu.c	2015-07-27 23:13:06.230751680 +0200
-@@ -0,0 +1,1344 @@
-+/*
-+ * Copyright 2006-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file mxc_vpu.c
-+ *
-+ * @brief VPU system initialization and file operation implementation
-+ *
-+ * @ingroup VPU
-+ */
-+#include <linux/kernel.h>
-+#include <linux/mm.h>
-+#include <linux/interrupt.h>
-+#include <linux/ioport.h>
-+#include <linux/stat.h>
-+#include <linux/platform_device.h>
-+#include <linux/kdev_t.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/wait.h>
-+#include <linux/list.h>
-+#include <linux/clk.h>
-+#include <linux/delay.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/uaccess.h>
-+#include <linux/io.h>
-+#include <linux/slab.h>
-+#include <linux/workqueue.h>
-+#include <linux/sched.h>
-+#include <linux/vmalloc.h>
-+#include <linux/regulator/consumer.h>
-+#include <linux/page-flags.h>
-+#include <linux/mm_types.h>
-+#include <linux/types.h>
-+#include <linux/memblock.h>
-+#include <linux/memory.h>
-+#include <linux/version.h>
-+#include <asm/page.h>
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+#include <linux/module.h>
-+#include <linux/pm_runtime.h>
-+#include <linux/sizes.h>
-+#endif
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
-+#include <linux/iram_alloc.h>
-+#include <mach/clock.h>
-+#include <mach/hardware.h>
-+#include <mach/mxc_vpu.h>
-+#endif
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+#include <linux/busfreq-imx6.h>
-+#include <linux/clk.h>
-+#include <linux/genalloc.h>
-+#include <linux/mxc_vpu.h>
-+#include <linux/of.h>
-+#include <linux/reset.h>
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+#include <mach/busfreq.h>
-+#include <mach/common.h>
-+#else
-+#include <asm/sizes.h>
-+#endif
-+
-+/* Define one new pgprot which combined uncached and XN(never executable) */
-+#define pgprot_noncachedxn(prot) \
-+	__pgprot_modify(prot, L_PTE_MT_MASK, L_PTE_MT_UNCACHED | L_PTE_XN)
-+
-+struct vpu_priv {
-+	struct fasync_struct *async_queue;
-+	struct work_struct work;
-+	struct workqueue_struct *workqueue;
-+	struct mutex lock;
-+};
-+
-+/* To track the allocated memory buffer */
-+struct memalloc_record {
-+	struct list_head list;
-+	struct vpu_mem_desc mem;
-+};
-+
-+struct iram_setting {
-+	u32 start;
-+	u32 end;
-+};
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+static struct gen_pool *iram_pool;
-+static u32 iram_base;
-+#endif
-+
-+static LIST_HEAD(head);
-+
-+static int vpu_major;
-+static int vpu_clk_usercount;
-+static struct class *vpu_class;
-+static struct vpu_priv vpu_data;
-+static u8 open_count;
-+static struct clk *vpu_clk;
-+static struct vpu_mem_desc bitwork_mem = { 0 };
-+static struct vpu_mem_desc pic_para_mem = { 0 };
-+static struct vpu_mem_desc user_data_mem = { 0 };
-+static struct vpu_mem_desc share_mem = { 0 };
-+static struct vpu_mem_desc vshare_mem = { 0 };
-+
-+static void __iomem *vpu_base;
-+static int vpu_ipi_irq;
-+static u32 phy_vpu_base_addr;
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+static phys_addr_t top_address_DRAM;
-+static struct mxc_vpu_platform_data *vpu_plat;
-+#endif
-+
-+static struct device *vpu_dev;
-+
-+/* IRAM setting */
-+static struct iram_setting iram;
-+
-+/* implement the blocking ioctl */
-+static int irq_status;
-+static int codec_done;
-+static wait_queue_head_t vpu_queue;
-+
-+#ifdef CONFIG_SOC_IMX6Q
-+#define MXC_VPU_HAS_JPU
-+#endif
-+
-+#ifdef MXC_VPU_HAS_JPU
-+static int vpu_jpu_irq;
-+#endif
-+
-+#ifdef CONFIG_PM
-+static unsigned int regBk[64];
-+static unsigned int pc_before_suspend;
-+#endif
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+static struct regulator *vpu_regulator;
-+#endif
-+static atomic_t clk_cnt_from_ioc = ATOMIC_INIT(0);
-+
-+#define	READ_REG(x)		readl_relaxed(vpu_base + x)
-+#define	WRITE_REG(val, x)	writel_relaxed(val, vpu_base + x)
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+/* redirect to static functions */
-+static int cpu_is_mx6dl(void)
-+{
-+	int ret;
-+	ret = of_machine_is_compatible("fsl,imx6dl");
-+	return ret;
-+}
-+
-+static int cpu_is_mx6q(void)
-+{
-+	int ret;
-+	ret = of_machine_is_compatible("fsl,imx6q");
-+	return ret;
-+}
-+#endif
-+
-+static void vpu_reset(void)
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+	device_reset(vpu_dev);
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+	imx_src_reset_vpu();
-+#else
-+	if (vpu_plat->reset)
-+		vpu_plat->reset();
-+#endif
-+}
-+
-+static long vpu_power_get(bool on)
-+{
-+	long ret = 0;
-+
-+	if (on) {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+		vpu_regulator = regulator_get(NULL, "cpu_vddvpu");
-+		ret = IS_ERR(vpu_regulator);
-+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+		vpu_regulator = devm_regulator_get(vpu_dev, "pu");
-+		ret = IS_ERR(vpu_regulator);
-+#endif
-+	} else {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+		if (!IS_ERR(vpu_regulator))
-+			regulator_put(vpu_regulator);
-+#endif
-+	}
-+	return ret;
-+}
-+
-+static void vpu_power_up(bool on)
-+{
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+	int ret = 0;
-+
-+	if (on) {
-+		if (!IS_ERR(vpu_regulator)) {
-+			ret = regulator_enable(vpu_regulator);
-+			if (ret)
-+				dev_err(vpu_dev, "failed to power up vpu\n");
-+		}
-+	} else {
-+		if (!IS_ERR(vpu_regulator)) {
-+			ret = regulator_disable(vpu_regulator);
-+			if (ret)
-+				dev_err(vpu_dev, "failed to power down vpu\n");
-+		}
-+	}
-+#else
-+	imx_gpc_power_up_pu(on);
-+#endif
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+static int cpu_is_mx53(void)
-+{
-+	return 0;
-+}
-+
-+static int cpu_is_mx51(void)
-+{
-+	return 0;
-+}
-+
-+#define VM_RESERVED 0
-+#endif
-+
-+/*!
-+ * Private function to alloc dma buffer
-+ * @return status  0 success.
-+ */
-+static int vpu_alloc_dma_buffer(struct vpu_mem_desc *mem)
-+{
-+	mem->cpu_addr = (unsigned long)
-+	    dma_zalloc_coherent(NULL, PAGE_ALIGN(mem->size),
-+			       (dma_addr_t *) (&mem->phy_addr),
-+			       GFP_DMA | GFP_KERNEL);
-+	dev_dbg(vpu_dev, "[ALLOC] mem alloc cpu_addr = 0x%x\n", mem->cpu_addr);
-+	if ((void *)(mem->cpu_addr) == NULL) {
-+		dev_err(vpu_dev, "Physical memory allocation error!\n");
-+		return -1;
-+	}
-+	return 0;
-+}
-+
-+/*!
-+ * Private function to free dma buffer
-+ */
-+static void vpu_free_dma_buffer(struct vpu_mem_desc *mem)
-+{
-+	if (mem->cpu_addr != 0) {
-+		dma_free_coherent(0, PAGE_ALIGN(mem->size),
-+				  (void *)mem->cpu_addr, mem->phy_addr);
-+	}
-+}
-+
-+/*!
-+ * Private function to free buffers
-+ * @return status  0 success.
-+ */
-+static int vpu_free_buffers(void)
-+{
-+	struct memalloc_record *rec, *n;
-+	struct vpu_mem_desc mem;
-+
-+	list_for_each_entry_safe(rec, n, &head, list) {
-+		mem = rec->mem;
-+		if (mem.cpu_addr != 0) {
-+			vpu_free_dma_buffer(&mem);
-+			dev_dbg(vpu_dev, "[FREE] freed paddr=0x%08X\n", mem.phy_addr);
-+			/* delete from list */
-+			list_del(&rec->list);
-+			kfree(rec);
-+		}
-+	}
-+
-+	return 0;
-+}
-+
-+static inline void vpu_worker_callback(struct work_struct *w)
-+{
-+	struct vpu_priv *dev = container_of(w, struct vpu_priv,
-+				work);
-+
-+	if (dev->async_queue)
-+		kill_fasync(&dev->async_queue, SIGIO, POLL_IN);
-+
-+	irq_status = 1;
-+	/*
-+	 * Clock is gated on when dec/enc started, gate it off when
-+	 * codec is done.
-+	 */
-+	if (codec_done)
-+		codec_done = 0;
-+
-+	wake_up_interruptible(&vpu_queue);
-+}
-+
-+/*!
-+ * @brief vpu interrupt handler
-+ */
-+static irqreturn_t vpu_ipi_irq_handler(int irq, void *dev_id)
-+{
-+	struct vpu_priv *dev = dev_id;
-+	unsigned long reg;
-+
-+	reg = READ_REG(BIT_INT_REASON);
-+	if (reg & 0x8)
-+		codec_done = 1;
-+	WRITE_REG(0x1, BIT_INT_CLEAR);
-+
-+	queue_work(dev->workqueue, &dev->work);
-+
-+	return IRQ_HANDLED;
-+}
-+
-+/*!
-+ * @brief vpu jpu interrupt handler
-+ */
-+#ifdef MXC_VPU_HAS_JPU
-+static irqreturn_t vpu_jpu_irq_handler(int irq, void *dev_id)
-+{
-+	struct vpu_priv *dev = dev_id;
-+	unsigned long reg;
-+
-+	reg = READ_REG(MJPEG_PIC_STATUS_REG);
-+	if (reg & 0x3)
-+		codec_done = 1;
-+
-+	queue_work(dev->workqueue, &dev->work);
-+
-+	return IRQ_HANDLED;
-+}
-+#endif
-+
-+/*!
-+ * @brief check phy memory prepare to pass to vpu is valid or not, we
-+ * already address some issue that if pass a wrong address to vpu
-+ * (like virtual address), system will hang.
-+ *
-+ * @return true return is a valid phy memory address, false return not.
-+ */
-+bool vpu_is_valid_phy_memory(u32 paddr)
-+{
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+	if (paddr > top_address_DRAM)
-+		return false;
-+#endif
-+
-+	return true;
-+}
-+
-+/*!
-+ * @brief open function for vpu file operation
-+ *
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_open(struct inode *inode, struct file *filp)
-+{
-+
-+	mutex_lock(&vpu_data.lock);
-+
-+	if (open_count++ == 0) {
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+		pm_runtime_get_sync(vpu_dev);
-+#endif
-+		vpu_power_up(true);
-+
-+#ifdef CONFIG_SOC_IMX6Q
-+		clk_prepare(vpu_clk);
-+		clk_enable(vpu_clk);
-+		if (READ_REG(BIT_CUR_PC))
-+			dev_dbg(vpu_dev, "Not power off before vpu open!\n");
-+		clk_disable(vpu_clk);
-+		clk_unprepare(vpu_clk);
-+#endif
-+	}
-+
-+	filp->private_data = (void *)(&vpu_data);
-+	mutex_unlock(&vpu_data.lock);
-+	return 0;
-+}
-+
-+/*!
-+ * @brief IO ctrl function for vpu file operation
-+ * @param cmd IO ctrl command
-+ * @return  0 on success or negative error code on error
-+ */
-+static long vpu_ioctl(struct file *filp, u_int cmd,
-+		     u_long arg)
-+{
-+	int ret = 0;
-+
-+	switch (cmd) {
-+	case VPU_IOC_PHYMEM_ALLOC:
-+		{
-+			struct memalloc_record *rec;
-+
-+			rec = kzalloc(sizeof(*rec), GFP_KERNEL);
-+			if (!rec)
-+				return -ENOMEM;
-+
-+			ret = copy_from_user(&(rec->mem),
-+					     (struct vpu_mem_desc *)arg,
-+					     sizeof(struct vpu_mem_desc));
-+			if (ret) {
-+				kfree(rec);
-+				return -EFAULT;
-+			}
-+
-+			dev_dbg(vpu_dev, "[ALLOC] mem alloc size = 0x%x\n",
-+				 rec->mem.size);
-+
-+			ret = vpu_alloc_dma_buffer(&(rec->mem));
-+			if (ret == -1) {
-+				kfree(rec);
-+				dev_err(vpu_dev,
-+					"Physical memory allocation error!\n");
-+				break;
-+			}
-+			ret = copy_to_user((void __user *)arg, &(rec->mem),
-+					   sizeof(struct vpu_mem_desc));
-+			if (ret) {
-+				kfree(rec);
-+				ret = -EFAULT;
-+				break;
-+			}
-+
-+			mutex_lock(&vpu_data.lock);
-+			list_add(&rec->list, &head);
-+			mutex_unlock(&vpu_data.lock);
-+
-+			break;
-+		}
-+	case VPU_IOC_PHYMEM_FREE:
-+		{
-+			struct memalloc_record *rec, *n;
-+			struct vpu_mem_desc vpu_mem;
-+
-+			ret = copy_from_user(&vpu_mem,
-+					     (struct vpu_mem_desc *)arg,
-+					     sizeof(struct vpu_mem_desc));
-+			if (ret)
-+				return -EACCES;
-+
-+			dev_dbg(vpu_dev, "[FREE] mem freed cpu_addr = 0x%x\n",
-+				 vpu_mem.cpu_addr);
-+			if ((void *)vpu_mem.cpu_addr != NULL)
-+				vpu_free_dma_buffer(&vpu_mem);
-+
-+			mutex_lock(&vpu_data.lock);
-+			list_for_each_entry_safe(rec, n, &head, list) {
-+				if (rec->mem.cpu_addr == vpu_mem.cpu_addr) {
-+					/* delete from list */
-+					list_del(&rec->list);
-+					kfree(rec);
-+					break;
-+				}
-+			}
-+			mutex_unlock(&vpu_data.lock);
-+
-+			break;
-+		}
-+	case VPU_IOC_WAIT4INT:
-+		{
-+			u_long timeout = (u_long) arg;
-+			if (!wait_event_interruptible_timeout
-+			    (vpu_queue, irq_status != 0,
-+			     msecs_to_jiffies(timeout))) {
-+				dev_warn(vpu_dev, "VPU blocking: timeout.\n");
-+				ret = -ETIME;
-+			} else if (signal_pending(current)) {
-+				dev_warn(vpu_dev, "VPU interrupt received.\n");
-+				ret = -ERESTARTSYS;
-+			} else
-+				irq_status = 0;
-+			break;
-+		}
-+	case VPU_IOC_IRAM_SETTING:
-+		{
-+			ret = copy_to_user((void __user *)arg, &iram,
-+					   sizeof(struct iram_setting));
-+			if (ret)
-+				ret = -EFAULT;
-+
-+			break;
-+		}
-+	case VPU_IOC_CLKGATE_SETTING:
-+		{
-+			u32 clkgate_en;
-+
-+			if (get_user(clkgate_en, (u32 __user *) arg))
-+				return -EFAULT;
-+
-+			if (clkgate_en) {
-+				clk_prepare(vpu_clk);
-+				clk_enable(vpu_clk);
-+				atomic_inc(&clk_cnt_from_ioc);
-+			} else {
-+				clk_disable(vpu_clk);
-+				clk_unprepare(vpu_clk);
-+				atomic_dec(&clk_cnt_from_ioc);
-+			}
-+
-+			break;
-+		}
-+	case VPU_IOC_GET_SHARE_MEM:
-+		{
-+			mutex_lock(&vpu_data.lock);
-+			if (share_mem.cpu_addr != 0) {
-+				ret = copy_to_user((void __user *)arg,
-+						   &share_mem,
-+						   sizeof(struct vpu_mem_desc));
-+				mutex_unlock(&vpu_data.lock);
-+				break;
-+			} else {
-+				if (copy_from_user(&share_mem,
-+						   (struct vpu_mem_desc *)arg,
-+						 sizeof(struct vpu_mem_desc))) {
-+					mutex_unlock(&vpu_data.lock);
-+					return -EFAULT;
-+				}
-+				if (vpu_alloc_dma_buffer(&share_mem) == -1)
-+					ret = -EFAULT;
-+				else {
-+					if (copy_to_user((void __user *)arg,
-+							 &share_mem,
-+							 sizeof(struct
-+								vpu_mem_desc)))
-+						ret = -EFAULT;
-+				}
-+			}
-+			mutex_unlock(&vpu_data.lock);
-+			break;
-+		}
-+	case VPU_IOC_REQ_VSHARE_MEM:
-+		{
-+			mutex_lock(&vpu_data.lock);
-+			if (vshare_mem.cpu_addr != 0) {
-+				ret = copy_to_user((void __user *)arg,
-+						   &vshare_mem,
-+						   sizeof(struct vpu_mem_desc));
-+				mutex_unlock(&vpu_data.lock);
-+				break;
-+			} else {
-+				if (copy_from_user(&vshare_mem,
-+						   (struct vpu_mem_desc *)arg,
-+						   sizeof(struct
-+							  vpu_mem_desc))) {
-+					mutex_unlock(&vpu_data.lock);
-+					return -EFAULT;
-+				}
-+				/* vmalloc shared memory if not allocated */
-+				if (!vshare_mem.cpu_addr)
-+					vshare_mem.cpu_addr =
-+					    (unsigned long)
-+					    vmalloc_user(vshare_mem.size);
-+				if (copy_to_user
-+				     ((void __user *)arg, &vshare_mem,
-+				     sizeof(struct vpu_mem_desc)))
-+					ret = -EFAULT;
-+			}
-+			mutex_unlock(&vpu_data.lock);
-+			break;
-+		}
-+	case VPU_IOC_GET_WORK_ADDR:
-+		{
-+			if (bitwork_mem.cpu_addr != 0) {
-+				ret =
-+				    copy_to_user((void __user *)arg,
-+						 &bitwork_mem,
-+						 sizeof(struct vpu_mem_desc));
-+				break;
-+			} else {
-+				if (copy_from_user(&bitwork_mem,
-+						   (struct vpu_mem_desc *)arg,
-+						   sizeof(struct vpu_mem_desc)))
-+					return -EFAULT;
-+
-+				if (vpu_alloc_dma_buffer(&bitwork_mem) == -1)
-+					ret = -EFAULT;
-+				else if (copy_to_user((void __user *)arg,
-+						      &bitwork_mem,
-+						      sizeof(struct
-+							     vpu_mem_desc)))
-+					ret = -EFAULT;
-+			}
-+			break;
-+		}
-+	/*
-+	 * The following two ioctl is used when user allocates working buffer
-+	 * and register it to vpu driver.
-+	 */
-+	case VPU_IOC_QUERY_BITWORK_MEM:
-+		{
-+			if (copy_to_user((void __user *)arg,
-+					 &bitwork_mem,
-+					 sizeof(struct vpu_mem_desc)))
-+				ret = -EFAULT;
-+			break;
-+		}
-+	case VPU_IOC_SET_BITWORK_MEM:
-+		{
-+			if (copy_from_user(&bitwork_mem,
-+					   (struct vpu_mem_desc *)arg,
-+					   sizeof(struct vpu_mem_desc)))
-+				ret = -EFAULT;
-+			break;
-+		}
-+	case VPU_IOC_SYS_SW_RESET:
-+		{
-+			vpu_reset();
-+			break;
-+		}
-+	case VPU_IOC_REG_DUMP:
-+		break;
-+	case VPU_IOC_PHYMEM_DUMP:
-+		break;
-+	case VPU_IOC_PHYMEM_CHECK:
-+	{
-+		struct vpu_mem_desc check_memory;
-+		ret = copy_from_user(&check_memory,
-+				     (void __user *)arg,
-+				     sizeof(struct vpu_mem_desc));
-+		if (ret != 0) {
-+			dev_err(vpu_dev, "copy from user failure:%d\n", ret);
-+			ret = -EFAULT;
-+			break;
-+		}
-+		ret = vpu_is_valid_phy_memory((u32)check_memory.phy_addr);
-+
-+		dev_dbg(vpu_dev, "vpu: memory phy:0x%x %s phy memory\n",
-+		       check_memory.phy_addr, (ret ? "is" : "isn't"));
-+		/* borrow .size to pass back the result. */
-+		check_memory.size = ret;
-+		ret = copy_to_user((void __user *)arg, &check_memory,
-+				   sizeof(struct vpu_mem_desc));
-+		if (ret) {
-+			ret = -EFAULT;
-+			break;
-+		}
-+		break;
-+	}
-+	case VPU_IOC_LOCK_DEV:
-+		{
-+			u32 lock_en;
-+
-+			if (get_user(lock_en, (u32 __user *) arg))
-+				return -EFAULT;
-+
-+			if (lock_en)
-+				mutex_lock(&vpu_data.lock);
-+			else
-+				mutex_unlock(&vpu_data.lock);
-+
-+			break;
-+		}
-+	default:
-+		{
-+			dev_err(vpu_dev, "No such IOCTL, cmd is %d\n", cmd);
-+			ret = -EINVAL;
-+			break;
-+		}
-+	}
-+	return ret;
-+}
-+
-+/*!
-+ * @brief Release function for vpu file operation
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_release(struct inode *inode, struct file *filp)
-+{
-+	int i;
-+	unsigned long timeout;
-+
-+	mutex_lock(&vpu_data.lock);
-+
-+	if (open_count > 0 && !(--open_count)) {
-+
-+		/* Wait for vpu go to idle state */
-+		clk_prepare(vpu_clk);
-+		clk_enable(vpu_clk);
-+		if (READ_REG(BIT_CUR_PC)) {
-+
-+			timeout = jiffies + HZ;
-+			while (READ_REG(BIT_BUSY_FLAG)) {
-+				msleep(1);
-+				if (time_after(jiffies, timeout)) {
-+					dev_warn(vpu_dev, "VPU timeout during release\n");
-+					break;
-+				}
-+			}
-+			clk_disable(vpu_clk);
-+			clk_unprepare(vpu_clk);
-+
-+			/* Clean up interrupt */
-+			cancel_work_sync(&vpu_data.work);
-+			flush_workqueue(vpu_data.workqueue);
-+			irq_status = 0;
-+
-+			clk_prepare(vpu_clk);
-+			clk_enable(vpu_clk);
-+			if (READ_REG(BIT_BUSY_FLAG)) {
-+
-+				if (cpu_is_mx51() || cpu_is_mx53()) {
-+					dev_err(vpu_dev,
-+						"fatal error: can't gate/power off when VPU is busy\n");
-+					clk_disable(vpu_clk);
-+					clk_unprepare(vpu_clk);
-+					mutex_unlock(&vpu_data.lock);
-+					return -EFAULT;
-+				}
-+
-+#ifdef CONFIG_SOC_IMX6Q
-+				if (cpu_is_mx6dl() || cpu_is_mx6q()) {
-+					WRITE_REG(0x11, 0x10F0);
-+					timeout = jiffies + HZ;
-+					while (READ_REG(0x10F4) != 0x77) {
-+						msleep(1);
-+						if (time_after(jiffies, timeout))
-+							break;
-+					}
-+
-+					if (READ_REG(0x10F4) != 0x77) {
-+						dev_err(vpu_dev,
-+							"fatal error: can't gate/power off when VPU is busy\n");
-+						WRITE_REG(0x0, 0x10F0);
-+						clk_disable(vpu_clk);
-+						clk_unprepare(vpu_clk);
-+						mutex_unlock(&vpu_data.lock);
-+						return -EFAULT;
-+					} else
-+						vpu_reset();
-+				}
-+#endif
-+			}
-+		}
-+		clk_disable(vpu_clk);
-+		clk_unprepare(vpu_clk);
-+
-+		vpu_free_buffers();
-+
-+		/* Free shared memory when vpu device is idle */
-+		vpu_free_dma_buffer(&share_mem);
-+		share_mem.cpu_addr = 0;
-+		vfree((void *)vshare_mem.cpu_addr);
-+		vshare_mem.cpu_addr = 0;
-+
-+		vpu_clk_usercount = atomic_read(&clk_cnt_from_ioc);
-+		for (i = 0; i < vpu_clk_usercount; i++) {
-+			clk_disable(vpu_clk);
-+			clk_unprepare(vpu_clk);
-+			atomic_dec(&clk_cnt_from_ioc);
-+		}
-+
-+		vpu_power_up(false);
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+		pm_runtime_put_sync_suspend(vpu_dev);
-+#endif
-+
-+	}
-+	mutex_unlock(&vpu_data.lock);
-+
-+	return 0;
-+}
-+
-+/*!
-+ * @brief fasync function for vpu file operation
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_fasync(int fd, struct file *filp, int mode)
-+{
-+	struct vpu_priv *dev = (struct vpu_priv *)filp->private_data;
-+	return fasync_helper(fd, filp, mode, &dev->async_queue);
-+}
-+
-+/*!
-+ * @brief memory map function of harware registers for vpu file operation
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_map_hwregs(struct file *fp, struct vm_area_struct *vm)
-+{
-+	unsigned long pfn;
-+
-+	vm->vm_flags |= VM_IO | VM_RESERVED;
-+	/*
-+	 * Since vpu registers have been mapped with ioremap() at probe
-+	 * which L_PTE_XN is 1, and the same physical address must be
-+	 * mapped multiple times with same type, so set L_PTE_XN to 1 here.
-+	 * Otherwise, there may be unexpected result in video codec.
-+	 */
-+	vm->vm_page_prot = pgprot_noncachedxn(vm->vm_page_prot);
-+	pfn = phy_vpu_base_addr >> PAGE_SHIFT;
-+	dev_dbg(vpu_dev, "size=0x%x, page no.=0x%x\n",
-+		 (int)(vm->vm_end - vm->vm_start), (int)pfn);
-+	return remap_pfn_range(vm, vm->vm_start, pfn, vm->vm_end - vm->vm_start,
-+			       vm->vm_page_prot) ? -EAGAIN : 0;
-+}
-+
-+/*!
-+ * @brief memory map function of memory for vpu file operation
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_map_dma_mem(struct file *fp, struct vm_area_struct *vm)
-+{
-+	int request_size;
-+	request_size = vm->vm_end - vm->vm_start;
-+
-+	dev_dbg(vpu_dev, "start=0x%x, pgoff=0x%x, size=0x%x\n",
-+		 (unsigned int)(vm->vm_start), (unsigned int)(vm->vm_pgoff),
-+		 request_size);
-+
-+	vm->vm_flags |= VM_IO | VM_RESERVED;
-+	vm->vm_page_prot = pgprot_writecombine(vm->vm_page_prot);
-+
-+	return remap_pfn_range(vm, vm->vm_start, vm->vm_pgoff,
-+			       request_size, vm->vm_page_prot) ? -EAGAIN : 0;
-+
-+}
-+
-+/* !
-+ * @brief memory map function of vmalloced share memory
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_map_vshare_mem(struct file *fp, struct vm_area_struct *vm)
-+{
-+	int ret = -EINVAL;
-+
-+	ret = remap_vmalloc_range(vm, (void *)(vm->vm_pgoff << PAGE_SHIFT), 0);
-+	vm->vm_flags |= VM_IO;
-+
-+	return ret;
-+}
-+/*!
-+ * @brief memory map interface for vpu file operation
-+ * @return  0 on success or negative error code on error
-+ */
-+static int vpu_mmap(struct file *fp, struct vm_area_struct *vm)
-+{
-+	unsigned long offset;
-+
-+	offset = vshare_mem.cpu_addr >> PAGE_SHIFT;
-+
-+	if (vm->vm_pgoff && (vm->vm_pgoff == offset))
-+		return vpu_map_vshare_mem(fp, vm);
-+	else if (vm->vm_pgoff)
-+		return vpu_map_dma_mem(fp, vm);
-+	else
-+		return vpu_map_hwregs(fp, vm);
-+}
-+
-+const struct file_operations vpu_fops = {
-+	.owner = THIS_MODULE,
-+	.open = vpu_open,
-+	.unlocked_ioctl = vpu_ioctl,
-+	.release = vpu_release,
-+	.fasync = vpu_fasync,
-+	.mmap = vpu_mmap,
-+};
-+
-+/*!
-+ * This function is called by the driver framework to initialize the vpu device.
-+ * @param   dev The device structure for the vpu passed in by the framework.
-+ * @return   0 on success or negative error code on error
-+ */
-+static int vpu_dev_probe(struct platform_device *pdev)
-+{
-+	int err = 0;
-+	struct device *temp_class;
-+	struct resource *res;
-+	unsigned long addr = 0;
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+	struct device_node *np = pdev->dev.of_node;
-+	u32 iramsize;
-+
-+	err = of_property_read_u32(np, "iramsize", (u32 *)&iramsize);
-+	if (!err && iramsize)
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+	{
-+		iram_pool = of_get_named_gen_pool(np, "iram", 0);
-+		if (!iram_pool) {
-+			dev_err(&pdev->dev, "iram pool not available\n");
-+			return -ENOMEM;
-+		}
-+
-+		iram_base = gen_pool_alloc(iram_pool, iramsize);
-+		if (!iram_base) {
-+			dev_err(&pdev->dev, "unable to alloc iram\n");
-+			return -ENOMEM;
-+		}
-+
-+		addr = gen_pool_virt_to_phys(iram_pool, iram_base);
-+	}
-+#else
-+		iram_alloc(iramsize, &addr);
-+#endif
-+	if (addr == 0)
-+		iram.start = iram.end = 0;
-+	else {
-+		iram.start = addr;
-+		iram.end = addr + iramsize - 1;
-+	}
-+#else
-+
-+	vpu_plat = pdev->dev.platform_data;
-+
-+	if (vpu_plat && vpu_plat->iram_enable && vpu_plat->iram_size)
-+		iram_alloc(vpu_plat->iram_size, &addr);
-+	if (addr == 0)
-+		iram.start = iram.end = 0;
-+	else {
-+		iram.start = addr;
-+		iram.end = addr +  vpu_plat->iram_size - 1;
-+	}
-+#endif
-+
-+	vpu_dev = &pdev->dev;
-+
-+	res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "vpu_regs");
-+	if (!res) {
-+		dev_err(vpu_dev, "vpu: unable to get vpu base addr\n");
-+		return -ENODEV;
-+	}
-+	phy_vpu_base_addr = res->start;
-+	vpu_base = ioremap(res->start, res->end - res->start);
-+
-+	vpu_major = register_chrdev(vpu_major, "mxc_vpu", &vpu_fops);
-+	if (vpu_major < 0) {
-+		dev_err(vpu_dev, "vpu: unable to get a major for VPU\n");
-+		err = -EBUSY;
-+		goto error;
-+	}
-+
-+	vpu_class = class_create(THIS_MODULE, "mxc_vpu");
-+	if (IS_ERR(vpu_class)) {
-+		err = PTR_ERR(vpu_class);
-+		goto err_out_chrdev;
-+	}
-+
-+	temp_class = device_create(vpu_class, NULL, MKDEV(vpu_major, 0),
-+				   NULL, "mxc_vpu");
-+	if (IS_ERR(temp_class)) {
-+		err = PTR_ERR(temp_class);
-+		goto err_out_class;
-+	}
-+
-+	vpu_clk = clk_get(&pdev->dev, "per");
-+	if (IS_ERR(vpu_clk)) {
-+		err = -ENOENT;
-+		goto err_out_class;
-+	}
-+
-+	vpu_ipi_irq = platform_get_irq_byname(pdev, "bit");
-+	if (vpu_ipi_irq < 0) {
-+		dev_err(vpu_dev, "vpu: unable to get vpu interrupt\n");
-+		err = -ENXIO;
-+		goto err_out_class;
-+	}
-+	err = request_irq(vpu_ipi_irq, vpu_ipi_irq_handler, 0, "VPU_CODEC_IRQ",
-+			  (void *)(&vpu_data));
-+	if (err)
-+		goto err_out_class;
-+	if (vpu_power_get(true)) {
-+		if (!(cpu_is_mx51() || cpu_is_mx53())) {
-+			dev_err(vpu_dev, "failed to get vpu power\n");
-+			goto err_out_class;
-+		} else {
-+			/* regulator_get will return error on MX5x,
-+			 * just igore it everywhere*/
-+			dev_warn(vpu_dev, "failed to get vpu power\n");
-+		}
-+	}
-+
-+#ifdef MXC_VPU_HAS_JPU
-+	vpu_jpu_irq = platform_get_irq_byname(pdev, "jpeg");
-+	if (vpu_jpu_irq < 0) {
-+		dev_err(vpu_dev, "vpu: unable to get vpu jpu interrupt\n");
-+		err = -ENXIO;
-+		free_irq(vpu_ipi_irq, &vpu_data);
-+		goto err_out_class;
-+	}
-+	err = request_irq(vpu_jpu_irq, vpu_jpu_irq_handler, IRQF_TRIGGER_RISING,
-+			  "VPU_JPG_IRQ", (void *)(&vpu_data));
-+	if (err) {
-+		free_irq(vpu_ipi_irq, &vpu_data);
-+		goto err_out_class;
-+	}
-+#endif
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+	pm_runtime_enable(&pdev->dev);
-+#endif
-+
-+	vpu_data.workqueue = create_workqueue("vpu_wq");
-+	INIT_WORK(&vpu_data.work, vpu_worker_callback);
-+	mutex_init(&vpu_data.lock);
-+	dev_info(vpu_dev, "VPU initialized\n");
-+	goto out;
-+
-+err_out_class:
-+	device_destroy(vpu_class, MKDEV(vpu_major, 0));
-+	class_destroy(vpu_class);
-+err_out_chrdev:
-+	unregister_chrdev(vpu_major, "mxc_vpu");
-+error:
-+	iounmap(vpu_base);
-+out:
-+	return err;
-+}
-+
-+static int vpu_dev_remove(struct platform_device *pdev)
-+{
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+	pm_runtime_disable(&pdev->dev);
-+#endif
-+	free_irq(vpu_ipi_irq, &vpu_data);
-+#ifdef MXC_VPU_HAS_JPU
-+	free_irq(vpu_jpu_irq, &vpu_data);
-+#endif
-+	cancel_work_sync(&vpu_data.work);
-+	flush_workqueue(vpu_data.workqueue);
-+	destroy_workqueue(vpu_data.workqueue);
-+
-+	iounmap(vpu_base);
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+	if (iram.start)
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
-+		gen_pool_free(iram_pool, iram_base, iram.end-iram.start+1);
-+#else
-+		iram_free(iram.start, iram.end-iram.start+1);
-+#endif
-+#else
-+	if (vpu_plat && vpu_plat->iram_enable && vpu_plat->iram_size)
-+		iram_free(iram.start,  vpu_plat->iram_size);
-+#endif
-+
-+	vpu_power_get(false);
-+	return 0;
-+}
-+
-+#ifdef CONFIG_PM
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+static int vpu_suspend(struct device *dev)
-+#else
-+static int vpu_suspend(struct platform_device *pdev, pm_message_t state)
-+#endif
-+{
-+	int i;
-+	unsigned long timeout;
-+
-+	mutex_lock(&vpu_data.lock);
-+	if (open_count == 0) {
-+		/* VPU is released (all instances are freed),
-+		 * clock is already off, context is no longer needed,
-+		 * power is already off on MX6,
-+		 * gate power on MX51 */
-+		if (cpu_is_mx51()) {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+			if (vpu_plat->pg)
-+				vpu_plat->pg(1);
-+#endif
-+		}
-+	} else {
-+		/* Wait for vpu go to idle state, suspect vpu cannot be changed
-+		   to idle state after about 1 sec */
-+		timeout = jiffies + HZ;
-+		clk_prepare(vpu_clk);
-+		clk_enable(vpu_clk);
-+		while (READ_REG(BIT_BUSY_FLAG)) {
-+			msleep(1);
-+			if (time_after(jiffies, timeout)) {
-+				clk_disable(vpu_clk);
-+				clk_unprepare(vpu_clk);
-+				mutex_unlock(&vpu_data.lock);
-+				return -EAGAIN;
-+			}
-+		}
-+		clk_disable(vpu_clk);
-+		clk_unprepare(vpu_clk);
-+
-+		/* Make sure clock is disabled before suspend */
-+		vpu_clk_usercount = atomic_read(&clk_cnt_from_ioc);
-+		for (i = 0; i < vpu_clk_usercount; i++) {
-+			clk_disable(vpu_clk);
-+			clk_unprepare(vpu_clk);
-+		}
-+
-+		if (cpu_is_mx53()) {
-+			mutex_unlock(&vpu_data.lock);
-+			return 0;
-+		}
-+
-+		if (bitwork_mem.cpu_addr != 0) {
-+			clk_prepare(vpu_clk);
-+			clk_enable(vpu_clk);
-+			/* Save 64 registers from BIT_CODE_BUF_ADDR */
-+			for (i = 0; i < 64; i++)
-+				regBk[i] = READ_REG(BIT_CODE_BUF_ADDR + (i * 4));
-+			pc_before_suspend = READ_REG(BIT_CUR_PC);
-+			clk_disable(vpu_clk);
-+			clk_unprepare(vpu_clk);
-+		}
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+		if (vpu_plat->pg)
-+			vpu_plat->pg(1);
-+#endif
-+
-+		/* If VPU is working before suspend, disable
-+		 * regulator to make usecount right. */
-+		vpu_power_up(false);
-+	}
-+
-+	mutex_unlock(&vpu_data.lock);
-+	return 0;
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+static int vpu_resume(struct device *dev)
-+#else
-+static int vpu_resume(struct platform_device *pdev)
-+#endif
-+{
-+	int i;
-+
-+	mutex_lock(&vpu_data.lock);
-+	if (open_count == 0) {
-+		/* VPU is released (all instances are freed),
-+		 * clock should be kept off, context is no longer needed,
-+		 * power should be kept off on MX6,
-+		 * disable power gating on MX51 */
-+		if (cpu_is_mx51()) {
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+			if (vpu_plat->pg)
-+				vpu_plat->pg(0);
-+#endif
-+		}
-+	} else {
-+		if (cpu_is_mx53())
-+			goto recover_clk;
-+
-+		/* If VPU is working before suspend, enable
-+		 * regulator to make usecount right. */
-+		vpu_power_up(true);
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+		if (vpu_plat->pg)
-+			vpu_plat->pg(0);
-+#endif
-+
-+		if (bitwork_mem.cpu_addr != 0) {
-+			u32 *p = (u32 *) bitwork_mem.cpu_addr;
-+			u32 data, pc;
-+			u16 data_hi;
-+			u16 data_lo;
-+
-+			clk_prepare(vpu_clk);
-+			clk_enable(vpu_clk);
-+
-+			pc = READ_REG(BIT_CUR_PC);
-+			if (pc) {
-+				dev_warn(vpu_dev, "Not power off after suspend (PC=0x%x)\n", pc);
-+				clk_disable(vpu_clk);
-+				clk_unprepare(vpu_clk);
-+				goto recover_clk;
-+			}
-+
-+			/* Restore registers */
-+			for (i = 0; i < 64; i++)
-+				WRITE_REG(regBk[i], BIT_CODE_BUF_ADDR + (i * 4));
-+
-+			WRITE_REG(0x0, BIT_RESET_CTRL);
-+			WRITE_REG(0x0, BIT_CODE_RUN);
-+			/* MX6 RTL has a bug not to init MBC_SET_SUBBLK_EN on reset */
-+#ifdef CONFIG_SOC_IMX6Q
-+			WRITE_REG(0x0, MBC_SET_SUBBLK_EN);
-+#endif
-+
-+			/*
-+			 * Re-load boot code, from the codebuffer in external RAM.
-+			 * Thankfully, we only need 4096 bytes, same for all platforms.
-+			 */
-+			for (i = 0; i < 2048; i += 4) {
-+				data = p[(i / 2) + 1];
-+				data_hi = (data >> 16) & 0xFFFF;
-+				data_lo = data & 0xFFFF;
-+				WRITE_REG((i << 16) | data_hi, BIT_CODE_DOWN);
-+				WRITE_REG(((i + 1) << 16) | data_lo,
-+						BIT_CODE_DOWN);
-+
-+				data = p[i / 2];
-+				data_hi = (data >> 16) & 0xFFFF;
-+				data_lo = data & 0xFFFF;
-+				WRITE_REG(((i + 2) << 16) | data_hi,
-+						BIT_CODE_DOWN);
-+				WRITE_REG(((i + 3) << 16) | data_lo,
-+						BIT_CODE_DOWN);
-+			}
-+
-+			if (pc_before_suspend) {
-+				WRITE_REG(0x1, BIT_BUSY_FLAG);
-+				WRITE_REG(0x1, BIT_CODE_RUN);
-+				while (READ_REG(BIT_BUSY_FLAG))
-+					;
-+			} else {
-+				dev_warn(vpu_dev, "PC=0 before suspend\n");
-+			}
-+			clk_disable(vpu_clk);
-+			clk_unprepare(vpu_clk);
-+		}
-+
-+recover_clk:
-+		/* Recover vpu clock */
-+		for (i = 0; i < vpu_clk_usercount; i++) {
-+			clk_prepare(vpu_clk);
-+			clk_enable(vpu_clk);
-+		}
-+	}
-+
-+	mutex_unlock(&vpu_data.lock);
-+	return 0;
-+}
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+static int vpu_runtime_suspend(struct device *dev)
-+{
-+	dev_dbg(dev, "ipu busfreq high release.\n");
-+	release_bus_freq(BUS_FREQ_HIGH);
-+	return 0;
-+}
-+
-+static int vpu_runtime_resume(struct device *dev)
-+{
-+	dev_dbg(dev, "ipu busfreq high request.\n");
-+	request_bus_freq(BUS_FREQ_HIGH);
-+	return 0;
-+}
-+
-+static const struct dev_pm_ops vpu_pm_ops = {
-+	SET_RUNTIME_PM_OPS(vpu_runtime_suspend, vpu_runtime_resume, NULL)
-+	SET_SYSTEM_SLEEP_PM_OPS(vpu_suspend, vpu_resume)
-+};
-+#endif
-+
-+#else
-+#define	vpu_suspend	NULL
-+#define	vpu_resume	NULL
-+#endif				/* !CONFIG_PM */
-+
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+static const struct of_device_id vpu_of_match[] = {
-+	{ .compatible = "fsl,imx6-vpu", },
-+	{ .compatible = "fsl,imx6q-vpu", },
-+	{/* sentinel */}
-+};
-+MODULE_DEVICE_TABLE(of, vpu_of_match);
-+#endif
-+
-+/*! Driver definition
-+ *
-+ */
-+static struct platform_driver mxcvpu_driver = {
-+	.driver = {
-+		   .name = "mxc_vpu",
-+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-+		   .of_match_table = vpu_of_match,
-+#ifdef CONFIG_PM
-+		   .pm = &vpu_pm_ops,
-+#endif
-+#endif
-+		   },
-+	.probe = vpu_dev_probe,
-+	.remove = vpu_dev_remove,
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+	.suspend = vpu_suspend,
-+	.resume = vpu_resume,
-+#endif
-+};
-+
-+static int __init vpu_init(void)
-+{
-+	int ret = platform_driver_register(&mxcvpu_driver);
-+
-+	init_waitqueue_head(&vpu_queue);
-+
-+
-+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
-+	memblock_analyze();
-+	top_address_DRAM = memblock_end_of_DRAM_with_reserved();
-+#endif
-+
-+	return ret;
-+}
-+
-+static void __exit vpu_exit(void)
-+{
-+	if (vpu_major > 0) {
-+		device_destroy(vpu_class, MKDEV(vpu_major, 0));
-+		class_destroy(vpu_class);
-+		unregister_chrdev(vpu_major, "mxc_vpu");
-+		vpu_major = 0;
-+	}
-+
-+	vpu_free_dma_buffer(&bitwork_mem);
-+	vpu_free_dma_buffer(&pic_para_mem);
-+	vpu_free_dma_buffer(&user_data_mem);
-+
-+	/* reset VPU state */
-+	vpu_power_up(true);
-+	clk_prepare(vpu_clk);
-+	clk_enable(vpu_clk);
-+	vpu_reset();
-+	clk_disable(vpu_clk);
-+	clk_unprepare(vpu_clk);
-+	vpu_power_up(false);
-+
-+	clk_put(vpu_clk);
-+
-+	platform_driver_unregister(&mxcvpu_driver);
-+	return;
-+}
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("Linux VPU driver for Freescale i.MX/MXC");
-+MODULE_LICENSE("GPL");
-+
-+module_init(vpu_init);
-+module_exit(vpu_exit);
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c	2015-07-27 23:13:06.848547454 +0200
-@@ -1011,6 +1011,14 @@
- 	return 0;
- }
- 
-+static void brcmf_sdiod_host_fixup(struct mmc_host *host)
-+{
-+	/* runtime-pm powers off the device */
-+	pm_runtime_forbid(host->parent);
-+	/* avoid removal detection upon resume */
-+	host->caps |= MMC_CAP_NONREMOVABLE;
-+}
-+
- static int brcmf_sdiod_probe(struct brcmf_sdio_dev *sdiodev)
- {
- 	struct sdio_func *func;
-@@ -1076,7 +1084,7 @@
- 		ret = -ENODEV;
- 		goto out;
- 	}
--	pm_runtime_forbid(host->parent);
-+	brcmf_sdiod_host_fixup(host);
- out:
- 	if (ret)
- 		brcmf_sdiod_remove(sdiodev);
-@@ -1246,15 +1254,15 @@
- 	brcmf_sdiod_freezer_on(sdiodev);
- 	brcmf_sdio_wd_timer(sdiodev->bus, 0);
- 
-+	sdio_flags = MMC_PM_KEEP_POWER;
- 	if (sdiodev->wowl_enabled) {
--		sdio_flags = MMC_PM_KEEP_POWER;
- 		if (sdiodev->pdata->oob_irq_supported)
- 			enable_irq_wake(sdiodev->pdata->oob_irq_nr);
- 		else
--			sdio_flags = MMC_PM_WAKE_SDIO_IRQ;
--		if (sdio_set_host_pm_flags(sdiodev->func[1], sdio_flags))
--			brcmf_err("Failed to set pm_flags %x\n", sdio_flags);
-+			sdio_flags |= MMC_PM_WAKE_SDIO_IRQ;
- 	}
-+	if (sdio_set_host_pm_flags(sdiodev->func[1], sdio_flags))
-+		brcmf_err("Failed to set pm_flags %x\n", sdio_flags);
- 	return 0;
- }
- 
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c	2015-07-27 23:13:06.848547454 +0200
-@@ -129,13 +129,47 @@
- 	RATETAB_ENT(BRCM_RATE_54M, 0),
- };
- 
--#define wl_a_rates		(__wl_rates + 4)
--#define wl_a_rates_size	8
- #define wl_g_rates		(__wl_rates + 0)
--#define wl_g_rates_size	12
-+#define wl_g_rates_size		ARRAY_SIZE(__wl_rates)
-+#define wl_a_rates		(__wl_rates + 4)
-+#define wl_a_rates_size		(wl_g_rates_size - 4)
-+
-+#define CHAN2G(_channel, _freq) {				\
-+	.band			= IEEE80211_BAND_2GHZ,		\
-+	.center_freq		= (_freq),			\
-+	.hw_value		= (_channel),			\
-+	.flags			= IEEE80211_CHAN_DISABLED,	\
-+	.max_antenna_gain	= 0,				\
-+	.max_power		= 30,				\
-+}
-+
-+#define CHAN5G(_channel) {					\
-+	.band			= IEEE80211_BAND_5GHZ,		\
-+	.center_freq		= 5000 + (5 * (_channel)),	\
-+	.hw_value		= (_channel),			\
-+	.flags			= IEEE80211_CHAN_DISABLED,	\
-+	.max_antenna_gain	= 0,				\
-+	.max_power		= 30,				\
-+}
-+
-+static struct ieee80211_channel __wl_2ghz_channels[] = {
-+	CHAN2G(1, 2412), CHAN2G(2, 2417), CHAN2G(3, 2422), CHAN2G(4, 2427),
-+	CHAN2G(5, 2432), CHAN2G(6, 2437), CHAN2G(7, 2442), CHAN2G(8, 2447),
-+	CHAN2G(9, 2452), CHAN2G(10, 2457), CHAN2G(11, 2462), CHAN2G(12, 2467),
-+	CHAN2G(13, 2472), CHAN2G(14, 2484)
-+};
-+
-+static struct ieee80211_channel __wl_5ghz_channels[] = {
-+	CHAN5G(34), CHAN5G(36), CHAN5G(38), CHAN5G(40), CHAN5G(42),
-+	CHAN5G(44), CHAN5G(46), CHAN5G(48), CHAN5G(52), CHAN5G(56),
-+	CHAN5G(60), CHAN5G(64), CHAN5G(100), CHAN5G(104), CHAN5G(108),
-+	CHAN5G(112), CHAN5G(116), CHAN5G(120), CHAN5G(124), CHAN5G(128),
-+	CHAN5G(132), CHAN5G(136), CHAN5G(140), CHAN5G(144), CHAN5G(149),
-+	CHAN5G(153), CHAN5G(157), CHAN5G(161), CHAN5G(165)
-+};
- 
- /* Band templates duplicated per wiphy. The channel info
-- * is filled in after querying the device.
-+ * above is added to the band during setup.
-  */
- static const struct ieee80211_supported_band __wl_band_2ghz = {
- 	.band = IEEE80211_BAND_2GHZ,
-@@ -143,7 +177,7 @@
- 	.n_bitrates = wl_g_rates_size,
- };
- 
--static const struct ieee80211_supported_band __wl_band_5ghz_a = {
-+static const struct ieee80211_supported_band __wl_band_5ghz = {
- 	.band = IEEE80211_BAND_5GHZ,
- 	.bitrates = wl_a_rates,
- 	.n_bitrates = wl_a_rates_size,
-@@ -5253,40 +5287,6 @@
- 	return err;
- }
- 
--/* Filter the list of channels received from firmware counting only
-- * the 20MHz channels. The wiphy band data only needs those which get
-- * flagged to indicate if they can take part in higher bandwidth.
-- */
--static void brcmf_count_20mhz_channels(struct brcmf_cfg80211_info *cfg,
--				       struct brcmf_chanspec_list *chlist,
--				       u32 chcnt[])
--{
--	u32 total = le32_to_cpu(chlist->count);
--	struct brcmu_chan ch;
--	int i;
--
--	for (i = 0; i < total; i++) {
--		ch.chspec = (u16)le32_to_cpu(chlist->element[i]);
--		cfg->d11inf.decchspec(&ch);
--
--		/* Firmware gives a ordered list. We skip non-20MHz
--		 * channels is 2G. For 5G we can abort upon reaching
--		 * a non-20MHz channel in the list.
--		 */
--		if (ch.bw != BRCMU_CHAN_BW_20) {
--			if (ch.band == BRCMU_CHAN_BAND_5G)
--				break;
--			else
--				continue;
--		}
--
--		if (ch.band == BRCMU_CHAN_BAND_2G)
--			chcnt[0] += 1;
--		else if (ch.band == BRCMU_CHAN_BAND_5G)
--			chcnt[1] += 1;
--	}
--}
--
- static void brcmf_update_bw40_channel_flag(struct ieee80211_channel *channel,
- 					   struct brcmu_chan *ch)
- {
-@@ -5322,7 +5322,6 @@
- 	u32 i, j;
- 	u32 total;
- 	u32 chaninfo;
--	u32 chcnt[2] = { 0, 0 };
- 	u32 index;
- 
- 	pbuf = kzalloc(BRCMF_DCMD_MEDLEN, GFP_KERNEL);
-@@ -5339,42 +5338,15 @@
- 		goto fail_pbuf;
- 	}
- 
--	brcmf_count_20mhz_channels(cfg, list, chcnt);
- 	wiphy = cfg_to_wiphy(cfg);
--	if (chcnt[0]) {
--		band = kmemdup(&__wl_band_2ghz, sizeof(__wl_band_2ghz),
--			       GFP_KERNEL);
--		if (band == NULL) {
--			err = -ENOMEM;
--			goto fail_pbuf;
--		}
--		band->channels = kcalloc(chcnt[0], sizeof(*channel),
--					 GFP_KERNEL);
--		if (band->channels == NULL) {
--			kfree(band);
--			err = -ENOMEM;
--			goto fail_pbuf;
--		}
--		band->n_channels = 0;
--		wiphy->bands[IEEE80211_BAND_2GHZ] = band;
--	}
--	if (chcnt[1]) {
--		band = kmemdup(&__wl_band_5ghz_a, sizeof(__wl_band_5ghz_a),
--			       GFP_KERNEL);
--		if (band == NULL) {
--			err = -ENOMEM;
--			goto fail_band2g;
--		}
--		band->channels = kcalloc(chcnt[1], sizeof(*channel),
--					 GFP_KERNEL);
--		if (band->channels == NULL) {
--			kfree(band);
--			err = -ENOMEM;
--			goto fail_band2g;
--		}
--		band->n_channels = 0;
--		wiphy->bands[IEEE80211_BAND_5GHZ] = band;
--	}
-+	band = wiphy->bands[IEEE80211_BAND_2GHZ];
-+	if (band)
-+		for (i = 0; i < band->n_channels; i++)
-+			band->channels[i].flags = IEEE80211_CHAN_DISABLED;
-+	band = wiphy->bands[IEEE80211_BAND_5GHZ];
-+	if (band)
-+		for (i = 0; i < band->n_channels; i++)
-+			band->channels[i].flags = IEEE80211_CHAN_DISABLED;
- 
- 	total = le32_to_cpu(list->count);
- 	for (i = 0; i < total; i++) {
-@@ -5389,6 +5361,8 @@
- 			brcmf_err("Invalid channel Spec. 0x%x.\n", ch.chspec);
- 			continue;
- 		}
-+		if (!band)
-+			continue;
- 		if (!(bw_cap[band->band] & WLC_BW_40MHZ_BIT) &&
- 		    ch.bw == BRCMU_CHAN_BW_40)
- 			continue;
-@@ -5416,9 +5390,9 @@
- 		} else if (ch.bw == BRCMU_CHAN_BW_40) {
- 			brcmf_update_bw40_channel_flag(&channel[index], &ch);
- 		} else {
--			/* disable other bandwidths for now as mentioned
--			 * order assure they are enabled for subsequent
--			 * chanspecs.
-+			/* enable the channel and disable other bandwidths
-+			 * for now as mentioned order assure they are enabled
-+			 * for subsequent chanspecs.
- 			 */
- 			channel[index].flags = IEEE80211_CHAN_NO_HT40 |
- 					       IEEE80211_CHAN_NO_80MHZ;
-@@ -5437,16 +5411,8 @@
- 						IEEE80211_CHAN_NO_IR;
- 			}
- 		}
--		if (index == band->n_channels)
--			band->n_channels++;
- 	}
--	kfree(pbuf);
--	return 0;
- 
--fail_band2g:
--	kfree(wiphy->bands[IEEE80211_BAND_2GHZ]->channels);
--	kfree(wiphy->bands[IEEE80211_BAND_2GHZ]);
--	wiphy->bands[IEEE80211_BAND_2GHZ] = NULL;
- fail_pbuf:
- 	kfree(pbuf);
- 	return err;
-@@ -5779,7 +5745,12 @@
- 
- static int brcmf_setup_wiphy(struct wiphy *wiphy, struct brcmf_if *ifp)
- {
-+	struct ieee80211_supported_band *band;
- 	struct ieee80211_iface_combination ifc_combo;
-+	__le32 bandlist[3];
-+	u32 n_bands;
-+	int err, i;
-+
- 	wiphy->max_scan_ssids = WL_NUM_SCAN_MAX;
- 	wiphy->max_scan_ie_len = BRCMF_SCAN_IE_LEN_MAX;
- 	wiphy->max_num_pmkids = WL_NUM_PMKIDS_MAX;
-@@ -5812,7 +5783,8 @@
- 		wiphy->flags |= WIPHY_FLAG_SUPPORTS_FW_ROAM;
- 	wiphy->mgmt_stypes = brcmf_txrx_stypes;
- 	wiphy->max_remain_on_channel_duration = 5000;
--	brcmf_wiphy_pno_params(wiphy);
-+	if (brcmf_feat_is_enabled(ifp, BRCMF_FEAT_PNO))
-+		brcmf_wiphy_pno_params(wiphy);
- 
- 	/* vendor commands/events support */
- 	wiphy->vendor_commands = brcmf_vendor_cmds;
-@@ -5821,7 +5793,52 @@
- 	if (brcmf_feat_is_enabled(ifp, BRCMF_FEAT_WOWL))
- 		brcmf_wiphy_wowl_params(wiphy);
- 
--	return brcmf_setup_wiphybands(wiphy);
-+	err = brcmf_fil_cmd_data_get(ifp, BRCMF_C_GET_BANDLIST, &bandlist,
-+				     sizeof(bandlist));
-+	if (err) {
-+		brcmf_err("could not obtain band info: err=%d\n", err);
-+		return err;
-+	}
-+	/* first entry in bandlist is number of bands */
-+	n_bands = le32_to_cpu(bandlist[0]);
-+	for (i = 1; i <= n_bands && i < ARRAY_SIZE(bandlist); i++) {
-+		if (bandlist[i] == cpu_to_le32(WLC_BAND_2G)) {
-+			band = kmemdup(&__wl_band_2ghz, sizeof(__wl_band_2ghz),
-+				       GFP_KERNEL);
-+			if (!band)
-+				return -ENOMEM;
-+
-+			band->channels = kmemdup(&__wl_2ghz_channels,
-+						 sizeof(__wl_2ghz_channels),
-+						 GFP_KERNEL);
-+			if (!band->channels) {
-+				kfree(band);
-+				return -ENOMEM;
-+			}
-+
-+			band->n_channels = ARRAY_SIZE(__wl_2ghz_channels);
-+			wiphy->bands[IEEE80211_BAND_2GHZ] = band;
-+		}
-+		if (bandlist[i] == cpu_to_le32(WLC_BAND_5G)) {
-+			band = kmemdup(&__wl_band_5ghz, sizeof(__wl_band_5ghz),
-+				       GFP_KERNEL);
-+			if (!band)
-+				return -ENOMEM;
-+
-+			band->channels = kmemdup(&__wl_5ghz_channels,
-+						 sizeof(__wl_5ghz_channels),
-+						 GFP_KERNEL);
-+			if (!band->channels) {
-+				kfree(band);
-+				return -ENOMEM;
-+			}
-+
-+			band->n_channels = ARRAY_SIZE(__wl_5ghz_channels);
-+			wiphy->bands[IEEE80211_BAND_5GHZ] = band;
-+		}
-+	}
-+	err = brcmf_setup_wiphybands(wiphy);
-+	return err;
- }
- 
- static s32 brcmf_config_dongle(struct brcmf_cfg80211_info *cfg)
-@@ -5998,7 +6015,15 @@
- 	brcmf_dbg(TRACE, "enter: initiator=%d, alpha=%c%c\n", req->initiator,
- 		  req->alpha2[0], req->alpha2[1]);
- 
--	/* ignore non-ISO3166 country codes */
-+	/* ignore non-ISO3166 country codes
-+	 * don't report an error on 00 the world roaming
-+	 * designator as the firmware  don't support it
-+	 * but there is no reason to pass that info to userspace
-+	 */
-+
-+	if (req->alpha2[0] == '0' && req->alpha2[1] == '0')
-+		return;
-+
- 	for (i = 0; i < sizeof(req->alpha2); i++)
- 		if (req->alpha2[i] < 'A' || req->alpha2[i] > 'Z') {
- 			brcmf_err("not a ISO3166 code\n");
-@@ -6007,11 +6032,18 @@
- 	memset(&ccreq, 0, sizeof(ccreq));
- 	ccreq.rev = cpu_to_le32(-1);
- 	memcpy(ccreq.ccode, req->alpha2, sizeof(req->alpha2));
--	brcmf_fil_iovar_data_set(ifp, "country", &ccreq, sizeof(ccreq));
-+	if (brcmf_fil_iovar_data_set(ifp, "country", &ccreq, sizeof(ccreq))) {
-+		brcmf_err("firmware rejected country setting\n");
-+		return;
-+	}
-+	brcmf_setup_wiphybands(wiphy);
- }
- 
- static void brcmf_free_wiphy(struct wiphy *wiphy)
- {
-+	if (!wiphy)
-+		return;
-+
- 	kfree(wiphy->iface_combinations);
- 	if (wiphy->bands[IEEE80211_BAND_2GHZ]) {
- 		kfree(wiphy->bands[IEEE80211_BAND_2GHZ]->channels);
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/commonring.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/commonring.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/commonring.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/commonring.c	2015-07-27 23:13:06.848547454 +0200
-@@ -22,17 +22,6 @@
- #include "core.h"
- #include "commonring.h"
- 
--
--/* dma flushing needs implementation for mips and arm platforms. Should
-- * be put in util. Note, this is not real flushing. It is virtual non
-- * cached memory. Only write buffers should have to be drained. Though
-- * this may be different depending on platform......
-- * SEE ALSO msgbuf.c
-- */
--#define brcmf_dma_flush(addr, len)
--#define brcmf_dma_invalidate_cache(addr, len)
--
--
- void brcmf_commonring_register_cb(struct brcmf_commonring *commonring,
- 				  int (*cr_ring_bell)(void *ctx),
- 				  int (*cr_update_rptr)(void *ctx),
-@@ -206,14 +195,9 @@
- 	address = commonring->buf_addr;
- 	address += (commonring->f_ptr * commonring->item_len);
- 	if (commonring->f_ptr > commonring->w_ptr) {
--		brcmf_dma_flush(address,
--				(commonring->depth - commonring->f_ptr) *
--				commonring->item_len);
- 		address = commonring->buf_addr;
- 		commonring->f_ptr = 0;
- 	}
--	brcmf_dma_flush(address, (commonring->w_ptr - commonring->f_ptr) *
--			commonring->item_len);
- 
- 	commonring->f_ptr = commonring->w_ptr;
- 
-@@ -258,8 +242,6 @@
- 	if (commonring->r_ptr == commonring->depth)
- 		commonring->r_ptr = 0;
- 
--	brcmf_dma_invalidate_cache(ret_addr, *n_ items * commonring->item_len);
--
- 	return ret_addr;
- }
- 
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/core.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/core.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/core.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/core.c	2015-07-27 23:13:06.848547454 +0200
-@@ -791,15 +791,15 @@
- 	 * in case we missed the BRCMF_E_IF_DEL event.
- 	 */
- 	if (ifp) {
--		brcmf_err("ERROR: netdev:%s already exists\n",
--			  ifp->ndev->name);
- 		if (ifidx) {
-+			brcmf_err("ERROR: netdev:%s already exists, deleting old interface\n",
-+				  ifp->ndev->name);
- 			netif_stop_queue(ifp->ndev);
- 			unregister_netdev(ifp->ndev);
- 			free_netdev(ifp->ndev);
- 			drvr->iflist[bssidx] = NULL;
- 		} else {
--			brcmf_err("ignore IF event\n");
-+			brcmf_dbg(EVENT, "ignore IF event\n");
- 			return ERR_PTR(-EINVAL);
- 		}
- 	}
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.c	2015-07-27 23:13:06.848547454 +0200
-@@ -124,9 +124,11 @@
- 	struct brcmf_if *ifp = drvr->iflist[0];
- 
- 	brcmf_feat_iovar_int_get(ifp, BRCMF_FEAT_MCHAN, "mchan");
-+	brcmf_feat_iovar_int_get(ifp, BRCMF_FEAT_PNO, "pfn");
- 	if (drvr->bus_if->wowl_supported)
- 		brcmf_feat_iovar_int_get(ifp, BRCMF_FEAT_WOWL, "wowl");
--	if (drvr->bus_if->chip != BRCM_CC_43362_CHIP_ID)
-+	if ((drvr->bus_if->chip != BRCM_CC_43362_CHIP_ID) &&
-+	    (drvr->bus_if->chip != BRCM_CC_4330_CHIP_ID))
- 		brcmf_feat_iovar_int_set(ifp, BRCMF_FEAT_MBSS, "mbss", 0);
- 
- 	/* set chip related quirks */
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.h linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.h
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.h	2015-07-27 23:13:06.848547454 +0200
-@@ -19,11 +19,15 @@
- /*
-  * Features:
-  *
-+ * MBSS: multiple BSSID support (eg. guest network in AP mode).
-  * MCHAN: multi-channel for concurrent P2P.
-+ * PNO: preferred network offload.
-+ * WOWL: Wake-On-WLAN.
-  */
- #define BRCMF_FEAT_LIST \
- 	BRCMF_FEAT_DEF(MBSS) \
- 	BRCMF_FEAT_DEF(MCHAN) \
-+	BRCMF_FEAT_DEF(PNO) \
- 	BRCMF_FEAT_DEF(WOWL)
- /*
-  * Quirks:
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.c	2015-07-27 23:13:06.848547454 +0200
-@@ -23,6 +23,10 @@
- #include "debug.h"
- #include "firmware.h"
- 
-+#define BRCMF_FW_MAX_NVRAM_SIZE			64000
-+#define BRCMF_FW_NVRAM_DEVPATH_LEN		19	/* devpath0=pcie/1/4/ */
-+#define BRCMF_FW_NVRAM_PCIEDEV_LEN		9	/* pcie/1/4/ */
-+
- char brcmf_firmware_path[BRCMF_FW_PATH_LEN];
- module_param_string(firmware_path, brcmf_firmware_path,
- 		    BRCMF_FW_PATH_LEN, 0440);
-@@ -46,6 +50,8 @@
-  * @column: current column in line.
-  * @pos: byte offset in input buffer.
-  * @entry: start position of key,value entry.
-+ * @multi_dev_v1: detect pcie multi device v1 (compressed).
-+ * @multi_dev_v2: detect pcie multi device v2.
-  */
- struct nvram_parser {
- 	enum nvram_parser_state state;
-@@ -56,6 +62,8 @@
- 	u32 column;
- 	u32 pos;
- 	u32 entry;
-+	bool multi_dev_v1;
-+	bool multi_dev_v2;
- };
- 
- static bool is_nvram_char(char c)
-@@ -108,6 +116,10 @@
- 			st = COMMENT;
- 		else
- 			st = VALUE;
-+		if (strncmp(&nvp->fwnv->data[nvp->entry], "devpath", 7) == 0)
-+			nvp->multi_dev_v1 = true;
-+		if (strncmp(&nvp->fwnv->data[nvp->entry], "pcie/", 5) == 0)
-+			nvp->multi_dev_v2 = true;
- 	} else if (!is_nvram_char(c)) {
- 		brcmf_dbg(INFO, "warning: ln=%d:col=%d: '=' expected, skip invalid key entry\n",
- 			  nvp->line, nvp->column);
-@@ -133,6 +145,8 @@
- 		ekv = (u8 *)&nvp->fwnv->data[nvp->pos];
- 		skv = (u8 *)&nvp->fwnv->data[nvp->entry];
- 		cplen = ekv - skv;
-+		if (nvp->nvram_len + cplen + 1 >= BRCMF_FW_MAX_NVRAM_SIZE)
-+			return END;
- 		/* copy to output buffer */
- 		memcpy(&nvp->nvram[nvp->nvram_len], skv, cplen);
- 		nvp->nvram_len += cplen;
-@@ -180,10 +194,18 @@
- static int brcmf_init_nvram_parser(struct nvram_parser *nvp,
- 				   const struct firmware *nv)
- {
-+	size_t size;
-+
- 	memset(nvp, 0, sizeof(*nvp));
- 	nvp->fwnv = nv;
-+	/* Limit size to MAX_NVRAM_SIZE, some files contain lot of comment */
-+	if (nv->size > BRCMF_FW_MAX_NVRAM_SIZE)
-+		size = BRCMF_FW_MAX_NVRAM_SIZE;
-+	else
-+		size = nv->size;
- 	/* Alloc for extra 0 byte + roundup by 4 + length field */
--	nvp->nvram = kzalloc(nv->size + 1 + 3 + sizeof(u32), GFP_KERNEL);
-+	size += 1 + 3 + sizeof(u32);
-+	nvp->nvram = kzalloc(size, GFP_KERNEL);
- 	if (!nvp->nvram)
- 		return -ENOMEM;
- 
-@@ -192,12 +214,136 @@
- 	return 0;
- }
- 
-+/* brcmf_fw_strip_multi_v1 :Some nvram files contain settings for multiple
-+ * devices. Strip it down for one device, use domain_nr/bus_nr to determine
-+ * which data is to be returned. v1 is the version where nvram is stored
-+ * compressed and "devpath" maps to index for valid entries.
-+ */
-+static void brcmf_fw_strip_multi_v1(struct nvram_parser *nvp, u16 domain_nr,
-+				    u16 bus_nr)
-+{
-+	u32 i, j;
-+	bool found;
-+	u8 *nvram;
-+	u8 id;
-+
-+	nvram = kzalloc(nvp->nvram_len + 1 + 3 + sizeof(u32), GFP_KERNEL);
-+	if (!nvram)
-+		goto fail;
-+
-+	/* min length: devpath0=pcie/1/4/ + 0:x=y */
-+	if (nvp->nvram_len < BRCMF_FW_NVRAM_DEVPATH_LEN + 6)
-+		goto fail;
-+
-+	/* First search for the devpathX and see if it is the configuration
-+	 * for domain_nr/bus_nr. Search complete nvp
-+	 */
-+	found = false;
-+	i = 0;
-+	while (i < nvp->nvram_len - BRCMF_FW_NVRAM_DEVPATH_LEN) {
-+		/* Format: devpathX=pcie/Y/Z/
-+		 * Y = domain_nr, Z = bus_nr, X = virtual ID
-+		 */
-+		if ((strncmp(&nvp->nvram[i], "devpath", 7) == 0) &&
-+		    (strncmp(&nvp->nvram[i + 8], "=pcie/", 6) == 0)) {
-+			if (((nvp->nvram[i + 14] - '0') == domain_nr) &&
-+			    ((nvp->nvram[i + 16] - '0') == bus_nr)) {
-+				id = nvp->nvram[i + 7] - '0';
-+				found = true;
-+				break;
-+			}
-+		}
-+		while (nvp->nvram[i] != 0)
-+			i++;
-+		i++;
-+	}
-+	if (!found)
-+		goto fail;
-+
-+	/* Now copy all valid entries, release old nvram and assign new one */
-+	i = 0;
-+	j = 0;
-+	while (i < nvp->nvram_len) {
-+		if ((nvp->nvram[i] - '0' == id) && (nvp->nvram[i + 1] == ':')) {
-+			i += 2;
-+			while (nvp->nvram[i] != 0) {
-+				nvram[j] = nvp->nvram[i];
-+				i++;
-+				j++;
-+			}
-+			nvram[j] = 0;
-+			j++;
-+		}
-+		while (nvp->nvram[i] != 0)
-+			i++;
-+		i++;
-+	}
-+	kfree(nvp->nvram);
-+	nvp->nvram = nvram;
-+	nvp->nvram_len = j;
-+	return;
-+
-+fail:
-+	kfree(nvram);
-+	nvp->nvram_len = 0;
-+}
-+
-+/* brcmf_fw_strip_multi_v2 :Some nvram files contain settings for multiple
-+ * devices. Strip it down for one device, use domain_nr/bus_nr to determine
-+ * which data is to be returned. v2 is the version where nvram is stored
-+ * uncompressed, all relevant valid entries are identified by
-+ * pcie/domain_nr/bus_nr:
-+ */
-+static void brcmf_fw_strip_multi_v2(struct nvram_parser *nvp, u16 domain_nr,
-+				    u16 bus_nr)
-+{
-+	u32 i, j;
-+	u8 *nvram;
-+
-+	nvram = kzalloc(nvp->nvram_len + 1 + 3 + sizeof(u32), GFP_KERNEL);
-+	if (!nvram)
-+		goto fail;
-+
-+	/* Copy all valid entries, release old nvram and assign new one.
-+	 * Valid entries are of type pcie/X/Y/ where X = domain_nr and
-+	 * Y = bus_nr.
-+	 */
-+	i = 0;
-+	j = 0;
-+	while (i < nvp->nvram_len - BRCMF_FW_NVRAM_PCIEDEV_LEN) {
-+		if ((strncmp(&nvp->nvram[i], "pcie/", 5) == 0) &&
-+		    (nvp->nvram[i + 6] == '/') && (nvp->nvram[i + 8] == '/') &&
-+		    ((nvp->nvram[i + 5] - '0') == domain_nr) &&
-+		    ((nvp->nvram[i + 7] - '0') == bus_nr)) {
-+			i += BRCMF_FW_NVRAM_PCIEDEV_LEN;
-+			while (nvp->nvram[i] != 0) {
-+				nvram[j] = nvp->nvram[i];
-+				i++;
-+				j++;
-+			}
-+			nvram[j] = 0;
-+			j++;
-+		}
-+		while (nvp->nvram[i] != 0)
-+			i++;
-+		i++;
-+	}
-+	kfree(nvp->nvram);
-+	nvp->nvram = nvram;
-+	nvp->nvram_len = j;
-+	return;
-+fail:
-+	kfree(nvram);
-+	nvp->nvram_len = 0;
-+}
-+
- /* brcmf_nvram_strip :Takes a buffer of "<var>=<value>\n" lines read from a fil
-  * and ending in a NUL. Removes carriage returns, empty lines, comment lines,
-  * and converts newlines to NULs. Shortens buffer as needed and pads with NULs.
-  * End of buffer is completed with token identifying length of buffer.
-  */
--static void *brcmf_fw_nvram_strip(const struct firmware *nv, u32 *new_length)
-+static void *brcmf_fw_nvram_strip(const struct firmware *nv, u32 *new_length,
-+				  u16 domain_nr, u16 bus_nr)
- {
- 	struct nvram_parser nvp;
- 	u32 pad;
-@@ -212,6 +358,16 @@
- 		if (nvp.state == END)
- 			break;
- 	}
-+	if (nvp.multi_dev_v1)
-+		brcmf_fw_strip_multi_v1(&nvp, domain_nr, bus_nr);
-+	else if (nvp.multi_dev_v2)
-+		brcmf_fw_strip_multi_v2(&nvp, domain_nr, bus_nr);
-+
-+	if (nvp.nvram_len == 0) {
-+		kfree(nvp.nvram);
-+		return NULL;
-+	}
-+
- 	pad = nvp.nvram_len;
- 	*new_length = roundup(nvp.nvram_len + 1, 4);
- 	while (pad != *new_length) {
-@@ -239,6 +395,8 @@
- 	u16 flags;
- 	const struct firmware *code;
- 	const char *nvram_name;
-+	u16 domain_nr;
-+	u16 bus_nr;
- 	void (*done)(struct device *dev, const struct firmware *fw,
- 		     void *nvram_image, u32 nvram_len);
- };
-@@ -254,7 +412,8 @@
- 		goto fail;
- 
- 	if (fw) {
--		nvram = brcmf_fw_nvram_strip(fw, &nvram_length);
-+		nvram = brcmf_fw_nvram_strip(fw, &nvram_length,
-+					     fwctx->domain_nr, fwctx->bus_nr);
- 		release_firmware(fw);
- 		if (!nvram && !(fwctx->flags & BRCMF_FW_REQ_NV_OPTIONAL))
- 			goto fail;
-@@ -309,11 +468,12 @@
- 	kfree(fwctx);
- }
- 
--int brcmf_fw_get_firmwares(struct device *dev, u16 flags,
--			   const char *code, const char *nvram,
--			   void (*fw_cb)(struct device *dev,
--					 const struct firmware *fw,
--					 void *nvram_image, u32 nvram_len))
-+int brcmf_fw_get_firmwares_pcie(struct device *dev, u16 flags,
-+				const char *code, const char *nvram,
-+				void (*fw_cb)(struct device *dev,
-+					      const struct firmware *fw,
-+					      void *nvram_image, u32 nvram_len),
-+				u16 domain_nr, u16 bus_nr)
- {
- 	struct brcmf_fw *fwctx;
- 
-@@ -333,8 +493,21 @@
- 	fwctx->done = fw_cb;
- 	if (flags & BRCMF_FW_REQUEST_NVRAM)
- 		fwctx->nvram_name = nvram;
-+	fwctx->domain_nr = domain_nr;
-+	fwctx->bus_nr = bus_nr;
- 
- 	return request_firmware_nowait(THIS_MODULE, true, code, dev,
- 				       GFP_KERNEL, fwctx,
- 				       brcmf_fw_request_code_done);
- }
-+
-+int brcmf_fw_get_firmwares(struct device *dev, u16 flags,
-+			   const char *code, const char *nvram,
-+			   void (*fw_cb)(struct device *dev,
-+					 const struct firmware *fw,
-+					 void *nvram_image, u32 nvram_len))
-+{
-+	return brcmf_fw_get_firmwares_pcie(dev, flags, code, nvram, fw_cb, 0,
-+					   0);
-+}
-+
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.h linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.h
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.h	2015-07-27 23:13:06.848547454 +0200
-@@ -32,6 +32,12 @@
-  * fails it will not use the callback, but call device_release_driver()
-  * instead which will call the driver .remove() callback.
-  */
-+int brcmf_fw_get_firmwares_pcie(struct device *dev, u16 flags,
-+				const char *code, const char *nvram,
-+				void (*fw_cb)(struct device *dev,
-+					      const struct firmware *fw,
-+					      void *nvram_image, u32 nvram_len),
-+				u16 domain_nr, u16 bus_nr);
- int brcmf_fw_get_firmwares(struct device *dev, u16 flags,
- 			   const char *code, const char *nvram,
- 			   void (*fw_cb)(struct device *dev,
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.c	2015-07-27 23:13:06.848547454 +0200
-@@ -249,8 +249,8 @@
- }
- 
- 
--void brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
--			    struct sk_buff *skb)
-+u32 brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
-+			   struct sk_buff *skb)
- {
- 	struct brcmf_flowring_ring *ring;
- 
-@@ -271,6 +271,7 @@
- 		if (skb_queue_len(&ring->skblist) < BRCMF_FLOWRING_LOW)
- 			brcmf_flowring_block(flow, flowid, false);
- 	}
-+	return skb_queue_len(&ring->skblist);
- }
- 
- 
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.h linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.h
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.h	2015-07-27 23:13:06.848547454 +0200
-@@ -64,8 +64,8 @@
- void brcmf_flowring_delete(struct brcmf_flowring *flow, u8 flowid);
- void brcmf_flowring_open(struct brcmf_flowring *flow, u8 flowid);
- u8 brcmf_flowring_tid(struct brcmf_flowring *flow, u8 flowid);
--void brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
--			    struct sk_buff *skb);
-+u32 brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
-+			   struct sk_buff *skb);
- struct sk_buff *brcmf_flowring_dequeue(struct brcmf_flowring *flow, u8 flowid);
- void brcmf_flowring_reinsert(struct brcmf_flowring *flow, u8 flowid,
- 			     struct sk_buff *skb);
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c	2015-07-27 23:13:06.860504792 +0200
-@@ -635,7 +635,7 @@
- 	return 0;
- }
- 
--static int brcmf_fws_hanger_poppkt(struct brcmf_fws_hanger *h,
-+static inline int brcmf_fws_hanger_poppkt(struct brcmf_fws_hanger *h,
- 					  u32 slot_id, struct sk_buff **pktout,
- 					  bool remove_item)
- {
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c	2015-07-27 23:13:06.860504792 +0200
-@@ -73,7 +73,7 @@
- #define BRCMF_MSGBUF_TX_FLUSH_CNT1		32
- #define BRCMF_MSGBUF_TX_FLUSH_CNT2		96
- 
--#define BRCMF_MSGBUF_DELAY_TXWORKER_THRS	64
-+#define BRCMF_MSGBUF_DELAY_TXWORKER_THRS	96
- #define BRCMF_MSGBUF_TRICKLE_TXWORKER_THRS	32
- 
- struct msgbuf_common_hdr {
-@@ -278,16 +278,6 @@
- 	struct brcmf_msgbuf_pktid *array;
- };
- 
--
--/* dma flushing needs implementation for mips and arm platforms. Should
-- * be put in util. Note, this is not real flushing. It is virtual non
-- * cached memory. Only write buffers should have to be drained. Though
-- * this may be different depending on platform......
-- */
--#define brcmf_dma_flush(addr, len)
--#define brcmf_dma_invalidate_cache(addr, len)
--
--
- static void brcmf_msgbuf_rxbuf_ioctlresp_post(struct brcmf_msgbuf *msgbuf);
- 
- 
-@@ -462,7 +452,6 @@
- 		memcpy(msgbuf->ioctbuf, buf, buf_len);
- 	else
- 		memset(msgbuf->ioctbuf, 0, buf_len);
--	brcmf_dma_flush(ioctl_buf, buf_len);
- 
- 	err = brcmf_commonring_write_complete(commonring);
- 	brcmf_commonring_unlock(commonring);
-@@ -795,6 +784,8 @@
- 	struct brcmf_flowring *flow = msgbuf->flow;
- 	struct ethhdr *eh = (struct ethhdr *)(skb->data);
- 	u32 flowid;
-+	u32 queue_count;
-+	bool force;
- 
- 	flowid = brcmf_flowring_lookup(flow, eh->h_dest, skb->priority, ifidx);
- 	if (flowid == BRCMF_FLOWRING_INVALID_ID) {
-@@ -802,8 +793,9 @@
- 		if (flowid == BRCMF_FLOWRING_INVALID_ID)
- 			return -ENOMEM;
- 	}
--	brcmf_flowring_enqueue(flow, flowid, skb);
--	brcmf_msgbuf_schedule_txdata(msgbuf, flowid, false);
-+	queue_count = brcmf_flowring_enqueue(flow, flowid, skb);
-+	force = ((queue_count % BRCMF_MSGBUF_TRICKLE_TXWORKER_THRS) == 0);
-+	brcmf_msgbuf_schedule_txdata(msgbuf, flowid, force);
- 
- 	return 0;
- }
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/of.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/of.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/of.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/of.c	2015-07-27 23:13:06.868476350 +0200
-@@ -39,10 +39,16 @@
- 	if (!sdiodev->pdata)
- 		return;
- 
-+	if (of_property_read_u32(np, "brcm,drive-strength", &val) == 0)
-+		sdiodev->pdata->drive_strength = val;
-+
-+	/* make sure there are interrupts defined in the node */
-+	if (!of_find_property(np, "interrupts", NULL))
-+		return;
-+
- 	irq = irq_of_parse_and_map(np, 0);
- 	if (!irq) {
- 		brcmf_err("interrupt could not be mapped\n");
--		devm_kfree(dev, sdiodev->pdata);
- 		return;
- 	}
- 	irqf = irqd_get_trigger_type(irq_get_irq_data(irq));
-@@ -50,7 +56,4 @@
- 	sdiodev->pdata->oob_irq_supported = true;
- 	sdiodev->pdata->oob_irq_nr = irq;
- 	sdiodev->pdata->oob_irq_flags = irqf;
--
--	if (of_property_read_u32(np, "brcm,drive-strength", &val) == 0)
--		sdiodev->pdata->drive_strength = val;
- }
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/pcie.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/pcie.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/pcie.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/pcie.c	2015-07-27 23:13:06.868476350 +0200
-@@ -110,10 +110,12 @@
- 						 BRCMF_PCIE_MB_INT_D2H3_DB0 | \
- 						 BRCMF_PCIE_MB_INT_D2H3_DB1)
- 
--#define BRCMF_PCIE_MIN_SHARED_VERSION		4
-+#define BRCMF_PCIE_MIN_SHARED_VERSION		5
- #define BRCMF_PCIE_MAX_SHARED_VERSION		5
- #define BRCMF_PCIE_SHARED_VERSION_MASK		0x00FF
- #define BRCMF_PCIE_SHARED_TXPUSH_SUPPORT	0x4000
-+#define BRCMF_PCIE_SHARED_DMA_INDEX		0x10000
-+#define BRCMF_PCIE_SHARED_DMA_2B_IDX		0x100000
- 
- #define BRCMF_PCIE_FLAGS_HTOD_SPLIT		0x4000
- #define BRCMF_PCIE_FLAGS_DTOH_SPLIT		0x8000
-@@ -145,6 +147,10 @@
- #define BRCMF_SHARED_RING_H2D_R_IDX_PTR_OFFSET	8
- #define BRCMF_SHARED_RING_D2H_W_IDX_PTR_OFFSET	12
- #define BRCMF_SHARED_RING_D2H_R_IDX_PTR_OFFSET	16
-+#define BRCMF_SHARED_RING_H2D_WP_HADDR_OFFSET	20
-+#define BRCMF_SHARED_RING_H2D_RP_HADDR_OFFSET	28
-+#define BRCMF_SHARED_RING_D2H_WP_HADDR_OFFSET	36
-+#define BRCMF_SHARED_RING_D2H_RP_HADDR_OFFSET	44
- #define BRCMF_SHARED_RING_TCM_MEMLOC_OFFSET	0
- #define BRCMF_SHARED_RING_MAX_SUB_QUEUES	52
- 
-@@ -244,6 +250,13 @@
- 	bool mbdata_completed;
- 	bool irq_allocated;
- 	bool wowl_enabled;
-+	u8 dma_idx_sz;
-+	void *idxbuf;
-+	u32 idxbuf_sz;
-+	dma_addr_t idxbuf_dmahandle;
-+	u16 (*read_ptr)(struct brcmf_pciedev_info *devinfo, u32 mem_offset);
-+	void (*write_ptr)(struct brcmf_pciedev_info *devinfo, u32 mem_offset,
-+			  u16 value);
- };
- 
- struct brcmf_pcie_ringbuf {
-@@ -273,15 +286,6 @@
- };
- 
- 
--/* dma flushing needs implementation for mips and arm platforms. Should
-- * be put in util. Note, this is not real flushing. It is virtual non
-- * cached memory. Only write buffers should have to be drained. Though
-- * this may be different depending on platform......
-- */
--#define brcmf_dma_flush(addr, len)
--#define brcmf_dma_invalidate_cache(addr, len)
--
--
- static u32
- brcmf_pcie_read_reg32(struct brcmf_pciedev_info *devinfo, u32 reg_offset)
- {
-@@ -329,6 +333,25 @@
- }
- 
- 
-+static u16
-+brcmf_pcie_read_idx(struct brcmf_pciedev_info *devinfo, u32 mem_offset)
-+{
-+	u16 *address = devinfo->idxbuf + mem_offset;
-+
-+	return (*(address));
-+}
-+
-+
-+static void
-+brcmf_pcie_write_idx(struct brcmf_pciedev_info *devinfo, u32 mem_offset,
-+		     u16 value)
-+{
-+	u16 *address = devinfo->idxbuf + mem_offset;
-+
-+	*(address) = value;
-+}
-+
-+
- static u32
- brcmf_pcie_read_tcm32(struct brcmf_pciedev_info *devinfo, u32 mem_offset)
- {
-@@ -874,7 +897,7 @@
- 	brcmf_dbg(PCIE, "W r_ptr %d (%d), ring %d\n", commonring->r_ptr,
- 		  commonring->w_ptr, ring->id);
- 
--	brcmf_pcie_write_tcm16(devinfo, ring->r_idx_addr, commonring->r_ptr);
-+	devinfo->write_ptr(devinfo, ring->r_idx_addr, commonring->r_ptr);
- 
- 	return 0;
- }
-@@ -892,7 +915,7 @@
- 	brcmf_dbg(PCIE, "W w_ptr %d (%d), ring %d\n", commonring->w_ptr,
- 		  commonring->r_ptr, ring->id);
- 
--	brcmf_pcie_write_tcm16(devinfo, ring->w_idx_addr, commonring->w_ptr);
-+	devinfo->write_ptr(devinfo, ring->w_idx_addr, commonring->w_ptr);
- 
- 	return 0;
- }
-@@ -921,7 +944,7 @@
- 	if (devinfo->state != BRCMFMAC_PCIE_STATE_UP)
- 		return -EIO;
- 
--	commonring->r_ptr = brcmf_pcie_read_tcm16(devinfo, ring->r_idx_addr);
-+	commonring->r_ptr = devinfo->read_ptr(devinfo, ring->r_idx_addr);
- 
- 	brcmf_dbg(PCIE, "R r_ptr %d (%d), ring %d\n", commonring->r_ptr,
- 		  commonring->w_ptr, ring->id);
-@@ -939,7 +962,7 @@
- 	if (devinfo->state != BRCMFMAC_PCIE_STATE_UP)
- 		return -EIO;
- 
--	commonring->w_ptr = brcmf_pcie_read_tcm16(devinfo, ring->w_idx_addr);
-+	commonring->w_ptr = devinfo->read_ptr(devinfo, ring->w_idx_addr);
- 
- 	brcmf_dbg(PCIE, "R w_ptr %d (%d), ring %d\n", commonring->w_ptr,
- 		  commonring->r_ptr, ring->id);
-@@ -1044,6 +1067,13 @@
- 	}
- 	kfree(devinfo->shared.flowrings);
- 	devinfo->shared.flowrings = NULL;
-+	if (devinfo->idxbuf) {
-+		dma_free_coherent(&devinfo->pdev->dev,
-+				  devinfo->idxbuf_sz,
-+				  devinfo->idxbuf,
-+				  devinfo->idxbuf_dmahandle);
-+		devinfo->idxbuf = NULL;
-+	}
- }
- 
- 
-@@ -1059,19 +1089,72 @@
- 	u32 addr;
- 	u32 ring_mem_ptr;
- 	u32 i;
-+	u64 address;
-+	u32 bufsz;
- 	u16 max_sub_queues;
-+	u8 idx_offset;
- 
- 	ring_addr = devinfo->shared.ring_info_addr;
- 	brcmf_dbg(PCIE, "Base ring addr = 0x%08x\n", ring_addr);
-+	addr = ring_addr + BRCMF_SHARED_RING_MAX_SUB_QUEUES;
-+	max_sub_queues = brcmf_pcie_read_tcm16(devinfo, addr);
- 
--	addr = ring_addr + BRCMF_SHARED_RING_D2H_W_IDX_PTR_OFFSET;
--	d2h_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
--	addr = ring_addr + BRCMF_SHARED_RING_D2H_R_IDX_PTR_OFFSET;
--	d2h_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
--	addr = ring_addr + BRCMF_SHARED_RING_H2D_W_IDX_PTR_OFFSET;
--	h2d_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
--	addr = ring_addr + BRCMF_SHARED_RING_H2D_R_IDX_PTR_OFFSET;
--	h2d_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
-+	if (devinfo->dma_idx_sz != 0) {
-+		bufsz = (BRCMF_NROF_D2H_COMMON_MSGRINGS + max_sub_queues) *
-+			devinfo->dma_idx_sz * 2;
-+		devinfo->idxbuf = dma_alloc_coherent(&devinfo->pdev->dev, bufsz,
-+						     &devinfo->idxbuf_dmahandle,
-+						     GFP_KERNEL);
-+		if (!devinfo->idxbuf)
-+			devinfo->dma_idx_sz = 0;
-+	}
-+
-+	if (devinfo->dma_idx_sz == 0) {
-+		addr = ring_addr + BRCMF_SHARED_RING_D2H_W_IDX_PTR_OFFSET;
-+		d2h_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
-+		addr = ring_addr + BRCMF_SHARED_RING_D2H_R_IDX_PTR_OFFSET;
-+		d2h_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
-+		addr = ring_addr + BRCMF_SHARED_RING_H2D_W_IDX_PTR_OFFSET;
-+		h2d_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
-+		addr = ring_addr + BRCMF_SHARED_RING_H2D_R_IDX_PTR_OFFSET;
-+		h2d_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
-+		idx_offset = sizeof(u32);
-+		devinfo->write_ptr = brcmf_pcie_write_tcm16;
-+		devinfo->read_ptr = brcmf_pcie_read_tcm16;
-+		brcmf_dbg(PCIE, "Using TCM indices\n");
-+	} else {
-+		memset(devinfo->idxbuf, 0, bufsz);
-+		devinfo->idxbuf_sz = bufsz;
-+		idx_offset = devinfo->dma_idx_sz;
-+		devinfo->write_ptr = brcmf_pcie_write_idx;
-+		devinfo->read_ptr = brcmf_pcie_read_idx;
-+
-+		h2d_w_idx_ptr = 0;
-+		addr = ring_addr + BRCMF_SHARED_RING_H2D_WP_HADDR_OFFSET;
-+		address = (u64)devinfo->idxbuf_dmahandle;
-+		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
-+		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
-+
-+		h2d_r_idx_ptr = h2d_w_idx_ptr + max_sub_queues * idx_offset;
-+		addr = ring_addr + BRCMF_SHARED_RING_H2D_RP_HADDR_OFFSET;
-+		address += max_sub_queues * idx_offset;
-+		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
-+		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
-+
-+		d2h_w_idx_ptr = h2d_r_idx_ptr + max_sub_queues * idx_offset;
-+		addr = ring_addr + BRCMF_SHARED_RING_D2H_WP_HADDR_OFFSET;
-+		address += max_sub_queues * idx_offset;
-+		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
-+		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
-+
-+		d2h_r_idx_ptr = d2h_w_idx_ptr +
-+				BRCMF_NROF_D2H_COMMON_MSGRINGS * idx_offset;
-+		addr = ring_addr + BRCMF_SHARED_RING_D2H_RP_HADDR_OFFSET;
-+		address += BRCMF_NROF_D2H_COMMON_MSGRINGS * idx_offset;
-+		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
-+		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
-+		brcmf_dbg(PCIE, "Using host memory indices\n");
-+	}
- 
- 	addr = ring_addr + BRCMF_SHARED_RING_TCM_MEMLOC_OFFSET;
- 	ring_mem_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
-@@ -1085,8 +1168,8 @@
- 		ring->id = i;
- 		devinfo->shared.commonrings[i] = ring;
- 
--		h2d_w_idx_ptr += sizeof(u32);
--		h2d_r_idx_ptr += sizeof(u32);
-+		h2d_w_idx_ptr += idx_offset;
-+		h2d_r_idx_ptr += idx_offset;
- 		ring_mem_ptr += BRCMF_RING_MEM_SZ;
- 	}
- 
-@@ -1100,13 +1183,11 @@
- 		ring->id = i;
- 		devinfo->shared.commonrings[i] = ring;
- 
--		d2h_w_idx_ptr += sizeof(u32);
--		d2h_r_idx_ptr += sizeof(u32);
-+		d2h_w_idx_ptr += idx_offset;
-+		d2h_r_idx_ptr += idx_offset;
- 		ring_mem_ptr += BRCMF_RING_MEM_SZ;
- 	}
- 
--	addr = ring_addr + BRCMF_SHARED_RING_MAX_SUB_QUEUES;
--	max_sub_queues = brcmf_pcie_read_tcm16(devinfo, addr);
- 	devinfo->shared.nrof_flowrings =
- 			max_sub_queues - BRCMF_NROF_H2D_COMMON_MSGRINGS;
- 	rings = kcalloc(devinfo->shared.nrof_flowrings, sizeof(*ring),
-@@ -1130,15 +1211,15 @@
- 					     ring);
- 		ring->w_idx_addr = h2d_w_idx_ptr;
- 		ring->r_idx_addr = h2d_r_idx_ptr;
--		h2d_w_idx_ptr += sizeof(u32);
--		h2d_r_idx_ptr += sizeof(u32);
-+		h2d_w_idx_ptr += idx_offset;
-+		h2d_r_idx_ptr += idx_offset;
- 	}
- 	devinfo->shared.flowrings = rings;
- 
- 	return 0;
- 
- fail:
--	brcmf_err("Allocating commonring buffers failed\n");
-+	brcmf_err("Allocating ring buffers failed\n");
- 	brcmf_pcie_release_ringbuffers(devinfo);
- 	return -ENOMEM;
- }
-@@ -1171,7 +1252,6 @@
- 		goto fail;
- 
- 	memset(devinfo->shared.scratch, 0, BRCMF_DMA_D2H_SCRATCH_BUF_LEN);
--	brcmf_dma_flush(devinfo->shared.scratch, BRCMF_DMA_D2H_SCRATCH_BUF_LEN);
- 
- 	addr = devinfo->shared.tcm_base_address +
- 	       BRCMF_SHARED_DMA_SCRATCH_ADDR_OFFSET;
-@@ -1189,7 +1269,6 @@
- 		goto fail;
- 
- 	memset(devinfo->shared.ringupd, 0, BRCMF_DMA_D2H_RINGUPD_BUF_LEN);
--	brcmf_dma_flush(devinfo->shared.ringupd, BRCMF_DMA_D2H_RINGUPD_BUF_LEN);
- 
- 	addr = devinfo->shared.tcm_base_address +
- 	       BRCMF_SHARED_DMA_RINGUPD_ADDR_OFFSET;
-@@ -1276,10 +1355,13 @@
- 		brcmf_err("Unsupported PCIE version %d\n", version);
- 		return -EINVAL;
- 	}
--	if (shared->flags & BRCMF_PCIE_SHARED_TXPUSH_SUPPORT) {
--		brcmf_err("Unsupported legacy TX mode 0x%x\n",
--			  shared->flags & BRCMF_PCIE_SHARED_TXPUSH_SUPPORT);
--		return -EINVAL;
-+
-+	/* check firmware support dma indicies */
-+	if (shared->flags & BRCMF_PCIE_SHARED_DMA_INDEX) {
-+		if (shared->flags & BRCMF_PCIE_SHARED_DMA_2B_IDX)
-+			devinfo->dma_idx_sz = sizeof(u16);
-+		else
-+			devinfo->dma_idx_sz = sizeof(u32);
- 	}
- 
- 	addr = sharedram_addr + BRCMF_SHARED_MAX_RXBUFPOST_OFFSET;
-@@ -1609,7 +1691,7 @@
- 		bus->msgbuf->commonrings[i] =
- 				&devinfo->shared.commonrings[i]->commonring;
- 
--	flowrings = kcalloc(devinfo->shared.nrof_flowrings, sizeof(flowrings),
-+	flowrings = kcalloc(devinfo->shared.nrof_flowrings, sizeof(*flowrings),
- 			    GFP_KERNEL);
- 	if (!flowrings)
- 		goto fail;
-@@ -1641,8 +1723,13 @@
- 	struct brcmf_pciedev_info *devinfo;
- 	struct brcmf_pciedev *pcie_bus_dev;
- 	struct brcmf_bus *bus;
-+	u16 domain_nr;
-+	u16 bus_nr;
- 
--	brcmf_dbg(PCIE, "Enter %x:%x\n", pdev->vendor, pdev->device);
-+	domain_nr = pci_domain_nr(pdev->bus) + 1;
-+	bus_nr = pdev->bus->number;
-+	brcmf_dbg(PCIE, "Enter %x:%x (%d/%d)\n", pdev->vendor, pdev->device,
-+		  domain_nr, bus_nr);
- 
- 	ret = -ENOMEM;
- 	devinfo = kzalloc(sizeof(*devinfo), GFP_KERNEL);
-@@ -1691,10 +1778,10 @@
- 	if (ret)
- 		goto fail_bus;
- 
--	ret = brcmf_fw_get_firmwares(bus->dev, BRCMF_FW_REQUEST_NVRAM |
--					       BRCMF_FW_REQ_NV_OPTIONAL,
--				     devinfo->fw_name, devinfo->nvram_name,
--				     brcmf_pcie_setup);
-+	ret = brcmf_fw_get_firmwares_pcie(bus->dev, BRCMF_FW_REQUEST_NVRAM |
-+						    BRCMF_FW_REQ_NV_OPTIONAL,
-+					  devinfo->fw_name, devinfo->nvram_name,
-+					  brcmf_pcie_setup, domain_nr, bus_nr);
- 	if (ret == 0)
- 		return 0;
- fail_bus:
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/sdio.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/sdio.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/sdio.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/sdio.c	2015-07-27 23:13:06.872462130 +0200
-@@ -3550,10 +3550,6 @@
- 		return;
- 	}
- 
--	if (bus->sdiodev->state != BRCMF_SDIOD_DATA) {
--		brcmf_err("bus is down. we have nothing to do\n");
--		return;
--	}
- 	/* Count the interrupt call */
- 	bus->sdcnt.intrcount++;
- 	if (in_interrupt())
-diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/usb.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/usb.c
---- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/usb.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/usb.c	2015-07-27 23:13:06.872462130 +0200
-@@ -1270,8 +1270,13 @@
- 	bus->chiprev = bus_pub->chiprev;
- 
- 	/* request firmware here */
--	brcmf_fw_get_firmwares(dev, 0, brcmf_usb_get_fwname(devinfo), NULL,
--			       brcmf_usb_probe_phase2);
-+	ret = brcmf_fw_get_firmwares(dev, 0, brcmf_usb_get_fwname(devinfo),
-+				     NULL, brcmf_usb_probe_phase2);
-+	if (ret) {
-+		brcmf_err("firmware request failed: %d\n", ret);
-+		goto fail;
-+	}
-+
- 	return 0;
- 
- fail:
-diff -Nur linux-4.1.3/drivers/spi/spi-imx.c linux-xbian-imx6/drivers/spi/spi-imx.c
---- linux-4.1.3/drivers/spi/spi-imx.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/spi/spi-imx.c	2015-07-27 23:13:07.837020693 +0200
-@@ -1,5 +1,5 @@
- /*
-- * Copyright 2004-2007 Freescale Semiconductor, Inc. All Rights Reserved.
-+ * Copyright 2004-2007, 2015 Freescale Semiconductor, Inc. All Rights Reserved.
-  * Copyright (C) 2008 Juergen Beisert
-  *
-  * This program is free software; you can redistribute it and/or
-@@ -53,10 +53,14 @@
- /* generic defines to abstract from the different register layouts */
- #define MXC_INT_RR	(1 << 0) /* Receive data ready interrupt */
- #define MXC_INT_TE	(1 << 1) /* Transmit FIFO empty interrupt */
-+#define MXC_INT_TCEN    (1 << 7)   /* Transfer complete */
- 
- /* The maximum  bytes that a sdma BD can transfer.*/
- #define MAX_SDMA_BD_BYTES  (1 << 15)
--#define IMX_DMA_TIMEOUT (msecs_to_jiffies(3000))
-+/* 3 Sec for 1MB or less than 1MB, else change with the transfer length */
-+#define IMX_DEFAULT_DMA_TIMEOUT (msecs_to_jiffies(3000))
-+#define IMX_DMA_TIMEOUT(len) ((len < 0x100000) ? IMX_DEFAULT_DMA_TIMEOUT : \
-+				len * IMX_DEFAULT_DMA_TIMEOUT / 0x100000)
- struct spi_imx_config {
- 	unsigned int speed_hz;
- 	unsigned int bpw;
-@@ -102,18 +106,23 @@
- 
- 	/* DMA */
- 	unsigned int dma_is_inited;
--	unsigned int dma_finished;
- 	bool usedma;
- 	u32 rx_wml;
- 	u32 tx_wml;
- 	u32 rxt_wml;
- 	struct completion dma_rx_completion;
- 	struct completion dma_tx_completion;
-+	struct dma_slave_config rx_config;
-+	struct dma_slave_config tx_config;
- 
- 	const struct spi_imx_devtype_data *devtype_data;
- 	int chipselect[0];
- };
- 
-+static struct spi_board_info info = {
-+	.modalias	= "spidev",
-+};
-+
- static inline int is_imx27_cspi(struct spi_imx_data *d)
- {
- 	return d->devtype_data->devtype == IMX27_CSPI;
-@@ -201,8 +210,9 @@
- {
- 	struct spi_imx_data *spi_imx = spi_master_get_devdata(master);
- 
--	if (spi_imx->dma_is_inited && (transfer->len > spi_imx->rx_wml)
--	    && (transfer->len > spi_imx->tx_wml))
-+	if (spi_imx->dma_is_inited &&
-+		(transfer->len > spi_imx_get_fifosize(spi_imx)) &&
-+		(transfer->len > spi_imx_get_fifosize(spi_imx)))
- 		return true;
- 	return false;
- }
-@@ -227,6 +237,7 @@
- #define MX51_ECSPI_INT		0x10
- #define MX51_ECSPI_INT_TEEN		(1 <<  0)
- #define MX51_ECSPI_INT_RREN		(1 <<  3)
-+#define MX51_ECSPI_INT_TCEN             (1 << 7)
- 
- #define MX51_ECSPI_DMA      0x14
- #define MX51_ECSPI_DMA_TX_WML_OFFSET	0
-@@ -291,17 +302,21 @@
- 	if (enable & MXC_INT_RR)
- 		val |= MX51_ECSPI_INT_RREN;
- 
-+	if (enable & MXC_INT_TCEN)
-+		val |= MX51_ECSPI_INT_TCEN;
-+
- 	writel(val, spi_imx->base + MX51_ECSPI_INT);
- }
- 
- static void __maybe_unused mx51_ecspi_trigger(struct spi_imx_data *spi_imx)
- {
- 	u32 reg = readl(spi_imx->base + MX51_ECSPI_CTRL);
--
-+	/*
-+	 * To workaround TKT238285, SDMA script need use XCH instead of SMC
-+	 * just like PIO mode.
-+	 */
- 	if (!spi_imx->usedma)
- 		reg |= MX51_ECSPI_CTRL_XCH;
--	else if (!spi_imx->dma_finished)
--		reg |= MX51_ECSPI_CTRL_SMC;
- 	else
- 		reg &= ~MX51_ECSPI_CTRL_SMC;
- 	writel(reg, spi_imx->base + MX51_ECSPI_CTRL);
-@@ -311,7 +326,6 @@
- 		struct spi_imx_config *config)
- {
- 	u32 ctrl = MX51_ECSPI_CTRL_ENABLE, cfg = 0, dma = 0;
--	u32 tx_wml_cfg, rx_wml_cfg, rxt_wml_cfg;
- 	u32 clk = config->speed_hz, delay;
- 
- 	/*
-@@ -368,20 +382,10 @@
- 	 * and enable DMA request.
- 	 */
- 	if (spi_imx->dma_is_inited) {
--		dma = readl(spi_imx->base + MX51_ECSPI_DMA);
--
--		spi_imx->rxt_wml = spi_imx_get_fifosize(spi_imx) / 2;
--		rx_wml_cfg = spi_imx->rx_wml << MX51_ECSPI_DMA_RX_WML_OFFSET;
--		tx_wml_cfg = spi_imx->tx_wml << MX51_ECSPI_DMA_TX_WML_OFFSET;
--		rxt_wml_cfg = spi_imx->rxt_wml << MX51_ECSPI_DMA_RXT_WML_OFFSET;
--		dma = (dma & ~MX51_ECSPI_DMA_TX_WML_MASK
--			   & ~MX51_ECSPI_DMA_RX_WML_MASK
--			   & ~MX51_ECSPI_DMA_RXT_WML_MASK)
--			   | rx_wml_cfg | tx_wml_cfg | rxt_wml_cfg
--			   |(1 << MX51_ECSPI_DMA_TEDEN_OFFSET)
--			   |(1 << MX51_ECSPI_DMA_RXDEN_OFFSET)
--			   |(1 << MX51_ECSPI_DMA_RXTDEN_OFFSET);
--
-+		spi_imx->rx_wml = spi_imx_get_fifosize(spi_imx) / 2;
-+		dma = (spi_imx->rx_wml - 1) << MX51_ECSPI_DMA_RX_WML_OFFSET
-+		      | (1 << MX51_ECSPI_DMA_TEDEN_OFFSET)
-+		      | (1 << MX51_ECSPI_DMA_RXDEN_OFFSET);
- 		writel(dma, spi_imx->base + MX51_ECSPI_DMA);
- 	}
- 
-@@ -768,6 +772,7 @@
- {
- 	struct spi_imx_data *spi_imx = spi_master_get_devdata(spi->master);
- 	struct spi_imx_config config;
-+	int ret;
- 
- 	config.bpw = t ? t->bits_per_word : spi->bits_per_word;
- 	config.speed_hz  = t ? t->speed_hz : spi->max_speed_hz;
-@@ -783,12 +788,35 @@
- 	if (config.bpw <= 8) {
- 		spi_imx->rx = spi_imx_buf_rx_u8;
- 		spi_imx->tx = spi_imx_buf_tx_u8;
-+		spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
-+		spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
- 	} else if (config.bpw <= 16) {
- 		spi_imx->rx = spi_imx_buf_rx_u16;
- 		spi_imx->tx = spi_imx_buf_tx_u16;
-+		spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_2_BYTES;
-+		spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_2_BYTES;
- 	} else {
- 		spi_imx->rx = spi_imx_buf_rx_u32;
- 		spi_imx->tx = spi_imx_buf_tx_u32;
-+		spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
-+		spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
-+	}
-+
-+	if (spi_imx->bitbang.master->can_dma &&
-+	    spi_imx_can_dma(spi_imx->bitbang.master, spi, t)) {
-+		ret = dmaengine_slave_config(spi_imx->bitbang.master->dma_tx,
-+						&spi_imx->tx_config);
-+		if (ret) {
-+			dev_err(&spi->dev, "error in TX dma configuration.\n");
-+			return ret;
-+		}
-+
-+		ret = dmaengine_slave_config(spi_imx->bitbang.master->dma_rx,
-+						&spi_imx->rx_config);
-+		if (ret) {
-+			dev_err(&spi->dev, "error in RX dma configuration.\n");
-+			return ret;
-+		}
- 	}
- 
- 	spi_imx->devtype_data->config(spi_imx, &config);
-@@ -817,7 +845,6 @@
- 			     struct spi_master *master,
- 			     const struct resource *res)
- {
--	struct dma_slave_config slave_config = {};
- 	int ret;
- 
- 	/* use pio mode for i.mx6dl chip TKT238285 */
-@@ -832,11 +859,11 @@
- 		goto err;
- 	}
- 
--	slave_config.direction = DMA_MEM_TO_DEV;
--	slave_config.dst_addr = res->start + MXC_CSPITXDATA;
--	slave_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
--	slave_config.dst_maxburst = spi_imx_get_fifosize(spi_imx) / 2;
--	ret = dmaengine_slave_config(master->dma_tx, &slave_config);
-+	spi_imx->tx_config.direction = DMA_MEM_TO_DEV;
-+	spi_imx->tx_config.dst_addr = res->start + MXC_CSPITXDATA;
-+	spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
-+	spi_imx->tx_config.dst_maxburst = spi_imx_get_fifosize(spi_imx) / 4;
-+	ret = dmaengine_slave_config(master->dma_tx, &spi_imx->tx_config);
- 	if (ret) {
- 		dev_err(dev, "error in TX dma configuration.\n");
- 		goto err;
-@@ -850,11 +877,11 @@
- 		goto err;
- 	}
- 
--	slave_config.direction = DMA_DEV_TO_MEM;
--	slave_config.src_addr = res->start + MXC_CSPIRXDATA;
--	slave_config.src_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
--	slave_config.src_maxburst = spi_imx_get_fifosize(spi_imx) / 2;
--	ret = dmaengine_slave_config(master->dma_rx, &slave_config);
-+	spi_imx->rx_config.direction = DMA_DEV_TO_MEM;
-+	spi_imx->rx_config.src_addr = res->start + MXC_CSPIRXDATA;
-+	spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
-+	spi_imx->rx_config.src_maxburst = spi_imx_get_fifosize(spi_imx) / 2;
-+	ret = dmaengine_slave_config(master->dma_rx, &spi_imx->rx_config);
- 	if (ret) {
- 		dev_err(dev, "error in RX dma configuration.\n");
- 		goto err;
-@@ -890,14 +917,33 @@
- 	complete(&spi_imx->dma_tx_completion);
- }
- 
-+static void spi_imx_tail_pio_set(struct spi_imx_data *spi_imx, int left)
-+{
-+
-+	switch (spi_imx->rx_config.src_addr_width) {
-+	case DMA_SLAVE_BUSWIDTH_1_BYTE:
-+		spi_imx->rx = spi_imx_buf_rx_u8;
-+		break;
-+	case DMA_SLAVE_BUSWIDTH_2_BYTES:
-+		spi_imx->rx = spi_imx_buf_rx_u16;
-+		break;
-+	case DMA_SLAVE_BUSWIDTH_4_BYTES:
-+		spi_imx->rx = spi_imx_buf_rx_u32;
-+		break;
-+	default:
-+		spi_imx->rx = spi_imx_buf_rx_u8;
-+		break;
-+	}
-+
-+	spi_imx->txfifo = left / spi_imx->tx_config.dst_addr_width;
-+}
-+
- static int spi_imx_dma_transfer(struct spi_imx_data *spi_imx,
- 				struct spi_transfer *transfer)
- {
- 	struct dma_async_tx_descriptor *desc_tx = NULL, *desc_rx = NULL;
- 	int ret;
--	unsigned long timeout;
--	u32 dma;
--	int left;
-+	int left = 0;
- 	struct spi_master *master = spi_imx->bitbang.master;
- 	struct sg_table *tx = &transfer->tx_sg, *rx = &transfer->rx_sg;
- 
-@@ -914,6 +960,18 @@
- 	}
- 
- 	if (rx) {
-+		struct scatterlist *sgl_last = &rx->sgl[rx->nents - 1];
-+		unsigned int	orig_length = sgl_last->length;
-+		int	wml_mask = ~(spi_imx->rx_wml - 1);
-+		/*
-+		 * Adjust the transfer lenth of the last scattlist if there are
-+		 * some tail data, use PIO read to get the tail data since DMA
-+		 * sometimes miss the last tail interrupt.
-+		 */
-+		left = transfer->len % spi_imx->rx_wml;
-+		if (left)
-+			sgl_last->length = orig_length & wml_mask;
-+
- 		desc_rx = dmaengine_prep_slave_sg(master->dma_rx,
- 					rx->sgl, rx->nents, DMA_DEV_TO_MEM,
- 					DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
-@@ -929,46 +987,50 @@
- 	reinit_completion(&spi_imx->dma_tx_completion);
- 
- 	/* Trigger the cspi module. */
--	spi_imx->dma_finished = 0;
--
--	dma = readl(spi_imx->base + MX51_ECSPI_DMA);
--	dma = dma & (~MX51_ECSPI_DMA_RXT_WML_MASK);
--	/* Change RX_DMA_LENGTH trigger dma fetch tail data */
--	left = transfer->len % spi_imx->rxt_wml;
--	if (left)
--		writel(dma | (left << MX51_ECSPI_DMA_RXT_WML_OFFSET),
--				spi_imx->base + MX51_ECSPI_DMA);
- 	spi_imx->devtype_data->trigger(spi_imx);
- 
- 	dma_async_issue_pending(master->dma_tx);
- 	dma_async_issue_pending(master->dma_rx);
- 	/* Wait SDMA to finish the data transfer.*/
--	timeout = wait_for_completion_timeout(&spi_imx->dma_tx_completion,
--						IMX_DMA_TIMEOUT);
--	if (!timeout) {
--		pr_warn("%s %s: I/O Error in DMA TX\n",
-+	ret = wait_for_completion_timeout(&spi_imx->dma_tx_completion,
-+					  IMX_DMA_TIMEOUT(transfer->len));
-+	if (!ret) {
-+		pr_warn("%s %s: I/O Error in DMA TX:%x\n",
- 			dev_driver_string(&master->dev),
--			dev_name(&master->dev));
-+			dev_name(&master->dev), transfer->len);
- 		dmaengine_terminate_all(master->dma_tx);
- 	} else {
--		timeout = wait_for_completion_timeout(
--				&spi_imx->dma_rx_completion, IMX_DMA_TIMEOUT);
--		if (!timeout) {
--			pr_warn("%s %s: I/O Error in DMA RX\n",
-+		ret = wait_for_completion_timeout(&spi_imx->dma_rx_completion,
-+				IMX_DMA_TIMEOUT(transfer->len));
-+		if (!ret) {
-+			pr_warn("%s %s: I/O Error in DMA RX:%x\n",
- 				dev_driver_string(&master->dev),
--				dev_name(&master->dev));
-+				dev_name(&master->dev), transfer->len);
- 			spi_imx->devtype_data->reset(spi_imx);
- 			dmaengine_terminate_all(master->dma_rx);
-+		} else if (left) {
-+			/* read the tail data by PIO */
-+			dma_sync_sg_for_cpu(master->dma_rx->device->dev,
-+					    &rx->sgl[rx->nents - 1], 1,
-+					    DMA_FROM_DEVICE);
-+			spi_imx->rx_buf = transfer->rx_buf
-+						+ (transfer->len - left);
-+			spi_imx_tail_pio_set(spi_imx, left);
-+			reinit_completion(&spi_imx->xfer_done);
-+
-+			spi_imx->devtype_data->intctrl(spi_imx, MXC_INT_TCEN);
-+
-+			ret = wait_for_completion_timeout(&spi_imx->xfer_done,
-+						IMX_DMA_TIMEOUT(transfer->len));
-+			if (!ret) {
-+				pr_warn("%s %s: I/O Error in RX tail\n",
-+					dev_driver_string(&master->dev),
-+					dev_name(&master->dev));
-+			}
- 		}
--		writel(dma |
--		       spi_imx->rxt_wml << MX51_ECSPI_DMA_RXT_WML_OFFSET,
--		       spi_imx->base + MX51_ECSPI_DMA);
- 	}
- 
--	spi_imx->dma_finished = 1;
--	spi_imx->devtype_data->trigger(spi_imx);
--
--	if (!timeout)
-+	if (!ret)
- 		ret = -ETIMEDOUT;
- 	else
- 		ret = transfer->len;
-@@ -1013,6 +1075,7 @@
- 	    spi_imx_can_dma(spi_imx->bitbang.master, spi, transfer)) {
- 		spi_imx->usedma = true;
- 		ret = spi_imx_dma_transfer(spi_imx, transfer);
-+		spi_imx->usedma = false; /* clear the dma flag */
- 		if (ret != -EAGAIN)
- 			return ret;
- 	}
-@@ -1200,6 +1263,7 @@
- 		goto out_clk_put;
- 	}
- 
-+	spi_new_device(master, &info);
- 	dev_info(&pdev->dev, "probed\n");
- 
- 	clk_disable(spi_imx->clk_ipg);
-diff -Nur linux-4.1.3/drivers/video/fbdev/core/fbmon.c linux-xbian-imx6/drivers/video/fbdev/core/fbmon.c
---- linux-4.1.3/drivers/video/fbdev/core/fbmon.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/video/fbdev/core/fbmon.c	2015-07-27 23:13:08.674034323 +0200
-@@ -494,7 +494,7 @@
- static int get_std_timing(unsigned char *block, struct fb_videomode *mode,
- 			  int ver, int rev, const struct fb_monspecs *specs)
- {
--	int i;
-+	int xres, yres = 0, ratio, i;
- 
- 	for (i = 0; i < DMT_SIZE; i++) {
- 		u32 std_2byte_code = block[0] << 8 | block[1];
-@@ -502,6 +502,32 @@
- 			break;
- 	}
- 
-+	ratio = (block[1] & 0xc0) >> 6;
-+	switch (ratio) {
-+	case 0:
-+		/* in EDID 1.3 the meaning of 0 changed to 16:10 (prior 1:1) */
-+		if (ver < 1 || (ver == 1 && rev < 3)) {
-+			yres = xres;
-+			mode->vmode &= FB_VMODE_ASPECT_1;
-+		} else {
-+			yres = (xres * 10)/16;
-+			mode->vmode &= FB_VMODE_ASPECT_16_10;
-+		}
-+		break;
-+	case 1:
-+		yres = (xres * 3)/4;
-+		mode->vmode &= FB_VMODE_ASPECT_4_3;
-+		break;
-+	case 2:
-+		yres = (xres * 4)/5;
-+		mode->vmode &= FB_VMODE_ASPECT_5_4;
-+		break;
-+	case 3:
-+		yres = (xres * 9)/16;
-+		mode->vmode &= FB_VMODE_ASPECT_16_9;
-+		break;
-+	}
-+
- 	if (i < DMT_SIZE && dmt_modes[i].mode) {
- 		/* DMT mode found */
- 		*mode = *dmt_modes[i].mode;
-diff -Nur linux-4.1.3/drivers/video/fbdev/core/fbsysfs.c linux-xbian-imx6/drivers/video/fbdev/core/fbsysfs.c
---- linux-4.1.3/drivers/video/fbdev/core/fbsysfs.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/video/fbdev/core/fbsysfs.c	2015-07-27 23:13:08.674034323 +0200
-@@ -20,6 +20,7 @@
- #include <linux/fb.h>
- #include <linux/console.h>
- #include <linux/module.h>
-+#include <linux/ctype.h>
- 
- #define FB_SYSFS_FLAG_ATTR 1
- 
-@@ -119,7 +120,15 @@
- 		v = 'i';
- 	if (mode->vmode & FB_VMODE_DOUBLE)
- 		v = 'd';
-+	if (mode->vmode & FB_VMODE_3D_SBS_HALF)
-+		m = 'H';
-+	if (mode->vmode & FB_VMODE_3D_TOP_BOTTOM)
-+		m = 'T';
-+	if (mode->vmode & FB_VMODE_3D_FRAME_PACK)
-+		m = 'F';
- 
-+	if (mode->vmode & FB_VMODE_FRACTIONAL)
-+		m = tolower(m);
- 	return snprintf(&buf[offset], PAGE_SIZE - offset, "%c:%dx%d%c-%d\n",
- 	                m, mode->xres, mode->yres, v, mode->refresh);
- }
-diff -Nur linux-4.1.3/drivers/video/Kconfig linux-xbian-imx6/drivers/video/Kconfig
---- linux-4.1.3/drivers/video/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/video/Kconfig	2015-07-27 23:13:08.626204974 +0200
-@@ -30,6 +30,8 @@
- source "drivers/video/fbdev/Kconfig"
- endmenu
- 
-+source "drivers/video/mxc/Kconfig"
-+
- source "drivers/video/backlight/Kconfig"
- 
- config VGASTATE
-diff -Nur linux-4.1.3/drivers/video/Makefile linux-xbian-imx6/drivers/video/Makefile
---- linux-4.1.3/drivers/video/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/drivers/video/Makefile	2015-07-27 23:13:08.626204974 +0200
-@@ -6,6 +6,7 @@
- obj-y				  += backlight/
- 
- obj-y				  += fbdev/
-+obj-y				  += mxc/
- 
- obj-$(CONFIG_VIDEOMODE_HELPERS) += display_timing.o videomode.o
- ifeq ($(CONFIG_OF),y)
-diff -Nur linux-4.1.3/drivers/video/mxc/Kconfig linux-xbian-imx6/drivers/video/mxc/Kconfig
---- linux-4.1.3/drivers/video/mxc/Kconfig	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/Kconfig	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,55 @@
-+config FB_MXC
-+	tristate "MXC Framebuffer support"
-+	depends on FB
-+	select FB_CFB_FILLRECT
-+	select FB_CFB_COPYAREA
-+	select FB_CFB_IMAGEBLIT
-+	select FB_MODE_HELPERS
-+	default y
-+	help
-+	  This is a framebuffer device for the MXC LCD Controller.
-+	  See <http://www.linux-fbdev.org/> for information on framebuffer
-+	  devices.
-+
-+	  If you plan to use the LCD display with your MXC system, say
-+	  Y here.
-+
-+config FB_MXC_SYNC_PANEL
-+	depends on FB_MXC
-+	tristate "Synchronous Panel Framebuffer"
-+
-+config FB_MXC_LDB
-+	tristate "MXC LDB"
-+	depends on FB_MXC_SYNC_PANEL
-+	depends on MXC_IPU_V3_FSL || IMX_IPUV3_CORE
-+
-+config FB_MXC_MIPI_DSI
-+	tristate "MXC MIPI_DSI"
-+	depends on FB_MXC_SYNC_PANEL
-+	depends on MXC_IPU_V3_FSL || IMX_IPUV3_CORE
-+
-+config FB_MXC_TRULY_WVGA_SYNC_PANEL
-+	tristate "TRULY WVGA Panel"
-+	depends on FB_MXC_SYNC_PANEL
-+	depends on FB_MXC_MIPI_DSI
-+
-+config FB_MXC_HDMI
-+	depends on FB_MXC_SYNC_PANEL
-+	depends on MXC_IPU_V3_FSL || IMX_IPUV3_CORE
-+	depends on I2C
-+	tristate "MXC HDMI driver support"
-+	select MFD_MXC_HDMI
-+	select HDMI
-+	help
-+	  Driver for the on-chip MXC HDMI controller.
-+
-+config FB_MXC_DCIC
-+        tristate "MXC DCIC"
-+        depends on FB_MXC_SYNC_PANEL
-+        depends on MXC_IPU_V3_FSL || FB_MXS
-+        select VIDEOMODE_HELPERS
-+
-+config FB_MXC_EDID
-+     depends on FB_MXC && I2C
-+     tristate "MXC EDID support"
-+     default y
-diff -Nur linux-4.1.3/drivers/video/mxc/ldb.c linux-xbian-imx6/drivers/video/mxc/ldb.c
---- linux-4.1.3/drivers/video/mxc/ldb.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/ldb.c	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,1036 @@
-+/*
-+ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*!
-+ * @file mxc_ldb.c
-+ *
-+ * @brief This file contains the LDB driver device interface and fops
-+ * functions.
-+ */
-+#include <linux/types.h>
-+#include <linux/init.h>
-+#include <linux/module.h>
-+#include <linux/platform_device.h>
-+#include <linux/err.h>
-+#include <linux/clk.h>
-+#include <linux/console.h>
-+#include <linux/io.h>
-+#include <linux/ipu.h>
-+#include <linux/mxcfb.h>
-+#include <linux/regulator/consumer.h>
-+#include <linux/spinlock.h>
-+#include <linux/of_device.h>
-+#include <linux/mod_devicetable.h>
-+#include "mxc_dispdrv.h"
-+
-+#define DISPDRV_LDB	"ldb"
-+
-+#define LDB_BGREF_RMODE_MASK		0x00008000
-+#define LDB_BGREF_RMODE_INT		0x00008000
-+#define LDB_BGREF_RMODE_EXT		0x0
-+
-+#define LDB_DI1_VS_POL_MASK		0x00000400
-+#define LDB_DI1_VS_POL_ACT_LOW		0x00000400
-+#define LDB_DI1_VS_POL_ACT_HIGH		0x0
-+#define LDB_DI0_VS_POL_MASK		0x00000200
-+#define LDB_DI0_VS_POL_ACT_LOW		0x00000200
-+#define LDB_DI0_VS_POL_ACT_HIGH		0x0
-+
-+#define LDB_BIT_MAP_CH1_MASK		0x00000100
-+#define LDB_BIT_MAP_CH1_JEIDA		0x00000100
-+#define LDB_BIT_MAP_CH1_SPWG		0x0
-+#define LDB_BIT_MAP_CH0_MASK		0x00000040
-+#define LDB_BIT_MAP_CH0_JEIDA		0x00000040
-+#define LDB_BIT_MAP_CH0_SPWG		0x0
-+
-+#define LDB_DATA_WIDTH_CH1_MASK		0x00000080
-+#define LDB_DATA_WIDTH_CH1_24		0x00000080
-+#define LDB_DATA_WIDTH_CH1_18		0x0
-+#define LDB_DATA_WIDTH_CH0_MASK		0x00000020
-+#define LDB_DATA_WIDTH_CH0_24		0x00000020
-+#define LDB_DATA_WIDTH_CH0_18		0x0
-+
-+#define LDB_CH1_MODE_MASK		0x0000000C
-+#define LDB_CH1_MODE_EN_TO_DI1		0x0000000C
-+#define LDB_CH1_MODE_EN_TO_DI0		0x00000004
-+#define LDB_CH1_MODE_DISABLE		0x0
-+#define LDB_CH0_MODE_MASK		0x00000003
-+#define LDB_CH0_MODE_EN_TO_DI1		0x00000003
-+#define LDB_CH0_MODE_EN_TO_DI0		0x00000001
-+#define LDB_CH0_MODE_DISABLE		0x0
-+
-+#define LDB_SPLIT_MODE_EN		0x00000010
-+
-+enum {
-+	IMX6_LDB,
-+};
-+
-+enum {
-+	LDB_IMX6 = 1,
-+};
-+
-+struct fsl_mxc_ldb_platform_data {
-+	int devtype;
-+	u32 ext_ref;
-+#define LDB_SPL_DI0	1
-+#define LDB_SPL_DI1	2
-+#define LDB_DUL_DI0	3
-+#define LDB_DUL_DI1	4
-+#define LDB_SIN0	5
-+#define LDB_SIN1	6
-+#define LDB_SEP0	7
-+#define LDB_SEP1	8
-+	int mode;
-+	int ipu_id;
-+	int disp_id;
-+
-+	/*only work for separate mode*/
-+	int sec_ipu_id;
-+	int sec_disp_id;
-+};
-+
-+struct ldb_data {
-+	struct platform_device *pdev;
-+	struct mxc_dispdrv_handle *disp_ldb;
-+	uint32_t *reg;
-+	uint32_t *control_reg;
-+	uint32_t *gpr3_reg;
-+	uint32_t control_reg_data;
-+	struct regulator *lvds_bg_reg;
-+	int mode;
-+	bool inited;
-+	struct ldb_setting {
-+		struct clk *di_clk;
-+		struct clk *ldb_di_clk;
-+		struct clk *div_3_5_clk;
-+		struct clk *div_7_clk;
-+		struct clk *div_sel_clk;
-+		bool active;
-+		bool clk_en;
-+		int ipu;
-+		int di;
-+		uint32_t ch_mask;
-+		uint32_t ch_val;
-+	} setting[2];
-+	struct notifier_block nb;
-+};
-+
-+static int g_ldb_mode;
-+
-+static struct fb_videomode ldb_modedb[] = {
-+	{
-+	 "LDB-WXGA", 60, 1280, 800, 14065,
-+	 40, 40,
-+	 10, 3,
-+	 80, 10,
-+	 0,
-+	 FB_VMODE_NONINTERLACED,
-+	 FB_MODE_IS_DETAILED,},
-+	{
-+	 "LDB-XGA", 60, 1024, 768, 15385,
-+	 220, 40,
-+	 21, 7,
-+	 60, 10,
-+	 0,
-+	 FB_VMODE_NONINTERLACED,
-+	 FB_MODE_IS_DETAILED,},
-+	{
-+	 "LDB-1080P60", 60, 1920, 1080, 7692,
-+	 100, 40,
-+	 30, 3,
-+	 10, 2,
-+	 0,
-+	 FB_VMODE_NONINTERLACED,
-+	 FB_MODE_IS_DETAILED,},
-+};
-+static int ldb_modedb_sz = ARRAY_SIZE(ldb_modedb);
-+
-+static inline int is_imx6_ldb(struct fsl_mxc_ldb_platform_data *plat_data)
-+{
-+	return (plat_data->devtype == LDB_IMX6);
-+}
-+
-+static int bits_per_pixel(int pixel_fmt)
-+{
-+	switch (pixel_fmt) {
-+	case IPU_PIX_FMT_BGR24:
-+	case IPU_PIX_FMT_RGB24:
-+		return 24;
-+		break;
-+	case IPU_PIX_FMT_BGR666:
-+	case IPU_PIX_FMT_RGB666:
-+	case IPU_PIX_FMT_LVDS666:
-+		return 18;
-+		break;
-+	default:
-+		break;
-+	}
-+	return 0;
-+}
-+
-+static int valid_mode(int pixel_fmt)
-+{
-+	return ((pixel_fmt == IPU_PIX_FMT_RGB24) ||
-+		(pixel_fmt == IPU_PIX_FMT_BGR24) ||
-+		(pixel_fmt == IPU_PIX_FMT_LVDS666) ||
-+		(pixel_fmt == IPU_PIX_FMT_RGB666) ||
-+		(pixel_fmt == IPU_PIX_FMT_BGR666));
-+}
-+
-+static int parse_ldb_mode(char *mode)
-+{
-+	int ldb_mode;
-+
-+	if (!strcmp(mode, "spl0"))
-+		ldb_mode = LDB_SPL_DI0;
-+	else if (!strcmp(mode, "spl1"))
-+		ldb_mode = LDB_SPL_DI1;
-+	else if (!strcmp(mode, "dul0"))
-+		ldb_mode = LDB_DUL_DI0;
-+	else if (!strcmp(mode, "dul1"))
-+		ldb_mode = LDB_DUL_DI1;
-+	else if (!strcmp(mode, "sin0"))
-+		ldb_mode = LDB_SIN0;
-+	else if (!strcmp(mode, "sin1"))
-+		ldb_mode = LDB_SIN1;
-+	else if (!strcmp(mode, "sep0"))
-+		ldb_mode = LDB_SEP0;
-+	else if (!strcmp(mode, "sep1"))
-+		ldb_mode = LDB_SEP1;
-+	else
-+		ldb_mode = -EINVAL;
-+
-+	return ldb_mode;
-+}
-+
-+#ifndef MODULE
-+/*
-+ *    "ldb=spl0/1"       --      split mode on DI0/1
-+ *    "ldb=dul0/1"       --      dual mode on DI0/1
-+ *    "ldb=sin0/1"       --      single mode on LVDS0/1
-+ *    "ldb=sep0/1" 	 --      separate mode begin from LVDS0/1
-+ *
-+ *    there are two LVDS channels(LVDS0 and LVDS1) which can transfer video
-+ *    datas, there two channels can be used as split/dual/single/separate mode.
-+ *
-+ *    split mode means display data from DI0 or DI1 will send to both channels
-+ *    LVDS0+LVDS1.
-+ *    dual mode means display data from DI0 or DI1 will be duplicated on LVDS0
-+ *    and LVDS1, it said, LVDS0 and LVDS1 has the same content.
-+ *    single mode means only work for DI0/DI1->LVDS0 or DI0/DI1->LVDS1.
-+ *    separate mode means you can make DI0/DI1->LVDS0 and DI0/DI1->LVDS1 work
-+ *    at the same time.
-+ */
-+static int __init ldb_setup(char *options)
-+{
-+	g_ldb_mode = parse_ldb_mode(options);
-+	return (g_ldb_mode < 0) ? 0 : 1;
-+}
-+__setup("ldb=", ldb_setup);
-+#endif
-+
-+static int ldb_get_of_property(struct platform_device *pdev,
-+				struct fsl_mxc_ldb_platform_data *plat_data)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+	int err;
-+	u32 ipu_id, disp_id;
-+	u32 sec_ipu_id, sec_disp_id;
-+	char *mode;
-+	u32 ext_ref;
-+
-+	err = of_property_read_string(np, "mode", (const char **)&mode);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property mode fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "ext_ref", &ext_ref);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property ext_ref fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "ipu_id", &ipu_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property ipu_id fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "disp_id", &disp_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property disp_id fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "sec_ipu_id", &sec_ipu_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property sec_ipu_id fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "sec_disp_id", &sec_disp_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property sec_disp_id fail\n");
-+		return err;
-+	}
-+
-+	plat_data->mode = parse_ldb_mode(mode);
-+	plat_data->ext_ref = ext_ref;
-+	plat_data->ipu_id = ipu_id;
-+	plat_data->disp_id = disp_id;
-+	plat_data->sec_ipu_id = sec_ipu_id;
-+	plat_data->sec_disp_id = sec_disp_id;
-+
-+	return err;
-+}
-+
-+static int find_ldb_setting(struct ldb_data *ldb, struct fb_info *fbi)
-+{
-+	char *id_di[] = {
-+		 "DISP3 BG",
-+		 "DISP3 BG - DI1",
-+		};
-+	char id[16];
-+	int i;
-+
-+	for (i = 0; i < 2; i++) {
-+		if (ldb->setting[i].active) {
-+			memset(id, 0, 16);
-+			memcpy(id, id_di[ldb->setting[i].di],
-+				strlen(id_di[ldb->setting[i].di]));
-+			id[4] += ldb->setting[i].ipu;
-+			if (!strcmp(id, fbi->fix.id))
-+				return i;
-+		}
-+	}
-+	return -EINVAL;
-+}
-+
-+static int ldb_disp_setup(struct mxc_dispdrv_handle *disp, struct fb_info *fbi)
-+{
-+	uint32_t reg, val;
-+	uint32_t pixel_clk, rounded_pixel_clk;
-+	struct clk *ldb_clk_parent;
-+	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
-+	int setting_idx, di;
-+	int ret;
-+
-+	setting_idx = find_ldb_setting(ldb, fbi);
-+	if (setting_idx < 0)
-+		return setting_idx;
-+
-+	di = ldb->setting[setting_idx].di;
-+
-+	/* restore channel mode setting */
-+	val = readl(ldb->control_reg);
-+	val |= ldb->setting[setting_idx].ch_val;
-+	writel(val, ldb->control_reg);
-+	dev_dbg(&ldb->pdev->dev, "LDB setup, control reg:0x%x\n",
-+			readl(ldb->control_reg));
-+
-+	/* vsync setup */
-+	reg = readl(ldb->control_reg);
-+	if (fbi->var.sync & FB_SYNC_VERT_HIGH_ACT) {
-+		if (di == 0)
-+			reg = (reg & ~LDB_DI0_VS_POL_MASK)
-+				| LDB_DI0_VS_POL_ACT_HIGH;
-+		else
-+			reg = (reg & ~LDB_DI1_VS_POL_MASK)
-+				| LDB_DI1_VS_POL_ACT_HIGH;
-+	} else {
-+		if (di == 0)
-+			reg = (reg & ~LDB_DI0_VS_POL_MASK)
-+				| LDB_DI0_VS_POL_ACT_LOW;
-+		else
-+			reg = (reg & ~LDB_DI1_VS_POL_MASK)
-+				| LDB_DI1_VS_POL_ACT_LOW;
-+	}
-+	writel(reg, ldb->control_reg);
-+
-+	/* clk setup */
-+	if (ldb->setting[setting_idx].clk_en)
-+		 clk_disable_unprepare(ldb->setting[setting_idx].ldb_di_clk);
-+	pixel_clk = (PICOS2KHZ(fbi->var.pixclock)) * 1000UL;
-+	ldb_clk_parent = clk_get_parent(ldb->setting[setting_idx].ldb_di_clk);
-+	if (IS_ERR(ldb_clk_parent)) {
-+		dev_err(&ldb->pdev->dev, "get ldb di parent clk fail\n");
-+		return PTR_ERR(ldb_clk_parent);
-+	}
-+	if ((ldb->mode == LDB_SPL_DI0) || (ldb->mode == LDB_SPL_DI1))
-+		ret = clk_set_rate(ldb_clk_parent, pixel_clk * 7 / 2);
-+	else
-+		ret = clk_set_rate(ldb_clk_parent, pixel_clk * 7);
-+	if (ret < 0) {
-+		dev_err(&ldb->pdev->dev, "set ldb parent clk fail:%d\n", ret);
-+		return ret;
-+	}
-+	rounded_pixel_clk = clk_round_rate(ldb->setting[setting_idx].ldb_di_clk,
-+						pixel_clk);
-+	dev_dbg(&ldb->pdev->dev, "pixel_clk:%d, rounded_pixel_clk:%d\n",
-+			pixel_clk, rounded_pixel_clk);
-+	ret = clk_set_rate(ldb->setting[setting_idx].ldb_di_clk,
-+				rounded_pixel_clk);
-+	if (ret < 0) {
-+		dev_err(&ldb->pdev->dev, "set ldb di clk fail:%d\n", ret);
-+		return ret;
-+	}
-+	ret = clk_prepare_enable(ldb->setting[setting_idx].ldb_di_clk);
-+	if (ret < 0) {
-+		dev_err(&ldb->pdev->dev, "enable ldb di clk fail:%d\n", ret);
-+		return ret;
-+	}
-+
-+	if (!ldb->setting[setting_idx].clk_en)
-+		ldb->setting[setting_idx].clk_en = true;
-+
-+	return 0;
-+}
-+
-+int ldb_fb_event(struct notifier_block *nb, unsigned long val, void *v)
-+{
-+	struct ldb_data *ldb = container_of(nb, struct ldb_data, nb);
-+	struct fb_event *event = v;
-+	struct fb_info *fbi = event->info;
-+	int index;
-+	uint32_t data;
-+
-+	index = find_ldb_setting(ldb, fbi);
-+	if (index < 0)
-+		return 0;
-+
-+	fbi->mode = (struct fb_videomode *)fb_match_mode(&fbi->var,
-+			&fbi->modelist);
-+
-+	if (!fbi->mode) {
-+		dev_warn(&ldb->pdev->dev,
-+				"LDB: can not find mode for xres=%d, yres=%d\n",
-+				fbi->var.xres, fbi->var.yres);
-+		if (ldb->setting[index].clk_en) {
-+			clk_disable(ldb->setting[index].ldb_di_clk);
-+			ldb->setting[index].clk_en = false;
-+			data = readl(ldb->control_reg);
-+			data &= ~ldb->setting[index].ch_mask;
-+			writel(data, ldb->control_reg);
-+		}
-+		return 0;
-+	}
-+
-+	switch (val) {
-+	case FB_EVENT_BLANK:
-+	{
-+		if (*((int *)event->data) == FB_BLANK_UNBLANK) {
-+			if (!ldb->setting[index].clk_en) {
-+				clk_enable(ldb->setting[index].ldb_di_clk);
-+				ldb->setting[index].clk_en = true;
-+			}
-+		} else {
-+			if (ldb->setting[index].clk_en) {
-+				clk_disable(ldb->setting[index].ldb_di_clk);
-+				ldb->setting[index].clk_en = false;
-+				data = readl(ldb->control_reg);
-+				data &= ~ldb->setting[index].ch_mask;
-+				writel(data, ldb->control_reg);
-+				dev_dbg(&ldb->pdev->dev,
-+					"LDB blank, control reg:0x%x\n",
-+						readl(ldb->control_reg));
-+			}
-+		}
-+		break;
-+	}
-+	case FB_EVENT_SUSPEND:
-+		if (ldb->setting[index].clk_en) {
-+			clk_disable(ldb->setting[index].ldb_di_clk);
-+			ldb->setting[index].clk_en = false;
-+		}
-+		break;
-+	default:
-+		break;
-+	}
-+	return 0;
-+}
-+
-+#define LVDS_MUX_CTL_WIDTH	2
-+#define LVDS_MUX_CTL_MASK	3
-+#define LVDS0_MUX_CTL_OFFS	6
-+#define LVDS1_MUX_CTL_OFFS	8
-+#define LVDS0_MUX_CTL_MASK	(LVDS_MUX_CTL_MASK << 6)
-+#define LVDS1_MUX_CTL_MASK	(LVDS_MUX_CTL_MASK << 8)
-+#define ROUTE_IPU_DI(ipu, di)	(((ipu << 1) | di) & LVDS_MUX_CTL_MASK)
-+static int ldb_ipu_ldb_route(int ipu, int di, struct ldb_data *ldb)
-+{
-+	uint32_t reg;
-+	int channel;
-+	int shift;
-+	int mode = ldb->mode;
-+
-+	reg = readl(ldb->gpr3_reg);
-+	if (mode < LDB_SIN0) {
-+		reg &= ~(LVDS0_MUX_CTL_MASK | LVDS1_MUX_CTL_MASK);
-+		reg |= (ROUTE_IPU_DI(ipu, di) << LVDS0_MUX_CTL_OFFS) |
-+			(ROUTE_IPU_DI(ipu, di) << LVDS1_MUX_CTL_OFFS);
-+		dev_dbg(&ldb->pdev->dev,
-+			"Dual/Split mode both channels route to IPU%d-DI%d\n",
-+			ipu, di);
-+	} else if ((mode == LDB_SIN0) || (mode == LDB_SIN1)) {
-+		reg &= ~(LVDS0_MUX_CTL_MASK | LVDS1_MUX_CTL_MASK);
-+		channel = mode - LDB_SIN0;
-+		shift = LVDS0_MUX_CTL_OFFS + channel * LVDS_MUX_CTL_WIDTH;
-+		reg |= ROUTE_IPU_DI(ipu, di) << shift;
-+		dev_dbg(&ldb->pdev->dev,
-+			"Single mode channel %d route to IPU%d-DI%d\n",
-+				channel, ipu, di);
-+	} else {
-+		static bool first = true;
-+
-+		if (first) {
-+			if (mode == LDB_SEP0) {
-+				reg &= ~LVDS0_MUX_CTL_MASK;
-+				channel = 0;
-+			} else {
-+				reg &= ~LVDS1_MUX_CTL_MASK;
-+				channel = 1;
-+			}
-+			first = false;
-+		} else {
-+			if (mode == LDB_SEP0) {
-+				reg &= ~LVDS1_MUX_CTL_MASK;
-+				channel = 1;
-+			} else {
-+				reg &= ~LVDS0_MUX_CTL_MASK;
-+				channel = 0;
-+			}
-+		}
-+
-+		shift = LVDS0_MUX_CTL_OFFS + channel * LVDS_MUX_CTL_WIDTH;
-+		reg |= ROUTE_IPU_DI(ipu, di) << shift;
-+
-+		dev_dbg(&ldb->pdev->dev,
-+			"Separate mode channel %d route to IPU%d-DI%d\n",
-+			channel, ipu, di);
-+	}
-+	writel(reg, ldb->gpr3_reg);
-+
-+	return 0;
-+}
-+
-+static int ldb_disp_init(struct mxc_dispdrv_handle *disp,
-+	struct mxc_dispdrv_setting *setting)
-+{
-+	int ret = 0, i, lvds_channel = 0;
-+	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
-+	struct fsl_mxc_ldb_platform_data *plat_data = ldb->pdev->dev.platform_data;
-+	struct resource *res;
-+	uint32_t reg, setting_idx;
-+	uint32_t ch_mask = 0, ch_val = 0;
-+	uint32_t ipu_id, disp_id;
-+	char di_clk[] = "ipu1_di0_sel";
-+	char ldb_clk[] = "ldb_di0";
-+	char div_3_5_clk[] = "di0_div_3_5";
-+	char div_7_clk[] = "di0_div_7";
-+	char div_sel_clk[] = "di0_div_sel";
-+
-+	/* if input format not valid, make RGB666 as default*/
-+	if (!valid_mode(setting->if_fmt)) {
-+		dev_warn(&ldb->pdev->dev, "Input pixel format not valid"
-+					" use default RGB666\n");
-+		setting->if_fmt = IPU_PIX_FMT_RGB666;
-+	}
-+
-+	if (!ldb->inited) {
-+		setting_idx = 0;
-+		res = platform_get_resource(ldb->pdev, IORESOURCE_MEM, 0);
-+		if (!res) {
-+			dev_err(&ldb->pdev->dev, "get iomem fail.\n");
-+			return -ENOMEM;
-+		}
-+
-+		ldb->reg = devm_ioremap(&ldb->pdev->dev, res->start,
-+					resource_size(res));
-+		ldb->control_reg = ldb->reg + 2;
-+		ldb->gpr3_reg = ldb->reg + 3;
-+
-+		/* ipu selected by platform data setting */
-+		setting->dev_id = plat_data->ipu_id;
-+
-+		reg = readl(ldb->control_reg);
-+
-+		/* refrence resistor select */
-+		reg &= ~LDB_BGREF_RMODE_MASK;
-+		if (plat_data->ext_ref)
-+			reg |= LDB_BGREF_RMODE_EXT;
-+		else
-+			reg |= LDB_BGREF_RMODE_INT;
-+
-+		/* TODO: now only use SPWG data mapping for both channel */
-+		reg &= ~(LDB_BIT_MAP_CH0_MASK | LDB_BIT_MAP_CH1_MASK);
-+		reg |= LDB_BIT_MAP_CH0_SPWG | LDB_BIT_MAP_CH1_SPWG;
-+
-+		/* channel mode setting */
-+		reg &= ~(LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK);
-+		reg &= ~(LDB_DATA_WIDTH_CH0_MASK | LDB_DATA_WIDTH_CH1_MASK);
-+
-+		if (bits_per_pixel(setting->if_fmt) == 24)
-+			reg |= LDB_DATA_WIDTH_CH0_24 | LDB_DATA_WIDTH_CH1_24;
-+		else
-+			reg |= LDB_DATA_WIDTH_CH0_18 | LDB_DATA_WIDTH_CH1_18;
-+
-+		if (g_ldb_mode >= LDB_SPL_DI0)
-+			ldb->mode = g_ldb_mode;
-+		else
-+			ldb->mode = plat_data->mode;
-+
-+		if ((ldb->mode == LDB_SIN0) || (ldb->mode == LDB_SIN1)) {
-+			ret = ldb->mode - LDB_SIN0;
-+			if (plat_data->disp_id != ret) {
-+				dev_warn(&ldb->pdev->dev,
-+					"change IPU DI%d to IPU DI%d for LDB "
-+					"channel%d.\n",
-+					plat_data->disp_id, ret, ret);
-+				plat_data->disp_id = ret;
-+			}
-+		} else if (((ldb->mode == LDB_SEP0) || (ldb->mode == LDB_SEP1))
-+				&& is_imx6_ldb(plat_data)) {
-+			if (plat_data->disp_id == plat_data->sec_disp_id) {
-+				dev_err(&ldb->pdev->dev,
-+					"For LVDS separate mode,"
-+					"two DIs should be different!\n");
-+				return -EINVAL;
-+			}
-+
-+			if (((!plat_data->disp_id) && (ldb->mode == LDB_SEP1))
-+				|| ((plat_data->disp_id) &&
-+					(ldb->mode == LDB_SEP0))) {
-+				dev_dbg(&ldb->pdev->dev,
-+					"LVDS separate mode:"
-+					"swap DI configuration!\n");
-+				ipu_id = plat_data->ipu_id;
-+				disp_id = plat_data->disp_id;
-+				plat_data->ipu_id = plat_data->sec_ipu_id;
-+				plat_data->disp_id = plat_data->sec_disp_id;
-+				plat_data->sec_ipu_id = ipu_id;
-+				plat_data->sec_disp_id = disp_id;
-+			}
-+		}
-+
-+		if (ldb->mode == LDB_SPL_DI0) {
-+			reg |= LDB_SPLIT_MODE_EN | LDB_CH0_MODE_EN_TO_DI0
-+				| LDB_CH1_MODE_EN_TO_DI0;
-+			setting->disp_id = 0;
-+		} else if (ldb->mode == LDB_SPL_DI1) {
-+			reg |= LDB_SPLIT_MODE_EN | LDB_CH0_MODE_EN_TO_DI1
-+				| LDB_CH1_MODE_EN_TO_DI1;
-+			setting->disp_id = 1;
-+		} else if (ldb->mode == LDB_DUL_DI0) {
-+			reg &= ~LDB_SPLIT_MODE_EN;
-+			reg |= LDB_CH0_MODE_EN_TO_DI0 | LDB_CH1_MODE_EN_TO_DI0;
-+			setting->disp_id = 0;
-+		} else if (ldb->mode == LDB_DUL_DI1) {
-+			reg &= ~LDB_SPLIT_MODE_EN;
-+			reg |= LDB_CH0_MODE_EN_TO_DI1 | LDB_CH1_MODE_EN_TO_DI1;
-+			setting->disp_id = 1;
-+		} else if (ldb->mode == LDB_SIN0) {
-+			reg &= ~LDB_SPLIT_MODE_EN;
-+			setting->disp_id = plat_data->disp_id;
-+			if (setting->disp_id == 0)
-+				reg |= LDB_CH0_MODE_EN_TO_DI0;
-+			else
-+				reg |= LDB_CH0_MODE_EN_TO_DI1;
-+			ch_mask = LDB_CH0_MODE_MASK;
-+			ch_val = reg & LDB_CH0_MODE_MASK;
-+		} else if (ldb->mode == LDB_SIN1) {
-+			reg &= ~LDB_SPLIT_MODE_EN;
-+			setting->disp_id = plat_data->disp_id;
-+			if (setting->disp_id == 0)
-+				reg |= LDB_CH1_MODE_EN_TO_DI0;
-+			else
-+				reg |= LDB_CH1_MODE_EN_TO_DI1;
-+			ch_mask = LDB_CH1_MODE_MASK;
-+			ch_val = reg & LDB_CH1_MODE_MASK;
-+		} else { /* separate mode*/
-+			setting->disp_id = plat_data->disp_id;
-+
-+			/* first output is LVDS0 or LVDS1 */
-+			if (ldb->mode == LDB_SEP0)
-+				lvds_channel = 0;
-+			else
-+				lvds_channel = 1;
-+
-+			reg &= ~LDB_SPLIT_MODE_EN;
-+
-+			if ((lvds_channel == 0) && (setting->disp_id == 0))
-+				reg |= LDB_CH0_MODE_EN_TO_DI0;
-+			else if ((lvds_channel == 0) && (setting->disp_id == 1))
-+				reg |= LDB_CH0_MODE_EN_TO_DI1;
-+			else if ((lvds_channel == 1) && (setting->disp_id == 0))
-+				reg |= LDB_CH1_MODE_EN_TO_DI0;
-+			else
-+				reg |= LDB_CH1_MODE_EN_TO_DI1;
-+			ch_mask = lvds_channel ? LDB_CH1_MODE_MASK :
-+					LDB_CH0_MODE_MASK;
-+			ch_val = reg & ch_mask;
-+
-+			if (bits_per_pixel(setting->if_fmt) == 24) {
-+				if (lvds_channel == 0)
-+					reg &= ~LDB_DATA_WIDTH_CH1_24;
-+				else
-+					reg &= ~LDB_DATA_WIDTH_CH0_24;
-+			} else {
-+				if (lvds_channel == 0)
-+					reg &= ~LDB_DATA_WIDTH_CH1_18;
-+				else
-+					reg &= ~LDB_DATA_WIDTH_CH0_18;
-+			}
-+		}
-+
-+		writel(reg, ldb->control_reg);
-+		if (ldb->mode <  LDB_SIN0) {
-+			ch_mask = LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK;
-+			ch_val = reg & (LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK);
-+		}
-+	} else { /* second time for separate mode */
-+		if ((ldb->mode == LDB_SPL_DI0) ||
-+			(ldb->mode == LDB_SPL_DI1) ||
-+			(ldb->mode == LDB_DUL_DI0) ||
-+			(ldb->mode == LDB_DUL_DI1) ||
-+			(ldb->mode == LDB_SIN0) ||
-+			(ldb->mode == LDB_SIN1)) {
-+			dev_err(&ldb->pdev->dev, "for second ldb disp"
-+					"ldb mode should in separate mode\n");
-+			return -EINVAL;
-+		}
-+
-+		setting_idx = 1;
-+		if (is_imx6_ldb(plat_data)) {
-+			setting->dev_id = plat_data->sec_ipu_id;
-+			setting->disp_id = plat_data->sec_disp_id;
-+		} else {
-+			setting->dev_id = plat_data->ipu_id;
-+			setting->disp_id = !plat_data->disp_id;
-+		}
-+		if (setting->disp_id == ldb->setting[0].di) {
-+			dev_err(&ldb->pdev->dev, "Err: for second ldb disp in"
-+				"separate mode, DI should be different!\n");
-+			return -EINVAL;
-+		}
-+
-+		/* second output is LVDS0 or LVDS1 */
-+		if (ldb->mode == LDB_SEP0)
-+			lvds_channel = 1;
-+		else
-+			lvds_channel = 0;
-+
-+		reg = readl(ldb->control_reg);
-+		if ((lvds_channel == 0) && (setting->disp_id == 0))
-+			reg |= LDB_CH0_MODE_EN_TO_DI0;
-+		else if ((lvds_channel == 0) && (setting->disp_id == 1))
-+			reg |= LDB_CH0_MODE_EN_TO_DI1;
-+		else if ((lvds_channel == 1) && (setting->disp_id == 0))
-+			reg |= LDB_CH1_MODE_EN_TO_DI0;
-+		else
-+			reg |= LDB_CH1_MODE_EN_TO_DI1;
-+		ch_mask = lvds_channel ?  LDB_CH1_MODE_MASK :
-+				LDB_CH0_MODE_MASK;
-+		ch_val = reg & ch_mask;
-+
-+		if (bits_per_pixel(setting->if_fmt) == 24) {
-+			if (lvds_channel == 0)
-+				reg |= LDB_DATA_WIDTH_CH0_24;
-+			else
-+				reg |= LDB_DATA_WIDTH_CH1_24;
-+		} else {
-+			if (lvds_channel == 0)
-+				reg |= LDB_DATA_WIDTH_CH0_18;
-+			else
-+				reg |= LDB_DATA_WIDTH_CH1_18;
-+		}
-+		writel(reg, ldb->control_reg);
-+	}
-+
-+	/* get clocks */
-+	if (is_imx6_ldb(plat_data) &&
-+		((ldb->mode == LDB_SEP0) || (ldb->mode == LDB_SEP1))) {
-+		ldb_clk[6] += lvds_channel;
-+		div_3_5_clk[2] += lvds_channel;
-+		div_7_clk[2] += lvds_channel;
-+		div_sel_clk[2] += lvds_channel;
-+	} else {
-+		ldb_clk[6] += setting->disp_id;
-+		div_3_5_clk[2] += setting->disp_id;
-+		div_7_clk[2] += setting->disp_id;
-+		div_sel_clk[2] += setting->disp_id;
-+	}
-+	ldb->setting[setting_idx].ldb_di_clk = clk_get(&ldb->pdev->dev,
-+							ldb_clk);
-+	if (IS_ERR(ldb->setting[setting_idx].ldb_di_clk)) {
-+		dev_err(&ldb->pdev->dev, "get ldb clk failed\n");
-+		return PTR_ERR(ldb->setting[setting_idx].ldb_di_clk);
-+	}
-+
-+	ldb->setting[setting_idx].div_3_5_clk = clk_get(&ldb->pdev->dev,
-+							div_3_5_clk);
-+	if (IS_ERR(ldb->setting[setting_idx].div_3_5_clk)) {
-+		dev_err(&ldb->pdev->dev, "get div 3.5 clk failed\n");
-+		return PTR_ERR(ldb->setting[setting_idx].div_3_5_clk);
-+	}
-+	ldb->setting[setting_idx].div_7_clk = clk_get(&ldb->pdev->dev,
-+							div_7_clk);
-+	if (IS_ERR(ldb->setting[setting_idx].div_7_clk)) {
-+		dev_err(&ldb->pdev->dev, "get div 7 clk failed\n");
-+		return PTR_ERR(ldb->setting[setting_idx].div_7_clk);
-+	}
-+
-+	ldb->setting[setting_idx].div_sel_clk = clk_get(&ldb->pdev->dev,
-+							div_sel_clk);
-+	if (IS_ERR(ldb->setting[setting_idx].div_sel_clk)) {
-+		dev_err(&ldb->pdev->dev, "get div sel clk failed\n");
-+		return PTR_ERR(ldb->setting[setting_idx].div_sel_clk);
-+	}
-+
-+	di_clk[3] += setting->dev_id;
-+	di_clk[7] += setting->disp_id;
-+	ldb->setting[setting_idx].di_clk = clk_get(&ldb->pdev->dev,
-+							di_clk);
-+	if (IS_ERR(ldb->setting[setting_idx].di_clk)) {
-+		dev_err(&ldb->pdev->dev, "get di clk failed\n");
-+		return PTR_ERR(ldb->setting[setting_idx].di_clk);
-+	}
-+
-+	ldb->setting[setting_idx].ch_mask = ch_mask;
-+	ldb->setting[setting_idx].ch_val = ch_val;
-+
-+	if (is_imx6_ldb(plat_data))
-+		ldb_ipu_ldb_route(setting->dev_id, setting->disp_id, ldb);
-+
-+	/* must use spec video mode defined by driver */
-+	ret = fb_find_mode(&setting->fbi->var, setting->fbi, setting->dft_mode_str,
-+				ldb_modedb, ldb_modedb_sz, NULL, setting->default_bpp);
-+	if (ret != 1)
-+		fb_videomode_to_var(&setting->fbi->var, &ldb_modedb[0]);
-+
-+	INIT_LIST_HEAD(&setting->fbi->modelist);
-+	for (i = 0; i < ldb_modedb_sz; i++) {
-+		struct fb_videomode m;
-+		fb_var_to_videomode(&m, &setting->fbi->var);
-+		if (fb_mode_is_equal(&m, &ldb_modedb[i])) {
-+			fb_add_videomode(&ldb_modedb[i],
-+					&setting->fbi->modelist);
-+			break;
-+		}
-+	}
-+
-+	ldb->setting[setting_idx].ipu = setting->dev_id;
-+	ldb->setting[setting_idx].di = setting->disp_id;
-+
-+	return ret;
-+}
-+
-+static int ldb_post_disp_init(struct mxc_dispdrv_handle *disp,
-+				int ipu_id, int disp_id)
-+{
-+	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
-+	int setting_idx = ldb->inited ? 1 : 0;
-+	int ret = 0;
-+
-+	if (!ldb->inited) {
-+		ldb->nb.notifier_call = ldb_fb_event;
-+		fb_register_client(&ldb->nb);
-+	}
-+
-+	ret = clk_set_parent(ldb->setting[setting_idx].di_clk,
-+			ldb->setting[setting_idx].ldb_di_clk);
-+	if (ret) {
-+		dev_err(&ldb->pdev->dev, "fail to set ldb_di clk as"
-+			"the parent of ipu_di clk\n");
-+		return ret;
-+	}
-+
-+	if ((ldb->mode == LDB_SPL_DI0) || (ldb->mode == LDB_SPL_DI1)) {
-+		ret = clk_set_parent(ldb->setting[setting_idx].div_sel_clk,
-+				ldb->setting[setting_idx].div_3_5_clk);
-+		if (ret) {
-+			dev_err(&ldb->pdev->dev, "fail to set div 3.5 clk as"
-+				"the parent of div sel clk\n");
-+			return ret;
-+		}
-+	} else {
-+		ret = clk_set_parent(ldb->setting[setting_idx].div_sel_clk,
-+				ldb->setting[setting_idx].div_7_clk);
-+		if (ret) {
-+			dev_err(&ldb->pdev->dev, "fail to set div 7 clk as"
-+				"the parent of div sel clk\n");
-+			return ret;
-+		}
-+	}
-+
-+	/* save active ldb setting for fb notifier */
-+	ldb->setting[setting_idx].active = true;
-+
-+	ldb->inited = true;
-+	return ret;
-+}
-+
-+static void ldb_disp_deinit(struct mxc_dispdrv_handle *disp)
-+{
-+	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
-+	int i;
-+
-+	writel(0, ldb->control_reg);
-+
-+	for (i = 0; i < 2; i++) {
-+		clk_disable(ldb->setting[i].ldb_di_clk);
-+		clk_put(ldb->setting[i].ldb_di_clk);
-+		clk_put(ldb->setting[i].div_3_5_clk);
-+		clk_put(ldb->setting[i].div_7_clk);
-+		clk_put(ldb->setting[i].div_sel_clk);
-+	}
-+
-+	fb_unregister_client(&ldb->nb);
-+}
-+
-+static struct mxc_dispdrv_driver ldb_drv = {
-+	.name 	= DISPDRV_LDB,
-+	.init 	= ldb_disp_init,
-+	.post_init = ldb_post_disp_init,
-+	.deinit	= ldb_disp_deinit,
-+	.setup = ldb_disp_setup,
-+};
-+
-+static int ldb_suspend(struct platform_device *pdev, pm_message_t state)
-+{
-+	struct ldb_data *ldb = dev_get_drvdata(&pdev->dev);
-+	uint32_t	data;
-+
-+	if (!ldb->inited)
-+		return 0;
-+	data = readl(ldb->control_reg);
-+	ldb->control_reg_data = data;
-+	data &= ~(LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK);
-+	writel(data, ldb->control_reg);
-+
-+	return 0;
-+}
-+
-+static int ldb_resume(struct platform_device *pdev)
-+{
-+	struct ldb_data *ldb = dev_get_drvdata(&pdev->dev);
-+
-+	if (!ldb->inited)
-+		return 0;
-+	writel(ldb->control_reg_data, ldb->control_reg);
-+
-+	return 0;
-+}
-+
-+static struct platform_device_id imx_ldb_devtype[] = {
-+	{
-+		.name = "ldb-imx6",
-+		.driver_data = LDB_IMX6,
-+	}, {
-+		/* sentinel */
-+	}
-+};
-+
-+static const struct of_device_id imx_ldb_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-ldb", .data = &imx_ldb_devtype[IMX6_LDB],},
-+	{ /* sentinel */ }
-+};
-+
-+/*!
-+ * This function is called by the driver framework to initialize the LDB
-+ * device.
-+ *
-+ * @param	dev	The device structure for the LDB passed in by the
-+ *			driver framework.
-+ *
-+ * @return      Returns 0 on success or negative error code on error
-+ */
-+static int ldb_probe(struct platform_device *pdev)
-+{
-+	int ret = 0;
-+	struct ldb_data *ldb;
-+	struct fsl_mxc_ldb_platform_data *plat_data;
-+	const struct of_device_id *of_id =
-+			of_match_device(imx_ldb_dt_ids, &pdev->dev);
-+
-+	dev_dbg(&pdev->dev, "%s enter\n", __func__);
-+	ldb = devm_kzalloc(&pdev->dev, sizeof(struct ldb_data), GFP_KERNEL);
-+	if (!ldb)
-+		return -ENOMEM;
-+
-+	plat_data = devm_kzalloc(&pdev->dev,
-+				sizeof(struct fsl_mxc_ldb_platform_data),
-+				GFP_KERNEL);
-+	if (!plat_data)
-+		return -ENOMEM;
-+	pdev->dev.platform_data = plat_data;
-+	if (of_id)
-+		pdev->id_entry = of_id->data;
-+	plat_data->devtype = pdev->id_entry->driver_data;
-+
-+	ret = ldb_get_of_property(pdev, plat_data);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "get ldb of property fail\n");
-+		return ret;
-+	}
-+
-+	ldb->pdev = pdev;
-+	ldb->disp_ldb = mxc_dispdrv_register(&ldb_drv);
-+	mxc_dispdrv_setdata(ldb->disp_ldb, ldb);
-+
-+	dev_set_drvdata(&pdev->dev, ldb);
-+
-+	dev_dbg(&pdev->dev, "%s exit\n", __func__);
-+	return ret;
-+}
-+
-+static int ldb_remove(struct platform_device *pdev)
-+{
-+	struct ldb_data *ldb = dev_get_drvdata(&pdev->dev);
-+
-+	if (!ldb->inited)
-+		return 0;
-+	mxc_dispdrv_puthandle(ldb->disp_ldb);
-+	mxc_dispdrv_unregister(ldb->disp_ldb);
-+	return 0;
-+}
-+
-+static struct platform_driver mxcldb_driver = {
-+	.driver = {
-+		.name = "mxc_ldb",
-+		.of_match_table	= imx_ldb_dt_ids,
-+	},
-+	.probe = ldb_probe,
-+	.remove = ldb_remove,
-+	.suspend = ldb_suspend,
-+	.resume = ldb_resume,
-+};
-+
-+static int __init ldb_init(void)
-+{
-+	return platform_driver_register(&mxcldb_driver);
-+}
-+
-+static void __exit ldb_uninit(void)
-+{
-+	platform_driver_unregister(&mxcldb_driver);
-+}
-+
-+module_init(ldb_init);
-+module_exit(ldb_uninit);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("MXC LDB driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/video/mxc/Makefile linux-xbian-imx6/drivers/video/mxc/Makefile
---- linux-4.1.3/drivers/video/mxc/Makefile	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/Makefile	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,7 @@
-+obj-$(CONFIG_FB_MXC_LDB) += ldb.o
-+obj-$(CONFIG_FB_MXC_MIPI_DSI)			+= mipi_dsi.o
-+obj-$(CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL)	+= mxcfb_hx8369_wvga.o
-+obj-$(CONFIG_FB_MXC_HDMI)			+= mxc_hdmi.o
-+obj-$(CONFIG_FB_MXC_EDID)			+= mxc_edid.o
-+obj-$(CONFIG_FB_MXC_SYNC_PANEL) += mxc_dispdrv.o mxc_lcdif.o mxc_ipuv3_fb.o
-+obj-$(CONFIG_FB_MXC_DCIC) += mxc_dcic.o
-diff -Nur linux-4.1.3/drivers/video/mxc/mipi_dsi.c linux-xbian-imx6/drivers/video/mxc/mipi_dsi.c
---- linux-4.1.3/drivers/video/mxc/mipi_dsi.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mipi_dsi.c	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,953 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/types.h>
-+#include <linux/init.h>
-+#include <linux/platform_device.h>
-+#include <linux/err.h>
-+#include <linux/clk.h>
-+#include <linux/console.h>
-+#include <linux/io.h>
-+#include <linux/bitops.h>
-+#include <linux/ipu.h>
-+#include <linux/mfd/syscon.h>
-+#include <linux/mfd/syscon/imx6q-iomuxc-gpr.h>
-+#include <linux/mipi_dsi.h>
-+#include <linux/module.h>
-+#include <linux/mxcfb.h>
-+#include <linux/backlight.h>
-+#include <linux/of_device.h>
-+#include <linux/regulator/consumer.h>
-+#include <linux/reset.h>
-+#include <linux/spinlock.h>
-+#include <linux/delay.h>
-+#include <video/mipi_display.h>
-+
-+#include "mxc_dispdrv.h"
-+#include "mipi_dsi.h"
-+
-+#define DISPDRV_MIPI			"mipi_dsi"
-+#define ROUND_UP(x)			((x)+1)
-+#define NS2PS_RATIO			(1000)
-+#define NUMBER_OF_CHUNKS		(0x8)
-+#define NULL_PKT_SIZE			(0x8)
-+#define PHY_BTA_MAXTIME			(0xd00)
-+#define PHY_LP2HS_MAXTIME		(0x40)
-+#define PHY_HS2LP_MAXTIME		(0x40)
-+#define	PHY_STOP_WAIT_TIME		(0x20)
-+#define	DSI_CLKMGR_CFG_CLK_DIV		(0x107)
-+#define DSI_GEN_PLD_DATA_BUF_ENTRY	(0x10)
-+#define	MIPI_MUX_CTRL(v)		(((v) & 0x3) << 4)
-+#define	MIPI_LCD_SLEEP_MODE_DELAY	(120)
-+#define	MIPI_DSI_REG_RW_TIMEOUT		(20)
-+#define	MIPI_DSI_PHY_TIMEOUT		(10)
-+
-+static struct mipi_dsi_match_lcd mipi_dsi_lcd_db[] = {
-+#ifdef CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL
-+	{
-+	 "TRULY-WVGA",
-+	 {mipid_hx8369_get_lcd_videomode, mipid_hx8369_lcd_setup}
-+	},
-+#endif
-+	{
-+	"", {NULL, NULL}
-+	}
-+};
-+
-+struct _mipi_dsi_phy_pll_clk {
-+	u32		max_phy_clk;
-+	u32		config;
-+};
-+
-+/* configure data for DPHY PLL 27M reference clk out */
-+static const struct _mipi_dsi_phy_pll_clk mipi_dsi_phy_pll_clk_table[] = {
-+	{1000, 0x74}, /*  950-1000MHz	*/
-+	{950,  0x54}, /*  900-950Mhz	*/
-+	{900,  0x34}, /*  850-900Mhz	*/
-+	{850,  0x14}, /*  800-850MHz	*/
-+	{800,  0x32}, /*  750-800MHz	*/
-+	{750,  0x12}, /*  700-750Mhz	*/
-+	{700,  0x30}, /*  650-700Mhz	*/
-+	{650,  0x10}, /*  600-650MHz	*/
-+	{600,  0x2e}, /*  550-600MHz	*/
-+	{550,  0x0e}, /*  500-550Mhz	*/
-+	{500,  0x2c}, /*  450-500Mhz	*/
-+	{450,  0x0c}, /*  400-450MHz	*/
-+	{400,  0x4a}, /*  360-400MHz	*/
-+	{360,  0x2a}, /*  330-360Mhz	*/
-+	{330,  0x48}, /*  300-330Mhz	*/
-+	{300,  0x28}, /*  270-300MHz	*/
-+	{270,  0x08}, /*  250-270MHz	*/
-+	{250,  0x46}, /*  240-250Mhz	*/
-+	{240,  0x26}, /*  210-240Mhz	*/
-+	{210,  0x06}, /*  200-210MHz	*/
-+	{200,  0x44}, /*  180-200MHz	*/
-+	{180,  0x24}, /*  160-180MHz	*/
-+	{160,  0x04}, /*  150-160MHz	*/
-+};
-+
-+static int valid_mode(int pixel_fmt)
-+{
-+	return ((pixel_fmt == IPU_PIX_FMT_RGB24)  ||
-+			(pixel_fmt == IPU_PIX_FMT_BGR24)  ||
-+			(pixel_fmt == IPU_PIX_FMT_RGB666) ||
-+			(pixel_fmt == IPU_PIX_FMT_RGB565) ||
-+			(pixel_fmt == IPU_PIX_FMT_BGR666) ||
-+			(pixel_fmt == IPU_PIX_FMT_RGB332));
-+}
-+
-+static inline void mipi_dsi_read_register(struct mipi_dsi_info *mipi_dsi,
-+				u32 reg, u32 *val)
-+{
-+	*val = ioread32(mipi_dsi->mmio_base + reg);
-+	dev_dbg(&mipi_dsi->pdev->dev, "read_reg:0x%02x, val:0x%08x.\n",
-+			reg, *val);
-+}
-+
-+static inline void mipi_dsi_write_register(struct mipi_dsi_info *mipi_dsi,
-+				u32 reg, u32 val)
-+{
-+	iowrite32(val, mipi_dsi->mmio_base + reg);
-+	dev_dbg(&mipi_dsi->pdev->dev, "\t\twrite_reg:0x%02x, val:0x%08x.\n",
-+			reg, val);
-+}
-+
-+int mipi_dsi_pkt_write(struct mipi_dsi_info *mipi_dsi,
-+				u8 data_type, const u32 *buf, int len)
-+{
-+	u32 val;
-+	u32 status = 0;
-+	int write_len = len;
-+	uint32_t	timeout = 0;
-+
-+	if (len) {
-+		/* generic long write command */
-+		while (len / DSI_GEN_PLD_DATA_BUF_SIZE) {
-+			mipi_dsi_write_register(mipi_dsi,
-+				MIPI_DSI_GEN_PLD_DATA, *buf);
-+			buf++;
-+			len -= DSI_GEN_PLD_DATA_BUF_SIZE;
-+			mipi_dsi_read_register(mipi_dsi,
-+				MIPI_DSI_CMD_PKT_STATUS, &status);
-+			while ((status & DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) ==
-+					 DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) {
-+				msleep(1);
-+				timeout++;
-+				if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
-+					return -EIO;
-+				mipi_dsi_read_register(mipi_dsi,
-+					MIPI_DSI_CMD_PKT_STATUS, &status);
-+			}
-+		}
-+		/* write the remainder bytes */
-+		if (len > 0) {
-+			while ((status & DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) ==
-+					 DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) {
-+				msleep(1);
-+				timeout++;
-+				if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
-+					return -EIO;
-+				mipi_dsi_read_register(mipi_dsi,
-+					MIPI_DSI_CMD_PKT_STATUS, &status);
-+			}
-+			mipi_dsi_write_register(mipi_dsi,
-+				MIPI_DSI_GEN_PLD_DATA, *buf);
-+		}
-+
-+		val = data_type | ((write_len & DSI_GEN_HDR_DATA_MASK)
-+			<< DSI_GEN_HDR_DATA_SHIFT);
-+	} else {
-+		/* generic short write command */
-+		val = data_type | ((*buf & DSI_GEN_HDR_DATA_MASK)
-+			<< DSI_GEN_HDR_DATA_SHIFT);
-+	}
-+
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &status);
-+	while ((status & DSI_CMD_PKT_STATUS_GEN_CMD_FULL) ==
-+			 DSI_CMD_PKT_STATUS_GEN_CMD_FULL) {
-+		msleep(1);
-+		timeout++;
-+		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
-+			return -EIO;
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
-+				&status);
-+	}
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_GEN_HDR, val);
-+
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &status);
-+	while (!((status & DSI_CMD_PKT_STATUS_GEN_CMD_EMPTY) ==
-+			 DSI_CMD_PKT_STATUS_GEN_CMD_EMPTY) ||
-+			!((status & DSI_CMD_PKT_STATUS_GEN_PLD_W_EMPTY) ==
-+			DSI_CMD_PKT_STATUS_GEN_PLD_W_EMPTY)) {
-+		msleep(1);
-+		timeout++;
-+		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
-+			return -EIO;
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
-+				&status);
-+	}
-+
-+	return 0;
-+}
-+
-+int mipi_dsi_pkt_read(struct mipi_dsi_info *mipi_dsi,
-+				u8 data_type, u32 *buf, int len)
-+{
-+	u32		val;
-+	int		read_len = 0;
-+	uint32_t	timeout = 0;
-+
-+	if (!len) {
-+		mipi_dbg("%s, len = 0 invalid error!\n", __func__);
-+		return -EINVAL;
-+	}
-+
-+	val = data_type | ((*buf & DSI_GEN_HDR_DATA_MASK)
-+		<< DSI_GEN_HDR_DATA_SHIFT);
-+	memset(buf, 0, len);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_GEN_HDR, val);
-+
-+	/* wait for cmd to sent out */
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &val);
-+	while ((val & DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) !=
-+			 DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) {
-+		msleep(1);
-+		timeout++;
-+		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
-+			return -EIO;
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
-+			&val);
-+	}
-+	/* wait for entire response stroed in FIFO */
-+	while ((val & DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) ==
-+			 DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) {
-+		msleep(1);
-+		timeout++;
-+		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
-+			return -EIO;
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
-+			&val);
-+	}
-+
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &val);
-+	while (!(val & DSI_CMD_PKT_STATUS_GEN_PLD_R_EMPTY)) {
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_GEN_PLD_DATA, buf);
-+		read_len += DSI_GEN_PLD_DATA_BUF_SIZE;
-+		buf++;
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
-+			&val);
-+		if (read_len == (DSI_GEN_PLD_DATA_BUF_ENTRY *
-+					DSI_GEN_PLD_DATA_BUF_SIZE))
-+			break;
-+	}
-+
-+	if ((len <= read_len) &&
-+		((len + DSI_GEN_PLD_DATA_BUF_SIZE) >= read_len))
-+		return 0;
-+	else {
-+		dev_err(&mipi_dsi->pdev->dev,
-+			"actually read_len:%d != len:%d.\n", read_len, len);
-+		return -ERANGE;
-+	}
-+}
-+
-+int mipi_dsi_dcs_cmd(struct mipi_dsi_info *mipi_dsi,
-+				u8 cmd, const u32 *param, int num)
-+{
-+	int err = 0;
-+	u32 buf[DSI_CMD_BUF_MAXSIZE];
-+
-+	switch (cmd) {
-+	case MIPI_DCS_EXIT_SLEEP_MODE:
-+	case MIPI_DCS_ENTER_SLEEP_MODE:
-+	case MIPI_DCS_SET_DISPLAY_ON:
-+	case MIPI_DCS_SET_DISPLAY_OFF:
-+		buf[0] = cmd;
-+		err = mipi_dsi_pkt_write(mipi_dsi,
-+				MIPI_DSI_DCS_SHORT_WRITE, buf, 0);
-+		break;
-+
-+	default:
-+	dev_err(&mipi_dsi->pdev->dev,
-+			"MIPI DSI DCS Command:0x%x Not supported!\n", cmd);
-+		break;
-+	}
-+
-+	return err;
-+}
-+
-+static void mipi_dsi_dphy_init(struct mipi_dsi_info *mipi_dsi,
-+						u32 cmd, u32 data)
-+{
-+	u32 val;
-+	u32 timeout = 0;
-+
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CTRL,
-+			DSI_PHY_IF_CTRL_RESET);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP, DSI_PWRUP_POWERUP);
-+
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 0);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL1,
-+		(0x10000 | cmd));
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 2);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 0);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL1, (0 | data));
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 2);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 0);
-+	val = DSI_PHY_RSTZ_EN_CLK | DSI_PHY_RSTZ_DISABLE_RST |
-+			DSI_PHY_RSTZ_DISABLE_SHUTDOWN;
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_RSTZ, val);
-+
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_PHY_STATUS, &val);
-+	while ((val & DSI_PHY_STATUS_LOCK) != DSI_PHY_STATUS_LOCK) {
-+		msleep(1);
-+		timeout++;
-+		if (timeout == MIPI_DSI_PHY_TIMEOUT) {
-+			dev_err(&mipi_dsi->pdev->dev,
-+				"Error: phy lock timeout!\n");
-+			break;
-+		}
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_PHY_STATUS, &val);
-+	}
-+	timeout = 0;
-+	while ((val & DSI_PHY_STATUS_STOPSTATE_CLK_LANE) !=
-+			DSI_PHY_STATUS_STOPSTATE_CLK_LANE) {
-+		msleep(1);
-+		timeout++;
-+		if (timeout == MIPI_DSI_PHY_TIMEOUT) {
-+			dev_err(&mipi_dsi->pdev->dev,
-+				"Error: phy lock lane timeout!\n");
-+			break;
-+		}
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_PHY_STATUS, &val);
-+	}
-+}
-+
-+static void mipi_dsi_enable_controller(struct mipi_dsi_info *mipi_dsi,
-+				bool init)
-+{
-+	u32		val;
-+	u32		lane_byte_clk_period;
-+	struct  fb_videomode *mode = mipi_dsi->mode;
-+	struct  mipi_lcd_config *lcd_config = mipi_dsi->lcd_config;
-+
-+	if (init) {
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
-+			DSI_PWRUP_RESET);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_RSTZ,
-+			DSI_PHY_RSTZ_RST);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CLKMGR_CFG,
-+			DSI_CLKMGR_CFG_CLK_DIV);
-+
-+		if (!(mode->sync & FB_SYNC_VERT_HIGH_ACT))
-+			val = DSI_DPI_CFG_VSYNC_ACT_LOW;
-+		if (!(mode->sync & FB_SYNC_HOR_HIGH_ACT))
-+			val |= DSI_DPI_CFG_HSYNC_ACT_LOW;
-+		if ((mode->sync & FB_SYNC_OE_LOW_ACT))
-+			val |= DSI_DPI_CFG_DATAEN_ACT_LOW;
-+		if (MIPI_RGB666_LOOSELY == lcd_config->dpi_fmt)
-+			val |= DSI_DPI_CFG_EN18LOOSELY;
-+		val |= (lcd_config->dpi_fmt & DSI_DPI_CFG_COLORCODE_MASK)
-+				<< DSI_DPI_CFG_COLORCODE_SHIFT;
-+		val |= (lcd_config->virtual_ch & DSI_DPI_CFG_VID_MASK)
-+				<< DSI_DPI_CFG_VID_SHIFT;
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_DPI_CFG, val);
-+
-+		val = DSI_PCKHDL_CFG_EN_BTA |
-+				DSI_PCKHDL_CFG_EN_ECC_RX |
-+				DSI_PCKHDL_CFG_EN_CRC_RX;
-+
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PCKHDL_CFG, val);
-+
-+		val = (mode->xres & DSI_VID_PKT_CFG_VID_PKT_SZ_MASK)
-+				<< DSI_VID_PKT_CFG_VID_PKT_SZ_SHIFT;
-+		val |= (NUMBER_OF_CHUNKS & DSI_VID_PKT_CFG_NUM_CHUNKS_MASK)
-+				<< DSI_VID_PKT_CFG_NUM_CHUNKS_SHIFT;
-+		val |= (NULL_PKT_SIZE & DSI_VID_PKT_CFG_NULL_PKT_SZ_MASK)
-+				<< DSI_VID_PKT_CFG_NULL_PKT_SZ_SHIFT;
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VID_PKT_CFG, val);
-+
-+		/* enable LP mode when TX DCS cmd and enable DSI command mode */
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG,
-+				MIPI_DSI_CMD_MODE_CFG_EN_LOWPOWER);
-+
-+		 /* mipi lane byte clk period in ns unit */
-+		lane_byte_clk_period = NS2PS_RATIO /
-+				(lcd_config->max_phy_clk / BITS_PER_BYTE);
-+		val  = ROUND_UP(mode->hsync_len * mode->pixclock /
-+				NS2PS_RATIO / lane_byte_clk_period)
-+				<< DSI_TME_LINE_CFG_HSA_TIME_SHIFT;
-+		val |= ROUND_UP(mode->left_margin * mode->pixclock /
-+				NS2PS_RATIO / lane_byte_clk_period)
-+				<< DSI_TME_LINE_CFG_HBP_TIME_SHIFT;
-+		val |= ROUND_UP((mode->left_margin + mode->right_margin +
-+				mode->hsync_len + mode->xres) * mode->pixclock
-+				/ NS2PS_RATIO / lane_byte_clk_period)
-+				<< DSI_TME_LINE_CFG_HLINE_TIME_SHIFT;
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_TMR_LINE_CFG, val);
-+
-+		val = ((mode->vsync_len & DSI_VTIMING_CFG_VSA_LINES_MASK)
-+					<< DSI_VTIMING_CFG_VSA_LINES_SHIFT);
-+		val |= ((mode->upper_margin & DSI_VTIMING_CFG_VBP_LINES_MASK)
-+				<< DSI_VTIMING_CFG_VBP_LINES_SHIFT);
-+		val |= ((mode->lower_margin & DSI_VTIMING_CFG_VFP_LINES_MASK)
-+				<< DSI_VTIMING_CFG_VFP_LINES_SHIFT);
-+		val |= ((mode->yres & DSI_VTIMING_CFG_V_ACT_LINES_MASK)
-+				<< DSI_VTIMING_CFG_V_ACT_LINES_SHIFT);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VTIMING_CFG, val);
-+
-+		val = ((PHY_BTA_MAXTIME & DSI_PHY_TMR_CFG_BTA_TIME_MASK)
-+				<< DSI_PHY_TMR_CFG_BTA_TIME_SHIFT);
-+		val |= ((PHY_LP2HS_MAXTIME & DSI_PHY_TMR_CFG_LP2HS_TIME_MASK)
-+				<< DSI_PHY_TMR_CFG_LP2HS_TIME_SHIFT);
-+		val |= ((PHY_HS2LP_MAXTIME & DSI_PHY_TMR_CFG_HS2LP_TIME_MASK)
-+				<< DSI_PHY_TMR_CFG_HS2LP_TIME_SHIFT);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TMR_CFG, val);
-+
-+		val = (((lcd_config->data_lane_num - 1) &
-+			DSI_PHY_IF_CFG_N_LANES_MASK)
-+			<< DSI_PHY_IF_CFG_N_LANES_SHIFT);
-+		val |= ((PHY_STOP_WAIT_TIME & DSI_PHY_IF_CFG_WAIT_TIME_MASK)
-+				<< DSI_PHY_IF_CFG_WAIT_TIME_SHIFT);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CFG, val);
-+
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST0, &val);
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST1, &val);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_ERROR_MSK0, 0);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_ERROR_MSK1, 0);
-+
-+		mipi_dsi_dphy_init(mipi_dsi, DSI_PHY_CLK_INIT_COMMAND,
-+					mipi_dsi->dphy_pll_config);
-+	} else {
-+		mipi_dsi_dphy_init(mipi_dsi, DSI_PHY_CLK_INIT_COMMAND,
-+					mipi_dsi->dphy_pll_config);
-+	}
-+}
-+
-+static void mipi_dsi_disable_controller(struct mipi_dsi_info *mipi_dsi)
-+{
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CTRL,
-+			DSI_PHY_IF_CTRL_RESET);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP, DSI_PWRUP_RESET);
-+	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_RSTZ, DSI_PHY_RSTZ_RST);
-+}
-+
-+static irqreturn_t mipi_dsi_irq_handler(int irq, void *data)
-+{
-+	u32		mask0;
-+	u32		mask1;
-+	u32		status0;
-+	u32		status1;
-+	struct mipi_dsi_info *mipi_dsi;
-+
-+	mipi_dsi = (struct mipi_dsi_info *)data;
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST0,  &status0);
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST1,  &status1);
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_MSK0, &mask0);
-+	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_MSK1, &mask1);
-+
-+	if ((status0 & (~mask0)) || (status1 & (~mask1))) {
-+		dev_err(&mipi_dsi->pdev->dev,
-+		"mipi_dsi IRQ status0:0x%x, status1:0x%x!\n",
-+		status0, status1);
-+	}
-+
-+	return IRQ_HANDLED;
-+}
-+
-+static inline void mipi_dsi_set_mode(struct mipi_dsi_info *mipi_dsi,
-+	bool cmd_mode)
-+{
-+	u32	val;
-+
-+	if (cmd_mode) {
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
-+			DSI_PWRUP_RESET);
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, &val);
-+		val |= MIPI_DSI_CMD_MODE_CFG_EN_CMD_MODE;
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, val);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VID_MODE_CFG, 0);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
-+			DSI_PWRUP_POWERUP);
-+	} else {
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
-+			DSI_PWRUP_RESET);
-+		 /* Disable Command mode when tranfering video data */
-+		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, &val);
-+		val &= ~MIPI_DSI_CMD_MODE_CFG_EN_CMD_MODE;
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, val);
-+		val = DSI_VID_MODE_CFG_EN | DSI_VID_MODE_CFG_EN_BURSTMODE |
-+				DSI_VID_MODE_CFG_EN_LP_MODE;
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VID_MODE_CFG, val);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
-+			DSI_PWRUP_POWERUP);
-+		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CTRL,
-+				DSI_PHY_IF_CTRL_TX_REQ_CLK_HS);
-+	}
-+}
-+
-+static int mipi_dsi_power_on(struct mxc_dispdrv_handle *disp)
-+{
-+	int err;
-+	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
-+
-+	if (!mipi_dsi->dsi_power_on) {
-+		clk_prepare_enable(mipi_dsi->dphy_clk);
-+		clk_prepare_enable(mipi_dsi->cfg_clk);
-+		mipi_dsi_enable_controller(mipi_dsi, false);
-+		mipi_dsi_set_mode(mipi_dsi, false);
-+		/* host send pclk/hsync/vsync for two frames before sleep-out */
-+		msleep((1000/mipi_dsi->mode->refresh + 1) << 1);
-+		mipi_dsi_set_mode(mipi_dsi, true);
-+		err = mipi_dsi_dcs_cmd(mipi_dsi, MIPI_DCS_EXIT_SLEEP_MODE,
-+			NULL, 0);
-+		if (err) {
-+			dev_err(&mipi_dsi->pdev->dev,
-+				"MIPI DSI DCS Command sleep-in error!\n");
-+		}
-+		msleep(MIPI_LCD_SLEEP_MODE_DELAY);
-+		mipi_dsi_set_mode(mipi_dsi, false);
-+		mipi_dsi->dsi_power_on = 1;
-+	}
-+
-+	return 0;
-+}
-+
-+void mipi_dsi_power_off(struct mxc_dispdrv_handle *disp)
-+{
-+	int err;
-+	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
-+
-+	if (mipi_dsi->dsi_power_on) {
-+		mipi_dsi_set_mode(mipi_dsi, true);
-+		err = mipi_dsi_dcs_cmd(mipi_dsi, MIPI_DCS_ENTER_SLEEP_MODE,
-+			NULL, 0);
-+		if (err) {
-+			dev_err(&mipi_dsi->pdev->dev,
-+				"MIPI DSI DCS Command display on error!\n");
-+		}
-+		/* To allow time for the supply voltages
-+		 * and clock circuits to stabilize.
-+		 */
-+		msleep(5);
-+		/* video stream timing on */
-+		mipi_dsi_set_mode(mipi_dsi, false);
-+		msleep(MIPI_LCD_SLEEP_MODE_DELAY);
-+
-+		mipi_dsi_set_mode(mipi_dsi, true);
-+		mipi_dsi_disable_controller(mipi_dsi);
-+		mipi_dsi->dsi_power_on = 0;
-+		clk_disable_unprepare(mipi_dsi->dphy_clk);
-+		clk_disable_unprepare(mipi_dsi->cfg_clk);
-+	}
-+}
-+
-+static int mipi_dsi_lcd_init(struct mipi_dsi_info *mipi_dsi,
-+	struct mxc_dispdrv_setting *setting)
-+{
-+	int		err;
-+	int		size;
-+	int		i;
-+	struct  fb_videomode *mipi_lcd_modedb;
-+	struct  fb_videomode mode;
-+	struct  device		 *dev = &mipi_dsi->pdev->dev;
-+
-+	for (i = 0; i < ARRAY_SIZE(mipi_dsi_lcd_db); i++) {
-+		if (!strcmp(mipi_dsi->lcd_panel,
-+			mipi_dsi_lcd_db[i].lcd_panel)) {
-+			mipi_dsi->lcd_callback =
-+				&mipi_dsi_lcd_db[i].lcd_callback;
-+			break;
-+		}
-+	}
-+	if (i == ARRAY_SIZE(mipi_dsi_lcd_db)) {
-+		dev_err(dev, "failed to find supported lcd panel.\n");
-+		return -EINVAL;
-+	}
-+	/* get the videomode in the order: cmdline->platform data->driver */
-+	mipi_dsi->lcd_callback->get_mipi_lcd_videomode(&mipi_lcd_modedb, &size,
-+					&mipi_dsi->lcd_config);
-+	err = fb_find_mode(&setting->fbi->var, setting->fbi,
-+				setting->dft_mode_str,
-+				mipi_lcd_modedb, size, NULL,
-+				setting->default_bpp);
-+	if (err != 1)
-+		fb_videomode_to_var(&setting->fbi->var, mipi_lcd_modedb);
-+
-+	INIT_LIST_HEAD(&setting->fbi->modelist);
-+	for (i = 0; i < size; i++) {
-+		fb_var_to_videomode(&mode, &setting->fbi->var);
-+		if (fb_mode_is_equal(&mode, mipi_lcd_modedb + i)) {
-+			err = fb_add_videomode(mipi_lcd_modedb + i,
-+					&setting->fbi->modelist);
-+			 /* Note: only support fb mode from driver */
-+			mipi_dsi->mode = mipi_lcd_modedb + i;
-+			break;
-+		}
-+	}
-+	if ((err < 0) || (size == i)) {
-+		dev_err(dev, "failed to add videomode.\n");
-+		return err;
-+	}
-+
-+	for (i = 0; i < ARRAY_SIZE(mipi_dsi_phy_pll_clk_table); i++) {
-+		if (mipi_dsi_phy_pll_clk_table[i].max_phy_clk <
-+				mipi_dsi->lcd_config->max_phy_clk)
-+			break;
-+	}
-+	if ((i == ARRAY_SIZE(mipi_dsi_phy_pll_clk_table)) ||
-+		(mipi_dsi->lcd_config->max_phy_clk >
-+			mipi_dsi_phy_pll_clk_table[0].max_phy_clk)) {
-+		dev_err(dev, "failed to find data in"
-+				"mipi_dsi_phy_pll_clk_table.\n");
-+		return -EINVAL;
-+	}
-+	mipi_dsi->dphy_pll_config = mipi_dsi_phy_pll_clk_table[--i].config;
-+	dev_dbg(dev, "dphy_pll_config:0x%x.\n", mipi_dsi->dphy_pll_config);
-+
-+	return 0;
-+}
-+
-+int mipi_dsi_enable(struct mxc_dispdrv_handle *disp)
-+{
-+	int err;
-+	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
-+
-+	if (!mipi_dsi->lcd_inited) {
-+		err = clk_prepare_enable(mipi_dsi->dphy_clk);
-+		err |= clk_prepare_enable(mipi_dsi->cfg_clk);
-+		if (err)
-+			dev_err(&mipi_dsi->pdev->dev,
-+				"clk enable error:%d!\n", err);
-+		mipi_dsi_enable_controller(mipi_dsi, true);
-+		err = mipi_dsi->lcd_callback->mipi_lcd_setup(
-+			mipi_dsi);
-+		if (err < 0) {
-+			dev_err(&mipi_dsi->pdev->dev,
-+				"failed to init mipi lcd.");
-+			clk_disable_unprepare(mipi_dsi->dphy_clk);
-+			clk_disable_unprepare(mipi_dsi->cfg_clk);
-+			return err;
-+		}
-+		mipi_dsi_set_mode(mipi_dsi, false);
-+		mipi_dsi->dsi_power_on = 1;
-+		mipi_dsi->lcd_inited = 1;
-+	}
-+	mipi_dsi_power_on(mipi_dsi->disp_mipi);
-+
-+	return 0;
-+}
-+
-+static int mipi_dsi_disp_init(struct mxc_dispdrv_handle *disp,
-+	struct mxc_dispdrv_setting *setting)
-+{
-+	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
-+	struct device *dev = &mipi_dsi->pdev->dev;
-+	int ret = 0;
-+
-+	if (!valid_mode(setting->if_fmt)) {
-+		dev_warn(dev, "Input pixel format not valid"
-+			"use default RGB24\n");
-+		setting->if_fmt = IPU_PIX_FMT_RGB24;
-+	}
-+
-+	setting->dev_id = mipi_dsi->dev_id;
-+	setting->disp_id = mipi_dsi->disp_id;
-+
-+	ret = mipi_dsi_lcd_init(mipi_dsi, setting);
-+	if (ret) {
-+		dev_err(dev, "failed to init mipi dsi lcd\n");
-+		return ret;
-+	}
-+
-+	dev_dbg(dev, "MIPI DSI dispdrv inited!\n");
-+	return ret;
-+}
-+
-+static void mipi_dsi_disp_deinit(struct mxc_dispdrv_handle *disp)
-+{
-+	struct mipi_dsi_info    *mipi_dsi;
-+
-+	mipi_dsi = mxc_dispdrv_getdata(disp);
-+
-+	mipi_dsi_power_off(mipi_dsi->disp_mipi);
-+	if (mipi_dsi->bl)
-+		backlight_device_unregister(mipi_dsi->bl);
-+}
-+
-+static struct mxc_dispdrv_driver mipi_dsi_drv = {
-+	.name	= DISPDRV_MIPI,
-+	.init	= mipi_dsi_disp_init,
-+	.deinit	= mipi_dsi_disp_deinit,
-+	.enable	= mipi_dsi_enable,
-+	.disable = mipi_dsi_power_off,
-+};
-+
-+static int imx6q_mipi_dsi_get_mux(int dev_id, int disp_id)
-+{
-+	if (dev_id > 1 || disp_id > 1)
-+		return -EINVAL;
-+
-+	return (dev_id << 5) | (disp_id << 4);
-+}
-+
-+static struct mipi_dsi_bus_mux imx6q_mipi_dsi_mux[] = {
-+	{
-+		.reg = IOMUXC_GPR3,
-+		.mask = IMX6Q_GPR3_MIPI_MUX_CTL_MASK,
-+		.get_mux = imx6q_mipi_dsi_get_mux,
-+	},
-+};
-+
-+static int imx6dl_mipi_dsi_get_mux(int dev_id, int disp_id)
-+{
-+	if (dev_id > 1 || disp_id > 1)
-+		return -EINVAL;
-+
-+	/* MIPI DSI source is LCDIF */
-+	if (dev_id)
-+		disp_id = 0;
-+
-+	return (dev_id << 5) | (disp_id << 4);
-+}
-+
-+static struct mipi_dsi_bus_mux imx6dl_mipi_dsi_mux[] = {
-+	{
-+		.reg = IOMUXC_GPR3,
-+		.mask = IMX6Q_GPR3_MIPI_MUX_CTL_MASK,
-+		.get_mux = imx6dl_mipi_dsi_get_mux,
-+	},
-+};
-+
-+static const struct of_device_id imx_mipi_dsi_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-mipi-dsi", .data = imx6q_mipi_dsi_mux, },
-+	{ .compatible = "fsl,imx6dl-mipi-dsi", .data = imx6dl_mipi_dsi_mux, },
-+	{ }
-+};
-+MODULE_DEVICE_TABLE(of, imx_mipi_dsi_dt_ids);
-+
-+/**
-+ * This function is called by the driver framework to initialize the MIPI DSI
-+ * device.
-+ *
-+ * @param	pdev	The device structure for the MIPI DSI passed in by the
-+ *			driver framework.
-+ *
-+ * @return      Returns 0 on success or negative error code on error
-+ */
-+static int mipi_dsi_probe(struct platform_device *pdev)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+	const struct of_device_id *of_id =
-+			of_match_device(of_match_ptr(imx_mipi_dsi_dt_ids),
-+					&pdev->dev);
-+	struct mipi_dsi_info *mipi_dsi;
-+	struct resource *res;
-+	u32 dev_id, disp_id;
-+	const char *lcd_panel;
-+	unsigned int mux;
-+	int ret = 0;
-+
-+	mipi_dsi = devm_kzalloc(&pdev->dev, sizeof(*mipi_dsi), GFP_KERNEL);
-+	if (!mipi_dsi)
-+		return -ENOMEM;
-+
-+	ret = of_property_read_string(np, "lcd_panel", &lcd_panel);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to read of property lcd_panel\n");
-+		return ret;
-+	}
-+
-+	ret = of_property_read_u32(np, "dev_id", &dev_id);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to read of property dev_id\n");
-+		return ret;
-+	}
-+	ret = of_property_read_u32(np, "disp_id", &disp_id);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to read of property disp_id\n");
-+		return ret;
-+	}
-+	mipi_dsi->dev_id = dev_id;
-+	mipi_dsi->disp_id = disp_id;
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res) {
-+		dev_err(&pdev->dev, "failed to get platform resource 0\n");
-+		return -ENODEV;
-+	}
-+
-+	if (!devm_request_mem_region(&pdev->dev, res->start,
-+				resource_size(res), pdev->name))
-+		return -EBUSY;
-+
-+	mipi_dsi->mmio_base = devm_ioremap(&pdev->dev, res->start,
-+				   resource_size(res));
-+	if (!mipi_dsi->mmio_base)
-+		return -EBUSY;
-+
-+	mipi_dsi->irq = platform_get_irq(pdev, 0);
-+	if (mipi_dsi->irq < 0) {
-+		dev_err(&pdev->dev, "failed get device irq\n");
-+		return -ENODEV;
-+	}
-+
-+	ret = devm_request_irq(&pdev->dev, mipi_dsi->irq,
-+				mipi_dsi_irq_handler,
-+				0, "mipi_dsi", mipi_dsi);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to request irq\n");
-+		return ret;
-+	}
-+
-+	mipi_dsi->dphy_clk = devm_clk_get(&pdev->dev, "mipi_pllref_clk");
-+	if (IS_ERR(mipi_dsi->dphy_clk)) {
-+		dev_err(&pdev->dev, "failed to get dphy pll_ref_clk\n");
-+		return PTR_ERR(mipi_dsi->dphy_clk);
-+	}
-+
-+	mipi_dsi->cfg_clk = devm_clk_get(&pdev->dev, "mipi_cfg_clk");
-+	if (IS_ERR(mipi_dsi->cfg_clk)) {
-+		dev_err(&pdev->dev, "failed to get cfg_clk\n");
-+		return PTR_ERR(mipi_dsi->cfg_clk);
-+	}
-+
-+	mipi_dsi->disp_power_on = devm_regulator_get(&pdev->dev,
-+							"disp-power-on");
-+	if (!IS_ERR(mipi_dsi->disp_power_on)) {
-+		ret = regulator_enable(mipi_dsi->disp_power_on);
-+		if (ret) {
-+			dev_err(&pdev->dev, "failed to enable display "
-+				"power regulator, err=%d\n", ret);
-+			return ret;
-+		}
-+	} else {
-+		mipi_dsi->disp_power_on = NULL;
-+	}
-+
-+	ret = device_reset(&pdev->dev);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to reset: %d\n", ret);
-+		goto dev_reset_fail;
-+	}
-+
-+	if (of_id)
-+		mipi_dsi->bus_mux = of_id->data;
-+
-+	mipi_dsi->regmap = syscon_regmap_lookup_by_phandle(np, "gpr");
-+	if (IS_ERR(mipi_dsi->regmap)) {
-+		dev_err(&pdev->dev, "failed to get parent regmap\n");
-+		ret = PTR_ERR(mipi_dsi->regmap);
-+		goto get_parent_regmap_fail;
-+	}
-+
-+	mux = mipi_dsi->bus_mux->get_mux(dev_id, disp_id);
-+	if (mux >= 0)
-+		regmap_update_bits(mipi_dsi->regmap, mipi_dsi->bus_mux->reg,
-+				   mipi_dsi->bus_mux->mask, mux);
-+	else
-+		dev_warn(&pdev->dev, "invalid dev_id or disp_id muxing\n");
-+
-+	mipi_dsi->lcd_panel = kstrdup(lcd_panel, GFP_KERNEL);
-+	if (!mipi_dsi->lcd_panel) {
-+		dev_err(&pdev->dev, "failed to allocate lcd panel name\n");
-+		ret = -ENOMEM;
-+		goto kstrdup_fail;
-+	}
-+
-+	mipi_dsi->pdev = pdev;
-+	mipi_dsi->disp_mipi = mxc_dispdrv_register(&mipi_dsi_drv);
-+	if (IS_ERR(mipi_dsi->disp_mipi)) {
-+		dev_err(&pdev->dev, "mxc_dispdrv_register error\n");
-+		ret = PTR_ERR(mipi_dsi->disp_mipi);
-+		goto dispdrv_reg_fail;
-+	}
-+
-+	mxc_dispdrv_setdata(mipi_dsi->disp_mipi, mipi_dsi);
-+	dev_set_drvdata(&pdev->dev, mipi_dsi);
-+
-+	dev_info(&pdev->dev, "i.MX MIPI DSI driver probed\n");
-+	return ret;
-+
-+dispdrv_reg_fail:
-+	kfree(mipi_dsi->lcd_panel);
-+kstrdup_fail:
-+get_parent_regmap_fail:
-+dev_reset_fail:
-+	if (mipi_dsi->disp_power_on)
-+		regulator_disable(mipi_dsi->disp_power_on);
-+	return ret;
-+}
-+
-+static void mipi_dsi_shutdown(struct platform_device *pdev)
-+{
-+	struct mipi_dsi_info *mipi_dsi = dev_get_drvdata(&pdev->dev);
-+
-+	mipi_dsi_power_off(mipi_dsi->disp_mipi);
-+}
-+
-+static int mipi_dsi_remove(struct platform_device *pdev)
-+{
-+	struct mipi_dsi_info *mipi_dsi = dev_get_drvdata(&pdev->dev);
-+
-+	mxc_dispdrv_puthandle(mipi_dsi->disp_mipi);
-+	mxc_dispdrv_unregister(mipi_dsi->disp_mipi);
-+
-+	if (mipi_dsi->disp_power_on)
-+		regulator_disable(mipi_dsi->disp_power_on);
-+
-+	kfree(mipi_dsi->lcd_panel);
-+	dev_set_drvdata(&pdev->dev, NULL);
-+
-+	return 0;
-+}
-+
-+static struct platform_driver mipi_dsi_driver = {
-+	.driver = {
-+		   .of_match_table = imx_mipi_dsi_dt_ids,
-+		   .name = "mxc_mipi_dsi",
-+	},
-+	.probe = mipi_dsi_probe,
-+	.remove = mipi_dsi_remove,
-+	.shutdown = mipi_dsi_shutdown,
-+};
-+
-+static int __init mipi_dsi_init(void)
-+{
-+	int err;
-+
-+	err = platform_driver_register(&mipi_dsi_driver);
-+	if (err) {
-+		pr_err("mipi_dsi_driver register failed\n");
-+		return -ENODEV;
-+	}
-+	pr_info("MIPI DSI driver module loaded\n");
-+	return 0;
-+}
-+
-+static void __exit mipi_dsi_cleanup(void)
-+{
-+	platform_driver_unregister(&mipi_dsi_driver);
-+}
-+
-+module_init(mipi_dsi_init);
-+module_exit(mipi_dsi_cleanup);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("i.MX MIPI DSI driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/drivers/video/mxc/mipi_dsi.h linux-xbian-imx6/drivers/video/mxc/mipi_dsi.h
---- linux-4.1.3/drivers/video/mxc/mipi_dsi.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mipi_dsi.h	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,112 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __MIPI_DSI_H__
-+#define __MIPI_DSI_H__
-+
-+#include <linux/regmap.h>
-+
-+#ifdef DEBUG
-+#define mipi_dbg(fmt, ...) printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__)
-+#else
-+#define mipi_dbg(fmt, ...)
-+#endif
-+
-+#define	DSI_CMD_BUF_MAXSIZE         (32)
-+
-+/* DPI interface pixel color coding map */
-+enum mipi_dsi_dpi_fmt {
-+	MIPI_RGB565_PACKED = 0,
-+	MIPI_RGB565_LOOSELY,
-+	MIPI_RGB565_CONFIG3,
-+	MIPI_RGB666_PACKED,
-+	MIPI_RGB666_LOOSELY,
-+	MIPI_RGB888,
-+};
-+
-+struct mipi_lcd_config {
-+	u32				virtual_ch;
-+	u32				data_lane_num;
-+	/* device max DPHY clock in MHz unit */
-+	u32				max_phy_clk;
-+	enum mipi_dsi_dpi_fmt		dpi_fmt;
-+};
-+
-+struct mipi_dsi_info;
-+struct mipi_dsi_lcd_callback {
-+	/* callback for lcd panel operation */
-+	void (*get_mipi_lcd_videomode)(struct fb_videomode **, int *,
-+			struct mipi_lcd_config **);
-+	int  (*mipi_lcd_setup)(struct mipi_dsi_info *);
-+
-+};
-+
-+struct mipi_dsi_match_lcd {
-+	char *lcd_panel;
-+	struct mipi_dsi_lcd_callback lcd_callback;
-+};
-+
-+struct mipi_dsi_bus_mux {
-+	int reg;
-+	int mask;
-+	int (*get_mux) (int dev_id, int disp_id);
-+};
-+
-+/* driver private data */
-+struct mipi_dsi_info {
-+	struct platform_device		*pdev;
-+	void __iomem			*mmio_base;
-+	struct regmap			*regmap;
-+	const struct mipi_dsi_bus_mux	*bus_mux;
-+	int				dsi_power_on;
-+	int				lcd_inited;
-+	u32				dphy_pll_config;
-+	int				dev_id;
-+	int				disp_id;
-+	char				*lcd_panel;
-+	int				irq;
-+	struct clk			*dphy_clk;
-+	struct clk			*cfg_clk;
-+	struct mxc_dispdrv_handle	*disp_mipi;
-+	struct  fb_videomode		*mode;
-+	struct regulator		*disp_power_on;
-+	struct  mipi_lcd_config		*lcd_config;
-+	/* board related power control */
-+	struct backlight_device		*bl;
-+	/* callback for lcd panel operation */
-+	struct mipi_dsi_lcd_callback	*lcd_callback;
-+};
-+
-+int mipi_dsi_pkt_write(struct mipi_dsi_info *mipi,
-+				u8 data_type, const u32 *buf, int len);
-+int mipi_dsi_pkt_read(struct mipi_dsi_info *mipi,
-+				u8 data_type, u32 *buf, int len);
-+int mipi_dsi_dcs_cmd(struct mipi_dsi_info *mipi,
-+				u8 cmd, const u32 *param, int num);
-+
-+#ifdef CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL
-+void mipid_hx8369_get_lcd_videomode(struct fb_videomode **mode, int *size,
-+		struct mipi_lcd_config **data);
-+int mipid_hx8369_lcd_setup(struct mipi_dsi_info *);
-+#endif
-+
-+#ifndef CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL
-+#error "Please configure MIPI LCD panel, we cannot find one!"
-+#endif
-+
-+#endif
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_dcic.c linux-xbian-imx6/drivers/video/mxc/mxc_dcic.c
---- linux-4.1.3/drivers/video/mxc/mxc_dcic.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_dcic.c	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,697 @@
-+/*
-+ * Copyright (C) 2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+#include <linux/clk.h>
-+#include <linux/cdev.h>
-+#include <linux/delay.h>
-+#include <linux/err.h>
-+#include <linux/fs.h>
-+#include <linux/fb.h>
-+#include <linux/init.h>
-+#include <linux/io.h>
-+#include <linux/ioctl.h>
-+#include <linux/interrupt.h>
-+#include <linux/mfd/syscon.h>
-+#include <linux/mfd/syscon/imx6q-iomuxc-gpr.h>
-+#include <linux/module.h>
-+#include <linux/mxc_dcic.h>
-+#include <linux/of_device.h>
-+#include <linux/platform_device.h>
-+#include <linux/regmap.h>
-+#include <linux/types.h>
-+#include <linux/uaccess.h>
-+#include <video/videomode.h>
-+#include <video/of_videomode.h>
-+
-+#define DRIVER_NAME	"mxc_dcic"
-+
-+#define  DCIC_IPU1_DI0		"dcic-ipu1-di0"
-+#define  DCIC_IPU1_DI1		"dcic-ipu1-di1"
-+#define  DCIC_IPU2_DI0		"dcic-ipu2-di0"
-+#define  DCIC_IPU2_DI1		"dcic-ipu2-di1"
-+#define  DCIC_LCDIF			"dcic-lcdif"
-+#define  DCIC_LCDIF1		"dcic-lcdif1"
-+#define  DCIC_LCDIF2		"dcic-lcdif2"
-+#define  DCIC_LVDS			"dcic-lvds"
-+#define  DCIC_LVDS0			"dcic-lvds0"
-+#define  DCIC_LVDS1			"dcic-lvds1"
-+#define  DCIC_HDMI			"dcic-hdmi"
-+
-+#define DCIC0_DEV_NAME "mxc_dcic0"
-+#define DCIC1_DEV_NAME "mxc_dcic1"
-+
-+#define FB_SYNC_OE_LOW_ACT		0x80000000
-+#define FB_SYNC_CLK_LAT_FALL	0x40000000
-+
-+static wait_queue_head_t mxc_dcic_wait;
-+static int mxc_dcic_vsync;
-+static uint16_t mxc_dcic_irq;
-+static unsigned long mxc_dcic_counter;
-+static uint16_t mxc_dcic_clients;
-+
-+static const struct dcic_mux imx6q_dcic0_mux[] = {
-+	{
-+		.dcic = DCIC_IPU1_DI0,
-+		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_IPU1_DI0,
-+	}, {
-+		.dcic = DCIC_LVDS0,
-+		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS0,
-+	}, {
-+		.dcic = DCIC_LVDS1,
-+		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS1,
-+	}, {
-+		.dcic = DCIC_HDMI,
-+		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_HDMI,
-+	}
-+};
-+
-+static const struct dcic_mux imx6q_dcic1_mux[] = {
-+	{
-+		.dcic = DCIC_IPU1_DI1,
-+		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI1,
-+	}, {
-+		.dcic = DCIC_LVDS0,
-+		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS0,
-+	}, {
-+		.dcic = DCIC_LVDS1,
-+		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS1,
-+	}, {
-+		.dcic = DCIC_HDMI,
-+		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_MIPI,
-+	}
-+};
-+
-+static const struct bus_mux imx6q_dcic_buses[] = {
-+	{
-+		.name = DCIC0_DEV_NAME,
-+		.reg = IOMUXC_GPR10,
-+		.shift = 0,
-+		.mask = IMX6Q_GPR10_DCIC1_MUX_CTL_MASK,
-+		.dcic_mux_num = ARRAY_SIZE(imx6q_dcic0_mux),
-+		.dcics = imx6q_dcic0_mux,
-+	}, {
-+		.name = DCIC1_DEV_NAME,
-+		.reg = IOMUXC_GPR10,
-+		.shift = 2,
-+		.mask = IMX6Q_GPR10_DCIC2_MUX_CTL_MASK,
-+		.dcic_mux_num = ARRAY_SIZE(imx6q_dcic1_mux),
-+		.dcics = imx6q_dcic1_mux,
-+	}
-+};
-+
-+static const struct dcic_info imx6q_dcic_info = {
-+	.bus_mux_num = ARRAY_SIZE(imx6q_dcic_buses),
-+	.buses = imx6q_dcic_buses,
-+};
-+
-+static const struct dcic_mux imx6sx_dcic0_mux[] = {
-+	{
-+		.dcic = DCIC_LCDIF1,
-+		.val = IMX6SX_GPR5_DISP_MUX_DCIC1_LCDIF1,
-+	}, {
-+		.dcic = DCIC_LVDS,
-+		.val = IMX6SX_GPR5_DISP_MUX_DCIC1_LVDS,
-+	}
-+};
-+
-+static const struct dcic_mux imx6sx_dcic1_mux[] = {
-+	{
-+		.dcic = DCIC_LCDIF2,
-+		.val = IMX6SX_GPR5_DISP_MUX_DCIC2_LCDIF2,
-+	}, {
-+		.dcic = DCIC_LVDS,
-+		.val = IMX6SX_GPR5_DISP_MUX_DCIC2_LVDS,
-+	}
-+};
-+
-+static const struct bus_mux imx6sx_dcic_buses[] = {
-+	{
-+		.name = DCIC0_DEV_NAME,
-+		.reg = IOMUXC_GPR5,
-+		.shift = 1,
-+		.mask = IMX6SX_GPR5_DISP_MUX_DCIC1_MASK,
-+		.dcic_mux_num = ARRAY_SIZE(imx6sx_dcic0_mux),
-+		.dcics = imx6sx_dcic0_mux,
-+	}, {
-+		.name = DCIC1_DEV_NAME,
-+		.reg = IOMUXC_GPR5,
-+		.shift = 2,
-+		.mask = IMX6SX_GPR5_DISP_MUX_DCIC2_MASK,
-+		.dcic_mux_num = ARRAY_SIZE(imx6sx_dcic1_mux),
-+		.dcics = imx6sx_dcic1_mux,
-+	}
-+};
-+
-+static const struct dcic_info imx6sx_dcic_info = {
-+	.bus_mux_num = ARRAY_SIZE(imx6sx_dcic_buses),
-+	.buses = imx6sx_dcic_buses,
-+};
-+
-+static const struct of_device_id dcic_dt_ids[] = {
-+	{ .compatible = "fsl,imx6q-dcic", .data = &imx6q_dcic_info, },
-+	{ .compatible = "fsl,imx6sx-dcic", .data = &imx6sx_dcic_info, },
-+	{ /* sentinel */ }
-+};
-+MODULE_DEVICE_TABLE(of, dcic_dt_ids);
-+
-+static int of_get_dcic_val(struct device_node *np, struct dcic_data *dcic)
-+{
-+	const char *mux;
-+	int ret;
-+	u32 i, dcic_id;
-+
-+	ret = of_property_read_string(np, "dcic_mux", &mux);
-+	if (ret < 0) {
-+		dev_err(dcic->dev, "Can not get dcic_mux\n");
-+		return ret;
-+	}
-+	ret = of_property_read_u32(np, "dcic_id", &dcic_id);
-+	if (ret < 0) {
-+		dev_err(dcic->dev, "Can not get dcic_id\n");
-+		return ret;
-+	}
-+
-+	dcic->bus_n = dcic_id;
-+
-+	for (i = 0; i < dcic->buses[dcic_id].dcic_mux_num; i++)
-+		if (!strcmp(mux, dcic->buses[dcic_id].dcics[i].dcic)) {
-+			dcic->mux_n = i;
-+			return dcic->buses[dcic_id].dcics[i].val;
-+		}
-+
-+	return -EINVAL;
-+}
-+
-+static void dcic_enable(struct dcic_data *dcic)
-+{
-+	u32 val;
-+
-+	val = readl(&dcic->regs->dcicc);
-+	val |= DCICC_IC_ENABLE;
-+	writel(val, &dcic->regs->dcicc);
-+}
-+
-+void dcic_disable(struct dcic_data *dcic)
-+{
-+	u32 val;
-+
-+	val = readl(&dcic->regs->dcicc);
-+	val &= ~DCICC_IC_MASK;
-+	val |= DCICC_IC_DISABLE;
-+	writel(val, &dcic->regs->dcicc);
-+}
-+
-+static void roi_enable(struct dcic_data *dcic, struct roi_params *roi_param)
-+{
-+	u32 val;
-+	u32 roi_n = roi_param->roi_n;
-+
-+	val = readl(&dcic->regs->ROI[roi_n].dcicrc);
-+	val |= DCICRC_ROI_ENABLE;
-+	if (roi_param->freeze)
-+		val |= DCICRC_ROI_FROZEN;
-+	writel(val, &dcic->regs->ROI[roi_n].dcicrc);
-+}
-+
-+static void roi_disable(struct dcic_data *dcic, u32 roi_n)
-+{
-+	u32 val;
-+
-+	val = readl(&dcic->regs->ROI[roi_n].dcicrc);
-+	val &= ~DCICRC_ROI_ENABLE;
-+	writel(val, &dcic->regs->ROI[roi_n].dcicrc);
-+}
-+
-+static bool roi_configure(struct dcic_data *dcic, struct roi_params *roi_param)
-+{
-+	struct roi_regs *roi_reg;
-+	u32 val;
-+
-+	if (roi_param->roi_n < 0 || roi_param->roi_n >= 16) {
-+		pr_err("Error, Wrong ROI number %d\n", roi_param->roi_n);
-+		return false;
-+	}
-+
-+	if (roi_param->end_x <= roi_param->start_x ||
-+			roi_param->end_y <= roi_param->start_y) {
-+		pr_err("Error, Wrong ROI\n");
-+		return false;
-+	}
-+
-+	roi_reg = (struct roi_regs *) &dcic->regs->ROI[roi_param->roi_n];
-+
-+	/* init roi block size  */
-+	val = roi_param->start_y << 16 | roi_param->start_x;
-+	writel(val, &roi_reg->dcicrc);
-+
-+	val = roi_param->end_y << 16 | roi_param->end_x;
-+	writel(val, &roi_reg->dcicrs);
-+
-+	writel(roi_param->ref_sig, &roi_reg->dcicrrs);
-+
-+	roi_enable(dcic, roi_param);
-+	return true;
-+}
-+
-+static void dcic_int_enable(struct dcic_data *dcic)
-+{
-+	u32 val;
-+
-+	/* Clean pending interrupt before enable int */
-+	writel(DCICS_FI_STAT_PENDING, &dcic->regs->dcics);
-+	writel(0xffffffff, &dcic->regs->dcics);
-+
-+	/* Enable function interrupt */
-+	val = readl(&dcic->regs->dcicic);
-+	val &= ~DCICIC_FUN_INT_MASK;
-+	val |= DCICIC_FUN_INT_ENABLE;
-+	writel(val, &dcic->regs->dcicic);
-+}
-+
-+static void dcic_int_disable(struct dcic_data *dcic)
-+{
-+	u32 val;
-+
-+	/* Disable both function and error interrupt */
-+	val = readl(&dcic->regs->dcicic);
-+	val = DCICIC_ERROR_INT_DISABLE | DCICIC_FUN_INT_DISABLE;
-+	writel(val, &dcic->regs->dcicic);
-+}
-+
-+static irqreturn_t dcic_irq_handler(int irq, void *data)
-+{
-+	u32 i;
-+
-+	struct dcic_data *dcic = data;
-+	u32 dcics = readl(&dcic->regs->dcics);
-+
-+	dcic->result = dcics & 0xffff;
-+
-+	if (!mxc_dcic_vsync)
-+		dcic_int_disable(dcic);
-+	else {
-+		mxc_dcic_irq = -1;
-+		mxc_dcic_counter++;
-+	}
-+
-+	/* clean dcic interrupt state */
-+	writel(DCICS_FI_STAT_PENDING, &dcic->regs->dcics);
-+	writel(dcics, &dcic->regs->dcics);
-+
-+	if (mxc_dcic_vsync) {
-+		wake_up(&mxc_dcic_wait);
-+		return IRQ_HANDLED;
-+	}
-+
-+	for (i = 0; i < 16; i++) {
-+		pr_debug("ROI=%d,crcRS=0x%x, crcCS=0x%x\n", i,
-+				readl(&dcic->regs->ROI[i].dcicrrs),
-+				readl(&dcic->regs->ROI[i].dcicrcs));
-+	}
-+	complete(&dcic->roi_crc_comp);
-+
-+	return IRQ_HANDLED;
-+}
-+
-+static int dcic_configure(struct dcic_data *dcic, unsigned int sync)
-+{
-+	u32 val;
-+	val = 0;
-+
-+	/* vsync, hsync,  DE, clk_pol  */
-+	if (!(sync & FB_SYNC_HOR_HIGH_ACT))
-+		val |= DCICC_HSYNC_POL_ACTIVE_LOW;
-+	if (!(sync & FB_SYNC_VERT_HIGH_ACT))
-+		val |= DCICC_VSYNC_POL_ACTIVE_LOW;
-+	if (sync & FB_SYNC_OE_LOW_ACT)
-+		val |= DCICC_DE_ACTIVE_LOW;
-+	if (sync & FB_SYNC_CLK_LAT_FALL)
-+		val |= DCICC_CLK_POL_INVERTED;
-+
-+	writel(val, &dcic->regs->dcicc);
-+	return 0;
-+}
-+
-+static int dcic_open(struct inode *inode, struct file *file)
-+{
-+	struct dcic_data *dcic = container_of(inode->i_cdev, struct dcic_data, cdev);
-+	struct dcic_private *dcic_client;
-+	int i = 0;
-+
-+	dcic_client = devm_kzalloc(dcic->dev,
-+				sizeof(struct dcic_private),
-+				GFP_KERNEL);
-+	if (!dcic_client) {
-+		dev_err(dcic->dev, "Cannot allocate device data\n");
-+		return -ENOMEM;
-+	}
-+
-+	mutex_lock(&dcic->lock);
-+
-+	if (mxc_dcic_clients == 0xffff) {
-+		mutex_unlock(&dcic->lock);
-+		return -EBUSY;
-+	}
-+
-+	clk_prepare_enable(dcic->disp_axi_clk);
-+	clk_prepare_enable(dcic->dcic_clk);
-+
-+	dcic_client->dcic = dcic;
-+	file->private_data = dcic_client;
-+
-+	while (mxc_dcic_clients & BIT(i++));
-+	mxc_dcic_clients |= BIT(i);
-+	dcic_client->client_id |= BIT(i);
-+
-+	mutex_unlock(&dcic->lock);
-+	return 0;
-+}
-+
-+static int dcic_release(struct inode *inode, struct file *file)
-+{
-+	struct dcic_private *dcic_client = file->private_data;
-+	struct dcic_data *dcic = dcic_client->dcic;
-+	u32 i;
-+
-+	mutex_lock(&dcic->lock);
-+
-+	mxc_dcic_clients &= ~dcic_client->client_id;
-+	if (!mxc_dcic_clients) {
-+		for (i = 0; i < 16; i++)
-+			roi_disable(dcic, i);
-+
-+		clk_disable_unprepare(dcic->dcic_clk);
-+		clk_disable_unprepare(dcic->disp_axi_clk);
-+	}
-+
-+	mutex_unlock(&dcic->lock);
-+	devm_kfree(dcic->dev, dcic_client);
-+	return 0;
-+}
-+
-+static int dcic_init(struct device_node *np, struct dcic_data *dcic)
-+{
-+	u32 val, bus;
-+
-+	val = of_get_dcic_val(np, dcic);
-+	if (val < 0) {
-+		pr_err("Error incorrect\n");
-+		return -1;
-+	}
-+
-+	bus = dcic->bus_n;
-+
-+	regmap_update_bits(dcic->regmap, dcic->buses[bus].reg ,
-+			   dcic->buses[bus].mask, val);
-+
-+	return 0;
-+}
-+
-+static long dcic_ioctl(struct file *file,
-+		unsigned int cmd, unsigned long arg)
-+{
-+	int __user *argp = (void __user *)arg;
-+	struct dcic_private *dcic_client = file->private_data;
-+	struct dcic_data *dcic = dcic_client->dcic;
-+	struct roi_params roi_param;
-+	unsigned int sync;
-+	int ret = 0;
-+	int i, t = 0;
-+
-+	if (cmd == DCIC_IOC_STOP_VSYNC || cmd == DCIC_IOC_START_VSYNC) {
-+		for (i = 0; i < 16; i++)
-+			if (mxc_dcic_clients & BIT(i) && ++t > 1)
-+				return 0;
-+	}
-+
-+	switch (cmd) {
-+	case DCIC_IOC_CONFIG_DCIC:
-+		if (!copy_from_user(&sync, argp, sizeof(unsigned int)))
-+			dcic_configure(dcic, sync);
-+		break;
-+	case DCIC_IOC_CONFIG_ROI:
-+		if (copy_from_user(&roi_param, argp, sizeof(roi_param)))
-+			return -EFAULT;
-+		else
-+			if (!roi_configure(dcic, &roi_param))
-+				return -EINVAL;
-+		break;
-+	case DCIC_IOC_GET_RESULT:
-+		init_completion(&dcic->roi_crc_comp);
-+
-+		dcic_enable(dcic);
-+
-+		dcic->result = 0;
-+		msleep(25);
-+
-+		dcic_int_enable(dcic);
-+
-+		ret = wait_for_completion_interruptible_timeout(
-+			&dcic->roi_crc_comp, 1 * HZ);
-+		if (ret == 0) {
-+			dev_err(dcic->dev,
-+			"dcic wait for roi crc cal timeout\n");
-+			ret = -ETIME;
-+		} else if (ret > 0) {
-+			if (copy_to_user(argp, &dcic->result, sizeof(dcic->result)))
-+				return -EFAULT;
-+			ret = 0;
-+		}
-+		dcic_disable(dcic);
-+		break;
-+	case DCIC_IOC_START_VSYNC:
-+		mxc_dcic_vsync = 1;
-+		mxc_dcic_irq = 0;
-+		mxc_dcic_counter = 0;
-+
-+		// configure minimum roi block
-+		roi_param.roi_n = 0;
-+		roi_param.end_x = 1;
-+		roi_param.start_x = 0;
-+		roi_param.end_y = 1;
-+		roi_param.start_y = 0;
-+		roi_configure(dcic, &roi_param);
-+
-+		dcic_enable(dcic);
-+		dcic_int_enable(dcic);
-+		break;
-+	case DCIC_IOC_STOP_VSYNC:
-+		mxc_dcic_vsync = 0;
-+		mxc_dcic_irq = 0;
-+		init_completion(&dcic->roi_crc_comp);
-+		wait_for_completion_interruptible_timeout(&dcic->roi_crc_comp, 1 * HZ);
-+		dcic_disable(dcic);
-+		break;
-+	default:
-+		pr_err("%s, Unsupport cmd %d\n", __func__, cmd);
-+		break;
-+     }
-+     return ret;
-+}
-+
-+static ssize_t dcic_read(struct file *file, char __user *buf, size_t count,
-+			    loff_t *ppos)
-+{
-+	struct dcic_private *dcic_client = file->private_data;
-+	int ret = 0;
-+
-+	do {
-+		if (mxc_dcic_irq & dcic_client->client_id) {
-+			count = min(sizeof(unsigned long), count);
-+			ret = copy_to_user(buf, &mxc_dcic_counter, count) ? -EFAULT : count;
-+			mxc_dcic_irq &= ~dcic_client->client_id;
-+			break;
-+		}
-+		if (file->f_flags & O_NONBLOCK) {
-+			ret = -EAGAIN;
-+		}
-+		else if (wait_event_interruptible(mxc_dcic_wait, mxc_dcic_irq & dcic_client->client_id))
-+			ret = -ERESTARTSYS;
-+	} while(!ret);
-+
-+	return ret;
-+}
-+
-+static const struct file_operations mxc_dcic_fops = {
-+	.owner = THIS_MODULE,
-+	.open = dcic_open,
-+	.release = dcic_release,
-+	.unlocked_ioctl = dcic_ioctl,
-+	.read = dcic_read,
-+};
-+
-+static int dcic_probe(struct platform_device *pdev)
-+{
-+	struct device *dev = &pdev->dev;
-+	const struct of_device_id *of_id =
-+			of_match_device(dcic_dt_ids, dev);
-+	const struct dcic_info *dcic_info =
-+			(const struct dcic_info *)of_id->data;
-+	struct device_node *np = dev->of_node;
-+	struct dcic_data *dcic;
-+	struct resource *res;
-+	const char *name;
-+	dev_t devt;
-+	int ret = 0;
-+	int irq;
-+
-+	dcic = devm_kzalloc(&pdev->dev,
-+				sizeof(struct dcic_data),
-+				GFP_KERNEL);
-+	if (!dcic) {
-+		dev_err(&pdev->dev, "Cannot allocate device data\n");
-+		ret = -ENOMEM;
-+		goto ealloc;
-+	}
-+
-+	platform_set_drvdata(pdev, dcic);
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res) {
-+		dev_err(&pdev->dev, "No dcic base address found.\n");
-+		ret = -ENODEV;
-+		goto ealloc;
-+	}
-+
-+	dcic->regs = (struct dcic_regs *) devm_ioremap(&pdev->dev, res->start, resource_size(res));
-+	if (!dcic->regs) {
-+		dev_err(&pdev->dev, "ioremap failed with dcic base\n");
-+		ret = -ENOMEM;
-+		goto ealloc;
-+	}
-+
-+	dcic->dev = dev;
-+	dcic->buses = dcic_info->buses;
-+
-+	dcic->regmap = syscon_regmap_lookup_by_phandle(np, "gpr");
-+	if (IS_ERR(dcic->regmap)) {
-+		dev_err(dev, "failed to get parent regmap\n");
-+		ret = PTR_ERR(dcic->regmap);
-+		goto ealloc;
-+	}
-+
-+	/* clock */
-+	dcic->disp_axi_clk = devm_clk_get(&pdev->dev, "disp-axi");
-+	if (IS_ERR(dcic->disp_axi_clk)) {
-+		dev_err(&pdev->dev, "get disp-axi clock failed\n");
-+		ret = PTR_ERR(dcic->disp_axi_clk);
-+		goto ealloc;
-+	}
-+
-+	dcic->dcic_clk = devm_clk_get(&pdev->dev, "dcic");
-+	if (IS_ERR(dcic->dcic_clk)) {
-+		dev_err(&pdev->dev, "get dcic clk failed\n");
-+		ret = PTR_ERR(dcic->dcic_clk);
-+		goto ealloc;
-+	}
-+
-+	mutex_init(&dcic->lock);
-+	ret = dcic_init(np, dcic);
-+	if (ret < 0) {
-+		pr_err("Failed init dcic\n");
-+		goto ealloc;
-+	}
-+
-+	/* register device */
-+	name = dcic->buses[dcic->bus_n].name;
-+	dcic->major = register_chrdev(0, name, &mxc_dcic_fops);
-+	if (dcic->major < 0) {
-+		pr_err("DCIC: unable to get a major for dcic\n");
-+		ret = -EBUSY;
-+		goto ealloc;
-+	}
-+
-+	dcic->class = class_create(THIS_MODULE, name);
-+	if (IS_ERR(dcic->class)) {
-+		ret = PTR_ERR(dcic->class);
-+		goto err_out_chrdev;
-+	}
-+
-+	/* create char device */
-+	devt = MKDEV(dcic->major, 0);
-+	dcic->devt = devt;
-+
-+	cdev_init(&dcic->cdev, &mxc_dcic_fops);
-+	dcic->cdev.owner = THIS_MODULE;
-+	ret = cdev_add(&dcic->cdev, devt, 1);
-+	if (ret)
-+		goto err_out_class;
-+
-+	device_create(dcic->class, NULL, devt,
-+				   NULL, name);
-+
-+	/* IRQ */
-+	irq = platform_get_irq(pdev, 0);
-+
-+	ret = devm_request_irq(&pdev->dev, irq, dcic_irq_handler, 0,
-+			  dev_name(&pdev->dev), dcic);
-+	if (ret) {
-+		dev_err(&pdev->dev, "request_irq (%d) failed with error %d\n",
-+				irq, ret);
-+		goto err_out_cdev;
-+	}
-+
-+	init_waitqueue_head(&mxc_dcic_wait);
-+	mxc_dcic_vsync = 0;
-+	mxc_dcic_irq = 0;
-+
-+	return 0;
-+
-+err_out_cdev:
-+	cdev_del(&dcic->cdev);
-+err_out_class:
-+	device_destroy(dcic->class, devt);
-+	class_destroy(dcic->class);
-+err_out_chrdev:
-+	unregister_chrdev(dcic->major, name);
-+ealloc:
-+	return ret;
-+}
-+
-+static int dcic_remove(struct platform_device *pdev)
-+{
-+	struct dcic_data *dcic = platform_get_drvdata(pdev);
-+	const char *name;
-+
-+	name = dcic->buses[dcic->bus_n].name;
-+
-+	device_destroy(dcic->class, dcic->devt);
-+	cdev_del(&dcic->cdev);
-+	class_destroy(dcic->class);
-+	unregister_chrdev(dcic->major, name);
-+	mutex_destroy(&dcic->lock);
-+
-+	return 0;
-+}
-+
-+static struct platform_driver dcic_driver = {
-+	.driver = {
-+		.name = DRIVER_NAME,
-+		.of_match_table	= dcic_dt_ids,
-+	},
-+	.probe = dcic_probe,
-+	.remove = dcic_remove,
-+};
-+
-+module_platform_driver(dcic_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("MXC DCIC driver");
-+MODULE_LICENSE("GPL");
-+MODULE_ALIAS("platform:" DRIVER_NAME);
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_dispdrv.c linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.c
---- linux-4.1.3/drivers/video/mxc/mxc_dispdrv.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.c	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,150 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @file mxc_dispdrv.c
-+ * @brief mxc display driver framework.
-+ *
-+ * A display device driver could call mxc_dispdrv_register(drv) in its dev_probe() function.
-+ * Move all dev_probe() things into mxc_dispdrv_driver->init(), init() function should init
-+ * and feedback setting;
-+ * Necessary deferred operations can be done in mxc_dispdrv_driver->post_init(),
-+ * after dev_id and disp_id pass usage check;
-+ * Move all dev_remove() things into mxc_dispdrv_driver->deinit();
-+ * Move all dev_suspend() things into fb_notifier for SUSPEND, if there is;
-+ * Move all dev_resume() things into fb_notifier for RESUME, if there is;
-+ *
-+ * ipuv3 fb driver could call mxc_dispdrv_gethandle(name, setting) before a fb
-+ * need be added, with fbi param passing by setting, after
-+ * mxc_dispdrv_gethandle() return, FB driver should get the basic setting
-+ * about fbi info and ipuv3-hw (ipu_id and disp_id).
-+ *
-+ * @ingroup Framebuffer
-+ */
-+
-+#include <linux/kernel.h>
-+#include <linux/module.h>
-+#include <linux/list.h>
-+#include <linux/mutex.h>
-+#include <linux/slab.h>
-+#include <linux/err.h>
-+#include <linux/string.h>
-+#include "mxc_dispdrv.h"
-+
-+static LIST_HEAD(dispdrv_list);
-+static DEFINE_MUTEX(dispdrv_lock);
-+
-+struct mxc_dispdrv_entry {
-+	/* Note: drv always the first element */
-+	struct mxc_dispdrv_driver *drv;
-+	bool active;
-+	void *priv;
-+	struct list_head list;
-+};
-+
-+struct mxc_dispdrv_handle *mxc_dispdrv_register(struct mxc_dispdrv_driver *drv)
-+{
-+	struct mxc_dispdrv_entry *new;
-+
-+	mutex_lock(&dispdrv_lock);
-+
-+	new = kzalloc(sizeof(struct mxc_dispdrv_entry), GFP_KERNEL);
-+	if (!new) {
-+		mutex_unlock(&dispdrv_lock);
-+		return ERR_PTR(-ENOMEM);
-+	}
-+
-+	new->drv = drv;
-+	list_add_tail(&new->list, &dispdrv_list);
-+
-+	mutex_unlock(&dispdrv_lock);
-+
-+	return (struct mxc_dispdrv_handle *)new;
-+}
-+EXPORT_SYMBOL_GPL(mxc_dispdrv_register);
-+
-+int mxc_dispdrv_unregister(struct mxc_dispdrv_handle *handle)
-+{
-+	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
-+
-+	if (entry) {
-+		mutex_lock(&dispdrv_lock);
-+		list_del(&entry->list);
-+		mutex_unlock(&dispdrv_lock);
-+		kfree(entry);
-+		return 0;
-+	} else
-+		return -EINVAL;
-+}
-+EXPORT_SYMBOL_GPL(mxc_dispdrv_unregister);
-+
-+struct mxc_dispdrv_handle *mxc_dispdrv_gethandle(char *name,
-+	struct mxc_dispdrv_setting *setting)
-+{
-+	int ret, found = 0;
-+	struct mxc_dispdrv_entry *entry;
-+
-+	mutex_lock(&dispdrv_lock);
-+	list_for_each_entry(entry, &dispdrv_list, list) {
-+		if (!strcmp(entry->drv->name, name) && (entry->drv->init)) {
-+			ret = entry->drv->init((struct mxc_dispdrv_handle *)
-+				entry, setting);
-+			if (ret >= 0) {
-+				entry->active = true;
-+				found = 1;
-+				break;
-+			}
-+		}
-+	}
-+	mutex_unlock(&dispdrv_lock);
-+
-+	return found ? (struct mxc_dispdrv_handle *)entry:ERR_PTR(-ENODEV);
-+}
-+EXPORT_SYMBOL_GPL(mxc_dispdrv_gethandle);
-+
-+void mxc_dispdrv_puthandle(struct mxc_dispdrv_handle *handle)
-+{
-+	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
-+
-+	mutex_lock(&dispdrv_lock);
-+	if (entry && entry->active && entry->drv->deinit) {
-+		entry->drv->deinit(handle);
-+		entry->active = false;
-+	}
-+	mutex_unlock(&dispdrv_lock);
-+
-+}
-+EXPORT_SYMBOL_GPL(mxc_dispdrv_puthandle);
-+
-+int mxc_dispdrv_setdata(struct mxc_dispdrv_handle *handle, void *data)
-+{
-+	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
-+
-+	if (entry) {
-+		entry->priv = data;
-+		return 0;
-+	} else
-+		return -EINVAL;
-+}
-+EXPORT_SYMBOL_GPL(mxc_dispdrv_setdata);
-+
-+void *mxc_dispdrv_getdata(struct mxc_dispdrv_handle *handle)
-+{
-+	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
-+
-+	if (entry) {
-+		return entry->priv;
-+	} else
-+		return ERR_PTR(-EINVAL);
-+}
-+EXPORT_SYMBOL_GPL(mxc_dispdrv_getdata);
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_dispdrv.h linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.h
---- linux-4.1.3/drivers/video/mxc/mxc_dispdrv.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.h	2015-07-27 23:13:08.749764128 +0200
-@@ -0,0 +1,54 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+#ifndef __MXC_DISPDRV_H__
-+#define __MXC_DISPDRV_H__
-+#include <linux/fb.h>
-+
-+struct mxc_dispdrv_handle {
-+	struct mxc_dispdrv_driver *drv;
-+};
-+
-+struct mxc_dispdrv_setting {
-+	/*input-feedback parameter*/
-+	struct fb_info *fbi;
-+	int if_fmt;
-+	int default_bpp;
-+	char *dft_mode_str;
-+
-+	/*feedback parameter*/
-+	int dev_id;
-+	int disp_id;
-+};
-+
-+struct mxc_dispdrv_driver {
-+	const char *name;
-+	int (*init) (struct mxc_dispdrv_handle *, struct mxc_dispdrv_setting *);
-+	/* deferred operations after dev_id and disp_id pass usage check */
-+	int (*post_init) (struct mxc_dispdrv_handle *, int dev_id, int disp_id);
-+	void (*deinit) (struct mxc_dispdrv_handle *);
-+	/* display driver enable function for extension */
-+	int (*enable) (struct mxc_dispdrv_handle *);
-+	/* display driver disable function, called at early part of fb_blank */
-+	void (*disable) (struct mxc_dispdrv_handle *);
-+	/* display driver setup function, called at early part of fb_set_par */
-+	int (*setup) (struct mxc_dispdrv_handle *, struct fb_info *fbi);
-+};
-+
-+struct mxc_dispdrv_handle *mxc_dispdrv_register(struct mxc_dispdrv_driver *drv);
-+int mxc_dispdrv_unregister(struct mxc_dispdrv_handle *handle);
-+struct mxc_dispdrv_handle *mxc_dispdrv_gethandle(char *name,
-+	struct mxc_dispdrv_setting *setting);
-+void mxc_dispdrv_puthandle(struct mxc_dispdrv_handle *handle);
-+int mxc_dispdrv_setdata(struct mxc_dispdrv_handle *handle, void *data);
-+void *mxc_dispdrv_getdata(struct mxc_dispdrv_handle *handle);
-+#endif
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_edid.c linux-xbian-imx6/drivers/video/mxc/mxc_edid.c
---- linux-4.1.3/drivers/video/mxc/mxc_edid.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_edid.c	2015-07-27 23:13:08.753749907 +0200
-@@ -0,0 +1,828 @@
-+/*
-+ * Copyright 2009-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @defgroup Framebuffer Framebuffer Driver for SDC and ADC.
-+ */
-+
-+/*!
-+ * @file mxc_edid.c
-+ *
-+ * @brief MXC EDID driver
-+ *
-+ * @ingroup Framebuffer
-+ */
-+
-+/*!
-+ * Include files
-+ */
-+#include <linux/i2c.h>
-+#include <linux/fb.h>
-+#include <video/mxc_edid.h>
-+#include "../fbdev/edid.h"
-+
-+#undef DEBUG  /* define this for verbose EDID parsing output */
-+#ifdef DEBUG
-+#define DPRINTK(fmt, args...) printk(fmt, ## args)
-+#else
-+#define DPRINTK(fmt, args...)
-+#endif
-+
-+const struct fb_videomode mxc_cea_mode[64] = {
-+	/* #1: 640x480p@59.94/60Hz 4:3 */
-+	[1] = {
-+		NULL, 60, 640, 480, 39722, 48, 16, 33, 10, 96, 2, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #2: 720x480p@59.94/60Hz 4:3 */
-+	[2] = {
-+		NULL, 60, 720, 480, 37037, 60, 16, 30, 9, 62, 6, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #3: 720x480p@59.94/60Hz 16:9 */
-+	[3] = {
-+		NULL, 60, 720, 480, 37037, 60, 16, 30, 9, 62, 6, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #4: 1280x720p@59.94/60Hz 16:9 */
-+	[4] = {
-+		NULL, 60, 1280, 720, 13468, 220, 110, 20, 5, 40, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0
-+	},
-+	/* #5: 1920x1080i@59.94/60Hz 16:9 */
-+	[5] = {
-+		NULL, 60, 1920, 1080, 13468, 88, 148, 4, 31, 44, 10,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #6: 720(1440)x480iH@59.94/60Hz 4:3 */
-+	[6] = {
-+		NULL, 60, 1440, 480, 37037, 38, 114, 8, 31, 124, 6, 0,
-+		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #7: 720(1440)x480iH@59.94/60Hz 16:9 */
-+	[7] = {
-+		NULL, 60, 1440, 480, 37037, 38, 114, 8, 31, 124, 6, 0,
-+		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #8: 720(1440)x240pH@59.94/60Hz 4:3 */
-+	[8] = {
-+		NULL, 60, 1440, 240, 37108, 114, 38, 15, 4, 124, 3, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #9: 720(1440)x240pH@59.94/60Hz 16:9 */
-+	[9] = {
-+		NULL, 60, 1440, 240, 37108, 114, 38, 15, 4, 124, 3, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #14: 1440x480p@59.94/60Hz 4:3 */
-+	[14] = {
-+		NULL, 60, 1440, 480, 18500, 120, 32, 30, 9, 124, 6, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #15: 1440x480p@59.94/60Hz 16:9 */
-+	[15] = {
-+		NULL, 60, 1440, 480, 18500, 120, 32, 30, 9, 124, 6, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #16: 1920x1080p@60Hz 16:9 */
-+	[16] = {
-+		NULL, 60, 1920, 1080, 6734, 148, 88, 36, 4, 44, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #17: 720x576pH@50Hz 4:3 */
-+	[17] = {
-+		NULL, 50, 720, 576, 37037, 68, 12, 39, 5, 64, 5, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #18: 720x576pH@50Hz 16:9 */
-+	[18] = {
-+		NULL, 50, 720, 576, 37037, 68, 12, 39, 5, 64, 5, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #19: 1280x720p@50Hz */
-+	[19] = {
-+		NULL, 50, 1280, 720, 13468, 220, 440, 20, 5, 40, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #20: 1920x1080i@50Hz */
-+	[20] = {
-+		NULL, 50, 1920, 1080, 13468, 148, 528, 4, 31, 44, 10,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #21: 720(1440)x576i@50Hz */
-+	[21] = {
-+		NULL, 50, 1440, 576, 37037, 24, 138, 4, 39, 126, 6, 0,
-+		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #22: 720(1440)x576i@50Hz */
-+	[22] = {
-+		NULL, 50, 1440, 576, 37037, 24, 138, 4, 39, 126, 6, 0,
-+		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #23: 720(1440)x288pH@50Hz 4:3 */
-+	[23] = {
-+		NULL, 50, 1440, 288, 37037, 138, 24, 19, 2, 126, 3, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #24: 720(1440)x288pH@50Hz 16:9 */
-+	[24] = {
-+		NULL, 50, 1440, 288, 37037, 138, 24, 19, 2, 126, 3, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #29: 720(1440)x576pH@50Hz 4:3 */
-+	[29] = {
-+		NULL, 50, 1440, 576, 18518, 136, 24, 39, 5, 128, 5, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
-+	},
-+	/* #30: 720(1440)x576pH@50Hz 16:9 */
-+	[30] = {
-+		NULL, 50, 1440, 576, 18518, 136, 24, 39, 5, 128, 5, 0,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #31: 1920x1080p@50Hz */
-+	[31] = {
-+		NULL, 50, 1920, 1080, 6734, 148, 528, 36, 4, 44, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #32: 1920x1080p@23.98/24Hz */
-+	[32] = {
-+		NULL, 24, 1920, 1080, 13468, 148, 638, 36, 4, 44, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #33: 1920x1080p@25Hz */
-+	[33] = {
-+		NULL, 25, 1920, 1080, 13468, 148, 528, 36, 4, 44, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #34: 1920x1080p@30Hz */
-+	[34] = {
-+		NULL, 30, 1920, 1080, 13468, 148, 88, 36, 4, 44, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
-+	},
-+	/* #41: 1280x720p@100Hz 16:9 */
-+	[41] = {
-+		NULL, 100, 1280, 720, 6734, 220, 440, 20, 5, 40, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0
-+	},
-+	/* #47: 1280x720p@119.88/120Hz 16:9 */
-+	[47] = {
-+		NULL, 120, 1280, 720, 6734, 220, 110, 20, 5, 40, 5,
-+		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0
-+	},
-+};
-+
-+/*
-+ * We have a special version of fb_mode_is_equal that ignores
-+ * pixclock, since for many CEA modes, 2 frequencies are supported
-+ * e.g. 640x480 @ 60Hz or 59.94Hz
-+ */
-+int mxc_edid_fb_mode_is_equal(bool use_aspect,
-+			const struct fb_videomode *mode1,
-+			const struct fb_videomode *mode2,
-+			u32 mode_mask)
-+{
-+	u32 mask;
-+
-+	if (use_aspect)
-+		mask = ~0;
-+	else
-+		mask = ~FB_VMODE_ASPECT_MASK;
-+
-+	return (mode1->xres         == mode2->xres &&
-+		mode1->yres         == mode2->yres &&
-+		mode1->hsync_len    == mode2->hsync_len &&
-+		mode1->vsync_len    == mode2->vsync_len &&
-+		mode1->left_margin  == mode2->left_margin &&
-+		mode1->right_margin == mode2->right_margin &&
-+		mode1->upper_margin == mode2->upper_margin &&
-+		mode1->lower_margin == mode2->lower_margin &&
-+		mode1->sync         == mode2->sync &&
-+		/* refresh check, 59.94Hz and 60Hz have the same parameter
-+		 * in struct of mxc_cea_mode */
-+		abs(mode1->refresh - mode2->refresh) <= 1 &&
-+		(mode1->vmode & mask & mode_mask) ==
-+		(mode2->vmode & mask & mode_mask));
-+}
-+EXPORT_SYMBOL(mxc_edid_fb_mode_is_equal);
-+
-+static void get_detailed_timing(unsigned char *block,
-+				struct fb_videomode *mode)
-+{
-+	mode->xres = H_ACTIVE;
-+	mode->yres = V_ACTIVE;
-+	mode->pixclock = PIXEL_CLOCK;
-+	mode->pixclock /= 1000;
-+	mode->pixclock = KHZ2PICOS(mode->pixclock);
-+	mode->right_margin = H_SYNC_OFFSET;
-+	mode->left_margin = (H_ACTIVE + H_BLANKING) -
-+		(H_ACTIVE + H_SYNC_OFFSET + H_SYNC_WIDTH);
-+	mode->upper_margin = V_BLANKING - V_SYNC_OFFSET -
-+		V_SYNC_WIDTH;
-+	mode->lower_margin = V_SYNC_OFFSET;
-+	mode->hsync_len = H_SYNC_WIDTH;
-+	mode->vsync_len = V_SYNC_WIDTH;
-+	if (HSYNC_POSITIVE)
-+		mode->sync |= FB_SYNC_HOR_HIGH_ACT;
-+	if (VSYNC_POSITIVE)
-+		mode->sync |= FB_SYNC_VERT_HIGH_ACT;
-+	mode->refresh = PIXEL_CLOCK/((H_ACTIVE + H_BLANKING) *
-+				     (V_ACTIVE + V_BLANKING));
-+	if (INTERLACED) {
-+		mode->yres *= 2;
-+		mode->upper_margin *= 2;
-+		mode->lower_margin *= 2;
-+		mode->vsync_len *= 2;
-+		mode->vmode |= FB_VMODE_INTERLACED;
-+	}
-+	mode->flag = FB_MODE_IS_DETAILED;
-+
-+	if ((H_SIZE / 16) == (V_SIZE / 9))
-+		mode->vmode |= FB_VMODE_ASPECT_16_9;
-+	else if ((H_SIZE / 4) == (V_SIZE / 3))
-+		mode->vmode |= FB_VMODE_ASPECT_4_3;
-+	else if ((mode->xres / 16) == (mode->yres / 9))
-+		mode->vmode |= FB_VMODE_ASPECT_16_9;
-+	else if ((mode->xres / 4) == (mode->yres / 3))
-+		mode->vmode |= FB_VMODE_ASPECT_4_3;
-+
-+	if (mode->vmode & FB_VMODE_ASPECT_16_9)
-+		DPRINTK("Aspect ratio: 16:9\n");
-+	if (mode->vmode & FB_VMODE_ASPECT_4_3)
-+		DPRINTK("Aspect ratio: 4:3\n");
-+	DPRINTK("      %d MHz ",  PIXEL_CLOCK/1000000);
-+	DPRINTK("%d %d %d %d ", H_ACTIVE, H_ACTIVE + H_SYNC_OFFSET,
-+	       H_ACTIVE + H_SYNC_OFFSET + H_SYNC_WIDTH, H_ACTIVE + H_BLANKING);
-+	DPRINTK("%d %d %d %d ", V_ACTIVE, V_ACTIVE + V_SYNC_OFFSET,
-+	       V_ACTIVE + V_SYNC_OFFSET + V_SYNC_WIDTH, V_ACTIVE + V_BLANKING);
-+	DPRINTK("%sHSync %sVSync\n\n", (HSYNC_POSITIVE) ? "+" : "-",
-+	       (VSYNC_POSITIVE) ? "+" : "-");
-+}
-+
-+int mxc_edid_parse_ext_blk(unsigned char *edid,
-+		struct mxc_edid_cfg *cfg,
-+		struct fb_monspecs *specs)
-+{
-+	char detail_timing_desc_offset;
-+	struct fb_videomode *mode, *m;
-+	unsigned char index = 0x0;
-+	unsigned char *block;
-+	int i, num = 0, revision;
-+
-+	if (edid[index++] != 0x2) /* only support cea ext block now */
-+		return -1;
-+	revision = edid[index++];
-+	DPRINTK("cea extent revision %d\n", revision);
-+	mode = kzalloc(50 * sizeof(struct fb_videomode), GFP_KERNEL);
-+	if (mode == NULL)
-+		return -1;
-+
-+	detail_timing_desc_offset = edid[index++];
-+
-+	if (revision >= 2) {
-+		cfg->cea_underscan = (edid[index] >> 7) & 0x1;
-+		cfg->cea_basicaudio = (edid[index] >> 6) & 0x1;
-+		cfg->cea_ycbcr444 = (edid[index] >> 5) & 0x1;
-+		cfg->cea_ycbcr422 = (edid[index] >> 4) & 0x1;
-+
-+		DPRINTK("CEA underscan %d\n", cfg->cea_underscan);
-+		DPRINTK("CEA basicaudio %d\n", cfg->cea_basicaudio);
-+		DPRINTK("CEA ycbcr444 %d\n", cfg->cea_ycbcr444);
-+		DPRINTK("CEA ycbcr422 %d\n", cfg->cea_ycbcr422);
-+	}
-+
-+	if (revision >= 3) {
-+		/* short desc */
-+		DPRINTK("CEA Short desc timmings\n");
-+		index++;
-+		while (index < detail_timing_desc_offset) {
-+			unsigned char tagcode, blklen;
-+
-+			tagcode = (edid[index] >> 5) & 0x7;
-+			blklen = (edid[index]) & 0x1f;
-+
-+			DPRINTK("Tagcode %x Len %d\n", tagcode, blklen);
-+
-+			switch (tagcode) {
-+			case 0x2: /*Video data block*/
-+				{
-+					int cea_idx;
-+					i = 0;
-+					while (i < blklen) {
-+						index++;
-+						cea_idx = edid[index] & 0x7f;
-+						if (cea_idx < ARRAY_SIZE(mxc_cea_mode) &&
-+								(mxc_cea_mode[cea_idx].xres)) {
-+							DPRINTK("Support CEA Format #%d\n", cea_idx);
-+							mode[num] = mxc_cea_mode[cea_idx];
-+							mode[num].flag |= FB_MODE_IS_STANDARD;
-+							num++;
-+						}
-+						i++;
-+					}
-+					break;
-+				}
-+			case 0x3: /*Vendor specific data*/
-+				{
-+					unsigned char IEEE_reg_iden[3];
-+					unsigned char deep_color;
-+					unsigned char latency_present;
-+					unsigned char I_latency_present;
-+					unsigned char hdmi_video_present;
-+					unsigned char hdmi_3d_present;
-+					unsigned char hdmi_3d_multi_present;
-+					unsigned char hdmi_vic_len;
-+					unsigned char hdmi_3d_len;
-+					unsigned char index_inc = 0;
-+					unsigned char vsd_end;
-+
-+					vsd_end = index + blklen;
-+
-+					IEEE_reg_iden[0] = edid[index+1];
-+					IEEE_reg_iden[1] = edid[index+2];
-+					IEEE_reg_iden[2] = edid[index+3];
-+					cfg->physical_address[0] = (edid[index+4] & 0xf0) >> 4;
-+					cfg->physical_address[1] = (edid[index+4] & 0x0f);
-+					cfg->physical_address[2] = (edid[index+5] & 0xf0) >> 4;
-+					cfg->physical_address[3] = (edid[index+5] & 0x0f);
-+
-+					if ((IEEE_reg_iden[0] == 0x03) &&
-+							(IEEE_reg_iden[1] == 0x0c) &&
-+							(IEEE_reg_iden[2] == 0x00))
-+						cfg->hdmi_cap = 1;
-+
-+					if (blklen > 5) {
-+						deep_color = edid[index+6];
-+						if (deep_color & 0x80)
-+							cfg->vsd_support_ai = true;
-+						if (deep_color & 0x40)
-+							cfg->vsd_dc_48bit = true;
-+						if (deep_color & 0x20)
-+							cfg->vsd_dc_36bit = true;
-+						if (deep_color & 0x10)
-+							cfg->vsd_dc_30bit = true;
-+						if (deep_color & 0x08)
-+							cfg->vsd_dc_y444 = true;
-+						if (deep_color & 0x01)
-+							cfg->vsd_dvi_dual = true;
-+					}
-+
-+					DPRINTK("VSD hdmi capability %d\n", cfg->hdmi_cap);
-+					DPRINTK("VSD support ai %d\n", cfg->vsd_support_ai);
-+					DPRINTK("VSD support deep color 48bit %d\n", cfg->vsd_dc_48bit);
-+					DPRINTK("VSD support deep color 36bit %d\n", cfg->vsd_dc_36bit);
-+					DPRINTK("VSD support deep color 30bit %d\n", cfg->vsd_dc_30bit);
-+					DPRINTK("VSD support deep color y444 %d\n", cfg->vsd_dc_y444);
-+					DPRINTK("VSD support dvi dual %d\n", cfg->vsd_dvi_dual);
-+
-+					if (blklen > 6)
-+						cfg->vsd_max_tmdsclk_rate = edid[index+7] * 5;
-+					DPRINTK("VSD MAX TMDS CLOCK RATE %d\n", cfg->vsd_max_tmdsclk_rate);
-+
-+					if (blklen > 7) {
-+						latency_present = edid[index+8] >> 7;
-+						I_latency_present =  (edid[index+8] & 0x40) >> 6;
-+						hdmi_video_present = (edid[index+8] & 0x20) >> 5;
-+						cfg->vsd_cnc3 = (edid[index+8] & 0x8) >> 3;
-+						cfg->vsd_cnc2 = (edid[index+8] & 0x4) >> 2;
-+						cfg->vsd_cnc1 = (edid[index+8] & 0x2) >> 1;
-+						cfg->vsd_cnc0 = edid[index+8] & 0x1;
-+
-+						DPRINTK("VSD cnc0 %d\n", cfg->vsd_cnc0);
-+						DPRINTK("VSD cnc1 %d\n", cfg->vsd_cnc1);
-+						DPRINTK("VSD cnc2 %d\n", cfg->vsd_cnc2);
-+						DPRINTK("VSD cnc3 %d\n", cfg->vsd_cnc3);
-+						DPRINTK("latency_present %d\n", latency_present);
-+						DPRINTK("I_latency_present %d\n", I_latency_present);
-+						DPRINTK("hdmi_video_present %d\n", hdmi_video_present);
-+
-+					} else {
-+						index += blklen;
-+						break;
-+					}
-+
-+					index += 9;
-+
-+					/*latency present */
-+					if (latency_present) {
-+						cfg->vsd_video_latency = edid[index++];
-+						cfg->vsd_audio_latency = edid[index++];
-+
-+						if (I_latency_present) {
-+							cfg->vsd_I_video_latency = edid[index++];
-+							cfg->vsd_I_audio_latency = edid[index++];
-+						} else {
-+							cfg->vsd_I_video_latency = cfg->vsd_video_latency;
-+							cfg->vsd_I_audio_latency = cfg->vsd_audio_latency;
-+						}
-+
-+						DPRINTK("VSD latency video_latency  %d\n", cfg->vsd_video_latency);
-+						DPRINTK("VSD latency audio_latency  %d\n", cfg->vsd_audio_latency);
-+						DPRINTK("VSD latency I_video_latency  %d\n", cfg->vsd_I_video_latency);
-+						DPRINTK("VSD latency I_audio_latency  %d\n", cfg->vsd_I_audio_latency);
-+					}
-+
-+					if (hdmi_video_present) {
-+						hdmi_3d_present = edid[index] >> 7;
-+						hdmi_3d_multi_present = (edid[index] & 0x60) >> 5;
-+						index++;
-+						hdmi_vic_len = (edid[index] & 0xe0) >> 5;
-+						hdmi_3d_len = edid[index] & 0x1f;
-+						index++;
-+
-+						DPRINTK("hdmi_3d_present %d\n", hdmi_3d_present);
-+						DPRINTK("hdmi_3d_multi_present %d\n", hdmi_3d_multi_present);
-+						DPRINTK("hdmi_vic_len %d\n", hdmi_vic_len);
-+						DPRINTK("hdmi_3d_len %d\n", hdmi_3d_len);
-+
-+						if (hdmi_vic_len > 0) {
-+							for (i = 0; i < hdmi_vic_len; i++) {
-+								cfg->hdmi_vic[i] = edid[index++];
-+								DPRINTK("HDMI_vic=%d\n", cfg->hdmi_vic[i]);
-+							}
-+						}
-+
-+						if (hdmi_3d_len > 0) {
-+							if (hdmi_3d_present) {
-+								cfg->hdmi_3d_present = hdmi_3d_present;
-+								if (hdmi_3d_multi_present == 0x1) {
-+									cfg->hdmi_3d_struct_all = (edid[index] << 8) | edid[index+1];
-+									index_inc = 2;
-+								} else if (hdmi_3d_multi_present == 0x2) {
-+									cfg->hdmi_3d_struct_all = (edid[index] << 8) | edid[index+1];
-+									cfg->hdmi_3d_mask_all = (edid[index+2] << 8) | edid[index+3];
-+									index_inc = 4;
-+								} else
-+									index_inc = 0;
-+								cfg->hdmi_3d_len = hdmi_3d_len - index_inc;
-+								cfg->hdmi_3d_multi_present = hdmi_3d_multi_present;
-+							}
-+
-+							DPRINTK("HDMI 3d struct all =0x%x\n", cfg->hdmi_3d_struct_all);
-+							DPRINTK("HDMI 3d mask all =0x%x\n", cfg->hdmi_3d_mask_all);
-+
-+							/* Read 2D vic 3D_struct */
-+							if ((hdmi_3d_len - index_inc) > 0) {
-+								DPRINTK("Support 3D video format\n");
-+								i = 0;
-+								while ((hdmi_3d_len - index_inc) > 0) {
-+
-+									cfg->hdmi_3d_format[i].vic_order_2d = edid[index+index_inc] >> 4;
-+									cfg->hdmi_3d_format[i].struct_3d = edid[index+index_inc] & 0x0f;
-+									index_inc++;
-+
-+									if (cfg->hdmi_3d_format[i].struct_3d ==  8) {
-+										cfg->hdmi_3d_format[i].detail_3d = edid[index+index_inc] >> 4;
-+										index_inc++;
-+									} else if (cfg->hdmi_3d_format[i].struct_3d > 8) {
-+										cfg->hdmi_3d_format[i].detail_3d = 0;
-+										index_inc++;
-+									}
-+
-+									DPRINTK("vic_order_2d=%d, 3d_struct=%d, 3d_detail=0x%x\n",
-+											cfg->hdmi_3d_format[i].vic_order_2d,
-+											cfg->hdmi_3d_format[i].struct_3d,
-+											cfg->hdmi_3d_format[i].detail_3d);
-+									i++;
-+								}
-+							}
-+							index += index_inc;
-+						}
-+					}
-+
-+					index = vsd_end;
-+
-+					break;
-+				}
-+			case 0x1: /*Audio data block*/
-+				{
-+					u8 audio_format, max_ch, byte1, byte2, byte3;
-+
-+					i = 0;
-+					cfg->max_channels = 0;
-+					cfg->sample_rates = 0;
-+					cfg->sample_sizes = 0;
-+
-+					while (i < blklen) {
-+						byte1 = edid[index + 1];
-+						byte2 = edid[index + 2];
-+						byte3 = edid[index + 3];
-+						index += 3;
-+						i += 3;
-+
-+						audio_format = byte1 >> 3;
-+						max_ch = (byte1 & 0x07) + 1;
-+
-+						DPRINTK("Audio Format Descriptor : %2d\n", audio_format);
-+						DPRINTK("Max Number of Channels  : %2d\n", max_ch);
-+						DPRINTK("Sample Rates            : %02x\n", byte2);
-+
-+						/* ALSA can't specify specific compressed
-+						 * formats, so only care about PCM for now. */
-+						if (audio_format == AUDIO_CODING_TYPE_LPCM) {
-+							if (max_ch > cfg->max_channels)
-+								cfg->max_channels = max_ch;
-+
-+							cfg->sample_rates |= byte2;
-+							cfg->sample_sizes |= byte3 & 0x7;
-+							DPRINTK("Sample Sizes            : %02x\n",
-+								byte3 & 0x7);
-+						}
-+					}
-+					break;
-+				}
-+			case 0x4: /*Speaker allocation block*/
-+				{
-+					i = 0;
-+					while (i < blklen) {
-+						cfg->speaker_alloc = edid[index + 1];
-+						index += 3;
-+						i += 3;
-+						DPRINTK("Speaker Alloc           : %02x\n", cfg->speaker_alloc);
-+					}
-+					break;
-+				}
-+			case 0x7: /*User extended block*/
-+			default:
-+				/* skip */
-+				DPRINTK("Not handle block, tagcode = 0x%x\n", tagcode);
-+				index += blklen;
-+				break;
-+			}
-+
-+			index++;
-+		}
-+	}
-+
-+	/* long desc */
-+	DPRINTK("CEA long desc timmings\n");
-+	index = detail_timing_desc_offset;
-+	block = edid + index;
-+	while (index < (EDID_LENGTH - DETAILED_TIMING_DESCRIPTION_SIZE)) {
-+		if (!(block[0] == 0x00 && block[1] == 0x00)) {
-+			get_detailed_timing(block, &mode[num]);
-+			num++;
-+		}
-+		block += DETAILED_TIMING_DESCRIPTION_SIZE;
-+		index += DETAILED_TIMING_DESCRIPTION_SIZE;
-+	}
-+
-+	if (!num) {
-+		kfree(mode);
-+		return 0;
-+	}
-+
-+	m = kmalloc((num + specs->modedb_len) *
-+			sizeof(struct fb_videomode), GFP_KERNEL);
-+	if (!m)
-+		return 0;
-+
-+	if (specs->modedb_len) {
-+		memmove(m, specs->modedb,
-+			specs->modedb_len * sizeof(struct fb_videomode));
-+		kfree(specs->modedb);
-+	}
-+	memmove(m+specs->modedb_len, mode,
-+		num * sizeof(struct fb_videomode));
-+	kfree(mode);
-+
-+	specs->modedb_len += num;
-+	specs->modedb = m;
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(mxc_edid_parse_ext_blk);
-+
-+static int mxc_edid_readblk(struct i2c_adapter *adp,
-+		unsigned short addr, unsigned char *edid)
-+{
-+	int ret = 0, extblknum = 0;
-+	unsigned char regaddr = 0x0;
-+	struct i2c_msg msg[2] = {
-+		{
-+		.addr	= addr,
-+		.flags	= 0,
-+		.len	= 1,
-+		.buf	= &regaddr,
-+		}, {
-+		.addr	= addr,
-+		.flags	= I2C_M_RD,
-+		.len	= EDID_LENGTH,
-+		.buf	= edid,
-+		},
-+	};
-+
-+	ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
-+	if (ret != ARRAY_SIZE(msg)) {
-+		DPRINTK("unable to read EDID block\n");
-+		return -EIO;
-+	}
-+
-+	if (edid[1] == 0x00)
-+		return -ENOENT;
-+
-+	extblknum = edid[0x7E];
-+
-+	if (extblknum) {
-+		regaddr = 128;
-+		msg[1].buf = edid + EDID_LENGTH;
-+
-+		ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
-+		if (ret != ARRAY_SIZE(msg)) {
-+			DPRINTK("unable to read EDID ext block\n");
-+			return -EIO;
-+		}
-+	}
-+
-+	return extblknum;
-+}
-+
-+static int mxc_edid_readsegblk(struct i2c_adapter *adp, unsigned short addr,
-+			unsigned char *edid, int seg_num)
-+{
-+	int ret = 0;
-+	unsigned char segment = 0x1, regaddr = 0;
-+	struct i2c_msg msg[3] = {
-+		{
-+		.addr	= 0x30,
-+		.flags	= 0,
-+		.len	= 1,
-+		.buf	= &segment,
-+		}, {
-+		.addr	= addr,
-+		.flags	= 0,
-+		.len	= 1,
-+		.buf	= &regaddr,
-+		}, {
-+		.addr	= addr,
-+		.flags	= I2C_M_RD,
-+		.len	= EDID_LENGTH,
-+		.buf	= edid,
-+		},
-+	};
-+
-+	ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
-+	if (ret != ARRAY_SIZE(msg)) {
-+		DPRINTK("unable to read EDID block\n");
-+		return -EIO;
-+	}
-+
-+	if (seg_num == 2) {
-+		regaddr = 128;
-+		msg[2].buf = edid + EDID_LENGTH;
-+
-+		ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
-+		if (ret != ARRAY_SIZE(msg)) {
-+			DPRINTK("unable to read EDID block\n");
-+			return -EIO;
-+		}
-+	}
-+
-+	return ret;
-+}
-+
-+int mxc_edid_var_to_vic(struct fb_var_screeninfo *var)
-+{
-+	int i;
-+	struct fb_videomode m;
-+
-+	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
-+		fb_var_to_videomode(&m, var);
-+		if (mxc_edid_fb_mode_is_equal(false, &m, &mxc_cea_mode[i], FB_VMODE_MASK))
-+			break;
-+	}
-+
-+	if (i == ARRAY_SIZE(mxc_cea_mode))
-+		return 0;
-+
-+	return i;
-+}
-+EXPORT_SYMBOL(mxc_edid_var_to_vic);
-+
-+int mxc_edid_mode_to_vic(const struct fb_videomode *mode, u32 mode_mask)
-+{
-+	int i;
-+	bool use_aspect = (mode->vmode & FB_VMODE_ASPECT_MASK);
-+	u32 use_mask = mode_mask ? mode_mask : FB_VMODE_MASK ^ (FB_VMODE_3D_MASK | FB_VMODE_FRACTIONAL);
-+
-+	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
-+		if (mxc_edid_fb_mode_is_equal(use_aspect, mode, &mxc_cea_mode[i], use_mask))
-+			break;
-+	}
-+
-+	if (i == ARRAY_SIZE(mxc_cea_mode))
-+		return 0;
-+
-+	return i;
-+}
-+EXPORT_SYMBOL(mxc_edid_mode_to_vic);
-+
-+/* make sure edid has 512 bytes*/
-+int mxc_edid_read(struct i2c_adapter *adp, unsigned short addr,
-+	unsigned char *edid, struct mxc_edid_cfg *cfg, struct fb_info *fbi)
-+{
-+	int ret = 0, extblknum;
-+	if (!adp || !edid || !cfg || !fbi)
-+		return -EINVAL;
-+
-+	memset(edid, 0, EDID_LENGTH*4);
-+	memset(cfg, 0, sizeof(struct mxc_edid_cfg));
-+
-+	extblknum = mxc_edid_readblk(adp, addr, edid);
-+	if (extblknum < 0)
-+		return extblknum;
-+
-+	/* edid first block parsing */
-+	memset(&fbi->monspecs, 0, sizeof(fbi->monspecs));
-+	fb_edid_to_monspecs(edid, &fbi->monspecs);
-+
-+	if (extblknum) {
-+		int i;
-+
-+		/* need read segment block? */
-+		if (extblknum > 1) {
-+			ret = mxc_edid_readsegblk(adp, addr,
-+				edid + EDID_LENGTH*2, extblknum - 1);
-+			if (ret < 0)
-+				return ret;
-+		}
-+
-+		for (i = 1; i <= extblknum; i++)
-+			/* edid ext block parsing */
-+			mxc_edid_parse_ext_blk(edid + i*EDID_LENGTH,
-+					cfg, &fbi->monspecs);
-+	}
-+
-+	return 0;
-+}
-+EXPORT_SYMBOL(mxc_edid_read);
-+
-+const struct fb_videomode *mxc_fb_find_nearest_mode(const struct fb_videomode *mode,
-+						    struct list_head *head)
-+{
-+	struct list_head *pos;
-+	struct fb_modelist *modelist;
-+	struct fb_videomode *cmode, *best = NULL;
-+	u32 diff = -1, diff_refresh = -1;
-+
-+	list_for_each(pos, head) {
-+		u32 d;
-+
-+		modelist = list_entry(pos, struct fb_modelist, list);
-+		cmode = &modelist->mode;
-+
-+		if (!(mode->vmode & FB_VMODE_3D_MASK) &&
-+		     (cmode->vmode & FB_VMODE_3D_MASK))
-+			continue;
-+		if ((mode->vmode & FB_VMODE_3D_MASK) &&
-+		   ((mode->vmode & FB_VMODE_3D_MASK) != (cmode->vmode & FB_VMODE_3D_MASK)))
-+			continue;
-+
-+		if ((mode->vmode & FB_VMODE_MASK_SIMPLE) != (cmode->vmode & FB_VMODE_MASK_SIMPLE))
-+			continue;
-+
-+		if ((mode->vmode & FB_VMODE_ASPECT_MASK) &&
-+		   ((mode->vmode & FB_VMODE_ASPECT_MASK) != (cmode->vmode & FB_VMODE_ASPECT_MASK)))
-+			continue;
-+
-+		if ((mode->vmode & FB_VMODE_FRACTIONAL) != (cmode->vmode & FB_VMODE_FRACTIONAL))
-+			continue;
-+
-+		d = abs(cmode->xres - mode->xres) +
-+			abs(cmode->yres - mode->yres);
-+		if (diff > d) {
-+			diff = d;
-+			diff_refresh = abs(cmode->refresh - mode->refresh);
-+			best = cmode;
-+		} else if (diff == d) {
-+			d = abs(cmode->refresh - mode->refresh);
-+			if (diff_refresh > d) {
-+				diff_refresh = d;
-+				best = cmode;
-+			}
-+		}
-+	}
-+
-+	return best;
-+}
-+EXPORT_SYMBOL(mxc_fb_find_nearest_mode);
-diff -Nur linux-4.1.3/drivers/video/mxc/mxcfb_hx8369_wvga.c linux-xbian-imx6/drivers/video/mxc/mxcfb_hx8369_wvga.c
---- linux-4.1.3/drivers/video/mxc/mxcfb_hx8369_wvga.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxcfb_hx8369_wvga.c	2015-07-27 23:13:08.753749907 +0200
-@@ -0,0 +1,449 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/types.h>
-+#include <linux/init.h>
-+#include <linux/delay.h>
-+#include <linux/platform_device.h>
-+#include <linux/err.h>
-+#include <linux/clk.h>
-+#include <linux/console.h>
-+#include <linux/io.h>
-+#include <linux/bitops.h>
-+#include <linux/spinlock.h>
-+#include <linux/mipi_dsi.h>
-+#include <linux/mxcfb.h>
-+#include <linux/backlight.h>
-+#include <video/mipi_display.h>
-+
-+#include "mipi_dsi.h"
-+
-+#define MIPI_DSI_MAX_RET_PACK_SIZE				(0x4)
-+
-+#define HX8369BL_MAX_BRIGHT		(255)
-+#define HX8369BL_DEF_BRIGHT		(255)
-+
-+#define HX8369_MAX_DPHY_CLK					(800)
-+#define HX8369_ONE_DATA_LANE					(0x1)
-+#define HX8369_TWO_DATA_LANE					(0x2)
-+
-+#define HX8369_CMD_SETEXTC					(0xB9)
-+#define HX8369_CMD_SETEXTC_LEN					(0x4)
-+#define HX8369_CMD_SETEXTC_PARAM_1				(0x6983ff)
-+
-+#define HX8369_CMD_GETHXID					(0xF4)
-+#define HX8369_CMD_GETHXID_LEN					(0x4)
-+#define HX8369_ID						(0x69)
-+#define HX8369_ID_MASK						(0xFF)
-+
-+#define HX8369_CMD_SETDISP					(0xB2)
-+#define HX8369_CMD_SETDISP_LEN					(16)
-+#define HX8369_CMD_SETDISP_1_HALT				(0x00)
-+#define HX8369_CMD_SETDISP_2_RES_MODE				(0x23)
-+#define HX8369_CMD_SETDISP_3_BP					(0x03)
-+#define HX8369_CMD_SETDISP_4_FP					(0x03)
-+#define HX8369_CMD_SETDISP_5_SAP				(0x70)
-+#define HX8369_CMD_SETDISP_6_GENON				(0x00)
-+#define HX8369_CMD_SETDISP_7_GENOFF				(0xff)
-+#define HX8369_CMD_SETDISP_8_RTN				(0x00)
-+#define HX8369_CMD_SETDISP_9_TEI				(0x00)
-+#define HX8369_CMD_SETDISP_10_TEP_UP				(0x00)
-+#define HX8369_CMD_SETDISP_11_TEP_LOW				(0x00)
-+#define HX8369_CMD_SETDISP_12_BP_PE				(0x03)
-+#define HX8369_CMD_SETDISP_13_FP_PE				(0x03)
-+#define HX8369_CMD_SETDISP_14_RTN_PE				(0x00)
-+#define HX8369_CMD_SETDISP_15_GON				(0x01)
-+
-+#define HX8369_CMD_SETCYC					(0xB4)
-+#define HX8369_CMD_SETCYC_LEN					(6)
-+#define HX8369_CMD_SETCYC_PARAM_1				(0x5f1d00)
-+#define HX8369_CMD_SETCYC_PARAM_2				(0x060e)
-+
-+#define HX8369_CMD_SETGIP					(0xD5)
-+#define HX8369_CMD_SETGIP_LEN					(27)
-+#define HX8369_CMD_SETGIP_PARAM_1				(0x030400)
-+#define HX8369_CMD_SETGIP_PARAM_2				(0x1c050100)
-+#define HX8369_CMD_SETGIP_PARAM_3				(0x00030170)
-+#define HX8369_CMD_SETGIP_PARAM_4				(0x51064000)
-+#define HX8369_CMD_SETGIP_PARAM_5				(0x41000007)
-+#define HX8369_CMD_SETGIP_PARAM_6				(0x07075006)
-+#define HX8369_CMD_SETGIP_PARAM_7				(0x040f)
-+
-+#define HX8369_CMD_SETPOWER					(0xB1)
-+#define HX8369_CMD_SETPOWER_LEN					(20)
-+#define HX8369_CMD_SETPOWER_PARAM_1				(0x340001)
-+#define HX8369_CMD_SETPOWER_PARAM_2				(0x0f0f0006)
-+#define HX8369_CMD_SETPOWER_PARAM_3				(0x3f3f322a)
-+#define HX8369_CMD_SETPOWER_PARAM_4				(0xe6013a07)
-+#define HX8369_CMD_SETPOWER_PARAM_5				(0xe6e6e6e6)
-+
-+#define HX8369_CMD_SETVCOM					(0xB6)
-+#define HX8369_CMD_SETVCOM_LEN					(3)
-+#define HX8369_CMD_SETVCOM_PARAM_1				(0x5656)
-+
-+#define HX8369_CMD_SETPANEL					(0xCC)
-+#define HX8369_CMD_SETPANEL_PARAM_1				(0x02)
-+
-+#define HX8369_CMD_SETGAMMA					(0xE0)
-+#define HX8369_CMD_SETGAMMA_LEN					(35)
-+#define HX8369_CMD_SETGAMMA_PARAM_1				(0x221d00)
-+#define HX8369_CMD_SETGAMMA_PARAM_2				(0x2e3f3d38)
-+#define HX8369_CMD_SETGAMMA_PARAM_3				(0x0f0d064a)
-+#define HX8369_CMD_SETGAMMA_PARAM_4				(0x16131513)
-+#define HX8369_CMD_SETGAMMA_PARAM_5				(0x1d001910)
-+#define HX8369_CMD_SETGAMMA_PARAM_6				(0x3f3d3822)
-+#define HX8369_CMD_SETGAMMA_PARAM_7				(0x0d064a2e)
-+#define HX8369_CMD_SETGAMMA_PARAM_8				(0x1315130f)
-+#define HX8369_CMD_SETGAMMA_PARAM_9				(0x191016)
-+
-+#define HX8369_CMD_SETMIPI					(0xBA)
-+#define HX8369_CMD_SETMIPI_LEN					(14)
-+#define HX8369_CMD_SETMIPI_PARAM_1				(0xc6a000)
-+#define HX8369_CMD_SETMIPI_PARAM_2				(0x10000a00)
-+#define HX8369_CMD_SETMIPI_ONELANE				(0x10 << 24)
-+#define HX8369_CMD_SETMIPI_TWOLANE				(0x11 << 24)
-+#define HX8369_CMD_SETMIPI_PARAM_3				(0x00026f30)
-+#define HX8369_CMD_SETMIPI_PARAM_4				(0x4018)
-+
-+#define HX8369_CMD_SETPIXEL_FMT					(0x3A)
-+#define HX8369_CMD_SETPIXEL_FMT_24BPP				(0x77)
-+#define HX8369_CMD_SETPIXEL_FMT_18BPP				(0x66)
-+#define HX8369_CMD_SETPIXEL_FMT_16BPP				(0x55)
-+
-+#define HX8369_CMD_SETCLUMN_ADDR				(0x2A)
-+#define HX8369_CMD_SETCLUMN_ADDR_LEN				(5)
-+#define HX8369_CMD_SETCLUMN_ADDR_PARAM_1			(0xdf0000)
-+#define HX8369_CMD_SETCLUMN_ADDR_PARAM_2			(0x01)
-+
-+#define HX8369_CMD_SETPAGE_ADDR					(0x2B)
-+#define HX8369_CMD_SETPAGE_ADDR_LEN				(5)
-+#define HX8369_CMD_SETPAGE_ADDR_PARAM_1				(0x1f0000)
-+#define HX8369_CMD_SETPAGE_ADDR_PARAM_2				(0x03)
-+
-+#define HX8369_CMD_WRT_DISP_BRIGHT				(0x51)
-+#define HX8369_CMD_WRT_DISP_BRIGHT_PARAM_1			(0xFF)
-+
-+#define HX8369_CMD_WRT_CABC_MIN_BRIGHT				(0x5E)
-+#define HX8369_CMD_WRT_CABC_MIN_BRIGHT_PARAM_1			(0x20)
-+
-+#define HX8369_CMD_WRT_CABC_CTRL				(0x55)
-+#define HX8369_CMD_WRT_CABC_CTRL_PARAM_1			(0x1)
-+
-+#define HX8369_CMD_WRT_CTRL_DISP				(0x53)
-+#define HX8369_CMD_WRT_CTRL_DISP_PARAM_1			(0x24)
-+
-+#define CHECK_RETCODE(ret)					\
-+do {								\
-+	if (ret < 0) {						\
-+		dev_err(&mipi_dsi->pdev->dev,			\
-+			"%s ERR: ret:%d, line:%d.\n",		\
-+			__func__, ret, __LINE__);		\
-+		return ret;					\
-+	}							\
-+} while (0)
-+
-+static int hx8369bl_brightness;
-+static int mipid_init_backlight(struct mipi_dsi_info *mipi_dsi);
-+
-+static struct fb_videomode truly_lcd_modedb[] = {
-+	{
-+	 "TRULY-WVGA", 64, 480, 800, 37880,
-+	 8, 8,
-+	 6, 6,
-+	 8, 6,
-+	 FB_SYNC_OE_LOW_ACT,
-+	 FB_VMODE_NONINTERLACED,
-+	 0,
-+	},
-+};
-+
-+static struct mipi_lcd_config lcd_config = {
-+	.virtual_ch		= 0x0,
-+	.data_lane_num  = HX8369_TWO_DATA_LANE,
-+	.max_phy_clk    = HX8369_MAX_DPHY_CLK,
-+	.dpi_fmt		= MIPI_RGB888,
-+};
-+void mipid_hx8369_get_lcd_videomode(struct fb_videomode **mode, int *size,
-+		struct mipi_lcd_config **data)
-+{
-+	*mode = &truly_lcd_modedb[0];
-+	*size = ARRAY_SIZE(truly_lcd_modedb);
-+	*data = &lcd_config;
-+}
-+
-+int mipid_hx8369_lcd_setup(struct mipi_dsi_info *mipi_dsi)
-+{
-+	u32 buf[DSI_CMD_BUF_MAXSIZE];
-+	int err;
-+
-+	dev_dbg(&mipi_dsi->pdev->dev, "MIPI DSI LCD setup.\n");
-+	buf[0] = HX8369_CMD_SETEXTC | (HX8369_CMD_SETEXTC_PARAM_1 << 8);
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
-+					buf, HX8369_CMD_SETEXTC_LEN);
-+	CHECK_RETCODE(err);
-+	buf[0] = MIPI_DSI_MAX_RET_PACK_SIZE;
-+	err = mipi_dsi_pkt_write(mipi_dsi,
-+				MIPI_DSI_SET_MAXIMUM_RETURN_PACKET_SIZE,
-+				buf, 0);
-+	CHECK_RETCODE(err);
-+	buf[0] = HX8369_CMD_GETHXID;
-+	err =  mipi_dsi_pkt_read(mipi_dsi,
-+			MIPI_DSI_GENERIC_READ_REQUEST_2_PARAM,
-+			buf, HX8369_CMD_GETHXID_LEN);
-+	if (!err && ((buf[0] & HX8369_ID_MASK) == HX8369_ID)) {
-+		dev_info(&mipi_dsi->pdev->dev,
-+				"MIPI DSI LCD ID:0x%x.\n", buf[0]);
-+	} else {
-+		dev_err(&mipi_dsi->pdev->dev,
-+			"mipi_dsi_pkt_read err:%d, data:0x%x.\n",
-+			err, buf[0]);
-+		dev_info(&mipi_dsi->pdev->dev,
-+				"MIPI DSI LCD not detected!\n");
-+		return err;
-+	}
-+
-+	/* set LCD resolution as 480RGBx800, DPI interface,
-+	 * display operation mode: RGB data bypass GRAM mode.
-+	 */
-+	buf[0] = HX8369_CMD_SETDISP | (HX8369_CMD_SETDISP_1_HALT << 8) |
-+			(HX8369_CMD_SETDISP_2_RES_MODE << 16) |
-+			(HX8369_CMD_SETDISP_3_BP << 24);
-+	buf[1] = HX8369_CMD_SETDISP_4_FP | (HX8369_CMD_SETDISP_5_SAP << 8) |
-+			 (HX8369_CMD_SETDISP_6_GENON << 16) |
-+			 (HX8369_CMD_SETDISP_7_GENOFF << 24);
-+	buf[2] = HX8369_CMD_SETDISP_8_RTN | (HX8369_CMD_SETDISP_9_TEI << 8) |
-+			 (HX8369_CMD_SETDISP_10_TEP_UP << 16) |
-+			 (HX8369_CMD_SETDISP_11_TEP_LOW << 24);
-+	buf[3] = HX8369_CMD_SETDISP_12_BP_PE |
-+			(HX8369_CMD_SETDISP_13_FP_PE << 8) |
-+			 (HX8369_CMD_SETDISP_14_RTN_PE << 16) |
-+			 (HX8369_CMD_SETDISP_15_GON << 24);
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
-+						buf, HX8369_CMD_SETDISP_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set display waveform cycle */
-+	buf[0] = HX8369_CMD_SETCYC | (HX8369_CMD_SETCYC_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETCYC_PARAM_2;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
-+						buf, HX8369_CMD_SETCYC_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set GIP timing output control */
-+	buf[0] = HX8369_CMD_SETGIP | (HX8369_CMD_SETGIP_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETGIP_PARAM_2;
-+	buf[2] = HX8369_CMD_SETGIP_PARAM_3;
-+	buf[3] = HX8369_CMD_SETGIP_PARAM_4;
-+	buf[4] = HX8369_CMD_SETGIP_PARAM_5;
-+	buf[5] = HX8369_CMD_SETGIP_PARAM_6;
-+	buf[6] = HX8369_CMD_SETGIP_PARAM_7;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
-+				HX8369_CMD_SETGIP_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set power: standby, DC etc. */
-+	buf[0] = HX8369_CMD_SETPOWER | (HX8369_CMD_SETPOWER_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETPOWER_PARAM_2;
-+	buf[2] = HX8369_CMD_SETPOWER_PARAM_3;
-+	buf[3] = HX8369_CMD_SETPOWER_PARAM_4;
-+	buf[4] = HX8369_CMD_SETPOWER_PARAM_5;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
-+				HX8369_CMD_SETPOWER_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set VCOM voltage. */
-+	buf[0] = HX8369_CMD_SETVCOM | (HX8369_CMD_SETVCOM_PARAM_1 << 8);
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
-+				HX8369_CMD_SETVCOM_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set Panel: BGR/RGB or Inversion. */
-+	buf[0] = HX8369_CMD_SETPANEL | (HX8369_CMD_SETPANEL_PARAM_1 << 8);
-+	err = mipi_dsi_pkt_write(mipi_dsi,
-+		MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM, buf, 0);
-+	CHECK_RETCODE(err);
-+
-+	/* Set gamma curve related setting */
-+	buf[0] = HX8369_CMD_SETGAMMA | (HX8369_CMD_SETGAMMA_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETGAMMA_PARAM_2;
-+	buf[2] = HX8369_CMD_SETGAMMA_PARAM_3;
-+	buf[3] = HX8369_CMD_SETGAMMA_PARAM_4;
-+	buf[4] = HX8369_CMD_SETGAMMA_PARAM_5;
-+	buf[5] = HX8369_CMD_SETGAMMA_PARAM_6;
-+	buf[7] = HX8369_CMD_SETGAMMA_PARAM_7;
-+	buf[7] = HX8369_CMD_SETGAMMA_PARAM_8;
-+	buf[8] = HX8369_CMD_SETGAMMA_PARAM_9;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
-+				HX8369_CMD_SETGAMMA_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set MIPI: DPHYCMD & DSICMD, data lane number */
-+	buf[0] = HX8369_CMD_SETMIPI | (HX8369_CMD_SETMIPI_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETMIPI_PARAM_2;
-+	buf[2] = HX8369_CMD_SETMIPI_PARAM_3;
-+	if (lcd_config.data_lane_num == HX8369_ONE_DATA_LANE)
-+		buf[2] |= HX8369_CMD_SETMIPI_ONELANE;
-+	else
-+		buf[2] |= HX8369_CMD_SETMIPI_TWOLANE;
-+	buf[3] = HX8369_CMD_SETMIPI_PARAM_4;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
-+				HX8369_CMD_SETMIPI_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set pixel format:24bpp */
-+	buf[0] = HX8369_CMD_SETPIXEL_FMT;
-+	switch (lcd_config.dpi_fmt) {
-+	case MIPI_RGB565_PACKED:
-+	case MIPI_RGB565_LOOSELY:
-+	case MIPI_RGB565_CONFIG3:
-+		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_16BPP << 8);
-+		break;
-+
-+	case MIPI_RGB666_LOOSELY:
-+	case MIPI_RGB666_PACKED:
-+		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_18BPP << 8);
-+		break;
-+
-+	case MIPI_RGB888:
-+		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_24BPP << 8);
-+		break;
-+
-+	default:
-+		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_24BPP << 8);
-+		break;
-+	}
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
-+			buf, 0);
-+	CHECK_RETCODE(err);
-+
-+	/* Set column address: 0~479 */
-+	buf[0] = HX8369_CMD_SETCLUMN_ADDR |
-+		(HX8369_CMD_SETCLUMN_ADDR_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETCLUMN_ADDR_PARAM_2;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
-+				buf, HX8369_CMD_SETCLUMN_ADDR_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set page address: 0~799 */
-+	buf[0] = HX8369_CMD_SETPAGE_ADDR |
-+		(HX8369_CMD_SETPAGE_ADDR_PARAM_1 << 8);
-+	buf[1] = HX8369_CMD_SETPAGE_ADDR_PARAM_2;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
-+					buf, HX8369_CMD_SETPAGE_ADDR_LEN);
-+	CHECK_RETCODE(err);
-+
-+	/* Set display brightness related */
-+	buf[0] = HX8369_CMD_WRT_DISP_BRIGHT |
-+			(HX8369_CMD_WRT_DISP_BRIGHT_PARAM_1 << 8);
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
-+		buf, 0);
-+	CHECK_RETCODE(err);
-+
-+	buf[0] = HX8369_CMD_WRT_CABC_CTRL |
-+		(HX8369_CMD_WRT_CABC_CTRL_PARAM_1 << 8);
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
-+		buf, 0);
-+	CHECK_RETCODE(err);
-+
-+	buf[0] = HX8369_CMD_WRT_CTRL_DISP |
-+		(HX8369_CMD_WRT_CTRL_DISP_PARAM_1 << 8);
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
-+		buf, 0);
-+	CHECK_RETCODE(err);
-+
-+	/* exit sleep mode and set display on */
-+	buf[0] = MIPI_DCS_EXIT_SLEEP_MODE;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_1_PARAM,
-+		buf, 0);
-+	CHECK_RETCODE(err);
-+	/* To allow time for the supply voltages
-+	 * and clock circuits to stabilize.
-+	 */
-+	msleep(5);
-+	buf[0] = MIPI_DCS_SET_DISPLAY_ON;
-+	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_1_PARAM,
-+		buf, 0);
-+	CHECK_RETCODE(err);
-+
-+	err = mipid_init_backlight(mipi_dsi);
-+	return err;
-+}
-+
-+static int mipid_bl_update_status(struct backlight_device *bl)
-+{
-+	u32 buf;
-+	int brightness = bl->props.brightness;
-+	struct mipi_dsi_info *mipi_dsi = bl_get_data(bl);
-+
-+	if (bl->props.power != FB_BLANK_UNBLANK ||
-+	    bl->props.fb_blank != FB_BLANK_UNBLANK)
-+		brightness = 0;
-+
-+	buf = HX8369_CMD_WRT_DISP_BRIGHT |
-+			((brightness & HX8369BL_MAX_BRIGHT) << 8);
-+	mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
-+		&buf, 0);
-+
-+	hx8369bl_brightness = brightness & HX8369BL_MAX_BRIGHT;
-+
-+	dev_dbg(&bl->dev, "mipid backlight bringtness:%d.\n", brightness);
-+	return 0;
-+}
-+
-+static int mipid_bl_get_brightness(struct backlight_device *bl)
-+{
-+	return hx8369bl_brightness;
-+}
-+
-+static int mipi_bl_check_fb(struct backlight_device *bl, struct fb_info *fbi)
-+{
-+	return 0;
-+}
-+
-+static const struct backlight_ops mipid_lcd_bl_ops = {
-+	.update_status = mipid_bl_update_status,
-+	.get_brightness = mipid_bl_get_brightness,
-+	.check_fb = mipi_bl_check_fb,
-+};
-+
-+static int mipid_init_backlight(struct mipi_dsi_info *mipi_dsi)
-+{
-+	struct backlight_properties props;
-+	struct backlight_device	*bl;
-+
-+	if (mipi_dsi->bl) {
-+		pr_debug("mipid backlight already init!\n");
-+		return 0;
-+	}
-+	memset(&props, 0, sizeof(struct backlight_properties));
-+	props.max_brightness = HX8369BL_MAX_BRIGHT;
-+	props.type = BACKLIGHT_RAW;
-+	bl = backlight_device_register("mipid-bl", &mipi_dsi->pdev->dev,
-+		mipi_dsi, &mipid_lcd_bl_ops, &props);
-+	if (IS_ERR(bl)) {
-+		pr_err("error %ld on backlight register\n", PTR_ERR(bl));
-+		return PTR_ERR(bl);
-+	}
-+	mipi_dsi->bl = bl;
-+	bl->props.power = FB_BLANK_UNBLANK;
-+	bl->props.fb_blank = FB_BLANK_UNBLANK;
-+	bl->props.brightness = HX8369BL_DEF_BRIGHT;
-+
-+	mipid_bl_update_status(bl);
-+	return 0;
-+}
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_hdmi.c linux-xbian-imx6/drivers/video/mxc/mxc_hdmi.c
---- linux-4.1.3/drivers/video/mxc/mxc_hdmi.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_hdmi.c	2015-07-27 23:13:08.753749907 +0200
-@@ -0,0 +1,3404 @@
-+/*
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+/*
-+ * SH-Mobile High-Definition Multimedia Interface (HDMI) driver
-+ * for SLISHDMI13T and SLIPHDMIT IP cores
-+ *
-+ * Copyright (C) 2010, Guennadi Liakhovetski <g.liakhovetski@gmx.de>
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License version 2 as
-+ * published by the Free Software Foundation.
-+ */
-+
-+#include <linux/module.h>
-+#include <linux/kernel.h>
-+#include <linux/device.h>
-+#include <linux/platform_device.h>
-+#include <linux/input.h>
-+#include <linux/interrupt.h>
-+#include <linux/irq.h>
-+#include <linux/io.h>
-+#include <linux/fb.h>
-+#include <linux/init.h>
-+#include <linux/list.h>
-+#include <linux/delay.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/err.h>
-+#include <linux/clk.h>
-+#include <linux/uaccess.h>
-+#include <linux/cpufreq.h>
-+#include <linux/firmware.h>
-+#include <linux/kthread.h>
-+#include <linux/regulator/driver.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/ipu.h>
-+#include <linux/regmap.h>
-+#include <linux/pinctrl/consumer.h>
-+#include <linux/of_device.h>
-+
-+#include <linux/console.h>
-+#include <linux/types.h>
-+
-+#include "../fbdev/edid.h"
-+#include <video/mxc_edid.h>
-+#include <video/mxc_hdmi.h>
-+#include "mxc_dispdrv.h"
-+
-+#include <linux/mfd/mxc-hdmi-core.h>
-+
-+#include <linux/hdmi.h>
-+
-+#define DISPDRV_HDMI	"hdmi"
-+#define HDMI_EDID_LEN		512
-+
-+/* status codes for reading edid */
-+#define HDMI_EDID_SUCCESS	0
-+#define HDMI_EDID_FAIL		-1
-+#define HDMI_EDID_SAME		-2
-+#define HDMI_EDID_NO_MODES	-3
-+
-+#define NUM_CEA_VIDEO_MODES	64
-+#define DEFAULT_VIDEO_MODE	16 /* 1080P */
-+
-+#define RGB			0
-+#define YCBCR444		1
-+#define YCBCR422_16BITS		2
-+#define YCBCR422_8BITS		3
-+#define XVYCC444            4
-+
-+#define fb_mode_is_equal(a, b)	mxc_edid_fb_mode_is_equal(true, a, b, ~0)
-+
-+/*
-+ * We follow a flowchart which is in the "Synopsys DesignWare Courses
-+ * HDMI Transmitter Controller User Guide, 1.30a", section 3.1
-+ * (dwc_hdmi_tx_user.pdf)
-+ *
-+ * Below are notes that say "HDMI Initialization Step X"
-+ * These correspond to the flowchart.
-+ */
-+
-+/*
-+ * We are required to configure VGA mode before reading edid
-+ * in HDMI Initialization Step B
-+ */
-+static const struct fb_videomode vga_mode = {
-+	/* 640x480 @ 60 Hz, 31.5 kHz hsync */
-+	NULL, 60, 640, 480, 39721, 48, 16, 33, 10, 96, 2, 0,
-+	FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, FB_MODE_IS_VESA,
-+};
-+
-+enum hdmi_datamap {
-+	RGB444_8B = 0x01,
-+	RGB444_10B = 0x03,
-+	RGB444_12B = 0x05,
-+	RGB444_16B = 0x07,
-+	YCbCr444_8B = 0x09,
-+	YCbCr444_10B = 0x0B,
-+	YCbCr444_12B = 0x0D,
-+	YCbCr444_16B = 0x0F,
-+	YCbCr422_8B = 0x16,
-+	YCbCr422_10B = 0x14,
-+	YCbCr422_12B = 0x12,
-+};
-+
-+enum hdmi_mxc_colorimetry {
-+	eITU601,
-+	eITU709,
-+};
-+
-+struct hdmi_vmode {
-+	bool mDVI;
-+	bool mHSyncPolarity;
-+	bool mVSyncPolarity;
-+	bool mInterlaced;
-+	bool mDataEnablePolarity;
-+
-+	unsigned long mPixelClock;
-+	unsigned int mPixelRepetitionInput;
-+	unsigned int mPixelRepetitionOutput;
-+};
-+
-+struct hdmi_data_info {
-+	unsigned int enc_in_format;
-+	unsigned int enc_out_format;
-+	unsigned int enc_color_depth;
-+	unsigned int colorimetry;
-+	unsigned int pix_repet_factor;
-+	unsigned int hdcp_enable;
-+	unsigned int rgb_out_enable;
-+	unsigned int rgb_quant_range;
-+	unsigned int enable_3d;
-+	unsigned int enable_fract;
-+	struct hdmi_vmode video_mode;
-+};
-+
-+struct hdmi_phy_reg_config {
-+	/* HDMI PHY register config for pass HCT */
-+	u16 reg_vlev;
-+	u16 reg_cksymtx;
-+};
-+
-+struct mxc_hdmi {
-+	struct platform_device *pdev;
-+	struct platform_device *core_pdev;
-+	struct mxc_dispdrv_handle *disp_mxc_hdmi;
-+	struct fb_info *fbi;
-+	struct clk *hdmi_isfr_clk;
-+	struct clk *hdmi_iahb_clk;
-+	struct timer_list jitter_timer;
-+	struct work_struct hotplug_work;
-+	struct delayed_work hdcp_hdp_work;
-+
-+	struct notifier_block nb;
-+
-+	struct hdmi_data_info hdmi_data;
-+	int vic;
-+	int edid_status;
-+	struct mxc_edid_cfg edid_cfg;
-+	u8 edid[HDMI_EDID_LEN];
-+	bool fb_reg;
-+	bool cable_plugin;
-+	u8  blank;
-+	bool dft_mode_set;
-+	char *dft_mode_str;
-+	int default_bpp;
-+	u8 latest_intr_stat;
-+	u8 plug_event;
-+	u8 plug_mask;
-+	bool irq_enabled;
-+	spinlock_t irq_lock;
-+	bool phy_enabled;
-+	struct fb_videomode default_mode;
-+	struct fb_var_screeninfo previous_non_vga_mode;
-+	bool requesting_vga_for_initialization;
-+
-+	int *gpr_base;
-+	int *gpr_hdmi_base;
-+	int *gpr_sdma_base;
-+	int cpu_type;
-+	int cpu_version;
-+	struct hdmi_phy_reg_config phy_config;
-+
-+	struct pinctrl *pinctrl;
-+};
-+
-+static int hdmi_major;
-+static struct class *hdmi_class;
-+
-+struct i2c_client *hdmi_i2c;
-+struct mxc_hdmi *g_hdmi;
-+
-+static bool hdmi_inited;
-+static bool hdcp_init;
-+
-+extern const struct fb_videomode mxc_cea_mode[64];
-+extern void mxc_hdmi_cec_handle(u32 cec_stat);
-+
-+static void mxc_hdmi_setup(struct mxc_hdmi *hdmi, unsigned long event);
-+static void hdmi_enable_overflow_interrupts(void);
-+static void hdmi_disable_overflow_interrupts(void);
-+static void mxc_hdmi_edid_rebuild_modelist(struct mxc_hdmi *hdmi);
-+static void mxc_hdmi_default_edid_cfg(struct mxc_hdmi *hdmi);
-+static void mxc_hdmi_default_modelist(struct mxc_hdmi *hdmi);
-+static void mxc_hdmi_set_mode(struct mxc_hdmi *hdmi);
-+
-+static char *rgb_quant_range = "default";
-+module_param(rgb_quant_range, charp, S_IRUGO);
-+MODULE_PARM_DESC(rgb_quant_range, "RGB Quant Range (default, limited, full)");
-+
-+static char *enable_3d = "1";
-+module_param(enable_3d, charp, S_IRUGO);
-+MODULE_PARM_DESC(enable_3d, "3D modes enabled (0/1)");
-+
-+static char *enable_fract = "1";
-+module_param(enable_fract, charp, S_IRUGO);
-+MODULE_PARM_DESC(enable_fract, "Fractional modes enabled (0/1)");
-+
-+static struct platform_device_id imx_hdmi_devtype[] = {
-+	{
-+		.name = "hdmi-imx6DL",
-+		.driver_data = IMX6DL_HDMI,
-+	}, {
-+		.name = "hdmi-imx6Q",
-+		.driver_data = IMX6Q_HDMI,
-+	}, {
-+		/* sentinel */
-+	}
-+};
-+MODULE_DEVICE_TABLE(platform, imx_hdmi_devtype);
-+
-+static const struct of_device_id imx_hdmi_dt_ids[] = {
-+	{ .compatible = "fsl,imx6dl-hdmi-video", .data = &imx_hdmi_devtype[IMX6DL_HDMI], },
-+	{ .compatible = "fsl,imx6q-hdmi-video", .data = &imx_hdmi_devtype[IMX6Q_HDMI], },
-+	{ /* sentinel */ }
-+};
-+MODULE_DEVICE_TABLE(of, imx_hdmi_dt_ids);
-+
-+static inline int cpu_is_imx6dl(struct mxc_hdmi *hdmi)
-+{
-+	return hdmi->cpu_type == IMX6DL_HDMI;
-+}
-+
-+static inline void get_refresh_str(struct fb_videomode *m, char *refresh)
-+{
-+	snprintf(refresh, 10, "%u.%uHz", m->refresh - (int)(m->vmode & FB_VMODE_FRACTIONAL ? 1 : 0),
-+				m->refresh * (int)(m->vmode & FB_VMODE_FRACTIONAL ? 999 : 1000) % 1000);
-+}
-+
-+static void dump_fb_videomode(struct fb_videomode *m)
-+{
-+	char refresh[10];
-+
-+	get_refresh_str(m, refresh);
-+	pr_debug("fb_videomode = %ux%u%c-%s (%ukHz) %u %u %u %u %u %u %u %u %u\n",
-+		m->xres, m->yres, m->vmode & FB_VMODE_INTERLACED ? 'i' : 'p',
-+		refresh, m->pixclock, m->left_margin,
-+		m->right_margin, m->upper_margin, m->lower_margin,
-+		m->hsync_len, m->vsync_len, m->sync, m->vmode, m->flag);
-+}
-+
-+static ssize_t mxc_hdmi_show_name(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	strcpy(buf, hdmi->fbi->fix.id);
-+	sprintf(buf+strlen(buf), "\n");
-+
-+	return strlen(buf);
-+}
-+
-+static DEVICE_ATTR(fb_name, S_IRUGO, mxc_hdmi_show_name, NULL);
-+
-+static ssize_t mxc_hdmi_show_state(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	if (hdmi->cable_plugin == false)
-+		strcpy(buf, "plugout\n");
-+	else
-+		strcpy(buf, "plugin\n");
-+
-+	return strlen(buf);
-+}
-+
-+static DEVICE_ATTR(cable_state, S_IRUGO, mxc_hdmi_show_state, NULL);
-+
-+static ssize_t mxc_hdmi_show_edid(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+	int i, j, len = 0;
-+
-+	for (j = 0; j < HDMI_EDID_LEN/16; j++) {
-+		for (i = 0; i < 16; i++)
-+			len += sprintf(buf+len, "0x%02X ",
-+					hdmi->edid[j*16 + i]);
-+		len += sprintf(buf+len, "\n");
-+	}
-+
-+	return len;
-+}
-+
-+static DEVICE_ATTR(edid, S_IRUGO, mxc_hdmi_show_edid, NULL);
-+
-+static ssize_t mxc_hdmi_show_rgb_out_enable(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	if (hdmi->hdmi_data.rgb_out_enable == true)
-+		strcpy(buf, "RGB out\n");
-+	else
-+		strcpy(buf, "YCbCr out\n");
-+
-+	return strlen(buf);
-+}
-+
-+static ssize_t mxc_hdmi_store_rgb_out_enable(struct device *dev,
-+		struct device_attribute *attr, const char *buf, size_t count)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+	unsigned long value;
-+	int ret;
-+
-+	ret = kstrtol(buf, 10, &value);
-+	if (ret)
-+		return ret;
-+
-+	hdmi->hdmi_data.rgb_out_enable = value;
-+
-+	/* Reconfig HDMI for output color space change */
-+	mxc_hdmi_setup(hdmi, 0);
-+
-+	return count;
-+}
-+
-+static DEVICE_ATTR(rgb_out_enable, S_IRUGO | S_IWUSR,
-+				mxc_hdmi_show_rgb_out_enable,
-+				mxc_hdmi_store_rgb_out_enable);
-+
-+static ssize_t mxc_hdmi_show_rgb_quant_range(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	switch (hdmi->hdmi_data.rgb_quant_range) {
-+	case HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE: 
-+		strcpy(buf, "limited\n");
-+		break;
-+	case HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE: 
-+		strcpy(buf, "full\n");
-+		break;
-+	case HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT: 
-+	default:
-+		strcpy(buf, "default\n");
-+		break;
-+	};
-+
-+	return strlen(buf);
-+}
-+
-+static ssize_t mxc_hdmi_store_rgb_quant_range(struct device *dev,
-+		struct device_attribute *attr, const char *buf, size_t count)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+	int ret = count;
-+
-+	if (sysfs_streq("limited", buf)) {
-+		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE;
-+	} else if (sysfs_streq("full", buf)) {
-+		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE;
-+	} else if (sysfs_streq("default", buf)) {
-+		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT;
-+	} else {
-+		ret = -EINVAL;
-+		goto out;
-+	}
-+
-+	/* Reconfig HDMI for output RGB Quant Range change if using RGB out */
-+	if(hdmi->hdmi_data.rgb_out_enable)
-+		mxc_hdmi_setup(hdmi, 0);
-+out:
-+	return ret;
-+}
-+
-+static DEVICE_ATTR(rgb_quant_range, S_IRUGO | S_IWUSR,
-+				mxc_hdmi_show_rgb_quant_range,
-+				mxc_hdmi_store_rgb_quant_range);
-+
-+static ssize_t mxc_hdmi_show_enable_3d(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	switch (hdmi->hdmi_data.enable_3d) {
-+	case 0:
-+		strcpy(buf, "disabled\n");
-+		break;
-+	default:
-+		strcpy(buf, "enabled\n");
-+		break;
-+	};
-+
-+	return strlen(buf);
-+}
-+
-+static ssize_t mxc_hdmi_store_enable_3d(struct device *dev,
-+		struct device_attribute *attr, const char *buf, size_t count)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+	int ret = count;
-+
-+	if (sysfs_streq("disable", buf)) {
-+		hdmi->hdmi_data.enable_3d = 0;
-+	} else if (sysfs_streq("0", buf)) {
-+		hdmi->hdmi_data.enable_3d = 0;
-+	} else {
-+		hdmi->hdmi_data.enable_3d = 1;
-+	}
-+
-+	mxc_hdmi_edid_rebuild_modelist(hdmi);
-+	if (hdmi->cable_plugin)
-+		mxc_hdmi_set_mode(hdmi);
-+
-+	return ret;
-+}
-+
-+static DEVICE_ATTR(enable_3d, S_IRUGO | S_IWUSR,
-+				mxc_hdmi_show_enable_3d,
-+				mxc_hdmi_store_enable_3d);
-+
-+static ssize_t mxc_hdmi_show_enable_fract(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	switch (hdmi->hdmi_data.enable_fract) {
-+	case 0:
-+		strcpy(buf, "disabled\n");
-+		break;
-+	default:
-+		strcpy(buf, "enabled\n");
-+		break;
-+	};
-+
-+	return strlen(buf);
-+}
-+
-+static ssize_t mxc_hdmi_store_enable_fract(struct device *dev,
-+		struct device_attribute *attr, const char *buf, size_t count)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+	int ret = count;
-+
-+	if (sysfs_streq("disable", buf)) {
-+		hdmi->hdmi_data.enable_fract = 0;
-+	} else if (sysfs_streq("0", buf)) {
-+		hdmi->hdmi_data.enable_fract = 0;
-+	} else {
-+		hdmi->hdmi_data.enable_fract = 1;
-+	}
-+
-+	mxc_hdmi_edid_rebuild_modelist(hdmi);
-+	if (hdmi->cable_plugin)
-+		mxc_hdmi_set_mode(hdmi);
-+
-+	return ret;
-+}
-+
-+static DEVICE_ATTR(enable_fract, S_IRUGO | S_IWUSR,
-+				mxc_hdmi_show_enable_fract,
-+				mxc_hdmi_store_enable_fract);
-+
-+static ssize_t mxc_hdmi_show_hdcp_enable(struct device *dev,
-+		struct device_attribute *attr, char *buf)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+
-+	if (hdmi->hdmi_data.hdcp_enable == false)
-+		strcpy(buf, "hdcp disable\n");
-+	else
-+		strcpy(buf, "hdcp enable\n");
-+
-+	return strlen(buf);
-+
-+}
-+
-+static ssize_t mxc_hdmi_store_hdcp_enable(struct device *dev,
-+		struct device_attribute *attr, const char *buf, size_t count)
-+{
-+	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
-+	char event_string[32];
-+	char *envp[] = { event_string, NULL };
-+	unsigned long value;
-+	int ret;
-+
-+	ret = kstrtol(buf, 10, &value);
-+	if (ret)
-+		return ret;
-+
-+	hdmi->hdmi_data.hdcp_enable = value;
-+
-+	/* Reconfig HDMI for HDCP */
-+	mxc_hdmi_setup(hdmi, 0);
-+
-+	if (hdmi->hdmi_data.hdcp_enable == false) {
-+		sprintf(event_string, "EVENT=hdcpdisable");
-+		kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
-+	} else {
-+		sprintf(event_string, "EVENT=hdcpenable");
-+		kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
-+	}
-+
-+	return count;
-+
-+}
-+
-+static DEVICE_ATTR(hdcp_enable, S_IRUGO | S_IWUSR,
-+			mxc_hdmi_show_hdcp_enable, mxc_hdmi_store_hdcp_enable);
-+
-+/*!
-+ * this submodule is responsible for the video data synchronization.
-+ * for example, for RGB 4:4:4 input, the data map is defined as
-+ *			pin{47~40} <==> R[7:0]
-+ *			pin{31~24} <==> G[7:0]
-+ *			pin{15~8}  <==> B[7:0]
-+ */
-+static void hdmi_video_sample(struct mxc_hdmi *hdmi)
-+{
-+	int color_format = 0;
-+	u8 val;
-+
-+	if (hdmi->hdmi_data.enc_in_format == RGB) {
-+		if (hdmi->hdmi_data.enc_color_depth == 8)
-+			color_format = 0x01;
-+		else if (hdmi->hdmi_data.enc_color_depth == 10)
-+			color_format = 0x03;
-+		else if (hdmi->hdmi_data.enc_color_depth == 12)
-+			color_format = 0x05;
-+		else if (hdmi->hdmi_data.enc_color_depth == 16)
-+			color_format = 0x07;
-+		else
-+			return;
-+	} else if (hdmi->hdmi_data.enc_in_format == YCBCR444) {
-+		if (hdmi->hdmi_data.enc_color_depth == 8)
-+			color_format = 0x09;
-+		else if (hdmi->hdmi_data.enc_color_depth == 10)
-+			color_format = 0x0B;
-+		else if (hdmi->hdmi_data.enc_color_depth == 12)
-+			color_format = 0x0D;
-+		else if (hdmi->hdmi_data.enc_color_depth == 16)
-+			color_format = 0x0F;
-+		else
-+			return;
-+	} else if (hdmi->hdmi_data.enc_in_format == YCBCR422_8BITS) {
-+		if (hdmi->hdmi_data.enc_color_depth == 8)
-+			color_format = 0x16;
-+		else if (hdmi->hdmi_data.enc_color_depth == 10)
-+			color_format = 0x14;
-+		else if (hdmi->hdmi_data.enc_color_depth == 12)
-+			color_format = 0x12;
-+		else
-+			return;
-+	}
-+
-+	val = HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_DISABLE |
-+		((color_format << HDMI_TX_INVID0_VIDEO_MAPPING_OFFSET) &
-+		HDMI_TX_INVID0_VIDEO_MAPPING_MASK);
-+	hdmi_writeb(val, HDMI_TX_INVID0);
-+
-+	/* Enable TX stuffing: When DE is inactive, fix the output data to 0 */
-+	val = HDMI_TX_INSTUFFING_BDBDATA_STUFFING_ENABLE |
-+		HDMI_TX_INSTUFFING_RCRDATA_STUFFING_ENABLE |
-+		HDMI_TX_INSTUFFING_GYDATA_STUFFING_ENABLE;
-+	hdmi_writeb(val, HDMI_TX_INSTUFFING);
-+	hdmi_writeb(0x0, HDMI_TX_GYDATA0);
-+	hdmi_writeb(0x0, HDMI_TX_GYDATA1);
-+	hdmi_writeb(0x0, HDMI_TX_RCRDATA0);
-+	hdmi_writeb(0x0, HDMI_TX_RCRDATA1);
-+	hdmi_writeb(0x0, HDMI_TX_BCBDATA0);
-+	hdmi_writeb(0x0, HDMI_TX_BCBDATA1);
-+}
-+
-+static int isColorSpaceConversion(struct mxc_hdmi *hdmi)
-+{
-+	return (hdmi->hdmi_data.enc_in_format != hdmi->hdmi_data.enc_out_format) ||
-+		(hdmi->hdmi_data.enc_out_format == RGB &&
-+		  ((hdmi->hdmi_data.rgb_quant_range == HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE) ||
-+		   (hdmi->hdmi_data.rgb_quant_range == HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT && hdmi->vic > 1)));
-+}
-+
-+static int isColorSpaceDecimation(struct mxc_hdmi *hdmi)
-+{
-+	return ((hdmi->hdmi_data.enc_out_format == YCBCR422_8BITS) &&
-+		(hdmi->hdmi_data.enc_in_format == RGB ||
-+		hdmi->hdmi_data.enc_in_format == YCBCR444));
-+}
-+
-+static int isColorSpaceInterpolation(struct mxc_hdmi *hdmi)
-+{
-+	return ((hdmi->hdmi_data.enc_in_format == YCBCR422_8BITS) &&
-+		(hdmi->hdmi_data.enc_out_format == RGB
-+		|| hdmi->hdmi_data.enc_out_format == YCBCR444));
-+}
-+
-+/*!
-+ * update the color space conversion coefficients.
-+ */
-+static void update_csc_coeffs(struct mxc_hdmi *hdmi)
-+{
-+	unsigned short csc_coeff[3][4];
-+	unsigned int csc_scale = 1;
-+	u8 val;
-+	bool coeff_selected = false;
-+
-+	if (isColorSpaceConversion(hdmi)) { /* csc needed */
-+		if (hdmi->hdmi_data.enc_out_format == RGB) {
-+			if (hdmi->hdmi_data.enc_in_format == RGB) {
-+				csc_coeff[0][0] = 0x1b80;
-+				csc_coeff[0][1] = 0x0000;
-+				csc_coeff[0][2] = 0x0000;
-+				csc_coeff[0][3] = 0x0020;
-+
-+				csc_coeff[1][0] = 0x0000;
-+				csc_coeff[1][1] = 0x1b80;
-+				csc_coeff[1][2] = 0x0000;
-+				csc_coeff[1][3] = 0x0020;
-+
-+				csc_coeff[2][0] = 0x0000;
-+				csc_coeff[2][1] = 0x0000;
-+				csc_coeff[2][2] = 0x1b80;
-+				csc_coeff[2][3] = 0x0020;
-+
-+				csc_scale = 1;
-+				coeff_selected = true;
-+			} else if (hdmi->hdmi_data.colorimetry == eITU601) {
-+				csc_coeff[0][0] = 0x2000;
-+				csc_coeff[0][1] = 0x6926;
-+				csc_coeff[0][2] = 0x74fd;
-+				csc_coeff[0][3] = 0x010e;
-+
-+				csc_coeff[1][0] = 0x2000;
-+				csc_coeff[1][1] = 0x2cdd;
-+				csc_coeff[1][2] = 0x0000;
-+				csc_coeff[1][3] = 0x7e9a;
-+
-+				csc_coeff[2][0] = 0x2000;
-+				csc_coeff[2][1] = 0x0000;
-+				csc_coeff[2][2] = 0x38b4;
-+				csc_coeff[2][3] = 0x7e3b;
-+
-+				csc_scale = 1;
-+				coeff_selected = true;
-+			} else if (hdmi->hdmi_data.colorimetry == eITU709) {
-+				csc_coeff[0][0] = 0x2000;
-+				csc_coeff[0][1] = 0x7106;
-+				csc_coeff[0][2] = 0x7a02;
-+				csc_coeff[0][3] = 0x00a7;
-+
-+				csc_coeff[1][0] = 0x2000;
-+				csc_coeff[1][1] = 0x3264;
-+				csc_coeff[1][2] = 0x0000;
-+				csc_coeff[1][3] = 0x7e6d;
-+
-+				csc_coeff[2][0] = 0x2000;
-+				csc_coeff[2][1] = 0x0000;
-+				csc_coeff[2][2] = 0x3b61;
-+				csc_coeff[2][3] = 0x7e25;
-+
-+				csc_scale = 1;
-+				coeff_selected = true;
-+			}
-+		} else if (hdmi->hdmi_data.enc_in_format == RGB) {
-+			if (hdmi->hdmi_data.colorimetry == eITU601) {
-+				csc_coeff[0][0] = 0x2591;
-+				csc_coeff[0][1] = 0x1322;
-+				csc_coeff[0][2] = 0x074b;
-+				csc_coeff[0][3] = 0x0000;
-+
-+				csc_coeff[1][0] = 0x6535;
-+				csc_coeff[1][1] = 0x2000;
-+				csc_coeff[1][2] = 0x7acc;
-+				csc_coeff[1][3] = 0x0200;
-+
-+				csc_coeff[2][0] = 0x6acd;
-+				csc_coeff[2][1] = 0x7534;
-+				csc_coeff[2][2] = 0x2000;
-+				csc_coeff[2][3] = 0x0200;
-+
-+				csc_scale = 0;
-+				coeff_selected = true;
-+			} else if (hdmi->hdmi_data.colorimetry == eITU709) {
-+				csc_coeff[0][0] = 0x2dc5;
-+				csc_coeff[0][1] = 0x0d9b;
-+				csc_coeff[0][2] = 0x049e;
-+				csc_coeff[0][3] = 0x0000;
-+
-+				csc_coeff[1][0] = 0x62f0;
-+				csc_coeff[1][1] = 0x2000;
-+				csc_coeff[1][2] = 0x7d11;
-+				csc_coeff[1][3] = 0x0200;
-+
-+				csc_coeff[2][0] = 0x6756;
-+				csc_coeff[2][1] = 0x78ab;
-+				csc_coeff[2][2] = 0x2000;
-+				csc_coeff[2][3] = 0x0200;
-+
-+				csc_scale = 0;
-+				coeff_selected = true;
-+			}
-+		}
-+	}
-+
-+	if (!coeff_selected) {
-+		csc_coeff[0][0] = 0x2000;
-+		csc_coeff[0][1] = 0x0000;
-+		csc_coeff[0][2] = 0x0000;
-+		csc_coeff[0][3] = 0x0000;
-+
-+		csc_coeff[1][0] = 0x0000;
-+		csc_coeff[1][1] = 0x2000;
-+		csc_coeff[1][2] = 0x0000;
-+		csc_coeff[1][3] = 0x0000;
-+
-+		csc_coeff[2][0] = 0x0000;
-+		csc_coeff[2][1] = 0x0000;
-+		csc_coeff[2][2] = 0x2000;
-+		csc_coeff[2][3] = 0x0000;
-+
-+		csc_scale = 1;
-+	}
-+
-+	/* Update CSC parameters in HDMI CSC registers */
-+	hdmi_writeb((unsigned char)(csc_coeff[0][0] & 0xFF),
-+		HDMI_CSC_COEF_A1_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][0] >> 8),
-+		HDMI_CSC_COEF_A1_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][1] & 0xFF),
-+		HDMI_CSC_COEF_A2_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][1] >> 8),
-+		HDMI_CSC_COEF_A2_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][2] & 0xFF),
-+		HDMI_CSC_COEF_A3_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][2] >> 8),
-+		HDMI_CSC_COEF_A3_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][3] & 0xFF),
-+		HDMI_CSC_COEF_A4_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[0][3] >> 8),
-+		HDMI_CSC_COEF_A4_MSB);
-+
-+	hdmi_writeb((unsigned char)(csc_coeff[1][0] & 0xFF),
-+		HDMI_CSC_COEF_B1_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][0] >> 8),
-+		HDMI_CSC_COEF_B1_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][1] & 0xFF),
-+		HDMI_CSC_COEF_B2_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][1] >> 8),
-+		HDMI_CSC_COEF_B2_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][2] & 0xFF),
-+		HDMI_CSC_COEF_B3_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][2] >> 8),
-+		HDMI_CSC_COEF_B3_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][3] & 0xFF),
-+		HDMI_CSC_COEF_B4_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[1][3] >> 8),
-+		HDMI_CSC_COEF_B4_MSB);
-+
-+	hdmi_writeb((unsigned char)(csc_coeff[2][0] & 0xFF),
-+		HDMI_CSC_COEF_C1_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][0] >> 8),
-+		HDMI_CSC_COEF_C1_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][1] & 0xFF),
-+		HDMI_CSC_COEF_C2_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][1] >> 8),
-+		HDMI_CSC_COEF_C2_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][2] & 0xFF),
-+		HDMI_CSC_COEF_C3_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][2] >> 8),
-+		HDMI_CSC_COEF_C3_MSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][3] & 0xFF),
-+		HDMI_CSC_COEF_C4_LSB);
-+	hdmi_writeb((unsigned char)(csc_coeff[2][3] >> 8),
-+		HDMI_CSC_COEF_C4_MSB);
-+
-+	val = hdmi_readb(HDMI_CSC_SCALE);
-+	val &= ~HDMI_CSC_SCALE_CSCSCALE_MASK;
-+	val |= csc_scale & HDMI_CSC_SCALE_CSCSCALE_MASK;
-+	hdmi_writeb(val, HDMI_CSC_SCALE);
-+}
-+
-+static void hdmi_video_csc(struct mxc_hdmi *hdmi)
-+{
-+	int color_depth = 0;
-+	int interpolation = HDMI_CSC_CFG_INTMODE_DISABLE;
-+	int decimation = HDMI_CSC_CFG_DECMODE_DISABLE;
-+	u8 val;
-+
-+	/* YCC422 interpolation to 444 mode */
-+	if (isColorSpaceInterpolation(hdmi))
-+		interpolation = HDMI_CSC_CFG_INTMODE_CHROMA_INT_FORMULA1;
-+	else if (isColorSpaceDecimation(hdmi))
-+		decimation = HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA3;
-+
-+	if (hdmi->hdmi_data.enc_color_depth == 8)
-+		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_24BPP;
-+	else if (hdmi->hdmi_data.enc_color_depth == 10)
-+		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_30BPP;
-+	else if (hdmi->hdmi_data.enc_color_depth == 12)
-+		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_36BPP;
-+	else if (hdmi->hdmi_data.enc_color_depth == 16)
-+		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_48BPP;
-+	else
-+		return;
-+
-+	/*configure the CSC registers */
-+	hdmi_writeb(interpolation | decimation, HDMI_CSC_CFG);
-+	val = hdmi_readb(HDMI_CSC_SCALE);
-+	val &= ~HDMI_CSC_SCALE_CSC_COLORDE_PTH_MASK;
-+	val |= color_depth;
-+	hdmi_writeb(val, HDMI_CSC_SCALE);
-+
-+	update_csc_coeffs(hdmi);
-+}
-+
-+/*!
-+ * HDMI video packetizer is used to packetize the data.
-+ * for example, if input is YCC422 mode or repeater is used,
-+ * data should be repacked this module can be bypassed.
-+ */
-+static void hdmi_video_packetize(struct mxc_hdmi *hdmi)
-+{
-+	unsigned int color_depth = 0;
-+	unsigned int remap_size = HDMI_VP_REMAP_YCC422_16bit;
-+	unsigned int output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_PP;
-+	struct hdmi_data_info *hdmi_data = &hdmi->hdmi_data;
-+	u8 val;
-+
-+	if (hdmi_data->enc_out_format == RGB
-+		|| hdmi_data->enc_out_format == YCBCR444) {
-+		if (hdmi_data->enc_color_depth == 0)
-+			output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS;
-+		else if (hdmi_data->enc_color_depth == 8) {
-+			color_depth = 4;
-+			output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS;
-+		} else if (hdmi_data->enc_color_depth == 10)
-+			color_depth = 5;
-+		else if (hdmi_data->enc_color_depth == 12)
-+			color_depth = 6;
-+		else if (hdmi_data->enc_color_depth == 16)
-+			color_depth = 7;
-+		else
-+			return;
-+	} else if (hdmi_data->enc_out_format == YCBCR422_8BITS) {
-+		if (hdmi_data->enc_color_depth == 0 ||
-+			hdmi_data->enc_color_depth == 8)
-+			remap_size = HDMI_VP_REMAP_YCC422_16bit;
-+		else if (hdmi_data->enc_color_depth == 10)
-+			remap_size = HDMI_VP_REMAP_YCC422_20bit;
-+		else if (hdmi_data->enc_color_depth == 12)
-+			remap_size = HDMI_VP_REMAP_YCC422_24bit;
-+		else
-+			return;
-+		output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_YCC422;
-+	} else
-+		return;
-+
-+	/* HDMI not support deep color,
-+	 * because IPU MAX support color depth is 24bit */
-+	color_depth = 0;
-+
-+	/* set the packetizer registers */
-+	val = ((color_depth << HDMI_VP_PR_CD_COLOR_DEPTH_OFFSET) &
-+		HDMI_VP_PR_CD_COLOR_DEPTH_MASK) |
-+		((hdmi_data->pix_repet_factor <<
-+		HDMI_VP_PR_CD_DESIRED_PR_FACTOR_OFFSET) &
-+		HDMI_VP_PR_CD_DESIRED_PR_FACTOR_MASK);
-+	hdmi_writeb(val, HDMI_VP_PR_CD);
-+
-+	val = hdmi_readb(HDMI_VP_STUFF);
-+	val &= ~HDMI_VP_STUFF_PR_STUFFING_MASK;
-+	val |= HDMI_VP_STUFF_PR_STUFFING_STUFFING_MODE;
-+	hdmi_writeb(val, HDMI_VP_STUFF);
-+
-+	/* Data from pixel repeater block */
-+	if (hdmi_data->pix_repet_factor > 1) {
-+		val = hdmi_readb(HDMI_VP_CONF);
-+		val &= ~(HDMI_VP_CONF_PR_EN_MASK |
-+			HDMI_VP_CONF_BYPASS_SELECT_MASK);
-+		val |= HDMI_VP_CONF_PR_EN_ENABLE |
-+			HDMI_VP_CONF_BYPASS_SELECT_PIX_REPEATER;
-+		hdmi_writeb(val, HDMI_VP_CONF);
-+	} else { /* data from packetizer block */
-+		val = hdmi_readb(HDMI_VP_CONF);
-+		val &= ~(HDMI_VP_CONF_PR_EN_MASK |
-+			HDMI_VP_CONF_BYPASS_SELECT_MASK);
-+		val |= HDMI_VP_CONF_PR_EN_DISABLE |
-+			HDMI_VP_CONF_BYPASS_SELECT_VID_PACKETIZER;
-+		hdmi_writeb(val, HDMI_VP_CONF);
-+	}
-+
-+	val = hdmi_readb(HDMI_VP_STUFF);
-+	val &= ~HDMI_VP_STUFF_IDEFAULT_PHASE_MASK;
-+	val |= 1 << HDMI_VP_STUFF_IDEFAULT_PHASE_OFFSET;
-+	hdmi_writeb(val, HDMI_VP_STUFF);
-+
-+	hdmi_writeb(remap_size, HDMI_VP_REMAP);
-+
-+	if (output_select == HDMI_VP_CONF_OUTPUT_SELECTOR_PP) {
-+		val = hdmi_readb(HDMI_VP_CONF);
-+		val &= ~(HDMI_VP_CONF_BYPASS_EN_MASK |
-+			HDMI_VP_CONF_PP_EN_ENMASK |
-+			HDMI_VP_CONF_YCC422_EN_MASK);
-+		val |= HDMI_VP_CONF_BYPASS_EN_DISABLE |
-+			HDMI_VP_CONF_PP_EN_ENABLE |
-+			HDMI_VP_CONF_YCC422_EN_DISABLE;
-+		hdmi_writeb(val, HDMI_VP_CONF);
-+	} else if (output_select == HDMI_VP_CONF_OUTPUT_SELECTOR_YCC422) {
-+		val = hdmi_readb(HDMI_VP_CONF);
-+		val &= ~(HDMI_VP_CONF_BYPASS_EN_MASK |
-+			HDMI_VP_CONF_PP_EN_ENMASK |
-+			HDMI_VP_CONF_YCC422_EN_MASK);
-+		val |= HDMI_VP_CONF_BYPASS_EN_DISABLE |
-+			HDMI_VP_CONF_PP_EN_DISABLE |
-+			HDMI_VP_CONF_YCC422_EN_ENABLE;
-+		hdmi_writeb(val, HDMI_VP_CONF);
-+	} else if (output_select == HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS) {
-+		val = hdmi_readb(HDMI_VP_CONF);
-+		val &= ~(HDMI_VP_CONF_BYPASS_EN_MASK |
-+			HDMI_VP_CONF_PP_EN_ENMASK |
-+			HDMI_VP_CONF_YCC422_EN_MASK);
-+		val |= HDMI_VP_CONF_BYPASS_EN_ENABLE |
-+			HDMI_VP_CONF_PP_EN_DISABLE |
-+			HDMI_VP_CONF_YCC422_EN_DISABLE;
-+		hdmi_writeb(val, HDMI_VP_CONF);
-+	} else {
-+		return;
-+	}
-+
-+	val = hdmi_readb(HDMI_VP_STUFF);
-+	val &= ~(HDMI_VP_STUFF_PP_STUFFING_MASK |
-+		HDMI_VP_STUFF_YCC422_STUFFING_MASK);
-+	val |= HDMI_VP_STUFF_PP_STUFFING_STUFFING_MODE |
-+		HDMI_VP_STUFF_YCC422_STUFFING_STUFFING_MODE;
-+	hdmi_writeb(val, HDMI_VP_STUFF);
-+
-+	val = hdmi_readb(HDMI_VP_CONF);
-+	val &= ~HDMI_VP_CONF_OUTPUT_SELECTOR_MASK;
-+	val |= output_select;
-+	hdmi_writeb(val, HDMI_VP_CONF);
-+}
-+
-+#if 0
-+/* Force a fixed color screen */
-+static void hdmi_video_force_output(struct mxc_hdmi *hdmi, unsigned char force)
-+{
-+	u8 val;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	if (force) {
-+		hdmi_writeb(0x00, HDMI_FC_DBGTMDS2);   /* R */
-+		hdmi_writeb(0x00, HDMI_FC_DBGTMDS1);   /* G */
-+		hdmi_writeb(0xFF, HDMI_FC_DBGTMDS0);   /* B */
-+		val = hdmi_readb(HDMI_FC_DBGFORCE);
-+		val |= HDMI_FC_DBGFORCE_FORCEVIDEO;
-+		hdmi_writeb(val, HDMI_FC_DBGFORCE);
-+	} else {
-+		val = hdmi_readb(HDMI_FC_DBGFORCE);
-+		val &= ~HDMI_FC_DBGFORCE_FORCEVIDEO;
-+		hdmi_writeb(val, HDMI_FC_DBGFORCE);
-+		hdmi_writeb(0x00, HDMI_FC_DBGTMDS2);   /* R */
-+		hdmi_writeb(0x00, HDMI_FC_DBGTMDS1);   /* G */
-+		hdmi_writeb(0x00, HDMI_FC_DBGTMDS0);   /* B */
-+	}
-+}
-+#endif
-+
-+static inline void hdmi_phy_test_clear(struct mxc_hdmi *hdmi,
-+						unsigned char bit)
-+{
-+	u8 val = hdmi_readb(HDMI_PHY_TST0);
-+	val &= ~HDMI_PHY_TST0_TSTCLR_MASK;
-+	val |= (bit << HDMI_PHY_TST0_TSTCLR_OFFSET) &
-+		HDMI_PHY_TST0_TSTCLR_MASK;
-+	hdmi_writeb(val, HDMI_PHY_TST0);
-+}
-+
-+static inline void hdmi_phy_test_enable(struct mxc_hdmi *hdmi,
-+						unsigned char bit)
-+{
-+	u8 val = hdmi_readb(HDMI_PHY_TST0);
-+	val &= ~HDMI_PHY_TST0_TSTEN_MASK;
-+	val |= (bit << HDMI_PHY_TST0_TSTEN_OFFSET) &
-+		HDMI_PHY_TST0_TSTEN_MASK;
-+	hdmi_writeb(val, HDMI_PHY_TST0);
-+}
-+
-+static inline void hdmi_phy_test_clock(struct mxc_hdmi *hdmi,
-+						unsigned char bit)
-+{
-+	u8 val = hdmi_readb(HDMI_PHY_TST0);
-+	val &= ~HDMI_PHY_TST0_TSTCLK_MASK;
-+	val |= (bit << HDMI_PHY_TST0_TSTCLK_OFFSET) &
-+		HDMI_PHY_TST0_TSTCLK_MASK;
-+	hdmi_writeb(val, HDMI_PHY_TST0);
-+}
-+
-+static inline void hdmi_phy_test_din(struct mxc_hdmi *hdmi,
-+						unsigned char bit)
-+{
-+	hdmi_writeb(bit, HDMI_PHY_TST1);
-+}
-+
-+static inline void hdmi_phy_test_dout(struct mxc_hdmi *hdmi,
-+						unsigned char bit)
-+{
-+	hdmi_writeb(bit, HDMI_PHY_TST2);
-+}
-+
-+static bool hdmi_phy_wait_i2c_done(struct mxc_hdmi *hdmi, int msec)
-+{
-+	unsigned char val = 0;
-+	val = hdmi_readb(HDMI_IH_I2CMPHY_STAT0) & 0x3;
-+	while (val == 0) {
-+		udelay(1000);
-+		if (msec-- == 0)
-+			return false;
-+		val = hdmi_readb(HDMI_IH_I2CMPHY_STAT0) & 0x3;
-+	}
-+	return true;
-+}
-+
-+static void hdmi_phy_i2c_write(struct mxc_hdmi *hdmi, unsigned short data,
-+			      unsigned char addr)
-+{
-+	hdmi_writeb(0xFF, HDMI_IH_I2CMPHY_STAT0);
-+	hdmi_writeb(addr, HDMI_PHY_I2CM_ADDRESS_ADDR);
-+	hdmi_writeb((unsigned char)(data >> 8),
-+		HDMI_PHY_I2CM_DATAO_1_ADDR);
-+	hdmi_writeb((unsigned char)(data >> 0),
-+		HDMI_PHY_I2CM_DATAO_0_ADDR);
-+	hdmi_writeb(HDMI_PHY_I2CM_OPERATION_ADDR_WRITE,
-+		HDMI_PHY_I2CM_OPERATION_ADDR);
-+	hdmi_phy_wait_i2c_done(hdmi, 1000);
-+}
-+
-+#if 0
-+static unsigned short hdmi_phy_i2c_read(struct mxc_hdmi *hdmi,
-+					unsigned char addr)
-+{
-+	unsigned short data;
-+	unsigned char msb = 0, lsb = 0;
-+	hdmi_writeb(0xFF, HDMI_IH_I2CMPHY_STAT0);
-+	hdmi_writeb(addr, HDMI_PHY_I2CM_ADDRESS_ADDR);
-+	hdmi_writeb(HDMI_PHY_I2CM_OPERATION_ADDR_READ,
-+		HDMI_PHY_I2CM_OPERATION_ADDR);
-+	hdmi_phy_wait_i2c_done(hdmi, 1000);
-+	msb = hdmi_readb(HDMI_PHY_I2CM_DATAI_1_ADDR);
-+	lsb = hdmi_readb(HDMI_PHY_I2CM_DATAI_0_ADDR);
-+	data = (msb << 8) | lsb;
-+	return data;
-+}
-+
-+static int hdmi_phy_i2c_write_verify(struct mxc_hdmi *hdmi, unsigned short data,
-+				     unsigned char addr)
-+{
-+	unsigned short val = 0;
-+	hdmi_phy_i2c_write(hdmi, data, addr);
-+	val = hdmi_phy_i2c_read(hdmi, addr);
-+	return (val == data);
-+}
-+#endif
-+
-+static bool  hdmi_edid_wait_i2c_done(struct mxc_hdmi *hdmi, int msec)
-+{
-+    unsigned char val = 0;
-+    val = hdmi_readb(HDMI_IH_I2CM_STAT0) & 0x2;
-+    while (val == 0) {
-+
-+		udelay(1000);
-+		if (msec-- == 0) {
-+			dev_dbg(&hdmi->pdev->dev,
-+					"HDMI EDID i2c operation time out!!\n");
-+			return false;
-+		}
-+		val = hdmi_readb(HDMI_IH_I2CM_STAT0) & 0x2;
-+	}
-+	return true;
-+}
-+
-+static u8 hdmi_edid_i2c_read(struct mxc_hdmi *hdmi,
-+					u8 addr, u8 blockno)
-+{
-+	u8 spointer = blockno / 2;
-+	u8 edidaddress = ((blockno % 2) * 0x80) + addr;
-+	u8 data;
-+
-+	hdmi_writeb(0xFF, HDMI_IH_I2CM_STAT0);
-+	hdmi_writeb(edidaddress, HDMI_I2CM_ADDRESS);
-+	hdmi_writeb(spointer, HDMI_I2CM_SEGADDR);
-+	if (spointer == 0)
-+		hdmi_writeb(HDMI_I2CM_OPERATION_READ,
-+			HDMI_I2CM_OPERATION);
-+	else
-+		hdmi_writeb(HDMI_I2CM_OPERATION_READ_EXT,
-+			HDMI_I2CM_OPERATION);
-+
-+	hdmi_edid_wait_i2c_done(hdmi, 1000);
-+	data = hdmi_readb(HDMI_I2CM_DATAI);
-+	hdmi_writeb(0xFF, HDMI_IH_I2CM_STAT0);
-+	return data;
-+}
-+
-+
-+/* "Power-down enable (active low)"
-+ * That mean that power up == 1! */
-+static void mxc_hdmi_phy_enable_power(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_PDZ_OFFSET,
-+			HDMI_PHY_CONF0_PDZ_MASK);
-+}
-+
-+static void mxc_hdmi_phy_enable_tmds(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_ENTMDS_OFFSET,
-+			HDMI_PHY_CONF0_ENTMDS_MASK);
-+}
-+
-+static void mxc_hdmi_phy_gen2_pddq(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_GEN2_PDDQ_OFFSET,
-+			HDMI_PHY_CONF0_GEN2_PDDQ_MASK);
-+}
-+
-+static void mxc_hdmi_phy_gen2_txpwron(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_GEN2_TXPWRON_OFFSET,
-+			HDMI_PHY_CONF0_GEN2_TXPWRON_MASK);
-+}
-+
-+#if 0
-+static void mxc_hdmi_phy_gen2_enhpdrxsense(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_OFFSET,
-+			HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_MASK);
-+}
-+#endif
-+
-+static void mxc_hdmi_phy_sel_data_en_pol(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_SELDATAENPOL_OFFSET,
-+			HDMI_PHY_CONF0_SELDATAENPOL_MASK);
-+}
-+
-+static void mxc_hdmi_phy_sel_interface_control(u8 enable)
-+{
-+	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
-+			HDMI_PHY_CONF0_SELDIPIF_OFFSET,
-+			HDMI_PHY_CONF0_SELDIPIF_MASK);
-+}
-+
-+static int hdmi_phy_configure(struct mxc_hdmi *hdmi, unsigned char pRep,
-+			      unsigned char cRes, int cscOn)
-+{
-+	u8 val;
-+	u8 msec;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* color resolution 0 is 8 bit colour depth */
-+	if (cRes == 0)
-+		cRes = 8;
-+
-+	if (pRep != 0)
-+		return false;
-+	else if (cRes != 8 && cRes != 12)
-+		return false;
-+
-+	/* Enable csc path */
-+	if (cscOn)
-+		val = HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_IN_PATH;
-+	else
-+		val = HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_BYPASS;
-+
-+	hdmi_writeb(val, HDMI_MC_FLOWCTRL);
-+
-+	/* gen2 tx power off */
-+	mxc_hdmi_phy_gen2_txpwron(0);
-+
-+	/* gen2 pddq */
-+	mxc_hdmi_phy_gen2_pddq(1);
-+
-+	/* PHY reset */
-+	hdmi_writeb(HDMI_MC_PHYRSTZ_DEASSERT, HDMI_MC_PHYRSTZ);
-+	hdmi_writeb(HDMI_MC_PHYRSTZ_ASSERT, HDMI_MC_PHYRSTZ);
-+
-+	hdmi_writeb(HDMI_MC_HEACPHY_RST_ASSERT, HDMI_MC_HEACPHY_RST);
-+
-+	hdmi_phy_test_clear(hdmi, 1);
-+	hdmi_writeb(HDMI_PHY_I2CM_SLAVE_ADDR_PHY_GEN2,
-+			HDMI_PHY_I2CM_SLAVE_ADDR);
-+	hdmi_phy_test_clear(hdmi, 0);
-+
-+	if (hdmi->hdmi_data.video_mode.mPixelClock < 0) {
-+		dev_dbg(&hdmi->pdev->dev, "Pixel clock (%lu) must be positive\n",
-+			hdmi->hdmi_data.video_mode.mPixelClock);
-+		return false;
-+	}
-+
-+	if (hdmi->hdmi_data.video_mode.mPixelClock <= 45250000) {
-+		switch (cRes) {
-+		case 8:
-+			/* PLL/MPLL Cfg */
-+			hdmi_phy_i2c_write(hdmi, 0x01e0, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x0000, 0x15);  /* GMPCTRL */
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x21e1, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x0000, 0x15);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x41e2, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x0000, 0x15);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 92500000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x0140, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x0005, 0x15);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x2141, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x0005, 0x15);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x4142, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x0005, 0x15);
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 148500000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x00a0, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x20a1, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x40a2, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
-+		default:
-+			return false;
-+		}
-+	} else {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x00a0, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x2001, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x000f, 0x15);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x4002, 0x06);
-+			hdmi_phy_i2c_write(hdmi, 0x000f, 0x15);
-+		default:
-+			return false;
-+		}
-+	}
-+
-+	if (hdmi->hdmi_data.video_mode.mPixelClock <= 54000000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);  /* CURRCTRL */
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 58400000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 72000000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 74250000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x0b5c, 0x10);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 118800000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 216000000) {
-+		switch (cRes) {
-+		case 8:
-+			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
-+			break;
-+		case 10:
-+			hdmi_phy_i2c_write(hdmi, 0x0b5c, 0x10);
-+			break;
-+		case 12:
-+			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
-+			break;
-+		default:
-+			return false;
-+		}
-+	} else {
-+		dev_err(&hdmi->pdev->dev,
-+				"Pixel clock %lu - unsupported by HDMI\n",
-+				hdmi->hdmi_data.video_mode.mPixelClock);
-+		return false;
-+	}
-+
-+	hdmi_phy_i2c_write(hdmi, 0x0000, 0x13);  /* PLLPHBYCTRL */
-+	hdmi_phy_i2c_write(hdmi, 0x0006, 0x17);
-+	/* RESISTANCE TERM 133Ohm Cfg */
-+	hdmi_phy_i2c_write(hdmi, 0x0005, 0x19);  /* TXTERM */
-+	/* PREEMP Cgf 0.00 */
-+	hdmi_phy_i2c_write(hdmi, 0x800d, 0x09);  /* CKSYMTXCTRL */
-+	/* TX/CK LVL 10 */
-+	hdmi_phy_i2c_write(hdmi, 0x01ad, 0x0E);  /* VLEVCTRL */
-+
-+	/* Board specific setting for PHY register 0x09, 0x0e to pass HCT */
-+	if (hdmi->phy_config.reg_cksymtx != 0)
-+		hdmi_phy_i2c_write(hdmi, hdmi->phy_config.reg_cksymtx, 0x09);
-+
-+	if (hdmi->phy_config.reg_vlev != 0)
-+		hdmi_phy_i2c_write(hdmi, hdmi->phy_config.reg_vlev, 0x0E);
-+
-+	/* REMOVE CLK TERM */
-+	hdmi_phy_i2c_write(hdmi, 0x8000, 0x05);  /* CKCALCTRL */
-+
-+	if (hdmi->hdmi_data.video_mode.mPixelClock > 148500000) {
-+			hdmi_phy_i2c_write(hdmi, 0x800b, 0x09);
-+			hdmi_phy_i2c_write(hdmi, 0x0129, 0x0E);
-+	}
-+
-+	mxc_hdmi_phy_enable_power(1);
-+
-+	/* toggle TMDS enable */
-+	mxc_hdmi_phy_enable_tmds(0);
-+	mxc_hdmi_phy_enable_tmds(1);
-+
-+	/* gen2 tx power on */
-+	mxc_hdmi_phy_gen2_txpwron(1);
-+	mxc_hdmi_phy_gen2_pddq(0);
-+
-+	/*Wait for PHY PLL lock */
-+	msec = 4;
-+	val = hdmi_readb(HDMI_PHY_STAT0) & HDMI_PHY_TX_PHY_LOCK;
-+	while (val == 0) {
-+		udelay(1000);
-+		if (msec-- == 0) {
-+			dev_dbg(&hdmi->pdev->dev, "PHY PLL not locked\n");
-+			return false;
-+		}
-+		val = hdmi_readb(HDMI_PHY_STAT0) & HDMI_PHY_TX_PHY_LOCK;
-+	}
-+
-+	return true;
-+}
-+
-+static void mxc_hdmi_phy_init(struct mxc_hdmi *hdmi)
-+{
-+	int i;
-+	bool cscon = false;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* Never do phy init if pixel clock is gated.
-+	 * Otherwise HDMI PHY will get messed up and generate an overflow
-+	 * interrupt that can't be cleared or detected by accessing the
-+	 * status register. */
-+	if (!hdmi->fb_reg || !hdmi->cable_plugin
-+			|| (hdmi->blank != FB_BLANK_UNBLANK))
-+		return;
-+
-+	/*check csc whether needed activated in HDMI mode */
-+	cscon = (isColorSpaceConversion(hdmi) &&
-+			!hdmi->hdmi_data.video_mode.mDVI);
-+
-+	/* HDMI Phy spec says to do the phy initialization sequence twice */
-+	for (i = 0 ; i < 2 ; i++) {
-+		mxc_hdmi_phy_sel_data_en_pol(1);
-+		mxc_hdmi_phy_sel_interface_control(0);
-+		mxc_hdmi_phy_enable_tmds(0);
-+		mxc_hdmi_phy_enable_power(0);
-+
-+		/* Enable CSC */
-+		hdmi_phy_configure(hdmi, 0, 8, cscon);
-+	}
-+
-+	hdmi->phy_enabled = true;
-+}
-+
-+static enum hdmi_3d_structure mxc_3d_structure_infoframe(u32 layout)
-+{
-+	switch (layout) {
-+	case FB_VMODE_3D_SBS_HALF:
-+		return HDMI_3D_STRUCTURE_SIDE_BY_SIDE_HALF;
-+	case FB_VMODE_3D_SBS_FULL:
-+		return HDMI_3D_STRUCTURE_SIDE_BY_SIDE_FULL;
-+	case FB_VMODE_3D_TOP_BOTTOM:
-+		return HDMI_3D_STRUCTURE_TOP_AND_BOTTOM;
-+	case FB_VMODE_3D_FRAME_PACK:
-+		return HDMI_3D_STRUCTURE_FRAME_PACKING;
-+	default:
-+		return HDMI_3D_STRUCTURE_INVALID;
-+	}
-+}
-+
-+static int mxc_hdmi_vendor_infoframe(struct mxc_hdmi *hdmi, struct hdmi_vendor_infoframe *frame)
-+{
-+	int err;
-+	u32 s3d_flags;
-+	u8 vic;
-+	uint8_t buffer[32]; //HDMI_FC_VSDPAYLOAD23 - HDMI_FC_VSDIEEEID0
-+			    //(with a hole starting at 0102B, ending 102F
-+	ssize_t len;
-+	int i;
-+
-+	if (!frame)
-+		return -EINVAL;
-+
-+	vic = hdmi->vic;
-+	s3d_flags = (*hdmi->fbi->mode).vmode & FB_VMODE_3D_MASK;
-+
-+	if (!vic && !s3d_flags)
-+		return -EINVAL;
-+
-+	err = hdmi_vendor_infoframe_init(frame);
-+	if (err < 0)
-+		return err;
-+
-+	if (s3d_flags)
-+		frame->s3d_struct = mxc_3d_structure_infoframe(s3d_flags);
-+	else if (vic)
-+		frame->vic = vic;
-+	else
-+		return -EINVAL;
-+
-+	/* see comment above for the reason for this offset */
-+	len = hdmi_vendor_infoframe_pack(frame, buffer+1, sizeof(buffer)-1);
-+	if (len < 0)
-+		return -EINVAL;
-+
-+	buffer[0] = buffer[5];
-+	buffer[1] = buffer[3];
-+	buffer[2] = 0;
-+	buffer[3] = 0;
-+	buffer[4] = 0;
-+	buffer[5] = 0;
-+
-+	//buffer[6] = buffer[6];
-+	//buffer[7] = buffer[7];
-+
-+	for (i = 0; i < 32; i++)
-+		hdmi_writeb(buffer[i], HDMI_FC_VSDIEEEID0 + i);
-+	return 0;
-+}
-+
-+static void hdmi_config_AVI(struct mxc_hdmi *hdmi)
-+{
-+	u8 val;
-+	u8 pix_fmt;
-+	u8 under_scan;
-+	u8 act_ratio, coded_ratio, colorimetry, ext_colorimetry;
-+	struct fb_videomode mode;
-+	const struct fb_videomode *edid_mode;
-+	bool aspect_16_9;
-+	struct hdmi_vendor_infoframe vendor_infoframe;
-+
-+	dev_dbg(&hdmi->pdev->dev, "set up AVI frame\n");
-+	fb_var_to_videomode(&mode, &hdmi->fbi->var);
-+	/* Use mode from list extracted from EDID to get aspect ratio */
-+	if (!list_empty(&hdmi->fbi->modelist)) {
-+		edid_mode = fb_find_nearest_mode(&mode, &hdmi->fbi->modelist);
-+		if (edid_mode->vmode & FB_VMODE_ASPECT_16_9)
-+			aspect_16_9 = true;
-+		else
-+			aspect_16_9 = false;
-+	} else
-+		aspect_16_9 = false;
-+
-+	/********************************************
-+	 * AVI Data Byte 1
-+	 ********************************************/
-+	if (hdmi->hdmi_data.enc_out_format == YCBCR444)
-+		pix_fmt = HDMI_FC_AVICONF0_PIX_FMT_YCBCR444;
-+	else if (hdmi->hdmi_data.enc_out_format == YCBCR422_8BITS)
-+		pix_fmt = HDMI_FC_AVICONF0_PIX_FMT_YCBCR422;
-+	else
-+		pix_fmt = HDMI_FC_AVICONF0_PIX_FMT_RGB;
-+
-+	if (hdmi->edid_cfg.cea_underscan)
-+		under_scan = HDMI_FC_AVICONF0_SCAN_INFO_UNDERSCAN;
-+	else
-+		under_scan =  HDMI_FC_AVICONF0_SCAN_INFO_NODATA;
-+
-+	/*
-+	 * Active format identification data is present in the AVI InfoFrame.
-+	 * Under scan info, no bar data
-+	 */
-+	val = pix_fmt | under_scan |
-+		HDMI_FC_AVICONF0_ACTIVE_FMT_INFO_PRESENT |
-+		HDMI_FC_AVICONF0_BAR_DATA_NO_DATA;
-+
-+	hdmi_writeb(val, HDMI_FC_AVICONF0);
-+
-+	/********************************************
-+	 * AVI Data Byte 2
-+	 ********************************************/
-+
-+	/*  Set the Aspect Ratio */
-+	if (aspect_16_9) {
-+		act_ratio = HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_16_9;
-+		coded_ratio = HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_16_9;
-+	} else {
-+		act_ratio = HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_4_3;
-+		coded_ratio = HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_4_3;
-+	}
-+
-+	/* Set up colorimetry */
-+	if (hdmi->hdmi_data.enc_out_format == XVYCC444) {
-+		colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_EXTENDED_INFO;
-+		if (hdmi->hdmi_data.colorimetry == eITU601)
-+			ext_colorimetry =
-+				HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601;
-+		else /* hdmi->hdmi_data.colorimetry == eITU709 */
-+			ext_colorimetry =
-+				HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC709;
-+	} else if (hdmi->hdmi_data.enc_out_format != RGB) {
-+		if (hdmi->hdmi_data.colorimetry == eITU601)
-+			colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_SMPTE;
-+		else /* hdmi->hdmi_data.colorimetry == eITU709 */
-+			colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_ITUR;
-+		ext_colorimetry = HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601;
-+	} else { /* Carries no data */
-+		colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_NO_DATA;
-+		ext_colorimetry = HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601;
-+	}
-+
-+	val = colorimetry | coded_ratio | act_ratio;
-+	hdmi_writeb(val, HDMI_FC_AVICONF1);
-+
-+	/********************************************
-+	 * AVI Data Byte 3
-+	 ********************************************/
-+
-+	val = HDMI_FC_AVICONF2_IT_CONTENT_NO_DATA | ext_colorimetry |
-+		hdmi->hdmi_data.rgb_quant_range |
-+		HDMI_FC_AVICONF2_SCALING_NONE;
-+	hdmi_writeb(val, HDMI_FC_AVICONF2);
-+
-+	/********************************************
-+	 * AVI Data Byte 4
-+	 ********************************************/
-+	hdmi_writeb(hdmi->vic, HDMI_FC_AVIVID);
-+
-+	/********************************************
-+	 * AVI Data Byte 5
-+	 ********************************************/
-+
-+	/* Set up input and output pixel repetition */
-+	val = (((hdmi->hdmi_data.video_mode.mPixelRepetitionInput + 1) <<
-+		HDMI_FC_PRCONF_INCOMING_PR_FACTOR_OFFSET) &
-+		HDMI_FC_PRCONF_INCOMING_PR_FACTOR_MASK) |
-+		((hdmi->hdmi_data.video_mode.mPixelRepetitionOutput <<
-+		HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_OFFSET) &
-+		HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_MASK);
-+	hdmi_writeb(val, HDMI_FC_PRCONF);
-+
-+	/* IT Content and quantization range = don't care */
-+	val = HDMI_FC_AVICONF3_IT_CONTENT_TYPE_GRAPHICS |
-+		HDMI_FC_AVICONF3_QUANT_RANGE_LIMITED;
-+	hdmi_writeb(val, HDMI_FC_AVICONF3);
-+
-+	/********************************************
-+	 * AVI Data Bytes 6-13
-+	 ********************************************/
-+	hdmi_writeb(0, HDMI_FC_AVIETB0);
-+	hdmi_writeb(0, HDMI_FC_AVIETB1);
-+	hdmi_writeb(0, HDMI_FC_AVISBB0);
-+	hdmi_writeb(0, HDMI_FC_AVISBB1);
-+	hdmi_writeb(0, HDMI_FC_AVIELB0);
-+	hdmi_writeb(0, HDMI_FC_AVIELB1);
-+	hdmi_writeb(0, HDMI_FC_AVISRB0);
-+	hdmi_writeb(0, HDMI_FC_AVISRB1);
-+
-+	mxc_hdmi_vendor_infoframe(hdmi, &vendor_infoframe);
-+}
-+
-+/*!
-+ * this submodule is responsible for the video/audio data composition.
-+ */
-+static void hdmi_av_composer(struct mxc_hdmi *hdmi)
-+{
-+	u8 inv_val;
-+	struct fb_info *fbi = hdmi->fbi;
-+	struct fb_videomode fb_mode;
-+	struct hdmi_vmode *vmode = &hdmi->hdmi_data.video_mode;
-+	int hblank, vblank;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	fb_var_to_videomode(&fb_mode, &fbi->var);
-+
-+	vmode->mHSyncPolarity = ((fb_mode.sync & FB_SYNC_HOR_HIGH_ACT) != 0);
-+	vmode->mVSyncPolarity = ((fb_mode.sync & FB_SYNC_VERT_HIGH_ACT) != 0);
-+	vmode->mInterlaced = ((fb_mode.vmode & FB_VMODE_INTERLACED) != 0);
-+	vmode->mPixelClock = (u32) (PICOS2KHZ(fb_mode.pixclock) * 1000UL);
-+
-+	dev_dbg(&hdmi->pdev->dev, "final pixclk = %lu\n", vmode->mPixelClock);
-+
-+	/* Set up HDMI_FC_INVIDCONF */
-+	inv_val = (vmode->mVSyncPolarity ?
-+		HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_HIGH :
-+		HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_LOW);
-+
-+	inv_val |= (vmode->mHSyncPolarity ?
-+		HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_HIGH :
-+		HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_LOW);
-+
-+	inv_val |= (vmode->mDataEnablePolarity ?
-+		HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_HIGH :
-+		HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_LOW);
-+
-+	if (fb_mode.vmode & FB_VMODE_FRACTIONAL)
-+		inv_val |= HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_HIGH;
-+	else
-+		inv_val |= (vmode->mInterlaced ?
-+			HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_HIGH :
-+			HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_LOW);
-+
-+	inv_val |= (vmode->mInterlaced ?
-+		HDMI_FC_INVIDCONF_IN_I_P_INTERLACED :
-+		HDMI_FC_INVIDCONF_IN_I_P_PROGRESSIVE);
-+
-+	inv_val |= (vmode->mDVI ?
-+		HDMI_FC_INVIDCONF_DVI_MODEZ_DVI_MODE :
-+		HDMI_FC_INVIDCONF_DVI_MODEZ_HDMI_MODE);
-+
-+	hdmi_writeb(inv_val, HDMI_FC_INVIDCONF);
-+
-+	/* Set up horizontal active pixel region width */
-+	hdmi_writeb(fb_mode.xres >> 8, HDMI_FC_INHACTV1);
-+	hdmi_writeb(fb_mode.xres, HDMI_FC_INHACTV0);
-+
-+	/* Set up vertical blanking pixel region width */
-+	if (vmode->mInterlaced) {
-+		hdmi_writeb((fb_mode.yres/2) >> 8, HDMI_FC_INVACTV1);
-+		hdmi_writeb((fb_mode.yres/2), HDMI_FC_INVACTV0);
-+	} else {
-+		hdmi_writeb(fb_mode.yres >> 8, HDMI_FC_INVACTV1);
-+		hdmi_writeb(fb_mode.yres, HDMI_FC_INVACTV0);
-+	}
-+
-+	/* Set up horizontal blanking pixel region width */
-+	hblank = fb_mode.left_margin + fb_mode.right_margin +
-+		fb_mode.hsync_len;
-+	hdmi_writeb(hblank >> 8, HDMI_FC_INHBLANK1);
-+	hdmi_writeb(hblank, HDMI_FC_INHBLANK0);
-+
-+	/* Set up vertical blanking pixel region width */
-+	vblank = fb_mode.upper_margin + fb_mode.lower_margin +
-+		fb_mode.vsync_len;
-+	if (vmode->mInterlaced)
-+		hdmi_writeb(vblank/2, HDMI_FC_INVBLANK);
-+	else
-+		hdmi_writeb(vblank, HDMI_FC_INVBLANK);
-+
-+	/* Set up HSYNC active edge delay width (in pixel clks) */
-+	hdmi_writeb(fb_mode.right_margin >> 8, HDMI_FC_HSYNCINDELAY1);
-+	hdmi_writeb(fb_mode.right_margin, HDMI_FC_HSYNCINDELAY0);
-+
-+	/* Set up VSYNC active edge delay (in pixel clks) */
-+	if (vmode->mInterlaced)
-+		hdmi_writeb(fb_mode.lower_margin / 2, HDMI_FC_VSYNCINDELAY);
-+	else
-+		hdmi_writeb(fb_mode.lower_margin, HDMI_FC_VSYNCINDELAY);
-+
-+	/* Set up HSYNC active pulse width (in pixel clks) */
-+	hdmi_writeb(fb_mode.hsync_len >> 8, HDMI_FC_HSYNCINWIDTH1);
-+	hdmi_writeb(fb_mode.hsync_len, HDMI_FC_HSYNCINWIDTH0);
-+
-+	/* Set up VSYNC active edge delay (in pixel clks) */
-+	if (vmode->mInterlaced)
-+		hdmi_writeb(fb_mode.vsync_len / 2, HDMI_FC_VSYNCINWIDTH);
-+	else
-+		hdmi_writeb(fb_mode.vsync_len, HDMI_FC_VSYNCINWIDTH);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
-+}
-+
-+static int mxc_edid_read_internal(struct mxc_hdmi *hdmi, unsigned char *edid,
-+			struct mxc_edid_cfg *cfg, struct fb_info *fbi)
-+{
-+	int extblknum;
-+	int i, j, ret;
-+	unsigned char *ediddata = edid;
-+	unsigned char tmpedid[EDID_LENGTH];
-+
-+	dev_info(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	if (!edid || !cfg || !fbi)
-+		return -EINVAL;
-+
-+	/* init HDMI I2CM for read edid*/
-+	hdmi_writeb(0x0, HDMI_I2CM_DIV);
-+	hdmi_writeb(0x00, HDMI_I2CM_SS_SCL_HCNT_1_ADDR);
-+	hdmi_writeb(0x79, HDMI_I2CM_SS_SCL_HCNT_0_ADDR);
-+	hdmi_writeb(0x00, HDMI_I2CM_SS_SCL_LCNT_1_ADDR);
-+	hdmi_writeb(0x91, HDMI_I2CM_SS_SCL_LCNT_0_ADDR);
-+
-+	hdmi_writeb(0x00, HDMI_I2CM_FS_SCL_HCNT_1_ADDR);
-+	hdmi_writeb(0x0F, HDMI_I2CM_FS_SCL_HCNT_0_ADDR);
-+	hdmi_writeb(0x00, HDMI_I2CM_FS_SCL_LCNT_1_ADDR);
-+	hdmi_writeb(0x21, HDMI_I2CM_FS_SCL_LCNT_0_ADDR);
-+
-+	hdmi_writeb(0x50, HDMI_I2CM_SLAVE);
-+	hdmi_writeb(0x30, HDMI_I2CM_SEGADDR);
-+
-+	/* Umask edid interrupt */
-+	hdmi_writeb(HDMI_I2CM_INT_DONE_POL,
-+		    HDMI_I2CM_INT);
-+
-+	hdmi_writeb(HDMI_I2CM_CTLINT_NAC_POL |
-+		    HDMI_I2CM_CTLINT_ARBITRATION_POL,
-+		    HDMI_I2CM_CTLINT);
-+
-+	/* reset edid data zero */
-+	memset(edid, 0, EDID_LENGTH*4);
-+	memset(cfg, 0, sizeof(struct mxc_edid_cfg));
-+
-+	/* Check first three byte of EDID head */
-+	if (!(hdmi_edid_i2c_read(hdmi, 0, 0) == 0x00) ||
-+		!(hdmi_edid_i2c_read(hdmi, 1, 0) == 0xFF) ||
-+		!(hdmi_edid_i2c_read(hdmi, 2, 0) == 0xFF)) {
-+		dev_info(&hdmi->pdev->dev, "EDID head check failed!");
-+		return -ENOENT;
-+	}
-+
-+	for (i = 0; i < 128; i++) {
-+		*ediddata = hdmi_edid_i2c_read(hdmi, i, 0);
-+		ediddata++;
-+	}
-+
-+	extblknum = edid[0x7E];
-+	if (extblknum < 0)
-+		return extblknum;
-+
-+	if (extblknum) {
-+		ediddata = edid + EDID_LENGTH;
-+		for (i = 0; i < 128; i++) {
-+			*ediddata = hdmi_edid_i2c_read(hdmi, i, 1);
-+			ediddata++;
-+		}
-+	}
-+
-+	/* edid first block parsing */
-+	memset(&fbi->monspecs, 0, sizeof(fbi->monspecs));
-+	fb_edid_to_monspecs(edid, &fbi->monspecs);
-+
-+	ret = mxc_edid_parse_ext_blk(edid + EDID_LENGTH,
-+			cfg, &fbi->monspecs);
-+	if (ret < 0) {
-+                fb_edid_add_monspecs(edid + EDID_LENGTH, &fbi->monspecs);
-+                if (fbi->monspecs.modedb_len > 0)
-+                        hdmi->edid_cfg.hdmi_cap = false;
-+                else
-+			return -ENOENT;
-+	}
-+
-+	/* need read segment block? */
-+	if (extblknum > 1) {
-+		for (j = 1; j <= extblknum; j++) {
-+			for (i = 0; i < 128; i++)
-+				*(tmpedid + 1) = hdmi_edid_i2c_read(hdmi, i, j);
-+
-+			/* edid ext block parsing */
-+			ret = mxc_edid_parse_ext_blk(tmpedid + EDID_LENGTH,
-+					cfg, &fbi->monspecs);
-+			if (ret < 0)
-+				return -ENOENT;
-+		}
-+	}
-+
-+	return 0;
-+}
-+
-+static int mxc_hdmi_read_edid(struct mxc_hdmi *hdmi)
-+{
-+	int ret;
-+	u8 edid_old[HDMI_EDID_LEN];
-+	u8 clkdis;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* save old edid */
-+	memcpy(edid_old, hdmi->edid, HDMI_EDID_LEN);
-+
-+	/* Read EDID via HDMI DDC when HDCP Enable */
-+	if (!hdcp_init)
-+		ret = mxc_edid_read(hdmi_i2c->adapter, hdmi_i2c->addr,
-+				hdmi->edid, &hdmi->edid_cfg, hdmi->fbi);
-+	else {
-+
-+		/* Disable HDCP clk */
-+		if (hdmi->hdmi_data.hdcp_enable) {
-+			clkdis = hdmi_readb(HDMI_MC_CLKDIS);
-+			clkdis |= HDMI_MC_CLKDIS_HDCPCLK_DISABLE;
-+			hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+		}
-+
-+		ret = mxc_edid_read_internal(hdmi, hdmi->edid,
-+				&hdmi->edid_cfg, hdmi->fbi);
-+
-+		/* Enable HDCP clk */
-+		if (hdmi->hdmi_data.hdcp_enable) {
-+			clkdis = hdmi_readb(HDMI_MC_CLKDIS);
-+			clkdis &= ~HDMI_MC_CLKDIS_HDCPCLK_DISABLE;
-+			hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+		}
-+
-+	}
-+
-+	if (ret < 0)
-+		return HDMI_EDID_FAIL;
-+
-+	dev_info(&hdmi->pdev->dev, "%s HDMI in %s mode\n", __func__, hdmi->edid_cfg.hdmi_cap?"HDMI":"DVI");
-+	hdmi->plug_event = hdmi->edid_cfg.hdmi_cap?HDMI_IH_PHY_STAT0_HPD:HDMI_DVI_IH_STAT;
-+	hdmi->plug_mask = hdmi->edid_cfg.hdmi_cap?HDMI_PHY_HPD:HDMI_DVI_STAT;
-+
-+	if (!memcmp(edid_old, hdmi->edid, HDMI_EDID_LEN)) {
-+		dev_info(&hdmi->pdev->dev, "same edid\n");
-+		return HDMI_EDID_SAME;
-+	}
-+
-+	if (hdmi->fbi->monspecs.modedb_len == 0) {
-+		dev_info(&hdmi->pdev->dev, "No modes read from edid\n");
-+		return HDMI_EDID_NO_MODES;
-+	}
-+
-+	return HDMI_EDID_SUCCESS;
-+}
-+
-+static void mxc_hdmi_phy_disable(struct mxc_hdmi *hdmi)
-+{
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	if (!hdmi->phy_enabled)
-+		return;
-+
-+	hdmi_disable_overflow_interrupts();
-+
-+	/* Setting PHY to reset status */
-+	hdmi_writeb(HDMI_MC_PHYRSTZ_DEASSERT, HDMI_MC_PHYRSTZ);
-+
-+	/* Power down PHY */
-+	mxc_hdmi_phy_enable_tmds(0);
-+	mxc_hdmi_phy_enable_power(0);
-+	mxc_hdmi_phy_gen2_txpwron(0);
-+	mxc_hdmi_phy_gen2_pddq(1);
-+
-+	hdmi->phy_enabled = false;
-+	dev_dbg(&hdmi->pdev->dev, "%s - exit\n", __func__);
-+}
-+
-+/* HDMI Initialization Step B.4 */
-+static void mxc_hdmi_enable_video_path(struct mxc_hdmi *hdmi)
-+{
-+	u8 clkdis;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* control period minimum duration */
-+	hdmi_writeb(12, HDMI_FC_CTRLDUR);
-+	hdmi_writeb(32, HDMI_FC_EXCTRLDUR);
-+	hdmi_writeb(1, HDMI_FC_EXCTRLSPAC);
-+
-+	/* Set to fill TMDS data channels */
-+	hdmi_writeb(0x0B, HDMI_FC_CH0PREAM);
-+	hdmi_writeb(0x16, HDMI_FC_CH1PREAM);
-+	hdmi_writeb(0x21, HDMI_FC_CH2PREAM);
-+
-+	/* Save CEC clock */
-+	clkdis = hdmi_readb(HDMI_MC_CLKDIS) & HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+	clkdis |= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+
-+	/* Enable pixel clock and tmds data path */
-+	clkdis = 0x7F & clkdis;
-+	clkdis &= ~HDMI_MC_CLKDIS_PIXELCLK_DISABLE;
-+	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+
-+	clkdis &= ~HDMI_MC_CLKDIS_TMDSCLK_DISABLE;
-+	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+
-+	/* Enable csc path */
-+	if (isColorSpaceConversion(hdmi) && !hdmi->hdmi_data.video_mode.mDVI) {
-+		clkdis &= ~HDMI_MC_CLKDIS_CSCCLK_DISABLE;
-+		hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+	}
-+}
-+
-+static void hdmi_enable_audio_clk(struct mxc_hdmi *hdmi)
-+{
-+	u8 clkdis;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	clkdis = hdmi_readb(HDMI_MC_CLKDIS);
-+	clkdis &= ~HDMI_MC_CLKDIS_AUDCLK_DISABLE;
-+	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+}
-+
-+/* Workaround to clear the overflow condition */
-+static void mxc_hdmi_clear_overflow(struct mxc_hdmi *hdmi)
-+{
-+	int count;
-+	u8 val;
-+
-+	/* TMDS software reset */
-+	hdmi_writeb((u8)~HDMI_MC_SWRSTZ_TMDSSWRST_REQ, HDMI_MC_SWRSTZ);
-+
-+	val = hdmi_readb(HDMI_FC_INVIDCONF);
-+
-+	if (cpu_is_imx6dl(hdmi)) {
-+		 hdmi_writeb(val, HDMI_FC_INVIDCONF);
-+		 return;
-+	}
-+
-+	for (count = 0 ; count < 5 ; count++)
-+		hdmi_writeb(val, HDMI_FC_INVIDCONF);
-+}
-+
-+static void hdmi_enable_overflow_interrupts(void)
-+{
-+	pr_debug("%s\n", __func__);
-+	hdmi_writeb(0, HDMI_FC_MASK2);
-+	hdmi_writeb(0, HDMI_IH_MUTE_FC_STAT2);
-+}
-+
-+static void hdmi_disable_overflow_interrupts(void)
-+{
-+	pr_debug("%s\n", __func__);
-+	hdmi_writeb(HDMI_IH_MUTE_FC_STAT2_OVERFLOW_MASK,
-+		    HDMI_IH_MUTE_FC_STAT2);
-+	hdmi_writeb(0x7f, HDMI_FC_MASK2);
-+}
-+
-+static void mxc_hdmi_notify_fb(struct mxc_hdmi *hdmi)
-+{
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* Don't notify if we aren't registered yet */
-+	WARN_ON(!hdmi->fb_reg);
-+
-+	/* disable the phy before ipu changes mode */
-+	mxc_hdmi_phy_disable(hdmi);
-+
-+	/*
-+	 * Note that fb_set_var will block.  During this time,
-+	 * FB_EVENT_MODE_CHANGE callback will happen.
-+	 * So by the end of this function, mxc_hdmi_setup()
-+	 * will be done.
-+	 */
-+	hdmi->fbi->var.activate |= FB_ACTIVATE_FORCE;
-+	console_lock();
-+	hdmi->fbi->flags |= FBINFO_MISC_USEREVENT;
-+	fb_set_var(hdmi->fbi, &hdmi->fbi->var);
-+	hdmi->fbi->flags &= ~FBINFO_MISC_USEREVENT;
-+	console_unlock();
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
-+}
-+
-+inline
-+static void mxc_fb_add_videomode(const struct fb_videomode *src_mode, struct list_head *modelist, const u32 new_flag, const u32 mod_vmode)
-+{
-+	struct fb_videomode mode;
-+
-+	memcpy(&mode, src_mode, sizeof(struct fb_videomode));
-+	mode.flag = new_flag; mode.vmode |= mod_vmode;
-+	fb_add_videomode(&mode, modelist);
-+}
-+
-+enum {
-+	hzSTART = 0,
-+	hz50    = 50,
-+	hz60    = 60,
-+	hzEND   = 61
-+};
-+
-+struct stereo_mandatory_mode {
-+	int				rfc_refresh;
-+	const struct fb_videomode	*rfc_parent_cea_mode;
-+	uint32_t			flag;
-+	uint32_t			vmode;
-+};
-+
-+static struct stereo_mandatory_mode stereo_mandatory_modes[] = {
-+	// 1280x720p @ 59.94 / 60Hz TOP-and-BOTTOM
-+	{ 60, &mxc_cea_mode[4],  FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM },
-+	// 1920x1080p @ 23.98 / 24Hz TOP-and-BOTTOM
-+	{ 60, &mxc_cea_mode[32], FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM },
-+	// 1280x720p @ 59.94 / 60Hz FRAME-PACK
-+	{ 60, &mxc_cea_mode[4],  FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK },
-+	// 1920x1080p @ 23.98 / 24Hz FRAME-PACK
-+	{ 60, &mxc_cea_mode[32], FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK },
-+	// 1920x1080i @ 59.94 / 60Hz SIDE-by-SIDE half
-+	{ 60, &mxc_cea_mode[5],  FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF   },
-+	// 1280x720p @ 50Hz TOP-and-BOTTOM
-+	{ 50, &mxc_cea_mode[19], FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM },
-+	// 1280x720p @ 50Hz FRAME-PACK
-+	{ 50, &mxc_cea_mode[19], FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK },
-+	// 1920x1080i @ 50Hz SIDE-by-SIDE half
-+	{ 50, &mxc_cea_mode[20], FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF   }
-+};
-+
-+static void mxc_hdmi_edid_rebuild_modelist(struct mxc_hdmi *hdmi)
-+{
-+	int i, j, k, nvic = 0, vic;
-+	struct fb_videomode *mode;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	console_lock();
-+
-+	fb_destroy_modelist(&hdmi->fbi->modelist);
-+	fb_add_videomode(&vga_mode, &hdmi->fbi->modelist);
-+
-+	for (i = 0; i < hdmi->fbi->monspecs.modedb_len; i++) {
-+		/*
-+		 * We might check here if mode is supported by HDMI.
-+		 * We do not currently support interlaced modes.
-+		 * And add CEA modes in the modelist.
-+		 */
-+		mode = &hdmi->fbi->monspecs.modedb[i];
-+
-+		if ((vic = mxc_edid_mode_to_vic(mode, 0)))
-+			nvic++;
-+
-+		// allow detailed timing specification with vic=0 for HDMI
-+		// mode
-+		if (hdmi->edid_cfg.hdmi_cap &&
-+		   (((mode->flag != FB_MODE_IS_DETAILED) && (vic == 0))
-+				||
-+		   (mode->flag == FB_MODE_IS_VESA)))
-+				continue;
-+
-+		if (!mode->xres || !mode->refresh)
-+			continue;
-+
-+		if (!(mode->vmode & FB_VMODE_ASPECT_MASK)) {
-+			if (mode->yres == (mode->xres * 3)/4)
-+				mode->vmode |= FB_VMODE_ASPECT_4_3;
-+			else
-+				mode->vmode |= FB_VMODE_ASPECT_16_9;
-+		}
-+
-+		for (j = 0; j < 1 || (hdmi->hdmi_data.enable_fract && j < 2); j++) {
-+			struct fb_videomode *tm = mode;
-+			struct fb_videomode mode2;
-+			char refresh[10];
-+
-+			if (j == 1 && (mode->refresh != 24 && mode->refresh != 30 && mode->refresh != 60))
-+				break;
-+
-+			switch (j) {
-+			case 1:
-+				memcpy(&mode2, mode, sizeof(struct fb_videomode));
-+				mode2.vmode = mode->vmode | FB_VMODE_FRACTIONAL;
-+				mode2.pixclock = PICOS2KHZ(KHZ2PICOS(mode2.pixclock) * 1000/1001);
-+				fb_add_videomode(&mode2, &hdmi->fbi->modelist);
-+				tm = &mode2;
-+				break;
-+			default:
-+				break;
-+			}
-+
-+			get_refresh_str(tm, refresh);
-+			dev_info(&hdmi->pdev->dev, "Added mode: %d, vic: %d %s", i, vic, j == 1 ? " fractional" : "");
-+			dev_info(&hdmi->pdev->dev,
-+				"xres = %d, yres = %d, ratio = %s, freq = %s, vmode = %d, flag = %d, pclk = %d\n",
-+				tm->xres,
-+				tm->yres,
-+				tm->vmode & FB_VMODE_ASPECT_1 ? "1" :
-+				    mode->vmode & FB_VMODE_ASPECT_4_3 ? "4/3" :
-+				    mode->vmode & FB_VMODE_ASPECT_5_4 ? "5/4" :
-+				    mode->vmode & FB_VMODE_ASPECT_16_10 ? "16/10" :
-+				    mode->vmode & FB_VMODE_ASPECT_16_9 ? "16/9" : "n/a",
-+				refresh,
-+				tm->vmode,
-+				tm->flag,
-+				tm->pixclock);
-+			fb_add_videomode(tm, &hdmi->fbi->modelist);
-+		}
-+
-+		if (!hdmi->hdmi_data.enable_3d || !vic)
-+			continue;
-+
-+		/* according to HDMI 1.4 specs, add mandatory modes for 50 and 60Hz existing 2d modes */
-+		for (k = hzSTART + 1; k < hzEND; k++) {
-+		    if (mode->refresh == k && hdmi->edid_cfg.hdmi_3d_present) {
-+			for (j = 0; j < sizeof(stereo_mandatory_modes) / sizeof(struct stereo_mandatory_mode); j++) {
-+				if (stereo_mandatory_modes[j].rfc_refresh != k)
-+					continue;
-+				mxc_fb_add_videomode(stereo_mandatory_modes[j].rfc_parent_cea_mode, &hdmi->fbi->modelist,
-+							stereo_mandatory_modes[j].flag, stereo_mandatory_modes[j].vmode);
-+			}
-+		    }
-+		}
-+
-+		if ((hdmi->edid_cfg.hdmi_3d_multi_present == 2 && hdmi->edid_cfg.hdmi_3d_mask_all & (1 << (nvic-1))) ||
-+		    (hdmi->edid_cfg.hdmi_3d_multi_present == 1 && nvic <= 16)) {
-+			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x1)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK);
-+			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x6)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_FULL);
-+			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x40)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM);
-+			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x100)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF);
-+		}
-+
-+		for (j = 0; j < hdmi->edid_cfg.hdmi_3d_len; j++) {
-+			if (hdmi->edid_cfg.hdmi_3d_format[j].vic_order_2d != nvic-1)
-+				continue;
-+
-+			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 0)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK);
-+			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 3)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_FULL);
-+			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 6)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM);
-+			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 8)
-+				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF);
-+		}
-+	}
-+
-+	fb_new_modelist(hdmi->fbi);
-+
-+	console_unlock();
-+}
-+
-+static void  mxc_hdmi_default_edid_cfg(struct mxc_hdmi *hdmi)
-+{
-+	/* Default setting HDMI working in HDMI mode */
-+	hdmi->edid_cfg.hdmi_cap = true;
-+}
-+
-+static void  mxc_hdmi_default_modelist(struct mxc_hdmi *hdmi)
-+{
-+	u32 i;
-+	const struct fb_videomode *mode;
-+	struct fb_videomode m;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* If not EDID data read, set up default modelist  */
-+	dev_info(&hdmi->pdev->dev, "No modes read from edid\n");
-+	dev_info(&hdmi->pdev->dev, "create default modelist\n");
-+
-+	console_lock();
-+
-+	fb_destroy_modelist(&hdmi->fbi->modelist);
-+
-+	fb_var_to_videomode(&m, &hdmi->fbi->var);
-+	fb_add_videomode(&m, &hdmi->fbi->modelist);
-+
-+	/*Add all no interlaced CEA mode to default modelist */
-+	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
-+		mode = &mxc_cea_mode[i];
-+		if (mode->xres != 0)
-+			fb_add_videomode(mode, &hdmi->fbi->modelist);
-+	}
-+
-+	fb_new_modelist(hdmi->fbi);
-+
-+	console_unlock();
-+}
-+
-+static void mxc_hdmi_set_mode(struct mxc_hdmi *hdmi)
-+{
-+	const struct fb_videomode *mode;
-+	struct fb_videomode m;
-+	struct fb_var_screeninfo var;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* Set the default mode only once. */
-+	if (!hdmi->dft_mode_set) {
-+		fb_videomode_to_var(&var, &hdmi->default_mode);
-+		hdmi->dft_mode_set = true;
-+		hdmi->requesting_vga_for_initialization = false;
-+	} else
-+		memcpy(&var, &hdmi->previous_non_vga_mode,
-+		       sizeof(struct fb_var_screeninfo));
-+
-+	fb_var_to_videomode(&m, &var);
-+
-+	mode = mxc_fb_find_nearest_mode(&m, &hdmi->fbi->modelist);
-+	if (!mode) {
-+		pr_err("%s: could not find mode in modelist\n", __func__);
-+		return;
-+	}
-+
-+	/* If video mode same as previous, init HDMI again */
-+	if (fb_mode_is_equal(&m, mode) && hdmi->edid_status == HDMI_EDID_SAME) {
-+		dev_dbg(&hdmi->pdev->dev,
-+				"%s: Video mode and EDID same as previous\n", __func__);
-+		/* update fbi mode in case modelist is updated */
-+		hdmi->fbi->mode = (struct fb_videomode *)mode;
-+		memcpy(&hdmi->fbi->var, &hdmi->previous_non_vga_mode,
-+		       sizeof(struct fb_var_screeninfo));
-+		/* update hdmi setting in case EDID data updated  */
-+		mxc_hdmi_setup(hdmi, 0);
-+	} else if (fb_mode_is_equal(&m, mode)) {
-+		dev_dbg(&hdmi->pdev->dev,
-+				"%s: Video mode same as previous\n", __func__);
-+		/* update fbi mode in case modelist is updated */
-+		hdmi->fbi->mode = (struct fb_videomode *)mode;
-+		dump_fb_videomode(hdmi->fbi->mode);
-+		memcpy(&hdmi->fbi->var, &hdmi->previous_non_vga_mode,
-+		       sizeof(struct fb_var_screeninfo));
-+		mxc_hdmi_notify_fb(hdmi);
-+	} else {
-+		dev_dbg(&hdmi->pdev->dev, "%s: New video mode\n", __func__);
-+		fb_videomode_to_var(&hdmi->fbi->var, mode);
-+		dump_fb_videomode((struct fb_videomode *)mode);
-+		mxc_hdmi_notify_fb(hdmi);
-+	}
-+
-+}
-+
-+static void mxc_hdmi_cable_connected(struct mxc_hdmi *hdmi)
-+{
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	hdmi->cable_plugin = true;
-+
-+	/* HDMI Initialization Step C */
-+	hdmi->edid_status = mxc_hdmi_read_edid(hdmi);
-+
-+	/* Read EDID again if first EDID read failed */
-+	if (hdmi->edid_status == HDMI_EDID_NO_MODES ||
-+			hdmi->edid_status == HDMI_EDID_FAIL) {
-+		dev_info(&hdmi->pdev->dev, "Read EDID again\n");
-+		msleep(25);
-+		hdmi->edid_status = mxc_hdmi_read_edid(hdmi);
-+	}
-+
-+	/* HDMI Initialization Steps D, E, F */
-+	switch (hdmi->edid_status) {
-+	case HDMI_EDID_SUCCESS:
-+		mxc_hdmi_edid_rebuild_modelist(hdmi);
-+		break;
-+
-+	/* Nothing to do if EDID same */
-+	case HDMI_EDID_SAME:
-+		break;
-+
-+	case HDMI_EDID_FAIL:
-+		mxc_hdmi_default_edid_cfg(hdmi);
-+		/* No break here  */
-+	case HDMI_EDID_NO_MODES:
-+	default:
-+		mxc_hdmi_default_modelist(hdmi);
-+		break;
-+	}
-+
-+	/* Save edid cfg for audio driver */
-+	hdmi_set_edid_cfg(hdmi->edid_status, &hdmi->edid_cfg);
-+
-+	/* Setting video mode */
-+	mxc_hdmi_set_mode(hdmi);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
-+}
-+
-+static int mxc_hdmi_power_on(struct mxc_dispdrv_handle *disp)
-+{
-+	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s reg %d cable %d blank %d\n", __func__, hdmi->fb_reg, hdmi->cable_plugin, hdmi->blank);
-+
-+	mxc_hdmi_phy_init(hdmi);
-+	hdmi_clk_regenerator_update_pixel_clock(hdmi->fbi->var.pixclock);
-+	return 0;
-+}
-+
-+static void mxc_hdmi_power_off(struct mxc_dispdrv_handle *disp)
-+{
-+	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	mxc_hdmi_phy_disable(hdmi);
-+}
-+
-+static void mxc_hdmi_cable_disconnected(struct mxc_hdmi *hdmi)
-+{
-+	u8  clkdis;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* Save CEC clock */
-+	clkdis = hdmi_readb(HDMI_MC_CLKDIS) & HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+	clkdis |= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
-+
-+	/* Disable All HDMI clock */
-+	hdmi_writeb(0x7f, HDMI_MC_CLKDIS);
-+
-+	mxc_hdmi_phy_disable(hdmi);
-+
-+	//hdmi_disable_overflow_interrupts();
-+	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
-+
-+	hdmi->cable_plugin = false;
-+}
-+
-+static void hotplug_worker(struct work_struct *work)
-+{
-+	struct mxc_hdmi *hdmi =
-+		container_of(work, struct mxc_hdmi, hotplug_work);
-+	u32 hdmi_phy_stat0, hdmi_phy_pol0, hdmi_phy_mask0;
-+	unsigned long flags;
-+	char event_string[32];
-+	char *envp[] = { event_string, NULL };
-+	u32 l;
-+
-+	hdmi_phy_stat0 = hdmi_readb(HDMI_PHY_STAT0);
-+	hdmi_phy_pol0 = hdmi_readb(HDMI_PHY_POL0);
-+
-+	dev_dbg(&hdmi->pdev->dev, "phy_int_stat=0x%x/0x%x, phy_int_pol=0x%x, plug_event=0x%x, plug_mask=0x%x\n",
-+			hdmi_phy_stat0, hdmi->latest_intr_stat, hdmi_phy_pol0, hdmi->plug_event, hdmi->plug_mask);
-+
-+		/* Make HPD intr active low to capture unplug event or
-+		 * active high to capture plugin event */
-+		hdmi_writeb((hdmi->plug_mask & ~hdmi_phy_pol0), HDMI_PHY_POL0);
-+
-+		/* cable connection changes */
-+		if (hdmi_phy_pol0 & hdmi->plug_mask) {
-+			/* Plugin event */
-+			dev_dbg(&hdmi->pdev->dev, "EVENT=plugin\n");
-+			mxc_hdmi_cable_connected(hdmi);
-+
-+			sprintf(event_string, "EVENT=plugin");
-+			kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
-+#ifdef CONFIG_MXC_HDMI_CEC
-+			memcpy(&l, &hdmi->edid_cfg.physical_address, 4 *sizeof(u8));
-+			mxc_hdmi_cec_handle(l);
-+#endif
-+			hdmi_set_cable_state(1);
-+		} else {
-+			/* Plugout event */
-+			dev_dbg(&hdmi->pdev->dev, "EVENT=plugout\n");
-+			hdmi_set_cable_state(0);
-+			mxc_hdmi_abort_stream();
-+			mxc_hdmi_cable_disconnected(hdmi);
-+
-+			sprintf(event_string, "EVENT=plugout");
-+			kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
-+#ifdef CONFIG_MXC_HDMI_CEC
-+			mxc_hdmi_cec_handle(0x0);
-+#endif
-+		}
-+
-+	/* Lock here to ensure full powerdown sequence
-+	 * completed before next interrupt processed */
-+	spin_lock_irqsave(&hdmi->irq_lock, flags);
-+
-+	/* Re-enable HPD interrupts */
-+	hdmi_phy_mask0 = hdmi_readb(HDMI_PHY_MASK0);
-+	hdmi_phy_mask0 &= ~hdmi->plug_mask;
-+	hdmi_writeb(hdmi_phy_mask0, HDMI_PHY_MASK0);
-+
-+	/* Unmute interrupts */
-+	hdmi_writeb(~hdmi->plug_event, HDMI_IH_MUTE_PHY_STAT0);
-+
-+	if (hdmi_readb(HDMI_IH_FC_STAT2) & HDMI_IH_FC_STAT2_OVERFLOW_MASK)
-+		mxc_hdmi_clear_overflow(hdmi);
-+
-+	spin_unlock_irqrestore(&hdmi->irq_lock, flags);
-+	pr_debug("%s exit\n", __func__);
-+}
-+
-+static void hotplug_work_launch(unsigned long data)
-+{
-+	struct mxc_hdmi *hdmi = (struct mxc_hdmi *)data;
-+	pr_debug("%s\n", __func__);
-+	schedule_work(&hdmi->hotplug_work);
-+}
-+
-+static void hdcp_hdp_worker(struct work_struct *work)
-+{
-+	struct delayed_work *delay_work = to_delayed_work(work);
-+	struct mxc_hdmi *hdmi =
-+		container_of(delay_work, struct mxc_hdmi, hdcp_hdp_work);
-+	char event_string[32];
-+	char *envp[] = { event_string, NULL };
-+
-+	/* HDCP interrupt */
-+	sprintf(event_string, "EVENT=hdcpint");
-+	kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
-+
-+	/* Unmute interrupts in HDCP application*/
-+}
-+
-+static irqreturn_t mxc_hdmi_hotplug(int irq, void *data)
-+{
-+	struct mxc_hdmi *hdmi = data;
-+	u8 val, intr_stat;
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&hdmi->irq_lock, flags);
-+
-+	/* Check and clean packet overflow interrupt.*/
-+	if (hdmi_readb(HDMI_IH_FC_STAT2) &
-+			HDMI_IH_FC_STAT2_OVERFLOW_MASK) {
-+		mxc_hdmi_clear_overflow(hdmi);
-+
-+		dev_dbg(&hdmi->pdev->dev, "Overflow interrupt received\n");
-+		/* clear irq status */
-+		hdmi_writeb(HDMI_IH_FC_STAT2_OVERFLOW_MASK,
-+			    HDMI_IH_FC_STAT2);
-+	}
-+
-+	/*
-+	 * We could not disable the irq.  Probably the audio driver
-+	 * has enabled it. Masking off the HDMI interrupts using
-+	 * HDMI registers.
-+	 */
-+	/* Capture status - used in hotplug_worker ISR */
-+	intr_stat = hdmi_readb(HDMI_IH_PHY_STAT0);
-+	if (intr_stat & hdmi->plug_event) {
-+
-+		dev_dbg(&hdmi->pdev->dev, "Hotplug interrupt received\n");
-+		hdmi->latest_intr_stat = intr_stat;
-+
-+		/* Mute interrupts until handled */
-+
-+		val = hdmi_readb(HDMI_IH_MUTE_PHY_STAT0);
-+		val |= hdmi->plug_event;
-+		hdmi_writeb(val, HDMI_IH_MUTE_PHY_STAT0);
-+
-+		val = hdmi_readb(HDMI_PHY_MASK0);
-+		val |= hdmi->plug_mask;
-+		hdmi_writeb(val, HDMI_PHY_MASK0);
-+
-+		/* Clear Hotplug interrupts */
-+		hdmi_writeb(hdmi->plug_event, HDMI_IH_PHY_STAT0);
-+
-+		if(hdmi_inited) {
-+			if (!hdmi->dft_mode_set)
-+				mod_timer(&hdmi->jitter_timer, jiffies + msecs_to_jiffies(20));
-+			else
-+				mod_timer(&hdmi->jitter_timer, jiffies + HZ);
-+		}
-+	}
-+
-+	/* Check HDCP  interrupt state */
-+	if (hdmi->hdmi_data.hdcp_enable) {
-+		val = hdmi_readb(HDMI_A_APIINTSTAT);
-+		if (val != 0) {
-+			/* Mute interrupts until interrupt handled */
-+			val = 0x7F;
-+			hdmi_writeb(val, HDMI_A_APIINTMSK);
-+			schedule_delayed_work(&(hdmi->hdcp_hdp_work), msecs_to_jiffies(50));
-+		}
-+	}
-+
-+	spin_unlock_irqrestore(&hdmi->irq_lock, flags);
-+	return IRQ_HANDLED;
-+}
-+
-+static void mxc_hdmi_setup(struct mxc_hdmi *hdmi, unsigned long event)
-+{
-+	struct fb_videomode m;
-+	const struct fb_videomode *edid_mode;
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	fb_var_to_videomode(&m, &hdmi->fbi->var);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s - video mode changed\n", __func__);
-+
-+	hdmi->vic = 0;
-+	if (!hdmi->requesting_vga_for_initialization) {
-+		/* Save mode if this isn't the result of requesting
-+		 * vga default. */
-+		memcpy(&hdmi->previous_non_vga_mode, &hdmi->fbi->var,
-+		       sizeof(struct fb_var_screeninfo));
-+		if (!list_empty(&hdmi->fbi->modelist)) {
-+			edid_mode = mxc_fb_find_nearest_mode(&m, &hdmi->fbi->modelist);
-+			pr_debug("edid mode vx:%d vy:%d", hdmi->fbi->var.xres_virtual, hdmi->fbi->var.yres_virtual);
-+			dump_fb_videomode((struct fb_videomode *)edid_mode);
-+			/* update fbi mode */
-+			hdmi->fbi->mode = (struct fb_videomode *)edid_mode;
-+			hdmi->vic = mxc_edid_mode_to_vic(edid_mode, 0);
-+		}
-+	}
-+
-+	hdmi_disable_overflow_interrupts();
-+
-+	dev_dbg(&hdmi->pdev->dev, "CEA mode used vic=%d\n", hdmi->vic);
-+	if (hdmi->edid_cfg.hdmi_cap || !hdmi->edid_status) {
-+		hdmi_set_dvi_mode(0);
-+		hdmi->hdmi_data.video_mode.mDVI = false;
-+	} else {
-+		hdmi_set_dvi_mode(1);
-+		dev_dbg(&hdmi->pdev->dev, "CEA mode vic=%d work in DVI\n", hdmi->vic);
-+		hdmi->hdmi_data.video_mode.mDVI = true;
-+	}
-+
-+	if ((hdmi->vic == 6) || (hdmi->vic == 7) ||
-+		(hdmi->vic == 21) || (hdmi->vic == 22) ||
-+		(hdmi->vic == 2) || (hdmi->vic == 3) ||
-+		(hdmi->vic == 17) || (hdmi->vic == 18))
-+		hdmi->hdmi_data.colorimetry = eITU601;
-+	else
-+		hdmi->hdmi_data.colorimetry = eITU709;
-+
-+	if ((hdmi->vic == 10) || (hdmi->vic == 11) ||
-+		(hdmi->vic == 12) || (hdmi->vic == 13) ||
-+		(hdmi->vic == 14) || (hdmi->vic == 15) ||
-+		(hdmi->vic == 25) || (hdmi->vic == 26) ||
-+		(hdmi->vic == 27) || (hdmi->vic == 28) ||
-+		(hdmi->vic == 29) || (hdmi->vic == 30) ||
-+		(hdmi->vic == 35) || (hdmi->vic == 36) ||
-+		(hdmi->vic == 37) || (hdmi->vic == 38))
-+		hdmi->hdmi_data.video_mode.mPixelRepetitionOutput = 1;
-+	else
-+		hdmi->hdmi_data.video_mode.mPixelRepetitionOutput = 0;
-+
-+	hdmi->hdmi_data.video_mode.mPixelRepetitionInput = 0;
-+
-+	/* TODO: Get input format from IPU (via FB driver iface) */
-+	hdmi->hdmi_data.enc_in_format = RGB;
-+
-+	hdmi->hdmi_data.enc_out_format = RGB;
-+
-+	/* YCbCr only enabled in HDMI mode */
-+	if (!hdmi->hdmi_data.video_mode.mDVI &&
-+		!hdmi->hdmi_data.rgb_out_enable) {
-+		if (hdmi->edid_cfg.cea_ycbcr444)
-+			hdmi->hdmi_data.enc_out_format = YCBCR444;
-+		else if (hdmi->edid_cfg.cea_ycbcr422)
-+			hdmi->hdmi_data.enc_out_format = YCBCR422_8BITS;
-+	}
-+
-+	/* IPU not support depth color output */
-+	hdmi->hdmi_data.enc_color_depth = 8;
-+	hdmi->hdmi_data.pix_repet_factor = 0;
-+	hdmi->hdmi_data.video_mode.mDataEnablePolarity = true;
-+
-+	/* HDMI Initialization Step B.1 */
-+	hdmi_av_composer(hdmi);
-+
-+	/* HDMI Initializateion Step B.2 */
-+	mxc_hdmi_phy_init(hdmi);
-+
-+	/* HDMI Initialization Step B.3 */
-+	mxc_hdmi_enable_video_path(hdmi);
-+
-+	/* not for DVI mode */
-+	if (hdmi->hdmi_data.video_mode.mDVI)
-+		dev_dbg(&hdmi->pdev->dev, "%s DVI mode\n", __func__);
-+	else {
-+		dev_dbg(&hdmi->pdev->dev, "%s CEA mode\n", __func__);
-+
-+		/* HDMI Initialization Step E - Configure audio */
-+		hdmi_enable_audio_clk(hdmi);
-+
-+		/* HDMI Initialization Step F - Configure AVI InfoFrame */
-+		hdmi_config_AVI(hdmi);
-+	}
-+
-+	hdmi_video_packetize(hdmi);
-+	hdmi_video_csc(hdmi);
-+	hdmi_video_sample(hdmi);
-+
-+	mxc_hdmi_clear_overflow(hdmi);
-+
-+	if (hdmi->cable_plugin && !hdmi->hdmi_data.video_mode.mDVI)
-+		hdmi_enable_overflow_interrupts();
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s exit\n\n", __func__);
-+
-+}
-+
-+/* Wait until we are registered to enable interrupts */
-+static void mxc_hdmi_fb_registered(struct mxc_hdmi *hdmi)
-+{
-+	unsigned long flags;
-+
-+	if (hdmi->fb_reg)
-+		return;
-+
-+	spin_lock_irqsave(&hdmi->irq_lock, flags);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	hdmi_writeb(HDMI_PHY_I2CM_INT_ADDR_DONE_POL,
-+		    HDMI_PHY_I2CM_INT_ADDR);
-+
-+	hdmi_writeb(HDMI_PHY_I2CM_CTLINT_ADDR_NAC_POL |
-+		    HDMI_PHY_I2CM_CTLINT_ADDR_ARBITRATION_POL,
-+		    HDMI_PHY_I2CM_CTLINT_ADDR);
-+
-+	/* enable cable hot plug irq */
-+	hdmi_writeb(~hdmi->plug_mask, HDMI_PHY_MASK0);
-+
-+	/* Clear Hotplug interrupts */
-+	hdmi_writeb(hdmi->plug_event, HDMI_IH_PHY_STAT0);
-+
-+	/* Unmute interrupts */
-+	hdmi_writeb(~hdmi->plug_event, HDMI_IH_MUTE_PHY_STAT0);
-+
-+	hdmi->fb_reg = true;
-+
-+	spin_unlock_irqrestore(&hdmi->irq_lock, flags);
-+
-+}
-+
-+static int mxc_hdmi_fb_event(struct notifier_block *nb,
-+					unsigned long val, void *v)
-+{
-+	struct fb_event *event = v;
-+	struct mxc_hdmi *hdmi = container_of(nb, struct mxc_hdmi, nb);
-+
-+	if (strcmp(event->info->fix.id, hdmi->fbi->fix.id))
-+		return 0;
-+
-+	switch (val) {
-+	case FB_EVENT_FB_REGISTERED:
-+		dev_dbg(&hdmi->pdev->dev, "event=FB_EVENT_FB_REGISTERED\n");
-+		mxc_hdmi_fb_registered(hdmi);
-+		hdmi_set_registered(1);
-+		break;
-+
-+	case FB_EVENT_FB_UNREGISTERED:
-+		dev_dbg(&hdmi->pdev->dev, "event=FB_EVENT_FB_UNREGISTERED\n");
-+		hdmi->fb_reg = false;
-+		hdmi_set_registered(0);
-+		break;
-+
-+	case FB_EVENT_MODE_CHANGE:
-+		dev_dbg(&hdmi->pdev->dev, "event=FB_EVENT_MODE_CHANGE\n");
-+		if (hdmi->fb_reg)
-+			mxc_hdmi_setup(hdmi, val);
-+		break;
-+
-+	case FB_EVENT_BLANK:
-+		if ((*((int *)event->data) == FB_BLANK_UNBLANK) &&
-+			(*((int *)event->data) != hdmi->blank)) {
-+			dev_dbg(&hdmi->pdev->dev,
-+				"event=FB_EVENT_BLANK - UNBLANK\n");
-+
-+			hdmi->blank = *((int *)event->data);
-+
-+			/* Re-enable HPD interrupts */
-+			val = hdmi_readb(HDMI_PHY_MASK0);
-+			val &= ~hdmi->plug_mask;
-+			hdmi_writeb(val, HDMI_PHY_MASK0);
-+
-+			/* Unmute interrupts */
-+			hdmi_writeb(~hdmi->plug_event, HDMI_IH_MUTE_PHY_STAT0);
-+
-+			if (hdmi->fb_reg && hdmi->cable_plugin)
-+				mxc_hdmi_setup(hdmi, val);
-+			hdmi_set_blank_state(1);
-+
-+		} else if (*((int *)event->data) != hdmi->blank) {
-+			dev_dbg(&hdmi->pdev->dev,
-+				"event=FB_EVENT_BLANK - BLANK\n");
-+			hdmi_set_blank_state(0);
-+			mxc_hdmi_abort_stream();
-+
-+			mxc_hdmi_phy_disable(hdmi);
-+
-+			if(hdmi->plug_mask == HDMI_DVI_STAT) {
-+				u8 val;
-+				pr_info("In DVI Mode disable interrupts\n");
-+				val = hdmi_readb(HDMI_IH_MUTE_PHY_STAT0);
-+				val |= hdmi->plug_event;
-+				hdmi_writeb(val, HDMI_IH_MUTE_PHY_STAT0);
-+
-+				val = hdmi_readb(HDMI_PHY_MASK0);
-+				val |= hdmi->plug_mask;
-+				hdmi_writeb(val, HDMI_PHY_MASK0);
-+
-+				hdmi_set_dvi_mode(1);
-+			}
-+
-+			hdmi->blank = *((int *)event->data);
-+		} else
-+			dev_dbg(&hdmi->pdev->dev,
-+				"FB BLANK state no changed!\n");
-+
-+		break;
-+
-+	case FB_EVENT_SUSPEND:
-+		dev_dbg(&hdmi->pdev->dev,
-+			"event=FB_EVENT_SUSPEND\n");
-+
-+		if (hdmi->blank == FB_BLANK_UNBLANK) {
-+			mxc_hdmi_phy_disable(hdmi);
-+			clk_disable(hdmi->hdmi_iahb_clk);
-+			clk_disable(hdmi->hdmi_isfr_clk);
-+		}
-+		break;
-+
-+	case FB_EVENT_RESUME:
-+		dev_dbg(&hdmi->pdev->dev,
-+			"event=FB_EVENT_RESUME\n");
-+
-+		if (hdmi->blank == FB_BLANK_UNBLANK) {
-+			clk_enable(hdmi->hdmi_iahb_clk);
-+			clk_enable(hdmi->hdmi_isfr_clk);
-+			mxc_hdmi_phy_init(hdmi);
-+		}
-+		break;
-+	default:
-+		break;
-+	}
-+
-+	return 0;
-+}
-+
-+static void hdmi_init_route(struct mxc_hdmi *hdmi)
-+{
-+	uint32_t hdmi_mux_setting, reg;
-+	int ipu_id, disp_id;
-+
-+	ipu_id = mxc_hdmi_ipu_id;
-+	disp_id = mxc_hdmi_disp_id;
-+
-+	if ((ipu_id > 1) || (ipu_id < 0)) {
-+		pr_err("Invalid IPU select for HDMI: %d. Set to 0\n", ipu_id);
-+		ipu_id = 0;
-+	}
-+
-+	if ((disp_id > 1) || (disp_id < 0)) {
-+		pr_err("Invalid DI select for HDMI: %d. Set to 0\n", disp_id);
-+		disp_id = 0;
-+	}
-+
-+	reg = readl(hdmi->gpr_hdmi_base);
-+
-+	/* Configure the connection between IPU1/2 and HDMI */
-+	hdmi_mux_setting = 2*ipu_id + disp_id;
-+
-+	/* GPR3, bits 2-3 = HDMI_MUX_CTL */
-+	reg &= ~0xd;
-+	reg |= hdmi_mux_setting << 2;
-+
-+	writel(reg, hdmi->gpr_hdmi_base);
-+
-+	/* Set HDMI event as SDMA event2 for HDMI audio */
-+	reg = readl(hdmi->gpr_sdma_base);
-+	reg |= 0x1;
-+	writel(reg, hdmi->gpr_sdma_base);
-+}
-+
-+static void hdmi_hdcp_get_property(struct platform_device *pdev)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+
-+	/* Check hdcp enable by dts.*/
-+	hdcp_init = of_property_read_bool(np, "fsl,hdcp");
-+	if (hdcp_init)
-+		dev_dbg(&pdev->dev, "hdcp enable\n");
-+	else
-+		dev_dbg(&pdev->dev, "hdcp disable\n");
-+}
-+
-+static void hdmi_get_of_property(struct mxc_hdmi *hdmi)
-+{
-+	struct platform_device *pdev = hdmi->pdev;
-+	struct device_node *np = pdev->dev.of_node;
-+	const struct of_device_id *of_id =
-+			of_match_device(imx_hdmi_dt_ids, &pdev->dev);
-+	int ret;
-+	u32 phy_reg_vlev = 0, phy_reg_cksymtx = 0;
-+
-+	if (of_id) {
-+		pdev->id_entry = of_id->data;
-+		hdmi->cpu_type = pdev->id_entry->driver_data;
-+	}
-+
-+	/* HDMI PHY register vlev and cksymtx preperty is optional.
-+	 * It is for specific board to pass HCT electrical part.
-+	 * Default value will been setting in HDMI PHY config function
-+	 * if it is not define in device tree.
-+	 */
-+	ret = of_property_read_u32(np, "fsl,phy_reg_vlev", &phy_reg_vlev);
-+	if (ret)
-+		dev_dbg(&pdev->dev, "No board specific HDMI PHY vlev\n");
-+
-+	ret = of_property_read_u32(np, "fsl,phy_reg_cksymtx", &phy_reg_cksymtx);
-+	if (ret)
-+		dev_dbg(&pdev->dev, "No board specific HDMI PHY cksymtx\n");
-+
-+	/* Specific phy config */
-+	hdmi->phy_config.reg_cksymtx = phy_reg_cksymtx;
-+	hdmi->phy_config.reg_vlev = phy_reg_vlev;
-+
-+}
-+
-+/* HDMI Initialization Step A */
-+static int mxc_hdmi_disp_init(struct mxc_dispdrv_handle *disp,
-+			      struct mxc_dispdrv_setting *setting)
-+{
-+	int ret = 0;
-+	u32 i;
-+	const struct fb_videomode *mode;
-+	struct fb_videomode m;
-+	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
-+	int irq = platform_get_irq(hdmi->pdev, 0);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	/* Check hdmi disp init once */
-+	if (hdmi_inited) {
-+		dev_err(&hdmi->pdev->dev,
-+				"Error only one HDMI output support now!\n");
-+		return -1;
-+	}
-+
-+	hdmi_get_of_property(hdmi);
-+
-+	if (irq < 0)
-+		return -ENODEV;
-+
-+	/* Setting HDMI default to blank state */
-+	hdmi->blank = FB_BLANK_POWERDOWN;
-+
-+	setting->dev_id = mxc_hdmi_ipu_id;
-+	setting->disp_id = mxc_hdmi_disp_id;
-+	setting->if_fmt = IPU_PIX_FMT_RGB24;
-+
-+	hdmi->dft_mode_str = setting->dft_mode_str;
-+	hdmi->default_bpp = setting->default_bpp;
-+	dev_dbg(&hdmi->pdev->dev, "%s - default mode %s bpp=%d\n",
-+		__func__, hdmi->dft_mode_str, hdmi->default_bpp);
-+
-+	hdmi->fbi = setting->fbi;
-+
-+	hdmi_init_route(hdmi);
-+
-+	hdmi->hdmi_isfr_clk = clk_get(&hdmi->pdev->dev, "hdmi_isfr");
-+	if (IS_ERR(hdmi->hdmi_isfr_clk)) {
-+		ret = PTR_ERR(hdmi->hdmi_isfr_clk);
-+		dev_err(&hdmi->pdev->dev,
-+			"Unable to get HDMI clk: %d\n", ret);
-+		goto egetclk1;
-+	}
-+
-+	ret = clk_prepare_enable(hdmi->hdmi_isfr_clk);
-+	if (ret < 0) {
-+		dev_err(&hdmi->pdev->dev,
-+			"Cannot enable HDMI isfr clock: %d\n", ret);
-+		goto erate1;
-+	}
-+
-+	hdmi->hdmi_iahb_clk = clk_get(&hdmi->pdev->dev, "hdmi_iahb");
-+	if (IS_ERR(hdmi->hdmi_iahb_clk)) {
-+		ret = PTR_ERR(hdmi->hdmi_iahb_clk);
-+		dev_err(&hdmi->pdev->dev,
-+			"Unable to get HDMI clk: %d\n", ret);
-+		goto egetclk2;
-+	}
-+
-+	ret = clk_prepare_enable(hdmi->hdmi_iahb_clk);
-+	if (ret < 0) {
-+		dev_err(&hdmi->pdev->dev,
-+			"Cannot enable HDMI iahb clock: %d\n", ret);
-+		goto erate2;
-+	}
-+
-+	dev_dbg(&hdmi->pdev->dev, "Enabled HDMI clocks\n");
-+
-+	/* Init DDC pins for HDCP  */
-+	if (hdcp_init) {
-+		hdmi->pinctrl = devm_pinctrl_get_select_default(&hdmi->pdev->dev);
-+		if (IS_ERR(hdmi->pinctrl)) {
-+			dev_err(&hdmi->pdev->dev, "can't get/select DDC pinctrl\n");
-+			goto erate2;
-+		}
-+	}
-+
-+	/* Product and revision IDs */
-+	dev_info(&hdmi->pdev->dev,
-+		"Detected HDMI controller 0x%x:0x%x:0x%x:0x%x\n",
-+		hdmi_readb(HDMI_DESIGN_ID),
-+		hdmi_readb(HDMI_REVISION_ID),
-+		hdmi_readb(HDMI_PRODUCT_ID0),
-+		hdmi_readb(HDMI_PRODUCT_ID1));
-+
-+	/* To prevent overflows in HDMI_IH_FC_STAT2, set the clk regenerator
-+	 * N and cts values before enabling phy */
-+	hdmi_init_clk_regenerator();
-+
-+	INIT_LIST_HEAD(&hdmi->fbi->modelist);
-+
-+	spin_lock_init(&hdmi->irq_lock);
-+
-+	/* Set the default mode and modelist when disp init. */
-+	fb_find_mode(&hdmi->fbi->var, hdmi->fbi,
-+		     hdmi->dft_mode_str, /*NULL, 0, NULL,*/mxc_cea_mode, ARRAY_SIZE(mxc_cea_mode), NULL,
-+		     hdmi->default_bpp);
-+
-+	console_lock();
-+
-+	fb_destroy_modelist(&hdmi->fbi->modelist);
-+
-+	/*Add all no interlaced CEA mode to default modelist */
-+	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
-+		mode = &mxc_cea_mode[i];
-+		if (mode->xres != 0)
-+			fb_add_videomode(mode, &hdmi->fbi->modelist);
-+	}
-+
-+	console_unlock();
-+
-+	/* Find a nearest mode in default modelist */
-+	fb_var_to_videomode(&m, &hdmi->fbi->var);
-+	dump_fb_videomode(&m);
-+	hdmi->dft_mode_set = false;
-+	/* Save default video mode */
-+	memcpy(&hdmi->default_mode, &m, sizeof(struct fb_videomode));
-+
-+	mode = mxc_fb_find_nearest_mode(&m, &hdmi->fbi->modelist);
-+	if (!mode) {
-+		pr_err("%s: could not find mode in modelist\n", __func__);
-+		return -1;
-+	}
-+
-+	fb_videomode_to_var(&hdmi->fbi->var, mode);
-+
-+	/* update fbi mode */
-+	hdmi->fbi->mode = (struct fb_videomode *)mode;
-+
-+	/* Default setting HDMI working in HDMI mode*/
-+	hdmi->edid_cfg.hdmi_cap = true;
-+
-+	hdmi->plug_event = HDMI_DVI_IH_STAT;
-+	hdmi->plug_mask = HDMI_DVI_STAT;
-+
-+	setup_timer(&hdmi->jitter_timer, hotplug_work_launch, (unsigned long)hdmi);
-+	INIT_WORK(&hdmi->hotplug_work, hotplug_worker);
-+	INIT_DELAYED_WORK(&hdmi->hdcp_hdp_work, hdcp_hdp_worker);
-+
-+	/* Configure registers related to HDMI interrupt
-+	 * generation before registering IRQ. */
-+	hdmi_writeb(hdmi->plug_mask, HDMI_PHY_POL0);
-+
-+	/* Clear Hotplug interrupts */
-+	hdmi_writeb(hdmi->plug_event, HDMI_IH_PHY_STAT0);
-+
-+	hdmi->nb.notifier_call = mxc_hdmi_fb_event;
-+	ret = fb_register_client(&hdmi->nb);
-+	if (ret < 0)
-+		goto efbclient;
-+
-+	memset(&hdmi->hdmi_data, 0, sizeof(struct hdmi_data_info));
-+
-+	/* Default HDMI working in RGB mode */
-+	hdmi->hdmi_data.rgb_out_enable = true;
-+
-+	if (!strcasecmp(rgb_quant_range, "limited")) {
-+		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE;
-+	} else if (!strcasecmp(rgb_quant_range, "full")) {
-+		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE;
-+	} else {
-+		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT;
-+	}
-+
-+	if (!strcasecmp(enable_3d, "disable")) {
-+		hdmi->hdmi_data.enable_3d = 0;
-+	} else if (!strcasecmp(enable_3d, "0")) {
-+		hdmi->hdmi_data.enable_3d = 0;
-+	} else {
-+		hdmi->hdmi_data.enable_3d = 1;
-+	}
-+
-+	if (!strcasecmp(enable_fract, "disable")) {
-+		hdmi->hdmi_data.enable_fract = 0;
-+	} else if (!strcasecmp(enable_fract, "0")) {
-+		hdmi->hdmi_data.enable_fract = 0;
-+	} else {
-+		hdmi->hdmi_data.enable_fract = 1;
-+	}
-+
-+	ret = devm_request_irq(&hdmi->pdev->dev, irq, mxc_hdmi_hotplug, IRQF_SHARED,
-+			dev_name(&hdmi->pdev->dev), hdmi);
-+	if (ret < 0) {
-+		dev_err(&hdmi->pdev->dev,
-+			"Unable to request irq: %d\n", ret);
-+		goto ereqirq;
-+	}
-+
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_fb_name);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for fb name\n");
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_cable_state);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for cable state\n");
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_edid);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for edid\n");
-+
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_rgb_out_enable);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for rgb out enable\n");
-+
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_rgb_quant_range);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for rgb quant range\n");
-+
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_enable_3d);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for enable_3d\n");
-+
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_enable_fract);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for enable_fract\n");
-+
-+	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_hdcp_enable);
-+	if (ret < 0)
-+		dev_warn(&hdmi->pdev->dev,
-+			"cound not create sys node for hdcp enable\n");
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
-+
-+	hdmi_inited = true;
-+
-+	return ret;
-+
-+efbclient:
-+	free_irq(irq, hdmi);
-+ereqirq:
-+	clk_disable_unprepare(hdmi->hdmi_iahb_clk);
-+erate2:
-+	clk_put(hdmi->hdmi_iahb_clk);
-+egetclk2:
-+	clk_disable_unprepare(hdmi->hdmi_isfr_clk);
-+erate1:
-+	clk_put(hdmi->hdmi_isfr_clk);
-+egetclk1:
-+	dev_dbg(&hdmi->pdev->dev, "%s error exit\n", __func__);
-+
-+	return ret;
-+}
-+
-+static void mxc_hdmi_disp_deinit(struct mxc_dispdrv_handle *disp)
-+{
-+	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
-+
-+	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
-+
-+	fb_unregister_client(&hdmi->nb);
-+
-+	clk_disable_unprepare(hdmi->hdmi_isfr_clk);
-+	clk_put(hdmi->hdmi_isfr_clk);
-+	clk_disable_unprepare(hdmi->hdmi_iahb_clk);
-+	clk_put(hdmi->hdmi_iahb_clk);
-+
-+	platform_device_unregister(hdmi->pdev);
-+
-+	hdmi_inited = false;
-+}
-+
-+static struct mxc_dispdrv_driver mxc_hdmi_drv = {
-+	.name	= DISPDRV_HDMI,
-+	.init	= mxc_hdmi_disp_init,
-+	.deinit	= mxc_hdmi_disp_deinit,
-+	.enable = mxc_hdmi_power_on,
-+	.disable = mxc_hdmi_power_off,
-+};
-+
-+
-+static int mxc_hdmi_open(struct inode *inode, struct file *file)
-+{
-+	return 0;
-+}
-+
-+static long mxc_hdmi_ioctl(struct file *file,
-+		unsigned int cmd, unsigned long arg)
-+{
-+	int __user *argp = (void __user *)arg;
-+	int ret = 0;
-+
-+	switch (cmd) {
-+	case HDMI_IOC_GET_RESOURCE:
-+		ret = copy_to_user(argp, &g_hdmi->hdmi_data,
-+				sizeof(g_hdmi->hdmi_data)) ? -EFAULT : 0;
-+		break;
-+	case HDMI_IOC_GET_CPU_TYPE:
-+		*argp = g_hdmi->cpu_type;
-+		break;
-+	default:
-+		pr_debug("Unsupport cmd %d\n", cmd);
-+		break;
-+     }
-+     return ret;
-+}
-+
-+static int mxc_hdmi_release(struct inode *inode, struct file *file)
-+{
-+	return 0;
-+}
-+
-+static const struct file_operations mxc_hdmi_fops = {
-+	.owner = THIS_MODULE,
-+	.open = mxc_hdmi_open,
-+	.release = mxc_hdmi_release,
-+	.unlocked_ioctl = mxc_hdmi_ioctl,
-+};
-+
-+
-+static int mxc_hdmi_probe(struct platform_device *pdev)
-+{
-+	struct mxc_hdmi *hdmi;
-+	struct device *temp_class;
-+	struct resource *res;
-+	int ret = 0;
-+
-+	/* Check I2C driver is loaded and available
-+	 * check hdcp function is enable by dts */
-+	hdmi_hdcp_get_property(pdev);
-+	if (!hdmi_i2c && !hdcp_init)
-+		return -ENODEV;
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (!res)
-+		return -ENOENT;
-+
-+	hdmi = devm_kzalloc(&pdev->dev,
-+				sizeof(struct mxc_hdmi),
-+				GFP_KERNEL);
-+	if (!hdmi) {
-+		dev_err(&pdev->dev, "Cannot allocate device data\n");
-+		ret = -ENOMEM;
-+		goto ealloc;
-+	}
-+	g_hdmi = hdmi;
-+
-+	hdmi_major = register_chrdev(hdmi_major, "mxc_hdmi", &mxc_hdmi_fops);
-+	if (hdmi_major < 0) {
-+		printk(KERN_ERR "HDMI: unable to get a major for HDMI\n");
-+		ret = -EBUSY;
-+		goto ealloc;
-+	}
-+
-+	hdmi_class = class_create(THIS_MODULE, "mxc_hdmi");
-+	if (IS_ERR(hdmi_class)) {
-+		ret = PTR_ERR(hdmi_class);
-+		goto err_out_chrdev;
-+	}
-+
-+	temp_class = device_create(hdmi_class, NULL, MKDEV(hdmi_major, 0),
-+				   NULL, "mxc_hdmi");
-+	if (IS_ERR(temp_class)) {
-+		ret = PTR_ERR(temp_class);
-+		goto err_out_class;
-+	}
-+
-+	hdmi->pdev = pdev;
-+
-+	hdmi->core_pdev = platform_device_alloc("mxc_hdmi_core", -1);
-+	if (!hdmi->core_pdev) {
-+		pr_err("%s failed platform_device_alloc for hdmi core\n",
-+			__func__);
-+		ret = -ENOMEM;
-+		goto ecore;
-+	}
-+
-+	hdmi->gpr_base = ioremap(res->start, resource_size(res));
-+	if (!hdmi->gpr_base) {
-+		dev_err(&pdev->dev, "ioremap failed\n");
-+		ret = -ENOMEM;
-+		goto eiomap;
-+	}
-+
-+	hdmi->gpr_hdmi_base = hdmi->gpr_base + 3;
-+	hdmi->gpr_sdma_base = hdmi->gpr_base;
-+
-+	hdmi_inited = false;
-+
-+	hdmi->disp_mxc_hdmi = mxc_dispdrv_register(&mxc_hdmi_drv);
-+	if (IS_ERR(hdmi->disp_mxc_hdmi)) {
-+		dev_err(&pdev->dev, "Failed to register dispdrv - 0x%x\n",
-+			(int)hdmi->disp_mxc_hdmi);
-+		ret = (int)hdmi->disp_mxc_hdmi;
-+		goto edispdrv;
-+	}
-+	mxc_dispdrv_setdata(hdmi->disp_mxc_hdmi, hdmi);
-+
-+	platform_set_drvdata(pdev, hdmi);
-+
-+	return 0;
-+edispdrv:
-+	iounmap(hdmi->gpr_base);
-+eiomap:
-+	platform_device_put(hdmi->core_pdev);
-+ecore:
-+	kfree(hdmi);
-+err_out_class:
-+	device_destroy(hdmi_class, MKDEV(hdmi_major, 0));
-+	class_destroy(hdmi_class);
-+err_out_chrdev:
-+	unregister_chrdev(hdmi_major, "mxc_hdmi");
-+ealloc:
-+	return ret;
-+}
-+
-+static int mxc_hdmi_remove(struct platform_device *pdev)
-+{
-+	struct mxc_hdmi *hdmi = platform_get_drvdata(pdev);
-+	int irq = platform_get_irq(pdev, 0);
-+
-+	fb_unregister_client(&hdmi->nb);
-+
-+	mxc_dispdrv_puthandle(hdmi->disp_mxc_hdmi);
-+	mxc_dispdrv_unregister(hdmi->disp_mxc_hdmi);
-+	iounmap(hdmi->gpr_base);
-+	/* No new work will be scheduled, wait for running ISR */
-+	free_irq(irq, hdmi);
-+	kfree(hdmi);
-+	g_hdmi = NULL;
-+
-+	return 0;
-+}
-+
-+static struct platform_driver mxc_hdmi_driver = {
-+	.probe = mxc_hdmi_probe,
-+	.remove = mxc_hdmi_remove,
-+	.driver = {
-+		.name = "mxc_hdmi",
-+		.of_match_table	= imx_hdmi_dt_ids,
-+		.owner = THIS_MODULE,
-+	},
-+};
-+
-+static int __init mxc_hdmi_init(void)
-+{
-+	return platform_driver_register(&mxc_hdmi_driver);
-+}
-+module_init(mxc_hdmi_init);
-+
-+static void __exit mxc_hdmi_exit(void)
-+{
-+	if (hdmi_major > 0) {
-+		device_destroy(hdmi_class, MKDEV(hdmi_major, 0));
-+		class_destroy(hdmi_class);
-+		unregister_chrdev(hdmi_major, "mxc_hdmi");
-+		hdmi_major = 0;
-+	}
-+
-+	platform_driver_unregister(&mxc_hdmi_driver);
-+}
-+module_exit(mxc_hdmi_exit);
-+
-+static int mxc_hdmi_i2c_probe(struct i2c_client *client,
-+		const struct i2c_device_id *id)
-+{
-+	if (!i2c_check_functionality(client->adapter,
-+				I2C_FUNC_SMBUS_BYTE | I2C_FUNC_I2C))
-+		return -ENODEV;
-+
-+	hdmi_i2c = client;
-+
-+	return 0;
-+}
-+
-+static int mxc_hdmi_i2c_remove(struct i2c_client *client)
-+{
-+	hdmi_i2c = NULL;
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_hdmi_i2c_match[] = {
-+	{ .compatible = "fsl,imx6-hdmi-i2c", },
-+	{ /* sentinel */ }
-+};
-+
-+static const struct i2c_device_id mxc_hdmi_i2c_id[] = {
-+	{ "mxc_hdmi_i2c", 0 },
-+	{},
-+};
-+MODULE_DEVICE_TABLE(i2c, mxc_hdmi_i2c_id);
-+
-+static struct i2c_driver mxc_hdmi_i2c_driver = {
-+	.driver = {
-+		   .name = "mxc_hdmi_i2c",
-+			.of_match_table	= imx_hdmi_i2c_match,
-+		   },
-+	.probe = mxc_hdmi_i2c_probe,
-+	.remove = mxc_hdmi_i2c_remove,
-+	.id_table = mxc_hdmi_i2c_id,
-+};
-+
-+static int __init mxc_hdmi_i2c_init(void)
-+{
-+	return i2c_add_driver(&mxc_hdmi_i2c_driver);
-+}
-+
-+static void __exit mxc_hdmi_i2c_exit(void)
-+{
-+	i2c_del_driver(&mxc_hdmi_i2c_driver);
-+}
-+
-+subsys_initcall(mxc_hdmi_i2c_init);
-+module_exit(mxc_hdmi_i2c_exit);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_ipuv3_fb.c linux-xbian-imx6/drivers/video/mxc/mxc_ipuv3_fb.c
---- linux-4.1.3/drivers/video/mxc/mxc_ipuv3_fb.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_ipuv3_fb.c	2015-07-27 23:13:08.753749907 +0200
-@@ -0,0 +1,2579 @@
-+/*
-+ * Copyright 2004-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @defgroup Framebuffer Framebuffer Driver for SDC and ADC.
-+ */
-+
-+/*!
-+ * @file mxcfb.c
-+ *
-+ * @brief MXC Frame buffer driver for SDC
-+ *
-+ * @ingroup Framebuffer
-+ */
-+
-+/*!
-+ * Include files
-+ */
-+#include <linux/clk.h>
-+#include <linux/console.h>
-+#include <linux/delay.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/errno.h>
-+#include <linux/fb.h>
-+#include <linux/fsl_devices.h>
-+#include <linux/init.h>
-+#include <linux/interrupt.h>
-+#include <linux/io.h>
-+#include <linux/ioport.h>
-+#include <linux/ipu.h>
-+#include <linux/ipu-v3.h>
-+#include <linux/kernel.h>
-+#include <linux/module.h>
-+#include <linux/mxcfb.h>
-+#include <linux/of_device.h>
-+#include <linux/platform_device.h>
-+#include <linux/sched.h>
-+#include <linux/slab.h>
-+#include <linux/string.h>
-+#include <linux/uaccess.h>
-+
-+#include "mxc_dispdrv.h"
-+
-+/*
-+ * Driver name
-+ */
-+#define MXCFB_NAME      "mxc_sdc_fb"
-+
-+/* Display port number */
-+#define MXCFB_PORT_NUM	2
-+/*!
-+ * Structure containing the MXC specific framebuffer information.
-+ */
-+struct mxcfb_info {
-+	int default_bpp;
-+	int cur_blank;
-+	int next_blank;
-+	ipu_channel_t ipu_ch;
-+	int ipu_id;
-+	int ipu_di;
-+	u32 ipu_di_pix_fmt;
-+	bool ipu_int_clk;
-+	bool overlay;
-+	bool alpha_chan_en;
-+	bool late_init;
-+	bool first_set_par;
-+	dma_addr_t alpha_phy_addr0;
-+	dma_addr_t alpha_phy_addr1;
-+	void *alpha_virt_addr0;
-+	void *alpha_virt_addr1;
-+	uint32_t alpha_mem_len;
-+	uint32_t ipu_ch_irq;
-+	uint32_t ipu_ch_nf_irq;
-+	uint32_t ipu_alp_ch_irq;
-+	uint32_t cur_ipu_buf;
-+	uint32_t cur_ipu_alpha_buf;
-+
-+	u32 pseudo_palette[16];
-+
-+	bool mode_found;
-+	struct completion flip_complete;
-+	struct completion alpha_flip_complete;
-+	struct completion vsync_complete;
-+
-+	void *ipu;
-+	struct fb_info *ovfbi;
-+
-+	struct mxc_dispdrv_handle *dispdrv;
-+
-+	struct fb_var_screeninfo cur_var;
-+};
-+
-+struct mxcfb_pfmt {
-+	u32 fb_pix_fmt;
-+	int bpp;
-+	struct fb_bitfield red;
-+	struct fb_bitfield green;
-+	struct fb_bitfield blue;
-+	struct fb_bitfield transp;
-+};
-+
-+static const struct mxcfb_pfmt mxcfb_pfmts[] = {
-+	/*     pixel         bpp    red         green        blue      transp */
-+	{IPU_PIX_FMT_RGB565, 16, {11, 5, 0}, { 5, 6, 0}, { 0, 5, 0}, { 0, 0, 0} },
-+	{IPU_PIX_FMT_RGB24,  24, { 0, 8, 0}, { 8, 8, 0}, {16, 8, 0}, { 0, 0, 0} },
-+	{IPU_PIX_FMT_BGR24,  24, {16, 8, 0}, { 8, 8, 0}, { 0, 8, 0}, { 0, 0, 0} },
-+	{IPU_PIX_FMT_RGB32,  32, { 0, 8, 0}, { 8, 8, 0}, {16, 8, 0}, {24, 8, 0} },
-+	{IPU_PIX_FMT_BGR32,  32, {16, 8, 0}, { 8, 8, 0}, { 0, 8, 0}, {24, 8, 0} },
-+	{IPU_PIX_FMT_ABGR32, 32, {24, 8, 0}, {16, 8, 0}, { 8, 8, 0}, { 0, 8, 0} },
-+};
-+
-+struct mxcfb_alloc_list {
-+	struct list_head list;
-+	dma_addr_t phy_addr;
-+	void *cpu_addr;
-+	u32 size;
-+};
-+
-+enum {
-+	BOTH_ON,
-+	SRC_ON,
-+	TGT_ON,
-+	BOTH_OFF
-+};
-+
-+static bool g_dp_in_use[2];
-+LIST_HEAD(fb_alloc_list);
-+
-+/* Return default standard(RGB) pixel format */
-+static uint32_t bpp_to_pixfmt(int bpp)
-+{
-+	uint32_t pixfmt = 0;
-+
-+	switch (bpp) {
-+	case 24:
-+		pixfmt = IPU_PIX_FMT_BGR24;
-+		break;
-+	case 32:
-+		pixfmt = IPU_PIX_FMT_BGR32;
-+		break;
-+	case 16:
-+		pixfmt = IPU_PIX_FMT_RGB565;
-+		break;
-+	}
-+	return pixfmt;
-+}
-+
-+static inline int bitfield_is_equal(struct fb_bitfield f1,
-+				    struct fb_bitfield f2)
-+{
-+	return !memcmp(&f1, &f2, sizeof(f1));
-+}
-+
-+static int pixfmt_to_var(uint32_t pixfmt, struct fb_var_screeninfo *var)
-+{
-+	int i, ret = -1;
-+
-+	for (i = 0; i < ARRAY_SIZE(mxcfb_pfmts); i++) {
-+		if (pixfmt == mxcfb_pfmts[i].fb_pix_fmt) {
-+			var->red    = mxcfb_pfmts[i].red;
-+			var->green  = mxcfb_pfmts[i].green;
-+			var->blue   = mxcfb_pfmts[i].blue;
-+			var->transp = mxcfb_pfmts[i].transp;
-+			var->bits_per_pixel = mxcfb_pfmts[i].bpp;
-+			ret = 0;
-+			break;
-+		}
-+	}
-+	return ret;
-+}
-+
-+static int bpp_to_var(int bpp, struct fb_var_screeninfo *var)
-+{
-+	uint32_t pixfmt = 0;
-+
-+	pixfmt = bpp_to_pixfmt(bpp);
-+	if (pixfmt)
-+		return pixfmt_to_var(pixfmt, var);
-+	else
-+		return -1;
-+}
-+
-+static int check_var_pixfmt(struct fb_var_screeninfo *var)
-+{
-+	int i, ret = -1;
-+
-+	for (i = 0; i < ARRAY_SIZE(mxcfb_pfmts); i++) {
-+		if (bitfield_is_equal(var->red, mxcfb_pfmts[i].red) &&
-+		    bitfield_is_equal(var->green, mxcfb_pfmts[i].green) &&
-+		    bitfield_is_equal(var->blue, mxcfb_pfmts[i].blue) &&
-+		    bitfield_is_equal(var->transp, mxcfb_pfmts[i].transp) &&
-+		    var->bits_per_pixel == mxcfb_pfmts[i].bpp) {
-+			ret = 0;
-+			break;
-+		}
-+	}
-+	return ret;
-+}
-+
-+static uint32_t fbi_to_pixfmt(struct fb_info *fbi)
-+{
-+	int i;
-+	uint32_t pixfmt = 0;
-+
-+	if (fbi->var.nonstd)
-+		return fbi->var.nonstd;
-+
-+	for (i = 0; i < ARRAY_SIZE(mxcfb_pfmts); i++) {
-+		if (bitfield_is_equal(fbi->var.red, mxcfb_pfmts[i].red) &&
-+		    bitfield_is_equal(fbi->var.green, mxcfb_pfmts[i].green) &&
-+		    bitfield_is_equal(fbi->var.blue, mxcfb_pfmts[i].blue) &&
-+		    bitfield_is_equal(fbi->var.transp, mxcfb_pfmts[i].transp)) {
-+			pixfmt = mxcfb_pfmts[i].fb_pix_fmt;
-+			break;
-+		}
-+	}
-+
-+	if (pixfmt == 0)
-+		dev_err(fbi->device, "cannot get pixel format\n");
-+
-+	return pixfmt;
-+}
-+
-+static struct fb_info *found_registered_fb(ipu_channel_t ipu_ch, int ipu_id)
-+{
-+	int i;
-+	struct mxcfb_info *mxc_fbi;
-+	struct fb_info *fbi = NULL;
-+
-+	for (i = 0; i < num_registered_fb; i++) {
-+		mxc_fbi =
-+			((struct mxcfb_info *)(registered_fb[i]->par));
-+
-+		if ((mxc_fbi->ipu_ch == ipu_ch) &&
-+			(mxc_fbi->ipu_id == ipu_id)) {
-+			fbi = registered_fb[i];
-+			break;
-+		}
-+	}
-+	return fbi;
-+}
-+
-+static irqreturn_t mxcfb_irq_handler(int irq, void *dev_id);
-+static irqreturn_t mxcfb_nf_irq_handler(int irq, void *dev_id);
-+static int mxcfb_blank(int blank, struct fb_info *info);
-+static int mxcfb_map_video_memory(struct fb_info *fbi);
-+static int mxcfb_unmap_video_memory(struct fb_info *fbi);
-+
-+/*
-+ * Set fixed framebuffer parameters based on variable settings.
-+ *
-+ * @param       info     framebuffer information pointer
-+ */
-+static int mxcfb_set_fix(struct fb_info *info)
-+{
-+	struct fb_fix_screeninfo *fix = &info->fix;
-+	struct fb_var_screeninfo *var = &info->var;
-+
-+	fix->line_length = var->xres_virtual * var->bits_per_pixel / 8;
-+
-+	fix->type = FB_TYPE_PACKED_PIXELS;
-+	fix->accel = FB_ACCEL_NONE;
-+	fix->visual = FB_VISUAL_TRUECOLOR;
-+	fix->xpanstep = 1;
-+	fix->ywrapstep = 1;
-+	fix->ypanstep = 1;
-+
-+	return 0;
-+}
-+
-+static int _setup_disp_channel1(struct fb_info *fbi)
-+{
-+	ipu_channel_params_t params;
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+
-+	memset(&params, 0, sizeof(params));
-+
-+	if (mxc_fbi->ipu_ch == MEM_DC_SYNC) {
-+		params.mem_dc_sync.di = mxc_fbi->ipu_di;
-+		if (fbi->var.vmode & FB_VMODE_INTERLACED)
-+			params.mem_dc_sync.interlaced = true;
-+		params.mem_dc_sync.out_pixel_fmt = mxc_fbi->ipu_di_pix_fmt;
-+		params.mem_dc_sync.in_pixel_fmt = fbi_to_pixfmt(fbi);
-+	} else {
-+		params.mem_dp_bg_sync.di = mxc_fbi->ipu_di;
-+		if (fbi->var.vmode & FB_VMODE_INTERLACED)
-+			params.mem_dp_bg_sync.interlaced = true;
-+		params.mem_dp_bg_sync.out_pixel_fmt = mxc_fbi->ipu_di_pix_fmt;
-+		params.mem_dp_bg_sync.in_pixel_fmt = fbi_to_pixfmt(fbi);
-+		if (mxc_fbi->alpha_chan_en)
-+			params.mem_dp_bg_sync.alpha_chan_en = true;
-+	}
-+	ipu_init_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch, &params);
-+
-+	return 0;
-+}
-+
-+static int _setup_disp_channel2(struct fb_info *fbi)
-+{
-+	int retval = 0;
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+	int fb_stride;
-+	unsigned long base;
-+	unsigned int fr_xoff, fr_yoff, fr_w, fr_h;
-+
-+	switch (fbi_to_pixfmt(fbi)) {
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_NV12:
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YVU422P:
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YUV444P:
-+		fb_stride = fbi->var.xres_virtual;
-+		break;
-+	default:
-+		fb_stride = fbi->fix.line_length;
-+	}
-+
-+	base = fbi->fix.smem_start;
-+	fr_xoff = fbi->var.xoffset;
-+	fr_w = fbi->var.xres_virtual;
-+	if (!(fbi->var.vmode & FB_VMODE_YWRAP)) {
-+		dev_dbg(fbi->device, "Y wrap disabled\n");
-+		fr_yoff = fbi->var.yoffset % fbi->var.yres;
-+		fr_h = fbi->var.yres;
-+		base += fbi->fix.line_length * fbi->var.yres *
-+			(fbi->var.yoffset / fbi->var.yres);
-+	} else {
-+		dev_dbg(fbi->device, "Y wrap enabled\n");
-+		fr_yoff = fbi->var.yoffset;
-+		fr_h = fbi->var.yres_virtual;
-+	}
-+	base += fr_yoff * fb_stride + fr_xoff;
-+
-+	mxc_fbi->cur_ipu_buf = 2;
-+	init_completion(&mxc_fbi->flip_complete);
-+	/*
-+	 * We don't need to wait for vsync at the first time
-+	 * we do pan display after fb is initialized, as IPU will
-+	 * switch to the newly selected buffer automatically,
-+	 * so we call complete() for both mxc_fbi->flip_complete
-+	 * and mxc_fbi->alpha_flip_complete.
-+	 */
-+	complete(&mxc_fbi->flip_complete);
-+	if (mxc_fbi->alpha_chan_en) {
-+		mxc_fbi->cur_ipu_alpha_buf = 1;
-+		init_completion(&mxc_fbi->alpha_flip_complete);
-+		complete(&mxc_fbi->alpha_flip_complete);
-+	}
-+
-+	retval = ipu_init_channel_buffer(mxc_fbi->ipu,
-+					 mxc_fbi->ipu_ch, IPU_INPUT_BUFFER,
-+					 fbi_to_pixfmt(fbi),
-+					 fbi->var.xres, fbi->var.yres,
-+					 fb_stride,
-+					 fbi->var.rotate,
-+					 base,
-+					 base,
-+					 fbi->var.accel_flags &
-+						FB_ACCEL_DOUBLE_FLAG ? 0 : base,
-+					 0, 0);
-+	if (retval) {
-+		dev_err(fbi->device,
-+			"ipu_init_channel_buffer error %d\n", retval);
-+		return retval;
-+	}
-+
-+	/* update u/v offset */
-+	ipu_update_channel_offset(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+			IPU_INPUT_BUFFER,
-+			fbi_to_pixfmt(fbi),
-+			fr_w,
-+			fr_h,
-+			fr_w,
-+			0, 0,
-+			fr_yoff,
-+			fr_xoff);
-+
-+	if (mxc_fbi->alpha_chan_en) {
-+		retval = ipu_init_channel_buffer(mxc_fbi->ipu,
-+						 mxc_fbi->ipu_ch,
-+						 IPU_ALPHA_IN_BUFFER,
-+						 IPU_PIX_FMT_GENERIC,
-+						 fbi->var.xres, fbi->var.yres,
-+						 fbi->var.xres,
-+						 fbi->var.rotate,
-+						 mxc_fbi->alpha_phy_addr1,
-+						 mxc_fbi->alpha_phy_addr0,
-+						 0,
-+						 0, 0);
-+		if (retval) {
-+			dev_err(fbi->device,
-+				"ipu_init_channel_buffer error %d\n", retval);
-+			return retval;
-+		}
-+	}
-+
-+	return retval;
-+}
-+
-+static bool mxcfb_need_to_set_par(struct fb_info *fbi)
-+{
-+	struct mxcfb_info *mxc_fbi = fbi->par;
-+
-+	if ((fbi->var.activate & FB_ACTIVATE_FORCE) &&
-+	    (fbi->var.activate & FB_ACTIVATE_MASK) == FB_ACTIVATE_NOW)
-+		return true;
-+
-+	/*
-+	 * Ignore xoffset and yoffset update,
-+	 * because pan display handles this case.
-+	 */
-+	mxc_fbi->cur_var.xoffset = fbi->var.xoffset;
-+	mxc_fbi->cur_var.yoffset = fbi->var.yoffset;
-+
-+	return !!memcmp(&mxc_fbi->cur_var, &fbi->var,
-+			sizeof(struct fb_var_screeninfo));
-+}
-+
-+/*
-+ * Set framebuffer parameters and change the operating mode.
-+ *
-+ * @param       info     framebuffer information pointer
-+ */
-+static int mxcfb_set_par(struct fb_info *fbi)
-+{
-+	int retval = 0;
-+	u32 mem_len, alpha_mem_len;
-+	ipu_di_signal_cfg_t sig_cfg;
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+
-+	int16_t ov_pos_x = 0, ov_pos_y = 0;
-+	int ov_pos_ret = 0;
-+	struct mxcfb_info *mxc_fbi_fg = NULL;
-+	bool ovfbi_enable = false;
-+
-+	if (ipu_ch_param_bad_alpha_pos(fbi_to_pixfmt(fbi)) &&
-+	    mxc_fbi->alpha_chan_en) {
-+		dev_err(fbi->device, "Bad pixel format for "
-+				"graphics plane fb\n");
-+		return -EINVAL;
-+	}
-+
-+	if (mxc_fbi->ovfbi)
-+		mxc_fbi_fg = (struct mxcfb_info *)mxc_fbi->ovfbi->par;
-+
-+	if (mxc_fbi->ovfbi && mxc_fbi_fg)
-+		if (mxc_fbi_fg->next_blank == FB_BLANK_UNBLANK)
-+			ovfbi_enable = true;
-+
-+	if (!mxcfb_need_to_set_par(fbi))
-+		return 0;
-+
-+	dev_dbg(fbi->device, "Reconfiguring framebuffer\n");
-+
-+	if (fbi->var.xres == 0 || fbi->var.yres == 0)
-+		return 0;
-+
-+	if (ovfbi_enable) {
-+		ov_pos_ret = ipu_disp_get_window_pos(
-+						mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch,
-+						&ov_pos_x, &ov_pos_y);
-+		if (ov_pos_ret < 0)
-+			dev_err(fbi->device, "Get overlay pos failed, dispdrv:%s.\n",
-+					mxc_fbi->dispdrv->drv->name);
-+
-+		ipu_clear_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_irq);
-+		ipu_disable_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_irq);
-+		ipu_clear_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_nf_irq);
-+		ipu_disable_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_nf_irq);
-+		ipu_disable_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch, true);
-+		ipu_uninit_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch);
-+	}
-+
-+	ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
-+	ipu_disable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
-+	ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
-+	ipu_disable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
-+	ipu_disable_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch, true);
-+	ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
-+
-+	/*
-+	 * Disable IPU hsp clock if it is enabled for an
-+	 * additional time in ipu common driver.
-+	 */
-+	if (mxc_fbi->first_set_par && mxc_fbi->late_init)
-+		ipu_disable_hsp_clk(mxc_fbi->ipu);
-+
-+	mxcfb_set_fix(fbi);
-+
-+	mem_len = fbi->var.yres_virtual * fbi->fix.line_length;
-+	if (!fbi->fix.smem_start || (mem_len > fbi->fix.smem_len)) {
-+		if (fbi->fix.smem_start)
-+			mxcfb_unmap_video_memory(fbi);
-+
-+		if (mxcfb_map_video_memory(fbi) < 0)
-+			return -ENOMEM;
-+	}
-+
-+	if (mxc_fbi->first_set_par) {
-+		/*
-+		 * Clear the screen in case uboot fb pixel format is not
-+		 * the same to kernel fb pixel format.
-+		 */
-+		if (mxc_fbi->late_init)
-+			memset((char *)fbi->screen_base, 0, fbi->fix.smem_len);
-+
-+		mxc_fbi->first_set_par = false;
-+	}
-+
-+	if (mxc_fbi->alpha_chan_en) {
-+		alpha_mem_len = fbi->var.xres * fbi->var.yres;
-+		if ((!mxc_fbi->alpha_phy_addr0 && !mxc_fbi->alpha_phy_addr1) ||
-+		    (alpha_mem_len > mxc_fbi->alpha_mem_len)) {
-+			if (mxc_fbi->alpha_phy_addr0)
-+				dma_free_coherent(fbi->device,
-+						  mxc_fbi->alpha_mem_len,
-+						  mxc_fbi->alpha_virt_addr0,
-+						  mxc_fbi->alpha_phy_addr0);
-+			if (mxc_fbi->alpha_phy_addr1)
-+				dma_free_coherent(fbi->device,
-+						  mxc_fbi->alpha_mem_len,
-+						  mxc_fbi->alpha_virt_addr1,
-+						  mxc_fbi->alpha_phy_addr1);
-+
-+			mxc_fbi->alpha_virt_addr0 =
-+					dma_alloc_coherent(fbi->device,
-+						  alpha_mem_len,
-+						  &mxc_fbi->alpha_phy_addr0,
-+						  GFP_DMA | GFP_KERNEL);
-+
-+			mxc_fbi->alpha_virt_addr1 =
-+					dma_alloc_coherent(fbi->device,
-+						  alpha_mem_len,
-+						  &mxc_fbi->alpha_phy_addr1,
-+						  GFP_DMA | GFP_KERNEL);
-+			if (mxc_fbi->alpha_virt_addr0 == NULL ||
-+			    mxc_fbi->alpha_virt_addr1 == NULL) {
-+				dev_err(fbi->device, "mxcfb: dma alloc for"
-+					" alpha buffer failed.\n");
-+				if (mxc_fbi->alpha_virt_addr0)
-+					dma_free_coherent(fbi->device,
-+						  mxc_fbi->alpha_mem_len,
-+						  mxc_fbi->alpha_virt_addr0,
-+						  mxc_fbi->alpha_phy_addr0);
-+				if (mxc_fbi->alpha_virt_addr1)
-+					dma_free_coherent(fbi->device,
-+						  mxc_fbi->alpha_mem_len,
-+						  mxc_fbi->alpha_virt_addr1,
-+						  mxc_fbi->alpha_phy_addr1);
-+				return -ENOMEM;
-+			}
-+			mxc_fbi->alpha_mem_len = alpha_mem_len;
-+		}
-+	}
-+
-+	if (mxc_fbi->next_blank != FB_BLANK_UNBLANK)
-+		return retval;
-+
-+	if (mxc_fbi->dispdrv && mxc_fbi->dispdrv->drv->setup) {
-+		retval = mxc_fbi->dispdrv->drv->setup(mxc_fbi->dispdrv, fbi);
-+		if (retval < 0) {
-+			dev_err(fbi->device, "setup error, dispdrv:%s.\n",
-+					mxc_fbi->dispdrv->drv->name);
-+			return -EINVAL;
-+		}
-+	}
-+
-+	_setup_disp_channel1(fbi);
-+	if (ovfbi_enable)
-+		_setup_disp_channel1(mxc_fbi->ovfbi);
-+
-+	if (!mxc_fbi->overlay) {
-+		uint32_t out_pixel_fmt;
-+
-+		memset(&sig_cfg, 0, sizeof(sig_cfg));
-+		if (fbi->var.vmode & FB_VMODE_INTERLACED)
-+			sig_cfg.interlaced = true;
-+		out_pixel_fmt = mxc_fbi->ipu_di_pix_fmt;
-+		if (fbi->var.vmode & FB_VMODE_ODD_FLD_FIRST) /* PAL */
-+			sig_cfg.odd_field_first = true;
-+		if (mxc_fbi->ipu_int_clk)
-+			sig_cfg.int_clk = true;
-+		if (fbi->var.sync & FB_SYNC_HOR_HIGH_ACT)
-+			sig_cfg.Hsync_pol = true;
-+		if (fbi->var.sync & FB_SYNC_VERT_HIGH_ACT)
-+			sig_cfg.Vsync_pol = true;
-+		if (!(fbi->var.sync & FB_SYNC_CLK_LAT_FALL))
-+			sig_cfg.clk_pol = true;
-+		if (fbi->var.sync & FB_SYNC_DATA_INVERT)
-+			sig_cfg.data_pol = true;
-+		if (!(fbi->var.sync & FB_SYNC_OE_LOW_ACT))
-+			sig_cfg.enable_pol = true;
-+		if (fbi->var.sync & FB_SYNC_CLK_IDLE_EN)
-+			sig_cfg.clkidle_en = true;
-+
-+		dev_dbg(fbi->device, "pixclock = %ul Hz\n",
-+			(u32) (PICOS2KHZ(fbi->var.pixclock) * 1000UL));
-+
-+		if (ipu_init_sync_panel(mxc_fbi->ipu, mxc_fbi->ipu_di,
-+					(PICOS2KHZ(fbi->var.pixclock)) * 1000UL,
-+					fbi->var.xres, fbi->var.yres,
-+					out_pixel_fmt,
-+					fbi->var.left_margin,
-+					fbi->var.hsync_len,
-+					fbi->var.right_margin,
-+					fbi->var.upper_margin,
-+					fbi->var.vsync_len,
-+					fbi->var.lower_margin,
-+					0, sig_cfg) != 0) {
-+			dev_err(fbi->device,
-+				"mxcfb: Error initializing panel.\n");
-+			return -EINVAL;
-+		}
-+
-+		fbi->mode =
-+		    (struct fb_videomode *)fb_match_mode(&fbi->var,
-+							 &fbi->modelist);
-+
-+		ipu_disp_set_window_pos(mxc_fbi->ipu, mxc_fbi->ipu_ch, 0, 0);
-+	}
-+
-+	retval = _setup_disp_channel2(fbi);
-+	if (retval) {
-+		ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
-+		return retval;
-+	}
-+
-+	if (ovfbi_enable) {
-+		if (ov_pos_ret >= 0)
-+			ipu_disp_set_window_pos(
-+					mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch,
-+					ov_pos_x, ov_pos_y);
-+		retval = _setup_disp_channel2(mxc_fbi->ovfbi);
-+		if (retval) {
-+			ipu_uninit_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch);
-+			ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
-+			return retval;
-+		}
-+	}
-+
-+	ipu_enable_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
-+	if (ovfbi_enable)
-+		ipu_enable_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch);
-+
-+	if (mxc_fbi->dispdrv && mxc_fbi->dispdrv->drv->enable) {
-+		retval = mxc_fbi->dispdrv->drv->enable(mxc_fbi->dispdrv);
-+		if (retval < 0) {
-+			dev_err(fbi->device, "enable error, dispdrv:%s.\n",
-+					mxc_fbi->dispdrv->drv->name);
-+			return -EINVAL;
-+		}
-+	}
-+
-+	mxc_fbi->cur_var = fbi->var;
-+
-+	return retval;
-+}
-+
-+static int _swap_channels(struct fb_info *fbi_from,
-+			  struct fb_info *fbi_to, bool both_on)
-+{
-+	int retval, tmp;
-+	ipu_channel_t old_ch;
-+	struct fb_info *ovfbi;
-+	struct mxcfb_info *mxc_fbi_from = (struct mxcfb_info *)fbi_from->par;
-+	struct mxcfb_info *mxc_fbi_to = (struct mxcfb_info *)fbi_to->par;
-+
-+	if (both_on) {
-+		ipu_disable_channel(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch, true);
-+		ipu_uninit_channel(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch);
-+	}
-+
-+	/* switch the mxc fbi parameters */
-+	old_ch = mxc_fbi_from->ipu_ch;
-+	mxc_fbi_from->ipu_ch = mxc_fbi_to->ipu_ch;
-+	mxc_fbi_to->ipu_ch = old_ch;
-+	tmp = mxc_fbi_from->ipu_ch_irq;
-+	mxc_fbi_from->ipu_ch_irq = mxc_fbi_to->ipu_ch_irq;
-+	mxc_fbi_to->ipu_ch_irq = tmp;
-+	tmp = mxc_fbi_from->ipu_ch_nf_irq;
-+	mxc_fbi_from->ipu_ch_nf_irq = mxc_fbi_to->ipu_ch_nf_irq;
-+	mxc_fbi_to->ipu_ch_nf_irq = tmp;
-+	ovfbi = mxc_fbi_from->ovfbi;
-+	mxc_fbi_from->ovfbi = mxc_fbi_to->ovfbi;
-+	mxc_fbi_to->ovfbi = ovfbi;
-+
-+	_setup_disp_channel1(fbi_from);
-+	retval = _setup_disp_channel2(fbi_from);
-+	if (retval)
-+		return retval;
-+
-+	/* switch between dp and dc, disable old idmac, enable new idmac */
-+	retval = ipu_swap_channel(mxc_fbi_from->ipu, old_ch, mxc_fbi_from->ipu_ch);
-+	ipu_uninit_channel(mxc_fbi_from->ipu, old_ch);
-+
-+	if (both_on) {
-+		_setup_disp_channel1(fbi_to);
-+		retval = _setup_disp_channel2(fbi_to);
-+		if (retval)
-+			return retval;
-+		ipu_enable_channel(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch);
-+	}
-+
-+	return retval;
-+}
-+
-+static int swap_channels(struct fb_info *fbi_from)
-+{
-+	int i;
-+	int swap_mode;
-+	ipu_channel_t ch_to;
-+	struct mxcfb_info *mxc_fbi_from = (struct mxcfb_info *)fbi_from->par;
-+	struct fb_info *fbi_to = NULL;
-+	struct mxcfb_info *mxc_fbi_to;
-+
-+	/* what's the target channel? */
-+	if (mxc_fbi_from->ipu_ch == MEM_BG_SYNC)
-+		ch_to = MEM_DC_SYNC;
-+	else
-+		ch_to = MEM_BG_SYNC;
-+
-+	fbi_to = found_registered_fb(ch_to, mxc_fbi_from->ipu_id);
-+	if (!fbi_to)
-+		return -1;
-+	mxc_fbi_to = (struct mxcfb_info *)fbi_to->par;
-+
-+	ipu_clear_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq);
-+	ipu_clear_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq);
-+	ipu_free_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq, fbi_from);
-+	ipu_free_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq, fbi_to);
-+	ipu_clear_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq);
-+	ipu_clear_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq);
-+	ipu_free_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq, fbi_from);
-+	ipu_free_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq, fbi_to);
-+
-+	if (mxc_fbi_from->cur_blank == FB_BLANK_UNBLANK) {
-+		if (mxc_fbi_to->cur_blank == FB_BLANK_UNBLANK)
-+			swap_mode = BOTH_ON;
-+		else
-+			swap_mode = SRC_ON;
-+	} else {
-+		if (mxc_fbi_to->cur_blank == FB_BLANK_UNBLANK)
-+			swap_mode = TGT_ON;
-+		else
-+			swap_mode = BOTH_OFF;
-+	}
-+
-+	switch (swap_mode) {
-+	case BOTH_ON:
-+		/* disable target->switch src->enable target */
-+		_swap_channels(fbi_from, fbi_to, true);
-+		break;
-+	case SRC_ON:
-+		/* just switch src */
-+		_swap_channels(fbi_from, fbi_to, false);
-+		break;
-+	case TGT_ON:
-+		/* just switch target */
-+		_swap_channels(fbi_to, fbi_from, false);
-+		break;
-+	case BOTH_OFF:
-+		/* switch directly, no more need to do */
-+		mxc_fbi_to->ipu_ch = mxc_fbi_from->ipu_ch;
-+		mxc_fbi_from->ipu_ch = ch_to;
-+		i = mxc_fbi_from->ipu_ch_irq;
-+		mxc_fbi_from->ipu_ch_irq = mxc_fbi_to->ipu_ch_irq;
-+		mxc_fbi_to->ipu_ch_irq = i;
-+		i = mxc_fbi_from->ipu_ch_nf_irq;
-+		mxc_fbi_from->ipu_ch_nf_irq = mxc_fbi_to->ipu_ch_nf_irq;
-+		mxc_fbi_to->ipu_ch_nf_irq = i;
-+		break;
-+	default:
-+		break;
-+	}
-+
-+	if (ipu_request_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq,
-+		mxcfb_irq_handler, IPU_IRQF_ONESHOT,
-+		MXCFB_NAME, fbi_from) != 0) {
-+		dev_err(fbi_from->device, "Error registering irq %d\n",
-+			mxc_fbi_from->ipu_ch_irq);
-+		return -EBUSY;
-+	}
-+	ipu_disable_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq);
-+	if (ipu_request_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq,
-+		mxcfb_irq_handler, IPU_IRQF_ONESHOT,
-+		MXCFB_NAME, fbi_to) != 0) {
-+		dev_err(fbi_to->device, "Error registering irq %d\n",
-+			mxc_fbi_to->ipu_ch_irq);
-+		return -EBUSY;
-+	}
-+	ipu_disable_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq);
-+	if (ipu_request_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq,
-+		mxcfb_nf_irq_handler, IPU_IRQF_ONESHOT,
-+		MXCFB_NAME, fbi_from) != 0) {
-+		dev_err(fbi_from->device, "Error registering irq %d\n",
-+			mxc_fbi_from->ipu_ch_nf_irq);
-+		return -EBUSY;
-+	}
-+	ipu_disable_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq);
-+	if (ipu_request_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq,
-+		mxcfb_nf_irq_handler, IPU_IRQF_ONESHOT,
-+		MXCFB_NAME, fbi_to) != 0) {
-+		dev_err(fbi_to->device, "Error registering irq %d\n",
-+			mxc_fbi_to->ipu_ch_nf_irq);
-+		return -EBUSY;
-+	}
-+	ipu_disable_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq);
-+
-+	return 0;
-+}
-+
-+/*
-+ * Check framebuffer variable parameters and adjust to valid values.
-+ *
-+ * @param       var      framebuffer variable parameters
-+ *
-+ * @param       info     framebuffer information pointer
-+ */
-+static int mxcfb_check_var(struct fb_var_screeninfo *var, struct fb_info *info)
-+{
-+	u32 vtotal;
-+	u32 htotal;
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)info->par;
-+
-+
-+	if (var->xres == 0 || var->yres == 0)
-+		return 0;
-+
-+	/* fg should not bigger than bg */
-+	if (mxc_fbi->ipu_ch == MEM_FG_SYNC) {
-+		struct fb_info *fbi_tmp;
-+		int bg_xres = 0, bg_yres = 0;
-+		int16_t pos_x, pos_y;
-+
-+		bg_xres = var->xres;
-+		bg_yres = var->yres;
-+
-+		fbi_tmp = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
-+		if (fbi_tmp) {
-+			bg_xres = fbi_tmp->var.xres;
-+			bg_yres = fbi_tmp->var.yres;
-+		}
-+
-+		ipu_disp_get_window_pos(mxc_fbi->ipu, mxc_fbi->ipu_ch, &pos_x, &pos_y);
-+
-+		if ((var->xres + pos_x) > bg_xres)
-+			var->xres = bg_xres - pos_x;
-+		if ((var->yres + pos_y) > bg_yres)
-+			var->yres = bg_yres - pos_y;
-+	}
-+
-+	if (var->rotate > IPU_ROTATE_VERT_FLIP)
-+		var->rotate = IPU_ROTATE_NONE;
-+
-+	if (var->xres_virtual < var->xres)
-+		var->xres_virtual = var->xres;
-+
-+	if (var->yres_virtual < var->yres)
-+		var->yres_virtual = var->yres * 3;
-+
-+	if ((var->bits_per_pixel != 32) && (var->bits_per_pixel != 24) &&
-+	    (var->bits_per_pixel != 16) && (var->bits_per_pixel != 12) &&
-+	    (var->bits_per_pixel != 8))
-+		var->bits_per_pixel = 16;
-+
-+	if (check_var_pixfmt(var))
-+		/* Fall back to default */
-+		bpp_to_var(var->bits_per_pixel, var);
-+
-+	if (var->pixclock < 1000) {
-+		htotal = var->xres + var->right_margin + var->hsync_len +
-+		    var->left_margin;
-+		vtotal = var->yres + var->lower_margin + var->vsync_len +
-+		    var->upper_margin;
-+		var->pixclock = (vtotal * htotal * 6UL) / 100UL;
-+		var->pixclock = KHZ2PICOS(var->pixclock);
-+		dev_dbg(info->device,
-+			"pixclock set for 60Hz refresh = %u ps\n",
-+			var->pixclock);
-+	}
-+
-+	var->height = -1;
-+	var->width = -1;
-+	var->grayscale = 0;
-+
-+	return 0;
-+}
-+
-+static inline u_int _chan_to_field(u_int chan, struct fb_bitfield *bf)
-+{
-+	chan &= 0xffff;
-+	chan >>= 16 - bf->length;
-+	return chan << bf->offset;
-+}
-+
-+static int mxcfb_setcolreg(u_int regno, u_int red, u_int green, u_int blue,
-+			   u_int trans, struct fb_info *fbi)
-+{
-+	unsigned int val;
-+	int ret = 1;
-+
-+	/*
-+	 * If greyscale is true, then we convert the RGB value
-+	 * to greyscale no matter what visual we are using.
-+	 */
-+	if (fbi->var.grayscale)
-+		red = green = blue = (19595 * red + 38470 * green +
-+				      7471 * blue) >> 16;
-+	switch (fbi->fix.visual) {
-+	case FB_VISUAL_TRUECOLOR:
-+		/*
-+		 * 16-bit True Colour.  We encode the RGB value
-+		 * according to the RGB bitfield information.
-+		 */
-+		if (regno < 16) {
-+			u32 *pal = fbi->pseudo_palette;
-+
-+			val = _chan_to_field(red, &fbi->var.red);
-+			val |= _chan_to_field(green, &fbi->var.green);
-+			val |= _chan_to_field(blue, &fbi->var.blue);
-+
-+			pal[regno] = val;
-+			ret = 0;
-+		}
-+		break;
-+
-+	case FB_VISUAL_STATIC_PSEUDOCOLOR:
-+	case FB_VISUAL_PSEUDOCOLOR:
-+		break;
-+	}
-+
-+	return ret;
-+}
-+
-+/*
-+ * Function to handle custom ioctls for MXC framebuffer.
-+ *
-+ * @param       inode   inode struct
-+ *
-+ * @param       file    file struct
-+ *
-+ * @param       cmd     Ioctl command to handle
-+ *
-+ * @param       arg     User pointer to command arguments
-+ *
-+ * @param       fbi     framebuffer information pointer
-+ */
-+static int mxcfb_ioctl(struct fb_info *fbi, unsigned int cmd, unsigned long arg)
-+{
-+	int retval = 0;
-+	int __user *argp = (void __user *)arg;
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+
-+	switch (cmd) {
-+	case MXCFB_SET_GBL_ALPHA:
-+		{
-+			struct mxcfb_gbl_alpha ga;
-+
-+			if (copy_from_user(&ga, (void *)arg, sizeof(ga))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+
-+			if (ipu_disp_set_global_alpha(mxc_fbi->ipu,
-+						      mxc_fbi->ipu_ch,
-+						      (bool)ga.enable,
-+						      ga.alpha)) {
-+				retval = -EINVAL;
-+				break;
-+			}
-+
-+			if (ga.enable)
-+				mxc_fbi->alpha_chan_en = false;
-+
-+			if (ga.enable)
-+				dev_dbg(fbi->device,
-+					"Set global alpha of %s to %d\n",
-+					fbi->fix.id, ga.alpha);
-+			break;
-+		}
-+	case MXCFB_SET_LOC_ALPHA:
-+		{
-+			struct mxcfb_loc_alpha la;
-+			bool bad_pixfmt =
-+				ipu_ch_param_bad_alpha_pos(fbi_to_pixfmt(fbi));
-+
-+			if (copy_from_user(&la, (void *)arg, sizeof(la))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+
-+			if (la.enable && !la.alpha_in_pixel) {
-+				struct fb_info *fbi_tmp;
-+				ipu_channel_t ipu_ch;
-+
-+				if (bad_pixfmt) {
-+					dev_err(fbi->device, "Bad pixel format "
-+						"for graphics plane fb\n");
-+					retval = -EINVAL;
-+					break;
-+				}
-+
-+				mxc_fbi->alpha_chan_en = true;
-+
-+				if (mxc_fbi->ipu_ch == MEM_FG_SYNC)
-+					ipu_ch = MEM_BG_SYNC;
-+				else if (mxc_fbi->ipu_ch == MEM_BG_SYNC)
-+					ipu_ch = MEM_FG_SYNC;
-+				else {
-+					retval = -EINVAL;
-+					break;
-+				}
-+
-+				fbi_tmp = found_registered_fb(ipu_ch, mxc_fbi->ipu_id);
-+				if (fbi_tmp)
-+					((struct mxcfb_info *)(fbi_tmp->par))->alpha_chan_en = false;
-+			} else
-+				mxc_fbi->alpha_chan_en = false;
-+
-+			if (ipu_disp_set_global_alpha(mxc_fbi->ipu,
-+						      mxc_fbi->ipu_ch,
-+						      !(bool)la.enable, 0)) {
-+				retval = -EINVAL;
-+				break;
-+			}
-+
-+			fbi->var.activate = (fbi->var.activate & ~FB_ACTIVATE_MASK) |
-+						FB_ACTIVATE_NOW | FB_ACTIVATE_FORCE;
-+			mxcfb_set_par(fbi);
-+
-+			la.alpha_phy_addr0 = mxc_fbi->alpha_phy_addr0;
-+			la.alpha_phy_addr1 = mxc_fbi->alpha_phy_addr1;
-+			if (copy_to_user((void *)arg, &la, sizeof(la))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+
-+			if (la.enable)
-+				dev_dbg(fbi->device,
-+					"Enable DP local alpha for %s\n",
-+					fbi->fix.id);
-+			break;
-+		}
-+	case MXCFB_SET_LOC_ALP_BUF:
-+		{
-+			unsigned long base;
-+			uint32_t ipu_alp_ch_irq;
-+
-+			if (!(((mxc_fbi->ipu_ch == MEM_FG_SYNC) ||
-+			     (mxc_fbi->ipu_ch == MEM_BG_SYNC)) &&
-+			     (mxc_fbi->alpha_chan_en))) {
-+				dev_err(fbi->device,
-+					"Should use background or overlay "
-+					"framebuffer to set the alpha buffer "
-+					"number\n");
-+				return -EINVAL;
-+			}
-+
-+			if (get_user(base, argp))
-+				return -EFAULT;
-+
-+			if (base != mxc_fbi->alpha_phy_addr0 &&
-+			    base != mxc_fbi->alpha_phy_addr1) {
-+				dev_err(fbi->device,
-+					"Wrong alpha buffer physical address "
-+					"%lu\n", base);
-+				return -EINVAL;
-+			}
-+
-+			if (mxc_fbi->ipu_ch == MEM_FG_SYNC)
-+				ipu_alp_ch_irq = IPU_IRQ_FG_ALPHA_SYNC_EOF;
-+			else
-+				ipu_alp_ch_irq = IPU_IRQ_BG_ALPHA_SYNC_EOF;
-+
-+			retval = wait_for_completion_timeout(
-+				&mxc_fbi->alpha_flip_complete, HZ/2);
-+			if (retval == 0) {
-+				dev_err(fbi->device, "timeout when waiting for alpha flip irq\n");
-+				retval = -ETIMEDOUT;
-+				break;
-+			}
-+
-+			mxc_fbi->cur_ipu_alpha_buf =
-+						!mxc_fbi->cur_ipu_alpha_buf;
-+			if (ipu_update_channel_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+						      IPU_ALPHA_IN_BUFFER,
-+						      mxc_fbi->
-+							cur_ipu_alpha_buf,
-+						      base) == 0) {
-+				ipu_select_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+						  IPU_ALPHA_IN_BUFFER,
-+						  mxc_fbi->cur_ipu_alpha_buf);
-+				ipu_clear_irq(mxc_fbi->ipu, ipu_alp_ch_irq);
-+				ipu_enable_irq(mxc_fbi->ipu, ipu_alp_ch_irq);
-+			} else {
-+				dev_err(fbi->device,
-+					"Error updating %s SDC alpha buf %d "
-+					"to address=0x%08lX\n",
-+					fbi->fix.id,
-+					mxc_fbi->cur_ipu_alpha_buf, base);
-+			}
-+			break;
-+		}
-+	case MXCFB_SET_CLR_KEY:
-+		{
-+			struct mxcfb_color_key key;
-+			if (copy_from_user(&key, (void *)arg, sizeof(key))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+			retval = ipu_disp_set_color_key(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+							key.enable,
-+							key.color_key);
-+			dev_dbg(fbi->device, "Set color key to 0x%08X\n",
-+				key.color_key);
-+			break;
-+		}
-+	case MXCFB_SET_GAMMA:
-+		{
-+			struct mxcfb_gamma gamma;
-+			if (copy_from_user(&gamma, (void *)arg, sizeof(gamma))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+			retval = ipu_disp_set_gamma_correction(mxc_fbi->ipu,
-+							mxc_fbi->ipu_ch,
-+							gamma.enable,
-+							gamma.constk,
-+							gamma.slopek);
-+			break;
-+		}
-+	case MXCFB_WAIT_FOR_VSYNC:
-+		{
-+			if (mxc_fbi->ipu_ch == MEM_FG_SYNC) {
-+				/* BG should poweron */
-+				struct mxcfb_info *bg_mxcfbi = NULL;
-+				struct fb_info *fbi_tmp;
-+
-+				fbi_tmp = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
-+				if (fbi_tmp)
-+					bg_mxcfbi = ((struct mxcfb_info *)(fbi_tmp->par));
-+
-+				if (!bg_mxcfbi) {
-+					retval = -EINVAL;
-+					break;
-+				}
-+				if (bg_mxcfbi->cur_blank != FB_BLANK_UNBLANK) {
-+					retval = -EINVAL;
-+					break;
-+				}
-+			}
-+			if (mxc_fbi->cur_blank != FB_BLANK_UNBLANK) {
-+				retval = -EINVAL;
-+				break;
-+			}
-+
-+			init_completion(&mxc_fbi->vsync_complete);
-+			ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
-+			ipu_enable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
-+			retval = wait_for_completion_interruptible_timeout(
-+				&mxc_fbi->vsync_complete, 1 * HZ);
-+			if (retval == 0) {
-+				dev_err(fbi->device,
-+					"MXCFB_WAIT_FOR_VSYNC: timeout %d\n",
-+					retval);
-+				retval = -ETIME;
-+			} else if (retval > 0) {
-+				retval = 0;
-+			}
-+			break;
-+		}
-+	case FBIO_ALLOC:
-+		{
-+			int size;
-+			struct mxcfb_alloc_list *mem;
-+
-+			mem = kzalloc(sizeof(*mem), GFP_KERNEL);
-+			if (mem == NULL)
-+				return -ENOMEM;
-+
-+			if (get_user(size, argp))
-+				return -EFAULT;
-+
-+			mem->size = PAGE_ALIGN(size);
-+
-+			mem->cpu_addr = dma_alloc_coherent(fbi->device, size,
-+							   &mem->phy_addr,
-+							   GFP_KERNEL);
-+			if (mem->cpu_addr == NULL) {
-+				kfree(mem);
-+				return -ENOMEM;
-+			}
-+
-+			list_add(&mem->list, &fb_alloc_list);
-+
-+			dev_dbg(fbi->device, "allocated %d bytes @ 0x%08X\n",
-+				mem->size, mem->phy_addr);
-+
-+			if (put_user(mem->phy_addr, argp))
-+				return -EFAULT;
-+
-+			break;
-+		}
-+	case FBIO_FREE:
-+		{
-+			unsigned long offset;
-+			struct mxcfb_alloc_list *mem;
-+
-+			if (get_user(offset, argp))
-+				return -EFAULT;
-+
-+			retval = -EINVAL;
-+			list_for_each_entry(mem, &fb_alloc_list, list) {
-+				if (mem->phy_addr == offset) {
-+					list_del(&mem->list);
-+					dma_free_coherent(fbi->device,
-+							  mem->size,
-+							  mem->cpu_addr,
-+							  mem->phy_addr);
-+					kfree(mem);
-+					retval = 0;
-+					break;
-+				}
-+			}
-+
-+			break;
-+		}
-+	case MXCFB_SET_OVERLAY_POS:
-+		{
-+			struct mxcfb_pos pos;
-+			struct fb_info *bg_fbi = NULL;
-+			struct mxcfb_info *bg_mxcfbi = NULL;
-+
-+			if (mxc_fbi->ipu_ch != MEM_FG_SYNC) {
-+				dev_err(fbi->device, "Should use the overlay "
-+					"framebuffer to set the position of "
-+					"the overlay window\n");
-+				retval = -EINVAL;
-+				break;
-+			}
-+
-+			if (copy_from_user(&pos, (void *)arg, sizeof(pos))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+
-+			bg_fbi = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
-+			if (bg_fbi)
-+				bg_mxcfbi = ((struct mxcfb_info *)(bg_fbi->par));
-+
-+			if (bg_fbi == NULL) {
-+				dev_err(fbi->device, "Cannot find the "
-+					"background framebuffer\n");
-+				retval = -ENOENT;
-+				break;
-+			}
-+
-+			/* if fb is unblank, check if the pos fit the display */
-+			if (mxc_fbi->cur_blank == FB_BLANK_UNBLANK) {
-+				if (fbi->var.xres + pos.x > bg_fbi->var.xres) {
-+					if (bg_fbi->var.xres < fbi->var.xres)
-+						pos.x = 0;
-+					else
-+						pos.x = bg_fbi->var.xres - fbi->var.xres;
-+				}
-+				if (fbi->var.yres + pos.y > bg_fbi->var.yres) {
-+					if (bg_fbi->var.yres < fbi->var.yres)
-+						pos.y = 0;
-+					else
-+						pos.y = bg_fbi->var.yres - fbi->var.yres;
-+				}
-+			}
-+
-+			retval = ipu_disp_set_window_pos(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+							 pos.x, pos.y);
-+
-+			if (copy_to_user((void *)arg, &pos, sizeof(pos))) {
-+				retval = -EFAULT;
-+				break;
-+			}
-+			break;
-+		}
-+	case MXCFB_GET_FB_IPU_CHAN:
-+		{
-+			struct mxcfb_info *mxc_fbi =
-+				(struct mxcfb_info *)fbi->par;
-+
-+			if (put_user(mxc_fbi->ipu_ch, argp))
-+				return -EFAULT;
-+			break;
-+		}
-+	case MXCFB_GET_DIFMT:
-+		{
-+			struct mxcfb_info *mxc_fbi =
-+				(struct mxcfb_info *)fbi->par;
-+
-+			if (put_user(mxc_fbi->ipu_di_pix_fmt, argp))
-+				return -EFAULT;
-+			break;
-+		}
-+	case MXCFB_GET_FB_IPU_DI:
-+		{
-+			struct mxcfb_info *mxc_fbi =
-+				(struct mxcfb_info *)fbi->par;
-+
-+			if (put_user(mxc_fbi->ipu_di, argp))
-+				return -EFAULT;
-+			break;
-+		}
-+	case MXCFB_GET_FB_BLANK:
-+		{
-+			struct mxcfb_info *mxc_fbi =
-+				(struct mxcfb_info *)fbi->par;
-+
-+			if (put_user(mxc_fbi->cur_blank, argp))
-+				return -EFAULT;
-+			break;
-+		}
-+	case MXCFB_SET_DIFMT:
-+		{
-+			struct mxcfb_info *mxc_fbi =
-+				(struct mxcfb_info *)fbi->par;
-+
-+			if (get_user(mxc_fbi->ipu_di_pix_fmt, argp))
-+				return -EFAULT;
-+
-+			break;
-+		}
-+	case MXCFB_CSC_UPDATE:
-+		{
-+			struct mxcfb_csc_matrix csc;
-+
-+			if (copy_from_user(&csc, (void *) arg, sizeof(csc)))
-+				return -EFAULT;
-+
-+			if ((mxc_fbi->ipu_ch != MEM_FG_SYNC) &&
-+				(mxc_fbi->ipu_ch != MEM_BG_SYNC) &&
-+				(mxc_fbi->ipu_ch != MEM_BG_ASYNC0))
-+				return -EFAULT;
-+			ipu_set_csc_coefficients(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+						csc.param);
-+			break;
-+		}
-+	default:
-+		retval = -EINVAL;
-+	}
-+	return retval;
-+}
-+
-+/*
-+ * mxcfb_blank():
-+ *      Blank the display.
-+ */
-+static int mxcfb_blank(int blank, struct fb_info *info)
-+{
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)info->par;
-+	int ret = 0;
-+
-+	dev_dbg(info->device, "blank = %d\n", blank);
-+
-+	if (mxc_fbi->cur_blank == blank)
-+		return 0;
-+
-+	mxc_fbi->next_blank = blank;
-+
-+	switch (blank) {
-+	case FB_BLANK_POWERDOWN:
-+	case FB_BLANK_VSYNC_SUSPEND:
-+	case FB_BLANK_HSYNC_SUSPEND:
-+	case FB_BLANK_NORMAL:
-+		if (mxc_fbi->dispdrv && mxc_fbi->dispdrv->drv->disable)
-+			mxc_fbi->dispdrv->drv->disable(mxc_fbi->dispdrv);
-+		ipu_disable_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch, true);
-+		if (mxc_fbi->ipu_di >= 0)
-+			ipu_uninit_sync_panel(mxc_fbi->ipu, mxc_fbi->ipu_di);
-+		ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
-+		break;
-+	case FB_BLANK_UNBLANK:
-+		info->var.activate = (info->var.activate & ~FB_ACTIVATE_MASK) |
-+				FB_ACTIVATE_NOW | FB_ACTIVATE_FORCE;
-+		ret = mxcfb_set_par(info);
-+		break;
-+	}
-+	if (!ret)
-+		mxc_fbi->cur_blank = blank;
-+	return ret;
-+}
-+
-+/*
-+ * Pan or Wrap the Display
-+ *
-+ * This call looks only at xoffset, yoffset and the FB_VMODE_YWRAP flag
-+ *
-+ * @param               var     Variable screen buffer information
-+ * @param               info    Framebuffer information pointer
-+ */
-+static int
-+mxcfb_pan_display(struct fb_var_screeninfo *var, struct fb_info *info)
-+{
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)info->par,
-+			  *mxc_graphic_fbi = NULL;
-+	u_int y_bottom;
-+	unsigned int fr_xoff, fr_yoff, fr_w, fr_h;
-+	unsigned long base, active_alpha_phy_addr = 0;
-+	bool loc_alpha_en = false;
-+	int fb_stride;
-+	int i;
-+	int ret;
-+
-+	/* no pan display during fb blank */
-+	if (mxc_fbi->ipu_ch == MEM_FG_SYNC) {
-+		struct mxcfb_info *bg_mxcfbi = NULL;
-+		struct fb_info *fbi_tmp;
-+
-+		fbi_tmp = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
-+		if (fbi_tmp)
-+			bg_mxcfbi = ((struct mxcfb_info *)(fbi_tmp->par));
-+		if (!bg_mxcfbi)
-+			return -EINVAL;
-+		if (bg_mxcfbi->cur_blank != FB_BLANK_UNBLANK)
-+			return -EINVAL;
-+	}
-+	if (mxc_fbi->cur_blank != FB_BLANK_UNBLANK)
-+		return -EINVAL;
-+
-+	y_bottom = var->yoffset;
-+
-+	if (y_bottom > info->var.yres_virtual)
-+		return -EINVAL;
-+
-+	switch (fbi_to_pixfmt(info)) {
-+	case IPU_PIX_FMT_YUV420P2:
-+	case IPU_PIX_FMT_YVU420P:
-+	case IPU_PIX_FMT_NV12:
-+	case IPU_PIX_FMT_YUV422P:
-+	case IPU_PIX_FMT_YVU422P:
-+	case IPU_PIX_FMT_YUV420P:
-+	case IPU_PIX_FMT_YUV444P:
-+		fb_stride = info->var.xres_virtual;
-+		break;
-+	default:
-+		fb_stride = info->fix.line_length;
-+	}
-+
-+	base = info->fix.smem_start;
-+	fr_xoff = var->xoffset;
-+	fr_w = info->var.xres_virtual;
-+	if (!(var->vmode & FB_VMODE_YWRAP)) {
-+		dev_dbg(info->device, "Y wrap disabled\n");
-+		fr_yoff = var->yoffset % info->var.yres;
-+		fr_h = info->var.yres;
-+		base += info->fix.line_length * info->var.yres *
-+			(var->yoffset / info->var.yres);
-+	} else {
-+		dev_dbg(info->device, "Y wrap enabled\n");
-+		fr_yoff = var->yoffset;
-+		fr_h = info->var.yres_virtual;
-+	}
-+	base += fr_yoff * fb_stride + fr_xoff;
-+
-+	/* Check if DP local alpha is enabled and find the graphic fb */
-+	if (mxc_fbi->ipu_ch == MEM_BG_SYNC || mxc_fbi->ipu_ch == MEM_FG_SYNC) {
-+		for (i = 0; i < num_registered_fb; i++) {
-+			char bg_id[] = "DISP3 BG";
-+			char fg_id[] = "DISP3 FG";
-+			char *idstr = registered_fb[i]->fix.id;
-+			bg_id[4] += mxc_fbi->ipu_id;
-+			fg_id[4] += mxc_fbi->ipu_id;
-+			if ((strcmp(idstr, bg_id) == 0 ||
-+			     strcmp(idstr, fg_id) == 0) &&
-+			    ((struct mxcfb_info *)
-+			      (registered_fb[i]->par))->alpha_chan_en) {
-+				loc_alpha_en = true;
-+				mxc_graphic_fbi = (struct mxcfb_info *)
-+						(registered_fb[i]->par);
-+				active_alpha_phy_addr =
-+					mxc_fbi->cur_ipu_alpha_buf ?
-+					mxc_graphic_fbi->alpha_phy_addr1 :
-+					mxc_graphic_fbi->alpha_phy_addr0;
-+				dev_dbg(info->device, "Updating SDC alpha "
-+					"buf %d address=0x%08lX\n",
-+					!mxc_fbi->cur_ipu_alpha_buf,
-+					active_alpha_phy_addr);
-+				break;
-+			}
-+		}
-+	}
-+
-+	ret = wait_for_completion_timeout(&mxc_fbi->flip_complete, HZ/2);
-+	if (ret == 0) {
-+		dev_err(info->device, "timeout when waiting for flip irq\n");
-+		return -ETIMEDOUT;
-+	}
-+
-+	++mxc_fbi->cur_ipu_buf;
-+	mxc_fbi->cur_ipu_buf %= 3;
-+	mxc_fbi->cur_ipu_alpha_buf = !mxc_fbi->cur_ipu_alpha_buf;
-+
-+	dev_dbg(info->device, "Updating SDC %s buf %d address=0x%08lX\n",
-+		info->fix.id, mxc_fbi->cur_ipu_buf, base);
-+
-+	if (ipu_update_channel_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch, IPU_INPUT_BUFFER,
-+				      mxc_fbi->cur_ipu_buf, base) == 0) {
-+		/* Update the DP local alpha buffer only for graphic plane */
-+		if (loc_alpha_en && mxc_graphic_fbi == mxc_fbi &&
-+		    ipu_update_channel_buffer(mxc_graphic_fbi->ipu, mxc_graphic_fbi->ipu_ch,
-+					      IPU_ALPHA_IN_BUFFER,
-+					      mxc_fbi->cur_ipu_alpha_buf,
-+					      active_alpha_phy_addr) == 0) {
-+			ipu_select_buffer(mxc_graphic_fbi->ipu, mxc_graphic_fbi->ipu_ch,
-+					  IPU_ALPHA_IN_BUFFER,
-+					  mxc_fbi->cur_ipu_alpha_buf);
-+		}
-+
-+		/* update u/v offset */
-+		ipu_update_channel_offset(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+				IPU_INPUT_BUFFER,
-+				fbi_to_pixfmt(info),
-+				fr_w,
-+				fr_h,
-+				fr_w,
-+				0, 0,
-+				fr_yoff,
-+				fr_xoff);
-+
-+		ipu_select_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch, IPU_INPUT_BUFFER,
-+				  mxc_fbi->cur_ipu_buf);
-+		ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
-+		ipu_enable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
-+	} else {
-+		dev_err(info->device,
-+			"Error updating SDC buf %d to address=0x%08lX, "
-+			"current buf %d, buf0 ready %d, buf1 ready %d, "
-+			"buf2 ready %d\n", mxc_fbi->cur_ipu_buf, base,
-+			ipu_get_cur_buffer_idx(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+					       IPU_INPUT_BUFFER),
-+			ipu_check_buffer_ready(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+					       IPU_INPUT_BUFFER, 0),
-+			ipu_check_buffer_ready(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+					       IPU_INPUT_BUFFER, 1),
-+			ipu_check_buffer_ready(mxc_fbi->ipu, mxc_fbi->ipu_ch,
-+					       IPU_INPUT_BUFFER, 2));
-+		++mxc_fbi->cur_ipu_buf;
-+		mxc_fbi->cur_ipu_buf %= 3;
-+		++mxc_fbi->cur_ipu_buf;
-+		mxc_fbi->cur_ipu_buf %= 3;
-+		mxc_fbi->cur_ipu_alpha_buf = !mxc_fbi->cur_ipu_alpha_buf;
-+		ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
-+		ipu_enable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
-+		return -EBUSY;
-+	}
-+
-+	dev_dbg(info->device, "Update complete\n");
-+
-+	info->var.yoffset = var->yoffset;
-+
-+	return 0;
-+}
-+
-+/*
-+ * Function to handle custom mmap for MXC framebuffer.
-+ *
-+ * @param       fbi     framebuffer information pointer
-+ *
-+ * @param       vma     Pointer to vm_area_struct
-+ */
-+static int mxcfb_mmap(struct fb_info *fbi, struct vm_area_struct *vma)
-+{
-+	bool found = false;
-+	u32 len;
-+	unsigned long offset = vma->vm_pgoff << PAGE_SHIFT;
-+	struct mxcfb_alloc_list *mem;
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+
-+	if (offset < fbi->fix.smem_len) {
-+		/* mapping framebuffer memory */
-+		len = fbi->fix.smem_len - offset;
-+		vma->vm_pgoff = (fbi->fix.smem_start + offset) >> PAGE_SHIFT;
-+	} else if ((vma->vm_pgoff ==
-+			(mxc_fbi->alpha_phy_addr0 >> PAGE_SHIFT)) ||
-+		   (vma->vm_pgoff ==
-+			(mxc_fbi->alpha_phy_addr1 >> PAGE_SHIFT))) {
-+		len = mxc_fbi->alpha_mem_len;
-+	} else {
-+		list_for_each_entry(mem, &fb_alloc_list, list) {
-+			if (offset == mem->phy_addr) {
-+				found = true;
-+				len = mem->size;
-+				break;
-+			}
-+		}
-+		if (!found)
-+			return -EINVAL;
-+	}
-+
-+	len = PAGE_ALIGN(len);
-+	if (vma->vm_end - vma->vm_start > len)
-+		return -EINVAL;
-+
-+	/* make buffers bufferable */
-+	vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
-+
-+	vma->vm_flags |= VM_IO;
-+
-+	if (remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
-+			    vma->vm_end - vma->vm_start, vma->vm_page_prot)) {
-+		dev_dbg(fbi->device, "mmap remap_pfn_range failed\n");
-+		return -ENOBUFS;
-+	}
-+
-+	return 0;
-+}
-+
-+/*!
-+ * This structure contains the pointers to the control functions that are
-+ * invoked by the core framebuffer driver to perform operations like
-+ * blitting, rectangle filling, copy regions and cursor definition.
-+ */
-+static struct fb_ops mxcfb_ops = {
-+	.owner = THIS_MODULE,
-+	.fb_set_par = mxcfb_set_par,
-+	.fb_check_var = mxcfb_check_var,
-+	.fb_setcolreg = mxcfb_setcolreg,
-+	.fb_pan_display = mxcfb_pan_display,
-+	.fb_ioctl = mxcfb_ioctl,
-+	.fb_mmap = mxcfb_mmap,
-+	.fb_fillrect = cfb_fillrect,
-+	.fb_copyarea = cfb_copyarea,
-+	.fb_imageblit = cfb_imageblit,
-+	.fb_blank = mxcfb_blank,
-+};
-+
-+static irqreturn_t mxcfb_irq_handler(int irq, void *dev_id)
-+{
-+	struct fb_info *fbi = dev_id;
-+	struct mxcfb_info *mxc_fbi = fbi->par;
-+
-+	complete(&mxc_fbi->flip_complete);
-+	return IRQ_HANDLED;
-+}
-+
-+static irqreturn_t mxcfb_nf_irq_handler(int irq, void *dev_id)
-+{
-+	struct fb_info *fbi = dev_id;
-+	struct mxcfb_info *mxc_fbi = fbi->par;
-+
-+	complete(&mxc_fbi->vsync_complete);
-+	return IRQ_HANDLED;
-+}
-+
-+static irqreturn_t mxcfb_alpha_irq_handler(int irq, void *dev_id)
-+{
-+	struct fb_info *fbi = dev_id;
-+	struct mxcfb_info *mxc_fbi = fbi->par;
-+
-+	complete(&mxc_fbi->alpha_flip_complete);
-+	return IRQ_HANDLED;
-+}
-+
-+/*
-+ * Suspends the framebuffer and blanks the screen. Power management support
-+ */
-+static int mxcfb_suspend(struct platform_device *pdev, pm_message_t state)
-+{
-+	struct fb_info *fbi = platform_get_drvdata(pdev);
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+	int saved_blank;
-+#ifdef CONFIG_FB_MXC_LOW_PWR_DISPLAY
-+	void *fbmem;
-+#endif
-+
-+	if (mxc_fbi->ovfbi) {
-+		struct mxcfb_info *mxc_fbi_fg =
-+			(struct mxcfb_info *)mxc_fbi->ovfbi->par;
-+
-+		console_lock();
-+		fb_set_suspend(mxc_fbi->ovfbi, 1);
-+		saved_blank = mxc_fbi_fg->cur_blank;
-+		mxcfb_blank(FB_BLANK_POWERDOWN, mxc_fbi->ovfbi);
-+		mxc_fbi_fg->next_blank = saved_blank;
-+		console_unlock();
-+	}
-+
-+	console_lock();
-+	fb_set_suspend(fbi, 1);
-+	saved_blank = mxc_fbi->cur_blank;
-+	mxcfb_blank(FB_BLANK_POWERDOWN, fbi);
-+	mxc_fbi->next_blank = saved_blank;
-+	console_unlock();
-+
-+	return 0;
-+}
-+
-+/*
-+ * Resumes the framebuffer and unblanks the screen. Power management support
-+ */
-+static int mxcfb_resume(struct platform_device *pdev)
-+{
-+	struct fb_info *fbi = platform_get_drvdata(pdev);
-+	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
-+
-+	console_lock();
-+	mxcfb_blank(mxc_fbi->next_blank, fbi);
-+	fb_set_suspend(fbi, 0);
-+	console_unlock();
-+
-+	if (mxc_fbi->ovfbi) {
-+		struct mxcfb_info *mxc_fbi_fg =
-+			(struct mxcfb_info *)mxc_fbi->ovfbi->par;
-+		console_lock();
-+		mxcfb_blank(mxc_fbi_fg->next_blank, mxc_fbi->ovfbi);
-+		fb_set_suspend(mxc_fbi->ovfbi, 0);
-+		console_unlock();
-+	}
-+
-+	return 0;
-+}
-+
-+/*
-+ * Main framebuffer functions
-+ */
-+
-+/*!
-+ * Allocates the DRAM memory for the frame buffer.      This buffer is remapped
-+ * into a non-cached, non-buffered, memory region to allow palette and pixel
-+ * writes to occur without flushing the cache.  Once this area is remapped,
-+ * all virtual memory access to the video memory should occur at the new region.
-+ *
-+ * @param       fbi     framebuffer information pointer
-+ *
-+ * @return      Error code indicating success or failure
-+ */
-+static int mxcfb_map_video_memory(struct fb_info *fbi)
-+{
-+	if (fbi->fix.smem_len < fbi->var.yres_virtual * fbi->fix.line_length)
-+		fbi->fix.smem_len = fbi->var.yres_virtual *
-+				    fbi->fix.line_length;
-+
-+	fbi->screen_base = dma_alloc_writecombine(fbi->device,
-+				fbi->fix.smem_len,
-+				(dma_addr_t *)&fbi->fix.smem_start,
-+				GFP_DMA | GFP_KERNEL);
-+	if (fbi->screen_base == 0) {
-+		dev_err(fbi->device, "Unable to allocate framebuffer memory\n");
-+		fbi->fix.smem_len = 0;
-+		fbi->fix.smem_start = 0;
-+		return -EBUSY;
-+	}
-+
-+	dev_dbg(fbi->device, "allocated fb @ paddr=0x%08X, size=%d.\n",
-+		(uint32_t) fbi->fix.smem_start, fbi->fix.smem_len);
-+
-+	fbi->screen_size = fbi->fix.smem_len;
-+
-+	/* Clear the screen */
-+	memset((char *)fbi->screen_base, 0, fbi->fix.smem_len);
-+
-+	return 0;
-+}
-+
-+/*!
-+ * De-allocates the DRAM memory for the frame buffer.
-+ *
-+ * @param       fbi     framebuffer information pointer
-+ *
-+ * @return      Error code indicating success or failure
-+ */
-+static int mxcfb_unmap_video_memory(struct fb_info *fbi)
-+{
-+	dma_free_writecombine(fbi->device, fbi->fix.smem_len,
-+			      fbi->screen_base, fbi->fix.smem_start);
-+	fbi->screen_base = 0;
-+	fbi->fix.smem_start = 0;
-+	fbi->fix.smem_len = 0;
-+	return 0;
-+}
-+
-+/*!
-+ * Initializes the framebuffer information pointer. After allocating
-+ * sufficient memory for the framebuffer structure, the fields are
-+ * filled with custom information passed in from the configurable
-+ * structures.  This includes information such as bits per pixel,
-+ * color maps, screen width/height and RGBA offsets.
-+ *
-+ * @return      Framebuffer structure initialized with our information
-+ */
-+static struct fb_info *mxcfb_init_fbinfo(struct device *dev, struct fb_ops *ops)
-+{
-+	struct fb_info *fbi;
-+	struct mxcfb_info *mxcfbi;
-+
-+	/*
-+	 * Allocate sufficient memory for the fb structure
-+	 */
-+	fbi = framebuffer_alloc(sizeof(struct mxcfb_info), dev);
-+	if (!fbi)
-+		return NULL;
-+
-+	mxcfbi = (struct mxcfb_info *)fbi->par;
-+
-+	fbi->var.activate = FB_ACTIVATE_NOW;
-+
-+	fbi->fbops = ops;
-+	fbi->flags = FBINFO_FLAG_DEFAULT;
-+	fbi->pseudo_palette = mxcfbi->pseudo_palette;
-+
-+	/*
-+	 * Allocate colormap
-+	 */
-+	fb_alloc_cmap(&fbi->cmap, 16, 0);
-+
-+	return fbi;
-+}
-+
-+static ssize_t show_disp_chan(struct device *dev,
-+			      struct device_attribute *attr, char *buf)
-+{
-+	struct fb_info *info = dev_get_drvdata(dev);
-+	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)info->par;
-+
-+	if (mxcfbi->ipu_ch == MEM_BG_SYNC)
-+		return sprintf(buf, "2-layer-fb-bg\n");
-+	else if (mxcfbi->ipu_ch == MEM_FG_SYNC)
-+		return sprintf(buf, "2-layer-fb-fg\n");
-+	else if (mxcfbi->ipu_ch == MEM_DC_SYNC)
-+		return sprintf(buf, "1-layer-fb\n");
-+	else
-+		return sprintf(buf, "err: no display chan\n");
-+}
-+
-+static ssize_t swap_disp_chan(struct device *dev,
-+			      struct device_attribute *attr,
-+			      const char *buf, size_t count)
-+{
-+	struct fb_info *info = dev_get_drvdata(dev);
-+	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)info->par;
-+	struct mxcfb_info *fg_mxcfbi = NULL;
-+
-+	console_lock();
-+	/* swap only happen between DP-BG and DC, while DP-FG disable */
-+	if (((mxcfbi->ipu_ch == MEM_BG_SYNC) &&
-+	     (strstr(buf, "1-layer-fb") != NULL)) ||
-+	    ((mxcfbi->ipu_ch == MEM_DC_SYNC) &&
-+	     (strstr(buf, "2-layer-fb-bg") != NULL))) {
-+		struct fb_info *fbi_fg;
-+
-+		fbi_fg = found_registered_fb(MEM_FG_SYNC, mxcfbi->ipu_id);
-+		if (fbi_fg)
-+			fg_mxcfbi = (struct mxcfb_info *)fbi_fg->par;
-+
-+		if (!fg_mxcfbi ||
-+			fg_mxcfbi->cur_blank == FB_BLANK_UNBLANK) {
-+			dev_err(dev,
-+				"Can not switch while fb2(fb-fg) is on.\n");
-+			console_unlock();
-+			return count;
-+		}
-+
-+		if (swap_channels(info) < 0)
-+			dev_err(dev, "Swap display channel failed.\n");
-+	}
-+
-+	console_unlock();
-+	return count;
-+}
-+static DEVICE_ATTR(fsl_disp_property, S_IWUSR | S_IRUGO,
-+		   show_disp_chan, swap_disp_chan);
-+
-+static ssize_t show_disp_dev(struct device *dev,
-+			     struct device_attribute *attr, char *buf)
-+{
-+	struct fb_info *info = dev_get_drvdata(dev);
-+	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)info->par;
-+
-+	if (mxcfbi->ipu_ch == MEM_FG_SYNC)
-+		return sprintf(buf, "overlay\n");
-+	else
-+		return sprintf(buf, "%s\n", mxcfbi->dispdrv->drv->name);
-+}
-+static DEVICE_ATTR(fsl_disp_dev_property, S_IRUGO, show_disp_dev, NULL);
-+
-+static int mxcfb_dispdrv_init(struct platform_device *pdev,
-+		struct fb_info *fbi)
-+{
-+	struct ipuv3_fb_platform_data *plat_data = pdev->dev.platform_data;
-+	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)fbi->par;
-+	struct mxc_dispdrv_setting setting;
-+	char disp_dev[32], *default_dev = "lcd";
-+	int ret = 0;
-+
-+	setting.if_fmt = plat_data->interface_pix_fmt;
-+	setting.dft_mode_str = plat_data->mode_str;
-+	setting.default_bpp = plat_data->default_bpp;
-+	if (!setting.default_bpp)
-+		setting.default_bpp = 16;
-+	setting.fbi = fbi;
-+	if (!strlen(plat_data->disp_dev)) {
-+		memcpy(disp_dev, default_dev, strlen(default_dev));
-+		disp_dev[strlen(default_dev)] = '\0';
-+	} else {
-+		memcpy(disp_dev, plat_data->disp_dev,
-+				strlen(plat_data->disp_dev));
-+		disp_dev[strlen(plat_data->disp_dev)] = '\0';
-+	}
-+
-+	dev_info(&pdev->dev, "register mxc display driver %s\n", disp_dev);
-+
-+	mxcfbi->dispdrv = mxc_dispdrv_gethandle(disp_dev, &setting);
-+	if (IS_ERR(mxcfbi->dispdrv)) {
-+		ret = PTR_ERR(mxcfbi->dispdrv);
-+		dev_err(&pdev->dev, "NO mxc display driver found!\n");
-+		return ret;
-+	} else {
-+		/* fix-up  */
-+		mxcfbi->ipu_di_pix_fmt = setting.if_fmt;
-+		mxcfbi->default_bpp = setting.default_bpp;
-+
-+		/* setting */
-+		mxcfbi->ipu_id = setting.dev_id;
-+		mxcfbi->ipu_di = setting.disp_id;
-+		dev_dbg(&pdev->dev, "di_pixfmt:0x%x, bpp:0x%x, di:%d, ipu:%d\n",
-+				setting.if_fmt, setting.default_bpp,
-+				setting.disp_id, setting.dev_id);
-+	}
-+
-+	return ret;
-+}
-+
-+/*
-+ * Parse user specified options (`video=trident:')
-+ * example:
-+ * 	video=mxcfb0:dev=lcd,800x480M-16@55,if=RGB565,bpp=16,noaccel
-+ *	video=mxcfb0:dev=lcd,800x480M-16@55,if=RGB565,fbpix=RGB565
-+ */
-+static int mxcfb_option_setup(struct platform_device *pdev, struct fb_info *fbi)
-+{
-+	struct ipuv3_fb_platform_data *pdata = pdev->dev.platform_data;
-+	char *options, *opt, *fb_mode_str = NULL;
-+	char name[] = "mxcfb0";
-+	uint32_t fb_pix_fmt = 0;
-+
-+	name[5] += pdev->id;
-+	if (fb_get_options(name, &options)) {
-+		dev_err(&pdev->dev, "Can't get fb option for %s!\n", name);
-+		return -ENODEV;
-+	}
-+
-+	if (!options || !*options)
-+		return 0;
-+
-+	while ((opt = strsep(&options, ",")) != NULL) {
-+		if (!*opt)
-+			continue;
-+
-+		if (!strncmp(opt, "dev=", 4)) {
-+			memcpy(pdata->disp_dev, opt + 4, strlen(opt) - 4);
-+			pdata->disp_dev[strlen(opt) - 4] = '\0';
-+		} else if (!strncmp(opt, "if=", 3)) {
-+			if (!strncmp(opt+3, "RGB24", 5))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_RGB24;
-+			else if (!strncmp(opt+3, "BGR24", 5))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_BGR24;
-+			else if (!strncmp(opt+3, "GBR24", 5))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_GBR24;
-+			else if (!strncmp(opt+3, "RGB565", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_RGB565;
-+			else if (!strncmp(opt+3, "RGB666", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_RGB666;
-+			else if (!strncmp(opt+3, "YUV444", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_YUV444;
-+			else if (!strncmp(opt+3, "LVDS666", 7))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_LVDS666;
-+			else if (!strncmp(opt+3, "YUYV16", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_YUYV;
-+			else if (!strncmp(opt+3, "UYVY16", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_UYVY;
-+			else if (!strncmp(opt+3, "YVYU16", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_YVYU;
-+			else if (!strncmp(opt+3, "VYUY16", 6))
-+				pdata->interface_pix_fmt = IPU_PIX_FMT_VYUY;
-+		} else if (!strncmp(opt, "fbpix=", 6)) {
-+			if (!strncmp(opt+6, "RGB24", 5))
-+				fb_pix_fmt = IPU_PIX_FMT_RGB24;
-+			else if (!strncmp(opt+6, "BGR24", 5))
-+				fb_pix_fmt = IPU_PIX_FMT_BGR24;
-+			else if (!strncmp(opt+6, "RGB32", 5))
-+				fb_pix_fmt = IPU_PIX_FMT_RGB32;
-+			else if (!strncmp(opt+6, "BGR32", 5))
-+				fb_pix_fmt = IPU_PIX_FMT_BGR32;
-+			else if (!strncmp(opt+6, "ABGR32", 6))
-+				fb_pix_fmt = IPU_PIX_FMT_ABGR32;
-+			else if (!strncmp(opt+6, "RGB565", 6))
-+				fb_pix_fmt = IPU_PIX_FMT_RGB565;
-+
-+			if (fb_pix_fmt) {
-+				pixfmt_to_var(fb_pix_fmt, &fbi->var);
-+				pdata->default_bpp =
-+					fbi->var.bits_per_pixel;
-+			}
-+		} else if (!strncmp(opt, "int_clk", 7)) {
-+			pdata->int_clk = true;
-+			continue;
-+		} else if (!strncmp(opt, "bpp=", 4)) {
-+			/* bpp setting cannot overwirte fbpix setting */
-+			if (fb_pix_fmt)
-+				continue;
-+
-+			pdata->default_bpp =
-+				simple_strtoul(opt + 4, NULL, 0);
-+
-+			fb_pix_fmt = bpp_to_pixfmt(pdata->default_bpp);
-+			if (fb_pix_fmt)
-+				pixfmt_to_var(fb_pix_fmt, &fbi->var);
-+		} else
-+			fb_mode_str = opt;
-+	}
-+
-+	if (fb_mode_str)
-+		pdata->mode_str = fb_mode_str;
-+
-+	return 0;
-+}
-+
-+static int mxcfb_register(struct fb_info *fbi)
-+{
-+	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)fbi->par;
-+	struct fb_videomode m;
-+	int ret = 0;
-+	char bg0_id[] = "DISP3 BG";
-+	char bg1_id[] = "DISP3 BG - DI1";
-+	char fg_id[] = "DISP3 FG";
-+
-+	if (mxcfbi->ipu_di == 0) {
-+		bg0_id[4] += mxcfbi->ipu_id;
-+		strcpy(fbi->fix.id, bg0_id);
-+	} else if (mxcfbi->ipu_di == 1) {
-+		bg1_id[4] += mxcfbi->ipu_id;
-+		strcpy(fbi->fix.id, bg1_id);
-+	} else { /* Overlay */
-+		fg_id[4] += mxcfbi->ipu_id;
-+		strcpy(fbi->fix.id, fg_id);
-+	}
-+
-+	mxcfb_check_var(&fbi->var, fbi);
-+
-+	mxcfb_set_fix(fbi);
-+
-+	/* Added first mode to fbi modelist. */
-+	if (!fbi->modelist.next || !fbi->modelist.prev)
-+		INIT_LIST_HEAD(&fbi->modelist);
-+	fb_var_to_videomode(&m, &fbi->var);
-+	fb_add_videomode(&m, &fbi->modelist);
-+
-+	if (ipu_request_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq,
-+		mxcfb_irq_handler, IPU_IRQF_ONESHOT, MXCFB_NAME, fbi) != 0) {
-+		dev_err(fbi->device, "Error registering EOF irq handler.\n");
-+		ret = -EBUSY;
-+		goto err0;
-+	}
-+	ipu_disable_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq);
-+	if (ipu_request_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq,
-+		mxcfb_nf_irq_handler, IPU_IRQF_ONESHOT, MXCFB_NAME, fbi) != 0) {
-+		dev_err(fbi->device, "Error registering NFACK irq handler.\n");
-+		ret = -EBUSY;
-+		goto err1;
-+	}
-+	ipu_disable_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq);
-+
-+	if (mxcfbi->ipu_alp_ch_irq != -1)
-+		if (ipu_request_irq(mxcfbi->ipu, mxcfbi->ipu_alp_ch_irq,
-+				mxcfb_alpha_irq_handler, IPU_IRQF_ONESHOT,
-+					MXCFB_NAME, fbi) != 0) {
-+			dev_err(fbi->device, "Error registering alpha irq "
-+					"handler.\n");
-+			ret = -EBUSY;
-+			goto err2;
-+		}
-+
-+	if (!mxcfbi->late_init) {
-+		fbi->var.activate |= FB_ACTIVATE_FORCE;
-+		console_lock();
-+		fbi->flags |= FBINFO_MISC_USEREVENT;
-+		ret = fb_set_var(fbi, &fbi->var);
-+		fbi->flags &= ~FBINFO_MISC_USEREVENT;
-+		console_unlock();
-+		if (ret < 0) {
-+			dev_err(fbi->device, "Error fb_set_var ret:%d\n", ret);
-+			goto err3;
-+		}
-+
-+		if (mxcfbi->next_blank == FB_BLANK_UNBLANK) {
-+			console_lock();
-+			ret = fb_blank(fbi, FB_BLANK_UNBLANK);
-+			console_unlock();
-+			if (ret < 0) {
-+				dev_err(fbi->device,
-+					"Error fb_blank ret:%d\n", ret);
-+				goto err4;
-+			}
-+		}
-+	} else {
-+		/*
-+		 * Setup the channel again though bootloader
-+		 * has done this, then set_par() can stop the
-+		 * channel neatly and re-initialize it .
-+		 */
-+		if (mxcfbi->next_blank == FB_BLANK_UNBLANK) {
-+			console_lock();
-+			_setup_disp_channel1(fbi);
-+			ipu_enable_channel(mxcfbi->ipu, mxcfbi->ipu_ch);
-+			console_unlock();
-+		}
-+	}
-+
-+
-+	ret = register_framebuffer(fbi);
-+	if (ret < 0)
-+		goto err5;
-+
-+	return ret;
-+err5:
-+	if (mxcfbi->next_blank == FB_BLANK_UNBLANK) {
-+		console_lock();
-+		if (!mxcfbi->late_init)
-+			fb_blank(fbi, FB_BLANK_POWERDOWN);
-+		else {
-+			ipu_disable_channel(mxcfbi->ipu, mxcfbi->ipu_ch,
-+					    true);
-+			ipu_uninit_channel(mxcfbi->ipu, mxcfbi->ipu_ch);
-+		}
-+		console_unlock();
-+	}
-+err4:
-+err3:
-+	if (mxcfbi->ipu_alp_ch_irq != -1)
-+		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_alp_ch_irq, fbi);
-+err2:
-+	ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq, fbi);
-+err1:
-+	ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq, fbi);
-+err0:
-+	return ret;
-+}
-+
-+static void mxcfb_unregister(struct fb_info *fbi)
-+{
-+	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)fbi->par;
-+
-+	if (mxcfbi->ipu_alp_ch_irq != -1)
-+		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_alp_ch_irq, fbi);
-+	if (mxcfbi->ipu_ch_irq)
-+		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq, fbi);
-+	if (mxcfbi->ipu_ch_nf_irq)
-+		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq, fbi);
-+
-+	unregister_framebuffer(fbi);
-+}
-+
-+static int mxcfb_setup_overlay(struct platform_device *pdev,
-+		struct fb_info *fbi_bg, struct resource *res)
-+{
-+	struct fb_info *ovfbi;
-+	struct mxcfb_info *mxcfbi_bg = (struct mxcfb_info *)fbi_bg->par;
-+	struct mxcfb_info *mxcfbi_fg;
-+	int ret = 0;
-+
-+	ovfbi = mxcfb_init_fbinfo(&pdev->dev, &mxcfb_ops);
-+	if (!ovfbi) {
-+		ret = -ENOMEM;
-+		goto init_ovfbinfo_failed;
-+	}
-+	mxcfbi_fg = (struct mxcfb_info *)ovfbi->par;
-+
-+	mxcfbi_fg->ipu = ipu_get_soc(mxcfbi_bg->ipu_id);
-+	if (IS_ERR(mxcfbi_fg->ipu)) {
-+		ret = -ENODEV;
-+		goto get_ipu_failed;
-+	}
-+	mxcfbi_fg->ipu_id = mxcfbi_bg->ipu_id;
-+	mxcfbi_fg->ipu_ch_irq = IPU_IRQ_FG_SYNC_EOF;
-+	mxcfbi_fg->ipu_ch_nf_irq = IPU_IRQ_FG_SYNC_NFACK;
-+	mxcfbi_fg->ipu_alp_ch_irq = IPU_IRQ_FG_ALPHA_SYNC_EOF;
-+	mxcfbi_fg->ipu_ch = MEM_FG_SYNC;
-+	mxcfbi_fg->ipu_di = -1;
-+	mxcfbi_fg->ipu_di_pix_fmt = mxcfbi_bg->ipu_di_pix_fmt;
-+	mxcfbi_fg->overlay = true;
-+	mxcfbi_fg->cur_blank = mxcfbi_fg->next_blank = FB_BLANK_POWERDOWN;
-+
-+	/* Need dummy values until real panel is configured */
-+	ovfbi->var.xres = 240;
-+	ovfbi->var.yres = 320;
-+
-+	if (res && res->start && res->end) {
-+		ovfbi->fix.smem_len = res->end - res->start + 1;
-+		ovfbi->fix.smem_start = res->start;
-+		ovfbi->screen_base = ioremap(
-+					ovfbi->fix.smem_start,
-+					ovfbi->fix.smem_len);
-+	}
-+
-+	ret = mxcfb_register(ovfbi);
-+	if (ret < 0)
-+		goto register_ov_failed;
-+
-+	mxcfbi_bg->ovfbi = ovfbi;
-+
-+	return ret;
-+
-+register_ov_failed:
-+get_ipu_failed:
-+	fb_dealloc_cmap(&ovfbi->cmap);
-+	framebuffer_release(ovfbi);
-+init_ovfbinfo_failed:
-+	return ret;
-+}
-+
-+static void mxcfb_unsetup_overlay(struct fb_info *fbi_bg)
-+{
-+	struct mxcfb_info *mxcfbi_bg = (struct mxcfb_info *)fbi_bg->par;
-+	struct fb_info *ovfbi = mxcfbi_bg->ovfbi;
-+
-+	mxcfb_unregister(ovfbi);
-+
-+	if (&ovfbi->cmap)
-+		fb_dealloc_cmap(&ovfbi->cmap);
-+	framebuffer_release(ovfbi);
-+}
-+
-+static bool ipu_usage[2][2];
-+static int ipu_test_set_usage(int ipu, int di)
-+{
-+	if (ipu_usage[ipu][di])
-+		return -EBUSY;
-+	else
-+		ipu_usage[ipu][di] = true;
-+	return 0;
-+}
-+
-+static void ipu_clear_usage(int ipu, int di)
-+{
-+	ipu_usage[ipu][di] = false;
-+}
-+
-+static int mxcfb_get_of_property(struct platform_device *pdev,
-+				struct ipuv3_fb_platform_data *plat_data)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+	const char *disp_dev;
-+	const char *mode_str;
-+	const char *pixfmt;
-+	int err;
-+	int len;
-+	u32 bpp, int_clk;
-+	u32 late_init;
-+
-+	err = of_property_read_string(np, "disp_dev", &disp_dev);
-+	if (err < 0) {
-+		dev_dbg(&pdev->dev, "get of property disp_dev fail\n");
-+		return err;
-+	}
-+	err = of_property_read_string(np, "mode_str", &mode_str);
-+	if (err < 0) {
-+		dev_dbg(&pdev->dev, "get of property mode_str fail\n");
-+		return err;
-+	}
-+	err = of_property_read_string(np, "interface_pix_fmt", &pixfmt);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property pix fmt fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "default_bpp", &bpp);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property bpp fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "int_clk", &int_clk);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property int_clk fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "late_init", &late_init);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property late_init fail\n");
-+		return err;
-+	}
-+
-+	if (!strncmp(pixfmt, "RGB24", 5))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_RGB24;
-+	else if (!strncmp(pixfmt, "BGR24", 5))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_BGR24;
-+	else if (!strncmp(pixfmt, "GBR24", 5))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_GBR24;
-+	else if (!strncmp(pixfmt, "RGB565", 6))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_RGB565;
-+	else if (!strncmp(pixfmt, "RGB666", 6))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_RGB666;
-+	else if (!strncmp(pixfmt, "YUV444", 6))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_YUV444;
-+	else if (!strncmp(pixfmt, "LVDS666", 7))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_LVDS666;
-+	else if (!strncmp(pixfmt, "YUYV16", 6))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_YUYV;
-+	else if (!strncmp(pixfmt, "UYVY16", 6))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_UYVY;
-+	else if (!strncmp(pixfmt, "YVYU16", 6))
-+		plat_data->interface_pix_fmt = IPU_PIX_FMT_YVYU;
-+	else if (!strncmp(pixfmt, "VYUY16", 6))
-+				plat_data->interface_pix_fmt = IPU_PIX_FMT_VYUY;
-+	else {
-+		dev_err(&pdev->dev, "err interface_pix_fmt!\n");
-+		return -ENOENT;
-+	}
-+
-+	len = min(sizeof(plat_data->disp_dev) - 1, strlen(disp_dev));
-+	memcpy(plat_data->disp_dev, disp_dev, len);
-+	plat_data->disp_dev[len] = '\0';
-+	plat_data->mode_str = (char *)mode_str;
-+	plat_data->default_bpp = bpp;
-+	plat_data->int_clk = (bool)int_clk;
-+	plat_data->late_init = (bool)late_init;
-+	return err;
-+}
-+
-+/*!
-+ * Probe routine for the framebuffer driver. It is called during the
-+ * driver binding process.      The following functions are performed in
-+ * this routine: Framebuffer initialization, Memory allocation and
-+ * mapping, Framebuffer registration, IPU initialization.
-+ *
-+ * @return      Appropriate error code to the kernel common code
-+ */
-+static int mxcfb_probe(struct platform_device *pdev)
-+{
-+	struct ipuv3_fb_platform_data *plat_data;
-+	struct fb_info *fbi;
-+	struct mxcfb_info *mxcfbi;
-+	struct resource *res;
-+	int ret = 0;
-+
-+	dev_dbg(&pdev->dev, "%s enter\n", __func__);
-+	pdev->id = of_alias_get_id(pdev->dev.of_node, "mxcfb");
-+	if (pdev->id < 0) {
-+		dev_err(&pdev->dev, "can not get alias id\n");
-+		return pdev->id;
-+	}
-+
-+	plat_data = devm_kzalloc(&pdev->dev, sizeof(struct
-+					ipuv3_fb_platform_data), GFP_KERNEL);
-+	if (!plat_data)
-+		return -ENOMEM;
-+	pdev->dev.platform_data = plat_data;
-+
-+	ret = mxcfb_get_of_property(pdev, plat_data);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "get mxcfb of property fail\n");
-+		return ret;
-+	}
-+
-+	/* Initialize FB structures */
-+	fbi = mxcfb_init_fbinfo(&pdev->dev, &mxcfb_ops);
-+	if (!fbi) {
-+		ret = -ENOMEM;
-+		goto init_fbinfo_failed;
-+	}
-+
-+	ret = mxcfb_option_setup(pdev, fbi);
-+	if (ret)
-+		goto get_fb_option_failed;
-+
-+	mxcfbi = (struct mxcfb_info *)fbi->par;
-+	mxcfbi->ipu_int_clk = plat_data->int_clk;
-+	mxcfbi->late_init = plat_data->late_init;
-+	mxcfbi->first_set_par = true;
-+	ret = mxcfb_dispdrv_init(pdev, fbi);
-+	if (ret < 0)
-+		goto init_dispdrv_failed;
-+
-+	ret = ipu_test_set_usage(mxcfbi->ipu_id, mxcfbi->ipu_di);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "ipu%d-di%d already in use\n",
-+				mxcfbi->ipu_id, mxcfbi->ipu_di);
-+		goto ipu_in_busy;
-+	}
-+
-+	if (mxcfbi->dispdrv->drv->post_init) {
-+		ret = mxcfbi->dispdrv->drv->post_init(mxcfbi->dispdrv,
-+						mxcfbi->ipu_id,
-+						mxcfbi->ipu_di);
-+		if (ret < 0) {
-+			dev_err(&pdev->dev, "post init failed\n");
-+			goto post_init_failed;
-+		}
-+	}
-+
-+	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
-+	if (res && res->start && res->end) {
-+		fbi->fix.smem_len = res->end - res->start + 1;
-+		fbi->fix.smem_start = res->start;
-+		fbi->screen_base = ioremap(fbi->fix.smem_start, fbi->fix.smem_len);
-+		/* Do not clear the fb content drawn in bootloader. */
-+		if (!mxcfbi->late_init)
-+			memset(fbi->screen_base, 0, fbi->fix.smem_len);
-+	}
-+
-+	mxcfbi->ipu = ipu_get_soc(mxcfbi->ipu_id);
-+	if (IS_ERR(mxcfbi->ipu)) {
-+		ret = -ENODEV;
-+		goto get_ipu_failed;
-+	}
-+
-+	/* first user uses DP with alpha feature */
-+	if (!g_dp_in_use[mxcfbi->ipu_id]) {
-+		mxcfbi->ipu_ch_irq = IPU_IRQ_BG_SYNC_EOF;
-+		mxcfbi->ipu_ch_nf_irq = IPU_IRQ_BG_SYNC_NFACK;
-+		mxcfbi->ipu_alp_ch_irq = IPU_IRQ_BG_ALPHA_SYNC_EOF;
-+		mxcfbi->ipu_ch = MEM_BG_SYNC;
-+		/* Unblank the primary fb only by default */
-+		if (pdev->id == 0)
-+			mxcfbi->cur_blank = mxcfbi->next_blank = FB_BLANK_UNBLANK;
-+		else
-+			mxcfbi->cur_blank = mxcfbi->next_blank = FB_BLANK_POWERDOWN;
-+
-+		ret = mxcfb_register(fbi);
-+		if (ret < 0)
-+			goto mxcfb_register_failed;
-+
-+		ipu_disp_set_global_alpha(mxcfbi->ipu, mxcfbi->ipu_ch,
-+					  true, 0x80);
-+		ipu_disp_set_color_key(mxcfbi->ipu, mxcfbi->ipu_ch, false, 0);
-+
-+		res = platform_get_resource(pdev, IORESOURCE_MEM, 1);
-+		ret = mxcfb_setup_overlay(pdev, fbi, res);
-+
-+		if (ret < 0) {
-+			mxcfb_unregister(fbi);
-+			goto mxcfb_setupoverlay_failed;
-+		}
-+
-+		g_dp_in_use[mxcfbi->ipu_id] = true;
-+
-+		ret = device_create_file(mxcfbi->ovfbi->dev,
-+					 &dev_attr_fsl_disp_property);
-+		if (ret)
-+			dev_err(mxcfbi->ovfbi->dev, "Error %d on creating "
-+						    "file for disp property\n",
-+						    ret);
-+
-+		ret = device_create_file(mxcfbi->ovfbi->dev,
-+					 &dev_attr_fsl_disp_dev_property);
-+		if (ret)
-+			dev_err(mxcfbi->ovfbi->dev, "Error %d on creating "
-+						    "file for disp device "
-+						    "propety\n", ret);
-+	} else {
-+		mxcfbi->ipu_ch_irq = IPU_IRQ_DC_SYNC_EOF;
-+		mxcfbi->ipu_ch_nf_irq = IPU_IRQ_DC_SYNC_NFACK;
-+		mxcfbi->ipu_alp_ch_irq = -1;
-+		mxcfbi->ipu_ch = MEM_DC_SYNC;
-+		mxcfbi->cur_blank = mxcfbi->next_blank = FB_BLANK_POWERDOWN;
-+
-+		ret = mxcfb_register(fbi);
-+		if (ret < 0)
-+			goto mxcfb_register_failed;
-+	}
-+
-+	platform_set_drvdata(pdev, fbi);
-+
-+	ret = device_create_file(fbi->dev, &dev_attr_fsl_disp_property);
-+	if (ret)
-+		dev_err(&pdev->dev, "Error %d on creating file for disp "
-+				    "property\n", ret);
-+
-+	ret = device_create_file(fbi->dev, &dev_attr_fsl_disp_dev_property);
-+	if (ret)
-+		dev_err(&pdev->dev, "Error %d on creating file for disp "
-+				    " device propety\n", ret);
-+
-+	return 0;
-+
-+mxcfb_setupoverlay_failed:
-+mxcfb_register_failed:
-+get_ipu_failed:
-+post_init_failed:
-+	ipu_clear_usage(mxcfbi->ipu_id, mxcfbi->ipu_di);
-+ipu_in_busy:
-+init_dispdrv_failed:
-+	fb_dealloc_cmap(&fbi->cmap);
-+	framebuffer_release(fbi);
-+get_fb_option_failed:
-+init_fbinfo_failed:
-+	return ret;
-+}
-+
-+static int mxcfb_remove(struct platform_device *pdev)
-+{
-+	struct fb_info *fbi = platform_get_drvdata(pdev);
-+	struct mxcfb_info *mxc_fbi = fbi->par;
-+
-+	if (!fbi)
-+		return 0;
-+
-+	device_remove_file(fbi->dev, &dev_attr_fsl_disp_dev_property);
-+	device_remove_file(fbi->dev, &dev_attr_fsl_disp_property);
-+	mxcfb_blank(FB_BLANK_POWERDOWN, fbi);
-+	mxcfb_unregister(fbi);
-+	mxcfb_unmap_video_memory(fbi);
-+
-+	if (mxc_fbi->ovfbi) {
-+		device_remove_file(mxc_fbi->ovfbi->dev,
-+				   &dev_attr_fsl_disp_dev_property);
-+		device_remove_file(mxc_fbi->ovfbi->dev,
-+				   &dev_attr_fsl_disp_property);
-+		mxcfb_blank(FB_BLANK_POWERDOWN, mxc_fbi->ovfbi);
-+		mxcfb_unsetup_overlay(fbi);
-+		mxcfb_unmap_video_memory(mxc_fbi->ovfbi);
-+	}
-+
-+	ipu_clear_usage(mxc_fbi->ipu_id, mxc_fbi->ipu_di);
-+	if (&fbi->cmap)
-+		fb_dealloc_cmap(&fbi->cmap);
-+	framebuffer_release(fbi);
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_mxcfb_dt_ids[] = {
-+	{ .compatible = "fsl,mxc_sdc_fb"},
-+	{ /* sentinel */ }
-+};
-+
-+/*!
-+ * This structure contains pointers to the power management callback functions.
-+ */
-+static struct platform_driver mxcfb_driver = {
-+	.driver = {
-+		.name = MXCFB_NAME,
-+		.of_match_table	= imx_mxcfb_dt_ids,
-+	},
-+	.probe = mxcfb_probe,
-+	.remove = mxcfb_remove,
-+	.suspend = mxcfb_suspend,
-+	.resume = mxcfb_resume,
-+};
-+
-+/*!
-+ * Main entry function for the framebuffer. The function registers the power
-+ * management callback functions with the kernel and also registers the MXCFB
-+ * callback functions with the core Linux framebuffer driver \b fbmem.c
-+ *
-+ * @return      Error code indicating success or failure
-+ */
-+int __init mxcfb_init(void)
-+{
-+	return platform_driver_register(&mxcfb_driver);
-+}
-+
-+void mxcfb_exit(void)
-+{
-+	platform_driver_unregister(&mxcfb_driver);
-+}
-+
-+module_init(mxcfb_init);
-+module_exit(mxcfb_exit);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("MXC framebuffer driver");
-+MODULE_LICENSE("GPL");
-+MODULE_SUPPORTED_DEVICE("fb");
-diff -Nur linux-4.1.3/drivers/video/mxc/mxc_lcdif.c linux-xbian-imx6/drivers/video/mxc/mxc_lcdif.c
---- linux-4.1.3/drivers/video/mxc/mxc_lcdif.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/drivers/video/mxc/mxc_lcdif.c	2015-07-27 23:13:08.753749907 +0200
-@@ -0,0 +1,241 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+#include <linux/init.h>
-+#include <linux/ipu.h>
-+#include <linux/kernel.h>
-+#include <linux/module.h>
-+#include <linux/mxcfb.h>
-+#include <linux/of_device.h>
-+#include <linux/pinctrl/consumer.h>
-+#include <linux/platform_device.h>
-+
-+#include "mxc_dispdrv.h"
-+
-+struct mxc_lcd_platform_data {
-+	u32 default_ifmt;
-+	u32 ipu_id;
-+	u32 disp_id;
-+};
-+
-+struct mxc_lcdif_data {
-+	struct platform_device *pdev;
-+	struct mxc_dispdrv_handle *disp_lcdif;
-+};
-+
-+#define DISPDRV_LCD	"lcd"
-+
-+static struct fb_videomode lcdif_modedb[] = {
-+	{
-+	/* 800x480 @ 57 Hz , pixel clk @ 27MHz */
-+	"CLAA-WVGA", 57, 800, 480, 37037, 40, 60, 10, 10, 20, 10,
-+	FB_SYNC_CLK_LAT_FALL,
-+	FB_VMODE_NONINTERLACED,
-+	0,},
-+	{
-+	/* 800x480 @ 60 Hz , pixel clk @ 32MHz */
-+	"SEIKO-WVGA", 60, 800, 480, 29850, 89, 164, 23, 10, 10, 10,
-+	FB_SYNC_CLK_LAT_FALL,
-+	FB_VMODE_NONINTERLACED,
-+	0,},
-+	{
-+	/* 1920x1080i @ 50 Hz , pixel clk @ 74.5MHz */
-+	"LCD-1080I50", 50, 1920, 1080, 13468, 528, 148, 4, 31, 44, 10,
-+	FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
-+	FB_VMODE_INTERLACED,
-+	0,},
-+};
-+static int lcdif_modedb_sz = ARRAY_SIZE(lcdif_modedb);
-+
-+static int lcdif_init(struct mxc_dispdrv_handle *disp,
-+	struct mxc_dispdrv_setting *setting)
-+{
-+	int ret, i;
-+	struct mxc_lcdif_data *lcdif = mxc_dispdrv_getdata(disp);
-+	struct mxc_lcd_platform_data *plat_data
-+			= lcdif->pdev->dev.platform_data;
-+	struct fb_videomode *modedb = lcdif_modedb;
-+	int modedb_sz = lcdif_modedb_sz;
-+
-+	/* use platform defined ipu/di */
-+	setting->dev_id = plat_data->ipu_id;
-+	setting->disp_id = plat_data->disp_id;
-+
-+	ret = fb_find_mode(&setting->fbi->var, setting->fbi, setting->dft_mode_str,
-+				modedb, modedb_sz, NULL, setting->default_bpp);
-+	if (!ret) {
-+		fb_videomode_to_var(&setting->fbi->var, &modedb[0]);
-+		setting->if_fmt = plat_data->default_ifmt;
-+	}
-+
-+	INIT_LIST_HEAD(&setting->fbi->modelist);
-+	for (i = 0; i < modedb_sz; i++) {
-+		struct fb_videomode m;
-+		fb_var_to_videomode(&m, &setting->fbi->var);
-+		if (fb_mode_is_equal(&m, &modedb[i])) {
-+			fb_add_videomode(&modedb[i],
-+					&setting->fbi->modelist);
-+			break;
-+		}
-+	}
-+
-+	return ret;
-+}
-+
-+void lcdif_deinit(struct mxc_dispdrv_handle *disp)
-+{
-+	/*TODO*/
-+}
-+
-+static struct mxc_dispdrv_driver lcdif_drv = {
-+	.name 	= DISPDRV_LCD,
-+	.init 	= lcdif_init,
-+	.deinit	= lcdif_deinit,
-+};
-+
-+static int lcd_get_of_property(struct platform_device *pdev,
-+				struct mxc_lcd_platform_data *plat_data)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+	int err;
-+	u32 ipu_id, disp_id;
-+	const char *default_ifmt;
-+
-+	err = of_property_read_string(np, "default_ifmt", &default_ifmt);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property default_ifmt fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "ipu_id", &ipu_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property ipu_id fail\n");
-+		return err;
-+	}
-+	err = of_property_read_u32(np, "disp_id", &disp_id);
-+	if (err) {
-+		dev_dbg(&pdev->dev, "get of property disp_id fail\n");
-+		return err;
-+	}
-+
-+	plat_data->ipu_id = ipu_id;
-+	plat_data->disp_id = disp_id;
-+	if (!strncmp(default_ifmt, "RGB24", 5))
-+		plat_data->default_ifmt = IPU_PIX_FMT_RGB24;
-+	else if (!strncmp(default_ifmt, "BGR24", 5))
-+		plat_data->default_ifmt = IPU_PIX_FMT_BGR24;
-+	else if (!strncmp(default_ifmt, "GBR24", 5))
-+		plat_data->default_ifmt = IPU_PIX_FMT_GBR24;
-+	else if (!strncmp(default_ifmt, "RGB565", 6))
-+		plat_data->default_ifmt = IPU_PIX_FMT_RGB565;
-+	else if (!strncmp(default_ifmt, "RGB666", 6))
-+		plat_data->default_ifmt = IPU_PIX_FMT_RGB666;
-+	else if (!strncmp(default_ifmt, "YUV444", 6))
-+		plat_data->default_ifmt = IPU_PIX_FMT_YUV444;
-+	else if (!strncmp(default_ifmt, "LVDS666", 7))
-+		plat_data->default_ifmt = IPU_PIX_FMT_LVDS666;
-+	else if (!strncmp(default_ifmt, "YUYV16", 6))
-+		plat_data->default_ifmt = IPU_PIX_FMT_YUYV;
-+	else if (!strncmp(default_ifmt, "UYVY16", 6))
-+		plat_data->default_ifmt = IPU_PIX_FMT_UYVY;
-+	else if (!strncmp(default_ifmt, "YVYU16", 6))
-+		plat_data->default_ifmt = IPU_PIX_FMT_YVYU;
-+	else if (!strncmp(default_ifmt, "VYUY16", 6))
-+				plat_data->default_ifmt = IPU_PIX_FMT_VYUY;
-+	else {
-+		dev_err(&pdev->dev, "err default_ifmt!\n");
-+		return -ENOENT;
-+	}
-+
-+	return err;
-+}
-+
-+static int mxc_lcdif_probe(struct platform_device *pdev)
-+{
-+	int ret;
-+	struct pinctrl *pinctrl;
-+	struct mxc_lcdif_data *lcdif;
-+	struct mxc_lcd_platform_data *plat_data;
-+
-+	dev_dbg(&pdev->dev, "%s enter\n", __func__);
-+	lcdif = devm_kzalloc(&pdev->dev, sizeof(struct mxc_lcdif_data),
-+				GFP_KERNEL);
-+	if (!lcdif)
-+		return -ENOMEM;
-+	plat_data = devm_kzalloc(&pdev->dev,
-+				sizeof(struct mxc_lcd_platform_data),
-+				GFP_KERNEL);
-+	if (!plat_data)
-+		return -ENOMEM;
-+	pdev->dev.platform_data = plat_data;
-+
-+	ret = lcd_get_of_property(pdev, plat_data);
-+	if (ret < 0) {
-+		dev_err(&pdev->dev, "get lcd of property fail\n");
-+		return ret;
-+	}
-+
-+	pinctrl = devm_pinctrl_get_select_default(&pdev->dev);
-+	if (IS_ERR(pinctrl)) {
-+		dev_err(&pdev->dev, "can't get/select pinctrl\n");
-+		return PTR_ERR(pinctrl);
-+	}
-+
-+	lcdif->pdev = pdev;
-+	lcdif->disp_lcdif = mxc_dispdrv_register(&lcdif_drv);
-+	mxc_dispdrv_setdata(lcdif->disp_lcdif, lcdif);
-+
-+	dev_set_drvdata(&pdev->dev, lcdif);
-+	dev_dbg(&pdev->dev, "%s exit\n", __func__);
-+
-+	return ret;
-+}
-+
-+static int mxc_lcdif_remove(struct platform_device *pdev)
-+{
-+	struct mxc_lcdif_data *lcdif = dev_get_drvdata(&pdev->dev);
-+
-+	mxc_dispdrv_puthandle(lcdif->disp_lcdif);
-+	mxc_dispdrv_unregister(lcdif->disp_lcdif);
-+	kfree(lcdif);
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_lcd_dt_ids[] = {
-+	{ .compatible = "fsl,lcd"},
-+	{ /* sentinel */ }
-+};
-+static struct platform_driver mxc_lcdif_driver = {
-+	.driver = {
-+		.name = "mxc_lcdif",
-+		.of_match_table	= imx_lcd_dt_ids,
-+	},
-+	.probe = mxc_lcdif_probe,
-+	.remove = mxc_lcdif_remove,
-+};
-+
-+static int __init mxc_lcdif_init(void)
-+{
-+	return platform_driver_register(&mxc_lcdif_driver);
-+}
-+
-+static void __exit mxc_lcdif_exit(void)
-+{
-+	platform_driver_unregister(&mxc_lcdif_driver);
-+}
-+
-+module_init(mxc_lcdif_init);
-+module_exit(mxc_lcdif_exit);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("i.MX ipuv3 LCD extern port driver");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/firmware/imx/sdma/sdma-imx6q.bin.ihex linux-xbian-imx6/firmware/imx/sdma/sdma-imx6q.bin.ihex
---- linux-4.1.3/firmware/imx/sdma/sdma-imx6q.bin.ihex	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/firmware/imx/sdma/sdma-imx6q.bin.ihex	2015-07-27 23:13:08.841437049 +0200
-@@ -0,0 +1,116 @@
-+:1000000053444D4101000000010000001C000000AD
-+:1000100026000000B40000007A0600008202000002
-+:10002000FFFFFFFF00000000FFFFFFFFFFFFFFFFDC
-+:10003000FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFD0
-+:10004000FFFFFFFFFFFFFFFF6A1A0000FFFFFFFF38
-+:10005000EB020000BB180000FFFFFFFF08040000D8
-+:10006000FFFFFFFFC0030000FFFFFFFFFFFFFFFFD9
-+:10007000FFFFFFFFAB020000FFFFFFFF7B0300005D
-+:10008000FFFFFFFFFFFFFFFF4C0400006E040000B6
-+:10009000FFFFFFFF00180000FFFFFFFFFFFFFFFF54
-+:1000A000000000000018000062180000161A00008E
-+:1000B000061B0000E3C1DB57E35FE357F352016A1D
-+:1000C0008F00D500017D8D00A005EB5D7804037DD8
-+:1000D00079042C7D367C79041F7CEE56000F600677
-+:1000E000057D0965437E0A62417E20980A623E7E54
-+:1000F00009653C7E12051205AD026007037DFB55C4
-+:10010000D36D2B98FB55041DD36DC86A2F7F011F3B
-+:1001100003200048E47C5398FB55D76D1500057803
-+:100120000962C86A0962C86AD76D5298FB55D76DD3
-+:100130001500150005780A62C86A0A62C86AD76D98
-+:100140005298FB55D76D15001500150005780B6208
-+:10015000C86A0B62C86AD76D097CDF6D077F000033
-+:10016000EB55004D077DFAC1E35706980700CC68B0
-+:100170000C6813C20AC20398D9C1E3C1DB57E35F1D
-+:10018000E357F352216A8F00D500017D8D00A00551
-+:10019000EB5DFB567804037D79042A7D317C79047C
-+:1001A000207C700B1103EB53000F6003057D096584
-+:1001B000377E0A62357E86980A62327E0965307E15
-+:1001C00012051205AD026007027C065A8E98265A67
-+:1001D000277F011F03200048E87C700B1103135395
-+:1001E000AF98150004780962065A0962265AAE983B
-+:1001F0001500150004780A62065A0A62265AAE985B
-+:1002000015001500150004780B62065A0B62265A79
-+:10021000077C0000EB55004D067DFAC1E357699855
-+:1002200007000C6813C20AC26698700B11031353BF
-+:100230006C07017CD9C1FB5E8A066B07017CD9C1C2
-+:10024000F35EDB59D3588F0110010F398B003CC18D
-+:100250002B7DC05AC85B4EC1277C88038906E35CAE
-+:10026000FF0D1105FF1DBC053E07004D187D7008F0
-+:1002700011007E07097D7D07027D2852E698F8521D
-+:10028000DB54BC02CC02097C7C07027D2852EF982B
-+:10029000F852D354BC02CC02097D0004DD988B00D7
-+:1002A000C052C85359C1D67D0002CD98FF08BF0087
-+:1002B0007F07157D8804D500017D8D00A005EB5DCD
-+:1002C0008F0212021202FF3ADA05027C3E071899E9
-+:1002D000A402DD02027D3E0718995E071899EB55CE
-+:1002E0009805EB5DF352FB546A07267D6C07017D90
-+:1002F00055996B07577C6907047D6807027D010EDD
-+:100300002F999358D600017D8E009355A005935DDB
-+:10031000A00602780255045D1D7C004E087C69072A
-+:10032000037D0255177E3C99045D147F8906935026
-+:100330000048017D2799A099150006780255045DB3
-+:100340004F070255245D2F07017CA09917006F0706
-+:10035000017C012093559D000700A7D9F598D36C27
-+:100360006907047D6807027D010E64999358D600E1
-+:10037000017D8E009355A005935DA006027802557D
-+:10038000C86D0F7C004E087C6907037D0255097E0D
-+:100390007199C86D067F890693500048017D5C996C
-+:1003A000A0999A99C36A6907047D6807027D010EC6
-+:1003B00087999358D600017D8E009355A005935DD3
-+:1003C000A0060278C865045D0F7C004E087C6907B2
-+:1003D000037DC865097E9499045D067F8906935064
-+:1003E0000048017D7F99A09993559D000700FF6CFF
-+:1003F000A7D9F5980000E354EB55004D017CF59822
-+:10040000DD98E354EB55FF0A1102FF1A7F07027CC7
-+:10041000A005B4999D008C05BA05A0051002BA0488
-+:10042000AD0454040600E3C1DB57FB52C36AF35228
-+:10043000056A8F00D500017D8D00A005EB5D780475
-+:10044000037D79042B7D1E7C7904337CEE56000FEE
-+:10045000FB556007027DC36DD599041DC36DC8624D
-+:100460003B7E6006027D10021202096A357F12028D
-+:10047000096A327F1202096A2F7F011F0320004898
-+:10048000E77C099AFB55C76D150015001500057826
-+:10049000C8620B6AC8620B6AC76D089AFB55C76DC4
-+:1004A000150015000578C8620A6AC8620A6AC76D35
-+:1004B000089AFB55C76D15000578C862096AC862BD
-+:1004C000096AC76D097C286A077F0000EB55004D5B
-+:1004D000057DFAC1DB57BF9977C254040AC2BA99A5
-+:1004E000D9C1E3C1DB57F352056A8F00D500017D06
-+:1004F0008D00A005FB567804037D7904297D1F7CBF
-+:1005000079042E7CE35D700D1105ED55000F600739
-+:10051000027D0652329A2652337E6005027D100219
-+:100520001202096A2D7F1202096A2A7F1202096AE1
-+:10053000277F011F03200048EA7CE3555D9A1500E0
-+:1005400015001500047806520B6A26520B6A5C9A55
-+:1005500015001500047806520A6A26520A6A5C9A47
-+:10056000150004780652096A2652096A097C286A2D
-+:10057000077F0000DB57004D057DFAC1DB571B9A52
-+:1005800077C254040AC2189AE3C1DB57F352056AD2
-+:10059000FB568E02941AC36AC8626902247D941EB7
-+:1005A000C36ED36EC8624802C86A9426981EC36E92
-+:1005B000D36EC8624C02C86A9826C36E981EC36E7A
-+:1005C000C8629826C36E6002097CC8626E02247DF0
-+:1005D000096A1E7F0125004D257D849A286A187FAF
-+:1005E00004627AC2B89AE36E8F00D805017D8D004F
-+:1005F000A005C8626E02107D096A0A7F0120F97C9D
-+:10060000286A067F0000004D0D7DFAC1DB576E9A07
-+:10061000070004620C6AB59A286AFA7F04627AC2FB
-+:1006200058045404286AF47F0AC26B9AD9C1E3C102
-+:10063000DB57F352056AFB568E02941A0252690286
-+:100640001D7D941E06524802065A9426981E065294
-+:100650004C02065A9826981E065260020A7C98267A
-+:1006600006526E02237D096A1D7F0125004D247DFF
-+:10067000D19A286A177F04627AC2029B8F00D8053C
-+:10068000017D8D00A00506526E02107D096A0A7F69
-+:100690000120F97C286A067F0000004D0D7DFAC11B
-+:1006A000DB57C19A070004620C6AFF9A286AFA7F36
-+:1006B00004627AC258045404286AF47F0AC2BE9ABB
-+:1006C000016E0B612F7E0B622D7E0B632B7E0C0D5A
-+:1006D0001704170417049D04081DCC05017C0C0D9C
-+:1006E000D16A000F4207C86FDD6F1C7F8E009D002E
-+:1006F00001680B67177ED56B04080278C86F120774
-+:10070000117C0B670F7E04080278C86F12070A7C01
-+:10071000DD6F087FD169010FC86FDD6F037F0101B5
-+:0E0720000004129B0700FF680C680002129B89
-+:00000001FF
-diff -Nur linux-4.1.3/firmware/Makefile linux-xbian-imx6/firmware/Makefile
---- linux-4.1.3/firmware/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/firmware/Makefile	2015-07-27 23:13:08.809550816 +0200
-@@ -62,6 +62,7 @@
- 				   radeon/RV730_pfp.bin radeon/RV730_me.bin \
- 				   radeon/RV710_pfp.bin radeon/RV710_me.bin
- fw-shipped-$(CONFIG_DVB_AV7110) += av7110/bootcode.bin
-+fw-shipped-$(CONFIG_IMX_SDMA) += imx/sdma/sdma-imx6q.bin
- fw-shipped-$(CONFIG_DVB_TTUSB_BUDGET) += ttusb-budget/dspbootcode.bin
- fw-shipped-$(CONFIG_E100) += e100/d101m_ucode.bin e100/d101s_ucode.bin \
- 			     e100/d102e_ucode.bin
-diff -Nur linux-4.1.3/fs/btrfs/compression.c linux-xbian-imx6/fs/btrfs/compression.c
---- linux-4.1.3/fs/btrfs/compression.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/compression.c	2015-07-27 23:13:08.905209516 +0200
-@@ -753,6 +753,8 @@
- static const struct btrfs_compress_op * const btrfs_compress_op[] = {
- 	&btrfs_zlib_compress,
- 	&btrfs_lzo_compress,
-+	&btrfs_lz4_compress,
-+	&btrfs_lz4hc_compress,
- };
- 
- void __init btrfs_init_compress(void)
-diff -Nur linux-4.1.3/fs/btrfs/compression.h linux-xbian-imx6/fs/btrfs/compression.h
---- linux-4.1.3/fs/btrfs/compression.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/compression.h	2015-07-27 23:13:08.905209516 +0200
-@@ -79,5 +79,7 @@
- 
- extern const struct btrfs_compress_op btrfs_zlib_compress;
- extern const struct btrfs_compress_op btrfs_lzo_compress;
-+extern const struct btrfs_compress_op btrfs_lz4_compress;
-+extern const struct btrfs_compress_op btrfs_lz4hc_compress;
- 
- #endif
-diff -Nur linux-4.1.3/fs/btrfs/ctree.h linux-xbian-imx6/fs/btrfs/ctree.h
---- linux-4.1.3/fs/btrfs/ctree.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/ctree.h	2015-07-27 23:13:08.909195295 +0200
-@@ -504,13 +504,7 @@
- #define BTRFS_FEATURE_INCOMPAT_DEFAULT_SUBVOL	(1ULL << 1)
- #define BTRFS_FEATURE_INCOMPAT_MIXED_GROUPS	(1ULL << 2)
- #define BTRFS_FEATURE_INCOMPAT_COMPRESS_LZO	(1ULL << 3)
--/*
-- * some patches floated around with a second compression method
-- * lets save that incompat here for when they do get in
-- * Note we don't actually support it, we're just reserving the
-- * number
-- */
--#define BTRFS_FEATURE_INCOMPAT_COMPRESS_LZOv2	(1ULL << 4)
-+#define BTRFS_FEATURE_INCOMPAT_COMPRESS_LZ4	(1ULL << 4)
- 
- /*
-  * older kernels tried to do bigger metadata blocks, but the
-@@ -539,6 +533,7 @@
- 	 BTRFS_FEATURE_INCOMPAT_RAID56 |		\
- 	 BTRFS_FEATURE_INCOMPAT_EXTENDED_IREF |		\
- 	 BTRFS_FEATURE_INCOMPAT_SKINNY_METADATA |	\
-+	 BTRFS_FEATURE_INCOMPAT_COMPRESS_LZ4 |		\
- 	 BTRFS_FEATURE_INCOMPAT_NO_HOLES)
- 
- #define BTRFS_FEATURE_INCOMPAT_SAFE_SET			\
-@@ -709,8 +704,10 @@
- 	BTRFS_COMPRESS_NONE  = 0,
- 	BTRFS_COMPRESS_ZLIB  = 1,
- 	BTRFS_COMPRESS_LZO   = 2,
--	BTRFS_COMPRESS_TYPES = 2,
--	BTRFS_COMPRESS_LAST  = 3,
-+	BTRFS_COMPRESS_LZ4   = 3,
-+	BTRFS_COMPRESS_LZ4HC = 4,
-+	BTRFS_COMPRESS_TYPES = 4,
-+	BTRFS_COMPRESS_LAST  = 5,
- };
- 
- struct btrfs_inode_item {
-diff -Nur linux-4.1.3/fs/btrfs/disk-io.c linux-xbian-imx6/fs/btrfs/disk-io.c
---- linux-4.1.3/fs/btrfs/disk-io.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/disk-io.c	2015-07-27 23:13:08.909195295 +0200
-@@ -2703,6 +2703,10 @@
- 	if (tree_root->fs_info->compress_type == BTRFS_COMPRESS_LZO)
- 		features |= BTRFS_FEATURE_INCOMPAT_COMPRESS_LZO;
- 
-+	if (tree_root->fs_info->compress_type == BTRFS_COMPRESS_LZ4 ||
-+	    tree_root->fs_info->compress_type == BTRFS_COMPRESS_LZ4HC)
-+		features |= BTRFS_FEATURE_INCOMPAT_COMPRESS_LZ4;
-+
- 	if (features & BTRFS_FEATURE_INCOMPAT_SKINNY_METADATA)
- 		printk(KERN_INFO "BTRFS: has skinny extents\n");
- 
-diff -Nur linux-4.1.3/fs/btrfs/ioctl.c linux-xbian-imx6/fs/btrfs/ioctl.c
---- linux-4.1.3/fs/btrfs/ioctl.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/ioctl.c	2015-07-27 23:13:08.921152633 +0200
-@@ -1439,6 +1439,10 @@
- 	if (range->compress_type == BTRFS_COMPRESS_LZO) {
- 		btrfs_set_fs_incompat(root->fs_info, COMPRESS_LZO);
- 	}
-+	if (range->compress_type == BTRFS_COMPRESS_LZ4 ||
-+	    range->compress_type == BTRFS_COMPRESS_LZ4HC) {
-+		btrfs_set_fs_incompat(root->fs_info, COMPRESS_LZ4);
-+	}
- 
- 	ret = defrag_count;
- 
-diff -Nur linux-4.1.3/fs/btrfs/lz4_wrapper.c linux-xbian-imx6/fs/btrfs/lz4_wrapper.c
---- linux-4.1.3/fs/btrfs/lz4_wrapper.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/fs/btrfs/lz4_wrapper.c	2015-07-27 23:13:08.921152633 +0200
-@@ -0,0 +1,487 @@
-+/*
-+ * Copyright (C) 2008 Oracle.  All rights reserved.
-+ * Copyright (C) 2013 SUSE.  All rights reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or
-+ * modify it under the terms of the GNU General Public
-+ * License v2 as published by the Free Software Foundation.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-+ * General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public
-+ * License along with this program; if not, write to the
-+ * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
-+ * Boston, MA 021110-1307, USA.
-+ */
-+
-+#include <linux/kernel.h>
-+#include <linux/slab.h>
-+#include <linux/vmalloc.h>
-+#include <linux/init.h>
-+#include <linux/err.h>
-+#include <linux/sched.h>
-+#include <linux/pagemap.h>
-+#include <linux/bio.h>
-+#include <linux/lz4.h>
-+#include "compression.h"
-+
-+#define LZ4_LEN		4
-+#define LZ4_CHUNK_SIZE	(4096)
-+#define LZ4_MAX_WORKBUF	2*LZ4_CHUNK_SIZE
-+
-+struct workspace {
-+	void *mem;	/* work memory for compression */
-+	void *buf;	/* where compressed data goes */
-+	void *cbuf;	/* where decompressed data goes */
-+	struct list_head list;
-+};
-+
-+static void lz4_free_workspace(struct list_head *ws)
-+{
-+	struct workspace *workspace = list_entry(ws, struct workspace, list);
-+
-+	vfree(workspace->buf);
-+	vfree(workspace->cbuf);
-+	vfree(workspace->mem);
-+	kfree(workspace);
-+}
-+
-+static struct list_head *lz4_alloc_workspace_generic(int hi)
-+{
-+	struct workspace *workspace;
-+
-+	workspace = kzalloc(sizeof(*workspace), GFP_NOFS);
-+	if (!workspace)
-+		return ERR_PTR(-ENOMEM);
-+
-+	if (hi)
-+		workspace->mem = vmalloc(LZ4HC_MEM_COMPRESS);
-+	else
-+		workspace->mem = vmalloc(LZ4_MEM_COMPRESS);
-+	workspace->buf = vmalloc(LZ4_MAX_WORKBUF);
-+	workspace->cbuf = vmalloc(LZ4_MAX_WORKBUF);
-+	if (!workspace->mem || !workspace->buf || !workspace->cbuf)
-+		goto fail;
-+
-+	INIT_LIST_HEAD(&workspace->list);
-+
-+	return &workspace->list;
-+fail:
-+	lz4_free_workspace(&workspace->list);
-+	return ERR_PTR(-ENOMEM);
-+}
-+
-+static struct list_head *lz4_alloc_workspace(void)
-+{
-+	return lz4_alloc_workspace_generic(0);
-+}
-+
-+static struct list_head *lz4hc_alloc_workspace(void)
-+{
-+	return lz4_alloc_workspace_generic(1);
-+}
-+
-+static inline void write_compress_length(char *buf, size_t len)
-+{
-+	__le32 dlen;
-+
-+	dlen = cpu_to_le32(len);
-+	memcpy(buf, &dlen, LZ4_LEN);
-+}
-+
-+static inline size_t read_compress_length(char *buf)
-+{
-+	__le32 dlen;
-+
-+	memcpy(&dlen, buf, LZ4_LEN);
-+	return le32_to_cpu(dlen);
-+}
-+
-+static int lz4_compress_pages_generic(struct list_head *ws,
-+			      struct address_space *mapping,
-+			      u64 start, unsigned long len,
-+			      struct page **pages,
-+			      unsigned long nr_dest_pages,
-+			      unsigned long *out_pages,
-+			      unsigned long *total_in,
-+			      unsigned long *total_out,
-+			      unsigned long max_out, int hi)
-+{
-+	struct workspace *workspace = list_entry(ws, struct workspace, list);
-+	int ret = 0;
-+	char *data_in;
-+	char *cpage_out;
-+	int nr_pages = 0;
-+	struct page *in_page = NULL;
-+	struct page *out_page = NULL;
-+	unsigned long bytes_left;
-+
-+	size_t in_len;
-+	size_t out_len;
-+	char *buf;
-+	unsigned long tot_in = 0;
-+	unsigned long tot_out = 0;
-+	unsigned long pg_bytes_left;
-+	unsigned long out_offset;
-+	unsigned long bytes;
-+
-+	*out_pages = 0;
-+	*total_out = 0;
-+	*total_in = 0;
-+
-+	in_page = find_get_page(mapping, start >> PAGE_CACHE_SHIFT);
-+	data_in = kmap(in_page);
-+
-+	/*
-+	 * store the size of all chunks of compressed data in
-+	 * the first 4 bytes
-+	 */
-+	out_page = alloc_page(GFP_NOFS | __GFP_HIGHMEM);
-+	if (out_page == NULL) {
-+		ret = -ENOMEM;
-+		goto out;
-+	}
-+	cpage_out = kmap(out_page);
-+	out_offset = LZ4_LEN;
-+	tot_out = LZ4_LEN;
-+	pages[0] = out_page;
-+	nr_pages = 1;
-+	pg_bytes_left = PAGE_CACHE_SIZE - LZ4_LEN;
-+
-+	/* compress at most one page of data each time */
-+	in_len = min(len, PAGE_CACHE_SIZE);
-+	while (tot_in < len) {
-+		if (hi)
-+			ret = lz4hc_compress(data_in, in_len, workspace->cbuf,
-+					&out_len, workspace->mem);
-+		else
-+			ret = lz4_compress(data_in, in_len, workspace->cbuf, &out_len,
-+					workspace->mem);
-+		if (ret < 0) {
-+			printk(KERN_DEBUG
-+				"btrfs: lz4 compress in loop returned %d\n",
-+			       ret);
-+			ret = -1;
-+			goto out;
-+		}
-+
-+		/* store the size of this chunk of compressed data */
-+		write_compress_length(cpage_out + out_offset, out_len);
-+		tot_out += LZ4_LEN;
-+		out_offset += LZ4_LEN;
-+		pg_bytes_left -= LZ4_LEN;
-+
-+		tot_in += in_len;
-+		tot_out += out_len;
-+
-+		/* copy bytes from the working buffer into the pages */
-+		buf = workspace->cbuf;
-+		while (out_len) {
-+			bytes = min_t(unsigned long, pg_bytes_left, out_len);
-+
-+			memcpy(cpage_out + out_offset, buf, bytes);
-+
-+			out_len -= bytes;
-+			pg_bytes_left -= bytes;
-+			buf += bytes;
-+			out_offset += bytes;
-+
-+			/*
-+			 * we need another page for writing out.
-+			 *
-+			 * Note if there's less than 4 bytes left, we just
-+			 * skip to a new page.
-+			 */
-+			if ((out_len == 0 && pg_bytes_left < LZ4_LEN) ||
-+			    pg_bytes_left == 0) {
-+				if (pg_bytes_left) {
-+					memset(cpage_out + out_offset, 0,
-+					       pg_bytes_left);
-+					tot_out += pg_bytes_left;
-+				}
-+
-+				/* we're done, don't allocate new page */
-+				if (out_len == 0 && tot_in >= len)
-+					break;
-+
-+				kunmap(out_page);
-+				if (nr_pages == nr_dest_pages) {
-+					out_page = NULL;
-+					ret = -1;
-+					goto out;
-+				}
-+
-+				out_page = alloc_page(GFP_NOFS | __GFP_HIGHMEM);
-+				if (out_page == NULL) {
-+					ret = -ENOMEM;
-+					goto out;
-+				}
-+				cpage_out = kmap(out_page);
-+				pages[nr_pages++] = out_page;
-+
-+				pg_bytes_left = PAGE_CACHE_SIZE;
-+				out_offset = 0;
-+			}
-+		}
-+
-+		/* we're making it bigger, give up */
-+		if (tot_in > 8192 && tot_in < tot_out)
-+			goto out;
-+
-+		/* we're all done */
-+		if (tot_in >= len)
-+			break;
-+
-+		if (tot_out > max_out)
-+			break;
-+
-+		bytes_left = len - tot_in;
-+		kunmap(in_page);
-+		page_cache_release(in_page);
-+
-+		start += PAGE_CACHE_SIZE;
-+		in_page = find_get_page(mapping, start >> PAGE_CACHE_SHIFT);
-+		data_in = kmap(in_page);
-+		in_len = min(bytes_left, PAGE_CACHE_SIZE);
-+	}
-+
-+	if (tot_out > tot_in)
-+		goto out;
-+
-+	/* store the size of all chunks of compressed data */
-+	cpage_out = kmap(pages[0]);
-+	write_compress_length(cpage_out, tot_out);
-+
-+	kunmap(pages[0]);
-+
-+	ret = 0;
-+	*total_out = tot_out;
-+	*total_in = tot_in;
-+out:
-+	*out_pages = nr_pages;
-+	if (out_page)
-+		kunmap(out_page);
-+
-+	if (in_page) {
-+		kunmap(in_page);
-+		page_cache_release(in_page);
-+	}
-+
-+	return ret;
-+}
-+
-+static int lz4_compress_pages(struct list_head *ws,
-+			      struct address_space *mapping,
-+			      u64 start, unsigned long len,
-+			      struct page **pages,
-+			      unsigned long nr_dest_pages,
-+			      unsigned long *out_pages,
-+			      unsigned long *total_in,
-+			      unsigned long *total_out,
-+			      unsigned long max_out)
-+{
-+	return lz4_compress_pages_generic(ws, mapping, start, len, pages,
-+				nr_dest_pages, out_pages, total_in, total_out,
-+				max_out, 0);
-+}
-+
-+static int lz4hc_compress_pages(struct list_head *ws,
-+			      struct address_space *mapping,
-+			      u64 start, unsigned long len,
-+			      struct page **pages,
-+			      unsigned long nr_dest_pages,
-+			      unsigned long *out_pages,
-+			      unsigned long *total_in,
-+			      unsigned long *total_out,
-+			      unsigned long max_out)
-+{
-+	return lz4_compress_pages_generic(ws, mapping, start, len, pages,
-+				nr_dest_pages, out_pages, total_in, total_out,
-+				max_out, 1);
-+}
-+
-+static int lz4_decompress_biovec(struct list_head *ws,
-+				 struct page **pages_in,
-+				 u64 disk_start,
-+				 struct bio_vec *bvec,
-+				 int vcnt,
-+				 size_t srclen)
-+{
-+	struct workspace *workspace = list_entry(ws, struct workspace, list);
-+	int ret = 0, ret2;
-+	char *data_in;
-+	unsigned long page_in_index = 0;
-+	unsigned long page_out_index = 0;
-+	unsigned long total_pages_in = (srclen + PAGE_CACHE_SIZE - 1) /
-+					PAGE_CACHE_SIZE;
-+	unsigned long buf_start;
-+	unsigned long buf_offset = 0;
-+	unsigned long bytes;
-+	unsigned long working_bytes;
-+	unsigned long pg_offset;
-+
-+	size_t in_len;
-+	size_t out_len;
-+	unsigned long in_offset;
-+	unsigned long in_page_bytes_left;
-+	unsigned long tot_in;
-+	unsigned long tot_out;
-+	unsigned long tot_len;
-+	char *buf;
-+	bool may_late_unmap, need_unmap;
-+
-+	data_in = kmap(pages_in[0]);
-+	tot_len = read_compress_length(data_in);
-+
-+	tot_in = LZ4_LEN;
-+	in_offset = LZ4_LEN;
-+	tot_len = min_t(size_t, srclen, tot_len);
-+	in_page_bytes_left = PAGE_CACHE_SIZE - LZ4_LEN;
-+
-+	tot_out = 0;
-+	pg_offset = 0;
-+
-+	while (tot_in < tot_len) {
-+		in_len = read_compress_length(data_in + in_offset);
-+		in_page_bytes_left -= LZ4_LEN;
-+		in_offset += LZ4_LEN;
-+		tot_in += LZ4_LEN;
-+
-+		tot_in += in_len;
-+		working_bytes = in_len;
-+		may_late_unmap = need_unmap = false;
-+
-+		/* fast path: avoid using the working buffer */
-+		if (in_page_bytes_left >= in_len) {
-+			buf = data_in + in_offset;
-+			bytes = in_len;
-+			may_late_unmap = true;
-+			goto cont;
-+		}
-+
-+		/* copy bytes from the pages into the working buffer */
-+		buf = workspace->cbuf;
-+		buf_offset = 0;
-+		while (working_bytes) {
-+			bytes = min(working_bytes, in_page_bytes_left);
-+
-+			memcpy(buf + buf_offset, data_in + in_offset, bytes);
-+			buf_offset += bytes;
-+cont:
-+			working_bytes -= bytes;
-+			in_page_bytes_left -= bytes;
-+			in_offset += bytes;
-+
-+			/* check if we need to pick another page */
-+			if ((working_bytes == 0 && in_page_bytes_left < LZ4_LEN)
-+			    || in_page_bytes_left == 0) {
-+				tot_in += in_page_bytes_left;
-+
-+				if (working_bytes == 0 && tot_in >= tot_len)
-+					break;
-+
-+				if (page_in_index + 1 >= total_pages_in) {
-+					ret = -1;
-+					goto done;
-+				}
-+
-+				if (may_late_unmap)
-+					need_unmap = true;
-+				else
-+					kunmap(pages_in[page_in_index]);
-+
-+				data_in = kmap(pages_in[++page_in_index]);
-+
-+				in_page_bytes_left = PAGE_CACHE_SIZE;
-+				in_offset = 0;
-+			}
-+		}
-+
-+		out_len = LZ4_CHUNK_SIZE;
-+		ret = lz4_decompress_unknownoutputsize(buf, in_len, workspace->buf,
-+				&out_len);
-+		if (need_unmap)
-+			kunmap(pages_in[page_in_index - 1]);
-+		if (ret < 0) {
-+			printk(KERN_WARNING "btrfs: lz4 decompress failed\n");
-+			ret = -1;
-+			break;
-+		}
-+
-+		buf_start = tot_out;
-+		tot_out += out_len;
-+
-+		ret2 = btrfs_decompress_buf2page(workspace->buf, buf_start,
-+						 tot_out, disk_start,
-+						 bvec, vcnt,
-+						 &page_out_index, &pg_offset);
-+		if (ret2 == 0)
-+			break;
-+	}
-+done:
-+	kunmap(pages_in[page_in_index]);
-+	return ret;
-+}
-+
-+static int lz4_decompress_wrapper(struct list_head *ws, unsigned char *data_in,
-+			  struct page *dest_page,
-+			  unsigned long start_byte,
-+			  size_t srclen, size_t destlen)
-+{
-+	struct workspace *workspace = list_entry(ws, struct workspace, list);
-+	size_t in_len;
-+	size_t out_len;
-+	size_t tot_len;
-+	int ret = 0;
-+	char *kaddr;
-+	unsigned long bytes;
-+
-+	BUG_ON(srclen < LZ4_LEN);
-+
-+	tot_len = read_compress_length(data_in);
-+	data_in += LZ4_LEN;
-+
-+	in_len = read_compress_length(data_in);
-+	data_in += LZ4_LEN;
-+
-+	out_len = LZ4_CHUNK_SIZE;
-+	ret = lz4_decompress_unknownoutputsize(data_in, in_len, workspace->buf,
-+			&out_len);
-+	if (ret < 0) {
-+		printk(KERN_WARNING "btrfs: lz4 decompress failed\n");
-+		ret = -1;
-+		goto out;
-+	}
-+
-+	if (out_len < start_byte) {
-+		ret = -1;
-+		goto out;
-+	}
-+
-+	bytes = min_t(unsigned long, destlen, out_len - start_byte);
-+
-+	kaddr = kmap_atomic(dest_page);
-+	memcpy(kaddr, workspace->buf + start_byte, bytes);
-+	kunmap_atomic(kaddr);
-+out:
-+	return ret;
-+}
-+
-+const struct btrfs_compress_op btrfs_lz4_compress = {
-+	.alloc_workspace	= lz4_alloc_workspace,
-+	.free_workspace		= lz4_free_workspace,
-+	.compress_pages		= lz4_compress_pages,
-+	.decompress_biovec	= lz4_decompress_biovec,
-+	.decompress		= lz4_decompress_wrapper,
-+};
-+
-+const struct btrfs_compress_op btrfs_lz4hc_compress = {
-+	.alloc_workspace	= lz4hc_alloc_workspace,
-+	.free_workspace		= lz4_free_workspace,
-+	.compress_pages		= lz4hc_compress_pages,
-+	.decompress_biovec	= lz4_decompress_biovec,
-+	.decompress		= lz4_decompress_wrapper,
-+};
-diff -Nur linux-4.1.3/fs/btrfs/Makefile linux-xbian-imx6/fs/btrfs/Makefile
---- linux-4.1.3/fs/btrfs/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/Makefile	2015-07-27 23:13:08.901223737 +0200
-@@ -9,7 +9,7 @@
- 	   export.o tree-log.o free-space-cache.o zlib.o lzo.o \
- 	   compression.o delayed-ref.o relocation.o delayed-inode.o scrub.o \
- 	   reada.o backref.o ulist.o qgroup.o send.o dev-replace.o raid56.o \
--	   uuid-tree.o props.o hash.o
-+	   uuid-tree.o props.o hash.o lz4_wrapper.o
- 
- btrfs-$(CONFIG_BTRFS_FS_POSIX_ACL) += acl.o
- btrfs-$(CONFIG_BTRFS_FS_CHECK_INTEGRITY) += check-integrity.o
-diff -Nur linux-4.1.3/fs/btrfs/super.c linux-xbian-imx6/fs/btrfs/super.c
---- linux-4.1.3/fs/btrfs/super.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/fs/btrfs/super.c	2015-07-27 23:13:08.961010425 +0200
-@@ -492,6 +492,20 @@
- 				btrfs_clear_opt(info->mount_opt, COMPRESS);
- 				btrfs_clear_opt(info->mount_opt, FORCE_COMPRESS);
- 				compress_force = false;
-+			} else if (strcmp(args[0].from, "lz4") == 0) {
-+				compress_type = "lz4";
-+				info->compress_type = BTRFS_COMPRESS_LZ4;
-+				btrfs_set_opt(info->mount_opt, COMPRESS);
-+				btrfs_clear_opt(info->mount_opt, NODATACOW);
-+				btrfs_clear_opt(info->mount_opt, NODATASUM);
-+				btrfs_set_fs_incompat(info, COMPRESS_LZ4);
-+			} else if (strcmp(args[0].from, "lz4hc") == 0) {
-+				compress_type = "lz4hc";
-+				info->compress_type = BTRFS_COMPRESS_LZ4HC;
-+				btrfs_set_opt(info->mount_opt, COMPRESS);
-+				btrfs_clear_opt(info->mount_opt, NODATACOW);
-+				btrfs_clear_opt(info->mount_opt, NODATASUM);
-+				btrfs_set_fs_incompat(info, COMPRESS_LZ4);
- 			} else {
- 				ret = -EINVAL;
- 				goto out;
-@@ -1051,8 +1065,14 @@
- 	if (btrfs_test_opt(root, COMPRESS)) {
- 		if (info->compress_type == BTRFS_COMPRESS_ZLIB)
- 			compress_type = "zlib";
-+		else if (info->compress_type == BTRFS_COMPRESS_LZ4)
-+			compress_type = "lz4";
-+		else if (info->compress_type == BTRFS_COMPRESS_LZ4HC)
-+			compress_type = "lz4hc";
-+ 		else if (info->compress_type == BTRFS_COMPRESS_LZO)
-+ 			compress_type = "lzo";
- 		else
--			compress_type = "lzo";
-+			compress_type = "none";
- 		if (btrfs_test_opt(root, FORCE_COMPRESS))
- 			seq_printf(seq, ",compress-force=%s", compress_type);
- 		else
-diff -Nur linux-4.1.3/include/dt-bindings/clock/imx6qdl-clock.h linux-xbian-imx6/include/dt-bindings/clock/imx6qdl-clock.h
---- linux-4.1.3/include/dt-bindings/clock/imx6qdl-clock.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/dt-bindings/clock/imx6qdl-clock.h	2015-07-27 23:13:09.467204382 +0200
-@@ -86,8 +86,6 @@
- #define IMX6QDL_CLK_GPU3D_SHADER		74
- #define IMX6QDL_CLK_IPU1_PODF			75
- #define IMX6QDL_CLK_IPU2_PODF			76
--#define IMX6QDL_CLK_LDB_DI0_PODF		77
--#define IMX6QDL_CLK_LDB_DI1_PODF		78
- #define IMX6QDL_CLK_IPU1_DI0_PRE		79
- #define IMX6QDL_CLK_IPU1_DI1_PRE		80
- #define IMX6QDL_CLK_IPU2_DI0_PRE		81
-@@ -251,6 +249,13 @@
- #define IMX6QDL_CLK_VIDEO_27M			238
- #define IMX6QDL_CLK_MIPI_CORE_CFG		239
- #define IMX6QDL_CLK_MIPI_IPG			240
--#define IMX6QDL_CLK_END				241
-+#define IMX6QDL_CLK_LDB_DI0_DIV_7		241
-+#define IMX6QDL_CLK_LDB_DI1_DIV_7		242
-+#define IMX6QDL_CLK_LDB_DI0_DIV_SEL		243
-+#define IMX6QDL_CLK_LDB_DI1_DIV_SEL		244
-+#define IMX6QDL_CLK_DCIC1			245
-+#define IMX6QDL_CLK_DCIC2			246
-+#define IMX6QDL_CLK_SPDIF_GCLK			247
-+#define IMX6QDL_CLK_END				248
- 
- #endif /* __DT_BINDINGS_CLOCK_IMX6QDL_H */
-diff -Nur linux-4.1.3/include/linux/busfreq-imx6.h linux-xbian-imx6/include/linux/busfreq-imx6.h
---- linux-4.1.3/include/linux/busfreq-imx6.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/busfreq-imx6.h	2015-07-27 23:13:09.479161721 +0200
-@@ -0,0 +1,23 @@
-+/*
-+ * Copyright 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License version 2 as
-+ * published by the Free Software Foundation.
-+ */
-+
-+#ifndef __ASM_ARCH_MXC_BUSFREQ_H__
-+#define __ASM_ARCH_MXC_BUSFREQ_H__
-+
-+/*
-+ * This enumerates busfreq mode.
-+ */
-+enum bus_freq_mode {
-+	BUS_FREQ_HIGH,
-+	BUS_FREQ_MED,
-+	BUS_FREQ_AUDIO,
-+	BUS_FREQ_LOW,
-+};
-+void request_bus_freq(enum bus_freq_mode mode);
-+void release_bus_freq(enum bus_freq_mode mode);
-+#endif
-diff -Nur linux-4.1.3/include/linux/cgroup_subsys.h linux-xbian-imx6/include/linux/cgroup_subsys.h
---- linux-4.1.3/include/linux/cgroup_subsys.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/linux/cgroup_subsys.h	2015-07-27 23:13:09.483147501 +0200
-@@ -35,6 +35,10 @@
- SUBSYS(net_cls)
- #endif
- 
-+#if IS_ENABLED(CONFIG_CGROUP_BFQIO)
-+SUBSYS(bfqio)
-+#endif
-+
- #if IS_ENABLED(CONFIG_CGROUP_PERF)
- SUBSYS(perf_event)
- #endif
-diff -Nur linux-4.1.3/include/linux/device_cooling.h linux-xbian-imx6/include/linux/device_cooling.h
---- linux-4.1.3/include/linux/device_cooling.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/device_cooling.h	2015-07-27 23:13:09.491119057 +0200
-@@ -0,0 +1,45 @@
-+/*
-+ * Copyright (C) 2013 Freescale Semiconductor, Inc.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License version 2 as
-+ * published by the Free Software Foundation.
-+ *
-+ */
-+
-+#ifndef __DEVICE_THERMAL_H__
-+#define __DEVICE_THERMAL_H__
-+
-+#include <linux/thermal.h>
-+
-+#ifdef CONFIG_DEVICE_THERMAL
-+int register_devfreq_cooling_notifier(struct notifier_block *nb);
-+int unregister_devfreq_cooling_notifier(struct notifier_block *nb);
-+struct thermal_cooling_device *devfreq_cooling_register(void);
-+void devfreq_cooling_unregister(struct thermal_cooling_device *cdev);
-+#else
-+static inline
-+int register_devfreq_cooling_notifier(struct notifier_block *nb)
-+{
-+	return 0;
-+}
-+
-+static inline
-+int unregister_devfreq_cooling_notifier(struct notifier_block *nb)
-+{
-+	return 0;
-+}
-+
-+static inline
-+struct thermal_cooling_device *devfreq_cooling_register(void)
-+{
-+	return NULL;
-+}
-+
-+static inline
-+void devfreq_cooling_unregister(struct thermal_cooling_device *cdev)
-+{
-+	return;
-+}
-+#endif
-+#endif /* __DEVICE_THERMAL_H__ */
-diff -Nur linux-4.1.3/include/linux/fb.h linux-xbian-imx6/include/linux/fb.h
---- linux-4.1.3/include/linux/fb.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/linux/fb.h	2015-07-27 23:13:09.495104834 +0200
-@@ -702,7 +702,8 @@
- #define FB_MODE_IS_VESA		4
- #define FB_MODE_IS_CALCULATED	8
- #define FB_MODE_IS_FIRST	16
--#define FB_MODE_IS_FROM_VAR     32
-+#define FB_MODE_IS_FROM_VAR	32
-+#define FB_MODE_IS_3D		64
- 
- extern int fbmon_dpms(const struct fb_info *fb_info);
- extern int fb_get_mode(int flags, u32 val, struct fb_var_screeninfo *var,
-diff -Nur linux-4.1.3/include/linux/ipu.h linux-xbian-imx6/include/linux/ipu.h
---- linux-4.1.3/include/linux/ipu.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/ipu.h	2015-07-27 23:13:09.542934188 +0200
-@@ -0,0 +1,38 @@
-+/*
-+ * Copyright 2005-2013 Freescale Semiconductor, Inc.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU Lesser General
-+ * Public License.  You may obtain a copy of the GNU Lesser General
-+ * Public License Version 2.1 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/lgpl-license.html
-+ * http://www.gnu.org/copyleft/lgpl.html
-+ */
-+
-+/*!
-+ * @defgroup IPU MXC Image Processing Unit (IPU) Driver
-+ */
-+/*!
-+ * @file linux/ipu.h
-+ *
-+ * @brief This file contains the IPU driver API declarations.
-+ *
-+ * @ingroup IPU
-+ */
-+
-+#ifndef __LINUX_IPU_H__
-+#define __LINUX_IPU_H__
-+
-+#include <linux/interrupt.h>
-+#include <uapi/linux/ipu.h>
-+
-+unsigned int fmt_to_bpp(unsigned int pixelformat);
-+cs_t colorspaceofpixel(int fmt);
-+int need_csc(int ifmt, int ofmt);
-+
-+int ipu_queue_task(struct ipu_task *task);
-+int ipu_check_task(struct ipu_task *task);
-+
-+#endif
-diff -Nur linux-4.1.3/include/linux/ipu-v3.h linux-xbian-imx6/include/linux/ipu-v3.h
---- linux-4.1.3/include/linux/ipu-v3.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/ipu-v3.h	2015-07-27 23:13:09.542934188 +0200
-@@ -0,0 +1,752 @@
-+/*
-+ * Copyright (c) 2010 Sascha Hauer <s.hauer@pengutronix.de>
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
-+ *
-+ * This program is free software; you can redistribute it and/or modify it
-+ * under the terms of the GNU General Public License as published by the
-+ * Free Software Foundation; either version 2 of the License, or (at your
-+ * option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful, but
-+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
-+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
-+ * for more details.
-+ */
-+
-+#ifndef __LINUX_IPU_V3_H_
-+#define __LINUX_IPU_V3_H_
-+
-+#include <linux/ipu.h>
-+
-+/* IPU Driver channels definitions.	*/
-+/* Note these are different from IDMA channels */
-+#define IPU_MAX_CH	32
-+#define _MAKE_CHAN(num, v_in, g_in, a_in, out) \
-+	((num << 24) | (v_in << 18) | (g_in << 12) | (a_in << 6) | out)
-+#define _MAKE_ALT_CHAN(ch)		(ch | (IPU_MAX_CH << 24))
-+#define IPU_CHAN_ID(ch)			(ch >> 24)
-+#define IPU_CHAN_ALT(ch)		(ch & 0x02000000)
-+#define IPU_CHAN_ALPHA_IN_DMA(ch)	((uint32_t) (ch >> 6) & 0x3F)
-+#define IPU_CHAN_GRAPH_IN_DMA(ch)	((uint32_t) (ch >> 12) & 0x3F)
-+#define IPU_CHAN_VIDEO_IN_DMA(ch)	((uint32_t) (ch >> 18) & 0x3F)
-+#define IPU_CHAN_OUT_DMA(ch)		((uint32_t) (ch & 0x3F))
-+#define NO_DMA 0x3F
-+#define ALT	1
-+/*!
-+ * Enumeration of IPU logical channels. An IPU logical channel is defined as a
-+ * combination of an input (memory to IPU), output (IPU to memory), and/or
-+ * secondary input IDMA channels and in some cases an Image Converter task.
-+ * Some channels consist of only an input or output.
-+ */
-+typedef enum {
-+	CHAN_NONE = -1,
-+	MEM_ROT_ENC_MEM = _MAKE_CHAN(1, 45, NO_DMA, NO_DMA, 48),
-+	MEM_ROT_VF_MEM = _MAKE_CHAN(2, 46, NO_DMA, NO_DMA, 49),
-+	MEM_ROT_PP_MEM = _MAKE_CHAN(3, 47, NO_DMA, NO_DMA, 50),
-+
-+	MEM_PRP_ENC_MEM = _MAKE_CHAN(4, 12, 14, 17, 20),
-+	MEM_PRP_VF_MEM = _MAKE_CHAN(5, 12, 14, 17, 21),
-+	MEM_PP_MEM = _MAKE_CHAN(6, 11, 15, 18, 22),
-+
-+	MEM_DC_SYNC = _MAKE_CHAN(7, 28, NO_DMA, NO_DMA, NO_DMA),
-+	MEM_DC_ASYNC = _MAKE_CHAN(8, 41, NO_DMA, NO_DMA, NO_DMA),
-+	MEM_BG_SYNC = _MAKE_CHAN(9, 23, NO_DMA, 51, NO_DMA),
-+	MEM_FG_SYNC = _MAKE_CHAN(10, 27, NO_DMA, 31, NO_DMA),
-+
-+	MEM_BG_ASYNC0 = _MAKE_CHAN(11, 24, NO_DMA, 52, NO_DMA),
-+	MEM_FG_ASYNC0 = _MAKE_CHAN(12, 29, NO_DMA, 33, NO_DMA),
-+	MEM_BG_ASYNC1 = _MAKE_ALT_CHAN(MEM_BG_ASYNC0),
-+	MEM_FG_ASYNC1 = _MAKE_ALT_CHAN(MEM_FG_ASYNC0),
-+
-+	DIRECT_ASYNC0 = _MAKE_CHAN(13, NO_DMA, NO_DMA, NO_DMA, NO_DMA),
-+	DIRECT_ASYNC1 = _MAKE_CHAN(14, NO_DMA, NO_DMA, NO_DMA, NO_DMA),
-+
-+	CSI_MEM0 = _MAKE_CHAN(15, NO_DMA, NO_DMA, NO_DMA, 0),
-+	CSI_MEM1 = _MAKE_CHAN(16, NO_DMA, NO_DMA, NO_DMA, 1),
-+	CSI_MEM2 = _MAKE_CHAN(17, NO_DMA, NO_DMA, NO_DMA, 2),
-+	CSI_MEM3 = _MAKE_CHAN(18, NO_DMA, NO_DMA, NO_DMA, 3),
-+
-+	CSI_MEM = CSI_MEM0,
-+
-+	CSI_PRP_ENC_MEM = _MAKE_CHAN(19, NO_DMA, NO_DMA, NO_DMA, 20),
-+	CSI_PRP_VF_MEM = _MAKE_CHAN(20, NO_DMA, NO_DMA, NO_DMA, 21),
-+
-+	/* for vdi mem->vdi->ic->mem , add graphics plane and alpha*/
-+	MEM_VDI_PRP_VF_MEM_P = _MAKE_CHAN(21, 8, 14, 17, 21),
-+	MEM_VDI_PRP_VF_MEM = _MAKE_CHAN(22, 9, 14, 17, 21),
-+	MEM_VDI_PRP_VF_MEM_N = _MAKE_CHAN(23, 10, 14, 17, 21),
-+
-+	/* for vdi mem->vdi->mem */
-+	MEM_VDI_MEM_P = _MAKE_CHAN(24, 8, NO_DMA, NO_DMA, 5),
-+	MEM_VDI_MEM = _MAKE_CHAN(25, 9, NO_DMA, NO_DMA, 5),
-+	MEM_VDI_MEM_N = _MAKE_CHAN(26, 10, NO_DMA, NO_DMA, 5),
-+
-+	/* fake channel for vdoa to link with IPU */
-+	MEM_VDOA_MEM =  _MAKE_CHAN(27, NO_DMA, NO_DMA, NO_DMA, NO_DMA),
-+
-+	MEM_PP_ADC = CHAN_NONE,
-+	ADC_SYS2 = CHAN_NONE,
-+
-+} ipu_channel_t;
-+
-+/*!
-+ * Enumeration of types of buffers for a logical channel.
-+ */
-+typedef enum {
-+	IPU_OUTPUT_BUFFER = 0,	/*!< Buffer for output from IPU */
-+	IPU_ALPHA_IN_BUFFER = 1,	/*!< Buffer for input to IPU */
-+	IPU_GRAPH_IN_BUFFER = 2,	/*!< Buffer for input to IPU */
-+	IPU_VIDEO_IN_BUFFER = 3,	/*!< Buffer for input to IPU */
-+	IPU_INPUT_BUFFER = IPU_VIDEO_IN_BUFFER,
-+	IPU_SEC_INPUT_BUFFER = IPU_GRAPH_IN_BUFFER,
-+} ipu_buffer_t;
-+
-+#define IPU_PANEL_SERIAL		1
-+#define IPU_PANEL_PARALLEL		2
-+
-+/*!
-+ * Enumeration of ADC channel operation mode.
-+ */
-+typedef enum {
-+	Disable,
-+	WriteTemplateNonSeq,
-+	ReadTemplateNonSeq,
-+	WriteTemplateUnCon,
-+	ReadTemplateUnCon,
-+	WriteDataWithRS,
-+	WriteDataWoRS,
-+	WriteCmd
-+} mcu_mode_t;
-+
-+/*!
-+ * Enumeration of ADC channel addressing mode.
-+ */
-+typedef enum {
-+	FullWoBE,
-+	FullWithBE,
-+	XY
-+} display_addressing_t;
-+
-+/*!
-+ * Union of initialization parameters for a logical channel.
-+ */
-+typedef union {
-+	struct {
-+		uint32_t csi;
-+		uint32_t mipi_id;
-+		uint32_t mipi_vc;
-+		bool mipi_en;
-+		bool interlaced;
-+	} csi_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		uint32_t outh_resize_ratio;
-+		uint32_t outv_resize_ratio;
-+		uint32_t csi;
-+		uint32_t mipi_id;
-+		uint32_t mipi_vc;
-+		bool mipi_en;
-+	} csi_prp_enc_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		uint32_t outh_resize_ratio;
-+		uint32_t outv_resize_ratio;
-+	} mem_prp_enc_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+	} mem_rot_enc_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		uint32_t outh_resize_ratio;
-+		uint32_t outv_resize_ratio;
-+		bool graphics_combine_en;
-+		bool global_alpha_en;
-+		bool key_color_en;
-+		uint32_t in_g_pixel_fmt;
-+		uint8_t alpha;
-+		uint32_t key_color;
-+		bool alpha_chan_en;
-+		ipu_motion_sel motion_sel;
-+		enum v4l2_field field_fmt;
-+		uint32_t csi;
-+		uint32_t mipi_id;
-+		uint32_t mipi_vc;
-+		bool mipi_en;
-+	} csi_prp_vf_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		bool graphics_combine_en;
-+		bool global_alpha_en;
-+		bool key_color_en;
-+		display_port_t disp;
-+		uint32_t out_left;
-+		uint32_t out_top;
-+	} csi_prp_vf_adc;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		uint32_t outh_resize_ratio;
-+		uint32_t outv_resize_ratio;
-+		bool graphics_combine_en;
-+		bool global_alpha_en;
-+		bool key_color_en;
-+		uint32_t in_g_pixel_fmt;
-+		uint8_t alpha;
-+		uint32_t key_color;
-+		bool alpha_chan_en;
-+		ipu_motion_sel motion_sel;
-+		enum v4l2_field field_fmt;
-+	} mem_prp_vf_mem;
-+	struct {
-+		uint32_t temp;
-+	} mem_prp_vf_adc;
-+	struct {
-+		uint32_t temp;
-+	} mem_rot_vf_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		uint32_t outh_resize_ratio;
-+		uint32_t outv_resize_ratio;
-+		bool graphics_combine_en;
-+		bool global_alpha_en;
-+		bool key_color_en;
-+		uint32_t in_g_pixel_fmt;
-+		uint8_t alpha;
-+		uint32_t key_color;
-+		bool alpha_chan_en;
-+	} mem_pp_mem;
-+	struct {
-+		uint32_t temp;
-+	} mem_rot_mem;
-+	struct {
-+		uint32_t in_width;
-+		uint32_t in_height;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_width;
-+		uint32_t out_height;
-+		uint32_t out_pixel_fmt;
-+		bool graphics_combine_en;
-+		bool global_alpha_en;
-+		bool key_color_en;
-+		display_port_t disp;
-+		uint32_t out_left;
-+		uint32_t out_top;
-+	} mem_pp_adc;
-+	struct {
-+		uint32_t di;
-+		bool interlaced;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_pixel_fmt;
-+	} mem_dc_sync;
-+	struct {
-+		uint32_t temp;
-+	} mem_sdc_fg;
-+	struct {
-+		uint32_t di;
-+		bool interlaced;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_pixel_fmt;
-+		bool alpha_chan_en;
-+	} mem_dp_bg_sync;
-+	struct {
-+		uint32_t temp;
-+	} mem_sdc_bg;
-+	struct {
-+		uint32_t di;
-+		bool interlaced;
-+		uint32_t in_pixel_fmt;
-+		uint32_t out_pixel_fmt;
-+		bool alpha_chan_en;
-+	} mem_dp_fg_sync;
-+	struct {
-+		uint32_t di;
-+	} direct_async;
-+	struct {
-+		display_port_t disp;
-+		mcu_mode_t ch_mode;
-+		uint32_t out_left;
-+		uint32_t out_top;
-+	} adc_sys1;
-+	struct {
-+		display_port_t disp;
-+		mcu_mode_t ch_mode;
-+		uint32_t out_left;
-+		uint32_t out_top;
-+	} adc_sys2;
-+} ipu_channel_params_t;
-+
-+/*
-+ * IPU_IRQF_ONESHOT - Interrupt is not reenabled after the irq handler finished.
-+ */
-+#define IPU_IRQF_NONE		0x00000000
-+#define IPU_IRQF_ONESHOT	0x00000001
-+
-+/*!
-+ * Enumeration of IPU interrupt sources.
-+ */
-+enum ipu_irq_line {
-+	IPU_IRQ_CSI0_OUT_EOF = 0,
-+	IPU_IRQ_CSI1_OUT_EOF = 1,
-+	IPU_IRQ_CSI2_OUT_EOF = 2,
-+	IPU_IRQ_CSI3_OUT_EOF = 3,
-+	IPU_IRQ_VDIC_OUT_EOF = 5,
-+	IPU_IRQ_VDI_P_IN_EOF = 8,
-+	IPU_IRQ_VDI_C_IN_EOF = 9,
-+	IPU_IRQ_VDI_N_IN_EOF = 10,
-+	IPU_IRQ_PP_IN_EOF = 11,
-+	IPU_IRQ_PRP_IN_EOF = 12,
-+	IPU_IRQ_PRP_GRAPH_IN_EOF = 14,
-+	IPU_IRQ_PP_GRAPH_IN_EOF = 15,
-+	IPU_IRQ_PRP_ALPHA_IN_EOF = 17,
-+	IPU_IRQ_PP_ALPHA_IN_EOF = 18,
-+	IPU_IRQ_PRP_ENC_OUT_EOF = 20,
-+	IPU_IRQ_PRP_VF_OUT_EOF = 21,
-+	IPU_IRQ_PP_OUT_EOF = 22,
-+	IPU_IRQ_BG_SYNC_EOF = 23,
-+	IPU_IRQ_BG_ASYNC_EOF = 24,
-+	IPU_IRQ_FG_SYNC_EOF = 27,
-+	IPU_IRQ_DC_SYNC_EOF = 28,
-+	IPU_IRQ_FG_ASYNC_EOF = 29,
-+	IPU_IRQ_FG_ALPHA_SYNC_EOF = 31,
-+
-+	IPU_IRQ_FG_ALPHA_ASYNC_EOF = 33,
-+	IPU_IRQ_DC_READ_EOF = 40,
-+	IPU_IRQ_DC_ASYNC_EOF = 41,
-+	IPU_IRQ_DC_CMD1_EOF = 42,
-+	IPU_IRQ_DC_CMD2_EOF = 43,
-+	IPU_IRQ_DC_MASK_EOF = 44,
-+	IPU_IRQ_PRP_ENC_ROT_IN_EOF = 45,
-+	IPU_IRQ_PRP_VF_ROT_IN_EOF = 46,
-+	IPU_IRQ_PP_ROT_IN_EOF = 47,
-+	IPU_IRQ_PRP_ENC_ROT_OUT_EOF = 48,
-+	IPU_IRQ_PRP_VF_ROT_OUT_EOF = 49,
-+	IPU_IRQ_PP_ROT_OUT_EOF = 50,
-+	IPU_IRQ_BG_ALPHA_SYNC_EOF = 51,
-+	IPU_IRQ_BG_ALPHA_ASYNC_EOF = 52,
-+
-+	IPU_IRQ_BG_SYNC_NFACK = 64 + 23,
-+	IPU_IRQ_FG_SYNC_NFACK = 64 + 27,
-+	IPU_IRQ_DC_SYNC_NFACK = 64 + 28,
-+
-+	IPU_IRQ_DP_SF_START = 448 + 2,
-+	IPU_IRQ_DP_SF_END = 448 + 3,
-+	IPU_IRQ_BG_SF_END = IPU_IRQ_DP_SF_END,
-+	IPU_IRQ_DC_FC_0 = 448 + 8,
-+	IPU_IRQ_DC_FC_1 = 448 + 9,
-+	IPU_IRQ_DC_FC_2 = 448 + 10,
-+	IPU_IRQ_DC_FC_3 = 448 + 11,
-+	IPU_IRQ_DC_FC_4 = 448 + 12,
-+	IPU_IRQ_DC_FC_6 = 448 + 13,
-+	IPU_IRQ_VSYNC_PRE_0 = 448 + 14,
-+	IPU_IRQ_VSYNC_PRE_1 = 448 + 15,
-+
-+	IPU_IRQ_COUNT
-+};
-+
-+/*!
-+ * Bitfield of Display Interface signal polarities.
-+ */
-+typedef struct {
-+	unsigned datamask_en:1;
-+	unsigned int_clk:1;
-+	unsigned interlaced:1;
-+	unsigned odd_field_first:1;
-+	unsigned clksel_en:1;
-+	unsigned clkidle_en:1;
-+	unsigned data_pol:1;	/* true = inverted */
-+	unsigned clk_pol:1;	/* true = rising edge */
-+	unsigned enable_pol:1;
-+	unsigned Hsync_pol:1;	/* true = active high */
-+	unsigned Vsync_pol:1;
-+} ipu_di_signal_cfg_t;
-+
-+/*!
-+ * Bitfield of CSI signal polarities and modes.
-+ */
-+
-+typedef struct {
-+	unsigned data_width:4;
-+	unsigned clk_mode:3;
-+	unsigned ext_vsync:1;
-+	unsigned Vsync_pol:1;
-+	unsigned Hsync_pol:1;
-+	unsigned pixclk_pol:1;
-+	unsigned data_pol:1;
-+	unsigned sens_clksrc:1;
-+	unsigned pack_tight:1;
-+	unsigned force_eof:1;
-+	unsigned data_en_pol:1;
-+	unsigned data_fmt;
-+	unsigned csi;
-+	unsigned mclk;
-+} ipu_csi_signal_cfg_t;
-+
-+/*!
-+ * Enumeration of CSI data bus widths.
-+ */
-+enum {
-+	IPU_CSI_DATA_WIDTH_4 = 0,
-+	IPU_CSI_DATA_WIDTH_8 = 1,
-+	IPU_CSI_DATA_WIDTH_10 = 3,
-+	IPU_CSI_DATA_WIDTH_16 = 9,
-+};
-+
-+/*!
-+ * Enumeration of CSI clock modes.
-+ */
-+enum {
-+	IPU_CSI_CLK_MODE_GATED_CLK,
-+	IPU_CSI_CLK_MODE_NONGATED_CLK,
-+	IPU_CSI_CLK_MODE_CCIR656_PROGRESSIVE,
-+	IPU_CSI_CLK_MODE_CCIR656_INTERLACED,
-+	IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_DDR,
-+	IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_SDR,
-+	IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_DDR,
-+	IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_SDR,
-+};
-+
-+enum {
-+	IPU_CSI_MIPI_DI0,
-+	IPU_CSI_MIPI_DI1,
-+	IPU_CSI_MIPI_DI2,
-+	IPU_CSI_MIPI_DI3,
-+};
-+
-+typedef enum {
-+	RGB,
-+	YCbCr,
-+	YUV
-+} ipu_color_space_t;
-+
-+/*!
-+ * Enumeration of ADC vertical sync mode.
-+ */
-+typedef enum {
-+	VsyncNone,
-+	VsyncInternal,
-+	VsyncCSI,
-+	VsyncExternal
-+} vsync_t;
-+
-+typedef enum {
-+	DAT,
-+	CMD
-+} cmddata_t;
-+
-+/*!
-+ * Enumeration of ADC display update mode.
-+ */
-+typedef enum {
-+	IPU_ADC_REFRESH_NONE,
-+	IPU_ADC_AUTO_REFRESH,
-+	IPU_ADC_AUTO_REFRESH_SNOOP,
-+	IPU_ADC_SNOOPING,
-+} ipu_adc_update_mode_t;
-+
-+/*!
-+ * Enumeration of ADC display interface types (serial or parallel).
-+ */
-+enum {
-+	IPU_ADC_IFC_MODE_SYS80_TYPE1,
-+	IPU_ADC_IFC_MODE_SYS80_TYPE2,
-+	IPU_ADC_IFC_MODE_SYS68K_TYPE1,
-+	IPU_ADC_IFC_MODE_SYS68K_TYPE2,
-+	IPU_ADC_IFC_MODE_3WIRE_SERIAL,
-+	IPU_ADC_IFC_MODE_4WIRE_SERIAL,
-+	IPU_ADC_IFC_MODE_5WIRE_SERIAL_CLK,
-+	IPU_ADC_IFC_MODE_5WIRE_SERIAL_CS,
-+};
-+
-+enum {
-+	IPU_ADC_IFC_WIDTH_8,
-+	IPU_ADC_IFC_WIDTH_16,
-+};
-+
-+/*!
-+ * Enumeration of ADC display interface burst mode.
-+ */
-+enum {
-+	IPU_ADC_BURST_WCS,
-+	IPU_ADC_BURST_WBLCK,
-+	IPU_ADC_BURST_NONE,
-+	IPU_ADC_BURST_SERIAL,
-+};
-+
-+/*!
-+ * Enumeration of ADC display interface RW signal timing modes.
-+ */
-+enum {
-+	IPU_ADC_SER_NO_RW,
-+	IPU_ADC_SER_RW_BEFORE_RS,
-+	IPU_ADC_SER_RW_AFTER_RS,
-+};
-+
-+/*!
-+ * Bitfield of ADC signal polarities and modes.
-+ */
-+typedef struct {
-+	unsigned data_pol:1;
-+	unsigned clk_pol:1;
-+	unsigned cs_pol:1;
-+	unsigned rs_pol:1;
-+	unsigned addr_pol:1;
-+	unsigned read_pol:1;
-+	unsigned write_pol:1;
-+	unsigned Vsync_pol:1;
-+	unsigned burst_pol:1;
-+	unsigned burst_mode:2;
-+	unsigned ifc_mode:3;
-+	unsigned ifc_width:5;
-+	unsigned ser_preamble_len:4;
-+	unsigned ser_preamble:8;
-+	unsigned ser_rw_mode:2;
-+} ipu_adc_sig_cfg_t;
-+
-+/*!
-+ * Enumeration of ADC template commands.
-+ */
-+enum {
-+	RD_DATA,
-+	RD_ACK,
-+	RD_WAIT,
-+	WR_XADDR,
-+	WR_YADDR,
-+	WR_ADDR,
-+	WR_CMND,
-+	WR_DATA,
-+};
-+
-+/*!
-+ * Enumeration of ADC template command flow control.
-+ */
-+enum {
-+	SINGLE_STEP,
-+	PAUSE,
-+	STOP,
-+};
-+
-+
-+/*Define template constants*/
-+#define     ATM_ADDR_RANGE      0x20	/*offset address of DISP */
-+#define     TEMPLATE_BUF_SIZE   0x20	/*size of template */
-+
-+/*!
-+ * Define to create ADC template command entry.
-+ */
-+#define ipu_adc_template_gen(oc, rs, fc, dat) (((rs) << 29) | ((fc) << 27) | \
-+			((oc) << 24) | (dat))
-+
-+typedef struct {
-+	u32 reg;
-+	u32 value;
-+} ipu_lpmc_reg_t;
-+
-+#define IPU_LPMC_REG_READ       0x80000000L
-+
-+#define CSI_MCLK_VF  1
-+#define CSI_MCLK_ENC 2
-+#define CSI_MCLK_RAW 4
-+#define CSI_MCLK_I2C 8
-+
-+struct ipu_soc;
-+/* Common IPU API */
-+struct ipu_soc *ipu_get_soc(int id);
-+int32_t ipu_init_channel(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params);
-+void ipu_uninit_channel(struct ipu_soc *ipu, ipu_channel_t channel);
-+void ipu_disable_hsp_clk(struct ipu_soc *ipu);
-+
-+static inline bool ipu_can_rotate_in_place(ipu_rotate_mode_t rot)
-+{
-+#ifdef CONFIG_MXC_IPU_V3D
-+	return (rot < IPU_ROTATE_HORIZ_FLIP);
-+#else
-+	return (rot < IPU_ROTATE_90_RIGHT);
-+#endif
-+}
-+
-+int32_t ipu_init_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+				uint32_t pixel_fmt,
-+				uint16_t width, uint16_t height,
-+				uint32_t stride,
-+				ipu_rotate_mode_t rot_mode,
-+				dma_addr_t phyaddr_0, dma_addr_t phyaddr_1,
-+				dma_addr_t phyaddr_2,
-+				uint32_t u_offset, uint32_t v_offset);
-+
-+int32_t ipu_update_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+				  uint32_t bufNum, dma_addr_t phyaddr);
-+
-+int32_t ipu_update_channel_offset(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+				uint32_t pixel_fmt,
-+				uint16_t width, uint16_t height,
-+				uint32_t stride,
-+				uint32_t u, uint32_t v,
-+				uint32_t vertical_offset, uint32_t horizontal_offset);
-+
-+int32_t ipu_select_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
-+			  ipu_buffer_t type, uint32_t bufNum);
-+int32_t ipu_select_multi_vdi_buffer(struct ipu_soc *ipu, uint32_t bufNum);
-+
-+int32_t ipu_link_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch);
-+int32_t ipu_unlink_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch);
-+
-+int32_t ipu_is_channel_busy(struct ipu_soc *ipu, ipu_channel_t channel);
-+int32_t ipu_check_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+		uint32_t bufNum);
-+void ipu_clear_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
-+		uint32_t bufNum);
-+uint32_t ipu_get_cur_buffer_idx(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type);
-+int32_t ipu_enable_channel(struct ipu_soc *ipu, ipu_channel_t channel);
-+int32_t ipu_disable_channel(struct ipu_soc *ipu, ipu_channel_t channel, bool wait_for_stop);
-+int32_t ipu_swap_channel(struct ipu_soc *ipu, ipu_channel_t from_ch, ipu_channel_t to_ch);
-+uint32_t ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel);
-+
-+int32_t ipu_enable_csi(struct ipu_soc *ipu, uint32_t csi);
-+int32_t ipu_disable_csi(struct ipu_soc *ipu, uint32_t csi);
-+
-+int ipu_lowpwr_display_enable(void);
-+int ipu_lowpwr_display_disable(void);
-+
-+int ipu_enable_irq(struct ipu_soc *ipu, uint32_t irq);
-+void ipu_disable_irq(struct ipu_soc *ipu, uint32_t irq);
-+void ipu_clear_irq(struct ipu_soc *ipu, uint32_t irq);
-+int ipu_request_irq(struct ipu_soc *ipu, uint32_t irq,
-+		    irqreturn_t(*handler) (int, void *),
-+		    uint32_t irq_flags, const char *devname, void *dev_id);
-+void ipu_free_irq(struct ipu_soc *ipu, uint32_t irq, void *dev_id);
-+bool ipu_get_irq_status(struct ipu_soc *ipu, uint32_t irq);
-+void ipu_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3]);
-+int32_t ipu_set_channel_bandmode(struct ipu_soc *ipu, ipu_channel_t channel,
-+				 ipu_buffer_t type, uint32_t band_height);
-+
-+/* two stripe calculations */
-+struct stripe_param{
-+	unsigned int input_width; /* width of the input stripe */
-+	unsigned int output_width; /* width of the output stripe */
-+	unsigned int input_column; /* the first column on the input stripe */
-+	unsigned int output_column; /* the first column on the output stripe */
-+	unsigned int idr;
-+	/* inverse downisizing ratio parameter; expressed as a power of 2 */
-+	unsigned int irr;
-+	/* inverse resizing ratio parameter; expressed as a multiple of 2^-13 */
-+};
-+int ipu_calc_stripes_sizes(const unsigned int input_frame_width,
-+				unsigned int output_frame_width,
-+				const unsigned int maximal_stripe_width,
-+				const unsigned long long cirr,
-+				const unsigned int equal_stripes,
-+				u32 input_pixelformat,
-+				u32 output_pixelformat,
-+				struct stripe_param *left,
-+				struct stripe_param *right);
-+
-+/* SDC API */
-+int32_t ipu_init_sync_panel(struct ipu_soc *ipu, int disp,
-+			    uint32_t pixel_clk,
-+			    uint16_t width, uint16_t height,
-+			    uint32_t pixel_fmt,
-+			    uint16_t h_start_width, uint16_t h_sync_width,
-+			    uint16_t h_end_width, uint16_t v_start_width,
-+			    uint16_t v_sync_width, uint16_t v_end_width,
-+			    uint32_t v_to_h_sync, ipu_di_signal_cfg_t sig);
-+
-+void ipu_uninit_sync_panel(struct ipu_soc *ipu, int disp);
-+
-+int32_t ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel, int16_t x_pos,
-+				int16_t y_pos);
-+int32_t ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel, int16_t *x_pos,
-+				int16_t *y_pos);
-+int32_t ipu_disp_set_global_alpha(struct ipu_soc *ipu, ipu_channel_t channel, bool enable,
-+				  uint8_t alpha);
-+int32_t ipu_disp_set_color_key(struct ipu_soc *ipu, ipu_channel_t channel, bool enable,
-+			       uint32_t colorKey);
-+int32_t ipu_disp_set_gamma_correction(struct ipu_soc *ipu, ipu_channel_t channel, bool enable,
-+				int constk[], int slopek[]);
-+
-+int ipu_init_async_panel(struct ipu_soc *ipu, int disp, int type, uint32_t cycle_time,
-+			 uint32_t pixel_fmt, ipu_adc_sig_cfg_t sig);
-+void ipu_disp_direct_write(struct ipu_soc *ipu, ipu_channel_t channel, u32 value, u32 offset);
-+void ipu_reset_disp_panel(struct ipu_soc *ipu);
-+
-+/* CMOS Sensor Interface API */
-+int32_t ipu_csi_init_interface(struct ipu_soc *ipu, uint16_t width, uint16_t height,
-+			       uint32_t pixel_fmt, ipu_csi_signal_cfg_t sig);
-+
-+int32_t ipu_csi_get_sensor_protocol(struct ipu_soc *ipu, uint32_t csi);
-+
-+int32_t ipu_csi_enable_mclk(struct ipu_soc *ipu, int src, bool flag, bool wait);
-+
-+static inline int32_t ipu_csi_enable_mclk_if(struct ipu_soc *ipu, int src, uint32_t csi,
-+		bool flag, bool wait)
-+{
-+	return ipu_csi_enable_mclk(ipu, csi, flag, wait);
-+}
-+
-+int ipu_csi_read_mclk_flag(void);
-+
-+void ipu_csi_flash_strobe(bool flag);
-+
-+void ipu_csi_get_window_size(struct ipu_soc *ipu, uint32_t *width, uint32_t *height, uint32_t csi);
-+
-+void ipu_csi_set_window_size(struct ipu_soc *ipu, uint32_t width, uint32_t height, uint32_t csi);
-+
-+void ipu_csi_set_window_pos(struct ipu_soc *ipu, uint32_t left, uint32_t top, uint32_t csi);
-+
-+uint32_t bytes_per_pixel(uint32_t fmt);
-+
-+bool ipu_ch_param_bad_alpha_pos(uint32_t fmt);
-+
-+struct ipuv3_fb_platform_data {
-+	char				disp_dev[32];
-+	u32				interface_pix_fmt;
-+	char				*mode_str;
-+	int				default_bpp;
-+	bool				int_clk;
-+
-+	/* reserved mem */
-+	resource_size_t 		res_base[2];
-+	resource_size_t 		res_size[2];
-+
-+	/*
-+	 * Late init to avoid display channel being
-+	 * re-initialized as we've probably setup the
-+	 * channel in bootloader.
-+	 */
-+	bool                            late_init;
-+};
-+
-+#endif /* __LINUX_IPU_V3_H_ */
-diff -Nur linux-4.1.3/include/linux/mfd/mxc-hdmi-core.h linux-xbian-imx6/include/linux/mfd/mxc-hdmi-core.h
---- linux-4.1.3/include/linux/mfd/mxc-hdmi-core.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/mfd/mxc-hdmi-core.h	2015-07-27 23:13:09.586777757 +0200
-@@ -0,0 +1,68 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+#ifndef __LINUX_MXC_HDMI_CORE_H_
-+#define __LINUX_MXC_HDMI_CORE_H_
-+
-+#include <video/mxc_edid.h>
-+
-+#include <sound/core.h>
-+#include <sound/pcm.h>
-+#include <sound/pcm_params.h>
-+#include <sound/soc.h>
-+
-+#define IRQ_DISABLE_SUCCEED	0
-+#define IRQ_DISABLE_FAIL	1
-+
-+bool hdmi_check_overflow(void);
-+
-+u8 hdmi_readb(unsigned int reg);
-+void hdmi_writeb(u8 value, unsigned int reg);
-+void hdmi_mask_writeb(u8 data, unsigned int addr, u8 shift, u8 mask);
-+unsigned int hdmi_read4(unsigned int reg);
-+void hdmi_write4(unsigned int value, unsigned int reg);
-+
-+void hdmi_irq_init(void);
-+void hdmi_irq_enable(int irq);
-+unsigned int hdmi_irq_disable(int irq);
-+
-+void hdmi_set_sample_rate(unsigned int rate);
-+void hdmi_set_dma_mode(unsigned int dma_running);
-+void hdmi_init_clk_regenerator(void);
-+void hdmi_clk_regenerator_update_pixel_clock(u32 pixclock);
-+
-+void hdmi_set_edid_cfg(int edid_status, struct mxc_edid_cfg *cfg);
-+int hdmi_get_edid_cfg(struct mxc_edid_cfg *cfg);
-+
-+extern int mxc_hdmi_ipu_id;
-+extern int mxc_hdmi_disp_id;
-+
-+void hdmi_set_registered(int registered);
-+int hdmi_get_registered(void);
-+int mxc_hdmi_abort_stream(void);
-+int mxc_hdmi_register_audio(struct snd_pcm_substream *substream);
-+void mxc_hdmi_unregister_audio(struct snd_pcm_substream *substream);
-+void hdmi_set_dvi_mode(unsigned int state);
-+unsigned int hdmi_set_cable_state(unsigned int state);
-+unsigned int hdmi_set_blank_state(unsigned int state);
-+int check_hdmi_state(void);
-+
-+void hdmi_cec_start_device(void);
-+void hdmi_cec_stop_device(void);
-+
-+#endif
-diff -Nur linux-4.1.3/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h linux-xbian-imx6/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h
---- linux-4.1.3/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h	2015-07-27 23:13:09.590763539 +0200
-@@ -1,5 +1,5 @@
- /*
-- * Copyright (C) 2012 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2012-2014 Freescale Semiconductor, Inc.
-  *
-  * This program is free software; you can redistribute it and/or modify
-  * it under the terms of the GNU General Public License version 2 as
-@@ -123,6 +123,9 @@
- #define IMX6Q_GPR1_USB_OTG_ID_SEL_ENET_RX_ER	0x0
- #define IMX6Q_GPR1_USB_OTG_ID_SEL_GPIO_1	BIT(13)
- #define IMX6Q_GPR1_GINT				BIT(12)
-+#define IMX6Q_GPR1_GINT_MASK			BIT(12)
-+#define IMX6Q_GPR1_GINT_CLEAR			0x0
-+#define IMX6Q_GPR1_GINT_ASSERT			BIT(12)
- #define IMX6Q_GPR1_ADDRS3_MASK			(0x3 << 10)
- #define IMX6Q_GPR1_ADDRS3_32MB			(0x0 << 10)
- #define IMX6Q_GPR1_ADDRS3_64MB			(0x1 << 10)
-@@ -285,15 +288,15 @@
- #define IMX6Q_GPR10_OCRAM_TZ_ADDR_MASK		(0x3f << 5)
- #define IMX6Q_GPR10_OCRAM_TZ_EN_MASK		BIT(4)
- #define IMX6Q_GPR10_DCIC2_MUX_CTL_MASK		(0x3 << 2)
--#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI0	(0x0 << 2)
--#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI1	(0x1 << 2)
--#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU2_DI0	(0x2 << 2)
--#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU2_DI1	(0x3 << 2)
-+#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI1	(0x0 << 2)
-+#define IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS0		(0x1 << 2)
-+#define IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS1		(0x2 << 2)
-+#define IMX6Q_GPR10_DCIC2_MUX_CTL_MIPI		(0x3 << 2)
- #define IMX6Q_GPR10_DCIC1_MUX_CTL_MASK		(0x3 << 0)
- #define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU1_DI0	(0x0 << 0)
--#define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU1_DI1	(0x1 << 0)
--#define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU2_DI0	(0x2 << 0)
--#define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU2_DI1	(0x3 << 0)
-+#define IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS0		(0x1 << 0)
-+#define IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS1		(0x2 << 0)
-+#define IMX6Q_GPR10_DCIC1_MUX_CTL_HDMI		(0x3 << 0)
- 
- #define IMX6Q_GPR12_ARMP_IPG_CLK_EN		BIT(27)
- #define IMX6Q_GPR12_ARMP_AHB_CLK_EN		BIT(26)
-@@ -302,6 +305,7 @@
- #define IMX6Q_GPR12_DEVICE_TYPE			(0xf << 12)
- #define IMX6Q_GPR12_PCIE_CTL_2			BIT(10)
- #define IMX6Q_GPR12_LOS_LEVEL			(0x1f << 4)
-+#define IMX6Q_GPR12_LOS_LEVEL_9			(0x9 << 4)
- 
- #define IMX6Q_GPR13_SDMA_STOP_REQ		BIT(30)
- #define IMX6Q_GPR13_CAN2_STOP_REQ		BIT(29)
-@@ -392,6 +396,16 @@
- #define IMX6Q_GPR13_SATA_MPLL_CLK_EN		BIT(1)
- #define IMX6Q_GPR13_SATA_TX_EDGE_RATE		BIT(0)
- 
-+/* For imx6dl iomux gpr register field definitions */
-+#define IMX6DL_GPR3_LVDS1_MUX_CTL_MASK		(0x3 << 8)
-+#define IMX6DL_GPR3_LVDS1_MUX_CTL_IPU1_DI0	(0x0 << 8)
-+#define IMX6DL_GPR3_LVDS1_MUX_CTL_IPU1_DI1	(0x1 << 8)
-+#define IMX6DL_GPR3_LVDS1_MUX_CTL_LCDIF		(0x2 << 8)
-+#define IMX6DL_GPR3_LVDS0_MUX_CTL_MASK		(0x3 << 6)
-+#define IMX6DL_GPR3_LVDS0_MUX_CTL_IPU1_DI0	(0x0 << 6)
-+#define IMX6DL_GPR3_LVDS0_MUX_CTL_IPU1_DI1	(0x1 << 6)
-+#define IMX6DL_GPR3_LVDS0_MUX_CTL_LCDIF		(0x2 << 6)
-+
- /* For imx6sl iomux gpr register field define */
- #define IMX6SL_GPR1_FEC_CLOCK_MUX1_SEL_MASK    (0x3 << 17)
- #define IMX6SL_GPR1_FEC_CLOCK_MUX2_SEL_MASK    (0x1 << 14)
-@@ -407,6 +421,15 @@
- #define IMX6SX_GPR1_FEC_CLOCK_PAD_DIR_MASK		(0x3 << 17)
- #define IMX6SX_GPR1_FEC_CLOCK_MUX_SEL_EXT		(0x3 << 13)
- 
-+#define IMX6SX_GPR2_MQS_OVERSAMPLE_MASK			(0x1 << 26)
-+#define IMX6SX_GPR2_MQS_OVERSAMPLE_SHIFT		(26)
-+#define IMX6SX_GPR2_MQS_EN_MASK				(0x1 << 25)
-+#define IMX6SX_GPR2_MQS_EN_SHIFT			(25)
-+#define IMX6SX_GPR2_MQS_SW_RST_MASK			(0x1 << 24)
-+#define IMX6SX_GPR2_MQS_SW_RST_SHIFT			(24)
-+#define IMX6SX_GPR2_MQS_CLK_DIV_MASK			(0xFF << 16)
-+#define IMX6SX_GPR2_MQS_CLK_DIV_SHIFT			(16)
-+
- #define IMX6SX_GPR4_FEC_ENET1_STOP_REQ			(0x1 << 3)
- #define IMX6SX_GPR4_FEC_ENET2_STOP_REQ			(0x1 << 4)
- 
-@@ -435,4 +458,11 @@
- #define IMX6SX_GPR5_DISP_MUX_DCIC1_LVDS			(0x1 << 1)
- #define IMX6SX_GPR5_DISP_MUX_DCIC1_MASK			(0x1 << 1)
- 
-+#define IMX6SX_GPR5_PCIE_BTNRST			BIT(19)
-+#define IMX6SX_GPR5_PCIE_PERST			BIT(18)
-+
-+#define IMX6SX_GPR12_PCIE_PM_TURN_OFF		BIT(16)
-+#define IMX6SX_GPR12_PCIE_TEST_PD		BIT(30)
-+#define IMX6SX_GPR12_RX_EQ_MASK			(0x7 << 0)
-+#define IMX6SX_GPR12_RX_EQ_2			(0x2 << 0)
- #endif /* __LINUX_IMX6Q_IOMUXC_GPR_H */
-diff -Nur linux-4.1.3/include/linux/mipi_csi2.h linux-xbian-imx6/include/linux/mipi_csi2.h
---- linux-4.1.3/include/linux/mipi_csi2.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/mipi_csi2.h	2015-07-27 23:13:09.598735098 +0200
-@@ -0,0 +1,93 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __INCLUDE_MIPI_CSI2_H
-+#define __INCLUDE_MIPI_CSI2_H
-+
-+/* MIPI CSI2 registers */
-+#define MIPI_CSI2_REG(offset)		(offset)
-+
-+#define	MIPI_CSI2_VERSION		MIPI_CSI2_REG(0x000)
-+#define	MIPI_CSI2_N_LANES		MIPI_CSI2_REG(0x004)
-+#define	MIPI_CSI2_PHY_SHUTDOWNZ		MIPI_CSI2_REG(0x008)
-+#define	MIPI_CSI2_DPHY_RSTZ		MIPI_CSI2_REG(0x00c)
-+#define	MIPI_CSI2_CSI2_RESETN		MIPI_CSI2_REG(0x010)
-+#define	MIPI_CSI2_PHY_STATE		MIPI_CSI2_REG(0x014)
-+#define	MIPI_CSI2_DATA_IDS_1		MIPI_CSI2_REG(0x018)
-+#define	MIPI_CSI2_DATA_IDS_2		MIPI_CSI2_REG(0x01c)
-+#define	MIPI_CSI2_ERR1			MIPI_CSI2_REG(0x020)
-+#define	MIPI_CSI2_ERR2			MIPI_CSI2_REG(0x024)
-+#define	MIPI_CSI2_MASK1			MIPI_CSI2_REG(0x028)
-+#define	MIPI_CSI2_MASK2			MIPI_CSI2_REG(0x02c)
-+#define	MIPI_CSI2_PHY_TST_CTRL0		MIPI_CSI2_REG(0x030)
-+#define	MIPI_CSI2_PHY_TST_CTRL1		MIPI_CSI2_REG(0x034)
-+#define	MIPI_CSI2_SFT_RESET		MIPI_CSI2_REG(0xf00)
-+
-+/* mipi data type */
-+#define MIPI_DT_YUV420		0x18 /* YYY.../UYVY.... */
-+#define MIPI_DT_YUV420_LEGACY	0x1a /* UYY.../VYY...   */
-+#define MIPI_DT_YUV422		0x1e /* UYVY...		*/
-+#define MIPI_DT_RGB444		0x20
-+#define MIPI_DT_RGB555		0x21
-+#define MIPI_DT_RGB565		0x22
-+#define MIPI_DT_RGB666		0x23
-+#define MIPI_DT_RGB888		0x24
-+#define MIPI_DT_RAW6		0x28
-+#define MIPI_DT_RAW7		0x29
-+#define MIPI_DT_RAW8		0x2a
-+#define MIPI_DT_RAW10		0x2b
-+#define MIPI_DT_RAW12		0x2c
-+#define MIPI_DT_RAW14		0x2d
-+
-+
-+struct mipi_csi2_info;
-+/* mipi csi2 API */
-+struct mipi_csi2_info *mipi_csi2_get_info(void);
-+
-+bool mipi_csi2_enable(struct mipi_csi2_info *info);
-+
-+bool mipi_csi2_disable(struct mipi_csi2_info *info);
-+
-+bool mipi_csi2_get_status(struct mipi_csi2_info *info);
-+
-+int mipi_csi2_get_bind_ipu(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_get_bind_csi(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_get_virtual_channel(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_set_lanes(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_set_datatype(struct mipi_csi2_info *info,
-+					unsigned int datatype);
-+
-+unsigned int mipi_csi2_get_datatype(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_dphy_status(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_get_error1(struct mipi_csi2_info *info);
-+
-+unsigned int mipi_csi2_get_error2(struct mipi_csi2_info *info);
-+
-+int mipi_csi2_pixelclk_enable(struct mipi_csi2_info *info);
-+
-+void mipi_csi2_pixelclk_disable(struct mipi_csi2_info *info);
-+
-+int mipi_csi2_reset(struct mipi_csi2_info *info);
-+
-+#endif
-diff -Nur linux-4.1.3/include/linux/mipi_dsi.h linux-xbian-imx6/include/linux/mipi_dsi.h
---- linux-4.1.3/include/linux/mipi_dsi.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/mipi_dsi.h	2015-07-27 23:13:09.598735098 +0200
-@@ -0,0 +1,171 @@
-+/*
-+ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __INCLUDE_MIPI_DSI_H
-+#define __INCLUDE_MIPI_DSI_H
-+
-+#define     MIPI_DSI_VERSION		(0x000)
-+#define     MIPI_DSI_PWR_UP		(0x004)
-+#define     MIPI_DSI_CLKMGR_CFG		(0x008)
-+#define     MIPI_DSI_DPI_CFG		(0x00c)
-+#define     MIPI_DSI_DBI_CFG		(0x010)
-+#define     MIPI_DSI_DBIS_CMDSIZE	(0x014)
-+#define     MIPI_DSI_PCKHDL_CFG		(0x018)
-+#define     MIPI_DSI_VID_MODE_CFG	(0x01c)
-+#define     MIPI_DSI_VID_PKT_CFG	(0x020)
-+#define     MIPI_DSI_CMD_MODE_CFG	(0x024)
-+#define     MIPI_DSI_TMR_LINE_CFG	(0x028)
-+#define     MIPI_DSI_VTIMING_CFG	(0x02c)
-+#define     MIPI_DSI_PHY_TMR_CFG	(0x030)
-+#define     MIPI_DSI_GEN_HDR		(0x034)
-+#define     MIPI_DSI_GEN_PLD_DATA	(0x038)
-+#define     MIPI_DSI_CMD_PKT_STATUS	(0x03c)
-+#define     MIPI_DSI_TO_CNT_CFG		(0x040)
-+#define     MIPI_DSI_ERROR_ST0		(0x044)
-+#define     MIPI_DSI_ERROR_ST1		(0x048)
-+#define     MIPI_DSI_ERROR_MSK0		(0x04c)
-+#define     MIPI_DSI_ERROR_MSK1		(0x050)
-+#define     MIPI_DSI_PHY_RSTZ		(0x054)
-+#define     MIPI_DSI_PHY_IF_CFG		(0x058)
-+#define     MIPI_DSI_PHY_IF_CTRL	(0x05c)
-+#define     MIPI_DSI_PHY_STATUS		(0x060)
-+#define     MIPI_DSI_PHY_TST_CTRL0	(0x064)
-+#define     MIPI_DSI_PHY_TST_CTRL1	(0x068)
-+
-+#define		DSI_PWRUP_RESET					(0x0 << 0)
-+#define		DSI_PWRUP_POWERUP				(0x1 << 0)
-+
-+#define		DSI_DPI_CFG_VID_SHIFT				(0)
-+#define		DSI_DPI_CFG_VID_MASK				(0x3)
-+#define		DSI_DPI_CFG_COLORCODE_SHIFT			(2)
-+#define		DSI_DPI_CFG_COLORCODE_MASK			(0x7)
-+#define		DSI_DPI_CFG_DATAEN_ACT_LOW			(0x1 << 5)
-+#define		DSI_DPI_CFG_DATAEN_ACT_HIGH			(0x0 << 5)
-+#define		DSI_DPI_CFG_VSYNC_ACT_LOW			(0x1 << 6)
-+#define		DSI_DPI_CFG_VSYNC_ACT_HIGH			(0x0 << 6)
-+#define		DSI_DPI_CFG_HSYNC_ACT_LOW			(0x1 << 7)
-+#define		DSI_DPI_CFG_HSYNC_ACT_HIGH			(0x0 << 7)
-+#define		DSI_DPI_CFG_SHUTD_ACT_LOW			(0x1 << 8)
-+#define		DSI_DPI_CFG_SHUTD_ACT_HIGH			(0x0 << 8)
-+#define		DSI_DPI_CFG_COLORMODE_ACT_LOW			(0x1 << 9)
-+#define		DSI_DPI_CFG_COLORMODE_ACT_HIGH			(0x0 << 9)
-+#define		DSI_DPI_CFG_EN18LOOSELY				(0x1 << 10)
-+
-+#define		DSI_PCKHDL_CFG_EN_EOTP_TX			(0x1 << 0)
-+#define		DSI_PCKHDL_CFG_EN_EOTP_RX			(0x1 << 1)
-+#define		DSI_PCKHDL_CFG_EN_BTA				(0x1 << 2)
-+#define		DSI_PCKHDL_CFG_EN_ECC_RX			(0x1 << 3)
-+#define		DSI_PCKHDL_CFG_EN_CRC_RX			(0x1 << 4)
-+#define		DSI_PCKHDL_CFG_GEN_VID_RX_MASK			(0x3)
-+#define		DSI_PCKHDL_CFG_GEN_VID_RX_SHIFT			(5)
-+
-+#define		DSI_VID_MODE_CFG_EN				(0x1 << 0)
-+#define		DSI_VID_MODE_CFG_EN_BURSTMODE			(0x3 << 1)
-+#define		DSI_VID_MODE_CFG_TYPE_MASK			(0x3)
-+#define		DSI_VID_MODE_CFG_TYPE_SHIFT			(1)
-+#define		DSI_VID_MODE_CFG_EN_LP_VSA			(0x1 << 3)
-+#define		DSI_VID_MODE_CFG_EN_LP_VBP			(0x1 << 4)
-+#define		DSI_VID_MODE_CFG_EN_LP_VFP			(0x1 << 5)
-+#define		DSI_VID_MODE_CFG_EN_LP_VACT			(0x1 << 6)
-+#define		DSI_VID_MODE_CFG_EN_LP_HBP			(0x1 << 7)
-+#define		DSI_VID_MODE_CFG_EN_LP_HFP			(0x1 << 8)
-+#define		DSI_VID_MODE_CFG_EN_MULTI_PKT			(0x1 << 9)
-+#define		DSI_VID_MODE_CFG_EN_NULL_PKT			(0x1 << 10)
-+#define		DSI_VID_MODE_CFG_EN_FRAME_ACK			(0x1 << 11)
-+#define		DSI_VID_MODE_CFG_EN_LP_MODE (DSI_VID_MODE_CFG_EN_LP_VSA | \
-+						 DSI_VID_MODE_CFG_EN_LP_VBP | \
-+						 DSI_VID_MODE_CFG_EN_LP_VFP | \
-+						 DSI_VID_MODE_CFG_EN_LP_HFP | \
-+						 DSI_VID_MODE_CFG_EN_LP_HBP | \
-+						 DSI_VID_MODE_CFG_EN_LP_VACT)
-+
-+
-+
-+#define		DSI_VID_PKT_CFG_VID_PKT_SZ_MASK			(0x7ff)
-+#define		DSI_VID_PKT_CFG_VID_PKT_SZ_SHIFT		(0)
-+#define		DSI_VID_PKT_CFG_NUM_CHUNKS_MASK			(0x3ff)
-+#define		DSI_VID_PKT_CFG_NUM_CHUNKS_SHIFT		(11)
-+#define		DSI_VID_PKT_CFG_NULL_PKT_SZ_MASK		(0x3ff)
-+#define		DSI_VID_PKT_CFG_NULL_PKT_SZ_SHIFT		(21)
-+
-+#define		MIPI_DSI_CMD_MODE_CFG_EN_LOWPOWER		(0x1FFF)
-+#define		MIPI_DSI_CMD_MODE_CFG_EN_CMD_MODE		(0x1 << 0)
-+
-+#define		DSI_TME_LINE_CFG_HSA_TIME_MASK			(0x1ff)
-+#define		DSI_TME_LINE_CFG_HSA_TIME_SHIFT			(0)
-+#define		DSI_TME_LINE_CFG_HBP_TIME_MASK			(0x1ff)
-+#define		DSI_TME_LINE_CFG_HBP_TIME_SHIFT			(9)
-+#define		DSI_TME_LINE_CFG_HLINE_TIME_MASK		(0x3fff)
-+#define		DSI_TME_LINE_CFG_HLINE_TIME_SHIFT		(18)
-+
-+#define		DSI_VTIMING_CFG_VSA_LINES_MASK			(0xf)
-+#define		DSI_VTIMING_CFG_VSA_LINES_SHIFT			(0)
-+#define		DSI_VTIMING_CFG_VBP_LINES_MASK			(0x3f)
-+#define		DSI_VTIMING_CFG_VBP_LINES_SHIFT			(4)
-+#define		DSI_VTIMING_CFG_VFP_LINES_MASK			(0x3f)
-+#define		DSI_VTIMING_CFG_VFP_LINES_SHIFT			(10)
-+#define		DSI_VTIMING_CFG_V_ACT_LINES_MASK		(0x7ff)
-+#define		DSI_VTIMING_CFG_V_ACT_LINES_SHIFT		(16)
-+
-+#define		DSI_PHY_TMR_CFG_BTA_TIME_MASK			(0xfff)
-+#define		DSI_PHY_TMR_CFG_BTA_TIME_SHIFT			(0)
-+#define		DSI_PHY_TMR_CFG_LP2HS_TIME_MASK			(0xff)
-+#define		DSI_PHY_TMR_CFG_LP2HS_TIME_SHIFT		(12)
-+#define		DSI_PHY_TMR_CFG_HS2LP_TIME_MASK			(0xff)
-+#define		DSI_PHY_TMR_CFG_HS2LP_TIME_SHIFT		(20)
-+
-+#define		DSI_PHY_IF_CFG_N_LANES_MASK			(0x3)
-+#define		DSI_PHY_IF_CFG_N_LANES_SHIFT			(0)
-+#define		DSI_PHY_IF_CFG_WAIT_TIME_MASK			(0xff)
-+#define		DSI_PHY_IF_CFG_WAIT_TIME_SHIFT			(2)
-+
-+#define		DSI_PHY_RSTZ_EN_CLK				(0x1 << 2)
-+#define		DSI_PHY_RSTZ_DISABLE_RST			(0x1 << 1)
-+#define		DSI_PHY_RSTZ_DISABLE_SHUTDOWN			(0x1 << 0)
-+#define		DSI_PHY_RSTZ_RST				(0x0)
-+
-+#define		DSI_PHY_STATUS_LOCK				(0x1 << 0)
-+#define		DSI_PHY_STATUS_STOPSTATE_CLK_LANE		(0x1 << 2)
-+
-+#define		DSI_GEN_HDR_TYPE_MASK				(0xff)
-+#define		DSI_GEN_HDR_TYPE_SHIFT				(0)
-+#define		DSI_GEN_HDR_DATA_MASK				(0xffff)
-+#define		DSI_GEN_HDR_DATA_SHIFT				(8)
-+
-+#define		DSI_CMD_PKT_STATUS_GEN_CMD_EMPTY		(0x1 << 0)
-+#define		DSI_CMD_PKT_STATUS_GEN_CMD_FULL			(0x1 << 1)
-+#define		DSI_CMD_PKT_STATUS_GEN_PLD_W_EMPTY		(0x1 << 2)
-+#define		DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL		(0x1 << 3)
-+#define		DSI_CMD_PKT_STATUS_GEN_PLD_R_EMPTY		(0x1 << 4)
-+#define		DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY		(0x1 << 6)
-+
-+#define		DSI_ERROR_MSK0_ALL_MASK				(0x1fffff)
-+#define		DSI_ERROR_MSK1_ALL_MASK				(0x3ffff)
-+
-+#define		DSI_PHY_IF_CTRL_RESET				(0x0)
-+#define		DSI_PHY_IF_CTRL_TX_REQ_CLK_HS			(0x1 << 0)
-+#define		DSI_PHY_IF_CTRL_TX_REQ_CLK_ULPS			(0x1 << 1)
-+#define		DSI_PHY_IF_CTRL_TX_EXIT_CLK_ULPS		(0x1 << 2)
-+#define		DSI_PHY_IF_CTRL_TX_REQ_DATA_ULPS		(0x1 << 3)
-+#define		DSI_PHY_IF_CTRL_TX_EXIT_DATA_ULPS		(0x1 << 4)
-+#define		DSI_PHY_IF_CTRL_TX_TRIG_MASK			(0xF)
-+#define		DSI_PHY_IF_CTRL_TX_TRIG_SHIFT			(5)
-+
-+#define		DSI_PHY_CLK_INIT_COMMAND			(0x44)
-+#define		DSI_GEN_PLD_DATA_BUF_SIZE			(0x4)
-+#endif
-diff -Nur linux-4.1.3/include/linux/mmc/host.h linux-xbian-imx6/include/linux/mmc/host.h
---- linux-4.1.3/include/linux/mmc/host.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/linux/mmc/host.h	2015-07-27 23:13:09.602720875 +0200
-@@ -300,6 +300,11 @@
- 	unsigned long           clkgate_delay;
- #endif
- 
-+	/* card specific properties to deal with power and reset */
-+	struct regulator	*card_regulator; /* External VCC needed by the card */
-+	struct gpio_desc	*card_reset_gpios[2]; /* External resets, active low */
-+	struct clk		*card_clk;	/* External clock needed by the card */
-+
- 	/* host specific block data */
- 	unsigned int		max_seg_size;	/* see blk_queue_max_segment_size */
- 	unsigned short		max_segs;	/* see blk_queue_max_segments */
-diff -Nur linux-4.1.3/include/linux/mm_types.h linux-xbian-imx6/include/linux/mm_types.h
---- linux-4.1.3/include/linux/mm_types.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/linux/mm_types.h	2015-07-27 23:13:09.602720875 +0200
-@@ -23,7 +23,7 @@
- struct address_space;
- struct mem_cgroup;
- 
--#define USE_SPLIT_PTE_PTLOCKS	(NR_CPUS >= CONFIG_SPLIT_PTLOCK_CPUS)
-+#define USE_SPLIT_PTE_PTLOCKS	(0)
- #define USE_SPLIT_PMD_PTLOCKS	(USE_SPLIT_PTE_PTLOCKS && \
- 		IS_ENABLED(CONFIG_ARCH_ENABLE_SPLIT_PMD_PTLOCK))
- #define ALLOC_SPLIT_PTLOCKS	(SPINLOCK_SIZE > BITS_PER_LONG/8)
-diff -Nur linux-4.1.3/include/linux/mxc_asrc.h linux-xbian-imx6/include/linux/mxc_asrc.h
---- linux-4.1.3/include/linux/mxc_asrc.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/mxc_asrc.h	2015-07-27 23:13:09.606706653 +0200
-@@ -0,0 +1,389 @@
-+/*
-+ * Copyright 2008-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ *
-+ * @file mxc_asrc.h
-+ *
-+ * @brief i.MX Asynchronous Sample Rate Converter
-+ *
-+ * @ingroup Audio
-+ */
-+
-+#ifndef __MXC_ASRC_H__
-+#define __MXC_ASRC_H__
-+
-+#include <uapi/linux/mxc_asrc.h>
-+#include <linux/scatterlist.h>
-+
-+#define ASRC_DMA_BUFFER_NUM		2
-+#define ASRC_INPUTFIFO_THRESHOLD	32
-+#define ASRC_OUTPUTFIFO_THRESHOLD	32
-+#define ASRC_FIFO_THRESHOLD_MIN		0
-+#define ASRC_FIFO_THRESHOLD_MAX		63
-+#define ASRC_DMA_BUFFER_SIZE		(1024 * 48 * 4)
-+#define ASRC_MAX_BUFFER_SIZE		(1024 * 48)
-+#define ASRC_OUTPUT_LAST_SAMPLE_DEFAULT_MAX 32
-+#define ASRC_OUTPUT_LAST_SAMPLE_DEFAULT 16
-+
-+
-+/* Ideal Ratio mode doesn't care the outclk frequency, so be fixed */
-+#define ASRC_PRESCALER_IDEAL_RATIO	5
-+/* SPDIF rxclk pulse rate is 128 * samplerate, so 2 ^ 7 */
-+#define ASRC_PRESCALER_SPDIF_RX		7
-+/* SPDIF txclk pulse rate is 64 * samplerate, so 2 ^ 6 */
-+#define ASRC_PRESCALER_SPDIF_TX		6
-+/* I2S bclk is 16 * 2 = 32, so 2 ^ 5 */
-+#define ASRC_PRESCALER_I2S_16BIT	5
-+/* I2S bclk is 24 * 2 = 48 -> 64, so 2 ^ 6 */
-+#define ASRC_PRESCALER_I2S_24BIT	6
-+
-+
-+#define REG_ASRCTR			0x00
-+#define REG_ASRIER			0x04
-+#define REG_ASRCNCR			0x0C
-+#define REG_ASRCFG			0x10
-+#define REG_ASRCSR			0x14
-+
-+#define REG_ASRCDR1			0x18
-+#define REG_ASRCDR2			0x1C
-+#define REG_ASRCDR(x)			((x < 2) ? REG_ASRCDR1 : REG_ASRCDR2)
-+
-+#define REG_ASRSTR			0x20
-+#define REG_ASRRA			0x24
-+#define REG_ASRRB			0x28
-+#define REG_ASRRC			0x2C
-+#define REG_ASRPM1			0x40
-+#define REG_ASRPM2			0x44
-+#define REG_ASRPM3			0x48
-+#define REG_ASRPM4			0x4C
-+#define REG_ASRPM5			0x50
-+#define REG_ASRTFR1			0x54
-+#define REG_ASRCCR			0x5C
-+
-+#define REG_ASRDIA			0x60
-+#define REG_ASRDOA			0x64
-+#define REG_ASRDIB			0x68
-+#define REG_ASRDOB			0x6C
-+#define REG_ASRDIC			0x70
-+#define REG_ASRDOC			0x74
-+#define REG_ASRDI(x)			(REG_ASRDIA + (x << 3))
-+#define REG_ASRDO(x)			(REG_ASRDOA + (x << 3))
-+
-+#define REG_ASRIDRHA			0x80
-+#define REG_ASRIDRLA			0x84
-+#define REG_ASRIDRHB			0x88
-+#define REG_ASRIDRLB			0x8C
-+#define REG_ASRIDRHC			0x90
-+#define REG_ASRIDRLC			0x94
-+#define REG_ASRIDRH(x)			(REG_ASRIDRHA + (x << 3))
-+#define REG_ASRIDRL(x)			(REG_ASRIDRLA + (x << 3))
-+
-+#define REG_ASR76K			0x98
-+#define REG_ASR56K			0x9C
-+
-+#define REG_ASRMCRA			0xA0
-+#define REG_ASRFSTA			0xA4
-+#define REG_ASRMCRB			0xA8
-+#define REG_ASRFSTB			0xAC
-+#define REG_ASRMCRC			0xB0
-+#define REG_ASRFSTC			0xB4
-+#define REG_ASRMCR(x)			(REG_ASRMCRA + (x << 3))
-+#define REG_ASRFST(x)			(REG_ASRFSTA + (x << 3))
-+
-+#define REG_ASRMCR1A			0xC0
-+#define REG_ASRMCR1B			0xC4
-+#define REG_ASRMCR1C			0xC8
-+#define REG_ASRMCR1(x)			(REG_ASRMCR1A + (x << 2))
-+
-+
-+/* REG0 0x00 REG_ASRCTR */
-+#define ASRCTR_ATSx_SHIFT(x)		(20 + x)
-+#define ASRCTR_ATSx_MASK(x)		(1 << ASRCTR_ATSx_SHIFT(x))
-+#define ASRCTR_ATS(x)			(1 << ASRCTR_ATSx_SHIFT(x))
-+#define ASRCTR_USRx_SHIFT(x)		(14 + (x << 1))
-+#define ASRCTR_USRx_MASK(x)		(1 << ASRCTR_USRx_SHIFT(x))
-+#define ASRCTR_USR(x)			(1 << ASRCTR_USRx_SHIFT(x))
-+#define ASRCTR_IDRx_SHIFT(x)		(13 + (x << 1))
-+#define ASRCTR_IDRx_MASK(x)		(1 << ASRCTR_IDRx_SHIFT(x))
-+#define ASRCTR_IDR(x)			(1 << ASRCTR_IDRx_SHIFT(x))
-+#define ASRCTR_SRST_SHIFT		4
-+#define ASRCTR_SRST_MASK		(1 << ASRCTR_SRST_SHIFT)
-+#define ASRCTR_SRST			(1 << ASRCTR_SRST_SHIFT)
-+#define ASRCTR_ASRCEx_SHIFT(x)		(1 + x)
-+#define ASRCTR_ASRCEx_MASK(x)		(1 << ASRCTR_ASRCEx_SHIFT(x))
-+#define ASRCTR_ASRCE(x)			(1 << ASRCTR_ASRCEx_SHIFT(x))
-+#define ASRCTR_ASRCEx_ALL_MASK		(0x7 << ASRCTR_ASRCEx_SHIFT(0))
-+#define ASRCTR_ASRCEN_SHIFT		0
-+#define ASRCTR_ASRCEN_MASK		(1 << ASRCTR_ASRCEN_SHIFT)
-+#define ASRCTR_ASRCEN			(1 << ASRCTR_ASRCEN_SHIFT)
-+
-+/* REG1 0x04 REG_ASRIER */
-+#define ASRIER_AFPWE_SHIFT		7
-+#define ASRIER_AFPWE_MASK		(1 << ASRIER_AFPWE_SHIFT)
-+#define ASRIER_AFPWE			(1 << ASRIER_AFPWE_SHIFT)
-+#define ASRIER_AOLIE_SHIFT		6
-+#define ASRIER_AOLIE_MASK		(1 << ASRIER_AOLIE_SHIFT)
-+#define ASRIER_AOLIE			(1 << ASRIER_AOLIE_SHIFT)
-+#define ASRIER_ADOEx_SHIFT(x)		(3 + x)
-+#define ASRIER_ADOEx_MASK(x)		(1 << ASRIER_ADOEx_SHIFT(x))
-+#define ASRIER_ADOE(x)			(1 << ASRIER_ADOEx_SHIFT(x))
-+#define ASRIER_ADIEx_SHIFT(x)		(0 + x)
-+#define ASRIER_ADIEx_MASK(x)		(1 << ASRIER_ADIEx_SHIFT(x))
-+#define ASRIER_ADIE(x)			(1 << ASRIER_ADIEx_SHIFT(x))
-+
-+/* REG2 0x0C REG_ASRCNCR */
-+#define ASRCNCR_ANCx_SHIFT(x, b)	(b * x)
-+#define ASRCNCR_ANCx_MASK(x, b)		(((1 << b) - 1) << ASRCNCR_ANCx_SHIFT(x, b))
-+#define ASRCNCR_ANCx_get(x, v, b)	((v & ASRCNCR_ANCx_MASK(x, b)) >> ASRCNCR_ANCx_SHIFT(x, b))
-+#define ASRCNCR_ANCx_set(x, v, b)	((v << ASRCNCR_ANCx_SHIFT(x, b)) & ASRCNCR_ANCx_MASK(x, b))
-+
-+/* REG3 0x10 REG_ASRCFG */
-+#define ASRCFG_INIRQx_SHIFT(x)		(21 + x)
-+#define ASRCFG_INIRQx_MASK(x)		(1 << ASRCFG_INIRQx_SHIFT(x))
-+#define ASRCFG_INIRQx			(1 << ASRCFG_INIRQx_SHIFT(x))
-+#define ASRCFG_NDPRx_SHIFT(x)		(18 + x)
-+#define ASRCFG_NDPRx_MASK(x)		(1 << ASRCFG_NDPRx_SHIFT(x))
-+#define ASRCFG_NDPRx			(1 << ASRCFG_NDPRx_SHIFT(x))
-+#define ASRCFG_POSTMODx_SHIFT(x)	(8 + (x << 2))
-+#define ASRCFG_POSTMODx_WIDTH		2
-+#define ASRCFG_POSTMODx_MASK(x)		(((1 << ASRCFG_POSTMODx_WIDTH) - 1) << ASRCFG_POSTMODx_SHIFT(x))
-+#define ASRCFG_POSTMOD(x, v)		((v) << ASRCFG_POSTMODx_SHIFT(x))
-+#define ASRCFG_POSTMODx_UP(x)		(0 << ASRCFG_POSTMODx_SHIFT(x))
-+#define ASRCFG_POSTMODx_DCON(x)		(1 << ASRCFG_POSTMODx_SHIFT(x))
-+#define ASRCFG_POSTMODx_DOWN(x)		(2 << ASRCFG_POSTMODx_SHIFT(x))
-+#define ASRCFG_PREMODx_SHIFT(x)		(6 + (x << 2))
-+#define ASRCFG_PREMODx_WIDTH		2
-+#define ASRCFG_PREMODx_MASK(x)		(((1 << ASRCFG_PREMODx_WIDTH) - 1) << ASRCFG_PREMODx_SHIFT(x))
-+#define ASRCFG_PREMOD(x, v)		((v) << ASRCFG_PREMODx_SHIFT(x))
-+#define ASRCFG_PREMODx_UP(x)		(0 << ASRCFG_PREMODx_SHIFT(x))
-+#define ASRCFG_PREMODx_DCON(x)		(1 << ASRCFG_PREMODx_SHIFT(x))
-+#define ASRCFG_PREMODx_DOWN(x)		(2 << ASRCFG_PREMODx_SHIFT(x))
-+#define ASRCFG_PREMODx_BYPASS(x)	(3 << ASRCFG_PREMODx_SHIFT(x))
-+
-+/* REG4 0x14 REG_ASRCSR */
-+#define ASRCSR_AxCSx_WIDTH		4
-+#define ASRCSR_AxCSx_MASK		((1 << ASRCSR_AxCSx_WIDTH) - 1)
-+#define ASRCSR_AOCSx_SHIFT(x)		(12 + (x << 2))
-+#define ASRCSR_AOCSx_MASK(x)		(((1 << ASRCSR_AxCSx_WIDTH) - 1) << ASRCSR_AOCSx_SHIFT(x))
-+#define ASRCSR_AOCS(x, v)		((v) << ASRCSR_AOCSx_SHIFT(x))
-+#define ASRCSR_AICSx_SHIFT(x)		(x << 2)
-+#define ASRCSR_AICSx_MASK(x)		(((1 << ASRCSR_AxCSx_WIDTH) - 1) << ASRCSR_AICSx_SHIFT(x))
-+#define ASRCSR_AICS(x, v)		((v) << ASRCSR_AICSx_SHIFT(x))
-+
-+/* REG5&6 0x18 & 0x1C REG_ASRCDR1 & ASRCDR2 */
-+#define ASRCDRx_AxCPx_WIDTH		3
-+#define ASRCDRx_AICPx_SHIFT(x)		(0 + (x % 2) * 6)
-+#define ASRCDRx_AICPx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AICPx_SHIFT(x))
-+#define ASRCDRx_AICP(x, v)		((v) << ASRCDRx_AICPx_SHIFT(x))
-+#define ASRCDRx_AICDx_SHIFT(x)		(3 + (x % 2) * 6)
-+#define ASRCDRx_AICDx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AICDx_SHIFT(x))
-+#define ASRCDRx_AICD(x, v)		((v) << ASRCDRx_AICDx_SHIFT(x))
-+#define ASRCDRx_AOCPx_SHIFT(x)		((x < 2) ? 12 + x * 6 : 6)
-+#define ASRCDRx_AOCPx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AOCPx_SHIFT(x))
-+#define ASRCDRx_AOCP(x, v)		((v) << ASRCDRx_AOCPx_SHIFT(x))
-+#define ASRCDRx_AOCDx_SHIFT(x)		((x < 2) ? 15 + x * 6 : 9)
-+#define ASRCDRx_AOCDx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AOCDx_SHIFT(x))
-+#define ASRCDRx_AOCD(x, v)		((v) << ASRCDRx_AOCDx_SHIFT(x))
-+
-+/* REG7 0x20 REG_ASRSTR */
-+#define ASRSTR_DSLCNT_SHIFT		21
-+#define ASRSTR_DSLCNT_MASK		(1 << ASRSTR_DSLCNT_SHIFT)
-+#define ASRSTR_DSLCNT			(1 << ASRSTR_DSLCNT_SHIFT)
-+#define ASRSTR_ATQOL_SHIFT		20
-+#define ASRSTR_ATQOL_MASK		(1 << ASRSTR_ATQOL_SHIFT)
-+#define ASRSTR_ATQOL			(1 << ASRSTR_ATQOL_SHIFT)
-+#define ASRSTR_AOOLx_SHIFT(x)		(17 + x)
-+#define ASRSTR_AOOLx_MASK(x)		(1 << ASRSTR_AOOLx_SHIFT(x))
-+#define ASRSTR_AOOL(x)			(1 << ASRSTR_AOOLx_SHIFT(x))
-+#define ASRSTR_AIOLx_SHIFT(x)		(14 + x)
-+#define ASRSTR_AIOLx_MASK(x)		(1 << ASRSTR_AIOLx_SHIFT(x))
-+#define ASRSTR_AIOL(x)			(1 << ASRSTR_AIOLx_SHIFT(x))
-+#define ASRSTR_AODOx_SHIFT(x)		(11 + x)
-+#define ASRSTR_AODOx_MASK(x)		(1 << ASRSTR_AODOx_SHIFT(x))
-+#define ASRSTR_AODO(x)			(1 << ASRSTR_AODOx_SHIFT(x))
-+#define ASRSTR_AIDUx_SHIFT(x)		(8 + x)
-+#define ASRSTR_AIDUx_MASK(x)		(1 << ASRSTR_AIDUx_SHIFT(x))
-+#define ASRSTR_AIDU(x)			(1 << ASRSTR_AIDUx_SHIFT(x))
-+#define ASRSTR_FPWT_SHIFT		7
-+#define ASRSTR_FPWT_MASK		(1 << ASRSTR_FPWT_SHIFT)
-+#define ASRSTR_FPWT			(1 << ASRSTR_FPWT_SHIFT)
-+#define ASRSTR_AOLE_SHIFT		6
-+#define ASRSTR_AOLE_MASK		(1 << ASRSTR_AOLE_SHIFT)
-+#define ASRSTR_AOLE			(1 << ASRSTR_AOLE_SHIFT)
-+#define ASRSTR_AODEx_SHIFT(x)		(3 + x)
-+#define ASRSTR_AODFx_MASK(x)		(1 << ASRSTR_AODEx_SHIFT(x))
-+#define ASRSTR_AODF(x)			(1 << ASRSTR_AODEx_SHIFT(x))
-+#define ASRSTR_AIDEx_SHIFT(x)		(0 + x)
-+#define ASRSTR_AIDEx_MASK(x)		(1 << ASRSTR_AIDEx_SHIFT(x))
-+#define ASRSTR_AIDE(x)			(1 << ASRSTR_AIDEx_SHIFT(x))
-+
-+/* REG10 0x54 REG_ASRTFR1 */
-+#define ASRTFR1_TF_BASE_WIDTH		7
-+#define ASRTFR1_TF_BASE_SHIFT		6
-+#define ASRTFR1_TF_BASE_MASK		(((1 << ASRTFR1_TF_BASE_WIDTH) - 1) << ASRTFR1_TF_BASE_SHIFT)
-+#define ASRTFR1_TF_BASE(x)		((x) << ASRTFR1_TF_BASE_SHIFT)
-+
-+/*
-+ * REG22 0xA0 REG_ASRMCRA
-+ * REG24 0xA8 REG_ASRMCRB
-+ * REG26 0xB0 REG_ASRMCRC
-+ */
-+#define ASRMCRx_ZEROBUFx_SHIFT		23
-+#define ASRMCRx_ZEROBUFxCLR_MASK	(1 << ASRMCRx_ZEROBUFx_SHIFT)
-+#define ASRMCRx_ZEROBUFxCLR		(1 << ASRMCRx_ZEROBUFx_SHIFT)
-+#define ASRMCRx_EXTTHRSHx_SHIFT		22
-+#define ASRMCRx_EXTTHRSHx_MASK		(1 << ASRMCRx_EXTTHRSHx_SHIFT)
-+#define ASRMCRx_EXTTHRSHx		(1 << ASRMCRx_EXTTHRSHx_SHIFT)
-+#define ASRMCRx_BUFSTALLx_SHIFT		21
-+#define ASRMCRx_BUFSTALLx_MASK		(1 << ASRMCRx_BUFSTALLx_SHIFT)
-+#define ASRMCRx_BUFSTALLx		(1 << ASRMCRx_BUFSTALLx_SHIFT)
-+#define ASRMCRx_BYPASSPOLYx_SHIFT	20
-+#define ASRMCRx_BYPASSPOLYx_MASK	(1 << ASRMCRx_BYPASSPOLYx_SHIFT)
-+#define ASRMCRx_BYPASSPOLYx		(1 << ASRMCRx_BYPASSPOLYx_SHIFT)
-+#define ASRMCRx_OUTFIFO_THRESHOLD_WIDTH	6
-+#define ASRMCRx_OUTFIFO_THRESHOLD_SHIFT	12
-+#define ASRMCRx_OUTFIFO_THRESHOLD_MASK	(((1 << ASRMCRx_OUTFIFO_THRESHOLD_WIDTH) - 1) << ASRMCRx_OUTFIFO_THRESHOLD_SHIFT)
-+#define ASRMCRx_OUTFIFO_THRESHOLD(v)	(((v) << ASRMCRx_OUTFIFO_THRESHOLD_SHIFT) & ASRMCRx_OUTFIFO_THRESHOLD_MASK)
-+#define ASRMCRx_RSYNIFx_SHIFT		11
-+#define ASRMCRx_RSYNIFx_MASK		(1 << ASRMCRx_RSYNIFx_SHIFT)
-+#define ASRMCRx_RSYNIFx			(1 << ASRMCRx_RSYNIFx_SHIFT)
-+#define ASRMCRx_RSYNOFx_SHIFT		10
-+#define ASRMCRx_RSYNOFx_MASK		(1 << ASRMCRx_RSYNOFx_SHIFT)
-+#define ASRMCRx_RSYNOFx			(1 << ASRMCRx_RSYNOFx_SHIFT)
-+#define ASRMCRx_INFIFO_THRESHOLD_WIDTH	6
-+#define ASRMCRx_INFIFO_THRESHOLD_SHIFT	0
-+#define ASRMCRx_INFIFO_THRESHOLD_MASK	(((1 << ASRMCRx_INFIFO_THRESHOLD_WIDTH) - 1) << ASRMCRx_INFIFO_THRESHOLD_SHIFT)
-+#define ASRMCRx_INFIFO_THRESHOLD(v)	(((v) << ASRMCRx_INFIFO_THRESHOLD_SHIFT) & ASRMCRx_INFIFO_THRESHOLD_MASK)
-+
-+/*
-+ * REG23 0xA4 REG_ASRFSTA
-+ * REG25 0xAC REG_ASRFSTB
-+ * REG27 0xB4 REG_ASRFSTC
-+ */
-+#define ASRFSTx_OAFx_SHIFT		23
-+#define ASRFSTx_OAFx_MASK		(1 << ASRFSTx_OAFx_SHIFT)
-+#define ASRFSTx_OAFx			(1 << ASRFSTx_OAFx_SHIFT)
-+#define ASRFSTx_OUTPUT_FIFO_WIDTH	7
-+#define ASRFSTx_OUTPUT_FIFO_SHIFT	12
-+#define ASRFSTx_OUTPUT_FIFO_MASK	(((1 << ASRFSTx_OUTPUT_FIFO_WIDTH) - 1) << ASRFSTx_OUTPUT_FIFO_SHIFT)
-+#define ASRFSTx_IAEx_SHIFT		11
-+#define ASRFSTx_IAEx_MASK		(1 << ASRFSTx_OAFx_SHIFT)
-+#define ASRFSTx_IAEx			(1 << ASRFSTx_OAFx_SHIFT)
-+#define ASRFSTx_INPUT_FIFO_WIDTH	7
-+#define ASRFSTx_INPUT_FIFO_SHIFT	0
-+#define ASRFSTx_INPUT_FIFO_MASK		((1 << ASRFSTx_INPUT_FIFO_WIDTH) - 1)
-+
-+/* REG28 0xC0 & 0xC4 & 0xC8 REG_ASRMCR1x */
-+#define ASRMCR1x_IWD_WIDTH		3
-+#define ASRMCR1x_IWD_SHIFT		9
-+#define ASRMCR1x_IWD_MASK		(((1 << ASRMCR1x_IWD_WIDTH) - 1) << ASRMCR1x_IWD_SHIFT)
-+#define ASRMCR1x_IWD(v)			((v) << ASRMCR1x_IWD_SHIFT)
-+#define ASRMCR1x_IMSB_SHIFT		8
-+#define ASRMCR1x_IMSB_MASK		(1 << ASRMCR1x_IMSB_SHIFT)
-+#define ASRMCR1x_IMSB_MSB		(1 << ASRMCR1x_IMSB_SHIFT)
-+#define ASRMCR1x_IMSB_LSB		(0 << ASRMCR1x_IMSB_SHIFT)
-+#define ASRMCR1x_OMSB_SHIFT		2
-+#define ASRMCR1x_OMSB_MASK		(1 << ASRMCR1x_OMSB_SHIFT)
-+#define ASRMCR1x_OMSB_MSB		(1 << ASRMCR1x_OMSB_SHIFT)
-+#define ASRMCR1x_OMSB_LSB		(0 << ASRMCR1x_OMSB_SHIFT)
-+#define ASRMCR1x_OSGN_SHIFT		1
-+#define ASRMCR1x_OSGN_MASK		(1 << ASRMCR1x_OSGN_SHIFT)
-+#define ASRMCR1x_OSGN			(1 << ASRMCR1x_OSGN_SHIFT)
-+#define ASRMCR1x_OW16_SHIFT		0
-+#define ASRMCR1x_OW16_MASK		(1 << ASRMCR1x_OW16_SHIFT)
-+#define ASRMCR1x_OW16(v)		((v) << ASRMCR1x_OW16_SHIFT)
-+
-+
-+struct dma_block {
-+	unsigned int index;
-+	unsigned int length;
-+	void *dma_vaddr;
-+	dma_addr_t dma_paddr;
-+	struct list_head queue;
-+};
-+
-+struct asrc_p2p_params {
-+	u32 p2p_rate;				/* ASRC output rate for p2p */
-+	enum asrc_word_width p2p_width;		/* ASRC output wordwidth for p2p */
-+};
-+
-+struct asrc_pair_params {
-+	enum asrc_pair_index index;
-+	struct completion input_complete;
-+	struct completion output_complete;
-+	struct dma_chan *input_dma_channel;
-+	struct dma_chan *output_dma_channel;
-+	unsigned int input_buffer_size;
-+	unsigned int output_buffer_size;
-+	unsigned int buffer_num;
-+	unsigned int pair_hold;
-+	unsigned int asrc_active;
-+	unsigned int channel_nums;
-+	struct dma_block input_dma_total;
-+	struct dma_block input_dma[ASRC_DMA_BUFFER_NUM];
-+	struct dma_block output_dma_total;
-+	struct dma_block output_dma[ASRC_DMA_BUFFER_NUM];
-+	struct dma_block output_last_period;
-+	struct dma_async_tx_descriptor *desc_in;
-+	struct dma_async_tx_descriptor *desc_out;
-+	unsigned int input_sg_nodes;
-+	unsigned int output_sg_nodes;
-+	struct scatterlist input_sg[4], output_sg[4];
-+	enum asrc_word_width input_word_width;
-+	enum asrc_word_width output_word_width;
-+	u32 input_sample_rate;
-+	u32 output_sample_rate;
-+	u32 input_wm;
-+	u32 output_wm;
-+	unsigned int last_period_sample;
-+};
-+
-+struct asrc_data {
-+	struct asrc_pair_params *params[ASRC_PAIR_MAX_NUM];
-+	struct asrc_pair asrc_pair[ASRC_PAIR_MAX_NUM];
-+	struct proc_dir_entry *proc_asrc;
-+	struct class *asrc_class;
-+	struct regmap *regmap;
-+	struct clk *mem_clk;
-+	struct clk *ipg_clk;
-+	struct clk *asrck_clk;
-+	struct clk *dma_clk;
-+	unsigned long paddr;
-+	unsigned int channel_bits;
-+	int asrc_major;
-+	int irq;
-+	struct device *dev;
-+};
-+
-+struct asrc_p2p_ops {
-+	void (*asrc_p2p_start_conv)(enum asrc_pair_index);
-+	void (*asrc_p2p_stop_conv)(enum asrc_pair_index);
-+	int (*asrc_p2p_get_dma_request)(enum asrc_pair_index, bool);
-+	u32 (*asrc_p2p_per_addr)(enum asrc_pair_index, bool);
-+	int (*asrc_p2p_req_pair)(int, enum asrc_pair_index *index);
-+	int (*asrc_p2p_config_pair)(struct asrc_config *config);
-+	void (*asrc_p2p_release_pair)(enum asrc_pair_index);
-+	void (*asrc_p2p_finish_conv)(enum asrc_pair_index);
-+};
-+
-+extern void asrc_p2p_hook(struct asrc_p2p_ops *asrc_p2p_ct);
-+
-+extern int asrc_req_pair(int chn_num, enum asrc_pair_index *index);
-+extern void asrc_release_pair(enum asrc_pair_index index);
-+extern int asrc_config_pair(struct asrc_config *config);
-+extern void asrc_get_status(struct asrc_status_flags *flags);
-+extern void asrc_start_conv(enum asrc_pair_index index);
-+extern void asrc_stop_conv(enum asrc_pair_index index);
-+extern u32 asrc_get_per_addr(enum asrc_pair_index index, bool i);
-+extern int asrc_get_dma_request(enum asrc_pair_index index, bool i);
-+extern void asrc_finish_conv(enum asrc_pair_index index);
-+extern int asrc_set_watermark(enum asrc_pair_index index,
-+		u32 in_wm, u32 out_wm);
-+
-+#endif/* __MXC_ASRC_H__ */
-diff -Nur linux-4.1.3/include/linux/mxc_dcic.h linux-xbian-imx6/include/linux/mxc_dcic.h
---- linux-4.1.3/include/linux/mxc_dcic.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/mxc_dcic.h	2015-07-27 23:13:09.606706653 +0200
-@@ -0,0 +1,139 @@
-+/*
-+ * Copyright (C) 2014 Freescale Semiconductor, Inc. All Rights Reserved
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*!
-+ * @file linux/mxc_dcic.h
-+ *
-+ * @brief Global header file for the MXC DCIC driver
-+ *
-+ * @ingroup MXC DCIC
-+ */
-+
-+#ifndef __LINUX_DCIC_H__
-+#define __LINUX_DCIC_H__
-+
-+#include <uapi/linux/mxc_dcic.h>
-+
-+#define DCICC_IC_ENABLE					0x1
-+#define DCICC_IC_DISABLE				0x0
-+#define DCICC_IC_MASK					0x1
-+#define DCICC_DE_ACTIVE_HIGH			0
-+#define DCICC_DE_ACTIVE_LOW				(0x1 << 4)
-+#define DCICC_DE_ACTIVE_MASK			(0x1 << 4)
-+#define DCICC_HSYNC_POL_ACTIVE_HIGH		0
-+#define DCICC_HSYNC_POL_ACTIVE_LOW		(0x1 << 5)
-+#define DCICC_HSYNC_POL_ACTIVE_MASK		(0x1 << 5)
-+#define DCICC_VSYNC_POL_ACTIVE_HIGH		0
-+#define DCICC_VSYNC_POL_ACTIVE_LOW		(0x1 << 6)
-+#define DCICC_VSYNC_POL_ACTIVE_MASK		(0x1 << 6)
-+#define DCICC_CLK_POL_NO_INVERTED		0
-+#define DCICC_CLK_POL_INVERTED			(0x1 << 7)
-+#define DCICC_CLK_POL_INVERTED_MASK		(0x1 << 7)
-+
-+#define DCICIC_ERROR_INT_DISABLE		1
-+#define DCICIC_ERROR_INT_ENABLE			0
-+#define DCICIC_ERROR_INT_MASK_MASK		1
-+#define DCICIC_FUN_INT_DISABLE			(0x1 << 1)
-+#define DCICIC_FUN_INT_ENABLE			0
-+#define DCICIC_FUN_INT_MASK				(0x1 << 1)
-+#define DCICIC_FREEZE_MASK_CHANGED		0
-+#define DCICIC_FREEZE_MASK_FORZEN		(0x1 << 3)
-+#define DCICIC_FREEZE_MASK_MASK			(0x1 << 3)
-+#define DCICIC_EXT_SIG_EX_DISABLE		0
-+#define DCICIC_EXT_SIG_EN_ENABLE		(0x1 << 16)
-+#define DCICIC_EXT_SIG_EN_MASK			(0x1 << 16)
-+
-+#define DCICS_ROI_MATCH_STAT_MASK		0xFFFF
-+#define DCICS_EI_STAT_PENDING			(0x1 << 16)
-+#define DCICS_EI_STAT_NO_PENDING		0
-+#define DCICS_FI_STAT_PENDING			(0x1 << 17)
-+#define DCICS_FI_STAT_NO_PENDING		0
-+
-+#define DCICRC_ROI_START_OFFSET_X_MASK	0x1FFF
-+#define DCICRC_ROI_START_OFFSET_X_SHIFT	0
-+#define DCICRC_ROI_START_OFFSET_Y_MASK	(0xFFF << 16)
-+#define DCICRC_ROI_START_OFFSET_Y_SHIFT	16
-+#define DCICRC_ROI_CHANGED				0
-+#define DCICRC_ROI_FROZEN				(0x1 << 30)
-+#define DCICRC_ROI_ENABLE				(0x1 << 31)
-+#define DCICRC_ROI_DISABLE				0
-+
-+#define DCICRS_ROI_END_OFFSET_X_MASK	0x1FFF
-+#define DCICRS_ROI_END_OFFSET_X_SHIFT	0
-+#define DCICRS_ROI_END_OFFSET_Y_MASK	(0xFFF << 16)
-+#define DCICRS_ROI_END_OFFSET_Y_SHIFT	16
-+
-+struct roi_regs {
-+	u32 dcicrc;
-+	u32 dcicrs;
-+	u32 dcicrrs;
-+	u32 dcicrcs;
-+};
-+
-+struct dcic_regs {
-+	u32 dcicc;
-+	u32 dcicic;
-+	u32 dcics;
-+	u32 dcic_reserved;
-+	struct roi_regs ROI[16];
-+};
-+
-+struct dcic_mux {
-+	char dcic[16];
-+	u32 val;
-+};
-+
-+struct bus_mux {
-+	char name[16];
-+	int reg;
-+	int shift;
-+	int mask;
-+	int dcic_mux_num;
-+	const struct dcic_mux *dcics;
-+};
-+
-+struct dcic_info {
-+	int bus_mux_num;
-+	const struct bus_mux *buses;
-+};
-+
-+struct dcic_data {
-+	struct regmap *regmap;
-+	struct device *dev;
-+	struct dcic_regs *regs;
-+	const struct bus_mux *buses;
-+	u32 bus_n;
-+	u32 mux_n;
-+	struct clk *disp_axi_clk;
-+	struct clk *dcic_clk;
-+	struct mutex lock;
-+	struct completion roi_crc_comp;
-+	struct class *class;
-+	int major;
-+	struct cdev cdev;	/* Char device structure */
-+	dev_t devt;
-+	unsigned int result;
-+};
-+
-+struct dcic_private {
-+	struct dcic_data *dcic;
-+	u16 client_id;
-+};
-+#endif
-diff -Nur linux-4.1.3/include/linux/mxc_vpu.h linux-xbian-imx6/include/linux/mxc_vpu.h
---- linux-4.1.3/include/linux/mxc_vpu.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/mxc_vpu.h	2015-07-27 23:13:09.606706653 +0200
-@@ -0,0 +1,118 @@
-+/*
-+ * Copyright 2004-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU Lesser General
-+ * Public License.  You may obtain a copy of the GNU Lesser General
-+ * Public License Version 2.1 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/lgpl-license.html
-+ * http://www.gnu.org/copyleft/lgpl.html
-+ */
-+
-+/*!
-+ * @defgroup VPU Video Processor Unit Driver
-+ */
-+
-+/*!
-+ * @file linux/mxc_vpu.h
-+ *
-+ * @brief VPU system initialization and file operation definition
-+ *
-+ * @ingroup VPU
-+ */
-+
-+#ifndef __LINUX_MXC_VPU_H__
-+#define __LINUX_MXC_VPU_H__
-+
-+#include <linux/fs.h>
-+
-+struct mxc_vpu_platform_data {
-+	bool iram_enable;
-+	int  iram_size;
-+	void (*reset) (void);
-+	void (*pg) (int);
-+};
-+
-+struct vpu_mem_desc {
-+	u32 size;
-+	dma_addr_t phy_addr;
-+	u32 cpu_addr;		/* cpu address to free the dma mem */
-+	u32 virt_uaddr;		/* virtual user space address */
-+};
-+
-+#define VPU_IOC_MAGIC  'V'
-+
-+#define VPU_IOC_PHYMEM_ALLOC	_IO(VPU_IOC_MAGIC, 0)
-+#define VPU_IOC_PHYMEM_FREE	_IO(VPU_IOC_MAGIC, 1)
-+#define VPU_IOC_WAIT4INT	_IO(VPU_IOC_MAGIC, 2)
-+#define VPU_IOC_PHYMEM_DUMP	_IO(VPU_IOC_MAGIC, 3)
-+#define VPU_IOC_REG_DUMP	_IO(VPU_IOC_MAGIC, 4)
-+#define VPU_IOC_IRAM_SETTING	_IO(VPU_IOC_MAGIC, 6)
-+#define VPU_IOC_CLKGATE_SETTING	_IO(VPU_IOC_MAGIC, 7)
-+#define VPU_IOC_GET_WORK_ADDR   _IO(VPU_IOC_MAGIC, 8)
-+#define VPU_IOC_REQ_VSHARE_MEM	_IO(VPU_IOC_MAGIC, 9)
-+#define VPU_IOC_SYS_SW_RESET	_IO(VPU_IOC_MAGIC, 11)
-+#define VPU_IOC_GET_SHARE_MEM   _IO(VPU_IOC_MAGIC, 12)
-+#define VPU_IOC_QUERY_BITWORK_MEM  _IO(VPU_IOC_MAGIC, 13)
-+#define VPU_IOC_SET_BITWORK_MEM    _IO(VPU_IOC_MAGIC, 14)
-+#define VPU_IOC_PHYMEM_CHECK	_IO(VPU_IOC_MAGIC, 15)
-+#define VPU_IOC_LOCK_DEV	_IO(VPU_IOC_MAGIC, 16)
-+
-+#define BIT_CODE_RUN			0x000
-+#define BIT_CODE_DOWN			0x004
-+#define BIT_INT_CLEAR			0x00C
-+#define BIT_INT_STATUS			0x010
-+#define BIT_CUR_PC			0x018
-+#define BIT_INT_REASON			0x174
-+
-+#define MJPEG_PIC_STATUS_REG		0x3004
-+#define MBC_SET_SUBBLK_EN		0x4A0
-+
-+#define BIT_WORK_CTRL_BUF_BASE		0x100
-+#define BIT_WORK_CTRL_BUF_REG(i)	(BIT_WORK_CTRL_BUF_BASE + i * 4)
-+#define BIT_CODE_BUF_ADDR		BIT_WORK_CTRL_BUF_REG(0)
-+#define BIT_WORK_BUF_ADDR		BIT_WORK_CTRL_BUF_REG(1)
-+#define BIT_PARA_BUF_ADDR		BIT_WORK_CTRL_BUF_REG(2)
-+#define BIT_BIT_STREAM_CTRL		BIT_WORK_CTRL_BUF_REG(3)
-+#define BIT_FRAME_MEM_CTRL		BIT_WORK_CTRL_BUF_REG(4)
-+#define BIT_BIT_STREAM_PARAM		BIT_WORK_CTRL_BUF_REG(5)
-+
-+#ifndef CONFIG_SOC_IMX6Q
-+#define BIT_RESET_CTRL			0x11C
-+#else
-+#define BIT_RESET_CTRL			0x128
-+#endif
-+
-+/* i could be 0, 1, 2, 3 */
-+#define	BIT_RD_PTR_BASE			0x120
-+#define BIT_RD_PTR_REG(i)		(BIT_RD_PTR_BASE + i * 8)
-+#define BIT_WR_PTR_REG(i)		(BIT_RD_PTR_BASE + i * 8 + 4)
-+
-+/* i could be 0, 1, 2, 3 */
-+#define BIT_FRM_DIS_FLG_BASE		(cpu_is_mx51() ? 0x150 : 0x140)
-+#define	BIT_FRM_DIS_FLG_REG(i)		(BIT_FRM_DIS_FLG_BASE + i * 4)
-+
-+#define BIT_BUSY_FLAG			0x160
-+#define BIT_RUN_COMMAND			0x164
-+#define BIT_INT_ENABLE			0x170
-+
-+#define	BITVAL_PIC_RUN			8
-+
-+#define	VPU_SLEEP_REG_VALUE		10
-+#define	VPU_WAKE_REG_VALUE		11
-+
-+int vl2cc_init(u32 vl2cc_hw_base);
-+void vl2cc_enable(void);
-+void vl2cc_flush(void);
-+void vl2cc_disable(void);
-+void vl2cc_cleanup(void);
-+
-+int vl2cc_init(u32 vl2cc_hw_base);
-+void vl2cc_enable(void);
-+void vl2cc_flush(void);
-+void vl2cc_disable(void);
-+void vl2cc_cleanup(void);
-+
-+#endif
-diff -Nur linux-4.1.3/include/linux/platform_data/dma-imx.h linux-xbian-imx6/include/linux/platform_data/dma-imx.h
---- linux-4.1.3/include/linux/platform_data/dma-imx.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/linux/platform_data/dma-imx.h	2015-07-27 23:13:09.622649772 +0200
-@@ -17,31 +17,30 @@
-  * This enumerates peripheral types. Used for SDMA.
-  */
- enum sdma_peripheral_type {
--	IMX_DMATYPE_SSI,	/* MCU domain SSI */
--	IMX_DMATYPE_SSI_SP,	/* Shared SSI */
--	IMX_DMATYPE_MMC,	/* MMC */
--	IMX_DMATYPE_SDHC,	/* SDHC */
--	IMX_DMATYPE_UART,	/* MCU domain UART */
--	IMX_DMATYPE_UART_SP,	/* Shared UART */
--	IMX_DMATYPE_FIRI,	/* FIRI */
--	IMX_DMATYPE_CSPI,	/* MCU domain CSPI */
--	IMX_DMATYPE_CSPI_SP,	/* Shared CSPI */
--	IMX_DMATYPE_SIM,	/* SIM */
--	IMX_DMATYPE_ATA,	/* ATA */
--	IMX_DMATYPE_CCM,	/* CCM */
--	IMX_DMATYPE_EXT,	/* External peripheral */
--	IMX_DMATYPE_MSHC,	/* Memory Stick Host Controller */
--	IMX_DMATYPE_MSHC_SP,	/* Shared Memory Stick Host Controller */
--	IMX_DMATYPE_DSP,	/* DSP */
--	IMX_DMATYPE_MEMORY,	/* Memory */
--	IMX_DMATYPE_FIFO_MEMORY,/* FIFO type Memory */
--	IMX_DMATYPE_SPDIF,	/* SPDIF */
--	IMX_DMATYPE_IPU_MEMORY,	/* IPU Memory */
--	IMX_DMATYPE_ASRC,	/* ASRC */
--	IMX_DMATYPE_ESAI,	/* ESAI */
--	IMX_DMATYPE_SSI_DUAL,	/* SSI Dual FIFO */
--	IMX_DMATYPE_ASRC_SP,	/* Shared ASRC */
--	IMX_DMATYPE_SAI,	/* SAI */
-+        IMX_DMATYPE_SSI,        /* MCU domain SSI */
-+        IMX_DMATYPE_SSI_SP,     /* Shared SSI */
-+        IMX_DMATYPE_MMC,        /* MMC */
-+        IMX_DMATYPE_SDHC,       /* SDHC */
-+        IMX_DMATYPE_UART,       /* MCU domain UART */
-+        IMX_DMATYPE_UART_SP,    /* Shared UART */
-+        IMX_DMATYPE_FIRI,       /* FIRI */
-+        IMX_DMATYPE_CSPI,       /* MCU domain CSPI */
-+        IMX_DMATYPE_CSPI_SP,    /* Shared CSPI */
-+        IMX_DMATYPE_SIM,        /* SIM */
-+        IMX_DMATYPE_ATA,        /* ATA */
-+        IMX_DMATYPE_CCM,        /* CCM */
-+        IMX_DMATYPE_EXT,        /* External peripheral */
-+        IMX_DMATYPE_MSHC,       /* Memory Stick Host Controller */
-+        IMX_DMATYPE_MSHC_SP,    /* Shared Memory Stick Host Controller */
-+        IMX_DMATYPE_DSP,        /* DSP */
-+        IMX_DMATYPE_MEMORY,     /* Memory */
-+        IMX_DMATYPE_FIFO_MEMORY,/* FIFO type Memory */
-+        IMX_DMATYPE_SPDIF,      /* SPDIF */
-+        IMX_DMATYPE_IPU_MEMORY, /* IPU Memory */
-+        IMX_DMATYPE_ASRC,       /* ASRC */
-+        IMX_DMATYPE_ESAI,       /* ESAI */
-+        IMX_DMATYPE_SSI_DUAL,   /* SSI Dual FIFO */
-+        IMX_DMATYPE_HDMI,       /* HDMI Audio */
- };
- 
- enum imx_dma_prio {
-@@ -55,6 +54,7 @@
- 	int dma_request2; /* secondary DMA request line */
- 	enum sdma_peripheral_type peripheral_type;
- 	int priority;
-+	void *data_addr1, *data_addr2;
- };
- 
- static inline int imx_dma_is_ipu(struct dma_chan *chan)
-diff -Nur linux-4.1.3/include/linux/pxp_device.h linux-xbian-imx6/include/linux/pxp_device.h
---- linux-4.1.3/include/linux/pxp_device.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/pxp_device.h	2015-07-27 23:13:09.634607108 +0200
-@@ -0,0 +1,68 @@
-+/*
-+ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+#ifndef _PXP_DEVICE
-+#define _PXP_DEVICE
-+
-+#include <linux/idr.h>
-+#include <linux/hash.h>
-+#include <uapi/linux/pxp_device.h>
-+
-+struct pxp_irq_info {
-+	wait_queue_head_t waitq;
-+	atomic_t irq_pending;
-+	int hist_status;
-+};
-+
-+struct pxp_buffer_hash {
-+	struct hlist_head *hash_table;
-+	u32 order;
-+	spinlock_t hash_lock;
-+};
-+
-+struct pxp_buf_obj {
-+	uint32_t handle;
-+
-+	uint32_t size;
-+	uint32_t mem_type;
-+
-+	unsigned long offset;
-+	void *virtual;
-+
-+	struct hlist_node item;
-+};
-+
-+struct pxp_chan_obj {
-+	uint32_t handle;
-+	struct dma_chan *chan;
-+};
-+
-+/* File private data */
-+struct pxp_file {
-+	struct file *filp;
-+
-+	/* record allocated dma buffer */
-+	struct idr buffer_idr;
-+	spinlock_t buffer_lock;
-+
-+	/* record allocated dma channel */
-+	struct idr channel_idr;
-+	spinlock_t channel_lock;
-+};
-+
-+#endif
-diff -Nur linux-4.1.3/include/linux/pxp_dma.h linux-xbian-imx6/include/linux/pxp_dma.h
---- linux-4.1.3/include/linux/pxp_dma.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/linux/pxp_dma.h	2015-07-27 23:13:09.634607108 +0200
-@@ -0,0 +1,72 @@
-+/*
-+ * Copyright (C) 2010-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+#ifndef _PXP_DMA
-+#define _PXP_DMA
-+
-+#include <uapi/linux/pxp_dma.h>
-+
-+struct pxp_tx_desc {
-+	struct dma_async_tx_descriptor txd;
-+	struct list_head tx_list;
-+	struct list_head list;
-+	int len;
-+	union {
-+		struct pxp_layer_param s0_param;
-+		struct pxp_layer_param out_param;
-+		struct pxp_layer_param ol_param;
-+	} layer_param;
-+	struct pxp_proc_data proc_data;
-+
-+	u32 hist_status;	/* Histogram output status */
-+
-+	struct pxp_tx_desc *next;
-+};
-+
-+struct pxp_channel {
-+	struct dma_chan dma_chan;
-+	dma_cookie_t completed;	/* last completed cookie */
-+	enum pxp_channel_status status;
-+	void *client;		/* Only one client per channel */
-+	unsigned int n_tx_desc;
-+	struct pxp_tx_desc *desc;	/* allocated tx-descriptors */
-+	struct list_head queue;	/* queued tx-descriptors */
-+	struct list_head list;	/* track queued channel number */
-+	spinlock_t lock;	/* protects sg[0,1], queue,
-+				 * status, cookie, free_list
-+				 */
-+	int active_buffer;
-+	unsigned int eof_irq;
-+	char eof_name[16];	/* EOF IRQ name for request_irq()  */
-+};
-+
-+#define to_tx_desc(tx) container_of(tx, struct pxp_tx_desc, txd)
-+#define to_pxp_channel(d) container_of(d, struct pxp_channel, dma_chan)
-+
-+void pxp_txd_ack(struct dma_async_tx_descriptor *txd,
-+		 struct pxp_channel *pxp_chan);
-+
-+#ifdef CONFIG_MXC_PXP_CLIENT_DEVICE
-+int register_pxp_device(void);
-+void unregister_pxp_device(void);
-+#else
-+int register_pxp_device(void) { return 0; }
-+void unregister_pxp_device(void) {}
-+#endif
-+
-+#endif
-diff -Nur linux-4.1.3/include/mmc-mxcmmc.h linux-xbian-imx6/include/mmc-mxcmmc.h
---- linux-4.1.3/include/mmc-mxcmmc.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/mmc-mxcmmc.h	2015-07-27 23:13:09.770123601 +0200
-@@ -0,0 +1,39 @@
-+#ifndef ASMARM_ARCH_MMC_H
-+#define ASMARM_ARCH_MMC_H
-+
-+#include <linux/mmc/host.h>
-+
-+struct device;
-+
-+/* board specific SDHC data, optional.
-+ * If not present, a writable card with 3,3V is assumed.
-+ */
-+struct imxmmc_platform_data {
-+	/* Return values for the get_ro callback should be:
-+	 *   0 for a read/write card
-+	 *   1 for a read-only card
-+	 *   -ENOSYS when not supported (equal to NULL callback)
-+	 *   or a negative errno value when something bad happened
-+	 */
-+	int (*get_ro)(struct device *);
-+
-+	/* board specific hook to (de)initialize the SD slot.
-+	 * The board code can call 'handler' on a card detection
-+	 * change giving data as argument.
-+	 */
-+	int (*init)(struct device *dev, irq_handler_t handler, void *data);
-+	void (*exit)(struct device *dev, void *data);
-+
-+	/* available voltages. If not given, assume
-+	 * MMC_VDD_32_33 | MMC_VDD_33_34
-+	 */
-+	unsigned int ocr_avail;
-+
-+	/* adjust slot voltage */
-+	void (*setpower)(struct device *, unsigned int vdd);
-+
-+	/* enable card detect using DAT3 */
-+	int dat3_card_detect;
-+};
-+
-+#endif
-diff -Nur linux-4.1.3/include/mtd-mxc_nand.h linux-xbian-imx6/include/mtd-mxc_nand.h
---- linux-4.1.3/include/mtd-mxc_nand.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/mtd-mxc_nand.h	2015-07-27 23:13:09.770123601 +0200
-@@ -0,0 +1,32 @@
-+/*
-+ * Copyright 2004-2007 Freescale Semiconductor, Inc. All Rights Reserved.
-+ * Copyright 2008 Sascha Hauer, kernel@pengutronix.de
-+ *
-+ * This program is free software; you can redistribute it and/or
-+ * modify it under the terms of the GNU General Public License
-+ * as published by the Free Software Foundation; either version 2
-+ * of the License, or (at your option) any later version.
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
-+ * MA 02110-1301, USA.
-+ */
-+
-+#ifndef __ASM_ARCH_NAND_H
-+#define __ASM_ARCH_NAND_H
-+
-+#include <linux/mtd/partitions.h>
-+
-+struct mxc_nand_platform_data {
-+	unsigned int width;	/* data bus width in bytes */
-+	unsigned int hw_ecc:1;	/* 0 if suppress hardware ECC */
-+	unsigned int flash_bbt:1; /* set to 1 to use a flash based bbt */
-+	struct mtd_partition *parts;	/* partition table */
-+	int nr_parts;			/* size of parts */
-+};
-+#endif /* __ASM_ARCH_NAND_H */
-diff -Nur linux-4.1.3/include/sound/soc.h linux-xbian-imx6/include/sound/soc.h
---- linux-4.1.3/include/sound/soc.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/sound/soc.h	2015-07-27 23:13:09.837881847 +0200
-@@ -28,6 +28,18 @@
- #include <sound/control.h>
- #include <sound/ac97_codec.h>
- 
-+/*enum snd_soc_control_type {
-+	SND_SOC_CUSTOM,
-+	SND_SOC_I2C,
-+	SND_SOC_SPI,
-+};*/
-+
-+enum snd_soc_control_type {
-+        SND_SOC_I2C = 1,
-+        SND_SOC_SPI,
-+        SND_SOC_REGMAP,
-+};
-+
- /*
-  * Convenience kcontrol builders
-  */
-@@ -805,16 +817,24 @@
- 
- 	struct list_head list;
- 	struct list_head card_list;
-+	int (*volatile_register)(struct snd_soc_codec *, unsigned int);
- 
- 	/* runtime */
- 	unsigned int cache_bypass:1; /* Suppress access to the cache */
- 	unsigned int suspended:1; /* Codec is in suspend PM state */
- 	unsigned int cache_init:1; /* codec cache has been initialized */
-+	unsigned int using_regmap:1; /* using regmap access */
-+	u32 cache_only;  /* Suppress writes to hardware */
-+	u32 cache_sync; /* Cache needs to be synced to hardware */
- 
- 	/* codec IO */
- 	void *control_data; /* codec control (i2c/3wire) data */
- 	hw_write_t hw_write;
-+	unsigned int (*read)(struct snd_soc_codec *, unsigned int);
-+	int (*write)(struct snd_soc_codec *, unsigned int, unsigned int);
- 	void *reg_cache;
-+	struct mutex cache_rw_mutex;
-+	int val_bytes;
- 
- 	/* component */
- 	struct snd_soc_component component;
-diff -Nur linux-4.1.3/include/sync.h linux-xbian-imx6/include/sync.h
---- linux-4.1.3/include/sync.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/sync.h	2015-07-27 23:13:09.837881847 +0200
-@@ -0,0 +1,356 @@
-+/*
-+ * include/linux/sync.h
-+ *
-+ * Copyright (C) 2012 Google, Inc.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ */
-+
-+#ifndef _LINUX_SYNC_H
-+#define _LINUX_SYNC_H
-+
-+#include <linux/types.h>
-+#include <linux/kref.h>
-+#include <linux/ktime.h>
-+#include <linux/list.h>
-+#include <linux/spinlock.h>
-+#include <linux/wait.h>
-+#include <linux/fence.h>
-+
-+#include "uapi/sync.h"
-+
-+struct sync_timeline;
-+struct sync_pt;
-+struct sync_fence;
-+
-+/**
-+ * struct sync_timeline_ops - sync object implementation ops
-+ * @driver_name:	name of the implementation
-+ * @dup:		duplicate a sync_pt
-+ * @has_signaled:	returns:
-+ *			  1 if pt has signaled
-+ *			  0 if pt has not signaled
-+ *			 <0 on error
-+ * @compare:		returns:
-+ *			  1 if b will signal before a
-+ *			  0 if a and b will signal at the same time
-+ *			 -1 if a will signal before b
-+ * @free_pt:		called before sync_pt is freed
-+ * @release_obj:	called before sync_timeline is freed
-+ * @fill_driver_data:	write implementation specific driver data to data.
-+ *			  should return an error if there is not enough room
-+ *			  as specified by size.  This information is returned
-+ *			  to userspace by SYNC_IOC_FENCE_INFO.
-+ * @timeline_value_str: fill str with the value of the sync_timeline's counter
-+ * @pt_value_str:	fill str with the value of the sync_pt
-+ */
-+struct sync_timeline_ops {
-+	const char *driver_name;
-+
-+	/* required */
-+	struct sync_pt * (*dup)(struct sync_pt *pt);
-+
-+	/* required */
-+	int (*has_signaled)(struct sync_pt *pt);
-+
-+	/* required */
-+	int (*compare)(struct sync_pt *a, struct sync_pt *b);
-+
-+	/* optional */
-+	void (*free_pt)(struct sync_pt *sync_pt);
-+
-+	/* optional */
-+	void (*release_obj)(struct sync_timeline *sync_timeline);
-+
-+	/* optional */
-+	int (*fill_driver_data)(struct sync_pt *syncpt, void *data, int size);
-+
-+	/* optional */
-+	void (*timeline_value_str)(struct sync_timeline *timeline, char *str,
-+				   int size);
-+
-+	/* optional */
-+	void (*pt_value_str)(struct sync_pt *pt, char *str, int size);
-+};
-+
-+/**
-+ * struct sync_timeline - sync object
-+ * @kref:		reference count on fence.
-+ * @ops:		ops that define the implementation of the sync_timeline
-+ * @name:		name of the sync_timeline. Useful for debugging
-+ * @destroyed:		set when sync_timeline is destroyed
-+ * @child_list_head:	list of children sync_pts for this sync_timeline
-+ * @child_list_lock:	lock protecting @child_list_head, destroyed, and
-+ *			  sync_pt.status
-+ * @active_list_head:	list of active (unsignaled/errored) sync_pts
-+ * @sync_timeline_list:	membership in global sync_timeline_list
-+ */
-+struct sync_timeline {
-+	struct kref		kref;
-+	const struct sync_timeline_ops	*ops;
-+	char			name[32];
-+
-+	/* protected by child_list_lock */
-+	bool			destroyed;
-+	int			context, value;
-+
-+	struct list_head	child_list_head;
-+	spinlock_t		child_list_lock;
-+
-+	struct list_head	active_list_head;
-+
-+#ifdef CONFIG_DEBUG_FS
-+	struct list_head	sync_timeline_list;
-+#endif
-+};
-+
-+/**
-+ * struct sync_pt - sync point
-+ * @fence:		base fence class
-+ * @child_list:		membership in sync_timeline.child_list_head
-+ * @active_list:	membership in sync_timeline.active_list_head
-+ * @signaled_list:	membership in temporary signaled_list on stack
-+ * @fence:		sync_fence to which the sync_pt belongs
-+ * @pt_list:		membership in sync_fence.pt_list_head
-+ * @status:		1: signaled, 0:active, <0: error
-+ * @timestamp:		time which sync_pt status transitioned from active to
-+ *			  signaled or error.
-+ */
-+struct sync_pt {
-+	struct fence base;
-+
-+	struct list_head	child_list;
-+	struct list_head	active_list;
-+};
-+
-+static inline struct sync_timeline *sync_pt_parent(struct sync_pt *pt)
-+{
-+	return container_of(pt->base.lock, struct sync_timeline,
-+			    child_list_lock);
-+}
-+
-+struct sync_fence_cb {
-+	struct fence_cb cb;
-+	struct fence *sync_pt;
-+	struct sync_fence *fence;
-+};
-+
-+/**
-+ * struct sync_fence - sync fence
-+ * @file:		file representing this fence
-+ * @kref:		reference count on fence.
-+ * @name:		name of sync_fence.  Useful for debugging
-+ * @pt_list_head:	list of sync_pts in the fence.  immutable once fence
-+ *			  is created
-+ * @status:		0: signaled, >0:active, <0: error
-+ *
-+ * @wq:			wait queue for fence signaling
-+ * @sync_fence_list:	membership in global fence list
-+ */
-+struct sync_fence {
-+	struct file		*file;
-+	struct kref		kref;
-+	char			name[32];
-+#ifdef CONFIG_DEBUG_FS
-+	struct list_head	sync_fence_list;
-+#endif
-+	int num_fences;
-+
-+	wait_queue_head_t	wq;
-+	atomic_t		status;
-+
-+	struct sync_fence_cb	cbs[];
-+};
-+
-+struct sync_fence_waiter;
-+typedef void (*sync_callback_t)(struct sync_fence *fence,
-+				struct sync_fence_waiter *waiter);
-+
-+/**
-+ * struct sync_fence_waiter - metadata for asynchronous waiter on a fence
-+ * @waiter_list:	membership in sync_fence.waiter_list_head
-+ * @callback:		function pointer to call when fence signals
-+ * @callback_data:	pointer to pass to @callback
-+ */
-+struct sync_fence_waiter {
-+	wait_queue_t work;
-+	sync_callback_t callback;
-+};
-+
-+static inline void sync_fence_waiter_init(struct sync_fence_waiter *waiter,
-+					  sync_callback_t callback)
-+{
-+	INIT_LIST_HEAD(&waiter->work.task_list);
-+	waiter->callback = callback;
-+}
-+
-+/*
-+ * API for sync_timeline implementers
-+ */
-+
-+/**
-+ * sync_timeline_create() - creates a sync object
-+ * @ops:	specifies the implementation ops for the object
-+ * @size:	size to allocate for this obj
-+ * @name:	sync_timeline name
-+ *
-+ * Creates a new sync_timeline which will use the implementation specified by
-+ * @ops.  @size bytes will be allocated allowing for implementation specific
-+ * data to be kept after the generic sync_timeline struct.
-+ */
-+struct sync_timeline *sync_timeline_create(const struct sync_timeline_ops *ops,
-+					   int size, const char *name);
-+
-+/**
-+ * sync_timeline_destroy() - destroys a sync object
-+ * @obj:	sync_timeline to destroy
-+ *
-+ * A sync implementation should call this when the @obj is going away
-+ * (i.e. module unload.)  @obj won't actually be freed until all its children
-+ * sync_pts are freed.
-+ */
-+void sync_timeline_destroy(struct sync_timeline *obj);
-+
-+/**
-+ * sync_timeline_signal() - signal a status change on a sync_timeline
-+ * @obj:	sync_timeline to signal
-+ *
-+ * A sync implementation should call this any time one of it's sync_pts
-+ * has signaled or has an error condition.
-+ */
-+void sync_timeline_signal(struct sync_timeline *obj);
-+
-+/**
-+ * sync_pt_create() - creates a sync pt
-+ * @parent:	sync_pt's parent sync_timeline
-+ * @size:	size to allocate for this pt
-+ *
-+ * Creates a new sync_pt as a child of @parent.  @size bytes will be
-+ * allocated allowing for implementation specific data to be kept after
-+ * the generic sync_timeline struct.
-+ */
-+struct sync_pt *sync_pt_create(struct sync_timeline *parent, int size);
-+
-+/**
-+ * sync_pt_free() - frees a sync pt
-+ * @pt:		sync_pt to free
-+ *
-+ * This should only be called on sync_pts which have been created but
-+ * not added to a fence.
-+ */
-+void sync_pt_free(struct sync_pt *pt);
-+
-+/**
-+ * sync_fence_create() - creates a sync fence
-+ * @name:	name of fence to create
-+ * @pt:		sync_pt to add to the fence
-+ *
-+ * Creates a fence containg @pt.  Once this is called, the fence takes
-+ * ownership of @pt.
-+ */
-+struct sync_fence *sync_fence_create(const char *name, struct sync_pt *pt);
-+
-+/*
-+ * API for sync_fence consumers
-+ */
-+
-+/**
-+ * sync_fence_merge() - merge two fences
-+ * @name:	name of new fence
-+ * @a:		fence a
-+ * @b:		fence b
-+ *
-+ * Creates a new fence which contains copies of all the sync_pts in both
-+ * @a and @b.  @a and @b remain valid, independent fences.
-+ */
-+struct sync_fence *sync_fence_merge(const char *name,
-+				    struct sync_fence *a, struct sync_fence *b);
-+
-+/**
-+ * sync_fence_fdget() - get a fence from an fd
-+ * @fd:		fd referencing a fence
-+ *
-+ * Ensures @fd references a valid fence, increments the refcount of the backing
-+ * file, and returns the fence.
-+ */
-+struct sync_fence *sync_fence_fdget(int fd);
-+
-+/**
-+ * sync_fence_put() - puts a reference of a sync fence
-+ * @fence:	fence to put
-+ *
-+ * Puts a reference on @fence.  If this is the last reference, the fence and
-+ * all it's sync_pts will be freed
-+ */
-+void sync_fence_put(struct sync_fence *fence);
-+
-+/**
-+ * sync_fence_install() - installs a fence into a file descriptor
-+ * @fence:	fence to install
-+ * @fd:		file descriptor in which to install the fence
-+ *
-+ * Installs @fence into @fd.  @fd's should be acquired through
-+ * get_unused_fd_flags(O_CLOEXEC).
-+ */
-+void sync_fence_install(struct sync_fence *fence, int fd);
-+
-+/**
-+ * sync_fence_wait_async() - registers and async wait on the fence
-+ * @fence:		fence to wait on
-+ * @waiter:		waiter callback struck
-+ *
-+ * Returns 1 if @fence has already signaled.
-+ *
-+ * Registers a callback to be called when @fence signals or has an error.
-+ * @waiter should be initialized with sync_fence_waiter_init().
-+ */
-+int sync_fence_wait_async(struct sync_fence *fence,
-+			  struct sync_fence_waiter *waiter);
-+
-+/**
-+ * sync_fence_cancel_async() - cancels an async wait
-+ * @fence:		fence to wait on
-+ * @waiter:		waiter callback struck
-+ *
-+ * returns 0 if waiter was removed from fence's async waiter list.
-+ * returns -ENOENT if waiter was not found on fence's async waiter list.
-+ *
-+ * Cancels a previously registered async wait.  Will fail gracefully if
-+ * @waiter was never registered or if @fence has already signaled @waiter.
-+ */
-+int sync_fence_cancel_async(struct sync_fence *fence,
-+			    struct sync_fence_waiter *waiter);
-+
-+/**
-+ * sync_fence_wait() - wait on fence
-+ * @fence:	fence to wait on
-+ * @tiemout:	timeout in ms
-+ *
-+ * Wait for @fence to be signaled or have an error.  Waits indefinitely
-+ * if @timeout < 0
-+ */
-+int sync_fence_wait(struct sync_fence *fence, long timeout);
-+
-+#ifdef CONFIG_DEBUG_FS
-+
-+extern void sync_timeline_debug_add(struct sync_timeline *obj);
-+extern void sync_timeline_debug_remove(struct sync_timeline *obj);
-+extern void sync_fence_debug_add(struct sync_fence *fence);
-+extern void sync_fence_debug_remove(struct sync_fence *fence);
-+extern void sync_dump(void);
-+
-+#else
-+# define sync_timeline_debug_add(obj)
-+# define sync_timeline_debug_remove(obj)
-+# define sync_fence_debug_add(fence)
-+# define sync_fence_debug_remove(fence)
-+# define sync_dump()
-+#endif
-+int sync_fence_wake_up_wq(wait_queue_t *curr, unsigned mode,
-+				 int wake_flags, void *key);
-+
-+#endif /* _LINUX_SYNC_H */
-diff -Nur linux-4.1.3/include/uapi/linux/fb.h linux-xbian-imx6/include/uapi/linux/fb.h
---- linux-4.1.3/include/uapi/linux/fb.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/uapi/linux/fb.h	2015-07-27 23:13:09.853824963 +0200
-@@ -217,14 +217,45 @@
- #define FB_SYNC_ON_GREEN	32	/* sync on green */
- 
- #define FB_VMODE_NONINTERLACED  0	/* non interlaced */
--#define FB_VMODE_INTERLACED	1	/* interlaced	*/
--#define FB_VMODE_DOUBLE		2	/* double scan */
--#define FB_VMODE_ODD_FLD_FIRST	4	/* interlaced: top line first */
--#define FB_VMODE_MASK		255
--
--#define FB_VMODE_YWRAP		256	/* ywrap instead of panning     */
--#define FB_VMODE_SMOOTH_XPAN	512	/* smooth xpan possible (internally used) */
--#define FB_VMODE_CONUPDATE	512	/* don't update x/yoffset	*/
-+#define FB_VMODE_INTERLACED	BIT(1)	/* interlaced	*/
-+#define FB_VMODE_DOUBLE		BIT(2)	/* double scan */
-+#define FB_VMODE_ODD_FLD_FIRST	BIT(3)	/* interlaced: top line first */
-+#define FB_VMODE_MASK_SIMPLE	(BIT(1) | \
-+				 BIT(2))
-+/*
-+ * mxc_edid is taking 16 and 32 for ASPECT_16_9/4_3
-+ */
-+#define FB_VMODE_3D_SBS_HALF	BIT(4)     /* HDMI_3D_STRUCTURE_SIDE_BY_SIDE_HALF */
-+#define FB_VMODE_3D_SBS_FULL	BIT(5)     /* HDMI_3D_STRUCTURE_SIDE_BY_SIDE_FULL */
-+#define FB_VMODE_3D_TOP_BOTTOM	BIT(6)     /* HDMI_3D_STRUCTURE_TOP_AND_BOTTOM */
-+#define FB_VMODE_3D_FRAME_PACK	BIT(7)    /* HDMI_3D_STRUCTURE_FRAME_PACKING */
-+#define FB_VMODE_3D_MASK	(BIT(4) | \
-+				 BIT(5) | \
-+				 BIT(6) | \
-+				 BIT(7))
-+
-+#define FB_VMODE_YWRAP		BIT(8)	/* ywrap instead of panning     */
-+#define FB_VMODE_SMOOTH_XPAN	BIT(9)	/* smooth xpan possible (internally used) */
-+#define FB_VMODE_CONUPDATE	BIT(9)	/* don't update x/yoffset	*/
-+
-+#define FB_VMODE_ASPECT_1	BIT(10)
-+#define FB_VMODE_ASPECT_4_3	BIT(11)
-+#define FB_VMODE_ASPECT_5_4	BIT(12)
-+#define FB_VMODE_ASPECT_16_9	BIT(13)
-+#define FB_VMODE_ASPECT_16_10	BIT(14)
-+#define FB_VMODE_ASPECT_MASK	(BIT(10) | \
-+				 BIT(11) | \
-+				 BIT(12) | \
-+				 BIT(13) | \
-+				 BIT(14))
-+
-+#define FB_VMODE_FRACTIONAL	BIT(15)
-+
-+#define FB_VMODE_MASK		(FB_VMODE_MASK_SIMPLE | \
-+				 FB_VMODE_3D_MASK     | \
-+				 FB_VMODE_ASPECT_MASK | \
-+				 FB_VMODE_FRACTIONAL)
-+
- 
- /*
-  * Display rotation support
-diff -Nur linux-4.1.3/include/uapi/linux/ipu.h linux-xbian-imx6/include/uapi/linux/ipu.h
---- linux-4.1.3/include/uapi/linux/ipu.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/ipu.h	2015-07-27 23:13:09.861796522 +0200
-@@ -0,0 +1,282 @@
-+/*
-+ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*!
-+ * @defgroup IPU MXC Image Processing Unit (IPU) Driver
-+ */
-+/*!
-+ * @file uapi/linux/ipu.h
-+ *
-+ * @brief This file contains the IPU driver API declarations.
-+ *
-+ * @ingroup IPU
-+ */
-+
-+#ifndef __ASM_ARCH_IPU_H__
-+#define __ASM_ARCH_IPU_H__
-+
-+#include <linux/types.h>
-+#include <linux/videodev2.h>
-+
-+#ifndef __KERNEL__
-+#ifndef __cplusplus
-+typedef unsigned char bool;
-+#endif
-+#define irqreturn_t int
-+#define dma_addr_t int
-+#define uint32_t unsigned int
-+#define uint16_t unsigned short
-+#define uint8_t unsigned char
-+#define u32 unsigned int
-+#define u8 unsigned char
-+#define __u32 u32
-+#endif
-+
-+/*!
-+ * Enumeration of IPU rotation modes
-+ */
-+typedef enum {
-+	/* Note the enum values correspond to BAM value */
-+	IPU_ROTATE_NONE = 0,
-+	IPU_ROTATE_VERT_FLIP = 1,
-+	IPU_ROTATE_HORIZ_FLIP = 2,
-+	IPU_ROTATE_180 = 3,
-+	IPU_ROTATE_90_RIGHT = 4,
-+	IPU_ROTATE_90_RIGHT_VFLIP = 5,
-+	IPU_ROTATE_90_RIGHT_HFLIP = 6,
-+	IPU_ROTATE_90_LEFT = 7,
-+} ipu_rotate_mode_t;
-+
-+/*!
-+ * Enumeration of VDI MOTION select
-+ */
-+typedef enum {
-+	MED_MOTION = 0,
-+	LOW_MOTION = 1,
-+	HIGH_MOTION = 2,
-+} ipu_motion_sel;
-+
-+/*!
-+ * Enumeration of DI ports for ADC.
-+ */
-+typedef enum {
-+	DISP0,
-+	DISP1,
-+	DISP2,
-+	DISP3
-+} display_port_t;
-+
-+/*  IPU Pixel format definitions */
-+/*  Four-character-code (FOURCC) */
-+#define fourcc(a, b, c, d)\
-+	 (((__u32)(a)<<0)|((__u32)(b)<<8)|((__u32)(c)<<16)|((__u32)(d)<<24))
-+
-+/*!
-+ * @name IPU Pixel Formats
-+ *
-+ * Pixel formats are defined with ASCII FOURCC code. The pixel format codes are
-+ * the same used by V4L2 API.
-+ */
-+
-+/*! @{ */
-+/*! @name Generic or Raw Data Formats */
-+/*! @{ */
-+#define IPU_PIX_FMT_GENERIC fourcc('I', 'P', 'U', '0')	/*!< IPU Generic Data */
-+#define IPU_PIX_FMT_GENERIC_32 fourcc('I', 'P', 'U', '1')	/*!< IPU Generic Data */
-+#define IPU_PIX_FMT_GENERIC_16 fourcc('I', 'P', 'U', '2')	/*!< IPU Generic Data */
-+#define IPU_PIX_FMT_LVDS666 fourcc('L', 'V', 'D', '6')	/*!< IPU Generic Data */
-+#define IPU_PIX_FMT_LVDS888 fourcc('L', 'V', 'D', '8')	/*!< IPU Generic Data */
-+/*! @} */
-+/*! @name RGB Formats */
-+/*! @{ */
-+#define IPU_PIX_FMT_RGB332  fourcc('R', 'G', 'B', '1')	/*!<  8  RGB-3-3-2    */
-+#define IPU_PIX_FMT_RGB555  fourcc('R', 'G', 'B', 'O')	/*!< 16  RGB-5-5-5    */
-+#define IPU_PIX_FMT_RGB565  fourcc('R', 'G', 'B', 'P')	/*!< 1 6  RGB-5-6-5   */
-+#define IPU_PIX_FMT_RGB666  fourcc('R', 'G', 'B', '6')	/*!< 18  RGB-6-6-6    */
-+#define IPU_PIX_FMT_BGR666  fourcc('B', 'G', 'R', '6')	/*!< 18  BGR-6-6-6    */
-+#define IPU_PIX_FMT_BGR24   fourcc('B', 'G', 'R', '3')	/*!< 24  BGR-8-8-8    */
-+#define IPU_PIX_FMT_RGB24   fourcc('R', 'G', 'B', '3')	/*!< 24  RGB-8-8-8    */
-+#define IPU_PIX_FMT_GBR24   fourcc('G', 'B', 'R', '3')	/*!< 24  GBR-8-8-8    */
-+#define IPU_PIX_FMT_BGR32   fourcc('B', 'G', 'R', '4')	/*!< 32  BGR-8-8-8-8  */
-+#define IPU_PIX_FMT_BGRA32  fourcc('B', 'G', 'R', 'A')	/*!< 32  BGR-8-8-8-8  */
-+#define IPU_PIX_FMT_RGB32   fourcc('R', 'G', 'B', '4')	/*!< 32  RGB-8-8-8-8  */
-+#define IPU_PIX_FMT_RGBA32  fourcc('R', 'G', 'B', 'A')	/*!< 32  RGB-8-8-8-8  */
-+#define IPU_PIX_FMT_ABGR32  fourcc('A', 'B', 'G', 'R')	/*!< 32  ABGR-8-8-8-8 */
-+/*! @} */
-+/*! @name YUV Interleaved Formats */
-+/*! @{ */
-+#define IPU_PIX_FMT_YUYV    fourcc('Y', 'U', 'Y', 'V')	/*!< 16 YUV 4:2:2 */
-+#define IPU_PIX_FMT_UYVY    fourcc('U', 'Y', 'V', 'Y')	/*!< 16 YUV 4:2:2 */
-+#define IPU_PIX_FMT_YVYU    fourcc('Y', 'V', 'Y', 'U')  /*!< 16 YVYU 4:2:2 */
-+#define IPU_PIX_FMT_VYUY    fourcc('V', 'Y', 'U', 'Y')  /*!< 16 VYYU 4:2:2 */
-+#define IPU_PIX_FMT_Y41P    fourcc('Y', '4', '1', 'P')	/*!< 12 YUV 4:1:1 */
-+#define IPU_PIX_FMT_YUV444  fourcc('Y', '4', '4', '4')	/*!< 24 YUV 4:4:4 */
-+#define IPU_PIX_FMT_VYU444  fourcc('V', '4', '4', '4')	/*!< 24 VYU 4:4:4 */
-+/* two planes -- one Y, one Cb + Cr interleaved  */
-+#define IPU_PIX_FMT_NV12    fourcc('N', 'V', '1', '2') /* 12  Y/CbCr 4:2:0  */
-+/* two planes -- 12  tiled Y/CbCr 4:2:0  */
-+#define IPU_PIX_FMT_TILED_NV12    fourcc('T', 'N', 'V', 'P')
-+#define IPU_PIX_FMT_TILED_NV12F   fourcc('T', 'N', 'V', 'F')
-+
-+/*! @} */
-+/*! @name YUV Planar Formats */
-+/*! @{ */
-+#define IPU_PIX_FMT_GREY    fourcc('G', 'R', 'E', 'Y')	/*!< 8  Greyscale */
-+#define IPU_PIX_FMT_YVU410P fourcc('Y', 'V', 'U', '9')	/*!< 9  YVU 4:1:0 */
-+#define IPU_PIX_FMT_YUV410P fourcc('Y', 'U', 'V', '9')	/*!< 9  YUV 4:1:0 */
-+#define IPU_PIX_FMT_YVU420P fourcc('Y', 'V', '1', '2')	/*!< 12 YVU 4:2:0 */
-+#define IPU_PIX_FMT_YUV420P fourcc('I', '4', '2', '0')	/*!< 12 YUV 4:2:0 */
-+#define IPU_PIX_FMT_YUV420P2 fourcc('Y', 'U', '1', '2')	/*!< 12 YUV 4:2:0 */
-+#define IPU_PIX_FMT_YVU422P fourcc('Y', 'V', '1', '6')	/*!< 16 YVU 4:2:2 */
-+#define IPU_PIX_FMT_YUV422P fourcc('4', '2', '2', 'P')	/*!< 16 YUV 4:2:2 */
-+/* non-interleaved 4:4:4 */
-+#define IPU_PIX_FMT_YUV444P fourcc('4', '4', '4', 'P')	/*!< 24 YUV 4:4:4 */
-+/*! @} */
-+#define IPU_PIX_FMT_TILED_NV12_MBALIGN	(16)
-+#define TILED_NV12_FRAME_SIZE(w, h)	\
-+		(ALIGN((w) * (h), SZ_4K) + ALIGN((w) * (h) / 2, SZ_4K))
-+/* IPU device */
-+typedef enum {
-+	RGB_CS,
-+	YUV_CS,
-+	NULL_CS
-+} cs_t;
-+
-+struct ipu_pos {
-+	u32 x;
-+	u32 y;
-+};
-+
-+struct ipu_crop {
-+	struct ipu_pos pos;
-+	u32 w;
-+	u32 h;
-+};
-+
-+struct ipu_deinterlace {
-+	bool	enable;
-+	u8	motion; /*see ipu_motion_sel*/
-+#define IPU_DEINTERLACE_FIELD_TOP	0
-+#define IPU_DEINTERLACE_FIELD_BOTTOM	1
-+#define IPU_DEINTERLACE_FIELD_MASK	\
-+		(IPU_DEINTERLACE_FIELD_TOP | IPU_DEINTERLACE_FIELD_BOTTOM)
-+	/* deinterlace frame rate double flags */
-+#define IPU_DEINTERLACE_RATE_EN		0x80
-+#define IPU_DEINTERLACE_RATE_FRAME1	0x40
-+#define IPU_DEINTERLACE_RATE_MASK	\
-+		(IPU_DEINTERLACE_RATE_EN | IPU_DEINTERLACE_RATE_FRAME1)
-+#define IPU_DEINTERLACE_MAX_FRAME	2
-+	u8	field_fmt;
-+};
-+
-+struct ipu_input {
-+	u32 width;
-+	u32 height;
-+	u32 format;
-+	struct ipu_crop crop;
-+	dma_addr_t paddr;
-+
-+	struct ipu_deinterlace deinterlace;
-+	dma_addr_t paddr_n; /*valid when deinterlace enable*/
-+};
-+
-+struct ipu_alpha {
-+#define IPU_ALPHA_MODE_GLOBAL	0
-+#define IPU_ALPHA_MODE_LOCAL	1
-+	u8 mode;
-+	u8 gvalue; /* 0~255 */
-+	dma_addr_t loc_alp_paddr;
-+};
-+
-+struct ipu_colorkey {
-+	bool enable;
-+	u32 value; /* RGB 24bit */
-+};
-+
-+struct ipu_overlay {
-+	u32	width;
-+	u32	height;
-+	u32	format;
-+	struct ipu_crop crop;
-+	struct ipu_alpha alpha;
-+	struct ipu_colorkey colorkey;
-+	dma_addr_t paddr;
-+};
-+
-+struct ipu_output {
-+	u32	width;
-+	u32	height;
-+	u32	format;
-+	u8	rotate;
-+	struct ipu_crop crop;
-+	dma_addr_t paddr;
-+};
-+
-+struct ipu_task {
-+	struct ipu_input input;
-+	struct ipu_output output;
-+
-+	bool overlay_en;
-+	struct ipu_overlay overlay;
-+
-+#define IPU_TASK_PRIORITY_NORMAL 0
-+#define IPU_TASK_PRIORITY_HIGH	1
-+	u8	priority;
-+
-+#define	IPU_TASK_ID_ANY	0
-+#define	IPU_TASK_ID_VF	1
-+#define	IPU_TASK_ID_PP	2
-+#define	IPU_TASK_ID_MAX 3
-+	u8	task_id;
-+
-+	int	timeout;
-+};
-+
-+enum {
-+	IPU_CHECK_OK = 0,
-+	IPU_CHECK_WARN_INPUT_OFFS_NOT8ALIGN = 0x1,
-+	IPU_CHECK_WARN_OUTPUT_OFFS_NOT8ALIGN = 0x2,
-+	IPU_CHECK_WARN_OVERLAY_OFFS_NOT8ALIGN = 0x4,
-+	IPU_CHECK_ERR_MIN,
-+	IPU_CHECK_ERR_INPUT_CROP,
-+	IPU_CHECK_ERR_OUTPUT_CROP,
-+	IPU_CHECK_ERR_OVERLAY_CROP,
-+	IPU_CHECK_ERR_INPUT_OVER_LIMIT,
-+	IPU_CHECK_ERR_OV_OUT_NO_FIT,
-+	IPU_CHECK_ERR_OVERLAY_WITH_VDI,
-+	IPU_CHECK_ERR_PROC_NO_NEED,
-+	IPU_CHECK_ERR_SPLIT_INPUTW_OVER,
-+	IPU_CHECK_ERR_SPLIT_INPUTH_OVER,
-+	IPU_CHECK_ERR_SPLIT_OUTPUTW_OVER,
-+	IPU_CHECK_ERR_SPLIT_OUTPUTH_OVER,
-+	IPU_CHECK_ERR_SPLIT_WITH_ROT,
-+	IPU_CHECK_ERR_NOT_SUPPORT,
-+	IPU_CHECK_ERR_NOT16ALIGN,
-+	IPU_CHECK_ERR_W_DOWNSIZE_OVER,
-+	IPU_CHECK_ERR_H_DOWNSIZE_OVER,
-+};
-+
-+/* IOCTL commands */
-+#define IPU_CHECK_TASK		_IOWR('I', 0x1, struct ipu_task)
-+#define IPU_QUEUE_TASK		_IOW('I', 0x2, struct ipu_task)
-+#define IPU_ALLOC		_IOWR('I', 0x3, int)
-+#define IPU_FREE		_IOW('I', 0x4, int)
-+
-+#endif
-diff -Nur linux-4.1.3/include/uapi/linux/Kbuild linux-xbian-imx6/include/uapi/linux/Kbuild
---- linux-4.1.3/include/uapi/linux/Kbuild	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/include/uapi/linux/Kbuild	2015-07-27 23:13:09.849839184 +0200
-@@ -266,6 +266,9 @@
- header-y += msdos_fs.h
- header-y += msg.h
- header-y += mtio.h
-+header-y += mxcfb.h
-+header-y += mxc_dcic.h
-+header-y += ipu.h
- header-y += nbd.h
- header-y += ncp_fs.h
- header-y += ncp.h
-@@ -451,3 +454,6 @@
- header-y += xilinx-v4l2-controls.h
- header-y += zorro.h
- header-y += zorro_ids.h
-+
-+header-y += pxp_device.h
-+header-y += pxp_dma.h
-diff -Nur linux-4.1.3/include/uapi/linux/mxc_asrc.h linux-xbian-imx6/include/uapi/linux/mxc_asrc.h
---- linux-4.1.3/include/uapi/linux/mxc_asrc.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/mxc_asrc.h	2015-07-27 23:13:09.865782301 +0200
-@@ -0,0 +1,143 @@
-+/*
-+ * Copyright 2008-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ *
-+ * @file mxc_asrc.h
-+ *
-+ * @brief i.MX Asynchronous Sample Rate Converter
-+ *
-+ * @ingroup Audio
-+ */
-+
-+#ifndef __MXC_ASRC_UAPI_H__
-+#define __MXC_ASRC_UAPI_H__
-+
-+#define ASRC_IOC_MAGIC		'C'
-+
-+#define ASRC_REQ_PAIR		_IOWR(ASRC_IOC_MAGIC, 0, struct asrc_req)
-+#define ASRC_CONFIG_PAIR	_IOWR(ASRC_IOC_MAGIC, 1, struct asrc_config)
-+#define ASRC_RELEASE_PAIR	_IOW(ASRC_IOC_MAGIC, 2, enum asrc_pair_index)
-+#define ASRC_CONVERT		_IOW(ASRC_IOC_MAGIC, 3, struct asrc_convert_buffer)
-+#define ASRC_START_CONV		_IOW(ASRC_IOC_MAGIC, 4, enum asrc_pair_index)
-+#define ASRC_STOP_CONV		_IOW(ASRC_IOC_MAGIC, 5, enum asrc_pair_index)
-+#define ASRC_STATUS		_IOW(ASRC_IOC_MAGIC, 6, struct asrc_status_flags)
-+#define ASRC_FLUSH		_IOW(ASRC_IOC_MAGIC, 7, enum asrc_pair_index)
-+
-+enum asrc_pair_index {
-+	ASRC_UNVALID_PAIR = -1,
-+	ASRC_PAIR_A = 0,
-+	ASRC_PAIR_B = 1,
-+	ASRC_PAIR_C = 2,
-+};
-+
-+#define ASRC_PAIR_MAX_NUM	(ASRC_PAIR_C + 1)
-+
-+enum asrc_inclk {
-+	INCLK_NONE = 0x03,
-+	INCLK_ESAI_RX = 0x00,
-+	INCLK_SSI1_RX = 0x01,
-+	INCLK_SSI2_RX = 0x02,
-+	INCLK_SSI3_RX = 0x07,
-+	INCLK_SPDIF_RX = 0x04,
-+	INCLK_MLB_CLK = 0x05,
-+	INCLK_PAD = 0x06,
-+	INCLK_ESAI_TX = 0x08,
-+	INCLK_SSI1_TX = 0x09,
-+	INCLK_SSI2_TX = 0x0a,
-+	INCLK_SSI3_TX = 0x0b,
-+	INCLK_SPDIF_TX = 0x0c,
-+	INCLK_ASRCK1_CLK = 0x0f,
-+};
-+
-+enum asrc_outclk {
-+	OUTCLK_NONE = 0x03,
-+	OUTCLK_ESAI_TX = 0x00,
-+	OUTCLK_SSI1_TX = 0x01,
-+	OUTCLK_SSI2_TX = 0x02,
-+	OUTCLK_SSI3_TX = 0x07,
-+	OUTCLK_SPDIF_TX = 0x04,
-+	OUTCLK_MLB_CLK = 0x05,
-+	OUTCLK_PAD = 0x06,
-+	OUTCLK_ESAI_RX = 0x08,
-+	OUTCLK_SSI1_RX = 0x09,
-+	OUTCLK_SSI2_RX = 0x0a,
-+	OUTCLK_SSI3_RX = 0x0b,
-+	OUTCLK_SPDIF_RX = 0x0c,
-+	OUTCLK_ASRCK1_CLK = 0x0f,
-+};
-+
-+enum asrc_word_width {
-+	ASRC_WIDTH_24_BIT = 0,
-+	ASRC_WIDTH_16_BIT = 1,
-+	ASRC_WIDTH_8_BIT = 2,
-+};
-+
-+struct asrc_config {
-+	enum asrc_pair_index pair;
-+	unsigned int channel_num;
-+	unsigned int buffer_num;
-+	unsigned int dma_buffer_size;
-+	unsigned int input_sample_rate;
-+	unsigned int output_sample_rate;
-+	enum asrc_word_width input_word_width;
-+	enum asrc_word_width output_word_width;
-+	enum asrc_inclk inclk;
-+	enum asrc_outclk outclk;
-+};
-+
-+struct asrc_pair {
-+	unsigned int start_channel;
-+	unsigned int chn_num;
-+	unsigned int chn_max;
-+	unsigned int active;
-+	unsigned int overload_error;
-+};
-+
-+struct asrc_req {
-+	unsigned int chn_num;
-+	enum asrc_pair_index index;
-+};
-+
-+struct asrc_querybuf {
-+	unsigned int buffer_index;
-+	unsigned int input_length;
-+	unsigned int output_length;
-+	unsigned long input_offset;
-+	unsigned long output_offset;
-+};
-+
-+struct asrc_convert_buffer {
-+	void *input_buffer_vaddr;
-+	void *output_buffer_vaddr;
-+	unsigned int input_buffer_length;
-+	unsigned int output_buffer_length;
-+};
-+
-+struct asrc_buffer {
-+	unsigned int index;
-+	unsigned int length;
-+	unsigned int output_last_length;
-+	int buf_valid;
-+};
-+
-+struct asrc_status_flags {
-+	enum asrc_pair_index index;
-+	unsigned int overload_error;
-+};
-+
-+#define ASRC_BUF_NA	-35	/* ASRC DQ's buffer is NOT available */
-+#define ASRC_BUF_AV	 35	/* ASRC DQ's buffer is available */
-+enum asrc_error_status {
-+	ASRC_TASK_Q_OVERLOAD		= 0x01,
-+	ASRC_OUTPUT_TASK_OVERLOAD	= 0x02,
-+	ASRC_INPUT_TASK_OVERLOAD	= 0x04,
-+	ASRC_OUTPUT_BUFFER_OVERFLOW	= 0x08,
-+	ASRC_INPUT_BUFFER_UNDERRUN	= 0x10,
-+};
-+#endif/* __MXC_ASRC_UAPI_H__ */
-diff -Nur linux-4.1.3/include/uapi/linux/mxc_dcic.h linux-xbian-imx6/include/uapi/linux/mxc_dcic.h
---- linux-4.1.3/include/uapi/linux/mxc_dcic.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/mxc_dcic.h	2015-07-27 23:13:09.865782301 +0200
-@@ -0,0 +1,49 @@
-+/*
-+ * Copyright (C) 2014 Freescale Semiconductor, Inc. All Rights Reserved
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*!
-+ * @file uapi/linux/mxc_dcic.h
-+ *
-+ * @brief MXC DCIC private header file
-+ *
-+ * @ingroup MXC DCIC
-+ */
-+#ifndef __ASM_ARCH_MXC_DCIC_H__
-+#define __ASM_ARCH_MXC_DCIC_H__
-+
-+#define DCIC_IOC_ALLOC_ROI_NUM	_IO('D', 10)
-+#define DCIC_IOC_FREE_ROI_NUM	_IO('D', 11)
-+#define DCIC_IOC_CONFIG_DCIC	_IO('D', 12)
-+#define DCIC_IOC_CONFIG_ROI		_IO('D', 13)
-+#define DCIC_IOC_GET_RESULT		_IO('D', 14)
-+#define DCIC_IOC_START_VSYNC		_IO('D', 15)
-+#define DCIC_IOC_STOP_VSYNC		_IO('D', 16)
-+
-+struct roi_params {
-+	unsigned int roi_n;
-+	unsigned int ref_sig;
-+	unsigned int start_y;
-+	unsigned int start_x;
-+	unsigned int end_y;
-+	unsigned int end_x;
-+	char freeze;
-+};
-+
-+#endif
-diff -Nur linux-4.1.3/include/uapi/linux/mxcfb.h linux-xbian-imx6/include/uapi/linux/mxcfb.h
---- linux-4.1.3/include/uapi/linux/mxcfb.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/mxcfb.h	2015-07-27 23:13:09.865782301 +0200
-@@ -0,0 +1,176 @@
-+/*
-+ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc. All Rights Reserved
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*
-+ * @file uapi/linux/mxcfb.h
-+ *
-+ * @brief Global header file for the MXC frame buffer
-+ *
-+ * @ingroup Framebuffer
-+ */
-+#ifndef __ASM_ARCH_MXCFB_H__
-+#define __ASM_ARCH_MXCFB_H__
-+
-+#include <linux/fb.h>
-+
-+#define FB_SYNC_OE_LOW_ACT	0x80000000
-+#define FB_SYNC_CLK_LAT_FALL	0x40000000
-+#define FB_SYNC_DATA_INVERT	0x20000000
-+#define FB_SYNC_CLK_IDLE_EN	0x10000000
-+#define FB_SYNC_SHARP_MODE	0x08000000
-+#define FB_SYNC_SWAP_RGB	0x04000000
-+#define FB_ACCEL_TRIPLE_FLAG	0x00000000
-+#define FB_ACCEL_DOUBLE_FLAG	0x00000001
-+
-+struct mxcfb_gbl_alpha {
-+	int enable;
-+	int alpha;
-+};
-+
-+struct mxcfb_loc_alpha {
-+	int enable;
-+	int alpha_in_pixel;
-+	unsigned long alpha_phy_addr0;
-+	unsigned long alpha_phy_addr1;
-+};
-+
-+struct mxcfb_color_key {
-+	int enable;
-+	__u32 color_key;
-+};
-+
-+struct mxcfb_pos {
-+	__u16 x;
-+	__u16 y;
-+};
-+
-+struct mxcfb_gamma {
-+	int enable;
-+	int constk[16];
-+	int slopek[16];
-+};
-+
-+struct mxcfb_rect {
-+	__u32 top;
-+	__u32 left;
-+	__u32 width;
-+	__u32 height;
-+};
-+
-+#define GRAYSCALE_8BIT				0x1
-+#define GRAYSCALE_8BIT_INVERTED			0x2
-+#define GRAYSCALE_4BIT                          0x3
-+#define GRAYSCALE_4BIT_INVERTED                 0x4
-+
-+#define AUTO_UPDATE_MODE_REGION_MODE		0
-+#define AUTO_UPDATE_MODE_AUTOMATIC_MODE		1
-+
-+#define UPDATE_SCHEME_SNAPSHOT			0
-+#define UPDATE_SCHEME_QUEUE			1
-+#define UPDATE_SCHEME_QUEUE_AND_MERGE		2
-+
-+#define UPDATE_MODE_PARTIAL			0x0
-+#define UPDATE_MODE_FULL			0x1
-+
-+#define WAVEFORM_MODE_AUTO			257
-+
-+#define TEMP_USE_AMBIENT			0x1000
-+
-+#define EPDC_FLAG_ENABLE_INVERSION		0x01
-+#define EPDC_FLAG_FORCE_MONOCHROME		0x02
-+#define EPDC_FLAG_USE_CMAP			0x04
-+#define EPDC_FLAG_USE_ALT_BUFFER		0x100
-+#define EPDC_FLAG_TEST_COLLISION		0x200
-+#define EPDC_FLAG_GROUP_UPDATE			0x400
-+#define EPDC_FLAG_USE_DITHERING_Y1		0x2000
-+#define EPDC_FLAG_USE_DITHERING_Y4		0x4000
-+
-+#define FB_POWERDOWN_DISABLE			-1
-+
-+struct mxcfb_alt_buffer_data {
-+	__u32 phys_addr;
-+	__u32 width;	/* width of entire buffer */
-+	__u32 height;	/* height of entire buffer */
-+	struct mxcfb_rect alt_update_region;	/* region within buffer to update */
-+};
-+
-+struct mxcfb_update_data {
-+	struct mxcfb_rect update_region;
-+	__u32 waveform_mode;
-+	__u32 update_mode;
-+	__u32 update_marker;
-+	int temp;
-+	unsigned int flags;
-+	struct mxcfb_alt_buffer_data alt_buffer_data;
-+};
-+
-+struct mxcfb_update_marker_data {
-+	__u32 update_marker;
-+	__u32 collision_test;
-+};
-+
-+/*
-+ * Structure used to define waveform modes for driver
-+ * Needed for driver to perform auto-waveform selection
-+ */
-+struct mxcfb_waveform_modes {
-+	int mode_init;
-+	int mode_du;
-+	int mode_gc4;
-+	int mode_gc8;
-+	int mode_gc16;
-+	int mode_gc32;
-+};
-+
-+/*
-+ * Structure used to define a 5*3 matrix of parameters for
-+ * setting IPU DP CSC module related to this framebuffer.
-+ */
-+struct mxcfb_csc_matrix {
-+	int param[5][3];
-+};
-+
-+#define MXCFB_WAIT_FOR_VSYNC	_IOW('F', 0x20, u_int32_t)
-+#define MXCFB_SET_GBL_ALPHA     _IOW('F', 0x21, struct mxcfb_gbl_alpha)
-+#define MXCFB_SET_CLR_KEY       _IOW('F', 0x22, struct mxcfb_color_key)
-+#define MXCFB_SET_OVERLAY_POS   _IOWR('F', 0x24, struct mxcfb_pos)
-+#define MXCFB_GET_FB_IPU_CHAN 	_IOR('F', 0x25, u_int32_t)
-+#define MXCFB_SET_LOC_ALPHA     _IOWR('F', 0x26, struct mxcfb_loc_alpha)
-+#define MXCFB_SET_LOC_ALP_BUF    _IOW('F', 0x27, unsigned long)
-+#define MXCFB_SET_GAMMA	       _IOW('F', 0x28, struct mxcfb_gamma)
-+#define MXCFB_GET_FB_IPU_DI 	_IOR('F', 0x29, u_int32_t)
-+#define MXCFB_GET_DIFMT	       _IOR('F', 0x2A, u_int32_t)
-+#define MXCFB_GET_FB_BLANK     _IOR('F', 0x2B, u_int32_t)
-+#define MXCFB_SET_DIFMT		_IOW('F', 0x2C, u_int32_t)
-+#define MXCFB_CSC_UPDATE	_IOW('F', 0x2D, struct mxcfb_csc_matrix)
-+
-+/* IOCTLs for E-ink panel updates */
-+#define MXCFB_SET_WAVEFORM_MODES	_IOW('F', 0x2B, struct mxcfb_waveform_modes)
-+#define MXCFB_SET_TEMPERATURE		_IOW('F', 0x2C, int32_t)
-+#define MXCFB_SET_AUTO_UPDATE_MODE	_IOW('F', 0x2D, __u32)
-+#define MXCFB_SEND_UPDATE		_IOW('F', 0x2E, struct mxcfb_update_data)
-+#define MXCFB_WAIT_FOR_UPDATE_COMPLETE	_IOWR('F', 0x2F, struct mxcfb_update_marker_data)
-+#define MXCFB_SET_PWRDOWN_DELAY		_IOW('F', 0x30, int32_t)
-+#define MXCFB_GET_PWRDOWN_DELAY		_IOR('F', 0x31, int32_t)
-+#define MXCFB_SET_UPDATE_SCHEME		_IOW('F', 0x32, __u32)
-+#define MXCFB_GET_WORK_BUFFER		_IOWR('F', 0x34, unsigned long)
-+#define MXCFB_DISABLE_EPDC_ACCESS	_IO('F', 0x35)
-+#define MXCFB_ENABLE_EPDC_ACCESS	_IO('F', 0x36)
-+#endif
-diff -Nur linux-4.1.3/include/uapi/linux/mxc_mlb.h linux-xbian-imx6/include/uapi/linux/mxc_mlb.h
---- linux-4.1.3/include/uapi/linux/mxc_mlb.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/mxc_mlb.h	2015-07-27 23:13:09.865782301 +0200
-@@ -0,0 +1,55 @@
-+/*
-+ * mxc_mlb.h
-+ *
-+ * Copyright 2008-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+#ifndef _MXC_MLB_UAPI_H
-+#define _MXC_MLB_UAPI_H
-+
-+/* define IOCTL command */
-+#define MLB_DBG_RUNTIME		_IO('S', 0x09)
-+#define MLB_SET_FPS		_IOW('S', 0x10, unsigned int)
-+#define MLB_GET_VER		_IOR('S', 0x11, unsigned long)
-+#define MLB_SET_DEVADDR		_IOR('S', 0x12, unsigned char)
-+
-+/*!
-+ * set channel address for each logical channel
-+ * the MSB 16bits is for tx channel, the left LSB is for rx channel
-+ */
-+#define MLB_CHAN_SETADDR	_IOW('S', 0x13, unsigned int)
-+#define MLB_CHAN_STARTUP	_IO('S', 0x14)
-+#define MLB_CHAN_SHUTDOWN	_IO('S', 0x15)
-+#define MLB_CHAN_GETEVENT	_IOR('S', 0x16, unsigned long)
-+
-+#define MLB_SET_ISOC_BLKSIZE_188 _IO('S', 0x17)
-+#define MLB_SET_ISOC_BLKSIZE_196 _IO('S', 0x18)
-+#define MLB_SET_SYNC_QUAD	_IOW('S', 0x19, unsigned int)
-+#define MLB_IRQ_ENABLE		_IO('S', 0x20)
-+#define MLB_IRQ_DISABLE		_IO('S', 0x21)
-+
-+/*!
-+ * MLB event define
-+ */
-+enum {
-+	MLB_EVT_TX_PROTO_ERR_CUR = 1 << 0,
-+	MLB_EVT_TX_BRK_DETECT_CUR = 1 << 1,
-+	MLB_EVT_TX_PROTO_ERR_PREV = 1 << 8,
-+	MLB_EVT_TX_BRK_DETECT_PREV = 1 << 9,
-+	MLB_EVT_RX_PROTO_ERR_CUR = 1 << 16,
-+	MLB_EVT_RX_BRK_DETECT_CUR = 1 << 17,
-+	MLB_EVT_RX_PROTO_ERR_PREV = 1 << 24,
-+	MLB_EVT_RX_BRK_DETECT_PREV = 1 << 25,
-+};
-+
-+
-+#endif				/* _MXC_MLB_H */
-diff -Nur linux-4.1.3/include/uapi/linux/mxc_v4l2.h linux-xbian-imx6/include/uapi/linux/mxc_v4l2.h
---- linux-4.1.3/include/uapi/linux/mxc_v4l2.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/mxc_v4l2.h	2015-07-27 23:13:09.865782301 +0200
-@@ -0,0 +1,56 @@
-+/*
-+ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+/*!
-+ * @file uapi/linux/mxc_v4l2.h
-+ *
-+ * @brief MXC V4L2 private header file
-+ *
-+ * @ingroup MXC V4L2
-+ */
-+
-+#ifndef __ASM_ARCH_MXC_V4L2_H__
-+#define __ASM_ARCH_MXC_V4L2_H__
-+
-+/*
-+ * For IPUv1 and IPUv3, V4L2_CID_MXC_ROT means encoder ioctl ID.
-+ * And V4L2_CID_MXC_VF_ROT is viewfinder ioctl ID only for IPUv1 and IPUv3.
-+ */
-+#define V4L2_CID_MXC_ROT		(V4L2_CID_PRIVATE_BASE + 0)
-+#define V4L2_CID_MXC_FLASH		(V4L2_CID_PRIVATE_BASE + 1)
-+#define V4L2_CID_MXC_VF_ROT		(V4L2_CID_PRIVATE_BASE + 2)
-+#define V4L2_CID_MXC_MOTION		(V4L2_CID_PRIVATE_BASE + 3)
-+#define V4L2_CID_MXC_SWITCH_CAM		(V4L2_CID_PRIVATE_BASE + 6)
-+
-+#define V4L2_MXC_ROTATE_NONE			0
-+#define V4L2_MXC_ROTATE_VERT_FLIP		1
-+#define V4L2_MXC_ROTATE_HORIZ_FLIP		2
-+#define V4L2_MXC_ROTATE_180			3
-+#define V4L2_MXC_ROTATE_90_RIGHT		4
-+#define V4L2_MXC_ROTATE_90_RIGHT_VFLIP		5
-+#define V4L2_MXC_ROTATE_90_RIGHT_HFLIP		6
-+#define V4L2_MXC_ROTATE_90_LEFT			7
-+
-+struct v4l2_mxc_offset {
-+	uint32_t u_offset;
-+	uint32_t v_offset;
-+};
-+
-+#endif
-diff -Nur linux-4.1.3/include/uapi/linux/pxp_device.h linux-xbian-imx6/include/uapi/linux/pxp_device.h
---- linux-4.1.3/include/uapi/linux/pxp_device.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/pxp_device.h	2015-07-27 23:13:09.941512106 +0200
-@@ -0,0 +1,63 @@
-+/*
-+ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+#ifndef _UAPI_PXP_DEVICE
-+#define _UAPI_PXP_DEVICE
-+
-+#include <linux/pxp_dma.h>
-+
-+struct pxp_chan_handle {
-+	unsigned int handle;
-+	int hist_status;
-+};
-+
-+struct pxp_mem_desc {
-+	unsigned int handle;
-+	unsigned int size;
-+	dma_addr_t phys_addr;
-+	unsigned int virt_uaddr;		/* virtual user space address */
-+	unsigned int mtype;
-+};
-+
-+struct pxp_mem_flush {
-+	unsigned int handle;
-+	unsigned int type;
-+};
-+
-+#define PXP_IOC_MAGIC  'P'
-+
-+#define PXP_IOC_GET_CHAN      _IOR(PXP_IOC_MAGIC, 0, struct pxp_mem_desc)
-+#define PXP_IOC_PUT_CHAN      _IOW(PXP_IOC_MAGIC, 1, struct pxp_mem_desc)
-+#define PXP_IOC_CONFIG_CHAN   _IOW(PXP_IOC_MAGIC, 2, struct pxp_mem_desc)
-+#define PXP_IOC_START_CHAN    _IOW(PXP_IOC_MAGIC, 3, struct pxp_mem_desc)
-+#define PXP_IOC_GET_PHYMEM    _IOWR(PXP_IOC_MAGIC, 4, struct pxp_mem_desc)
-+#define PXP_IOC_PUT_PHYMEM    _IOW(PXP_IOC_MAGIC, 5, struct pxp_mem_desc)
-+#define PXP_IOC_WAIT4CMPLT    _IOWR(PXP_IOC_MAGIC, 6, struct pxp_mem_desc)
-+#define PXP_IOC_FLUSH_PHYMEM   _IOR(PXP_IOC_MAGIC, 7, struct pxp_mem_flush)
-+
-+/* Memory types supported*/
-+#define MEMORY_TYPE_UNCACHED 0x0
-+#define MEMORY_TYPE_WC	     0x1
-+#define MEMORY_TYPE_CACHED   0x2
-+
-+/* Cache flush operations */
-+#define CACHE_CLEAN      0x1
-+#define CACHE_INVALIDATE 0x2
-+#define CACHE_FLUSH      0x4
-+
-+#endif
-diff -Nur linux-4.1.3/include/uapi/linux/pxp_dma.h linux-xbian-imx6/include/uapi/linux/pxp_dma.h
---- linux-4.1.3/include/uapi/linux/pxp_dma.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/linux/pxp_dma.h	2015-07-27 23:13:09.941512106 +0200
-@@ -0,0 +1,173 @@
-+/*
-+ * Copyright (C) 2013-2015 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License
-+ * along with this program; if not, write to the Free Software
-+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
-+ *
-+ */
-+#ifndef _UAPI_PXP_DMA
-+#define _UAPI_PXP_DMA
-+
-+#include <linux/posix_types.h>
-+#include <linux/types.h>
-+
-+#ifndef __KERNEL__
-+typedef unsigned long dma_addr_t;
-+typedef unsigned char bool;
-+#endif
-+
-+/*  PXP Pixel format definitions */
-+/*  Four-character-code (FOURCC) */
-+#define fourcc(a, b, c, d)\
-+	(((__u32)(a)<<0)|((__u32)(b)<<8)|((__u32)(c)<<16)|((__u32)(d)<<24))
-+
-+/*!
-+ * @name PXP Pixel Formats
-+ *
-+ * Pixel formats are defined with ASCII FOURCC code. The pixel format codes are
-+ * the same used by V4L2 API.
-+ */
-+
-+/*! @} */
-+/*! @name RGB Formats */
-+/*! @{ */
-+#define PXP_PIX_FMT_RGB332  fourcc('R', 'G', 'B', '1')	/*!<  8  RGB-3-3-2    */
-+#define PXP_PIX_FMT_RGB555  fourcc('R', 'G', 'B', 'O')	/*!< 16  RGB-5-5-5    */
-+#define PXP_PIX_FMT_RGB565  fourcc('R', 'G', 'B', 'P')	/*!< 1 6  RGB-5-6-5   */
-+#define PXP_PIX_FMT_RGB666  fourcc('R', 'G', 'B', '6')	/*!< 18  RGB-6-6-6    */
-+#define PXP_PIX_FMT_BGR666  fourcc('B', 'G', 'R', '6')	/*!< 18  BGR-6-6-6    */
-+#define PXP_PIX_FMT_BGR24   fourcc('B', 'G', 'R', '3')	/*!< 24  BGR-8-8-8    */
-+#define PXP_PIX_FMT_RGB24   fourcc('R', 'G', 'B', '3')	/*!< 24  RGB-8-8-8    */
-+#define PXP_PIX_FMT_BGR32   fourcc('B', 'G', 'R', '4')	/*!< 32  BGR-8-8-8-8  */
-+#define PXP_PIX_FMT_BGRA32  fourcc('B', 'G', 'R', 'A')	/*!< 32  BGR-8-8-8-8  */
-+#define PXP_PIX_FMT_RGB32   fourcc('R', 'G', 'B', '4')	/*!< 32  RGB-8-8-8-8  */
-+#define PXP_PIX_FMT_RGBA32  fourcc('R', 'G', 'B', 'A')	/*!< 32  RGB-8-8-8-8  */
-+#define PXP_PIX_FMT_ABGR32  fourcc('A', 'B', 'G', 'R')	/*!< 32  ABGR-8-8-8-8 */
-+/*! @} */
-+/*! @name YUV Interleaved Formats */
-+/*! @{ */
-+#define PXP_PIX_FMT_YUYV    fourcc('Y', 'U', 'Y', 'V')	/*!< 16 YUV 4:2:2 */
-+#define PXP_PIX_FMT_UYVY    fourcc('U', 'Y', 'V', 'Y')	/*!< 16 YUV 4:2:2 */
-+#define PXP_PIX_FMT_VYUY    fourcc('V', 'Y', 'U', 'Y')  /*!< 16 YVU 4:2:2 */
-+#define PXP_PIX_FMT_YVYU    fourcc('Y', 'V', 'Y', 'U')  /*!< 16 YVU 4:2:2 */
-+#define PXP_PIX_FMT_Y41P    fourcc('Y', '4', '1', 'P')	/*!< 12 YUV 4:1:1 */
-+#define PXP_PIX_FMT_VUY444  fourcc('V', 'U', 'Y', 'A')	/*!< 32 VUYA 8:8:8 */
-+/* two planes -- one Y, one Cb + Cr interleaved  */
-+#define PXP_PIX_FMT_NV12    fourcc('N', 'V', '1', '2')	/* 12  Y/CbCr 4:2:0  */
-+#define PXP_PIX_FMT_NV21    fourcc('N', 'V', '2', '1')	/* 12  Y/CbCr 4:2:0  */
-+#define PXP_PIX_FMT_NV16    fourcc('N', 'V', '1', '6')	/* 12  Y/CbCr 4:2:2  */
-+#define PXP_PIX_FMT_NV61    fourcc('N', 'V', '6', '1')	/* 12  Y/CbCr 4:2:2  */
-+/*! @} */
-+/*! @name YUV Planar Formats */
-+/*! @{ */
-+#define PXP_PIX_FMT_GREY    fourcc('G', 'R', 'E', 'Y')	/*!< 8  Greyscale */
-+#define PXP_PIX_FMT_GY04    fourcc('G', 'Y', '0', '4') /*!< 4  Greyscale */
-+#define PXP_PIX_FMT_YVU410P fourcc('Y', 'V', 'U', '9')	/*!< 9  YVU 4:1:0 */
-+#define PXP_PIX_FMT_YUV410P fourcc('Y', 'U', 'V', '9')	/*!< 9  YUV 4:1:0 */
-+#define PXP_PIX_FMT_YVU420P fourcc('Y', 'V', '1', '2')	/*!< 12 YVU 4:2:0 */
-+#define PXP_PIX_FMT_YUV420P fourcc('I', '4', '2', '0')	/*!< 12 YUV 4:2:0 */
-+#define PXP_PIX_FMT_YUV420P2 fourcc('Y', 'U', '1', '2')	/*!< 12 YUV 4:2:0 */
-+#define PXP_PIX_FMT_YVU422P fourcc('Y', 'V', '1', '6')	/*!< 16 YVU 4:2:2 */
-+#define PXP_PIX_FMT_YUV422P fourcc('4', '2', '2', 'P')	/*!< 16 YUV 4:2:2 */
-+/*! @} */
-+
-+#define PXP_LUT_NONE			0x0
-+#define PXP_LUT_INVERT			0x1
-+#define PXP_LUT_BLACK_WHITE		0x2
-+#define PXP_LUT_USE_CMAP		0x4
-+
-+#define NR_PXP_VIRT_CHANNEL	16
-+
-+/* Order significant! */
-+enum pxp_channel_status {
-+	PXP_CHANNEL_FREE,
-+	PXP_CHANNEL_INITIALIZED,
-+	PXP_CHANNEL_READY,
-+};
-+
-+struct rect {
-+	int top;		/* Upper left coordinate of rectangle */
-+	int left;
-+	int width;
-+	int height;
-+};
-+
-+struct pxp_layer_param {
-+	unsigned short width;
-+	unsigned short height;
-+	unsigned short stride; /* aka pitch */
-+	unsigned int pixel_fmt;
-+
-+	/* layers combining parameters
-+	 * (these are ignored for S0 and output
-+	 * layers, and only apply for OL layer)
-+	 */
-+	bool combine_enable;
-+	unsigned int color_key_enable;
-+	unsigned int color_key;
-+	bool global_alpha_enable;
-+	/* global alpha is either override or multiply */
-+	bool global_override;
-+	unsigned char global_alpha;
-+	bool alpha_invert;
-+	bool local_alpha_enable;
-+
-+	dma_addr_t paddr;
-+};
-+
-+struct pxp_proc_data {
-+	/* S0 Transformation Info */
-+	int scaling;
-+	int hflip;
-+	int vflip;
-+	int rotate;
-+	int rot_pos;
-+	int yuv;
-+
-+	/* Source rectangle (srect) defines the sub-rectangle
-+	 * within S0 to undergo processing.
-+	 */
-+	struct rect srect;
-+	/* Dest rect (drect) defines how to position the processed
-+	 * source rectangle (after resizing) within the output frame,
-+	 * whose dimensions are defined in pxp->pxp_conf_state.out_param
-+	 */
-+	struct rect drect;
-+
-+	/* Current S0 configuration */
-+	unsigned int bgcolor;
-+
-+	/* Output overlay support */
-+	int overlay_state;
-+
-+	/* LUT transformation on Y data */
-+	int lut_transform;
-+	unsigned char *lut_map; /* 256 entries */
-+	bool lut_map_updated; /* Map recently changed */
-+	bool combine_enable;
-+};
-+
-+struct pxp_config_data {
-+	struct pxp_layer_param s0_param;
-+	struct pxp_layer_param ol_param[8];
-+	struct pxp_layer_param out_param;
-+	struct pxp_proc_data proc_data;
-+	int layer_nr;
-+
-+	/* Users don't touch */
-+	int handle;
-+};
-+
-+
-+#endif
-diff -Nur linux-4.1.3/include/uapi/sync.h linux-xbian-imx6/include/uapi/sync.h
---- linux-4.1.3/include/uapi/sync.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/uapi/sync.h	2015-07-27 23:13:09.977384118 +0200
-@@ -0,0 +1,97 @@
-+/*
-+ * Copyright (C) 2012 Google, Inc.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ */
-+
-+#ifndef _UAPI_LINUX_SYNC_H
-+#define _UAPI_LINUX_SYNC_H
-+
-+#include <linux/ioctl.h>
-+#include <linux/types.h>
-+
-+/**
-+ * struct sync_merge_data - data passed to merge ioctl
-+ * @fd2:	file descriptor of second fence
-+ * @name:	name of new fence
-+ * @fence:	returns the fd of the new fence to userspace
-+ */
-+struct sync_merge_data {
-+	__s32	fd2; /* fd of second fence */
-+	char	name[32]; /* name of new fence */
-+	__s32	fence; /* fd on newly created fence */
-+};
-+
-+/**
-+ * struct sync_pt_info - detailed sync_pt information
-+ * @len:		length of sync_pt_info including any driver_data
-+ * @obj_name:		name of parent sync_timeline
-+ * @driver_name:	name of driver implementing the parent
-+ * @status:		status of the sync_pt 0:active 1:signaled <0:error
-+ * @timestamp_ns:	timestamp of status change in nanoseconds
-+ * @driver_data:	any driver dependent data
-+ */
-+struct sync_pt_info {
-+	__u32	len;
-+	char	obj_name[32];
-+	char	driver_name[32];
-+	__s32	status;
-+	__u64	timestamp_ns;
-+
-+	__u8	driver_data[0];
-+};
-+
-+/**
-+ * struct sync_fence_info_data - data returned from fence info ioctl
-+ * @len:	ioctl caller writes the size of the buffer its passing in.
-+ *		ioctl returns length of sync_fence_data returned to userspace
-+ *		including pt_info.
-+ * @name:	name of fence
-+ * @status:	status of fence. 1: signaled 0:active <0:error
-+ * @pt_info:	a sync_pt_info struct for every sync_pt in the fence
-+ */
-+struct sync_fence_info_data {
-+	__u32	len;
-+	char	name[32];
-+	__s32	status;
-+
-+	__u8	pt_info[0];
-+};
-+
-+#define SYNC_IOC_MAGIC		'>'
-+
-+/**
-+ * DOC: SYNC_IOC_WAIT - wait for a fence to signal
-+ *
-+ * pass timeout in milliseconds.  Waits indefinitely timeout < 0.
-+ */
-+#define SYNC_IOC_WAIT		_IOW(SYNC_IOC_MAGIC, 0, __s32)
-+
-+/**
-+ * DOC: SYNC_IOC_MERGE - merge two fences
-+ *
-+ * Takes a struct sync_merge_data.  Creates a new fence containing copies of
-+ * the sync_pts in both the calling fd and sync_merge_data.fd2.  Returns the
-+ * new fence's fd in sync_merge_data.fence
-+ */
-+#define SYNC_IOC_MERGE		_IOWR(SYNC_IOC_MAGIC, 1, struct sync_merge_data)
-+
-+/**
-+ * DOC: SYNC_IOC_FENCE_INFO - get detailed information on a fence
-+ *
-+ * Takes a struct sync_fence_info_data with extra space allocated for pt_info.
-+ * Caller should write the size of the buffer into len.  On return, len is
-+ * updated to reflect the total size of the sync_fence_info_data including
-+ * pt_info.
-+ *
-+ * pt_info is a buffer containing sync_pt_infos for every sync_pt in the fence.
-+ * To iterate over the sync_pt_infos, use the sync_pt_info.len field.
-+ */
-+#define SYNC_IOC_FENCE_INFO	_IOWR(SYNC_IOC_MAGIC, 2,\
-+	struct sync_fence_info_data)
-+
-+#endif /* _UAPI_LINUX_SYNC_H */
-diff -Nur linux-4.1.3/include/usb-ehci-mxc.h linux-xbian-imx6/include/usb-ehci-mxc.h
---- linux-4.1.3/include/usb-ehci-mxc.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/usb-ehci-mxc.h	2015-07-27 23:13:09.981369897 +0200
-@@ -0,0 +1,13 @@
-+#ifndef __INCLUDE_ASM_ARCH_MXC_EHCI_H
-+#define __INCLUDE_ASM_ARCH_MXC_EHCI_H
-+
-+struct mxc_usbh_platform_data {
-+	int (*init)(struct platform_device *pdev);
-+	int (*exit)(struct platform_device *pdev);
-+
-+	unsigned int		 portsc;
-+	struct usb_phy		*otg;
-+};
-+
-+#endif /* __INCLUDE_ASM_ARCH_MXC_EHCI_H */
-+
-diff -Nur linux-4.1.3/include/video/mxc_edid.h linux-xbian-imx6/include/video/mxc_edid.h
---- linux-4.1.3/include/video/mxc_edid.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/video/mxc_edid.h	2015-07-27 23:13:09.981369897 +0200
-@@ -0,0 +1,108 @@
-+/*
-+ * Copyright 2009-2013 Freescale Semiconductor, Inc. All Rights Reserved.
-+ */
-+
-+/*
-+ * The code contained herein is licensed under the GNU General Public
-+ * License. You may obtain a copy of the GNU General Public License
-+ * Version 2 or later at the following locations:
-+ *
-+ * http://www.opensource.org/licenses/gpl-license.html
-+ * http://www.gnu.org/copyleft/gpl.html
-+ */
-+
-+/*!
-+ * @defgroup Framebuffer Framebuffer Driver for SDC and ADC.
-+ */
-+
-+/*!
-+ * @file mxc_edid.h
-+ *
-+ * @brief MXC EDID tools
-+ *
-+ * @ingroup Framebuffer
-+ */
-+
-+#ifndef MXC_EDID_H
-+#define MXC_EDID_H
-+
-+#include <linux/fb.h>
-+
-+enum cea_audio_coding_types {
-+	AUDIO_CODING_TYPE_REF_STREAM_HEADER	=  0,
-+	AUDIO_CODING_TYPE_LPCM			=  1,
-+	AUDIO_CODING_TYPE_AC3			=  2,
-+	AUDIO_CODING_TYPE_MPEG1			=  3,
-+	AUDIO_CODING_TYPE_MP3			=  4,
-+	AUDIO_CODING_TYPE_MPEG2			=  5,
-+	AUDIO_CODING_TYPE_AACLC			=  6,
-+	AUDIO_CODING_TYPE_DTS			=  7,
-+	AUDIO_CODING_TYPE_ATRAC			=  8,
-+	AUDIO_CODING_TYPE_SACD			=  9,
-+	AUDIO_CODING_TYPE_EAC3			= 10,
-+	AUDIO_CODING_TYPE_DTS_HD		= 11,
-+	AUDIO_CODING_TYPE_MLP			= 12,
-+	AUDIO_CODING_TYPE_DST			= 13,
-+	AUDIO_CODING_TYPE_WMAPRO		= 14,
-+	AUDIO_CODING_TYPE_RESERVED		= 15,
-+};
-+
-+struct mxc_hdmi_3d_format {
-+	unsigned char vic_order_2d;
-+	unsigned char struct_3d;
-+	unsigned char detail_3d;
-+	unsigned char reserved;
-+};
-+
-+struct mxc_edid_cfg {
-+	bool cea_underscan;
-+	bool cea_basicaudio;
-+	bool cea_ycbcr444;
-+	bool cea_ycbcr422;
-+	bool hdmi_cap;
-+
-+	/*VSD*/
-+	bool vsd_support_ai;
-+	bool vsd_dc_48bit;
-+	bool vsd_dc_36bit;
-+	bool vsd_dc_30bit;
-+	bool vsd_dc_y444;
-+	bool vsd_dvi_dual;
-+
-+	bool vsd_cnc0;
-+	bool vsd_cnc1;
-+	bool vsd_cnc2;
-+	bool vsd_cnc3;
-+
-+	u8 vsd_video_latency;
-+	u8 vsd_audio_latency;
-+	u8 vsd_I_video_latency;
-+	u8 vsd_I_audio_latency;
-+
-+	u8 physical_address[4];
-+	u8 hdmi_vic[64];
-+	struct mxc_hdmi_3d_format hdmi_3d_format[64];
-+	u16 hdmi_3d_mask_all;
-+	u16 hdmi_3d_struct_all;
-+	unsigned char hdmi_3d_present;
-+	unsigned char hdmi_3d_len;
-+	unsigned char hdmi_3d_multi_present;
-+	u32 vsd_max_tmdsclk_rate;
-+
-+	u8 max_channels;
-+	u8 sample_sizes;
-+	u8 sample_rates;
-+	u8 speaker_alloc;
-+};
-+
-+int mxc_edid_var_to_vic(struct fb_var_screeninfo *var);
-+int mxc_edid_mode_to_vic(const struct fb_videomode *mode, u32 mode_mask);
-+int mxc_edid_read(struct i2c_adapter *adp, unsigned short addr,
-+	unsigned char *edid, struct mxc_edid_cfg *cfg, struct fb_info *fbi);
-+int mxc_edid_parse_ext_blk(unsigned char *edid, struct mxc_edid_cfg *cfg,
-+	struct fb_monspecs *specs);
-+const struct fb_videomode *mxc_fb_find_nearest_mode(const struct fb_videomode *mode,
-+	struct list_head *head);
-+int mxc_edid_fb_mode_is_equal(bool use_aspect, const struct fb_videomode *mode1,
-+	const struct fb_videomode *mode2, u32 mode_mask);
-+#endif
-diff -Nur linux-4.1.3/include/video/mxc_hdmi.h linux-xbian-imx6/include/video/mxc_hdmi.h
---- linux-4.1.3/include/video/mxc_hdmi.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/include/video/mxc_hdmi.h	2015-07-27 23:13:09.981369897 +0200
-@@ -0,0 +1,1027 @@
-+/*
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
-+ */
-+
-+/*
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __MXC_HDMI_H__
-+#define __MXC_HDMI_H__
-+
-+/*
-+ * Hdmi controller registers
-+ */
-+
-+/* Identification Registers */
-+#define HDMI_DESIGN_ID                          0x0000
-+#define HDMI_REVISION_ID                        0x0001
-+#define HDMI_PRODUCT_ID0                        0x0002
-+#define HDMI_PRODUCT_ID1                        0x0003
-+#define HDMI_CONFIG0_ID                         0x0004
-+#define HDMI_CONFIG1_ID                         0x0005
-+#define HDMI_CONFIG2_ID                         0x0006
-+#define HDMI_CONFIG3_ID                         0x0007
-+
-+/* Interrupt Registers */
-+#define HDMI_IH_FC_STAT0                        0x0100
-+#define HDMI_IH_FC_STAT1                        0x0101
-+#define HDMI_IH_FC_STAT2                        0x0102
-+#define HDMI_IH_AS_STAT0                        0x0103
-+#define HDMI_IH_PHY_STAT0                       0x0104
-+#define HDMI_IH_I2CM_STAT0                      0x0105
-+#define HDMI_IH_CEC_STAT0                       0x0106
-+#define HDMI_IH_VP_STAT0                        0x0107
-+#define HDMI_IH_I2CMPHY_STAT0                   0x0108
-+#define HDMI_IH_AHBDMAAUD_STAT0                 0x0109
-+
-+#define HDMI_IH_MUTE_FC_STAT0                   0x0180
-+#define HDMI_IH_MUTE_FC_STAT1                   0x0181
-+#define HDMI_IH_MUTE_FC_STAT2                   0x0182
-+#define HDMI_IH_MUTE_AS_STAT0                   0x0183
-+#define HDMI_IH_MUTE_PHY_STAT0                  0x0184
-+#define HDMI_IH_MUTE_I2CM_STAT0                 0x0185
-+#define HDMI_IH_MUTE_CEC_STAT0                  0x0186
-+#define HDMI_IH_MUTE_VP_STAT0                   0x0187
-+#define HDMI_IH_MUTE_I2CMPHY_STAT0              0x0188
-+#define HDMI_IH_MUTE_AHBDMAAUD_STAT0            0x0189
-+#define HDMI_IH_MUTE                            0x01FF
-+
-+/* Video Sample Registers */
-+#define HDMI_TX_INVID0                          0x0200
-+#define HDMI_TX_INSTUFFING                      0x0201
-+#define HDMI_TX_GYDATA0                         0x0202
-+#define HDMI_TX_GYDATA1                         0x0203
-+#define HDMI_TX_RCRDATA0                        0x0204
-+#define HDMI_TX_RCRDATA1                        0x0205
-+#define HDMI_TX_BCBDATA0                        0x0206
-+#define HDMI_TX_BCBDATA1                        0x0207
-+
-+/* Video Packetizer Registers */
-+#define HDMI_VP_STATUS                          0x0800
-+#define HDMI_VP_PR_CD                           0x0801
-+#define HDMI_VP_STUFF                           0x0802
-+#define HDMI_VP_REMAP                           0x0803
-+#define HDMI_VP_CONF                            0x0804
-+#define HDMI_VP_STAT                            0x0805
-+#define HDMI_VP_INT                             0x0806
-+#define HDMI_VP_MASK                            0x0807
-+#define HDMI_VP_POL                             0x0808
-+
-+/* Frame Composer Registers */
-+#define HDMI_FC_INVIDCONF                       0x1000
-+#define HDMI_FC_INHACTV0                        0x1001
-+#define HDMI_FC_INHACTV1                        0x1002
-+#define HDMI_FC_INHBLANK0                       0x1003
-+#define HDMI_FC_INHBLANK1                       0x1004
-+#define HDMI_FC_INVACTV0                        0x1005
-+#define HDMI_FC_INVACTV1                        0x1006
-+#define HDMI_FC_INVBLANK                        0x1007
-+#define HDMI_FC_HSYNCINDELAY0                   0x1008
-+#define HDMI_FC_HSYNCINDELAY1                   0x1009
-+#define HDMI_FC_HSYNCINWIDTH0                   0x100A
-+#define HDMI_FC_HSYNCINWIDTH1                   0x100B
-+#define HDMI_FC_VSYNCINDELAY                    0x100C
-+#define HDMI_FC_VSYNCINWIDTH                    0x100D
-+#define HDMI_FC_INFREQ0                         0x100E
-+#define HDMI_FC_INFREQ1                         0x100F
-+#define HDMI_FC_INFREQ2                         0x1010
-+#define HDMI_FC_CTRLDUR                         0x1011
-+#define HDMI_FC_EXCTRLDUR                       0x1012
-+#define HDMI_FC_EXCTRLSPAC                      0x1013
-+#define HDMI_FC_CH0PREAM                        0x1014
-+#define HDMI_FC_CH1PREAM                        0x1015
-+#define HDMI_FC_CH2PREAM                        0x1016
-+#define HDMI_FC_AVICONF3                        0x1017
-+#define HDMI_FC_GCP                             0x1018
-+#define HDMI_FC_AVICONF0                        0x1019
-+#define HDMI_FC_AVICONF1                        0x101A
-+#define HDMI_FC_AVICONF2                        0x101B
-+#define HDMI_FC_AVIVID                          0x101C
-+#define HDMI_FC_AVIETB0                         0x101D
-+#define HDMI_FC_AVIETB1                         0x101E
-+#define HDMI_FC_AVISBB0                         0x101F
-+#define HDMI_FC_AVISBB1                         0x1020
-+#define HDMI_FC_AVIELB0                         0x1021
-+#define HDMI_FC_AVIELB1                         0x1022
-+#define HDMI_FC_AVISRB0                         0x1023
-+#define HDMI_FC_AVISRB1                         0x1024
-+#define HDMI_FC_AUDICONF0                       0x1025
-+#define HDMI_FC_AUDICONF1                       0x1026
-+#define HDMI_FC_AUDICONF2                       0x1027
-+#define HDMI_FC_AUDICONF3                       0x1028
-+#define HDMI_FC_VSDIEEEID0                      0x1029
-+#define HDMI_FC_VSDSIZE                         0x102A
-+#define HDMI_FC_VSDIEEEID1                      0x1030
-+#define HDMI_FC_VSDIEEEID2                      0x1031
-+#define HDMI_FC_VSDPAYLOAD0                     0x1032
-+#define HDMI_FC_VSDPAYLOAD1                     0x1033
-+#define HDMI_FC_VSDPAYLOAD2                     0x1034
-+#define HDMI_FC_VSDPAYLOAD3                     0x1035
-+#define HDMI_FC_VSDPAYLOAD4                     0x1036
-+#define HDMI_FC_VSDPAYLOAD5                     0x1037
-+#define HDMI_FC_VSDPAYLOAD6                     0x1038
-+#define HDMI_FC_VSDPAYLOAD7                     0x1039
-+#define HDMI_FC_VSDPAYLOAD8                     0x103A
-+#define HDMI_FC_VSDPAYLOAD9                     0x103B
-+#define HDMI_FC_VSDPAYLOAD10                    0x103C
-+#define HDMI_FC_VSDPAYLOAD11                    0x103D
-+#define HDMI_FC_VSDPAYLOAD12                    0x103E
-+#define HDMI_FC_VSDPAYLOAD13                    0x103F
-+#define HDMI_FC_VSDPAYLOAD14                    0x1040
-+#define HDMI_FC_VSDPAYLOAD15                    0x1041
-+#define HDMI_FC_VSDPAYLOAD16                    0x1042
-+#define HDMI_FC_VSDPAYLOAD17                    0x1043
-+#define HDMI_FC_VSDPAYLOAD18                    0x1044
-+#define HDMI_FC_VSDPAYLOAD19                    0x1045
-+#define HDMI_FC_VSDPAYLOAD20                    0x1046
-+#define HDMI_FC_VSDPAYLOAD21                    0x1047
-+#define HDMI_FC_VSDPAYLOAD22                    0x1048
-+#define HDMI_FC_VSDPAYLOAD23                    0x1049
-+#define HDMI_FC_SPDVENDORNAME0                  0x104A
-+#define HDMI_FC_SPDVENDORNAME1                  0x104B
-+#define HDMI_FC_SPDVENDORNAME2                  0x104C
-+#define HDMI_FC_SPDVENDORNAME3                  0x104D
-+#define HDMI_FC_SPDVENDORNAME4                  0x104E
-+#define HDMI_FC_SPDVENDORNAME5                  0x104F
-+#define HDMI_FC_SPDVENDORNAME6                  0x1050
-+#define HDMI_FC_SPDVENDORNAME7                  0x1051
-+#define HDMI_FC_SDPPRODUCTNAME0                 0x1052
-+#define HDMI_FC_SDPPRODUCTNAME1                 0x1053
-+#define HDMI_FC_SDPPRODUCTNAME2                 0x1054
-+#define HDMI_FC_SDPPRODUCTNAME3                 0x1055
-+#define HDMI_FC_SDPPRODUCTNAME4                 0x1056
-+#define HDMI_FC_SDPPRODUCTNAME5                 0x1057
-+#define HDMI_FC_SDPPRODUCTNAME6                 0x1058
-+#define HDMI_FC_SDPPRODUCTNAME7                 0x1059
-+#define HDMI_FC_SDPPRODUCTNAME8                 0x105A
-+#define HDMI_FC_SDPPRODUCTNAME9                 0x105B
-+#define HDMI_FC_SDPPRODUCTNAME10                0x105C
-+#define HDMI_FC_SDPPRODUCTNAME11                0x105D
-+#define HDMI_FC_SDPPRODUCTNAME12                0x105E
-+#define HDMI_FC_SDPPRODUCTNAME13                0x105F
-+#define HDMI_FC_SDPPRODUCTNAME14                0x1060
-+#define HDMI_FC_SPDPRODUCTNAME15                0x1061
-+#define HDMI_FC_SPDDEVICEINF                    0x1062
-+#define HDMI_FC_AUDSCONF                        0x1063
-+#define HDMI_FC_AUDSSTAT                        0x1064
-+#define HDMI_FC_DATACH0FILL                     0x1070
-+#define HDMI_FC_DATACH1FILL                     0x1071
-+#define HDMI_FC_DATACH2FILL                     0x1072
-+#define HDMI_FC_CTRLQHIGH                       0x1073
-+#define HDMI_FC_CTRLQLOW                        0x1074
-+#define HDMI_FC_ACP0                            0x1075
-+#define HDMI_FC_ACP28                           0x1076
-+#define HDMI_FC_ACP27                           0x1077
-+#define HDMI_FC_ACP26                           0x1078
-+#define HDMI_FC_ACP25                           0x1079
-+#define HDMI_FC_ACP24                           0x107A
-+#define HDMI_FC_ACP23                           0x107B
-+#define HDMI_FC_ACP22                           0x107C
-+#define HDMI_FC_ACP21                           0x107D
-+#define HDMI_FC_ACP20                           0x107E
-+#define HDMI_FC_ACP19                           0x107F
-+#define HDMI_FC_ACP18                           0x1080
-+#define HDMI_FC_ACP17                           0x1081
-+#define HDMI_FC_ACP16                           0x1082
-+#define HDMI_FC_ACP15                           0x1083
-+#define HDMI_FC_ACP14                           0x1084
-+#define HDMI_FC_ACP13                           0x1085
-+#define HDMI_FC_ACP12                           0x1086
-+#define HDMI_FC_ACP11                           0x1087
-+#define HDMI_FC_ACP10                           0x1088
-+#define HDMI_FC_ACP9                            0x1089
-+#define HDMI_FC_ACP8                            0x108A
-+#define HDMI_FC_ACP7                            0x108B
-+#define HDMI_FC_ACP6                            0x108C
-+#define HDMI_FC_ACP5                            0x108D
-+#define HDMI_FC_ACP4                            0x108E
-+#define HDMI_FC_ACP3                            0x108F
-+#define HDMI_FC_ACP2                            0x1090
-+#define HDMI_FC_ACP1                            0x1091
-+#define HDMI_FC_ISCR1_0                         0x1092
-+#define HDMI_FC_ISCR1_16                        0x1093
-+#define HDMI_FC_ISCR1_15                        0x1094
-+#define HDMI_FC_ISCR1_14                        0x1095
-+#define HDMI_FC_ISCR1_13                        0x1096
-+#define HDMI_FC_ISCR1_12                        0x1097
-+#define HDMI_FC_ISCR1_11                        0x1098
-+#define HDMI_FC_ISCR1_10                        0x1099
-+#define HDMI_FC_ISCR1_9                         0x109A
-+#define HDMI_FC_ISCR1_8                         0x109B
-+#define HDMI_FC_ISCR1_7                         0x109C
-+#define HDMI_FC_ISCR1_6                         0x109D
-+#define HDMI_FC_ISCR1_5                         0x109E
-+#define HDMI_FC_ISCR1_4                         0x109F
-+#define HDMI_FC_ISCR1_3                         0x10A0
-+#define HDMI_FC_ISCR1_2                         0x10A1
-+#define HDMI_FC_ISCR1_1                         0x10A2
-+#define HDMI_FC_ISCR2_15                        0x10A3
-+#define HDMI_FC_ISCR2_14                        0x10A4
-+#define HDMI_FC_ISCR2_13                        0x10A5
-+#define HDMI_FC_ISCR2_12                        0x10A6
-+#define HDMI_FC_ISCR2_11                        0x10A7
-+#define HDMI_FC_ISCR2_10                        0x10A8
-+#define HDMI_FC_ISCR2_9                         0x10A9
-+#define HDMI_FC_ISCR2_8                         0x10AA
-+#define HDMI_FC_ISCR2_7                         0x10AB
-+#define HDMI_FC_ISCR2_6                         0x10AC
-+#define HDMI_FC_ISCR2_5                         0x10AD
-+#define HDMI_FC_ISCR2_4                         0x10AE
-+#define HDMI_FC_ISCR2_3                         0x10AF
-+#define HDMI_FC_ISCR2_2                         0x10B0
-+#define HDMI_FC_ISCR2_1                         0x10B1
-+#define HDMI_FC_ISCR2_0                         0x10B2
-+#define HDMI_FC_DATAUTO0                        0x10B3
-+#define HDMI_FC_DATAUTO1                        0x10B4
-+#define HDMI_FC_DATAUTO2                        0x10B5
-+#define HDMI_FC_DATMAN                          0x10B6
-+#define HDMI_FC_DATAUTO3                        0x10B7
-+#define HDMI_FC_RDRB0                           0x10B8
-+#define HDMI_FC_RDRB1                           0x10B9
-+#define HDMI_FC_RDRB2                           0x10BA
-+#define HDMI_FC_RDRB3                           0x10BB
-+#define HDMI_FC_RDRB4                           0x10BC
-+#define HDMI_FC_RDRB5                           0x10BD
-+#define HDMI_FC_RDRB6                           0x10BE
-+#define HDMI_FC_RDRB7                           0x10BF
-+#define HDMI_FC_STAT0                           0x10D0
-+#define HDMI_FC_INT0                            0x10D1
-+#define HDMI_FC_MASK0                           0x10D2
-+#define HDMI_FC_POL0                            0x10D3
-+#define HDMI_FC_STAT1                           0x10D4
-+#define HDMI_FC_INT1                            0x10D5
-+#define HDMI_FC_MASK1                           0x10D6
-+#define HDMI_FC_POL1                            0x10D7
-+#define HDMI_FC_STAT2                           0x10D8
-+#define HDMI_FC_INT2                            0x10D9
-+#define HDMI_FC_MASK2                           0x10DA
-+#define HDMI_FC_POL2                            0x10DB
-+#define HDMI_FC_PRCONF                          0x10E0
-+
-+#define HDMI_FC_GMD_STAT                        0x1100
-+#define HDMI_FC_GMD_EN                          0x1101
-+#define HDMI_FC_GMD_UP                          0x1102
-+#define HDMI_FC_GMD_CONF                        0x1103
-+#define HDMI_FC_GMD_HB                          0x1104
-+#define HDMI_FC_GMD_PB0                         0x1105
-+#define HDMI_FC_GMD_PB1                         0x1106
-+#define HDMI_FC_GMD_PB2                         0x1107
-+#define HDMI_FC_GMD_PB3                         0x1108
-+#define HDMI_FC_GMD_PB4                         0x1109
-+#define HDMI_FC_GMD_PB5                         0x110A
-+#define HDMI_FC_GMD_PB6                         0x110B
-+#define HDMI_FC_GMD_PB7                         0x110C
-+#define HDMI_FC_GMD_PB8                         0x110D
-+#define HDMI_FC_GMD_PB9                         0x110E
-+#define HDMI_FC_GMD_PB10                        0x110F
-+#define HDMI_FC_GMD_PB11                        0x1110
-+#define HDMI_FC_GMD_PB12                        0x1111
-+#define HDMI_FC_GMD_PB13                        0x1112
-+#define HDMI_FC_GMD_PB14                        0x1113
-+#define HDMI_FC_GMD_PB15                        0x1114
-+#define HDMI_FC_GMD_PB16                        0x1115
-+#define HDMI_FC_GMD_PB17                        0x1116
-+#define HDMI_FC_GMD_PB18                        0x1117
-+#define HDMI_FC_GMD_PB19                        0x1118
-+#define HDMI_FC_GMD_PB20                        0x1119
-+#define HDMI_FC_GMD_PB21                        0x111A
-+#define HDMI_FC_GMD_PB22                        0x111B
-+#define HDMI_FC_GMD_PB23                        0x111C
-+#define HDMI_FC_GMD_PB24                        0x111D
-+#define HDMI_FC_GMD_PB25                        0x111E
-+#define HDMI_FC_GMD_PB26                        0x111F
-+#define HDMI_FC_GMD_PB27                        0x1120
-+
-+#define HDMI_FC_DBGFORCE                        0x1200
-+#define HDMI_FC_DBGAUD0CH0                      0x1201
-+#define HDMI_FC_DBGAUD1CH0                      0x1202
-+#define HDMI_FC_DBGAUD2CH0                      0x1203
-+#define HDMI_FC_DBGAUD0CH1                      0x1204
-+#define HDMI_FC_DBGAUD1CH1                      0x1205
-+#define HDMI_FC_DBGAUD2CH1                      0x1206
-+#define HDMI_FC_DBGAUD0CH2                      0x1207
-+#define HDMI_FC_DBGAUD1CH2                      0x1208
-+#define HDMI_FC_DBGAUD2CH2                      0x1209
-+#define HDMI_FC_DBGAUD0CH3                      0x120A
-+#define HDMI_FC_DBGAUD1CH3                      0x120B
-+#define HDMI_FC_DBGAUD2CH3                      0x120C
-+#define HDMI_FC_DBGAUD0CH4                      0x120D
-+#define HDMI_FC_DBGAUD1CH4                      0x120E
-+#define HDMI_FC_DBGAUD2CH4                      0x120F
-+#define HDMI_FC_DBGAUD0CH5                      0x1210
-+#define HDMI_FC_DBGAUD1CH5                      0x1211
-+#define HDMI_FC_DBGAUD2CH5                      0x1212
-+#define HDMI_FC_DBGAUD0CH6                      0x1213
-+#define HDMI_FC_DBGAUD1CH6                      0x1214
-+#define HDMI_FC_DBGAUD2CH6                      0x1215
-+#define HDMI_FC_DBGAUD0CH7                      0x1216
-+#define HDMI_FC_DBGAUD1CH7                      0x1217
-+#define HDMI_FC_DBGAUD2CH7                      0x1218
-+#define HDMI_FC_DBGTMDS0                        0x1219
-+#define HDMI_FC_DBGTMDS1                        0x121A
-+#define HDMI_FC_DBGTMDS2                        0x121B
-+
-+/* HDMI Source PHY Registers */
-+#define HDMI_PHY_CONF0                          0x3000
-+#define HDMI_PHY_TST0                           0x3001
-+#define HDMI_PHY_TST1                           0x3002
-+#define HDMI_PHY_TST2                           0x3003
-+#define HDMI_PHY_STAT0                          0x3004
-+#define HDMI_PHY_INT0                           0x3005
-+#define HDMI_PHY_MASK0                          0x3006
-+#define HDMI_PHY_POL0                           0x3007
-+
-+/* HDMI Master PHY Registers */
-+#define HDMI_PHY_I2CM_SLAVE_ADDR                0x3020
-+#define HDMI_PHY_I2CM_ADDRESS_ADDR              0x3021
-+#define HDMI_PHY_I2CM_DATAO_1_ADDR              0x3022
-+#define HDMI_PHY_I2CM_DATAO_0_ADDR              0x3023
-+#define HDMI_PHY_I2CM_DATAI_1_ADDR              0x3024
-+#define HDMI_PHY_I2CM_DATAI_0_ADDR              0x3025
-+#define HDMI_PHY_I2CM_OPERATION_ADDR            0x3026
-+#define HDMI_PHY_I2CM_INT_ADDR                  0x3027
-+#define HDMI_PHY_I2CM_CTLINT_ADDR               0x3028
-+#define HDMI_PHY_I2CM_DIV_ADDR                  0x3029
-+#define HDMI_PHY_I2CM_SOFTRSTZ_ADDR             0x302a
-+#define HDMI_PHY_I2CM_SS_SCL_HCNT_1_ADDR        0x302b
-+#define HDMI_PHY_I2CM_SS_SCL_HCNT_0_ADDR        0x302c
-+#define HDMI_PHY_I2CM_SS_SCL_LCNT_1_ADDR        0x302d
-+#define HDMI_PHY_I2CM_SS_SCL_LCNT_0_ADDR        0x302e
-+#define HDMI_PHY_I2CM_FS_SCL_HCNT_1_ADDR        0x302f
-+#define HDMI_PHY_I2CM_FS_SCL_HCNT_0_ADDR        0x3030
-+#define HDMI_PHY_I2CM_FS_SCL_LCNT_1_ADDR        0x3031
-+#define HDMI_PHY_I2CM_FS_SCL_LCNT_0_ADDR        0x3032
-+
-+/* Audio Sampler Registers */
-+#define HDMI_AUD_CONF0                          0x3100
-+#define HDMI_AUD_CONF1                          0x3101
-+#define HDMI_AUD_INT                            0x3102
-+#define HDMI_AUD_CONF2                          0x3103
-+#define HDMI_AUD_N1                             0x3200
-+#define HDMI_AUD_N2                             0x3201
-+#define HDMI_AUD_N3                             0x3202
-+#define HDMI_AUD_CTS1                           0x3203
-+#define HDMI_AUD_CTS2                           0x3204
-+#define HDMI_AUD_CTS3                           0x3205
-+#define HDMI_AUD_INPUTCLKFS                     0x3206
-+#define HDMI_AUD_SPDIFINT			0x3302
-+#define HDMI_AUD_CONF0_HBR                      0x3400
-+#define HDMI_AUD_HBR_STATUS                     0x3401
-+#define HDMI_AUD_HBR_INT                        0x3402
-+#define HDMI_AUD_HBR_POL                        0x3403
-+#define HDMI_AUD_HBR_MASK                       0x3404
-+
-+/* Generic Parallel Audio Interface Registers */
-+/* Not used as GPAUD interface is not enabled in hw */
-+#define HDMI_GP_CONF0                           0x3500
-+#define HDMI_GP_CONF1                           0x3501
-+#define HDMI_GP_CONF2                           0x3502
-+#define HDMI_GP_STAT                            0x3503
-+#define HDMI_GP_INT                             0x3504
-+#define HDMI_GP_MASK                            0x3505
-+#define HDMI_GP_POL                             0x3506
-+
-+/* Audio DMA Registers */
-+#define HDMI_AHB_DMA_CONF0                      0x3600
-+#define HDMI_AHB_DMA_START                      0x3601
-+#define HDMI_AHB_DMA_STOP                       0x3602
-+#define HDMI_AHB_DMA_THRSLD                     0x3603
-+#define HDMI_AHB_DMA_STRADDR0                   0x3604
-+#define HDMI_AHB_DMA_STRADDR1                   0x3605
-+#define HDMI_AHB_DMA_STRADDR2                   0x3606
-+#define HDMI_AHB_DMA_STRADDR3                   0x3607
-+#define HDMI_AHB_DMA_STPADDR0                   0x3608
-+#define HDMI_AHB_DMA_STPADDR1                   0x3609
-+#define HDMI_AHB_DMA_STPADDR2                   0x360a
-+#define HDMI_AHB_DMA_STPADDR3                   0x360b
-+#define HDMI_AHB_DMA_BSTADDR0                   0x360c
-+#define HDMI_AHB_DMA_BSTADDR1                   0x360d
-+#define HDMI_AHB_DMA_BSTADDR2                   0x360e
-+#define HDMI_AHB_DMA_BSTADDR3                   0x360f
-+#define HDMI_AHB_DMA_MBLENGTH0                  0x3610
-+#define HDMI_AHB_DMA_MBLENGTH1                  0x3611
-+#define HDMI_AHB_DMA_STAT                       0x3612
-+#define HDMI_AHB_DMA_INT                        0x3613
-+#define HDMI_AHB_DMA_MASK                       0x3614
-+#define HDMI_AHB_DMA_POL                        0x3615
-+#define HDMI_AHB_DMA_CONF1                      0x3616
-+#define HDMI_AHB_DMA_BUFFSTAT                   0x3617
-+#define HDMI_AHB_DMA_BUFFINT                    0x3618
-+#define HDMI_AHB_DMA_BUFFMASK                   0x3619
-+#define HDMI_AHB_DMA_BUFFPOL                    0x361a
-+
-+/* Main Controller Registers */
-+#define HDMI_MC_SFRDIV                          0x4000
-+#define HDMI_MC_CLKDIS                          0x4001
-+#define HDMI_MC_SWRSTZ                          0x4002
-+#define HDMI_MC_OPCTRL                          0x4003
-+#define HDMI_MC_FLOWCTRL                        0x4004
-+#define HDMI_MC_PHYRSTZ                         0x4005
-+#define HDMI_MC_LOCKONCLOCK                     0x4006
-+#define HDMI_MC_HEACPHY_RST                     0x4007
-+
-+/* Color Space  Converter Registers */
-+#define HDMI_CSC_CFG                            0x4100
-+#define HDMI_CSC_SCALE                          0x4101
-+#define HDMI_CSC_COEF_A1_MSB                    0x4102
-+#define HDMI_CSC_COEF_A1_LSB                    0x4103
-+#define HDMI_CSC_COEF_A2_MSB                    0x4104
-+#define HDMI_CSC_COEF_A2_LSB                    0x4105
-+#define HDMI_CSC_COEF_A3_MSB                    0x4106
-+#define HDMI_CSC_COEF_A3_LSB                    0x4107
-+#define HDMI_CSC_COEF_A4_MSB                    0x4108
-+#define HDMI_CSC_COEF_A4_LSB                    0x4109
-+#define HDMI_CSC_COEF_B1_MSB                    0x410A
-+#define HDMI_CSC_COEF_B1_LSB                    0x410B
-+#define HDMI_CSC_COEF_B2_MSB                    0x410C
-+#define HDMI_CSC_COEF_B2_LSB                    0x410D
-+#define HDMI_CSC_COEF_B3_MSB                    0x410E
-+#define HDMI_CSC_COEF_B3_LSB                    0x410F
-+#define HDMI_CSC_COEF_B4_MSB                    0x4110
-+#define HDMI_CSC_COEF_B4_LSB                    0x4111
-+#define HDMI_CSC_COEF_C1_MSB                    0x4112
-+#define HDMI_CSC_COEF_C1_LSB                    0x4113
-+#define HDMI_CSC_COEF_C2_MSB                    0x4114
-+#define HDMI_CSC_COEF_C2_LSB                    0x4115
-+#define HDMI_CSC_COEF_C3_MSB                    0x4116
-+#define HDMI_CSC_COEF_C3_LSB                    0x4117
-+#define HDMI_CSC_COEF_C4_MSB                    0x4118
-+#define HDMI_CSC_COEF_C4_LSB                    0x4119
-+
-+/* HDCP Interrupt Registers */
-+#define HDMI_A_APIINTCLR                        0x5006
-+#define HDMI_A_APIINTSTAT                       0x5007
-+#define HDMI_A_APIINTMSK                        0x5008
-+
-+/* CEC Engine Registers */
-+#define HDMI_CEC_CTRL                           0x7D00
-+#define HDMI_CEC_STAT                           0x7D01
-+#define HDMI_CEC_MASK                           0x7D02
-+#define HDMI_CEC_POLARITY                       0x7D03
-+#define HDMI_CEC_INT                            0x7D04
-+#define HDMI_CEC_ADDR_L                         0x7D05
-+#define HDMI_CEC_ADDR_H                         0x7D06
-+#define HDMI_CEC_TX_CNT                         0x7D07
-+#define HDMI_CEC_RX_CNT                         0x7D08
-+#define HDMI_CEC_TX_DATA0                       0x7D10
-+#define HDMI_CEC_TX_DATA1                       0x7D11
-+#define HDMI_CEC_TX_DATA2                       0x7D12
-+#define HDMI_CEC_TX_DATA3                       0x7D13
-+#define HDMI_CEC_TX_DATA4                       0x7D14
-+#define HDMI_CEC_TX_DATA5                       0x7D15
-+#define HDMI_CEC_TX_DATA6                       0x7D16
-+#define HDMI_CEC_TX_DATA7                       0x7D17
-+#define HDMI_CEC_TX_DATA8                       0x7D18
-+#define HDMI_CEC_TX_DATA9                       0x7D19
-+#define HDMI_CEC_TX_DATA10                      0x7D1a
-+#define HDMI_CEC_TX_DATA11                      0x7D1b
-+#define HDMI_CEC_TX_DATA12                      0x7D1c
-+#define HDMI_CEC_TX_DATA13                      0x7D1d
-+#define HDMI_CEC_TX_DATA14                      0x7D1e
-+#define HDMI_CEC_TX_DATA15                      0x7D1f
-+#define HDMI_CEC_RX_DATA0                       0x7D20
-+#define HDMI_CEC_RX_DATA1                       0x7D21
-+#define HDMI_CEC_RX_DATA2                       0x7D22
-+#define HDMI_CEC_RX_DATA3                       0x7D23
-+#define HDMI_CEC_RX_DATA4                       0x7D24
-+#define HDMI_CEC_RX_DATA5                       0x7D25
-+#define HDMI_CEC_RX_DATA6                       0x7D26
-+#define HDMI_CEC_RX_DATA7                       0x7D27
-+#define HDMI_CEC_RX_DATA8                       0x7D28
-+#define HDMI_CEC_RX_DATA9                       0x7D29
-+#define HDMI_CEC_RX_DATA10                      0x7D2a
-+#define HDMI_CEC_RX_DATA11                      0x7D2b
-+#define HDMI_CEC_RX_DATA12                      0x7D2c
-+#define HDMI_CEC_RX_DATA13                      0x7D2d
-+#define HDMI_CEC_RX_DATA14                      0x7D2e
-+#define HDMI_CEC_RX_DATA15                      0x7D2f
-+#define HDMI_CEC_LOCK                           0x7D30
-+#define HDMI_CEC_WKUPCTRL                       0x7D31
-+
-+/* I2C Master Registers (E-DDC) */
-+#define HDMI_I2CM_SLAVE                         0x7E00
-+#define HDMI_I2CM_ADDRESS                       0x7E01
-+#define HDMI_I2CM_DATAO                         0x7E02
-+#define HDMI_I2CM_DATAI                         0x7E03
-+#define HDMI_I2CM_OPERATION                     0x7E04
-+#define HDMI_I2CM_INT                           0x7E05
-+#define HDMI_I2CM_CTLINT                        0x7E06
-+#define HDMI_I2CM_DIV                           0x7E07
-+#define HDMI_I2CM_SEGADDR                       0x7E08
-+#define HDMI_I2CM_SOFTRSTZ                      0x7E09
-+#define HDMI_I2CM_SEGPTR                        0x7E0A
-+#define HDMI_I2CM_SS_SCL_HCNT_1_ADDR            0x7E0B
-+#define HDMI_I2CM_SS_SCL_HCNT_0_ADDR            0x7E0C
-+#define HDMI_I2CM_SS_SCL_LCNT_1_ADDR            0x7E0D
-+#define HDMI_I2CM_SS_SCL_LCNT_0_ADDR            0x7E0E
-+#define HDMI_I2CM_FS_SCL_HCNT_1_ADDR            0x7E0F
-+#define HDMI_I2CM_FS_SCL_HCNT_0_ADDR            0x7E10
-+#define HDMI_I2CM_FS_SCL_LCNT_1_ADDR            0x7E11
-+#define HDMI_I2CM_FS_SCL_LCNT_0_ADDR            0x7E12
-+
-+/* Random Number Generator Registers (RNG) */
-+#define HDMI_RNG_BASE                           0x8000
-+
-+
-+/*
-+ * Register field definitions
-+ */
-+enum {
-+/* IH_FC_INT2 field values */
-+	HDMI_IH_FC_INT2_OVERFLOW_MASK = 0x03,
-+	HDMI_IH_FC_INT2_LOW_PRIORITY_OVERFLOW = 0x02,
-+	HDMI_IH_FC_INT2_HIGH_PRIORITY_OVERFLOW = 0x01,
-+
-+/* IH_FC_STAT2 field values */
-+	HDMI_IH_FC_STAT2_OVERFLOW_MASK = 0x03,
-+	HDMI_IH_FC_STAT2_LOW_PRIORITY_OVERFLOW = 0x02,
-+	HDMI_IH_FC_STAT2_HIGH_PRIORITY_OVERFLOW = 0x01,
-+
-+/* IH_PHY_STAT0 field values */
-+	HDMI_IH_PHY_STAT0_RX_SENSE3 = 0x20,
-+	HDMI_IH_PHY_STAT0_RX_SENSE2 = 0x10,
-+	HDMI_IH_PHY_STAT0_RX_SENSE1 = 0x8,
-+	HDMI_IH_PHY_STAT0_RX_SENSE0 = 0x4,
-+	HDMI_IH_PHY_STAT0_TX_PHY_LOCK = 0x2,
-+	HDMI_IH_PHY_STAT0_HPD = 0x1,
-+
-+/* IH_CEC_STAT0 field values */
-+	HDMI_IH_CEC_STAT0_WAKEUP = 0x40,
-+	HDMI_IH_CEC_STAT0_ERROR_FOLL = 0x20,
-+	HDMI_IH_CEC_STAT0_ERROR_INIT = 0x10,
-+	HDMI_IH_CEC_STAT0_ARB_LOST = 0x8,
-+	HDMI_IH_CEC_STAT0_NACK = 0x4,
-+	HDMI_IH_CEC_STAT0_EOM = 0x2,
-+	HDMI_IH_CEC_STAT0_DONE = 0x1,
-+
-+
-+/* IH_MUTE_I2CMPHY_STAT0 field values */
-+	HDMI_IH_MUTE_I2CMPHY_STAT0_I2CMPHYDONE = 0x2,
-+	HDMI_IH_MUTE_I2CMPHY_STAT0_I2CMPHYERROR = 0x1,
-+
-+/* IH_PHY_STAT0 field values */
-+	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE3 = 0x20,
-+	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE2 = 0x10,
-+	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE1 = 0x8,
-+	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE0 = 0x4,
-+	HDMI_IH_MUTE_PHY_STAT0_TX_PHY_LOCK = 0x2,
-+	HDMI_IH_MUTE_PHY_STAT0_HPD = 0x1,
-+
-+/* IH and IH_MUTE convenience macro RX_SENSE | HPD*/
-+	HDMI_DVI_IH_STAT = 0x3D,
-+
-+
-+/* IH_AHBDMAAUD_STAT0 field values */
-+	HDMI_IH_AHBDMAAUD_STAT0_ERROR = 0x20,
-+	HDMI_IH_AHBDMAAUD_STAT0_LOST = 0x10,
-+	HDMI_IH_AHBDMAAUD_STAT0_RETRY = 0x08,
-+	HDMI_IH_AHBDMAAUD_STAT0_DONE = 0x04,
-+	HDMI_IH_AHBDMAAUD_STAT0_BUFFFULL = 0x02,
-+	HDMI_IH_AHBDMAAUD_STAT0_BUFFEMPTY = 0x01,
-+
-+/* IH_MUTE_FC_STAT2 field values */
-+	HDMI_IH_MUTE_FC_STAT2_OVERFLOW_MASK = 0x03,
-+	HDMI_IH_MUTE_FC_STAT2_LOW_PRIORITY_OVERFLOW = 0x02,
-+	HDMI_IH_MUTE_FC_STAT2_HIGH_PRIORITY_OVERFLOW = 0x01,
-+
-+/* IH_MUTE_AHBDMAAUD_STAT0 field values */
-+	HDMI_IH_MUTE_AHBDMAAUD_STAT0_ERROR = 0x20,
-+	HDMI_IH_MUTE_AHBDMAAUD_STAT0_LOST = 0x10,
-+	HDMI_IH_MUTE_AHBDMAAUD_STAT0_RETRY = 0x08,
-+	HDMI_IH_MUTE_AHBDMAAUD_STAT0_DONE = 0x04,
-+	HDMI_IH_MUTE_AHBDMAAUD_STAT0_BUFFFULL = 0x02,
-+	HDMI_IH_MUTE_AHBDMAAUD_STAT0_BUFFEMPTY = 0x01,
-+
-+/* IH_MUTE field values */
-+	HDMI_IH_MUTE_MUTE_WAKEUP_INTERRUPT = 0x2,
-+	HDMI_IH_MUTE_MUTE_ALL_INTERRUPT = 0x1,
-+
-+/* TX_INVID0 field values */
-+	HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_MASK = 0x80,
-+	HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_ENABLE = 0x80,
-+	HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_DISABLE = 0x00,
-+	HDMI_TX_INVID0_VIDEO_MAPPING_MASK = 0x1F,
-+	HDMI_TX_INVID0_VIDEO_MAPPING_OFFSET = 0,
-+
-+/* TX_INSTUFFING field values */
-+	HDMI_TX_INSTUFFING_BDBDATA_STUFFING_MASK = 0x4,
-+	HDMI_TX_INSTUFFING_BDBDATA_STUFFING_ENABLE = 0x4,
-+	HDMI_TX_INSTUFFING_BDBDATA_STUFFING_DISABLE = 0x0,
-+	HDMI_TX_INSTUFFING_RCRDATA_STUFFING_MASK = 0x2,
-+	HDMI_TX_INSTUFFING_RCRDATA_STUFFING_ENABLE = 0x2,
-+	HDMI_TX_INSTUFFING_RCRDATA_STUFFING_DISABLE = 0x0,
-+	HDMI_TX_INSTUFFING_GYDATA_STUFFING_MASK = 0x1,
-+	HDMI_TX_INSTUFFING_GYDATA_STUFFING_ENABLE = 0x1,
-+	HDMI_TX_INSTUFFING_GYDATA_STUFFING_DISABLE = 0x0,
-+
-+/* VP_PR_CD field values */
-+	HDMI_VP_PR_CD_COLOR_DEPTH_MASK = 0xF0,
-+	HDMI_VP_PR_CD_COLOR_DEPTH_OFFSET = 4,
-+	HDMI_VP_PR_CD_DESIRED_PR_FACTOR_MASK = 0x0F,
-+	HDMI_VP_PR_CD_DESIRED_PR_FACTOR_OFFSET = 0,
-+
-+/* VP_STUFF field values */
-+	HDMI_VP_STUFF_IDEFAULT_PHASE_MASK = 0x20,
-+	HDMI_VP_STUFF_IDEFAULT_PHASE_OFFSET = 5,
-+	HDMI_VP_STUFF_IFIX_PP_TO_LAST_MASK = 0x10,
-+	HDMI_VP_STUFF_IFIX_PP_TO_LAST_OFFSET = 4,
-+	HDMI_VP_STUFF_ICX_GOTO_P0_ST_MASK = 0x8,
-+	HDMI_VP_STUFF_ICX_GOTO_P0_ST_OFFSET = 3,
-+	HDMI_VP_STUFF_YCC422_STUFFING_MASK = 0x4,
-+	HDMI_VP_STUFF_YCC422_STUFFING_STUFFING_MODE = 0x4,
-+	HDMI_VP_STUFF_YCC422_STUFFING_DIRECT_MODE = 0x0,
-+	HDMI_VP_STUFF_PP_STUFFING_MASK = 0x2,
-+	HDMI_VP_STUFF_PP_STUFFING_STUFFING_MODE = 0x2,
-+	HDMI_VP_STUFF_PP_STUFFING_DIRECT_MODE = 0x0,
-+	HDMI_VP_STUFF_PR_STUFFING_MASK = 0x1,
-+	HDMI_VP_STUFF_PR_STUFFING_STUFFING_MODE = 0x1,
-+	HDMI_VP_STUFF_PR_STUFFING_DIRECT_MODE = 0x0,
-+
-+/* VP_CONF field values */
-+	HDMI_VP_CONF_BYPASS_EN_MASK = 0x40,
-+	HDMI_VP_CONF_BYPASS_EN_ENABLE = 0x40,
-+	HDMI_VP_CONF_BYPASS_EN_DISABLE = 0x00,
-+	HDMI_VP_CONF_PP_EN_ENMASK = 0x20,
-+	HDMI_VP_CONF_PP_EN_ENABLE = 0x20,
-+	HDMI_VP_CONF_PP_EN_DISABLE = 0x00,
-+	HDMI_VP_CONF_PR_EN_MASK = 0x10,
-+	HDMI_VP_CONF_PR_EN_ENABLE = 0x10,
-+	HDMI_VP_CONF_PR_EN_DISABLE = 0x00,
-+	HDMI_VP_CONF_YCC422_EN_MASK = 0x8,
-+	HDMI_VP_CONF_YCC422_EN_ENABLE = 0x8,
-+	HDMI_VP_CONF_YCC422_EN_DISABLE = 0x0,
-+	HDMI_VP_CONF_BYPASS_SELECT_MASK = 0x4,
-+	HDMI_VP_CONF_BYPASS_SELECT_VID_PACKETIZER = 0x4,
-+	HDMI_VP_CONF_BYPASS_SELECT_PIX_REPEATER = 0x0,
-+	HDMI_VP_CONF_OUTPUT_SELECTOR_MASK = 0x3,
-+	HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS = 0x3,
-+	HDMI_VP_CONF_OUTPUT_SELECTOR_YCC422 = 0x1,
-+	HDMI_VP_CONF_OUTPUT_SELECTOR_PP = 0x0,
-+
-+/* VP_REMAP field values */
-+	HDMI_VP_REMAP_MASK = 0x3,
-+	HDMI_VP_REMAP_YCC422_24bit = 0x2,
-+	HDMI_VP_REMAP_YCC422_20bit = 0x1,
-+	HDMI_VP_REMAP_YCC422_16bit = 0x0,
-+
-+/* FC_INVIDCONF field values */
-+	HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_MASK = 0x40,
-+	HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_HIGH = 0x40,
-+	HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_LOW = 0x00,
-+	HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_MASK = 0x20,
-+	HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_HIGH = 0x20,
-+	HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_LOW = 0x00,
-+	HDMI_FC_INVIDCONF_DE_IN_POLARITY_MASK = 0x10,
-+	HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_HIGH = 0x10,
-+	HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_LOW = 0x00,
-+	HDMI_FC_INVIDCONF_DVI_MODEZ_MASK = 0x8,
-+	HDMI_FC_INVIDCONF_DVI_MODEZ_HDMI_MODE = 0x8,
-+	HDMI_FC_INVIDCONF_DVI_MODEZ_DVI_MODE = 0x0,
-+	HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_MASK = 0x2,
-+	HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_HIGH = 0x2,
-+	HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_LOW = 0x0,
-+	HDMI_FC_INVIDCONF_IN_I_P_MASK = 0x1,
-+	HDMI_FC_INVIDCONF_IN_I_P_INTERLACED = 0x1,
-+	HDMI_FC_INVIDCONF_IN_I_P_PROGRESSIVE = 0x0,
-+
-+/* FC_AUDICONF0 field values */
-+	HDMI_FC_AUDICONF0_CC_OFFSET = 4,
-+	HDMI_FC_AUDICONF0_CC_MASK = 0x70,
-+	HDMI_FC_AUDICONF0_CT_OFFSET = 0,
-+	HDMI_FC_AUDICONF0_CT_MASK = 0xF,
-+
-+/* FC_AUDICONF1 field values */
-+	HDMI_FC_AUDICONF1_SS_OFFSET = 3,
-+	HDMI_FC_AUDICONF1_SS_MASK = 0x18,
-+	HDMI_FC_AUDICONF1_SF_OFFSET = 0,
-+	HDMI_FC_AUDICONF1_SF_MASK = 0x7,
-+
-+/* FC_AUDICONF3 field values */
-+	HDMI_FC_AUDICONF3_LFEPBL_OFFSET = 5,
-+	HDMI_FC_AUDICONF3_LFEPBL_MASK = 0x60,
-+	HDMI_FC_AUDICONF3_DM_INH_OFFSET = 4,
-+	HDMI_FC_AUDICONF3_DM_INH_MASK = 0x10,
-+	HDMI_FC_AUDICONF3_LSV_OFFSET = 0,
-+	HDMI_FC_AUDICONF3_LSV_MASK = 0xF,
-+
-+/* FC_AUDSCHNLS0 field values */
-+	HDMI_FC_AUDSCHNLS0_CGMSA_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS0_CGMSA_MASK = 0x30,
-+	HDMI_FC_AUDSCHNLS0_COPYRIGHT_OFFSET = 0,
-+	HDMI_FC_AUDSCHNLS0_COPYRIGHT_MASK = 0x01,
-+
-+/* FC_AUDSCHNLS3-6 field values */
-+	HDMI_FC_AUDSCHNLS3_OIEC_CH0_OFFSET = 0,
-+	HDMI_FC_AUDSCHNLS3_OIEC_CH0_MASK = 0x0f,
-+	HDMI_FC_AUDSCHNLS3_OIEC_CH1_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS3_OIEC_CH1_MASK = 0xf0,
-+	HDMI_FC_AUDSCHNLS4_OIEC_CH2_OFFSET = 0,
-+	HDMI_FC_AUDSCHNLS4_OIEC_CH2_MASK = 0x0f,
-+	HDMI_FC_AUDSCHNLS4_OIEC_CH3_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS4_OIEC_CH3_MASK = 0xf0,
-+
-+	HDMI_FC_AUDSCHNLS5_OIEC_CH0_OFFSET = 0,
-+	HDMI_FC_AUDSCHNLS5_OIEC_CH0_MASK = 0x0f,
-+	HDMI_FC_AUDSCHNLS5_OIEC_CH1_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS5_OIEC_CH1_MASK = 0xf0,
-+	HDMI_FC_AUDSCHNLS6_OIEC_CH2_OFFSET = 0,
-+	HDMI_FC_AUDSCHNLS6_OIEC_CH2_MASK = 0x0f,
-+	HDMI_FC_AUDSCHNLS6_OIEC_CH3_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS6_OIEC_CH3_MASK = 0xf0,
-+
-+/* HDMI_FC_AUDSCHNLS7 field values */
-+	HDMI_FC_AUDSCHNLS7_ACCURACY_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS7_ACCURACY_MASK = 0x30,
-+
-+/* HDMI_FC_AUDSCHNLS8 field values */
-+	HDMI_FC_AUDSCHNLS8_ORIGSAMPFREQ_MASK = 0xf0,
-+	HDMI_FC_AUDSCHNLS8_ORIGSAMPFREQ_OFFSET = 4,
-+	HDMI_FC_AUDSCHNLS8_WORDLEGNTH_MASK = 0x0f,
-+	HDMI_FC_AUDSCHNLS8_WORDLEGNTH_OFFSET = 0,
-+
-+/* FC_AUDSCONF field values */
-+	HDMI_FC_AUDSCONF_AUD_PACKET_SAMPFIT_MASK = 0xF0,
-+	HDMI_FC_AUDSCONF_AUD_PACKET_SAMPFIT_OFFSET = 4,
-+	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_MASK = 0x1,
-+	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_OFFSET = 0,
-+	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_LAYOUT1 = 0x1,
-+	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_LAYOUT0 = 0x0,
-+
-+/* FC_STAT2 field values */
-+	HDMI_FC_STAT2_OVERFLOW_MASK = 0x03,
-+	HDMI_FC_STAT2_LOW_PRIORITY_OVERFLOW = 0x02,
-+	HDMI_FC_STAT2_HIGH_PRIORITY_OVERFLOW = 0x01,
-+
-+/* FC_INT2 field values */
-+	HDMI_FC_INT2_OVERFLOW_MASK = 0x03,
-+	HDMI_FC_INT2_LOW_PRIORITY_OVERFLOW = 0x02,
-+	HDMI_FC_INT2_HIGH_PRIORITY_OVERFLOW = 0x01,
-+
-+/* FC_MASK2 field values */
-+	HDMI_FC_MASK2_OVERFLOW_MASK = 0x03,
-+	HDMI_FC_MASK2_LOW_PRIORITY_OVERFLOW = 0x02,
-+	HDMI_FC_MASK2_HIGH_PRIORITY_OVERFLOW = 0x01,
-+
-+/* FC_PRCONF field values */
-+	HDMI_FC_PRCONF_INCOMING_PR_FACTOR_MASK = 0xF0,
-+	HDMI_FC_PRCONF_INCOMING_PR_FACTOR_OFFSET = 4,
-+	HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_MASK = 0x0F,
-+	HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_OFFSET = 0,
-+
-+/* FC_AVICONF0-FC_AVICONF3 field values */
-+	HDMI_FC_AVICONF0_PIX_FMT_MASK = 0x03,
-+	HDMI_FC_AVICONF0_PIX_FMT_RGB = 0x00,
-+	HDMI_FC_AVICONF0_PIX_FMT_YCBCR422 = 0x01,
-+	HDMI_FC_AVICONF0_PIX_FMT_YCBCR444 = 0x02,
-+	HDMI_FC_AVICONF0_ACTIVE_FMT_MASK = 0x40,
-+	HDMI_FC_AVICONF0_ACTIVE_FMT_INFO_PRESENT = 0x40,
-+	HDMI_FC_AVICONF0_ACTIVE_FMT_NO_INFO = 0x00,
-+	HDMI_FC_AVICONF0_BAR_DATA_MASK = 0x0C,
-+	HDMI_FC_AVICONF0_BAR_DATA_NO_DATA = 0x00,
-+	HDMI_FC_AVICONF0_BAR_DATA_VERT_BAR = 0x04,
-+	HDMI_FC_AVICONF0_BAR_DATA_HORIZ_BAR = 0x08,
-+	HDMI_FC_AVICONF0_BAR_DATA_VERT_HORIZ_BAR = 0x0C,
-+	HDMI_FC_AVICONF0_SCAN_INFO_MASK = 0x30,
-+	HDMI_FC_AVICONF0_SCAN_INFO_OVERSCAN = 0x10,
-+	HDMI_FC_AVICONF0_SCAN_INFO_UNDERSCAN = 0x20,
-+	HDMI_FC_AVICONF0_SCAN_INFO_NODATA = 0x00,
-+
-+	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_MASK = 0x0F,
-+	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_USE_CODED = 0x08,
-+	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_4_3 = 0x09,
-+	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_16_9 = 0x0A,
-+	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_14_9 = 0x0B,
-+	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_MASK = 0x30,
-+	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_NO_DATA = 0x00,
-+	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_4_3 = 0x10,
-+	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_16_9 = 0x20,
-+	HDMI_FC_AVICONF1_COLORIMETRY_MASK = 0xC0,
-+	HDMI_FC_AVICONF1_COLORIMETRY_NO_DATA = 0x00,
-+	HDMI_FC_AVICONF1_COLORIMETRY_SMPTE = 0x40,
-+	HDMI_FC_AVICONF1_COLORIMETRY_ITUR = 0x80,
-+	HDMI_FC_AVICONF1_COLORIMETRY_EXTENDED_INFO = 0xC0,
-+
-+	HDMI_FC_AVICONF2_SCALING_MASK = 0x03,
-+	HDMI_FC_AVICONF2_SCALING_NONE = 0x00,
-+	HDMI_FC_AVICONF2_SCALING_HORIZ = 0x01,
-+	HDMI_FC_AVICONF2_SCALING_VERT = 0x02,
-+	HDMI_FC_AVICONF2_SCALING_HORIZ_VERT = 0x03,
-+	HDMI_FC_AVICONF2_RGB_QUANT_MASK = 0x0C,
-+	HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT = 0x00,
-+	HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE = 0x04,
-+	HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE = 0x08,
-+	HDMI_FC_AVICONF2_EXT_COLORIMETRY_MASK = 0x70,
-+	HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601 = 0x00,
-+	HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC709 = 0x10,
-+	HDMI_FC_AVICONF2_EXT_COLORIMETRY_SYCC601 = 0x20,
-+	HDMI_FC_AVICONF2_EXT_COLORIMETRY_ADOBE_YCC601 = 0x30,
-+	HDMI_FC_AVICONF2_EXT_COLORIMETRY_ADOBE_RGB = 0x40,
-+	HDMI_FC_AVICONF2_IT_CONTENT_MASK = 0x80,
-+	HDMI_FC_AVICONF2_IT_CONTENT_NO_DATA = 0x00,
-+	HDMI_FC_AVICONF2_IT_CONTENT_VALID = 0x80,
-+
-+	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_MASK = 0x03,
-+	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_GRAPHICS = 0x00,
-+	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_PHOTO = 0x01,
-+	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_CINEMA = 0x02,
-+	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_GAME = 0x03,
-+	HDMI_FC_AVICONF3_QUANT_RANGE_MASK = 0x0C,
-+	HDMI_FC_AVICONF3_QUANT_RANGE_LIMITED = 0x00,
-+	HDMI_FC_AVICONF3_QUANT_RANGE_FULL = 0x04,
-+
-+/* FC_DBGFORCE field values */
-+	HDMI_FC_DBGFORCE_FORCEAUDIO = 0x10,
-+	HDMI_FC_DBGFORCE_FORCEVIDEO = 0x1,
-+
-+/* PHY_CONF0 field values */
-+	HDMI_PHY_CONF0_PDZ_MASK = 0x80,
-+	HDMI_PHY_CONF0_PDZ_OFFSET = 7,
-+	HDMI_PHY_CONF0_ENTMDS_MASK = 0x40,
-+	HDMI_PHY_CONF0_ENTMDS_OFFSET = 6,
-+	HDMI_PHY_CONF0_SPARECTRL = 0x20,
-+	HDMI_PHY_CONF0_GEN2_PDDQ_MASK = 0x10,
-+	HDMI_PHY_CONF0_GEN2_PDDQ_OFFSET = 4,
-+	HDMI_PHY_CONF0_GEN2_TXPWRON_MASK = 0x8,
-+	HDMI_PHY_CONF0_GEN2_TXPWRON_OFFSET = 3,
-+	HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_MASK = 0x4,
-+	HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_OFFSET = 2,
-+	HDMI_PHY_CONF0_SELDATAENPOL_MASK = 0x2,
-+	HDMI_PHY_CONF0_SELDATAENPOL_OFFSET = 1,
-+	HDMI_PHY_CONF0_SELDIPIF_MASK = 0x1,
-+	HDMI_PHY_CONF0_SELDIPIF_OFFSET = 0,
-+
-+/* PHY_TST0 field values */
-+	HDMI_PHY_TST0_TSTCLR_MASK = 0x20,
-+	HDMI_PHY_TST0_TSTCLR_OFFSET = 5,
-+	HDMI_PHY_TST0_TSTEN_MASK = 0x10,
-+	HDMI_PHY_TST0_TSTEN_OFFSET = 4,
-+	HDMI_PHY_TST0_TSTCLK_MASK = 0x1,
-+	HDMI_PHY_TST0_TSTCLK_OFFSET = 0,
-+
-+/* PHY_STAT0 field values */
-+	HDMI_PHY_RX_SENSE3 = 0x80,
-+	HDMI_PHY_RX_SENSE2 = 0x40,
-+	HDMI_PHY_RX_SENSE1 = 0x20,
-+	HDMI_PHY_RX_SENSE0 = 0x10,
-+	HDMI_PHY_HPD = 0x02,
-+	HDMI_PHY_TX_PHY_LOCK = 0x01,
-+
-+/* HDMI STAT convenience RX_SENSE | HPD */
-+	HDMI_DVI_STAT = 0xF2,
-+
-+/* PHY_I2CM_SLAVE_ADDR field values */
-+	HDMI_PHY_I2CM_SLAVE_ADDR_PHY_GEN2 = 0x69,
-+	HDMI_PHY_I2CM_SLAVE_ADDR_HEAC_PHY = 0x49,
-+
-+/* PHY_I2CM_OPERATION_ADDR field values */
-+	HDMI_PHY_I2CM_OPERATION_ADDR_WRITE = 0x10,
-+	HDMI_PHY_I2CM_OPERATION_ADDR_READ = 0x1,
-+
-+/* HDMI_PHY_I2CM_INT_ADDR */
-+	HDMI_PHY_I2CM_INT_ADDR_DONE_POL = 0x08,
-+	HDMI_PHY_I2CM_INT_ADDR_DONE_MASK = 0x04,
-+
-+/* HDMI_PHY_I2CM_CTLINT_ADDR */
-+	HDMI_PHY_I2CM_CTLINT_ADDR_NAC_POL = 0x80,
-+	HDMI_PHY_I2CM_CTLINT_ADDR_NAC_MASK = 0x40,
-+	HDMI_PHY_I2CM_CTLINT_ADDR_ARBITRATION_POL = 0x08,
-+	HDMI_PHY_I2CM_CTLINT_ADDR_ARBITRATION_MASK = 0x04,
-+
-+/* AUD_CTS3 field values */
-+	HDMI_AUD_CTS3_N_SHIFT_OFFSET = 5,
-+	HDMI_AUD_CTS3_N_SHIFT_MASK = 0xe0,
-+	HDMI_AUD_CTS3_N_SHIFT_1 = 0,
-+	HDMI_AUD_CTS3_N_SHIFT_16 = 0x20,
-+	HDMI_AUD_CTS3_N_SHIFT_32 = 0x40,
-+	HDMI_AUD_CTS3_N_SHIFT_64 = 0x60,
-+	HDMI_AUD_CTS3_N_SHIFT_128 = 0x80,
-+	HDMI_AUD_CTS3_N_SHIFT_256 = 0xa0,
-+	/* note that the CTS3 MANUAL bit has been removed
-+	   from our part. Can't set it, will read as 0. */
-+	HDMI_AUD_CTS3_CTS_MANUAL = 0x10,
-+	HDMI_AUD_CTS3_AUDCTS19_16_MASK = 0x0f,
-+
-+/* AHB_DMA_CONF0 field values */
-+	HDMI_AHB_DMA_CONF0_SW_FIFO_RST_OFFSET = 7,
-+	HDMI_AHB_DMA_CONF0_SW_FIFO_RST_MASK = 0x80,
-+	HDMI_AHB_DMA_CONF0_HBR_OFFSET = 4,
-+	HDMI_AHB_DMA_CONF0_HBR_MASK = 0x10,
-+	HDMI_AHB_DMA_CONF0_EN_HLOCK_OFFSET = 3,
-+	HDMI_AHB_DMA_CONF0_EN_HLOCK_MASK = 0x08,
-+	HDMI_AHB_DMA_CONF0_INCR_TYPE_OFFSET = 1,
-+	HDMI_AHB_DMA_CONF0_INCR_TYPE_MASK = 0x06,
-+	HDMI_AHB_DMA_CONF0_INCR4 = 0x0,
-+	HDMI_AHB_DMA_CONF0_INCR8 = 0x2,
-+	HDMI_AHB_DMA_CONF0_INCR16 = 0x4,
-+	HDMI_AHB_DMA_CONF0_BURST_MODE = 0x1,
-+
-+/* HDMI_AHB_DMA_START field values */
-+	HDMI_AHB_DMA_START_START_OFFSET = 0,
-+	HDMI_AHB_DMA_START_START_MASK = 0x01,
-+
-+/* HDMI_AHB_DMA_STOP field values */
-+	HDMI_AHB_DMA_STOP_STOP_OFFSET = 0,
-+	HDMI_AHB_DMA_STOP_STOP_MASK = 0x01,
-+
-+/* AHB_DMA_STAT, AHB_DMA_INT, AHB_DMA_MASK, AHB_DMA_POL field values */
-+	HDMI_AHB_DMA_DONE = 0x80,
-+	HDMI_AHB_DMA_RETRY_SPLIT = 0x40,
-+	HDMI_AHB_DMA_LOSTOWNERSHIP = 0x20,
-+	HDMI_AHB_DMA_ERROR = 0x10,
-+	HDMI_AHB_DMA_FIFO_THREMPTY = 0x04,
-+	HDMI_AHB_DMA_FIFO_FULL = 0x02,
-+	HDMI_AHB_DMA_FIFO_EMPTY = 0x01,
-+
-+/* AHB_DMA_BUFFSTAT, AHB_DMA_BUFFINT, AHB_DMA_BUFFMASK, AHB_DMA_BUFFPOL field values */
-+	HDMI_AHB_DMA_BUFFSTAT_FULL = 0x02,
-+	HDMI_AHB_DMA_BUFFSTAT_EMPTY = 0x01,
-+
-+/* MC_CLKDIS field values */
-+	HDMI_MC_CLKDIS_HDCPCLK_DISABLE = 0x40,
-+	HDMI_MC_CLKDIS_CECCLK_DISABLE = 0x20,
-+	HDMI_MC_CLKDIS_CSCCLK_DISABLE = 0x10,
-+	HDMI_MC_CLKDIS_AUDCLK_DISABLE = 0x8,
-+	HDMI_MC_CLKDIS_PREPCLK_DISABLE = 0x4,
-+	HDMI_MC_CLKDIS_TMDSCLK_DISABLE = 0x2,
-+	HDMI_MC_CLKDIS_PIXELCLK_DISABLE = 0x1,
-+
-+/* MC_SWRSTZ field values */
-+	HDMI_MC_SWRSTZ_TMDSSWRST_REQ = 0x02,
-+
-+/* MC_FLOWCTRL field values */
-+	HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_MASK = 0x1,
-+	HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_IN_PATH = 0x1,
-+	HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_BYPASS = 0x0,
-+
-+/* MC_PHYRSTZ field values */
-+	HDMI_MC_PHYRSTZ_ASSERT = 0x0,
-+	HDMI_MC_PHYRSTZ_DEASSERT = 0x1,
-+
-+/* MC_HEACPHY_RST field values */
-+	HDMI_MC_HEACPHY_RST_ASSERT = 0x1,
-+	HDMI_MC_HEACPHY_RST_DEASSERT = 0x0,
-+
-+/* CSC_CFG field values */
-+	HDMI_CSC_CFG_INTMODE_MASK = 0x30,
-+	HDMI_CSC_CFG_INTMODE_OFFSET = 4,
-+	HDMI_CSC_CFG_INTMODE_DISABLE = 0x00,
-+	HDMI_CSC_CFG_INTMODE_CHROMA_INT_FORMULA1 = 0x10,
-+	HDMI_CSC_CFG_INTMODE_CHROMA_INT_FORMULA2 = 0x20,
-+	HDMI_CSC_CFG_DECMODE_MASK = 0x3,
-+	HDMI_CSC_CFG_DECMODE_OFFSET = 0,
-+	HDMI_CSC_CFG_DECMODE_DISABLE = 0x0,
-+	HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA1 = 0x1,
-+	HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA2 = 0x2,
-+	HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA3 = 0x3,
-+
-+/* CSC_SCALE field values */
-+	HDMI_CSC_SCALE_CSC_COLORDE_PTH_MASK = 0xF0,
-+	HDMI_CSC_SCALE_CSC_COLORDE_PTH_24BPP = 0x00,
-+	HDMI_CSC_SCALE_CSC_COLORDE_PTH_30BPP = 0x50,
-+	HDMI_CSC_SCALE_CSC_COLORDE_PTH_36BPP = 0x60,
-+	HDMI_CSC_SCALE_CSC_COLORDE_PTH_48BPP = 0x70,
-+	HDMI_CSC_SCALE_CSCSCALE_MASK = 0x03,
-+
-+/* I2CM_OPERATION field values */
-+	HDMI_I2CM_OPERATION_WRITE = 0x10,
-+	HDMI_I2CM_OPERATION_READ_EXT = 0x2,
-+	HDMI_I2CM_OPERATION_READ = 0x1,
-+
-+/* HDMI_I2CM_INT */
-+	HDMI_I2CM_INT_DONE_POL = 0x08,
-+	HDMI_I2CM_INT_DONE_MASK = 0x04,
-+
-+/* HDMI_I2CM_CTLINT */
-+	HDMI_I2CM_CTLINT_NAC_POL = 0x80,
-+	HDMI_I2CM_CTLINT_NAC_MASK = 0x40,
-+	HDMI_I2CM_CTLINT_ARBITRATION_POL = 0x08,
-+	HDMI_I2CM_CTLINT_ARBITRATION_MASK = 0x04,
-+
-+};
-+
-+enum imx_hdmi_type {
-+	IMX6DL_HDMI,
-+	IMX6Q_HDMI,
-+};
-+
-+/* IOCTL commands */
-+#define HDMI_IOC_MAGIC  'H'
-+
-+#define HDMI_IOC_GET_RESOURCE	_IO(HDMI_IOC_MAGIC, 0)
-+#define HDMI_IOC_GET_CPU_TYPE	_IO(HDMI_IOC_MAGIC, 1)
-+
-+
-+#endif /* __MXC_HDMI_H__ */
-diff -Nur linux-4.1.3/sound/soc/codecs/hdmi.c linux-xbian-imx6/sound/soc/codecs/hdmi.c
---- linux-4.1.3/sound/soc/codecs/hdmi.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/codecs/hdmi.c	2015-07-27 23:13:11.073473395 +0200
-@@ -47,7 +47,7 @@
- 			SNDRV_PCM_RATE_176400 | SNDRV_PCM_RATE_192000,
- 		.formats = SNDRV_PCM_FMTBIT_S16_LE |
- 			SNDRV_PCM_FMTBIT_S24_LE | SNDRV_PCM_FMTBIT_S32_LE,
--		.sig_bits = 24,
-+//		.sig_bits = 24,
- 	},
- 	.capture = {
- 		.stream_name = "Capture",
-diff -Nur linux-4.1.3/sound/soc/codecs/sgtl5000.c linux-xbian-imx6/sound/soc/codecs/sgtl5000.c
---- linux-4.1.3/sound/soc/codecs/sgtl5000.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/codecs/sgtl5000.c	2015-07-27 23:13:11.085430733 +0200
-@@ -16,7 +16,6 @@
- #include <linux/pm.h>
- #include <linux/i2c.h>
- #include <linux/clk.h>
--#include <linux/log2.h>
- #include <linux/regmap.h>
- #include <linux/regulator/driver.h>
- #include <linux/regulator/machine.h>
-@@ -35,34 +34,25 @@
- #define SGTL5000_DAP_REG_OFFSET	0x0100
- #define SGTL5000_MAX_REG_OFFSET	0x013A
- 
-+
-+int snd_soc_codec_set_cache_io(struct snd_soc_codec *codec,
-+					int addr_bits, int data_bits,
-+					enum snd_soc_control_type control);
-+
- /* default value of sgtl5000 registers */
- static const struct reg_default sgtl5000_reg_defaults[] = {
--	{ SGTL5000_CHIP_DIG_POWER,		0x0000 },
- 	{ SGTL5000_CHIP_CLK_CTRL,		0x0008 },
- 	{ SGTL5000_CHIP_I2S_CTRL,		0x0010 },
- 	{ SGTL5000_CHIP_SSS_CTRL,		0x0010 },
--	{ SGTL5000_CHIP_ADCDAC_CTRL,		0x020c },
- 	{ SGTL5000_CHIP_DAC_VOL,		0x3c3c },
- 	{ SGTL5000_CHIP_PAD_STRENGTH,		0x015f },
--	{ SGTL5000_CHIP_ANA_ADC_CTRL,		0x0000 },
- 	{ SGTL5000_CHIP_ANA_HP_CTRL,		0x1818 },
- 	{ SGTL5000_CHIP_ANA_CTRL,		0x0111 },
--	{ SGTL5000_CHIP_LINREG_CTRL,		0x0000 },
--	{ SGTL5000_CHIP_REF_CTRL,		0x0000 },
--	{ SGTL5000_CHIP_MIC_CTRL,		0x0000 },
--	{ SGTL5000_CHIP_LINE_OUT_CTRL,		0x0000 },
- 	{ SGTL5000_CHIP_LINE_OUT_VOL,		0x0404 },
- 	{ SGTL5000_CHIP_ANA_POWER,		0x7060 },
- 	{ SGTL5000_CHIP_PLL_CTRL,		0x5000 },
--	{ SGTL5000_CHIP_CLK_TOP_CTRL,		0x0000 },
--	{ SGTL5000_CHIP_ANA_STATUS,		0x0000 },
--	{ SGTL5000_CHIP_SHORT_CTRL,		0x0000 },
--	{ SGTL5000_CHIP_ANA_TEST2,		0x0000 },
--	{ SGTL5000_DAP_CTRL,			0x0000 },
--	{ SGTL5000_DAP_PEQ,			0x0000 },
- 	{ SGTL5000_DAP_BASS_ENHANCE,		0x0040 },
- 	{ SGTL5000_DAP_BASS_ENHANCE_CTRL,	0x051f },
--	{ SGTL5000_DAP_AUDIO_EQ,		0x0000 },
- 	{ SGTL5000_DAP_SURROUND,		0x0040 },
- 	{ SGTL5000_DAP_EQ_BASS_BAND0,		0x002f },
- 	{ SGTL5000_DAP_EQ_BASS_BAND1,		0x002f },
-@@ -70,7 +60,6 @@
- 	{ SGTL5000_DAP_EQ_BASS_BAND3,		0x002f },
- 	{ SGTL5000_DAP_EQ_BASS_BAND4,		0x002f },
- 	{ SGTL5000_DAP_MAIN_CHAN,		0x8000 },
--	{ SGTL5000_DAP_MIX_CHAN,		0x0000 },
- 	{ SGTL5000_DAP_AVC_CTRL,		0x0510 },
- 	{ SGTL5000_DAP_AVC_THRESHOLD,		0x1473 },
- 	{ SGTL5000_DAP_AVC_ATTACK,		0x0028 },
-@@ -122,13 +111,6 @@
- 	bool enabled;
- };
- 
--enum sgtl5000_micbias_resistor {
--	SGTL5000_MICBIAS_OFF = 0,
--	SGTL5000_MICBIAS_2K = 2,
--	SGTL5000_MICBIAS_4K = 4,
--	SGTL5000_MICBIAS_8K = 8,
--};
--
- /* sgtl5000 private structure in codec */
- struct sgtl5000_priv {
- 	int sysclk;	/* sysclk rate */
-@@ -216,9 +198,8 @@
- 	"MIC_IN", "LINE_IN"
- };
- 
--static SOC_ENUM_SINGLE_DECL(adc_enum,
--			    SGTL5000_CHIP_ANA_CTRL, 2,
--			    adc_mux_text);
-+static const struct soc_enum adc_enum =
-+SOC_ENUM_SINGLE(SGTL5000_CHIP_ANA_CTRL, 2, 2, adc_mux_text);
- 
- static const struct snd_kcontrol_new adc_mux =
- SOC_DAPM_ENUM("Capture Mux", adc_enum);
-@@ -228,9 +209,8 @@
- 	"DAC", "LINE_IN"
- };
- 
--static SOC_ENUM_SINGLE_DECL(dac_enum,
--			    SGTL5000_CHIP_ANA_CTRL, 6,
--			    dac_mux_text);
-+static const struct soc_enum dac_enum =
-+SOC_ENUM_SINGLE(SGTL5000_CHIP_ANA_CTRL, 6, 2, dac_mux_text);
- 
- static const struct snd_kcontrol_new dac_mux =
- SOC_DAPM_ENUM("Headphone Mux", dac_enum);
-@@ -325,7 +305,7 @@
- static int dac_get_volsw(struct snd_kcontrol *kcontrol,
- 			 struct snd_ctl_elem_value *ucontrol)
- {
--	struct snd_soc_codec *codec = snd_soc_kcontrol_codec(kcontrol);
-+	struct snd_soc_codec *codec = snd_kcontrol_chip(kcontrol);
- 	int reg;
- 	int l;
- 	int r;
-@@ -378,7 +358,7 @@
- static int dac_put_volsw(struct snd_kcontrol *kcontrol,
- 			 struct snd_ctl_elem_value *ucontrol)
- {
--	struct snd_soc_codec *codec = snd_soc_kcontrol_codec(kcontrol);
-+	struct snd_soc_codec *codec = snd_kcontrol_chip(kcontrol);
- 	int reg;
- 	int l;
- 	int r;
-@@ -485,21 +465,21 @@
- 	/* setting i2s data format */
- 	switch (fmt & SND_SOC_DAIFMT_FORMAT_MASK) {
- 	case SND_SOC_DAIFMT_DSP_A:
--		i2sctl |= SGTL5000_I2S_MODE_PCM << SGTL5000_I2S_MODE_SHIFT;
-+		i2sctl |= SGTL5000_I2S_MODE_PCM;
- 		break;
- 	case SND_SOC_DAIFMT_DSP_B:
--		i2sctl |= SGTL5000_I2S_MODE_PCM << SGTL5000_I2S_MODE_SHIFT;
-+		i2sctl |= SGTL5000_I2S_MODE_PCM;
- 		i2sctl |= SGTL5000_I2S_LRALIGN;
- 		break;
- 	case SND_SOC_DAIFMT_I2S:
--		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ << SGTL5000_I2S_MODE_SHIFT;
-+		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ;
- 		break;
- 	case SND_SOC_DAIFMT_RIGHT_J:
--		i2sctl |= SGTL5000_I2S_MODE_RJ << SGTL5000_I2S_MODE_SHIFT;
-+		i2sctl |= SGTL5000_I2S_MODE_RJ;
- 		i2sctl |= SGTL5000_I2S_LRPOL;
- 		break;
- 	case SND_SOC_DAIFMT_LEFT_J:
--		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ << SGTL5000_I2S_MODE_SHIFT;
-+		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ;
- 		i2sctl |= SGTL5000_I2S_LRALIGN;
- 		break;
- 	default:
-@@ -544,16 +524,16 @@
- 
- /*
-  * set clock according to i2s frame clock,
-- * sgtl5000 provides 2 clock sources:
-- * 1. sys_mclk: sample freq can only be configured to
-+ * sgtl5000 provide 2 clock sources.
-+ * 1. sys_mclk. sample freq can only configure to
-  *	1/256, 1/384, 1/512 of sys_mclk.
-- * 2. pll: can derive any audio clocks.
-+ * 2. pll. can derive any audio clocks.
-  *
-  * clock setting rules:
-- * 1. in slave mode, only sys_mclk can be used
-- * 2. as constraint by sys_mclk, sample freq should be set to 32 kHz, 44.1 kHz
-- * and above.
-- * 3. usage of sys_mclk is preferred over pll to save power.
-+ * 1. in slave mode, only sys_mclk can use.
-+ * 2. as constraint by sys_mclk, sample freq should
-+ *	set to 32k, 44.1k and above.
-+ * 3. using sys_mclk prefer to pll to save power.
-  */
- static int sgtl5000_set_clock(struct snd_soc_codec *codec, int frame_rate)
- {
-@@ -563,8 +543,8 @@
- 
- 	/*
- 	 * sample freq should be divided by frame clock,
--	 * if frame clock is lower than 44.1 kHz, sample freq should be set to
--	 * 32 kHz or 44.1 kHz.
-+	 * if frame clock lower than 44.1khz, sample feq should set to
-+	 * 32khz or 44.1khz.
- 	 */
- 	switch (frame_rate) {
- 	case 8000:
-@@ -617,10 +597,9 @@
- 
- 	/*
- 	 * calculate the divider of mclk/sample_freq,
--	 * factor of freq = 96 kHz can only be 256, since mclk is in the range
--	 * of 8 MHz - 27 MHz
-+	 * factor of freq =96k can only be 256, since mclk in range (12m,27m)
- 	 */
--	switch (sgtl5000->sysclk / frame_rate) {
-+	switch (sgtl5000->sysclk / sys_fs) {
- 	case 256:
- 		clk_ctl |= SGTL5000_MCLK_FREQ_256FS <<
- 			SGTL5000_MCLK_FREQ_SHIFT;
-@@ -634,16 +613,13 @@
- 			SGTL5000_MCLK_FREQ_SHIFT;
- 		break;
- 	default:
--		/* if mclk does not satisfy the divider, use pll */
-+		/* if mclk not satisify the divider, use pll */
- 		if (sgtl5000->master) {
- 			clk_ctl |= SGTL5000_MCLK_FREQ_PLL <<
- 				SGTL5000_MCLK_FREQ_SHIFT;
- 		} else {
- 			dev_err(codec->dev,
- 				"PLL not supported in slave mode\n");
--			dev_err(codec->dev, "%d ratio is not supported. "
--				"SYS_MCLK needs to be 256, 384 or 512 * fs\n",
--				sgtl5000->sysclk / frame_rate);
- 			return -EINVAL;
- 		}
- 	}
-@@ -742,25 +718,25 @@
- 		return ret;
- 
- 	/* set i2s data format */
--	switch (params_width(params)) {
--	case 16:
-+	switch (params_format(params)) {
-+	case SNDRV_PCM_FORMAT_S16_LE:
- 		if (sgtl5000->fmt == SND_SOC_DAIFMT_RIGHT_J)
- 			return -EINVAL;
- 		i2s_ctl |= SGTL5000_I2S_DLEN_16 << SGTL5000_I2S_DLEN_SHIFT;
- 		i2s_ctl |= SGTL5000_I2S_SCLKFREQ_32FS <<
- 		    SGTL5000_I2S_SCLKFREQ_SHIFT;
- 		break;
--	case 20:
-+	case SNDRV_PCM_FORMAT_S20_3LE:
- 		i2s_ctl |= SGTL5000_I2S_DLEN_20 << SGTL5000_I2S_DLEN_SHIFT;
- 		i2s_ctl |= SGTL5000_I2S_SCLKFREQ_64FS <<
- 		    SGTL5000_I2S_SCLKFREQ_SHIFT;
- 		break;
--	case 24:
-+	case SNDRV_PCM_FORMAT_S24_LE:
- 		i2s_ctl |= SGTL5000_I2S_DLEN_24 << SGTL5000_I2S_DLEN_SHIFT;
- 		i2s_ctl |= SGTL5000_I2S_SCLKFREQ_64FS <<
- 		    SGTL5000_I2S_SCLKFREQ_SHIFT;
- 		break;
--	case 32:
-+	case SNDRV_PCM_FORMAT_S32_LE:
- 		if (sgtl5000->fmt == SND_SOC_DAIFMT_RIGHT_J)
- 			return -EINVAL;
- 		i2s_ctl |= SGTL5000_I2S_DLEN_32 << SGTL5000_I2S_DLEN_SHIFT;
-@@ -791,7 +767,7 @@
- 	struct ldo_regulator *ldo = rdev_get_drvdata(dev);
- 	struct snd_soc_codec *codec = (struct snd_soc_codec *)ldo->codec_data;
- 	int reg;
--
-+dev_info(codec->dev, "%s(): enabled %u\n", __func__, ldo->enabled);
- 	if (ldo_regulator_is_enabled(dev))
- 		return 0;
- 
-@@ -810,7 +786,7 @@
- 				SGTL5000_LINEREG_D_POWERUP,
- 				SGTL5000_LINEREG_D_POWERUP);
- 
--	/* when internal ldo is enabled, simple digital power can be disabled */
-+	/* when internal ldo enabled, simple digital power can be disabled */
- 	snd_soc_update_bits(codec, SGTL5000_CHIP_ANA_POWER,
- 				SGTL5000_LINREG_SIMPLE_POWERUP,
- 				0);
-@@ -823,10 +799,16 @@
- {
- 	struct ldo_regulator *ldo = rdev_get_drvdata(dev);
- 	struct snd_soc_codec *codec = (struct snd_soc_codec *)ldo->codec_data;
-+dev_info(codec->dev, "%s(): enabled %u\n", __func__, ldo->enabled);
-+
-+	snd_soc_update_bits(codec, SGTL5000_CHIP_ANA_POWER,
-+				SGTL5000_LINREG_SIMPLE_POWERUP,
-+				SGTL5000_LINREG_SIMPLE_POWERUP);
- 
- 	snd_soc_update_bits(codec, SGTL5000_CHIP_ANA_POWER,
- 				SGTL5000_LINEREG_D_POWERUP,
- 				0);
-+dev_info(codec->dev, "%s: ANA_POWER = 0x%04x\n", __func__, snd_soc_read(codec, SGTL5000_CHIP_ANA_POWER));
- 
- 	/* clear voltage info */
- 	snd_soc_update_bits(codec, SGTL5000_CHIP_LINREG_CTRL,
-@@ -861,8 +843,10 @@
- 
- 	ldo = kzalloc(sizeof(struct ldo_regulator), GFP_KERNEL);
- 
--	if (!ldo)
-+	if (!ldo) {
-+		dev_err(codec->dev, "failed to allocate ldo_regulator\n");
- 		return -ENOMEM;
-+	}
- 
- 	ldo->desc.name = kstrdup(dev_name(codec->dev), GFP_KERNEL);
- 	if (!ldo->desc.name) {
-@@ -882,6 +866,7 @@
- 	config.dev = codec->dev;
- 	config.driver_data = ldo;
- 	config.init_data = init_data;
-+	config.ena_gpio = -EINVAL;
- 
- 	ldo->dev = regulator_register(&ldo->desc, &config);
- 	if (IS_ERR(ldo->dev)) {
-@@ -1091,10 +1076,90 @@
- 	}
- }
- 
-+#ifdef CONFIG_SUSPEND
-+static int sgtl5000_suspend(struct snd_soc_codec *codec)
-+{
-+	sgtl5000_set_bias_level(codec, SND_SOC_BIAS_OFF);
-+
-+	return 0;
-+}
-+
-+/*
-+ * restore all sgtl5000 registers,
-+ * since a big hole between dap and regular registers,
-+ * we will restore them respectively.
-+ */
-+static int sgtl5000_restore_regs(struct snd_soc_codec *codec)
-+{
-+	u16 *cache = codec->reg_cache;
-+	u16 reg;
-+
-+	/* restore regular registers */
-+	for (reg = 0; reg <= SGTL5000_CHIP_SHORT_CTRL; reg += 2) {
-+
-+		/* These regs should restore in particular order */
-+		if (reg == SGTL5000_CHIP_ANA_POWER ||
-+			reg == SGTL5000_CHIP_CLK_CTRL ||
-+			reg == SGTL5000_CHIP_LINREG_CTRL ||
-+			reg == SGTL5000_CHIP_LINE_OUT_CTRL ||
-+			reg == SGTL5000_CHIP_REF_CTRL)
-+			continue;
-+
-+		snd_soc_write(codec, reg, cache[reg]);
-+	}
-+
-+	/* restore dap registers */
-+	for (reg = SGTL5000_DAP_REG_OFFSET; reg < SGTL5000_MAX_REG_OFFSET; reg += 2)
-+		snd_soc_write(codec, reg, cache[reg]);
-+
-+	/*
-+	 * restore these regs according to the power setting sequence in
-+	 * sgtl5000_set_power_regs() and clock setting sequence in
-+	 * sgtl5000_set_clock().
-+	 *
-+	 * The order of restore is:
-+	 * 1. SGTL5000_CHIP_CLK_CTRL MCLK_FREQ bits (1:0) should be restore after
-+	 *    SGTL5000_CHIP_ANA_POWER PLL bits set
-+	 * 2. SGTL5000_CHIP_LINREG_CTRL should be set before
-+	 *    SGTL5000_CHIP_ANA_POWER LINREG_D restored
-+	 * 3. SGTL5000_CHIP_REF_CTRL controls Analog Ground Voltage,
-+	 *    prefer to resotre it after SGTL5000_CHIP_ANA_POWER restored
-+	 */
-+	snd_soc_write(codec, SGTL5000_CHIP_LINREG_CTRL,
-+			cache[SGTL5000_CHIP_LINREG_CTRL]);
-+
-+	snd_soc_write(codec, SGTL5000_CHIP_ANA_POWER,
-+			cache[SGTL5000_CHIP_ANA_POWER]);
-+
-+	snd_soc_write(codec, SGTL5000_CHIP_CLK_CTRL,
-+			cache[SGTL5000_CHIP_CLK_CTRL]);
-+
-+	snd_soc_write(codec, SGTL5000_CHIP_REF_CTRL,
-+			cache[SGTL5000_CHIP_REF_CTRL]);
-+
-+	snd_soc_write(codec, SGTL5000_CHIP_LINE_OUT_CTRL,
-+			cache[SGTL5000_CHIP_LINE_OUT_CTRL]);
-+	return 0;
-+}
-+
-+static int sgtl5000_resume(struct snd_soc_codec *codec)
-+{
-+	/* Bring the codec back up to standby to enable regulators */
-+	sgtl5000_set_bias_level(codec, SND_SOC_BIAS_STANDBY);
-+
-+	/* Restore registers by cached in memory */
-+	sgtl5000_restore_regs(codec);
-+	return 0;
-+}
-+#else
-+#define sgtl5000_suspend NULL
-+#define sgtl5000_resume  NULL
-+#endif	/* CONFIG_SUSPEND */
-+
- /*
-  * sgtl5000 has 3 internal power supplies:
-  * 1. VAG, normally set to vdda/2
-- * 2. charge pump, set to different value
-+ * 2. chargepump, set to different value
-  *	according to voltage of vdda and vddio
-  * 3. line out VAG, normally set to vddio/2
-  *
-@@ -1267,7 +1332,7 @@
- 			return ret;
- 	}
- 
--	ret = regulator_bulk_get(codec->dev, ARRAY_SIZE(sgtl5000->supplies),
-+	ret = devm_regulator_bulk_get(codec->dev, ARRAY_SIZE(sgtl5000->supplies),
- 				 sgtl5000->supplies);
- 	if (ret)
- 		goto err_ldo_remove;
-@@ -1275,16 +1340,13 @@
- 	ret = regulator_bulk_enable(ARRAY_SIZE(sgtl5000->supplies),
- 					sgtl5000->supplies);
- 	if (ret)
--		goto err_regulator_free;
-+		goto err_ldo_remove;
- 
- 	/* wait for all power rails bring up */
- 	udelay(10);
- 
- 	return 0;
- 
--err_regulator_free:
--	regulator_bulk_free(ARRAY_SIZE(sgtl5000->supplies),
--				sgtl5000->supplies);
- err_ldo_remove:
- 	if (!external_vddd)
- 		ldo_regulator_remove(codec);
-@@ -1297,6 +1359,17 @@
- 	int ret;
- 	struct sgtl5000_priv *sgtl5000 = snd_soc_codec_get_drvdata(codec);
- 
-+	/* setup i2c data ops */
-+	codec->control_data = sgtl5000->regmap;
-+	ret = snd_soc_codec_set_cache_io(codec, 16, 16, SND_SOC_REGMAP);
-+	if (ret < 0) {
-+		dev_err(codec->dev, "Failed to set cache I/O: %d\n", ret);
-+		return ret;
-+	}
-+
-+	if (!devres_open_group(codec->dev, NULL, GFP_KERNEL))
-+		return -ENOMEM;
-+
- 	ret = sgtl5000_enable_regulators(codec);
- 	if (ret)
- 		return ret;
-@@ -1334,13 +1407,8 @@
- 			SGTL5000_HP_ZCD_EN |
- 			SGTL5000_ADC_ZCD_EN);
- 
--	snd_soc_update_bits(codec, SGTL5000_CHIP_MIC_CTRL,
--			SGTL5000_BIAS_R_MASK,
--			sgtl5000->micbias_resistor << SGTL5000_BIAS_R_SHIFT);
-+	snd_soc_write(codec, SGTL5000_CHIP_MIC_CTRL, 2);
- 
--	snd_soc_update_bits(codec, SGTL5000_CHIP_MIC_CTRL,
--			SGTL5000_BIAS_R_MASK,
--			sgtl5000->micbias_voltage << SGTL5000_BIAS_R_SHIFT);
- 	/*
- 	 * disable DAP
- 	 * TODO:
-@@ -1348,13 +1416,19 @@
- 	 */
- 	snd_soc_write(codec, SGTL5000_DAP_CTRL, 0);
- 
-+	/* leading to standby state */
-+	ret = sgtl5000_set_bias_level(codec, SND_SOC_BIAS_STANDBY);
-+	if (ret)
-+		goto err;
-+
- 	return 0;
- 
- err:
- 	regulator_bulk_disable(ARRAY_SIZE(sgtl5000->supplies),
- 						sgtl5000->supplies);
--	regulator_bulk_free(ARRAY_SIZE(sgtl5000->supplies),
--				sgtl5000->supplies);
-+
-+	devres_release_group(codec->dev, NULL);
-+
- 	ldo_regulator_remove(codec);
- 
- 	return ret;
-@@ -1364,10 +1438,13 @@
- {
- 	struct sgtl5000_priv *sgtl5000 = snd_soc_codec_get_drvdata(codec);
- 
-+	sgtl5000_set_bias_level(codec, SND_SOC_BIAS_OFF);
-+
- 	regulator_bulk_disable(ARRAY_SIZE(sgtl5000->supplies),
- 						sgtl5000->supplies);
--	regulator_bulk_free(ARRAY_SIZE(sgtl5000->supplies),
--				sgtl5000->supplies);
-+
-+	devres_release_group(codec->dev, NULL);
-+
- 	ldo_regulator_remove(codec);
- 
- 	return 0;
-@@ -1376,8 +1453,9 @@
- static struct snd_soc_codec_driver sgtl5000_driver = {
- 	.probe = sgtl5000_probe,
- 	.remove = sgtl5000_remove,
-+	.suspend = sgtl5000_suspend,
-+	.resume = sgtl5000_resume,
- 	.set_bias_level = sgtl5000_set_bias_level,
--	.suspend_bias_off = true,
- 	.controls = sgtl5000_snd_controls,
- 	.num_controls = ARRAY_SIZE(sgtl5000_snd_controls),
- 	.dapm_widgets = sgtl5000_dapm_widgets,
-@@ -1430,10 +1508,9 @@
- {
- 	struct sgtl5000_priv *sgtl5000;
- 	int ret, reg, rev;
--	struct device_node *np = client->dev.of_node;
--	u32 value;
- 
--	sgtl5000 = devm_kzalloc(&client->dev, sizeof(*sgtl5000), GFP_KERNEL);
-+	sgtl5000 = devm_kzalloc(&client->dev, sizeof(struct sgtl5000_priv),
-+								GFP_KERNEL);
- 	if (!sgtl5000)
- 		return -ENOMEM;
- 
-@@ -1478,47 +1555,6 @@
- 	dev_info(&client->dev, "sgtl5000 revision 0x%x\n", rev);
- 	sgtl5000->revision = rev;
- 
--	if (np) {
--		if (!of_property_read_u32(np,
--			"micbias-resistor-k-ohms", &value)) {
--			switch (value) {
--			case SGTL5000_MICBIAS_OFF:
--				sgtl5000->micbias_resistor = 0;
--				break;
--			case SGTL5000_MICBIAS_2K:
--				sgtl5000->micbias_resistor = 1;
--				break;
--			case SGTL5000_MICBIAS_4K:
--				sgtl5000->micbias_resistor = 2;
--				break;
--			case SGTL5000_MICBIAS_8K:
--				sgtl5000->micbias_resistor = 3;
--				break;
--			default:
--				sgtl5000->micbias_resistor = 2;
--				dev_err(&client->dev,
--					"Unsuitable MicBias resistor\n");
--			}
--		} else {
--			/* default is 4Kohms */
--			sgtl5000->micbias_resistor = 2;
--		}
--		if (!of_property_read_u32(np,
--			"micbias-voltage-m-volts", &value)) {
--			/* 1250mV => 0 */
--			/* steps of 250mV */
--			if ((value >= 1250) && (value <= 3000))
--				sgtl5000->micbias_voltage = (value / 250) - 5;
--			else {
--				sgtl5000->micbias_voltage = 0;
--				dev_err(&client->dev,
--					"Unsuitable MicBias resistor\n");
--			}
--		} else {
--			sgtl5000->micbias_voltage = 0;
--		}
--	}
--
- 	i2c_set_clientdata(client, sgtl5000);
- 
- 	/* Ensure sgtl5000 will start with sane register values */
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_asrc.h linux-xbian-imx6/sound/soc/fsl/fsl_asrc.h
---- linux-4.1.3/sound/soc/fsl/fsl_asrc.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_asrc.h	2015-07-27 23:13:11.149203200 +0200
-@@ -326,7 +326,7 @@
- 	OUTCLK_ASRCK1_CLK = 0x0f,
- };
- 
--#define ASRC_CLK_MAX_NUM	16
-+#define ASRC_CLK_MAX_NUM	1
- 
- enum asrc_word_width {
- 	ASRC_WIDTH_24_BIT = 0,
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_esai.c linux-xbian-imx6/sound/soc/fsl/fsl_esai.c
---- linux-4.1.3/sound/soc/fsl/fsl_esai.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_esai.c	2015-07-27 23:13:11.149203200 +0200
-@@ -839,7 +839,7 @@
- 		return ret;
- 	}
- 
--	ret = imx_pcm_dma_init(pdev);
-+	ret = imx_pcm_dma_init(pdev, IMX_ESAI_DMABUF_SIZE);
- 	if (ret)
- 		dev_err(&pdev->dev, "failed to init imx pcm dma: %d\n", ret);
- 
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_hdmi.c linux-xbian-imx6/sound/soc/fsl/fsl_hdmi.c
---- linux-4.1.3/sound/soc/fsl/fsl_hdmi.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_hdmi.c	2015-07-27 23:13:11.149203200 +0200
-@@ -0,0 +1,614 @@
-+/*
-+ * ALSA SoC HDMI Audio Layer for Freescale i.MX
-+ *
-+ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
-+ *
-+ * Some code from patch_hdmi.c
-+ *  Copyright (c) 2008-2010 Intel Corporation. All rights reserved.
-+ *  Copyright (c) 2006 ATI Technologies Inc.
-+ *  Copyright (c) 2008 NVIDIA Corp.  All rights reserved.
-+ *  Copyright (c) 2008 Wei Ni <wni@nvidia.com>
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#include <linux/init.h>
-+#include <linux/module.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/slab.h>
-+#include <linux/clk.h>
-+#include <linux/delay.h>
-+#include <linux/mfd/mxc-hdmi-core.h>
-+#include <sound/pcm.h>
-+#include <sound/soc.h>
-+#include <sound/asoundef.h>
-+
-+#include <video/mxc_hdmi.h>
-+
-+#include "imx-hdmi.h"
-+
-+
-+static struct mxc_edid_cfg edid_cfg;
-+
-+static u32 playback_rates[HDMI_MAX_RATES];
-+static u32 playback_sample_size[HDMI_MAX_SAMPLE_SIZE];
-+static u32 playback_channels[HDMI_MAX_CHANNEL_CONSTRAINTS];
-+
-+static struct snd_pcm_hw_constraint_list playback_constraint_rates;
-+static struct snd_pcm_hw_constraint_list playback_constraint_bits;
-+static struct snd_pcm_hw_constraint_list playback_constraint_channels;
-+
-+#ifdef DEBUG
-+static void dumpregs(struct snd_soc_dai *dai)
-+{
-+	u32 n, cts;
-+
-+	cts = (hdmi_readb(HDMI_AUD_CTS3) << 16) |
-+		(hdmi_readb(HDMI_AUD_CTS2) << 8) |
-+		hdmi_readb(HDMI_AUD_CTS1);
-+
-+	n = (hdmi_readb(HDMI_AUD_N3) << 16) |
-+		(hdmi_readb(HDMI_AUD_N2) << 8) |
-+		hdmi_readb(HDMI_AUD_N1);
-+
-+	dev_dbg(dai->dev, "HDMI_PHY_CONF0      0x%02x\n",
-+			hdmi_readb(HDMI_PHY_CONF0));
-+	dev_dbg(dai->dev, "HDMI_MC_CLKDIS      0x%02x\n",
-+			hdmi_readb(HDMI_MC_CLKDIS));
-+	dev_dbg(dai->dev, "HDMI_AUD_N[1-3]     0x%06x (%d)\n",
-+			n, n);
-+	dev_dbg(dai->dev, "HDMI_AUD_CTS[1-3]   0x%06x (%d)\n",
-+			cts, cts);
-+	dev_dbg(dai->dev, "HDMI_FC_AUDSCONF    0x%02x\n",
-+			hdmi_readb(HDMI_FC_AUDSCONF));
-+}
-+#else
-+static void dumpregs(struct snd_soc_dai *dai) {}
-+#endif
-+
-+enum cea_speaker_placement {
-+	FL  = (1 <<  0),	/* Front Left           */
-+	FC  = (1 <<  1),	/* Front Center         */
-+	FR  = (1 <<  2),	/* Front Right          */
-+	FLC = (1 <<  3),	/* Front Left Center    */
-+	FRC = (1 <<  4),	/* Front Right Center   */
-+	RL  = (1 <<  5),	/* Rear Left            */
-+	RC  = (1 <<  6),	/* Rear Center          */
-+	RR  = (1 <<  7),	/* Rear Right           */
-+	RLC = (1 <<  8),	/* Rear Left Center     */
-+	RRC = (1 <<  9),	/* Rear Right Center    */
-+	LFE = (1 << 10),	/* Low Frequency Effect */
-+	FLW = (1 << 11),	/* Front Left Wide      */
-+	FRW = (1 << 12),	/* Front Right Wide     */
-+	FLH = (1 << 13),	/* Front Left High      */
-+	FCH = (1 << 14),	/* Front Center High    */
-+	FRH = (1 << 15),	/* Front Right High     */
-+	TC  = (1 << 16),	/* Top Center           */
-+};
-+
-+/*
-+ * EDID SA bits in the CEA Speaker Allocation data block
-+ */
-+static int edid_speaker_allocation_bits[] = {
-+	[0] = FL | FR,
-+	[1] = LFE,
-+	[2] = FC,
-+	[3] = RL | RR,
-+	[4] = RC,
-+	[5] = FLC | FRC,
-+	[6] = RLC | RRC,
-+	[7] = FLW | FRW,
-+	[8] = FLH | FRH,
-+	[9] = TC,
-+	[10] = FCH,
-+};
-+
-+struct cea_channel_speaker_allocation {
-+	int ca_index;
-+	int speakers[8];
-+
-+	/* Derived values, just for convenience */
-+	int channels;
-+	int spk_mask;
-+};
-+
-+/*
-+ * This is an ordered list!
-+ *
-+ * The preceding ones have better chances to be selected by
-+ * hdmi_channel_allocation().
-+ */
-+static struct cea_channel_speaker_allocation channel_allocations[] = {
-+	/*			  channel:  7     6    5    4    3     2    1    0  */
-+	{ .ca_index = 0x00, .speakers = {   0,    0,   0,   0,   0,    0,  FR,  FL },},
-+					 /* 2.1 */
-+	{ .ca_index = 0x01, .speakers = {   0,    0,   0,   0,   0,  LFE,  FR,  FL },},
-+					 /* Dolby Surround */
-+	{ .ca_index = 0x08, .speakers = {   0,    0,  RR,  RL,   0,    0,  FR,  FL },},  /* Prefer FL/FR/RL/RR over FL/FR/LFE/FC */
-+	{ .ca_index = 0x02, .speakers = {   0,    0,   0,   0,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x03, .speakers = {   0,    0,   0,   0,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x04, .speakers = {   0,    0,   0,  RC,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x05, .speakers = {   0,    0,   0,  RC,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x06, .speakers = {   0,    0,   0,  RC,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x07, .speakers = {   0,    0,   0,  RC,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x09, .speakers = {   0,    0,  RR,  RL,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x0a, .speakers = {   0,    0,  RR,  RL,  FC,    0,  FR,  FL },},
-+					 /* surround51 */
-+	{ .ca_index = 0x0b, .speakers = {   0,    0,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x0c, .speakers = {   0,   RC,  RR,  RL,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x0d, .speakers = {   0,   RC,  RR,  RL,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x0e, .speakers = {   0,   RC,  RR,  RL,  FC,    0,  FR,  FL },},
-+					 /* 6.1 */
-+	{ .ca_index = 0x0f, .speakers = {   0,   RC,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x10, .speakers = { RRC,  RLC,  RR,  RL,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x11, .speakers = { RRC,  RLC,  RR,  RL,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x12, .speakers = { RRC,  RLC,  RR,  RL,  FC,    0,  FR,  FL },},
-+					 /* surround71 */
-+	{ .ca_index = 0x13, .speakers = { RRC,  RLC,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x14, .speakers = { FRC,  FLC,   0,   0,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x15, .speakers = { FRC,  FLC,   0,   0,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x16, .speakers = { FRC,  FLC,   0,   0,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x17, .speakers = { FRC,  FLC,   0,   0,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x18, .speakers = { FRC,  FLC,   0,  RC,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x19, .speakers = { FRC,  FLC,   0,  RC,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x1a, .speakers = { FRC,  FLC,   0,  RC,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x1b, .speakers = { FRC,  FLC,   0,  RC,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x1c, .speakers = { FRC,  FLC,  RR,  RL,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x1d, .speakers = { FRC,  FLC,  RR,  RL,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x1e, .speakers = { FRC,  FLC,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x1f, .speakers = { FRC,  FLC,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x20, .speakers = {   0,  FCH,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x21, .speakers = {   0,  FCH,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x22, .speakers = {  TC,    0,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x23, .speakers = {  TC,    0,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x24, .speakers = { FRH,  FLH,  RR,  RL,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x25, .speakers = { FRH,  FLH,  RR,  RL,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x26, .speakers = { FRW,  FLW,  RR,  RL,   0,    0,  FR,  FL },},
-+	{ .ca_index = 0x27, .speakers = { FRW,  FLW,  RR,  RL,   0,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x28, .speakers = {  TC,   RC,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x29, .speakers = {  TC,   RC,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x2a, .speakers = { FCH,   RC,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x2b, .speakers = { FCH,   RC,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x2c, .speakers = {  TC,  FCH,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x2d, .speakers = {  TC,  FCH,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x2e, .speakers = { FRH,  FLH,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x2f, .speakers = { FRH,  FLH,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+	{ .ca_index = 0x30, .speakers = { FRW,  FLW,  RR,  RL,  FC,    0,  FR,  FL },},
-+	{ .ca_index = 0x31, .speakers = { FRW,  FLW,  RR,  RL,  FC,  LFE,  FR,  FL },},
-+};
-+
-+/* Compute derived values in channel_allocations[] */
-+static void init_channel_allocations(void)
-+{
-+	struct cea_channel_speaker_allocation *p;
-+	int i, j;
-+
-+	for (i = 0; i < ARRAY_SIZE(channel_allocations); i++) {
-+		p = channel_allocations + i;
-+		p->channels = 0;
-+		p->spk_mask = 0;
-+		for (j = 0; j < ARRAY_SIZE(p->speakers); j++)
-+			if (p->speakers[j]) {
-+				p->channels++;
-+				p->spk_mask |= p->speakers[j];
-+			}
-+	}
-+}
-+
-+/*
-+ * The transformation takes two steps:
-+ *
-+ * speaker_alloc => (edid_speaker_allocation_bits[]) => spk_mask
-+ * spk_mask      => (channel_allocations[])         => CA
-+ *
-+ * TODO: it could select the wrong CA from multiple candidates.
-+*/
-+static int hdmi_channel_allocation(int channels)
-+{
-+	int spk_mask = 0, ca = 0, i, tmpchn, tmpspk;
-+
-+	/* CA defaults to 0 for basic stereo audio */
-+	if (channels <= 2)
-+		return 0;
-+
-+	/*
-+	 * Expand EDID's speaker allocation mask
-+	 *
-+	 * EDID tells the speaker mask in a compact(paired) form,
-+	 * expand EDID's notions to match the ones used by Audio InfoFrame.
-+	 */
-+	for (i = 0; i < ARRAY_SIZE(edid_speaker_allocation_bits); i++) {
-+		if (edid_cfg.speaker_alloc & (1 << i))
-+			spk_mask |= edid_speaker_allocation_bits[i];
-+	}
-+
-+	/* Search for the first working match in the CA table */
-+	for (i = 0; i < ARRAY_SIZE(channel_allocations); i++) {
-+		tmpchn = channel_allocations[i].channels;
-+		tmpspk = channel_allocations[i].spk_mask;
-+
-+		if (channels == tmpchn && (spk_mask & tmpspk) == tmpspk) {
-+			ca = channel_allocations[i].ca_index;
-+			break;
-+		}
-+	}
-+
-+	return ca;
-+}
-+
-+static void hdmi_set_audio_infoframe(unsigned int channels)
-+{
-+	u8 audiconf0, audiconf2;
-+
-+	/*
-+	 * From CEA-861-D spec:
-+	 * HDMI requires the CT, SS and SF fields to be set to 0 ("Refer
-+	 * to Stream Header") as these items are carried in the audio stream.
-+	 *
-+	 * So we only set the CC and CA fields.
-+	 */
-+	audiconf0 = ((channels - 1) << HDMI_FC_AUDICONF0_CC_OFFSET) &
-+		HDMI_FC_AUDICONF0_CC_MASK;
-+
-+	audiconf2 = hdmi_channel_allocation(channels);
-+
-+	hdmi_writeb(audiconf0, HDMI_FC_AUDICONF0);
-+	hdmi_writeb(0, HDMI_FC_AUDICONF1);
-+	hdmi_writeb(audiconf2, HDMI_FC_AUDICONF2);
-+	hdmi_writeb(0, HDMI_FC_AUDICONF3);
-+}
-+
-+static int cea_audio_rates[HDMI_MAX_RATES] = {
-+	32000, 44100, 48000, 88200, 96000, 176400, 192000,
-+};
-+
-+static void fsl_hdmi_get_playback_rates(void)
-+{
-+	int i, count = 0;
-+	u8 rates;
-+
-+	/* Always assume basic audio support */
-+	rates = edid_cfg.sample_rates | 0x7;
-+
-+	for (i = 0 ; i < HDMI_MAX_RATES ; i++)
-+		if ((rates & (1 << i)) != 0)
-+			playback_rates[count++] = cea_audio_rates[i];
-+
-+	playback_constraint_rates.list = playback_rates;
-+	playback_constraint_rates.count = count;
-+
-+	for (i = 0 ; i < playback_constraint_rates.count ; i++)
-+		pr_debug("%s: constraint = %d Hz\n", __func__, playback_rates[i]);
-+}
-+
-+static void fsl_hdmi_get_playback_sample_size(void)
-+{
-+	int i = 0;
-+
-+	/* Always assume basic audio support */
-+	playback_sample_size[i++] = 16;
-+
-+	if (edid_cfg.sample_sizes & 0x4)
-+		playback_sample_size[i++] = 32;
-+
-+	playback_constraint_bits.list = playback_sample_size;
-+	playback_constraint_bits.count = i;
-+
-+	for (i = 0 ; i < playback_constraint_bits.count ; i++)
-+		pr_debug("%s: constraint = %d bits\n", __func__, playback_sample_size[i]);
-+}
-+
-+static void fsl_hdmi_get_playback_channels(void)
-+{
-+	int channels = 2, i = 0;
-+
-+	/* Always assume basic audio support */
-+	playback_channels[i++] = channels;
-+	channels += 2;
-+
-+	while ((i < HDMI_MAX_CHANNEL_CONSTRAINTS) &&
-+			(channels <= edid_cfg.max_channels)) {
-+		playback_channels[i++] = channels;
-+		channels += 2;
-+	}
-+
-+	playback_constraint_channels.list = playback_channels;
-+	playback_constraint_channels.count = i;
-+
-+	for (i = 0 ; i < playback_constraint_channels.count ; i++)
-+		pr_debug("%s: constraint = %d channels\n", __func__, playback_channels[i]);
-+}
-+
-+static int fsl_hdmi_update_constraints(struct snd_pcm_substream *substream)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	int edid_status, ret;
-+
-+	edid_status = hdmi_get_edid_cfg(&edid_cfg);
-+
-+	if (edid_status && !edid_cfg.hdmi_cap)
-+		return -1;
-+
-+	fsl_hdmi_get_playback_rates();
-+	ret = snd_pcm_hw_constraint_list(runtime, 0, SNDRV_PCM_HW_PARAM_RATE,
-+			&playback_constraint_rates);
-+	if (ret)
-+		return ret;
-+
-+	fsl_hdmi_get_playback_sample_size();
-+	ret = snd_pcm_hw_constraint_list(runtime, 0, SNDRV_PCM_HW_PARAM_SAMPLE_BITS,
-+			&playback_constraint_bits);
-+	if (ret)
-+		return ret;
-+
-+	fsl_hdmi_get_playback_channels();
-+	ret = snd_pcm_hw_constraint_list(runtime, 0, SNDRV_PCM_HW_PARAM_CHANNELS,
-+			&playback_constraint_channels);
-+	if (ret)
-+		return ret;
-+
-+	ret = snd_pcm_hw_constraint_integer(runtime, SNDRV_PCM_HW_PARAM_PERIODS);
-+	if (ret)
-+		return ret;
-+
-+	return 0;
-+}
-+
-+static int fsl_hdmi_soc_startup(struct snd_pcm_substream *substream,
-+				struct snd_soc_dai *dai)
-+{
-+	struct imx_hdmi *hdmi_data = snd_soc_dai_get_drvdata(dai);
-+	int ret;
-+
-+	ret = fsl_hdmi_update_constraints(substream);
-+	if (ret < 0)
-+		return ret;
-+
-+	clk_prepare_enable(hdmi_data->isfr_clk);
-+	clk_prepare_enable(hdmi_data->iahb_clk);
-+
-+	dev_dbg(dai->dev, "%s hdmi clks: isfr:%d iahb:%d\n", __func__,
-+			(int)clk_get_rate(hdmi_data->isfr_clk),
-+			(int)clk_get_rate(hdmi_data->iahb_clk));
-+
-+	/* Indicates the subpacket represents a flatline sample */
-+	hdmi_audio_writeb(FC_AUDSCONF, AUD_PACKET_SAMPFIT, 0x0);
-+
-+	return 0;
-+}
-+
-+static void fsl_hdmi_soc_shutdown(struct snd_pcm_substream *substream,
-+				struct snd_soc_dai *dai)
-+{
-+	struct imx_hdmi *hdmi_data = snd_soc_dai_get_drvdata(dai);
-+
-+	clk_disable_unprepare(hdmi_data->iahb_clk);
-+	clk_disable_unprepare(hdmi_data->isfr_clk);
-+}
-+
-+static int fsl_hdmi_soc_prepare(struct snd_pcm_substream *substream,
-+		struct snd_soc_dai *dai)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+
-+	hdmi_set_audio_infoframe(runtime->channels);
-+	hdmi_audio_writeb(FC_AUDSCONF, AUD_PACKET_LAYOUT,
-+			(runtime->channels > 2) ? 0x1 : 0x0);
-+	hdmi_set_sample_rate(runtime->rate);
-+	dumpregs(dai);
-+
-+	return 0;
-+}
-+
-+static struct snd_soc_dai_ops fsl_hdmi_soc_dai_ops = {
-+	.startup = fsl_hdmi_soc_startup,
-+	.shutdown = fsl_hdmi_soc_shutdown,
-+	.prepare = fsl_hdmi_soc_prepare,
-+};
-+
-+/* IEC60958 status functions */
-+static int fsl_hdmi_iec_info(struct snd_kcontrol *kcontrol,
-+		struct snd_ctl_elem_info *uinfo)
-+{
-+	uinfo->type = SNDRV_CTL_ELEM_TYPE_IEC958;
-+	uinfo->count = 1;
-+
-+	return 0;
-+}
-+
-+
-+static int fsl_hdmi_iec_get(struct snd_kcontrol *kcontrol,
-+		struct snd_ctl_elem_value *uvalue)
-+{
-+	int i;
-+
-+	for (i = 0 ; i < 6 ; i++)
-+		uvalue->value.iec958.status[i] = iec_header.status[i];
-+
-+	return 0;
-+}
-+
-+static int fsl_hdmi_iec_put(struct snd_kcontrol *kcontrol,
-+		struct snd_ctl_elem_value *uvalue)
-+{
-+	int i;
-+
-+	/* Do not allow professional mode */
-+	if (uvalue->value.iec958.status[0] & IEC958_AES0_PROFESSIONAL)
-+		return -EPERM;
-+
-+	for (i = 0 ; i < 6 ; i++) {
-+		iec_header.status[i] = uvalue->value.iec958.status[i];
-+		pr_debug("%s status[%d]=0x%02x\n", __func__, i, iec_header.status[i]);
-+	}
-+
-+	return 0;
-+}
-+
-+static struct snd_kcontrol_new fsl_hdmi_ctrls[] = {
-+	/* Status cchanel controller */
-+	{
-+		.iface = SNDRV_CTL_ELEM_IFACE_MIXER,
-+		.name = SNDRV_CTL_NAME_IEC958("", PLAYBACK, DEFAULT),
-+		.access = SNDRV_CTL_ELEM_ACCESS_READ |
-+			SNDRV_CTL_ELEM_ACCESS_WRITE |
-+			SNDRV_CTL_ELEM_ACCESS_VOLATILE,
-+		.info = fsl_hdmi_iec_info,
-+		.get = fsl_hdmi_iec_get,
-+		.put = fsl_hdmi_iec_put,
-+	},
-+};
-+
-+static int fsl_hdmi_soc_dai_probe(struct snd_soc_dai *dai)
-+{
-+	int ret;
-+
-+	init_channel_allocations();
-+
-+	ret = snd_soc_add_dai_controls(dai, fsl_hdmi_ctrls,
-+			ARRAY_SIZE(fsl_hdmi_ctrls));
-+	if (ret)
-+		dev_warn(dai->dev, "failed to add dai controls\n");
-+
-+	return 0;
-+}
-+
-+static struct snd_soc_dai_driver fsl_hdmi_dai = {
-+	.probe = &fsl_hdmi_soc_dai_probe,
-+	.playback = {
-+		.channels_min = 2,
-+		.channels_max = 8,
-+		.rates = MXC_HDMI_RATES_PLAYBACK,
-+		.formats = MXC_HDMI_FORMATS_PLAYBACK,
-+	},
-+	.ops = &fsl_hdmi_soc_dai_ops,
-+};
-+
-+static const struct snd_soc_component_driver fsl_hdmi_component = {
-+	.name		= "fsl-hdmi",
-+};
-+
-+static int fsl_hdmi_dai_probe(struct platform_device *pdev)
-+{
-+	struct device_node *np = pdev->dev.of_node;
-+	struct imx_hdmi *hdmi_data;
-+	int ret = 0;
-+
-+	if (!np)
-+		return -ENODEV;
-+
-+	if (!hdmi_get_registered()) {
-+		dev_err(&pdev->dev, "failed to probe. Load HDMI-video first.\n");
-+		return -ENOMEM;
-+	}
-+
-+	hdmi_data = devm_kzalloc(&pdev->dev, sizeof(*hdmi_data), GFP_KERNEL);
-+	if (!hdmi_data) {
-+		dev_err(&pdev->dev, "failed to alloc hdmi_data\n");
-+		return -ENOMEM;
-+	}
-+
-+	hdmi_data->pdev = pdev;
-+
-+	memcpy(&hdmi_data->cpu_dai_drv, &fsl_hdmi_dai, sizeof(fsl_hdmi_dai));
-+	hdmi_data->cpu_dai_drv.name = np->name;
-+
-+	hdmi_data->isfr_clk = devm_clk_get(&pdev->dev, "hdmi_isfr");
-+	if (IS_ERR(hdmi_data->isfr_clk)) {
-+		ret = PTR_ERR(hdmi_data->isfr_clk);
-+		dev_err(&pdev->dev, "failed to get HDMI isfr clk: %d\n", ret);
-+		return -EINVAL;
-+	}
-+
-+	hdmi_data->iahb_clk = devm_clk_get(&pdev->dev, "hdmi_iahb");
-+	if (IS_ERR(hdmi_data->iahb_clk)) {
-+		ret = PTR_ERR(hdmi_data->iahb_clk);
-+		dev_err(&pdev->dev, "failed to get HDMI ahb clk: %d\n", ret);
-+		return -EINVAL;
-+	}
-+
-+	dev_set_drvdata(&pdev->dev, hdmi_data);
-+	ret = snd_soc_register_component(&pdev->dev, &fsl_hdmi_component,
-+					&hdmi_data->cpu_dai_drv, 1);
-+	if (ret) {
-+		dev_err(&pdev->dev, "register DAI failed\n");
-+		return ret;
-+	}
-+
-+	hdmi_data->codec_dev = platform_device_register_simple(
-+			"hdmi-audio-codec", -1, NULL, 0);
-+	if (IS_ERR(hdmi_data->codec_dev)) {
-+		dev_err(&pdev->dev, "failed to register HDMI audio codec\n");
-+		ret = PTR_ERR(hdmi_data->codec_dev);
-+		goto fail;
-+	}
-+
-+	hdmi_data->dma_dev = platform_device_alloc("imx-hdmi-audio", -1);
-+	if (IS_ERR(hdmi_data->dma_dev)) {
-+		ret = PTR_ERR(hdmi_data->dma_dev);
-+		goto fail_dma;
-+	}
-+
-+	platform_set_drvdata(hdmi_data->dma_dev, hdmi_data);
-+
-+	ret = platform_device_add(hdmi_data->dma_dev);
-+	if (ret) {
-+		platform_device_put(hdmi_data->dma_dev);
-+		goto fail_dma;
-+	}
-+
-+	return 0;
-+
-+fail_dma:
-+	platform_device_unregister(hdmi_data->codec_dev);
-+fail:
-+	snd_soc_unregister_component(&pdev->dev);
-+
-+	return ret;
-+}
-+
-+static int fsl_hdmi_dai_remove(struct platform_device *pdev)
-+{
-+	struct imx_hdmi *hdmi_data = platform_get_drvdata(pdev);
-+
-+	platform_device_unregister(hdmi_data->dma_dev);
-+	platform_device_unregister(hdmi_data->codec_dev);
-+	snd_soc_unregister_component(&pdev->dev);
-+
-+	return 0;
-+}
-+
-+static const struct of_device_id fsl_hdmi_dai_dt_ids[] = {
-+	{ .compatible = "fsl,imx6dl-hdmi-audio", },
-+	{ .compatible = "fsl,imx6q-hdmi-audio", },
-+	{ /* sentinel */ }
-+};
-+MODULE_DEVICE_TABLE(of, fsl_hdmi_dai_dt_ids);
-+
-+static struct platform_driver fsl_hdmi_driver = {
-+	.probe = fsl_hdmi_dai_probe,
-+	.remove = fsl_hdmi_dai_remove,
-+	.driver = {
-+		.name = "fsl-hdmi-dai",
-+		.owner = THIS_MODULE,
-+		.of_match_table = fsl_hdmi_dai_dt_ids,
-+	},
-+};
-+module_platform_driver(fsl_hdmi_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("IMX HDMI TX DAI");
-+MODULE_LICENSE("GPL");
-+MODULE_ALIAS("platform:fsl-hdmi-dai");
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_sai.c linux-xbian-imx6/sound/soc/fsl/fsl_sai.c
---- linux-4.1.3/sound/soc/fsl/fsl_sai.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_sai.c	2015-07-27 23:13:11.149203200 +0200
-@@ -1,7 +1,7 @@
- /*
-  * Freescale ALSA SoC Digital Audio Interface (SAI) driver.
-  *
-- * Copyright 2012-2013 Freescale Semiconductor, Inc.
-+ * Copyright 2012-2014 Freescale Semiconductor, Inc.
-  *
-  * This program is free software, you can redistribute it and/or modify it
-  * under the terms of the GNU General Public License as published by the
-@@ -662,7 +662,7 @@
- 		return ret;
- 
- 	if (sai->sai_on_imx)
--		return imx_pcm_dma_init(pdev);
-+		return imx_pcm_dma_init(pdev, IMX_SAI_DMABUF_SIZE);
- 	else
- 		return devm_snd_dmaengine_pcm_register(&pdev->dev, NULL,
- 				SND_DMAENGINE_PCM_FLAG_NO_RESIDUE);
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_spdif.c linux-xbian-imx6/sound/soc/fsl/fsl_spdif.c
---- linux-4.1.3/sound/soc/fsl/fsl_spdif.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_spdif.c	2015-07-27 23:13:11.149203200 +0200
-@@ -1,7 +1,7 @@
- /*
-  * Freescale S/PDIF ALSA SoC Digital Audio Interface (DAI) driver
-  *
-- * Copyright (C) 2013 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc.
-  *
-  * Based on stmp3xxx_spdif_dai.c
-  * Vladimir Barinov <vbarinov@embeddedalley.com>
-@@ -20,6 +20,8 @@
- #include <linux/of_device.h>
- #include <linux/of_irq.h>
- #include <linux/regmap.h>
-+#include <linux/pm_runtime.h>
-+#include <linux/busfreq-imx6.h>
- 
- #include <sound/asoundef.h>
- #include <sound/dmaengine_pcm.h>
-@@ -106,8 +108,11 @@
- 	struct clk *rxclk;
- 	struct clk *coreclk;
- 	struct clk *sysclk;
-+	struct clk *dmaclk;
- 	struct snd_dmaengine_dai_dma_data dma_params_tx;
- 	struct snd_dmaengine_dai_dma_data dma_params_rx;
-+	/* regcache for SRPC */
-+	u32 regcache_srpc;
- };
- 
- /* DPLL locked and lock loss interrupt handler */
-@@ -300,6 +305,8 @@
- 	struct regmap *regmap = spdif_priv->regmap;
- 	u32 val, cycle = 1000;
- 
-+	regcache_cache_bypass(regmap, true);
-+
- 	regmap_write(regmap, REG_SPDIF_SCR, SCR_SOFT_RESET);
- 
- 	/*
-@@ -310,6 +317,10 @@
- 		regmap_read(regmap, REG_SPDIF_SCR, &val);
- 	} while ((val & SCR_SOFT_RESET) && cycle--);
- 
-+	regcache_cache_bypass(regmap, false);
-+	regcache_mark_dirty(regmap);
-+	regcache_sync(regmap);
-+
- 	if (cycle)
- 		return 0;
- 	else
-@@ -371,7 +382,6 @@
- 	unsigned long csfs = 0;
- 	u32 stc, mask, rate;
- 	u8 clk, txclk_df, sysclk_df;
--	int ret;
- 
- 	switch (sample_rate) {
- 	case 32000:
-@@ -413,21 +423,6 @@
- 
- 	sysclk_df = spdif_priv->sysclk_df[rate];
- 
--	/* Don't mess up the clocks from other modules */
--	if (clk != STC_TXCLK_SPDIF_ROOT)
--		goto clk_set_bypass;
--
--	/*
--	 * The S/PDIF block needs a clock of 64 * fs * txclk_df.
--	 * So request 64 * fs * (txclk_df + 1) to get rounded.
--	 */
--	ret = clk_set_rate(spdif_priv->txclk[rate], 64 * sample_rate * (txclk_df + 1));
--	if (ret) {
--		dev_err(&pdev->dev, "failed to set tx clock rate\n");
--		return ret;
--	}
--
--clk_set_bypass:
- 	dev_dbg(&pdev->dev, "expected clock rate = %d\n",
- 			(64 * sample_rate * txclk_df * sysclk_df));
- 	dev_dbg(&pdev->dev, "actual clock rate = %ld\n",
-@@ -459,6 +454,8 @@
- 	u32 scr, mask, i;
- 	int ret;
- 
-+	pm_runtime_get_sync(cpu_dai->dev);
-+
- 	/* Reset module and interrupts only for first initialization */
- 	if (!cpu_dai->active) {
- 		ret = clk_prepare_enable(spdif_priv->coreclk);
-@@ -467,6 +464,12 @@
- 			return ret;
- 		}
- 
-+		ret = clk_prepare_enable(spdif_priv->dmaclk);
-+		if (ret) {
-+			dev_err(&pdev->dev, "failed to enable dma clock\n");
-+			return ret;
-+		}
-+
- 		ret = spdif_softreset(spdif_priv);
- 		if (ret) {
- 			dev_err(&pdev->dev, "failed to soft reset\n");
-@@ -533,8 +536,11 @@
- 		spdif_intr_status_clear(spdif_priv);
- 		regmap_update_bits(regmap, REG_SPDIF_SCR,
- 				SCR_LOW_POWER, SCR_LOW_POWER);
-+		clk_disable_unprepare(spdif_priv->dmaclk);
- 		clk_disable_unprepare(spdif_priv->coreclk);
- 	}
-+
-+	pm_runtime_put_sync(cpu_dai->dev);
- }
- 
- static int fsl_spdif_hw_params(struct snd_pcm_substream *substream,
-@@ -1015,6 +1021,27 @@
- 	}
- }
- 
-+static bool fsl_spdif_volatile_reg(struct device *dev, unsigned int reg)
-+{
-+	switch (reg) {
-+	case REG_SPDIF_SRPC:
-+	case REG_SPDIF_SIS:
-+	case REG_SPDIF_SRL:
-+	case REG_SPDIF_SRR:
-+	case REG_SPDIF_SRCSH:
-+	case REG_SPDIF_SRCSL:
-+	case REG_SPDIF_SRU:
-+	case REG_SPDIF_SRQ:
-+	case REG_SPDIF_STL:
-+	case REG_SPDIF_STR:
-+	case REG_SPDIF_SRFM:
-+		return true;
-+	default:
-+		return false;
-+	}
-+
-+}
-+
- static bool fsl_spdif_writeable_reg(struct device *dev, unsigned int reg)
- {
- 	switch (reg) {
-@@ -1041,7 +1068,9 @@
- 
- 	.max_register = REG_SPDIF_STC,
- 	.readable_reg = fsl_spdif_readable_reg,
-+	.volatile_reg = fsl_spdif_volatile_reg,
- 	.writeable_reg = fsl_spdif_writeable_reg,
-+	.cache_type = REGCACHE_RBTREE,
- };
- 
- static u32 fsl_spdif_txclk_caldiv(struct fsl_spdif_priv *spdif_priv,
-@@ -1049,8 +1078,8 @@
- 				enum spdif_txrate index, bool round)
- {
- 	const u32 rate[] = { 32000, 44100, 48000, 96000, 192000 };
--	bool is_sysclk = clk_is_match(clk, spdif_priv->sysclk);
--	u64 rate_ideal, rate_actual, sub;
-+	bool is_sysclk = clk == spdif_priv->sysclk;
-+	u64 rate_actual, sub;
- 	u32 sysclk_dfmin, sysclk_dfmax;
- 	u32 txclk_df, sysclk_df, arate;
- 
-@@ -1060,11 +1089,7 @@
- 
- 	for (sysclk_df = sysclk_dfmin; sysclk_df <= sysclk_dfmax; sysclk_df++) {
- 		for (txclk_df = 1; txclk_df <= 128; txclk_df++) {
--			rate_ideal = rate[index] * (txclk_df + 1) * 64;
--			if (round)
--				rate_actual = clk_round_rate(clk, rate_ideal);
--			else
--				rate_actual = clk_get_rate(clk);
-+			rate_actual = clk_get_rate(clk);
- 
- 			arate = rate_actual / 64;
- 			arate /= txclk_df * sysclk_df;
-@@ -1214,6 +1239,13 @@
- 		return PTR_ERR(spdif_priv->coreclk);
- 	}
- 
-+	/* Get dma clock for dma script operation */
-+	spdif_priv->dmaclk = devm_clk_get(&pdev->dev, "dma");
-+	if (IS_ERR(spdif_priv->dmaclk)) {
-+		dev_err(&pdev->dev, "no dma clock in devicetree\n");
-+		return PTR_ERR(spdif_priv->dmaclk);
-+	}
-+
- 	/* Select clock source for rx/tx clock */
- 	spdif_priv->rxclk = devm_clk_get(&pdev->dev, "rxtx1");
- 	if (IS_ERR(spdif_priv->rxclk)) {
-@@ -1247,6 +1279,8 @@
- 	spdif_priv->dma_params_tx.addr = res->start + REG_SPDIF_STL;
- 	spdif_priv->dma_params_rx.addr = res->start + REG_SPDIF_SRL;
- 
-+	pm_runtime_enable(&pdev->dev);
-+
- 	/* Register with ASoC */
- 	dev_set_drvdata(&pdev->dev, spdif_priv);
- 
-@@ -1257,13 +1291,62 @@
- 		return ret;
- 	}
- 
--	ret = imx_pcm_dma_init(pdev);
-+	ret = imx_pcm_dma_init(pdev, IMX_SPDIF_DMABUF_SIZE);
- 	if (ret)
- 		dev_err(&pdev->dev, "imx_pcm_dma_init failed: %d\n", ret);
- 
- 	return ret;
- }
- 
-+#ifdef CONFIG_PM
-+static int fsl_spdif_runtime_resume(struct device *dev)
-+{
-+	request_bus_freq(BUS_FREQ_HIGH);
-+	return 0;
-+}
-+
-+static int fsl_spdif_runtime_suspend(struct device *dev)
-+{
-+	release_bus_freq(BUS_FREQ_HIGH);
-+	return 0;
-+}
-+#endif
-+
-+#ifdef CONFIG_PM_SLEEP
-+static int fsl_spdif_suspend(struct device *dev)
-+{
-+	struct fsl_spdif_priv *spdif_priv = dev_get_drvdata(dev);
-+
-+	regmap_read(spdif_priv->regmap, REG_SPDIF_SRPC,
-+			&spdif_priv->regcache_srpc);
-+
-+	regcache_cache_only(spdif_priv->regmap, true);
-+	regcache_mark_dirty(spdif_priv->regmap);
-+
-+	return 0;
-+}
-+
-+static int fsl_spdif_resume(struct device *dev)
-+{
-+	struct fsl_spdif_priv *spdif_priv = dev_get_drvdata(dev);
-+
-+	regcache_cache_only(spdif_priv->regmap, false);
-+
-+	regmap_update_bits(spdif_priv->regmap, REG_SPDIF_SRPC,
-+			SRPC_CLKSRC_SEL_MASK | SRPC_GAINSEL_MASK,
-+			spdif_priv->regcache_srpc);
-+
-+	return regcache_sync(spdif_priv->regmap);
-+}
-+#endif /* CONFIG_PM_SLEEP */
-+
-+static const struct dev_pm_ops fsl_spdif_pm = {
-+	SET_RUNTIME_PM_OPS(fsl_spdif_runtime_suspend,
-+			fsl_spdif_runtime_resume,
-+			NULL)
-+	SET_SYSTEM_SLEEP_PM_OPS(fsl_spdif_suspend, fsl_spdif_resume)
-+};
-+
- static const struct of_device_id fsl_spdif_dt_ids[] = {
- 	{ .compatible = "fsl,imx35-spdif", },
- 	{ .compatible = "fsl,vf610-spdif", },
-@@ -1275,6 +1358,7 @@
- 	.driver = {
- 		.name = "fsl-spdif-dai",
- 		.of_match_table = fsl_spdif_dt_ids,
-+		.pm = &fsl_spdif_pm,
- 	},
- 	.probe = fsl_spdif_probe,
- };
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_ssi.c linux-xbian-imx6/sound/soc/fsl/fsl_ssi.c
---- linux-4.1.3/sound/soc/fsl/fsl_ssi.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_ssi.c	2015-07-27 23:13:11.153188979 +0200
-@@ -3,7 +3,7 @@
-  *
-  * Author: Timur Tabi <timur@freescale.com>
-  *
-- * Copyright 2007-2010 Freescale Semiconductor, Inc.
-+ * Copyright (C) 2007-2013 Freescale Semiconductor, Inc.
-  *
-  * This file is licensed under the terms of the GNU General Public License
-  * version 2.  This program is licensed "as is" without any warranty of any
-@@ -30,19 +30,21 @@
-  * around this by not polling these bits but only wait a fixed delay.
-  */
- 
-+#include <linux/busfreq-imx6.h>
- #include <linux/init.h>
- #include <linux/io.h>
- #include <linux/module.h>
- #include <linux/interrupt.h>
- #include <linux/clk.h>
-+#include <linux/debugfs.h>
- #include <linux/device.h>
- #include <linux/delay.h>
- #include <linux/slab.h>
- #include <linux/spinlock.h>
--#include <linux/of.h>
- #include <linux/of_address.h>
- #include <linux/of_irq.h>
- #include <linux/of_platform.h>
-+#include <linux/pm_runtime.h>
- 
- #include <sound/core.h>
- #include <sound/pcm.h>
-@@ -54,6 +56,43 @@
- #include "fsl_ssi.h"
- #include "imx-pcm.h"
- 
-+#ifdef PPC
-+#define read_ssi(addr)			 in_be32(addr)
-+#define write_ssi(val, addr)		 out_be32(addr, val)
-+#define write_ssi_mask(addr, clear, set) clrsetbits_be32(addr, clear, set)
-+#else
-+#define read_ssi(addr)			 readl(addr)
-+#define write_ssi(val, addr)		 writel(val, addr)
-+/*
-+ * FIXME: Proper locking should be added at write_ssi_mask caller level
-+ * to ensure this register read/modify/write sequence is race free.
-+ */
-+static inline void write_ssi_mask(u32 __iomem *addr, u32 clear, u32 set)
-+{
-+	u32 val = readl(addr);
-+	val = (val & ~clear) | set;
-+	writel(val, addr);
-+}
-+#endif
-+
-+#ifdef DEBUG
-+#define NUM_OF_SSI_REG (sizeof(struct ccsr_ssi) / sizeof(__be32))
-+
-+void dump_reg(struct ccsr_ssi __iomem *ssi)
-+{
-+	u32 val, i;
-+
-+	for (i = 0; i < NUM_OF_SSI_REG; i++) {
-+		if (&ssi->stx0 + i == NULL)
-+			continue;
-+		val = read_ssi(&ssi->stx0 + i);
-+		pr_debug("REG %x = %x\n", (u32)(&ssi->stx0 + i) & 0xff, val);
-+	}
-+}
-+#else
-+void dump_reg(struct ccsr_ssi __iomem *ssi) {}
-+#endif
-+
- /**
-  * FSLSSI_I2S_RATES: sample rates supported by the I2S
-  *
-@@ -67,6 +106,8 @@
- /**
-  * FSLSSI_I2S_FORMATS: audio formats supported by the SSI
-  *
-+ * This driver currently only supports the SSI running in I2S slave mode.
-+ *
-  * The SSI has a limitation in that the samples must be in the same byte
-  * order as the host CPU.  This is because when multiple bytes are written
-  * to the STX register, the bytes and bits must be written in the same
-@@ -92,6 +133,8 @@
- #define FSLSSI_SIER_DBG_TX_FLAGS (CCSR_SSI_SIER_TFE0_EN | \
- 		CCSR_SSI_SIER_TLS_EN | CCSR_SSI_SIER_TFS_EN | \
- 		CCSR_SSI_SIER_TUE0_EN | CCSR_SSI_SIER_TFRC_EN)
-+#define FSLSSI_SISR_MASK (FSLSSI_SIER_DBG_RX_FLAGS | FSLSSI_SIER_DBG_TX_FLAGS)
-+
- 
- enum fsl_ssi_type {
- 	FSL_SSI_MCP8610,
-@@ -111,158 +154,105 @@
- 	struct fsl_ssi_reg_val rx;
- 	struct fsl_ssi_reg_val tx;
- };
--static const struct regmap_config fsl_ssi_regconfig = {
--	.max_register = CCSR_SSI_SACCDIS,
--	.reg_bits = 32,
--	.val_bits = 32,
--	.reg_stride = 4,
--	.val_format_endian = REGMAP_ENDIAN_NATIVE,
--};
--
--struct fsl_ssi_soc_data {
--	bool imx;
--	bool offline_config;
--	u32 sisr_write_mask;
--};
- 
- /**
-  * fsl_ssi_private: per-SSI private data
-  *
-- * @reg: Pointer to the regmap registers
-- * @irq: IRQ of this SSI
-- * @cpu_dai_drv: CPU DAI driver for this device
-- *
-- * @dai_fmt: DAI configuration this device is currently used with
-- * @i2s_mode: i2s and network mode configuration of the device. Is used to
-- * switch between normal and i2s/network mode
-- * mode depending on the number of channels
-- * @use_dma: DMA is used or FIQ with stream filter
-- * @use_dual_fifo: DMA with support for both FIFOs used
-- * @fifo_deph: Depth of the SSI FIFOs
-- * @rxtx_reg_val: Specific register settings for receive/transmit configuration
-- *
-- * @clk: SSI clock
-- * @baudclk: SSI baud clock for master mode
-- * @baudclk_streams: Active streams that are using baudclk
-- * @bitclk_freq: bitclock frequency set by .set_dai_sysclk
-- *
-- * @dma_params_tx: DMA transmit parameters
-- * @dma_params_rx: DMA receive parameters
-+ * @ssi: pointer to the SSI's registers
-  * @ssi_phys: physical address of the SSI registers
-- *
-- * @fiq_params: FIQ stream filtering parameters
-- *
-- * @pdev: Pointer to pdev used for deprecated fsl-ssi sound card
-- *
-- * @dbg_stats: Debugging statistics
-- *
-- * @soc: SoC specifc data
-+ * @irq: IRQ of this SSI
-+ * @playback: the number of playback streams opened
-+ * @capture: the number of capture streams opened
-+ * @cpu_dai: the CPU DAI for this device
-+ * @dev_attr: the sysfs device attribute structure
-+ * @stats: SSI statistics
-+ * @name: name for this device
-  */
- struct fsl_ssi_private {
--	struct regmap *regs;
--	int irq;
-+	struct ccsr_ssi __iomem *ssi;
-+	dma_addr_t ssi_phys;
-+	unsigned int irq;
-+	unsigned int fifo_depth;
- 	struct snd_soc_dai_driver cpu_dai_drv;
-+	struct platform_device *pdev;
- 
--	unsigned int dai_fmt;
--	u8 i2s_mode;
-+	enum fsl_ssi_type hw_type;
-+	bool new_binding;
-+	bool ssi_on_imx;
-+	bool imx_ac97;
- 	bool use_dma;
-+	bool baudclk_locked;
-+	bool irq_stats;
-+	bool offline_config;
- 	bool use_dual_fifo;
--	bool has_ipg_clk_name;
--	unsigned int fifo_depth;
--	struct fsl_ssi_rxtx_reg_val rxtx_reg_val;
--
--	struct clk *clk;
-+	u8 i2s_mode;
-+	spinlock_t baudclk_lock;
- 	struct clk *baudclk;
--	unsigned int baudclk_streams;
--	unsigned int bitclk_freq;
--
--	/* DMA params */
-+	struct clk *clk;
- 	struct snd_dmaengine_dai_dma_data dma_params_tx;
- 	struct snd_dmaengine_dai_dma_data dma_params_rx;
--	dma_addr_t ssi_phys;
--
--	/* params for non-dma FIQ stream filtered mode */
- 	struct imx_pcm_fiq_params fiq_params;
-+	/* Register values for rx/tx configuration */
-+	struct fsl_ssi_rxtx_reg_val rxtx_reg_val;
- 
--	/* Used when using fsl-ssi as sound-card. This is only used by ppc and
--	 * should be replaced with simple-sound-card. */
--	struct platform_device *pdev;
--
--	struct fsl_ssi_dbg dbg_stats;
--
--	const struct fsl_ssi_soc_data *soc;
--};
--
--/*
-- * imx51 and later SoCs have a slightly different IP that allows the
-- * SSI configuration while the SSI unit is running.
-- *
-- * More important, it is necessary on those SoCs to configure the
-- * sperate TX/RX DMA bits just before starting the stream
-- * (fsl_ssi_trigger). The SDMA unit has to be configured before fsl_ssi
-- * sends any DMA requests to the SDMA unit, otherwise it is not defined
-- * how the SDMA unit handles the DMA request.
-- *
-- * SDMA units are present on devices starting at imx35 but the imx35
-- * reference manual states that the DMA bits should not be changed
-- * while the SSI unit is running (SSIEN). So we support the necessary
-- * online configuration of fsl-ssi starting at imx51.
-- */
-+	struct {
-+		unsigned int rfrc;
-+		unsigned int tfrc;
-+		unsigned int cmdau;
-+		unsigned int cmddu;
-+		unsigned int rxt;
-+		unsigned int rdr1;
-+		unsigned int rdr0;
-+		unsigned int tde1;
-+		unsigned int tde0;
-+		unsigned int roe1;
-+		unsigned int roe0;
-+		unsigned int tue1;
-+		unsigned int tue0;
-+		unsigned int tfs;
-+		unsigned int rfs;
-+		unsigned int tls;
-+		unsigned int rls;
-+		unsigned int rff1;
-+		unsigned int rff0;
-+		unsigned int tfe1;
-+		unsigned int tfe0;
-+	} stats;
-+	struct dentry *dbg_dir;
-+	struct dentry *dbg_stats;
- 
--static struct fsl_ssi_soc_data fsl_ssi_mpc8610 = {
--	.imx = false,
--	.offline_config = true,
--	.sisr_write_mask = CCSR_SSI_SISR_RFRC | CCSR_SSI_SISR_TFRC |
--			CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
--			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1,
-+	char name[1];
- };
- 
--static struct fsl_ssi_soc_data fsl_ssi_imx21 = {
--	.imx = true,
--	.offline_config = true,
--	.sisr_write_mask = 0,
--};
-+#ifdef CONFIG_PM
-+static int fsl_ssi_runtime_resume(struct device *dev)
-+{
-+	request_bus_freq(BUS_FREQ_AUDIO);
-+	return 0;
-+}
- 
--static struct fsl_ssi_soc_data fsl_ssi_imx35 = {
--	.imx = true,
--	.offline_config = true,
--	.sisr_write_mask = CCSR_SSI_SISR_RFRC | CCSR_SSI_SISR_TFRC |
--			CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
--			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1,
--};
-+static int fsl_ssi_runtime_suspend(struct device *dev)
-+{
-+	release_bus_freq(BUS_FREQ_AUDIO);
-+	return 0;
-+}
-+#endif
- 
--static struct fsl_ssi_soc_data fsl_ssi_imx51 = {
--	.imx = true,
--	.offline_config = false,
--	.sisr_write_mask = CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
--		CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1,
-+static const struct dev_pm_ops fsl_ssi_pm = {
-+	SET_RUNTIME_PM_OPS(fsl_ssi_runtime_suspend,
-+			fsl_ssi_runtime_resume,
-+			NULL)
- };
- 
- static const struct of_device_id fsl_ssi_ids[] = {
--	{ .compatible = "fsl,mpc8610-ssi", .data = &fsl_ssi_mpc8610 },
--	{ .compatible = "fsl,imx51-ssi", .data = &fsl_ssi_imx51 },
--	{ .compatible = "fsl,imx35-ssi", .data = &fsl_ssi_imx35 },
--	{ .compatible = "fsl,imx21-ssi", .data = &fsl_ssi_imx21 },
-+	{ .compatible = "fsl,mpc8610-ssi", .data = (void *) FSL_SSI_MCP8610},
-+	{ .compatible = "fsl,imx51-ssi", .data = (void *) FSL_SSI_MX51},
-+	{ .compatible = "fsl,imx35-ssi", .data = (void *) FSL_SSI_MX35},
-+	{ .compatible = "fsl,imx21-ssi", .data = (void *) FSL_SSI_MX21},
- 	{}
- };
- MODULE_DEVICE_TABLE(of, fsl_ssi_ids);
- 
--static bool fsl_ssi_is_ac97(struct fsl_ssi_private *ssi_private)
--{
--	return !!(ssi_private->dai_fmt & SND_SOC_DAIFMT_AC97);
--}
--
--static bool fsl_ssi_is_i2s_master(struct fsl_ssi_private *ssi_private)
--{
--	return (ssi_private->dai_fmt & SND_SOC_DAIFMT_MASTER_MASK) ==
--		SND_SOC_DAIFMT_CBS_CFS;
--}
--
--static bool fsl_ssi_is_i2s_cbm_cfs(struct fsl_ssi_private *ssi_private)
--{
--	return (ssi_private->dai_fmt & SND_SOC_DAIFMT_MASTER_MASK) ==
--		SND_SOC_DAIFMT_CBM_CFS;
--}
- /**
-  * fsl_ssi_isr: SSI interrupt handler
-  *
-@@ -278,74 +268,281 @@
- static irqreturn_t fsl_ssi_isr(int irq, void *dev_id)
- {
- 	struct fsl_ssi_private *ssi_private = dev_id;
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
-+	irqreturn_t ret = IRQ_NONE;
- 	__be32 sisr;
- 	__be32 sisr2;
-+	__be32 sisr_write_mask = 0;
-+
-+	switch (ssi_private->hw_type) {
-+	case FSL_SSI_MX21:
-+		sisr_write_mask = 0;
-+		break;
-+
-+	case FSL_SSI_MCP8610:
-+	case FSL_SSI_MX35:
-+		sisr_write_mask = CCSR_SSI_SISR_RFRC | CCSR_SSI_SISR_TFRC |
-+			CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
-+			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1;
-+		break;
-+
-+	case FSL_SSI_MX51:
-+		sisr_write_mask = CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
-+			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1;
-+		break;
-+	}
- 
- 	/* We got an interrupt, so read the status register to see what we
- 	   were interrupted for.  We mask it with the Interrupt Enable register
- 	   so that we only check for events that we're interested in.
- 	 */
--	regmap_read(regs, CCSR_SSI_SISR, &sisr);
-+	sisr = read_ssi(&ssi->sisr) & FSLSSI_SISR_MASK;
- 
--	sisr2 = sisr & ssi_private->soc->sisr_write_mask;
-+	if (sisr & CCSR_SSI_SISR_RFRC) {
-+		ssi_private->stats.rfrc++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TFRC) {
-+		ssi_private->stats.tfrc++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_CMDAU) {
-+		ssi_private->stats.cmdau++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_CMDDU) {
-+		ssi_private->stats.cmddu++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RXT) {
-+		ssi_private->stats.rxt++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RDR1) {
-+		ssi_private->stats.rdr1++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RDR0) {
-+		ssi_private->stats.rdr0++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TDE1) {
-+		ssi_private->stats.tde1++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TDE0) {
-+		ssi_private->stats.tde0++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_ROE1) {
-+		ssi_private->stats.roe1++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_ROE0) {
-+		ssi_private->stats.roe0++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TUE1) {
-+		ssi_private->stats.tue1++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TUE0) {
-+		ssi_private->stats.tue0++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TFS) {
-+		ssi_private->stats.tfs++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RFS) {
-+		ssi_private->stats.rfs++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TLS) {
-+		ssi_private->stats.tls++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RLS) {
-+		ssi_private->stats.rls++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RFF1) {
-+		ssi_private->stats.rff1++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_RFF0) {
-+		ssi_private->stats.rff0++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TFE1) {
-+		ssi_private->stats.tfe1++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	if (sisr & CCSR_SSI_SISR_TFE0) {
-+		ssi_private->stats.tfe0++;
-+		ret = IRQ_HANDLED;
-+	}
-+
-+	sisr2 = sisr & sisr_write_mask;
- 	/* Clear the bits that we set */
- 	if (sisr2)
--		regmap_write(regs, CCSR_SSI_SISR, sisr2);
-+		write_ssi(sisr2, &ssi->sisr);
-+
-+	return ret;
-+}
-+
-+#if IS_ENABLED(CONFIG_DEBUG_FS)
-+/* Show the statistics of a flag only if its interrupt is enabled.  The
-+ * compiler will optimze this code to a no-op if the interrupt is not
-+ * enabled.
-+ */
-+#define SIER_SHOW(flag, name) \
-+	do { \
-+		if (FSLSSI_SISR_MASK & CCSR_SSI_SIER_##flag) \
-+			seq_printf(s, #name "=%u\n", ssi_private->stats.name); \
-+	} while (0)
-+
-+
-+/**
-+ * fsl_sysfs_ssi_show: display SSI statistics
-+ *
-+ * Display the statistics for the current SSI device.  To avoid confusion,
-+ * we only show those counts that are enabled.
-+ */
-+static int fsl_ssi_stats_show(struct seq_file *s, void *unused)
-+{
-+	struct fsl_ssi_private *ssi_private = s->private;
-+
-+	SIER_SHOW(RFRC_EN, rfrc);
-+	SIER_SHOW(TFRC_EN, tfrc);
-+	SIER_SHOW(CMDAU_EN, cmdau);
-+	SIER_SHOW(CMDDU_EN, cmddu);
-+	SIER_SHOW(RXT_EN, rxt);
-+	SIER_SHOW(RDR1_EN, rdr1);
-+	SIER_SHOW(RDR0_EN, rdr0);
-+	SIER_SHOW(TDE1_EN, tde1);
-+	SIER_SHOW(TDE0_EN, tde0);
-+	SIER_SHOW(ROE1_EN, roe1);
-+	SIER_SHOW(ROE0_EN, roe0);
-+	SIER_SHOW(TUE1_EN, tue1);
-+	SIER_SHOW(TUE0_EN, tue0);
-+	SIER_SHOW(TFS_EN, tfs);
-+	SIER_SHOW(RFS_EN, rfs);
-+	SIER_SHOW(TLS_EN, tls);
-+	SIER_SHOW(RLS_EN, rls);
-+	SIER_SHOW(RFF1_EN, rff1);
-+	SIER_SHOW(RFF0_EN, rff0);
-+	SIER_SHOW(TFE1_EN, tfe1);
-+	SIER_SHOW(TFE0_EN, tfe0);
-+
-+	return 0;
-+}
-+
-+static int fsl_ssi_stats_open(struct inode *inode, struct file *file)
-+{
-+	return single_open(file, fsl_ssi_stats_show, inode->i_private);
-+}
- 
--	fsl_ssi_dbg_isr(&ssi_private->dbg_stats, sisr);
-+static const struct file_operations fsl_ssi_stats_ops = {
-+	.open = fsl_ssi_stats_open,
-+	.read = seq_read,
-+	.llseek = seq_lseek,
-+	.release = single_release,
-+};
-+
-+static int fsl_ssi_debugfs_create(struct fsl_ssi_private *ssi_private,
-+		struct device *dev)
-+{
-+	ssi_private->dbg_dir = debugfs_create_dir(dev_name(dev), NULL);
-+	if (!ssi_private->dbg_dir)
-+		return -ENOMEM;
-+
-+	ssi_private->dbg_stats = debugfs_create_file("stats", S_IRUGO,
-+			ssi_private->dbg_dir, ssi_private, &fsl_ssi_stats_ops);
-+	if (!ssi_private->dbg_stats) {
-+		debugfs_remove(ssi_private->dbg_dir);
-+		return -ENOMEM;
-+	}
-+
-+	return 0;
-+}
-+
-+static void fsl_ssi_debugfs_remove(struct fsl_ssi_private *ssi_private)
-+{
-+	debugfs_remove(ssi_private->dbg_stats);
-+	debugfs_remove(ssi_private->dbg_dir);
-+}
-+
-+#else
-+
-+static int fsl_ssi_debugfs_create(struct fsl_ssi_private *ssi_private,
-+		struct device *dev)
-+{
-+	return 0;
-+}
- 
--	return IRQ_HANDLED;
-+static void fsl_ssi_debugfs_remove(struct fsl_ssi_private *ssi_private)
-+{
- }
- 
-+#endif /* IS_ENABLED(CONFIG_DEBUG_FS) */
-+
- /*
-  * Enable/Disable all rx/tx config flags at once.
-  */
- static void fsl_ssi_rxtx_config(struct fsl_ssi_private *ssi_private,
- 		bool enable)
- {
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
- 	struct fsl_ssi_rxtx_reg_val *vals = &ssi_private->rxtx_reg_val;
- 
- 	if (enable) {
--		regmap_update_bits(regs, CCSR_SSI_SIER,
--				vals->rx.sier | vals->tx.sier,
--				vals->rx.sier | vals->tx.sier);
--		regmap_update_bits(regs, CCSR_SSI_SRCR,
--				vals->rx.srcr | vals->tx.srcr,
--				vals->rx.srcr | vals->tx.srcr);
--		regmap_update_bits(regs, CCSR_SSI_STCR,
--				vals->rx.stcr | vals->tx.stcr,
--				vals->rx.stcr | vals->tx.stcr);
-+		write_ssi_mask(&ssi->sier, 0, vals->rx.sier | vals->tx.sier);
-+		write_ssi_mask(&ssi->srcr, 0, vals->rx.srcr | vals->tx.srcr);
-+		write_ssi_mask(&ssi->stcr, 0, vals->rx.stcr | vals->tx.stcr);
- 	} else {
--		regmap_update_bits(regs, CCSR_SSI_SRCR,
--				vals->rx.srcr | vals->tx.srcr, 0);
--		regmap_update_bits(regs, CCSR_SSI_STCR,
--				vals->rx.stcr | vals->tx.stcr, 0);
--		regmap_update_bits(regs, CCSR_SSI_SIER,
--				vals->rx.sier | vals->tx.sier, 0);
-+		write_ssi_mask(&ssi->srcr, vals->rx.srcr | vals->tx.srcr, 0);
-+		write_ssi_mask(&ssi->stcr, vals->rx.stcr | vals->tx.stcr, 0);
-+		write_ssi_mask(&ssi->sier, vals->rx.sier | vals->tx.sier, 0);
- 	}
- }
- 
--/*
-- * Calculate the bits that have to be disabled for the current stream that is
-- * getting disabled. This keeps the bits enabled that are necessary for the
-- * second stream to work if 'stream_active' is true.
-- *
-- * Detailed calculation:
-- * These are the values that need to be active after disabling. For non-active
-- * second stream, this is 0:
-- *	vals_stream * !!stream_active
-- *
-- * The following computes the overall differences between the setup for the
-- * to-disable stream and the active stream, a simple XOR:
-- *	vals_disable ^ (vals_stream * !!(stream_active))
-- *
-- * The full expression adds a mask on all values we care about
-- */
--#define fsl_ssi_disable_val(vals_disable, vals_stream, stream_active) \
--	((vals_disable) & \
--	 ((vals_disable) ^ ((vals_stream) * (u32)!!(stream_active))))
-+static void fsl_ssi_clk_ctrl(struct fsl_ssi_private *ssi_private, bool enable)
-+{
-+	if (enable) {
-+		if (ssi_private->ssi_on_imx) {
-+			if (!IS_ERR(ssi_private->baudclk))
-+				clk_enable(ssi_private->baudclk);
-+			clk_enable(ssi_private->clk);
-+		}
-+	} else {
-+		if (ssi_private->ssi_on_imx) {
-+			if (!IS_ERR(ssi_private->baudclk))
-+				clk_disable(ssi_private->baudclk);
-+			clk_disable(ssi_private->clk);
-+		}
-+	}
-+}
- 
- /*
-  * Enable/Disable a ssi configuration. You have to pass either
-@@ -354,22 +551,12 @@
- static void fsl_ssi_config(struct fsl_ssi_private *ssi_private, bool enable,
- 		struct fsl_ssi_reg_val *vals)
- {
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
- 	struct fsl_ssi_reg_val *avals;
--	int nr_active_streams;
--	u32 scr_val;
--	int keep_active;
--
--	regmap_read(regs, CCSR_SSI_SCR, &scr_val);
--
--	nr_active_streams = !!(scr_val & CCSR_SSI_SCR_TE) +
-+	u32 scr_val = read_ssi(&ssi->scr);
-+	int nr_active_streams = !!(scr_val & CCSR_SSI_SCR_TE) +
- 				!!(scr_val & CCSR_SSI_SCR_RE);
- 
--	if (nr_active_streams - 1 > 0)
--		keep_active = 1;
--	else
--		keep_active = 0;
--
- 	/* Find the other direction values rx or tx which we do not want to
- 	 * modify */
- 	if (&ssi_private->rxtx_reg_val.rx == vals)
-@@ -377,11 +564,12 @@
- 	else
- 		avals = &ssi_private->rxtx_reg_val.rx;
- 
-+	fsl_ssi_clk_ctrl(ssi_private, enable);
-+
- 	/* If vals should be disabled, start with disabling the unit */
- 	if (!enable) {
--		u32 scr = fsl_ssi_disable_val(vals->scr, avals->scr,
--				keep_active);
--		regmap_update_bits(regs, CCSR_SSI_SCR, scr, 0);
-+		u32 scr = vals->scr & (vals->scr ^ avals->scr);
-+		write_ssi_mask(&ssi->scr, scr, 0);
- 	}
- 
- 	/*
-@@ -389,9 +577,9 @@
- 	 * reconfiguration, so we have to enable all necessary flags at once
- 	 * even if we do not use them later (capture and playback configuration)
- 	 */
--	if (ssi_private->soc->offline_config) {
-+	if (ssi_private->offline_config) {
- 		if ((enable && !nr_active_streams) ||
--				(!enable && !keep_active))
-+				(!enable && nr_active_streams == 1))
- 			fsl_ssi_rxtx_config(ssi_private, enable);
- 
- 		goto config_done;
-@@ -402,9 +590,9 @@
- 	 * (online configuration)
- 	 */
- 	if (enable) {
--		regmap_update_bits(regs, CCSR_SSI_SIER, vals->sier, vals->sier);
--		regmap_update_bits(regs, CCSR_SSI_SRCR, vals->srcr, vals->srcr);
--		regmap_update_bits(regs, CCSR_SSI_STCR, vals->stcr, vals->stcr);
-+		write_ssi_mask(&ssi->sier, 0, vals->sier);
-+		write_ssi_mask(&ssi->srcr, 0, vals->srcr);
-+		write_ssi_mask(&ssi->stcr, 0, vals->stcr);
- 	} else {
- 		u32 sier;
- 		u32 srcr;
-@@ -420,22 +608,19 @@
- 		 */
- 
- 		/* These assignments are simply vals without bits set in avals*/
--		sier = fsl_ssi_disable_val(vals->sier, avals->sier,
--				keep_active);
--		srcr = fsl_ssi_disable_val(vals->srcr, avals->srcr,
--				keep_active);
--		stcr = fsl_ssi_disable_val(vals->stcr, avals->stcr,
--				keep_active);
--
--		regmap_update_bits(regs, CCSR_SSI_SRCR, srcr, 0);
--		regmap_update_bits(regs, CCSR_SSI_STCR, stcr, 0);
--		regmap_update_bits(regs, CCSR_SSI_SIER, sier, 0);
-+		sier = vals->sier & (vals->sier ^ avals->sier);
-+		srcr = vals->srcr & (vals->srcr ^ avals->srcr);
-+		stcr = vals->stcr & (vals->stcr ^ avals->stcr);
-+
-+		write_ssi_mask(&ssi->srcr, srcr, 0);
-+		write_ssi_mask(&ssi->stcr, stcr, 0);
-+		write_ssi_mask(&ssi->sier, sier, 0);
- 	}
- 
- config_done:
- 	/* Enabling of subunits is done after configuration */
- 	if (enable)
--		regmap_update_bits(regs, CCSR_SSI_SCR, vals->scr, vals->scr);
-+		write_ssi_mask(&ssi->scr, 0, vals->scr);
- }
- 
- 
-@@ -465,7 +650,7 @@
- 	reg->tx.stcr = CCSR_SSI_STCR_TFEN0;
- 	reg->tx.scr = 0;
- 
--	if (!fsl_ssi_is_ac97(ssi_private)) {
-+	if (!ssi_private->imx_ac97) {
- 		reg->rx.scr = CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_RE;
- 		reg->rx.sier |= CCSR_SSI_SIER_RFF0_EN;
- 		reg->tx.scr = CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_TE;
-@@ -486,197 +671,161 @@
- 
- static void fsl_ssi_setup_ac97(struct fsl_ssi_private *ssi_private)
- {
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
- 
- 	/*
- 	 * Setup the clock control register
- 	 */
--	regmap_write(regs, CCSR_SSI_STCCR,
--			CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13));
--	regmap_write(regs, CCSR_SSI_SRCCR,
--			CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13));
-+	write_ssi(CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13),
-+			&ssi->stccr);
-+	write_ssi(CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13),
-+			&ssi->srccr);
- 
- 	/*
- 	 * Enable AC97 mode and startup the SSI
- 	 */
--	regmap_write(regs, CCSR_SSI_SACNT,
--			CCSR_SSI_SACNT_AC97EN | CCSR_SSI_SACNT_FV);
--	regmap_write(regs, CCSR_SSI_SACCDIS, 0xff);
--	regmap_write(regs, CCSR_SSI_SACCEN, 0x300);
-+	write_ssi(CCSR_SSI_SACNT_AC97EN | CCSR_SSI_SACNT_FV,
-+			&ssi->sacnt);
-+	write_ssi(0xff, &ssi->saccdis);
-+	write_ssi(0x300, &ssi->saccen);
- 
- 	/*
- 	 * Enable SSI, Transmit and Receive. AC97 has to communicate with the
- 	 * codec before a stream is started.
- 	 */
--	regmap_update_bits(regs, CCSR_SSI_SCR,
--			CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE,
--			CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE);
--
--	regmap_write(regs, CCSR_SSI_SOR, CCSR_SSI_SOR_WAIT(3));
--}
--
--/**
-- * fsl_ssi_startup: create a new substream
-- *
-- * This is the first function called when a stream is opened.
-- *
-- * If this is the first stream open, then grab the IRQ and program most of
-- * the SSI registers.
-- */
--static int fsl_ssi_startup(struct snd_pcm_substream *substream,
--			   struct snd_soc_dai *dai)
--{
--	struct snd_soc_pcm_runtime *rtd = substream->private_data;
--	struct fsl_ssi_private *ssi_private =
--		snd_soc_dai_get_drvdata(rtd->cpu_dai);
--	int ret;
--
--	ret = clk_prepare_enable(ssi_private->clk);
--	if (ret)
--		return ret;
--
--	/* When using dual fifo mode, it is safer to ensure an even period
--	 * size. If appearing to an odd number while DMA always starts its
--	 * task from fifo0, fifo1 would be neglected at the end of each
--	 * period. But SSI would still access fifo1 with an invalid data.
--	 */
--	if (ssi_private->use_dual_fifo)
--		snd_pcm_hw_constraint_step(substream->runtime, 0,
--				SNDRV_PCM_HW_PARAM_PERIOD_SIZE, 2);
-+	write_ssi_mask(&ssi->scr, 0, CCSR_SSI_SCR_SSIEN |
-+			CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE);
- 
--	return 0;
-+	write_ssi(CCSR_SSI_SOR_WAIT(3), &ssi->sor);
- }
- 
--/**
-- * fsl_ssi_shutdown: shutdown the SSI
-- *
-- */
--static void fsl_ssi_shutdown(struct snd_pcm_substream *substream,
--				struct snd_soc_dai *dai)
-+static int fsl_ssi_setup(struct fsl_ssi_private *ssi_private)
- {
--	struct snd_soc_pcm_runtime *rtd = substream->private_data;
--	struct fsl_ssi_private *ssi_private =
--		snd_soc_dai_get_drvdata(rtd->cpu_dai);
--
--	clk_disable_unprepare(ssi_private->clk);
--
--}
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
-+	u8 wm;
-+	int synchronous = ssi_private->cpu_dai_drv.symmetric_rates;
- 
--/**
-- * fsl_ssi_set_bclk - configure Digital Audio Interface bit clock
-- *
-- * Note: This function can be only called when using SSI as DAI master
-- *
-- * Quick instruction for parameters:
-- * freq: Output BCLK frequency = samplerate * 32 (fixed) * channels
-- * dir: SND_SOC_CLOCK_OUT -> TxBCLK, SND_SOC_CLOCK_IN -> RxBCLK.
-- */
--static int fsl_ssi_set_bclk(struct snd_pcm_substream *substream,
--		struct snd_soc_dai *cpu_dai,
--		struct snd_pcm_hw_params *hw_params)
--{
--	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
--	struct regmap *regs = ssi_private->regs;
--	int synchronous = ssi_private->cpu_dai_drv.symmetric_rates, ret;
--	u32 pm = 999, div2, psr, stccr, mask, afreq, factor, i;
--	unsigned long clkrate, baudrate, tmprate;
--	u64 sub, savesub = 100000;
--	unsigned int freq;
--	bool baudclk_is_used;
-+	fsl_ssi_setup_reg_vals(ssi_private);
- 
--	/* Prefer the explicitly set bitclock frequency */
--	if (ssi_private->bitclk_freq)
--		freq = ssi_private->bitclk_freq;
-+	if (ssi_private->imx_ac97)
-+		ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_NORMAL | CCSR_SSI_SCR_NET;
- 	else
--		freq = params_channels(hw_params) * 32 * params_rate(hw_params);
--
--	/* Don't apply it to any non-baudclk circumstance */
--	if (IS_ERR(ssi_private->baudclk))
--		return -EINVAL;
--
--	baudclk_is_used = ssi_private->baudclk_streams & ~(BIT(substream->stream));
-+		ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_SLAVE;
- 
--	/* It should be already enough to divide clock by setting pm alone */
--	psr = 0;
--	div2 = 0;
--
--	factor = (div2 + 1) * (7 * psr + 1) * 2;
-+	/*
-+	 * Section 16.5 of the MPC8610 reference manual says that the SSI needs
-+	 * to be disabled before updating the registers we set here.
-+	 */
-+	write_ssi_mask(&ssi->scr, CCSR_SSI_SCR_SSIEN, 0);
- 
--	for (i = 0; i < 255; i++) {
--		tmprate = freq * factor * (i + 1);
-+	/*
-+	 * Program the SSI into I2S Slave Non-Network Synchronous mode. Also
-+	 * enable the transmit and receive FIFO.
-+	 *
-+	 * FIXME: Little-endian samples require a different shift dir
-+	 */
-+	write_ssi_mask(&ssi->scr,
-+		CCSR_SSI_SCR_I2S_MODE_MASK | CCSR_SSI_SCR_SYN,
-+		CCSR_SSI_SCR_TFR_CLK_DIS |
-+		ssi_private->i2s_mode |
-+		(synchronous ? CCSR_SSI_SCR_SYN : 0));
- 
--		if (baudclk_is_used)
--			clkrate = clk_get_rate(ssi_private->baudclk);
--		else
--			clkrate = clk_round_rate(ssi_private->baudclk, tmprate);
-+	write_ssi(CCSR_SSI_STCR_TXBIT0 | CCSR_SSI_STCR_TFSI |
-+			CCSR_SSI_STCR_TEFS | CCSR_SSI_STCR_TSCKP, &ssi->stcr);
- 
--		/*
--		 * Hardware limitation: The bclk rate must be
--		 * never greater than 1/5 IPG clock rate
--		 */
--		if (clkrate * 5 > clk_get_rate(ssi_private->clk))
--			continue;
-+	write_ssi(CCSR_SSI_SRCR_RXBIT0 | CCSR_SSI_SRCR_RFSI |
-+			CCSR_SSI_SRCR_REFS | CCSR_SSI_SRCR_RSCKP, &ssi->srcr);
- 
--		clkrate /= factor;
--		afreq = clkrate / (i + 1);
-+	/*
-+	 * The DC and PM bits are only used if the SSI is the clock master.
-+	 */
- 
--		if (freq == afreq)
--			sub = 0;
--		else if (freq / afreq == 1)
--			sub = freq - afreq;
--		else if (afreq / freq == 1)
--			sub = afreq - freq;
--		else
--			continue;
-+	/*
-+	 * Set the watermark for transmit FIFI 0 and receive FIFO 0. We don't
-+	 * use FIFO 1. We program the transmit water to signal a DMA transfer
-+	 * if there are only two (or fewer) elements left in the FIFO. Two
-+	 * elements equals one frame (left channel, right channel). This value,
-+	 * however, depends on the depth of the transmit buffer.
-+	 *
-+	 * We set the watermark on the same level as the DMA burstsize.  For
-+	 * fiq it is probably better to use the biggest possible watermark
-+	 * size.
-+	 */
-+	if (ssi_private->use_dma)
-+		wm = ssi_private->fifo_depth - 2;
-+	else
-+		wm = ssi_private->fifo_depth;
- 
--		/* Calculate the fraction */
--		sub *= 100000;
--		do_div(sub, freq);
-+	write_ssi(CCSR_SSI_SFCSR_TFWM0(wm) | CCSR_SSI_SFCSR_RFWM0(wm) |
-+		CCSR_SSI_SFCSR_TFWM1(wm) | CCSR_SSI_SFCSR_RFWM1(wm),
-+		&ssi->sfcsr);
- 
--		if (sub < savesub) {
--			baudrate = tmprate;
--			savesub = sub;
--			pm = i;
--		}
-+	/*
-+	 * For ac97 interrupts are enabled with the startup of the substream
-+	 * because it is also running without an active substream. Normally SSI
-+	 * is only enabled when there is a substream.
-+	 */
-+	if (ssi_private->imx_ac97)
-+		fsl_ssi_setup_ac97(ssi_private);
- 
--		/* We are lucky */
--		if (savesub == 0)
--			break;
-+	/*
-+	 * Set a default slot number so that there is no need for those common
-+	 * cases like I2S mode to call the extra set_tdm_slot() any more.
-+	 */
-+	if (!ssi_private->imx_ac97) {
-+		write_ssi_mask(&ssi->stccr, CCSR_SSI_SxCCR_DC_MASK,
-+				CCSR_SSI_SxCCR_DC(2));
-+		write_ssi_mask(&ssi->srccr, CCSR_SSI_SxCCR_DC_MASK,
-+				CCSR_SSI_SxCCR_DC(2));
- 	}
- 
--	/* No proper pm found if it is still remaining the initial value */
--	if (pm == 999) {
--		dev_err(cpu_dai->dev, "failed to handle the required sysclk\n");
--		return -EINVAL;
-+	if (ssi_private->use_dual_fifo) {
-+		write_ssi_mask(&ssi->srcr, 0, CCSR_SSI_SRCR_RFEN1);
-+		write_ssi_mask(&ssi->stcr, 0, CCSR_SSI_STCR_TFEN1);
-+		write_ssi_mask(&ssi->scr, 0, CCSR_SSI_SCR_TCH_EN);
- 	}
- 
--	stccr = CCSR_SSI_SxCCR_PM(pm + 1) | (div2 ? CCSR_SSI_SxCCR_DIV2 : 0) |
--		(psr ? CCSR_SSI_SxCCR_PSR : 0);
--	mask = CCSR_SSI_SxCCR_PM_MASK | CCSR_SSI_SxCCR_DIV2 |
--		CCSR_SSI_SxCCR_PSR;
-+	return 0;
-+}
- 
--	if (substream->stream == SNDRV_PCM_STREAM_PLAYBACK || synchronous)
--		regmap_update_bits(regs, CCSR_SSI_STCCR, mask, stccr);
--	else
--		regmap_update_bits(regs, CCSR_SSI_SRCCR, mask, stccr);
- 
--	if (!baudclk_is_used) {
--		ret = clk_set_rate(ssi_private->baudclk, baudrate);
--		if (ret) {
--			dev_err(cpu_dai->dev, "failed to set baudclk rate\n");
--			return -EINVAL;
--		}
--	}
-+/**
-+ * fsl_ssi_startup: create a new substream
-+ *
-+ * This is the first function called when a stream is opened.
-+ *
-+ * If this is the first stream open, then grab the IRQ and program most of
-+ * the SSI registers.
-+ */
-+static int fsl_ssi_startup(struct snd_pcm_substream *substream,
-+			   struct snd_soc_dai *dai)
-+{
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct fsl_ssi_private *ssi_private =
-+		snd_soc_dai_get_drvdata(rtd->cpu_dai);
-+	unsigned long flags;
- 
--	return 0;
--}
-+	pm_runtime_get_sync(dai->dev);
- 
--static int fsl_ssi_set_dai_sysclk(struct snd_soc_dai *cpu_dai,
--		int clk_id, unsigned int freq, int dir)
--{
--	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
-+	/* First, we only do fsl_ssi_setup() when SSI is going to be active.
-+	 * Second, fsl_ssi_setup was already called by ac97_init earlier if
-+	 * the driver is in ac97 mode.
-+	 */
-+	if (!dai->active && !ssi_private->imx_ac97) {
-+		fsl_ssi_setup(ssi_private);
-+		spin_lock_irqsave(&ssi_private->baudclk_lock, flags);
-+		ssi_private->baudclk_locked = false;
-+		spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
-+	}
- 
--	ssi_private->bitclk_freq = freq;
-+	/* When using dual fifo mode, it is safer to ensure an even period
-+	 * size. If appearing to an odd number while DMA always starts its
-+	 * task from fifo0, fifo1 would be neglected at the end of each
-+	 * period. But SSI would still access fifo1 with an invalid data.
-+	 */
-+	if (ssi_private->use_dual_fifo)
-+		snd_pcm_hw_constraint_step(substream->runtime, 0,
-+				SNDRV_PCM_HW_PARAM_PERIOD_SIZE, 2);
- 
- 	return 0;
- }
-@@ -698,17 +847,12 @@
- 	struct snd_pcm_hw_params *hw_params, struct snd_soc_dai *cpu_dai)
- {
- 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
- 	unsigned int channels = params_channels(hw_params);
- 	unsigned int sample_size =
- 		snd_pcm_format_width(params_format(hw_params));
- 	u32 wl = CCSR_SSI_SxCCR_WL(sample_size);
--	int ret;
--	u32 scr_val;
--	int enabled;
--
--	regmap_read(regs, CCSR_SSI_SCR, &scr_val);
--	enabled = scr_val & CCSR_SSI_SCR_SSIEN;
-+	int enabled = read_ssi(&ssi->scr) & CCSR_SSI_SCR_SSIEN;
- 
- 	/*
- 	 * If we're in synchronous mode, and the SSI is already enabled,
-@@ -717,38 +861,6 @@
- 	if (enabled && ssi_private->cpu_dai_drv.symmetric_rates)
- 		return 0;
- 
--	if (fsl_ssi_is_i2s_master(ssi_private)) {
--		ret = fsl_ssi_set_bclk(substream, cpu_dai, hw_params);
--		if (ret)
--			return ret;
--
--		/* Do not enable the clock if it is already enabled */
--		if (!(ssi_private->baudclk_streams & BIT(substream->stream))) {
--			ret = clk_prepare_enable(ssi_private->baudclk);
--			if (ret)
--				return ret;
--
--			ssi_private->baudclk_streams |= BIT(substream->stream);
--		}
--	}
--
--	if (!fsl_ssi_is_ac97(ssi_private)) {
--		u8 i2smode;
--		/*
--		 * Switch to normal net mode in order to have a frame sync
--		 * signal every 32 bits instead of 16 bits
--		 */
--		if (fsl_ssi_is_i2s_cbm_cfs(ssi_private) && sample_size == 16)
--			i2smode = CCSR_SSI_SCR_I2S_MODE_NORMAL |
--				CCSR_SSI_SCR_NET;
--		else
--			i2smode = ssi_private->i2s_mode;
--
--		regmap_update_bits(regs, CCSR_SSI_SCR,
--				CCSR_SSI_SCR_NET | CCSR_SSI_SCR_I2S_MODE_MASK,
--				channels == 1 ? 0 : i2smode);
--	}
--
- 	/*
- 	 * FIXME: The documentation says that SxCCR[WL] should not be
- 	 * modified while the SSI is enabled.  The only time this can
-@@ -762,80 +874,49 @@
- 	/* In synchronous mode, the SSI uses STCCR for capture */
- 	if ((substream->stream == SNDRV_PCM_STREAM_PLAYBACK) ||
- 	    ssi_private->cpu_dai_drv.symmetric_rates)
--		regmap_update_bits(regs, CCSR_SSI_STCCR, CCSR_SSI_SxCCR_WL_MASK,
--				wl);
-+		write_ssi_mask(&ssi->stccr, CCSR_SSI_SxCCR_WL_MASK, wl);
- 	else
--		regmap_update_bits(regs, CCSR_SSI_SRCCR, CCSR_SSI_SxCCR_WL_MASK,
--				wl);
-+		write_ssi_mask(&ssi->srccr, CCSR_SSI_SxCCR_WL_MASK, wl);
- 
--	return 0;
--}
--
--static int fsl_ssi_hw_free(struct snd_pcm_substream *substream,
--		struct snd_soc_dai *cpu_dai)
--{
--	struct snd_soc_pcm_runtime *rtd = substream->private_data;
--	struct fsl_ssi_private *ssi_private =
--		snd_soc_dai_get_drvdata(rtd->cpu_dai);
--
--	if (fsl_ssi_is_i2s_master(ssi_private) &&
--			ssi_private->baudclk_streams & BIT(substream->stream)) {
--		clk_disable_unprepare(ssi_private->baudclk);
--		ssi_private->baudclk_streams &= ~BIT(substream->stream);
--	}
-+	if (!ssi_private->imx_ac97)
-+		write_ssi_mask(&ssi->scr,
-+				CCSR_SSI_SCR_NET | CCSR_SSI_SCR_I2S_MODE_MASK,
-+				channels == 1 ? 0 : ssi_private->i2s_mode);
- 
- 	return 0;
- }
- 
--static int _fsl_ssi_set_dai_fmt(struct device *dev,
--				struct fsl_ssi_private *ssi_private,
--				unsigned int fmt)
-+/**
-+ * fsl_ssi_set_dai_fmt - configure Digital Audio Interface Format.
-+ */
-+static int fsl_ssi_set_dai_fmt(struct snd_soc_dai *cpu_dai, unsigned int fmt)
- {
--	struct regmap *regs = ssi_private->regs;
-+	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
- 	u32 strcr = 0, stcr, srcr, scr, mask;
--	u8 wm;
- 
--	ssi_private->dai_fmt = fmt;
--
--	if (fsl_ssi_is_i2s_master(ssi_private) && IS_ERR(ssi_private->baudclk)) {
--		dev_err(dev, "baudclk is missing which is necessary for master mode\n");
--		return -EINVAL;
--	}
--
--	fsl_ssi_setup_reg_vals(ssi_private);
--
--	regmap_read(regs, CCSR_SSI_SCR, &scr);
--	scr &= ~(CCSR_SSI_SCR_SYN | CCSR_SSI_SCR_I2S_MODE_MASK);
--	scr |= CCSR_SSI_SCR_SYNC_TX_FS;
-+	scr = read_ssi(&ssi->scr) & ~(CCSR_SSI_SCR_SYN | CCSR_SSI_SCR_I2S_MODE_MASK);
-+	scr |= CCSR_SSI_SCR_NET;
- 
- 	mask = CCSR_SSI_STCR_TXBIT0 | CCSR_SSI_STCR_TFDIR | CCSR_SSI_STCR_TXDIR |
- 		CCSR_SSI_STCR_TSCKP | CCSR_SSI_STCR_TFSI | CCSR_SSI_STCR_TFSL |
- 		CCSR_SSI_STCR_TEFS;
--	regmap_read(regs, CCSR_SSI_STCR, &stcr);
--	regmap_read(regs, CCSR_SSI_SRCR, &srcr);
--	stcr &= ~mask;
--	srcr &= ~mask;
-+	stcr = read_ssi(&ssi->stcr) & ~mask;
-+	srcr = read_ssi(&ssi->srcr) & ~mask;
- 
--	ssi_private->i2s_mode = CCSR_SSI_SCR_NET;
- 	switch (fmt & SND_SOC_DAIFMT_FORMAT_MASK) {
- 	case SND_SOC_DAIFMT_I2S:
- 		switch (fmt & SND_SOC_DAIFMT_MASTER_MASK) {
--		case SND_SOC_DAIFMT_CBM_CFS:
- 		case SND_SOC_DAIFMT_CBS_CFS:
--			ssi_private->i2s_mode |= CCSR_SSI_SCR_I2S_MODE_MASTER;
--			regmap_update_bits(regs, CCSR_SSI_STCCR,
--					CCSR_SSI_SxCCR_DC_MASK,
--					CCSR_SSI_SxCCR_DC(2));
--			regmap_update_bits(regs, CCSR_SSI_SRCCR,
--					CCSR_SSI_SxCCR_DC_MASK,
--					CCSR_SSI_SxCCR_DC(2));
-+			ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_MASTER;
- 			break;
- 		case SND_SOC_DAIFMT_CBM_CFM:
--			ssi_private->i2s_mode |= CCSR_SSI_SCR_I2S_MODE_SLAVE;
-+			ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_SLAVE;
- 			break;
- 		default:
- 			return -EINVAL;
- 		}
-+		scr |= ssi_private->i2s_mode;
- 
- 		/* Data on rising edge of bclk, frame low, 1clk before data */
- 		strcr |= CCSR_SSI_STCR_TFSI | CCSR_SSI_STCR_TSCKP |
-@@ -855,13 +936,9 @@
- 		strcr |= CCSR_SSI_STCR_TFSL | CCSR_SSI_STCR_TSCKP |
- 			CCSR_SSI_STCR_TXBIT0;
- 		break;
--	case SND_SOC_DAIFMT_AC97:
--		ssi_private->i2s_mode |= CCSR_SSI_SCR_I2S_MODE_NORMAL;
--		break;
- 	default:
- 		return -EINVAL;
- 	}
--	scr |= ssi_private->i2s_mode;
- 
- 	/* DAI clock inversion */
- 	switch (fmt & SND_SOC_DAIFMT_INV_MASK) {
-@@ -894,11 +971,6 @@
- 	case SND_SOC_DAIFMT_CBM_CFM:
- 		scr &= ~CCSR_SSI_SCR_SYS_CLK_EN;
- 		break;
--	case SND_SOC_DAIFMT_CBM_CFS:
--		strcr &= ~CCSR_SSI_STCR_TXDIR;
--		strcr |= CCSR_SSI_STCR_TFDIR;
--		scr &= ~CCSR_SSI_SCR_SYS_CLK_EN;
--		break;
- 	default:
- 		return -EINVAL;
- 	}
-@@ -912,54 +984,105 @@
- 		scr |= CCSR_SSI_SCR_SYN;
- 	}
- 
--	regmap_write(regs, CCSR_SSI_STCR, stcr);
--	regmap_write(regs, CCSR_SSI_SRCR, srcr);
--	regmap_write(regs, CCSR_SSI_SCR, scr);
--
--	/*
--	 * Set the watermark for transmit FIFI 0 and receive FIFO 0. We don't
--	 * use FIFO 1. We program the transmit water to signal a DMA transfer
--	 * if there are only two (or fewer) elements left in the FIFO. Two
--	 * elements equals one frame (left channel, right channel). This value,
--	 * however, depends on the depth of the transmit buffer.
--	 *
--	 * We set the watermark on the same level as the DMA burstsize.  For
--	 * fiq it is probably better to use the biggest possible watermark
--	 * size.
--	 */
--	if (ssi_private->use_dma)
--		wm = ssi_private->fifo_depth - 2;
--	else
--		wm = ssi_private->fifo_depth;
--
--	regmap_write(regs, CCSR_SSI_SFCSR,
--			CCSR_SSI_SFCSR_TFWM0(wm) | CCSR_SSI_SFCSR_RFWM0(wm) |
--			CCSR_SSI_SFCSR_TFWM1(wm) | CCSR_SSI_SFCSR_RFWM1(wm));
--
--	if (ssi_private->use_dual_fifo) {
--		regmap_update_bits(regs, CCSR_SSI_SRCR, CCSR_SSI_SRCR_RFEN1,
--				CCSR_SSI_SRCR_RFEN1);
--		regmap_update_bits(regs, CCSR_SSI_STCR, CCSR_SSI_STCR_TFEN1,
--				CCSR_SSI_STCR_TFEN1);
--		regmap_update_bits(regs, CCSR_SSI_SCR, CCSR_SSI_SCR_TCH_EN,
--				CCSR_SSI_SCR_TCH_EN);
--	}
--
--	if (fmt & SND_SOC_DAIFMT_AC97)
--		fsl_ssi_setup_ac97(ssi_private);
-+	write_ssi(stcr, &ssi->stcr);
-+	write_ssi(srcr, &ssi->srcr);
-+	write_ssi(scr, &ssi->scr);
- 
- 	return 0;
--
- }
- 
- /**
-- * fsl_ssi_set_dai_fmt - configure Digital Audio Interface Format.
-+ * fsl_ssi_set_dai_sysclk - configure Digital Audio Interface bit clock
-+ *
-+ * Note: This function can be only called when using SSI as DAI master
-+ *
-+ * Quick instruction for parameters:
-+ * freq: Output BCLK frequency = samplerate * 32 (fixed) * channels
-+ * dir: SND_SOC_CLOCK_OUT -> TxBCLK, SND_SOC_CLOCK_IN -> RxBCLK.
-  */
--static int fsl_ssi_set_dai_fmt(struct snd_soc_dai *cpu_dai, unsigned int fmt)
-+static int fsl_ssi_set_dai_sysclk(struct snd_soc_dai *cpu_dai,
-+				  int clk_id, unsigned int freq, int dir)
- {
- 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
-+	int synchronous = ssi_private->cpu_dai_drv.symmetric_rates, ret;
-+	u32 pm = 999, div2, psr, stccr, mask, afreq, factor, i;
-+	unsigned long flags, clkrate, baudrate, tmprate;
-+	u64 sub, savesub = 100000;
-+
-+	/* Don't apply it to any non-baudclk circumstance */
-+	if (IS_ERR(ssi_private->baudclk))
-+		return -EINVAL;
-+
-+	/* It should be already enough to divide clock by setting pm alone */
-+	psr = 0;
-+	div2 = 0;
-+
-+	factor = (div2 + 1) * (7 * psr + 1) * 2;
-+
-+	for (i = 0; i < 255; i++) {
-+		/* The bclk rate must be smaller than 1/5 sysclk rate */
-+		if (factor * (i + 1) < 5)
-+			continue;
-+
-+		tmprate = freq * factor * (i + 2);
-+		clkrate = clk_round_rate(ssi_private->baudclk, tmprate);
-+
-+		do_div(clkrate, factor);
-+		afreq = (u32)clkrate / (i + 1);
-+
-+		if (freq == afreq)
-+			sub = 0;
-+		else if (freq / afreq == 1)
-+			sub = freq - afreq;
-+		else if (afreq / freq == 1)
-+			sub = afreq - freq;
-+		else
-+			continue;
-+
-+		/* Calculate the fraction */
-+		sub *= 100000;
-+		do_div(sub, freq);
-+
-+		if (sub < savesub) {
-+			baudrate = tmprate;
-+			savesub = sub;
-+			pm = i;
-+		}
-+
-+		/* We are lucky */
-+		if (savesub == 0)
-+			break;
-+	}
-+
-+	/* No proper pm found if it is still remaining the initial value */
-+	if (pm == 999) {
-+		dev_err(cpu_dai->dev, "failed to handle the required sysclk\n");
-+		return -EINVAL;
-+	}
-+
-+	stccr = CCSR_SSI_SxCCR_PM(pm + 1) | (div2 ? CCSR_SSI_SxCCR_DIV2 : 0) |
-+		(psr ? CCSR_SSI_SxCCR_PSR : 0);
-+	mask = CCSR_SSI_SxCCR_PM_MASK | CCSR_SSI_SxCCR_DIV2 | CCSR_SSI_SxCCR_PSR;
-+
-+	if (dir == SND_SOC_CLOCK_OUT || synchronous)
-+		write_ssi_mask(&ssi->stccr, mask, stccr);
-+	else
-+		write_ssi_mask(&ssi->srccr, mask, stccr);
-+
-+	spin_lock_irqsave(&ssi_private->baudclk_lock, flags);
-+	if (!ssi_private->baudclk_locked) {
-+		ret = clk_set_rate(ssi_private->baudclk, baudrate);
-+		if (ret) {
-+			spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
-+			dev_err(cpu_dai->dev, "failed to set baudclk rate\n");
-+			return -EINVAL;
-+		}
-+		ssi_private->baudclk_locked = true;
-+	}
-+	spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
- 
--	return _fsl_ssi_set_dai_fmt(cpu_dai->dev, ssi_private, fmt);
-+	return 0;
- }
- 
- /**
-@@ -971,34 +1094,31 @@
- 				u32 rx_mask, int slots, int slot_width)
- {
- 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
- 	u32 val;
- 
- 	/* The slot number should be >= 2 if using Network mode or I2S mode */
--	regmap_read(regs, CCSR_SSI_SCR, &val);
--	val &= CCSR_SSI_SCR_I2S_MODE_MASK | CCSR_SSI_SCR_NET;
-+	val = read_ssi(&ssi->scr) & (CCSR_SSI_SCR_I2S_MODE_MASK | CCSR_SSI_SCR_NET);
- 	if (val && slots < 2) {
- 		dev_err(cpu_dai->dev, "slot number should be >= 2 in I2S or NET\n");
- 		return -EINVAL;
- 	}
- 
--	regmap_update_bits(regs, CCSR_SSI_STCCR, CCSR_SSI_SxCCR_DC_MASK,
-+	write_ssi_mask(&ssi->stccr, CCSR_SSI_SxCCR_DC_MASK,
- 			CCSR_SSI_SxCCR_DC(slots));
--	regmap_update_bits(regs, CCSR_SSI_SRCCR, CCSR_SSI_SxCCR_DC_MASK,
-+	write_ssi_mask(&ssi->srccr, CCSR_SSI_SxCCR_DC_MASK,
- 			CCSR_SSI_SxCCR_DC(slots));
- 
- 	/* The register SxMSKs needs SSI to provide essential clock due to
- 	 * hardware design. So we here temporarily enable SSI to set them.
- 	 */
--	regmap_read(regs, CCSR_SSI_SCR, &val);
--	val &= CCSR_SSI_SCR_SSIEN;
--	regmap_update_bits(regs, CCSR_SSI_SCR, CCSR_SSI_SCR_SSIEN,
--			CCSR_SSI_SCR_SSIEN);
-+	val = read_ssi(&ssi->scr) & CCSR_SSI_SCR_SSIEN;
-+	write_ssi_mask(&ssi->scr, 0, CCSR_SSI_SCR_SSIEN);
- 
--	regmap_write(regs, CCSR_SSI_STMSK, ~tx_mask);
--	regmap_write(regs, CCSR_SSI_SRMSK, ~rx_mask);
-+	write_ssi(tx_mask, &ssi->stmsk);
-+	write_ssi(rx_mask, &ssi->srmsk);
- 
--	regmap_update_bits(regs, CCSR_SSI_SCR, CCSR_SSI_SCR_SSIEN, val);
-+	write_ssi_mask(&ssi->scr, CCSR_SSI_SCR_SSIEN, val);
- 
- 	return 0;
- }
-@@ -1017,7 +1137,8 @@
- {
- 	struct snd_soc_pcm_runtime *rtd = substream->private_data;
- 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(rtd->cpu_dai);
--	struct regmap *regs = ssi_private->regs;
-+	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
-+	unsigned long flags;
- 
- 	switch (cmd) {
- 	case SNDRV_PCM_TRIGGER_START:
-@@ -1027,6 +1148,7 @@
- 			fsl_ssi_tx_config(ssi_private, true);
- 		else
- 			fsl_ssi_rx_config(ssi_private, true);
-+		dump_reg(ssi);
- 		break;
- 
- 	case SNDRV_PCM_TRIGGER_STOP:
-@@ -1036,27 +1158,40 @@
- 			fsl_ssi_tx_config(ssi_private, false);
- 		else
- 			fsl_ssi_rx_config(ssi_private, false);
-+
-+		if (!ssi_private->imx_ac97 && (read_ssi(&ssi->scr) &
-+					(CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE)) == 0) {
-+			spin_lock_irqsave(&ssi_private->baudclk_lock, flags);
-+			ssi_private->baudclk_locked = false;
-+			spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
-+		}
- 		break;
- 
- 	default:
- 		return -EINVAL;
- 	}
- 
--	if (fsl_ssi_is_ac97(ssi_private)) {
-+	if (ssi_private->imx_ac97) {
- 		if (substream->stream == SNDRV_PCM_STREAM_PLAYBACK)
--			regmap_write(regs, CCSR_SSI_SOR, CCSR_SSI_SOR_TX_CLR);
-+			write_ssi(CCSR_SSI_SOR_TX_CLR, &ssi->sor);
- 		else
--			regmap_write(regs, CCSR_SSI_SOR, CCSR_SSI_SOR_RX_CLR);
-+			write_ssi(CCSR_SSI_SOR_RX_CLR, &ssi->sor);
- 	}
- 
- 	return 0;
- }
- 
-+static void fsl_ssi_shutdown(struct snd_pcm_substream *substream,
-+   			     struct snd_soc_dai *dai)
-+{
-+	pm_runtime_put_sync(dai->dev);
-+}
-+
- static int fsl_ssi_dai_probe(struct snd_soc_dai *dai)
- {
- 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(dai);
- 
--	if (ssi_private->soc->imx && ssi_private->use_dma) {
-+	if (ssi_private->ssi_on_imx && ssi_private->use_dma) {
- 		dai->playback_dma_data = &ssi_private->dma_params_tx;
- 		dai->capture_dma_data = &ssi_private->dma_params_rx;
- 	}
-@@ -1066,27 +1201,24 @@
- 
- static const struct snd_soc_dai_ops fsl_ssi_dai_ops = {
- 	.startup	= fsl_ssi_startup,
--	.shutdown       = fsl_ssi_shutdown,
- 	.hw_params	= fsl_ssi_hw_params,
--	.hw_free	= fsl_ssi_hw_free,
- 	.set_fmt	= fsl_ssi_set_dai_fmt,
- 	.set_sysclk	= fsl_ssi_set_dai_sysclk,
- 	.set_tdm_slot	= fsl_ssi_set_dai_tdm_slot,
- 	.trigger	= fsl_ssi_trigger,
-+	.shutdown	= fsl_ssi_shutdown,
- };
- 
- /* Template for the CPU dai driver structure */
- static struct snd_soc_dai_driver fsl_ssi_dai_template = {
- 	.probe = fsl_ssi_dai_probe,
- 	.playback = {
--		.stream_name = "CPU-Playback",
- 		.channels_min = 1,
- 		.channels_max = 2,
- 		.rates = FSLSSI_I2S_RATES,
- 		.formats = FSLSSI_I2S_FORMATS,
- 	},
- 	.capture = {
--		.stream_name = "CPU-Capture",
- 		.channels_min = 1,
- 		.channels_max = 2,
- 		.rates = FSLSSI_I2S_RATES,
-@@ -1100,7 +1232,7 @@
- };
- 
- static struct snd_soc_dai_driver fsl_ssi_ac97_dai = {
--	.bus_control = true,
-+//	.ac97_control = 1,
- 	.playback = {
- 		.stream_name = "AC97 Playback",
- 		.channels_min = 2,
-@@ -1121,10 +1253,15 @@
- 
- static struct fsl_ssi_private *fsl_ac97_data;
- 
-+static void fsl_ssi_ac97_init(void)
-+{
-+	fsl_ssi_setup(fsl_ac97_data);
-+}
-+
- static void fsl_ssi_ac97_write(struct snd_ac97 *ac97, unsigned short reg,
- 		unsigned short val)
- {
--	struct regmap *regs = fsl_ac97_data->regs;
-+	struct ccsr_ssi *ssi = fsl_ac97_data->ssi;
- 	unsigned int lreg;
- 	unsigned int lval;
- 
-@@ -1133,12 +1270,12 @@
- 
- 
- 	lreg = reg <<  12;
--	regmap_write(regs, CCSR_SSI_SACADD, lreg);
-+	write_ssi(lreg, &ssi->sacadd);
- 
- 	lval = val << 4;
--	regmap_write(regs, CCSR_SSI_SACDAT, lval);
-+	write_ssi(lval , &ssi->sacdat);
- 
--	regmap_update_bits(regs, CCSR_SSI_SACNT, CCSR_SSI_SACNT_RDWR_MASK,
-+	write_ssi_mask(&ssi->sacnt, CCSR_SSI_SACNT_RDWR_MASK,
- 			CCSR_SSI_SACNT_WR);
- 	udelay(100);
- }
-@@ -1146,21 +1283,19 @@
- static unsigned short fsl_ssi_ac97_read(struct snd_ac97 *ac97,
- 		unsigned short reg)
- {
--	struct regmap *regs = fsl_ac97_data->regs;
-+	struct ccsr_ssi *ssi = fsl_ac97_data->ssi;
- 
- 	unsigned short val = -1;
--	u32 reg_val;
- 	unsigned int lreg;
- 
- 	lreg = (reg & 0x7f) <<  12;
--	regmap_write(regs, CCSR_SSI_SACADD, lreg);
--	regmap_update_bits(regs, CCSR_SSI_SACNT, CCSR_SSI_SACNT_RDWR_MASK,
-+	write_ssi(lreg, &ssi->sacadd);
-+	write_ssi_mask(&ssi->sacnt, CCSR_SSI_SACNT_RDWR_MASK,
- 			CCSR_SSI_SACNT_RD);
- 
- 	udelay(100);
- 
--	regmap_read(regs, CCSR_SSI_SACDAT, &reg_val);
--	val = (reg_val >> 4) & 0xffff;
-+	val = (read_ssi(&ssi->sacdat) >> 4) & 0xffff;
- 
- 	return val;
- }
-@@ -1185,112 +1320,20 @@
- 	}
- }
- 
--static int fsl_ssi_imx_probe(struct platform_device *pdev,
--		struct fsl_ssi_private *ssi_private, void __iomem *iomem)
--{
--	struct device_node *np = pdev->dev.of_node;
--	u32 dmas[4];
--	int ret;
--
--	if (ssi_private->has_ipg_clk_name)
--		ssi_private->clk = devm_clk_get(&pdev->dev, "ipg");
--	else
--		ssi_private->clk = devm_clk_get(&pdev->dev, NULL);
--	if (IS_ERR(ssi_private->clk)) {
--		ret = PTR_ERR(ssi_private->clk);
--		dev_err(&pdev->dev, "could not get clock: %d\n", ret);
--		return ret;
--	}
--
--	if (!ssi_private->has_ipg_clk_name) {
--		ret = clk_prepare_enable(ssi_private->clk);
--		if (ret) {
--			dev_err(&pdev->dev, "clk_prepare_enable failed: %d\n", ret);
--			return ret;
--		}
--	}
--
--	/* For those SLAVE implementations, we ingore non-baudclk cases
--	 * and, instead, abandon MASTER mode that needs baud clock.
--	 */
--	ssi_private->baudclk = devm_clk_get(&pdev->dev, "baud");
--	if (IS_ERR(ssi_private->baudclk))
--		dev_dbg(&pdev->dev, "could not get baud clock: %ld\n",
--			 PTR_ERR(ssi_private->baudclk));
--
--	/*
--	 * We have burstsize be "fifo_depth - 2" to match the SSI
--	 * watermark setting in fsl_ssi_startup().
--	 */
--	ssi_private->dma_params_tx.maxburst = ssi_private->fifo_depth - 2;
--	ssi_private->dma_params_rx.maxburst = ssi_private->fifo_depth - 2;
--	ssi_private->dma_params_tx.addr = ssi_private->ssi_phys + CCSR_SSI_STX0;
--	ssi_private->dma_params_rx.addr = ssi_private->ssi_phys + CCSR_SSI_SRX0;
--
--	ret = of_property_read_u32_array(np, "dmas", dmas, 4);
--	if (ssi_private->use_dma && !ret && dmas[2] == IMX_DMATYPE_SSI_DUAL) {
--		ssi_private->use_dual_fifo = true;
--		/* When using dual fifo mode, we need to keep watermark
--		 * as even numbers due to dma script limitation.
--		 */
--		ssi_private->dma_params_tx.maxburst &= ~0x1;
--		ssi_private->dma_params_rx.maxburst &= ~0x1;
--	}
--
--	if (!ssi_private->use_dma) {
--
--		/*
--		 * Some boards use an incompatible codec. To get it
--		 * working, we are using imx-fiq-pcm-audio, that
--		 * can handle those codecs. DMA is not possible in this
--		 * situation.
--		 */
--
--		ssi_private->fiq_params.irq = ssi_private->irq;
--		ssi_private->fiq_params.base = iomem;
--		ssi_private->fiq_params.dma_params_rx =
--			&ssi_private->dma_params_rx;
--		ssi_private->fiq_params.dma_params_tx =
--			&ssi_private->dma_params_tx;
--
--		ret = imx_pcm_fiq_init(pdev, &ssi_private->fiq_params);
--		if (ret)
--			goto error_pcm;
--	} else {
--		ret = imx_pcm_dma_init(pdev);
--		if (ret)
--			goto error_pcm;
--	}
--
--	return 0;
--
--error_pcm:
--
--	if (!ssi_private->has_ipg_clk_name)
--		clk_disable_unprepare(ssi_private->clk);
--	return ret;
--}
--
--static void fsl_ssi_imx_clean(struct platform_device *pdev,
--		struct fsl_ssi_private *ssi_private)
--{
--	if (!ssi_private->use_dma)
--		imx_pcm_fiq_exit(pdev);
--	if (!ssi_private->has_ipg_clk_name)
--		clk_disable_unprepare(ssi_private->clk);
--}
--
- static int fsl_ssi_probe(struct platform_device *pdev)
- {
- 	struct fsl_ssi_private *ssi_private;
- 	int ret = 0;
-+	struct device_attribute *dev_attr = NULL;
- 	struct device_node *np = pdev->dev.of_node;
-+	u32 dmas[4];
- 	const struct of_device_id *of_id;
-+	enum fsl_ssi_type hw_type;
- 	const char *p, *sprop;
- 	const uint32_t *iprop;
--	struct resource *res;
--	void __iomem *iomem;
-+	struct resource res;
- 	char name[64];
-+	bool ac97 = false;
- 
- 	/* SSIs that are not connected on the board should have a
- 	 *      status = "disabled"
-@@ -1300,32 +1343,39 @@
- 		return -ENODEV;
- 
- 	of_id = of_match_device(fsl_ssi_ids, &pdev->dev);
--	if (!of_id || !of_id->data)
-+	if (!of_id)
-+		return -EINVAL;
-+	hw_type = (enum fsl_ssi_type) of_id->data;
-+
-+	sprop = of_get_property(np, "fsl,mode", NULL);
-+	if (!sprop) {
-+		dev_err(&pdev->dev, "fsl,mode property is necessary\n");
- 		return -EINVAL;
-+	}
-+	if (!strcmp(sprop, "ac97-slave"))
-+		ac97 = true;
- 
--	ssi_private = devm_kzalloc(&pdev->dev, sizeof(*ssi_private),
--			GFP_KERNEL);
-+	/* The DAI name is the last part of the full name of the node. */
-+	p = strrchr(np->full_name, '/') + 1;
-+	ssi_private = devm_kzalloc(&pdev->dev, sizeof(*ssi_private) + strlen(p),
-+			      GFP_KERNEL);
- 	if (!ssi_private) {
- 		dev_err(&pdev->dev, "could not allocate DAI object\n");
- 		return -ENOMEM;
- 	}
- 
--	ssi_private->soc = of_id->data;
--
--	sprop = of_get_property(np, "fsl,mode", NULL);
--	if (sprop) {
--		if (!strcmp(sprop, "ac97-slave"))
--			ssi_private->dai_fmt = SND_SOC_DAIFMT_AC97;
--	}
-+	strcpy(ssi_private->name, p);
- 
- 	ssi_private->use_dma = !of_property_read_bool(np,
- 			"fsl,fiq-stream-filter");
-+	ssi_private->hw_type = hw_type;
- 
--	if (fsl_ssi_is_ac97(ssi_private)) {
-+	if (ac97) {
- 		memcpy(&ssi_private->cpu_dai_drv, &fsl_ssi_ac97_dai,
- 				sizeof(fsl_ssi_ac97_dai));
- 
- 		fsl_ac97_data = ssi_private;
-+		ssi_private->imx_ac97 = true;
- 
- 		snd_soc_set_ac97_ops_of_reset(&fsl_ssi_ac97_ops, pdev);
- 	} else {
-@@ -1333,33 +1383,25 @@
- 		memcpy(&ssi_private->cpu_dai_drv, &fsl_ssi_dai_template,
- 		       sizeof(fsl_ssi_dai_template));
- 	}
--	ssi_private->cpu_dai_drv.name = dev_name(&pdev->dev);
-+	ssi_private->cpu_dai_drv.name = ssi_private->name;
- 
--	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
--	iomem = devm_ioremap_resource(&pdev->dev, res);
--	if (IS_ERR(iomem))
--		return PTR_ERR(iomem);
--	ssi_private->ssi_phys = res->start;
--
--	ret = of_property_match_string(np, "clock-names", "ipg");
--	if (ret < 0) {
--		ssi_private->has_ipg_clk_name = false;
--		ssi_private->regs = devm_regmap_init_mmio(&pdev->dev, iomem,
--			&fsl_ssi_regconfig);
--	} else {
--		ssi_private->has_ipg_clk_name = true;
--		ssi_private->regs = devm_regmap_init_mmio_clk(&pdev->dev,
--			"ipg", iomem, &fsl_ssi_regconfig);
--	}
--	if (IS_ERR(ssi_private->regs)) {
--		dev_err(&pdev->dev, "Failed to init register map\n");
--		return PTR_ERR(ssi_private->regs);
-+	/* Get the addresses and IRQ */
-+	ret = of_address_to_resource(np, 0, &res);
-+	if (ret) {
-+		dev_err(&pdev->dev, "could not determine device resources\n");
-+		return ret;
-+	}
-+	ssi_private->ssi = of_iomap(np, 0);
-+	if (!ssi_private->ssi) {
-+		dev_err(&pdev->dev, "could not map device resources\n");
-+		return -ENOMEM;
- 	}
-+	ssi_private->ssi_phys = res.start;
- 
--	ssi_private->irq = platform_get_irq(pdev, 0);
--	if (ssi_private->irq < 0) {
--		dev_err(&pdev->dev, "no irq for node %s\n", pdev->name);
--		return ssi_private->irq;
-+	ssi_private->irq = irq_of_parse_and_map(np, 0);
-+	if (!ssi_private->irq) {
-+		dev_err(&pdev->dev, "no irq for node %s\n", np->full_name);
-+		return -ENXIO;
- 	}
- 
- 	/* Are the RX and the TX clocks locked? */
-@@ -1377,43 +1419,153 @@
-                 /* Older 8610 DTs didn't have the fifo-depth property */
- 		ssi_private->fifo_depth = 8;
- 
--	dev_set_drvdata(&pdev->dev, ssi_private);
-+	ssi_private->baudclk_locked = false;
-+	spin_lock_init(&ssi_private->baudclk_lock);
- 
--	if (ssi_private->soc->imx) {
--		ret = fsl_ssi_imx_probe(pdev, ssi_private, iomem);
--		if (ret)
--			return ret;
-+	/*
-+	 * imx51 and later SoCs have a slightly different IP that allows the
-+	 * SSI configuration while the SSI unit is running.
-+	 *
-+	 * More important, it is necessary on those SoCs to configure the
-+	 * sperate TX/RX DMA bits just before starting the stream
-+	 * (fsl_ssi_trigger). The SDMA unit has to be configured before fsl_ssi
-+	 * sends any DMA requests to the SDMA unit, otherwise it is not defined
-+	 * how the SDMA unit handles the DMA request.
-+	 *
-+	 * SDMA units are present on devices starting at imx35 but the imx35
-+	 * reference manual states that the DMA bits should not be changed
-+	 * while the SSI unit is running (SSIEN). So we support the necessary
-+	 * online configuration of fsl-ssi starting at imx51.
-+	 */
-+	switch (hw_type) {
-+	case FSL_SSI_MCP8610:
-+	case FSL_SSI_MX21:
-+	case FSL_SSI_MX35:
-+		ssi_private->offline_config = true;
-+		break;
-+	case FSL_SSI_MX51:
-+		ssi_private->offline_config = false;
-+		break;
- 	}
- 
--	ret = devm_snd_soc_register_component(&pdev->dev, &fsl_ssi_component,
--					      &ssi_private->cpu_dai_drv, 1);
--	if (ret) {
--		dev_err(&pdev->dev, "failed to register DAI: %d\n", ret);
--		goto error_asoc_register;
-+	if (hw_type == FSL_SSI_MX21 || hw_type == FSL_SSI_MX51 ||
-+			hw_type == FSL_SSI_MX35) {
-+		ssi_private->ssi_on_imx = true;
-+
-+		ssi_private->clk = devm_clk_get(&pdev->dev, NULL);
-+		if (IS_ERR(ssi_private->clk)) {
-+			ret = PTR_ERR(ssi_private->clk);
-+			dev_err(&pdev->dev, "could not get clock: %d\n", ret);
-+			goto error_irqmap;
-+		}
-+		ret = clk_prepare(ssi_private->clk);
-+		if (ret) {
-+			dev_err(&pdev->dev, "clk_prepare failed: %d\n",
-+				ret);
-+			goto error_irqmap;
-+		}
-+
-+		/* For those SLAVE implementations, we ingore non-baudclk cases
-+		 * and, instead, abandon MASTER mode that needs baud clock.
-+		 */
-+		ssi_private->baudclk = devm_clk_get(&pdev->dev, "baud");
-+		if (IS_ERR(ssi_private->baudclk))
-+			dev_dbg(&pdev->dev, "could not get baud clock: %ld\n",
-+				 PTR_ERR(ssi_private->baudclk));
-+		else
-+			clk_prepare(ssi_private->baudclk);
-+
-+		/*
-+		 * We have burstsize be "fifo_depth - 2" to match the SSI
-+		 * watermark setting in fsl_ssi_startup().
-+		 */
-+		ssi_private->dma_params_tx.maxburst = ssi_private->fifo_depth - 2;
-+		ssi_private->dma_params_rx.maxburst = ssi_private->fifo_depth - 2;
-+		ssi_private->dma_params_tx.addr =
-+			ssi_private->ssi_phys + offsetof(struct ccsr_ssi, stx0);
-+		ssi_private->dma_params_rx.addr =
-+			ssi_private->ssi_phys + offsetof(struct ccsr_ssi, srx0);
-+
-+		ret = !of_property_read_u32_array(np, "dmas", dmas, 4);
-+		if (ssi_private->use_dma && !ret && dmas[2] == IMX_DMATYPE_SSI_DUAL) {
-+			ssi_private->use_dual_fifo = true;
-+			/* When using dual fifo mode, we need to keep watermark
-+			 * as even numbers due to dma script limitation.
-+			 */
-+			ssi_private->dma_params_tx.maxburst &= ~0x1;
-+			ssi_private->dma_params_rx.maxburst &= ~0x1;
-+		}
- 	}
- 
-+	/*
-+	 * Enable interrupts only for MCP8610 and MX51. The other MXs have
-+	 * different writeable interrupt status registers.
-+	 */
- 	if (ssi_private->use_dma) {
-+		/* The 'name' should not have any slashes in it. */
- 		ret = devm_request_irq(&pdev->dev, ssi_private->irq,
--					fsl_ssi_isr, 0, dev_name(&pdev->dev),
-+					fsl_ssi_isr, 0, ssi_private->name,
- 					ssi_private);
-+		ssi_private->irq_stats = true;
- 		if (ret < 0) {
- 			dev_err(&pdev->dev, "could not claim irq %u\n",
- 					ssi_private->irq);
--			goto error_asoc_register;
-+			goto error_clk;
- 		}
- 	}
- 
--	ret = fsl_ssi_debugfs_create(&ssi_private->dbg_stats, &pdev->dev);
-+	pm_runtime_enable(&pdev->dev);
-+
-+	/* Register with ASoC */
-+	dev_set_drvdata(&pdev->dev, ssi_private);
-+
-+	ret = snd_soc_register_component(&pdev->dev, &fsl_ssi_component,
-+					 &ssi_private->cpu_dai_drv, 1);
-+	if (ret) {
-+		dev_err(&pdev->dev, "failed to register DAI: %d\n", ret);
-+		goto error_dev;
-+	}
-+
-+	ret = fsl_ssi_debugfs_create(ssi_private, &pdev->dev);
- 	if (ret)
--		goto error_asoc_register;
-+		goto error_dbgfs;
-+
-+	if (ssi_private->ssi_on_imx) {
-+		if (!ssi_private->use_dma) {
-+
-+			/*
-+			 * Some boards use an incompatible codec. To get it
-+			 * working, we are using imx-fiq-pcm-audio, that
-+			 * can handle those codecs. DMA is not possible in this
-+			 * situation.
-+			 */
-+
-+			ssi_private->fiq_params.irq = ssi_private->irq;
-+			ssi_private->fiq_params.base = ssi_private->ssi;
-+			ssi_private->fiq_params.dma_params_rx =
-+				&ssi_private->dma_params_rx;
-+			ssi_private->fiq_params.dma_params_tx =
-+				&ssi_private->dma_params_tx;
-+
-+			ret = imx_pcm_fiq_init(pdev, &ssi_private->fiq_params);
-+			if (ret)
-+				goto error_pcm;
-+		} else {
-+			ret = imx_pcm_dma_init(pdev, IMX_SSI_DMABUF_SIZE);
-+			if (ret)
-+				goto error_pcm;
-+		}
-+	}
- 
- 	/*
- 	 * If codec-handle property is missing from SSI node, we assume
- 	 * that the machine driver uses new binding which does not require
- 	 * SSI driver to trigger machine driver's probe.
- 	 */
--	if (!of_get_property(np, "codec-handle", NULL))
-+	if (!of_get_property(np, "codec-handle", NULL)) {
-+		ssi_private->new_binding = true;
- 		goto done;
-+	}
- 
- 	/* Trigger the machine driver's probe function.  The platform driver
- 	 * name of the machine driver is taken from /compatible property of the
-@@ -1433,22 +1585,42 @@
- 	if (IS_ERR(ssi_private->pdev)) {
- 		ret = PTR_ERR(ssi_private->pdev);
- 		dev_err(&pdev->dev, "failed to register platform: %d\n", ret);
--		goto error_sound_card;
-+		goto error_dai;
- 	}
- 
- done:
--	if (ssi_private->dai_fmt)
--		_fsl_ssi_set_dai_fmt(&pdev->dev, ssi_private,
--				     ssi_private->dai_fmt);
-+	if (ssi_private->imx_ac97)
-+		fsl_ssi_ac97_init();
- 
- 	return 0;
- 
--error_sound_card:
--	fsl_ssi_debugfs_remove(&ssi_private->dbg_stats);
-+error_dai:
-+	if (ssi_private->ssi_on_imx && !ssi_private->use_dma)
-+		imx_pcm_fiq_exit(pdev);
-+
-+error_pcm:
-+	fsl_ssi_debugfs_remove(ssi_private);
-+
-+error_dbgfs:
-+	snd_soc_unregister_component(&pdev->dev);
-+
-+error_dev:
-+	device_remove_file(&pdev->dev, dev_attr);
- 
--error_asoc_register:
--	if (ssi_private->soc->imx)
--		fsl_ssi_imx_clean(pdev, ssi_private);
-+	if (ssi_private->ssi_on_imx) {
-+		if (!IS_ERR(ssi_private->baudclk))
-+			clk_unprepare(ssi_private->baudclk);
-+		clk_unprepare(ssi_private->clk);
-+	}
-+error_clk:
-+	if (!IS_ERR(ssi_private->baudclk))
-+		clk_unprepare(ssi_private->baudclk);
-+	if (!IS_ERR(ssi_private->clk))
-+		clk_unprepare(ssi_private->clk);
-+
-+error_irqmap:
-+	if (ssi_private->irq_stats)
-+		irq_dispose_mapping(ssi_private->irq);
- 
- 	return ret;
- }
-@@ -1457,13 +1629,18 @@
- {
- 	struct fsl_ssi_private *ssi_private = dev_get_drvdata(&pdev->dev);
- 
--	fsl_ssi_debugfs_remove(&ssi_private->dbg_stats);
-+	fsl_ssi_debugfs_remove(ssi_private);
- 
--	if (ssi_private->pdev)
-+	if (!ssi_private->new_binding)
- 		platform_device_unregister(ssi_private->pdev);
--
--	if (ssi_private->soc->imx)
--		fsl_ssi_imx_clean(pdev, ssi_private);
-+	snd_soc_unregister_component(&pdev->dev);
-+	if (ssi_private->ssi_on_imx) {
-+		if (!IS_ERR(ssi_private->baudclk))
-+			clk_unprepare(ssi_private->baudclk);
-+		clk_unprepare(ssi_private->clk);
-+	}
-+	if (ssi_private->irq_stats)
-+		irq_dispose_mapping(ssi_private->irq);
- 
- 	return 0;
- }
-@@ -1471,7 +1648,9 @@
- static struct platform_driver fsl_ssi_driver = {
- 	.driver = {
- 		.name = "fsl-ssi-dai",
-+		.owner = THIS_MODULE,
- 		.of_match_table = fsl_ssi_ids,
-+		.pm = &fsl_ssi_pm,
- 	},
- 	.probe = fsl_ssi_probe,
- 	.remove = fsl_ssi_remove,
-diff -Nur linux-4.1.3/sound/soc/fsl/fsl_ssi.h linux-xbian-imx6/sound/soc/fsl/fsl_ssi.h
---- linux-4.1.3/sound/soc/fsl/fsl_ssi.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/fsl_ssi.h	2015-07-27 23:13:11.153188979 +0200
-@@ -12,32 +12,33 @@
- #ifndef _MPC8610_I2S_H
- #define _MPC8610_I2S_H
- 
--/* SSI registers */
--#define CCSR_SSI_STX0			0x00
--#define CCSR_SSI_STX1			0x04
--#define CCSR_SSI_SRX0			0x08
--#define CCSR_SSI_SRX1			0x0c
--#define CCSR_SSI_SCR			0x10
--#define CCSR_SSI_SISR			0x14
--#define CCSR_SSI_SIER			0x18
--#define CCSR_SSI_STCR			0x1c
--#define CCSR_SSI_SRCR			0x20
--#define CCSR_SSI_STCCR			0x24
--#define CCSR_SSI_SRCCR			0x28
--#define CCSR_SSI_SFCSR			0x2c
--#define CCSR_SSI_STR			0x30
--#define CCSR_SSI_SOR			0x34
--#define CCSR_SSI_SACNT			0x38
--#define CCSR_SSI_SACADD			0x3c
--#define CCSR_SSI_SACDAT			0x40
--#define CCSR_SSI_SATAG			0x44
--#define CCSR_SSI_STMSK			0x48
--#define CCSR_SSI_SRMSK			0x4c
--#define CCSR_SSI_SACCST			0x50
--#define CCSR_SSI_SACCEN			0x54
--#define CCSR_SSI_SACCDIS		0x58
-+/* SSI Register Map */
-+struct ccsr_ssi {
-+	__be32 stx0;	/* 0x.0000 - SSI Transmit Data Register 0 */
-+	__be32 stx1;	/* 0x.0004 - SSI Transmit Data Register 1 */
-+	__be32 srx0;	/* 0x.0008 - SSI Receive Data Register 0 */
-+	__be32 srx1;	/* 0x.000C - SSI Receive Data Register 1 */
-+	__be32 scr;	/* 0x.0010 - SSI Control Register */
-+	__be32 sisr;	/* 0x.0014 - SSI Interrupt Status Register Mixed */
-+	__be32 sier;	/* 0x.0018 - SSI Interrupt Enable Register */
-+	__be32 stcr;	/* 0x.001C - SSI Transmit Configuration Register */
-+	__be32 srcr;	/* 0x.0020 - SSI Receive Configuration Register */
-+	__be32 stccr;	/* 0x.0024 - SSI Transmit Clock Control Register */
-+	__be32 srccr;	/* 0x.0028 - SSI Receive Clock Control Register */
-+	__be32 sfcsr;	/* 0x.002C - SSI FIFO Control/Status Register */
-+	__be32 str;	/* 0x.0030 - SSI Test Register */
-+	__be32 sor;	/* 0x.0034 - SSI Option Register */
-+	__be32 sacnt;	/* 0x.0038 - SSI AC97 Control Register */
-+	__be32 sacadd;	/* 0x.003C - SSI AC97 Command Address Register */
-+	__be32 sacdat;	/* 0x.0040 - SSI AC97 Command Data Register */
-+	__be32 satag;	/* 0x.0044 - SSI AC97 Tag Register */
-+	__be32 stmsk;	/* 0x.0048 - SSI Transmit Time Slot Mask Register */
-+	__be32 srmsk;	/* 0x.004C - SSI Receive Time Slot Mask Register */
-+	__be32 saccst;	/* 0x.0050 - SSI AC97 Channel Status Register */
-+	__be32 saccen;	/* 0x.0054 - SSI AC97 Channel Enable Register */
-+	__be32 saccdis; /* 0x.0058 - SSI AC97 Channel Disable Register */
-+};
- 
--#define CCSR_SSI_SCR_SYNC_TX_FS		0x00001000
- #define CCSR_SSI_SCR_RFR_CLK_DIS	0x00000800
- #define CCSR_SSI_SCR_TFR_CLK_DIS	0x00000400
- #define CCSR_SSI_SCR_TCH_EN		0x00000100
-@@ -205,64 +206,5 @@
- #define CCSR_SSI_SACNT_FV		0x00000002
- #define CCSR_SSI_SACNT_AC97EN		0x00000001
- 
--
--struct device;
--
--#if IS_ENABLED(CONFIG_DEBUG_FS)
--
--struct fsl_ssi_dbg {
--	struct dentry *dbg_dir;
--	struct dentry *dbg_stats;
--
--	struct {
--		unsigned int rfrc;
--		unsigned int tfrc;
--		unsigned int cmdau;
--		unsigned int cmddu;
--		unsigned int rxt;
--		unsigned int rdr1;
--		unsigned int rdr0;
--		unsigned int tde1;
--		unsigned int tde0;
--		unsigned int roe1;
--		unsigned int roe0;
--		unsigned int tue1;
--		unsigned int tue0;
--		unsigned int tfs;
--		unsigned int rfs;
--		unsigned int tls;
--		unsigned int rls;
--		unsigned int rff1;
--		unsigned int rff0;
--		unsigned int tfe1;
--		unsigned int tfe0;
--	} stats;
--};
--
--void fsl_ssi_dbg_isr(struct fsl_ssi_dbg *ssi_dbg, u32 sisr);
--
--int fsl_ssi_debugfs_create(struct fsl_ssi_dbg *ssi_dbg, struct device *dev);
--
--void fsl_ssi_debugfs_remove(struct fsl_ssi_dbg *ssi_dbg);
--
--#else
--
--struct fsl_ssi_dbg {
--};
--
--static inline void fsl_ssi_dbg_isr(struct fsl_ssi_dbg *stats, u32 sisr)
--{
--}
--
--static inline int fsl_ssi_debugfs_create(struct fsl_ssi_dbg *ssi_dbg,
--		struct device *dev)
--{
--	return 0;
--}
--
--static inline void fsl_ssi_debugfs_remove(struct fsl_ssi_dbg *ssi_dbg)
--{
--}
--#endif  /* ! IS_ENABLED(CONFIG_DEBUG_FS) */
--
- #endif
-+
-diff -Nur linux-4.1.3/sound/soc/fsl/hdmi_pcm.S linux-xbian-imx6/sound/soc/fsl/hdmi_pcm.S
---- linux-4.1.3/sound/soc/fsl/hdmi_pcm.S	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/sound/soc/fsl/hdmi_pcm.S	2015-07-27 23:13:11.153188979 +0200
-@@ -0,0 +1,246 @@
-+/**
-+ * Copyright (C) 2010-2014 Freescale Semiconductor, Inc. All Rights Reserved.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+.section .text
-+
-+.global hdmi_dma_copy_16_neon_lut
-+.global hdmi_dma_copy_16_neon_fast
-+.global hdmi_dma_copy_24_neon_lut
-+.global hdmi_dma_copy_24_neon_fast
-+
-+
-+/**
-+ * hdmi_dma_copy_16_neon_lut
-+ * Convert pcm sample to iec sample. Pcm sample is 16 bits.
-+ * Frame index's between 0 and 47 inclusively. Channel count can be 1, 2, 4, 8.
-+ * Frame count should be multipliable by 4, and Sample count by 8.
-+ *
-+ * C Prototype
-+ *   void hdmi_dma_copy_16_neon_lut(unsigned short *src, unsigned int *dst,
-+ *			int samples, unsigned char *lookup_table);
-+ * Return value
-+ *   None
-+ * Parameters
-+ *   src		Source PCM16 samples
-+ *   dst		Dest buffer to store pcm with header
-+ *   samples		Contains sample count (=frame_count * channel_count)
-+ *   lookup_table	Preconstructed header table. Channels interleaved.
-+ */
-+
-+hdmi_dma_copy_16_neon_lut:
-+	mov     r12, #1		/* construct vector(1) */
-+	vdup.8 d6, r12
-+
-+hdmi_dma_copy_16_neon_lut_start:
-+
-+	/* get 8 samples to q0 */
-+	vld1.16 {d0, d1}, [r0]!	/* TODO: aligned */
-+
-+	/* pld [r1, #(64*4)] */
-+
-+	/* xor every bit */
-+	vcnt.8     q1, q0	/* count of 1s */
-+	vpadd.i8 d2, d2, d3	/* only care about the LST in every element */
-+	vand       d2, d2, d6	/* clear other bits while keep the least bit */
-+	vshl.u8    d2, d2, #3	/* bit p: d2 = d2 << 3 */
-+
-+	/* get packet header */
-+	vld1.8       {d5}, [r3]!
-+	veor        d4, d5, d2	/* xor bit c */
-+
-+	/* store: (d4 << 16 | q0) << 8 */
-+	vmovl.u8  q2, d4	/* expand from char to short */
-+	vzip.16     q0, q2
-+	vshl.u32   q0, q0, #8
-+	vshl.u32   q1, q2, #8
-+	vst1.32     {d0, d1, d2, d3}, [r1]!
-+
-+	/* decrease sample count */
-+	subs  r2, r2, #8
-+	bne   hdmi_dma_copy_16_neon_lut_start
-+
-+	mov pc, lr
-+
-+/**
-+ * hdmi_dma_copy_16_neon_fast
-+ * Convert pcm sample to iec sample. Pcm sample is 16 bits.
-+ * Frame index's between 48 and 191 inclusively.
-+ * Channel count can be 1, 2, 4 or 8.
-+ * Frame count should be multipliable by 4, and Sample count by 8.
-+ *
-+ * C Prototype
-+ * void hdmi_dma_copy_16_neon_fast(unsigned short *src,
-+ * 		unsigned int *dst, int samples);
-+ * Return value
-+ *   None
-+ * Parameters
-+ *   src		Source PCM16 samples
-+ *   dst		Dest buffer to store pcm with header
-+ *   samples		Contains sample count (=frame_count * channel_count)
-+ */
-+
-+hdmi_dma_copy_16_neon_fast:
-+	mov     r12, #1		/* construct vector(1) */
-+	vdup.8 d6, r12
-+
-+hdmi_dma_copy_16_neon_fast_start:
-+	/* get 8 samples to q0 */
-+	vld1.16 {d0, d1}, [r0]!	/* TODO: aligned */
-+
-+	/* pld [r1, #(64*4)] */
-+
-+	/* xor every bit */
-+	vcnt.8     q1, q0	/* count of 1s */
-+	vpadd.i8 d2, d2, d3
-+	vand       d2, d2, d6	/* clear other bits while keep the LST */
-+	/* finally we construct packet header */
-+	vshl.u8    d4, d2, #3	/* bit p: d2 = d2 << 3 */
-+
-+	/* get packet header: always 0 */
-+
-+	/* store: (d4 << 16 | q0) << 8 */
-+	vmovl.u8  q2, d4	/* expand from char to short */
-+	vzip.16     q0, q2
-+	vshl.u32   q0, q0, #8
-+	vshl.u32   q1, q2, #8
-+	vst1.32     {d0, d1, d2, d3}, [r1]!
-+
-+	/* decrease sample count */
-+	subs  r2, r2, #8
-+	bne   hdmi_dma_copy_16_neon_fast_start
-+
-+	mov pc, lr
-+
-+
-+
-+/**
-+ * hdmi_dma_copy_24_neon_lut
-+ * Convert pcm sample to iec sample. Pcm sample is 24 bits.
-+ * Frame index's between 0 and 47 inclusively. Channel count can be 1, 2, 4, 8.
-+ * Frame count should be multipliable by 4, and Sample count by 8.
-+ *
-+ * C Prototype
-+ *   void hdmi_dma_copy_24_neon_lut(unsigned int *src, unsigned int *dst,
-+ *			int samples, unsigned char *lookup_table);
-+ * Return value
-+ *   None
-+ * Parameters
-+ *   src		Source PCM24 samples
-+ *   dst		Dest buffer to store pcm with header
-+ *   samples		Contains sample count (=frame_count * channel_count)
-+ *   lookup_table	Preconstructed header table. Channels interleaved.
-+ */
-+
-+hdmi_dma_copy_24_neon_lut:
-+	vpush   {d8}
-+
-+	mov     r12, #1		/* construct vector(1) */
-+	vdup.8 d8, r12
-+
-+hdmi_dma_copy_24_neon_lut_start:
-+
-+	/* get 8 samples to q0 and q1 */
-+	vld1.32 {d0, d1, d2, d3}, [r0]! /* TODO: aligned */
-+
-+	/* pld [r1, #(64*4)] */
-+
-+	/* xor every bit */
-+	vcnt.8     q2, q0	/* count of 1s */
-+	vpadd.i8 d4, d4, d5	/* only care about the LSB in every element */
-+	vcnt.8     q3, q1
-+	vpadd.i8 d6, d6, d7
-+	vpadd.i8 d4, d4, d6	/* d4: contains xor result and other dirty bits */
-+	vand       d4, d4, d8	/* clear other bits while keep the least bit */
-+	vshl.u8    d4, d4, #3	/* bit p: d4 = d4 << 3 */
-+
-+	/* get packet header */
-+	vld1.8       {d5}, [r3]!/* d5: original header */
-+	veor        d5, d5, d4	/* fix bit p */
-+
-+	/* store: (d5 << 24 | q0) */
-+	vmovl.u8  q3, d5	/* expand from char to short */
-+	vmovl.u16 q2, d6	/* expand from short to int */
-+	vmovl.u16 q3, d7
-+	vshl.u32    q2, q2, #24
-+	vshl.u32    q3, q3, #24
-+	vorr          q0, q0, q2
-+	vorr          q1, q1, q3
-+	vst1.32     {d0, d1, d2, d3}, [r1]!
-+
-+	/* decrease sample count */
-+	subs  r2, r2, #8
-+	bne   hdmi_dma_copy_24_neon_lut_start
-+
-+	vpop {d8}
-+	mov pc, lr
-+
-+/**
-+ * hdmi_dma_copy_24_neon_fast
-+ * Convert pcm sample to iec sample. Pcm sample is 24 bits.
-+ * Frame index's between 48 and 191 inclusively.
-+ * Channel count can be 1, 2, 4 or 8.
-+ * Frame count should be multipliable by 4, and Sample count by 8.
-+ *
-+ * C Prototype
-+ * void hdmi_dma_copy_24_neon_fast(unsigned int *src,
-+ * 		unsigned int *dst, int samples);
-+ * Return value
-+ *   None
-+ * Parameters
-+ *   src		Source PCM24 samples
-+ *   dst		Dest buffer to store pcm with header
-+ *   samples		Contains sample count (=frame_count * channel_count)
-+ */
-+
-+hdmi_dma_copy_24_neon_fast:
-+	vpush   {d8}
-+
-+	mov     r12, #1		/* construct vector(1) */
-+	vdup.8 d8, r12
-+
-+hdmi_dma_copy_24_neon_fast_start:
-+	/* get 8 samples to q0 and q1 */
-+	vld1.32 {d0, d1, d2, d3}, [r0]! /* TODO: aligned */
-+
-+	/* pld [r1, #(64*4)] */
-+
-+	/* xor every bit */
-+	vcnt.8     q2, q0	/* count of 1s */
-+	vpadd.i8 d4, d4, d5	/* only care about the LSB in every element */
-+	vcnt.8     q3, q1
-+	vpadd.i8 d6, d6, d7
-+	vpadd.i8 d4, d4, d6	/* d4: contains xor result and other dirty bits */
-+	vand       d4, d4, d8	/* clear other bits while keep the least bit */
-+	vshl.u8    d4, d4, #3	/* bit p: d4 = d4 << 3 */
-+
-+	/* store: (d4 << 24 | q0)  */
-+	vmovl.u8  q3, d4	/* expand from char to short */
-+	vmovl.u16 q2, d6	/* expand from short to int */
-+	vmovl.u16 q3, d7
-+	vshl.u32    q2, q2, #24
-+	vshl.u32    q3, q3, #24
-+	vorr          q0, q0, q2
-+	vorr          q1, q1, q3
-+	vst1.32     {d0, d1, d2, d3}, [r1]!
-+
-+	/* decrease sample count */
-+	subs  r2, r2, #8
-+	bne   hdmi_dma_copy_24_neon_fast_start
-+
-+	vpop {d8}
-+	mov pc, lr
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-audmux.c linux-xbian-imx6/sound/soc/fsl/imx-audmux.c
---- linux-4.1.3/sound/soc/fsl/imx-audmux.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/imx-audmux.c	2015-07-27 23:13:11.153188979 +0200
-@@ -67,7 +67,7 @@
- {
- 	ssize_t ret;
- 	char *buf;
--	uintptr_t port = (uintptr_t)file->private_data;
-+	int port = (int)file->private_data;
- 	u32 pdcr, ptcr;
- 
- 	if (audmux_clk) {
-@@ -145,9 +145,9 @@
- 	.llseek = default_llseek,
- };
- 
--static void audmux_debugfs_init(void)
-+static void __init audmux_debugfs_init(void)
- {
--	uintptr_t i;
-+	int i;
- 	char buf[20];
- 
- 	audmux_debugfs_root = debugfs_create_dir("audmux", NULL);
-@@ -157,10 +157,10 @@
- 	}
- 
- 	for (i = 0; i < MX31_AUDMUX_PORT7_SSI_PINS_7 + 1; i++) {
--		snprintf(buf, sizeof(buf), "ssi%lu", i);
-+		snprintf(buf, sizeof(buf), "ssi%d", i);
- 		if (!debugfs_create_file(buf, 0444, audmux_debugfs_root,
- 					 (void *)i, &audmux_debugfs_fops))
--			pr_warning("Failed to create AUDMUX port %lu debugfs file\n",
-+			pr_warning("Failed to create AUDMUX port %d debugfs file\n",
- 				   i);
- 	}
- }
-@@ -356,6 +356,7 @@
- 	.id_table	= imx_audmux_ids,
- 	.driver	= {
- 		.name	= DRIVER_NAME,
-+		.owner	= THIS_MODULE,
- 		.of_match_table = imx_audmux_dt_ids,
- 	}
- };
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-hdmi.c linux-xbian-imx6/sound/soc/fsl/imx-hdmi.c
---- linux-4.1.3/sound/soc/fsl/imx-hdmi.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/sound/soc/fsl/imx-hdmi.c	2015-07-27 23:13:11.153188979 +0200
-@@ -0,0 +1,114 @@
-+/*
-+ * ASoC HDMI Transmitter driver for IMX development boards
-+ *
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
-+ *
-+ * based on stmp3780_devb_hdmi.c
-+ *
-+ * Vladimir Barinov <vbarinov@embeddedalley.com>
-+ *
-+ * Copyright 2008 SigmaTel, Inc
-+ * Copyright 2008 Embedded Alley Solutions, Inc
-+ *
-+ * This file is licensed under the terms of the GNU General Public License
-+ * version 2.  This program  is licensed "as is" without any warranty of any
-+ * kind, whether express or implied.
-+ */
-+
-+#include <linux/module.h>
-+#include <linux/of_platform.h>
-+#include <linux/mfd/mxc-hdmi-core.h>
-+#include <sound/soc.h>
-+
-+#include "imx-hdmi.h"
-+
-+/* imx digital audio interface glue - connects codec <--> CPU */
-+static struct snd_soc_dai_link imx_hdmi_dai_link = {
-+	.name = "i.MX HDMI Audio Tx",
-+	.stream_name = "i.MX HDMI Audio Tx",
-+	.codec_dai_name = "hdmi-hifi",
-+	.codec_name = "hdmi-audio-codec",
-+	.platform_name = "imx-hdmi-audio",
-+	.ignore_pmdown_time = 1,
-+};
-+
-+static struct snd_soc_card snd_soc_card_imx_hdmi = {
-+	.name = "imx-hdmi-soc",
-+	.dai_link = &imx_hdmi_dai_link,
-+	.num_links = 1,
-+};
-+
-+static int imx_hdmi_audio_probe(struct platform_device *pdev)
-+{
-+	struct device_node *hdmi_np, *np = pdev->dev.of_node;
-+	struct snd_soc_card *card = &snd_soc_card_imx_hdmi;
-+	struct platform_device *hdmi_pdev;
-+	int ret = 0;
-+
-+	if (!hdmi_get_registered()) {
-+		dev_err(&pdev->dev, "initialize HDMI-audio failed. load HDMI-video first!\n");
-+		return -ENODEV;
-+	}
-+
-+	hdmi_np = of_parse_phandle(np, "hdmi-controller", 0);
-+	if (!hdmi_np) {
-+		dev_err(&pdev->dev, "failed to find hdmi-audio cpudai\n");
-+		ret = -EINVAL;
-+		goto end;
-+	}
-+
-+	hdmi_pdev = of_find_device_by_node(hdmi_np);
-+	if (!hdmi_pdev) {
-+		dev_err(&pdev->dev, "failed to find SSI platform device\n");
-+		ret = -EINVAL;
-+		goto end;
-+	}
-+
-+	card->dev = &pdev->dev;
-+	card->dai_link->cpu_dai_name = dev_name(&hdmi_pdev->dev);
-+
-+	platform_set_drvdata(pdev, card);
-+
-+	ret = snd_soc_register_card(card);
-+	if (ret)
-+		dev_err(&pdev->dev, "failed to register card: %d\n", ret);
-+
-+end:
-+	if (hdmi_np)
-+		of_node_put(hdmi_np);
-+
-+	return ret;
-+}
-+
-+static int imx_hdmi_audio_remove(struct platform_device *pdev)
-+{
-+	struct snd_soc_card *card = platform_get_drvdata(pdev);
-+
-+	snd_soc_unregister_card(card);
-+
-+	return 0;
-+}
-+
-+static const struct of_device_id imx_hdmi_dt_ids[] = {
-+	{ .compatible = "fsl,imx-audio-hdmi", },
-+	{ /* sentinel */ }
-+};
-+MODULE_DEVICE_TABLE(of, imx_hdmi_dt_ids);
-+
-+static struct platform_driver imx_hdmi_audio_driver = {
-+	.probe = imx_hdmi_audio_probe,
-+	.remove = imx_hdmi_audio_remove,
-+	.driver = {
-+		.of_match_table = imx_hdmi_dt_ids,
-+		.name = "imx-audio-hdmi",
-+		.owner = THIS_MODULE,
-+		.pm = &snd_soc_pm_ops,
-+	},
-+};
-+
-+module_platform_driver(imx_hdmi_audio_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("IMX HDMI TX ASoC driver");
-+MODULE_LICENSE("GPL");
-+MODULE_ALIAS("platform:imx-audio-hdmi");
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-hdmi-dma.c linux-xbian-imx6/sound/soc/fsl/imx-hdmi-dma.c
---- linux-4.1.3/sound/soc/fsl/imx-hdmi-dma.c	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/sound/soc/fsl/imx-hdmi-dma.c	2015-07-27 23:13:11.153188979 +0200
-@@ -0,0 +1,1256 @@
-+/*
-+ * imx-hdmi-dma.c  --  HDMI DMA driver for ALSA Soc Audio Layer
-+ *
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
-+ *
-+ * based on imx-pcm-dma-mx2.c
-+ * Copyright 2009 Sascha Hauer <s.hauer@pengutronix.de>
-+ *
-+ * This code is based on code copyrighted by Freescale,
-+ * Liam Girdwood, Javier Martin and probably others.
-+ *
-+ *  This program is free software; you can redistribute  it and/or modify it
-+ *  under  the terms of  the GNU General  Public License as published by the
-+ *  Free Software Foundation;  either version 2 of the  License, or (at your
-+ *  option) any later version.
-+ */
-+
-+#include <linux/module.h>
-+#include <linux/delay.h>
-+#include <linux/dma-mapping.h>
-+#include <linux/mfd/mxc-hdmi-core.h>
-+#include <linux/platform_data/dma-imx.h>
-+
-+#include <video/mxc_hdmi.h>
-+
-+#include "imx-hdmi.h"
-+
-+#define HDMI_DMA_BURST_UNSPECIFIED_LEGNTH	0
-+#define HDMI_DMA_BURST_INCR4			1
-+#define HDMI_DMA_BURST_INCR8			2
-+#define HDMI_DMA_BURST_INCR16			3
-+
-+#define HDMI_BASE_ADDR 0x00120000
-+
-+struct hdmi_sdma_script {
-+	int control_reg_addr;
-+	int status_reg_addr;
-+	int dma_start_addr;
-+	u32 buffer[20];
-+};
-+
-+struct hdmi_dma_priv {
-+	struct snd_pcm_substream *substream;
-+	struct platform_device *pdev;
-+
-+	struct snd_dma_buffer hw_buffer;
-+	unsigned long buffer_bytes;
-+	unsigned long appl_bytes;
-+
-+	int periods;
-+	int period_time;
-+	int period_bytes;
-+	int dma_period_bytes;
-+	int buffer_ratio;
-+
-+	unsigned long offset;
-+
-+	snd_pcm_format_t format;
-+	int sample_align;
-+	int sample_bits;
-+	int channels;
-+	int rate;
-+
-+	int frame_idx;
-+
-+	bool tx_active;
-+	spinlock_t irq_lock;
-+
-+	/* SDMA part */
-+	dma_addr_t phy_hdmi_sdma_t;
-+	struct hdmi_sdma_script *hdmi_sdma_t;
-+	struct dma_chan *dma_channel;
-+	struct imx_dma_data dma_data;
-+	struct dma_async_tx_descriptor *desc;
-+	struct imx_hdmi_sdma_params sdma_params;
-+};
-+
-+/* bit 0:0:0:b:p(0):c:(u)0:(v)0 */
-+/* max 8 channels supported; channels are interleaved */
-+static u8 g_packet_head_table[48 * 8];
-+
-+/* channel remapping for hdmi_dma_copy_xxxx() */
-+static u8 g_channel_remap_table[24];
-+
-+/* default mapping tables */
-+static const u8 channel_maps_alsa_cea[5][8] = {
-+	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 0CH: no remapping */
-+	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 2CH: no remapping */
-+	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 4CH: no remapping */
-+	{ 0, 1, 4, 5, 3, 2, 6, 7 },	/* 6CH: ALSA5.1 to CEA */
-+	{ 0, 1, 6, 7, 3, 2, 4, 5 }	/* 8CH: ALSA7.1 to CEA */
-+};
-+
-+static const u8 channel_maps_cea_alsa[5][8] = {
-+	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 0CH: no remapping */
-+	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 2CH: no remapping */
-+	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 4CH: no remapping */
-+	{ 0, 1, 5, 4, 2, 3, 6, 7 },	/* 6CH: CEA to ALSA5.1 */
-+	{ 0, 1, 5, 4, 6, 7, 2, 3 }	/* 8CH: CEA to ALSA7.1 */
-+};
-+
-+union hdmi_audio_header_t iec_header;
-+EXPORT_SYMBOL(iec_header);
-+
-+/*
-+ * Note that the period size for DMA != period size for ALSA because the
-+ * driver adds iec frame info to the audio samples (in hdmi_dma_copy).
-+ *
-+ * Each 4 byte subframe = 1 byte of iec data + 3 byte audio sample.
-+ *
-+ * A 16 bit audio sample becomes 32 bits including the frame info. Ratio=2
-+ * A 24 bit audio sample becomes 32 bits including the frame info. Ratio=3:4
-+ * If the 24 bit raw audio is in 32 bit words, the
-+ *
-+ *  Original  Packed into  subframe  Ratio of size        Format
-+ *   sample    how many      size    of DMA buffer
-+ *   (bits)      bits                to ALSA buffer
-+ *  --------  -----------  --------  --------------  ------------------------
-+ *     16         16          32          2          SNDRV_PCM_FORMAT_S16_LE
-+ *     24         24          32          1.33       SNDRV_PCM_FORMAT_S24_3LE*
-+ *     24         32          32          1          SNDRV_PCM_FORMAT_S24_LE
-+ *
-+ * *so SNDRV_PCM_FORMAT_S24_3LE is not supported.
-+ */
-+
-+/*
-+ * The minimum dma period is one IEC audio frame (192 * 4 * channels).
-+ * The maximum dma period for the HDMI DMA is 8K.
-+ *
-+ *   channels       minimum          maximum
-+ *                 dma period       dma period
-+ *   --------  ------------------   ----------
-+ *       2     192 * 4 * 2 = 1536   * 4 = 6144
-+ *       4     192 * 4 * 4 = 3072   * 2 = 6144
-+ *       6     192 * 4 * 6 = 4608   * 1 = 4608
-+ *       8     192 * 4 * 8 = 6144   * 1 = 6144
-+ *
-+ * Bottom line:
-+ * 1. Must keep the ratio of DMA buffer to ALSA buffer consistent.
-+ * 2. frame_idx is saved in the private data, so even if a frame cannot be
-+ *    transmitted in a period, it can be continued in the next period.  This
-+ *    is necessary for 6 ch.
-+ */
-+#define HDMI_DMA_PERIOD_BYTES		(12288)
-+#define HDMI_DMA_BUF_SIZE		(1280 * 1024)
-+#define HDMI_PCM_BUF_SIZE		(1280 * 1024)
-+
-+#define hdmi_audio_debug(dev, reg) \
-+	dev_dbg(dev, #reg ": 0x%02x\n", hdmi_readb(reg))
-+
-+#ifdef DEBUG
-+static void dumpregs(struct device *dev)
-+{
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_CONF0);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_START);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_STOP);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_THRSLD);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_STRADDR0);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_STPADDR0);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_BSTADDR0);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_MBLENGTH0);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_MBLENGTH1);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_STAT);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_INT);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_MASK);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_POL);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_CONF1);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFSTAT);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFINT);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFMASK);
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFPOL);
-+	hdmi_audio_debug(dev, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
-+	hdmi_audio_debug(dev, HDMI_IH_AHBDMAAUD_STAT0);
-+	hdmi_audio_debug(dev, HDMI_IH_MUTE);
-+}
-+
-+static void dumppriv(struct device *dev, struct hdmi_dma_priv *priv)
-+{
-+	dev_dbg(dev, "channels         = %d\n", priv->channels);
-+	dev_dbg(dev, "periods          = %d\n", priv->periods);
-+	dev_dbg(dev, "period_bytes     = %d\n", priv->period_bytes);
-+	dev_dbg(dev, "dma period_bytes = %d\n", priv->dma_period_bytes);
-+	dev_dbg(dev, "buffer_ratio     = %d\n", priv->buffer_ratio);
-+	dev_dbg(dev, "hw dma buffer    = 0x%08x\n", (int)priv->hw_buffer.addr);
-+	dev_dbg(dev, "dma buf size     = %d\n", (int)priv->buffer_bytes);
-+	dev_dbg(dev, "sample_rate      = %d\n", (int)priv->rate);
-+}
-+#else
-+static void dumpregs(struct device *dev) {}
-+static void dumppriv(struct device *dev, struct hdmi_dma_priv *priv) {}
-+#endif
-+
-+/*
-+ * Conditions for DMA to work:
-+ * ((final_addr - initial_addr)>>2)+1) < 2k.  So max period is 8k.
-+ * (inital_addr & 0x3) == 0
-+ * (final_addr  & 0x3) == 0x3
-+ *
-+ * The DMA Period should be an integer multiple of the IEC 60958 audio
-+ * frame size, which is 768 bytes (192 * 4).
-+ */
-+static void hdmi_dma_set_addr(int start_addr, int dma_period_bytes)
-+{
-+	int final_addr = start_addr + dma_period_bytes - 1;
-+
-+	hdmi_write4(start_addr, HDMI_AHB_DMA_STRADDR0);
-+	hdmi_write4(final_addr, HDMI_AHB_DMA_STPADDR0);
-+}
-+
-+static void hdmi_dma_irq_set(bool set)
-+{
-+	u8 val = hdmi_readb(HDMI_AHB_DMA_MASK);
-+
-+	if (set)
-+		val |= HDMI_AHB_DMA_DONE;
-+	else
-+		val &= (u8)~HDMI_AHB_DMA_DONE;
-+
-+	hdmi_writeb(val, HDMI_AHB_DMA_MASK);
-+}
-+
-+static void hdmi_mask(int mask)
-+{
-+	u8 regval = hdmi_readb(HDMI_AHB_DMA_MASK);
-+
-+	if (mask)
-+		regval |= HDMI_AHB_DMA_ERROR | HDMI_AHB_DMA_FIFO_EMPTY;
-+	else
-+		regval &= (u8)~(HDMI_AHB_DMA_ERROR | HDMI_AHB_DMA_FIFO_EMPTY);
-+
-+	hdmi_writeb(regval, HDMI_AHB_DMA_MASK);
-+}
-+
-+static inline int odd_ones(unsigned a)
-+{
-+	a ^= a >> 16;
-+	a ^= a >> 8;
-+	a ^= a >> 4;
-+	a ^= a >> 2;
-+	a ^= a >> 1;
-+
-+	return a & 1;
-+}
-+
-+/* Add frame information for one pcm subframe */
-+static u32 hdmi_dma_add_frame_info(struct hdmi_dma_priv *priv,
-+				   u32 pcm_data, int subframe_idx)
-+{
-+	union hdmi_audio_dma_data_t subframe;
-+	union hdmi_audio_header_t tmp_header;
-+
-+	subframe.U = 0;
-+
-+	if (priv->frame_idx < 42) {
-+		tmp_header = iec_header;
-+
-+		/* fill v (validity) */
-+		subframe.B.v = tmp_header.B.linear_pcm;
-+
-+		/* fill c (channel status) */
-+		if (tmp_header.B.linear_pcm == 0)
-+			tmp_header.B.channel = subframe_idx + 1;
-+		subframe.B.c = tmp_header.U >> priv->frame_idx;
-+	} else {
-+		/* fill v (validity), c is always zero */
-+		subframe.B.v = iec_header.B.linear_pcm;
-+	}
-+
-+	/* fill data */
-+	if (priv->sample_bits == 16)
-+		pcm_data <<= 8;
-+	subframe.B.data = pcm_data;
-+
-+	/* fill p (parity) Note: Do not include b ! */
-+	subframe.B.p = odd_ones(subframe.U);
-+
-+	/* fill b (start-of-block) */
-+	if (priv->frame_idx == 0)
-+		subframe.B.b = 1;
-+
-+	return subframe.U;
-+}
-+
-+static void init_table(int channels)
-+{
-+	int i, map_sel, ch;
-+	unsigned char *p = g_packet_head_table;
-+	union hdmi_audio_header_t tmp_header = iec_header;
-+
-+	for (i = 0; i < 48; i++) {
-+		int b = 0;
-+		if (i == 0)
-+			b = 1;
-+
-+		for (ch = 0; ch < channels; ch++) {
-+			int c = 0;
-+			if (i < 42) {
-+				tmp_header.B.channel = ch + 1;
-+				c = (tmp_header.U >> i) & 0x1;
-+			}
-+			/* preset bit p as c */
-+			*p++ = (b << 4) | (c << 2) | (c << 3);
-+		}
-+	}
-+
-+	map_sel = channels / 2;
-+	for (i = 0; i < 24; i++) {
-+		g_channel_remap_table[i] = (i / channels) * channels +
-+			channel_maps_cea_alsa[map_sel][i % channels];
-+	}
-+}
-+
-+/* Optimization for IEC head */
-+static void hdmi_dma_copy_16_c_lut(u16 *src, u32 *dst, int samples,
-+				u8 *lookup_table)
-+{
-+	u32 sample, head;
-+	int i = 0;
-+
-+	while (samples--) {
-+		/* get source sample */
-+		sample = src[g_channel_remap_table[i]];
-+
-+		/* get packet header and p-bit */
-+		head = *lookup_table++ ^ (odd_ones(sample) << 3);
-+
-+		/* store sample and header */
-+		*dst++ = (head << 24) | (sample << 8);
-+
-+		if (++i == 24) {
-+			src += 24;
-+			i = 0;
-+		}
-+	}
-+}
-+
-+static void hdmi_dma_copy_16_c_fast(u16 *src, u32 *dst, int samples)
-+{
-+	u32 sample;
-+	int i = 0;
-+
-+	while (samples--) {
-+		/* get source sample */
-+		sample = src[g_channel_remap_table[i]];
-+
-+		/* store sample and p-bit */
-+		*dst++ = (odd_ones(sample) << (3+24)) | (sample << 8);
-+
-+		if (++i == 24) {
-+			src += 24;
-+			i = 0;
-+		}
-+	}
-+}
-+
-+static void hdmi_dma_copy_24_c_lut(u32 *src, u32 *dst, int samples,
-+				u8 *lookup_table)
-+{
-+	u32 sample, head;
-+	int i = 0;
-+
-+	while (samples--) {
-+		/* get source sample */
-+		sample = src[g_channel_remap_table[i]] & 0x00ffffff;
-+
-+		/* get packet header and p-bit */
-+		head = *lookup_table++ ^ (odd_ones(sample) << 3);
-+
-+		/* store sample and header */
-+		*dst++ = (head << 24) | sample;
-+
-+		if (++i == 24) {
-+			src += 24;
-+			i = 0;
-+		}
-+	}
-+}
-+
-+static void hdmi_dma_copy_24_c_fast(u32 *src, u32 *dst, int samples)
-+{
-+	u32 sample;
-+	int i = 0;
-+
-+	while (samples--) {
-+		/* get source sample */
-+		sample = src[g_channel_remap_table[i]] & 0x00ffffff;
-+
-+		/* store sample and p-bit */
-+		*dst++ = (odd_ones(sample) << (3+24)) | sample;
-+
-+		if (++i == 24) {
-+			src += 24;
-+			i = 0;
-+		}
-+	}
-+}
-+
-+static void hdmi_mmap_copy(u8 *src, int samplesize, u32 *dst, int framecnt, int channelcnt)
-+{
-+	/* split input frames into 192-frame each */
-+	int count_in_192 = (framecnt + 191) / 192;
-+	int i;
-+
-+	typedef void (*fn_copy_lut)(u8 *src, u32 *dst, int samples, u8 *lookup_table);
-+	typedef void (*fn_copy_fast)(u8 *src, u32 *dst, int samples);
-+	fn_copy_lut copy_lut;
-+	fn_copy_fast copy_fast;
-+
-+	if (samplesize == 4) {
-+		copy_lut = (fn_copy_lut)hdmi_dma_copy_24_c_lut;
-+		copy_fast = (fn_copy_fast)hdmi_dma_copy_24_c_fast;
-+	} else {
-+		copy_lut = (fn_copy_lut)hdmi_dma_copy_16_c_lut;
-+		copy_fast = (fn_copy_fast)hdmi_dma_copy_16_c_fast;
-+	}
-+
-+	for (i = 0; i < count_in_192; i++) {
-+		int count, samples;
-+
-+		/* handles frame index [0, 48) */
-+		count = (framecnt < 48) ? framecnt : 48;
-+		samples = count * channelcnt;
-+		copy_lut(src, dst, samples, g_packet_head_table);
-+		framecnt -= count;
-+		if (framecnt == 0)
-+			break;
-+
-+		src  += samples * samplesize;
-+		dst += samples;
-+
-+		/* handles frame index [48, 192) */
-+		count = (framecnt < 192 - 48) ? framecnt : 192 - 48;
-+		samples = count * channelcnt;
-+		copy_fast(src, dst, samples);
-+		framecnt -= count;
-+		src  += samples * samplesize;
-+		dst += samples;
-+	}
-+}
-+
-+static void hdmi_dma_mmap_copy(struct snd_pcm_substream *substream,
-+				int offset, int count)
-+{
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+	struct device *dev = rtd->platform->dev;
-+	u32 framecount, *dst;
-+
-+	framecount = count / (priv->sample_align * priv->channels);
-+
-+	/* hw_buffer is the destination for pcm data plus frame info. */
-+	dst = (u32 *)(priv->hw_buffer.area + (offset * priv->buffer_ratio));
-+
-+	switch (priv->format) {
-+	case SNDRV_PCM_FORMAT_S16_LE:
-+	case SNDRV_PCM_FORMAT_S24_LE:
-+		/* dma_buffer is the mmapped buffer we are copying pcm from. */
-+		hdmi_mmap_copy(runtime->dma_area + offset,
-+			       priv->sample_align, dst, framecount, priv->channels);
-+		break;
-+	default:
-+		dev_err(dev, "unsupported sample format %s\n",
-+				snd_pcm_format_name(priv->format));
-+		return;
-+	}
-+}
-+
-+static void hdmi_dma_data_copy(struct snd_pcm_substream *substream,
-+				struct hdmi_dma_priv *priv, char type)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	unsigned long offset, count, appl_bytes, space_to_end;
-+
-+	if (runtime->access != SNDRV_PCM_ACCESS_MMAP_INTERLEAVED)
-+		return;
-+
-+	appl_bytes = frames_to_bytes(runtime, runtime->status->hw_ptr);
-+
-+	switch (type) {
-+	case 'p':
-+		offset = (appl_bytes + 2 * priv->period_bytes) % priv->buffer_bytes;
-+		count = priv->period_bytes;
-+		space_to_end = priv->period_bytes;
-+		break;
-+	case 'b':
-+		offset = appl_bytes % priv->buffer_bytes;
-+		count = priv->buffer_bytes;
-+		space_to_end = priv->buffer_bytes - offset;
-+		break;
-+	default:
-+		return;
-+	}
-+
-+	if (count <= space_to_end) {
-+		hdmi_dma_mmap_copy(substream, offset, count);
-+	} else {
-+		hdmi_dma_mmap_copy(substream, offset, space_to_end);
-+		hdmi_dma_mmap_copy(substream, 0, count - space_to_end);
-+	}
-+}
-+
-+static void hdmi_sdma_callback(void *data)
-+{
-+	struct hdmi_dma_priv *priv = (struct hdmi_dma_priv *)data;
-+	struct snd_pcm_substream *substream = priv->substream;
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&priv->irq_lock, flags);
-+
-+	if (runtime && runtime->dma_area && priv->tx_active) {
-+		priv->offset += priv->period_bytes;
-+		priv->offset %= priv->period_bytes * priv->periods;
-+
-+		/* Copy data by period_bytes */
-+		hdmi_dma_data_copy(substream, priv, 'p');
-+
-+		snd_pcm_period_elapsed(substream);
-+	}
-+
-+	spin_unlock_irqrestore(&priv->irq_lock, flags);
-+
-+	return;
-+}
-+
-+static int hdmi_dma_set_thrsld_incrtype(struct device *dev, int channels)
-+{
-+	u8 mask = HDMI_AHB_DMA_CONF0_BURST_MODE | HDMI_AHB_DMA_CONF0_INCR_TYPE_MASK;
-+	u8 val = hdmi_readb(HDMI_AHB_DMA_CONF0) & ~mask;
-+	int incr_type, threshold;
-+
-+	switch (hdmi_readb(HDMI_REVISION_ID)) {
-+	case 0x0a:
-+		incr_type = HDMI_DMA_BURST_INCR4;
-+		if (channels == 2)
-+			threshold = 126;
-+		else
-+			threshold = 124;
-+		break;
-+	case 0x1a:
-+		incr_type = HDMI_DMA_BURST_INCR8;
-+		threshold = 128;
-+		break;
-+	default:
-+		dev_err(dev, "unknown hdmi controller!\n");
-+		return -ENODEV;
-+	}
-+
-+	hdmi_writeb(threshold, HDMI_AHB_DMA_THRSLD);
-+
-+	switch (incr_type) {
-+	case HDMI_DMA_BURST_UNSPECIFIED_LEGNTH:
-+		break;
-+	case HDMI_DMA_BURST_INCR4:
-+		val |= HDMI_AHB_DMA_CONF0_BURST_MODE;
-+		break;
-+	case HDMI_DMA_BURST_INCR8:
-+		val |= HDMI_AHB_DMA_CONF0_BURST_MODE |
-+			 HDMI_AHB_DMA_CONF0_INCR8;
-+		break;
-+	case HDMI_DMA_BURST_INCR16:
-+		val |= HDMI_AHB_DMA_CONF0_BURST_MODE |
-+			 HDMI_AHB_DMA_CONF0_INCR16;
-+		break;
-+	default:
-+		dev_err(dev, "invalid increment type: %d!", incr_type);
-+		return -EINVAL;
-+	}
-+
-+	hdmi_writeb(val, HDMI_AHB_DMA_CONF0);
-+
-+	hdmi_audio_debug(dev, HDMI_AHB_DMA_THRSLD);
-+
-+	return 0;
-+}
-+
-+static void hdmi_dma_set_hbr(struct device *dev, int channels)
-+{
-+	u8 value = hdmi_readb(HDMI_AHB_DMA_CONF0) & (~HDMI_AHB_DMA_CONF0_HBR_MASK);
-+
-+	/* non audio AES and 8 channels means we have to enable HBR */
-+	if ((channels == 8) &&
-+	    (iec_header.B.linear_pcm == 0)) {
-+		value |= HDMI_AHB_DMA_CONF0_HBR_MASK;
-+		dev_info(dev, "Enabling HBR");
-+	}
-+
-+	hdmi_writeb(value, HDMI_AHB_DMA_CONF0);
-+}
-+
-+static int hdmi_dma_configure_dma(struct device *dev, int channels)
-+{
-+	int ret;
-+	static u8 chan_enable[] = { 0x00, 0x03, 0x33, 0x3f, 0xff };
-+
-+	if (channels <= 0 || channels > 8 || channels % 2 != 0) {
-+		dev_err(dev, "unsupported channel number: %d\n", channels);
-+		return -EINVAL;
-+	}
-+
-+	hdmi_audio_writeb(AHB_DMA_CONF0, EN_HLOCK, 0x1);
-+
-+	ret = hdmi_dma_set_thrsld_incrtype(dev, channels);
-+	if (ret)
-+		return ret;
-+
-+	hdmi_writeb(chan_enable[channels / 2], HDMI_AHB_DMA_CONF1);
-+
-+	/* Handle HBR */
-+	hdmi_dma_set_hbr(dev, channels);
-+
-+	return 0;
-+}
-+
-+static void hdmi_dma_init_iec_header(void)
-+{
-+	iec_header.U = 0;
-+
-+	iec_header.B.consumer = 0;		/* Consumer use */
-+	iec_header.B.linear_pcm = 0;		/* linear pcm audio */
-+	iec_header.B.copyright = 1;		/* no copyright */
-+	iec_header.B.pre_emphasis = 0;		/* 2 channels without pre-emphasis */
-+	iec_header.B.mode = 0;			/* Mode 0 */
-+
-+	iec_header.B.category_code = 0;
-+
-+	iec_header.B.source = 2;		/* stereo */
-+	iec_header.B.channel = 0;
-+
-+	iec_header.B.sample_freq = 0x02;	/* 48 KHz */
-+	iec_header.B.clock_acc = 0;		/* Level II */
-+
-+	iec_header.B.word_length = 0x02;	/* 16 bits */
-+	iec_header.B.org_sample_freq = 0x0D;	/* 48 KHz */
-+
-+	iec_header.B.cgms_a = 0;		/* Copying is permitted without restriction */
-+}
-+
-+static int hdmi_dma_update_iec_header(struct snd_pcm_substream *substream)
-+{
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+	struct device *dev = rtd->platform->dev;
-+
-+	iec_header.B.source = priv->channels;
-+
-+	switch (priv->rate) {
-+	case 32000:
-+		iec_header.B.sample_freq = 0x03;
-+		iec_header.B.org_sample_freq = 0x0C;
-+		break;
-+	case 44100:
-+		iec_header.B.sample_freq = 0x00;
-+		iec_header.B.org_sample_freq = 0x0F;
-+		break;
-+	case 48000:
-+		iec_header.B.sample_freq = 0x02;
-+		iec_header.B.org_sample_freq = 0x0D;
-+		break;
-+	case 88200:
-+		iec_header.B.sample_freq = 0x08;
-+		iec_header.B.org_sample_freq = 0x07;
-+		break;
-+	case 96000:
-+		iec_header.B.sample_freq = 0x0A;
-+		iec_header.B.org_sample_freq = 0x05;
-+		break;
-+	case 176400:
-+		iec_header.B.sample_freq = 0x0C;
-+		iec_header.B.org_sample_freq = 0x03;
-+		break;
-+	case 192000:
-+		iec_header.B.sample_freq = 0x0E;
-+		iec_header.B.org_sample_freq = 0x01;
-+		break;
-+	default:
-+		dev_err(dev, "unsupported sample rate\n");
-+		return -EFAULT;
-+	}
-+
-+	switch (priv->format) {
-+	case SNDRV_PCM_FORMAT_S16_LE:
-+		iec_header.B.word_length = 0x02;
-+		break;
-+	case SNDRV_PCM_FORMAT_S24_LE:
-+		iec_header.B.word_length = 0x0b;
-+		break;
-+	default:
-+		return -EFAULT;
-+	}
-+
-+	return 0;
-+}
-+
-+/*
-+ * The HDMI block transmits the audio data without adding any of the audio
-+ * frame bits.  So we have to copy the raw dma data from the ALSA buffer
-+ * to the DMA buffer, adding the frame information.
-+ */
-+static int hdmi_dma_copy(struct snd_pcm_substream *substream, int channel,
-+			snd_pcm_uframes_t pos, void __user *buf,
-+			snd_pcm_uframes_t frames)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+	unsigned int count = frames_to_bytes(runtime, frames);
-+	unsigned int pos_bytes = frames_to_bytes(runtime, pos);
-+	int channel_no, pcm_idx, subframe_idx, bits_left, sample_bits, map_sel;
-+	u32 pcm_data[8], pcm_temp, *hw_buf, sample_block, inc_mask;
-+
-+	/* Adding frame info to pcm data from userspace and copy to hw_buffer */
-+	hw_buf = (u32 *)(priv->hw_buffer.area + (pos_bytes * priv->buffer_ratio));
-+
-+	sample_bits = priv->sample_align * 8;
-+	sample_block = priv->sample_align * priv->channels;
-+
-+	if (iec_header.B.linear_pcm == 0) {
-+		map_sel = priv->channels / 2;
-+		inc_mask = 1 << (priv->channels - 1);
-+	} else {
-+		map_sel = 0;
-+		inc_mask = 0xaa;
-+	}
-+
-+	while (count > 0) {
-+		if (copy_from_user(pcm_data, buf, sample_block))
-+			return -EFAULT;
-+
-+		buf += sample_block;
-+		count -= sample_block;
-+
-+		channel_no = pcm_idx = 0;
-+		do {
-+			pcm_temp = pcm_data[pcm_idx++];
-+			bits_left = 32;
-+			for (;;) {
-+				/* re-map channels */
-+				subframe_idx = channel_maps_alsa_cea[map_sel][channel_no];
-+
-+				/* Save the header info to the audio dma buffer */
-+				hw_buf[subframe_idx] = hdmi_dma_add_frame_info(
-+								priv, pcm_temp, subframe_idx);
-+
-+				if (inc_mask & (1 << channel_no)) {
-+					if (++priv->frame_idx == 192)
-+						priv->frame_idx = 0;
-+				}
-+
-+				channel_no++;
-+
-+				if (bits_left <= sample_bits)
-+					break;
-+
-+				bits_left -= sample_bits;
-+				pcm_temp >>= sample_bits;
-+			}
-+		} while (channel_no < priv->channels);
-+
-+		hw_buf += priv->channels;
-+	}
-+
-+	return 0;
-+}
-+
-+static int hdmi_sdma_initbuf(struct device *dev, struct hdmi_dma_priv *priv)
-+{
-+	struct hdmi_sdma_script *hdmi_sdma_t = priv->hdmi_sdma_t;
-+	u32 *head, *tail, i;
-+
-+	if (!hdmi_sdma_t) {
-+		dev_err(dev, "hdmi private addr invalid!!!\n");
-+		return -EINVAL;
-+	}
-+
-+	hdmi_sdma_t->control_reg_addr = HDMI_BASE_ADDR + HDMI_AHB_DMA_START;
-+	hdmi_sdma_t->status_reg_addr = HDMI_BASE_ADDR + HDMI_IH_AHBDMAAUD_STAT0;
-+	hdmi_sdma_t->dma_start_addr = HDMI_BASE_ADDR + HDMI_AHB_DMA_STRADDR0;
-+
-+	head = &hdmi_sdma_t->buffer[0];
-+	tail = &hdmi_sdma_t->buffer[1];
-+
-+	for (i = 0; i < priv->sdma_params.buffer_num; i++) {
-+		*head = priv->hw_buffer.addr + i * priv->period_bytes * priv->buffer_ratio;
-+		*tail = *head + priv->dma_period_bytes - 1;
-+		head += 2;
-+		tail += 2;
-+	}
-+
-+	return 0;
-+}
-+
-+static int hdmi_sdma_config(struct snd_pcm_substream *substream,
-+			struct hdmi_dma_priv *priv)
-+{
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct device *dai_dev = &priv->pdev->dev;
-+	struct device *dev = rtd->platform->dev;
-+	struct dma_slave_config slave_config;
-+	int ret;
-+
-+	priv->dma_channel = dma_request_slave_channel(dai_dev, "tx");
-+	if (priv->dma_channel == NULL) {
-+		dev_err(dev, "failed to alloc dma channel\n");
-+		return -EBUSY;
-+	}
-+
-+	priv->dma_data.data_addr1 = &priv->sdma_params.buffer_num;
-+	priv->dma_data.data_addr2 = &priv->sdma_params.phyaddr;
-+	//priv->dma_data.peripheral_type = IMX_DMATYPE_HDMI;
-+	priv->dma_channel->private = &priv->dma_data;
-+
-+	slave_config.direction = DMA_TRANS_NONE;
-+
-+	ret = dmaengine_slave_config(priv->dma_channel, &slave_config);
-+	if (ret) {
-+		dev_err(dev, "failed to config slave dma, (%d)\n", ret);
-+		return -EINVAL;
-+	}
-+
-+	return 0;
-+}
-+
-+static int hdmi_dma_hw_free(struct snd_pcm_substream *substream)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+
-+	if (priv->dma_channel) {
-+		dma_release_channel(priv->dma_channel);
-+		priv->dma_channel = NULL;
-+	}
-+
-+	return 0;
-+}
-+
-+static int hdmi_dma_hw_params(struct snd_pcm_substream *substream,
-+				struct snd_pcm_hw_params *params)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct device *dev = rtd->platform->dev;
-+	int ret;
-+
-+	priv->buffer_bytes = params_buffer_bytes(params);
-+	priv->periods = params_periods(params);
-+	priv->period_bytes = params_period_bytes(params);
-+	priv->channels = params_channels(params);
-+	priv->format = params_format(params);
-+	priv->rate = params_rate(params);
-+
-+	priv->offset = 0;
-+	priv->period_time = HZ / (priv->rate / params_period_size(params));
-+
-+	switch (priv->format) {
-+	case SNDRV_PCM_FORMAT_S16_LE:
-+		priv->buffer_ratio = 2;
-+		priv->sample_align = 2;
-+		priv->sample_bits = 16;
-+		break;
-+	case SNDRV_PCM_FORMAT_S24_LE:
-+		/* 24 bit audio in 32 bit word */
-+		priv->buffer_ratio = 1;
-+		priv->sample_align = 4;
-+		priv->sample_bits = 24;
-+		break;
-+	default:
-+		dev_err(dev, "unsupported sample format: %d\n", priv->format);
-+		return -EINVAL;
-+	}
-+
-+	priv->dma_period_bytes = priv->period_bytes * priv->buffer_ratio;
-+	priv->sdma_params.buffer_num = priv->periods;
-+	priv->sdma_params.phyaddr = priv->phy_hdmi_sdma_t;
-+
-+	ret = hdmi_sdma_initbuf(dev, priv);
-+	if (ret)
-+		return ret;
-+
-+	ret = hdmi_sdma_config(substream, priv);
-+	if (ret)
-+		return ret;
-+
-+	snd_pcm_set_runtime_buffer(substream, &substream->dma_buffer);
-+
-+	ret = hdmi_dma_configure_dma(dev, priv->channels);
-+	if (ret)
-+		return ret;
-+
-+	hdmi_dma_set_addr(priv->hw_buffer.addr, priv->dma_period_bytes);
-+
-+	dumppriv(dev, priv);
-+
-+	hdmi_dma_update_iec_header(substream);
-+
-+	/* Init par for mmap optimizate */
-+	init_table(priv->channels);
-+
-+	priv->appl_bytes = 0;
-+	priv->frame_idx = 0;
-+
-+	return 0;
-+}
-+
-+static void hdmi_dma_trigger_init(struct snd_pcm_substream *substream,
-+				struct hdmi_dma_priv *priv)
-+{
-+	unsigned long status;
-+	bool hbr;
-+
-+	/*
-+	 * Set HBR mode (>192kHz IEC-61937 HD audio bitstreaming).
-+	 * This is done this late because userspace may alter the AESx
-+	 * parameters until the stream is finally prepared.
-+	 */
-+	hbr = (iec_header.B.linear_pcm != 0 && priv->channels == 8);
-+	hdmi_audio_writeb(AHB_DMA_CONF0, HBR, !!hbr);
-+
-+	/*
-+	 * Override AES3 - parameter: This is a temporary hack for
-+	 * callers that provide incorrect information when opening
-+	 * the device. 0x09 (i.e. 768K) is the only acceptable value.
-+	 */
-+	if (hbr) {
-+		iec_header.B.sample_freq = 0x09;
-+		iec_header.B.org_sample_freq = 0x00;
-+	}
-+
-+	priv->offset = 0;
-+
-+	/* Copy data by buffer_bytes */
-+	hdmi_dma_data_copy(substream, priv, 'b');
-+
-+	hdmi_audio_writeb(AHB_DMA_CONF0, SW_FIFO_RST, 0x1);
-+
-+	/* Delay after reset */
-+	udelay(1);
-+
-+	status = hdmi_readb(HDMI_IH_AHBDMAAUD_STAT0);
-+	hdmi_writeb(status, HDMI_IH_AHBDMAAUD_STAT0);
-+}
-+
-+static int hdmi_dma_prepare_and_submit(struct snd_pcm_substream *substream,
-+					struct hdmi_dma_priv *priv)
-+{
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct device *dev = rtd->platform->dev;
-+
-+	priv->desc = dmaengine_prep_dma_cyclic(priv->dma_channel, 0, 0, 0,
-+						DMA_TRANS_NONE, 0);
-+	if (!priv->desc) {
-+		dev_err(dev, "failed to prepare slave dma\n");
-+		return -EINVAL;
-+	}
-+
-+	priv->desc->callback = hdmi_sdma_callback;
-+	priv->desc->callback_param = (void *)priv;
-+	dmaengine_submit(priv->desc);
-+
-+	return 0;
-+}
-+
-+static int hdmi_dma_trigger(struct snd_pcm_substream *substream, int cmd)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+	struct device *dev = rtd->platform->dev;
-+	int ret;
-+
-+	switch (cmd) {
-+	case SNDRV_PCM_TRIGGER_START:
-+	case SNDRV_PCM_TRIGGER_RESUME:
-+		if (!check_hdmi_state())
-+			return 0;
-+		hdmi_dma_trigger_init(substream, priv);
-+
-+		dumpregs(dev);
-+
-+	case SNDRV_PCM_TRIGGER_PAUSE_RELEASE:
-+		priv->tx_active = true;
-+		hdmi_audio_writeb(AHB_DMA_START, START, 0x1);
-+		hdmi_dma_irq_set(false);
-+		hdmi_set_dma_mode(1);
-+		ret = hdmi_dma_prepare_and_submit(substream, priv);
-+		if (ret)
-+			return ret;
-+		dma_async_issue_pending(priv->desc->chan);
-+		break;
-+	case SNDRV_PCM_TRIGGER_STOP:
-+	case SNDRV_PCM_TRIGGER_SUSPEND:
-+	case SNDRV_PCM_TRIGGER_PAUSE_PUSH:
-+		dmaengine_terminate_all(priv->dma_channel);
-+		hdmi_set_dma_mode(0);
-+		hdmi_dma_irq_set(true);
-+		hdmi_audio_writeb(AHB_DMA_STOP, STOP, 0x1);
-+		priv->tx_active = false;
-+		break;
-+	default:
-+		return -EINVAL;
-+	}
-+
-+	return 0;
-+}
-+
-+static snd_pcm_uframes_t hdmi_dma_pointer(struct snd_pcm_substream *substream)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+
-+	return bytes_to_frames(runtime, priv->offset);
-+}
-+
-+static struct snd_pcm_hardware snd_imx_hardware = {
-+	.info = SNDRV_PCM_INFO_INTERLEAVED |
-+		SNDRV_PCM_INFO_BLOCK_TRANSFER |
-+		SNDRV_PCM_INFO_MMAP |
-+		SNDRV_PCM_INFO_MMAP_VALID |
-+		SNDRV_PCM_INFO_PAUSE |
-+		SNDRV_PCM_INFO_RESUME,
-+	.formats = MXC_HDMI_FORMATS_PLAYBACK,
-+	.rate_min = 32000,
-+	.channels_min = 2,
-+	.channels_max = 8,
-+	.buffer_bytes_max = HDMI_PCM_BUF_SIZE,
-+	.period_bytes_min = HDMI_DMA_PERIOD_BYTES / 2,
-+	.period_bytes_max = HDMI_DMA_PERIOD_BYTES / 2,
-+	.periods_min = 2, //8
-+	.periods_max = HDMI_DMA_BUF_SIZE / HDMI_DMA_PERIOD_BYTES,
-+	.fifo_size = 0,
-+};
-+
-+static void hdmi_dma_irq_enable(struct hdmi_dma_priv *priv)
-+{
-+	unsigned long flags;
-+
-+	hdmi_writeb(0xff, HDMI_AHB_DMA_POL);
-+	hdmi_writeb(0xff, HDMI_AHB_DMA_BUFFPOL);
-+
-+	spin_lock_irqsave(&priv->irq_lock, flags);
-+
-+	hdmi_writeb(0xff, HDMI_IH_AHBDMAAUD_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
-+	hdmi_dma_irq_set(false);
-+	hdmi_mask(0);
-+
-+	spin_unlock_irqrestore(&priv->irq_lock, flags);
-+}
-+
-+static void hdmi_dma_irq_disable(struct hdmi_dma_priv *priv)
-+{
-+	unsigned long flags;
-+
-+	spin_lock_irqsave(&priv->irq_lock, flags);
-+
-+	hdmi_dma_irq_set(true);
-+	hdmi_writeb(0x0, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
-+	hdmi_writeb(0xff, HDMI_IH_AHBDMAAUD_STAT0);
-+	hdmi_mask(1);
-+
-+	spin_unlock_irqrestore(&priv->irq_lock, flags);
-+}
-+
-+static int hdmi_dma_open(struct snd_pcm_substream *substream)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct snd_soc_pcm_runtime *rtd = substream->private_data;
-+	struct device *dev = rtd->platform->dev;
-+	struct hdmi_dma_priv *priv = dev_get_drvdata(dev);
-+	int ret;
-+
-+	runtime->private_data = priv;
-+
-+	ret = mxc_hdmi_register_audio(substream);
-+	if (ret < 0) {
-+		dev_err(dev, "HDMI Video is not ready!\n");
-+		return ret;
-+	}
-+
-+	hdmi_audio_writeb(AHB_DMA_CONF0, SW_FIFO_RST, 0x1);
-+
-+	ret = snd_pcm_hw_constraint_integer(substream->runtime,
-+			SNDRV_PCM_HW_PARAM_PERIODS);
-+	if (ret < 0)
-+		return ret;
-+
-+	snd_soc_set_runtime_hwparams(substream, &snd_imx_hardware);
-+
-+	hdmi_dma_irq_enable(priv);
-+
-+	return 0;
-+}
-+
-+static int hdmi_dma_close(struct snd_pcm_substream *substream)
-+{
-+	struct snd_pcm_runtime *runtime = substream->runtime;
-+	struct hdmi_dma_priv *priv = runtime->private_data;
-+
-+	hdmi_dma_irq_disable(priv);
-+	mxc_hdmi_unregister_audio(substream);
-+
-+	return 0;
-+}
-+
-+static struct snd_pcm_ops imx_hdmi_dma_pcm_ops = {
-+	.open		= hdmi_dma_open,
-+	.close		= hdmi_dma_close,
-+	.ioctl		= snd_pcm_lib_ioctl,
-+	.hw_params	= hdmi_dma_hw_params,
-+	.hw_free	= hdmi_dma_hw_free,
-+	.trigger	= hdmi_dma_trigger,
-+	.pointer	= hdmi_dma_pointer,
-+	.copy		= hdmi_dma_copy,
-+};
-+
-+static int imx_hdmi_dma_pcm_new(struct snd_soc_pcm_runtime *rtd)
-+{
-+	struct hdmi_dma_priv *priv = dev_get_drvdata(rtd->platform->dev);
-+	struct snd_card *card = rtd->card->snd_card;
-+	struct snd_pcm_substream *substream;
-+	struct snd_pcm *pcm = rtd->pcm;
-+	u64 dma_mask = DMA_BIT_MASK(32);
-+	int ret = 0;
-+
-+	if (!card->dev->dma_mask)
-+		card->dev->dma_mask = &dma_mask;
-+	if (!card->dev->coherent_dma_mask)
-+		card->dev->coherent_dma_mask = DMA_BIT_MASK(32);
-+
-+	substream = pcm->streams[SNDRV_PCM_STREAM_PLAYBACK].substream;
-+
-+	ret = snd_dma_alloc_pages(SNDRV_DMA_TYPE_DEV, pcm->card->dev,
-+			HDMI_PCM_BUF_SIZE, &substream->dma_buffer);
-+	if (ret) {
-+		dev_err(card->dev, "failed to alloc playback dma buffer\n");
-+		return ret;
-+	}
-+
-+	priv->substream = substream;
-+
-+	/* Alloc the hw_buffer */
-+	ret = snd_dma_alloc_pages(SNDRV_DMA_TYPE_DEV, pcm->card->dev,
-+			HDMI_DMA_BUF_SIZE, &priv->hw_buffer);
-+	if (ret) {
-+		dev_err(card->dev, "failed to alloc hw dma buffer\n");
-+		return ret;
-+	}
-+
-+	return ret;
-+}
-+
-+static void imx_hdmi_dma_pcm_free(struct snd_pcm *pcm)
-+{
-+	int stream = SNDRV_PCM_STREAM_PLAYBACK;
-+	struct snd_pcm_substream *substream = pcm->streams[stream].substream;
-+	struct snd_soc_pcm_runtime *rtd = pcm->private_data;
-+	struct hdmi_dma_priv *priv = dev_get_drvdata(rtd->platform->dev);
-+
-+	if (substream) {
-+		snd_dma_free_pages(&substream->dma_buffer);
-+		substream->dma_buffer.area = NULL;
-+		substream->dma_buffer.addr = 0;
-+	}
-+
-+	/* Free the hw_buffer */
-+	snd_dma_free_pages(&priv->hw_buffer);
-+	priv->hw_buffer.area = NULL;
-+	priv->hw_buffer.addr = 0;
-+}
-+
-+static struct snd_soc_platform_driver imx_hdmi_platform = {
-+	.ops		= &imx_hdmi_dma_pcm_ops,
-+	.pcm_new	= imx_hdmi_dma_pcm_new,
-+	.pcm_free	= imx_hdmi_dma_pcm_free,
-+};
-+
-+static int imx_soc_platform_probe(struct platform_device *pdev)
-+{
-+	struct imx_hdmi *hdmi_drvdata = platform_get_drvdata(pdev);
-+	struct hdmi_dma_priv *priv;
-+	int ret = 0;
-+
-+	priv = devm_kzalloc(&pdev->dev, sizeof(*priv), GFP_KERNEL);
-+	if (!priv) {
-+		dev_err(&pdev->dev, "Failed to alloc hdmi_dma\n");
-+		return -ENOMEM;
-+	}
-+
-+	priv->hdmi_sdma_t = dma_alloc_coherent(NULL,
-+			sizeof(struct hdmi_sdma_script),
-+			&priv->phy_hdmi_sdma_t, GFP_KERNEL);
-+	if (!priv->hdmi_sdma_t) {
-+		dev_err(&pdev->dev, "Failed to alloc hdmi_sdma_t\n");
-+		return -ENOMEM;
-+	}
-+
-+	priv->tx_active = false;
-+	spin_lock_init(&priv->irq_lock);
-+
-+	priv->pdev = hdmi_drvdata->pdev;
-+
-+	hdmi_dma_init_iec_header();
-+
-+	dev_set_drvdata(&pdev->dev, priv);
-+
-+	switch (hdmi_readb(HDMI_REVISION_ID)) {
-+	case 0x0a:
-+		snd_imx_hardware.period_bytes_max = HDMI_DMA_PERIOD_BYTES / 4;
-+		snd_imx_hardware.period_bytes_min = HDMI_DMA_PERIOD_BYTES / 4;
-+		snd_imx_hardware.periods_max = HDMI_DMA_BUF_SIZE / (HDMI_DMA_PERIOD_BYTES / 2);
-+		break;
-+	default:
-+		break;
-+	}
-+
-+	ret = snd_soc_register_platform(&pdev->dev, &imx_hdmi_platform);
-+	if (ret)
-+		goto err_plat;
-+
-+	return 0;
-+
-+err_plat:
-+	dma_free_coherent(NULL, sizeof(struct hdmi_sdma_script),
-+			priv->hdmi_sdma_t, priv->phy_hdmi_sdma_t);
-+
-+	return ret;
-+}
-+
-+static int imx_soc_platform_remove(struct platform_device *pdev)
-+{
-+	struct hdmi_dma_priv *priv = dev_get_drvdata(&pdev->dev);
-+
-+	dma_free_coherent(NULL, sizeof(struct hdmi_sdma_script),
-+			priv->hdmi_sdma_t, priv->phy_hdmi_sdma_t);
-+
-+	snd_soc_unregister_platform(&pdev->dev);
-+
-+	return 0;
-+}
-+
-+static struct platform_driver imx_hdmi_dma_driver = {
-+	.driver = {
-+		.name = "imx-hdmi-audio",
-+		.owner = THIS_MODULE,
-+	},
-+	.probe = imx_soc_platform_probe,
-+	.remove = imx_soc_platform_remove,
-+};
-+
-+module_platform_driver(imx_hdmi_dma_driver);
-+
-+MODULE_AUTHOR("Freescale Semiconductor, Inc.");
-+MODULE_DESCRIPTION("i.MX HDMI audio DMA");
-+MODULE_LICENSE("GPL");
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-hdmi.h linux-xbian-imx6/sound/soc/fsl/imx-hdmi.h
---- linux-4.1.3/sound/soc/fsl/imx-hdmi.h	1970-01-01 01:00:00.000000000 +0100
-+++ linux-xbian-imx6/sound/soc/fsl/imx-hdmi.h	2015-07-27 23:13:11.153188979 +0200
-@@ -0,0 +1,106 @@
-+/*
-+ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
-+ *
-+ * This program is free software; you can redistribute it and/or modify
-+ * it under the terms of the GNU General Public License as published by
-+ * the Free Software Foundation; either version 2 of the License, or
-+ * (at your option) any later version.
-+ *
-+ * This program is distributed in the hope that it will be useful,
-+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
-+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-+ * GNU General Public License for more details.
-+ *
-+ * You should have received a copy of the GNU General Public License along
-+ * with this program; if not, write to the Free Software Foundation, Inc.,
-+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
-+ */
-+
-+#ifndef __IMX_HDMI_H
-+#define __IMX_HDMI_H
-+
-+struct imx_hdmi_sdma_params {
-+	dma_addr_t phyaddr;
-+	u32 buffer_num;
-+	int dma;
-+};
-+
-+struct imx_hdmi {
-+	struct snd_soc_dai_driver cpu_dai_drv;
-+	struct platform_device *codec_dev;
-+	struct platform_device *dma_dev;
-+	struct platform_device *pdev;
-+	struct clk *isfr_clk;
-+	struct clk *iahb_clk;
-+	struct clk *mipi_core_clk;
-+};
-+
-+#define HDMI_MAX_RATES 7
-+#define HDMI_MAX_SAMPLE_SIZE 3
-+#define HDMI_MAX_CHANNEL_CONSTRAINTS 4
-+
-+#define MXC_HDMI_RATES_PLAYBACK \
-+	(SNDRV_PCM_RATE_32000 | SNDRV_PCM_RATE_44100 | SNDRV_PCM_RATE_48000 | \
-+	 SNDRV_PCM_RATE_88200 | SNDRV_PCM_RATE_96000 | \
-+	 SNDRV_PCM_RATE_176400 | SNDRV_PCM_RATE_192000)
-+
-+#define MXC_HDMI_FORMATS_PLAYBACK \
-+	(SNDRV_PCM_FMTBIT_S16_LE | SNDRV_PCM_FMTBIT_S24_LE)
-+
-+union hdmi_audio_header_t {
-+	uint64_t  U;
-+	struct {
-+		unsigned consumer:1;
-+		unsigned linear_pcm:1;
-+		unsigned copyright:1;
-+		unsigned pre_emphasis:3;
-+		unsigned mode:2;
-+
-+		unsigned category_code:8;
-+
-+		unsigned source:4;
-+		unsigned channel:4;
-+
-+		unsigned sample_freq:4;
-+		unsigned clock_acc:2;
-+		unsigned reserved0:2;
-+
-+		unsigned word_length:4;
-+		unsigned org_sample_freq:4;
-+
-+		unsigned cgms_a:2;
-+		unsigned reserved1:6;
-+
-+		unsigned reserved2:8;
-+
-+		unsigned reserved3:8;
-+	} B;
-+	unsigned char status[8];
-+};
-+
-+union hdmi_audio_dma_data_t {
-+	uint32_t  U;
-+	struct {
-+		unsigned data:24;
-+		unsigned v:1;
-+		unsigned u:1;
-+		unsigned c:1;
-+		unsigned p:1;
-+		unsigned b:1;
-+		unsigned reserved:3;
-+	} B;
-+};
-+
-+extern union hdmi_audio_header_t iec_header;
-+
-+#define hdmi_audio_writeb(reg, bit, val) \
-+	do { \
-+		hdmi_mask_writeb(val, HDMI_ ## reg, \
-+			HDMI_ ## reg ## _ ## bit ## _OFFSET, \
-+			HDMI_ ## reg ## _ ## bit ## _MASK); \
-+		pr_debug("Set reg: HDMI_" #reg " (0x%x) "\
-+			"bit: HDMI_" #reg "_" #bit " (%d) to val: %x\n", \
-+			HDMI_ ## reg, HDMI_ ## reg ## _ ## bit ## _OFFSET, val); \
-+	} while (0)
-+
-+#endif /* __IMX_HDMI_H */
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-pcm-dma.c linux-xbian-imx6/sound/soc/fsl/imx-pcm-dma.c
---- linux-4.1.3/sound/soc/fsl/imx-pcm-dma.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/imx-pcm-dma.c	2015-07-27 23:13:11.153188979 +0200
-@@ -43,7 +43,7 @@
- 	.buffer_bytes_max = IMX_SSI_DMABUF_SIZE,
- 	.period_bytes_min = 128,
- 	.period_bytes_max = 65535, /* Limited by SDMA engine */
--	.periods_min = 2,
-+	.periods_min = 4,
- 	.periods_max = 255,
- 	.fifo_size = 0,
- };
-@@ -55,10 +55,27 @@
- 	.prealloc_buffer_size = IMX_SSI_DMABUF_SIZE,
- };
- 
--int imx_pcm_dma_init(struct platform_device *pdev)
-+int imx_pcm_dma_init(struct platform_device *pdev, size_t size)
- {
-+	struct snd_dmaengine_pcm_config *config;
-+	struct snd_pcm_hardware *pcm_hardware;
-+
-+	config = devm_kzalloc(&pdev->dev,
-+			sizeof(struct snd_dmaengine_pcm_config), GFP_KERNEL);
-+	*config = imx_dmaengine_pcm_config;
-+	if (size)
-+		config->prealloc_buffer_size = size;
-+
-+	pcm_hardware = devm_kzalloc(&pdev->dev,
-+			sizeof(struct snd_pcm_hardware), GFP_KERNEL);
-+	*pcm_hardware = imx_pcm_hardware;
-+	if (size)
-+		pcm_hardware->buffer_bytes_max = size;
-+
-+	config->pcm_hardware = pcm_hardware;
-+
- 	return devm_snd_dmaengine_pcm_register(&pdev->dev,
--		&imx_dmaengine_pcm_config,
-+		config,
- 		SND_DMAENGINE_PCM_FLAG_COMPAT);
- }
- EXPORT_SYMBOL_GPL(imx_pcm_dma_init);
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-pcm.h linux-xbian-imx6/sound/soc/fsl/imx-pcm.h
---- linux-4.1.3/sound/soc/fsl/imx-pcm.h	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/imx-pcm.h	2015-07-27 23:13:11.153188979 +0200
-@@ -19,6 +19,10 @@
-  * Do not change this as the FIQ handler depends on this size
-  */
- #define IMX_SSI_DMABUF_SIZE	(64 * 1024)
-+#define IMX_SAI_DMABUF_SIZE	(64 * 1024)
-+#define IMX_SPDIF_DMABUF_SIZE	(64 * 1024)
-+#define IMX_ESAI_DMABUF_SIZE	(256 * 1024)
-+#define IMX_ASRC_DMABUF_SIZE	(256 * 1024)
- 
- static inline void
- imx_pcm_dma_params_init_data(struct imx_dma_data *dma_data,
-@@ -39,9 +43,9 @@
- };
- 
- #if IS_ENABLED(CONFIG_SND_SOC_IMX_PCM_DMA)
--int imx_pcm_dma_init(struct platform_device *pdev);
-+int imx_pcm_dma_init(struct platform_device *pdev, size_t size);
- #else
--static inline int imx_pcm_dma_init(struct platform_device *pdev)
-+static inline int imx_pcm_dma_init(struct platform_device *pdev, size_t size)
- {
- 	return -ENODEV;
- }
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-sgtl5000.c linux-xbian-imx6/sound/soc/fsl/imx-sgtl5000.c
---- linux-4.1.3/sound/soc/fsl/imx-sgtl5000.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/imx-sgtl5000.c	2015-07-27 23:13:11.153188979 +0200
-@@ -175,8 +175,10 @@
- fail:
- 	if (data && !IS_ERR(data->codec_clk))
- 		clk_put(data->codec_clk);
--	of_node_put(ssi_np);
--	of_node_put(codec_np);
-+	if (ssi_np)
-+		of_node_put(ssi_np);
-+	if (codec_np)
-+		of_node_put(codec_np);
- 
- 	return ret;
- }
-@@ -200,6 +202,7 @@
- static struct platform_driver imx_sgtl5000_driver = {
- 	.driver = {
- 		.name = "imx-sgtl5000",
-+		.owner = THIS_MODULE,
- 		.pm = &snd_soc_pm_ops,
- 		.of_match_table = imx_sgtl5000_dt_ids,
- 	},
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-spdif.c linux-xbian-imx6/sound/soc/fsl/imx-spdif.c
---- linux-4.1.3/sound/soc/fsl/imx-spdif.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/imx-spdif.c	2015-07-27 23:13:11.153188979 +0200
-@@ -66,16 +66,18 @@
- 	if (ret)
- 		goto end;
- 
-+	platform_set_drvdata(pdev, &data->card);
-+	snd_soc_card_set_drvdata(&data->card, data);
-+
- 	ret = devm_snd_soc_register_card(&pdev->dev, &data->card);
- 	if (ret) {
- 		dev_err(&pdev->dev, "snd_soc_register_card failed: %d\n", ret);
- 		goto end;
- 	}
- 
--	platform_set_drvdata(pdev, data);
--
- end:
--	of_node_put(spdif_np);
-+	if (spdif_np)
-+		of_node_put(spdif_np);
- 
- 	return ret;
- }
-@@ -89,6 +91,8 @@
- static struct platform_driver imx_spdif_driver = {
- 	.driver = {
- 		.name = "imx-spdif",
-+		.owner = THIS_MODULE,
-+		.pm = &snd_soc_pm_ops,
- 		.of_match_table = imx_spdif_dt_ids,
- 	},
- 	.probe = imx_spdif_audio_probe,
-diff -Nur linux-4.1.3/sound/soc/fsl/imx-ssi.c linux-xbian-imx6/sound/soc/fsl/imx-ssi.c
---- linux-4.1.3/sound/soc/fsl/imx-ssi.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/imx-ssi.c	2015-07-27 23:13:11.153188979 +0200
-@@ -603,7 +603,7 @@
- 	ssi->fiq_params.dma_params_tx = &ssi->dma_params_tx;
- 
- 	ssi->fiq_init = imx_pcm_fiq_init(pdev, &ssi->fiq_params);
--	ssi->dma_init = imx_pcm_dma_init(pdev);
-+	ssi->dma_init = imx_pcm_dma_init(pdev, IMX_SSI_DMABUF_SIZE);
- 
- 	if (ssi->fiq_init && ssi->dma_init) {
- 		ret = ssi->fiq_init;
-diff -Nur linux-4.1.3/sound/soc/fsl/Kconfig linux-xbian-imx6/sound/soc/fsl/Kconfig
---- linux-4.1.3/sound/soc/fsl/Kconfig	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/Kconfig	2015-07-27 23:13:11.149203200 +0200
-@@ -55,6 +55,9 @@
- 	  This option is only useful for out-of-tree drivers since
- 	  in-tree drivers select it automatically.
- 
-+config SND_SOC_FSL_HDMI
-+        tristate
-+
- config SND_SOC_FSL_UTILS
- 	tristate
- 
-@@ -62,6 +65,11 @@
- 	tristate
- 	select SND_SOC_GENERIC_DMAENGINE_PCM
- 
-+config SND_SOC_IMX_HDMI_DMA
-+	bool
-+	select SND_SOC_GENERIC_DMAENGINE_PCM
-+	select SND_SOC_IMX_PCM_DMA
-+
- config SND_SOC_IMX_AUDMUX
- 	tristate "Digital Audio Mux module support"
- 	help
-@@ -235,7 +243,9 @@
- 	select SND_SOC_WM8962
- 	select SND_SOC_IMX_PCM_DMA
- 	select SND_SOC_IMX_AUDMUX
-+	select SND_SOC_FSL_SAI
- 	select SND_SOC_FSL_SSI
-+	select SND_SOC_FSL_UTILS
- 	help
- 	  Say Y if you want to add support for SoC audio on an i.MX board with
- 	  a wm8962 codec.
-@@ -258,7 +268,9 @@
- 	select SND_SOC_SGTL5000
- 	select SND_SOC_IMX_PCM_DMA
- 	select SND_SOC_IMX_AUDMUX
-+	select SND_SOC_FSL_SAI
- 	select SND_SOC_FSL_SSI
-+	select SND_SOC_FSL_UTILS
- 	help
- 	  Say Y if you want to add support for SoC audio on an i.MX board with
- 	  a sgtl5000 codec.
-@@ -280,6 +292,17 @@
- 	select SND_SOC_MC13783
- 	select SND_SOC_IMX_PCM_DMA
- 
-+config SND_SOC_IMX_HDMI
-+	tristate "SoC Audio support for i.MX boards with HDMI port"
-+	depends on MFD_MXC_HDMI
-+	select SND_SOC_IMX_HDMI_DMA
-+	select SND_SOC_FSL_HDMI
-+	select SND_SOC_OMAP_HDMI_CODEC
-+	help
-+	  SoC Audio support for i.MX boards with HDMI audio
-+	  Say Y if you want to add support for SoC audio on an i.MX board with
-+	  IMX HDMI.
-+
- config SND_SOC_FSL_ASOC_CARD
- 	tristate "Generic ASoC Sound Card with ASRC support"
- 	depends on OF && I2C
-diff -Nur linux-4.1.3/sound/soc/fsl/Makefile linux-xbian-imx6/sound/soc/fsl/Makefile
---- linux-4.1.3/sound/soc/fsl/Makefile	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/fsl/Makefile	2015-07-27 23:13:11.149203200 +0200
-@@ -15,7 +15,8 @@
- snd-soc-fsl-asrc-objs := fsl_asrc.o fsl_asrc_dma.o
- snd-soc-fsl-sai-objs := fsl_sai.o
- snd-soc-fsl-ssi-y := fsl_ssi.o
--snd-soc-fsl-ssi-$(CONFIG_DEBUG_FS) += fsl_ssi_dbg.o
-+##snd-soc-fsl-ssi-$(CONFIG_DEBUG_FS) += fsl_ssi_dbg.o
-+snd-soc-fsl-hdmi-objs := fsl_hdmi.o
- snd-soc-fsl-spdif-objs := fsl_spdif.o
- snd-soc-fsl-esai-objs := fsl_esai.o
- snd-soc-fsl-utils-objs := fsl_utils.o
-@@ -26,6 +27,7 @@
- obj-$(CONFIG_SND_SOC_FSL_SSI) += snd-soc-fsl-ssi.o
- obj-$(CONFIG_SND_SOC_FSL_SPDIF) += snd-soc-fsl-spdif.o
- obj-$(CONFIG_SND_SOC_FSL_ESAI) += snd-soc-fsl-esai.o
-+obj-$(CONFIG_SND_SOC_FSL_HDMI) += snd-soc-fsl-hdmi.o
- obj-$(CONFIG_SND_SOC_FSL_UTILS) += snd-soc-fsl-utils.o
- obj-$(CONFIG_SND_SOC_POWERPC_DMA) += snd-soc-fsl-dma.o
- 
-@@ -46,7 +48,7 @@
- 
- obj-$(CONFIG_SND_SOC_IMX_PCM_FIQ) += imx-pcm-fiq.o
- obj-$(CONFIG_SND_SOC_IMX_PCM_DMA) += imx-pcm-dma.o
--
-+obj-$(CONFIG_SND_SOC_IMX_HDMI_DMA) += imx-hdmi-dma.o hdmi_pcm.o
- # i.MX Machine Support
- snd-soc-eukrea-tlv320-objs := eukrea-tlv320.o
- snd-soc-phycore-ac97-objs := phycore-ac97.o
-@@ -57,6 +59,7 @@
- snd-soc-imx-wm8962-objs := imx-wm8962.o
- snd-soc-imx-spdif-objs := imx-spdif.o
- snd-soc-imx-mc13783-objs := imx-mc13783.o
-+snd-soc-imx-hdmi-objs := imx-hdmi.o
- 
- obj-$(CONFIG_SND_SOC_EUKREA_TLV320) += snd-soc-eukrea-tlv320.o
- obj-$(CONFIG_SND_SOC_PHYCORE_AC97) += snd-soc-phycore-ac97.o
-@@ -67,3 +70,6 @@
- obj-$(CONFIG_SND_SOC_IMX_WM8962) += snd-soc-imx-wm8962.o
- obj-$(CONFIG_SND_SOC_IMX_SPDIF) += snd-soc-imx-spdif.o
- obj-$(CONFIG_SND_SOC_IMX_MC13783) += snd-soc-imx-mc13783.o
-+obj-$(CONFIG_SND_SOC_IMX_HDMI) += snd-soc-imx-hdmi.o
-+
-+AFLAGS_hdmi_pcm.o := -march=armv7-a -mtune=cortex-a9 -mfpu=neon -mfloat-abi=softfp
-diff -Nur linux-4.1.3/sound/soc/soc-io.c linux-xbian-imx6/sound/soc/soc-io.c
---- linux-4.1.3/sound/soc/soc-io.c	2015-07-21 19:10:33.000000000 +0200
-+++ linux-xbian-imx6/sound/soc/soc-io.c	2015-07-27 23:13:11.344506380 +0200
-@@ -17,6 +17,8 @@
- #include <linux/export.h>
- #include <sound/soc.h>
- 
-+#include <trace/events/asoc.h>
-+
- /**
-  * snd_soc_component_read() - Read register value
-  * @component: Component to read from
-@@ -271,3 +273,233 @@
- 	return snd_soc_component_write(&platform->component, reg, val);
- }
- EXPORT_SYMBOL_GPL(snd_soc_platform_write);
-+
-+#ifdef CONFIG_REGMAP
-+static bool snd_soc_set_cache_val(void *base, unsigned int idx,
-+                                  unsigned int val, unsigned int word_size)
-+{
-+        switch (word_size) {
-+        case 1: {
-+                u8 *cache = base;
-+                if (cache[idx] == val)
-+                        return true;
-+                cache[idx] = val;
-+                break;
-+        }
-+        case 2: {
-+                u16 *cache = base;
-+                if (cache[idx] == val)
-+                        return true;
-+                cache[idx] = val;
-+                break;
-+        }
-+        default:
-+                WARN(1, "Invalid word_size %d\n", word_size);
-+                break;
-+        }
-+        return false;
-+}
-+
-+static unsigned int snd_soc_get_cache_val(const void *base, unsigned int idx,
-+                unsigned int word_size)
-+{
-+        if (!base)
-+                return -1;
-+
-+        switch (word_size) {
-+        case 1: {
-+                const u8 *cache = base;
-+                return cache[idx];
-+        }
-+        case 2: {
-+                const u16 *cache = base;
-+                return cache[idx];
-+        }
-+        default:
-+                WARN(1, "Invalid word_size %d\n", word_size);
-+                break;
-+        }
-+        /* unreachable */
-+        return -1;
-+}
-+
-+/**
-+ * snd_soc_cache_read: Fetch the value of a given register from the cache.
-+ *
-+ * @codec: CODEC to configure.
-+ * @reg: The register index.
-+ * @value: The value to be returned.
-+ */
-+int snd_soc_cache_read(struct snd_soc_codec *codec,
-+                       unsigned int reg, unsigned int *value)
-+{
-+        if (!value)
-+                return -EINVAL;
-+
-+        mutex_lock(&codec->cache_rw_mutex);
-+        *value = snd_soc_get_cache_val(codec->reg_cache, reg,
-+                                       codec->driver->reg_word_size);
-+        mutex_unlock(&codec->cache_rw_mutex);
-+
-+        return 0;
-+}
-+
-+/**
-+ * snd_soc_cache_write: Set the value of a given register in the cache.
-+ *
-+ * @codec: CODEC to configure.
-+ * @reg: The register index.
-+ * @value: The new register value.
-+ */
-+int snd_soc_cache_write(struct snd_soc_codec *codec,
-+                        unsigned int reg, unsigned int value)
-+{
-+        mutex_lock(&codec->cache_rw_mutex);
-+        snd_soc_set_cache_val(codec->reg_cache, reg, value,
-+                              codec->driver->reg_word_size);
-+        mutex_unlock(&codec->cache_rw_mutex);
-+
-+        return 0;
-+}
-+
-+/**
-+ * snd_soc_codec_volatile_register: Report if a register is volatile.
-+ *
-+ * @codec: CODEC to query.
-+ * @reg: Register to query.
-+ *
-+ * Boolean function indiciating if a CODEC register is volatile.
-+ */
-+int snd_soc_codec_volatile_register(struct snd_soc_codec *codec,
-+                                    unsigned int reg)
-+{
-+        if (codec->volatile_register)
-+                return codec->volatile_register(codec, reg);
-+        else
-+                return 0;
-+}
-+
-+static int hw_write(struct snd_soc_codec *codec, unsigned int reg,
-+                    unsigned int value)
-+{
-+        int ret;
-+
-+        if (!snd_soc_codec_volatile_register(codec, reg) &&
-+            reg < codec->driver->reg_cache_size &&
-+            !codec->cache_bypass) {
-+                ret = snd_soc_cache_write(codec, reg, value);
-+                if (ret < 0)
-+                        return -1;
-+        }
-+
-+        if (codec->cache_only) {
-+                codec->cache_sync = 1;
-+                return 0;
-+        }
-+
-+        return regmap_write(codec->control_data, reg, value);
-+}
-+
-+static unsigned int hw_read(struct snd_soc_codec *codec, unsigned int reg)
-+{
-+        int ret;
-+        unsigned int val;
-+
-+        if (reg >= codec->driver->reg_cache_size ||
-+            snd_soc_codec_volatile_register(codec, reg) ||
-+            codec->cache_bypass) {
-+                if (codec->cache_only)
-+                        return -1;
-+
-+                ret = regmap_read(codec->control_data, reg, &val);
-+                if (ret == 0)
-+                        return val;
-+                else
-+                        return -1;
-+        }
-+
-+        ret = snd_soc_cache_read(codec, reg, &val);
-+        if (ret < 0)
-+                return -1;
-+        return val;
-+}
-+
-+/**
-+ * snd_soc_codec_set_cache_io: Set up standard I/O functions.
-+ *
-+ * @codec: CODEC to configure.
-+ * @addr_bits: Number of bits of register address data.
-+ * @data_bits: Number of bits of data per register.
-+ * @control: Control bus used.
-+ *
-+ * Register formats are frequently shared between many I2C and SPI
-+ * devices.  In order to promote code reuse the ASoC core provides
-+ * some standard implementations of CODEC read and write operations
-+ * which can be set up using this function.
-+ *
-+ * The caller is responsible for allocating and initialising the
-+ * actual cache.
-+ *
-+ * Note that at present this code cannot be used by CODECs with
-+ * volatile registers.
-+ */
-+int snd_soc_codec_set_cache_io(struct snd_soc_codec *codec,
-+                               int addr_bits, int data_bits,
-+                               enum snd_soc_control_type control)
-+{
-+        struct regmap_config config;
-+        int ret;
-+
-+        memset(&config, 0, sizeof(config));
-+        codec->write = hw_write;
-+        codec->read = hw_read;
-+
-+        config.reg_bits = addr_bits;
-+        config.val_bits = data_bits;
-+
-+        switch (control) {
-+#if IS_ENABLED(CONFIG_REGMAP_I2C)
-+        case SND_SOC_I2C:
-+                codec->control_data = regmap_init_i2c(to_i2c_client(codec->dev),
-+                                                      &config);
-+                break;
-+#endif
-+
-+#if IS_ENABLED(CONFIG_REGMAP_SPI)
-+        case SND_SOC_SPI:
-+                codec->control_data = regmap_init_spi(to_spi_device(codec->dev),
-+                                                      &config);
-+                break;
-+#endif
-+
-+        case SND_SOC_REGMAP:
-+                /* Device has made its own regmap arrangements */
-+                codec->using_regmap = true;
-+                if (!codec->control_data)
-+                        codec->control_data = dev_get_regmap(codec->dev, NULL);
-+
-+                if (codec->control_data) {
-+                        ret = regmap_get_val_bytes(codec->control_data);
-+                        /* Errors are legitimate for non-integer byte
-+                         * multiples */
-+                        if (ret > 0)
-+                                codec->val_bytes = ret;
-+                }
-+                break;
-+
-+        default:
-+                return -EINVAL;
-+        }
-+
-+        return PTR_ERR_OR_ZERO(codec->control_data);
-+}
-+EXPORT_SYMBOL_GPL(snd_soc_codec_set_cache_io);
-+#else
-+int snd_soc_codec_set_cache_io(struct snd_soc_codec *codec,
-+                               int addr_bits, int data_bits,
-+                               enum snd_soc_control_type control)
-+{
-+        return -ENOTSUPP;
-+}
-+EXPORT_SYMBOL_GPL(snd_soc_codec_set_cache_io);
-+#endif
diff --git a/target/arm/solidrun-imx6/patches/4.1.6/0001-xbian.patch b/target/arm/solidrun-imx6/patches/4.1.6/0001-xbian.patch
new file mode 100644
index 000000000..6286c0868
--- /dev/null
+++ b/target/arm/solidrun-imx6/patches/4.1.6/0001-xbian.patch
@@ -0,0 +1,171697 @@
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6dl.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6dl.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6dl.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6dl.dtsi	2015-07-27 23:13:00.299912248 +0200
+@@ -60,17 +60,103 @@
+ 	};
+ 
+ 	soc {
+-		ocram: sram@00900000 {
++		busfreq { /* BUSFREQ */
++			compatible = "fsl,imx6_busfreq";
++			clocks = <&clks 171>, <&clks 6>, <&clks 11>, <&clks 104>, <&clks 172>, <&clks 58>,
++				 <&clks 18>, <&clks 60>, <&clks 20>, <&clks 3>, <&clks 22> , <&clks 8>;
++			clock-names = "pll2_bus", "pll2_pfd2_396m", "pll2_198m", "arm", "pll3_usb_otg", "periph",
++				      "periph_pre", "periph_clk2", "periph_clk2_sel", "osc", "axi_sel", "pll3_pfd1_540m";
++			interrupts = <0 107 0x04>, <0 112 0x4>;
++			interrupt-names = "irq_busfreq_0", "irq_busfreq_1";
++			fsl,max_ddr_freq = <400000000>;
++		};
++
++		gpu@00130000 {
++			compatible = "fsl,imx6dl-gpu", "fsl,imx6q-gpu";
++			reg = <0x00130000 0x4000>, <0x00134000 0x4000>,
++			      <0x0 0x0>;
++			reg-names = "iobase_3d", "iobase_2d",
++			            "phys_baseaddr";
++			interrupts = <0 9 0x04>, <0 10 0x04>;
++			interrupt-names = "irq_3d", "irq_2d";
++			clocks = <&clks 26>, <&clks 27>,
++			         <&clks 121>, <&clks 122>,
++			         <&clks 74>;
++			clock-names = "gpu2d_axi_clk", "gpu3d_axi_clk",
++		                      "gpu2d_clk", "gpu3d_clk",
++		                      "gpu3d_shader_clk";
++			resets = <&src 0>, <&src 3>;
++			reset-names = "gpu3d", "gpu2d";
++			power-domains = <&gpc 1>;
++		};
++
++		hdmi_core: hdmi_core@00120000 {
++			compatible = "fsl,imx6q-hdmi-core";
++			reg = <0x00120000 0x9000>;
++			clocks = <&clks 124>, <&clks 123>;
++			clock-names = "hdmi_isfr", "hdmi_iahb";
++			status = "disabled";
++		};
++
++		hdmi_video: hdmi_video@020e0000 {
++			compatible = "fsl,imx6q-hdmi-video";
++			reg = <0x020e0000 0x1000>;
++			reg-names = "hdmi_gpr";
++			interrupts = <0 115 0x04>;
++			clocks = <&clks 124>, <&clks 123>;
++			clock-names = "hdmi_isfr", "hdmi_iahb";
++			status = "disabled";
++		};
++
++		hdmi_audio: hdmi_audio@00120000 {
++			compatible = "fsl,imx6q-hdmi-audio";
++			clocks = <&clks 124>, <&clks 123>;
++			clock-names = "hdmi_isfr", "hdmi_iahb";
++			dmas = <&sdma 2 23 0>;
++			dma-names = "tx";
++			status = "disabled";
++		};
++
++		hdmi_cec: hdmi_cec@00120000 {
++			compatible = "fsl,imx6q-hdmi-cec";
++			interrupts = <0 115 0x04>;
++			status = "disabled";
++		};
++
++		ocrams: sram@00900000 {
++			compatible = "fsl,lpm-sram";
++			reg = <0x00900000 0x4000>;
++			clocks = <&clks IMX6QDL_CLK_OCRAM>;
++		};
++
++		ocrams_ddr: sram@00904000 {
++			compatible = "fsl,ddr-lpm-sram";
++			reg = <0x00904000 0x1000>;
++			clocks = <&clks IMX6QDL_CLK_OCRAM>;
++		};
++
++		ocram: sram@00905000 {
+ 			compatible = "mmio-sram";
+-			reg = <0x00900000 0x20000>;
++			reg = <0x00905000 0x1B000>;
+ 			clocks = <&clks IMX6QDL_CLK_OCRAM>;
+ 		};
+ 
+ 		aips1: aips-bus@02000000 {
++			vpu@02040000 {
++				iramsize = <0>;
++				status = "okay";
++			};
++
+ 			iomuxc: iomuxc@020e0000 {
+ 				compatible = "fsl,imx6dl-iomuxc";
+ 			};
+ 
++			dcic2: dcic@020e8000 {
++				clocks = <&clks IMX6QDL_CLK_DCIC1 >,
++					 <&clks IMX6QDL_CLK_DCIC2>; /* DCIC2 depend on DCIC1 clock in imx6dl*/
++				clock-names = "dcic", "disp-axi";
++			};
++
+ 			pxp: pxp@020f0000 {
+ 				reg = <0x020f0000 0x4000>;
+ 				interrupts = <0 98 IRQ_TYPE_LEVEL_HIGH>;
+@@ -99,26 +185,13 @@
+ 			};
+ 		};
+ 	};
+-
+-	display-subsystem {
+-		compatible = "fsl,imx-display-subsystem";
+-		ports = <&ipu1_di0>, <&ipu1_di1>;
+-	};
+-};
+-
+-&hdmi {
+-	compatible = "fsl,imx6dl-hdmi";
+ };
+ 
+ &ldb {
+-	clocks = <&clks IMX6QDL_CLK_LDB_DI0_SEL>, <&clks IMX6QDL_CLK_LDB_DI1_SEL>,
+-		 <&clks IMX6QDL_CLK_IPU1_DI0_SEL>, <&clks IMX6QDL_CLK_IPU1_DI1_SEL>,
+-		 <&clks IMX6QDL_CLK_LDB_DI0>, <&clks IMX6QDL_CLK_LDB_DI1>;
++	clocks = <&clks 33>, <&clks 34>,
++		 <&clks 39>, <&clks 40>,
++		 <&clks 135>, <&clks 136>;
+ 	clock-names = "di0_pll", "di1_pll",
+ 		      "di0_sel", "di1_sel",
+ 		      "di0", "di1";
+ };
+-
+-&vpu {
+-	compatible = "fsl,imx6dl-vpu", "cnm,coda960";
+-};
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-cubox-i.dtsi	2015-07-27 23:13:00.303898027 +0200
+@@ -45,11 +45,22 @@
+ #include <dt-bindings/gpio/gpio.h>
+ 
+ / {
++	chosen {
++		bootargs = "quiet console=ttymxc0,115200 root=/dev/mmcblk0p2 rw";
++	};
++
++	aliases {
++		mmc0 = &usdhc2;
++		mmc1 = &usdhc1;
++		mxcfb0 = &mxcfb1;
++	};
++
+ 	ir_recv: ir-receiver {
+ 		compatible = "gpio-ir-receiver";
+ 		gpios = <&gpio3 9 1>;
+ 		pinctrl-names = "default";
+ 		pinctrl-0 = <&pinctrl_cubox_i_ir>;
++		linux,rc-map-name = "rc-rc6-mce";
+ 	};
+ 
+ 	pwmleds {
+@@ -78,6 +89,8 @@
+ 
+ 		reg_usbh1_vbus: usb-h1-vbus {
+ 			compatible = "regulator-fixed";
++			regulator-boot-on;
++			regulator-always-on;
+ 			enable-active-high;
+ 			gpio = <&gpio1 0 0>;
+ 			pinctrl-names = "default";
+@@ -89,6 +102,8 @@
+ 
+ 		reg_usbotg_vbus: usb-otg-vbus {
+ 			compatible = "regulator-fixed";
++			regulator-boot-on;
++			regulator-always-on;
+ 			enable-active-high;
+ 			gpio = <&gpio3 22 0>;
+ 			pinctrl-names = "default";
+@@ -101,8 +116,7 @@
+ 
+ 	sound-spdif {
+ 		compatible = "fsl,imx-audio-spdif";
+-		model = "Integrated SPDIF";
+-		/* IMX6 doesn't implement this yet */
++		model = "imx-spdif";
+ 		spdif-controller = <&spdif>;
+ 		spdif-out;
+ 	};
+@@ -118,12 +132,45 @@
+ 			linux,code = <BTN_0>;
+ 		};
+ 	};
++
++	sound-hdmi {
++		compatible = "fsl,imx6q-audio-hdmi",
++			     "fsl,imx-audio-hdmi";
++		model = "imx-audio-hdmi";
++		hdmi-controller = <&hdmi_audio>;
++	};
++
++	mxcfb1: fb@0 {
++		compatible = "fsl,mxc_sdc_fb";
++		disp_dev = "hdmi";
++		interface_pix_fmt = "RGB24";
++		mode_str ="1920x1080M@60";
++		default_bpp = <32>;
++		int_clk = <0>;
++		late_init = <0>;
++		status = "okay";
++	};
++};
++
++&hdmi_core {
++	ipu_id = <0>;
++	disp_id = <0>;
++	status = "okay";
++};
++
++&hdmi_video {
++	fsl,phy_reg_vlev = <0x0294>;
++	fsl,phy_reg_cksymtx = <0x800d>;
++	status = "okay";
++};
++
++&hdmi_audio {
++	status = "okay";
+ };
+ 
+-&hdmi {
++&hdmi_cec {
+ 	pinctrl-names = "default";
+ 	pinctrl-0 = <&pinctrl_cubox_i_hdmi>;
+-	ddc-i2c-bus = <&i2c2>;
+ 	status = "okay";
+ };
+ 
+@@ -131,7 +178,13 @@
+ 	clock-frequency = <100000>;
+ 	pinctrl-names = "default";
+ 	pinctrl-0 = <&pinctrl_cubox_i_i2c2>;
++
+ 	status = "okay";
++
++	ddc: imx6_hdmi_i2c@50 {
++		compatible = "fsl,imx6-hdmi-i2c";
++		reg = <0x50>;
++	};
+ };
+ 
+ &i2c3 {
+@@ -228,6 +281,28 @@
+ 				MX6QDL_PAD_EIM_DA8__GPIO3_IO08	0x17059
+ 			>;
+ 		};
++
++		pinctrl_cubox_i_usdhc2_100mhz: cubox-i-usdhc2-100mhz {
++			fsl,pins = <
++				MX6QDL_PAD_SD2_CMD__SD2_CMD    0x170b9
++				MX6QDL_PAD_SD2_CLK__SD2_CLK    0x100b9
++				MX6QDL_PAD_SD2_DAT0__SD2_DATA0 0x170b9
++				MX6QDL_PAD_SD2_DAT1__SD2_DATA1 0x170b9
++				MX6QDL_PAD_SD2_DAT2__SD2_DATA2 0x170b9
++				MX6QDL_PAD_SD2_DAT3__SD2_DATA3 0x130b9
++			>;
++		};
++
++		pinctrl_cubox_i_usdhc2_200mhz: cubox-i-usdhc2-200mhz {
++			fsl,pins = <
++				MX6QDL_PAD_SD2_CMD__SD2_CMD    0x170f9
++				MX6QDL_PAD_SD2_CLK__SD2_CLK    0x100f9
++				MX6QDL_PAD_SD2_DAT0__SD2_DATA0 0x170f9
++				MX6QDL_PAD_SD2_DAT1__SD2_DATA1 0x170f9
++				MX6QDL_PAD_SD2_DAT2__SD2_DATA2 0x170f9
++				MX6QDL_PAD_SD2_DAT3__SD2_DATA3 0x130f9
++			>;
++		};
+ 	};
+ };
+ 
+@@ -256,9 +331,24 @@
+ };
+ 
+ &usdhc2 {
+-	pinctrl-names = "default";
++	pinctrl-names = "default", "state_100mhz", "state_200mhz";
+ 	pinctrl-0 = <&pinctrl_cubox_i_usdhc2_aux &pinctrl_cubox_i_usdhc2>;
++	pinctrl-1 = <&pinctrl_cubox_i_usdhc2_aux &pinctrl_cubox_i_usdhc2_100mhz>;
++	pinctrl-2 = <&pinctrl_cubox_i_usdhc2_aux &pinctrl_cubox_i_usdhc2_200mhz>;
+ 	vmmc-supply = <&reg_3p3v>;
+ 	cd-gpios = <&gpio1 4 0>;
+ 	status = "okay";
++	no-1-8-v;
++};
++
++&dcic1 {
++	dcic_id = <0>;
++	dcic_mux = "dcic-hdmi";
++	status = "okay";
++};
++
++&dcic2 {
++	dcic_id = <1>;
++	dcic_mux = "dcic-lvds1";
++	status = "okay";
+ };
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6qdl.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl.dtsi	2015-07-27 23:13:00.303898027 +0200
+@@ -14,6 +14,7 @@
+ #include <dt-bindings/interrupt-controller/arm-gic.h>
+ 
+ #include "skeleton.dtsi"
++#include <dt-bindings/gpio/gpio.h>
+ 
+ / {
+ 	aliases {
+@@ -30,6 +31,7 @@
+ 		i2c0 = &i2c1;
+ 		i2c1 = &i2c2;
+ 		i2c2 = &i2c3;
++		ipu0 = &ipu1;
+ 		mmc0 = &usdhc1;
+ 		mmc1 = &usdhc2;
+ 		mmc2 = &usdhc3;
+@@ -79,6 +81,10 @@
+ 		};
+ 	};
+ 
++	pu_dummy: pudummy_reg {
++		compatible = "fsl,imx6-dummy-pureg"; /* only used in ldo-bypass */
++	};
++
+ 	soc {
+ 		#address-cells = <1>;
+ 		#size-cells = <1>;
+@@ -86,6 +92,11 @@
+ 		interrupt-parent = <&gpc>;
+ 		ranges;
+ 
++		caam_sm: caam-sm@00100000 {
++			compatible = "fsl,imx6q-caam-sm";
++			reg = <0x00100000 0x3fff>;
++		};
++
+ 		dma_apbh: dma-apbh@00110000 {
+ 			compatible = "fsl,imx6q-dma-apbh", "fsl,imx28-dma-apbh";
+ 			reg = <0x00110000 0x2000>;
+@@ -99,6 +110,12 @@
+ 			clocks = <&clks IMX6QDL_CLK_APBH_DMA>;
+ 		};
+ 
++		irq_sec_vio: caam_secvio {
++			compatible = "fsl,imx6q-caam-secvio";
++			interrupts = <0 20 0x04>;
++			secvio_src = <0x8000001d>;
++		};
++
+ 		gpmi: gpmi-nand@00112000 {
+ 			compatible = "fsl,imx6q-gpmi-nand";
+ 			#address-cells = <1>;
+@@ -190,16 +207,16 @@
+ 					dmas = <&sdma 14 18 0>,
+ 					       <&sdma 15 18 0>;
+ 					dma-names = "rx", "tx";
+-					clocks = <&clks IMX6QDL_CLK_SPDIF>, <&clks IMX6QDL_CLK_OSC>,
+-						 <&clks IMX6QDL_CLK_SPDIF>, <&clks IMX6QDL_CLK_DUMMY>,
+-						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_DUMMY>,
+-						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_DUMMY>,
+-						 <&clks IMX6QDL_CLK_DUMMY>;
++					clocks = <&clks IMX6QDL_CLK_SPDIF_GCLK>, <&clks IMX6QDL_CLK_OSC>,
++						 <&clks IMX6QDL_CLK_SPDIF>, <&clks IMX6QDL_CLK_ASRC>,
++						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_ESAI_EXTAL>,
++						 <&clks IMX6QDL_CLK_IPG>, <&clks IMX6QDL_CLK_MLB>,
++						 <&clks IMX6QDL_CLK_DUMMY>, <&clks IMX6QDL_CLK_SPBA>;
+ 					clock-names = "core",  "rxtx0",
+ 						      "rxtx1", "rxtx2",
+ 						      "rxtx3", "rxtx4",
+ 						      "rxtx5", "rxtx6",
+-						      "rxtx7";
++						      "rxtx7", "dma";
+ 					status = "disabled";
+ 				};
+ 
+@@ -274,7 +291,12 @@
+ 				esai: esai@02024000 {
+ 					reg = <0x02024000 0x4000>;
+ 					interrupts = <0 51 IRQ_TYPE_LEVEL_HIGH>;
+-				};
++					compatible = "fsl,imx6q-esai";
++					clocks = <&clks 118>;
++					fsl,esai-dma-events = <24 23>;
++					fsl,flags = <1>;
++					status = "disabled";
++                                };
+ 
+ 				ssi1: ssi@02028000 {
+ 					#sound-dai-cells = <0>;
+@@ -325,8 +347,30 @@
+ 				};
+ 
+ 				asrc: asrc@02034000 {
++					compatible = "fsl,imx53-asrc";
+ 					reg = <0x02034000 0x4000>;
+ 					interrupts = <0 50 IRQ_TYPE_LEVEL_HIGH>;
++					clocks = <&clks IMX6QDL_CLK_ASRC_MEM>,
++						 <&clks IMX6QDL_CLK_ASRC_IPG>,
++						 <&clks IMX6QDL_CLK_SPDIF>,
++						 <&clks IMX6QDL_CLK_SPBA>;
++					clock-names = "mem", "ipg", "asrck_0", "dma";
++					dmas = <&sdma 17 20 1>, <&sdma 18 20 1>, <&sdma 19 20 1>,
++					       <&sdma 20 20 1>, <&sdma 21 20 1>, <&sdma 22 20 1>;
++					dma-names = "rxa", "rxb", "rxc",
++						    "txa", "txb", "txc";
++					fsl,asrc-rate = <48000>;
++					fsl,asrc-width = <16>;
++					status = "okay";
++				};
++
++				asrc_p2p: asrc_p2p {
++					compatible = "fsl,imx6q-asrc-p2p";
++					fsl,output-rate  = <48000>;
++					fsl,output-width = <16>;
++					fsl,asrc-dma-rx-events = <17 18 19>;
++					fsl,asrc-dma-tx-events = <20 21 22>;
++					status = "okay";
+ 				};
+ 
+ 				spba@0203c000 {
+@@ -335,16 +379,20 @@
+ 			};
+ 
+ 			vpu: vpu@02040000 {
+-				compatible = "cnm,coda960";
++				compatible = "cnm,coda960", "fsl,imx6-vpu";
+ 				reg = <0x02040000 0x3c000>;
++				reg-names = "vpu_regs";
+ 				interrupts = <0 12 IRQ_TYPE_LEVEL_HIGH>,
+ 					     <0 3 IRQ_TYPE_LEVEL_HIGH>;
+ 				interrupt-names = "bit", "jpeg";
+ 				clocks = <&clks IMX6QDL_CLK_VPU_AXI>,
+-					 <&clks IMX6QDL_CLK_MMDC_CH0_AXI>;
+-				clock-names = "per", "ahb";
+-				resets = <&src 1>;
++					 <&clks IMX6QDL_CLK_MMDC_CH0_AXI>,
++					 <&clks IMX6QDL_CLK_OCRAM>;
++				clock-names = "per", "ahb", "ocram";
++				iramsize = <0x21000>;
+ 				iram = <&ocram>;
++				resets = <&src 1>;
++				power-domains = <&gpc 1>;
+ 			};
+ 
+ 			aipstz@0207c000 { /* AIPSTZ1 */
+@@ -552,20 +600,21 @@
+ 					anatop-min-bit-val = <4>;
+ 					anatop-min-voltage = <800000>;
+ 					anatop-max-voltage = <1375000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+-				regulator-3p0@120 {
++				reg_3p0: regulator-3p0@120 {
+ 					compatible = "fsl,anatop-regulator";
+ 					regulator-name = "vdd3p0";
+-					regulator-min-microvolt = <2800000>;
+-					regulator-max-microvolt = <3150000>;
+-					regulator-always-on;
++					regulator-min-microvolt = <2625000>;
++					regulator-max-microvolt = <3400000>;
+ 					anatop-reg-offset = <0x120>;
+ 					anatop-vol-bit-shift = <8>;
+ 					anatop-vol-bit-width = <5>;
+ 					anatop-min-bit-val = <0>;
+ 					anatop-min-voltage = <2625000>;
+ 					anatop-max-voltage = <3400000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+ 				regulator-2p5@130 {
+@@ -580,6 +629,7 @@
+ 					anatop-min-bit-val = <0>;
+ 					anatop-min-voltage = <2000000>;
+ 					anatop-max-voltage = <2750000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+ 				reg_arm: regulator-vddcore@140 {
+@@ -647,6 +697,7 @@
+ 				reg = <0x020c9000 0x1000>;
+ 				interrupts = <0 44 IRQ_TYPE_LEVEL_HIGH>;
+ 				clocks = <&clks IMX6QDL_CLK_USBPHY1>;
++				phy-3p0-supply = <&reg_3p0>;
+ 				fsl,anatop = <&anatop>;
+ 			};
+ 
+@@ -655,9 +706,15 @@
+ 				reg = <0x020ca000 0x1000>;
+ 				interrupts = <0 45 IRQ_TYPE_LEVEL_HIGH>;
+ 				clocks = <&clks IMX6QDL_CLK_USBPHY2>;
++				phy-3p0-supply = <&reg_3p0>;
+ 				fsl,anatop = <&anatop>;
+ 			};
+ 
++			caam_snvs: caam-snvs@020cc000 {
++				compatible = "fsl,imx6q-caam-snvs";
++				reg = <0x020cc000 0x4000>;
++			};
++
+ 			snvs@020cc000 {
+ 				compatible = "fsl,sec-v4.0-mon", "simple-bus";
+ 				#address-cells = <1>;
+@@ -704,14 +761,12 @@
+ 				interrupts = <0 89 IRQ_TYPE_LEVEL_HIGH>,
+ 					     <0 90 IRQ_TYPE_LEVEL_HIGH>;
+ 				interrupt-parent = <&intc>;
+-				pu-supply = <&reg_pu>;
+-				clocks = <&clks IMX6QDL_CLK_GPU3D_CORE>,
+-					 <&clks IMX6QDL_CLK_GPU3D_SHADER>,
+-					 <&clks IMX6QDL_CLK_GPU2D_CORE>,
+-					 <&clks IMX6QDL_CLK_GPU2D_AXI>,
+-					 <&clks IMX6QDL_CLK_OPENVG_AXI>,
+-					 <&clks IMX6QDL_CLK_VPU_AXI>;
+ 				#power-domain-cells = <1>;
++				clocks = <&clks 122>, <&clks 74>, <&clks 121>,
++					 <&clks 26>, <&clks 143>, <&clks 168>;
++				clock-names = "gpu3d_core", "gpu3d_shader", "gpu2d_core",
++					      "gpu2d_axi", "openvg_axi", "vpu_axi";
++				pu-supply = <&reg_pu>;
+ 			};
+ 
+ 			gpr: iomuxc-gpr@020e0000 {
+@@ -736,22 +791,6 @@
+ 					#size-cells = <0>;
+ 					reg = <0>;
+ 					status = "disabled";
+-
+-					port@0 {
+-						reg = <0>;
+-
+-						lvds0_mux_0: endpoint {
+-							remote-endpoint = <&ipu1_di0_lvds0>;
+-						};
+-					};
+-
+-					port@1 {
+-						reg = <1>;
+-
+-						lvds0_mux_1: endpoint {
+-							remote-endpoint = <&ipu1_di1_lvds0>;
+-						};
+-					};
+ 				};
+ 
+ 				lvds-channel@1 {
+@@ -759,22 +798,6 @@
+ 					#size-cells = <0>;
+ 					reg = <1>;
+ 					status = "disabled";
+-
+-					port@0 {
+-						reg = <0>;
+-
+-						lvds1_mux_0: endpoint {
+-							remote-endpoint = <&ipu1_di0_lvds1>;
+-						};
+-					};
+-
+-					port@1 {
+-						reg = <1>;
+-
+-						lvds1_mux_1: endpoint {
+-							remote-endpoint = <&ipu1_di1_lvds1>;
+-						};
+-					};
+ 				};
+ 			};
+ 
+@@ -788,32 +811,26 @@
+ 					 <&clks IMX6QDL_CLK_HDMI_ISFR>;
+ 				clock-names = "iahb", "isfr";
+ 				status = "disabled";
+-
+-				port@0 {
+-					reg = <0>;
+-
+-					hdmi_mux_0: endpoint {
+-						remote-endpoint = <&ipu1_di0_hdmi>;
+-					};
+-				};
+-
+-				port@1 {
+-					reg = <1>;
+-
+-					hdmi_mux_1: endpoint {
+-						remote-endpoint = <&ipu1_di1_hdmi>;
+-					};
+-				};
+ 			};
+ 
+ 			dcic1: dcic@020e4000 {
++				compatible = "fsl,imx6q-dcic";
+ 				reg = <0x020e4000 0x4000>;
+ 				interrupts = <0 124 IRQ_TYPE_LEVEL_HIGH>;
++				clocks = <&clks IMX6QDL_CLK_DCIC1>, <&clks IMX6QDL_CLK_DCIC1>;
++				clock-names = "dcic", "disp-axi";
++				gpr = <&gpr>;
++				status = "disabled";
+ 			};
+ 
+ 			dcic2: dcic@020e8000 {
++				compatible = "fsl,imx6q-dcic";
+ 				reg = <0x020e8000 0x4000>;
+ 				interrupts = <0 125 IRQ_TYPE_LEVEL_HIGH>;
++				clocks = <&clks IMX6QDL_CLK_DCIC2>, <&clks IMX6QDL_CLK_DCIC2>;
++				clock-names = "dcic", "disp-axi";
++				gpr = <&gpr>;
++				status = "disabled";
+ 			};
+ 
+ 			sdma: sdma@020ec000 {
+@@ -824,6 +841,7 @@
+ 					 <&clks IMX6QDL_CLK_SDMA>;
+ 				clock-names = "ipg", "ahb";
+ 				#dma-cells = <3>;
++				iram = <&ocram>;
+ 				fsl,sdma-ram-script-name = "imx/sdma/sdma-imx6q.bin";
+ 			};
+ 		};
+@@ -835,10 +853,30 @@
+ 			reg = <0x02100000 0x100000>;
+ 			ranges;
+ 
+-			caam@02100000 {
+-				reg = <0x02100000 0x40000>;
+-				interrupts = <0 105 IRQ_TYPE_LEVEL_HIGH>,
+-					     <0 106 IRQ_TYPE_LEVEL_HIGH>;
++			crypto: caam@2100000 {
++				compatible = "fsl,sec-v4.0";
++				#address-cells = <1>;
++				#size-cells = <1>;
++				reg = <0x2100000 0x40000>;
++				ranges = <0 0x2100000 0x40000>;
++				interrupt-parent = <&intc>; /* interrupts = <0 92 0x4>; */
++				interrupts = <0 92 0x4>;
++				clocks = <&clks 213>, <&clks 214>, <&clks 215> ,<&clks 196>;
++				clock-names = "caam_mem", "caam_aclk", "caam_ipg", "caam_emi_slow";
++
++				sec_jr0: jr0@1000 {
++					compatible = "fsl,sec-v4.0-job-ring";
++					reg = <0x1000 0x1000>;
++					interrupt-parent = <&intc>;
++					interrupts = <0 105 IRQ_TYPE_LEVEL_HIGH>;
++				};
++
++				sec_jr1: jr1@2000 {
++					compatible = "fsl,sec-v4.0-job-ring";
++					reg = <0x2000 0x1000>;
++					interrupt-parent = <&intc>;
++					interrupts = <0 106 IRQ_TYPE_LEVEL_HIGH>;
++				};
+ 			};
+ 
+ 			aipstz@0217c000 { /* AIPSTZ2 */
+@@ -852,6 +890,7 @@
+ 				clocks = <&clks IMX6QDL_CLK_USBOH3>;
+ 				fsl,usbphy = <&usbphy1>;
+ 				fsl,usbmisc = <&usbmisc 0>;
++				fsl,anatop = <&anatop>;
+ 				status = "disabled";
+ 			};
+ 
+@@ -903,14 +942,21 @@
+ 					 <&clks IMX6QDL_CLK_ENET>,
+ 					 <&clks IMX6QDL_CLK_ENET_REF>;
+ 				clock-names = "ipg", "ahb", "ptp";
+-				status = "disabled";
++				phy-mode = "rgmii";
++				fsl,magic-packet;
++				status = "okay";
+ 			};
+ 
+-			mlb@0218c000 {
++			mlb: mlb@0218c000 {
+ 				reg = <0x0218c000 0x4000>;
+ 				interrupts = <0 53 IRQ_TYPE_LEVEL_HIGH>,
+ 					     <0 117 IRQ_TYPE_LEVEL_HIGH>,
+ 					     <0 126 IRQ_TYPE_LEVEL_HIGH>;
++				compatible = "fsl,imx6q-mlb150";
++				clocks = <&clks 139>, <&clks 175>;
++				clock-names = "mlb", "pll8_mlb";
++				iram = <&ocram>;
++				status = "disabled";
+ 			};
+ 
+ 			usdhc1: usdhc@02190000 {
+@@ -995,6 +1041,11 @@
+ 				reg = <0x021ac000 0x4000>;
+ 			};
+ 
++			mmdc0-1@021b0000 {
++				compatible = "fsl,imx6q-mmdc-combine";
++				reg = <0x021b0000 0x8000>;
++			};
++
+ 			mmdc0: mmdc@021b0000 { /* MMDC0 */
+ 				compatible = "fsl,imx6q-mmdc";
+ 				reg = <0x021b0000 0x4000>;
+@@ -1011,11 +1062,17 @@
+ 				clocks = <&clks IMX6QDL_CLK_EIM_SLOW>;
+ 			};
+ 
+-			ocotp: ocotp@021bc000 {
+-				compatible = "fsl,imx6q-ocotp", "syscon";
++			ocotp: ocotp-ctrl@021bc000 {
++				compatible = "syscon";
+ 				reg = <0x021bc000 0x4000>;
+ 			};
+ 
++			ocotp-fuse@021bc000 {
++				compatible = "fsl,imx6q-ocotp";
++				reg = <0x021bc000 0x4000>;
++				clocks = <&clks 128>;
++			};
++
+ 			tzasc@021d0000 { /* TZASC1 */
+ 				reg = <0x021d0000 0x4000>;
+ 				interrupts = <0 108 IRQ_TYPE_LEVEL_HIGH>;
+@@ -1034,39 +1091,38 @@
+ 
+ 			mipi_csi: mipi@021dc000 {
+ 				reg = <0x021dc000 0x4000>;
++				compatible = "fsl,imx6q-mipi-csi2";
++				interrupts = <0 100 0x04>, <0 101 0x04>;
++				clocks = <&clks IMX6QDL_CLK_HSI_TX>,
++					 <&clks IMX6QDL_CLK_EIM_SEL>,
++					 <&clks IMX6QDL_CLK_LVDS2_IN>;
++				/* Note: clks 138 is hsi_tx, however, the dphy_c
++                                 * hsi_tx and pll_refclk use the same clk gate.
++                                 * In current clk driver, open/close clk gate do
++                                 * use hsi_tx for a temporary debug purpose.
++                                 */
++				clock-names = "dphy_clk", "pixel_clk", "cfg_clk";
++				status = "disabled";
+ 			};
+ 
+ 			mipi_dsi: mipi@021e0000 {
++				compatible = "fsl,imx6q-mipi-dsi";
+ 				#address-cells = <1>;
+ 				#size-cells = <0>;
+ 				reg = <0x021e0000 0x4000>;
+ 				status = "disabled";
+-
+-				ports {
+-					#address-cells = <1>;
+-					#size-cells = <0>;
+-
+-					port@0 {
+-						reg = <0>;
+-
+-						mipi_mux_0: endpoint {
+-							remote-endpoint = <&ipu1_di0_mipi>;
+-						};
+-					};
+-
+-					port@1 {
+-						reg = <1>;
+-
+-						mipi_mux_1: endpoint {
+-							remote-endpoint = <&ipu1_di1_mipi>;
+-						};
+-					};
+-				};
++				interrupts = <0 102 0x04>;
++				gpr = <&gpr>;
++				clocks = <&clks IMX6QDL_CLK_HSI_TX>, <&clks IMX6QDL_CLK_VIDEO_27M>;
++				clock-names = "mipi_pllref_clk", "mipi_cfg_clk";
+ 			};
+ 
+ 			vdoa@021e4000 {
++				compatible = "fsl,imx6q-vdoa";
+ 				reg = <0x021e4000 0x4000>;
+ 				interrupts = <0 18 IRQ_TYPE_LEVEL_HIGH>;
++				clocks = <&clks 202>;
++				iram = <&ocram>;
+ 			};
+ 
+ 			uart2: serial@021e8000 {
+@@ -1127,67 +1183,14 @@
+ 				     <0 5 IRQ_TYPE_LEVEL_HIGH>;
+ 			clocks = <&clks IMX6QDL_CLK_IPU1>,
+ 				 <&clks IMX6QDL_CLK_IPU1_DI0>,
+-				 <&clks IMX6QDL_CLK_IPU1_DI1>;
+-			clock-names = "bus", "di0", "di1";
++				 <&clks IMX6QDL_CLK_IPU1_DI1>,
++                                 <&clks 39>, <&clks 40>,
++                                 <&clks 135>, <&clks 136>;
++			clock-names = "bus", "di0", "di1",
++                                      "di0_sel", "di1_sel",
++                                      "ldb_di0", "ldb_di1";
+ 			resets = <&src 2>;
+-
+-			ipu1_csi0: port@0 {
+-				reg = <0>;
+-			};
+-
+-			ipu1_csi1: port@1 {
+-				reg = <1>;
+-			};
+-
+-			ipu1_di0: port@2 {
+-				#address-cells = <1>;
+-				#size-cells = <0>;
+-				reg = <2>;
+-
+-				ipu1_di0_disp0: endpoint@0 {
+-				};
+-
+-				ipu1_di0_hdmi: endpoint@1 {
+-					remote-endpoint = <&hdmi_mux_0>;
+-				};
+-
+-				ipu1_di0_mipi: endpoint@2 {
+-					remote-endpoint = <&mipi_mux_0>;
+-				};
+-
+-				ipu1_di0_lvds0: endpoint@3 {
+-					remote-endpoint = <&lvds0_mux_0>;
+-				};
+-
+-				ipu1_di0_lvds1: endpoint@4 {
+-					remote-endpoint = <&lvds1_mux_0>;
+-				};
+-			};
+-
+-			ipu1_di1: port@3 {
+-				#address-cells = <1>;
+-				#size-cells = <0>;
+-				reg = <3>;
+-
+-				ipu1_di0_disp1: endpoint@0 {
+-				};
+-
+-				ipu1_di1_hdmi: endpoint@1 {
+-					remote-endpoint = <&hdmi_mux_1>;
+-				};
+-
+-				ipu1_di1_mipi: endpoint@2 {
+-					remote-endpoint = <&mipi_mux_1>;
+-				};
+-
+-				ipu1_di1_lvds0: endpoint@3 {
+-					remote-endpoint = <&lvds0_mux_1>;
+-				};
+-
+-				ipu1_di1_lvds1: endpoint@4 {
+-					remote-endpoint = <&lvds1_mux_1>;
+-				};
+-			};
++			bypass_reset = <0>;
+ 		};
+ 	};
+ };
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-hummingboard.dtsi	2015-07-27 23:13:00.303898027 +0200
+@@ -43,8 +43,10 @@
+ #include "imx6qdl-microsom-ar8035.dtsi"
+ 
+ / {
+-	chosen {
+-		stdout-path = &uart1;
++	aliases {
++		mmc0 = &usdhc2;
++		mmc1 = &usdhc1;
++		mxcfb0 = &mxcfb1;
+ 	};
+ 
+ 	ir_recv: ir-receiver {
+@@ -52,6 +54,7 @@
+ 		gpios = <&gpio3 5 1>;
+ 		pinctrl-names = "default";
+ 		pinctrl-0 = <&pinctrl_hummingboard_gpio3_5>;
++		linux,rc-map-name = "rc-rc6-mce";
+ 	};
+ 
+ 	regulators {
+@@ -98,32 +101,70 @@
+ 		model = "On-board Codec";
+ 		mux-ext-port = <5>;
+ 		mux-int-port = <1>;
++		cpu-dai = <&ssi1>;
+ 		ssi-controller = <&ssi1>;
+ 	};
+ 
+ 	sound-spdif {
+ 		compatible = "fsl,imx-audio-spdif";
+-		model = "On-board SPDIF";
++		model = "imx-spdif";
+ 		/* IMX6 doesn't implement this yet */
+ 		spdif-controller = <&spdif>;
+ 		spdif-out;
+ 	};
++
++	sound-hdmi {
++		compatible = "fsl,imx6q-audio-hdmi",
++			     "fsl,imx-audio-hdmi";
++		model = "imx-audio-hdmi";
++		hdmi-controller = <&hdmi_audio>;
++	};
++
++	mxcfb1: fb@0 {
++		compatible = "fsl,mxc_sdc_fb";
++		disp_dev = "hdmi";
++		interface_pix_fmt = "RGB24";
++		mode_str ="1920x1080M@60";
++		default_bpp = <32>;
++		int_clk = <0>;
++		late_init = <0>;
++		status = "okay";
++	};
+ };
+ 
+ &audmux {
+ 	status = "okay";
+ };
+ 
+-&can1 {
++/*&can1 {
+ 	pinctrl-names = "default";
+ 	pinctrl-0 = <&pinctrl_hummingboard_flexcan1>;
+ 	status = "okay";
+ };
++*/
++&hdmi_core {
++	ipu_id = <0>;
++	disp_id = <0>;
++	status = "okay";
++};
++
++&hdmi_video {
++	fsl,phy_reg_vlev = <0x0294>;
++	fsl,phy_reg_cksymtx = <0x800d>;
++	status = "okay";
++};
++
++&hdmi_audio {
++	status = "okay";
++};
++
++&ocram {
++	status = "okay";
++};
+ 
+-&hdmi {
++&hdmi_cec {
+ 	pinctrl-names = "default";
+ 	pinctrl-0 = <&pinctrl_hummingboard_hdmi>;
+-	ddc-i2c-bus = <&i2c2>;
+ 	status = "okay";
+ };
+ 
+@@ -136,6 +177,7 @@
+ 	rtc: pcf8523@68 {
+ 		compatible = "nxp,pcf8523";
+ 		reg = <0x68>;
++		nxp,12p5_pf;
+ 	};
+ 
+ 	/* Pro baseboard model */
+@@ -155,20 +197,57 @@
+ 	pinctrl-names = "default";
+ 	pinctrl-0 = <&pinctrl_hummingboard_i2c2>;
+ 	status = "okay";
++
++	ddc: imx6_hdmi_i2c@50 {
++		compatible = "fsl,imx6-hdmi-i2c";
++		reg = <0x50>;
++	};
+ };
+ 
+ &iomuxc {
++	pinctrl-names = "default";
++	pinctrl-0 = <&pinctrl_hog>;
+ 	hummingboard {
+-		pinctrl_hummingboard_flexcan1: hummingboard-flexcan1 {
++		pinctrl_hog: hoggrp {
++			fsl,pins = <
++				/*
++                                 * 26 pin header GPIO description. The pins.
++                                 * numbering as following -
++                                 * GPIO number | GPIO (bank,num) |  PIN number
++                                 * ------------+-----------------+------------
++                                 * gpio1       | (1,1)           | IO7
++                                 * gpio73      | (3,9)           | IO11
++                                 * gpio72      | (3,8)           | IO12
++                                 * gpio71      | (3,7)           | IO13
++                                 * gpio70      | (3,6)           | IO15
++                                 * gpio194     | (7,2)           | IO16
++                                 * gpio195     | (7,3)           | IO18
++                                 * gpio67      | (3,3)           | IO22
++                                 *
++                                 * Notice the gpioX and GPIO (Y,Z) mapping forumla :
++                                 * X = (Y-1) * 32 + Z
++                                 */
++				MX6QDL_PAD_GPIO_1__GPIO1_IO01 0x400130b1
++				MX6QDL_PAD_EIM_DA9__GPIO3_IO09 0x400130b1
++				MX6QDL_PAD_EIM_DA8__GPIO3_IO08 0x400130b1
++				MX6QDL_PAD_EIM_DA7__GPIO3_IO07 0x400130b1
++				MX6QDL_PAD_EIM_DA6__GPIO3_IO06 0x400130b1
++				MX6QDL_PAD_SD3_CMD__GPIO7_IO02 0x400130b1
++				MX6QDL_PAD_SD3_CLK__GPIO7_IO03 0x400130b1
++				MX6QDL_PAD_EIM_DA3__GPIO3_IO03 0x400130b1
++			>;
++		};
++
++/*		pinctrl_hummingboard_flexcan1: hummingboard-flexcan1 {
+ 			fsl,pins = <
+ 				MX6QDL_PAD_SD3_CLK__FLEXCAN1_RX 0x80000000
+ 				MX6QDL_PAD_SD3_CMD__FLEXCAN1_TX 0x80000000
+ 			>;
+ 		};
+-
++*/
+ 		pinctrl_hummingboard_gpio3_5: hummingboard-gpio3_5 {
+ 			fsl,pins = <
+-				MX6QDL_PAD_EIM_DA5__GPIO3_IO05 0x1b0b1
++				MX6QDL_PAD_EIM_DA5__GPIO3_IO05 0x80000000
+ 			>;
+ 		};
+ 
+@@ -198,10 +277,10 @@
+ 
+ 		pinctrl_hummingboard_sgtl5000: hummingboard-sgtl5000 {
+ 			fsl,pins = <
+-				MX6QDL_PAD_DISP0_DAT19__AUD5_RXD 0x130b0
+-				MX6QDL_PAD_KEY_COL0__AUD5_TXC 0x130b0
+-				MX6QDL_PAD_KEY_ROW0__AUD5_TXD 0x110b0
+-				MX6QDL_PAD_KEY_COL1__AUD5_TXFS 0x130b0
++				MX6QDL_PAD_DISP0_DAT19__AUD5_RXD 0x130b0 /*brk*/
++				MX6QDL_PAD_KEY_COL0__AUD5_TXC 0x130b0 /*ok*/
++				MX6QDL_PAD_KEY_ROW0__AUD5_TXD 0x110b0 /*brk*/
++				MX6QDL_PAD_KEY_COL1__AUD5_TXFS 0x130b0 /*ok*/
+ 				MX6QDL_PAD_GPIO_5__CCM_CLKO1 0x130b0
+ 			>;
+ 		};
+@@ -219,7 +298,7 @@
+ 			 * Similar to pinctrl_usbotg_2, but we want it
+ 			 * pulled down for a fixed host connection.
+ 			 */
+-			fsl,pins = <MX6QDL_PAD_GPIO_1__USB_OTG_ID 0x13059>;
++			fsl,pins = <MX6QDL_PAD_ENET_RX_ER__USB_OTG_ID 0x13059>;
+ 		};
+ 
+ 		pinctrl_hummingboard_usbotg_vbus: hummingboard-usbotg-vbus {
+@@ -242,6 +321,13 @@
+ 				MX6QDL_PAD_SD2_DAT3__SD2_DATA3 0x13059
+ 			>;
+ 		};
++
++		pinctrl_hummingboard_pcie_reset: hummingboard-pcie-reset {
++			fsl,pins = <
++				MX6QDL_PAD_EIM_DA4__GPIO3_IO04 0x80000000
++			>;
++		};
++
+ 	};
+ };
+ 
+@@ -256,6 +342,14 @@
+ 	 status = "okay";
+ };
+ 
++&pwm3 {
++	status = "disabled";
++};
++
++&pwm4 {
++	status = "disabled";
++};
++
+ &spdif {
+ 	pinctrl-names = "default";
+ 	pinctrl-0 = <&pinctrl_hummingboard_spdif>;
+@@ -291,3 +385,48 @@
+ 	cd-gpios = <&gpio1 4 0>;
+ 	status = "okay";
+ };
++
++&gpc {
++	fsl,cpu_pupscr_sw2iso = <0xf>;
++	fsl,cpu_pupscr_sw = <0xf>;
++	fsl,cpu_pdnscr_iso2sw = <0x1>;
++	fsl,cpu_pdnscr_iso = <0x1>;
++	status = "okay";
++};
++
++&pcie {
++	pinctrl-names = "default";
++	pinctrl-0 = <
++		&pinctrl_hummingboard_pcie_reset
++	>;
++	reset-gpio = <&gpio3 4 0>;
++	status = "okay";
++	no-msi;
++};
++
++&ecspi1 {
++	status = "okay";
++	fsl,spi-num-chipselects = <1>;
++};
++
++&ecspi2 {
++	status = "okay";
++	fsl,spi-num-chipselects = <2>;
++};
++
++&ecspi3 {
++	status = "okay";
++	fsl,spi-num-chipselects = <3>;
++};
++
++&dcic1 {
++	dcic_id = <0>;
++	dcic_mux = "dcic-hdmi";
++	status = "okay";
++};
++
++&dcic2 {
++	dcic_id = <1>;
++	dcic_mux = "dcic-lvds1";
++	status = "okay";
++};
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6qdl-microsom.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-microsom.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6qdl-microsom.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6qdl-microsom.dtsi	2015-07-27 23:13:00.303898027 +0200
+@@ -39,15 +39,98 @@
+  *     FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+  *     OTHER DEALINGS IN THE SOFTWARE.
+  */
++#include <dt-bindings/gpio/gpio.h>
++/ {
++	clk_sdio: sdio-clock {
++		compatible = "gpio-gate-clock";
++		#clock-cells = <0>;
++		pinctrl-names = "default";
++		pinctrl-0 = <&pinctrl_microsom_brcm_osc>;
++		enable-gpios = <&gpio5 5 GPIO_ACTIVE_HIGH>;
++	};
++
++	regulators {
++		compatible = "simple-bus";
++
++		reg_brcm: brcm-reg {
++			compatible = "regulator-fixed";
++			enable-active-high;
++			gpio = <&gpio3 19 0>;
++			pinctrl-names = "default";
++			pinctrl-0 = <&pinctrl_microsom_brcm_reg>;
++			regulator-name = "brcm_reg";
++			regulator-min-microvolt = <3300000>;
++			regulator-max-microvolt = <3300000>;
++			startup-delay-us = <200000>;
++		};
++	};
++
++	usdhc1_pwrseq: usdhc1_pwrseq {
++		compatible = "mmc-pwrseq-simple";
++		reset-gpios = <&gpio5 26 GPIO_ACTIVE_LOW>,
++			      <&gpio6 0 GPIO_ACTIVE_LOW>;
++		clocks = <&clk_sdio>;
++		clock-names = "ext_clock";
++	};
++};
+ 
+ &iomuxc {
+ 	microsom {
++		pinctrl_microsom_brcm_bt: microsom-brcm-bt {
++			fsl,pins = <
++				MX6QDL_PAD_CSI0_DAT14__GPIO6_IO00	0x40013070
++				MX6QDL_PAD_CSI0_DAT15__GPIO6_IO01	0x40013070
++				MX6QDL_PAD_CSI0_DAT18__GPIO6_IO04	0x40013070
++			>;
++		};
++
++		pinctrl_microsom_brcm_osc: microsom-brcm-osc {
++			fsl,pins = <
++				MX6QDL_PAD_DISP0_DAT11__GPIO5_IO05	0x40013070
++			>;
++		};
++
++		pinctrl_microsom_brcm_reg: microsom-brcm-reg {
++			fsl,pins = <
++				MX6QDL_PAD_EIM_D19__GPIO3_IO19		0x40013070
++			>;
++		};
++
++		pinctrl_microsom_brcm_wifi: microsom-brcm-wifi {
++			fsl,pins = <
++				MX6QDL_PAD_GPIO_8__XTALOSC_REF_CLK_32K	0x1b0b0
++				MX6QDL_PAD_CSI0_DATA_EN__GPIO5_IO20	0x40013070
++				MX6QDL_PAD_CSI0_DAT8__GPIO5_IO26	0x40013070
++				MX6QDL_PAD_CSI0_DAT9__GPIO5_IO27	0x40013070
++			>;
++		};
++
+ 		pinctrl_microsom_uart1: microsom-uart1 {
+ 			fsl,pins = <
+ 				MX6QDL_PAD_CSI0_DAT10__UART1_TX_DATA	0x1b0b1
+ 				MX6QDL_PAD_CSI0_DAT11__UART1_RX_DATA	0x1b0b1
+ 			>;
+ 		};
++
++		pinctrl_microsom_uart4: microsom-uart4 {
++			fsl,pins = <
++				MX6QDL_PAD_CSI0_DAT12__UART4_TX_DATA 0x1b0b1
++				MX6QDL_PAD_CSI0_DAT13__UART4_RX_DATA 0x1b0b1
++				MX6QDL_PAD_CSI0_DAT16__UART4_RTS_B 0x1b0b1
++				MX6QDL_PAD_CSI0_DAT17__UART4_CTS_B 0x1b0b1
++			>;
++		};
++
++		pinctrl_microsom_usdhc1: microsom-usdhc1 {
++			fsl,pins = <
++				MX6QDL_PAD_SD1_CMD__SD1_CMD    0x17059
++				MX6QDL_PAD_SD1_CLK__SD1_CLK    0x10059
++				MX6QDL_PAD_SD1_DAT0__SD1_DATA0 0x17059
++				MX6QDL_PAD_SD1_DAT1__SD1_DATA1 0x17059
++				MX6QDL_PAD_SD1_DAT2__SD1_DATA2 0x17059
++				MX6QDL_PAD_SD1_DAT3__SD1_DATA3 0x17059
++			>;
++		};
+ 	};
+ };
+ 
+@@ -56,3 +139,23 @@
+ 	pinctrl-0 = <&pinctrl_microsom_uart1>;
+ 	status = "okay";
+ };
++
++/* UART4 - Connected to optional BRCM Wifi/BT/FM */
++&uart4 {
++	pinctrl-names = "default";
++	pinctrl-0 = <&pinctrl_microsom_brcm_bt &pinctrl_microsom_uart4>;
++	fsl,uart-has-rtscts;
++	status = "okay";
++};
++
++/* USDHC1 - Connected to optional BRCM Wifi/BT/FM */
++&usdhc1 {
++	pinctrl-names = "default";
++	pinctrl-0 = <&pinctrl_microsom_brcm_wifi &pinctrl_microsom_usdhc1>;
++	bus-width = <4>;
++	mmc-pwrseq = <&usdhc1_pwrseq>;
++	keep-power-in-suspend;
++	non-removable;
++	vmmc-supply = <&reg_brcm>;
++	status = "okay";
++};
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6q.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6q.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6q.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6q.dtsi	2015-07-27 23:13:00.303898027 +0200
+@@ -14,6 +14,7 @@
+ 
+ / {
+ 	aliases {
++		ipu1 = &ipu2;
+ 		spi4 = &ecspi5;
+ 	};
+ 
+@@ -47,9 +48,12 @@
+ 				 <&clks IMX6QDL_CLK_PLL2_PFD2_396M>,
+ 				 <&clks IMX6QDL_CLK_STEP>,
+ 				 <&clks IMX6QDL_CLK_PLL1_SW>,
+-				 <&clks IMX6QDL_CLK_PLL1_SYS>;
++				 <&clks IMX6QDL_CLK_PLL1_SYS>,
++				 <&clks IMX6QDL_PLL1_BYPASS>,
++				 <&clks IMX6QDL_CLK_PLL1>,
++				 <&clks IMX6QDL_PLL1_BYPASS_SRC> ;
+ 			clock-names = "arm", "pll2_pfd2_396m", "step",
+-				      "pll1_sw", "pll1_sys";
++				      "pll1_sw", "pll1_sys", "pll1_bypass", "pll1", "pll1_bypass_src";
+ 			arm-supply = <&reg_arm>;
+ 			pu-supply = <&reg_pu>;
+ 			soc-supply = <&reg_soc>;
+@@ -78,9 +82,85 @@
+ 	};
+ 
+ 	soc {
+-		ocram: sram@00900000 {
++
++		busfreq { /* BUSFREQ */
++			compatible = "fsl,imx6_busfreq";
++			clocks = <&clks 171>, <&clks 6>, <&clks 11>, <&clks 104>, <&clks 172>, <&clks 58>,
++				 <&clks 18>, <&clks 60>, <&clks 20>, <&clks 3>;
++			clock-names = "pll2_bus", "pll2_pfd2_396m", "pll2_198m", "arm", "pll3_usb_otg", "periph",
++				      "periph_pre", "periph_clk2", "periph_clk2_sel", "osc";
++			interrupts = <0 107 0x04>, <0 112 0x4>, <0 113 0x4>, <0 114 0x4>;
++			interrupt-names = "irq_busfreq_0", "irq_busfreq_1", "irq_busfreq_2", "irq_busfreq_3";
++			fsl,max_ddr_freq = <528000000>;
++		};
++
++		gpu@00130000 {
++			compatible = "fsl,imx6q-gpu";
++			reg = <0x00130000 0x4000>, <0x00134000 0x4000>,
++			      <0x02204000 0x4000>, <0x0 0x0>;
++			reg-names = "iobase_3d", "iobase_2d",
++				    "iobase_vg", "phys_baseaddr";
++			interrupts = <0 9 0x04>, <0 10 0x04>,<0 11 0x04>;
++			interrupt-names = "irq_3d", "irq_2d", "irq_vg";
++			clocks = <&clks 26>, <&clks 143>,
++				 <&clks 27>, <&clks 121>,
++				 <&clks 122>, <&clks 74>;
++			clock-names = "gpu2d_axi_clk", "openvg_axi_clk",
++				      "gpu3d_axi_clk", "gpu2d_clk",
++				      "gpu3d_clk", "gpu3d_shader_clk";
++			resets = <&src 0>, <&src 3>, <&src 3>;
++			reset-names = "gpu3d", "gpu2d", "gpuvg";
++			power-domains = <&gpc 1>;
++		};
++
++		hdmi_core: hdmi_core@00120000 {
++			compatible = "fsl,imx6q-hdmi-core";
++			reg = <0x00120000 0x9000>;
++			clocks = <&clks 124>, <&clks 123>;
++			clock-names = "hdmi_isfr", "hdmi_iahb";
++			status = "disabled";
++		};
++
++		hdmi_video: hdmi_video@020e0000 {
++			compatible = "fsl,imx6q-hdmi-video";
++			reg = <0x020e0000 0x1000>;
++			reg-names = "hdmi_gpr";
++			interrupts = <0 115 0x04>;
++			clocks = <&clks 124>, <&clks 123>;
++			clock-names = "hdmi_isfr", "hdmi_iahb";
++			status = "disabled";
++		};
++
++		hdmi_audio: hdmi_audio@00120000 {
++			compatible = "fsl,imx6q-hdmi-audio";
++			clocks = <&clks 124>, <&clks 123>;
++			clock-names = "hdmi_isfr", "hdmi_iahb";
++			dmas = <&sdma 2 23 0>;
++			dma-names = "tx";
++			status = "disabled";
++		};
++
++		hdmi_cec: hdmi_cec@00120000 {
++			compatible = "fsl,imx6q-hdmi-cec";
++			interrupts = <0 115 0x04>;
++			status = "disabled";
++		};
++
++		ocrams: sram@00900000 {
++			compatible = "fsl,lpm-sram";
++			reg = <0x00900000 0x4000>;
++			clocks = <&clks IMX6QDL_CLK_OCRAM>;
++		};
++
++		ocrams_ddr: sram@00904000 {
++			compatible = "fsl,ddr-lpm-sram";
++			reg = <0x00904000 0x1000>;
++			clocks = <&clks IMX6QDL_CLK_OCRAM>;
++		};
++
++		ocram: sram@00905000 {
+ 			compatible = "mmio-sram";
+-			reg = <0x00900000 0x40000>;
++			reg = <0x00905000 0x3B000>;
+ 			clocks = <&clks IMX6QDL_CLK_OCRAM>;
+ 		};
+ 
+@@ -101,6 +181,10 @@
+ 				};
+ 			};
+ 
++			vpu@02040000 {
++				status = "okay";
++			};
++
+ 			iomuxc: iomuxc@020e0000 {
+ 				compatible = "fsl,imx6q-iomuxc";
+ 
+@@ -154,165 +238,33 @@
+ 		};
+ 
+ 		ipu2: ipu@02800000 {
+-			#address-cells = <1>;
+-			#size-cells = <0>;
+ 			compatible = "fsl,imx6q-ipu";
+ 			reg = <0x02800000 0x400000>;
+ 			interrupts = <0 8 IRQ_TYPE_LEVEL_HIGH>,
+ 				     <0 7 IRQ_TYPE_LEVEL_HIGH>;
+-			clocks = <&clks IMX6QDL_CLK_IPU2>,
+-				 <&clks IMX6QDL_CLK_IPU2_DI0>,
+-				 <&clks IMX6QDL_CLK_IPU2_DI1>;
+-			clock-names = "bus", "di0", "di1";
++			clocks = <&clks 133>, <&clks 134>, <&clks 137>,
++				 <&clks 41>, <&clks 42>,
++				 <&clks 135>, <&clks 136>;
++			clock-names = "bus", "di0", "di1",
++				      "di0_sel", "di1_sel",
++				      "ldb_di0", "ldb_di1";
+ 			resets = <&src 4>;
+-
+-			ipu2_csi0: port@0 {
+-				reg = <0>;
+-			};
+-
+-			ipu2_csi1: port@1 {
+-				reg = <1>;
+-			};
+-
+-			ipu2_di0: port@2 {
+-				#address-cells = <1>;
+-				#size-cells = <0>;
+-				reg = <2>;
+-
+-				ipu2_di0_disp0: endpoint@0 {
+-				};
+-
+-				ipu2_di0_hdmi: endpoint@1 {
+-					remote-endpoint = <&hdmi_mux_2>;
+-				};
+-
+-				ipu2_di0_mipi: endpoint@2 {
+-				};
+-
+-				ipu2_di0_lvds0: endpoint@3 {
+-					remote-endpoint = <&lvds0_mux_2>;
+-				};
+-
+-				ipu2_di0_lvds1: endpoint@4 {
+-					remote-endpoint = <&lvds1_mux_2>;
+-				};
+-			};
+-
+-			ipu2_di1: port@3 {
+-				#address-cells = <1>;
+-				#size-cells = <0>;
+-				reg = <3>;
+-
+-				ipu2_di1_hdmi: endpoint@1 {
+-					remote-endpoint = <&hdmi_mux_3>;
+-				};
+-
+-				ipu2_di1_mipi: endpoint@2 {
+-				};
+-
+-				ipu2_di1_lvds0: endpoint@3 {
+-					remote-endpoint = <&lvds0_mux_3>;
+-				};
+-
+-				ipu2_di1_lvds1: endpoint@4 {
+-					remote-endpoint = <&lvds1_mux_3>;
+-				};
+-			};
+-		};
+-	};
+-
+-	display-subsystem {
+-		compatible = "fsl,imx-display-subsystem";
+-		ports = <&ipu1_di0>, <&ipu1_di1>, <&ipu2_di0>, <&ipu2_di1>;
+-	};
+-};
+-
+-&hdmi {
+-	compatible = "fsl,imx6q-hdmi";
+-
+-	port@2 {
+-		reg = <2>;
+-
+-		hdmi_mux_2: endpoint {
+-			remote-endpoint = <&ipu2_di0_hdmi>;
+-		};
+-	};
+-
+-	port@3 {
+-		reg = <3>;
+-
+-		hdmi_mux_3: endpoint {
+-			remote-endpoint = <&ipu2_di1_hdmi>;
++			bypass_reset = <0>;
+ 		};
+ 	};
+ };
+ 
+ &ldb {
+-	clocks = <&clks IMX6QDL_CLK_LDB_DI0_SEL>, <&clks IMX6QDL_CLK_LDB_DI1_SEL>,
++	clocks = <&clks IMX6QDL_CLK_LDB_DI0>, <&clks IMX6QDL_CLK_LDB_DI1>,
+ 		 <&clks IMX6QDL_CLK_IPU1_DI0_SEL>, <&clks IMX6QDL_CLK_IPU1_DI1_SEL>,
+ 		 <&clks IMX6QDL_CLK_IPU2_DI0_SEL>, <&clks IMX6QDL_CLK_IPU2_DI1_SEL>,
+-		 <&clks IMX6QDL_CLK_LDB_DI0>, <&clks IMX6QDL_CLK_LDB_DI1>;
+-	clock-names = "di0_pll", "di1_pll",
+-		      "di0_sel", "di1_sel", "di2_sel", "di3_sel",
+-		      "di0", "di1";
+-
+-	lvds-channel@0 {
+-		port@2 {
+-			reg = <2>;
+-
+-			lvds0_mux_2: endpoint {
+-				remote-endpoint = <&ipu2_di0_lvds0>;
+-			};
+-		};
+-
+-		port@3 {
+-			reg = <3>;
+-
+-			lvds0_mux_3: endpoint {
+-				remote-endpoint = <&ipu2_di1_lvds0>;
+-			};
+-		};
+-	};
+-
+-	lvds-channel@1 {
+-		port@2 {
+-			reg = <2>;
+-
+-			lvds1_mux_2: endpoint {
+-				remote-endpoint = <&ipu2_di0_lvds1>;
+-			};
+-		};
+-
+-		port@3 {
+-			reg = <3>;
+-
+-			lvds1_mux_3: endpoint {
+-				remote-endpoint = <&ipu2_di1_lvds1>;
+-			};
+-		};
+-	};
+-};
+-
+-&mipi_dsi {
+-	ports {
+-		port@2 {
+-			reg = <2>;
+-
+-			mipi_mux_2: endpoint {
+-				remote-endpoint = <&ipu2_di0_mipi>;
+-			};
+-		};
+-
+-		port@3 {
+-			reg = <3>;
+-
+-			mipi_mux_3: endpoint {
+-				remote-endpoint = <&ipu2_di1_mipi>;
+-			};
+-		};
+-	};
+-};
+-
+-&vpu {
+-	compatible = "fsl,imx6q-vpu", "cnm,coda960";
++		 <&clks IMX6QDL_CLK_LDB_DI0_DIV_3_5>, <&clks IMX6QDL_CLK_LDB_DI1_DIV_3_5>,
++		 <&clks IMX6QDL_CLK_LDB_DI0_DIV_7>, <&clks IMX6QDL_CLK_LDB_DI1_DIV_7>,
++		 <&clks IMX6QDL_CLK_LDB_DI0_DIV_SEL>, <&clks IMX6QDL_CLK_LDB_DI1_DIV_SEL>;
++	clock-names = "ldb_di0", "ldb_di1",
++		      "di0_sel", "di1_sel",
++		      "di2_sel", "di3_sel",
++		      "ldb_di0_div_3_5", "ldb_di1_div_3_5",
++		      "ldb_di0_div_7", "ldb_di1_div_7",
++		      "ldb_di0_div_sel", "ldb_di1_div_sel";
+ };
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6q-hummingboard.dts linux-xbian-imx6/arch/arm/boot/dts/imx6q-hummingboard.dts
+--- linux-4.1.3/arch/arm/boot/dts/imx6q-hummingboard.dts	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6q-hummingboard.dts	2015-07-27 23:13:00.303898027 +0200
+@@ -57,3 +57,7 @@
+ 	fsl,transmit-atten-16ths = <9>;
+ 	fsl,receive-eq-mdB = <3000>;
+ };
++
++&sgtl5000 {
++	status = "okay";
++};
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6sl.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6sl.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6sl.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6sl.dtsi	2015-07-27 23:13:00.307883804 +0200
+@@ -457,20 +457,21 @@
+ 					anatop-min-bit-val = <4>;
+ 					anatop-min-voltage = <800000>;
+ 					anatop-max-voltage = <1375000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+-				regulator-3p0@120 {
++				reg_3p0: regulator-3p0@120 {
+ 					compatible = "fsl,anatop-regulator";
+ 					regulator-name = "vdd3p0";
+-					regulator-min-microvolt = <2800000>;
+-					regulator-max-microvolt = <3150000>;
+-					regulator-always-on;
++					regulator-min-microvolt = <2625000>;
++					regulator-max-microvolt = <3400000>;
+ 					anatop-reg-offset = <0x120>;
+ 					anatop-vol-bit-shift = <8>;
+ 					anatop-vol-bit-width = <5>;
+ 					anatop-min-bit-val = <0>;
+ 					anatop-min-voltage = <2625000>;
+ 					anatop-max-voltage = <3400000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+ 				regulator-2p5@130 {
+@@ -485,6 +486,7 @@
+ 					anatop-min-bit-val = <0>;
+ 					anatop-min-voltage = <2100000>;
+ 					anatop-max-voltage = <2850000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+ 				reg_arm: regulator-vddcore@140 {
+@@ -552,6 +554,7 @@
+ 				reg = <0x020c9000 0x1000>;
+ 				interrupts = <0 44 IRQ_TYPE_LEVEL_HIGH>;
+ 				clocks = <&clks IMX6SL_CLK_USBPHY1>;
++				phy-3p0-supply = <&reg_3p0>;
+ 				fsl,anatop = <&anatop>;
+ 			};
+ 
+@@ -560,6 +563,7 @@
+ 				reg = <0x020ca000 0x1000>;
+ 				interrupts = <0 45 IRQ_TYPE_LEVEL_HIGH>;
+ 				clocks = <&clks IMX6SL_CLK_USBPHY2>;
++				phy-3p0-supply = <&reg_3p0>;
+ 				fsl,anatop = <&anatop>;
+ 			};
+ 
+diff -Nur linux-4.1.3/arch/arm/boot/dts/imx6sx.dtsi linux-xbian-imx6/arch/arm/boot/dts/imx6sx.dtsi
+--- linux-4.1.3/arch/arm/boot/dts/imx6sx.dtsi	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/boot/dts/imx6sx.dtsi	2015-07-27 23:13:00.307883804 +0200
+@@ -556,20 +556,21 @@
+ 					anatop-min-bit-val = <4>;
+ 					anatop-min-voltage = <800000>;
+ 					anatop-max-voltage = <1375000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+-				regulator-3p0@120 {
++				reg_3p0: regulator-3p0@120 {
+ 					compatible = "fsl,anatop-regulator";
+ 					regulator-name = "vdd3p0";
+-					regulator-min-microvolt = <2800000>;
+-					regulator-max-microvolt = <3150000>;
+-					regulator-always-on;
++					regulator-min-microvolt = <2625000>;
++					regulator-max-microvolt = <3400000>;
+ 					anatop-reg-offset = <0x120>;
+ 					anatop-vol-bit-shift = <8>;
+ 					anatop-vol-bit-width = <5>;
+ 					anatop-min-bit-val = <0>;
+ 					anatop-min-voltage = <2625000>;
+ 					anatop-max-voltage = <3400000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+ 				regulator-2p5@130 {
+@@ -584,6 +585,7 @@
+ 					anatop-min-bit-val = <0>;
+ 					anatop-min-voltage = <2100000>;
+ 					anatop-max-voltage = <2875000>;
++					anatop-enable-bit = <0>;
+ 				};
+ 
+ 				reg_arm: regulator-vddcore@140 {
+@@ -650,6 +652,7 @@
+ 				reg = <0x020c9000 0x1000>;
+ 				interrupts = <GIC_SPI 44 IRQ_TYPE_LEVEL_HIGH>;
+ 				clocks = <&clks IMX6SX_CLK_USBPHY1>;
++				phy-3p0-supply = <&reg_3p0>;
+ 				fsl,anatop = <&anatop>;
+ 			};
+ 
+@@ -658,6 +661,7 @@
+ 				reg = <0x020ca000 0x1000>;
+ 				interrupts = <GIC_SPI 45 IRQ_TYPE_LEVEL_HIGH>;
+ 				clocks = <&clks IMX6SX_CLK_USBPHY2>;
++				phy-3p0-supply = <&reg_3p0>;
+ 				fsl,anatop = <&anatop>;
+ 			};
+ 
+diff -Nur linux-4.1.3/arch/arm/include/asm/glue-cache.h linux-xbian-imx6/arch/arm/include/asm/glue-cache.h
+--- linux-4.1.3/arch/arm/include/asm/glue-cache.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/include/asm/glue-cache.h	2015-07-27 23:13:00.746319518 +0200
+@@ -102,19 +102,19 @@
+ #endif
+ 
+ #if defined(CONFIG_CPU_V6) || defined(CONFIG_CPU_V6K)
+-# ifdef _CACHE
++//# ifdef _CACHE
+ #  define MULTI_CACHE 1
+-# else
+-#  define _CACHE v6
+-# endif
++//# else
++//#  define _CACHE v6
++//# endif
+ #endif
+ 
+ #if defined(CONFIG_CPU_V7)
+-# ifdef _CACHE
++//# ifdef _CACHE
+ #  define MULTI_CACHE 1
+-# else
+-#  define _CACHE v7
+-# endif
++//# else
++//#  define _CACHE v7
++//# endif
+ #endif
+ 
+ #if defined(CONFIG_CPU_V7M)
+diff -Nur linux-4.1.3/arch/arm/Kconfig linux-xbian-imx6/arch/arm/Kconfig
+--- linux-4.1.3/arch/arm/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/Kconfig	2015-07-27 23:13:00.128523741 +0200
+@@ -1688,6 +1688,7 @@
+ 	range 11 64 if ARCH_SHMOBILE_LEGACY
+ 	default "12" if SOC_AM33XX
+ 	default "9" if SA1111 || ARCH_EFM32
++	default "14" if ARCH_MXC
+ 	default "11"
+ 	help
+ 	  The kernel memory allocator divides physically contiguous memory
+diff -Nur linux-4.1.3/arch/arm/mach-imx/busfreq_ddr3.c linux-xbian-imx6/arch/arm/mach-imx/busfreq_ddr3.c
+--- linux-4.1.3/arch/arm/mach-imx/busfreq_ddr3.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/arch/arm/mach-imx/busfreq_ddr3.c	2015-07-27 23:13:01.073153409 +0200
+@@ -0,0 +1,514 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file busfreq_ddr3.c
++ *
++ * @brief iMX6 DDR3 frequency change specific file.
++ *
++ * @ingroup PM
++ */
++#define DEBUG
++
++#include <asm/cacheflush.h>
++#include <asm/fncpy.h>
++#include <asm/io.h>
++#include <asm/mach/map.h>
++#include <asm/mach-types.h>
++#include <asm/tlb.h>
++#include <linux/clk.h>
++#include <linux/cpumask.h>
++#include <linux/delay.h>
++#include <linux/genalloc.h>
++#include <linux/interrupt.h>
++#include <linux/irqchip/arm-gic.h>
++#include <linux/kernel.h>
++#include <linux/mutex.h>
++#include <linux/of.h>
++#include <linux/of_address.h>
++#include <linux/of_device.h>
++#include <linux/platform_device.h>
++#include <linux/proc_fs.h>
++#include <linux/sched.h>
++#include <linux/smp.h>
++#include <linux/slab.h>
++
++#include "hardware.h"
++
++/* DDR settings */
++static unsigned long (*iram_ddr_settings)[2];
++static unsigned long (*normal_mmdc_settings)[2];
++static unsigned long (*iram_iomux_settings)[2];
++static void __iomem *mmdc_base;
++static void __iomem *iomux_base;
++static void __iomem *ccm_base;
++static void __iomem *l2_base;
++static void __iomem *gic_dist_base;
++static u32 *irqs_used;
++
++static void *ddr_freq_change_iram_base;
++static int ddr_settings_size;
++static int iomux_settings_size;
++static volatile unsigned int cpus_in_wfe;
++static volatile bool wait_for_ddr_freq_update;
++static int curr_ddr_rate;
++
++void (*mx6_change_ddr_freq)(u32 freq, void *ddr_settings,
++	bool dll_mode, void *iomux_offsets) = NULL;
++
++extern unsigned int ddr_med_rate;
++extern unsigned int ddr_normal_rate;
++extern int low_bus_freq_mode;
++extern int audio_bus_freq_mode;
++extern void mx6_ddr3_freq_change(u32 freq, void *ddr_settings,
++	bool dll_mode, void *iomux_offsets);
++extern unsigned long save_ttbr1(void);
++extern void restore_ttbr1(unsigned long ttbr1);
++
++#ifdef CONFIG_SMP
++extern void __iomem *imx_scu_base;
++static unsigned int online_cpus;
++#endif
++
++#define MIN_DLL_ON_FREQ		333000000
++#define MAX_DLL_OFF_FREQ		125000000
++#define DDR_FREQ_CHANGE_SIZE	0x2000
++
++unsigned long ddr3_dll_mx6q[][2] = {
++	{0x0c, 0x0},
++	{0x10, 0x0},
++	{0x1C, 0x04088032},
++	{0x1C, 0x0408803a},
++	{0x1C, 0x08408030},
++	{0x1C, 0x08408038},
++	{0x818, 0x0},
++};
++
++unsigned long ddr3_calibration[][2] = {
++	{0x83c, 0x0},
++	{0x840, 0x0},
++	{0x483c, 0x0},
++	{0x4840, 0x0},
++	{0x848, 0x0},
++	{0x4848, 0x0},
++	{0x850, 0x0},
++	{0x4850, 0x0},
++};
++
++unsigned long ddr3_dll_mx6dl[][2] = {
++	{0x0c, 0x0},
++	{0x10, 0x0},
++	{0x1C, 0x04008032},
++	{0x1C, 0x0400803a},
++	{0x1C, 0x07208030},
++	{0x1C, 0x07208038},
++	{0x818, 0x0},
++};
++
++unsigned long iomux_offsets_mx6q[][2] = {
++	{0x5A8, 0x0},
++	{0x5B0, 0x0},
++	{0x524, 0x0},
++	{0x51C, 0x0},
++	{0x518, 0x0},
++	{0x50C, 0x0},
++	{0x5B8, 0x0},
++	{0x5C0, 0x0},
++};
++
++unsigned long iomux_offsets_mx6dl[][2] = {
++	{0x4BC, 0x0},
++	{0x4C0, 0x0},
++	{0x4C4, 0x0},
++	{0x4C8, 0x0},
++	{0x4CC, 0x0},
++	{0x4D0, 0x0},
++	{0x4D4, 0x0},
++	{0x4D8, 0x0},
++};
++
++unsigned long ddr3_400[][2] = {
++	{0x83c, 0x42490249},
++	{0x840, 0x02470247},
++	{0x483c, 0x42570257},
++	{0x4840, 0x02400240},
++	{0x848, 0x4039363C},
++	{0x4848, 0x3A39333F},
++	{0x850, 0x38414441},
++	{0x4850, 0x472D4833}
++};
++
++int can_change_ddr_freq(void)
++{
++	return 0;
++}
++
++/*
++ * each active core apart from the one changing
++ * the DDR frequency will execute this function.
++ * the rest of the cores have to remain in WFE
++ * state until the frequency is changed.
++ */
++irqreturn_t wait_in_wfe_irq(int irq, void *dev_id)
++{
++	u32 me = smp_processor_id();
++
++	*((char *)(&cpus_in_wfe) + (u8)me) = 0xff;
++
++	while (wait_for_ddr_freq_update)
++		wfe();
++
++	*((char *)(&cpus_in_wfe) + (u8)me) = 0;
++
++	return IRQ_HANDLED;
++}
++
++/* change the DDR frequency. */
++int update_ddr_freq(int ddr_rate)
++{
++	int i, j;
++	bool dll_off = false;
++	int me = 0;
++	unsigned long ttbr1;
++#ifdef CONFIG_SMP
++	unsigned int reg;
++	int cpu = 0;
++#endif
++
++	if (!can_change_ddr_freq())
++		return -1;
++
++	if (ddr_rate == curr_ddr_rate)
++		return 0;
++
++	printk(KERN_DEBUG "\nBus freq set to %d start...\n", ddr_rate);
++
++	if (low_bus_freq_mode || audio_bus_freq_mode)
++		dll_off = true;
++
++	iram_ddr_settings[0][0] = ddr_settings_size;
++	iram_iomux_settings[0][0] = iomux_settings_size;
++	if (ddr_rate == ddr_med_rate && cpu_is_imx6q() &&
++		ddr_med_rate != ddr_normal_rate) {
++		for (i = 0; i < ARRAY_SIZE(ddr3_dll_mx6q); i++) {
++			iram_ddr_settings[i + 1][0] =
++					normal_mmdc_settings[i][0];
++			iram_ddr_settings[i + 1][1] =
++					normal_mmdc_settings[i][1];
++		}
++		for (j = 0, i = ARRAY_SIZE(ddr3_dll_mx6q);
++			i < iram_ddr_settings[0][0]; j++, i++) {
++			iram_ddr_settings[i + 1][0] =
++					ddr3_400[j][0];
++			iram_ddr_settings[i + 1][1] =
++					ddr3_400[j][1];
++		}
++	} else if (ddr_rate == ddr_normal_rate) {
++		for (i = 0; i < iram_ddr_settings[0][0]; i++) {
++			iram_ddr_settings[i + 1][0] =
++					normal_mmdc_settings[i][0];
++			iram_ddr_settings[i + 1][1] =
++					normal_mmdc_settings[i][1];
++		}
++	}
++
++	/* ensure that all Cores are in WFE. */
++	local_irq_disable();
++
++#ifdef CONFIG_SMP
++	me = smp_processor_id();
++
++	/* Make sure all the online cores are active */
++	while (1) {
++		bool not_exited_busfreq = false;
++		for_each_online_cpu(cpu) {
++			u32 reg = __raw_readl(imx_scu_base + 0x08);
++			if (reg & (0x02 << (cpu * 8)))
++				not_exited_busfreq = true;
++		}
++		if (!not_exited_busfreq)
++			break;
++	}
++
++	wmb();
++	wait_for_ddr_freq_update = 1;
++	dsb();
++
++	online_cpus = readl_relaxed(imx_scu_base + 0x08);
++	for_each_online_cpu(cpu) {
++		*((char *)(&online_cpus) + (u8)cpu) = 0x02;
++		if (cpu != me) {
++			/* set the interrupt to be pending in the GIC. */
++			reg = 1 << (irqs_used[cpu] % 32);
++			writel_relaxed(reg, gic_dist_base + GIC_DIST_PENDING_SET
++				+ (irqs_used[cpu] / 32) * 4);
++		}
++	}
++	/* Wait for the other active CPUs to idle */
++	while (1) {
++		u32 reg = readl_relaxed(imx_scu_base + 0x08);
++		reg |= (0x02 << (me * 8));
++		if (reg == online_cpus)
++			break;
++	}
++#endif
++
++	/* Ensure iram_tlb_phys_addr is flushed to DDR. */
++	/*__cpuc_flush_dcache_area(&iram_tlb_phys_addr, sizeof(iram_tlb_phys_addr));
++	outer_clean_range(virt_to_phys(&iram_tlb_phys_addr), virt_to_phys(&iram_tlb_phys_addr + 1));*/
++
++	/*
++	 * Flush the TLB, to ensure no TLB maintenance occurs
++	 * when DDR is in self-refresh.
++	 */
++	local_flush_tlb_all();
++
++	ttbr1 = save_ttbr1();
++	/* Now we can change the DDR frequency. */
++	mx6_change_ddr_freq(ddr_rate, iram_ddr_settings,
++		dll_off, iram_iomux_settings);
++	restore_ttbr1(ttbr1);
++	curr_ddr_rate = ddr_rate;
++
++#ifdef CONFIG_SMP
++	wmb();
++	/* DDR frequency change is done . */
++	wait_for_ddr_freq_update = 0;
++	dsb();
++
++	/* wake up all the cores. */
++	sev();
++#endif
++
++	local_irq_enable();
++
++	printk(KERN_DEBUG "Bus freq set to %d done! cpu=%d\n", ddr_rate, me);
++
++	return 0;
++}
++
++int init_mmdc_ddr3_settings(struct platform_device *busfreq_pdev)
++{
++	struct device *dev = &busfreq_pdev->dev;
++	struct platform_device *ocram_dev;
++	unsigned int iram_paddr;
++	int i, err;
++	u32 cpu;
++	struct device_node *node;
++	struct gen_pool *iram_pool;
++
++	node = of_find_compatible_node(NULL, NULL, "fsl,imx6q-mmdc-combine");
++	if (!node) {
++		pr_err("failed to find imx6q-mmdc device tree data!\n");
++		return -EINVAL;
++	}
++	mmdc_base = of_iomap(node, 0);
++	WARN(!mmdc_base, "unable to map mmdc registers\n");
++
++	node = NULL;
++	if (cpu_is_imx6q())
++		node = of_find_compatible_node(NULL, NULL, "fsl,imx6q-iomuxc");
++	if (cpu_is_imx6dl())
++		node = of_find_compatible_node(NULL, NULL,
++			"fsl,imx6dl-iomuxc");
++	if (!node) {
++		pr_err("failed to find imx6q-iomux device tree data!\n");
++		return -EINVAL;
++	}
++	iomux_base = of_iomap(node, 0);
++	WARN(!iomux_base, "unable to map iomux registers\n");
++
++	node = of_find_compatible_node(NULL, NULL, "fsl,imx6q-ccm");
++	if (!node) {
++		pr_err("failed to find imx6q-ccm device tree data!\n");
++		return -EINVAL;
++	}
++	ccm_base = of_iomap(node, 0);
++	WARN(!ccm_base, "unable to map mmdc registers\n");
++
++	node = of_find_compatible_node(NULL, NULL, "arm,pl310-cache");
++	if (!node) {
++		pr_err("failed to find imx6q-pl310-cache device tree data!\n");
++		return -EINVAL;
++	}
++	l2_base = of_iomap(node, 0);
++	WARN(!ccm_base, "unable to map mmdc registers\n");
++
++	node = NULL;
++	node = of_find_compatible_node(NULL, NULL, "arm,cortex-a9-gic");
++	if (!node) {
++		pr_err("failed to find imx6q-a9-gic device tree data!\n");
++		return -EINVAL;
++	}
++	gic_dist_base = of_iomap(node, 0);
++	WARN(!gic_dist_base, "unable to map gic dist registers\n");
++
++	if (cpu_is_imx6q())
++		ddr_settings_size = ARRAY_SIZE(ddr3_dll_mx6q) +
++			ARRAY_SIZE(ddr3_calibration);
++	if (cpu_is_imx6dl())
++		ddr_settings_size = ARRAY_SIZE(ddr3_dll_mx6dl) +
++			ARRAY_SIZE(ddr3_calibration);
++
++	normal_mmdc_settings = kmalloc((ddr_settings_size * 8), GFP_KERNEL);
++	if (cpu_is_imx6q()) {
++		memcpy(normal_mmdc_settings, ddr3_dll_mx6q,
++			sizeof(ddr3_dll_mx6q));
++		memcpy(((char *)normal_mmdc_settings + sizeof(ddr3_dll_mx6q)),
++			ddr3_calibration, sizeof(ddr3_calibration));
++	}
++	if (cpu_is_imx6dl()) {
++		memcpy(normal_mmdc_settings, ddr3_dll_mx6dl,
++			sizeof(ddr3_dll_mx6dl));
++		memcpy(((char *)normal_mmdc_settings + sizeof(ddr3_dll_mx6dl)),
++			ddr3_calibration, sizeof(ddr3_calibration));
++	}
++	/* store the original DDR settings at boot. */
++	for (i = 0; i < ddr_settings_size; i++) {
++		/*
++		 * writes via command mode register cannot be read back.
++		 * hence hardcode them in the initial static array.
++		 * this may require modification on a per customer basis.
++		 */
++		if (normal_mmdc_settings[i][0] != 0x1C)
++			normal_mmdc_settings[i][1] =
++				readl_relaxed(mmdc_base
++				+ normal_mmdc_settings[i][0]);
++	}
++
++	irqs_used = devm_kzalloc(dev, sizeof(u32) * num_present_cpus(),
++					GFP_KERNEL);
++
++	for_each_online_cpu(cpu) {
++		int irq;
++
++		/*
++		 * set up a reserved interrupt to get all
++		 * the active cores into a WFE state
++		 * before changing the DDR frequency.
++		 */
++		irq = platform_get_irq(busfreq_pdev, cpu);
++		err = request_irq(irq, wait_in_wfe_irq,
++			IRQF_PERCPU, "mmdc_1", NULL);
++		if (err) {
++			dev_err(dev,
++				"Busfreq:request_irq failed %d, err = %d\n",
++				irq, err);
++			return err;
++		}
++		err = irq_set_affinity(irq, cpumask_of(cpu));
++		if (err) {
++			dev_err(dev,
++				"Busfreq: Cannot set irq affinity irq=%d,\n",
++				irq);
++			return err;
++		}
++		irqs_used[cpu] = irq;
++	}
++
++	node = NULL;
++	node = of_find_compatible_node(NULL, NULL, "mmio-sram");
++	if (!node) {
++		dev_err(dev, "%s: failed to find ocram node\n",
++			__func__);
++		return -EINVAL;
++	}
++
++	ocram_dev = of_find_device_by_node(node);
++	if (!ocram_dev) {
++		dev_err(dev, "failed to find ocram device!\n");
++		return -EINVAL;
++	}
++
++	iram_pool = dev_get_gen_pool(&ocram_dev->dev);
++	if (!iram_pool) {
++		dev_err(dev, "iram pool unavailable!\n");
++		return -EINVAL;
++	}
++
++	iomux_settings_size = ARRAY_SIZE(iomux_offsets_mx6q);
++	iram_iomux_settings = (void*)gen_pool_alloc(iram_pool,
++						(iomux_settings_size * 8) + 8);
++	if (!iram_iomux_settings) {
++		dev_err(dev, "unable to alloc iram for IOMUX settings!\n");
++		return -ENOMEM;
++	}
++
++	/*
++	 * Allocate extra space to store the number of entries in the
++	 * ddr_settings plus 4 extra regsiter information that needs
++	 * to be passed to the frequency change code.
++	 * sizeof(iram_ddr_settings) = sizeof(ddr_settings) +
++	 *					entries in ddr_settings + 16.
++	 * The last 4 enties store the addresses of the registers:
++	 * CCM_BASE_ADDR
++	 * MMDC_BASE_ADDR
++	 * IOMUX_BASE_ADDR
++	 * L2X0_BASE_ADDR
++	 */
++	iram_ddr_settings = (void*)gen_pool_alloc(iram_pool,
++					(ddr_settings_size * 8) + 8 + 32);
++	if (!iram_ddr_settings) {
++		dev_err(dev, "unable to alloc iram for ddr settings!\n");
++		return -ENOMEM;
++	}
++	i = ddr_settings_size + 1;
++	iram_ddr_settings[i][0] = (unsigned long)mmdc_base;
++	iram_ddr_settings[i+1][0] = (unsigned long)ccm_base;
++	iram_ddr_settings[i+2][0] = (unsigned long)iomux_base;
++	iram_ddr_settings[i+3][0] = (unsigned long)l2_base;
++
++	if (cpu_is_imx6q()) {
++		/* store the IOMUX settings at boot. */
++		for (i = 0; i < iomux_settings_size; i++) {
++			iomux_offsets_mx6q[i][1] =
++				readl_relaxed(iomux_base +
++					iomux_offsets_mx6q[i][0]);
++			iram_iomux_settings[i+1][0] = iomux_offsets_mx6q[i][0];
++			iram_iomux_settings[i+1][1] = iomux_offsets_mx6q[i][1];
++		}
++	}
++
++	if (cpu_is_imx6dl()) {
++		for (i = 0; i < iomux_settings_size; i++) {
++			iomux_offsets_mx6dl[i][1] =
++				readl_relaxed(iomux_base +
++					iomux_offsets_mx6dl[i][0]);
++			iram_iomux_settings[i+1][0] = iomux_offsets_mx6dl[i][0];
++			iram_iomux_settings[i+1][1] = iomux_offsets_mx6dl[i][1];
++		}
++	}
++
++	ddr_freq_change_iram_base = (void*)gen_pool_alloc(iram_pool,
++						DDR_FREQ_CHANGE_SIZE);
++	if (!ddr_freq_change_iram_base) {
++		dev_err(dev, "Cannot alloc iram for ddr freq change code!\n");
++		return -ENOMEM;
++	}
++
++	iram_paddr = gen_pool_virt_to_phys(iram_pool,
++				(unsigned long)ddr_freq_change_iram_base);
++	/*
++	 * Need to remap the area here since we want
++	 * the memory region to be executable.
++	 */
++	ddr_freq_change_iram_base = __arm_ioremap(iram_paddr,
++						DDR_FREQ_CHANGE_SIZE,
++						MT_MEMORY_RWX_NONCACHED);
++	mx6_change_ddr_freq = (void *)fncpy(ddr_freq_change_iram_base,
++		&mx6_ddr3_freq_change, DDR_FREQ_CHANGE_SIZE);
++
++	curr_ddr_rate = ddr_normal_rate;
++
++	return 0;
++}
+diff -Nur linux-4.1.3/arch/arm/mach-imx/busfreq-imx6.c linux-xbian-imx6/arch/arm/mach-imx/busfreq-imx6.c
+--- linux-4.1.3/arch/arm/mach-imx/busfreq-imx6.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/arch/arm/mach-imx/busfreq-imx6.c	2015-07-27 23:13:01.073153409 +0200
+@@ -0,0 +1,984 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*!
++ * @file busfreq-imx6.c
++ *
++ * @brief A common API for the Freescale Semiconductor iMX6 Busfreq API
++ *
++ * The APIs are for setting bus frequency to different values based on the
++ * highest freqeuncy requested.
++ *
++ * @ingroup PM
++ */
++
++#include <linux/module.h>
++#include <linux/moduleparam.h>
++#include <asm/cacheflush.h>
++#include <asm/io.h>
++#include <asm/mach/map.h>
++#include <asm/mach-types.h>
++#include <asm/tlb.h>
++#include <linux/busfreq-imx6.h>
++#include <linux/clk.h>
++#include <linux/clk-provider.h>
++#include <linux/delay.h>
++#include <linux/module.h>
++#include <linux/mutex.h>
++#include <linux/of.h>
++#include <linux/platform_device.h>
++#include <linux/proc_fs.h>
++#include <linux/reboot.h>
++#include <linux/regulator/consumer.h>
++#include <linux/sched.h>
++#include <linux/suspend.h>
++#include "hardware.h"
++
++#define LPAPM_CLK		24000000
++#define DDR3_AUDIO_CLK		50000000
++#define LPDDR2_AUDIO_CLK	100000000
++
++int vpu352 = 0;
++
++int high_bus_freq_mode;
++int med_bus_freq_mode;
++int audio_bus_freq_mode;
++int low_bus_freq_mode;
++int ultra_low_bus_freq_mode;
++unsigned int ddr_med_rate;
++unsigned int ddr_normal_rate;
++
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++static int bus_freq_scaling_initialized;
++static struct device *busfreq_dev;
++static int busfreq_suspended;
++static u32 org_arm_rate;
++static int bus_freq_scaling_is_active;
++static int high_bus_count, med_bus_count, audio_bus_count, low_bus_count;
++static unsigned int ddr_low_rate;
++
++extern int init_mmdc_lpddr2_settings(struct platform_device *dev);
++extern int init_mmdc_ddr3_settings(struct platform_device *dev);
++extern int update_ddr_freq(int ddr_rate);
++extern int update_lpddr2_freq(int ddr_rate);
++
++DEFINE_MUTEX(bus_freq_mutex);
++static DEFINE_SPINLOCK(freq_lock);
++
++static struct clk *pll2_400;
++static struct clk *periph_clk;
++static struct clk *periph_pre_clk;
++static struct clk *periph_clk2_sel;
++static struct clk *periph_clk2;
++static struct clk *osc_clk;
++static struct clk *cpu_clk;
++static struct clk *pll3;
++static struct clk *pll2;
++static struct clk *pll2_200;
++static struct clk *pll1_sys;
++static struct clk *periph2_clk;
++static struct clk *ocram_clk;
++static struct clk *ahb_clk;
++static struct clk *pll1_sw_clk;
++static struct clk *periph2_pre_clk;
++static struct clk *periph2_clk2_sel;
++static struct clk *periph2_clk2;
++static struct clk *step_clk;
++static struct clk *axi_sel_clk;
++static struct clk *pll3_pfd1_540m;
++
++static u32 pll2_org_rate;
++static struct delayed_work low_bus_freq_handler;
++static struct delayed_work bus_freq_daemon;
++
++static void enter_lpm_imx6sl(void)
++{
++	unsigned long flags;
++
++	if (high_bus_freq_mode) {
++		pll2_org_rate = clk_get_rate(pll2);
++		/* Set periph_clk to be sourced from OSC_CLK */
++		clk_set_parent(periph_clk2_sel, osc_clk);
++		clk_set_parent(periph_clk, periph_clk2);
++		/* Ensure AHB/AXI clks are at 24MHz. */
++		clk_set_rate(ahb_clk, LPAPM_CLK);
++		clk_set_rate(ocram_clk, LPAPM_CLK);
++	}
++	if (audio_bus_count) {
++		/* Set AHB to 8MHz to lower pwer.*/
++		clk_set_rate(ahb_clk, LPAPM_CLK / 3);
++
++		/* Set up DDR to 100MHz. */
++		spin_lock_irqsave(&freq_lock, flags);
++		update_lpddr2_freq(LPDDR2_AUDIO_CLK);
++		spin_unlock_irqrestore(&freq_lock, flags);
++
++		/* Fix the clock tree in kernel */
++		clk_set_rate(pll2, pll2_org_rate);
++		clk_set_parent(periph2_pre_clk, pll2_200);
++		clk_set_parent(periph2_clk, periph2_pre_clk);
++
++		if (low_bus_freq_mode || ultra_low_bus_freq_mode) {
++			/*
++			 * Swtich ARM to run off PLL2_PFD2_400MHz
++			 * since DDR is anyway at 100MHz.
++			 */
++			clk_set_parent(step_clk, pll2_400);
++			clk_set_parent(pll1_sw_clk, step_clk);
++			/*
++			 * Ensure that the clock will be
++			 * at original speed.
++			 */
++			clk_set_rate(cpu_clk, org_arm_rate);
++		}
++		low_bus_freq_mode = 0;
++		ultra_low_bus_freq_mode = 0;
++		audio_bus_freq_mode = 1;
++	} else {
++		u32 arm_div, pll1_rate;
++		org_arm_rate = clk_get_rate(cpu_clk);
++		if (low_bus_freq_mode && low_bus_count == 0) {
++			/*
++			 * We are already in DDR @ 24MHz state, but
++			 * no one but ARM needs the DDR. In this case,
++			 * we can lower the DDR freq to 1MHz when ARM
++			 * enters WFI in this state. Keep track of this state.
++			 */
++			ultra_low_bus_freq_mode = 1;
++			low_bus_freq_mode = 0;
++			audio_bus_freq_mode = 0;
++		} else {
++			if (!ultra_low_bus_freq_mode && !low_bus_freq_mode) {
++				/*
++				 * Set DDR to 24MHz.
++				 * Since we are going to bypass PLL2,
++				 * we need to move ARM clk off PLL2_PFD2
++				 * to PLL1. Make sure the PLL1 is running
++				 * at the lowest possible freq.
++				 */
++				clk_set_rate(pll1_sys,
++					clk_round_rate(pll1_sys, org_arm_rate));
++				pll1_rate = clk_get_rate(pll1_sys);
++				arm_div = pll1_rate / org_arm_rate + 1;
++				/*
++				 * Ensure ARM CLK is lower before
++				 * changing the parent.
++				 */
++				clk_set_rate(cpu_clk, org_arm_rate / arm_div);
++				/* Now set the ARM clk parent to PLL1_SYS. */
++				clk_set_parent(pll1_sw_clk, pll1_sys);
++
++				/*
++				 * Set STEP_CLK back to OSC to save power and
++				 * also to maintain the parent.The WFI iram code
++				 * will switch step_clk to osc, but the clock API
++				 * is not aware of the change and when a new request
++				 * to change the step_clk parent to pll2_pfd2_400M
++				 * is requested sometime later, the change is ignored.
++				 */
++				clk_set_parent(step_clk, osc_clk);
++				/* Now set DDR to 24MHz. */
++				spin_lock_irqsave(&freq_lock, flags);
++				update_lpddr2_freq(LPAPM_CLK);
++				spin_unlock_irqrestore(&freq_lock, flags);
++
++				/*
++				 * Fix the clock tree in kernel.
++				 * Make sure PLL2 rate is updated as it gets
++				 * bypassed in the DDR freq change code.
++				 */
++				clk_set_rate(pll2, LPAPM_CLK);
++				clk_set_parent(periph2_clk2_sel, pll2);
++				clk_set_parent(periph2_clk, periph2_clk2_sel);
++
++			}
++			if (low_bus_count == 0) {
++				ultra_low_bus_freq_mode = 1;
++				low_bus_freq_mode = 0;
++			} else {
++				ultra_low_bus_freq_mode = 0;
++				low_bus_freq_mode = 1;
++			}
++			audio_bus_freq_mode = 0;
++		}
++	}
++}
++
++static void exit_lpm_imx6sl(void)
++{
++	unsigned long flags;
++
++	spin_lock_irqsave(&freq_lock, flags);
++	/* Change DDR freq in IRAM. */
++	update_lpddr2_freq(ddr_normal_rate);
++	spin_unlock_irqrestore(&freq_lock, flags);
++
++	/*
++	 * Fix the clock tree in kernel.
++	 * Make sure PLL2 rate is updated as it gets
++	 * un-bypassed in the DDR freq change code.
++	 */
++	clk_set_rate(pll2, pll2_org_rate);
++	clk_set_parent(periph2_pre_clk, pll2_400);
++	clk_set_parent(periph2_clk, periph2_pre_clk);
++
++	/* Ensure that periph_clk is sourced from PLL2_400. */
++	clk_set_parent(periph_pre_clk, pll2_400);
++	/*
++	 * Before switching the perhiph_clk, ensure that the
++	 * AHB/AXI will not be too fast.
++	 */
++	clk_set_rate(ahb_clk, LPAPM_CLK / 3);
++	clk_set_rate(ocram_clk, LPAPM_CLK / 2);
++	clk_set_parent(periph_clk, periph_pre_clk);
++
++	if (low_bus_freq_mode || ultra_low_bus_freq_mode) {
++		/* Move ARM from PLL1_SW_CLK to PLL2_400. */
++		clk_set_parent(step_clk, pll2_400);
++		clk_set_parent(pll1_sw_clk, step_clk);
++		clk_set_rate(cpu_clk, org_arm_rate);
++		ultra_low_bus_freq_mode = 0;
++	}
++}
++
++int reduce_bus_freq(void)
++{
++	int ret = 0;
++	clk_prepare_enable(pll3);
++	if (cpu_is_imx6sl())
++		enter_lpm_imx6sl();
++	else {
++		if (cpu_is_imx6dl() && (clk_get_parent(axi_sel_clk)
++			!= periph_clk))
++			/* Set axi to periph_clk */
++			clk_set_parent(axi_sel_clk, periph_clk);
++
++		if (audio_bus_count) {
++			/* Need to ensure that PLL2_PFD_400M is kept ON. */
++			clk_prepare_enable(pll2_400);
++			update_ddr_freq(DDR3_AUDIO_CLK);
++			/* Make sure periph clk's parent also got updated */
++			ret = clk_set_parent(periph_clk2_sel, pll3);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			ret = clk_set_parent(periph_pre_clk, pll2_200);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			ret = clk_set_parent(periph_clk, periph_pre_clk);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			audio_bus_freq_mode = 1;
++			low_bus_freq_mode = 0;
++		} else {
++			update_ddr_freq(LPAPM_CLK);
++			/* Make sure periph clk's parent also got updated */
++			ret = clk_set_parent(periph_clk2_sel, osc_clk);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			/* Set periph_clk parent to OSC via periph_clk2_sel */
++			ret = clk_set_parent(periph_clk, periph_clk2);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			if (audio_bus_freq_mode)
++				clk_disable_unprepare(pll2_400);
++			low_bus_freq_mode = 1;
++			audio_bus_freq_mode = 0;
++		}
++	}
++	clk_disable_unprepare(pll3);
++
++	med_bus_freq_mode = 0;
++	high_bus_freq_mode = 0;
++
++	if (audio_bus_freq_mode)
++		dev_dbg(busfreq_dev, "Bus freq set to audio mode. Count:\
++			high %d, med %d, audio %d\n",
++			high_bus_count, med_bus_count, audio_bus_count);
++	if (low_bus_freq_mode)
++		dev_dbg(busfreq_dev, "Bus freq set to low mode. Count:\
++			high %d, med %d, audio %d\n",
++			high_bus_count, med_bus_count, audio_bus_count);
++
++	return ret;
++}
++
++static void reduce_bus_freq_handler(struct work_struct *work)
++{
++	mutex_lock(&bus_freq_mutex);
++
++	reduce_bus_freq();
++
++	mutex_unlock(&bus_freq_mutex);
++}
++
++/*
++ * Set the DDR, AHB to 24MHz.
++ * This mode will be activated only when none of the modules that
++ * need a higher DDR or AHB frequency are active.
++ */
++int set_low_bus_freq(void)
++{
++	if (busfreq_suspended)
++		return 0;
++
++	if (!bus_freq_scaling_initialized || !bus_freq_scaling_is_active)
++		return 0;
++
++	/*
++	 * Check to see if we need to got from
++	 * low bus freq mode to audio bus freq mode.
++	 * If so, the change needs to be done immediately.
++	 */
++	if (audio_bus_count && (low_bus_freq_mode || ultra_low_bus_freq_mode))
++		reduce_bus_freq();
++	else
++		/*
++		 * Don't lower the frequency immediately. Instead
++		 * scheduled a delayed work and drop the freq if
++		 * the conditions still remain the same.
++		 */
++		schedule_delayed_work(&low_bus_freq_handler,
++					usecs_to_jiffies(3000000));
++	return 0;
++}
++
++/*
++ * Set the DDR to either 528MHz or 400MHz for iMX6qd
++ * or 400MHz for iMX6dl.
++ */
++int set_high_bus_freq(int high_bus_freq)
++{
++	int ret = 0;
++	struct clk *periph_clk_parent;
++
++	if (bus_freq_scaling_initialized && bus_freq_scaling_is_active)
++		cancel_delayed_work_sync(&low_bus_freq_handler);
++
++	if (busfreq_suspended)
++		return 0;
++
++	if (cpu_is_imx6q())
++		periph_clk_parent = pll2;
++	else
++		periph_clk_parent = pll2_400;
++
++	if (!bus_freq_scaling_initialized || !bus_freq_scaling_is_active)
++		return 0;
++
++	if (high_bus_freq_mode)
++		return 0;
++
++	/* medium bus freq is only supported for MX6DQ */
++	if (med_bus_freq_mode && !high_bus_freq)
++		return 0;
++
++	clk_prepare_enable(pll3);
++	if (cpu_is_imx6sl())
++		exit_lpm_imx6sl();
++	else {
++		if (high_bus_freq) {
++			update_ddr_freq(ddr_normal_rate);
++			/* Make sure periph clk's parent also got updated */
++			ret = clk_set_parent(periph_clk2_sel, pll3);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			ret = clk_set_parent(periph_pre_clk, periph_clk_parent);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			ret = clk_set_parent(periph_clk, periph_pre_clk);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			if (cpu_is_imx6dl() && (clk_get_parent(axi_sel_clk)
++				!= pll3_pfd1_540m))
++				/* Set axi to pll3_pfd1_540m */
++				clk_set_parent(axi_sel_clk, pll3_pfd1_540m);
++		} else {
++			update_ddr_freq(ddr_med_rate);
++			/* Make sure periph clk's parent also got updated */
++			ret = clk_set_parent(periph_clk2_sel, pll3);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			ret = clk_set_parent(periph_pre_clk, pll2_400);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++			ret = clk_set_parent(periph_clk, periph_pre_clk);
++			if (ret)
++				dev_WARN(busfreq_dev,
++					"%s: %d: clk set parent fail!\n",
++					__func__, __LINE__);
++		}
++		if (audio_bus_freq_mode)
++			clk_disable_unprepare(pll2_400);
++	}
++
++	high_bus_freq_mode = 1;
++	med_bus_freq_mode = 0;
++	low_bus_freq_mode = 0;
++	audio_bus_freq_mode = 0;
++
++	clk_disable_unprepare(pll3);
++
++	if (high_bus_freq_mode)
++		dev_dbg(busfreq_dev, "Bus freq set to high mode. Count:\
++			high %d, med %d, audio %d\n",
++			high_bus_count, med_bus_count, audio_bus_count);
++	if (med_bus_freq_mode)
++		dev_dbg(busfreq_dev, "Bus freq set to med mode. Count:\
++			high %d, med %d, audio %d\n",
++			high_bus_count, med_bus_count, audio_bus_count);
++
++	return 0;
++}
++#endif
++
++void request_bus_freq(enum bus_freq_mode mode)
++{
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++	mutex_lock(&bus_freq_mutex);
++
++	if (mode == BUS_FREQ_HIGH)
++		high_bus_count++;
++	else if (mode == BUS_FREQ_MED)
++		med_bus_count++;
++	else if (mode == BUS_FREQ_AUDIO)
++		audio_bus_count++;
++	else if (mode == BUS_FREQ_LOW)
++		low_bus_count++;
++
++	if (busfreq_suspended || !bus_freq_scaling_initialized ||
++		!bus_freq_scaling_is_active) {
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++	cancel_delayed_work_sync(&low_bus_freq_handler);
++
++	if (cpu_is_imx6dl()) {
++		/* No support for medium setpoint on MX6DL. */
++		if (mode == BUS_FREQ_MED) {
++			high_bus_count++;
++			mode = BUS_FREQ_HIGH;
++		}
++	}
++
++	if ((mode == BUS_FREQ_HIGH) && (!high_bus_freq_mode)) {
++		set_high_bus_freq(1);
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++
++	if ((mode == BUS_FREQ_MED) && (!high_bus_freq_mode) &&
++		(!med_bus_freq_mode)) {
++		set_high_bus_freq(0);
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++	if ((mode == BUS_FREQ_AUDIO) && (!high_bus_freq_mode) &&
++		(!med_bus_freq_mode) && (!audio_bus_freq_mode)) {
++		set_low_bus_freq();
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++	mutex_unlock(&bus_freq_mutex);
++#endif
++	return;
++}
++EXPORT_SYMBOL(request_bus_freq);
++
++void release_bus_freq(enum bus_freq_mode mode)
++{
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++	mutex_lock(&bus_freq_mutex);
++
++	if (mode == BUS_FREQ_HIGH) {
++		if (high_bus_count == 0) {
++			dev_err(busfreq_dev, "high bus count mismatch!\n");
++			dump_stack();
++			mutex_unlock(&bus_freq_mutex);
++			return;
++		}
++		high_bus_count--;
++	} else if (mode == BUS_FREQ_MED) {
++		if (med_bus_count == 0) {
++			dev_err(busfreq_dev, "med bus count mismatch!\n");
++			dump_stack();
++			mutex_unlock(&bus_freq_mutex);
++			return;
++		}
++		med_bus_count--;
++	} else if (mode == BUS_FREQ_AUDIO) {
++		if (audio_bus_count == 0) {
++			dev_err(busfreq_dev, "audio bus count mismatch!\n");
++			dump_stack();
++			mutex_unlock(&bus_freq_mutex);
++			return;
++		}
++		audio_bus_count--;
++	} else if (mode == BUS_FREQ_LOW) {
++		if (low_bus_count == 0) {
++			dev_err(busfreq_dev, "low bus count mismatch!\n");
++			dump_stack();
++			mutex_unlock(&bus_freq_mutex);
++			return;
++		}
++		low_bus_count--;
++	}
++
++	if (busfreq_suspended || !bus_freq_scaling_initialized ||
++		!bus_freq_scaling_is_active) {
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++
++	if (cpu_is_imx6dl()) {
++		/* No support for medium setpoint on MX6DL. */
++		if (mode == BUS_FREQ_MED) {
++			high_bus_count--;
++			mode = BUS_FREQ_HIGH;
++		}
++	}
++
++	if ((!audio_bus_freq_mode) && (high_bus_count == 0) &&
++		(med_bus_count == 0) && (audio_bus_count != 0)) {
++		set_low_bus_freq();
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++	if ((!low_bus_freq_mode) && (high_bus_count == 0) &&
++		(med_bus_count == 0) && (audio_bus_count == 0) &&
++		(low_bus_count != 0)) {
++		set_low_bus_freq();
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++	if ((!ultra_low_bus_freq_mode) && (high_bus_count == 0) &&
++		(med_bus_count == 0) && (audio_bus_count == 0) &&
++		(low_bus_count == 0)) {
++		set_low_bus_freq();
++		mutex_unlock(&bus_freq_mutex);
++		return;
++	}
++
++	mutex_unlock(&bus_freq_mutex);
++#endif
++	return;
++}
++EXPORT_SYMBOL(release_bus_freq);
++
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++static void bus_freq_daemon_handler(struct work_struct *work)
++{
++	mutex_lock(&bus_freq_mutex);
++	if ((!low_bus_freq_mode) && (!ultra_low_bus_freq_mode) && (high_bus_count == 0) &&
++		(med_bus_count == 0) && (audio_bus_count == 0))
++		set_low_bus_freq();
++	mutex_unlock(&bus_freq_mutex);
++}
++
++static ssize_t bus_freq_scaling_enable_show(struct device *dev,
++				struct device_attribute *attr, char *buf)
++{
++	if (bus_freq_scaling_is_active)
++		return sprintf(buf, "Bus frequency scaling is enabled\n");
++	else
++		return sprintf(buf, "Bus frequency scaling is disabled\n");
++}
++
++static ssize_t vpu352_enable_show(struct device *dev,
++				struct device_attribute *attr, char *buf)
++{
++	if (vpu352)
++		return sprintf(buf, "VPU352M is enabled\n");
++	else
++		return sprintf(buf, "VPU352M is disabled\n");
++}
++
++static int vpu352_setup(char *options)
++{
++	return kstrtol(options, 0, (long int *)&vpu352);
++}
++
++static ssize_t bus_freq_scaling_enable_store(struct device *dev,
++				 struct device_attribute *attr,
++				 const char *buf, size_t size)
++{
++	if (strncmp(buf, "1", 1) == 0) {
++		bus_freq_scaling_is_active = 1;
++		set_high_bus_freq(1);
++		/*
++		 * We set bus freq to highest at the beginning,
++		 * so we use this daemon thread to make sure system
++		 * can enter low bus mode if
++		 * there is no high bus request pending
++		 */
++		schedule_delayed_work(&bus_freq_daemon,
++			usecs_to_jiffies(5000000));
++	} else if (strncmp(buf, "0", 1) == 0) {
++		if (bus_freq_scaling_is_active)
++			set_high_bus_freq(1);
++		bus_freq_scaling_is_active = 0;
++	}
++	return size;
++}
++
++static int bus_freq_pm_notify(struct notifier_block *nb, unsigned long event,
++	void *dummy)
++{
++	mutex_lock(&bus_freq_mutex);
++
++	if (event == PM_SUSPEND_PREPARE) {
++		high_bus_count++;
++		set_high_bus_freq(1);
++		busfreq_suspended = 1;
++	} else if (event == PM_POST_SUSPEND) {
++		busfreq_suspended = 0;
++		high_bus_count--;
++		schedule_delayed_work(&bus_freq_daemon,
++			usecs_to_jiffies(5000000));
++	}
++
++	mutex_unlock(&bus_freq_mutex);
++
++	return NOTIFY_OK;
++}
++
++static int busfreq_reboot_notifier_event(struct notifier_block *this,
++						 unsigned long event, void *ptr)
++{
++	/* System is rebooting. Set the system into high_bus_freq_mode. */
++	request_bus_freq(BUS_FREQ_HIGH);
++
++	return 0;
++}
++
++static struct notifier_block imx_bus_freq_pm_notifier = {
++	.notifier_call = bus_freq_pm_notify,
++};
++
++static struct notifier_block imx_busfreq_reboot_notifier = {
++	.notifier_call = busfreq_reboot_notifier_event,
++};
++
++
++static DEVICE_ATTR(enable, 0644, bus_freq_scaling_enable_show,
++			bus_freq_scaling_enable_store);
++static DEVICE_ATTR(vpu352, 0444, vpu352_enable_show,
++			NULL);
++#endif
++
++/*!
++ * This is the probe routine for the bus frequency driver.
++ *
++ * @param   pdev   The platform device structure
++ *
++ * @return         The function returns 0 on success
++ *
++ */
++
++static int busfreq_probe(struct platform_device *pdev)
++{
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++	u32 err;
++
++	busfreq_dev = &pdev->dev;
++
++	pll2_400 = devm_clk_get(&pdev->dev, "pll2_pfd2_396m");
++	if (IS_ERR(pll2_400)) {
++		dev_err(busfreq_dev, "%s: failed to get pll2_pfd2_396m\n",
++		__func__);
++		return PTR_ERR(pll2_400);
++	}
++
++	pll2_200 = devm_clk_get(&pdev->dev, "pll2_198m");
++	if (IS_ERR(pll2_200)) {
++		dev_err(busfreq_dev, "%s: failed to get pll2_198m\n",
++			__func__);
++		return PTR_ERR(pll2_200);
++	}
++
++	pll2 = devm_clk_get(&pdev->dev, "pll2_bus");
++	if (IS_ERR(pll2)) {
++		dev_err(busfreq_dev, "%s: failed to get pll2_bus\n",
++			__func__);
++		return PTR_ERR(pll2);
++	}
++
++	cpu_clk = devm_clk_get(&pdev->dev, "arm");
++	if (IS_ERR(cpu_clk)) {
++		dev_err(busfreq_dev, "%s: failed to get cpu_clk\n",
++			__func__);
++		return PTR_ERR(cpu_clk);
++	}
++
++	pll3 = devm_clk_get(&pdev->dev, "pll3_usb_otg");
++	if (IS_ERR(pll3)) {
++		dev_err(busfreq_dev, "%s: failed to get pll3_usb_otg\n",
++			__func__);
++		return PTR_ERR(pll3);
++	}
++
++	periph_clk = devm_clk_get(&pdev->dev, "periph");
++	if (IS_ERR(periph_clk)) {
++		dev_err(busfreq_dev, "%s: failed to get periph\n",
++			__func__);
++		return PTR_ERR(periph_clk);
++	}
++
++	periph_pre_clk = devm_clk_get(&pdev->dev, "periph_pre");
++	if (IS_ERR(periph_pre_clk)) {
++		dev_err(busfreq_dev, "%s: failed to get periph_pre\n",
++			__func__);
++		return PTR_ERR(periph_pre_clk);
++	}
++
++	periph_clk2 = devm_clk_get(&pdev->dev, "periph_clk2");
++	if (IS_ERR(periph_clk2)) {
++		dev_err(busfreq_dev, "%s: failed to get periph_clk2\n",
++			__func__);
++		return PTR_ERR(periph_clk2);
++	}
++
++	periph_clk2_sel = devm_clk_get(&pdev->dev, "periph_clk2_sel");
++	if (IS_ERR(periph_clk2_sel)) {
++		dev_err(busfreq_dev, "%s: failed to get periph_clk2_sel\n",
++			__func__);
++		return PTR_ERR(periph_clk2_sel);
++	}
++
++	osc_clk = devm_clk_get(&pdev->dev, "osc");
++	if (IS_ERR(osc_clk)) {
++		dev_err(busfreq_dev, "%s: failed to get osc_clk\n",
++			__func__);
++		return PTR_ERR(osc_clk);
++	}
++
++	if (cpu_is_imx6dl()) {
++		axi_sel_clk = devm_clk_get(&pdev->dev, "axi_sel");
++		if (IS_ERR(axi_sel_clk)) {
++			dev_err(busfreq_dev, "%s: failed to get axi_sel_clk\n",
++				__func__);
++			return PTR_ERR(axi_sel_clk);
++		}
++
++		pll3_pfd1_540m = devm_clk_get(&pdev->dev, "pll3_pfd1_540m");
++		if (IS_ERR(pll3_pfd1_540m)) {
++			dev_err(busfreq_dev,
++				"%s: failed to get pll3_pfd1_540m\n", __func__);
++			return PTR_ERR(pll3_pfd1_540m);
++		}
++	}
++
++	if (cpu_is_imx6sl()) {
++		pll1_sys = devm_clk_get(&pdev->dev, "pll1_sys");
++		if (IS_ERR(pll1_sys)) {
++			dev_err(busfreq_dev, "%s: failed to get pll1_sys\n",
++				__func__);
++			return PTR_ERR(pll1_sys);
++		}
++
++		ahb_clk = devm_clk_get(&pdev->dev, "ahb");
++		if (IS_ERR(ahb_clk)) {
++			dev_err(busfreq_dev, "%s: failed to get ahb_clk\n",
++				__func__);
++			return PTR_ERR(ahb_clk);
++		}
++
++		ocram_clk = devm_clk_get(&pdev->dev, "ocram");
++		if (IS_ERR(ocram_clk)) {
++			dev_err(busfreq_dev, "%s: failed to get ocram_clk\n",
++				__func__);
++			return PTR_ERR(ocram_clk);
++		}
++
++		pll1_sw_clk = devm_clk_get(&pdev->dev, "pll1_sw");
++		if (IS_ERR(pll1_sw_clk)) {
++			dev_err(busfreq_dev, "%s: failed to get pll1_sw_clk\n",
++				__func__);
++			return PTR_ERR(pll1_sw_clk);
++		}
++
++		periph2_clk = devm_clk_get(&pdev->dev, "periph2");
++		if (IS_ERR(periph2_clk)) {
++			dev_err(busfreq_dev, "%s: failed to get periph2\n",
++				__func__);
++			return PTR_ERR(periph2_clk);
++		}
++
++		periph2_pre_clk = devm_clk_get(&pdev->dev, "periph2_pre");
++		if (IS_ERR(periph2_pre_clk)) {
++			dev_err(busfreq_dev,
++				"%s: failed to get periph2_pre_clk\n",
++				__func__);
++			return PTR_ERR(periph2_pre_clk);
++		}
++
++		periph2_clk2 = devm_clk_get(&pdev->dev, "periph2_clk2");
++		if (IS_ERR(periph2_clk2)) {
++			dev_err(busfreq_dev,
++				"%s: failed to get periph2_clk2\n",
++				__func__);
++			return PTR_ERR(periph2_clk2);
++		}
++
++		periph2_clk2_sel = devm_clk_get(&pdev->dev, "periph2_clk2_sel");
++		if (IS_ERR(periph2_clk2_sel)) {
++			dev_err(busfreq_dev,
++				"%s: failed to get periph2_clk2_sel\n",
++				__func__);
++			return PTR_ERR(periph2_clk2_sel);
++		}
++
++		step_clk = devm_clk_get(&pdev->dev, "step");
++		if (IS_ERR(step_clk)) {
++			dev_err(busfreq_dev,
++				"%s: failed to get step_clk\n",
++				__func__);
++			return PTR_ERR(periph2_clk2_sel);
++		}
++
++	}
++
++	err = sysfs_create_file(&busfreq_dev->kobj, &dev_attr_enable.attr);
++	if (err) {
++		dev_err(busfreq_dev,
++		       "Unable to register sysdev entry for BUSFREQ");
++		return err;
++	}
++	err = sysfs_create_file(&busfreq_dev->kobj, &dev_attr_vpu352.attr);
++	if (err) {
++		dev_err(busfreq_dev,
++		       "Unable to register sysdev entry for BUSFREQ");
++		return err;
++	}
++
++	if (of_property_read_u32(pdev->dev.of_node, "fsl,max_ddr_freq",
++			&ddr_normal_rate)) {
++		dev_err(busfreq_dev, "max_ddr_freq entry missing\n");
++		return -EINVAL;
++	}
++#endif
++
++	high_bus_freq_mode = 1;
++	med_bus_freq_mode = 0;
++	low_bus_freq_mode = 0;
++	audio_bus_freq_mode = 0;
++	ultra_low_bus_freq_mode = 0;
++
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++	bus_freq_scaling_is_active = 1;
++	bus_freq_scaling_initialized = 1;
++
++	ddr_low_rate = LPAPM_CLK;
++	if (cpu_is_imx6q()) {
++		if (of_property_read_u32(pdev->dev.of_node, "fsl,med_ddr_freq",
++				&ddr_med_rate)) {
++			dev_info(busfreq_dev,
++					"DDR medium rate not supported.\n");
++			ddr_med_rate = ddr_normal_rate;
++		}
++	}
++
++	INIT_DELAYED_WORK(&low_bus_freq_handler, reduce_bus_freq_handler);
++	INIT_DELAYED_WORK(&bus_freq_daemon, bus_freq_daemon_handler);
++	register_pm_notifier(&imx_bus_freq_pm_notifier);
++	register_reboot_notifier(&imx_busfreq_reboot_notifier);
++
++	if (cpu_is_imx6sl())
++		err = init_mmdc_lpddr2_settings(pdev);
++	else
++		err = init_mmdc_ddr3_settings(pdev);
++	if (err) {
++		dev_err(busfreq_dev, "Busfreq init of MMDC failed\n");
++		return err;
++	}
++#endif
++	return 0;
++}
++
++static const struct of_device_id imx6_busfreq_ids[] = {
++	{ .compatible = "fsl,imx6_busfreq", },
++	{ /* sentinel */ }
++};
++
++static struct platform_driver busfreq_driver = {
++	.driver = {
++		.name = "imx6_busfreq",
++		.owner  = THIS_MODULE,
++		.of_match_table = imx6_busfreq_ids,
++		},
++	.probe = busfreq_probe,
++};
++
++/*!
++ * Initialise the busfreq_driver.
++ *
++ * @return  The function always returns 0.
++ */
++
++static int __init busfreq_init(void)
++{
++	if (vpu352) {
++		printk(KERN_INFO "VPU@352Mhz activated. Bus freq driver module not loading\n");
++		return 0;
++	}
++
++	if (platform_driver_register(&busfreq_driver) != 0)
++		return -ENODEV;
++
++	printk(KERN_INFO "Bus freq driver module loaded\n");
++
++	return 0;
++}
++
++static void __exit busfreq_cleanup(void)
++{
++#ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++	sysfs_remove_file(&busfreq_dev->kobj, &dev_attr_enable.attr);
++
++	bus_freq_scaling_initialized = 0;
++#endif
++	/* Unregister the device structure */
++	platform_driver_unregister(&busfreq_driver);
++}
++
++__setup("vpu352=", vpu352_setup);
++module_init(busfreq_init);
++module_exit(busfreq_cleanup);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("BusFreq driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/arch/arm/mach-imx/busfreq_lpddr2.c linux-xbian-imx6/arch/arm/mach-imx/busfreq_lpddr2.c
+--- linux-4.1.3/arch/arm/mach-imx/busfreq_lpddr2.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/arch/arm/mach-imx/busfreq_lpddr2.c	2015-07-27 23:13:01.073153409 +0200
+@@ -0,0 +1,183 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file busfreq_lpddr2.c
++ *
++ * @brief iMX6 LPDDR2 frequency change specific file.
++ *
++ * @ingroup PM
++ */
++#include <asm/cacheflush.h>
++#include <asm/fncpy.h>
++#include <asm/io.h>
++#include <asm/mach/map.h>
++#include <asm/mach-types.h>
++#include <asm/tlb.h>
++#include <linux/clk.h>
++#include <linux/cpumask.h>
++#include <linux/delay.h>
++#include <linux/genalloc.h>
++#include <linux/interrupt.h>
++#include <linux/irqchip/arm-gic.h>
++#include <linux/kernel.h>
++#include <linux/mutex.h>
++#include <linux/of.h>
++#include <linux/of_address.h>
++#include <linux/of_device.h>
++#include <linux/platform_device.h>
++#include <linux/proc_fs.h>
++#include <linux/sched.h>
++#include <linux/smp.h>
++
++#include "hardware.h"
++
++/* DDR settings */
++static void __iomem *mmdc_base;
++static void __iomem *anatop_base;
++static void __iomem *ccm_base;
++static void __iomem *l2_base;
++static struct device *busfreq_dev;
++static void *ddr_freq_change_iram_base;
++static int curr_ddr_rate;
++
++unsigned long reg_addrs[4];
++
++void (*mx6_change_lpddr2_freq)(u32 ddr_freq, int bus_freq_mode,
++	void *iram_addr) = NULL;
++
++extern unsigned int ddr_normal_rate;
++extern int low_bus_freq_mode;
++extern int ultra_low_bus_freq_mode;
++extern void mx6_lpddr2_freq_change(u32 freq, int bus_freq_mode,
++	void *iram_addr);
++
++
++#define LPDDR2_FREQ_CHANGE_SIZE	0x1000
++
++
++/* change the DDR frequency. */
++int update_lpddr2_freq(int ddr_rate)
++{
++	if (ddr_rate == curr_ddr_rate)
++		return 0;
++
++	dev_dbg(busfreq_dev, "\nBus freq set to %d start...\n", ddr_rate);
++
++	/*
++	 * Flush the TLB, to ensure no TLB maintenance occurs
++	 * when DDR is in self-refresh.
++	 */
++	local_flush_tlb_all();
++	/* Now change DDR frequency. */
++	mx6_change_lpddr2_freq(ddr_rate,
++		(low_bus_freq_mode | ultra_low_bus_freq_mode),
++		reg_addrs);
++
++	curr_ddr_rate = ddr_rate;
++
++	dev_dbg(busfreq_dev, "\nBus freq set to %d done...\n", ddr_rate);
++
++	return 0;
++}
++
++int init_mmdc_lpddr2_settings(struct platform_device *busfreq_pdev)
++{
++	struct platform_device *ocram_dev;
++	unsigned int iram_paddr;
++	struct device_node *node;
++	struct gen_pool *iram_pool;
++
++	busfreq_dev = &busfreq_pdev->dev;
++	node = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-mmdc");
++	if (!node) {
++		printk(KERN_ERR "failed to find imx6sl-mmdc device tree data!\n");
++		return -EINVAL;
++	}
++	mmdc_base = of_iomap(node, 0);
++	WARN(!mmdc_base, "unable to map mmdc registers\n");
++
++	node = NULL;
++	node = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-ccm");
++	if (!node) {
++		printk(KERN_ERR "failed to find imx6sl-ccm device tree data!\n");
++		return -EINVAL;
++	}
++	ccm_base = of_iomap(node, 0);
++	WARN(!ccm_base, "unable to map ccm registers\n");
++
++	node = of_find_compatible_node(NULL, NULL, "arm,pl310-cache");
++	if (!node) {
++		printk(KERN_ERR "failed to find imx6sl-pl310-cache device tree data!\n");
++		return -EINVAL;
++	}
++	l2_base = of_iomap(node, 0);
++	WARN(!l2_base, "unable to map PL310 registers\n");
++
++	node = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-anatop");
++	if (!node) {
++		printk(KERN_ERR "failed to find imx6sl-pl310-cache device tree data!\n");
++		return -EINVAL;
++	}
++	anatop_base = of_iomap(node, 0);
++	WARN(!anatop_base, "unable to map anatop registers\n");
++
++	node = NULL;
++	node = of_find_compatible_node(NULL, NULL, "mmio-sram");
++	if (!node) {
++		dev_err(busfreq_dev, "%s: failed to find ocram node\n",
++			__func__);
++		return -EINVAL;
++	}
++
++	ocram_dev = of_find_device_by_node(node);
++	if (!ocram_dev) {
++		dev_err(busfreq_dev, "failed to find ocram device!\n");
++		return -EINVAL;
++	}
++
++	iram_pool = dev_get_gen_pool(&ocram_dev->dev);
++	if (!iram_pool) {
++		dev_err(busfreq_dev, "iram pool unavailable!\n");
++		return -EINVAL;
++	}
++
++	reg_addrs[0] = (unsigned long)anatop_base;
++	reg_addrs[1] = (unsigned long)ccm_base;
++	reg_addrs[2] = (unsigned long)mmdc_base;
++	reg_addrs[3] = (unsigned long)l2_base;
++
++	ddr_freq_change_iram_base = (void *)gen_pool_alloc(iram_pool,
++						LPDDR2_FREQ_CHANGE_SIZE);
++	if (!ddr_freq_change_iram_base) {
++		dev_err(busfreq_dev,
++			"Cannot alloc iram for ddr freq change code!\n");
++		return -ENOMEM;
++	}
++
++	iram_paddr = gen_pool_virt_to_phys(iram_pool,
++				(unsigned long)ddr_freq_change_iram_base);
++	/*
++	 * Need to remap the area here since we want
++	 * the memory region to be executable.
++	 */
++	ddr_freq_change_iram_base = __arm_ioremap(iram_paddr,
++						LPDDR2_FREQ_CHANGE_SIZE,
++						MT_MEMORY_RWX_NONCACHED);
++	mx6_change_lpddr2_freq = (void *)fncpy(ddr_freq_change_iram_base,
++		&mx6_lpddr2_freq_change, LPDDR2_FREQ_CHANGE_SIZE);
++
++	curr_ddr_rate = ddr_normal_rate;
++
++	return 0;
++}
+diff -Nur linux-4.1.3/arch/arm/mach-imx/clk.h linux-xbian-imx6/arch/arm/mach-imx/clk.h
+--- linux-4.1.3/arch/arm/mach-imx/clk.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/clk.h	2015-07-27 23:13:01.085110746 +0200
+@@ -55,6 +55,34 @@
+ 			shift, 0, &imx_ccm_lock, share_count);
+ }
+ 
++static inline void imx_clk_prepare_enable(struct clk *clk)
++{
++	int ret = clk_prepare_enable(clk);
++
++	if (ret)
++		pr_err("failed to prepare and enable clk %s: %d\n",
++			__clk_get_name(clk), ret);
++}
++
++static inline int imx_clk_set_parent(struct clk *clk, struct clk *parent)
++{
++	int ret = clk_set_parent(clk, parent);
++
++	if (ret)
++		pr_err("failed to set parent of clk %s to %s: %d\n",
++			__clk_get_name(clk), __clk_get_name(parent), ret);
++	return ret;
++}
++
++static inline void imx_clk_set_rate(struct clk *clk, unsigned long rate)
++{
++	int ret = clk_set_rate(clk, rate);
++
++	if (ret)
++		pr_err("failed to set rate of clk %s to %ld: %d\n",
++			__clk_get_name(clk), rate, ret);
++}
++
+ struct clk *imx_clk_pfd(const char *name, const char *parent_name,
+ 		void __iomem *reg, u8 idx);
+ 
+diff -Nur linux-4.1.3/arch/arm/mach-imx/clk-imx6q.c linux-xbian-imx6/arch/arm/mach-imx/clk-imx6q.c
+--- linux-4.1.3/arch/arm/mach-imx/clk-imx6q.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/clk-imx6q.c	2015-07-27 23:13:01.081124967 +0200
+@@ -24,7 +24,6 @@
+ #include "clk.h"
+ #include "common.h"
+ #include "hardware.h"
+-
+ static const char *step_sels[]	= { "osc", "pll2_pfd2_396m", };
+ static const char *pll1_sw_sels[]	= { "pll1_sys", "step", };
+ static const char *periph_pre_sels[]	= { "pll2_bus", "pll2_pfd2_396m", "pll2_pfd0_352m", "pll2_198m", };
+@@ -41,6 +40,8 @@
+ static const char *ipu_sels[]		= { "mmdc_ch0_axi", "pll2_pfd2_396m", "pll3_120m", "pll3_pfd1_540m", };
+ static const char *ldb_di_sels[]	= { "pll5_video_div", "pll2_pfd0_352m", "pll2_pfd2_396m", "mmdc_ch1_axi", "pll3_usb_otg", };
+ static const char *ipu_di_pre_sels[]	= { "mmdc_ch0_axi", "pll3_usb_otg", "pll5_video_div", "pll2_pfd0_352m", "pll2_pfd2_396m", "pll3_pfd1_540m", };
++static const char *ldb_di0_div_sels[]   = { "ldb_di0_div_3_5", "ldb_di0_div_7", };
++static const char *ldb_di1_div_sels[]   = { "ldb_di1_div_3_5", "ldb_di1_div_7", };
+ static const char *ipu1_di0_sels[]	= { "ipu1_di0_pre", "dummy", "dummy", "ldb_di0", "ldb_di1", };
+ static const char *ipu1_di1_sels[]	= { "ipu1_di1_pre", "dummy", "dummy", "ldb_di0", "ldb_di1", };
+ static const char *ipu2_di0_sels[]	= { "ipu2_di0_pre", "dummy", "dummy", "ldb_di0", "ldb_di1", };
+@@ -119,8 +120,118 @@
+ static unsigned int share_count_ssi1;
+ static unsigned int share_count_ssi2;
+ static unsigned int share_count_ssi3;
++static unsigned int share_count_spdif;
+ static unsigned int share_count_mipi_core_cfg;
+ 
++static void __iomem *ccm_base;
++
++static void init_ldb_clks(struct clk *new_parent)
++{
++	u32 reg;
++
++	/*
++	 * Need to follow a strict procedure when changing the LDB
++	 * clock, else we can introduce a glitch. Things to keep in
++	 * mind:
++	 * 1. The current and new parent clocks must be disabled.
++	 * 2. The default clock for ldb_dio_clk is mmdc_ch1 which has
++	 * no CG bit.
++	 * 3. In the RTL implementation of the LDB_DI_CLK_SEL mux
++	 * the top four options are in one mux and the PLL3 option along
++	 * with another option is in the second mux. There is third mux
++	 * used to decide between the first and second mux.
++	 * The code below switches the parent to the bottom mux first
++	 * and then manipulates the top mux. This ensures that no glitch
++	 * will enter the divider.
++	 *
++	 * Need to disable MMDC_CH1 clock manually as there is no CG bit
++	 * for this clock. The only way to disable this clock is to move
++	 * it topll3_sw_clk and then to disable pll3_sw_clk
++	 * Make sure periph2_clk2_sel is set to pll3_sw_clk
++	 */
++	reg = readl_relaxed(ccm_base + 0x18);
++	reg &= ~(1 << 20);
++	writel_relaxed(reg, ccm_base + 0x18);
++
++	/*
++	 * Set MMDC_CH1 mask bit.
++	 */
++	reg = readl_relaxed(ccm_base + 0x4);
++	reg |= 1 << 16;
++	writel_relaxed(reg, ccm_base + 0x4);
++
++	/*
++	 * Set the periph2_clk_sel to the top mux so that
++	 * mmdc_ch1 is from pll3_sw_clk.
++	 */
++	reg = readl_relaxed(ccm_base + 0x14);
++	reg |= 1 << 26;
++	writel_relaxed(reg, ccm_base + 0x14);
++
++	/*
++	 * Wait for the clock switch.
++	 */
++	while (readl_relaxed(ccm_base + 0x48))
++		;
++
++	/*
++	 * Disable pll3_sw_clk by selecting the bypass clock source.
++	 */
++	reg = readl_relaxed(ccm_base + 0xc);
++	reg |= 1 << 0;
++	writel_relaxed(reg, ccm_base + 0xc);
++
++	/*
++	 * Set the ldb_di0_clk and ldb_di1_clk to 111b.
++	 */
++	reg = readl_relaxed(ccm_base + 0x2c);
++	reg |= ((7 << 9) | (7 << 12));
++	writel_relaxed(reg, ccm_base + 0x2c);
++
++	/*
++	 * Set the ldb_di0_clk and ldb_di1_clk to 100b.
++	 */
++	reg = readl_relaxed(ccm_base + 0x2c);
++	reg &= ~((7 << 9) | (7 << 12));
++	reg |= ((4 << 9) | (4 << 12));
++	writel_relaxed(reg, ccm_base + 0x2c);
++
++	/*
++	 * Perform the LDB parent clock switch.
++	 */
++	imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI0_SEL], new_parent);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI1_SEL], new_parent);
++
++	/*
++	 * Unbypass pll3_sw_clk.
++	 */
++	reg = readl_relaxed(ccm_base + 0xc);
++	reg &= ~(1 << 0);
++	writel_relaxed(reg, ccm_base + 0xc);
++
++	/*
++	 * Set the periph2_clk_sel back to the bottom mux so that
++	 * mmdc_ch1 is from its original parent.
++	 */
++	reg = readl_relaxed(ccm_base + 0x14);
++	reg &= ~(1 << 26);
++	writel_relaxed(reg, ccm_base + 0x14);
++
++	/*
++	 * Wait for the clock switch.
++	 */
++	while (readl_relaxed(ccm_base + 0x48))
++		;
++
++	/*
++	 * Clear MMDC_CH1 mask bit.
++	 */
++	reg = readl_relaxed(ccm_base + 0x4);
++	reg &= ~(1 << 16);
++	writel_relaxed(reg, ccm_base + 0x4);
++
++}
++
+ static void __init imx6q_clocks_init(struct device_node *ccm_node)
+ {
+ 	struct device_node *np;
+@@ -174,13 +285,13 @@
+ 	clk[IMX6QDL_PLL7_BYPASS] = imx_clk_mux_flags("pll7_bypass", base + 0x20, 16, 1, pll7_bypass_sels, ARRAY_SIZE(pll7_bypass_sels), CLK_SET_RATE_PARENT);
+ 
+ 	/* Do not bypass PLLs initially */
+-	clk_set_parent(clk[IMX6QDL_PLL1_BYPASS], clk[IMX6QDL_CLK_PLL1]);
+-	clk_set_parent(clk[IMX6QDL_PLL2_BYPASS], clk[IMX6QDL_CLK_PLL2]);
+-	clk_set_parent(clk[IMX6QDL_PLL3_BYPASS], clk[IMX6QDL_CLK_PLL3]);
+-	clk_set_parent(clk[IMX6QDL_PLL4_BYPASS], clk[IMX6QDL_CLK_PLL4]);
+-	clk_set_parent(clk[IMX6QDL_PLL5_BYPASS], clk[IMX6QDL_CLK_PLL5]);
+-	clk_set_parent(clk[IMX6QDL_PLL6_BYPASS], clk[IMX6QDL_CLK_PLL6]);
+-	clk_set_parent(clk[IMX6QDL_PLL7_BYPASS], clk[IMX6QDL_CLK_PLL7]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL1_BYPASS], clk[IMX6QDL_CLK_PLL1]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL2_BYPASS], clk[IMX6QDL_CLK_PLL2]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL3_BYPASS], clk[IMX6QDL_CLK_PLL3]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL4_BYPASS], clk[IMX6QDL_CLK_PLL4]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL5_BYPASS], clk[IMX6QDL_CLK_PLL5]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL6_BYPASS], clk[IMX6QDL_CLK_PLL6]);
++	imx_clk_set_parent(clk[IMX6QDL_PLL7_BYPASS], clk[IMX6QDL_CLK_PLL7]);
+ 
+ 	clk[IMX6QDL_CLK_PLL1_SYS]      = imx_clk_gate("pll1_sys",      "pll1_bypass", base + 0x00, 13);
+ 	clk[IMX6QDL_CLK_PLL2_BUS]      = imx_clk_gate("pll2_bus",      "pll2_bypass", base + 0x30, 13);
+@@ -259,7 +370,7 @@
+ 	clk[IMX6QDL_CLK_PLL5_VIDEO_DIV] = clk_register_divider_table(NULL, "pll5_video_div", "pll5_post_div", CLK_SET_RATE_PARENT, base + 0x170, 30, 2, 0, video_div_table, &imx_ccm_lock);
+ 
+ 	np = ccm_node;
+-	base = of_iomap(np, 0);
++	ccm_base = base = of_iomap(np, 0);
+ 	WARN_ON(!base);
+ 
+ 	imx6q_pm_set_ccm_base(base);
+@@ -286,6 +397,8 @@
+ 	clk[IMX6QDL_CLK_IPU2_SEL]         = imx_clk_mux("ipu2_sel",         base + 0x3c, 14, 2, ipu_sels,          ARRAY_SIZE(ipu_sels));
+ 	clk[IMX6QDL_CLK_LDB_DI0_SEL]      = imx_clk_mux_flags("ldb_di0_sel", base + 0x2c, 9,  3, ldb_di_sels,      ARRAY_SIZE(ldb_di_sels), CLK_SET_RATE_PARENT);
+ 	clk[IMX6QDL_CLK_LDB_DI1_SEL]      = imx_clk_mux_flags("ldb_di1_sel", base + 0x2c, 12, 3, ldb_di_sels,      ARRAY_SIZE(ldb_di_sels), CLK_SET_RATE_PARENT);
++	clk[IMX6QDL_CLK_LDB_DI0_DIV_SEL]  = imx_clk_mux_flags("ldb_di0_div_sel", base + 0x20, 10, 1, ldb_di0_div_sels, ARRAY_SIZE(ldb_di0_div_sels), CLK_SET_RATE_PARENT);
++	clk[IMX6QDL_CLK_LDB_DI1_DIV_SEL]  = imx_clk_mux_flags("ldb_di1_div_sel", base + 0x20, 11, 1, ldb_di1_div_sels, ARRAY_SIZE(ldb_di1_div_sels), CLK_SET_RATE_PARENT);
+ 	clk[IMX6QDL_CLK_IPU1_DI0_PRE_SEL] = imx_clk_mux_flags("ipu1_di0_pre_sel", base + 0x34, 6,  3, ipu_di_pre_sels,   ARRAY_SIZE(ipu_di_pre_sels), CLK_SET_RATE_PARENT);
+ 	clk[IMX6QDL_CLK_IPU1_DI1_PRE_SEL] = imx_clk_mux_flags("ipu1_di1_pre_sel", base + 0x34, 15, 3, ipu_di_pre_sels,   ARRAY_SIZE(ipu_di_pre_sels), CLK_SET_RATE_PARENT);
+ 	clk[IMX6QDL_CLK_IPU2_DI0_PRE_SEL] = imx_clk_mux_flags("ipu2_di0_pre_sel", base + 0x38, 6,  3, ipu_di_pre_sels,   ARRAY_SIZE(ipu_di_pre_sels), CLK_SET_RATE_PARENT);
+@@ -335,9 +448,9 @@
+ 	clk[IMX6QDL_CLK_IPU1_PODF]        = imx_clk_divider("ipu1_podf",        "ipu1_sel",          base + 0x3c, 11, 3);
+ 	clk[IMX6QDL_CLK_IPU2_PODF]        = imx_clk_divider("ipu2_podf",        "ipu2_sel",          base + 0x3c, 16, 3);
+ 	clk[IMX6QDL_CLK_LDB_DI0_DIV_3_5]  = imx_clk_fixed_factor("ldb_di0_div_3_5", "ldb_di0_sel", 2, 7);
+-	clk[IMX6QDL_CLK_LDB_DI0_PODF]     = imx_clk_divider_flags("ldb_di0_podf", "ldb_di0_div_3_5", base + 0x20, 10, 1, 0);
++	clk[IMX6QDL_CLK_LDB_DI0_DIV_7]    = imx_clk_fixed_factor("ldb_di0_div_7",   "ldb_di0_sel", 1, 7);
+ 	clk[IMX6QDL_CLK_LDB_DI1_DIV_3_5]  = imx_clk_fixed_factor("ldb_di1_div_3_5", "ldb_di1_sel", 2, 7);
+-	clk[IMX6QDL_CLK_LDB_DI1_PODF]     = imx_clk_divider_flags("ldb_di1_podf", "ldb_di1_div_3_5", base + 0x20, 11, 1, 0);
++	clk[IMX6QDL_CLK_LDB_DI1_DIV_7]    = imx_clk_fixed_factor("ldb_di1_div_7",   "ldb_di1_sel", 1, 7);
+ 	clk[IMX6QDL_CLK_IPU1_DI0_PRE]     = imx_clk_divider("ipu1_di0_pre",     "ipu1_di0_pre_sel",  base + 0x34, 3,  3);
+ 	clk[IMX6QDL_CLK_IPU1_DI1_PRE]     = imx_clk_divider("ipu1_di1_pre",     "ipu1_di1_pre_sel",  base + 0x34, 12, 3);
+ 	clk[IMX6QDL_CLK_IPU2_DI0_PRE]     = imx_clk_divider("ipu2_di0_pre",     "ipu2_di0_pre_sel",  base + 0x38, 3,  3);
+@@ -378,6 +491,8 @@
+ 	clk[IMX6QDL_CLK_CAN1_SERIAL]  = imx_clk_gate2("can1_serial",   "can_root",          base + 0x68, 16);
+ 	clk[IMX6QDL_CLK_CAN2_IPG]     = imx_clk_gate2("can2_ipg",      "ipg",               base + 0x68, 18);
+ 	clk[IMX6QDL_CLK_CAN2_SERIAL]  = imx_clk_gate2("can2_serial",   "can_root",          base + 0x68, 20);
++	clk[IMX6QDL_CLK_DCIC1]        = imx_clk_gate2("dcic1",         "ipu1_podf",         base + 0x68, 24);
++	clk[IMX6QDL_CLK_DCIC2]        = imx_clk_gate2("dcic2",         "ipu2_podf",         base + 0x68, 26);
+ 	clk[IMX6QDL_CLK_ECSPI1]       = imx_clk_gate2("ecspi1",        "ecspi_root",        base + 0x6c, 0);
+ 	clk[IMX6QDL_CLK_ECSPI2]       = imx_clk_gate2("ecspi2",        "ecspi_root",        base + 0x6c, 2);
+ 	clk[IMX6QDL_CLK_ECSPI3]       = imx_clk_gate2("ecspi3",        "ecspi_root",        base + 0x6c, 4);
+@@ -414,9 +529,9 @@
+ 	clk[IMX6QDL_CLK_IPU1_DI1]     = imx_clk_gate2("ipu1_di1",      "ipu1_di1_sel",      base + 0x74, 4);
+ 	clk[IMX6QDL_CLK_IPU2]         = imx_clk_gate2("ipu2",          "ipu2_podf",         base + 0x74, 6);
+ 	clk[IMX6QDL_CLK_IPU2_DI0]     = imx_clk_gate2("ipu2_di0",      "ipu2_di0_sel",      base + 0x74, 8);
+-	clk[IMX6QDL_CLK_LDB_DI0]      = imx_clk_gate2("ldb_di0",       "ldb_di0_podf",      base + 0x74, 12);
+-	clk[IMX6QDL_CLK_LDB_DI1]      = imx_clk_gate2("ldb_di1",       "ldb_di1_podf",      base + 0x74, 14);
+ 	clk[IMX6QDL_CLK_IPU2_DI1]     = imx_clk_gate2("ipu2_di1",      "ipu2_di1_sel",      base + 0x74, 10);
++	clk[IMX6QDL_CLK_LDB_DI0]      = imx_clk_gate2("ldb_di0",       "ldb_di0_div_sel",      base + 0x74, 12);
++	clk[IMX6QDL_CLK_LDB_DI1]      = imx_clk_gate2("ldb_di1",       "ldb_di1_div_sel",      base + 0x74, 14);
+ 	clk[IMX6QDL_CLK_HSI_TX]       = imx_clk_gate2_shared("hsi_tx", "hsi_tx_podf",       base + 0x74, 16, &share_count_mipi_core_cfg);
+ 	clk[IMX6QDL_CLK_MIPI_CORE_CFG] = imx_clk_gate2_shared("mipi_core_cfg", "video_27m", base + 0x74, 16, &share_count_mipi_core_cfg);
+ 	clk[IMX6QDL_CLK_MIPI_IPG]     = imx_clk_gate2_shared("mipi_ipg", "ipg",             base + 0x74, 16, &share_count_mipi_core_cfg);
+@@ -446,7 +561,8 @@
+ 	clk[IMX6QDL_CLK_SATA]         = imx_clk_gate2("sata",          "ahb",               base + 0x7c, 4);
+ 	clk[IMX6QDL_CLK_SDMA]         = imx_clk_gate2("sdma",          "ahb",               base + 0x7c, 6);
+ 	clk[IMX6QDL_CLK_SPBA]         = imx_clk_gate2("spba",          "ipg",               base + 0x7c, 12);
+-	clk[IMX6QDL_CLK_SPDIF]        = imx_clk_gate2("spdif",         "spdif_podf",        base + 0x7c, 14);
++	clk[IMX6QDL_CLK_SPDIF]        = imx_clk_gate2_shared("spdif",         "spdif_podf", base + 0x7c, 14, &share_count_spdif);
++	clk[IMX6QDL_CLK_SPDIF_GCLK]   = imx_clk_gate2_shared("spdif_gclk", "ipg",           base + 0x7c, 14, &share_count_spdif);
+ 	clk[IMX6QDL_CLK_SSI1_IPG]     = imx_clk_gate2_shared("ssi1_ipg",      "ipg",        base + 0x7c, 18, &share_count_ssi1);
+ 	clk[IMX6QDL_CLK_SSI2_IPG]     = imx_clk_gate2_shared("ssi2_ipg",      "ipg",        base + 0x7c, 20, &share_count_ssi2);
+ 	clk[IMX6QDL_CLK_SSI3_IPG]     = imx_clk_gate2_shared("ssi3_ipg",      "ipg",        base + 0x7c, 22, &share_count_ssi3);
+@@ -479,54 +595,104 @@
+ 	clk_data.clk_num = ARRAY_SIZE(clk);
+ 	of_clk_add_provider(np, of_clk_src_onecell_get, &clk_data);
+ 
++	clk_register_clkdev(clk[IMX6QDL_CLK_GPT_3M], "gpt_3m", "imx-gpt.0");
+ 	clk_register_clkdev(clk[IMX6QDL_CLK_ENET_REF], "enet_ref", NULL);
+ 
+ 	if ((imx_get_soc_revision() != IMX_CHIP_REVISION_1_0) ||
+ 	    cpu_is_imx6dl()) {
+-		clk_set_parent(clk[IMX6QDL_CLK_LDB_DI0_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
+-		clk_set_parent(clk[IMX6QDL_CLK_LDB_DI1_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
++		imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI0_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
++		imx_clk_set_parent(clk[IMX6QDL_CLK_LDB_DI1_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
+ 	}
+ 
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_SEL], clk[IMX6QDL_CLK_IPU1_DI0_PRE]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_SEL], clk[IMX6QDL_CLK_IPU1_DI1_PRE]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_SEL], clk[IMX6QDL_CLK_IPU2_DI0_PRE]);
+-	clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_SEL], clk[IMX6QDL_CLK_IPU2_DI1_PRE]);
++	init_ldb_clks(clk[IMX6QDL_CLK_PLL2_PFD0_352M]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_PRE_SEL], clk[IMX6QDL_CLK_PLL5_VIDEO_DIV]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI0_SEL], clk[IMX6QDL_CLK_IPU1_DI0_PRE]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_DI1_SEL], clk[IMX6QDL_CLK_IPU1_DI1_PRE]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI0_SEL], clk[IMX6QDL_CLK_IPU2_DI0_PRE]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_IPU2_DI1_SEL], clk[IMX6QDL_CLK_IPU2_DI1_PRE]);
++
++	if (cpu_is_imx6dl())
++		imx_clk_set_parent(clk[IMX6QDL_CLK_IPU1_SEL], clk[IMX6QDL_CLK_PLL3_PFD1_540M]);
+ 
+ 	/*
+ 	 * The gpmi needs 100MHz frequency in the EDO/Sync mode,
+ 	 * We can not get the 100MHz from the pll2_pfd0_352m.
+ 	 * So choose pll2_pfd2_396m as enfc_sel's parent.
+ 	 */
+-	clk_set_parent(clk[IMX6QDL_CLK_ENFC_SEL], clk[IMX6QDL_CLK_PLL2_PFD2_396M]);
+-
+-	for (i = 0; i < ARRAY_SIZE(clks_init_on); i++)
+-		clk_prepare_enable(clk[clks_init_on[i]]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_ENFC_SEL], clk[IMX6QDL_CLK_PLL2_PFD2_396M]);
+ 
++	/* gpu clock initilazation */
++	/*
++	* On mx6dl, 2d core clock sources(sel, podf) is from 3d
++	* shader core clock, but 3d shader clock multiplexer of
++	* mx6dl is different. For instance the equivalent of
++	* pll2_pfd_594M on mx6q is pll2_pfd_528M on mx6dl.
++	* Make a note here.
++	*/
++#if 0
++	imx_clk_set_parent(clk[IMX6QDL_CLK_GPU3D_SHADER_SEL], clk[IMX6QDL_CLK_PLL2_PFD1_594M]);
++	if (cpu_is_imx6dl()) {
++		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_SHADER], 528000000);
++		/* for mx6dl, change gpu3d_core parent to 594_PFD*/
++		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU3D_CORE_SEL], clk[IMX6QDL_CLK_PLL2_PFD1_594M]);
++		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_CORE], 528000000);
++		/* for mx6dl, change gpu2d_core parent to 594_PFD*/
++		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU2D_CORE_SEL], clk[IMX6QDL_CLK_PLL2_PFD1_594M]);
++		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU2D_CORE], 528000000);
++	} else if (cpu_is_imx6q()) {
++		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_SHADER], 594000000);
++		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU3D_CORE_SEL], clk[IMX6QDL_CLK_MMDC_CH0_AXI]);
++		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU3D_CORE], 528000000);
++		imx_clk_set_parent(clk[IMX6QDL_CLK_GPU2D_CORE_SEL], clk[IMX6QDL_CLK_PLL3_USB_OTG]);
++		imx_clk_set_rate(clk[IMX6QDL_CLK_GPU2D_CORE], 480000000);
++	}
++#endif
+ 	if (IS_ENABLED(CONFIG_USB_MXS_PHY)) {
+-		clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY1_GATE]);
+-		clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY2_GATE]);
++		imx_clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY1_GATE]);
++		imx_clk_prepare_enable(clk[IMX6QDL_CLK_USBPHY2_GATE]);
+ 	}
+ 
+ 	/*
+ 	 * Let's initially set up CLKO with OSC24M, since this configuration
+ 	 * is widely used by imx6q board designs to clock audio codec.
+ 	 */
+-	ret = clk_set_parent(clk[IMX6QDL_CLK_CKO2_SEL], clk[IMX6QDL_CLK_OSC]);
++	ret = imx_clk_set_parent(clk[IMX6QDL_CLK_CKO2_SEL], clk[IMX6QDL_CLK_OSC]);
+ 	if (!ret)
+-		ret = clk_set_parent(clk[IMX6QDL_CLK_CKO], clk[IMX6QDL_CLK_CKO2]);
++		ret = imx_clk_set_parent(clk[IMX6QDL_CLK_CKO], clk[IMX6QDL_CLK_CKO2]);
+ 	if (ret)
+ 		pr_warn("failed to set up CLKO: %d\n", ret);
+ 
+ 	/* Audio-related clocks configuration */
+-	clk_set_parent(clk[IMX6QDL_CLK_SPDIF_SEL], clk[IMX6QDL_CLK_PLL3_PFD3_454M]);
++	imx_clk_set_parent(clk[IMX6QDL_CLK_SPDIF_SEL], clk[IMX6QDL_CLK_PLL3_PFD3_454M]);
+ 
+ 	/* All existing boards with PCIe use LVDS1 */
+ 	if (IS_ENABLED(CONFIG_PCI_IMX6))
+-		clk_set_parent(clk[IMX6QDL_CLK_LVDS1_SEL], clk[IMX6QDL_CLK_SATA_REF_100M]);
++		imx_clk_set_parent(clk[IMX6QDL_CLK_LVDS1_SEL], clk[IMX6QDL_CLK_SATA_REF_100M]);
++
++	/*
++	 * Enable clocks only after both parent and rate are all initialized
++	 * as needed
++	 */
++	for (i = 0; i < ARRAY_SIZE(clks_init_on); i++)
++		imx_clk_prepare_enable(clk[clks_init_on[i]]);
++
++	/*
++	 * If VPU 352M is enabled, then PLL2_PDF2 need to be
++	 * set to 352M, cpufreq will be disabled as VDDSOC/PU
++	 * need to be at highest voltage, scaling cpu freq is
++	 * not saving any power, and busfreq will be also disabled
++	 * as the PLL2_PFD2 is not at default freq, in a word,
++	 * all modules that sourceing clk from PLL2_PFD2 will
++	 * be impacted.
++	 */
++	if (vpu352) {
++		clk_set_rate(clk[IMX6QDL_CLK_PLL2_PFD2_396M], 352000000);
++		clk_set_parent(clk[IMX6QDL_CLK_VPU_AXI_SEL], clk[IMX6QDL_CLK_PLL2_PFD2_396M]);
++		pr_info("VPU 352M is enabled!\n");
++	}
+ 
+ 	/* Set initial power mode */
+ 	imx6q_set_lpm(WAIT_CLOCKED);
+diff -Nur linux-4.1.3/arch/arm/mach-imx/clk-pllv3.c linux-xbian-imx6/arch/arm/mach-imx/clk-pllv3.c
+--- linux-4.1.3/arch/arm/mach-imx/clk-pllv3.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/clk-pllv3.c	2015-07-27 23:13:01.085110746 +0200
+@@ -23,6 +23,7 @@
+ #define PLL_DENOM_OFFSET	0x20
+ 
+ #define BM_PLL_POWER		(0x1 << 12)
++#define BM_PLL_BYPASS		(0x1 << 16)
+ #define BM_PLL_LOCK		(0x1 << 31)
+ 
+ /**
+@@ -237,9 +238,10 @@
+ 	struct clk_pllv3 *pll = to_clk_pllv3(hw);
+ 	unsigned long min_rate = parent_rate * 27;
+ 	unsigned long max_rate = parent_rate * 54;
+-	u32 val, div;
++	u32 val, newval, div;
+ 	u32 mfn, mfd = 1000000;
+ 	s64 temp64;
++	int ret;
+ 
+ 	if (rate < min_rate || rate > max_rate)
+ 		return -EINVAL;
+@@ -251,13 +253,27 @@
+ 	mfn = temp64;
+ 
+ 	val = readl_relaxed(pll->base);
+-	val &= ~pll->div_mask;
+-	val |= div;
+-	writel_relaxed(val, pll->base);
++
++	/* set the PLL into bypass mode */
++	newval = val | BM_PLL_BYPASS;
++	writel_relaxed(newval, pll->base);
++
++	/* configure the new frequency */
++	newval &= ~pll->div_mask;
++	newval |= div;
++	writel_relaxed(newval, pll->base);
+ 	writel_relaxed(mfn, pll->base + PLL_NUM_OFFSET);
+ 	writel_relaxed(mfd, pll->base + PLL_DENOM_OFFSET);
+ 
+-	return clk_pllv3_wait_lock(pll);
++	ret = clk_pllv3_wait_lock(pll);
++	if (ret == 0 && val & BM_PLL_POWER) {
++		/* only if it locked can we switch back to the PLL */
++		newval &= ~BM_PLL_BYPASS;
++		newval |= val & BM_PLL_BYPASS;
++		writel_relaxed(newval, pll->base);
++	}
++
++	return ret;
+ }
+ 
+ static const struct clk_ops clk_pllv3_av_ops = {
+diff -Nur linux-4.1.3/arch/arm/mach-imx/common.h linux-xbian-imx6/arch/arm/mach-imx/common.h
+--- linux-4.1.3/arch/arm/mach-imx/common.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/common.h	2015-07-27 23:13:01.085110746 +0200
+@@ -56,6 +56,7 @@
+ void mxc_set_cpu_type(unsigned int type);
+ void mxc_restart(enum reboot_mode, const char *);
+ void mxc_arch_reset_init(void __iomem *);
++void mxc_arch_reset_init_dt(void);
+ int mx51_revision(void);
+ int mx53_revision(void);
+ void imx_set_aips(void __iomem *);
+@@ -86,6 +87,8 @@
+ 	MX3_SLEEP,
+ };
+ 
++extern int vpu352;
++
+ void mx3_cpu_lp_set(enum mx3_cpu_pwr_mode mode);
+ void imx_print_silicon_rev(const char *cpu, int srev);
+ 
+@@ -102,6 +105,7 @@
+ static inline void imx_smp_prepare(void) {}
+ #endif
+ void imx_src_init(void);
++
+ void imx_gpc_pre_suspend(bool arm_power_off);
+ void imx_gpc_post_resume(void);
+ void imx_gpc_mask_all(void);
+diff -Nur linux-4.1.3/arch/arm/mach-imx/ddr3_freq_imx6.S linux-xbian-imx6/arch/arm/mach-imx/ddr3_freq_imx6.S
+--- linux-4.1.3/arch/arm/mach-imx/ddr3_freq_imx6.S	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/arch/arm/mach-imx/ddr3_freq_imx6.S	2015-07-27 23:13:01.089096525 +0200
+@@ -0,0 +1,893 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/linkage.h>
++
++#define MMDC0_MDPDC		0x4
++#define MMDC0_MDCF0			0x0c
++#define MMDC0_MDCF1			0x10
++#define MMDC0_MDMISC		0x18
++#define MMDC0_MDSCR		0x1c
++#define MMDC0_MAPSR			0x404
++#define MMDC0_MADPCR0		0x410
++#define MMDC0_MPZQHWCTRL	0x800
++#define MMDC1_MPZQHWCTRL	0x4800
++#define MMDC0_MPODTCTRL	0x818
++#define MMDC1_MPODTCTRL	0x4818
++#define MMDC0_MPDGCTRL0	0x83c
++#define MMDC1_MPDGCTRL0	0x483c
++#define MMDC0_MPMUR0		0x8b8
++#define MMDC1_MPMUR0		0x48b8
++
++#define CCM_CBCDR			0x14
++#define CCM_CBCMR			0x18
++#define CCM_CSCMR1			0x1c
++#define CCM_CDHIPR			0x48
++
++#define L2_CACHE_SYNC		0x730
++
++	.align 3
++
++	.macro	switch_to_528MHz
++
++	/* check if periph_clk_sel is already set */
++	ldr	r0, [r6, #CCM_CBCDR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	beq	set_ahb_podf_before_switch
++
++	/* change periph_clk to be sourced from pll3_clk. */
++	ldr	r0, [r6, #CCM_CBCMR]
++	bic	r0, r0, #(3 << 12)
++	str	r0, [r6, #CCM_CBCMR]
++
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(0x38 << 20)
++	str	r0, [r6, #CCM_CBCDR]
++
++	/*
++	 * set the AHB dividers before the switch,
++	 * don't change AXI clock divider,
++	 * set the MMDC_DIV=1, AXI_DIV = 2, AHB_DIV=4,
++	 */
++	ldr	r0, [r6, #CCM_CBCDR]
++	ldr	r2, =0x3f1f00
++	bic	r0, r0, r2
++	orr	r0, r0, #0xd00
++	orr	r0, r0, #(1 << 16)
++	str	r0, [r6, #CCM_CBCDR]
++
++wait_div_update528:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	wait_div_update528
++
++	/* now switch periph_clk to pll3_main_clk. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	orr	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch3:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch3
++
++	b	switch_pre_periph_clk_528
++
++set_ahb_podf_before_switch:
++	/*
++	 * set the MMDC_DIV=1, AXI_DIV = 2, AHB_DIV=4,
++	 */
++	ldr	r0, [r6, #CCM_CBCDR]
++	ldr	r2, =0x3f1f00
++	bic	r0, r0, r2
++	orr	r0, r0, #0xd00
++	orr	r0, r0, #(1 << 16)
++	str	r0, [r6, #CCM_CBCDR]
++
++wait_div_update528_1:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	wait_div_update528_1
++
++switch_pre_periph_clk_528:
++
++	/* now switch pre_periph_clk to PLL2_528MHz. */
++	ldr	r0, [r6, #CCM_CBCMR]
++	bic	r0, r0, #(0xc << 16)
++	str	r0, [r6, #CCM_CBCMR]
++
++	/* now switch periph_clk back. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch4:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch4
++
++	.endm
++
++	.macro	switch_to_400MHz
++
++	/* check if periph_clk_sel is already set. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	beq	set_ahb_podf_before_switch1
++
++	/* change periph_clk to be sourced from pll3_clk. */
++	ldr	r0, [r6, #CCM_CBCMR]
++	bic	r0, r0, #(3 << 12)
++	str	r0, [r6, #CCM_CBCMR]
++
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(0x38 << 24)
++	str	r0, [r6, #CCM_CBCDR]
++
++	/* now switch periph_clk to pll3_main_clk. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	orr	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch5:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch5
++
++	b	switch_pre_periph_clk_400
++
++set_ahb_podf_before_switch1:
++	/*
++	 * set the MMDC_DIV=1, AXI_DIV = 2, AHB_DIV=4,
++	 */
++	ldr	r0, [r6, #CCM_CBCDR]
++	ldr	r2, =0x3f1f00
++	bic	r0, r0, r2
++	orr	r0, r0, #(0x9 << 8)
++	orr	r0, r0, #(1 << 16)
++	str	r0, [r6, #CCM_CBCDR]
++
++wait_div_update400_1:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	wait_div_update400_1
++
++switch_pre_periph_clk_400:
++
++	/* now switch pre_periph_clk to PFD_400MHz. */
++	ldr	r0, [r6, #CCM_CBCMR]
++	bic	r0, r0, #(0xc << 16)
++	orr	r0, r0, #(0x4 << 16)
++	str	r0, [r6, #CCM_CBCMR]
++
++	/* now switch periph_clk back. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch6:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch6
++
++	/*
++	 * change AHB divider so that we are at 400/3=133MHz.
++	 * don't change AXI clock divider.
++	 * set the MMDC_DIV=1, AXI_DIV=2, AHB_DIV=3,
++	 */
++	ldr	r0, [r6, #CCM_CBCDR]
++	ldr	r2, =0x3f1f00
++	bic	r0, r0, r2
++	orr	r0, r0, #(0x9 << 8)
++	orr	r0, r0, #(1 << 16)
++	str	r0, [r6, #CCM_CBCDR]
++
++wait_div_update400_2:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	wait_div_update400_2
++
++	.endm
++
++	.macro	switch_to_50MHz
++
++	/* check if periph_clk_sel is already set. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	beq	switch_pre_periph_clk_50
++
++	/*
++	 * set the periph_clk to be sourced from PLL2_PFD_200M
++	 * change periph_clk to be sourced from pll3_clk.
++	 * ensure PLL3 is the source and set the divider to 1.
++	 */
++	ldr	r0, [r6, #CCM_CBCMR]
++	bic	r0, r0, #(0x3 << 12)
++	str	r0, [r6, #CCM_CBCMR]
++
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(0x38 << 24)
++	str	r0, [r6, #CCM_CBCDR]
++
++	/* now switch periph_clk to pll3_main_clk. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	orr	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch_50:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch_50
++
++switch_pre_periph_clk_50:
++
++	/* now switch pre_periph_clk to PFD_200MHz. */
++	ldr	r0, [r6, #CCM_CBCMR]
++	orr	r0, r0, #(0xc << 16)
++	str	r0, [r6, #CCM_CBCMR]
++
++	/*
++	 * set the MMDC_DIV=4, AXI_DIV = 4, AHB_DIV=8,
++	 */
++	ldr	r0, [r6, #CCM_CBCDR]
++	ldr	r2, =0x3f1f00
++	bic	r0, r0, r2
++	orr	r0, r0, #(0x18 << 16)
++	orr	r0, r0, #(0x3 << 16)
++
++	/*
++	 * if changing AHB divider remember to change
++	 * the IPGPER divider too below.
++	 */
++	orr	r0, r0, #0x1d00
++	str	r0, [r6, #CCM_CBCDR]
++
++wait_div_update_50:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	wait_div_update_50
++
++	/* now switch periph_clk back. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch2:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch2
++
++	.endm
++
++	.macro	switch_to_24MHz
++	/*
++	 * change the freq now try setting DDR to 24MHz.
++	 * source it from the periph_clk2 ensure the
++	 * periph_clk2 is sourced from 24MHz and the
++	 * divider is 1.
++	 */
++
++	ldr	r0, [r6, #CCM_CBCMR]
++	bic	r0, r0, #(0x3 << 12)
++	orr	r0, r0, #(1 << 12)
++	str	r0, [r6, #CCM_CBCMR]
++
++	ldr	r0, [r6, #CCM_CBCDR]
++	bic	r0, r0, #(0x38 << 24)
++	str	r0, [r6, #CCM_CBCDR]
++
++	/* now switch periph_clk to 24MHz. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	orr	r0, r0, #(1 << 25)
++	str	r0, [r6, #CCM_CBCDR]
++
++periph_clk_switch1:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	periph_clk_switch1
++
++	/* change all the dividers to 1. */
++	ldr	r0, [r6, #CCM_CBCDR]
++	ldr	r2, =0x3f1f00
++	bic	r0, r0, r2
++	orr	r0, r0, #(1 << 8)
++	str	r0, [r6, #CCM_CBCDR]
++
++	/* Wait for the divider to change. */
++wait_div_update:
++	ldr	r0, [r6, #CCM_CDHIPR]
++	cmp	r0, #0
++	bne	wait_div_update
++
++	.endm
++
++/*
++ *  mx6_ddr3_freq_change
++ *
++ *  idle the processor (eg, wait for interrupt).
++ *  make sure DDR is in self-refresh.
++ *  IRQs are already disabled.
++ */
++ENTRY(mx6_ddr3_freq_change)
++
++	stmfd	sp!, {r4-r12}
++
++	/*
++	  * r5 -> mmdc_base
++	  * r6 -> ccm_base
++	  * r7 -> iomux_base
++	  * r12 -> l2_base
++	  */
++	mov	r4, r0
++	mov	r8, r1
++	mov	r9, r2
++	mov	r11, r3
++
++	/*
++	  * Get the addresses of the registers.
++	  * They are last few entries in the
++	  * ddr_settings parameter.
++	  * The first entry contains the count,
++	  * and each entry is 2 words.
++	  */
++	ldr	r0, [r1]
++	add	r0, r0, #1
++	lsl	r0, r0, #3
++	add	r1, r0, r1
++	/* mmdc_base. */
++	ldr	r5, [r1]
++	add	r1, #8
++	/* ccm_base */
++	ldr	r6, [r1]
++	add	r1, #8
++	/*iomux_base */
++	ldr	r7, [r1]
++	add	r1, #8
++	/*l2_base */
++	ldr	r12, [r1]
++
++ddr_freq_change:
++	/*
++	 * make sure no TLB miss will occur when
++	 * the DDR is in self refresh. invalidate
++	 * TLB single entry to ensure that the
++	 * address is not already in the TLB.
++	 */
++
++	adr	r10, ddr_freq_change
++
++	ldr	r2, [r6]
++	ldr	r2, [r5]
++	ldr	r2, [r7]
++	ldr	r2, [r8]
++	ldr	r2, [r10]
++	ldr	r2, [r11]
++	ldr	r2, [r12]
++
++#ifdef CONFIG_CACHE_L2X0
++	/*
++	  * Make sure the L2 buffers are drained.
++	  * Sync operation on L2 drains the buffers.
++	  */
++	mov    r1, #0x0
++	str      r1, [r12, #L2_CACHE_SYNC]
++#endif
++
++	/* disable automatic power saving. */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	orr	r0, r0, #0x01
++	str	r0, [r5, #MMDC0_MAPSR]
++
++	/* disable MMDC power down timer. */
++	ldr	r0, [r5, #MMDC0_MDPDC]
++	bic	r0, r0, #(0xff << 8)
++	str	r0, [r5, #MMDC0_MDPDC]
++
++	/* delay for a while */
++	ldr	r1, =4
++delay1:
++	ldr	r2, =0
++cont1:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont1
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay1
++
++	/* set CON_REG */
++	ldr	r0, =0x8000
++	str	r0, [r5, #MMDC0_MDSCR]
++poll_conreq_set_1:
++	ldr	r0, [r5, #MMDC0_MDSCR]
++	and	r0, r0, #(0x4 << 12)
++	cmp	r0, #(0x4 << 12)
++	bne	poll_conreq_set_1
++
++	ldr	r0, =0x00008050
++	str	r0, [r5, #MMDC0_MDSCR]
++	ldr	r0, =0x00008058
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	/*
++	 * if requested frequency is greater than
++	 * 300MHz go to DLL on mode.
++	 */
++	ldr	r1, =300000000
++	cmp	r4, r1
++	bge	dll_on_mode
++
++dll_off_mode:
++
++	/* if DLL is currently on, turn it off. */
++	cmp	r9, #1
++	beq	continue_dll_off_1
++
++	ldr	r0, =0x00018031
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x00018039
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r1, =10
++delay1a:
++	ldr	r2, =0
++cont1a:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont1a
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay1a
++
++continue_dll_off_1:
++	/* set DVFS - enter self refresh mode */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	orr	r0, r0, #(1 << 21)
++	str	r0, [r5, #MMDC0_MAPSR]
++
++	/* de-assert con_req */
++	mov	r0, #0x0
++	str	r0, [r5, #MMDC0_MDSCR]
++
++poll_dvfs_set_1:
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	bne	poll_dvfs_set_1
++
++	ldr	r1, =24000000
++	cmp	r4, r1
++	beq	switch_freq_24
++
++	switch_to_50MHz
++	b	continue_dll_off_2
++
++switch_freq_24:
++	switch_to_24MHz
++
++continue_dll_off_2:
++
++	/* set SBS - block ddr accesses */
++	ldr	r0, [r5, #MMDC0_MADPCR0]
++	orr	r0, r0, #(1 << 8)
++	str	r0, [r5, #MMDC0_MADPCR0]
++
++	/* clear DVFS - exit from self refresh mode */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	bic	r0, r0, #(1 << 21)
++	str	r0, [r5, #MMDC0_MAPSR]
++
++poll_dvfs_clear_1:
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	beq	poll_dvfs_clear_1
++
++	/* if DLL was previously on, continue DLL off routine. */
++	cmp    	r9, #1
++	beq 	continue_dll_off_3
++
++	ldr	r0, =0x00018031
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x00018039
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x08208030
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x08208038
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x00088032
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x0008803A
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	/* delay for a while. */
++	ldr	r1, =4
++delay_1:
++	ldr	r2, =0
++cont_1:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont_1
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay_1
++
++	ldr	r0, [r5, #MMDC0_MDCF0]
++	bic	r0, r0, #0xf
++	orr	r0, r0, #0x3
++	str	r0, [r5, #MMDC0_MDCF0]
++
++	ldr	r0, [r5, #MMDC0_MDCF1]
++	bic	r0, r0, #0x7
++	orr	r0, r0, #0x4
++	str	r0, [r5, #MMDC0_MDCF1]
++
++	ldr	r0, =0x00011680
++	str	r0, [r5, #MMDC0_MDMISC]
++
++	/* enable dqs pull down in the IOMUX. */
++	ldr	r1, [r11]
++	add	r11, r11, #8
++	ldr	r2, =0x3028
++update_iomux:
++	ldr	r0, [r11, #0x0]
++	ldr	r3, [r7, r0]
++	bic	r3, r3, r2
++	orr	r3, r3, #(0x3 << 12)
++	orr	r3, r3, #0x28
++	str	r3, [r7, r0]
++	add	r11, r11, #8
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	update_iomux
++
++	/*  ODT disabled. */
++	ldr	r0, =0x0
++	ldr	r2, =MMDC0_MPODTCTRL
++	str	r0, [r5, r2]
++	ldr	r2, =MMDC1_MPODTCTRL
++	str	r0, [r5, r2]
++
++	/* DQS gating disabled. */
++	ldr	r2, =MMDC0_MPDGCTRL0
++	ldr	r0, [r5, r2]
++	orr	r0, r0, #(1 << 29)
++	str	r0, [r5, r2]
++
++	ldr	r2, =MMDC1_MPDGCTRL0
++	ldr	r0, [r5, r2]
++	orr	r0, r0, #(0x1 << 29)
++	str	r0, [r5, r2]
++
++	/* MMDC0_MAPSR adopt power down enable. */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	bic	r0, r0, #0x01
++	str	r0, [r5, #MMDC0_MAPSR]
++
++	/* frc_msr + mu bypass */
++	ldr	r0, =0x00000060
++	str	r0, [r5, #MMDC0_MPMUR0]
++	ldr	r2, =MMDC1_MPMUR0
++	str	r0, [r5, r2]
++	ldr	r0, =0x00000460
++	str	r0, [r5, #MMDC0_MPMUR0]
++	ldr	r2, =MMDC1_MPMUR0
++	str	r0, [r5, r2]
++	ldr	r0, =0x00000c60
++	str	r0, [r5, #MMDC0_MPMUR0]
++	ldr	r2, =MMDC1_MPMUR0
++	str	r0, [r5, r2]
++
++continue_dll_off_3:
++	/* clear SBS - unblock accesses to DDR. */
++	ldr	r0, [r5, #MMDC0_MADPCR0]
++	bic	r0, r0, #(0x1 << 8)
++	str	r0, [r5, #MMDC0_MADPCR0]
++
++	mov	r0, #0x0
++	str	r0, [r5, #MMDC0_MDSCR]
++poll_conreq_clear_1:
++	ldr	r0, [r5, #MMDC0_MDSCR]
++	and	r0, r0, #(0x4 << 12)
++	cmp	r0, #(0x4 << 12)
++	beq	poll_conreq_clear_1
++
++	b	done
++
++dll_on_mode:
++	/* assert DVFS - enter self refresh mode. */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	orr	r0, r0, #(1 << 21)
++	str	r0, [r5, #MMDC0_MAPSR]
++
++	/* de-assert CON_REQ. */
++	mov	r0, #0x0
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	/* poll DVFS ack. */
++poll_dvfs_set_2:
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	bne	poll_dvfs_set_2
++
++	ldr	r1, =528000000
++	cmp	r4, r1
++	beq	switch_freq_528
++
++	switch_to_400MHz
++
++	b	continue_dll_on
++
++switch_freq_528:
++	switch_to_528MHz
++
++continue_dll_on:
++
++	/* set SBS step-by-step mode. */
++	ldr	r0, [r5, #MMDC0_MADPCR0]
++	orr	r0, r0, #( 1 << 8)
++	str	r0, [r5, #MMDC0_MADPCR0]
++
++	/* clear DVFS - exit self refresh mode. */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	bic	r0, r0, #(1 << 21)
++	str	r0, [r5, #MMDC0_MAPSR]
++
++poll_dvfs_clear_2:
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	and	r0, r0, #(1 << 25)
++	cmp	r0, #(1 << 25)
++	beq	poll_dvfs_clear_2
++
++	/* if DLL is currently off, turn it back on. */
++	cmp	r9, #0
++	beq	update_calibration_only
++
++	ldr	r0, =0xa5390003
++	str	r0, [r5, #MMDC0_MPZQHWCTRL]
++	ldr	r2, =MMDC1_MPZQHWCTRL
++	str	r0, [r5, r2]
++
++	/* enable DQS gating. */
++	ldr	r2, =MMDC0_MPDGCTRL0
++	ldr	r0, [r5, r2]
++	bic	r0, r0, #(1 << 29)
++	str	r0, [r5, r2]
++
++	ldr	r2, =MMDC1_MPDGCTRL0
++	ldr	r0, [r5, r2]
++	bic	r0, r0, #(1 << 29)
++	str	r0, [r5, r2]
++
++	/* force measure. */
++	ldr	r0, =0x00000800
++	str	r0, [r5, #MMDC0_MPMUR0]
++	ldr	r2, =MMDC1_MPMUR0
++	str	r0, [r5, r2]
++
++	/* delay for while. */
++	ldr	r1, =4
++delay5:
++	ldr	r2, =0
++cont5:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont5
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay5
++
++	/* disable dqs pull down in the IOMUX. */
++	ldr	r1, [r11]
++	add	r11, r11, #8
++update_iomux1:
++	ldr	r0, [r11, #0x0]
++	ldr	r3, [r11, #0x4]
++	str	r3, [r7, r0]
++	add	r11, r11, #8
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	update_iomux1
++
++	/* config MMDC timings to 528MHz. */
++	ldr	r9, [r8]
++	add	r8, r8, #8
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	/* update MISC register: WALAT, RALAT */
++	ldr	r0, =0x00001740
++	str	r0, [r5, #MMDC0_MDMISC]
++
++	/* configure ddr devices to dll on, odt. */
++	ldr	r0, =0x00048031
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x00048039
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	/* delay for while. */
++	ldr	r1, =4
++delay7:
++	ldr	r2, =0
++cont7:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont7
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay7
++
++	/* reset dll. */
++	ldr	r0, =0x09408030
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x09408038
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	/* delay for while. */
++	ldr	r1, =100
++delay8:
++	ldr	r2, =0
++cont8:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont8
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay8
++
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	ldr	r0, =0x00428031
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x00428039
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	/* issue a zq command. */
++	ldr	r0, =0x04008040
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	ldr	r0, =0x04008048
++	str	r0, [r5, #MMDC0_MDSCR]
++
++	/* MMDC ODT enable. */
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++
++	ldr	r2, =0x4818
++	str	r3, [r5, r2]
++
++	/* delay for while. */
++	ldr	r1, =40
++delay15:
++	ldr	r2, =0
++cont15:
++	ldr	r0, [r5, r2]
++	add	r2, r2, #4
++	cmp	r2, #16
++	bne	cont15
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	delay15
++
++	/* MMDC0_MAPSR adopt power down enable. */
++	ldr	r0, [r5, #MMDC0_MAPSR]
++	bic	r0, r0, #0x01
++	str	r0, [r5, #MMDC0_MAPSR]
++
++	/* enable MMDC power down timer. */
++	ldr	r0, [r5, #MMDC0_MDPDC]
++	orr	r0, r0, #(0x55 << 8)
++	str	r0, [r5, #MMDC0_MDPDC]
++
++	b	update_calibration
++
++update_calibration_only:
++	ldr	r1, [r8]
++	sub	r1, r1, #7
++	add	r8, r8, #64
++	b	update_calib
++
++update_calibration:
++	/* write the new calibration values. */
++	mov	r1, r9
++	sub	r1, r1, #7
++
++update_calib:
++	ldr	r0, [r8, #0x0]
++	ldr	r3, [r8, #0x4]
++	str	r3, [r5, r0]
++	add	r8, r8, #8
++	sub	r1, r1, #1
++	cmp	r1, #0
++	bgt	update_calib
++
++	/* perform a force measurement. */
++	ldr	r0, =0x800
++	str	r0, [r5, #MMDC0_MPMUR0]
++	ldr	r2, =MMDC1_MPMUR0
++	str	r0, [r5, r2]
++
++	/* clear SBS - unblock DDR accesses. */
++	ldr	r0, [r5, #MMDC0_MADPCR0]
++	bic	r0, r0, #(1 << 8)
++	str	r0, [r5, #MMDC0_MADPCR0]
++
++	mov	r0, #0x0
++	str	r0, [r5, #MMDC0_MDSCR]
++poll_conreq_clear_2:
++	ldr	r0, [r5, #MMDC0_MDSCR]
++	and	r0, r0, #(0x4 << 12)
++	cmp	r0, #(0x4 << 12)
++	beq	poll_conreq_clear_2
++
++done:
++	/* restore registers */
++
++	ldmfd	sp!, {r4-r12}
++	mov	pc, lr
++
++	.type	mx6_do_ddr3_freq_change, #object
++ENTRY(mx6_do_ddr_freq_change)
++	.word	mx6_ddr3_freq_change
++	.size	mx6_ddr3_freq_change, . - mx6_ddr3_freq_change
+diff -Nur linux-4.1.3/arch/arm/mach-imx/Kconfig linux-xbian-imx6/arch/arm/mach-imx/Kconfig
+--- linux-4.1.3/arch/arm/mach-imx/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/Kconfig	2015-07-27 23:13:01.053224513 +0200
+@@ -1,5 +1,6 @@
+ menuconfig ARCH_MXC
+ 	bool "Freescale i.MX family" if ARCH_MULTI_V4_V5 || ARCH_MULTI_V6_V7
++	select ARCH_HAS_RESET_CONTROLLER
+ 	select ARCH_REQUIRE_GPIOLIB
+ 	select ARM_CPU_SUSPEND if PM
+ 	select CLKSRC_MMIO
+@@ -8,6 +9,7 @@
+ 	select PM_OPP if PM
+ 	select SOC_BUS
+ 	select SRAM
++	select ZONE_DMA
+ 	help
+ 	  Support for Freescale MXC/iMX-based family of processors
+ 
+@@ -58,7 +60,6 @@
+ 
+ config HAVE_IMX_SRC
+ 	def_bool y if SMP
+-	select ARCH_HAS_RESET_CONTROLLER
+ 
+ config IMX_HAVE_IOMUX_V1
+ 	bool
+diff -Nur linux-4.1.3/arch/arm/mach-imx/lpddr2_freq_imx6.S linux-xbian-imx6/arch/arm/mach-imx/lpddr2_freq_imx6.S
+--- linux-4.1.3/arch/arm/mach-imx/lpddr2_freq_imx6.S	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/arch/arm/mach-imx/lpddr2_freq_imx6.S	2015-07-27 23:13:01.093082305 +0200
+@@ -0,0 +1,484 @@
++/*
++ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/linkage.h>
++
++	.macro    mx6sl_switch_to_24MHz
++
++	/*
++	 * Set MMDC clock to be sourced from PLL3.
++	 * Ensure first periph2_clk2 is sourced from PLL3.
++	 * Set the PERIPH2_CLK2_PODF to divide by 2.
++	 */
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x7
++	orr	r6, r6, #0x1
++	str	r6, [r2, #0x14]
++
++	/* Select PLL3 to source MMDC. */
++	ldr	r6, [r2, #0x18]
++	bic	r6, r6, #0x100000
++	str	r6, [r2, #0x18]
++
++	/* Swtich periph2_clk_sel to run from PLL3. */
++	ldr	r6, [r2, #0x14]
++	orr	r6, r6, #0x4000000
++	str	r6, [r2, #0x14]
++
++periph2_clk_switch1:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	periph2_clk_switch1
++
++	/*
++	 * Need to clock gate the 528 PFDs before
++	 * powering down PLL2.
++	 * Only the PLL2_PFD2_400M should be ON
++	 * at this time, so only clock gate that one.
++	 */
++	ldr	r6, [r3, #0x100]
++	orr	r6, r6, #0x800000
++	str	r6, [r3, #0x100]
++
++	/*
++	 * Set PLL2 to bypass state. We should be here
++	 * only if MMDC is not sourced from PLL2.
++	 */
++	ldr	r6, [r3, #0x30]
++	orr	r6, r6, #0x10000
++	str	r6, [r3, #0x30]
++
++	ldr	r6, [r3, #0x30]
++	orr	r6, r6, #0x1000
++	str	r6, [r3, #0x30]
++
++	/* Ensure pre_periph2_clk_mux is set to pll2 */
++	ldr	r6, [r2, #0x18]
++	bic	r6, r6, #0x600000
++	str	r6, [r2, #0x18]
++
++	/* Set MMDC clock to be sourced from the bypassed PLL2. */
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x4000000
++	str	r6, [r2, #0x14]
++
++periph2_clk_switch2:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	periph2_clk_switch2
++
++	/*
++	 * Now move MMDC back to periph2_clk2 source.
++	 * after selecting PLL2 as the option.
++	 * Select PLL2 as the source.
++	 */
++	ldr	r6, [r2, #0x18]
++	orr	r6, r6, #0x100000
++	str	r6, [r2, #0x18]
++
++	/* set periph2_clk2_podf to divide by 1. */
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x7
++	str	r6, [r2, #0x14]
++
++	/* Now move periph2_clk to periph2_clk2 source */
++	ldr	r6, [r2, #0x14]
++	orr	r6, r6, #0x4000000
++	str	r6, [r2, #0x14]
++
++periph2_clk_switch3:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	periph2_clk_switch3
++
++	/* Now set the MMDC PODF back to 1.*/
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x38
++	str	r6, [r2, #0x14]
++
++mmdc_podf0:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	mmdc_podf0
++
++	.endm
++
++	  .macro	ddr_switch_400MHz
++
++	/* Set MMDC divider first, in case PLL3 is at 480MHz. */
++	ldr	r6, [r3, #0x10]
++	and	r6, r6, #0x10000
++	cmp	r6, #0x10000
++	beq	pll3_in_bypass
++
++	/* Set MMDC divder to divide by 2. */
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x38
++	orr	r6, r6, #0x8
++	str	r6, [r2, #0x14]
++
++mmdc_podf:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	mmdc_podf
++
++pll3_in_bypass:
++	/*
++	 * Check if we are switching between
++	 * 400Mhz <-> 100MHz.If so, we should
++	 * try to source MMDC from PLL2_200M.
++	 */
++	cmp	r1, #0
++	beq	not_low_bus_freq
++
++	/* Ensure that MMDC is sourced from PLL2 mux first. */
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x4000000
++	str	r6, [r2, #0x14]
++
++periph2_clk_switch4:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	periph2_clk_switch4
++
++not_low_bus_freq:
++	/* Now ensure periph2_clk2_sel mux is set to PLL3 */
++	ldr	r6, [r2, #0x18]
++	bic	r6, r6, #0x100000
++	str	r6, [r2, #0x18]
++
++	/* Now switch MMDC to PLL3. */
++	ldr	r6, [r2, #0x14]
++	orr	r6, r6, #0x4000000
++	str	r6, [r2, #0x14]
++
++periph2_clk_switch5:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	periph2_clk_switch5
++
++	/*
++	 * Check if PLL2 is already unlocked.
++	 * If so do nothing with PLL2.
++	 */
++	cmp	r1, #0
++	beq	pll2_already_on
++
++	/* Now power up PLL2 and unbypass it. */
++	ldr	r6, [r3, #0x30]
++	bic	r6, r6, #0x1000
++	str	r6, [r3, #0x30]
++
++	/* Make sure PLL2 has locked.*/
++wait_for_pll_lock:
++	ldr	r6, [r3, #0x30]
++	and	r6, r6, #0x80000000
++	cmp	r6, #0x80000000
++	bne	wait_for_pll_lock
++
++	ldr	r6, [r3, #0x30]
++	bic	r6, r6, #0x10000
++	str	r6, [r3, #0x30]
++
++	/*
++	 * Need to enable the 528 PFDs after
++	 * powering up PLL2.
++	 * Only the PLL2_PFD2_400M should be ON
++	 * as it feeds the MMDC. Rest should have
++	 * been managed by clock code.
++	 */
++	ldr	r6, [r3, #0x100]
++	bic	r6, r6, #0x800000
++	str	r6, [r3, #0x100]
++
++pll2_already_on:
++	/*
++	 * Now switch MMDC clk back to pll2_mux option.
++	 * Ensure pre_periph2_clk2 is set to pll2_pfd_400M.
++	 * If switching to audio DDR freq, set the
++	 * pre_periph2_clk2 to PLL2_PFD_200M
++	 */
++	ldr	r6, =400000000
++	cmp	r6, r0
++	bne	use_pll2_pfd_200M
++
++	ldr	r6, [r2, #0x18]
++	bic	r6, r6, #0x600000
++	orr	r6, r6, #0x200000
++	str	r6, [r2, #0x18]
++	ldr	r6, =400000000
++	b       cont2
++
++use_pll2_pfd_200M:
++	ldr	r6, [r2, #0x18]
++	orr	r6, r6, #0x600000
++	str	r6, [r2, #0x18]
++	ldr	r6, =200000000
++
++cont2:
++	ldr	r4, [r2, #0x14]
++	bic	r4, r4, #0x4000000
++	str	r4, [r2, #0x14]
++
++periph2_clk_switch6:
++	ldr	r4, [r2, #0x48]
++	cmp	r4, #0
++	bne	periph2_clk_switch6
++
++change_divider_only:
++	/*
++	 * Calculate the MMDC divider
++	 * based on the requested freq.
++	 */
++	ldr	r4, =0
++Loop2:
++	sub	r6, r6, r0
++	cmp	r6, r0
++	blt	Div_Found
++	add	r4, r4, #1
++	bgt	Loop2
++
++	/* Shift divider into correct offset. */
++	lsl	r4, r4, #3
++Div_Found:
++	/* Set the MMDC PODF. */
++	ldr	r6, [r2, #0x14]
++	bic	r6, r6, #0x38
++	orr	r6, r6, r4
++	str	r6, [r2, #0x14]
++
++mmdc_podf1:
++	ldr	r6, [r2, #0x48]
++	cmp	r6, #0
++	bne	mmdc_podf1
++
++	.endm
++
++	.macro	mmdc_clk_lower_100MHz
++
++	/*
++	 * Prior to reducing the DDR frequency (at 528/400 MHz),
++	 * read the Measure unit count bits (MU_UNIT_DEL_NUM)
++	 */
++	ldr	r5, =0x8B8
++	ldr	r6, [r8, r5]
++	/* Original MU unit count */
++	mov	r6, r6, LSR #16
++	ldr	r4, =0x3FF
++	and	r6, r6, r4
++	/* Original MU unit count * 2 */
++	mov	r7, r6, LSL #1
++	/*
++	 * Bypass the automatic measure unit when below 100 MHz
++	 * by setting the Measure unit bypass enable bit (MU_BYP_EN)
++	 */
++	ldr	r6, [r8, r5]
++	orr	r6, r6, #0x400
++	str	r6, [r8, r5]
++	/*
++	 * Double the measure count value read in step 1 and program it in the
++	 * measurement bypass bits (MU_BYP_VAL) of the MMDC PHY Measure Unit
++	 * Register for the reduced frequency operation below 100 MHz
++	 */
++	ldr	r6, [r8, r5]
++	ldr	r4, =0x3FF
++	bic	r6, r6, r4
++	orr	r6, r6, r7
++	str	r6, [r8, r5]
++	/* Now perform a Force Measurement. */
++	ldr	r6, [r8, r5]
++	orr	r6, r6, #0x800
++	str	r6, [r8, r5]
++	/* Wait for FRC_MSR to clear. */
++force_measure:
++	ldr	r6, [r8, r5]
++	and	r6, r6, #0x800
++	cmp	r6, #0x0
++	bne	force_measure
++
++	.endm
++
++	.macro	mmdc_clk_above_100MHz
++
++	/* Make sure that the PHY measurement unit is NOT in bypass mode */
++	ldr	r5, =0x8B8
++	ldr	r6, [r8, r5]
++	bic	r6, r6, #0x400
++	str	r6, [r8, r5]
++	/* Now perform a Force Measurement. */
++	ldr	r6, [r8, r5]
++	orr	r6, r6, #0x800
++	str	r6, [r8, r5]
++	/* Wait for FRC_MSR to clear. */
++force_measure1:
++	ldr	r6, [r8, r5]
++	and	r6, r6, #0x800
++	cmp	r6, #0x0
++	bne	force_measure1
++	.endm
++
++/*
++ *  mx6_lpddr2_freq_change
++ *
++ *  Make sure DDR is in self-refresh.
++ *  IRQs are already disabled.
++ * r0 : DDR freq.
++ * r1: low_bus_freq_mode flag
++ * r2: Pointer to array containing addresses of registers.
++ */
++	.align 3
++ENTRY(mx6_lpddr2_freq_change)
++
++	push {r4-r10}
++
++	mov	r4, r2
++	ldr	r3, [r4]			@ANATOP_BASE_ADDR
++	ldr	r2, [r4, #0x4]		@CCM_BASE_ADDR
++	ldr	r8, [r4, #0x8]		@MMDC_P0_BASE_ADDR
++	ldr	r7, [r4, #0xC]		@L2_BASE_ADDR
++
++lpddr2_freq_change:
++	adr	r9, lpddr2_freq_change
++
++	/* Prime all TLB entries. */
++	ldr	r6, [r9]
++	ldr	r6, [r8]
++	ldr	r6, [r3]
++	ldr	r6, [r2]
++
++	 /* Drain all the L1 buffers. */
++	 dsb
++
++#ifdef CONFIG_CACHE_L2X0
++	/*
++	 * Need to make sure the buffers in L2 are drained.
++	 * Performing a sync operation does this.
++	 */
++	mov	r6, #0x0
++	str	r6, [r7, #0x730]
++#endif
++
++	/*
++	 * The second dsb might be needed to keep cache sync (device write)
++	 * ordering with the memory accesses before it.
++	 */
++	dsb
++	isb
++
++	/* Disable Automatic power savings. */
++	ldr	r6, [r8, #0x404]
++	orr	r6, r6, #0x01
++	str	r6, [r8, #0x404]
++
++	/* MMDC0_MDPDC disable power down timer */
++	ldr	r6, [r8, #0x4]
++	bic	r6, r6, #0xff00
++	str	r6, [r8, #0x4]
++
++	/* Delay for a while */
++	ldr	r10, =10
++delay1:
++	ldr	r7, =0
++cont1:
++	ldr	r6, [r8, r7]
++	add	r7, r7, #4
++	cmp	r7, #16
++	bne	cont1
++	sub	r10, r10, #1
++	cmp	r10, #0
++	bgt	delay1
++
++	/* Make the DDR explicitly enter self-refresh. */
++	ldr	r6, [r8, #0x404]
++	orr	r6, r6, #0x200000
++	str	r6, [r8, #0x404]
++
++poll_dvfs_set_1:
++	ldr	r6, [r8, #0x404]
++	and	r6, r6, #0x2000000
++	cmp	r6, #0x2000000
++	bne	poll_dvfs_set_1
++
++	/* set SBS step-by-step mode */
++	ldr	r6, [r8, #0x410]
++	orr	r6, r6, #0x100
++	str	r6, [r8, #0x410]
++
++	ldr	r10, =100000000
++	cmp	r0, r10
++	bgt	set_ddr_mu_above_100
++	mmdc_clk_lower_100MHz
++
++set_ddr_mu_above_100:
++	ldr	r10, =24000000
++	cmp	r0, r10
++	beq	set_to_24MHz
++
++	ddr_switch_400MHz
++
++	ldr	r10,=100000000
++	cmp	r0, r10
++	blt	done
++	mmdc_clk_above_100MHz
++
++	b	done
++
++set_to_24MHz:
++	mx6sl_switch_to_24MHz
++
++done:
++	/* clear DVFS - exit from self refresh mode */
++	ldr	r6, [r8, #0x404]
++	bic	r6, r6, #0x200000
++	str	r6, [r8, #0x404]
++
++poll_dvfs_clear_1:
++	ldr	r6, [r8, #0x404]
++	and	r6, r6, #0x2000000
++	cmp	r6, #0x2000000
++	beq	poll_dvfs_clear_1
++
++	/* Enable Automatic power savings. */
++	ldr	r6, [r8, #0x404]
++	bic	r6, r6, #0x01
++	str	r6, [r8, #0x404]
++
++	ldr	r10, =24000000
++	cmp	r0, r10
++	beq	skip_power_down
++
++	/* Enable MMDC power down timer. */
++	ldr	r6, [r8, #0x4]
++	orr	r6, r6, #0x5500
++	str	r6, [r8, #0x4]
++
++skip_power_down:
++	/* clear SBS - unblock DDR accesses */
++	ldr	r6, [r8, #0x410]
++	bic	r6, r6, #0x100
++	str	r6, [r8, #0x410]
++
++	pop {r4-r10}
++
++	/* Restore registers */
++	mov	pc, lr
++
++	.type	mx6_lpddr2_do_iram, #object
++ENTRY(mx6_lpddr2_do_iram)
++	.word	mx6_lpddr2_freq_change
++	.size		mx6_lpddr2_freq_change, . - mx6_lpddr2_freq_change
+diff -Nur linux-4.1.3/arch/arm/mach-imx/mach-imx6q.c linux-xbian-imx6/arch/arm/mach-imx/mach-imx6q.c
+--- linux-4.1.3/arch/arm/mach-imx/mach-imx6q.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/mach-imx6q.c	2015-07-27 23:13:01.097068084 +0200
+@@ -265,10 +265,12 @@
+ static void __init imx6q_init_machine(void)
+ {
+ 	struct device *parent;
++	void __iomem *p;
+ 
+ 	imx_print_silicon_rev(cpu_is_imx6dl() ? "i.MX6DL" : "i.MX6Q",
+ 			      imx_get_soc_revision());
+ 
++	mxc_arch_reset_init_dt();
+ 	parent = imx_soc_device_init();
+ 	if (parent == NULL)
+ 		pr_warn("failed to initialize soc device\n");
+@@ -281,6 +283,12 @@
+ 	cpu_is_imx6q() ?  imx6q_pm_init() : imx6dl_pm_init();
+ 	imx6q_1588_init();
+ 	imx6q_axi_init();
++
++	p = ioremap(0x21b0000, SZ_4K);
++	if (p) {
++		writel(0x7f, p + 0x40);
++		iounmap(p);
++	}
+ }
+ 
+ #define OCOTP_CFG3			0x440
+@@ -330,6 +338,12 @@
+ 			if (dev_pm_opp_disable(cpu_dev, 852000000))
+ 				pr_warn("failed to disable 852 MHz OPP\n");
+ 	}
++	if (vpu352) {
++		if (dev_pm_opp_disable(cpu_dev, 396000000))
++			pr_warn("VPU352: failed to disable 396MHz OPP\n");
++		pr_info("VPU352: remove 396MHz OPP for VPU running at 352MHz!\n");
++	}
++
+ 	iounmap(base);
+ put_node:
+ 	of_node_put(np);
+@@ -408,4 +422,5 @@
+ 	.init_machine	= imx6q_init_machine,
+ 	.init_late      = imx6q_init_late,
+ 	.dt_compat	= imx6q_dt_compat,
++	.restart	= mxc_restart,
+ MACHINE_END
+diff -Nur linux-4.1.3/arch/arm/mach-imx/Makefile linux-xbian-imx6/arch/arm/mach-imx/Makefile
+--- linux-4.1.3/arch/arm/mach-imx/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/Makefile	2015-07-27 23:13:01.053224513 +0200
+@@ -28,6 +28,12 @@
+ obj-$(CONFIG_MXC_USE_EPIT) += epit.o
+ obj-$(CONFIG_MXC_DEBUG_BOARD) += 3ds_debugboard.o
+ 
++obj-y += busfreq-imx6.o
++ifdef CONFIG_ARM_IMX6Q_CPUFREQ
++obj-$(CONFIG_SOC_IMX6Q) += ddr3_freq_imx6.o busfreq_ddr3.o
++obj-$(CONFIG_SOC_IMX6SL) += lpddr2_freq_imx6.o busfreq_lpddr2.o
++endif
++
+ ifeq ($(CONFIG_CPU_IDLE),y)
+ obj-$(CONFIG_SOC_IMX5) += cpuidle-imx5.o
+ obj-$(CONFIG_SOC_IMX6Q) += cpuidle-imx6q.o
+diff -Nur linux-4.1.3/arch/arm/mach-imx/src.c linux-xbian-imx6/arch/arm/mach-imx/src.c
+--- linux-4.1.3/arch/arm/mach-imx/src.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/src.c	2015-07-27 23:13:01.097068084 +0200
+@@ -1,5 +1,5 @@
+ /*
+- * Copyright 2011 Freescale Semiconductor, Inc.
++ * Copyright 2011-2014 Freescale Semiconductor, Inc.
+  * Copyright 2011 Linaro Ltd.
+  *
+  * The code contained herein is licensed under the GNU General Public
+@@ -18,6 +18,7 @@
+ #include <linux/smp.h>
+ #include <asm/smp_plat.h>
+ #include "common.h"
++#include "hardware.h"
+ 
+ #define SRC_SCR				0x000
+ #define SRC_GPR1			0x020
+@@ -32,6 +33,7 @@
+ 
+ static void __iomem *src_base;
+ static DEFINE_SPINLOCK(scr_lock);
++static bool m4_is_enabled;
+ 
+ static const int sw_reset_bits[5] = {
+ 	BP_SRC_SCR_SW_GPU_RST,
+@@ -41,6 +43,11 @@
+ 	BP_SRC_SCR_SW_IPU2_RST
+ };
+ 
++bool imx_src_is_m4_enabled(void)
++{
++	return m4_is_enabled;
++}
++
+ static int imx_src_reset_module(struct reset_controller_dev *rcdev,
+ 		unsigned long sw_reset_idx)
+ {
+@@ -136,6 +143,14 @@
+ 	 */
+ 	spin_lock(&scr_lock);
+ 	val = readl_relaxed(src_base + SRC_SCR);
++
++	/* bit 4 is m4c_non_sclr_rst on i.MX6SX */
++	if (cpu_is_imx6sx() && ((val &
++		(1 << BP_SRC_SCR_SW_OPEN_VG_RST)) == 0))
++		m4_is_enabled = true;
++	else
++		m4_is_enabled = false;
++
+ 	val &= ~(1 << BP_SRC_SCR_WARM_RESET_ENABLE);
+ 	writel_relaxed(val, src_base + SRC_SCR);
+ 	spin_unlock(&scr_lock);
+diff -Nur linux-4.1.3/arch/arm/mach-imx/system.c linux-xbian-imx6/arch/arm/mach-imx/system.c
+--- linux-4.1.3/arch/arm/mach-imx/system.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mach-imx/system.c	2015-07-27 23:13:01.101053863 +0200
+@@ -34,6 +34,7 @@
+ 
+ static void __iomem *wdog_base;
+ static struct clk *wdog_clk;
++static u32 wdog_source = 1; /* use WDOG1 default */
+ 
+ /*
+  * Reset the system. It is called by machine_restart().
+@@ -50,6 +51,17 @@
+ 
+ 	if (cpu_is_mx1())
+ 		wcr_enable = (1 << 0);
++	/*
++	 * Some i.MX6 boards use WDOG2 to reset external pmic in bypass mode,
++	 * so do WDOG2 reset here. Do not set SRS, since we will
++	 * trigger external POR later. Use WDOG1 to reset in ldo-enable
++	 * mode. You can set it by "fsl,wdog-reset" in dts.
++	 * For i.MX6SX we have to trigger wdog-reset to reset QSPI-NOR flash to
++	 * workaround qspi-nor reboot issue whatever ldo-bypass or not.
++	 */
++	else if ((wdog_source == 2 && (cpu_is_imx6q() || cpu_is_imx6dl() ||
++			cpu_is_imx6sl())) || cpu_is_imx6sx())
++		wcr_enable = 0x14;
+ 	else
+ 		wcr_enable = (1 << 2);
+ 
+@@ -89,6 +101,41 @@
+ 		clk_prepare(wdog_clk);
+ }
+ 
++void __init mxc_arch_reset_init_dt(void)
++{
++        struct device_node *np = NULL;
++
++        if (cpu_is_imx6q() || cpu_is_imx6dl())
++                np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-gpc");
++        else if (cpu_is_imx6sl())
++                np = of_find_compatible_node(NULL, NULL, "fsl,imx6sl-gpc");
++
++        if (np)
++                of_property_read_u32(np, "fsl,wdog-reset", &wdog_source);
++        pr_info("Use WDOG%d as reset source\n", wdog_source);
++
++        np = of_find_compatible_node(NULL, NULL, "fsl,imx21-wdt");
++        wdog_base = of_iomap(np, 0);
++        WARN_ON(!wdog_base);
++
++        /* Some i.MX6 boards use WDOG2 to reset board in ldo-bypass mode */
++        if (wdog_source == 2 && (cpu_is_imx6q() || cpu_is_imx6dl() ||
++                cpu_is_imx6sl())) {
++                np = of_find_compatible_node(np, NULL, "fsl,imx21-wdt");
++                wdog_base = of_iomap(np, 0);
++                WARN_ON(!wdog_base);
++        }
++
++        wdog_clk = of_clk_get(np, 0);
++        if (IS_ERR(wdog_clk)) {
++                pr_warn("%s: failed to get wdog clock\n", __func__);
++                wdog_clk = NULL;
++                return;
++        }
++
++        clk_prepare(wdog_clk);
++}
++
+ #ifdef CONFIG_CACHE_L2X0
+ void __init imx_init_l2cache(void)
+ {
+diff -Nur linux-4.1.3/arch/arm/mm/cache-v7.S linux-xbian-imx6/arch/arm/mm/cache-v7.S
+--- linux-4.1.3/arch/arm/mm/cache-v7.S	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/arch/arm/mm/cache-v7.S	2015-07-27 23:13:01.503617563 +0200
+@@ -446,3 +446,5 @@
+ 
+ 	@ define struct cpu_cache_fns (see <asm/cacheflush.h> and proc-macros.S)
+ 	define_cache_functions v7
++
++	.long	v7_dma_flush_range
+diff -Nur linux-4.1.3/block/bfq-cgroup.c linux-xbian-imx6/block/bfq-cgroup.c
+--- linux-4.1.3/block/bfq-cgroup.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/block/bfq-cgroup.c	2015-07-27 23:13:03.600137415 +0200
+@@ -0,0 +1,936 @@
++/*
++ * BFQ: CGROUPS support.
++ *
++ * Based on ideas and code from CFQ:
++ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
++ *
++ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
++ *		      Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Licensed under the GPL-2 as detailed in the accompanying COPYING.BFQ
++ * file.
++ */
++
++#ifdef CONFIG_CGROUP_BFQIO
++
++static DEFINE_MUTEX(bfqio_mutex);
++
++static bool bfqio_is_removed(struct bfqio_cgroup *bgrp)
++{
++	return bgrp ? !bgrp->online : false;
++}
++
++static struct bfqio_cgroup bfqio_root_cgroup = {
++	.weight = BFQ_DEFAULT_GRP_WEIGHT,
++	.ioprio = BFQ_DEFAULT_GRP_IOPRIO,
++	.ioprio_class = BFQ_DEFAULT_GRP_CLASS,
++};
++
++static inline void bfq_init_entity(struct bfq_entity *entity,
++				   struct bfq_group *bfqg)
++{
++	entity->weight = entity->new_weight;
++	entity->orig_weight = entity->new_weight;
++	entity->ioprio = entity->new_ioprio;
++	entity->ioprio_class = entity->new_ioprio_class;
++	entity->parent = bfqg->my_entity;
++	entity->sched_data = &bfqg->sched_data;
++}
++
++static struct bfqio_cgroup *css_to_bfqio(struct cgroup_subsys_state *css)
++{
++	return css ? container_of(css, struct bfqio_cgroup, css) : NULL;
++}
++
++/*
++ * Search the bfq_group for bfqd into the hash table (by now only a list)
++ * of bgrp.  Must be called under rcu_read_lock().
++ */
++static struct bfq_group *bfqio_lookup_group(struct bfqio_cgroup *bgrp,
++					    struct bfq_data *bfqd)
++{
++	struct bfq_group *bfqg;
++	void *key;
++
++	hlist_for_each_entry_rcu(bfqg, &bgrp->group_data, group_node) {
++		key = rcu_dereference(bfqg->bfqd);
++		if (key == bfqd)
++			return bfqg;
++	}
++
++	return NULL;
++}
++
++static inline void bfq_group_init_entity(struct bfqio_cgroup *bgrp,
++					 struct bfq_group *bfqg)
++{
++	struct bfq_entity *entity = &bfqg->entity;
++
++	/*
++	 * If the weight of the entity has never been set via the sysfs
++	 * interface, then bgrp->weight == 0. In this case we initialize
++	 * the weight from the current ioprio value. Otherwise, the group
++	 * weight, if set, has priority over the ioprio value.
++	 */
++	if (bgrp->weight == 0) {
++		entity->new_weight = bfq_ioprio_to_weight(bgrp->ioprio);
++		entity->new_ioprio = bgrp->ioprio;
++	} else {
++		if (bgrp->weight < BFQ_MIN_WEIGHT ||
++		    bgrp->weight > BFQ_MAX_WEIGHT) {
++			printk(KERN_CRIT "bfq_group_init_entity: "
++					 "bgrp->weight %d\n", bgrp->weight);
++			BUG();
++		}
++		entity->new_weight = bgrp->weight;
++		entity->new_ioprio = bfq_weight_to_ioprio(bgrp->weight);
++	}
++	entity->orig_weight = entity->weight = entity->new_weight;
++	entity->ioprio = entity->new_ioprio;
++	entity->ioprio_class = entity->new_ioprio_class = bgrp->ioprio_class;
++	entity->my_sched_data = &bfqg->sched_data;
++	bfqg->active_entities = 0;
++}
++
++static inline void bfq_group_set_parent(struct bfq_group *bfqg,
++					struct bfq_group *parent)
++{
++	struct bfq_entity *entity;
++
++	BUG_ON(parent == NULL);
++	BUG_ON(bfqg == NULL);
++
++	entity = &bfqg->entity;
++	entity->parent = parent->my_entity;
++	entity->sched_data = &parent->sched_data;
++}
++
++/**
++ * bfq_group_chain_alloc - allocate a chain of groups.
++ * @bfqd: queue descriptor.
++ * @css: the leaf cgroup_subsys_state this chain starts from.
++ *
++ * Allocate a chain of groups starting from the one belonging to
++ * @cgroup up to the root cgroup.  Stop if a cgroup on the chain
++ * to the root has already an allocated group on @bfqd.
++ */
++static struct bfq_group *bfq_group_chain_alloc(struct bfq_data *bfqd,
++					       struct cgroup_subsys_state *css)
++{
++	struct bfqio_cgroup *bgrp;
++	struct bfq_group *bfqg, *prev = NULL, *leaf = NULL;
++
++	for (; css != NULL; css = css->parent) {
++		bgrp = css_to_bfqio(css);
++
++		bfqg = bfqio_lookup_group(bgrp, bfqd);
++		if (bfqg != NULL) {
++			/*
++			 * All the cgroups in the path from there to the
++			 * root must have a bfq_group for bfqd, so we don't
++			 * need any more allocations.
++			 */
++			break;
++		}
++
++		bfqg = kzalloc(sizeof(*bfqg), GFP_ATOMIC);
++		if (bfqg == NULL)
++			goto cleanup;
++
++		bfq_group_init_entity(bgrp, bfqg);
++		bfqg->my_entity = &bfqg->entity;
++
++		if (leaf == NULL) {
++			leaf = bfqg;
++			prev = leaf;
++		} else {
++			bfq_group_set_parent(prev, bfqg);
++			/*
++			 * Build a list of allocated nodes using the bfqd
++			 * filed, that is still unused and will be
++			 * initialized only after the node will be
++			 * connected.
++			 */
++			prev->bfqd = bfqg;
++			prev = bfqg;
++		}
++	}
++
++	return leaf;
++
++cleanup:
++	while (leaf != NULL) {
++		prev = leaf;
++		leaf = leaf->bfqd;
++		kfree(prev);
++	}
++
++	return NULL;
++}
++
++/**
++ * bfq_group_chain_link - link an allocated group chain to a cgroup
++ *                        hierarchy.
++ * @bfqd: the queue descriptor.
++ * @css: the leaf cgroup_subsys_state to start from.
++ * @leaf: the leaf group (to be associated to @cgroup).
++ *
++ * Try to link a chain of groups to a cgroup hierarchy, connecting the
++ * nodes bottom-up, so we can be sure that when we find a cgroup in the
++ * hierarchy that already as a group associated to @bfqd all the nodes
++ * in the path to the root cgroup have one too.
++ *
++ * On locking: the queue lock protects the hierarchy (there is a hierarchy
++ * per device) while the bfqio_cgroup lock protects the list of groups
++ * belonging to the same cgroup.
++ */
++static void bfq_group_chain_link(struct bfq_data *bfqd,
++				 struct cgroup_subsys_state *css,
++				 struct bfq_group *leaf)
++{
++	struct bfqio_cgroup *bgrp;
++	struct bfq_group *bfqg, *next, *prev = NULL;
++	unsigned long flags;
++
++	assert_spin_locked(bfqd->queue->queue_lock);
++
++	for (; css != NULL && leaf != NULL; css = css->parent) {
++		bgrp = css_to_bfqio(css);
++		next = leaf->bfqd;
++
++		bfqg = bfqio_lookup_group(bgrp, bfqd);
++		BUG_ON(bfqg != NULL);
++
++		spin_lock_irqsave(&bgrp->lock, flags);
++
++		rcu_assign_pointer(leaf->bfqd, bfqd);
++		hlist_add_head_rcu(&leaf->group_node, &bgrp->group_data);
++		hlist_add_head(&leaf->bfqd_node, &bfqd->group_list);
++
++		spin_unlock_irqrestore(&bgrp->lock, flags);
++
++		prev = leaf;
++		leaf = next;
++	}
++
++	BUG_ON(css == NULL && leaf != NULL);
++	if (css != NULL && prev != NULL) {
++		bgrp = css_to_bfqio(css);
++		bfqg = bfqio_lookup_group(bgrp, bfqd);
++		bfq_group_set_parent(prev, bfqg);
++	}
++}
++
++/**
++ * bfq_find_alloc_group - return the group associated to @bfqd in @cgroup.
++ * @bfqd: queue descriptor.
++ * @cgroup: cgroup being searched for.
++ *
++ * Return a group associated to @bfqd in @cgroup, allocating one if
++ * necessary.  When a group is returned all the cgroups in the path
++ * to the root have a group associated to @bfqd.
++ *
++ * If the allocation fails, return the root group: this breaks guarantees
++ * but is a safe fallback.  If this loss becomes a problem it can be
++ * mitigated using the equivalent weight (given by the product of the
++ * weights of the groups in the path from @group to the root) in the
++ * root scheduler.
++ *
++ * We allocate all the missing nodes in the path from the leaf cgroup
++ * to the root and we connect the nodes only after all the allocations
++ * have been successful.
++ */
++static struct bfq_group *bfq_find_alloc_group(struct bfq_data *bfqd,
++					      struct cgroup_subsys_state *css)
++{
++	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
++	struct bfq_group *bfqg;
++
++	bfqg = bfqio_lookup_group(bgrp, bfqd);
++	if (bfqg != NULL)
++		return bfqg;
++
++	bfqg = bfq_group_chain_alloc(bfqd, css);
++	if (bfqg != NULL)
++		bfq_group_chain_link(bfqd, css, bfqg);
++	else
++		bfqg = bfqd->root_group;
++
++	return bfqg;
++}
++
++/**
++ * bfq_bfqq_move - migrate @bfqq to @bfqg.
++ * @bfqd: queue descriptor.
++ * @bfqq: the queue to move.
++ * @entity: @bfqq's entity.
++ * @bfqg: the group to move to.
++ *
++ * Move @bfqq to @bfqg, deactivating it from its old group and reactivating
++ * it on the new one.  Avoid putting the entity on the old group idle tree.
++ *
++ * Must be called under the queue lock; the cgroup owning @bfqg must
++ * not disappear (by now this just means that we are called under
++ * rcu_read_lock()).
++ */
++static void bfq_bfqq_move(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++			  struct bfq_entity *entity, struct bfq_group *bfqg)
++{
++	int busy, resume;
++
++	busy = bfq_bfqq_busy(bfqq);
++	resume = !RB_EMPTY_ROOT(&bfqq->sort_list);
++
++	BUG_ON(resume && !entity->on_st);
++	BUG_ON(busy && !resume && entity->on_st &&
++	       bfqq != bfqd->in_service_queue);
++
++	if (busy) {
++		BUG_ON(atomic_read(&bfqq->ref) < 2);
++
++		if (!resume)
++			bfq_del_bfqq_busy(bfqd, bfqq, 0);
++		else
++			bfq_deactivate_bfqq(bfqd, bfqq, 0);
++	} else if (entity->on_st)
++		bfq_put_idle_entity(bfq_entity_service_tree(entity), entity);
++
++	/*
++	 * Here we use a reference to bfqg.  We don't need a refcounter
++	 * as the cgroup reference will not be dropped, so that its
++	 * destroy() callback will not be invoked.
++	 */
++	entity->parent = bfqg->my_entity;
++	entity->sched_data = &bfqg->sched_data;
++
++	if (busy && resume)
++		bfq_activate_bfqq(bfqd, bfqq);
++
++	if (bfqd->in_service_queue == NULL && !bfqd->rq_in_driver)
++		bfq_schedule_dispatch(bfqd);
++}
++
++/**
++ * __bfq_bic_change_cgroup - move @bic to @cgroup.
++ * @bfqd: the queue descriptor.
++ * @bic: the bic to move.
++ * @cgroup: the cgroup to move to.
++ *
++ * Move bic to cgroup, assuming that bfqd->queue is locked; the caller
++ * has to make sure that the reference to cgroup is valid across the call.
++ *
++ * NOTE: an alternative approach might have been to store the current
++ * cgroup in bfqq and getting a reference to it, reducing the lookup
++ * time here, at the price of slightly more complex code.
++ */
++static struct bfq_group *__bfq_bic_change_cgroup(struct bfq_data *bfqd,
++						struct bfq_io_cq *bic,
++						struct cgroup_subsys_state *css)
++{
++	struct bfq_queue *async_bfqq = bic_to_bfqq(bic, 0);
++	struct bfq_queue *sync_bfqq = bic_to_bfqq(bic, 1);
++	struct bfq_entity *entity;
++	struct bfq_group *bfqg;
++	struct bfqio_cgroup *bgrp;
++
++	bgrp = css_to_bfqio(css);
++
++	bfqg = bfq_find_alloc_group(bfqd, css);
++	if (async_bfqq != NULL) {
++		entity = &async_bfqq->entity;
++
++		if (entity->sched_data != &bfqg->sched_data) {
++			bic_set_bfqq(bic, NULL, 0);
++			bfq_log_bfqq(bfqd, async_bfqq,
++				     "bic_change_group: %p %d",
++				     async_bfqq, atomic_read(&async_bfqq->ref));
++			bfq_put_queue(async_bfqq);
++		}
++	}
++
++	if (sync_bfqq != NULL) {
++		entity = &sync_bfqq->entity;
++		if (entity->sched_data != &bfqg->sched_data)
++			bfq_bfqq_move(bfqd, sync_bfqq, entity, bfqg);
++	}
++
++	return bfqg;
++}
++
++/**
++ * bfq_bic_change_cgroup - move @bic to @cgroup.
++ * @bic: the bic being migrated.
++ * @cgroup: the destination cgroup.
++ *
++ * When the task owning @bic is moved to @cgroup, @bic is immediately
++ * moved into its new parent group.
++ */
++static void bfq_bic_change_cgroup(struct bfq_io_cq *bic,
++				  struct cgroup_subsys_state *css)
++{
++	struct bfq_data *bfqd;
++	unsigned long uninitialized_var(flags);
++
++	bfqd = bfq_get_bfqd_locked(&(bic->icq.q->elevator->elevator_data),
++				   &flags);
++	if (bfqd != NULL) {
++		__bfq_bic_change_cgroup(bfqd, bic, css);
++		bfq_put_bfqd_unlock(bfqd, &flags);
++	}
++}
++
++/**
++ * bfq_bic_update_cgroup - update the cgroup of @bic.
++ * @bic: the @bic to update.
++ *
++ * Make sure that @bic is enqueued in the cgroup of the current task.
++ * We need this in addition to moving bics during the cgroup attach
++ * phase because the task owning @bic could be at its first disk
++ * access or we may end up in the root cgroup as the result of a
++ * memory allocation failure and here we try to move to the right
++ * group.
++ *
++ * Must be called under the queue lock.  It is safe to use the returned
++ * value even after the rcu_read_unlock() as the migration/destruction
++ * paths act under the queue lock too.  IOW it is impossible to race with
++ * group migration/destruction and end up with an invalid group as:
++ *   a) here cgroup has not yet been destroyed, nor its destroy callback
++ *      has started execution, as current holds a reference to it,
++ *   b) if it is destroyed after rcu_read_unlock() [after current is
++ *      migrated to a different cgroup] its attach() callback will have
++ *      taken care of remove all the references to the old cgroup data.
++ */
++static struct bfq_group *bfq_bic_update_cgroup(struct bfq_io_cq *bic)
++{
++	struct bfq_data *bfqd = bic_to_bfqd(bic);
++	struct bfq_group *bfqg;
++	struct cgroup_subsys_state *css;
++
++	BUG_ON(bfqd == NULL);
++
++	rcu_read_lock();
++	css = task_css(current, bfqio_cgrp_id);
++	bfqg = __bfq_bic_change_cgroup(bfqd, bic, css);
++	rcu_read_unlock();
++
++	return bfqg;
++}
++
++/**
++ * bfq_flush_idle_tree - deactivate any entity on the idle tree of @st.
++ * @st: the service tree being flushed.
++ */
++static inline void bfq_flush_idle_tree(struct bfq_service_tree *st)
++{
++	struct bfq_entity *entity = st->first_idle;
++
++	for (; entity != NULL; entity = st->first_idle)
++		__bfq_deactivate_entity(entity, 0);
++}
++
++/**
++ * bfq_reparent_leaf_entity - move leaf entity to the root_group.
++ * @bfqd: the device data structure with the root group.
++ * @entity: the entity to move.
++ */
++static inline void bfq_reparent_leaf_entity(struct bfq_data *bfqd,
++					    struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++
++	BUG_ON(bfqq == NULL);
++	bfq_bfqq_move(bfqd, bfqq, entity, bfqd->root_group);
++	return;
++}
++
++/**
++ * bfq_reparent_active_entities - move to the root group all active
++ *                                entities.
++ * @bfqd: the device data structure with the root group.
++ * @bfqg: the group to move from.
++ * @st: the service tree with the entities.
++ *
++ * Needs queue_lock to be taken and reference to be valid over the call.
++ */
++static inline void bfq_reparent_active_entities(struct bfq_data *bfqd,
++						struct bfq_group *bfqg,
++						struct bfq_service_tree *st)
++{
++	struct rb_root *active = &st->active;
++	struct bfq_entity *entity = NULL;
++
++	if (!RB_EMPTY_ROOT(&st->active))
++		entity = bfq_entity_of(rb_first(active));
++
++	for (; entity != NULL; entity = bfq_entity_of(rb_first(active)))
++		bfq_reparent_leaf_entity(bfqd, entity);
++
++	if (bfqg->sched_data.in_service_entity != NULL)
++		bfq_reparent_leaf_entity(bfqd,
++			bfqg->sched_data.in_service_entity);
++
++	return;
++}
++
++/**
++ * bfq_destroy_group - destroy @bfqg.
++ * @bgrp: the bfqio_cgroup containing @bfqg.
++ * @bfqg: the group being destroyed.
++ *
++ * Destroy @bfqg, making sure that it is not referenced from its parent.
++ */
++static void bfq_destroy_group(struct bfqio_cgroup *bgrp, struct bfq_group *bfqg)
++{
++	struct bfq_data *bfqd;
++	struct bfq_service_tree *st;
++	struct bfq_entity *entity = bfqg->my_entity;
++	unsigned long uninitialized_var(flags);
++	int i;
++
++	hlist_del(&bfqg->group_node);
++
++	/*
++	 * Empty all service_trees belonging to this group before
++	 * deactivating the group itself.
++	 */
++	for (i = 0; i < BFQ_IOPRIO_CLASSES; i++) {
++		st = bfqg->sched_data.service_tree + i;
++
++		/*
++		 * The idle tree may still contain bfq_queues belonging
++		 * to exited task because they never migrated to a different
++		 * cgroup from the one being destroyed now.  No one else
++		 * can access them so it's safe to act without any lock.
++		 */
++		bfq_flush_idle_tree(st);
++
++		/*
++		 * It may happen that some queues are still active
++		 * (busy) upon group destruction (if the corresponding
++		 * processes have been forced to terminate). We move
++		 * all the leaf entities corresponding to these queues
++		 * to the root_group.
++		 * Also, it may happen that the group has an entity
++		 * in service, which is disconnected from the active
++		 * tree: it must be moved, too.
++		 * There is no need to put the sync queues, as the
++		 * scheduler has taken no reference.
++		 */
++		bfqd = bfq_get_bfqd_locked(&bfqg->bfqd, &flags);
++		if (bfqd != NULL) {
++			bfq_reparent_active_entities(bfqd, bfqg, st);
++			bfq_put_bfqd_unlock(bfqd, &flags);
++		}
++		BUG_ON(!RB_EMPTY_ROOT(&st->active));
++		BUG_ON(!RB_EMPTY_ROOT(&st->idle));
++	}
++	BUG_ON(bfqg->sched_data.next_in_service != NULL);
++	BUG_ON(bfqg->sched_data.in_service_entity != NULL);
++
++	/*
++	 * We may race with device destruction, take extra care when
++	 * dereferencing bfqg->bfqd.
++	 */
++	bfqd = bfq_get_bfqd_locked(&bfqg->bfqd, &flags);
++	if (bfqd != NULL) {
++		hlist_del(&bfqg->bfqd_node);
++		__bfq_deactivate_entity(entity, 0);
++		bfq_put_async_queues(bfqd, bfqg);
++		bfq_put_bfqd_unlock(bfqd, &flags);
++	}
++	BUG_ON(entity->tree != NULL);
++
++	/*
++	 * No need to defer the kfree() to the end of the RCU grace
++	 * period: we are called from the destroy() callback of our
++	 * cgroup, so we can be sure that no one is a) still using
++	 * this cgroup or b) doing lookups in it.
++	 */
++	kfree(bfqg);
++}
++
++static void bfq_end_wr_async(struct bfq_data *bfqd)
++{
++	struct hlist_node *tmp;
++	struct bfq_group *bfqg;
++
++	hlist_for_each_entry_safe(bfqg, tmp, &bfqd->group_list, bfqd_node)
++		bfq_end_wr_async_queues(bfqd, bfqg);
++	bfq_end_wr_async_queues(bfqd, bfqd->root_group);
++}
++
++/**
++ * bfq_disconnect_groups - disconnect @bfqd from all its groups.
++ * @bfqd: the device descriptor being exited.
++ *
++ * When the device exits we just make sure that no lookup can return
++ * the now unused group structures.  They will be deallocated on cgroup
++ * destruction.
++ */
++static void bfq_disconnect_groups(struct bfq_data *bfqd)
++{
++	struct hlist_node *tmp;
++	struct bfq_group *bfqg;
++
++	bfq_log(bfqd, "disconnect_groups beginning");
++	hlist_for_each_entry_safe(bfqg, tmp, &bfqd->group_list, bfqd_node) {
++		hlist_del(&bfqg->bfqd_node);
++
++		__bfq_deactivate_entity(bfqg->my_entity, 0);
++
++		/*
++		 * Don't remove from the group hash, just set an
++		 * invalid key.  No lookups can race with the
++		 * assignment as bfqd is being destroyed; this
++		 * implies also that new elements cannot be added
++		 * to the list.
++		 */
++		rcu_assign_pointer(bfqg->bfqd, NULL);
++
++		bfq_log(bfqd, "disconnect_groups: put async for group %p",
++			bfqg);
++		bfq_put_async_queues(bfqd, bfqg);
++	}
++}
++
++static inline void bfq_free_root_group(struct bfq_data *bfqd)
++{
++	struct bfqio_cgroup *bgrp = &bfqio_root_cgroup;
++	struct bfq_group *bfqg = bfqd->root_group;
++
++	bfq_put_async_queues(bfqd, bfqg);
++
++	spin_lock_irq(&bgrp->lock);
++	hlist_del_rcu(&bfqg->group_node);
++	spin_unlock_irq(&bgrp->lock);
++
++	/*
++	 * No need to synchronize_rcu() here: since the device is gone
++	 * there cannot be any read-side access to its root_group.
++	 */
++	kfree(bfqg);
++}
++
++static struct bfq_group *bfq_alloc_root_group(struct bfq_data *bfqd, int node)
++{
++	struct bfq_group *bfqg;
++	struct bfqio_cgroup *bgrp;
++	int i;
++
++	bfqg = kzalloc_node(sizeof(*bfqg), GFP_KERNEL, node);
++	if (bfqg == NULL)
++		return NULL;
++
++	bfqg->entity.parent = NULL;
++	for (i = 0; i < BFQ_IOPRIO_CLASSES; i++)
++		bfqg->sched_data.service_tree[i] = BFQ_SERVICE_TREE_INIT;
++
++	bgrp = &bfqio_root_cgroup;
++	spin_lock_irq(&bgrp->lock);
++	rcu_assign_pointer(bfqg->bfqd, bfqd);
++	hlist_add_head_rcu(&bfqg->group_node, &bgrp->group_data);
++	spin_unlock_irq(&bgrp->lock);
++
++	return bfqg;
++}
++
++#define SHOW_FUNCTION(__VAR)						\
++static u64 bfqio_cgroup_##__VAR##_read(struct cgroup_subsys_state *css, \
++				       struct cftype *cftype)		\
++{									\
++	struct bfqio_cgroup *bgrp = css_to_bfqio(css);			\
++	u64 ret = -ENODEV;						\
++									\
++	mutex_lock(&bfqio_mutex);					\
++	if (bfqio_is_removed(bgrp))					\
++		goto out_unlock;					\
++									\
++	spin_lock_irq(&bgrp->lock);					\
++	ret = bgrp->__VAR;						\
++	spin_unlock_irq(&bgrp->lock);					\
++									\
++out_unlock:								\
++	mutex_unlock(&bfqio_mutex);					\
++	return ret;							\
++}
++
++SHOW_FUNCTION(weight);
++SHOW_FUNCTION(ioprio);
++SHOW_FUNCTION(ioprio_class);
++#undef SHOW_FUNCTION
++
++#define STORE_FUNCTION(__VAR, __MIN, __MAX)				\
++static int bfqio_cgroup_##__VAR##_write(struct cgroup_subsys_state *css,\
++					struct cftype *cftype,		\
++					u64 val)			\
++{									\
++	struct bfqio_cgroup *bgrp = css_to_bfqio(css);			\
++	struct bfq_group *bfqg;						\
++	int ret = -EINVAL;						\
++									\
++	if (val < (__MIN) || val > (__MAX))				\
++		return ret;						\
++									\
++	ret = -ENODEV;							\
++	mutex_lock(&bfqio_mutex);					\
++	if (bfqio_is_removed(bgrp))					\
++		goto out_unlock;					\
++	ret = 0;							\
++									\
++	spin_lock_irq(&bgrp->lock);					\
++	bgrp->__VAR = (unsigned short)val;				\
++	hlist_for_each_entry(bfqg, &bgrp->group_data, group_node) {	\
++		/*							\
++		 * Setting the ioprio_changed flag of the entity        \
++		 * to 1 with new_##__VAR == ##__VAR would re-set        \
++		 * the value of the weight to its ioprio mapping.       \
++		 * Set the flag only if necessary.			\
++		 */							\
++		if ((unsigned short)val != bfqg->entity.new_##__VAR) {  \
++			bfqg->entity.new_##__VAR = (unsigned short)val; \
++			/*						\
++			 * Make sure that the above new value has been	\
++			 * stored in bfqg->entity.new_##__VAR before	\
++			 * setting the ioprio_changed flag. In fact,	\
++			 * this flag may be read asynchronously (in	\
++			 * critical sections protected by a different	\
++			 * lock than that held here), and finding this	\
++			 * flag set may cause the execution of the code	\
++			 * for updating parameters whose value may	\
++			 * depend also on bfqg->entity.new_##__VAR (in	\
++			 * __bfq_entity_update_weight_prio).		\
++			 * This barrier makes sure that the new value	\
++			 * of bfqg->entity.new_##__VAR is correctly	\
++			 * seen in that code.				\
++			 */						\
++			smp_wmb();                                      \
++			bfqg->entity.ioprio_changed = 1;                \
++		}							\
++	}								\
++	spin_unlock_irq(&bgrp->lock);					\
++									\
++out_unlock:								\
++	mutex_unlock(&bfqio_mutex);					\
++	return ret;							\
++}
++
++STORE_FUNCTION(weight, BFQ_MIN_WEIGHT, BFQ_MAX_WEIGHT);
++STORE_FUNCTION(ioprio, 0, IOPRIO_BE_NR - 1);
++STORE_FUNCTION(ioprio_class, IOPRIO_CLASS_RT, IOPRIO_CLASS_IDLE);
++#undef STORE_FUNCTION
++
++static struct cftype bfqio_files[] = {
++	{
++		.name = "weight",
++		.read_u64 = bfqio_cgroup_weight_read,
++		.write_u64 = bfqio_cgroup_weight_write,
++	},
++	{
++		.name = "ioprio",
++		.read_u64 = bfqio_cgroup_ioprio_read,
++		.write_u64 = bfqio_cgroup_ioprio_write,
++	},
++	{
++		.name = "ioprio_class",
++		.read_u64 = bfqio_cgroup_ioprio_class_read,
++		.write_u64 = bfqio_cgroup_ioprio_class_write,
++	},
++	{ },	/* terminate */
++};
++
++static struct cgroup_subsys_state *bfqio_create(struct cgroup_subsys_state
++						*parent_css)
++{
++	struct bfqio_cgroup *bgrp;
++
++	if (parent_css != NULL) {
++		bgrp = kzalloc(sizeof(*bgrp), GFP_KERNEL);
++		if (bgrp == NULL)
++			return ERR_PTR(-ENOMEM);
++	} else
++		bgrp = &bfqio_root_cgroup;
++
++	spin_lock_init(&bgrp->lock);
++	INIT_HLIST_HEAD(&bgrp->group_data);
++	bgrp->ioprio = BFQ_DEFAULT_GRP_IOPRIO;
++	bgrp->ioprio_class = BFQ_DEFAULT_GRP_CLASS;
++
++	return &bgrp->css;
++}
++
++/*
++ * We cannot support shared io contexts, as we have no means to support
++ * two tasks with the same ioc in two different groups without major rework
++ * of the main bic/bfqq data structures.  By now we allow a task to change
++ * its cgroup only if it's the only owner of its ioc; the drawback of this
++ * behavior is that a group containing a task that forked using CLONE_IO
++ * will not be destroyed until the tasks sharing the ioc die.
++ */
++static int bfqio_can_attach(struct cgroup_subsys_state *css,
++			    struct cgroup_taskset *tset)
++{
++	struct task_struct *task;
++	struct io_context *ioc;
++	int ret = 0;
++
++	cgroup_taskset_for_each(task, tset) {
++		/*
++		 * task_lock() is needed to avoid races with
++		 * exit_io_context()
++		 */
++		task_lock(task);
++		ioc = task->io_context;
++		if (ioc != NULL && atomic_read(&ioc->nr_tasks) > 1)
++			/*
++			 * ioc == NULL means that the task is either too
++			 * young or exiting: if it has still no ioc the
++			 * ioc can't be shared, if the task is exiting the
++			 * attach will fail anyway, no matter what we
++			 * return here.
++			 */
++			ret = -EINVAL;
++		task_unlock(task);
++		if (ret)
++			break;
++	}
++
++	return ret;
++}
++
++static void bfqio_attach(struct cgroup_subsys_state *css,
++			 struct cgroup_taskset *tset)
++{
++	struct task_struct *task;
++	struct io_context *ioc;
++	struct io_cq *icq;
++
++	/*
++	 * IMPORTANT NOTE: The move of more than one process at a time to a
++	 * new group has not yet been tested.
++	 */
++	cgroup_taskset_for_each(task, tset) {
++		ioc = get_task_io_context(task, GFP_ATOMIC, NUMA_NO_NODE);
++		if (ioc) {
++			/*
++			 * Handle cgroup change here.
++			 */
++			rcu_read_lock();
++			hlist_for_each_entry_rcu(icq, &ioc->icq_list, ioc_node)
++				if (!strncmp(
++					icq->q->elevator->type->elevator_name,
++					"bfq", ELV_NAME_MAX))
++					bfq_bic_change_cgroup(icq_to_bic(icq),
++							      css);
++			rcu_read_unlock();
++			put_io_context(ioc);
++		}
++	}
++}
++
++static void bfqio_destroy(struct cgroup_subsys_state *css)
++{
++	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
++	struct hlist_node *tmp;
++	struct bfq_group *bfqg;
++
++	/*
++	 * Since we are destroying the cgroup, there are no more tasks
++	 * referencing it, and all the RCU grace periods that may have
++	 * referenced it are ended (as the destruction of the parent
++	 * cgroup is RCU-safe); bgrp->group_data will not be accessed by
++	 * anything else and we don't need any synchronization.
++	 */
++	hlist_for_each_entry_safe(bfqg, tmp, &bgrp->group_data, group_node)
++		bfq_destroy_group(bgrp, bfqg);
++
++	BUG_ON(!hlist_empty(&bgrp->group_data));
++
++	kfree(bgrp);
++}
++
++static int bfqio_css_online(struct cgroup_subsys_state *css)
++{
++	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
++
++	mutex_lock(&bfqio_mutex);
++	bgrp->online = true;
++	mutex_unlock(&bfqio_mutex);
++
++	return 0;
++}
++
++static void bfqio_css_offline(struct cgroup_subsys_state *css)
++{
++	struct bfqio_cgroup *bgrp = css_to_bfqio(css);
++
++	mutex_lock(&bfqio_mutex);
++	bgrp->online = false;
++	mutex_unlock(&bfqio_mutex);
++}
++
++struct cgroup_subsys bfqio_cgrp_subsys = {
++	.css_alloc = bfqio_create,
++	.css_online = bfqio_css_online,
++	.css_offline = bfqio_css_offline,
++	.can_attach = bfqio_can_attach,
++	.attach = bfqio_attach,
++	.css_free = bfqio_destroy,
++	.legacy_cftypes = bfqio_files,
++};
++#else
++static inline void bfq_init_entity(struct bfq_entity *entity,
++				   struct bfq_group *bfqg)
++{
++	entity->weight = entity->new_weight;
++	entity->orig_weight = entity->new_weight;
++	entity->ioprio = entity->new_ioprio;
++	entity->ioprio_class = entity->new_ioprio_class;
++	entity->sched_data = &bfqg->sched_data;
++}
++
++static inline struct bfq_group *
++bfq_bic_update_cgroup(struct bfq_io_cq *bic)
++{
++	struct bfq_data *bfqd = bic_to_bfqd(bic);
++	return bfqd->root_group;
++}
++
++static inline void bfq_bfqq_move(struct bfq_data *bfqd,
++				 struct bfq_queue *bfqq,
++				 struct bfq_entity *entity,
++				 struct bfq_group *bfqg)
++{
++}
++
++static void bfq_end_wr_async(struct bfq_data *bfqd)
++{
++	bfq_end_wr_async_queues(bfqd, bfqd->root_group);
++}
++
++static inline void bfq_disconnect_groups(struct bfq_data *bfqd)
++{
++	bfq_put_async_queues(bfqd, bfqd->root_group);
++}
++
++static inline void bfq_free_root_group(struct bfq_data *bfqd)
++{
++	kfree(bfqd->root_group);
++}
++
++static struct bfq_group *bfq_alloc_root_group(struct bfq_data *bfqd, int node)
++{
++	struct bfq_group *bfqg;
++	int i;
++
++	bfqg = kmalloc_node(sizeof(*bfqg), GFP_KERNEL | __GFP_ZERO, node);
++	if (bfqg == NULL)
++		return NULL;
++
++	for (i = 0; i < BFQ_IOPRIO_CLASSES; i++)
++		bfqg->sched_data.service_tree[i] = BFQ_SERVICE_TREE_INIT;
++
++	return bfqg;
++}
++#endif
+diff -Nur linux-4.1.3/block/bfq.h linux-xbian-imx6/block/bfq.h
+--- linux-4.1.3/block/bfq.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/block/bfq.h	2015-07-27 23:13:03.604123194 +0200
+@@ -0,0 +1,811 @@
++/*
++ * BFQ-v7r7 for 4.0.0: data structures and common functions prototypes.
++ *
++ * Based on ideas and code from CFQ:
++ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
++ *
++ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
++ *		      Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
++ */
++
++#ifndef _BFQ_H
++#define _BFQ_H
++
++#include <linux/blktrace_api.h>
++#include <linux/hrtimer.h>
++#include <linux/ioprio.h>
++#include <linux/rbtree.h>
++
++#define BFQ_IOPRIO_CLASSES	3
++#define BFQ_CL_IDLE_TIMEOUT	(HZ/5)
++
++#define BFQ_MIN_WEIGHT	1
++#define BFQ_MAX_WEIGHT	1000
++
++#define BFQ_DEFAULT_QUEUE_IOPRIO	4
++
++#define BFQ_DEFAULT_GRP_WEIGHT	10
++#define BFQ_DEFAULT_GRP_IOPRIO	0
++#define BFQ_DEFAULT_GRP_CLASS	IOPRIO_CLASS_BE
++
++struct bfq_entity;
++
++/**
++ * struct bfq_service_tree - per ioprio_class service tree.
++ * @active: tree for active entities (i.e., those backlogged).
++ * @idle: tree for idle entities (i.e., those not backlogged, with V <= F_i).
++ * @first_idle: idle entity with minimum F_i.
++ * @last_idle: idle entity with maximum F_i.
++ * @vtime: scheduler virtual time.
++ * @wsum: scheduler weight sum; active and idle entities contribute to it.
++ *
++ * Each service tree represents a B-WF2Q+ scheduler on its own.  Each
++ * ioprio_class has its own independent scheduler, and so its own
++ * bfq_service_tree.  All the fields are protected by the queue lock
++ * of the containing bfqd.
++ */
++struct bfq_service_tree {
++	struct rb_root active;
++	struct rb_root idle;
++
++	struct bfq_entity *first_idle;
++	struct bfq_entity *last_idle;
++
++	u64 vtime;
++	unsigned long wsum;
++};
++
++/**
++ * struct bfq_sched_data - multi-class scheduler.
++ * @in_service_entity: entity in service.
++ * @next_in_service: head-of-the-line entity in the scheduler.
++ * @service_tree: array of service trees, one per ioprio_class.
++ *
++ * bfq_sched_data is the basic scheduler queue.  It supports three
++ * ioprio_classes, and can be used either as a toplevel queue or as
++ * an intermediate queue on a hierarchical setup.
++ * @next_in_service points to the active entity of the sched_data
++ * service trees that will be scheduled next.
++ *
++ * The supported ioprio_classes are the same as in CFQ, in descending
++ * priority order, IOPRIO_CLASS_RT, IOPRIO_CLASS_BE, IOPRIO_CLASS_IDLE.
++ * Requests from higher priority queues are served before all the
++ * requests from lower priority queues; among requests of the same
++ * queue requests are served according to B-WF2Q+.
++ * All the fields are protected by the queue lock of the containing bfqd.
++ */
++struct bfq_sched_data {
++	struct bfq_entity *in_service_entity;
++	struct bfq_entity *next_in_service;
++	struct bfq_service_tree service_tree[BFQ_IOPRIO_CLASSES];
++};
++
++/**
++ * struct bfq_weight_counter - counter of the number of all active entities
++ *                             with a given weight.
++ * @weight: weight of the entities that this counter refers to.
++ * @num_active: number of active entities with this weight.
++ * @weights_node: weights tree member (see bfq_data's @queue_weights_tree
++ *                and @group_weights_tree).
++ */
++struct bfq_weight_counter {
++	short int weight;
++	unsigned int num_active;
++	struct rb_node weights_node;
++};
++
++/**
++ * struct bfq_entity - schedulable entity.
++ * @rb_node: service_tree member.
++ * @weight_counter: pointer to the weight counter associated with this entity.
++ * @on_st: flag, true if the entity is on a tree (either the active or
++ *         the idle one of its service_tree).
++ * @finish: B-WF2Q+ finish timestamp (aka F_i).
++ * @start: B-WF2Q+ start timestamp (aka S_i).
++ * @tree: tree the entity is enqueued into; %NULL if not on a tree.
++ * @min_start: minimum start time of the (active) subtree rooted at
++ *             this entity; used for O(log N) lookups into active trees.
++ * @service: service received during the last round of service.
++ * @budget: budget used to calculate F_i; F_i = S_i + @budget / @weight.
++ * @weight: weight of the queue
++ * @parent: parent entity, for hierarchical scheduling.
++ * @my_sched_data: for non-leaf nodes in the cgroup hierarchy, the
++ *                 associated scheduler queue, %NULL on leaf nodes.
++ * @sched_data: the scheduler queue this entity belongs to.
++ * @ioprio: the ioprio in use.
++ * @new_weight: when a weight change is requested, the new weight value.
++ * @orig_weight: original weight, used to implement weight boosting
++ * @new_ioprio: when an ioprio change is requested, the new ioprio value.
++ * @ioprio_class: the ioprio_class in use.
++ * @new_ioprio_class: when an ioprio_class change is requested, the new
++ *                    ioprio_class value.
++ * @ioprio_changed: flag, true when the user requested a weight, ioprio or
++ *                  ioprio_class change.
++ *
++ * A bfq_entity is used to represent either a bfq_queue (leaf node in the
++ * cgroup hierarchy) or a bfq_group into the upper level scheduler.  Each
++ * entity belongs to the sched_data of the parent group in the cgroup
++ * hierarchy.  Non-leaf entities have also their own sched_data, stored
++ * in @my_sched_data.
++ *
++ * Each entity stores independently its priority values; this would
++ * allow different weights on different devices, but this
++ * functionality is not exported to userspace by now.  Priorities and
++ * weights are updated lazily, first storing the new values into the
++ * new_* fields, then setting the @ioprio_changed flag.  As soon as
++ * there is a transition in the entity state that allows the priority
++ * update to take place the effective and the requested priority
++ * values are synchronized.
++ *
++ * Unless cgroups are used, the weight value is calculated from the
++ * ioprio to export the same interface as CFQ.  When dealing with
++ * ``well-behaved'' queues (i.e., queues that do not spend too much
++ * time to consume their budget and have true sequential behavior, and
++ * when there are no external factors breaking anticipation) the
++ * relative weights at each level of the cgroups hierarchy should be
++ * guaranteed.  All the fields are protected by the queue lock of the
++ * containing bfqd.
++ */
++struct bfq_entity {
++	struct rb_node rb_node;
++	struct bfq_weight_counter *weight_counter;
++
++	int on_st;
++
++	u64 finish;
++	u64 start;
++
++	struct rb_root *tree;
++
++	u64 min_start;
++
++	unsigned long service, budget;
++	unsigned short weight, new_weight;
++	unsigned short orig_weight;
++
++	struct bfq_entity *parent;
++
++	struct bfq_sched_data *my_sched_data;
++	struct bfq_sched_data *sched_data;
++
++	unsigned short ioprio, new_ioprio;
++	unsigned short ioprio_class, new_ioprio_class;
++
++	int ioprio_changed;
++};
++
++struct bfq_group;
++
++/**
++ * struct bfq_queue - leaf schedulable entity.
++ * @ref: reference counter.
++ * @bfqd: parent bfq_data.
++ * @new_bfqq: shared bfq_queue if queue is cooperating with
++ *           one or more other queues.
++ * @pos_node: request-position tree member (see bfq_data's @rq_pos_tree).
++ * @pos_root: request-position tree root (see bfq_data's @rq_pos_tree).
++ * @sort_list: sorted list of pending requests.
++ * @next_rq: if fifo isn't expired, next request to serve.
++ * @queued: nr of requests queued in @sort_list.
++ * @allocated: currently allocated requests.
++ * @meta_pending: pending metadata requests.
++ * @fifo: fifo list of requests in sort_list.
++ * @entity: entity representing this queue in the scheduler.
++ * @max_budget: maximum budget allowed from the feedback mechanism.
++ * @budget_timeout: budget expiration (in jiffies).
++ * @dispatched: number of requests on the dispatch list or inside driver.
++ * @flags: status flags.
++ * @bfqq_list: node for active/idle bfqq list inside our bfqd.
++ * @burst_list_node: node for the device's burst list.
++ * @seek_samples: number of seeks sampled
++ * @seek_total: sum of the distances of the seeks sampled
++ * @seek_mean: mean seek distance
++ * @last_request_pos: position of the last request enqueued
++ * @requests_within_timer: number of consecutive pairs of request completion
++ *                         and arrival, such that the queue becomes idle
++ *                         after the completion, but the next request arrives
++ *                         within an idle time slice; used only if the queue's
++ *                         IO_bound has been cleared.
++ * @pid: pid of the process owning the queue, used for logging purposes.
++ * @last_wr_start_finish: start time of the current weight-raising period if
++ *                        the @bfq-queue is being weight-raised, otherwise
++ *                        finish time of the last weight-raising period
++ * @wr_cur_max_time: current max raising time for this queue
++ * @soft_rt_next_start: minimum time instant such that, only if a new
++ *                      request is enqueued after this time instant in an
++ *                      idle @bfq_queue with no outstanding requests, then
++ *                      the task associated with the queue it is deemed as
++ *                      soft real-time (see the comments to the function
++ *                      bfq_bfqq_softrt_next_start())
++ * @last_idle_bklogged: time of the last transition of the @bfq_queue from
++ *                      idle to backlogged
++ * @service_from_backlogged: cumulative service received from the @bfq_queue
++ *                           since the last transition from idle to
++ *                           backlogged
++ * @bic: pointer to the bfq_io_cq owning the bfq_queue, set to %NULL if the
++ *	 queue is shared
++ *
++ * A bfq_queue is a leaf request queue; it can be associated with an
++ * io_context or more, if it  is  async or shared  between  cooperating
++ * processes. @cgroup holds a reference to the cgroup, to be sure that it
++ * does not disappear while a bfqq still references it (mostly to avoid
++ * races between request issuing and task migration followed by cgroup
++ * destruction).
++ * All the fields are protected by the queue lock of the containing bfqd.
++ */
++struct bfq_queue {
++	atomic_t ref;
++	struct bfq_data *bfqd;
++
++	/* fields for cooperating queues handling */
++	struct bfq_queue *new_bfqq;
++	struct rb_node pos_node;
++	struct rb_root *pos_root;
++
++	struct rb_root sort_list;
++	struct request *next_rq;
++	int queued[2];
++	int allocated[2];
++	int meta_pending;
++	struct list_head fifo;
++
++	struct bfq_entity entity;
++
++	unsigned long max_budget;
++	unsigned long budget_timeout;
++
++	int dispatched;
++
++	unsigned int flags;
++
++	struct list_head bfqq_list;
++
++	struct hlist_node burst_list_node;
++
++	unsigned int seek_samples;
++	u64 seek_total;
++	sector_t seek_mean;
++	sector_t last_request_pos;
++
++	unsigned int requests_within_timer;
++
++	pid_t pid;
++	struct bfq_io_cq *bic;
++
++	/* weight-raising fields */
++	unsigned long wr_cur_max_time;
++	unsigned long soft_rt_next_start;
++	unsigned long last_wr_start_finish;
++	unsigned int wr_coeff;
++	unsigned long last_idle_bklogged;
++	unsigned long service_from_backlogged;
++};
++
++/**
++ * struct bfq_ttime - per process thinktime stats.
++ * @ttime_total: total process thinktime
++ * @ttime_samples: number of thinktime samples
++ * @ttime_mean: average process thinktime
++ */
++struct bfq_ttime {
++	unsigned long last_end_request;
++
++	unsigned long ttime_total;
++	unsigned long ttime_samples;
++	unsigned long ttime_mean;
++};
++
++/**
++ * struct bfq_io_cq - per (request_queue, io_context) structure.
++ * @icq: associated io_cq structure
++ * @bfqq: array of two process queues, the sync and the async
++ * @ttime: associated @bfq_ttime struct
++ * @wr_time_left: snapshot of the time left before weight raising ends
++ *                for the sync queue associated to this process; this
++ *		  snapshot is taken to remember this value while the weight
++ *		  raising is suspended because the queue is merged with a
++ *		  shared queue, and is used to set @raising_cur_max_time
++ *		  when the queue is split from the shared queue and its
++ *		  weight is raised again
++ * @saved_idle_window: same purpose as the previous field for the idle
++ *                     window
++ * @saved_IO_bound: same purpose as the previous two fields for the I/O
++ *                  bound classification of a queue
++ * @saved_in_large_burst: same purpose as the previous fields for the
++ *                        value of the field keeping the queue's belonging
++ *                        to a large burst
++ * @was_in_burst_list: true if the queue belonged to a burst list
++ *                     before its merge with another cooperating queue
++ * @cooperations: counter of consecutive successful queue merges underwent
++ *                by any of the process' @bfq_queues
++ * @failed_cooperations: counter of consecutive failed queue merges of any
++ *                       of the process' @bfq_queues
++ */
++struct bfq_io_cq {
++	struct io_cq icq; /* must be the first member */
++	struct bfq_queue *bfqq[2];
++	struct bfq_ttime ttime;
++	int ioprio;
++
++	unsigned int wr_time_left;
++	bool saved_idle_window;
++	bool saved_IO_bound;
++
++	bool saved_in_large_burst;
++	bool was_in_burst_list;
++
++	unsigned int cooperations;
++	unsigned int failed_cooperations;
++};
++
++enum bfq_device_speed {
++	BFQ_BFQD_FAST,
++	BFQ_BFQD_SLOW,
++};
++
++/**
++ * struct bfq_data - per device data structure.
++ * @queue: request queue for the managed device.
++ * @root_group: root bfq_group for the device.
++ * @rq_pos_tree: rbtree sorted by next_request position, used when
++ *               determining if two or more queues have interleaving
++ *               requests (see bfq_close_cooperator()).
++ * @active_numerous_groups: number of bfq_groups containing more than one
++ *                          active @bfq_entity.
++ * @queue_weights_tree: rbtree of weight counters of @bfq_queues, sorted by
++ *                      weight. Used to keep track of whether all @bfq_queues
++ *                     have the same weight. The tree contains one counter
++ *                     for each distinct weight associated to some active
++ *                     and not weight-raised @bfq_queue (see the comments to
++ *                      the functions bfq_weights_tree_[add|remove] for
++ *                     further details).
++ * @group_weights_tree: rbtree of non-queue @bfq_entity weight counters, sorted
++ *                      by weight. Used to keep track of whether all
++ *                     @bfq_groups have the same weight. The tree contains
++ *                     one counter for each distinct weight associated to
++ *                     some active @bfq_group (see the comments to the
++ *                     functions bfq_weights_tree_[add|remove] for further
++ *                     details).
++ * @busy_queues: number of bfq_queues containing requests (including the
++ *		 queue in service, even if it is idling).
++ * @busy_in_flight_queues: number of @bfq_queues containing pending or
++ *                         in-flight requests, plus the @bfq_queue in
++ *                         service, even if idle but waiting for the
++ *                         possible arrival of its next sync request. This
++ *                         field is updated only if the device is rotational,
++ *                         but used only if the device is also NCQ-capable.
++ *                         The reason why the field is updated also for non-
++ *                         NCQ-capable rotational devices is related to the
++ *                         fact that the value of @hw_tag may be set also
++ *                         later than when busy_in_flight_queues may need to
++ *                         be incremented for the first time(s). Taking also
++ *                         this possibility into account, to avoid unbalanced
++ *                         increments/decrements, would imply more overhead
++ *                         than just updating busy_in_flight_queues
++ *                         regardless of the value of @hw_tag.
++ * @const_seeky_busy_in_flight_queues: number of constantly-seeky @bfq_queues
++ *                                     (that is, seeky queues that expired
++ *                                     for budget timeout at least once)
++ *                                     containing pending or in-flight
++ *                                     requests, including the in-service
++ *                                     @bfq_queue if constantly seeky. This
++ *                                     field is updated only if the device
++ *                                     is rotational, but used only if the
++ *                                     device is also NCQ-capable (see the
++ *                                     comments to @busy_in_flight_queues).
++ * @wr_busy_queues: number of weight-raised busy @bfq_queues.
++ * @queued: number of queued requests.
++ * @rq_in_driver: number of requests dispatched and waiting for completion.
++ * @sync_flight: number of sync requests in the driver.
++ * @max_rq_in_driver: max number of reqs in driver in the last
++ *                    @hw_tag_samples completed requests.
++ * @hw_tag_samples: nr of samples used to calculate hw_tag.
++ * @hw_tag: flag set to one if the driver is showing a queueing behavior.
++ * @budgets_assigned: number of budgets assigned.
++ * @idle_slice_timer: timer set when idling for the next sequential request
++ *                    from the queue in service.
++ * @unplug_work: delayed work to restart dispatching on the request queue.
++ * @in_service_queue: bfq_queue in service.
++ * @in_service_bic: bfq_io_cq (bic) associated with the @in_service_queue.
++ * @last_position: on-disk position of the last served request.
++ * @last_budget_start: beginning of the last budget.
++ * @last_idling_start: beginning of the last idle slice.
++ * @peak_rate: peak transfer rate observed for a budget.
++ * @peak_rate_samples: number of samples used to calculate @peak_rate.
++ * @bfq_max_budget: maximum budget allotted to a bfq_queue before
++ *                  rescheduling.
++ * @group_list: list of all the bfq_groups active on the device.
++ * @active_list: list of all the bfq_queues active on the device.
++ * @idle_list: list of all the bfq_queues idle on the device.
++ * @bfq_quantum: max number of requests dispatched per dispatch round.
++ * @bfq_fifo_expire: timeout for async/sync requests; when it expires
++ *                   requests are served in fifo order.
++ * @bfq_back_penalty: weight of backward seeks wrt forward ones.
++ * @bfq_back_max: maximum allowed backward seek.
++ * @bfq_slice_idle: maximum idling time.
++ * @bfq_user_max_budget: user-configured max budget value
++ *                       (0 for auto-tuning).
++ * @bfq_max_budget_async_rq: maximum budget (in nr of requests) allotted to
++ *                           async queues.
++ * @bfq_timeout: timeout for bfq_queues to consume their budget; used to
++ *               to prevent seeky queues to impose long latencies to well
++ *               behaved ones (this also implies that seeky queues cannot
++ *               receive guarantees in the service domain; after a timeout
++ *               they are charged for the whole allocated budget, to try
++ *               to preserve a behavior reasonably fair among them, but
++ *               without service-domain guarantees).
++ * @bfq_coop_thresh: number of queue merges after which a @bfq_queue is
++ *                   no more granted any weight-raising.
++ * @bfq_failed_cooperations: number of consecutive failed cooperation
++ *                           chances after which weight-raising is restored
++ *                           to a queue subject to more than bfq_coop_thresh
++ *                           queue merges.
++ * @bfq_requests_within_timer: number of consecutive requests that must be
++ *                             issued within the idle time slice to set
++ *                             again idling to a queue which was marked as
++ *                             non-I/O-bound (see the definition of the
++ *                             IO_bound flag for further details).
++ * @last_ins_in_burst: last time at which a queue entered the current
++ *                     burst of queues being activated shortly after
++ *                     each other; for more details about this and the
++ *                     following parameters related to a burst of
++ *                     activations, see the comments to the function
++ *                     @bfq_handle_burst.
++ * @bfq_burst_interval: reference time interval used to decide whether a
++ *                      queue has been activated shortly after
++ *                      @last_ins_in_burst.
++ * @burst_size: number of queues in the current burst of queue activations.
++ * @bfq_large_burst_thresh: maximum burst size above which the current
++ * 			    queue-activation burst is deemed as 'large'.
++ * @large_burst: true if a large queue-activation burst is in progress.
++ * @burst_list: head of the burst list (as for the above fields, more details
++ * 		in the comments to the function bfq_handle_burst).
++ * @low_latency: if set to true, low-latency heuristics are enabled.
++ * @bfq_wr_coeff: maximum factor by which the weight of a weight-raised
++ *                queue is multiplied.
++ * @bfq_wr_max_time: maximum duration of a weight-raising period (jiffies).
++ * @bfq_wr_rt_max_time: maximum duration for soft real-time processes.
++ * @bfq_wr_min_idle_time: minimum idle period after which weight-raising
++ *			  may be reactivated for a queue (in jiffies).
++ * @bfq_wr_min_inter_arr_async: minimum period between request arrivals
++ *				after which weight-raising may be
++ *				reactivated for an already busy queue
++ *				(in jiffies).
++ * @bfq_wr_max_softrt_rate: max service-rate for a soft real-time queue,
++ *			    sectors per seconds.
++ * @RT_prod: cached value of the product R*T used for computing the maximum
++ *	     duration of the weight raising automatically.
++ * @device_speed: device-speed class for the low-latency heuristic.
++ * @oom_bfqq: fallback dummy bfqq for extreme OOM conditions.
++ *
++ * All the fields are protected by the @queue lock.
++ */
++struct bfq_data {
++	struct request_queue *queue;
++
++	struct bfq_group *root_group;
++	struct rb_root rq_pos_tree;
++
++#ifdef CONFIG_CGROUP_BFQIO
++	int active_numerous_groups;
++#endif
++
++	struct rb_root queue_weights_tree;
++	struct rb_root group_weights_tree;
++
++	int busy_queues;
++	int busy_in_flight_queues;
++	int const_seeky_busy_in_flight_queues;
++	int wr_busy_queues;
++	int queued;
++	int rq_in_driver;
++	int sync_flight;
++
++	int max_rq_in_driver;
++	int hw_tag_samples;
++	int hw_tag;
++
++	int budgets_assigned;
++
++	struct timer_list idle_slice_timer;
++	struct work_struct unplug_work;
++
++	struct bfq_queue *in_service_queue;
++	struct bfq_io_cq *in_service_bic;
++
++	sector_t last_position;
++
++	ktime_t last_budget_start;
++	ktime_t last_idling_start;
++	int peak_rate_samples;
++	u64 peak_rate;
++	unsigned long bfq_max_budget;
++
++	struct hlist_head group_list;
++	struct list_head active_list;
++	struct list_head idle_list;
++
++	unsigned int bfq_quantum;
++	unsigned int bfq_fifo_expire[2];
++	unsigned int bfq_back_penalty;
++	unsigned int bfq_back_max;
++	unsigned int bfq_slice_idle;
++	u64 bfq_class_idle_last_service;
++
++	unsigned int bfq_user_max_budget;
++	unsigned int bfq_max_budget_async_rq;
++	unsigned int bfq_timeout[2];
++
++	unsigned int bfq_coop_thresh;
++	unsigned int bfq_failed_cooperations;
++	unsigned int bfq_requests_within_timer;
++
++	unsigned long last_ins_in_burst;
++	unsigned long bfq_burst_interval;
++	int burst_size;
++	unsigned long bfq_large_burst_thresh;
++	bool large_burst;
++	struct hlist_head burst_list;
++
++	bool low_latency;
++
++	/* parameters of the low_latency heuristics */
++	unsigned int bfq_wr_coeff;
++	unsigned int bfq_wr_max_time;
++	unsigned int bfq_wr_rt_max_time;
++	unsigned int bfq_wr_min_idle_time;
++	unsigned long bfq_wr_min_inter_arr_async;
++	unsigned int bfq_wr_max_softrt_rate;
++	u64 RT_prod;
++	enum bfq_device_speed device_speed;
++
++	struct bfq_queue oom_bfqq;
++};
++
++enum bfqq_state_flags {
++	BFQ_BFQQ_FLAG_busy = 0,		/* has requests or is in service */
++	BFQ_BFQQ_FLAG_wait_request,	/* waiting for a request */
++	BFQ_BFQQ_FLAG_must_alloc,	/* must be allowed rq alloc */
++	BFQ_BFQQ_FLAG_fifo_expire,	/* FIFO checked in this slice */
++	BFQ_BFQQ_FLAG_idle_window,	/* slice idling enabled */
++	BFQ_BFQQ_FLAG_prio_changed,	/* task priority has changed */
++	BFQ_BFQQ_FLAG_sync,		/* synchronous queue */
++	BFQ_BFQQ_FLAG_budget_new,	/* no completion with this budget */
++	BFQ_BFQQ_FLAG_IO_bound,		/*
++					 * bfqq has timed-out at least once
++					 * having consumed at most 2/10 of
++					 * its budget
++					 */
++	BFQ_BFQQ_FLAG_in_large_burst,	/*
++					 * bfqq activated in a large burst,
++					 * see comments to bfq_handle_burst.
++					 */
++	BFQ_BFQQ_FLAG_constantly_seeky,	/*
++					 * bfqq has proved to be slow and
++					 * seeky until budget timeout
++					 */
++	BFQ_BFQQ_FLAG_softrt_update,	/*
++					 * may need softrt-next-start
++					 * update
++					 */
++	BFQ_BFQQ_FLAG_coop,		/* bfqq is shared */
++	BFQ_BFQQ_FLAG_split_coop,	/* shared bfqq will be split */
++	BFQ_BFQQ_FLAG_just_split,	/* queue has just been split */
++};
++
++#define BFQ_BFQQ_FNS(name)						\
++static inline void bfq_mark_bfqq_##name(struct bfq_queue *bfqq)		\
++{									\
++	(bfqq)->flags |= (1 << BFQ_BFQQ_FLAG_##name);			\
++}									\
++static inline void bfq_clear_bfqq_##name(struct bfq_queue *bfqq)	\
++{									\
++	(bfqq)->flags &= ~(1 << BFQ_BFQQ_FLAG_##name);			\
++}									\
++static inline int bfq_bfqq_##name(const struct bfq_queue *bfqq)		\
++{									\
++	return ((bfqq)->flags & (1 << BFQ_BFQQ_FLAG_##name)) != 0;	\
++}
++
++BFQ_BFQQ_FNS(busy);
++BFQ_BFQQ_FNS(wait_request);
++BFQ_BFQQ_FNS(must_alloc);
++BFQ_BFQQ_FNS(fifo_expire);
++BFQ_BFQQ_FNS(idle_window);
++BFQ_BFQQ_FNS(prio_changed);
++BFQ_BFQQ_FNS(sync);
++BFQ_BFQQ_FNS(budget_new);
++BFQ_BFQQ_FNS(IO_bound);
++BFQ_BFQQ_FNS(in_large_burst);
++BFQ_BFQQ_FNS(constantly_seeky);
++BFQ_BFQQ_FNS(coop);
++BFQ_BFQQ_FNS(split_coop);
++BFQ_BFQQ_FNS(just_split);
++BFQ_BFQQ_FNS(softrt_update);
++#undef BFQ_BFQQ_FNS
++
++/* Logging facilities. */
++#define bfq_log_bfqq(bfqd, bfqq, fmt, args...) \
++	blk_add_trace_msg((bfqd)->queue, "bfq%d " fmt, (bfqq)->pid, ##args)
++
++#define bfq_log(bfqd, fmt, args...) \
++	blk_add_trace_msg((bfqd)->queue, "bfq " fmt, ##args)
++
++/* Expiration reasons. */
++enum bfqq_expiration {
++	BFQ_BFQQ_TOO_IDLE = 0,		/*
++					 * queue has been idling for
++					 * too long
++					 */
++	BFQ_BFQQ_BUDGET_TIMEOUT,	/* budget took too long to be used */
++	BFQ_BFQQ_BUDGET_EXHAUSTED,	/* budget consumed */
++	BFQ_BFQQ_NO_MORE_REQUESTS,	/* the queue has no more requests */
++};
++
++#ifdef CONFIG_CGROUP_BFQIO
++/**
++ * struct bfq_group - per (device, cgroup) data structure.
++ * @entity: schedulable entity to insert into the parent group sched_data.
++ * @sched_data: own sched_data, to contain child entities (they may be
++ *              both bfq_queues and bfq_groups).
++ * @group_node: node to be inserted into the bfqio_cgroup->group_data
++ *              list of the containing cgroup's bfqio_cgroup.
++ * @bfqd_node: node to be inserted into the @bfqd->group_list list
++ *             of the groups active on the same device; used for cleanup.
++ * @bfqd: the bfq_data for the device this group acts upon.
++ * @async_bfqq: array of async queues for all the tasks belonging to
++ *              the group, one queue per ioprio value per ioprio_class,
++ *              except for the idle class that has only one queue.
++ * @async_idle_bfqq: async queue for the idle class (ioprio is ignored).
++ * @my_entity: pointer to @entity, %NULL for the toplevel group; used
++ *             to avoid too many special cases during group creation/
++ *             migration.
++ * @active_entities: number of active entities belonging to the group;
++ *                   unused for the root group. Used to know whether there
++ *                   are groups with more than one active @bfq_entity
++ *                   (see the comments to the function
++ *                   bfq_bfqq_must_not_expire()).
++ *
++ * Each (device, cgroup) pair has its own bfq_group, i.e., for each cgroup
++ * there is a set of bfq_groups, each one collecting the lower-level
++ * entities belonging to the group that are acting on the same device.
++ *
++ * Locking works as follows:
++ *    o @group_node is protected by the bfqio_cgroup lock, and is accessed
++ *      via RCU from its readers.
++ *    o @bfqd is protected by the queue lock, RCU is used to access it
++ *      from the readers.
++ *    o All the other fields are protected by the @bfqd queue lock.
++ */
++struct bfq_group {
++	struct bfq_entity entity;
++	struct bfq_sched_data sched_data;
++
++	struct hlist_node group_node;
++	struct hlist_node bfqd_node;
++
++	void *bfqd;
++
++	struct bfq_queue *async_bfqq[2][IOPRIO_BE_NR];
++	struct bfq_queue *async_idle_bfqq;
++
++	struct bfq_entity *my_entity;
++
++	int active_entities;
++};
++
++/**
++ * struct bfqio_cgroup - bfq cgroup data structure.
++ * @css: subsystem state for bfq in the containing cgroup.
++ * @online: flag marked when the subsystem is inserted.
++ * @weight: cgroup weight.
++ * @ioprio: cgroup ioprio.
++ * @ioprio_class: cgroup ioprio_class.
++ * @lock: spinlock that protects @ioprio, @ioprio_class and @group_data.
++ * @group_data: list containing the bfq_group belonging to this cgroup.
++ *
++ * @group_data is accessed using RCU, with @lock protecting the updates,
++ * @ioprio and @ioprio_class are protected by @lock.
++ */
++struct bfqio_cgroup {
++	struct cgroup_subsys_state css;
++	bool online;
++
++	unsigned short weight, ioprio, ioprio_class;
++
++	spinlock_t lock;
++	struct hlist_head group_data;
++};
++#else
++struct bfq_group {
++	struct bfq_sched_data sched_data;
++
++	struct bfq_queue *async_bfqq[2][IOPRIO_BE_NR];
++	struct bfq_queue *async_idle_bfqq;
++};
++#endif
++
++static inline struct bfq_service_tree *
++bfq_entity_service_tree(struct bfq_entity *entity)
++{
++	struct bfq_sched_data *sched_data = entity->sched_data;
++	unsigned int idx = entity->ioprio_class - 1;
++
++	BUG_ON(idx >= BFQ_IOPRIO_CLASSES);
++	BUG_ON(sched_data == NULL);
++
++	return sched_data->service_tree + idx;
++}
++
++static inline struct bfq_queue *bic_to_bfqq(struct bfq_io_cq *bic,
++					    bool is_sync)
++{
++	return bic->bfqq[is_sync];
++}
++
++static inline void bic_set_bfqq(struct bfq_io_cq *bic,
++				struct bfq_queue *bfqq, bool is_sync)
++{
++	bic->bfqq[is_sync] = bfqq;
++}
++
++static inline struct bfq_data *bic_to_bfqd(struct bfq_io_cq *bic)
++{
++	return bic->icq.q->elevator->elevator_data;
++}
++
++/**
++ * bfq_get_bfqd_locked - get a lock to a bfqd using a RCU protected pointer.
++ * @ptr: a pointer to a bfqd.
++ * @flags: storage for the flags to be saved.
++ *
++ * This function allows bfqg->bfqd to be protected by the
++ * queue lock of the bfqd they reference; the pointer is dereferenced
++ * under RCU, so the storage for bfqd is assured to be safe as long
++ * as the RCU read side critical section does not end.  After the
++ * bfqd->queue->queue_lock is taken the pointer is rechecked, to be
++ * sure that no other writer accessed it.  If we raced with a writer,
++ * the function returns NULL, with the queue unlocked, otherwise it
++ * returns the dereferenced pointer, with the queue locked.
++ */
++static inline struct bfq_data *bfq_get_bfqd_locked(void **ptr,
++						   unsigned long *flags)
++{
++	struct bfq_data *bfqd;
++
++	rcu_read_lock();
++	bfqd = rcu_dereference(*(struct bfq_data **)ptr);
++
++	if (bfqd != NULL) {
++		spin_lock_irqsave(bfqd->queue->queue_lock, *flags);
++		if (*ptr == bfqd)
++			goto out;
++		spin_unlock_irqrestore(bfqd->queue->queue_lock, *flags);
++	}
++
++	bfqd = NULL;
++out:
++	rcu_read_unlock();
++	return bfqd;
++}
++
++static inline void bfq_put_bfqd_unlock(struct bfq_data *bfqd,
++				       unsigned long *flags)
++{
++	spin_unlock_irqrestore(bfqd->queue->queue_lock, *flags);
++}
++
++static void bfq_changed_ioprio(struct bfq_io_cq *bic);
++static void bfq_put_queue(struct bfq_queue *bfqq);
++static void bfq_dispatch_insert(struct request_queue *q, struct request *rq);
++static struct bfq_queue *bfq_get_queue(struct bfq_data *bfqd,
++				       struct bfq_group *bfqg, int is_sync,
++				       struct bfq_io_cq *bic, gfp_t gfp_mask);
++static void bfq_end_wr_async_queues(struct bfq_data *bfqd,
++				    struct bfq_group *bfqg);
++static void bfq_put_async_queues(struct bfq_data *bfqd, struct bfq_group *bfqg);
++static void bfq_exit_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq);
++
++#endif /* _BFQ_H */
+diff -Nur linux-4.1.3/block/bfq-ioc.c linux-xbian-imx6/block/bfq-ioc.c
+--- linux-4.1.3/block/bfq-ioc.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/block/bfq-ioc.c	2015-07-27 23:13:03.600137415 +0200
+@@ -0,0 +1,36 @@
++/*
++ * BFQ: I/O context handling.
++ *
++ * Based on ideas and code from CFQ:
++ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
++ *
++ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
++ *		      Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
++ */
++
++/**
++ * icq_to_bic - convert iocontext queue structure to bfq_io_cq.
++ * @icq: the iocontext queue.
++ */
++static inline struct bfq_io_cq *icq_to_bic(struct io_cq *icq)
++{
++	/* bic->icq is the first member, %NULL will convert to %NULL */
++	return container_of(icq, struct bfq_io_cq, icq);
++}
++
++/**
++ * bfq_bic_lookup - search into @ioc a bic associated to @bfqd.
++ * @bfqd: the lookup key.
++ * @ioc: the io_context of the process doing I/O.
++ *
++ * Queue lock must be held.
++ */
++static inline struct bfq_io_cq *bfq_bic_lookup(struct bfq_data *bfqd,
++					       struct io_context *ioc)
++{
++	if (ioc)
++		return icq_to_bic(ioc_lookup_icq(ioc, bfqd->queue));
++	return NULL;
++}
+diff -Nur linux-4.1.3/block/bfq-iosched.c linux-xbian-imx6/block/bfq-iosched.c
+--- linux-4.1.3/block/bfq-iosched.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/block/bfq-iosched.c	2015-07-27 23:13:03.600137415 +0200
+@@ -0,0 +1,4223 @@
++/*
++ * Budget Fair Queueing (BFQ) disk scheduler.
++ *
++ * Based on ideas and code from CFQ:
++ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
++ *
++ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
++ *		      Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Licensed under the GPL-2 as detailed in the accompanying COPYING.BFQ
++ * file.
++ *
++ * BFQ is a proportional-share storage-I/O scheduling algorithm based on
++ * the slice-by-slice service scheme of CFQ. But BFQ assigns budgets,
++ * measured in number of sectors, to processes instead of time slices. The
++ * device is not granted to the in-service process for a given time slice,
++ * but until it has exhausted its assigned budget. This change from the time
++ * to the service domain allows BFQ to distribute the device throughput
++ * among processes as desired, without any distortion due to ZBR, workload
++ * fluctuations or other factors. BFQ uses an ad hoc internal scheduler,
++ * called B-WF2Q+, to schedule processes according to their budgets. More
++ * precisely, BFQ schedules queues associated to processes. Thanks to the
++ * accurate policy of B-WF2Q+, BFQ can afford to assign high budgets to
++ * I/O-bound processes issuing sequential requests (to boost the
++ * throughput), and yet guarantee a low latency to interactive and soft
++ * real-time applications.
++ *
++ * BFQ is described in [1], where also a reference to the initial, more
++ * theoretical paper on BFQ can be found. The interested reader can find
++ * in the latter paper full details on the main algorithm, as well as
++ * formulas of the guarantees and formal proofs of all the properties.
++ * With respect to the version of BFQ presented in these papers, this
++ * implementation adds a few more heuristics, such as the one that
++ * guarantees a low latency to soft real-time applications, and a
++ * hierarchical extension based on H-WF2Q+.
++ *
++ * B-WF2Q+ is based on WF2Q+, that is described in [2], together with
++ * H-WF2Q+, while the augmented tree used to implement B-WF2Q+ with O(log N)
++ * complexity derives from the one introduced with EEVDF in [3].
++ *
++ * [1] P. Valente and M. Andreolini, ``Improving Application Responsiveness
++ *     with the BFQ Disk I/O Scheduler'',
++ *     Proceedings of the 5th Annual International Systems and Storage
++ *     Conference (SYSTOR '12), June 2012.
++ *
++ * http://algogroup.unimo.it/people/paolo/disk_sched/bf1-v1-suite-results.pdf
++ *
++ * [2] Jon C.R. Bennett and H. Zhang, ``Hierarchical Packet Fair Queueing
++ *     Algorithms,'' IEEE/ACM Transactions on Networking, 5(5):675-689,
++ *     Oct 1997.
++ *
++ * http://www.cs.cmu.edu/~hzhang/papers/TON-97-Oct.ps.gz
++ *
++ * [3] I. Stoica and H. Abdel-Wahab, ``Earliest Eligible Virtual Deadline
++ *     First: A Flexible and Accurate Mechanism for Proportional Share
++ *     Resource Allocation,'' technical report.
++ *
++ * http://www.cs.berkeley.edu/~istoica/papers/eevdf-tr-95.pdf
++ */
++#include <linux/module.h>
++#include <linux/slab.h>
++#include <linux/blkdev.h>
++#include <linux/cgroup.h>
++#include <linux/elevator.h>
++#include <linux/jiffies.h>
++#include <linux/rbtree.h>
++#include <linux/ioprio.h>
++#include "bfq.h"
++#include "blk.h"
++
++/* Max number of dispatches in one round of service. */
++static const int bfq_quantum = 4;
++
++/* Expiration time of sync (0) and async (1) requests, in jiffies. */
++static const int bfq_fifo_expire[2] = { HZ / 4, HZ / 8 };
++
++/* Maximum backwards seek, in KiB. */
++static const int bfq_back_max = 16 * 1024;
++
++/* Penalty of a backwards seek, in number of sectors. */
++static const int bfq_back_penalty = 2;
++
++/* Idling period duration, in jiffies. */
++static int bfq_slice_idle = HZ / 125;
++
++/* Default maximum budget values, in sectors and number of requests. */
++static const int bfq_default_max_budget = 16 * 1024;
++static const int bfq_max_budget_async_rq = 4;
++
++/*
++ * Async to sync throughput distribution is controlled as follows:
++ * when an async request is served, the entity is charged the number
++ * of sectors of the request, multiplied by the factor below
++ */
++static const int bfq_async_charge_factor = 10;
++
++/* Default timeout values, in jiffies, approximating CFQ defaults. */
++static const int bfq_timeout_sync = HZ / 8;
++static int bfq_timeout_async = HZ / 25;
++
++struct kmem_cache *bfq_pool;
++
++/* Below this threshold (in ms), we consider thinktime immediate. */
++#define BFQ_MIN_TT		2
++
++/* hw_tag detection: parallel requests threshold and min samples needed. */
++#define BFQ_HW_QUEUE_THRESHOLD	4
++#define BFQ_HW_QUEUE_SAMPLES	32
++
++#define BFQQ_SEEK_THR	 (sector_t)(8 * 1024)
++#define BFQQ_SEEKY(bfqq) ((bfqq)->seek_mean > BFQQ_SEEK_THR)
++
++/* Min samples used for peak rate estimation (for autotuning). */
++#define BFQ_PEAK_RATE_SAMPLES	32
++
++/* Shift used for peak rate fixed precision calculations. */
++#define BFQ_RATE_SHIFT		16
++
++/*
++ * By default, BFQ computes the duration of the weight raising for
++ * interactive applications automatically, using the following formula:
++ * duration = (R / r) * T, where r is the peak rate of the device, and
++ * R and T are two reference parameters.
++ * In particular, R is the peak rate of the reference device (see below),
++ * and T is a reference time: given the systems that are likely to be
++ * installed on the reference device according to its speed class, T is
++ * about the maximum time needed, under BFQ and while reading two files in
++ * parallel, to load typical large applications on these systems.
++ * In practice, the slower/faster the device at hand is, the more/less it
++ * takes to load applications with respect to the reference device.
++ * Accordingly, the longer/shorter BFQ grants weight raising to interactive
++ * applications.
++ *
++ * BFQ uses four different reference pairs (R, T), depending on:
++ * . whether the device is rotational or non-rotational;
++ * . whether the device is slow, such as old or portable HDDs, as well as
++ *   SD cards, or fast, such as newer HDDs and SSDs.
++ *
++ * The device's speed class is dynamically (re)detected in
++ * bfq_update_peak_rate() every time the estimated peak rate is updated.
++ *
++ * In the following definitions, R_slow[0]/R_fast[0] and T_slow[0]/T_fast[0]
++ * are the reference values for a slow/fast rotational device, whereas
++ * R_slow[1]/R_fast[1] and T_slow[1]/T_fast[1] are the reference values for
++ * a slow/fast non-rotational device. Finally, device_speed_thresh are the
++ * thresholds used to switch between speed classes.
++ * Both the reference peak rates and the thresholds are measured in
++ * sectors/usec, left-shifted by BFQ_RATE_SHIFT.
++ */
++static int R_slow[2] = {1536, 10752};
++static int R_fast[2] = {17415, 34791};
++/*
++ * To improve readability, a conversion function is used to initialize the
++ * following arrays, which entails that they can be initialized only in a
++ * function.
++ */
++static int T_slow[2];
++static int T_fast[2];
++static int device_speed_thresh[2];
++
++#define BFQ_SERVICE_TREE_INIT	((struct bfq_service_tree)		\
++				{ RB_ROOT, RB_ROOT, NULL, NULL, 0, 0 })
++
++#define RQ_BIC(rq)		((struct bfq_io_cq *) (rq)->elv.priv[0])
++#define RQ_BFQQ(rq)		((rq)->elv.priv[1])
++
++static inline void bfq_schedule_dispatch(struct bfq_data *bfqd);
++
++#include "bfq-ioc.c"
++#include "bfq-sched.c"
++#include "bfq-cgroup.c"
++
++#define bfq_class_idle(bfqq)	((bfqq)->entity.ioprio_class ==\
++				 IOPRIO_CLASS_IDLE)
++#define bfq_class_rt(bfqq)	((bfqq)->entity.ioprio_class ==\
++				 IOPRIO_CLASS_RT)
++
++#define bfq_sample_valid(samples)	((samples) > 80)
++
++/*
++ * We regard a request as SYNC, if either it's a read or has the SYNC bit
++ * set (in which case it could also be a direct WRITE).
++ */
++static inline int bfq_bio_sync(struct bio *bio)
++{
++	if (bio_data_dir(bio) == READ || (bio->bi_rw & REQ_SYNC))
++		return 1;
++
++	return 0;
++}
++
++/*
++ * Scheduler run of queue, if there are requests pending and no one in the
++ * driver that will restart queueing.
++ */
++static inline void bfq_schedule_dispatch(struct bfq_data *bfqd)
++{
++	if (bfqd->queued != 0) {
++		bfq_log(bfqd, "schedule dispatch");
++		kblockd_schedule_work(&bfqd->unplug_work);
++	}
++}
++
++/*
++ * Lifted from AS - choose which of rq1 and rq2 that is best served now.
++ * We choose the request that is closesr to the head right now.  Distance
++ * behind the head is penalized and only allowed to a certain extent.
++ */
++static struct request *bfq_choose_req(struct bfq_data *bfqd,
++				      struct request *rq1,
++				      struct request *rq2,
++				      sector_t last)
++{
++	sector_t s1, s2, d1 = 0, d2 = 0;
++	unsigned long back_max;
++#define BFQ_RQ1_WRAP	0x01 /* request 1 wraps */
++#define BFQ_RQ2_WRAP	0x02 /* request 2 wraps */
++	unsigned wrap = 0; /* bit mask: requests behind the disk head? */
++
++	if (rq1 == NULL || rq1 == rq2)
++		return rq2;
++	if (rq2 == NULL)
++		return rq1;
++
++	if (rq_is_sync(rq1) && !rq_is_sync(rq2))
++		return rq1;
++	else if (rq_is_sync(rq2) && !rq_is_sync(rq1))
++		return rq2;
++	if ((rq1->cmd_flags & REQ_META) && !(rq2->cmd_flags & REQ_META))
++		return rq1;
++	else if ((rq2->cmd_flags & REQ_META) && !(rq1->cmd_flags & REQ_META))
++		return rq2;
++
++	s1 = blk_rq_pos(rq1);
++	s2 = blk_rq_pos(rq2);
++
++	/*
++	 * By definition, 1KiB is 2 sectors.
++	 */
++	back_max = bfqd->bfq_back_max * 2;
++
++	/*
++	 * Strict one way elevator _except_ in the case where we allow
++	 * short backward seeks which are biased as twice the cost of a
++	 * similar forward seek.
++	 */
++	if (s1 >= last)
++		d1 = s1 - last;
++	else if (s1 + back_max >= last)
++		d1 = (last - s1) * bfqd->bfq_back_penalty;
++	else
++		wrap |= BFQ_RQ1_WRAP;
++
++	if (s2 >= last)
++		d2 = s2 - last;
++	else if (s2 + back_max >= last)
++		d2 = (last - s2) * bfqd->bfq_back_penalty;
++	else
++		wrap |= BFQ_RQ2_WRAP;
++
++	/* Found required data */
++
++	/*
++	 * By doing switch() on the bit mask "wrap" we avoid having to
++	 * check two variables for all permutations: --> faster!
++	 */
++	switch (wrap) {
++	case 0: /* common case for CFQ: rq1 and rq2 not wrapped */
++		if (d1 < d2)
++			return rq1;
++		else if (d2 < d1)
++			return rq2;
++		else {
++			if (s1 >= s2)
++				return rq1;
++			else
++				return rq2;
++		}
++
++	case BFQ_RQ2_WRAP:
++		return rq1;
++	case BFQ_RQ1_WRAP:
++		return rq2;
++	case (BFQ_RQ1_WRAP|BFQ_RQ2_WRAP): /* both rqs wrapped */
++	default:
++		/*
++		 * Since both rqs are wrapped,
++		 * start with the one that's further behind head
++		 * (--> only *one* back seek required),
++		 * since back seek takes more time than forward.
++		 */
++		if (s1 <= s2)
++			return rq1;
++		else
++			return rq2;
++	}
++}
++
++static struct bfq_queue *
++bfq_rq_pos_tree_lookup(struct bfq_data *bfqd, struct rb_root *root,
++		     sector_t sector, struct rb_node **ret_parent,
++		     struct rb_node ***rb_link)
++{
++	struct rb_node **p, *parent;
++	struct bfq_queue *bfqq = NULL;
++
++	parent = NULL;
++	p = &root->rb_node;
++	while (*p) {
++		struct rb_node **n;
++
++		parent = *p;
++		bfqq = rb_entry(parent, struct bfq_queue, pos_node);
++
++		/*
++		 * Sort strictly based on sector. Smallest to the left,
++		 * largest to the right.
++		 */
++		if (sector > blk_rq_pos(bfqq->next_rq))
++			n = &(*p)->rb_right;
++		else if (sector < blk_rq_pos(bfqq->next_rq))
++			n = &(*p)->rb_left;
++		else
++			break;
++		p = n;
++		bfqq = NULL;
++	}
++
++	*ret_parent = parent;
++	if (rb_link)
++		*rb_link = p;
++
++	bfq_log(bfqd, "rq_pos_tree_lookup %llu: returning %d",
++		(long long unsigned)sector,
++		bfqq != NULL ? bfqq->pid : 0);
++
++	return bfqq;
++}
++
++static void bfq_rq_pos_tree_add(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	struct rb_node **p, *parent;
++	struct bfq_queue *__bfqq;
++
++	if (bfqq->pos_root != NULL) {
++		rb_erase(&bfqq->pos_node, bfqq->pos_root);
++		bfqq->pos_root = NULL;
++	}
++
++	if (bfq_class_idle(bfqq))
++		return;
++	if (!bfqq->next_rq)
++		return;
++
++	bfqq->pos_root = &bfqd->rq_pos_tree;
++	__bfqq = bfq_rq_pos_tree_lookup(bfqd, bfqq->pos_root,
++			blk_rq_pos(bfqq->next_rq), &parent, &p);
++	if (__bfqq == NULL) {
++		rb_link_node(&bfqq->pos_node, parent, p);
++		rb_insert_color(&bfqq->pos_node, bfqq->pos_root);
++	} else
++		bfqq->pos_root = NULL;
++}
++
++/*
++ * Tell whether there are active queues or groups with differentiated weights.
++ */
++static inline bool bfq_differentiated_weights(struct bfq_data *bfqd)
++{
++	BUG_ON(!bfqd->hw_tag);
++	/*
++	 * For weights to differ, at least one of the trees must contain
++	 * at least two nodes.
++	 */
++	return (!RB_EMPTY_ROOT(&bfqd->queue_weights_tree) &&
++		(bfqd->queue_weights_tree.rb_node->rb_left ||
++		 bfqd->queue_weights_tree.rb_node->rb_right)
++#ifdef CONFIG_CGROUP_BFQIO
++	       ) ||
++	       (!RB_EMPTY_ROOT(&bfqd->group_weights_tree) &&
++		(bfqd->group_weights_tree.rb_node->rb_left ||
++		 bfqd->group_weights_tree.rb_node->rb_right)
++#endif
++	       );
++}
++
++/*
++ * If the weight-counter tree passed as input contains no counter for
++ * the weight of the input entity, then add that counter; otherwise just
++ * increment the existing counter.
++ *
++ * Note that weight-counter trees contain few nodes in mostly symmetric
++ * scenarios. For example, if all queues have the same weight, then the
++ * weight-counter tree for the queues may contain at most one node.
++ * This holds even if low_latency is on, because weight-raised queues
++ * are not inserted in the tree.
++ * In most scenarios, the rate at which nodes are created/destroyed
++ * should be low too.
++ */
++static void bfq_weights_tree_add(struct bfq_data *bfqd,
++				 struct bfq_entity *entity,
++				 struct rb_root *root)
++{
++	struct rb_node **new = &(root->rb_node), *parent = NULL;
++
++	/*
++	 * Do not insert if:
++	 * - the device does not support queueing;
++	 * - the entity is already associated with a counter, which happens if:
++	 *   1) the entity is associated with a queue, 2) a request arrival
++	 *   has caused the queue to become both non-weight-raised, and hence
++	 *   change its weight, and backlogged; in this respect, each
++	 *   of the two events causes an invocation of this function,
++	 *   3) this is the invocation of this function caused by the second
++	 *   event. This second invocation is actually useless, and we handle
++	 *   this fact by exiting immediately. More efficient or clearer
++	 *   solutions might possibly be adopted.
++	 */
++	if (!bfqd->hw_tag || entity->weight_counter)
++		return;
++
++	while (*new) {
++		struct bfq_weight_counter *__counter = container_of(*new,
++						struct bfq_weight_counter,
++						weights_node);
++		parent = *new;
++
++		if (entity->weight == __counter->weight) {
++			entity->weight_counter = __counter;
++			goto inc_counter;
++		}
++		if (entity->weight < __counter->weight)
++			new = &((*new)->rb_left);
++		else
++			new = &((*new)->rb_right);
++	}
++
++	entity->weight_counter = kzalloc(sizeof(struct bfq_weight_counter),
++					 GFP_ATOMIC);
++	entity->weight_counter->weight = entity->weight;
++	rb_link_node(&entity->weight_counter->weights_node, parent, new);
++	rb_insert_color(&entity->weight_counter->weights_node, root);
++
++inc_counter:
++	entity->weight_counter->num_active++;
++}
++
++/*
++ * Decrement the weight counter associated with the entity, and, if the
++ * counter reaches 0, remove the counter from the tree.
++ * See the comments to the function bfq_weights_tree_add() for considerations
++ * about overhead.
++ */
++static void bfq_weights_tree_remove(struct bfq_data *bfqd,
++				    struct bfq_entity *entity,
++				    struct rb_root *root)
++{
++	/*
++	 * Check whether the entity is actually associated with a counter.
++	 * In fact, the device may not be considered NCQ-capable for a while,
++	 * which implies that no insertion in the weight trees is performed,
++	 * after which the device may start to be deemed NCQ-capable, and hence
++	 * this function may start to be invoked. This may cause the function
++	 * to be invoked for entities that are not associated with any counter.
++	 */
++	if (!entity->weight_counter)
++		return;
++
++	BUG_ON(RB_EMPTY_ROOT(root));
++	BUG_ON(entity->weight_counter->weight != entity->weight);
++
++	BUG_ON(!entity->weight_counter->num_active);
++	entity->weight_counter->num_active--;
++	if (entity->weight_counter->num_active > 0)
++		goto reset_entity_pointer;
++
++	rb_erase(&entity->weight_counter->weights_node, root);
++	kfree(entity->weight_counter);
++
++reset_entity_pointer:
++	entity->weight_counter = NULL;
++}
++
++static struct request *bfq_find_next_rq(struct bfq_data *bfqd,
++					struct bfq_queue *bfqq,
++					struct request *last)
++{
++	struct rb_node *rbnext = rb_next(&last->rb_node);
++	struct rb_node *rbprev = rb_prev(&last->rb_node);
++	struct request *next = NULL, *prev = NULL;
++
++	BUG_ON(RB_EMPTY_NODE(&last->rb_node));
++
++	if (rbprev != NULL)
++		prev = rb_entry_rq(rbprev);
++
++	if (rbnext != NULL)
++		next = rb_entry_rq(rbnext);
++	else {
++		rbnext = rb_first(&bfqq->sort_list);
++		if (rbnext && rbnext != &last->rb_node)
++			next = rb_entry_rq(rbnext);
++	}
++
++	return bfq_choose_req(bfqd, next, prev, blk_rq_pos(last));
++}
++
++/* see the definition of bfq_async_charge_factor for details */
++static inline unsigned long bfq_serv_to_charge(struct request *rq,
++					       struct bfq_queue *bfqq)
++{
++	return blk_rq_sectors(rq) *
++		(1 + ((!bfq_bfqq_sync(bfqq)) * (bfqq->wr_coeff == 1) *
++		bfq_async_charge_factor));
++}
++
++/**
++ * bfq_updated_next_req - update the queue after a new next_rq selection.
++ * @bfqd: the device data the queue belongs to.
++ * @bfqq: the queue to update.
++ *
++ * If the first request of a queue changes we make sure that the queue
++ * has enough budget to serve at least its first request (if the
++ * request has grown).  We do this because if the queue has not enough
++ * budget for its first request, it has to go through two dispatch
++ * rounds to actually get it dispatched.
++ */
++static void bfq_updated_next_req(struct bfq_data *bfqd,
++				 struct bfq_queue *bfqq)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++	struct bfq_service_tree *st = bfq_entity_service_tree(entity);
++	struct request *next_rq = bfqq->next_rq;
++	unsigned long new_budget;
++
++	if (next_rq == NULL)
++		return;
++
++	if (bfqq == bfqd->in_service_queue)
++		/*
++		 * In order not to break guarantees, budgets cannot be
++		 * changed after an entity has been selected.
++		 */
++		return;
++
++	BUG_ON(entity->tree != &st->active);
++	BUG_ON(entity == entity->sched_data->in_service_entity);
++
++	new_budget = max_t(unsigned long, bfqq->max_budget,
++			   bfq_serv_to_charge(next_rq, bfqq));
++	if (entity->budget != new_budget) {
++		entity->budget = new_budget;
++		bfq_log_bfqq(bfqd, bfqq, "updated next rq: new budget %lu",
++					 new_budget);
++		bfq_activate_bfqq(bfqd, bfqq);
++	}
++}
++
++static inline unsigned int bfq_wr_duration(struct bfq_data *bfqd)
++{
++	u64 dur;
++
++	if (bfqd->bfq_wr_max_time > 0)
++		return bfqd->bfq_wr_max_time;
++
++	dur = bfqd->RT_prod;
++	do_div(dur, bfqd->peak_rate);
++
++	return dur;
++}
++
++static inline unsigned
++bfq_bfqq_cooperations(struct bfq_queue *bfqq)
++{
++	return bfqq->bic ? bfqq->bic->cooperations : 0;
++}
++
++static inline void
++bfq_bfqq_resume_state(struct bfq_queue *bfqq, struct bfq_io_cq *bic)
++{
++	if (bic->saved_idle_window)
++		bfq_mark_bfqq_idle_window(bfqq);
++	else
++		bfq_clear_bfqq_idle_window(bfqq);
++	if (bic->saved_IO_bound)
++		bfq_mark_bfqq_IO_bound(bfqq);
++	else
++		bfq_clear_bfqq_IO_bound(bfqq);
++	/* Assuming that the flag in_large_burst is already correctly set */
++	if (bic->wr_time_left && bfqq->bfqd->low_latency &&
++	    !bfq_bfqq_in_large_burst(bfqq) &&
++	    bic->cooperations < bfqq->bfqd->bfq_coop_thresh) {
++		/*
++		 * Start a weight raising period with the duration given by
++		 * the raising_time_left snapshot.
++		 */
++		if (bfq_bfqq_busy(bfqq))
++			bfqq->bfqd->wr_busy_queues++;
++		bfqq->wr_coeff = bfqq->bfqd->bfq_wr_coeff;
++		bfqq->wr_cur_max_time = bic->wr_time_left;
++		bfqq->last_wr_start_finish = jiffies;
++		bfqq->entity.ioprio_changed = 1;
++	}
++	/*
++	 * Clear wr_time_left to prevent bfq_bfqq_save_state() from
++	 * getting confused about the queue's need of a weight-raising
++	 * period.
++	 */
++	bic->wr_time_left = 0;
++}
++
++/* Must be called with the queue_lock held. */
++static int bfqq_process_refs(struct bfq_queue *bfqq)
++{
++	int process_refs, io_refs;
++
++	io_refs = bfqq->allocated[READ] + bfqq->allocated[WRITE];
++	process_refs = atomic_read(&bfqq->ref) - io_refs - bfqq->entity.on_st;
++	BUG_ON(process_refs < 0);
++	return process_refs;
++}
++
++/* Empty burst list and add just bfqq (see comments to bfq_handle_burst) */
++static inline void bfq_reset_burst_list(struct bfq_data *bfqd,
++					struct bfq_queue *bfqq)
++{
++	struct bfq_queue *item;
++	struct hlist_node *n;
++
++	hlist_for_each_entry_safe(item, n, &bfqd->burst_list, burst_list_node)
++		hlist_del_init(&item->burst_list_node);
++	hlist_add_head(&bfqq->burst_list_node, &bfqd->burst_list);
++	bfqd->burst_size = 1;
++}
++
++/* Add bfqq to the list of queues in current burst (see bfq_handle_burst) */
++static void bfq_add_to_burst(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	/* Increment burst size to take into account also bfqq */
++	bfqd->burst_size++;
++
++	if (bfqd->burst_size == bfqd->bfq_large_burst_thresh) {
++		struct bfq_queue *pos, *bfqq_item;
++		struct hlist_node *n;
++
++		/*
++		 * Enough queues have been activated shortly after each
++		 * other to consider this burst as large.
++		 */
++		bfqd->large_burst = true;
++
++		/*
++		 * We can now mark all queues in the burst list as
++		 * belonging to a large burst.
++		 */
++		hlist_for_each_entry(bfqq_item, &bfqd->burst_list,
++				     burst_list_node)
++		        bfq_mark_bfqq_in_large_burst(bfqq_item);
++		bfq_mark_bfqq_in_large_burst(bfqq);
++
++		/*
++		 * From now on, and until the current burst finishes, any
++		 * new queue being activated shortly after the last queue
++		 * was inserted in the burst can be immediately marked as
++		 * belonging to a large burst. So the burst list is not
++		 * needed any more. Remove it.
++		 */
++		hlist_for_each_entry_safe(pos, n, &bfqd->burst_list,
++					  burst_list_node)
++			hlist_del_init(&pos->burst_list_node);
++	} else /* burst not yet large: add bfqq to the burst list */
++		hlist_add_head(&bfqq->burst_list_node, &bfqd->burst_list);
++}
++
++/*
++ * If many queues happen to become active shortly after each other, then,
++ * to help the processes associated to these queues get their job done as
++ * soon as possible, it is usually better to not grant either weight-raising
++ * or device idling to these queues. In this comment we describe, firstly,
++ * the reasons why this fact holds, and, secondly, the next function, which
++ * implements the main steps needed to properly mark these queues so that
++ * they can then be treated in a different way.
++ *
++ * As for the terminology, we say that a queue becomes active, i.e.,
++ * switches from idle to backlogged, either when it is created (as a
++ * consequence of the arrival of an I/O request), or, if already existing,
++ * when a new request for the queue arrives while the queue is idle.
++ * Bursts of activations, i.e., activations of different queues occurring
++ * shortly after each other, are typically caused by services or applications
++ * that spawn or reactivate many parallel threads/processes. Examples are
++ * systemd during boot or git grep.
++ *
++ * These services or applications benefit mostly from a high throughput:
++ * the quicker the requests of the activated queues are cumulatively served,
++ * the sooner the target job of these queues gets completed. As a consequence,
++ * weight-raising any of these queues, which also implies idling the device
++ * for it, is almost always counterproductive: in most cases it just lowers
++ * throughput.
++ *
++ * On the other hand, a burst of activations may be also caused by the start
++ * of an application that does not consist in a lot of parallel I/O-bound
++ * threads. In fact, with a complex application, the burst may be just a
++ * consequence of the fact that several processes need to be executed to
++ * start-up the application. To start an application as quickly as possible,
++ * the best thing to do is to privilege the I/O related to the application
++ * with respect to all other I/O. Therefore, the best strategy to start as
++ * quickly as possible an application that causes a burst of activations is
++ * to weight-raise all the queues activated during the burst. This is the
++ * exact opposite of the best strategy for the other type of bursts.
++ *
++ * In the end, to take the best action for each of the two cases, the two
++ * types of bursts need to be distinguished. Fortunately, this seems
++ * relatively easy to do, by looking at the sizes of the bursts. In
++ * particular, we found a threshold such that bursts with a larger size
++ * than that threshold are apparently caused only by services or commands
++ * such as systemd or git grep. For brevity, hereafter we call just 'large'
++ * these bursts. BFQ *does not* weight-raise queues whose activations occur
++ * in a large burst. In addition, for each of these queues BFQ performs or
++ * does not perform idling depending on which choice boosts the throughput
++ * most. The exact choice depends on the device and request pattern at
++ * hand.
++ *
++ * Turning back to the next function, it implements all the steps needed
++ * to detect the occurrence of a large burst and to properly mark all the
++ * queues belonging to it (so that they can then be treated in a different
++ * way). This goal is achieved by maintaining a special "burst list" that
++ * holds, temporarily, the queues that belong to the burst in progress. The
++ * list is then used to mark these queues as belonging to a large burst if
++ * the burst does become large. The main steps are the following.
++ *
++ * . when the very first queue is activated, the queue is inserted into the
++ *   list (as it could be the first queue in a possible burst)
++ *
++ * . if the current burst has not yet become large, and a queue Q that does
++ *   not yet belong to the burst is activated shortly after the last time
++ *   at which a new queue entered the burst list, then the function appends
++ *   Q to the burst list
++ *
++ * . if, as a consequence of the previous step, the burst size reaches
++ *   the large-burst threshold, then
++ *
++ *     . all the queues in the burst list are marked as belonging to a
++ *       large burst
++ *
++ *     . the burst list is deleted; in fact, the burst list already served
++ *       its purpose (keeping temporarily track of the queues in a burst,
++ *       so as to be able to mark them as belonging to a large burst in the
++ *       previous sub-step), and now is not needed any more
++ *
++ *     . the device enters a large-burst mode
++ *
++ * . if a queue Q that does not belong to the burst is activated while
++ *   the device is in large-burst mode and shortly after the last time
++ *   at which a queue either entered the burst list or was marked as
++ *   belonging to the current large burst, then Q is immediately marked
++ *   as belonging to a large burst.
++ *
++ * . if a queue Q that does not belong to the burst is activated a while
++ *   later, i.e., not shortly after, than the last time at which a queue
++ *   either entered the burst list or was marked as belonging to the
++ *   current large burst, then the current burst is deemed as finished and:
++ *
++ *        . the large-burst mode is reset if set
++ *
++ *        . the burst list is emptied
++ *
++ *        . Q is inserted in the burst list, as Q may be the first queue
++ *          in a possible new burst (then the burst list contains just Q
++ *          after this step).
++ */
++static void bfq_handle_burst(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++			     bool idle_for_long_time)
++{
++	/*
++	 * If bfqq happened to be activated in a burst, but has been idle
++	 * for at least as long as an interactive queue, then we assume
++	 * that, in the overall I/O initiated in the burst, the I/O
++	 * associated to bfqq is finished. So bfqq does not need to be
++	 * treated as a queue belonging to a burst anymore. Accordingly,
++	 * we reset bfqq's in_large_burst flag if set, and remove bfqq
++	 * from the burst list if it's there. We do not decrement instead
++	 * burst_size, because the fact that bfqq does not need to belong
++	 * to the burst list any more does not invalidate the fact that
++	 * bfqq may have been activated during the current burst.
++	 */
++	if (idle_for_long_time) {
++		hlist_del_init(&bfqq->burst_list_node);
++		bfq_clear_bfqq_in_large_burst(bfqq);
++	}
++
++	/*
++	 * If bfqq is already in the burst list or is part of a large
++	 * burst, then there is nothing else to do.
++	 */
++	if (!hlist_unhashed(&bfqq->burst_list_node) ||
++	    bfq_bfqq_in_large_burst(bfqq))
++		return;
++
++	/*
++	 * If bfqq's activation happens late enough, then the current
++	 * burst is finished, and related data structures must be reset.
++	 *
++	 * In this respect, consider the special case where bfqq is the very
++	 * first queue being activated. In this case, last_ins_in_burst is
++	 * not yet significant when we get here. But it is easy to verify
++	 * that, whether or not the following condition is true, bfqq will
++	 * end up being inserted into the burst list. In particular the
++	 * list will happen to contain only bfqq. And this is exactly what
++	 * has to happen, as bfqq may be the first queue in a possible
++	 * burst.
++	 */
++	if (time_is_before_jiffies(bfqd->last_ins_in_burst +
++	    bfqd->bfq_burst_interval)) {
++		bfqd->large_burst = false;
++		bfq_reset_burst_list(bfqd, bfqq);
++		return;
++	}
++
++	/*
++	 * If we get here, then bfqq is being activated shortly after the
++	 * last queue. So, if the current burst is also large, we can mark
++	 * bfqq as belonging to this large burst immediately.
++	 */
++	if (bfqd->large_burst) {
++		bfq_mark_bfqq_in_large_burst(bfqq);
++		return;
++	}
++
++	/*
++	 * If we get here, then a large-burst state has not yet been
++	 * reached, but bfqq is being activated shortly after the last
++	 * queue. Then we add bfqq to the burst.
++	 */
++	bfq_add_to_burst(bfqd, bfqq);
++}
++
++static void bfq_add_request(struct request *rq)
++{
++	struct bfq_queue *bfqq = RQ_BFQQ(rq);
++	struct bfq_entity *entity = &bfqq->entity;
++	struct bfq_data *bfqd = bfqq->bfqd;
++	struct request *next_rq, *prev;
++	unsigned long old_wr_coeff = bfqq->wr_coeff;
++	bool interactive = false;
++
++	bfq_log_bfqq(bfqd, bfqq, "add_request %d", rq_is_sync(rq));
++	bfqq->queued[rq_is_sync(rq)]++;
++	bfqd->queued++;
++
++	elv_rb_add(&bfqq->sort_list, rq);
++
++	/*
++	 * Check if this request is a better next-serve candidate.
++	 */
++	prev = bfqq->next_rq;
++	next_rq = bfq_choose_req(bfqd, bfqq->next_rq, rq, bfqd->last_position);
++	BUG_ON(next_rq == NULL);
++	bfqq->next_rq = next_rq;
++
++	/*
++	 * Adjust priority tree position, if next_rq changes.
++	 */
++	if (prev != bfqq->next_rq)
++		bfq_rq_pos_tree_add(bfqd, bfqq);
++
++	if (!bfq_bfqq_busy(bfqq)) {
++		bool soft_rt, coop_or_in_burst,
++		     idle_for_long_time = time_is_before_jiffies(
++						bfqq->budget_timeout +
++						bfqd->bfq_wr_min_idle_time);
++
++		if (bfq_bfqq_sync(bfqq)) {
++			bool already_in_burst =
++			   !hlist_unhashed(&bfqq->burst_list_node) ||
++			   bfq_bfqq_in_large_burst(bfqq);
++			bfq_handle_burst(bfqd, bfqq, idle_for_long_time);
++			/*
++			 * If bfqq was not already in the current burst,
++			 * then, at this point, bfqq either has been
++			 * added to the current burst or has caused the
++			 * current burst to terminate. In particular, in
++			 * the second case, bfqq has become the first
++			 * queue in a possible new burst.
++			 * In both cases last_ins_in_burst needs to be
++			 * moved forward.
++			 */
++			if (!already_in_burst)
++				bfqd->last_ins_in_burst = jiffies;
++		}
++
++		coop_or_in_burst = bfq_bfqq_in_large_burst(bfqq) ||
++			bfq_bfqq_cooperations(bfqq) >= bfqd->bfq_coop_thresh;
++		soft_rt = bfqd->bfq_wr_max_softrt_rate > 0 &&
++			!coop_or_in_burst &&
++			time_is_before_jiffies(bfqq->soft_rt_next_start);
++		interactive = !coop_or_in_burst && idle_for_long_time;
++		entity->budget = max_t(unsigned long, bfqq->max_budget,
++				       bfq_serv_to_charge(next_rq, bfqq));
++
++		if (!bfq_bfqq_IO_bound(bfqq)) {
++			if (time_before(jiffies,
++					RQ_BIC(rq)->ttime.last_end_request +
++					bfqd->bfq_slice_idle)) {
++				bfqq->requests_within_timer++;
++				if (bfqq->requests_within_timer >=
++				    bfqd->bfq_requests_within_timer)
++					bfq_mark_bfqq_IO_bound(bfqq);
++			} else
++				bfqq->requests_within_timer = 0;
++		}
++
++		if (!bfqd->low_latency)
++			goto add_bfqq_busy;
++
++		if (bfq_bfqq_just_split(bfqq))
++			goto set_ioprio_changed;
++
++		/*
++		 * If the queue:
++		 * - is not being boosted,
++		 * - has been idle for enough time,
++		 * - is not a sync queue or is linked to a bfq_io_cq (it is
++		 *   shared "for its nature" or it is not shared and its
++		 *   requests have not been redirected to a shared queue)
++		 * start a weight-raising period.
++		 */
++		if (old_wr_coeff == 1 && (interactive || soft_rt) &&
++		    (!bfq_bfqq_sync(bfqq) || bfqq->bic != NULL)) {
++			bfqq->wr_coeff = bfqd->bfq_wr_coeff;
++			if (interactive)
++				bfqq->wr_cur_max_time = bfq_wr_duration(bfqd);
++			else
++				bfqq->wr_cur_max_time =
++					bfqd->bfq_wr_rt_max_time;
++			bfq_log_bfqq(bfqd, bfqq,
++				     "wrais starting at %lu, rais_max_time %u",
++				     jiffies,
++				     jiffies_to_msecs(bfqq->wr_cur_max_time));
++		} else if (old_wr_coeff > 1) {
++			if (interactive)
++				bfqq->wr_cur_max_time = bfq_wr_duration(bfqd);
++			else if (coop_or_in_burst ||
++				 (bfqq->wr_cur_max_time ==
++				  bfqd->bfq_wr_rt_max_time &&
++				  !soft_rt)) {
++				bfqq->wr_coeff = 1;
++				bfq_log_bfqq(bfqd, bfqq,
++					"wrais ending at %lu, rais_max_time %u",
++					jiffies,
++					jiffies_to_msecs(bfqq->
++						wr_cur_max_time));
++			} else if (time_before(
++					bfqq->last_wr_start_finish +
++					bfqq->wr_cur_max_time,
++					jiffies +
++					bfqd->bfq_wr_rt_max_time) &&
++				   soft_rt) {
++				/*
++				 *
++				 * The remaining weight-raising time is lower
++				 * than bfqd->bfq_wr_rt_max_time, which means
++				 * that the application is enjoying weight
++				 * raising either because deemed soft-rt in
++				 * the near past, or because deemed interactive
++				 * a long ago.
++				 * In both cases, resetting now the current
++				 * remaining weight-raising time for the
++				 * application to the weight-raising duration
++				 * for soft rt applications would not cause any
++				 * latency increase for the application (as the
++				 * new duration would be higher than the
++				 * remaining time).
++				 *
++				 * In addition, the application is now meeting
++				 * the requirements for being deemed soft rt.
++				 * In the end we can correctly and safely
++				 * (re)charge the weight-raising duration for
++				 * the application with the weight-raising
++				 * duration for soft rt applications.
++				 *
++				 * In particular, doing this recharge now, i.e.,
++				 * before the weight-raising period for the
++				 * application finishes, reduces the probability
++				 * of the following negative scenario:
++				 * 1) the weight of a soft rt application is
++				 *    raised at startup (as for any newly
++				 *    created application),
++				 * 2) since the application is not interactive,
++				 *    at a certain time weight-raising is
++				 *    stopped for the application,
++				 * 3) at that time the application happens to
++				 *    still have pending requests, and hence
++				 *    is destined to not have a chance to be
++				 *    deemed soft rt before these requests are
++				 *    completed (see the comments to the
++				 *    function bfq_bfqq_softrt_next_start()
++				 *    for details on soft rt detection),
++				 * 4) these pending requests experience a high
++				 *    latency because the application is not
++				 *    weight-raised while they are pending.
++				 */
++				bfqq->last_wr_start_finish = jiffies;
++				bfqq->wr_cur_max_time =
++					bfqd->bfq_wr_rt_max_time;
++			}
++		}
++set_ioprio_changed:
++		if (old_wr_coeff != bfqq->wr_coeff)
++			entity->ioprio_changed = 1;
++add_bfqq_busy:
++		bfqq->last_idle_bklogged = jiffies;
++		bfqq->service_from_backlogged = 0;
++		bfq_clear_bfqq_softrt_update(bfqq);
++		bfq_add_bfqq_busy(bfqd, bfqq);
++	} else {
++		if (bfqd->low_latency && old_wr_coeff == 1 && !rq_is_sync(rq) &&
++		    time_is_before_jiffies(
++				bfqq->last_wr_start_finish +
++				bfqd->bfq_wr_min_inter_arr_async)) {
++			bfqq->wr_coeff = bfqd->bfq_wr_coeff;
++			bfqq->wr_cur_max_time = bfq_wr_duration(bfqd);
++
++			bfqd->wr_busy_queues++;
++			entity->ioprio_changed = 1;
++			bfq_log_bfqq(bfqd, bfqq,
++			    "non-idle wrais starting at %lu, rais_max_time %u",
++			    jiffies,
++			    jiffies_to_msecs(bfqq->wr_cur_max_time));
++		}
++		if (prev != bfqq->next_rq)
++			bfq_updated_next_req(bfqd, bfqq);
++	}
++
++	if (bfqd->low_latency &&
++		(old_wr_coeff == 1 || bfqq->wr_coeff == 1 || interactive))
++		bfqq->last_wr_start_finish = jiffies;
++}
++
++static struct request *bfq_find_rq_fmerge(struct bfq_data *bfqd,
++					  struct bio *bio)
++{
++	struct task_struct *tsk = current;
++	struct bfq_io_cq *bic;
++	struct bfq_queue *bfqq;
++
++	bic = bfq_bic_lookup(bfqd, tsk->io_context);
++	if (bic == NULL)
++		return NULL;
++
++	bfqq = bic_to_bfqq(bic, bfq_bio_sync(bio));
++	if (bfqq != NULL)
++		return elv_rb_find(&bfqq->sort_list, bio_end_sector(bio));
++
++	return NULL;
++}
++
++static void bfq_activate_request(struct request_queue *q, struct request *rq)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++
++	bfqd->rq_in_driver++;
++	bfqd->last_position = blk_rq_pos(rq) + blk_rq_sectors(rq);
++	bfq_log(bfqd, "activate_request: new bfqd->last_position %llu",
++		(long long unsigned)bfqd->last_position);
++}
++
++static inline void bfq_deactivate_request(struct request_queue *q,
++					  struct request *rq)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++
++	BUG_ON(bfqd->rq_in_driver == 0);
++	bfqd->rq_in_driver--;
++}
++
++static void bfq_remove_request(struct request *rq)
++{
++	struct bfq_queue *bfqq = RQ_BFQQ(rq);
++	struct bfq_data *bfqd = bfqq->bfqd;
++	const int sync = rq_is_sync(rq);
++
++	if (bfqq->next_rq == rq) {
++		bfqq->next_rq = bfq_find_next_rq(bfqd, bfqq, rq);
++		bfq_updated_next_req(bfqd, bfqq);
++	}
++
++	list_del_init(&rq->queuelist);
++	BUG_ON(bfqq->queued[sync] == 0);
++	bfqq->queued[sync]--;
++	bfqd->queued--;
++	elv_rb_del(&bfqq->sort_list, rq);
++
++	if (RB_EMPTY_ROOT(&bfqq->sort_list)) {
++		if (bfq_bfqq_busy(bfqq) && bfqq != bfqd->in_service_queue)
++			bfq_del_bfqq_busy(bfqd, bfqq, 1);
++		/*
++		 * Remove queue from request-position tree as it is empty.
++		 */
++		if (bfqq->pos_root != NULL) {
++			rb_erase(&bfqq->pos_node, bfqq->pos_root);
++			bfqq->pos_root = NULL;
++		}
++	}
++
++	if (rq->cmd_flags & REQ_META) {
++		BUG_ON(bfqq->meta_pending == 0);
++		bfqq->meta_pending--;
++	}
++}
++
++static int bfq_merge(struct request_queue *q, struct request **req,
++		     struct bio *bio)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct request *__rq;
++
++	__rq = bfq_find_rq_fmerge(bfqd, bio);
++	if (__rq != NULL && elv_rq_merge_ok(__rq, bio)) {
++		*req = __rq;
++		return ELEVATOR_FRONT_MERGE;
++	}
++
++	return ELEVATOR_NO_MERGE;
++}
++
++static void bfq_merged_request(struct request_queue *q, struct request *req,
++			       int type)
++{
++	if (type == ELEVATOR_FRONT_MERGE &&
++	    rb_prev(&req->rb_node) &&
++	    blk_rq_pos(req) <
++	    blk_rq_pos(container_of(rb_prev(&req->rb_node),
++				    struct request, rb_node))) {
++		struct bfq_queue *bfqq = RQ_BFQQ(req);
++		struct bfq_data *bfqd = bfqq->bfqd;
++		struct request *prev, *next_rq;
++
++		/* Reposition request in its sort_list */
++		elv_rb_del(&bfqq->sort_list, req);
++		elv_rb_add(&bfqq->sort_list, req);
++		/* Choose next request to be served for bfqq */
++		prev = bfqq->next_rq;
++		next_rq = bfq_choose_req(bfqd, bfqq->next_rq, req,
++					 bfqd->last_position);
++		BUG_ON(next_rq == NULL);
++		bfqq->next_rq = next_rq;
++		/*
++		 * If next_rq changes, update both the queue's budget to
++		 * fit the new request and the queue's position in its
++		 * rq_pos_tree.
++		 */
++		if (prev != bfqq->next_rq) {
++			bfq_updated_next_req(bfqd, bfqq);
++			bfq_rq_pos_tree_add(bfqd, bfqq);
++		}
++	}
++}
++
++static void bfq_merged_requests(struct request_queue *q, struct request *rq,
++				struct request *next)
++{
++	struct bfq_queue *bfqq = RQ_BFQQ(rq);
++
++	/*
++	 * Reposition in fifo if next is older than rq.
++	 */
++	if (!list_empty(&rq->queuelist) && !list_empty(&next->queuelist) &&
++	    time_before(next->fifo_time, rq->fifo_time)) {
++		list_move(&rq->queuelist, &next->queuelist);
++		rq->fifo_time = next->fifo_time;
++	}
++
++	if (bfqq->next_rq == next)
++		bfqq->next_rq = rq;
++
++	bfq_remove_request(next);
++}
++
++/* Must be called with bfqq != NULL */
++static inline void bfq_bfqq_end_wr(struct bfq_queue *bfqq)
++{
++	BUG_ON(bfqq == NULL);
++	if (bfq_bfqq_busy(bfqq))
++		bfqq->bfqd->wr_busy_queues--;
++	bfqq->wr_coeff = 1;
++	bfqq->wr_cur_max_time = 0;
++	/* Trigger a weight change on the next activation of the queue */
++	bfqq->entity.ioprio_changed = 1;
++}
++
++static void bfq_end_wr_async_queues(struct bfq_data *bfqd,
++				    struct bfq_group *bfqg)
++{
++	int i, j;
++
++	for (i = 0; i < 2; i++)
++		for (j = 0; j < IOPRIO_BE_NR; j++)
++			if (bfqg->async_bfqq[i][j] != NULL)
++				bfq_bfqq_end_wr(bfqg->async_bfqq[i][j]);
++	if (bfqg->async_idle_bfqq != NULL)
++		bfq_bfqq_end_wr(bfqg->async_idle_bfqq);
++}
++
++static void bfq_end_wr(struct bfq_data *bfqd)
++{
++	struct bfq_queue *bfqq;
++
++	spin_lock_irq(bfqd->queue->queue_lock);
++
++	list_for_each_entry(bfqq, &bfqd->active_list, bfqq_list)
++		bfq_bfqq_end_wr(bfqq);
++	list_for_each_entry(bfqq, &bfqd->idle_list, bfqq_list)
++		bfq_bfqq_end_wr(bfqq);
++	bfq_end_wr_async(bfqd);
++
++	spin_unlock_irq(bfqd->queue->queue_lock);
++}
++
++static inline sector_t bfq_io_struct_pos(void *io_struct, bool request)
++{
++	if (request)
++		return blk_rq_pos(io_struct);
++	else
++		return ((struct bio *)io_struct)->bi_iter.bi_sector;
++}
++
++static inline sector_t bfq_dist_from(sector_t pos1,
++				     sector_t pos2)
++{
++	if (pos1 >= pos2)
++		return pos1 - pos2;
++	else
++		return pos2 - pos1;
++}
++
++static inline int bfq_rq_close_to_sector(void *io_struct, bool request,
++					 sector_t sector)
++{
++	return bfq_dist_from(bfq_io_struct_pos(io_struct, request), sector) <=
++	       BFQQ_SEEK_THR;
++}
++
++static struct bfq_queue *bfqq_close(struct bfq_data *bfqd, sector_t sector)
++{
++	struct rb_root *root = &bfqd->rq_pos_tree;
++	struct rb_node *parent, *node;
++	struct bfq_queue *__bfqq;
++
++	if (RB_EMPTY_ROOT(root))
++		return NULL;
++
++	/*
++	 * First, if we find a request starting at the end of the last
++	 * request, choose it.
++	 */
++	__bfqq = bfq_rq_pos_tree_lookup(bfqd, root, sector, &parent, NULL);
++	if (__bfqq != NULL)
++		return __bfqq;
++
++	/*
++	 * If the exact sector wasn't found, the parent of the NULL leaf
++	 * will contain the closest sector (rq_pos_tree sorted by
++	 * next_request position).
++	 */
++	__bfqq = rb_entry(parent, struct bfq_queue, pos_node);
++	if (bfq_rq_close_to_sector(__bfqq->next_rq, true, sector))
++		return __bfqq;
++
++	if (blk_rq_pos(__bfqq->next_rq) < sector)
++		node = rb_next(&__bfqq->pos_node);
++	else
++		node = rb_prev(&__bfqq->pos_node);
++	if (node == NULL)
++		return NULL;
++
++	__bfqq = rb_entry(node, struct bfq_queue, pos_node);
++	if (bfq_rq_close_to_sector(__bfqq->next_rq, true, sector))
++		return __bfqq;
++
++	return NULL;
++}
++
++/*
++ * bfqd - obvious
++ * cur_bfqq - passed in so that we don't decide that the current queue
++ *            is closely cooperating with itself
++ * sector - used as a reference point to search for a close queue
++ */
++static struct bfq_queue *bfq_close_cooperator(struct bfq_data *bfqd,
++					      struct bfq_queue *cur_bfqq,
++					      sector_t sector)
++{
++	struct bfq_queue *bfqq;
++
++	if (bfq_class_idle(cur_bfqq))
++		return NULL;
++	if (!bfq_bfqq_sync(cur_bfqq))
++		return NULL;
++	if (BFQQ_SEEKY(cur_bfqq))
++		return NULL;
++
++	/* If device has only one backlogged bfq_queue, don't search. */
++	if (bfqd->busy_queues == 1)
++		return NULL;
++
++	/*
++	 * We should notice if some of the queues are cooperating, e.g.
++	 * working closely on the same area of the disk. In that case,
++	 * we can group them together and don't waste time idling.
++	 */
++	bfqq = bfqq_close(bfqd, sector);
++	if (bfqq == NULL || bfqq == cur_bfqq)
++		return NULL;
++
++	/*
++	 * Do not merge queues from different bfq_groups.
++	*/
++	if (bfqq->entity.parent != cur_bfqq->entity.parent)
++		return NULL;
++
++	/*
++	 * It only makes sense to merge sync queues.
++	 */
++	if (!bfq_bfqq_sync(bfqq))
++		return NULL;
++	if (BFQQ_SEEKY(bfqq))
++		return NULL;
++
++	/*
++	 * Do not merge queues of different priority classes.
++	 */
++	if (bfq_class_rt(bfqq) != bfq_class_rt(cur_bfqq))
++		return NULL;
++
++	return bfqq;
++}
++
++static struct bfq_queue *
++bfq_setup_merge(struct bfq_queue *bfqq, struct bfq_queue *new_bfqq)
++{
++	int process_refs, new_process_refs;
++	struct bfq_queue *__bfqq;
++
++	/*
++	 * If there are no process references on the new_bfqq, then it is
++	 * unsafe to follow the ->new_bfqq chain as other bfqq's in the chain
++	 * may have dropped their last reference (not just their last process
++	 * reference).
++	 */
++	if (!bfqq_process_refs(new_bfqq))
++		return NULL;
++
++	/* Avoid a circular list and skip interim queue merges. */
++	while ((__bfqq = new_bfqq->new_bfqq)) {
++		if (__bfqq == bfqq)
++			return NULL;
++		new_bfqq = __bfqq;
++	}
++
++	process_refs = bfqq_process_refs(bfqq);
++	new_process_refs = bfqq_process_refs(new_bfqq);
++	/*
++	 * If the process for the bfqq has gone away, there is no
++	 * sense in merging the queues.
++	 */
++	if (process_refs == 0 || new_process_refs == 0)
++		return NULL;
++
++	bfq_log_bfqq(bfqq->bfqd, bfqq, "scheduling merge with queue %d",
++		new_bfqq->pid);
++
++	/*
++	 * Merging is just a redirection: the requests of the process
++	 * owning one of the two queues are redirected to the other queue.
++	 * The latter queue, in its turn, is set as shared if this is the
++	 * first time that the requests of some process are redirected to
++	 * it.
++	 *
++	 * We redirect bfqq to new_bfqq and not the opposite, because we
++	 * are in the context of the process owning bfqq, hence we have
++	 * the io_cq of this process. So we can immediately configure this
++	 * io_cq to redirect the requests of the process to new_bfqq.
++	 *
++	 * NOTE, even if new_bfqq coincides with the in-service queue, the
++	 * io_cq of new_bfqq is not available, because, if the in-service
++	 * queue is shared, bfqd->in_service_bic may not point to the
++	 * io_cq of the in-service queue.
++	 * Redirecting the requests of the process owning bfqq to the
++	 * currently in-service queue is in any case the best option, as
++	 * we feed the in-service queue with new requests close to the
++	 * last request served and, by doing so, hopefully increase the
++	 * throughput.
++	 */
++	bfqq->new_bfqq = new_bfqq;
++	atomic_add(process_refs, &new_bfqq->ref);
++	return new_bfqq;
++}
++
++/*
++ * Attempt to schedule a merge of bfqq with the currently in-service queue
++ * or with a close queue among the scheduled queues.
++ * Return NULL if no merge was scheduled, a pointer to the shared bfq_queue
++ * structure otherwise.
++ *
++ * The OOM queue is not allowed to participate to cooperation: in fact, since
++ * the requests temporarily redirected to the OOM queue could be redirected
++ * again to dedicated queues at any time, the state needed to correctly
++ * handle merging with the OOM queue would be quite complex and expensive
++ * to maintain. Besides, in such a critical condition as an out of memory,
++ * the benefits of queue merging may be little relevant, or even negligible.
++ */
++static struct bfq_queue *
++bfq_setup_cooperator(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++		     void *io_struct, bool request)
++{
++	struct bfq_queue *in_service_bfqq, *new_bfqq;
++
++	if (bfqq->new_bfqq)
++		return bfqq->new_bfqq;
++
++	if (!io_struct || unlikely(bfqq == &bfqd->oom_bfqq))
++		return NULL;
++
++	in_service_bfqq = bfqd->in_service_queue;
++
++	if (in_service_bfqq == NULL || in_service_bfqq == bfqq ||
++	    !bfqd->in_service_bic ||
++	    unlikely(in_service_bfqq == &bfqd->oom_bfqq))
++		goto check_scheduled;
++
++	if (bfq_class_idle(in_service_bfqq) || bfq_class_idle(bfqq))
++		goto check_scheduled;
++
++	if (bfq_class_rt(in_service_bfqq) != bfq_class_rt(bfqq))
++		goto check_scheduled;
++
++	if (in_service_bfqq->entity.parent != bfqq->entity.parent)
++		goto check_scheduled;
++
++	if (bfq_rq_close_to_sector(io_struct, request, bfqd->last_position) &&
++	    bfq_bfqq_sync(in_service_bfqq) && bfq_bfqq_sync(bfqq)) {
++		new_bfqq = bfq_setup_merge(bfqq, in_service_bfqq);
++		if (new_bfqq != NULL)
++			return new_bfqq; /* Merge with in-service queue */
++	}
++
++	/*
++	 * Check whether there is a cooperator among currently scheduled
++	 * queues. The only thing we need is that the bio/request is not
++	 * NULL, as we need it to establish whether a cooperator exists.
++	 */
++check_scheduled:
++	new_bfqq = bfq_close_cooperator(bfqd, bfqq,
++					bfq_io_struct_pos(io_struct, request));
++	if (new_bfqq && likely(new_bfqq != &bfqd->oom_bfqq))
++		return bfq_setup_merge(bfqq, new_bfqq);
++
++	return NULL;
++}
++
++static inline void
++bfq_bfqq_save_state(struct bfq_queue *bfqq)
++{
++	/*
++	 * If bfqq->bic == NULL, the queue is already shared or its requests
++	 * have already been redirected to a shared queue; both idle window
++	 * and weight raising state have already been saved. Do nothing.
++	 */
++	if (bfqq->bic == NULL)
++		return;
++	if (bfqq->bic->wr_time_left)
++		/*
++		 * This is the queue of a just-started process, and would
++		 * deserve weight raising: we set wr_time_left to the full
++		 * weight-raising duration to trigger weight-raising when
++		 * and if the queue is split and the first request of the
++		 * queue is enqueued.
++		 */
++		bfqq->bic->wr_time_left = bfq_wr_duration(bfqq->bfqd);
++	else if (bfqq->wr_coeff > 1) {
++		unsigned long wr_duration =
++			jiffies - bfqq->last_wr_start_finish;
++		/*
++		 * It may happen that a queue's weight raising period lasts
++		 * longer than its wr_cur_max_time, as weight raising is
++		 * handled only when a request is enqueued or dispatched (it
++		 * does not use any timer). If the weight raising period is
++		 * about to end, don't save it.
++		 */
++		if (bfqq->wr_cur_max_time <= wr_duration)
++			bfqq->bic->wr_time_left = 0;
++		else
++			bfqq->bic->wr_time_left =
++				bfqq->wr_cur_max_time - wr_duration;
++		/*
++		 * The bfq_queue is becoming shared or the requests of the
++		 * process owning the queue are being redirected to a shared
++		 * queue. Stop the weight raising period of the queue, as in
++		 * both cases it should not be owned by an interactive or
++		 * soft real-time application.
++		 */
++		bfq_bfqq_end_wr(bfqq);
++	} else
++		bfqq->bic->wr_time_left = 0;
++	bfqq->bic->saved_idle_window = bfq_bfqq_idle_window(bfqq);
++	bfqq->bic->saved_IO_bound = bfq_bfqq_IO_bound(bfqq);
++	bfqq->bic->saved_in_large_burst = bfq_bfqq_in_large_burst(bfqq);
++	bfqq->bic->was_in_burst_list = !hlist_unhashed(&bfqq->burst_list_node);
++	bfqq->bic->cooperations++;
++	bfqq->bic->failed_cooperations = 0;
++}
++
++static inline void
++bfq_get_bic_reference(struct bfq_queue *bfqq)
++{
++	/*
++	 * If bfqq->bic has a non-NULL value, the bic to which it belongs
++	 * is about to begin using a shared bfq_queue.
++	 */
++	if (bfqq->bic)
++		atomic_long_inc(&bfqq->bic->icq.ioc->refcount);
++}
++
++static void
++bfq_merge_bfqqs(struct bfq_data *bfqd, struct bfq_io_cq *bic,
++		struct bfq_queue *bfqq, struct bfq_queue *new_bfqq)
++{
++	bfq_log_bfqq(bfqd, bfqq, "merging with queue %lu",
++		(long unsigned)new_bfqq->pid);
++	/* Save weight raising and idle window of the merged queues */
++	bfq_bfqq_save_state(bfqq);
++	bfq_bfqq_save_state(new_bfqq);
++	if (bfq_bfqq_IO_bound(bfqq))
++		bfq_mark_bfqq_IO_bound(new_bfqq);
++	bfq_clear_bfqq_IO_bound(bfqq);
++	/*
++	 * Grab a reference to the bic, to prevent it from being destroyed
++	 * before being possibly touched by a bfq_split_bfqq().
++	 */
++	bfq_get_bic_reference(bfqq);
++	bfq_get_bic_reference(new_bfqq);
++	/*
++	 * Merge queues (that is, let bic redirect its requests to new_bfqq)
++	 */
++	bic_set_bfqq(bic, new_bfqq, 1);
++	bfq_mark_bfqq_coop(new_bfqq);
++	/*
++	 * new_bfqq now belongs to at least two bics (it is a shared queue):
++	 * set new_bfqq->bic to NULL. bfqq either:
++	 * - does not belong to any bic any more, and hence bfqq->bic must
++	 *   be set to NULL, or
++	 * - is a queue whose owning bics have already been redirected to a
++	 *   different queue, hence the queue is destined to not belong to
++	 *   any bic soon and bfqq->bic is already NULL (therefore the next
++	 *   assignment causes no harm).
++	 */
++	new_bfqq->bic = NULL;
++	bfqq->bic = NULL;
++	bfq_put_queue(bfqq);
++}
++
++static inline void bfq_bfqq_increase_failed_cooperations(struct bfq_queue *bfqq)
++{
++	struct bfq_io_cq *bic = bfqq->bic;
++	struct bfq_data *bfqd = bfqq->bfqd;
++
++	if (bic && bfq_bfqq_cooperations(bfqq) >= bfqd->bfq_coop_thresh) {
++		bic->failed_cooperations++;
++		if (bic->failed_cooperations >= bfqd->bfq_failed_cooperations)
++			bic->cooperations = 0;
++	}
++}
++
++static int bfq_allow_merge(struct request_queue *q, struct request *rq,
++			   struct bio *bio)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct bfq_io_cq *bic;
++	struct bfq_queue *bfqq, *new_bfqq;
++
++	/*
++	 * Disallow merge of a sync bio into an async request.
++	 */
++	if (bfq_bio_sync(bio) && !rq_is_sync(rq))
++		return 0;
++
++	/*
++	 * Lookup the bfqq that this bio will be queued with. Allow
++	 * merge only if rq is queued there.
++	 * Queue lock is held here.
++	 */
++	bic = bfq_bic_lookup(bfqd, current->io_context);
++	if (bic == NULL)
++		return 0;
++
++	bfqq = bic_to_bfqq(bic, bfq_bio_sync(bio));
++	/*
++	 * We take advantage of this function to perform an early merge
++	 * of the queues of possible cooperating processes.
++	 */
++	if (bfqq != NULL) {
++		new_bfqq = bfq_setup_cooperator(bfqd, bfqq, bio, false);
++		if (new_bfqq != NULL) {
++			bfq_merge_bfqqs(bfqd, bic, bfqq, new_bfqq);
++			/*
++			 * If we get here, the bio will be queued in the
++			 * shared queue, i.e., new_bfqq, so use new_bfqq
++			 * to decide whether bio and rq can be merged.
++			 */
++			bfqq = new_bfqq;
++		} else
++			bfq_bfqq_increase_failed_cooperations(bfqq);
++	}
++
++	return bfqq == RQ_BFQQ(rq);
++}
++
++static void __bfq_set_in_service_queue(struct bfq_data *bfqd,
++				       struct bfq_queue *bfqq)
++{
++	if (bfqq != NULL) {
++		bfq_mark_bfqq_must_alloc(bfqq);
++		bfq_mark_bfqq_budget_new(bfqq);
++		bfq_clear_bfqq_fifo_expire(bfqq);
++
++		bfqd->budgets_assigned = (bfqd->budgets_assigned*7 + 256) / 8;
++
++		bfq_log_bfqq(bfqd, bfqq,
++			     "set_in_service_queue, cur-budget = %lu",
++			     bfqq->entity.budget);
++	}
++
++	bfqd->in_service_queue = bfqq;
++}
++
++/*
++ * Get and set a new queue for service.
++ */
++static struct bfq_queue *bfq_set_in_service_queue(struct bfq_data *bfqd)
++{
++	struct bfq_queue *bfqq = bfq_get_next_queue(bfqd);
++
++	__bfq_set_in_service_queue(bfqd, bfqq);
++	return bfqq;
++}
++
++/*
++ * If enough samples have been computed, return the current max budget
++ * stored in bfqd, which is dynamically updated according to the
++ * estimated disk peak rate; otherwise return the default max budget
++ */
++static inline unsigned long bfq_max_budget(struct bfq_data *bfqd)
++{
++	if (bfqd->budgets_assigned < 194)
++		return bfq_default_max_budget;
++	else
++		return bfqd->bfq_max_budget;
++}
++
++/*
++ * Return min budget, which is a fraction of the current or default
++ * max budget (trying with 1/32)
++ */
++static inline unsigned long bfq_min_budget(struct bfq_data *bfqd)
++{
++	if (bfqd->budgets_assigned < 194)
++		return bfq_default_max_budget / 32;
++	else
++		return bfqd->bfq_max_budget / 32;
++}
++
++static void bfq_arm_slice_timer(struct bfq_data *bfqd)
++{
++	struct bfq_queue *bfqq = bfqd->in_service_queue;
++	struct bfq_io_cq *bic;
++	unsigned long sl;
++
++	BUG_ON(!RB_EMPTY_ROOT(&bfqq->sort_list));
++
++	/* Processes have exited, don't wait. */
++	bic = bfqd->in_service_bic;
++	if (bic == NULL || atomic_read(&bic->icq.ioc->active_ref) == 0)
++		return;
++
++	bfq_mark_bfqq_wait_request(bfqq);
++
++	/*
++	 * We don't want to idle for seeks, but we do want to allow
++	 * fair distribution of slice time for a process doing back-to-back
++	 * seeks. So allow a little bit of time for him to submit a new rq.
++	 *
++	 * To prevent processes with (partly) seeky workloads from
++	 * being too ill-treated, grant them a small fraction of the
++	 * assigned budget before reducing the waiting time to
++	 * BFQ_MIN_TT. This happened to help reduce latency.
++	 */
++	sl = bfqd->bfq_slice_idle;
++	/*
++	 * Unless the queue is being weight-raised, grant only minimum idle
++	 * time if the queue either has been seeky for long enough or has
++	 * already proved to be constantly seeky.
++	 */
++	if (bfq_sample_valid(bfqq->seek_samples) &&
++	    ((BFQQ_SEEKY(bfqq) && bfqq->entity.service >
++				  bfq_max_budget(bfqq->bfqd) / 8) ||
++	      bfq_bfqq_constantly_seeky(bfqq)) && bfqq->wr_coeff == 1)
++		sl = min(sl, msecs_to_jiffies(BFQ_MIN_TT));
++	else if (bfqq->wr_coeff > 1)
++		sl = sl * 3;
++	bfqd->last_idling_start = ktime_get();
++	mod_timer(&bfqd->idle_slice_timer, jiffies + sl);
++	bfq_log(bfqd, "arm idle: %u/%u ms",
++		jiffies_to_msecs(sl), jiffies_to_msecs(bfqd->bfq_slice_idle));
++}
++
++/*
++ * Set the maximum time for the in-service queue to consume its
++ * budget. This prevents seeky processes from lowering the disk
++ * throughput (always guaranteed with a time slice scheme as in CFQ).
++ */
++static void bfq_set_budget_timeout(struct bfq_data *bfqd)
++{
++	struct bfq_queue *bfqq = bfqd->in_service_queue;
++	unsigned int timeout_coeff;
++	if (bfqq->wr_cur_max_time == bfqd->bfq_wr_rt_max_time)
++		timeout_coeff = 1;
++	else
++		timeout_coeff = bfqq->entity.weight / bfqq->entity.orig_weight;
++
++	bfqd->last_budget_start = ktime_get();
++
++	bfq_clear_bfqq_budget_new(bfqq);
++	bfqq->budget_timeout = jiffies +
++		bfqd->bfq_timeout[bfq_bfqq_sync(bfqq)] * timeout_coeff;
++
++	bfq_log_bfqq(bfqd, bfqq, "set budget_timeout %u",
++		jiffies_to_msecs(bfqd->bfq_timeout[bfq_bfqq_sync(bfqq)] *
++		timeout_coeff));
++}
++
++/*
++ * Move request from internal lists to the request queue dispatch list.
++ */
++static void bfq_dispatch_insert(struct request_queue *q, struct request *rq)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct bfq_queue *bfqq = RQ_BFQQ(rq);
++
++	/*
++	 * For consistency, the next instruction should have been executed
++	 * after removing the request from the queue and dispatching it.
++	 * We execute instead this instruction before bfq_remove_request()
++	 * (and hence introduce a temporary inconsistency), for efficiency.
++	 * In fact, in a forced_dispatch, this prevents two counters related
++	 * to bfqq->dispatched to risk to be uselessly decremented if bfqq
++	 * is not in service, and then to be incremented again after
++	 * incrementing bfqq->dispatched.
++	 */
++	bfqq->dispatched++;
++	bfq_remove_request(rq);
++	elv_dispatch_sort(q, rq);
++
++	if (bfq_bfqq_sync(bfqq))
++		bfqd->sync_flight++;
++}
++
++/*
++ * Return expired entry, or NULL to just start from scratch in rbtree.
++ */
++static struct request *bfq_check_fifo(struct bfq_queue *bfqq)
++{
++	struct request *rq = NULL;
++
++	if (bfq_bfqq_fifo_expire(bfqq))
++		return NULL;
++
++	bfq_mark_bfqq_fifo_expire(bfqq);
++
++	if (list_empty(&bfqq->fifo))
++		return NULL;
++
++	rq = rq_entry_fifo(bfqq->fifo.next);
++
++	if (time_before(jiffies, rq->fifo_time))
++		return NULL;
++
++	return rq;
++}
++
++static inline unsigned long bfq_bfqq_budget_left(struct bfq_queue *bfqq)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++	return entity->budget - entity->service;
++}
++
++static void __bfq_bfqq_expire(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	BUG_ON(bfqq != bfqd->in_service_queue);
++
++	__bfq_bfqd_reset_in_service(bfqd);
++
++	/*
++	 * If this bfqq is shared between multiple processes, check
++	 * to make sure that those processes are still issuing I/Os
++	 * within the mean seek distance. If not, it may be time to
++	 * break the queues apart again.
++	 */
++	if (bfq_bfqq_coop(bfqq) && BFQQ_SEEKY(bfqq))
++		bfq_mark_bfqq_split_coop(bfqq);
++
++	if (RB_EMPTY_ROOT(&bfqq->sort_list)) {
++		/*
++		 * Overloading budget_timeout field to store the time
++		 * at which the queue remains with no backlog; used by
++		 * the weight-raising mechanism.
++		 */
++		bfqq->budget_timeout = jiffies;
++		bfq_del_bfqq_busy(bfqd, bfqq, 1);
++	} else {
++		bfq_activate_bfqq(bfqd, bfqq);
++		/*
++		 * Resort priority tree of potential close cooperators.
++		 */
++		bfq_rq_pos_tree_add(bfqd, bfqq);
++	}
++}
++
++/**
++ * __bfq_bfqq_recalc_budget - try to adapt the budget to the @bfqq behavior.
++ * @bfqd: device data.
++ * @bfqq: queue to update.
++ * @reason: reason for expiration.
++ *
++ * Handle the feedback on @bfqq budget.  See the body for detailed
++ * comments.
++ */
++static void __bfq_bfqq_recalc_budget(struct bfq_data *bfqd,
++				     struct bfq_queue *bfqq,
++				     enum bfqq_expiration reason)
++{
++	struct request *next_rq;
++	unsigned long budget, min_budget;
++
++	budget = bfqq->max_budget;
++	min_budget = bfq_min_budget(bfqd);
++
++	BUG_ON(bfqq != bfqd->in_service_queue);
++
++	bfq_log_bfqq(bfqd, bfqq, "recalc_budg: last budg %lu, budg left %lu",
++		bfqq->entity.budget, bfq_bfqq_budget_left(bfqq));
++	bfq_log_bfqq(bfqd, bfqq, "recalc_budg: last max_budg %lu, min budg %lu",
++		budget, bfq_min_budget(bfqd));
++	bfq_log_bfqq(bfqd, bfqq, "recalc_budg: sync %d, seeky %d",
++		bfq_bfqq_sync(bfqq), BFQQ_SEEKY(bfqd->in_service_queue));
++
++	if (bfq_bfqq_sync(bfqq)) {
++		switch (reason) {
++		/*
++		 * Caveat: in all the following cases we trade latency
++		 * for throughput.
++		 */
++		case BFQ_BFQQ_TOO_IDLE:
++			/*
++			 * This is the only case where we may reduce
++			 * the budget: if there is no request of the
++			 * process still waiting for completion, then
++			 * we assume (tentatively) that the timer has
++			 * expired because the batch of requests of
++			 * the process could have been served with a
++			 * smaller budget.  Hence, betting that
++			 * process will behave in the same way when it
++			 * becomes backlogged again, we reduce its
++			 * next budget.  As long as we guess right,
++			 * this budget cut reduces the latency
++			 * experienced by the process.
++			 *
++			 * However, if there are still outstanding
++			 * requests, then the process may have not yet
++			 * issued its next request just because it is
++			 * still waiting for the completion of some of
++			 * the still outstanding ones.  So in this
++			 * subcase we do not reduce its budget, on the
++			 * contrary we increase it to possibly boost
++			 * the throughput, as discussed in the
++			 * comments to the BUDGET_TIMEOUT case.
++			 */
++			if (bfqq->dispatched > 0) /* still outstanding reqs */
++				budget = min(budget * 2, bfqd->bfq_max_budget);
++			else {
++				if (budget > 5 * min_budget)
++					budget -= 4 * min_budget;
++				else
++					budget = min_budget;
++			}
++			break;
++		case BFQ_BFQQ_BUDGET_TIMEOUT:
++			/*
++			 * We double the budget here because: 1) it
++			 * gives the chance to boost the throughput if
++			 * this is not a seeky process (which may have
++			 * bumped into this timeout because of, e.g.,
++			 * ZBR), 2) together with charge_full_budget
++			 * it helps give seeky processes higher
++			 * timestamps, and hence be served less
++			 * frequently.
++			 */
++			budget = min(budget * 2, bfqd->bfq_max_budget);
++			break;
++		case BFQ_BFQQ_BUDGET_EXHAUSTED:
++			/*
++			 * The process still has backlog, and did not
++			 * let either the budget timeout or the disk
++			 * idling timeout expire. Hence it is not
++			 * seeky, has a short thinktime and may be
++			 * happy with a higher budget too. So
++			 * definitely increase the budget of this good
++			 * candidate to boost the disk throughput.
++			 */
++			budget = min(budget * 4, bfqd->bfq_max_budget);
++			break;
++		case BFQ_BFQQ_NO_MORE_REQUESTS:
++		       /*
++			* Leave the budget unchanged.
++			*/
++		default:
++			return;
++		}
++	} else /* async queue */
++	    /* async queues get always the maximum possible budget
++	     * (their ability to dispatch is limited by
++	     * @bfqd->bfq_max_budget_async_rq).
++	     */
++		budget = bfqd->bfq_max_budget;
++
++	bfqq->max_budget = budget;
++
++	if (bfqd->budgets_assigned >= 194 && bfqd->bfq_user_max_budget == 0 &&
++	    bfqq->max_budget > bfqd->bfq_max_budget)
++		bfqq->max_budget = bfqd->bfq_max_budget;
++
++	/*
++	 * Make sure that we have enough budget for the next request.
++	 * Since the finish time of the bfqq must be kept in sync with
++	 * the budget, be sure to call __bfq_bfqq_expire() after the
++	 * update.
++	 */
++	next_rq = bfqq->next_rq;
++	if (next_rq != NULL)
++		bfqq->entity.budget = max_t(unsigned long, bfqq->max_budget,
++					    bfq_serv_to_charge(next_rq, bfqq));
++	else
++		bfqq->entity.budget = bfqq->max_budget;
++
++	bfq_log_bfqq(bfqd, bfqq, "head sect: %u, new budget %lu",
++			next_rq != NULL ? blk_rq_sectors(next_rq) : 0,
++			bfqq->entity.budget);
++}
++
++static unsigned long bfq_calc_max_budget(u64 peak_rate, u64 timeout)
++{
++	unsigned long max_budget;
++
++	/*
++	 * The max_budget calculated when autotuning is equal to the
++	 * amount of sectors transfered in timeout_sync at the
++	 * estimated peak rate.
++	 */
++	max_budget = (unsigned long)(peak_rate * 1000 *
++				     timeout >> BFQ_RATE_SHIFT);
++
++	return max_budget;
++}
++
++/*
++ * In addition to updating the peak rate, checks whether the process
++ * is "slow", and returns 1 if so. This slow flag is used, in addition
++ * to the budget timeout, to reduce the amount of service provided to
++ * seeky processes, and hence reduce their chances to lower the
++ * throughput. See the code for more details.
++ */
++static int bfq_update_peak_rate(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++				int compensate, enum bfqq_expiration reason)
++{
++	u64 bw, usecs, expected, timeout;
++	ktime_t delta;
++	int update = 0;
++
++	if (!bfq_bfqq_sync(bfqq) || bfq_bfqq_budget_new(bfqq))
++		return 0;
++
++	if (compensate)
++		delta = bfqd->last_idling_start;
++	else
++		delta = ktime_get();
++	delta = ktime_sub(delta, bfqd->last_budget_start);
++	usecs = ktime_to_us(delta);
++
++	/* Don't trust short/unrealistic values. */
++	if (usecs < 100 || usecs >= LONG_MAX)
++		return 0;
++
++	/*
++	 * Calculate the bandwidth for the last slice.  We use a 64 bit
++	 * value to store the peak rate, in sectors per usec in fixed
++	 * point math.  We do so to have enough precision in the estimate
++	 * and to avoid overflows.
++	 */
++	bw = (u64)bfqq->entity.service << BFQ_RATE_SHIFT;
++	do_div(bw, (unsigned long)usecs);
++
++	timeout = jiffies_to_msecs(bfqd->bfq_timeout[BLK_RW_SYNC]);
++
++	/*
++	 * Use only long (> 20ms) intervals to filter out spikes for
++	 * the peak rate estimation.
++	 */
++	if (usecs > 20000) {
++		if (bw > bfqd->peak_rate ||
++		   (!BFQQ_SEEKY(bfqq) &&
++		    reason == BFQ_BFQQ_BUDGET_TIMEOUT)) {
++			bfq_log(bfqd, "measured bw =%llu", bw);
++			/*
++			 * To smooth oscillations use a low-pass filter with
++			 * alpha=7/8, i.e.,
++			 * new_rate = (7/8) * old_rate + (1/8) * bw
++			 */
++			do_div(bw, 8);
++			if (bw == 0)
++				return 0;
++			bfqd->peak_rate *= 7;
++			do_div(bfqd->peak_rate, 8);
++			bfqd->peak_rate += bw;
++			update = 1;
++			bfq_log(bfqd, "new peak_rate=%llu", bfqd->peak_rate);
++		}
++
++		update |= bfqd->peak_rate_samples == BFQ_PEAK_RATE_SAMPLES - 1;
++
++		if (bfqd->peak_rate_samples < BFQ_PEAK_RATE_SAMPLES)
++			bfqd->peak_rate_samples++;
++
++		if (bfqd->peak_rate_samples == BFQ_PEAK_RATE_SAMPLES &&
++		    update) {
++			int dev_type = blk_queue_nonrot(bfqd->queue);
++			if (bfqd->bfq_user_max_budget == 0) {
++				bfqd->bfq_max_budget =
++					bfq_calc_max_budget(bfqd->peak_rate,
++							    timeout);
++				bfq_log(bfqd, "new max_budget=%lu",
++					bfqd->bfq_max_budget);
++			}
++			if (bfqd->device_speed == BFQ_BFQD_FAST &&
++			    bfqd->peak_rate < device_speed_thresh[dev_type]) {
++				bfqd->device_speed = BFQ_BFQD_SLOW;
++				bfqd->RT_prod = R_slow[dev_type] *
++						T_slow[dev_type];
++			} else if (bfqd->device_speed == BFQ_BFQD_SLOW &&
++			    bfqd->peak_rate > device_speed_thresh[dev_type]) {
++				bfqd->device_speed = BFQ_BFQD_FAST;
++				bfqd->RT_prod = R_fast[dev_type] *
++						T_fast[dev_type];
++			}
++		}
++	}
++
++	/*
++	 * If the process has been served for a too short time
++	 * interval to let its possible sequential accesses prevail on
++	 * the initial seek time needed to move the disk head on the
++	 * first sector it requested, then give the process a chance
++	 * and for the moment return false.
++	 */
++	if (bfqq->entity.budget <= bfq_max_budget(bfqd) / 8)
++		return 0;
++
++	/*
++	 * A process is considered ``slow'' (i.e., seeky, so that we
++	 * cannot treat it fairly in the service domain, as it would
++	 * slow down too much the other processes) if, when a slice
++	 * ends for whatever reason, it has received service at a
++	 * rate that would not be high enough to complete the budget
++	 * before the budget timeout expiration.
++	 */
++	expected = bw * 1000 * timeout >> BFQ_RATE_SHIFT;
++
++	/*
++	 * Caveat: processes doing IO in the slower disk zones will
++	 * tend to be slow(er) even if not seeky. And the estimated
++	 * peak rate will actually be an average over the disk
++	 * surface. Hence, to not be too harsh with unlucky processes,
++	 * we keep a budget/3 margin of safety before declaring a
++	 * process slow.
++	 */
++	return expected > (4 * bfqq->entity.budget) / 3;
++}
++
++/*
++ * To be deemed as soft real-time, an application must meet two
++ * requirements. First, the application must not require an average
++ * bandwidth higher than the approximate bandwidth required to playback or
++ * record a compressed high-definition video.
++ * The next function is invoked on the completion of the last request of a
++ * batch, to compute the next-start time instant, soft_rt_next_start, such
++ * that, if the next request of the application does not arrive before
++ * soft_rt_next_start, then the above requirement on the bandwidth is met.
++ *
++ * The second requirement is that the request pattern of the application is
++ * isochronous, i.e., that, after issuing a request or a batch of requests,
++ * the application stops issuing new requests until all its pending requests
++ * have been completed. After that, the application may issue a new batch,
++ * and so on.
++ * For this reason the next function is invoked to compute
++ * soft_rt_next_start only for applications that meet this requirement,
++ * whereas soft_rt_next_start is set to infinity for applications that do
++ * not.
++ *
++ * Unfortunately, even a greedy application may happen to behave in an
++ * isochronous way if the CPU load is high. In fact, the application may
++ * stop issuing requests while the CPUs are busy serving other processes,
++ * then restart, then stop again for a while, and so on. In addition, if
++ * the disk achieves a low enough throughput with the request pattern
++ * issued by the application (e.g., because the request pattern is random
++ * and/or the device is slow), then the application may meet the above
++ * bandwidth requirement too. To prevent such a greedy application to be
++ * deemed as soft real-time, a further rule is used in the computation of
++ * soft_rt_next_start: soft_rt_next_start must be higher than the current
++ * time plus the maximum time for which the arrival of a request is waited
++ * for when a sync queue becomes idle, namely bfqd->bfq_slice_idle.
++ * This filters out greedy applications, as the latter issue instead their
++ * next request as soon as possible after the last one has been completed
++ * (in contrast, when a batch of requests is completed, a soft real-time
++ * application spends some time processing data).
++ *
++ * Unfortunately, the last filter may easily generate false positives if
++ * only bfqd->bfq_slice_idle is used as a reference time interval and one
++ * or both the following cases occur:
++ * 1) HZ is so low that the duration of a jiffy is comparable to or higher
++ *    than bfqd->bfq_slice_idle. This happens, e.g., on slow devices with
++ *    HZ=100.
++ * 2) jiffies, instead of increasing at a constant rate, may stop increasing
++ *    for a while, then suddenly 'jump' by several units to recover the lost
++ *    increments. This seems to happen, e.g., inside virtual machines.
++ * To address this issue, we do not use as a reference time interval just
++ * bfqd->bfq_slice_idle, but bfqd->bfq_slice_idle plus a few jiffies. In
++ * particular we add the minimum number of jiffies for which the filter
++ * seems to be quite precise also in embedded systems and KVM/QEMU virtual
++ * machines.
++ */
++static inline unsigned long bfq_bfqq_softrt_next_start(struct bfq_data *bfqd,
++						       struct bfq_queue *bfqq)
++{
++	return max(bfqq->last_idle_bklogged +
++		   HZ * bfqq->service_from_backlogged /
++		   bfqd->bfq_wr_max_softrt_rate,
++		   jiffies + bfqq->bfqd->bfq_slice_idle + 4);
++}
++
++/*
++ * Return the largest-possible time instant such that, for as long as possible,
++ * the current time will be lower than this time instant according to the macro
++ * time_is_before_jiffies().
++ */
++static inline unsigned long bfq_infinity_from_now(unsigned long now)
++{
++	return now + ULONG_MAX / 2;
++}
++
++/**
++ * bfq_bfqq_expire - expire a queue.
++ * @bfqd: device owning the queue.
++ * @bfqq: the queue to expire.
++ * @compensate: if true, compensate for the time spent idling.
++ * @reason: the reason causing the expiration.
++ *
++ *
++ * If the process associated to the queue is slow (i.e., seeky), or in
++ * case of budget timeout, or, finally, if it is async, we
++ * artificially charge it an entire budget (independently of the
++ * actual service it received). As a consequence, the queue will get
++ * higher timestamps than the correct ones upon reactivation, and
++ * hence it will be rescheduled as if it had received more service
++ * than what it actually received. In the end, this class of processes
++ * will receive less service in proportion to how slowly they consume
++ * their budgets (and hence how seriously they tend to lower the
++ * throughput).
++ *
++ * In contrast, when a queue expires because it has been idling for
++ * too much or because it exhausted its budget, we do not touch the
++ * amount of service it has received. Hence when the queue will be
++ * reactivated and its timestamps updated, the latter will be in sync
++ * with the actual service received by the queue until expiration.
++ *
++ * Charging a full budget to the first type of queues and the exact
++ * service to the others has the effect of using the WF2Q+ policy to
++ * schedule the former on a timeslice basis, without violating the
++ * service domain guarantees of the latter.
++ */
++static void bfq_bfqq_expire(struct bfq_data *bfqd,
++			    struct bfq_queue *bfqq,
++			    int compensate,
++			    enum bfqq_expiration reason)
++{
++	int slow;
++	BUG_ON(bfqq != bfqd->in_service_queue);
++
++	/* Update disk peak rate for autotuning and check whether the
++	 * process is slow (see bfq_update_peak_rate).
++	 */
++	slow = bfq_update_peak_rate(bfqd, bfqq, compensate, reason);
++
++	/*
++	 * As above explained, 'punish' slow (i.e., seeky), timed-out
++	 * and async queues, to favor sequential sync workloads.
++	 *
++	 * Processes doing I/O in the slower disk zones will tend to be
++	 * slow(er) even if not seeky. Hence, since the estimated peak
++	 * rate is actually an average over the disk surface, these
++	 * processes may timeout just for bad luck. To avoid punishing
++	 * them we do not charge a full budget to a process that
++	 * succeeded in consuming at least 2/3 of its budget.
++	 */
++	if (slow || (reason == BFQ_BFQQ_BUDGET_TIMEOUT &&
++		     bfq_bfqq_budget_left(bfqq) >=  bfqq->entity.budget / 3))
++		bfq_bfqq_charge_full_budget(bfqq);
++
++	bfqq->service_from_backlogged += bfqq->entity.service;
++
++	if (BFQQ_SEEKY(bfqq) && reason == BFQ_BFQQ_BUDGET_TIMEOUT &&
++	    !bfq_bfqq_constantly_seeky(bfqq)) {
++		bfq_mark_bfqq_constantly_seeky(bfqq);
++		if (!blk_queue_nonrot(bfqd->queue))
++			bfqd->const_seeky_busy_in_flight_queues++;
++	}
++
++	if (reason == BFQ_BFQQ_TOO_IDLE &&
++	    bfqq->entity.service <= 2 * bfqq->entity.budget / 10 )
++		bfq_clear_bfqq_IO_bound(bfqq);
++
++	if (bfqd->low_latency && bfqq->wr_coeff == 1)
++		bfqq->last_wr_start_finish = jiffies;
++
++	if (bfqd->low_latency && bfqd->bfq_wr_max_softrt_rate > 0 &&
++	    RB_EMPTY_ROOT(&bfqq->sort_list)) {
++		/*
++		 * If we get here, and there are no outstanding requests,
++		 * then the request pattern is isochronous (see the comments
++		 * to the function bfq_bfqq_softrt_next_start()). Hence we
++		 * can compute soft_rt_next_start. If, instead, the queue
++		 * still has outstanding requests, then we have to wait
++		 * for the completion of all the outstanding requests to
++		 * discover whether the request pattern is actually
++		 * isochronous.
++		 */
++		if (bfqq->dispatched == 0)
++			bfqq->soft_rt_next_start =
++				bfq_bfqq_softrt_next_start(bfqd, bfqq);
++		else {
++			/*
++			 * The application is still waiting for the
++			 * completion of one or more requests:
++			 * prevent it from possibly being incorrectly
++			 * deemed as soft real-time by setting its
++			 * soft_rt_next_start to infinity. In fact,
++			 * without this assignment, the application
++			 * would be incorrectly deemed as soft
++			 * real-time if:
++			 * 1) it issued a new request before the
++			 *    completion of all its in-flight
++			 *    requests, and
++			 * 2) at that time, its soft_rt_next_start
++			 *    happened to be in the past.
++			 */
++			bfqq->soft_rt_next_start =
++				bfq_infinity_from_now(jiffies);
++			/*
++			 * Schedule an update of soft_rt_next_start to when
++			 * the task may be discovered to be isochronous.
++			 */
++			bfq_mark_bfqq_softrt_update(bfqq);
++		}
++	}
++
++	bfq_log_bfqq(bfqd, bfqq,
++		"expire (%d, slow %d, num_disp %d, idle_win %d)", reason,
++		slow, bfqq->dispatched, bfq_bfqq_idle_window(bfqq));
++
++	/*
++	 * Increase, decrease or leave budget unchanged according to
++	 * reason.
++	 */
++	__bfq_bfqq_recalc_budget(bfqd, bfqq, reason);
++	__bfq_bfqq_expire(bfqd, bfqq);
++}
++
++/*
++ * Budget timeout is not implemented through a dedicated timer, but
++ * just checked on request arrivals and completions, as well as on
++ * idle timer expirations.
++ */
++static int bfq_bfqq_budget_timeout(struct bfq_queue *bfqq)
++{
++	if (bfq_bfqq_budget_new(bfqq) ||
++	    time_before(jiffies, bfqq->budget_timeout))
++		return 0;
++	return 1;
++}
++
++/*
++ * If we expire a queue that is waiting for the arrival of a new
++ * request, we may prevent the fictitious timestamp back-shifting that
++ * allows the guarantees of the queue to be preserved (see [1] for
++ * this tricky aspect). Hence we return true only if this condition
++ * does not hold, or if the queue is slow enough to deserve only to be
++ * kicked off for preserving a high throughput.
++*/
++static inline int bfq_may_expire_for_budg_timeout(struct bfq_queue *bfqq)
++{
++	bfq_log_bfqq(bfqq->bfqd, bfqq,
++		"may_budget_timeout: wait_request %d left %d timeout %d",
++		bfq_bfqq_wait_request(bfqq),
++			bfq_bfqq_budget_left(bfqq) >=  bfqq->entity.budget / 3,
++		bfq_bfqq_budget_timeout(bfqq));
++
++	return (!bfq_bfqq_wait_request(bfqq) ||
++		bfq_bfqq_budget_left(bfqq) >=  bfqq->entity.budget / 3)
++		&&
++		bfq_bfqq_budget_timeout(bfqq);
++}
++
++/*
++ * Device idling is allowed only for the queues for which this function
++ * returns true. For this reason, the return value of this function plays a
++ * critical role for both throughput boosting and service guarantees. The
++ * return value is computed through a logical expression. In this rather
++ * long comment, we try to briefly describe all the details and motivations
++ * behind the components of this logical expression.
++ *
++ * First, the expression is false if bfqq is not sync, or if: bfqq happened
++ * to become active during a large burst of queue activations, and the
++ * pattern of requests bfqq contains boosts the throughput if bfqq is
++ * expired. In fact, queues that became active during a large burst benefit
++ * only from throughput, as discussed in the comments to bfq_handle_burst.
++ * In this respect, expiring bfqq certainly boosts the throughput on NCQ-
++ * capable flash-based devices, whereas, on rotational devices, it boosts
++ * the throughput only if bfqq contains random requests.
++ *
++ * On the opposite end, if (a) bfqq is sync, (b) the above burst-related
++ * condition does not hold, and (c) bfqq is being weight-raised, then the
++ * expression always evaluates to true, as device idling is instrumental
++ * for preserving low-latency guarantees (see [1]). If, instead, conditions
++ * (a) and (b) do hold, but (c) does not, then the expression evaluates to
++ * true only if: (1) bfqq is I/O-bound and has a non-null idle window, and
++ * (2) at least one of the following two conditions holds.
++ * The first condition is that the device is not performing NCQ, because
++ * idling the device most certainly boosts the throughput if this condition
++ * holds and bfqq is I/O-bound and has been granted a non-null idle window.
++ * The second compound condition is made of the logical AND of two components.
++ *
++ * The first component is true only if there is no weight-raised busy
++ * queue. This guarantees that the device is not idled for a sync non-
++ * weight-raised queue when there are busy weight-raised queues. The former
++ * is then expired immediately if empty. Combined with the timestamping
++ * rules of BFQ (see [1] for details), this causes sync non-weight-raised
++ * queues to get a lower number of requests served, and hence to ask for a
++ * lower number of requests from the request pool, before the busy weight-
++ * raised queues get served again.
++ *
++ * This is beneficial for the processes associated with weight-raised
++ * queues, when the request pool is saturated (e.g., in the presence of
++ * write hogs). In fact, if the processes associated with the other queues
++ * ask for requests at a lower rate, then weight-raised processes have a
++ * higher probability to get a request from the pool immediately (or at
++ * least soon) when they need one. Hence they have a higher probability to
++ * actually get a fraction of the disk throughput proportional to their
++ * high weight. This is especially true with NCQ-capable drives, which
++ * enqueue several requests in advance and further reorder internally-
++ * queued requests.
++ *
++ * In the end, mistreating non-weight-raised queues when there are busy
++ * weight-raised queues seems to mitigate starvation problems in the
++ * presence of heavy write workloads and NCQ, and hence to guarantee a
++ * higher application and system responsiveness in these hostile scenarios.
++ *
++ * If the first component of the compound condition is instead true, i.e.,
++ * there is no weight-raised busy queue, then the second component of the
++ * compound condition takes into account service-guarantee and throughput
++ * issues related to NCQ (recall that the compound condition is evaluated
++ * only if the device is detected as supporting NCQ).
++ *
++ * As for service guarantees, allowing the drive to enqueue more than one
++ * request at a time, and hence delegating de facto final scheduling
++ * decisions to the drive's internal scheduler, causes loss of control on
++ * the actual request service order. In this respect, when the drive is
++ * allowed to enqueue more than one request at a time, the service
++ * distribution enforced by the drive's internal scheduler is likely to
++ * coincide with the desired device-throughput distribution only in the
++ * following, perfectly symmetric, scenario:
++ * 1) all active queues have the same weight,
++ * 2) all active groups at the same level in the groups tree have the same
++ *    weight,
++ * 3) all active groups at the same level in the groups tree have the same
++ *    number of children.
++ *
++ * Even in such a scenario, sequential I/O may still receive a preferential
++ * treatment, but this is not likely to be a big issue with flash-based
++ * devices, because of their non-dramatic loss of throughput with random
++ * I/O. Things do differ with HDDs, for which additional care is taken, as
++ * explained after completing the discussion for flash-based devices.
++ *
++ * Unfortunately, keeping the necessary state for evaluating exactly the
++ * above symmetry conditions would be quite complex and time-consuming.
++ * Therefore BFQ evaluates instead the following stronger sub-conditions,
++ * for which it is much easier to maintain the needed state:
++ * 1) all active queues have the same weight,
++ * 2) all active groups have the same weight,
++ * 3) all active groups have at most one active child each.
++ * In particular, the last two conditions are always true if hierarchical
++ * support and the cgroups interface are not enabled, hence no state needs
++ * to be maintained in this case.
++ *
++ * According to the above considerations, the second component of the
++ * compound condition evaluates to true if any of the above symmetry
++ * sub-condition does not hold, or the device is not flash-based. Therefore,
++ * if also the first component is true, then idling is allowed for a sync
++ * queue. These are the only sub-conditions considered if the device is
++ * flash-based, as, for such a device, it is sensible to force idling only
++ * for service-guarantee issues. In fact, as for throughput, idling
++ * NCQ-capable flash-based devices would not boost the throughput even
++ * with sequential I/O; rather it would lower the throughput in proportion
++ * to how fast the device is. In the end, (only) if all the three
++ * sub-conditions hold and the device is flash-based, the compound
++ * condition evaluates to false and therefore no idling is performed.
++ *
++ * As already said, things change with a rotational device, where idling
++ * boosts the throughput with sequential I/O (even with NCQ). Hence, for
++ * such a device the second component of the compound condition evaluates
++ * to true also if the following additional sub-condition does not hold:
++ * the queue is constantly seeky. Unfortunately, this different behavior
++ * with respect to flash-based devices causes an additional asymmetry: if
++ * some sync queues enjoy idling and some other sync queues do not, then
++ * the latter get a low share of the device throughput, simply because the
++ * former get many requests served after being set as in service, whereas
++ * the latter do not. As a consequence, to guarantee the desired throughput
++ * distribution, on HDDs the compound expression evaluates to true (and
++ * hence device idling is performed) also if the following last symmetry
++ * condition does not hold: no other queue is benefiting from idling. Also
++ * this last condition is actually replaced with a simpler-to-maintain and
++ * stronger condition: there is no busy queue which is not constantly seeky
++ * (and hence may also benefit from idling).
++ *
++ * To sum up, when all the required symmetry and throughput-boosting
++ * sub-conditions hold, the second component of the compound condition
++ * evaluates to false, and hence no idling is performed. This helps to
++ * keep the drives' internal queues full on NCQ-capable devices, and hence
++ * to boost the throughput, without causing 'almost' any loss of service
++ * guarantees. The 'almost' follows from the fact that, if the internal
++ * queue of one such device is filled while all the sub-conditions hold,
++ * but at some point in time some sub-condition stops to hold, then it may
++ * become impossible to let requests be served in the new desired order
++ * until all the requests already queued in the device have been served.
++ */
++static inline bool bfq_bfqq_must_not_expire(struct bfq_queue *bfqq)
++{
++	struct bfq_data *bfqd = bfqq->bfqd;
++#ifdef CONFIG_CGROUP_BFQIO
++#define symmetric_scenario	  (!bfqd->active_numerous_groups && \
++				   !bfq_differentiated_weights(bfqd))
++#else
++#define symmetric_scenario	  (!bfq_differentiated_weights(bfqd))
++#endif
++#define cond_for_seeky_on_ncq_hdd (bfq_bfqq_constantly_seeky(bfqq) && \
++				   bfqd->busy_in_flight_queues == \
++				   bfqd->const_seeky_busy_in_flight_queues)
++
++#define cond_for_expiring_in_burst	(bfq_bfqq_in_large_burst(bfqq) && \
++					 bfqd->hw_tag && \
++					 (blk_queue_nonrot(bfqd->queue) || \
++					  bfq_bfqq_constantly_seeky(bfqq)))
++
++/*
++ * Condition for expiring a non-weight-raised queue (and hence not idling
++ * the device).
++ */
++#define cond_for_expiring_non_wr  (bfqd->hw_tag && \
++				   (bfqd->wr_busy_queues > 0 || \
++				    (symmetric_scenario && \
++				     (blk_queue_nonrot(bfqd->queue) || \
++				      cond_for_seeky_on_ncq_hdd))))
++
++	return bfq_bfqq_sync(bfqq) &&
++		!cond_for_expiring_in_burst &&
++		(bfqq->wr_coeff > 1 ||
++		 (bfq_bfqq_IO_bound(bfqq) && bfq_bfqq_idle_window(bfqq) &&
++		  !cond_for_expiring_non_wr)
++	);
++}
++
++/*
++ * If the in-service queue is empty but sync, and the function
++ * bfq_bfqq_must_not_expire returns true, then:
++ * 1) the queue must remain in service and cannot be expired, and
++ * 2) the disk must be idled to wait for the possible arrival of a new
++ *    request for the queue.
++ * See the comments to the function bfq_bfqq_must_not_expire for the reasons
++ * why performing device idling is the best choice to boost the throughput
++ * and preserve service guarantees when bfq_bfqq_must_not_expire itself
++ * returns true.
++ */
++static inline bool bfq_bfqq_must_idle(struct bfq_queue *bfqq)
++{
++	struct bfq_data *bfqd = bfqq->bfqd;
++
++	return RB_EMPTY_ROOT(&bfqq->sort_list) && bfqd->bfq_slice_idle != 0 &&
++	       bfq_bfqq_must_not_expire(bfqq);
++}
++
++/*
++ * Select a queue for service.  If we have a current queue in service,
++ * check whether to continue servicing it, or retrieve and set a new one.
++ */
++static struct bfq_queue *bfq_select_queue(struct bfq_data *bfqd)
++{
++	struct bfq_queue *bfqq;
++	struct request *next_rq;
++	enum bfqq_expiration reason = BFQ_BFQQ_BUDGET_TIMEOUT;
++
++	bfqq = bfqd->in_service_queue;
++	if (bfqq == NULL)
++		goto new_queue;
++
++	bfq_log_bfqq(bfqd, bfqq, "select_queue: already in-service queue");
++
++	if (bfq_may_expire_for_budg_timeout(bfqq) &&
++	    !timer_pending(&bfqd->idle_slice_timer) &&
++	    !bfq_bfqq_must_idle(bfqq))
++		goto expire;
++
++	next_rq = bfqq->next_rq;
++	/*
++	 * If bfqq has requests queued and it has enough budget left to
++	 * serve them, keep the queue, otherwise expire it.
++	 */
++	if (next_rq != NULL) {
++		if (bfq_serv_to_charge(next_rq, bfqq) >
++			bfq_bfqq_budget_left(bfqq)) {
++			reason = BFQ_BFQQ_BUDGET_EXHAUSTED;
++			goto expire;
++		} else {
++			/*
++			 * The idle timer may be pending because we may
++			 * not disable disk idling even when a new request
++			 * arrives.
++			 */
++			if (timer_pending(&bfqd->idle_slice_timer)) {
++				/*
++				 * If we get here: 1) at least a new request
++				 * has arrived but we have not disabled the
++				 * timer because the request was too small,
++				 * 2) then the block layer has unplugged
++				 * the device, causing the dispatch to be
++				 * invoked.
++				 *
++				 * Since the device is unplugged, now the
++				 * requests are probably large enough to
++				 * provide a reasonable throughput.
++				 * So we disable idling.
++				 */
++				bfq_clear_bfqq_wait_request(bfqq);
++				del_timer(&bfqd->idle_slice_timer);
++			}
++			goto keep_queue;
++		}
++	}
++
++	/*
++	 * No requests pending.  If the in-service queue still has requests
++	 * in flight (possibly waiting for a completion) or is idling for a
++	 * new request, then keep it.
++	 */
++	if (timer_pending(&bfqd->idle_slice_timer) ||
++	    (bfqq->dispatched != 0 && bfq_bfqq_must_not_expire(bfqq))) {
++		bfqq = NULL;
++		goto keep_queue;
++	}
++
++	reason = BFQ_BFQQ_NO_MORE_REQUESTS;
++expire:
++	bfq_bfqq_expire(bfqd, bfqq, 0, reason);
++new_queue:
++	bfqq = bfq_set_in_service_queue(bfqd);
++	bfq_log(bfqd, "select_queue: new queue %d returned",
++		bfqq != NULL ? bfqq->pid : 0);
++keep_queue:
++	return bfqq;
++}
++
++static void bfq_update_wr_data(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++	if (bfqq->wr_coeff > 1) { /* queue is being weight-raised */
++		bfq_log_bfqq(bfqd, bfqq,
++			"raising period dur %u/%u msec, old coeff %u, w %d(%d)",
++			jiffies_to_msecs(jiffies - bfqq->last_wr_start_finish),
++			jiffies_to_msecs(bfqq->wr_cur_max_time),
++			bfqq->wr_coeff,
++			bfqq->entity.weight, bfqq->entity.orig_weight);
++
++		BUG_ON(bfqq != bfqd->in_service_queue && entity->weight !=
++		       entity->orig_weight * bfqq->wr_coeff);
++		if (entity->ioprio_changed)
++			bfq_log_bfqq(bfqd, bfqq, "WARN: pending prio change");
++
++		/*
++		 * If the queue was activated in a burst, or
++		 * too much time has elapsed from the beginning
++		 * of this weight-raising period, or the queue has
++		 * exceeded the acceptable number of cooperations,
++		 * then end weight raising.
++		 */
++		if (bfq_bfqq_in_large_burst(bfqq) ||
++		    bfq_bfqq_cooperations(bfqq) >= bfqd->bfq_coop_thresh ||
++		    time_is_before_jiffies(bfqq->last_wr_start_finish +
++					   bfqq->wr_cur_max_time)) {
++			bfqq->last_wr_start_finish = jiffies;
++			bfq_log_bfqq(bfqd, bfqq,
++				     "wrais ending at %lu, rais_max_time %u",
++				     bfqq->last_wr_start_finish,
++				     jiffies_to_msecs(bfqq->wr_cur_max_time));
++			bfq_bfqq_end_wr(bfqq);
++		}
++	}
++	/* Update weight both if it must be raised and if it must be lowered */
++	if ((entity->weight > entity->orig_weight) != (bfqq->wr_coeff > 1))
++		__bfq_entity_update_weight_prio(
++			bfq_entity_service_tree(entity),
++			entity);
++}
++
++/*
++ * Dispatch one request from bfqq, moving it to the request queue
++ * dispatch list.
++ */
++static int bfq_dispatch_request(struct bfq_data *bfqd,
++				struct bfq_queue *bfqq)
++{
++	int dispatched = 0;
++	struct request *rq;
++	unsigned long service_to_charge;
++
++	BUG_ON(RB_EMPTY_ROOT(&bfqq->sort_list));
++
++	/* Follow expired path, else get first next available. */
++	rq = bfq_check_fifo(bfqq);
++	if (rq == NULL)
++		rq = bfqq->next_rq;
++	service_to_charge = bfq_serv_to_charge(rq, bfqq);
++
++	if (service_to_charge > bfq_bfqq_budget_left(bfqq)) {
++		/*
++		 * This may happen if the next rq is chosen in fifo order
++		 * instead of sector order. The budget is properly
++		 * dimensioned to be always sufficient to serve the next
++		 * request only if it is chosen in sector order. The reason
++		 * is that it would be quite inefficient and little useful
++		 * to always make sure that the budget is large enough to
++		 * serve even the possible next rq in fifo order.
++		 * In fact, requests are seldom served in fifo order.
++		 *
++		 * Expire the queue for budget exhaustion, and make sure
++		 * that the next act_budget is enough to serve the next
++		 * request, even if it comes from the fifo expired path.
++		 */
++		bfqq->next_rq = rq;
++		/*
++		 * Since this dispatch is failed, make sure that
++		 * a new one will be performed
++		 */
++		if (!bfqd->rq_in_driver)
++			bfq_schedule_dispatch(bfqd);
++		goto expire;
++	}
++
++	/* Finally, insert request into driver dispatch list. */
++	bfq_bfqq_served(bfqq, service_to_charge);
++	bfq_dispatch_insert(bfqd->queue, rq);
++
++	bfq_update_wr_data(bfqd, bfqq);
++
++	bfq_log_bfqq(bfqd, bfqq,
++			"dispatched %u sec req (%llu), budg left %lu",
++			blk_rq_sectors(rq),
++			(long long unsigned)blk_rq_pos(rq),
++			bfq_bfqq_budget_left(bfqq));
++
++	dispatched++;
++
++	if (bfqd->in_service_bic == NULL) {
++		atomic_long_inc(&RQ_BIC(rq)->icq.ioc->refcount);
++		bfqd->in_service_bic = RQ_BIC(rq);
++	}
++
++	if (bfqd->busy_queues > 1 && ((!bfq_bfqq_sync(bfqq) &&
++	    dispatched >= bfqd->bfq_max_budget_async_rq) ||
++	    bfq_class_idle(bfqq)))
++		goto expire;
++
++	return dispatched;
++
++expire:
++	bfq_bfqq_expire(bfqd, bfqq, 0, BFQ_BFQQ_BUDGET_EXHAUSTED);
++	return dispatched;
++}
++
++static int __bfq_forced_dispatch_bfqq(struct bfq_queue *bfqq)
++{
++	int dispatched = 0;
++
++	while (bfqq->next_rq != NULL) {
++		bfq_dispatch_insert(bfqq->bfqd->queue, bfqq->next_rq);
++		dispatched++;
++	}
++
++	BUG_ON(!list_empty(&bfqq->fifo));
++	return dispatched;
++}
++
++/*
++ * Drain our current requests.
++ * Used for barriers and when switching io schedulers on-the-fly.
++ */
++static int bfq_forced_dispatch(struct bfq_data *bfqd)
++{
++	struct bfq_queue *bfqq, *n;
++	struct bfq_service_tree *st;
++	int dispatched = 0;
++
++	bfqq = bfqd->in_service_queue;
++	if (bfqq != NULL)
++		__bfq_bfqq_expire(bfqd, bfqq);
++
++	/*
++	 * Loop through classes, and be careful to leave the scheduler
++	 * in a consistent state, as feedback mechanisms and vtime
++	 * updates cannot be disabled during the process.
++	 */
++	list_for_each_entry_safe(bfqq, n, &bfqd->active_list, bfqq_list) {
++		st = bfq_entity_service_tree(&bfqq->entity);
++
++		dispatched += __bfq_forced_dispatch_bfqq(bfqq);
++		bfqq->max_budget = bfq_max_budget(bfqd);
++
++		bfq_forget_idle(st);
++	}
++
++	BUG_ON(bfqd->busy_queues != 0);
++
++	return dispatched;
++}
++
++static int bfq_dispatch_requests(struct request_queue *q, int force)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct bfq_queue *bfqq;
++	int max_dispatch;
++
++	bfq_log(bfqd, "dispatch requests: %d busy queues", bfqd->busy_queues);
++	if (bfqd->busy_queues == 0)
++		return 0;
++
++	if (unlikely(force))
++		return bfq_forced_dispatch(bfqd);
++
++	bfqq = bfq_select_queue(bfqd);
++	if (bfqq == NULL)
++		return 0;
++
++	max_dispatch = bfqd->bfq_quantum;
++	if (bfq_class_idle(bfqq))
++		max_dispatch = 1;
++
++	if (!bfq_bfqq_sync(bfqq))
++		max_dispatch = bfqd->bfq_max_budget_async_rq;
++
++	if (bfqq->dispatched >= max_dispatch) {
++		if (bfqd->busy_queues > 1)
++			return 0;
++		if (bfqq->dispatched >= 4 * max_dispatch)
++			return 0;
++	}
++
++	if (bfqd->sync_flight != 0 && !bfq_bfqq_sync(bfqq))
++		return 0;
++
++	bfq_clear_bfqq_wait_request(bfqq);
++	BUG_ON(timer_pending(&bfqd->idle_slice_timer));
++
++	if (!bfq_dispatch_request(bfqd, bfqq))
++		return 0;
++
++	bfq_log_bfqq(bfqd, bfqq, "dispatched one request of %d (max_disp %d)",
++			bfqq->pid, max_dispatch);
++
++	return 1;
++}
++
++/*
++ * Task holds one reference to the queue, dropped when task exits.  Each rq
++ * in-flight on this queue also holds a reference, dropped when rq is freed.
++ *
++ * Queue lock must be held here.
++ */
++static void bfq_put_queue(struct bfq_queue *bfqq)
++{
++	struct bfq_data *bfqd = bfqq->bfqd;
++
++	BUG_ON(atomic_read(&bfqq->ref) <= 0);
++
++	bfq_log_bfqq(bfqd, bfqq, "put_queue: %p %d", bfqq,
++		     atomic_read(&bfqq->ref));
++	if (!atomic_dec_and_test(&bfqq->ref))
++		return;
++
++	BUG_ON(rb_first(&bfqq->sort_list) != NULL);
++	BUG_ON(bfqq->allocated[READ] + bfqq->allocated[WRITE] != 0);
++	BUG_ON(bfqq->entity.tree != NULL);
++	BUG_ON(bfq_bfqq_busy(bfqq));
++	BUG_ON(bfqd->in_service_queue == bfqq);
++
++	if (bfq_bfqq_sync(bfqq))
++		/*
++		 * The fact that this queue is being destroyed does not
++		 * invalidate the fact that this queue may have been
++		 * activated during the current burst. As a consequence,
++		 * although the queue does not exist anymore, and hence
++		 * needs to be removed from the burst list if there,
++		 * the burst size has not to be decremented.
++		 */
++		hlist_del_init(&bfqq->burst_list_node);
++
++	bfq_log_bfqq(bfqd, bfqq, "put_queue: %p freed", bfqq);
++
++	kmem_cache_free(bfq_pool, bfqq);
++}
++
++static void bfq_put_cooperator(struct bfq_queue *bfqq)
++{
++	struct bfq_queue *__bfqq, *next;
++
++	/*
++	 * If this queue was scheduled to merge with another queue, be
++	 * sure to drop the reference taken on that queue (and others in
++	 * the merge chain). See bfq_setup_merge and bfq_merge_bfqqs.
++	 */
++	__bfqq = bfqq->new_bfqq;
++	while (__bfqq) {
++		if (__bfqq == bfqq)
++			break;
++		next = __bfqq->new_bfqq;
++		bfq_put_queue(__bfqq);
++		__bfqq = next;
++	}
++}
++
++static void bfq_exit_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	if (bfqq == bfqd->in_service_queue) {
++		__bfq_bfqq_expire(bfqd, bfqq);
++		bfq_schedule_dispatch(bfqd);
++	}
++
++	bfq_log_bfqq(bfqd, bfqq, "exit_bfqq: %p, %d", bfqq,
++		     atomic_read(&bfqq->ref));
++
++	bfq_put_cooperator(bfqq);
++
++	bfq_put_queue(bfqq);
++}
++
++static inline void bfq_init_icq(struct io_cq *icq)
++{
++	struct bfq_io_cq *bic = icq_to_bic(icq);
++
++	bic->ttime.last_end_request = jiffies;
++	/*
++	 * A newly created bic indicates that the process has just
++	 * started doing I/O, and is probably mapping into memory its
++	 * executable and libraries: it definitely needs weight raising.
++	 * There is however the possibility that the process performs,
++	 * for a while, I/O close to some other process. EQM intercepts
++	 * this behavior and may merge the queue corresponding to the
++	 * process  with some other queue, BEFORE the weight of the queue
++	 * is raised. Merged queues are not weight-raised (they are assumed
++	 * to belong to processes that benefit only from high throughput).
++	 * If the merge is basically the consequence of an accident, then
++	 * the queue will be split soon and will get back its old weight.
++	 * It is then important to write down somewhere that this queue
++	 * does need weight raising, even if it did not make it to get its
++	 * weight raised before being merged. To this purpose, we overload
++	 * the field raising_time_left and assign 1 to it, to mark the queue
++	 * as needing weight raising.
++	 */
++	bic->wr_time_left = 1;
++}
++
++static void bfq_exit_icq(struct io_cq *icq)
++{
++	struct bfq_io_cq *bic = icq_to_bic(icq);
++	struct bfq_data *bfqd = bic_to_bfqd(bic);
++
++	if (bic->bfqq[BLK_RW_ASYNC]) {
++		bfq_exit_bfqq(bfqd, bic->bfqq[BLK_RW_ASYNC]);
++		bic->bfqq[BLK_RW_ASYNC] = NULL;
++	}
++
++	if (bic->bfqq[BLK_RW_SYNC]) {
++		/*
++		 * If the bic is using a shared queue, put the reference
++		 * taken on the io_context when the bic started using a
++		 * shared bfq_queue.
++		 */
++		if (bfq_bfqq_coop(bic->bfqq[BLK_RW_SYNC]))
++			put_io_context(icq->ioc);
++		bfq_exit_bfqq(bfqd, bic->bfqq[BLK_RW_SYNC]);
++		bic->bfqq[BLK_RW_SYNC] = NULL;
++	}
++}
++
++/*
++ * Update the entity prio values; note that the new values will not
++ * be used until the next (re)activation.
++ */
++static void bfq_init_prio_data(struct bfq_queue *bfqq, struct bfq_io_cq *bic)
++{
++	struct task_struct *tsk = current;
++	int ioprio_class;
++
++	if (!bfq_bfqq_prio_changed(bfqq))
++		return;
++
++	ioprio_class = IOPRIO_PRIO_CLASS(bic->ioprio);
++	switch (ioprio_class) {
++	default:
++		dev_err(bfqq->bfqd->queue->backing_dev_info.dev,
++			"bfq: bad prio class %d\n", ioprio_class);
++	case IOPRIO_CLASS_NONE:
++		/*
++		 * No prio set, inherit CPU scheduling settings.
++		 */
++		bfqq->entity.new_ioprio = task_nice_ioprio(tsk);
++		bfqq->entity.new_ioprio_class = task_nice_ioclass(tsk);
++		break;
++	case IOPRIO_CLASS_RT:
++		bfqq->entity.new_ioprio = IOPRIO_PRIO_DATA(bic->ioprio);
++		bfqq->entity.new_ioprio_class = IOPRIO_CLASS_RT;
++		break;
++	case IOPRIO_CLASS_BE:
++		bfqq->entity.new_ioprio = IOPRIO_PRIO_DATA(bic->ioprio);
++		bfqq->entity.new_ioprio_class = IOPRIO_CLASS_BE;
++		break;
++	case IOPRIO_CLASS_IDLE:
++		bfqq->entity.new_ioprio_class = IOPRIO_CLASS_IDLE;
++		bfqq->entity.new_ioprio = 7;
++		bfq_clear_bfqq_idle_window(bfqq);
++		break;
++	}
++
++	if (bfqq->entity.new_ioprio < 0 ||
++	    bfqq->entity.new_ioprio >= IOPRIO_BE_NR) {
++		printk(KERN_CRIT "bfq_init_prio_data: new_ioprio %d\n",
++				 bfqq->entity.new_ioprio);
++		BUG();
++	}
++
++	bfqq->entity.ioprio_changed = 1;
++
++	bfq_clear_bfqq_prio_changed(bfqq);
++}
++
++static void bfq_changed_ioprio(struct bfq_io_cq *bic)
++{
++	struct bfq_data *bfqd;
++	struct bfq_queue *bfqq, *new_bfqq;
++	struct bfq_group *bfqg;
++	unsigned long uninitialized_var(flags);
++	int ioprio = bic->icq.ioc->ioprio;
++
++	bfqd = bfq_get_bfqd_locked(&(bic->icq.q->elevator->elevator_data),
++				   &flags);
++	/*
++	 * This condition may trigger on a newly created bic, be sure to
++	 * drop the lock before returning.
++	 */
++	if (unlikely(bfqd == NULL) || likely(bic->ioprio == ioprio))
++		goto out;
++
++	bfqq = bic->bfqq[BLK_RW_ASYNC];
++	if (bfqq != NULL) {
++		bfqg = container_of(bfqq->entity.sched_data, struct bfq_group,
++				    sched_data);
++		new_bfqq = bfq_get_queue(bfqd, bfqg, BLK_RW_ASYNC, bic,
++					 GFP_ATOMIC);
++		if (new_bfqq != NULL) {
++			bic->bfqq[BLK_RW_ASYNC] = new_bfqq;
++			bfq_log_bfqq(bfqd, bfqq,
++				     "changed_ioprio: bfqq %p %d",
++				     bfqq, atomic_read(&bfqq->ref));
++			bfq_put_queue(bfqq);
++		}
++	}
++
++	bfqq = bic->bfqq[BLK_RW_SYNC];
++	if (bfqq != NULL)
++		bfq_mark_bfqq_prio_changed(bfqq);
++
++	bic->ioprio = ioprio;
++
++out:
++	bfq_put_bfqd_unlock(bfqd, &flags);
++}
++
++static void bfq_init_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++			  pid_t pid, int is_sync)
++{
++	RB_CLEAR_NODE(&bfqq->entity.rb_node);
++	INIT_LIST_HEAD(&bfqq->fifo);
++	INIT_HLIST_NODE(&bfqq->burst_list_node);
++
++	atomic_set(&bfqq->ref, 0);
++	bfqq->bfqd = bfqd;
++
++	bfq_mark_bfqq_prio_changed(bfqq);
++
++	if (is_sync) {
++		if (!bfq_class_idle(bfqq))
++			bfq_mark_bfqq_idle_window(bfqq);
++		bfq_mark_bfqq_sync(bfqq);
++	}
++	bfq_mark_bfqq_IO_bound(bfqq);
++
++	/* Tentative initial value to trade off between thr and lat */
++	bfqq->max_budget = (2 * bfq_max_budget(bfqd)) / 3;
++	bfqq->pid = pid;
++
++	bfqq->wr_coeff = 1;
++	bfqq->last_wr_start_finish = 0;
++	/*
++	 * Set to the value for which bfqq will not be deemed as
++	 * soft rt when it becomes backlogged.
++	 */
++	bfqq->soft_rt_next_start = bfq_infinity_from_now(jiffies);
++}
++
++static struct bfq_queue *bfq_find_alloc_queue(struct bfq_data *bfqd,
++					      struct bfq_group *bfqg,
++					      int is_sync,
++					      struct bfq_io_cq *bic,
++					      gfp_t gfp_mask)
++{
++	struct bfq_queue *bfqq, *new_bfqq = NULL;
++
++retry:
++	/* bic always exists here */
++	bfqq = bic_to_bfqq(bic, is_sync);
++
++	/*
++	 * Always try a new alloc if we fall back to the OOM bfqq
++	 * originally, since it should just be a temporary situation.
++	 */
++	if (bfqq == NULL || bfqq == &bfqd->oom_bfqq) {
++		bfqq = NULL;
++		if (new_bfqq != NULL) {
++			bfqq = new_bfqq;
++			new_bfqq = NULL;
++		} else if (gfp_mask & __GFP_WAIT) {
++			spin_unlock_irq(bfqd->queue->queue_lock);
++			new_bfqq = kmem_cache_alloc_node(bfq_pool,
++					gfp_mask | __GFP_ZERO,
++					bfqd->queue->node);
++			spin_lock_irq(bfqd->queue->queue_lock);
++			if (new_bfqq != NULL)
++				goto retry;
++		} else {
++			bfqq = kmem_cache_alloc_node(bfq_pool,
++					gfp_mask | __GFP_ZERO,
++					bfqd->queue->node);
++		}
++
++		if (bfqq != NULL) {
++			bfq_init_bfqq(bfqd, bfqq, current->pid, is_sync);
++			bfq_init_prio_data(bfqq, bic);
++			bfq_init_entity(&bfqq->entity, bfqg);
++			bfq_log_bfqq(bfqd, bfqq, "allocated");
++		} else {
++			bfqq = &bfqd->oom_bfqq;
++			bfq_log_bfqq(bfqd, bfqq, "using oom bfqq");
++		}
++	}
++
++	if (new_bfqq != NULL)
++		kmem_cache_free(bfq_pool, new_bfqq);
++
++	return bfqq;
++}
++
++static struct bfq_queue **bfq_async_queue_prio(struct bfq_data *bfqd,
++					       struct bfq_group *bfqg,
++					       int ioprio_class, int ioprio)
++{
++	switch (ioprio_class) {
++	case IOPRIO_CLASS_RT:
++		return &bfqg->async_bfqq[0][ioprio];
++	case IOPRIO_CLASS_NONE:
++		ioprio = IOPRIO_NORM;
++		/* fall through */
++	case IOPRIO_CLASS_BE:
++		return &bfqg->async_bfqq[1][ioprio];
++	case IOPRIO_CLASS_IDLE:
++		return &bfqg->async_idle_bfqq;
++	default:
++		BUG();
++	}
++}
++
++static struct bfq_queue *bfq_get_queue(struct bfq_data *bfqd,
++				       struct bfq_group *bfqg, int is_sync,
++				       struct bfq_io_cq *bic, gfp_t gfp_mask)
++{
++	const int ioprio = IOPRIO_PRIO_DATA(bic->ioprio);
++	const int ioprio_class = IOPRIO_PRIO_CLASS(bic->ioprio);
++	struct bfq_queue **async_bfqq = NULL;
++	struct bfq_queue *bfqq = NULL;
++
++	if (!is_sync) {
++		async_bfqq = bfq_async_queue_prio(bfqd, bfqg, ioprio_class,
++						  ioprio);
++		bfqq = *async_bfqq;
++	}
++
++	if (bfqq == NULL)
++		bfqq = bfq_find_alloc_queue(bfqd, bfqg, is_sync, bic, gfp_mask);
++
++	/*
++	 * Pin the queue now that it's allocated, scheduler exit will
++	 * prune it.
++	 */
++	if (!is_sync && *async_bfqq == NULL) {
++		atomic_inc(&bfqq->ref);
++		bfq_log_bfqq(bfqd, bfqq, "get_queue, bfqq not in async: %p, %d",
++			     bfqq, atomic_read(&bfqq->ref));
++		*async_bfqq = bfqq;
++	}
++
++	atomic_inc(&bfqq->ref);
++	bfq_log_bfqq(bfqd, bfqq, "get_queue, at end: %p, %d", bfqq,
++		     atomic_read(&bfqq->ref));
++	return bfqq;
++}
++
++static void bfq_update_io_thinktime(struct bfq_data *bfqd,
++				    struct bfq_io_cq *bic)
++{
++	unsigned long elapsed = jiffies - bic->ttime.last_end_request;
++	unsigned long ttime = min(elapsed, 2UL * bfqd->bfq_slice_idle);
++
++	bic->ttime.ttime_samples = (7*bic->ttime.ttime_samples + 256) / 8;
++	bic->ttime.ttime_total = (7*bic->ttime.ttime_total + 256*ttime) / 8;
++	bic->ttime.ttime_mean = (bic->ttime.ttime_total + 128) /
++				bic->ttime.ttime_samples;
++}
++
++static void bfq_update_io_seektime(struct bfq_data *bfqd,
++				   struct bfq_queue *bfqq,
++				   struct request *rq)
++{
++	sector_t sdist;
++	u64 total;
++
++	if (bfqq->last_request_pos < blk_rq_pos(rq))
++		sdist = blk_rq_pos(rq) - bfqq->last_request_pos;
++	else
++		sdist = bfqq->last_request_pos - blk_rq_pos(rq);
++
++	/*
++	 * Don't allow the seek distance to get too large from the
++	 * odd fragment, pagein, etc.
++	 */
++	if (bfqq->seek_samples == 0) /* first request, not really a seek */
++		sdist = 0;
++	else if (bfqq->seek_samples <= 60) /* second & third seek */
++		sdist = min(sdist, (bfqq->seek_mean * 4) + 2*1024*1024);
++	else
++		sdist = min(sdist, (bfqq->seek_mean * 4) + 2*1024*64);
++
++	bfqq->seek_samples = (7*bfqq->seek_samples + 256) / 8;
++	bfqq->seek_total = (7*bfqq->seek_total + (u64)256*sdist) / 8;
++	total = bfqq->seek_total + (bfqq->seek_samples/2);
++	do_div(total, bfqq->seek_samples);
++	bfqq->seek_mean = (sector_t)total;
++
++	bfq_log_bfqq(bfqd, bfqq, "dist=%llu mean=%llu", (u64)sdist,
++			(u64)bfqq->seek_mean);
++}
++
++/*
++ * Disable idle window if the process thinks too long or seeks so much that
++ * it doesn't matter.
++ */
++static void bfq_update_idle_window(struct bfq_data *bfqd,
++				   struct bfq_queue *bfqq,
++				   struct bfq_io_cq *bic)
++{
++	int enable_idle;
++
++	/* Don't idle for async or idle io prio class. */
++	if (!bfq_bfqq_sync(bfqq) || bfq_class_idle(bfqq))
++		return;
++
++	/* Idle window just restored, statistics are meaningless. */
++	if (bfq_bfqq_just_split(bfqq))
++		return;
++
++	enable_idle = bfq_bfqq_idle_window(bfqq);
++
++	if (atomic_read(&bic->icq.ioc->active_ref) == 0 ||
++	    bfqd->bfq_slice_idle == 0 ||
++		(bfqd->hw_tag && BFQQ_SEEKY(bfqq) &&
++			bfqq->wr_coeff == 1))
++		enable_idle = 0;
++	else if (bfq_sample_valid(bic->ttime.ttime_samples)) {
++		if (bic->ttime.ttime_mean > bfqd->bfq_slice_idle &&
++			bfqq->wr_coeff == 1)
++			enable_idle = 0;
++		else
++			enable_idle = 1;
++	}
++	bfq_log_bfqq(bfqd, bfqq, "update_idle_window: enable_idle %d",
++		enable_idle);
++
++	if (enable_idle)
++		bfq_mark_bfqq_idle_window(bfqq);
++	else
++		bfq_clear_bfqq_idle_window(bfqq);
++}
++
++/*
++ * Called when a new fs request (rq) is added to bfqq.  Check if there's
++ * something we should do about it.
++ */
++static void bfq_rq_enqueued(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++			    struct request *rq)
++{
++	struct bfq_io_cq *bic = RQ_BIC(rq);
++
++	if (rq->cmd_flags & REQ_META)
++		bfqq->meta_pending++;
++
++	bfq_update_io_thinktime(bfqd, bic);
++	bfq_update_io_seektime(bfqd, bfqq, rq);
++	if (!BFQQ_SEEKY(bfqq) && bfq_bfqq_constantly_seeky(bfqq)) {
++		bfq_clear_bfqq_constantly_seeky(bfqq);
++		if (!blk_queue_nonrot(bfqd->queue)) {
++			BUG_ON(!bfqd->const_seeky_busy_in_flight_queues);
++			bfqd->const_seeky_busy_in_flight_queues--;
++		}
++	}
++	if (bfqq->entity.service > bfq_max_budget(bfqd) / 8 ||
++	    !BFQQ_SEEKY(bfqq))
++		bfq_update_idle_window(bfqd, bfqq, bic);
++	bfq_clear_bfqq_just_split(bfqq);
++
++	bfq_log_bfqq(bfqd, bfqq,
++		     "rq_enqueued: idle_window=%d (seeky %d, mean %llu)",
++		     bfq_bfqq_idle_window(bfqq), BFQQ_SEEKY(bfqq),
++		     (long long unsigned)bfqq->seek_mean);
++
++	bfqq->last_request_pos = blk_rq_pos(rq) + blk_rq_sectors(rq);
++
++	if (bfqq == bfqd->in_service_queue && bfq_bfqq_wait_request(bfqq)) {
++		int small_req = bfqq->queued[rq_is_sync(rq)] == 1 &&
++				blk_rq_sectors(rq) < 32;
++		int budget_timeout = bfq_bfqq_budget_timeout(bfqq);
++
++		/*
++		 * There is just this request queued: if the request
++		 * is small and the queue is not to be expired, then
++		 * just exit.
++		 *
++		 * In this way, if the disk is being idled to wait for
++		 * a new request from the in-service queue, we avoid
++		 * unplugging the device and committing the disk to serve
++		 * just a small request. On the contrary, we wait for
++		 * the block layer to decide when to unplug the device:
++		 * hopefully, new requests will be merged to this one
++		 * quickly, then the device will be unplugged and
++		 * larger requests will be dispatched.
++		 */
++		if (small_req && !budget_timeout)
++			return;
++
++		/*
++		 * A large enough request arrived, or the queue is to
++		 * be expired: in both cases disk idling is to be
++		 * stopped, so clear wait_request flag and reset
++		 * timer.
++		 */
++		bfq_clear_bfqq_wait_request(bfqq);
++		del_timer(&bfqd->idle_slice_timer);
++
++		/*
++		 * The queue is not empty, because a new request just
++		 * arrived. Hence we can safely expire the queue, in
++		 * case of budget timeout, without risking that the
++		 * timestamps of the queue are not updated correctly.
++		 * See [1] for more details.
++		 */
++		if (budget_timeout)
++			bfq_bfqq_expire(bfqd, bfqq, 0, BFQ_BFQQ_BUDGET_TIMEOUT);
++
++		/*
++		 * Let the request rip immediately, or let a new queue be
++		 * selected if bfqq has just been expired.
++		 */
++		__blk_run_queue(bfqd->queue);
++	}
++}
++
++static void bfq_insert_request(struct request_queue *q, struct request *rq)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct bfq_queue *bfqq = RQ_BFQQ(rq), *new_bfqq;
++
++	assert_spin_locked(bfqd->queue->queue_lock);
++
++	/*
++	 * An unplug may trigger a requeue of a request from the device
++	 * driver: make sure we are in process context while trying to
++	 * merge two bfq_queues.
++	 */
++	if (!in_interrupt()) {
++		new_bfqq = bfq_setup_cooperator(bfqd, bfqq, rq, true);
++		if (new_bfqq != NULL) {
++			if (bic_to_bfqq(RQ_BIC(rq), 1) != bfqq)
++				new_bfqq = bic_to_bfqq(RQ_BIC(rq), 1);
++			/*
++			 * Release the request's reference to the old bfqq
++			 * and make sure one is taken to the shared queue.
++			 */
++			new_bfqq->allocated[rq_data_dir(rq)]++;
++			bfqq->allocated[rq_data_dir(rq)]--;
++			atomic_inc(&new_bfqq->ref);
++			bfq_put_queue(bfqq);
++			if (bic_to_bfqq(RQ_BIC(rq), 1) == bfqq)
++				bfq_merge_bfqqs(bfqd, RQ_BIC(rq),
++						bfqq, new_bfqq);
++			rq->elv.priv[1] = new_bfqq;
++			bfqq = new_bfqq;
++		} else
++			bfq_bfqq_increase_failed_cooperations(bfqq);
++	}
++
++	bfq_init_prio_data(bfqq, RQ_BIC(rq));
++
++	bfq_add_request(rq);
++
++	/*
++	 * Here a newly-created bfq_queue has already started a weight-raising
++	 * period: clear raising_time_left to prevent bfq_bfqq_save_state()
++	 * from assigning it a full weight-raising period. See the detailed
++	 * comments about this field in bfq_init_icq().
++	 */
++	if (bfqq->bic != NULL)
++		bfqq->bic->wr_time_left = 0;
++	rq->fifo_time = jiffies + bfqd->bfq_fifo_expire[rq_is_sync(rq)];
++	list_add_tail(&rq->queuelist, &bfqq->fifo);
++
++	bfq_rq_enqueued(bfqd, bfqq, rq);
++}
++
++static void bfq_update_hw_tag(struct bfq_data *bfqd)
++{
++	bfqd->max_rq_in_driver = max(bfqd->max_rq_in_driver,
++				     bfqd->rq_in_driver);
++
++	if (bfqd->hw_tag == 1)
++		return;
++
++	/*
++	 * This sample is valid if the number of outstanding requests
++	 * is large enough to allow a queueing behavior.  Note that the
++	 * sum is not exact, as it's not taking into account deactivated
++	 * requests.
++	 */
++	if (bfqd->rq_in_driver + bfqd->queued < BFQ_HW_QUEUE_THRESHOLD)
++		return;
++
++	if (bfqd->hw_tag_samples++ < BFQ_HW_QUEUE_SAMPLES)
++		return;
++
++	bfqd->hw_tag = bfqd->max_rq_in_driver > BFQ_HW_QUEUE_THRESHOLD;
++	bfqd->max_rq_in_driver = 0;
++	bfqd->hw_tag_samples = 0;
++}
++
++static void bfq_completed_request(struct request_queue *q, struct request *rq)
++{
++	struct bfq_queue *bfqq = RQ_BFQQ(rq);
++	struct bfq_data *bfqd = bfqq->bfqd;
++	bool sync = bfq_bfqq_sync(bfqq);
++
++	bfq_log_bfqq(bfqd, bfqq, "completed one req with %u sects left (%d)",
++		     blk_rq_sectors(rq), sync);
++
++	bfq_update_hw_tag(bfqd);
++
++	BUG_ON(!bfqd->rq_in_driver);
++	BUG_ON(!bfqq->dispatched);
++	bfqd->rq_in_driver--;
++	bfqq->dispatched--;
++
++	if (!bfqq->dispatched && !bfq_bfqq_busy(bfqq)) {
++		bfq_weights_tree_remove(bfqd, &bfqq->entity,
++					&bfqd->queue_weights_tree);
++		if (!blk_queue_nonrot(bfqd->queue)) {
++			BUG_ON(!bfqd->busy_in_flight_queues);
++			bfqd->busy_in_flight_queues--;
++			if (bfq_bfqq_constantly_seeky(bfqq)) {
++				BUG_ON(!bfqd->
++					const_seeky_busy_in_flight_queues);
++				bfqd->const_seeky_busy_in_flight_queues--;
++			}
++		}
++	}
++
++	if (sync) {
++		bfqd->sync_flight--;
++		RQ_BIC(rq)->ttime.last_end_request = jiffies;
++	}
++
++	/*
++	 * If we are waiting to discover whether the request pattern of the
++	 * task associated with the queue is actually isochronous, and
++	 * both requisites for this condition to hold are satisfied, then
++	 * compute soft_rt_next_start (see the comments to the function
++	 * bfq_bfqq_softrt_next_start()).
++	 */
++	if (bfq_bfqq_softrt_update(bfqq) && bfqq->dispatched == 0 &&
++	    RB_EMPTY_ROOT(&bfqq->sort_list))
++		bfqq->soft_rt_next_start =
++			bfq_bfqq_softrt_next_start(bfqd, bfqq);
++
++	/*
++	 * If this is the in-service queue, check if it needs to be expired,
++	 * or if we want to idle in case it has no pending requests.
++	 */
++	if (bfqd->in_service_queue == bfqq) {
++		if (bfq_bfqq_budget_new(bfqq))
++			bfq_set_budget_timeout(bfqd);
++
++		if (bfq_bfqq_must_idle(bfqq)) {
++			bfq_arm_slice_timer(bfqd);
++			goto out;
++		} else if (bfq_may_expire_for_budg_timeout(bfqq))
++			bfq_bfqq_expire(bfqd, bfqq, 0, BFQ_BFQQ_BUDGET_TIMEOUT);
++		else if (RB_EMPTY_ROOT(&bfqq->sort_list) &&
++			 (bfqq->dispatched == 0 ||
++			  !bfq_bfqq_must_not_expire(bfqq)))
++			bfq_bfqq_expire(bfqd, bfqq, 0,
++					BFQ_BFQQ_NO_MORE_REQUESTS);
++	}
++
++	if (!bfqd->rq_in_driver)
++		bfq_schedule_dispatch(bfqd);
++
++out:
++	return;
++}
++
++static inline int __bfq_may_queue(struct bfq_queue *bfqq)
++{
++	if (bfq_bfqq_wait_request(bfqq) && bfq_bfqq_must_alloc(bfqq)) {
++		bfq_clear_bfqq_must_alloc(bfqq);
++		return ELV_MQUEUE_MUST;
++	}
++
++	return ELV_MQUEUE_MAY;
++}
++
++static int bfq_may_queue(struct request_queue *q, int rw)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct task_struct *tsk = current;
++	struct bfq_io_cq *bic;
++	struct bfq_queue *bfqq;
++
++	/*
++	 * Don't force setup of a queue from here, as a call to may_queue
++	 * does not necessarily imply that a request actually will be
++	 * queued. So just lookup a possibly existing queue, or return
++	 * 'may queue' if that fails.
++	 */
++	bic = bfq_bic_lookup(bfqd, tsk->io_context);
++	if (bic == NULL)
++		return ELV_MQUEUE_MAY;
++
++	bfqq = bic_to_bfqq(bic, rw_is_sync(rw));
++	if (bfqq != NULL) {
++		bfq_init_prio_data(bfqq, bic);
++
++		return __bfq_may_queue(bfqq);
++	}
++
++	return ELV_MQUEUE_MAY;
++}
++
++/*
++ * Queue lock held here.
++ */
++static void bfq_put_request(struct request *rq)
++{
++	struct bfq_queue *bfqq = RQ_BFQQ(rq);
++
++	if (bfqq != NULL) {
++		const int rw = rq_data_dir(rq);
++
++		BUG_ON(!bfqq->allocated[rw]);
++		bfqq->allocated[rw]--;
++
++		rq->elv.priv[0] = NULL;
++		rq->elv.priv[1] = NULL;
++
++		bfq_log_bfqq(bfqq->bfqd, bfqq, "put_request %p, %d",
++			     bfqq, atomic_read(&bfqq->ref));
++		bfq_put_queue(bfqq);
++	}
++}
++
++/*
++ * Returns NULL if a new bfqq should be allocated, or the old bfqq if this
++ * was the last process referring to said bfqq.
++ */
++static struct bfq_queue *
++bfq_split_bfqq(struct bfq_io_cq *bic, struct bfq_queue *bfqq)
++{
++	bfq_log_bfqq(bfqq->bfqd, bfqq, "splitting queue");
++
++	put_io_context(bic->icq.ioc);
++
++	if (bfqq_process_refs(bfqq) == 1) {
++		bfqq->pid = current->pid;
++		bfq_clear_bfqq_coop(bfqq);
++		bfq_clear_bfqq_split_coop(bfqq);
++		return bfqq;
++	}
++
++	bic_set_bfqq(bic, NULL, 1);
++
++	bfq_put_cooperator(bfqq);
++
++	bfq_put_queue(bfqq);
++	return NULL;
++}
++
++/*
++ * Allocate bfq data structures associated with this request.
++ */
++static int bfq_set_request(struct request_queue *q, struct request *rq,
++			   struct bio *bio, gfp_t gfp_mask)
++{
++	struct bfq_data *bfqd = q->elevator->elevator_data;
++	struct bfq_io_cq *bic = icq_to_bic(rq->elv.icq);
++	const int rw = rq_data_dir(rq);
++	const int is_sync = rq_is_sync(rq);
++	struct bfq_queue *bfqq;
++	struct bfq_group *bfqg;
++	unsigned long flags;
++	bool split = false;
++
++	might_sleep_if(gfp_mask & __GFP_WAIT);
++
++	bfq_changed_ioprio(bic);
++
++	spin_lock_irqsave(q->queue_lock, flags);
++
++	if (bic == NULL)
++		goto queue_fail;
++
++	bfqg = bfq_bic_update_cgroup(bic);
++
++new_queue:
++	bfqq = bic_to_bfqq(bic, is_sync);
++	if (bfqq == NULL || bfqq == &bfqd->oom_bfqq) {
++		bfqq = bfq_get_queue(bfqd, bfqg, is_sync, bic, gfp_mask);
++		bic_set_bfqq(bic, bfqq, is_sync);
++		if (split && is_sync) {
++			if ((bic->was_in_burst_list && bfqd->large_burst) ||
++			    bic->saved_in_large_burst)
++				bfq_mark_bfqq_in_large_burst(bfqq);
++			else {
++			    bfq_clear_bfqq_in_large_burst(bfqq);
++			    if (bic->was_in_burst_list)
++			       hlist_add_head(&bfqq->burst_list_node,
++				              &bfqd->burst_list);
++			}
++		}
++	} else {
++		/* If the queue was seeky for too long, break it apart. */
++		if (bfq_bfqq_coop(bfqq) && bfq_bfqq_split_coop(bfqq)) {
++			bfq_log_bfqq(bfqd, bfqq, "breaking apart bfqq");
++			bfqq = bfq_split_bfqq(bic, bfqq);
++			split = true;
++			if (!bfqq)
++				goto new_queue;
++		}
++	}
++
++	bfqq->allocated[rw]++;
++	atomic_inc(&bfqq->ref);
++	bfq_log_bfqq(bfqd, bfqq, "set_request: bfqq %p, %d", bfqq,
++		     atomic_read(&bfqq->ref));
++
++	rq->elv.priv[0] = bic;
++	rq->elv.priv[1] = bfqq;
++
++	/*
++	 * If a bfq_queue has only one process reference, it is owned
++	 * by only one bfq_io_cq: we can set the bic field of the
++	 * bfq_queue to the address of that structure. Also, if the
++	 * queue has just been split, mark a flag so that the
++	 * information is available to the other scheduler hooks.
++	 */
++	if (likely(bfqq != &bfqd->oom_bfqq) && bfqq_process_refs(bfqq) == 1) {
++		bfqq->bic = bic;
++		if (split) {
++			bfq_mark_bfqq_just_split(bfqq);
++			/*
++			 * If the queue has just been split from a shared
++			 * queue, restore the idle window and the possible
++			 * weight raising period.
++			 */
++			bfq_bfqq_resume_state(bfqq, bic);
++		}
++	}
++
++	spin_unlock_irqrestore(q->queue_lock, flags);
++
++	return 0;
++
++queue_fail:
++	bfq_schedule_dispatch(bfqd);
++	spin_unlock_irqrestore(q->queue_lock, flags);
++
++	return 1;
++}
++
++static void bfq_kick_queue(struct work_struct *work)
++{
++	struct bfq_data *bfqd =
++		container_of(work, struct bfq_data, unplug_work);
++	struct request_queue *q = bfqd->queue;
++
++	spin_lock_irq(q->queue_lock);
++	__blk_run_queue(q);
++	spin_unlock_irq(q->queue_lock);
++}
++
++/*
++ * Handler of the expiration of the timer running if the in-service queue
++ * is idling inside its time slice.
++ */
++static void bfq_idle_slice_timer(unsigned long data)
++{
++	struct bfq_data *bfqd = (struct bfq_data *)data;
++	struct bfq_queue *bfqq;
++	unsigned long flags;
++	enum bfqq_expiration reason;
++
++	spin_lock_irqsave(bfqd->queue->queue_lock, flags);
++
++	bfqq = bfqd->in_service_queue;
++	/*
++	 * Theoretical race here: the in-service queue can be NULL or
++	 * different from the queue that was idling if the timer handler
++	 * spins on the queue_lock and a new request arrives for the
++	 * current queue and there is a full dispatch cycle that changes
++	 * the in-service queue.  This can hardly happen, but in the worst
++	 * case we just expire a queue too early.
++	 */
++	if (bfqq != NULL) {
++		bfq_log_bfqq(bfqd, bfqq, "slice_timer expired");
++		if (bfq_bfqq_budget_timeout(bfqq))
++			/*
++			 * Also here the queue can be safely expired
++			 * for budget timeout without wasting
++			 * guarantees
++			 */
++			reason = BFQ_BFQQ_BUDGET_TIMEOUT;
++		else if (bfqq->queued[0] == 0 && bfqq->queued[1] == 0)
++			/*
++			 * The queue may not be empty upon timer expiration,
++			 * because we may not disable the timer when the
++			 * first request of the in-service queue arrives
++			 * during disk idling.
++			 */
++			reason = BFQ_BFQQ_TOO_IDLE;
++		else
++			goto schedule_dispatch;
++
++		bfq_bfqq_expire(bfqd, bfqq, 1, reason);
++	}
++
++schedule_dispatch:
++	bfq_schedule_dispatch(bfqd);
++
++	spin_unlock_irqrestore(bfqd->queue->queue_lock, flags);
++}
++
++static void bfq_shutdown_timer_wq(struct bfq_data *bfqd)
++{
++	del_timer_sync(&bfqd->idle_slice_timer);
++	cancel_work_sync(&bfqd->unplug_work);
++}
++
++static inline void __bfq_put_async_bfqq(struct bfq_data *bfqd,
++					struct bfq_queue **bfqq_ptr)
++{
++	struct bfq_group *root_group = bfqd->root_group;
++	struct bfq_queue *bfqq = *bfqq_ptr;
++
++	bfq_log(bfqd, "put_async_bfqq: %p", bfqq);
++	if (bfqq != NULL) {
++		bfq_bfqq_move(bfqd, bfqq, &bfqq->entity, root_group);
++		bfq_log_bfqq(bfqd, bfqq, "put_async_bfqq: putting %p, %d",
++			     bfqq, atomic_read(&bfqq->ref));
++		bfq_put_queue(bfqq);
++		*bfqq_ptr = NULL;
++	}
++}
++
++/*
++ * Release all the bfqg references to its async queues.  If we are
++ * deallocating the group these queues may still contain requests, so
++ * we reparent them to the root cgroup (i.e., the only one that will
++ * exist for sure until all the requests on a device are gone).
++ */
++static void bfq_put_async_queues(struct bfq_data *bfqd, struct bfq_group *bfqg)
++{
++	int i, j;
++
++	for (i = 0; i < 2; i++)
++		for (j = 0; j < IOPRIO_BE_NR; j++)
++			__bfq_put_async_bfqq(bfqd, &bfqg->async_bfqq[i][j]);
++
++	__bfq_put_async_bfqq(bfqd, &bfqg->async_idle_bfqq);
++}
++
++static void bfq_exit_queue(struct elevator_queue *e)
++{
++	struct bfq_data *bfqd = e->elevator_data;
++	struct request_queue *q = bfqd->queue;
++	struct bfq_queue *bfqq, *n;
++
++	bfq_shutdown_timer_wq(bfqd);
++
++	spin_lock_irq(q->queue_lock);
++
++	BUG_ON(bfqd->in_service_queue != NULL);
++	list_for_each_entry_safe(bfqq, n, &bfqd->idle_list, bfqq_list)
++		bfq_deactivate_bfqq(bfqd, bfqq, 0);
++
++	bfq_disconnect_groups(bfqd);
++	spin_unlock_irq(q->queue_lock);
++
++	bfq_shutdown_timer_wq(bfqd);
++
++	synchronize_rcu();
++
++	BUG_ON(timer_pending(&bfqd->idle_slice_timer));
++
++	bfq_free_root_group(bfqd);
++	kfree(bfqd);
++}
++
++static int bfq_init_queue(struct request_queue *q, struct elevator_type *e)
++{
++	struct bfq_group *bfqg;
++	struct bfq_data *bfqd;
++	struct elevator_queue *eq;
++
++	eq = elevator_alloc(q, e);
++	if (eq == NULL)
++		return -ENOMEM;
++
++	bfqd = kzalloc_node(sizeof(*bfqd), GFP_KERNEL, q->node);
++	if (bfqd == NULL) {
++		kobject_put(&eq->kobj);
++		return -ENOMEM;
++	}
++	eq->elevator_data = bfqd;
++
++	/*
++	 * Our fallback bfqq if bfq_find_alloc_queue() runs into OOM issues.
++	 * Grab a permanent reference to it, so that the normal code flow
++	 * will not attempt to free it.
++	 */
++	bfq_init_bfqq(bfqd, &bfqd->oom_bfqq, 1, 0);
++	atomic_inc(&bfqd->oom_bfqq.ref);
++	bfqd->oom_bfqq.entity.new_ioprio = BFQ_DEFAULT_QUEUE_IOPRIO;
++	bfqd->oom_bfqq.entity.new_ioprio_class = IOPRIO_CLASS_BE;
++	/*
++	 * Trigger weight initialization, according to ioprio, at the
++	 * oom_bfqq's first activation. The oom_bfqq's ioprio and ioprio
++	 * class won't be changed any more.
++	 */
++	bfqd->oom_bfqq.entity.ioprio_changed = 1;
++
++	bfqd->queue = q;
++
++	spin_lock_irq(q->queue_lock);
++	q->elevator = eq;
++	spin_unlock_irq(q->queue_lock);
++
++	bfqg = bfq_alloc_root_group(bfqd, q->node);
++	if (bfqg == NULL) {
++		kfree(bfqd);
++		kobject_put(&eq->kobj);
++		return -ENOMEM;
++	}
++
++	bfqd->root_group = bfqg;
++	bfq_init_entity(&bfqd->oom_bfqq.entity, bfqd->root_group);
++#ifdef CONFIG_CGROUP_BFQIO
++	bfqd->active_numerous_groups = 0;
++#endif
++
++	init_timer(&bfqd->idle_slice_timer);
++	bfqd->idle_slice_timer.function = bfq_idle_slice_timer;
++	bfqd->idle_slice_timer.data = (unsigned long)bfqd;
++
++	bfqd->rq_pos_tree = RB_ROOT;
++	bfqd->queue_weights_tree = RB_ROOT;
++	bfqd->group_weights_tree = RB_ROOT;
++
++	INIT_WORK(&bfqd->unplug_work, bfq_kick_queue);
++
++	INIT_LIST_HEAD(&bfqd->active_list);
++	INIT_LIST_HEAD(&bfqd->idle_list);
++	INIT_HLIST_HEAD(&bfqd->burst_list);
++
++	bfqd->hw_tag = -1;
++
++	bfqd->bfq_max_budget = bfq_default_max_budget;
++
++	bfqd->bfq_quantum = bfq_quantum;
++	bfqd->bfq_fifo_expire[0] = bfq_fifo_expire[0];
++	bfqd->bfq_fifo_expire[1] = bfq_fifo_expire[1];
++	bfqd->bfq_back_max = bfq_back_max;
++	bfqd->bfq_back_penalty = bfq_back_penalty;
++	bfqd->bfq_slice_idle = bfq_slice_idle;
++	bfqd->bfq_class_idle_last_service = 0;
++	bfqd->bfq_max_budget_async_rq = bfq_max_budget_async_rq;
++	bfqd->bfq_timeout[BLK_RW_ASYNC] = bfq_timeout_async;
++	bfqd->bfq_timeout[BLK_RW_SYNC] = bfq_timeout_sync;
++
++	bfqd->bfq_coop_thresh = 2;
++	bfqd->bfq_failed_cooperations = 7000;
++	bfqd->bfq_requests_within_timer = 120;
++
++	bfqd->bfq_large_burst_thresh = 11;
++	bfqd->bfq_burst_interval = msecs_to_jiffies(500);
++
++	bfqd->low_latency = true;
++
++	bfqd->bfq_wr_coeff = 20;
++	bfqd->bfq_wr_rt_max_time = msecs_to_jiffies(300);
++	bfqd->bfq_wr_max_time = 0;
++	bfqd->bfq_wr_min_idle_time = msecs_to_jiffies(2000);
++	bfqd->bfq_wr_min_inter_arr_async = msecs_to_jiffies(500);
++	bfqd->bfq_wr_max_softrt_rate = 7000; /*
++					      * Approximate rate required
++					      * to playback or record a
++					      * high-definition compressed
++					      * video.
++					      */
++	bfqd->wr_busy_queues = 0;
++	bfqd->busy_in_flight_queues = 0;
++	bfqd->const_seeky_busy_in_flight_queues = 0;
++
++	/*
++	 * Begin by assuming, optimistically, that the device peak rate is
++	 * equal to the highest reference rate.
++	 */
++	bfqd->RT_prod = R_fast[blk_queue_nonrot(bfqd->queue)] *
++			T_fast[blk_queue_nonrot(bfqd->queue)];
++	bfqd->peak_rate = R_fast[blk_queue_nonrot(bfqd->queue)];
++	bfqd->device_speed = BFQ_BFQD_FAST;
++
++	return 0;
++}
++
++static void bfq_slab_kill(void)
++{
++	if (bfq_pool != NULL)
++		kmem_cache_destroy(bfq_pool);
++}
++
++static int __init bfq_slab_setup(void)
++{
++	bfq_pool = KMEM_CACHE(bfq_queue, 0);
++	if (bfq_pool == NULL)
++		return -ENOMEM;
++	return 0;
++}
++
++static ssize_t bfq_var_show(unsigned int var, char *page)
++{
++	return sprintf(page, "%d\n", var);
++}
++
++static ssize_t bfq_var_store(unsigned long *var, const char *page,
++			     size_t count)
++{
++	unsigned long new_val;
++	int ret = kstrtoul(page, 10, &new_val);
++
++	if (ret == 0)
++		*var = new_val;
++
++	return count;
++}
++
++static ssize_t bfq_wr_max_time_show(struct elevator_queue *e, char *page)
++{
++	struct bfq_data *bfqd = e->elevator_data;
++	return sprintf(page, "%d\n", bfqd->bfq_wr_max_time > 0 ?
++		       jiffies_to_msecs(bfqd->bfq_wr_max_time) :
++		       jiffies_to_msecs(bfq_wr_duration(bfqd)));
++}
++
++static ssize_t bfq_weights_show(struct elevator_queue *e, char *page)
++{
++	struct bfq_queue *bfqq;
++	struct bfq_data *bfqd = e->elevator_data;
++	ssize_t num_char = 0;
++
++	num_char += sprintf(page + num_char, "Tot reqs queued %d\n\n",
++			    bfqd->queued);
++
++	spin_lock_irq(bfqd->queue->queue_lock);
++
++	num_char += sprintf(page + num_char, "Active:\n");
++	list_for_each_entry(bfqq, &bfqd->active_list, bfqq_list) {
++	  num_char += sprintf(page + num_char,
++			      "pid%d: weight %hu, nr_queued %d %d, dur %d/%u\n",
++			      bfqq->pid,
++			      bfqq->entity.weight,
++			      bfqq->queued[0],
++			      bfqq->queued[1],
++			jiffies_to_msecs(jiffies - bfqq->last_wr_start_finish),
++			jiffies_to_msecs(bfqq->wr_cur_max_time));
++	}
++
++	num_char += sprintf(page + num_char, "Idle:\n");
++	list_for_each_entry(bfqq, &bfqd->idle_list, bfqq_list) {
++			num_char += sprintf(page + num_char,
++				"pid%d: weight %hu, dur %d/%u\n",
++				bfqq->pid,
++				bfqq->entity.weight,
++				jiffies_to_msecs(jiffies -
++					bfqq->last_wr_start_finish),
++				jiffies_to_msecs(bfqq->wr_cur_max_time));
++	}
++
++	spin_unlock_irq(bfqd->queue->queue_lock);
++
++	return num_char;
++}
++
++#define SHOW_FUNCTION(__FUNC, __VAR, __CONV)				\
++static ssize_t __FUNC(struct elevator_queue *e, char *page)		\
++{									\
++	struct bfq_data *bfqd = e->elevator_data;			\
++	unsigned int __data = __VAR;					\
++	if (__CONV)							\
++		__data = jiffies_to_msecs(__data);			\
++	return bfq_var_show(__data, (page));				\
++}
++SHOW_FUNCTION(bfq_quantum_show, bfqd->bfq_quantum, 0);
++SHOW_FUNCTION(bfq_fifo_expire_sync_show, bfqd->bfq_fifo_expire[1], 1);
++SHOW_FUNCTION(bfq_fifo_expire_async_show, bfqd->bfq_fifo_expire[0], 1);
++SHOW_FUNCTION(bfq_back_seek_max_show, bfqd->bfq_back_max, 0);
++SHOW_FUNCTION(bfq_back_seek_penalty_show, bfqd->bfq_back_penalty, 0);
++SHOW_FUNCTION(bfq_slice_idle_show, bfqd->bfq_slice_idle, 1);
++SHOW_FUNCTION(bfq_max_budget_show, bfqd->bfq_user_max_budget, 0);
++SHOW_FUNCTION(bfq_max_budget_async_rq_show,
++	      bfqd->bfq_max_budget_async_rq, 0);
++SHOW_FUNCTION(bfq_timeout_sync_show, bfqd->bfq_timeout[BLK_RW_SYNC], 1);
++SHOW_FUNCTION(bfq_timeout_async_show, bfqd->bfq_timeout[BLK_RW_ASYNC], 1);
++SHOW_FUNCTION(bfq_low_latency_show, bfqd->low_latency, 0);
++SHOW_FUNCTION(bfq_wr_coeff_show, bfqd->bfq_wr_coeff, 0);
++SHOW_FUNCTION(bfq_wr_rt_max_time_show, bfqd->bfq_wr_rt_max_time, 1);
++SHOW_FUNCTION(bfq_wr_min_idle_time_show, bfqd->bfq_wr_min_idle_time, 1);
++SHOW_FUNCTION(bfq_wr_min_inter_arr_async_show, bfqd->bfq_wr_min_inter_arr_async,
++	1);
++SHOW_FUNCTION(bfq_wr_max_softrt_rate_show, bfqd->bfq_wr_max_softrt_rate, 0);
++#undef SHOW_FUNCTION
++
++#define STORE_FUNCTION(__FUNC, __PTR, MIN, MAX, __CONV)			\
++static ssize_t								\
++__FUNC(struct elevator_queue *e, const char *page, size_t count)	\
++{									\
++	struct bfq_data *bfqd = e->elevator_data;			\
++	unsigned long uninitialized_var(__data);			\
++	int ret = bfq_var_store(&__data, (page), count);		\
++	if (__data < (MIN))						\
++		__data = (MIN);						\
++	else if (__data > (MAX))					\
++		__data = (MAX);						\
++	if (__CONV)							\
++		*(__PTR) = msecs_to_jiffies(__data);			\
++	else								\
++		*(__PTR) = __data;					\
++	return ret;							\
++}
++STORE_FUNCTION(bfq_quantum_store, &bfqd->bfq_quantum, 1, INT_MAX, 0);
++STORE_FUNCTION(bfq_fifo_expire_sync_store, &bfqd->bfq_fifo_expire[1], 1,
++		INT_MAX, 1);
++STORE_FUNCTION(bfq_fifo_expire_async_store, &bfqd->bfq_fifo_expire[0], 1,
++		INT_MAX, 1);
++STORE_FUNCTION(bfq_back_seek_max_store, &bfqd->bfq_back_max, 0, INT_MAX, 0);
++STORE_FUNCTION(bfq_back_seek_penalty_store, &bfqd->bfq_back_penalty, 1,
++		INT_MAX, 0);
++STORE_FUNCTION(bfq_slice_idle_store, &bfqd->bfq_slice_idle, 0, INT_MAX, 1);
++STORE_FUNCTION(bfq_max_budget_async_rq_store, &bfqd->bfq_max_budget_async_rq,
++		1, INT_MAX, 0);
++STORE_FUNCTION(bfq_timeout_async_store, &bfqd->bfq_timeout[BLK_RW_ASYNC], 0,
++		INT_MAX, 1);
++STORE_FUNCTION(bfq_wr_coeff_store, &bfqd->bfq_wr_coeff, 1, INT_MAX, 0);
++STORE_FUNCTION(bfq_wr_max_time_store, &bfqd->bfq_wr_max_time, 0, INT_MAX, 1);
++STORE_FUNCTION(bfq_wr_rt_max_time_store, &bfqd->bfq_wr_rt_max_time, 0, INT_MAX,
++		1);
++STORE_FUNCTION(bfq_wr_min_idle_time_store, &bfqd->bfq_wr_min_idle_time, 0,
++		INT_MAX, 1);
++STORE_FUNCTION(bfq_wr_min_inter_arr_async_store,
++		&bfqd->bfq_wr_min_inter_arr_async, 0, INT_MAX, 1);
++STORE_FUNCTION(bfq_wr_max_softrt_rate_store, &bfqd->bfq_wr_max_softrt_rate, 0,
++		INT_MAX, 0);
++#undef STORE_FUNCTION
++
++/* do nothing for the moment */
++static ssize_t bfq_weights_store(struct elevator_queue *e,
++				    const char *page, size_t count)
++{
++	return count;
++}
++
++static inline unsigned long bfq_estimated_max_budget(struct bfq_data *bfqd)
++{
++	u64 timeout = jiffies_to_msecs(bfqd->bfq_timeout[BLK_RW_SYNC]);
++
++	if (bfqd->peak_rate_samples >= BFQ_PEAK_RATE_SAMPLES)
++		return bfq_calc_max_budget(bfqd->peak_rate, timeout);
++	else
++		return bfq_default_max_budget;
++}
++
++static ssize_t bfq_max_budget_store(struct elevator_queue *e,
++				    const char *page, size_t count)
++{
++	struct bfq_data *bfqd = e->elevator_data;
++	unsigned long uninitialized_var(__data);
++	int ret = bfq_var_store(&__data, (page), count);
++
++	if (__data == 0)
++		bfqd->bfq_max_budget = bfq_estimated_max_budget(bfqd);
++	else {
++		if (__data > INT_MAX)
++			__data = INT_MAX;
++		bfqd->bfq_max_budget = __data;
++	}
++
++	bfqd->bfq_user_max_budget = __data;
++
++	return ret;
++}
++
++static ssize_t bfq_timeout_sync_store(struct elevator_queue *e,
++				      const char *page, size_t count)
++{
++	struct bfq_data *bfqd = e->elevator_data;
++	unsigned long uninitialized_var(__data);
++	int ret = bfq_var_store(&__data, (page), count);
++
++	if (__data < 1)
++		__data = 1;
++	else if (__data > INT_MAX)
++		__data = INT_MAX;
++
++	bfqd->bfq_timeout[BLK_RW_SYNC] = msecs_to_jiffies(__data);
++	if (bfqd->bfq_user_max_budget == 0)
++		bfqd->bfq_max_budget = bfq_estimated_max_budget(bfqd);
++
++	return ret;
++}
++
++static ssize_t bfq_low_latency_store(struct elevator_queue *e,
++				     const char *page, size_t count)
++{
++	struct bfq_data *bfqd = e->elevator_data;
++	unsigned long uninitialized_var(__data);
++	int ret = bfq_var_store(&__data, (page), count);
++
++	if (__data > 1)
++		__data = 1;
++	if (__data == 0 && bfqd->low_latency != 0)
++		bfq_end_wr(bfqd);
++	bfqd->low_latency = __data;
++
++	return ret;
++}
++
++#define BFQ_ATTR(name) \
++	__ATTR(name, S_IRUGO|S_IWUSR, bfq_##name##_show, bfq_##name##_store)
++
++static struct elv_fs_entry bfq_attrs[] = {
++	BFQ_ATTR(quantum),
++	BFQ_ATTR(fifo_expire_sync),
++	BFQ_ATTR(fifo_expire_async),
++	BFQ_ATTR(back_seek_max),
++	BFQ_ATTR(back_seek_penalty),
++	BFQ_ATTR(slice_idle),
++	BFQ_ATTR(max_budget),
++	BFQ_ATTR(max_budget_async_rq),
++	BFQ_ATTR(timeout_sync),
++	BFQ_ATTR(timeout_async),
++	BFQ_ATTR(low_latency),
++	BFQ_ATTR(wr_coeff),
++	BFQ_ATTR(wr_max_time),
++	BFQ_ATTR(wr_rt_max_time),
++	BFQ_ATTR(wr_min_idle_time),
++	BFQ_ATTR(wr_min_inter_arr_async),
++	BFQ_ATTR(wr_max_softrt_rate),
++	BFQ_ATTR(weights),
++	__ATTR_NULL
++};
++
++static struct elevator_type iosched_bfq = {
++	.ops = {
++		.elevator_merge_fn =		bfq_merge,
++		.elevator_merged_fn =		bfq_merged_request,
++		.elevator_merge_req_fn =	bfq_merged_requests,
++		.elevator_allow_merge_fn =	bfq_allow_merge,
++		.elevator_dispatch_fn =		bfq_dispatch_requests,
++		.elevator_add_req_fn =		bfq_insert_request,
++		.elevator_activate_req_fn =	bfq_activate_request,
++		.elevator_deactivate_req_fn =	bfq_deactivate_request,
++		.elevator_completed_req_fn =	bfq_completed_request,
++		.elevator_former_req_fn =	elv_rb_former_request,
++		.elevator_latter_req_fn =	elv_rb_latter_request,
++		.elevator_init_icq_fn =		bfq_init_icq,
++		.elevator_exit_icq_fn =		bfq_exit_icq,
++		.elevator_set_req_fn =		bfq_set_request,
++		.elevator_put_req_fn =		bfq_put_request,
++		.elevator_may_queue_fn =	bfq_may_queue,
++		.elevator_init_fn =		bfq_init_queue,
++		.elevator_exit_fn =		bfq_exit_queue,
++	},
++	.icq_size =		sizeof(struct bfq_io_cq),
++	.icq_align =		__alignof__(struct bfq_io_cq),
++	.elevator_attrs =	bfq_attrs,
++	.elevator_name =	"bfq",
++	.elevator_owner =	THIS_MODULE,
++};
++
++static int __init bfq_init(void)
++{
++	/*
++	 * Can be 0 on HZ < 1000 setups.
++	 */
++	if (bfq_slice_idle == 0)
++		bfq_slice_idle = 1;
++
++	if (bfq_timeout_async == 0)
++		bfq_timeout_async = 1;
++
++	if (bfq_slab_setup())
++		return -ENOMEM;
++
++	/*
++	 * Times to load large popular applications for the typical systems
++	 * installed on the reference devices (see the comments before the
++	 * definitions of the two arrays).
++	 */
++	T_slow[0] = msecs_to_jiffies(2600);
++	T_slow[1] = msecs_to_jiffies(1000);
++	T_fast[0] = msecs_to_jiffies(5500);
++	T_fast[1] = msecs_to_jiffies(2000);
++
++	/*
++	 * Thresholds that determine the switch between speed classes (see
++	 * the comments before the definition of the array).
++	 */
++	device_speed_thresh[0] = (R_fast[0] + R_slow[0]) / 2;
++	device_speed_thresh[1] = (R_fast[1] + R_slow[1]) / 2;
++
++	elv_register(&iosched_bfq);
++	pr_info("BFQ I/O-scheduler version: v7r7");
++
++	return 0;
++}
++
++static void __exit bfq_exit(void)
++{
++	elv_unregister(&iosched_bfq);
++	bfq_slab_kill();
++}
++
++module_init(bfq_init);
++module_exit(bfq_exit);
++
++MODULE_AUTHOR("Fabio Checconi, Paolo Valente");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/block/bfq-sched.c linux-xbian-imx6/block/bfq-sched.c
+--- linux-4.1.3/block/bfq-sched.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/block/bfq-sched.c	2015-07-27 23:13:03.604123194 +0200
+@@ -0,0 +1,1186 @@
++/*
++ * BFQ: Hierarchical B-WF2Q+ scheduler.
++ *
++ * Based on ideas and code from CFQ:
++ * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
++ *
++ * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
++ *		      Paolo Valente <paolo.valente@unimore.it>
++ *
++ * Copyright (C) 2010 Paolo Valente <paolo.valente@unimore.it>
++ */
++
++#ifdef CONFIG_CGROUP_BFQIO
++#define for_each_entity(entity)	\
++	for (; entity != NULL; entity = entity->parent)
++
++#define for_each_entity_safe(entity, parent) \
++	for (; entity && ({ parent = entity->parent; 1; }); entity = parent)
++
++static struct bfq_entity *bfq_lookup_next_entity(struct bfq_sched_data *sd,
++						 int extract,
++						 struct bfq_data *bfqd);
++
++static inline void bfq_update_budget(struct bfq_entity *next_in_service)
++{
++	struct bfq_entity *bfqg_entity;
++	struct bfq_group *bfqg;
++	struct bfq_sched_data *group_sd;
++
++	BUG_ON(next_in_service == NULL);
++
++	group_sd = next_in_service->sched_data;
++
++	bfqg = container_of(group_sd, struct bfq_group, sched_data);
++	/*
++	 * bfq_group's my_entity field is not NULL only if the group
++	 * is not the root group. We must not touch the root entity
++	 * as it must never become an in-service entity.
++	 */
++	bfqg_entity = bfqg->my_entity;
++	if (bfqg_entity != NULL)
++		bfqg_entity->budget = next_in_service->budget;
++}
++
++static int bfq_update_next_in_service(struct bfq_sched_data *sd)
++{
++	struct bfq_entity *next_in_service;
++
++	if (sd->in_service_entity != NULL)
++		/* will update/requeue at the end of service */
++		return 0;
++
++	/*
++	 * NOTE: this can be improved in many ways, such as returning
++	 * 1 (and thus propagating upwards the update) only when the
++	 * budget changes, or caching the bfqq that will be scheduled
++	 * next from this subtree.  By now we worry more about
++	 * correctness than about performance...
++	 */
++	next_in_service = bfq_lookup_next_entity(sd, 0, NULL);
++	sd->next_in_service = next_in_service;
++
++	if (next_in_service != NULL)
++		bfq_update_budget(next_in_service);
++
++	return 1;
++}
++
++static inline void bfq_check_next_in_service(struct bfq_sched_data *sd,
++					     struct bfq_entity *entity)
++{
++	BUG_ON(sd->next_in_service != entity);
++}
++#else
++#define for_each_entity(entity)	\
++	for (; entity != NULL; entity = NULL)
++
++#define for_each_entity_safe(entity, parent) \
++	for (parent = NULL; entity != NULL; entity = parent)
++
++static inline int bfq_update_next_in_service(struct bfq_sched_data *sd)
++{
++	return 0;
++}
++
++static inline void bfq_check_next_in_service(struct bfq_sched_data *sd,
++					     struct bfq_entity *entity)
++{
++}
++
++static inline void bfq_update_budget(struct bfq_entity *next_in_service)
++{
++}
++#endif
++
++/*
++ * Shift for timestamp calculations.  This actually limits the maximum
++ * service allowed in one timestamp delta (small shift values increase it),
++ * the maximum total weight that can be used for the queues in the system
++ * (big shift values increase it), and the period of virtual time
++ * wraparounds.
++ */
++#define WFQ_SERVICE_SHIFT	22
++
++/**
++ * bfq_gt - compare two timestamps.
++ * @a: first ts.
++ * @b: second ts.
++ *
++ * Return @a > @b, dealing with wrapping correctly.
++ */
++static inline int bfq_gt(u64 a, u64 b)
++{
++	return (s64)(a - b) > 0;
++}
++
++static inline struct bfq_queue *bfq_entity_to_bfqq(struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = NULL;
++
++	BUG_ON(entity == NULL);
++
++	if (entity->my_sched_data == NULL)
++		bfqq = container_of(entity, struct bfq_queue, entity);
++
++	return bfqq;
++}
++
++
++/**
++ * bfq_delta - map service into the virtual time domain.
++ * @service: amount of service.
++ * @weight: scale factor (weight of an entity or weight sum).
++ */
++static inline u64 bfq_delta(unsigned long service,
++					unsigned long weight)
++{
++	u64 d = (u64)service << WFQ_SERVICE_SHIFT;
++
++	do_div(d, weight);
++	return d;
++}
++
++/**
++ * bfq_calc_finish - assign the finish time to an entity.
++ * @entity: the entity to act upon.
++ * @service: the service to be charged to the entity.
++ */
++static inline void bfq_calc_finish(struct bfq_entity *entity,
++				   unsigned long service)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++
++	BUG_ON(entity->weight == 0);
++
++	entity->finish = entity->start +
++		bfq_delta(service, entity->weight);
++
++	if (bfqq != NULL) {
++		bfq_log_bfqq(bfqq->bfqd, bfqq,
++			"calc_finish: serv %lu, w %d",
++			service, entity->weight);
++		bfq_log_bfqq(bfqq->bfqd, bfqq,
++			"calc_finish: start %llu, finish %llu, delta %llu",
++			entity->start, entity->finish,
++			bfq_delta(service, entity->weight));
++	}
++}
++
++/**
++ * bfq_entity_of - get an entity from a node.
++ * @node: the node field of the entity.
++ *
++ * Convert a node pointer to the relative entity.  This is used only
++ * to simplify the logic of some functions and not as the generic
++ * conversion mechanism because, e.g., in the tree walking functions,
++ * the check for a %NULL value would be redundant.
++ */
++static inline struct bfq_entity *bfq_entity_of(struct rb_node *node)
++{
++	struct bfq_entity *entity = NULL;
++
++	if (node != NULL)
++		entity = rb_entry(node, struct bfq_entity, rb_node);
++
++	return entity;
++}
++
++/**
++ * bfq_extract - remove an entity from a tree.
++ * @root: the tree root.
++ * @entity: the entity to remove.
++ */
++static inline void bfq_extract(struct rb_root *root,
++			       struct bfq_entity *entity)
++{
++	BUG_ON(entity->tree != root);
++
++	entity->tree = NULL;
++	rb_erase(&entity->rb_node, root);
++}
++
++/**
++ * bfq_idle_extract - extract an entity from the idle tree.
++ * @st: the service tree of the owning @entity.
++ * @entity: the entity being removed.
++ */
++static void bfq_idle_extract(struct bfq_service_tree *st,
++			     struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++	struct rb_node *next;
++
++	BUG_ON(entity->tree != &st->idle);
++
++	if (entity == st->first_idle) {
++		next = rb_next(&entity->rb_node);
++		st->first_idle = bfq_entity_of(next);
++	}
++
++	if (entity == st->last_idle) {
++		next = rb_prev(&entity->rb_node);
++		st->last_idle = bfq_entity_of(next);
++	}
++
++	bfq_extract(&st->idle, entity);
++
++	if (bfqq != NULL)
++		list_del(&bfqq->bfqq_list);
++}
++
++/**
++ * bfq_insert - generic tree insertion.
++ * @root: tree root.
++ * @entity: entity to insert.
++ *
++ * This is used for the idle and the active tree, since they are both
++ * ordered by finish time.
++ */
++static void bfq_insert(struct rb_root *root, struct bfq_entity *entity)
++{
++	struct bfq_entity *entry;
++	struct rb_node **node = &root->rb_node;
++	struct rb_node *parent = NULL;
++
++	BUG_ON(entity->tree != NULL);
++
++	while (*node != NULL) {
++		parent = *node;
++		entry = rb_entry(parent, struct bfq_entity, rb_node);
++
++		if (bfq_gt(entry->finish, entity->finish))
++			node = &parent->rb_left;
++		else
++			node = &parent->rb_right;
++	}
++
++	rb_link_node(&entity->rb_node, parent, node);
++	rb_insert_color(&entity->rb_node, root);
++
++	entity->tree = root;
++}
++
++/**
++ * bfq_update_min - update the min_start field of a entity.
++ * @entity: the entity to update.
++ * @node: one of its children.
++ *
++ * This function is called when @entity may store an invalid value for
++ * min_start due to updates to the active tree.  The function  assumes
++ * that the subtree rooted at @node (which may be its left or its right
++ * child) has a valid min_start value.
++ */
++static inline void bfq_update_min(struct bfq_entity *entity,
++				  struct rb_node *node)
++{
++	struct bfq_entity *child;
++
++	if (node != NULL) {
++		child = rb_entry(node, struct bfq_entity, rb_node);
++		if (bfq_gt(entity->min_start, child->min_start))
++			entity->min_start = child->min_start;
++	}
++}
++
++/**
++ * bfq_update_active_node - recalculate min_start.
++ * @node: the node to update.
++ *
++ * @node may have changed position or one of its children may have moved,
++ * this function updates its min_start value.  The left and right subtrees
++ * are assumed to hold a correct min_start value.
++ */
++static inline void bfq_update_active_node(struct rb_node *node)
++{
++	struct bfq_entity *entity = rb_entry(node, struct bfq_entity, rb_node);
++
++	entity->min_start = entity->start;
++	bfq_update_min(entity, node->rb_right);
++	bfq_update_min(entity, node->rb_left);
++}
++
++/**
++ * bfq_update_active_tree - update min_start for the whole active tree.
++ * @node: the starting node.
++ *
++ * @node must be the deepest modified node after an update.  This function
++ * updates its min_start using the values held by its children, assuming
++ * that they did not change, and then updates all the nodes that may have
++ * changed in the path to the root.  The only nodes that may have changed
++ * are the ones in the path or their siblings.
++ */
++static void bfq_update_active_tree(struct rb_node *node)
++{
++	struct rb_node *parent;
++
++up:
++	bfq_update_active_node(node);
++
++	parent = rb_parent(node);
++	if (parent == NULL)
++		return;
++
++	if (node == parent->rb_left && parent->rb_right != NULL)
++		bfq_update_active_node(parent->rb_right);
++	else if (parent->rb_left != NULL)
++		bfq_update_active_node(parent->rb_left);
++
++	node = parent;
++	goto up;
++}
++
++static void bfq_weights_tree_add(struct bfq_data *bfqd,
++				 struct bfq_entity *entity,
++				 struct rb_root *root);
++
++static void bfq_weights_tree_remove(struct bfq_data *bfqd,
++				    struct bfq_entity *entity,
++				    struct rb_root *root);
++
++
++/**
++ * bfq_active_insert - insert an entity in the active tree of its
++ *                     group/device.
++ * @st: the service tree of the entity.
++ * @entity: the entity being inserted.
++ *
++ * The active tree is ordered by finish time, but an extra key is kept
++ * per each node, containing the minimum value for the start times of
++ * its children (and the node itself), so it's possible to search for
++ * the eligible node with the lowest finish time in logarithmic time.
++ */
++static void bfq_active_insert(struct bfq_service_tree *st,
++			      struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++	struct rb_node *node = &entity->rb_node;
++#ifdef CONFIG_CGROUP_BFQIO
++	struct bfq_sched_data *sd = NULL;
++	struct bfq_group *bfqg = NULL;
++	struct bfq_data *bfqd = NULL;
++#endif
++
++	bfq_insert(&st->active, entity);
++
++	if (node->rb_left != NULL)
++		node = node->rb_left;
++	else if (node->rb_right != NULL)
++		node = node->rb_right;
++
++	bfq_update_active_tree(node);
++
++#ifdef CONFIG_CGROUP_BFQIO
++	sd = entity->sched_data;
++	bfqg = container_of(sd, struct bfq_group, sched_data);
++	BUG_ON(!bfqg);
++	bfqd = (struct bfq_data *)bfqg->bfqd;
++#endif
++	if (bfqq != NULL)
++		list_add(&bfqq->bfqq_list, &bfqq->bfqd->active_list);
++#ifdef CONFIG_CGROUP_BFQIO
++	else { /* bfq_group */
++		BUG_ON(!bfqd);
++		bfq_weights_tree_add(bfqd, entity, &bfqd->group_weights_tree);
++	}
++	if (bfqg != bfqd->root_group) {
++		BUG_ON(!bfqg);
++		BUG_ON(!bfqd);
++		bfqg->active_entities++;
++		if (bfqg->active_entities == 2)
++			bfqd->active_numerous_groups++;
++	}
++#endif
++}
++
++/**
++ * bfq_ioprio_to_weight - calc a weight from an ioprio.
++ * @ioprio: the ioprio value to convert.
++ */
++static inline unsigned short bfq_ioprio_to_weight(int ioprio)
++{
++	BUG_ON(ioprio < 0 || ioprio >= IOPRIO_BE_NR);
++	return IOPRIO_BE_NR - ioprio;
++}
++
++/**
++ * bfq_weight_to_ioprio - calc an ioprio from a weight.
++ * @weight: the weight value to convert.
++ *
++ * To preserve as mush as possible the old only-ioprio user interface,
++ * 0 is used as an escape ioprio value for weights (numerically) equal or
++ * larger than IOPRIO_BE_NR
++ */
++static inline unsigned short bfq_weight_to_ioprio(int weight)
++{
++	BUG_ON(weight < BFQ_MIN_WEIGHT || weight > BFQ_MAX_WEIGHT);
++	return IOPRIO_BE_NR - weight < 0 ? 0 : IOPRIO_BE_NR - weight;
++}
++
++static inline void bfq_get_entity(struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++
++	if (bfqq != NULL) {
++		atomic_inc(&bfqq->ref);
++		bfq_log_bfqq(bfqq->bfqd, bfqq, "get_entity: %p %d",
++			     bfqq, atomic_read(&bfqq->ref));
++	}
++}
++
++/**
++ * bfq_find_deepest - find the deepest node that an extraction can modify.
++ * @node: the node being removed.
++ *
++ * Do the first step of an extraction in an rb tree, looking for the
++ * node that will replace @node, and returning the deepest node that
++ * the following modifications to the tree can touch.  If @node is the
++ * last node in the tree return %NULL.
++ */
++static struct rb_node *bfq_find_deepest(struct rb_node *node)
++{
++	struct rb_node *deepest;
++
++	if (node->rb_right == NULL && node->rb_left == NULL)
++		deepest = rb_parent(node);
++	else if (node->rb_right == NULL)
++		deepest = node->rb_left;
++	else if (node->rb_left == NULL)
++		deepest = node->rb_right;
++	else {
++		deepest = rb_next(node);
++		if (deepest->rb_right != NULL)
++			deepest = deepest->rb_right;
++		else if (rb_parent(deepest) != node)
++			deepest = rb_parent(deepest);
++	}
++
++	return deepest;
++}
++
++/**
++ * bfq_active_extract - remove an entity from the active tree.
++ * @st: the service_tree containing the tree.
++ * @entity: the entity being removed.
++ */
++static void bfq_active_extract(struct bfq_service_tree *st,
++			       struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++	struct rb_node *node;
++#ifdef CONFIG_CGROUP_BFQIO
++	struct bfq_sched_data *sd = NULL;
++	struct bfq_group *bfqg = NULL;
++	struct bfq_data *bfqd = NULL;
++#endif
++
++	node = bfq_find_deepest(&entity->rb_node);
++	bfq_extract(&st->active, entity);
++
++	if (node != NULL)
++		bfq_update_active_tree(node);
++
++#ifdef CONFIG_CGROUP_BFQIO
++	sd = entity->sched_data;
++	bfqg = container_of(sd, struct bfq_group, sched_data);
++	BUG_ON(!bfqg);
++	bfqd = (struct bfq_data *)bfqg->bfqd;
++#endif
++	if (bfqq != NULL)
++		list_del(&bfqq->bfqq_list);
++#ifdef CONFIG_CGROUP_BFQIO
++	else { /* bfq_group */
++		BUG_ON(!bfqd);
++		bfq_weights_tree_remove(bfqd, entity,
++					&bfqd->group_weights_tree);
++	}
++	if (bfqg != bfqd->root_group) {
++		BUG_ON(!bfqg);
++		BUG_ON(!bfqd);
++		BUG_ON(!bfqg->active_entities);
++		bfqg->active_entities--;
++		if (bfqg->active_entities == 1) {
++			BUG_ON(!bfqd->active_numerous_groups);
++			bfqd->active_numerous_groups--;
++		}
++	}
++#endif
++}
++
++/**
++ * bfq_idle_insert - insert an entity into the idle tree.
++ * @st: the service tree containing the tree.
++ * @entity: the entity to insert.
++ */
++static void bfq_idle_insert(struct bfq_service_tree *st,
++			    struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++	struct bfq_entity *first_idle = st->first_idle;
++	struct bfq_entity *last_idle = st->last_idle;
++
++	if (first_idle == NULL || bfq_gt(first_idle->finish, entity->finish))
++		st->first_idle = entity;
++	if (last_idle == NULL || bfq_gt(entity->finish, last_idle->finish))
++		st->last_idle = entity;
++
++	bfq_insert(&st->idle, entity);
++
++	if (bfqq != NULL)
++		list_add(&bfqq->bfqq_list, &bfqq->bfqd->idle_list);
++}
++
++/**
++ * bfq_forget_entity - remove an entity from the wfq trees.
++ * @st: the service tree.
++ * @entity: the entity being removed.
++ *
++ * Update the device status and forget everything about @entity, putting
++ * the device reference to it, if it is a queue.  Entities belonging to
++ * groups are not refcounted.
++ */
++static void bfq_forget_entity(struct bfq_service_tree *st,
++			      struct bfq_entity *entity)
++{
++	struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++	struct bfq_sched_data *sd;
++
++	BUG_ON(!entity->on_st);
++
++	entity->on_st = 0;
++	st->wsum -= entity->weight;
++	if (bfqq != NULL) {
++		sd = entity->sched_data;
++		bfq_log_bfqq(bfqq->bfqd, bfqq, "forget_entity: %p %d",
++			     bfqq, atomic_read(&bfqq->ref));
++		bfq_put_queue(bfqq);
++	}
++}
++
++/**
++ * bfq_put_idle_entity - release the idle tree ref of an entity.
++ * @st: service tree for the entity.
++ * @entity: the entity being released.
++ */
++static void bfq_put_idle_entity(struct bfq_service_tree *st,
++				struct bfq_entity *entity)
++{
++	bfq_idle_extract(st, entity);
++	bfq_forget_entity(st, entity);
++}
++
++/**
++ * bfq_forget_idle - update the idle tree if necessary.
++ * @st: the service tree to act upon.
++ *
++ * To preserve the global O(log N) complexity we only remove one entry here;
++ * as the idle tree will not grow indefinitely this can be done safely.
++ */
++static void bfq_forget_idle(struct bfq_service_tree *st)
++{
++	struct bfq_entity *first_idle = st->first_idle;
++	struct bfq_entity *last_idle = st->last_idle;
++
++	if (RB_EMPTY_ROOT(&st->active) && last_idle != NULL &&
++	    !bfq_gt(last_idle->finish, st->vtime)) {
++		/*
++		 * Forget the whole idle tree, increasing the vtime past
++		 * the last finish time of idle entities.
++		 */
++		st->vtime = last_idle->finish;
++	}
++
++	if (first_idle != NULL && !bfq_gt(first_idle->finish, st->vtime))
++		bfq_put_idle_entity(st, first_idle);
++}
++
++static struct bfq_service_tree *
++__bfq_entity_update_weight_prio(struct bfq_service_tree *old_st,
++			 struct bfq_entity *entity)
++{
++	struct bfq_service_tree *new_st = old_st;
++
++	if (entity->ioprio_changed) {
++		struct bfq_queue *bfqq = bfq_entity_to_bfqq(entity);
++		unsigned short prev_weight, new_weight;
++		struct bfq_data *bfqd = NULL;
++		struct rb_root *root;
++#ifdef CONFIG_CGROUP_BFQIO
++		struct bfq_sched_data *sd;
++		struct bfq_group *bfqg;
++#endif
++
++		if (bfqq != NULL)
++			bfqd = bfqq->bfqd;
++#ifdef CONFIG_CGROUP_BFQIO
++		else {
++			sd = entity->my_sched_data;
++			bfqg = container_of(sd, struct bfq_group, sched_data);
++			BUG_ON(!bfqg);
++			bfqd = (struct bfq_data *)bfqg->bfqd;
++			BUG_ON(!bfqd);
++		}
++#endif
++
++		BUG_ON(old_st->wsum < entity->weight);
++		old_st->wsum -= entity->weight;
++
++		if (entity->new_weight != entity->orig_weight) {
++			if (entity->new_weight < BFQ_MIN_WEIGHT ||
++			    entity->new_weight > BFQ_MAX_WEIGHT) {
++				printk(KERN_CRIT "update_weight_prio: "
++						 "new_weight %d\n",
++					entity->new_weight);
++				BUG();
++			}
++			entity->orig_weight = entity->new_weight;
++			entity->ioprio =
++				bfq_weight_to_ioprio(entity->orig_weight);
++		} else if (entity->new_ioprio != entity->ioprio) {
++			entity->ioprio = entity->new_ioprio;
++			entity->orig_weight =
++					bfq_ioprio_to_weight(entity->ioprio);
++		} else
++			entity->new_weight = entity->orig_weight =
++				bfq_ioprio_to_weight(entity->ioprio);
++
++		entity->ioprio_class = entity->new_ioprio_class;
++		entity->ioprio_changed = 0;
++
++		/*
++		 * NOTE: here we may be changing the weight too early,
++		 * this will cause unfairness.  The correct approach
++		 * would have required additional complexity to defer
++		 * weight changes to the proper time instants (i.e.,
++		 * when entity->finish <= old_st->vtime).
++		 */
++		new_st = bfq_entity_service_tree(entity);
++
++		prev_weight = entity->weight;
++		new_weight = entity->orig_weight *
++			     (bfqq != NULL ? bfqq->wr_coeff : 1);
++		/*
++		 * If the weight of the entity changes, remove the entity
++		 * from its old weight counter (if there is a counter
++		 * associated with the entity), and add it to the counter
++		 * associated with its new weight.
++		 */
++		if (prev_weight != new_weight) {
++			root = bfqq ? &bfqd->queue_weights_tree :
++				      &bfqd->group_weights_tree;
++			bfq_weights_tree_remove(bfqd, entity, root);
++		}
++		entity->weight = new_weight;
++		/*
++		 * Add the entity to its weights tree only if it is
++		 * not associated with a weight-raised queue.
++		 */
++		if (prev_weight != new_weight &&
++		    (bfqq ? bfqq->wr_coeff == 1 : 1))
++			/* If we get here, root has been initialized. */
++			bfq_weights_tree_add(bfqd, entity, root);
++
++		new_st->wsum += entity->weight;
++
++		if (new_st != old_st)
++			entity->start = new_st->vtime;
++	}
++
++	return new_st;
++}
++
++/**
++ * bfq_bfqq_served - update the scheduler status after selection for
++ *                   service.
++ * @bfqq: the queue being served.
++ * @served: bytes to transfer.
++ *
++ * NOTE: this can be optimized, as the timestamps of upper level entities
++ * are synchronized every time a new bfqq is selected for service.  By now,
++ * we keep it to better check consistency.
++ */
++static void bfq_bfqq_served(struct bfq_queue *bfqq, unsigned long served)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++	struct bfq_service_tree *st;
++
++	for_each_entity(entity) {
++		st = bfq_entity_service_tree(entity);
++
++		entity->service += served;
++		BUG_ON(entity->service > entity->budget);
++		BUG_ON(st->wsum == 0);
++
++		st->vtime += bfq_delta(served, st->wsum);
++		bfq_forget_idle(st);
++	}
++	bfq_log_bfqq(bfqq->bfqd, bfqq, "bfqq_served %lu secs", served);
++}
++
++/**
++ * bfq_bfqq_charge_full_budget - set the service to the entity budget.
++ * @bfqq: the queue that needs a service update.
++ *
++ * When it's not possible to be fair in the service domain, because
++ * a queue is not consuming its budget fast enough (the meaning of
++ * fast depends on the timeout parameter), we charge it a full
++ * budget.  In this way we should obtain a sort of time-domain
++ * fairness among all the seeky/slow queues.
++ */
++static inline void bfq_bfqq_charge_full_budget(struct bfq_queue *bfqq)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++
++	bfq_log_bfqq(bfqq->bfqd, bfqq, "charge_full_budget");
++
++	bfq_bfqq_served(bfqq, entity->budget - entity->service);
++}
++
++/**
++ * __bfq_activate_entity - activate an entity.
++ * @entity: the entity being activated.
++ *
++ * Called whenever an entity is activated, i.e., it is not active and one
++ * of its children receives a new request, or has to be reactivated due to
++ * budget exhaustion.  It uses the current budget of the entity (and the
++ * service received if @entity is active) of the queue to calculate its
++ * timestamps.
++ */
++static void __bfq_activate_entity(struct bfq_entity *entity)
++{
++	struct bfq_sched_data *sd = entity->sched_data;
++	struct bfq_service_tree *st = bfq_entity_service_tree(entity);
++
++	if (entity == sd->in_service_entity) {
++		BUG_ON(entity->tree != NULL);
++		/*
++		 * If we are requeueing the current entity we have
++		 * to take care of not charging to it service it has
++		 * not received.
++		 */
++		bfq_calc_finish(entity, entity->service);
++		entity->start = entity->finish;
++		sd->in_service_entity = NULL;
++	} else if (entity->tree == &st->active) {
++		/*
++		 * Requeueing an entity due to a change of some
++		 * next_in_service entity below it.  We reuse the
++		 * old start time.
++		 */
++		bfq_active_extract(st, entity);
++	} else if (entity->tree == &st->idle) {
++		/*
++		 * Must be on the idle tree, bfq_idle_extract() will
++		 * check for that.
++		 */
++		bfq_idle_extract(st, entity);
++		entity->start = bfq_gt(st->vtime, entity->finish) ?
++				       st->vtime : entity->finish;
++	} else {
++		/*
++		 * The finish time of the entity may be invalid, and
++		 * it is in the past for sure, otherwise the queue
++		 * would have been on the idle tree.
++		 */
++		entity->start = st->vtime;
++		st->wsum += entity->weight;
++		bfq_get_entity(entity);
++
++		BUG_ON(entity->on_st);
++		entity->on_st = 1;
++	}
++
++	st = __bfq_entity_update_weight_prio(st, entity);
++	bfq_calc_finish(entity, entity->budget);
++	bfq_active_insert(st, entity);
++}
++
++/**
++ * bfq_activate_entity - activate an entity and its ancestors if necessary.
++ * @entity: the entity to activate.
++ *
++ * Activate @entity and all the entities on the path from it to the root.
++ */
++static void bfq_activate_entity(struct bfq_entity *entity)
++{
++	struct bfq_sched_data *sd;
++
++	for_each_entity(entity) {
++		__bfq_activate_entity(entity);
++
++		sd = entity->sched_data;
++		if (!bfq_update_next_in_service(sd))
++			/*
++			 * No need to propagate the activation to the
++			 * upper entities, as they will be updated when
++			 * the in-service entity is rescheduled.
++			 */
++			break;
++	}
++}
++
++/**
++ * __bfq_deactivate_entity - deactivate an entity from its service tree.
++ * @entity: the entity to deactivate.
++ * @requeue: if false, the entity will not be put into the idle tree.
++ *
++ * Deactivate an entity, independently from its previous state.  If the
++ * entity was not on a service tree just return, otherwise if it is on
++ * any scheduler tree, extract it from that tree, and if necessary
++ * and if the caller did not specify @requeue, put it on the idle tree.
++ *
++ * Return %1 if the caller should update the entity hierarchy, i.e.,
++ * if the entity was in service or if it was the next_in_service for
++ * its sched_data; return %0 otherwise.
++ */
++static int __bfq_deactivate_entity(struct bfq_entity *entity, int requeue)
++{
++	struct bfq_sched_data *sd = entity->sched_data;
++	struct bfq_service_tree *st = bfq_entity_service_tree(entity);
++	int was_in_service = entity == sd->in_service_entity;
++	int ret = 0;
++
++	if (!entity->on_st)
++		return 0;
++
++	BUG_ON(was_in_service && entity->tree != NULL);
++
++	if (was_in_service) {
++		bfq_calc_finish(entity, entity->service);
++		sd->in_service_entity = NULL;
++	} else if (entity->tree == &st->active)
++		bfq_active_extract(st, entity);
++	else if (entity->tree == &st->idle)
++		bfq_idle_extract(st, entity);
++	else if (entity->tree != NULL)
++		BUG();
++
++	if (was_in_service || sd->next_in_service == entity)
++		ret = bfq_update_next_in_service(sd);
++
++	if (!requeue || !bfq_gt(entity->finish, st->vtime))
++		bfq_forget_entity(st, entity);
++	else
++		bfq_idle_insert(st, entity);
++
++	BUG_ON(sd->in_service_entity == entity);
++	BUG_ON(sd->next_in_service == entity);
++
++	return ret;
++}
++
++/**
++ * bfq_deactivate_entity - deactivate an entity.
++ * @entity: the entity to deactivate.
++ * @requeue: true if the entity can be put on the idle tree
++ */
++static void bfq_deactivate_entity(struct bfq_entity *entity, int requeue)
++{
++	struct bfq_sched_data *sd;
++	struct bfq_entity *parent;
++
++	for_each_entity_safe(entity, parent) {
++		sd = entity->sched_data;
++
++		if (!__bfq_deactivate_entity(entity, requeue))
++			/*
++			 * The parent entity is still backlogged, and
++			 * we don't need to update it as it is still
++			 * in service.
++			 */
++			break;
++
++		if (sd->next_in_service != NULL)
++			/*
++			 * The parent entity is still backlogged and
++			 * the budgets on the path towards the root
++			 * need to be updated.
++			 */
++			goto update;
++
++		/*
++		 * If we reach there the parent is no more backlogged and
++		 * we want to propagate the dequeue upwards.
++		 */
++		requeue = 1;
++	}
++
++	return;
++
++update:
++	entity = parent;
++	for_each_entity(entity) {
++		__bfq_activate_entity(entity);
++
++		sd = entity->sched_data;
++		if (!bfq_update_next_in_service(sd))
++			break;
++	}
++}
++
++/**
++ * bfq_update_vtime - update vtime if necessary.
++ * @st: the service tree to act upon.
++ *
++ * If necessary update the service tree vtime to have at least one
++ * eligible entity, skipping to its start time.  Assumes that the
++ * active tree of the device is not empty.
++ *
++ * NOTE: this hierarchical implementation updates vtimes quite often,
++ * we may end up with reactivated processes getting timestamps after a
++ * vtime skip done because we needed a ->first_active entity on some
++ * intermediate node.
++ */
++static void bfq_update_vtime(struct bfq_service_tree *st)
++{
++	struct bfq_entity *entry;
++	struct rb_node *node = st->active.rb_node;
++
++	entry = rb_entry(node, struct bfq_entity, rb_node);
++	if (bfq_gt(entry->min_start, st->vtime)) {
++		st->vtime = entry->min_start;
++		bfq_forget_idle(st);
++	}
++}
++
++/**
++ * bfq_first_active_entity - find the eligible entity with
++ *                           the smallest finish time
++ * @st: the service tree to select from.
++ *
++ * This function searches the first schedulable entity, starting from the
++ * root of the tree and going on the left every time on this side there is
++ * a subtree with at least one eligible (start >= vtime) entity. The path on
++ * the right is followed only if a) the left subtree contains no eligible
++ * entities and b) no eligible entity has been found yet.
++ */
++static struct bfq_entity *bfq_first_active_entity(struct bfq_service_tree *st)
++{
++	struct bfq_entity *entry, *first = NULL;
++	struct rb_node *node = st->active.rb_node;
++
++	while (node != NULL) {
++		entry = rb_entry(node, struct bfq_entity, rb_node);
++left:
++		if (!bfq_gt(entry->start, st->vtime))
++			first = entry;
++
++		BUG_ON(bfq_gt(entry->min_start, st->vtime));
++
++		if (node->rb_left != NULL) {
++			entry = rb_entry(node->rb_left,
++					 struct bfq_entity, rb_node);
++			if (!bfq_gt(entry->min_start, st->vtime)) {
++				node = node->rb_left;
++				goto left;
++			}
++		}
++		if (first != NULL)
++			break;
++		node = node->rb_right;
++	}
++
++	BUG_ON(first == NULL && !RB_EMPTY_ROOT(&st->active));
++	return first;
++}
++
++/**
++ * __bfq_lookup_next_entity - return the first eligible entity in @st.
++ * @st: the service tree.
++ *
++ * Update the virtual time in @st and return the first eligible entity
++ * it contains.
++ */
++static struct bfq_entity *__bfq_lookup_next_entity(struct bfq_service_tree *st,
++						   bool force)
++{
++	struct bfq_entity *entity, *new_next_in_service = NULL;
++
++	if (RB_EMPTY_ROOT(&st->active))
++		return NULL;
++
++	bfq_update_vtime(st);
++	entity = bfq_first_active_entity(st);
++	BUG_ON(bfq_gt(entity->start, st->vtime));
++
++	/*
++	 * If the chosen entity does not match with the sched_data's
++	 * next_in_service and we are forcedly serving the IDLE priority
++	 * class tree, bubble up budget update.
++	 */
++	if (unlikely(force && entity != entity->sched_data->next_in_service)) {
++		new_next_in_service = entity;
++		for_each_entity(new_next_in_service)
++			bfq_update_budget(new_next_in_service);
++	}
++
++	return entity;
++}
++
++/**
++ * bfq_lookup_next_entity - return the first eligible entity in @sd.
++ * @sd: the sched_data.
++ * @extract: if true the returned entity will be also extracted from @sd.
++ *
++ * NOTE: since we cache the next_in_service entity at each level of the
++ * hierarchy, the complexity of the lookup can be decreased with
++ * absolutely no effort just returning the cached next_in_service value;
++ * we prefer to do full lookups to test the consistency of * the data
++ * structures.
++ */
++static struct bfq_entity *bfq_lookup_next_entity(struct bfq_sched_data *sd,
++						 int extract,
++						 struct bfq_data *bfqd)
++{
++	struct bfq_service_tree *st = sd->service_tree;
++	struct bfq_entity *entity;
++	int i = 0;
++
++	BUG_ON(sd->in_service_entity != NULL);
++
++	if (bfqd != NULL &&
++	    jiffies - bfqd->bfq_class_idle_last_service > BFQ_CL_IDLE_TIMEOUT) {
++		entity = __bfq_lookup_next_entity(st + BFQ_IOPRIO_CLASSES - 1,
++						  true);
++		if (entity != NULL) {
++			i = BFQ_IOPRIO_CLASSES - 1;
++			bfqd->bfq_class_idle_last_service = jiffies;
++			sd->next_in_service = entity;
++		}
++	}
++	for (; i < BFQ_IOPRIO_CLASSES; i++) {
++		entity = __bfq_lookup_next_entity(st + i, false);
++		if (entity != NULL) {
++			if (extract) {
++				bfq_check_next_in_service(sd, entity);
++				bfq_active_extract(st + i, entity);
++				sd->in_service_entity = entity;
++				sd->next_in_service = NULL;
++			}
++			break;
++		}
++	}
++
++	return entity;
++}
++
++/*
++ * Get next queue for service.
++ */
++static struct bfq_queue *bfq_get_next_queue(struct bfq_data *bfqd)
++{
++	struct bfq_entity *entity = NULL;
++	struct bfq_sched_data *sd;
++	struct bfq_queue *bfqq;
++
++	BUG_ON(bfqd->in_service_queue != NULL);
++
++	if (bfqd->busy_queues == 0)
++		return NULL;
++
++	sd = &bfqd->root_group->sched_data;
++	for (; sd != NULL; sd = entity->my_sched_data) {
++		entity = bfq_lookup_next_entity(sd, 1, bfqd);
++		BUG_ON(entity == NULL);
++		entity->service = 0;
++	}
++
++	bfqq = bfq_entity_to_bfqq(entity);
++	BUG_ON(bfqq == NULL);
++
++	return bfqq;
++}
++
++static void __bfq_bfqd_reset_in_service(struct bfq_data *bfqd)
++{
++	if (bfqd->in_service_bic != NULL) {
++		put_io_context(bfqd->in_service_bic->icq.ioc);
++		bfqd->in_service_bic = NULL;
++	}
++
++	bfqd->in_service_queue = NULL;
++	del_timer(&bfqd->idle_slice_timer);
++}
++
++static void bfq_deactivate_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++				int requeue)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++
++	if (bfqq == bfqd->in_service_queue)
++		__bfq_bfqd_reset_in_service(bfqd);
++
++	bfq_deactivate_entity(entity, requeue);
++}
++
++static void bfq_activate_bfqq(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	struct bfq_entity *entity = &bfqq->entity;
++
++	bfq_activate_entity(entity);
++}
++
++/*
++ * Called when the bfqq no longer has requests pending, remove it from
++ * the service tree.
++ */
++static void bfq_del_bfqq_busy(struct bfq_data *bfqd, struct bfq_queue *bfqq,
++			      int requeue)
++{
++	BUG_ON(!bfq_bfqq_busy(bfqq));
++	BUG_ON(!RB_EMPTY_ROOT(&bfqq->sort_list));
++
++	bfq_log_bfqq(bfqd, bfqq, "del from busy");
++
++	bfq_clear_bfqq_busy(bfqq);
++
++	BUG_ON(bfqd->busy_queues == 0);
++	bfqd->busy_queues--;
++
++	if (!bfqq->dispatched) {
++		bfq_weights_tree_remove(bfqd, &bfqq->entity,
++					&bfqd->queue_weights_tree);
++		if (!blk_queue_nonrot(bfqd->queue)) {
++			BUG_ON(!bfqd->busy_in_flight_queues);
++			bfqd->busy_in_flight_queues--;
++			if (bfq_bfqq_constantly_seeky(bfqq)) {
++				BUG_ON(!bfqd->
++					const_seeky_busy_in_flight_queues);
++				bfqd->const_seeky_busy_in_flight_queues--;
++			}
++		}
++	}
++	if (bfqq->wr_coeff > 1)
++		bfqd->wr_busy_queues--;
++
++	bfq_deactivate_bfqq(bfqd, bfqq, requeue);
++}
++
++/*
++ * Called when an inactive queue receives a new request.
++ */
++static void bfq_add_bfqq_busy(struct bfq_data *bfqd, struct bfq_queue *bfqq)
++{
++	BUG_ON(bfq_bfqq_busy(bfqq));
++	BUG_ON(bfqq == bfqd->in_service_queue);
++
++	bfq_log_bfqq(bfqd, bfqq, "add to busy");
++
++	bfq_activate_bfqq(bfqd, bfqq);
++
++	bfq_mark_bfqq_busy(bfqq);
++	bfqd->busy_queues++;
++
++	if (!bfqq->dispatched) {
++		if (bfqq->wr_coeff == 1)
++			bfq_weights_tree_add(bfqd, &bfqq->entity,
++					     &bfqd->queue_weights_tree);
++		if (!blk_queue_nonrot(bfqd->queue)) {
++			bfqd->busy_in_flight_queues++;
++			if (bfq_bfqq_constantly_seeky(bfqq))
++				bfqd->const_seeky_busy_in_flight_queues++;
++		}
++	}
++	if (bfqq->wr_coeff > 1)
++		bfqd->wr_busy_queues++;
++}
+diff -Nur linux-4.1.3/block/Kconfig.iosched linux-xbian-imx6/block/Kconfig.iosched
+--- linux-4.1.3/block/Kconfig.iosched	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/block/Kconfig.iosched	2015-07-27 23:13:03.600137415 +0200
+@@ -39,6 +39,27 @@
+ 	---help---
+ 	  Enable group IO scheduling in CFQ.
+ 
++config IOSCHED_BFQ
++	tristate "BFQ I/O scheduler"
++	default n
++	---help---
++	  The BFQ I/O scheduler tries to distribute bandwidth among
++	  all processes according to their weights.
++	  It aims at distributing the bandwidth as desired, independently of
++	  the disk parameters and with any workload. It also tries to
++	  guarantee low latency to interactive and soft real-time
++	  applications. If compiled built-in (saying Y here), BFQ can
++	  be configured to support hierarchical scheduling.
++
++config CGROUP_BFQIO
++	bool "BFQ hierarchical scheduling support"
++	depends on CGROUPS && IOSCHED_BFQ=y
++	default n
++	---help---
++	  Enable hierarchical scheduling in BFQ, using the cgroups
++	  filesystem interface.  The name of the subsystem will be
++	  bfqio.
++
+ choice
+ 	prompt "Default I/O scheduler"
+ 	default DEFAULT_CFQ
+@@ -52,6 +73,16 @@
+ 	config DEFAULT_CFQ
+ 		bool "CFQ" if IOSCHED_CFQ=y
+ 
++	config DEFAULT_BFQ
++		bool "BFQ" if IOSCHED_BFQ=y
++		help
++		  Selects BFQ as the default I/O scheduler which will be
++		  used by default for all block devices.
++		  The BFQ I/O scheduler aims at distributing the bandwidth
++		  as desired, independently of the disk parameters and with
++		  any workload. It also tries to guarantee low latency to
++		  interactive and soft real-time applications.
++
+ 	config DEFAULT_NOOP
+ 		bool "No-op"
+ 
+@@ -61,6 +92,7 @@
+ 	string
+ 	default "deadline" if DEFAULT_DEADLINE
+ 	default "cfq" if DEFAULT_CFQ
++	default "bfq" if DEFAULT_BFQ
+ 	default "noop" if DEFAULT_NOOP
+ 
+ endmenu
+diff -Nur linux-4.1.3/block/Makefile linux-xbian-imx6/block/Makefile
+--- linux-4.1.3/block/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/block/Makefile	2015-07-27 23:13:03.600137415 +0200
+@@ -18,6 +18,7 @@
+ obj-$(CONFIG_IOSCHED_NOOP)	+= noop-iosched.o
+ obj-$(CONFIG_IOSCHED_DEADLINE)	+= deadline-iosched.o
+ obj-$(CONFIG_IOSCHED_CFQ)	+= cfq-iosched.o
++obj-$(CONFIG_IOSCHED_BFQ)	+= bfq-iosched.o
+ 
+ obj-$(CONFIG_BLOCK_COMPAT)	+= compat_ioctl.o
+ obj-$(CONFIG_BLK_CMDLINE_PARSER)	+= cmdline-parser.o
+diff -Nur linux-4.1.3/Documentation/devicetree/bindings/mmc/mmc.txt linux-xbian-imx6/Documentation/devicetree/bindings/mmc/mmc.txt
+--- linux-4.1.3/Documentation/devicetree/bindings/mmc/mmc.txt	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/Documentation/devicetree/bindings/mmc/mmc.txt	2015-07-27 23:12:59.335353684 +0200
+@@ -5,6 +5,8 @@
+ Interpreted by the OF core:
+ - reg: Registers location and length.
+ - interrupts: Interrupts used by the MMC controller.
++- clocks: Clocks needed for the host controller, if any.
++- clock-names: Goes with clocks above.
+ 
+ Card detection:
+ If no property below is supplied, host native card detect is used.
+@@ -43,6 +45,15 @@
+ - dsr: Value the card's (optional) Driver Stage Register (DSR) should be
+   programmed with. Valid range: [0 .. 0xffff].
+ 
++Card power and reset control:
++The following properties can be specified for cases where the MMC
++peripheral needs additional reset, regulator and clock lines. It is for
++example common for WiFi/BT adapters to have these separate from the main
++MMC bus:
++  - card-reset-gpios: Specify GPIOs for card reset (reset active low)
++  - card-external-vcc-supply: Regulator to drive (independent) card VCC
++  - clock with name "card_ext_clock": External clock provided to the card
++
+ *NOTE* on CD and WP polarity. To use common for all SD/MMC host controllers line
+ polarity properties, we have to fix the meaning of the "normal" and "inverted"
+ line levels. We choose to follow the SDHCI standard, which specifies both those
+diff -Nur linux-4.1.3/Documentation/devicetree/bindings/vendor-prefixes.txt linux-xbian-imx6/Documentation/devicetree/bindings/vendor-prefixes.txt
+--- linux-4.1.3/Documentation/devicetree/bindings/vendor-prefixes.txt	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/Documentation/devicetree/bindings/vendor-prefixes.txt	2015-07-27 23:12:59.518699524 +0200
+@@ -201,6 +201,7 @@
+ variscite	Variscite Ltd.
+ via	VIA Technologies, Inc.
+ virtio	Virtual I/O Device Specification, developed by the OASIS consortium
++vivante	Vivante Corporation
+ voipac	Voipac Technologies s.r.o.
+ winbond Winbond Electronics corp.
+ wlf	Wolfson Microelectronics
+diff -Nur linux-4.1.3/drivers/char/frandom.c linux-xbian-imx6/drivers/char/frandom.c
+--- linux-4.1.3/drivers/char/frandom.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/char/frandom.c	2015-07-27 23:13:03.986757999 +0200
+@@ -0,0 +1,415 @@
++/*
++** frandom.c
++**      Fast pseudo-random generator
++**
++**      (c) Copyright 2003-2011 Eli Billauer
++**      http://www.billauer.co.il
++**
++** This program is free software; you can redistribute it and/or modify
++** it under the terms of the GNU General Public License as published by
++** the Free Software Foundation; either version 2 of the License, or
++** (at your option) any later version.
++**
++**
++*/
++
++#include <linux/version.h>
++#include <linux/module.h>
++#include <linux/moduleparam.h>
++
++#include <linux/kernel.h>
++#include <linux/init.h>
++#include <linux/slab.h>
++#include <linux/fs.h>
++#include <linux/errno.h>
++#include <linux/types.h>
++#include <linux/random.h>
++
++#include <asm/uaccess.h>
++#include <linux/cdev.h>
++#include <linux/err.h>
++#include <linux/device.h>
++
++#define INTERNAL_SEED 0
++#define EXTERNAL_SEED 1
++
++#define FRANDOM_MAJOR 235
++#define FRANDOM_MINOR 11
++#define ERANDOM_MINOR 12
++
++static struct file_operations frandom_fops; /* Values assigned below */
++
++static int erandom_seeded = 0; /* Internal flag */
++
++static int frandom_major = FRANDOM_MAJOR;
++static int frandom_minor = FRANDOM_MINOR;
++static int erandom_minor = ERANDOM_MINOR;
++static int frandom_bufsize = 256;
++static int frandom_chunklimit = 0; /* =0 means unlimited */
++
++static struct cdev frandom_cdev;
++static struct cdev erandom_cdev;
++static struct class *frandom_class;
++struct device *frandom_device;
++struct device *erandom_device;
++
++MODULE_DESCRIPTION("Fast pseudo-random number generator");
++MODULE_LICENSE("GPL");
++MODULE_AUTHOR("Eli Billauer");
++module_param(frandom_major, int, 0);
++module_param(frandom_minor, int, 0);
++module_param(erandom_minor, int, 0);
++module_param(frandom_bufsize, int, 0);
++module_param(frandom_chunklimit, int, 0);
++
++MODULE_PARM_DESC(frandom_major,"Major number of /dev/frandom and /dev/erandom");
++MODULE_PARM_DESC(frandom_minor,"Minor number of /dev/frandom");
++MODULE_PARM_DESC(erandom_minor,"Minor number of /dev/erandom");
++MODULE_PARM_DESC(frandom_bufsize,"Internal buffer size in bytes. Default is 256. Must be >= 256");
++MODULE_PARM_DESC(frandom_chunklimit,"Limit for read() blocks size. 0 (default) is unlimited, otherwise must be >= 256");
++
++struct frandom_state
++{
++	struct semaphore sem; /* Semaphore on the state structure */
++
++	u8 S[256]; /* The state array */
++	u8 i;
++	u8 j;
++
++	char *buf;
++};
++
++static struct frandom_state *erandom_state;
++
++static inline void swap_byte(u8 *a, u8 *b)
++{
++	u8 swapByte;
++
++	swapByte = *a;
++	*a = *b;
++	*b = swapByte;
++}
++
++static void init_rand_state(struct frandom_state *state, int seedflag);
++
++void erandom_get_random_bytes(char *buf, size_t count)
++{
++	struct frandom_state *state = erandom_state;
++	int k;
++
++	unsigned int i;
++	unsigned int j;
++	u8 *S;
++
++	/* If we fail to get the semaphore, we revert to external random data.
++	   Since semaphore blocking is expected to be very rare, and interrupts
++	   during these rare and very short periods of time even less frequent,
++	   we take the better-safe-than-sorry approach, and fill the buffer
++	   some expensive random data, in case the caller wasn't aware of this
++	   possibility, and expects random data anyhow.
++	*/
++
++	if (down_interruptible(&state->sem)) {
++		get_random_bytes(buf, count);
++		return;
++	}
++
++	/* We seed erandom as late as possible, hoping that the kernel's main
++	   RNG is already restored in the boot sequence (not critical, but
++	   better.
++	*/
++
++	if (!erandom_seeded) {
++		erandom_seeded = 1;
++		init_rand_state(state, EXTERNAL_SEED);
++		printk(KERN_INFO "frandom: Seeded global generator now (used by erandom)\n");
++	}
++
++	i = state->i;
++	j = state->j;
++	S = state->S;
++
++	for (k=0; k<count; k++) {
++		i = (i + 1) & 0xff;
++		j = (j + S[i]) & 0xff;
++		swap_byte(&S[i], &S[j]);
++		*buf++ = S[(S[i] + S[j]) & 0xff];
++	}
++
++	state->i = i;
++	state->j = j;
++
++	up(&state->sem);
++}
++
++static void init_rand_state(struct frandom_state *state, int seedflag)
++{
++	unsigned int i, j, k;
++	u8 *S;
++	u8 *seed = state->buf;
++
++	if (seedflag == INTERNAL_SEED)
++		erandom_get_random_bytes(seed, 256);
++	else
++		get_random_bytes(seed, 256);
++
++	S = state->S;
++	for (i=0; i<256; i++)
++		*S++=i;
++
++	j=0;
++	S = state->S;
++
++	for (i=0; i<256; i++) {
++		j = (j + S[i] + *seed++) & 0xff;
++		swap_byte(&S[i], &S[j]);
++	}
++
++	/* It's considered good practice to discard the first 256 bytes
++	   generated. So we do it:
++	*/
++
++	i=0; j=0;
++	for (k=0; k<256; k++) {
++		i = (i + 1) & 0xff;
++		j = (j + S[i]) & 0xff;
++		swap_byte(&S[i], &S[j]);
++	}
++
++	state->i = i; /* Save state */
++	state->j = j;
++}
++
++static int frandom_open(struct inode *inode, struct file *filp)
++{
++
++	struct frandom_state *state;
++
++	int num = iminor(inode);
++
++	/* This should never happen, now when the minors are regsitered
++	 * explicitly
++	 */
++	if ((num != frandom_minor) && (num != erandom_minor)) return -ENODEV;
++
++	state = kmalloc(sizeof(struct frandom_state), GFP_KERNEL);
++	if (!state)
++		return -ENOMEM;
++
++	state->buf = kmalloc(frandom_bufsize, GFP_KERNEL);
++	if (!state->buf) {
++		kfree(state);
++		return -ENOMEM;
++	}
++
++	sema_init(&state->sem, 1); /* Init semaphore as a mutex */
++
++	if (num == frandom_minor)
++		init_rand_state(state, EXTERNAL_SEED);
++	else
++		init_rand_state(state, INTERNAL_SEED);
++
++	filp->private_data = state;
++
++	return 0; /* Success */
++}
++
++static int frandom_release(struct inode *inode, struct file *filp)
++{
++
++	struct frandom_state *state = filp->private_data;
++
++	kfree(state->buf);
++	kfree(state);
++
++	return 0;
++}
++
++static ssize_t frandom_read(struct file *filp, char *buf, size_t count,
++			    loff_t *f_pos)
++{
++	struct frandom_state *state = filp->private_data;
++	ssize_t ret;
++	int dobytes, k;
++	char *localbuf;
++
++	unsigned int i;
++	unsigned int j;
++	u8 *S;
++
++	if (down_interruptible(&state->sem))
++		return -ERESTARTSYS;
++
++	if ((frandom_chunklimit > 0) && (count > frandom_chunklimit))
++		count = frandom_chunklimit;
++
++	ret = count; /* It's either everything or an error... */
++
++	i = state->i;
++	j = state->j;
++	S = state->S;
++
++	while (count) {
++		if (count > frandom_bufsize)
++			dobytes = frandom_bufsize;
++		else
++			dobytes = count;
++
++		localbuf = state->buf;
++
++		for (k=0; k<dobytes; k++) {
++			i = (i + 1) & 0xff;
++			j = (j + S[i]) & 0xff;
++			swap_byte(&S[i], &S[j]);
++			*localbuf++ = S[(S[i] + S[j]) & 0xff];
++		}
++
++		if (copy_to_user(buf, state->buf, dobytes)) {
++			ret = -EFAULT;
++			goto out;
++		}
++
++		buf += dobytes;
++		count -= dobytes;
++	}
++
++ out:
++	state->i = i;
++	state->j = j;
++
++	up(&state->sem);
++	return ret;
++}
++
++static struct file_operations frandom_fops = {
++	read:       frandom_read,
++	open:       frandom_open,
++	release:    frandom_release,
++};
++
++static void frandom_cleanup_module(void) {
++	unregister_chrdev_region(MKDEV(frandom_major, erandom_minor), 1);
++	cdev_del(&erandom_cdev);
++	device_destroy(frandom_class, MKDEV(frandom_major, erandom_minor));
++
++	unregister_chrdev_region(MKDEV(frandom_major, frandom_minor), 1);
++	cdev_del(&frandom_cdev);
++	device_destroy(frandom_class, MKDEV(frandom_major, frandom_minor));
++	class_destroy(frandom_class);
++
++	kfree(erandom_state->buf);
++	kfree(erandom_state);
++}
++
++
++static int frandom_init_module(void)
++{
++	int result;
++
++	/* The buffer size MUST be at least 256 bytes, because we assume that
++	   minimal length in init_rand_state().
++	*/
++	if (frandom_bufsize < 256) {
++		printk(KERN_ERR "frandom: Refused to load because frandom_bufsize=%d < 256\n",frandom_bufsize);
++		return -EINVAL;
++	}
++	if ((frandom_chunklimit != 0) && (frandom_chunklimit < 256)) {
++		printk(KERN_ERR "frandom: Refused to load because frandom_chunklimit=%d < 256 and != 0\n",frandom_chunklimit);
++		return -EINVAL;
++	}
++
++	erandom_state = kmalloc(sizeof(struct frandom_state), GFP_KERNEL);
++	if (!erandom_state)
++		return -ENOMEM;
++
++	/* This specific buffer is only used for seeding, so we need
++	   256 bytes exactly */
++	erandom_state->buf = kmalloc(256, GFP_KERNEL);
++	if (!erandom_state->buf) {
++		kfree(erandom_state);
++		return -ENOMEM;
++	}
++
++	sema_init(&erandom_state->sem, 1); /* Init semaphore as a mutex */
++
++	erandom_seeded = 0;
++
++	frandom_class = class_create(THIS_MODULE, "fastrng");
++	if (IS_ERR(frandom_class)) {
++		result = PTR_ERR(frandom_class);
++		printk(KERN_WARNING "frandom: Failed to register class fastrng\n");
++		goto error0;
++	}
++
++	/*
++	 * Register your major, and accept a dynamic number. This is the
++	 * first thing to do, in order to avoid releasing other module's
++	 * fops in frandom_cleanup_module()
++	 */
++
++	cdev_init(&frandom_cdev, &frandom_fops);
++	frandom_cdev.owner = THIS_MODULE;
++	result = cdev_add(&frandom_cdev, MKDEV(frandom_major, frandom_minor), 1);
++	if (result) {
++	  printk(KERN_WARNING "frandom: Failed to add cdev for /dev/frandom\n");
++	  goto error1;
++	}
++
++	result = register_chrdev_region(MKDEV(frandom_major, frandom_minor), 1, "/dev/frandom");
++	if (result < 0) {
++		printk(KERN_WARNING "frandom: can't get major/minor %d/%d\n", frandom_major, frandom_minor);
++	  goto error2;
++	}
++
++	frandom_device = device_create(frandom_class, NULL, MKDEV(frandom_major, frandom_minor), NULL, "frandom");
++
++	if (IS_ERR(frandom_device)) {
++		printk(KERN_WARNING "frandom: Failed to create frandom device\n");
++		goto error3;
++	}
++
++	cdev_init(&erandom_cdev, &frandom_fops);
++	erandom_cdev.owner = THIS_MODULE;
++	result = cdev_add(&erandom_cdev, MKDEV(frandom_major, erandom_minor), 1);
++	if (result) {
++	  printk(KERN_WARNING "frandom: Failed to add cdev for /dev/erandom\n");
++	  goto error4;
++	}
++
++	result = register_chrdev_region(MKDEV(frandom_major, erandom_minor), 1, "/dev/erandom");
++	if (result < 0) {
++		printk(KERN_WARNING "frandom: can't get major/minor %d/%d\n", frandom_major, erandom_minor);
++		goto error5;
++	}
++
++	erandom_device = device_create(frandom_class, NULL, MKDEV(frandom_major, erandom_minor), NULL, "erandom");
++
++	if (IS_ERR(erandom_device)) {
++		printk(KERN_WARNING "frandom: Failed to create erandom device\n");
++		goto error6;
++	}
++	return 0; /* succeed */
++
++ error6:
++	unregister_chrdev_region(MKDEV(frandom_major, erandom_minor), 1);
++ error5:
++	cdev_del(&erandom_cdev);
++ error4:
++	device_destroy(frandom_class, MKDEV(frandom_major, frandom_minor));
++ error3:
++	unregister_chrdev_region(MKDEV(frandom_major, frandom_minor), 1);
++ error2:
++	cdev_del(&frandom_cdev);
++ error1:
++	class_destroy(frandom_class);
++ error0:
++	kfree(erandom_state->buf);
++	kfree(erandom_state);
++
++	return result;
++}
++
++module_init(frandom_init_module);
++module_exit(frandom_cleanup_module);
++
++EXPORT_SYMBOL(erandom_get_random_bytes);
+diff -Nur linux-4.1.3/drivers/char/Makefile linux-xbian-imx6/drivers/char/Makefile
+--- linux-4.1.3/drivers/char/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/char/Makefile	2015-07-27 23:13:03.982772220 +0200
+@@ -2,6 +2,7 @@
+ # Makefile for the kernel character device drivers.
+ #
+ 
++obj-m				+= frandom.o
+ obj-y				+= mem.o random.o
+ obj-$(CONFIG_TTY_PRINTK)	+= ttyprintk.o
+ obj-y				+= misc.o
+diff -Nur linux-4.1.3/drivers/cpufreq/imx6q-cpufreq.c linux-xbian-imx6/drivers/cpufreq/imx6q-cpufreq.c
+--- linux-4.1.3/drivers/cpufreq/imx6q-cpufreq.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/cpufreq/imx6q-cpufreq.c	2015-07-27 23:13:04.158146502 +0200
+@@ -20,6 +20,8 @@
+ #define PU_SOC_VOLTAGE_HIGH	1275000
+ #define FREQ_1P2_GHZ		1200000000
+ 
++extern int vpu352;
++
+ static struct regulator *arm_reg;
+ static struct regulator *pu_reg;
+ static struct regulator *soc_reg;
+@@ -251,6 +253,10 @@
+ 			unsigned long volt = be32_to_cpup(val++);
+ 			if (freq_table[j].frequency == freq) {
+ 				imx6_soc_volt[soc_opp_count++] = volt;
++				if (vpu352 && freq == 792000) {
++					pr_info("VPU352: increase SOC/PU voltage for VPU352MHz\n");
++					imx6_soc_volt[soc_opp_count-1] = 1250000;
++				}
+ 				break;
+ 			}
+ 		}
+diff -Nur linux-4.1.3/drivers/crypto/caam/caamalg.c linux-xbian-imx6/drivers/crypto/caam/caamalg.c
+--- linux-4.1.3/drivers/crypto/caam/caamalg.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/caamalg.c	2015-07-27 23:13:04.205975852 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * caam - Freescale FSL CAAM support for crypto API
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  *
+  * Based on talitos crypto API driver.
+  *
+@@ -53,6 +53,7 @@
+ #include "error.h"
+ #include "sg_sw_sec4.h"
+ #include "key_gen.h"
++#include <linux/string.h>
+ 
+ /*
+  * crypto alg
+@@ -60,68 +61,42 @@
+ #define CAAM_CRA_PRIORITY		3000
+ /* max key is sum of AES_MAX_KEY_SIZE, max split key size */
+ #define CAAM_MAX_KEY_SIZE		(AES_MAX_KEY_SIZE + \
+-					 CTR_RFC3686_NONCE_SIZE + \
+ 					 SHA512_DIGEST_SIZE * 2)
+ /* max IV is max of AES_BLOCK_SIZE, DES3_EDE_BLOCK_SIZE */
+ #define CAAM_MAX_IV_LENGTH		16
+ 
+ /* length of descriptors text */
++#define DESC_JOB_IO_LEN			(CAAM_CMD_SZ * 5 + CAAM_PTR_SZ * 3)
++
+ #define DESC_AEAD_BASE			(4 * CAAM_CMD_SZ)
+-#define DESC_AEAD_ENC_LEN		(DESC_AEAD_BASE + 15 * CAAM_CMD_SZ)
+-#define DESC_AEAD_DEC_LEN		(DESC_AEAD_BASE + 18 * CAAM_CMD_SZ)
++#define DESC_AEAD_ENC_LEN		(DESC_AEAD_BASE + 16 * CAAM_CMD_SZ)
++#define DESC_AEAD_DEC_LEN		(DESC_AEAD_BASE + 21 * CAAM_CMD_SZ)
+ #define DESC_AEAD_GIVENC_LEN		(DESC_AEAD_ENC_LEN + 7 * CAAM_CMD_SZ)
+ 
+-/* Note: Nonce is counted in enckeylen */
+-#define DESC_AEAD_CTR_RFC3686_LEN	(6 * CAAM_CMD_SZ)
+-
+-#define DESC_AEAD_NULL_BASE		(3 * CAAM_CMD_SZ)
+-#define DESC_AEAD_NULL_ENC_LEN		(DESC_AEAD_NULL_BASE + 14 * CAAM_CMD_SZ)
+-#define DESC_AEAD_NULL_DEC_LEN		(DESC_AEAD_NULL_BASE + 17 * CAAM_CMD_SZ)
+-
+-#define DESC_GCM_BASE			(3 * CAAM_CMD_SZ)
+-#define DESC_GCM_ENC_LEN		(DESC_GCM_BASE + 23 * CAAM_CMD_SZ)
+-#define DESC_GCM_DEC_LEN		(DESC_GCM_BASE + 19 * CAAM_CMD_SZ)
+-
+-#define DESC_RFC4106_BASE		(3 * CAAM_CMD_SZ)
+-#define DESC_RFC4106_ENC_LEN		(DESC_RFC4106_BASE + 15 * CAAM_CMD_SZ)
+-#define DESC_RFC4106_DEC_LEN		(DESC_RFC4106_BASE + 14 * CAAM_CMD_SZ)
+-#define DESC_RFC4106_GIVENC_LEN		(DESC_RFC4106_BASE + 21 * CAAM_CMD_SZ)
+-
+-#define DESC_RFC4543_BASE		(3 * CAAM_CMD_SZ)
+-#define DESC_RFC4543_ENC_LEN		(DESC_RFC4543_BASE + 25 * CAAM_CMD_SZ)
+-#define DESC_RFC4543_DEC_LEN		(DESC_RFC4543_BASE + 27 * CAAM_CMD_SZ)
+-#define DESC_RFC4543_GIVENC_LEN		(DESC_RFC4543_BASE + 30 * CAAM_CMD_SZ)
+-
+ #define DESC_ABLKCIPHER_BASE		(3 * CAAM_CMD_SZ)
+ #define DESC_ABLKCIPHER_ENC_LEN		(DESC_ABLKCIPHER_BASE + \
+ 					 20 * CAAM_CMD_SZ)
+ #define DESC_ABLKCIPHER_DEC_LEN		(DESC_ABLKCIPHER_BASE + \
+ 					 15 * CAAM_CMD_SZ)
+ 
+-#define DESC_MAX_USED_BYTES		(DESC_RFC4543_GIVENC_LEN + \
++#define DESC_MAX_USED_BYTES		(DESC_AEAD_GIVENC_LEN + \
+ 					 CAAM_MAX_KEY_SIZE)
+ #define DESC_MAX_USED_LEN		(DESC_MAX_USED_BYTES / CAAM_CMD_SZ)
+ 
+ #ifdef DEBUG
+ /* for print_hex_dumps with line references */
++#define xstr(s) str(s)
++#define str(s) #s
+ #define debug(format, arg...) printk(format, arg)
+ #else
+ #define debug(format, arg...)
+ #endif
+-static struct list_head alg_list;
+ 
+ /* Set DK bit in class 1 operation if shared */
+ static inline void append_dec_op1(u32 *desc, u32 type)
+ {
+ 	u32 *jump_cmd, *uncond_jump_cmd;
+ 
+-	/* DK bit is valid only for AES */
+-	if ((type & OP_ALG_ALGSEL_MASK) != OP_ALG_ALGSEL_AES) {
+-		append_operation(desc, type | OP_ALG_AS_INITFINAL |
+-				 OP_ALG_DECRYPT);
+-		return;
+-	}
+-
+ 	jump_cmd = append_jump(desc, JUMP_TEST_ALL | JUMP_COND_SHRD);
+ 	append_operation(desc, type | OP_ALG_AS_INITFINAL |
+ 			 OP_ALG_DECRYPT);
+@@ -133,26 +108,37 @@
+ }
+ 
+ /*
++ * Wait for completion of class 1 key loading before allowing
++ * error propagation
++ */
++static inline void append_dec_shr_done(u32 *desc)
++{
++	u32 *jump_cmd;
++
++	jump_cmd = append_jump(desc, JUMP_CLASS_CLASS1 | JUMP_TEST_ALL);
++	set_jump_tgt_here(desc, jump_cmd);
++	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
++}
++
++/*
+  * For aead functions, read payload and write payload,
+  * both of which are specified in req->src and req->dst
+  */
+ static inline void aead_append_src_dst(u32 *desc, u32 msg_type)
+ {
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | KEY_VLF);
+ 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_BOTH |
+ 			     KEY_VLF | msg_type | FIFOLD_TYPE_LASTBOTH);
++	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | KEY_VLF);
+ }
+ 
+ /*
+  * For aead encrypt and decrypt, read iv for both classes
+  */
+-static inline void aead_append_ld_iv(u32 *desc, int ivsize, int ivoffset)
++static inline void aead_append_ld_iv(u32 *desc, int ivsize)
+ {
+-	append_seq_load(desc, ivsize, LDST_CLASS_1_CCB |
+-			LDST_SRCDST_BYTE_CONTEXT |
+-			(ivoffset << LDST_OFFSET_SHIFT));
+-	append_move(desc, MOVE_SRC_CLASS1CTX | MOVE_DEST_CLASS2INFIFO |
+-		    (ivoffset << MOVE_OFFSET_SHIFT) | ivsize);
++	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++		   LDST_CLASS_1_CCB | ivsize);
++	append_move(desc, MOVE_SRC_CLASS1CTX | MOVE_DEST_CLASS2INFIFO | ivsize);
+ }
+ 
+ /*
+@@ -198,309 +184,68 @@
+ };
+ 
+ static void append_key_aead(u32 *desc, struct caam_ctx *ctx,
+-			    int keys_fit_inline, bool is_rfc3686)
++			    int keys_fit_inline)
+ {
+-	u32 *nonce;
+-	unsigned int enckeylen = ctx->enckeylen;
+-
+-	/*
+-	 * RFC3686 specific:
+-	 *	| ctx->key = {AUTH_KEY, ENC_KEY, NONCE}
+-	 *	| enckeylen = encryption key size + nonce size
+-	 */
+-	if (is_rfc3686)
+-		enckeylen -= CTR_RFC3686_NONCE_SIZE;
+-
+ 	if (keys_fit_inline) {
+ 		append_key_as_imm(desc, ctx->key, ctx->split_key_pad_len,
+ 				  ctx->split_key_len, CLASS_2 |
+ 				  KEY_DEST_MDHA_SPLIT | KEY_ENC);
+ 		append_key_as_imm(desc, (void *)ctx->key +
+-				  ctx->split_key_pad_len, enckeylen,
+-				  enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
++				  ctx->split_key_pad_len, ctx->enckeylen,
++				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+ 	} else {
+ 		append_key(desc, ctx->key_dma, ctx->split_key_len, CLASS_2 |
+ 			   KEY_DEST_MDHA_SPLIT | KEY_ENC);
+ 		append_key(desc, ctx->key_dma + ctx->split_key_pad_len,
+-			   enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	}
+-
+-	/* Load Counter into CONTEXT1 reg */
+-	if (is_rfc3686) {
+-		nonce = (u32 *)((void *)ctx->key + ctx->split_key_pad_len +
+-			       enckeylen);
+-		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
+-				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
+-		append_move(desc,
+-			    MOVE_SRC_OUTFIFO |
+-			    MOVE_DEST_CLASS1CTX |
+-			    (16 << MOVE_OFFSET_SHIFT) |
+-			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
++			   ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+ 	}
+ }
+ 
+ static void init_sh_desc_key_aead(u32 *desc, struct caam_ctx *ctx,
+-				  int keys_fit_inline, bool is_rfc3686)
++				  int keys_fit_inline)
+ {
+ 	u32 *key_jump_cmd;
+ 
+-	/* Note: Context registers are saved. */
+-	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
+-
+-	/* Skip if already shared */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-
+-	append_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
+-
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-}
+-
+-static int aead_null_set_sh_desc(struct crypto_aead *aead)
+-{
+-	struct aead_tfm *tfm = &aead->base.crt_aead;
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	bool keys_fit_inline = false;
+-	u32 *key_jump_cmd, *jump_cmd, *read_move_cmd, *write_move_cmd;
+-	u32 *desc;
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	if (DESC_AEAD_NULL_ENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->split_key_pad_len <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	/* aead_encrypt shared descriptor */
+-	desc = ctx->sh_desc_enc;
+-
+ 	init_sh_desc(desc, HDR_SHARE_SERIAL);
+ 
+ 	/* Skip if already shared */
+ 	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+ 				   JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, ctx->key, ctx->split_key_pad_len,
+-				  ctx->split_key_len, CLASS_2 |
+-				  KEY_DEST_MDHA_SPLIT | KEY_ENC);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->split_key_len, CLASS_2 |
+-			   KEY_DEST_MDHA_SPLIT | KEY_ENC);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* cryptlen = seqoutlen - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
+-
+-	/*
+-	 * NULL encryption; IV is zero
+-	 * assoclen = (assoclen + cryptlen) - cryptlen
+-	 */
+-	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
+-
+-	/* read assoc before reading payload */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
+-			     KEY_VLF);
+-
+-	/* Prepare to read and write cryptlen bytes */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
+-
+-	/*
+-	 * MOVE_LEN opcode is not available in all SEC HW revisions,
+-	 * thus need to do some magic, i.e. self-patch the descriptor
+-	 * buffer.
+-	 */
+-	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF |
+-				    MOVE_DEST_MATH3 |
+-				    (0x6 << MOVE_LEN_SHIFT));
+-	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 |
+-				     MOVE_DEST_DESCBUF |
+-				     MOVE_WAITCOMP |
+-				     (0x8 << MOVE_LEN_SHIFT));
+-
+-	/* Class 2 operation */
+-	append_operation(desc, ctx->class2_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+-
+-	/* Read and write cryptlen bytes */
+-	aead_append_src_dst(desc, FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
+-
+-	set_move_tgt_here(desc, read_move_cmd);
+-	set_move_tgt_here(desc, write_move_cmd);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO |
+-		    MOVE_AUX_LS);
+-
+-	/* Write ICV */
+-	append_seq_store(desc, ctx->authsize, LDST_CLASS_2_CCB |
+-			 LDST_SRCDST_BYTE_CONTEXT);
+-
+-	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "aead null enc shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	keys_fit_inline = false;
+-	if (DESC_AEAD_NULL_DEC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->split_key_pad_len <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	desc = ctx->sh_desc_dec;
+ 
+-	/* aead_decrypt shared descriptor */
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
++	append_key_aead(desc, ctx, keys_fit_inline);
+ 
+-	/* Skip if already shared */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, ctx->key, ctx->split_key_pad_len,
+-				  ctx->split_key_len, CLASS_2 |
+-				  KEY_DEST_MDHA_SPLIT | KEY_ENC);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->split_key_len, CLASS_2 |
+-			   KEY_DEST_MDHA_SPLIT | KEY_ENC);
+ 	set_jump_tgt_here(desc, key_jump_cmd);
+ 
+-	/* Class 2 operation */
+-	append_operation(desc, ctx->class2_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
+-
+-	/* assoclen + cryptlen = seqinlen - ivsize - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
+-				ctx->authsize + tfm->ivsize);
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
+-	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
+-	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
+-
+-	/* read assoc before reading payload */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
+-			     KEY_VLF);
+-
+-	/* Prepare to read and write cryptlen bytes */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG2, CAAM_CMD_SZ);
+-
+-	/*
+-	 * MOVE_LEN opcode is not available in all SEC HW revisions,
+-	 * thus need to do some magic, i.e. self-patch the descriptor
+-	 * buffer.
+-	 */
+-	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF |
+-				    MOVE_DEST_MATH2 |
+-				    (0x6 << MOVE_LEN_SHIFT));
+-	write_move_cmd = append_move(desc, MOVE_SRC_MATH2 |
+-				     MOVE_DEST_DESCBUF |
+-				     MOVE_WAITCOMP |
+-				     (0x8 << MOVE_LEN_SHIFT));
+-
+-	/* Read and write cryptlen bytes */
+-	aead_append_src_dst(desc, FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
+-
+-	/*
+-	 * Insert a NOP here, since we need at least 4 instructions between
+-	 * code patching the descriptor buffer and the location being patched.
+-	 */
+-	jump_cmd = append_jump(desc, JUMP_TEST_ALL);
+-	set_jump_tgt_here(desc, jump_cmd);
+-
+-	set_move_tgt_here(desc, read_move_cmd);
+-	set_move_tgt_here(desc, write_move_cmd);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO |
+-		    MOVE_AUX_LS);
+-	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
+-
+-	/* Load ICV */
+-	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS2 |
+-			     FIFOLD_TYPE_LAST2 | FIFOLD_TYPE_ICV);
+-
+-	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "aead null dec shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	return 0;
++	/* Propagate errors from shared to job descriptor */
++	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
+ }
+ 
+ static int aead_set_sh_desc(struct crypto_aead *aead)
+ {
+ 	struct aead_tfm *tfm = &aead->base.crt_aead;
+ 	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct crypto_tfm *ctfm = crypto_aead_tfm(aead);
+-	const char *alg_name = crypto_tfm_alg_name(ctfm);
+ 	struct device *jrdev = ctx->jrdev;
+-	bool keys_fit_inline;
++	bool keys_fit_inline = false;
++	u32 *key_jump_cmd, *jump_cmd;
+ 	u32 geniv, moveiv;
+-	u32 ctx1_iv_off = 0;
+ 	u32 *desc;
+-	const bool ctr_mode = ((ctx->class1_alg_type & OP_ALG_AAI_MASK) ==
+-			       OP_ALG_AAI_CTR_MOD128);
+-	const bool is_rfc3686 = (ctr_mode &&
+-				 (strstr(alg_name, "rfc3686") != NULL));
+ 
+-	if (!ctx->authsize)
++	if (!ctx->enckeylen || !ctx->authsize)
+ 		return 0;
+ 
+-	/* NULL encryption / decryption */
+-	if (!ctx->enckeylen)
+-		return aead_null_set_sh_desc(aead);
+-
+-	/*
+-	 * AES-CTR needs to load IV in CONTEXT1 reg
+-	 * at an offset of 128bits (16bytes)
+-	 * CONTEXT1[255:128] = IV
+-	 */
+-	if (ctr_mode)
+-		ctx1_iv_off = 16;
+-
+-	/*
+-	 * RFC3686 specific:
+-	 *	CONTEXT1[255:128] = {NONCE, IV, COUNTER}
+-	 */
+-	if (is_rfc3686)
+-		ctx1_iv_off = 16 + CTR_RFC3686_NONCE_SIZE;
+-
+ 	/*
+ 	 * Job Descriptor and Shared Descriptors
+ 	 * must all fit into the 64-word Descriptor h/w Buffer
+ 	 */
+-	keys_fit_inline = false;
+ 	if (DESC_AEAD_ENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->split_key_pad_len + ctx->enckeylen +
+-	    (is_rfc3686 ? DESC_AEAD_CTR_RFC3686_LEN : 0) <=
++	    ctx->split_key_pad_len + ctx->enckeylen <=
+ 	    CAAM_DESC_BYTES_MAX)
+ 		keys_fit_inline = true;
+ 
+ 	/* aead_encrypt shared descriptor */
+ 	desc = ctx->sh_desc_enc;
+ 
+-	/* Note: Context registers are saved. */
+-	init_sh_desc_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
++	init_sh_desc_key_aead(desc, ctx, keys_fit_inline);
+ 
+ 	/* Class 2 operation */
+ 	append_operation(desc, ctx->class2_alg_type |
+@@ -512,21 +257,13 @@
+ 	/* assoclen + cryptlen = seqinlen - ivsize */
+ 	append_math_sub_imm_u32(desc, REG2, SEQINLEN, IMM, tfm->ivsize);
+ 
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
++	/* assoclen + cryptlen = (assoclen + cryptlen) - cryptlen */
+ 	append_math_sub(desc, VARSEQINLEN, REG2, REG3, CAAM_CMD_SZ);
+ 
+ 	/* read assoc before reading payload */
+ 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
+ 			     KEY_VLF);
+-	aead_append_ld_iv(desc, tfm->ivsize, ctx1_iv_off);
+-
+-	/* Load Counter into CONTEXT1 reg */
+-	if (is_rfc3686)
+-		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
+-				    LDST_CLASS_1_CCB |
+-				    LDST_SRCDST_BYTE_CONTEXT |
+-				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
+-				     LDST_OFFSET_SHIFT));
++	aead_append_ld_iv(desc, tfm->ivsize);
+ 
+ 	/* Class 1 operation */
+ 	append_operation(desc, ctx->class1_alg_type |
+@@ -549,35 +286,46 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "aead enc shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "aead enc shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
+ 
++	dma_sync_single_for_cpu(jrdev, ctx->sh_desc_enc_dma, desc_bytes(desc),
++				DMA_TO_DEVICE);
+ 	/*
+ 	 * Job Descriptor and Shared Descriptors
+ 	 * must all fit into the 64-word Descriptor h/w Buffer
+ 	 */
+-	keys_fit_inline = false;
+ 	if (DESC_AEAD_DEC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->split_key_pad_len + ctx->enckeylen +
+-	    (is_rfc3686 ? DESC_AEAD_CTR_RFC3686_LEN : 0) <=
++	    ctx->split_key_pad_len + ctx->enckeylen <=
+ 	    CAAM_DESC_BYTES_MAX)
+ 		keys_fit_inline = true;
+ 
+-	/* aead_decrypt shared descriptor */
+ 	desc = ctx->sh_desc_dec;
+ 
+-	/* Note: Context registers are saved. */
+-	init_sh_desc_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
++	/* aead_decrypt shared descriptor */
++	init_sh_desc(desc, HDR_SHARE_SERIAL);
++
++	/* Skip if already shared */
++	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
++				   JUMP_COND_SHRD);
++
++	append_key_aead(desc, ctx, keys_fit_inline);
++
++	/* Only propagate error immediately if shared */
++	jump_cmd = append_jump(desc, JUMP_TEST_ALL);
++	set_jump_tgt_here(desc, key_jump_cmd);
++	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
++	set_jump_tgt_here(desc, jump_cmd);
+ 
+ 	/* Class 2 operation */
+ 	append_operation(desc, ctx->class2_alg_type |
+ 			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
+ 
+-	/* assoclen + cryptlen = seqinlen - ivsize - authsize */
++	/* assoclen + cryptlen = seqinlen - ivsize */
+ 	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
+-				ctx->authsize + tfm->ivsize);
++				ctx->authsize + tfm->ivsize)
+ 	/* assoclen = (assoclen + cryptlen) - cryptlen */
+ 	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
+ 	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
+@@ -586,22 +334,9 @@
+ 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
+ 			     KEY_VLF);
+ 
+-	aead_append_ld_iv(desc, tfm->ivsize, ctx1_iv_off);
++	aead_append_ld_iv(desc, tfm->ivsize);
+ 
+-	/* Load Counter into CONTEXT1 reg */
+-	if (is_rfc3686)
+-		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
+-				    LDST_CLASS_1_CCB |
+-				    LDST_SRCDST_BYTE_CONTEXT |
+-				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
+-				     LDST_OFFSET_SHIFT));
+-
+-	/* Choose operation */
+-	if (ctr_mode)
+-		append_operation(desc, ctx->class1_alg_type |
+-				 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT);
+-	else
+-		append_dec_op1(desc, ctx->class1_alg_type);
++	append_dec_op1(desc, ctx->class1_alg_type);
+ 
+ 	/* Read and write cryptlen bytes */
+ 	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
+@@ -611,6 +346,7 @@
+ 	/* Load ICV */
+ 	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS2 |
+ 			     FIFOLD_TYPE_LAST2 | FIFOLD_TYPE_ICV);
++	append_dec_shr_done(desc);
+ 
+ 	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
+ 					      desc_bytes(desc),
+@@ -620,27 +356,26 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "aead dec shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "aead dec shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_cpu(jrdev, ctx->sh_desc_dec_dma, desc_bytes(desc),
++				DMA_TO_DEVICE);
+ 
+ 	/*
+ 	 * Job Descriptor and Shared Descriptors
+ 	 * must all fit into the 64-word Descriptor h/w Buffer
+ 	 */
+-	keys_fit_inline = false;
+ 	if (DESC_AEAD_GIVENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->split_key_pad_len + ctx->enckeylen +
+-	    (is_rfc3686 ? DESC_AEAD_CTR_RFC3686_LEN : 0) <=
++	    ctx->split_key_pad_len + ctx->enckeylen <=
+ 	    CAAM_DESC_BYTES_MAX)
+ 		keys_fit_inline = true;
+ 
+ 	/* aead_givencrypt shared descriptor */
+ 	desc = ctx->sh_desc_givenc;
+ 
+-	/* Note: Context registers are saved. */
+-	init_sh_desc_key_aead(desc, ctx, keys_fit_inline, is_rfc3686);
++	init_sh_desc_key_aead(desc, ctx, keys_fit_inline);
+ 
+ 	/* Generate IV */
+ 	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
+@@ -649,16 +384,13 @@
+ 	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
+ 			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
+ 	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	append_move(desc, MOVE_WAITCOMP |
+-		    MOVE_SRC_INFIFO | MOVE_DEST_CLASS1CTX |
+-		    (ctx1_iv_off << MOVE_OFFSET_SHIFT) |
+-		    (tfm->ivsize << MOVE_LEN_SHIFT));
++	append_move(desc, MOVE_SRC_INFIFO |
++		    MOVE_DEST_CLASS1CTX | (tfm->ivsize << MOVE_LEN_SHIFT));
+ 	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
+ 
+ 	/* Copy IV to class 1 context */
+-	append_move(desc, MOVE_SRC_CLASS1CTX | MOVE_DEST_OUTFIFO |
+-		    (ctx1_iv_off << MOVE_OFFSET_SHIFT) |
+-		    (tfm->ivsize << MOVE_LEN_SHIFT));
++	append_move(desc, MOVE_SRC_CLASS1CTX |
++		    MOVE_DEST_OUTFIFO | (tfm->ivsize << MOVE_LEN_SHIFT));
+ 
+ 	/* Return to encryption */
+ 	append_operation(desc, ctx->class2_alg_type |
+@@ -674,7 +406,7 @@
+ 	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS2 | FIFOLD_TYPE_MSG |
+ 			     KEY_VLF);
+ 
+-	/* Copy iv from outfifo to class 2 fifo */
++	/* Copy iv from class 1 ctx to class 2 fifo*/
+ 	moveiv = NFIFOENTRY_STYPE_OFIFO | NFIFOENTRY_DEST_CLASS2 |
+ 		 NFIFOENTRY_DTYPE_MSG | (tfm->ivsize << NFIFOENTRY_DLEN_SHIFT);
+ 	append_load_imm_u32(desc, moveiv, LDST_CLASS_IND_CCB |
+@@ -682,14 +414,6 @@
+ 	append_load_imm_u32(desc, tfm->ivsize, LDST_CLASS_2_CCB |
+ 			    LDST_SRCDST_WORD_DATASZ_REG | LDST_IMM);
+ 
+-	/* Load Counter into CONTEXT1 reg */
+-	if (is_rfc3686)
+-		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
+-				    LDST_CLASS_1_CCB |
+-				    LDST_SRCDST_BYTE_CONTEXT |
+-				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
+-				     LDST_OFFSET_SHIFT));
+-
+ 	/* Class 1 operation */
+ 	append_operation(desc, ctx->class1_alg_type |
+ 			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+@@ -717,10 +441,12 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "aead givenc shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "aead givenc shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_cpu(jrdev, ctx->sh_desc_givenc_dma,
++				desc_bytes(desc), DMA_TO_DEVICE);
+ 
+ 	return 0;
+ }
+@@ -736,977 +462,84 @@
+ 	return 0;
+ }
+ 
+-static int gcm_set_sh_desc(struct crypto_aead *aead)
++static u32 gen_split_aead_key(struct caam_ctx *ctx, const u8 *key_in,
++			      u32 authkeylen)
+ {
+-	struct aead_tfm *tfm = &aead->base.crt_aead;
++	return gen_split_key(ctx->jrdev, ctx->key, ctx->split_key_len,
++			       ctx->split_key_pad_len, key_in, authkeylen,
++			       ctx->alg_op);
++}
++
++static int aead_setkey(struct crypto_aead *aead,
++			       const u8 *key, unsigned int keylen)
++{
++	/* Sizes for MDHA pads (*not* keys): MD5, SHA1, 224, 256, 384, 512 */
++	static const u8 mdpadlen[] = { 16, 20, 32, 32, 64, 64 };
+ 	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+ 	struct device *jrdev = ctx->jrdev;
+-	bool keys_fit_inline = false;
+-	u32 *key_jump_cmd, *zero_payload_jump_cmd,
+-	    *zero_assoc_jump_cmd1, *zero_assoc_jump_cmd2;
+-	u32 *desc;
+-
+-	if (!ctx->enckeylen || !ctx->authsize)
+-		return 0;
+-
+-	/*
+-	 * AES GCM encrypt shared descriptor
+-	 * Job Descriptor and Shared Descriptor
+-	 * must fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	if (DESC_GCM_ENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
++	struct rtattr *rta = (void *)key;
++	struct crypto_authenc_key_param *param;
++	unsigned int authkeylen;
++	unsigned int enckeylen;
++	int ret = 0;
+ 
+-	desc = ctx->sh_desc_enc;
++	param = RTA_DATA(rta);
++	enckeylen = be32_to_cpu(param->enckeylen);
+ 
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
++	key += RTA_ALIGN(rta->rta_len);
++	keylen -= RTA_ALIGN(rta->rta_len);
+ 
+-	/* skip key loading if they are loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD | JUMP_COND_SELF);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
++	if (keylen < enckeylen)
++		goto badkey;
+ 
+-	/* class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
++	authkeylen = keylen - enckeylen;
+ 
+-	/* cryptlen = seqoutlen - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
++	if (keylen > CAAM_MAX_KEY_SIZE)
++		goto badkey;
+ 
+-	/* assoclen + cryptlen = seqinlen - ivsize */
+-	append_math_sub_imm_u32(desc, REG2, SEQINLEN, IMM, tfm->ivsize);
++	/* Pick class 2 key length from algorithm submask */
++	ctx->split_key_len = mdpadlen[(ctx->alg_op & OP_ALG_ALGSEL_SUBMASK) >>
++				      OP_ALG_ALGSEL_SHIFT] * 2;
++	ctx->split_key_pad_len = ALIGN(ctx->split_key_len, 16);
+ 
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
+-	append_math_sub(desc, REG1, REG2, REG3, CAAM_CMD_SZ);
++#ifdef DEBUG
++	printk(KERN_ERR "keylen %d enckeylen %d authkeylen %d\n",
++	       keylen, enckeylen, authkeylen);
++	printk(KERN_ERR "split_key_len %d split_key_pad_len %d\n",
++	       ctx->split_key_len, ctx->split_key_pad_len);
++	print_hex_dump(KERN_ERR, "key in @"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
++#endif
+ 
+-	/* if cryptlen is ZERO jump to zero-payload commands */
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
+-	zero_payload_jump_cmd = append_jump(desc, JUMP_TEST_ALL |
+-					    JUMP_COND_MATH_Z);
+-	/* read IV */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
+-
+-	/* if assoclen is ZERO, skip reading the assoc data */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
+-	zero_assoc_jump_cmd1 = append_jump(desc, JUMP_TEST_ALL |
+-					   JUMP_COND_MATH_Z);
+-
+-	/* read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
+-	set_jump_tgt_here(desc, zero_assoc_jump_cmd1);
++	ret = gen_split_aead_key(ctx, key, authkeylen);
++	if (ret) {
++		goto badkey;
++	}
+ 
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
++	/* postpend encryption key to auth split key */
++	memcpy(ctx->key + ctx->split_key_pad_len, key + authkeylen, enckeylen);
+ 
+-	/* write encrypted data */
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
++	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->split_key_pad_len +
++				       enckeylen, DMA_TO_DEVICE);
++	if (dma_mapping_error(jrdev, ctx->key_dma)) {
++		dev_err(jrdev, "unable to map key i/o memory\n");
++		return -ENOMEM;
++	}
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
++		       ctx->split_key_pad_len + enckeylen, 1);
++#endif
++	dma_sync_single_for_device(jrdev, ctx->key_dma,
++				   ctx->split_key_pad_len + enckeylen,
++				   DMA_TO_DEVICE);
+ 
+-	/* read payload data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1);
+-
+-	/* jump the zero-payload commands */
+-	append_jump(desc, JUMP_TEST_ALL | 7);
+-
+-	/* zero-payload commands */
+-	set_jump_tgt_here(desc, zero_payload_jump_cmd);
+-
+-	/* if assoclen is ZERO, jump to IV reading - is the only input data */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
+-	zero_assoc_jump_cmd2 = append_jump(desc, JUMP_TEST_ALL |
+-					   JUMP_COND_MATH_Z);
+-	/* read IV */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
+-
+-	/* read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_LAST1);
+-
+-	/* jump to ICV writing */
+-	append_jump(desc, JUMP_TEST_ALL | 2);
+-
+-	/* read IV - is the only input data */
+-	set_jump_tgt_here(desc, zero_assoc_jump_cmd2);
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 |
+-			     FIFOLD_TYPE_LAST1);
+-
+-	/* write ICV */
+-	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
+-			 LDST_SRCDST_BYTE_CONTEXT);
+-
+-	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "gcm enc shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	keys_fit_inline = false;
+-	if (DESC_GCM_DEC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	desc = ctx->sh_desc_dec;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* skip key loading if they are loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL |
+-				   JUMP_TEST_ALL | JUMP_COND_SHRD |
+-				   JUMP_COND_SELF);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
+-
+-	/* assoclen + cryptlen = seqinlen - ivsize - icvsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
+-				ctx->authsize + tfm->ivsize);
+-
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
+-	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
+-	append_math_sub(desc, REG1, REG3, REG2, CAAM_CMD_SZ);
+-
+-	/* read IV */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
+-
+-	/* jump to zero-payload command if cryptlen is zero */
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG2, CAAM_CMD_SZ);
+-	zero_payload_jump_cmd = append_jump(desc, JUMP_TEST_ALL |
+-					    JUMP_COND_MATH_Z);
+-
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
+-	/* if asoclen is ZERO, skip reading assoc data */
+-	zero_assoc_jump_cmd1 = append_jump(desc, JUMP_TEST_ALL |
+-					   JUMP_COND_MATH_Z);
+-	/* read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
+-	set_jump_tgt_here(desc, zero_assoc_jump_cmd1);
+-
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
+-
+-	/* store encrypted data */
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
+-
+-	/* read payload data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
+-
+-	/* jump the zero-payload commands */
+-	append_jump(desc, JUMP_TEST_ALL | 4);
+-
+-	/* zero-payload command */
+-	set_jump_tgt_here(desc, zero_payload_jump_cmd);
+-
+-	/* if assoclen is ZERO, jump to ICV reading */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG1, CAAM_CMD_SZ);
+-	zero_assoc_jump_cmd2 = append_jump(desc, JUMP_TEST_ALL |
+-					   JUMP_COND_MATH_Z);
+-	/* read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
+-	set_jump_tgt_here(desc, zero_assoc_jump_cmd2);
+-
+-	/* read ICV */
+-	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_ICV | FIFOLD_TYPE_LAST1);
+-
+-	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "gcm dec shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	return 0;
+-}
+-
+-static int gcm_setauthsize(struct crypto_aead *authenc, unsigned int authsize)
+-{
+-	struct caam_ctx *ctx = crypto_aead_ctx(authenc);
+-
+-	ctx->authsize = authsize;
+-	gcm_set_sh_desc(authenc);
+-
+-	return 0;
+-}
+-
+-static int rfc4106_set_sh_desc(struct crypto_aead *aead)
+-{
+-	struct aead_tfm *tfm = &aead->base.crt_aead;
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	bool keys_fit_inline = false;
+-	u32 *key_jump_cmd, *move_cmd, *write_iv_cmd;
+-	u32 *desc;
+-	u32 geniv;
+-
+-	if (!ctx->enckeylen || !ctx->authsize)
+-		return 0;
+-
+-	/*
+-	 * RFC4106 encrypt shared descriptor
+-	 * Job Descriptor and Shared Descriptor
+-	 * must fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	if (DESC_RFC4106_ENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	desc = ctx->sh_desc_enc;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* Skip key loading if it is loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+-
+-	/* cryptlen = seqoutlen - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
+-
+-	/* assoclen + cryptlen = seqinlen - ivsize */
+-	append_math_sub_imm_u32(desc, REG2, SEQINLEN, IMM, tfm->ivsize);
+-
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
+-	append_math_sub(desc, VARSEQINLEN, REG2, REG3, CAAM_CMD_SZ);
+-
+-	/* Read Salt */
+-	append_fifo_load_as_imm(desc, (void *)(ctx->key + ctx->enckeylen),
+-				4, FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_IV);
+-	/* Read AES-GCM-ESP IV */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
+-
+-	/* Read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
+-
+-	/* Will read cryptlen bytes */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
+-
+-	/* Write encrypted data */
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
+-
+-	/* Read payload data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1);
+-
+-	/* Write ICV */
+-	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
+-			 LDST_SRCDST_BYTE_CONTEXT);
+-
+-	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "rfc4106 enc shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	keys_fit_inline = false;
+-	if (DESC_RFC4106_DEC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	desc = ctx->sh_desc_dec;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* Skip key loading if it is loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL |
+-				   JUMP_TEST_ALL | JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
+-
+-	/* assoclen + cryptlen = seqinlen - ivsize - icvsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM,
+-				ctx->authsize + tfm->ivsize);
+-
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
+-	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
+-	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
+-
+-	/* Will write cryptlen bytes */
+-	append_math_sub(desc, VARSEQOUTLEN, SEQOUTLEN, REG0, CAAM_CMD_SZ);
+-
+-	/* Read Salt */
+-	append_fifo_load_as_imm(desc, (void *)(ctx->key + ctx->enckeylen),
+-				4, FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_IV);
+-	/* Read AES-GCM-ESP IV */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1);
+-
+-	/* Read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
+-
+-	/* Will read cryptlen bytes */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
+-
+-	/* Store payload data */
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
+-
+-	/* Read encrypted data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_FLUSH1);
+-
+-	/* Read ICV */
+-	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_ICV | FIFOLD_TYPE_LAST1);
+-
+-	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "rfc4106 dec shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	keys_fit_inline = false;
+-	if (DESC_RFC4106_GIVENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->split_key_pad_len + ctx->enckeylen <=
+-	    CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	/* rfc4106_givencrypt shared descriptor */
+-	desc = ctx->sh_desc_givenc;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* Skip key loading if it is loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Generate IV */
+-	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
+-		NFIFOENTRY_DTYPE_MSG | NFIFOENTRY_LC1 |
+-		NFIFOENTRY_PTYPE_RND | (tfm->ivsize << NFIFOENTRY_DLEN_SHIFT);
+-	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
+-			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	move_cmd = append_move(desc, MOVE_SRC_INFIFO | MOVE_DEST_DESCBUF |
+-			       (tfm->ivsize << MOVE_LEN_SHIFT));
+-	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
+-
+-	/* Copy generated IV to OFIFO */
+-	write_iv_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_OUTFIFO |
+-				   (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* Class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+-
+-	/* ivsize + cryptlen = seqoutlen - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
+-
+-	/* assoclen = seqinlen - (ivsize + cryptlen) */
+-	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
+-
+-	/* Will write ivsize + cryptlen */
+-	append_math_add(desc, VARSEQOUTLEN, REG3, REG0, CAAM_CMD_SZ);
+-
+-	/* Read Salt and generated IV */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_IV |
+-		   FIFOLD_TYPE_FLUSH1 | IMMEDIATE | 12);
+-	/* Append Salt */
+-	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
+-	set_move_tgt_here(desc, move_cmd);
+-	set_move_tgt_here(desc, write_iv_cmd);
+-	/* Blank commands. Will be overwritten by generated IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* No need to reload iv */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_SKIP);
+-
+-	/* Read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_FLUSH1);
+-
+-	/* Will read cryptlen */
+-	append_math_add(desc, VARSEQINLEN, SEQINLEN, REG0, CAAM_CMD_SZ);
+-
+-	/* Store generated IV and encrypted data */
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
+-
+-	/* Read payload data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1);
+-
+-	/* Write ICV */
+-	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
+-			 LDST_SRCDST_BYTE_CONTEXT);
+-
+-	ctx->sh_desc_givenc_dma = dma_map_single(jrdev, desc,
+-						 desc_bytes(desc),
+-						 DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_givenc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "rfc4106 givenc shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	return 0;
+-}
+-
+-static int rfc4106_setauthsize(struct crypto_aead *authenc,
+-			       unsigned int authsize)
+-{
+-	struct caam_ctx *ctx = crypto_aead_ctx(authenc);
+-
+-	ctx->authsize = authsize;
+-	rfc4106_set_sh_desc(authenc);
+-
+-	return 0;
+-}
+-
+-static int rfc4543_set_sh_desc(struct crypto_aead *aead)
+-{
+-	struct aead_tfm *tfm = &aead->base.crt_aead;
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	bool keys_fit_inline = false;
+-	u32 *key_jump_cmd, *write_iv_cmd, *write_aad_cmd;
+-	u32 *read_move_cmd, *write_move_cmd;
+-	u32 *desc;
+-	u32 geniv;
+-
+-	if (!ctx->enckeylen || !ctx->authsize)
+-		return 0;
+-
+-	/*
+-	 * RFC4543 encrypt shared descriptor
+-	 * Job Descriptor and Shared Descriptor
+-	 * must fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	if (DESC_RFC4543_ENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	desc = ctx->sh_desc_enc;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* Skip key loading if it is loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+-
+-	/* Load AES-GMAC ESP IV into Math1 register */
+-	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_WORD_DECO_MATH1 |
+-		   LDST_CLASS_DECO | tfm->ivsize);
+-
+-	/* Wait the DMA transaction to finish */
+-	append_jump(desc, JUMP_TEST_ALL | JUMP_COND_CALM |
+-		    (1 << JUMP_OFFSET_SHIFT));
+-
+-	/* Overwrite blank immediate AES-GMAC ESP IV data */
+-	write_iv_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
+-				   (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* Overwrite blank immediate AAD data */
+-	write_aad_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
+-				    (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* cryptlen = seqoutlen - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
+-
+-	/* assoclen = (seqinlen - ivsize) - cryptlen */
+-	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
+-
+-	/* Read Salt and AES-GMAC ESP IV */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
+-		   FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 | (4 + tfm->ivsize));
+-	/* Append Salt */
+-	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
+-	set_move_tgt_here(desc, write_iv_cmd);
+-	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* Read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD);
+-
+-	/* Will read cryptlen bytes */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG3, CAAM_CMD_SZ);
+-
+-	/* Will write cryptlen bytes */
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG3, CAAM_CMD_SZ);
+-
+-	/*
+-	 * MOVE_LEN opcode is not available in all SEC HW revisions,
+-	 * thus need to do some magic, i.e. self-patch the descriptor
+-	 * buffer.
+-	 */
+-	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_MATH3 |
+-				    (0x6 << MOVE_LEN_SHIFT));
+-	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 | MOVE_DEST_DESCBUF |
+-				     (0x8 << MOVE_LEN_SHIFT));
+-
+-	/* Authenticate AES-GMAC ESP IV  */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
+-		   FIFOLD_TYPE_AAD | tfm->ivsize);
+-	set_move_tgt_here(desc, write_aad_cmd);
+-	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* Read and write cryptlen bytes */
+-	aead_append_src_dst(desc, FIFOLD_TYPE_AAD);
+-
+-	set_move_tgt_here(desc, read_move_cmd);
+-	set_move_tgt_here(desc, write_move_cmd);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	/* Move payload data to OFIFO */
+-	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO);
+-
+-	/* Write ICV */
+-	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
+-			 LDST_SRCDST_BYTE_CONTEXT);
+-
+-	ctx->sh_desc_enc_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "rfc4543 enc shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	keys_fit_inline = false;
+-	if (DESC_RFC4543_DEC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	desc = ctx->sh_desc_dec;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* Skip key loading if it is loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL |
+-				   JUMP_TEST_ALL | JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT | OP_ALG_ICV_ON);
+-
+-	/* Load AES-GMAC ESP IV into Math1 register */
+-	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_WORD_DECO_MATH1 |
+-		   LDST_CLASS_DECO | tfm->ivsize);
+-
+-	/* Wait the DMA transaction to finish */
+-	append_jump(desc, JUMP_TEST_ALL | JUMP_COND_CALM |
+-		    (1 << JUMP_OFFSET_SHIFT));
+-
+-	/* assoclen + cryptlen = (seqinlen - ivsize) - icvsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQINLEN, IMM, ctx->authsize);
+-
+-	/* Overwrite blank immediate AES-GMAC ESP IV data */
+-	write_iv_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
+-				   (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* Overwrite blank immediate AAD data */
+-	write_aad_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
+-				    (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* assoclen = (assoclen + cryptlen) - cryptlen */
+-	append_math_sub(desc, REG2, SEQOUTLEN, REG0, CAAM_CMD_SZ);
+-	append_math_sub(desc, VARSEQINLEN, REG3, REG2, CAAM_CMD_SZ);
+-
+-	/*
+-	 * MOVE_LEN opcode is not available in all SEC HW revisions,
+-	 * thus need to do some magic, i.e. self-patch the descriptor
+-	 * buffer.
+-	 */
+-	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_MATH3 |
+-				    (0x6 << MOVE_LEN_SHIFT));
+-	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 | MOVE_DEST_DESCBUF |
+-				     (0x8 << MOVE_LEN_SHIFT));
+-
+-	/* Read Salt and AES-GMAC ESP IV */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
+-		   FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 | (4 + tfm->ivsize));
+-	/* Append Salt */
+-	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
+-	set_move_tgt_here(desc, write_iv_cmd);
+-	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* Read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD);
+-
+-	/* Will read cryptlen bytes */
+-	append_math_add(desc, VARSEQINLEN, ZERO, REG2, CAAM_CMD_SZ);
+-
+-	/* Will write cryptlen bytes */
+-	append_math_add(desc, VARSEQOUTLEN, ZERO, REG2, CAAM_CMD_SZ);
+-
+-	/* Authenticate AES-GMAC ESP IV  */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
+-		   FIFOLD_TYPE_AAD | tfm->ivsize);
+-	set_move_tgt_here(desc, write_aad_cmd);
+-	/* Blank commands. Will be overwritten by AES-GMAC ESP IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* Store payload data */
+-	append_seq_fifo_store(desc, 0, FIFOST_TYPE_MESSAGE_DATA | FIFOLDST_VLF);
+-
+-	/* In-snoop cryptlen data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_BOTH | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD | FIFOLD_TYPE_LAST2FLUSH1);
+-
+-	set_move_tgt_here(desc, read_move_cmd);
+-	set_move_tgt_here(desc, write_move_cmd);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	/* Move payload data to OFIFO */
+-	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO);
+-	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
+-
+-	/* Read ICV */
+-	append_seq_fifo_load(desc, ctx->authsize, FIFOLD_CLASS_CLASS1 |
+-			     FIFOLD_TYPE_ICV | FIFOLD_TYPE_LAST1);
+-
+-	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
+-					      desc_bytes(desc),
+-					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "rfc4543 dec shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	/*
+-	 * Job Descriptor and Shared Descriptors
+-	 * must all fit into the 64-word Descriptor h/w Buffer
+-	 */
+-	keys_fit_inline = false;
+-	if (DESC_RFC4543_GIVENC_LEN + DESC_JOB_IO_LEN +
+-	    ctx->enckeylen <= CAAM_DESC_BYTES_MAX)
+-		keys_fit_inline = true;
+-
+-	/* rfc4543_givencrypt shared descriptor */
+-	desc = ctx->sh_desc_givenc;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL);
+-
+-	/* Skip key loading if it is loaded due to sharing */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-	if (keys_fit_inline)
+-		append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-				  ctx->enckeylen, CLASS_1 | KEY_DEST_CLASS_REG);
+-	else
+-		append_key(desc, ctx->key_dma, ctx->enckeylen,
+-			   CLASS_1 | KEY_DEST_CLASS_REG);
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Generate IV */
+-	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
+-		NFIFOENTRY_DTYPE_MSG | NFIFOENTRY_LC1 |
+-		NFIFOENTRY_PTYPE_RND | (tfm->ivsize << NFIFOENTRY_DLEN_SHIFT);
+-	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
+-			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	/* Move generated IV to Math1 register */
+-	append_move(desc, MOVE_SRC_INFIFO | MOVE_DEST_MATH1 |
+-		    (tfm->ivsize << MOVE_LEN_SHIFT));
+-	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
+-
+-	/* Overwrite blank immediate AES-GMAC IV data */
+-	write_iv_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
+-				   (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* Overwrite blank immediate AAD data */
+-	write_aad_cmd = append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_DESCBUF |
+-				    (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* Copy generated IV to OFIFO */
+-	append_move(desc, MOVE_SRC_MATH1 | MOVE_DEST_OUTFIFO |
+-		    (tfm->ivsize << MOVE_LEN_SHIFT));
+-
+-	/* Class 1 operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+-
+-	/* ivsize + cryptlen = seqoutlen - authsize */
+-	append_math_sub_imm_u32(desc, REG3, SEQOUTLEN, IMM, ctx->authsize);
+-
+-	/* assoclen = seqinlen - (ivsize + cryptlen) */
+-	append_math_sub(desc, VARSEQINLEN, SEQINLEN, REG3, CAAM_CMD_SZ);
+-
+-	/* Will write ivsize + cryptlen */
+-	append_math_add(desc, VARSEQOUTLEN, REG3, REG0, CAAM_CMD_SZ);
+-
+-	/*
+-	 * MOVE_LEN opcode is not available in all SEC HW revisions,
+-	 * thus need to do some magic, i.e. self-patch the descriptor
+-	 * buffer.
+-	 */
+-	read_move_cmd = append_move(desc, MOVE_SRC_DESCBUF | MOVE_DEST_MATH3 |
+-				    (0x6 << MOVE_LEN_SHIFT));
+-	write_move_cmd = append_move(desc, MOVE_SRC_MATH3 | MOVE_DEST_DESCBUF |
+-				     (0x8 << MOVE_LEN_SHIFT));
+-
+-	/* Read Salt and AES-GMAC generated IV */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
+-		   FIFOLD_TYPE_IV | FIFOLD_TYPE_FLUSH1 | (4 + tfm->ivsize));
+-	/* Append Salt */
+-	append_data(desc, (void *)(ctx->key + ctx->enckeylen), 4);
+-	set_move_tgt_here(desc, write_iv_cmd);
+-	/* Blank commands. Will be overwritten by AES-GMAC generated IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* No need to reload iv */
+-	append_seq_fifo_load(desc, tfm->ivsize, FIFOLD_CLASS_SKIP);
+-
+-	/* Read assoc data */
+-	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLDST_VLF |
+-			     FIFOLD_TYPE_AAD);
+-
+-	/* Will read cryptlen */
+-	append_math_add(desc, VARSEQINLEN, SEQINLEN, REG0, CAAM_CMD_SZ);
+-
+-	/* Authenticate AES-GMAC IV  */
+-	append_cmd(desc, CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 | IMMEDIATE |
+-		   FIFOLD_TYPE_AAD | tfm->ivsize);
+-	set_move_tgt_here(desc, write_aad_cmd);
+-	/* Blank commands. Will be overwritten by AES-GMAC IV. */
+-	append_cmd(desc, 0x00000000);
+-	append_cmd(desc, 0x00000000);
+-	/* End of blank commands */
+-
+-	/* Read and write cryptlen bytes */
+-	aead_append_src_dst(desc, FIFOLD_TYPE_AAD);
+-
+-	set_move_tgt_here(desc, read_move_cmd);
+-	set_move_tgt_here(desc, write_move_cmd);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	/* Move payload data to OFIFO */
+-	append_move(desc, MOVE_SRC_INFIFO_CL | MOVE_DEST_OUTFIFO);
+-
+-	/* Write ICV */
+-	append_seq_store(desc, ctx->authsize, LDST_CLASS_1_CCB |
+-			 LDST_SRCDST_BYTE_CONTEXT);
+-
+-	ctx->sh_desc_givenc_dma = dma_map_single(jrdev, desc,
+-						 desc_bytes(desc),
+-						 DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_givenc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "rfc4543 givenc shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-
+-	return 0;
+-}
+-
+-static int rfc4543_setauthsize(struct crypto_aead *authenc,
+-			       unsigned int authsize)
+-{
+-	struct caam_ctx *ctx = crypto_aead_ctx(authenc);
+-
+-	ctx->authsize = authsize;
+-	rfc4543_set_sh_desc(authenc);
+-
+-	return 0;
+-}
+-
+-static u32 gen_split_aead_key(struct caam_ctx *ctx, const u8 *key_in,
+-			      u32 authkeylen)
+-{
+-	return gen_split_key(ctx->jrdev, ctx->key, ctx->split_key_len,
+-			       ctx->split_key_pad_len, key_in, authkeylen,
+-			       ctx->alg_op);
+-}
+-
+-static int aead_setkey(struct crypto_aead *aead,
+-			       const u8 *key, unsigned int keylen)
+-{
+-	/* Sizes for MDHA pads (*not* keys): MD5, SHA1, 224, 256, 384, 512 */
+-	static const u8 mdpadlen[] = { 16, 20, 32, 32, 64, 64 };
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	struct crypto_authenc_keys keys;
+-	int ret = 0;
+-
+-	if (crypto_authenc_extractkeys(&keys, key, keylen) != 0)
+-		goto badkey;
+-
+-	/* Pick class 2 key length from algorithm submask */
+-	ctx->split_key_len = mdpadlen[(ctx->alg_op & OP_ALG_ALGSEL_SUBMASK) >>
+-				      OP_ALG_ALGSEL_SHIFT] * 2;
+-	ctx->split_key_pad_len = ALIGN(ctx->split_key_len, 16);
+-
+-	if (ctx->split_key_pad_len + keys.enckeylen > CAAM_MAX_KEY_SIZE)
+-		goto badkey;
+-
+-#ifdef DEBUG
+-	printk(KERN_ERR "keylen %d enckeylen %d authkeylen %d\n",
+-	       keys.authkeylen + keys.enckeylen, keys.enckeylen,
+-	       keys.authkeylen);
+-	printk(KERN_ERR "split_key_len %d split_key_pad_len %d\n",
+-	       ctx->split_key_len, ctx->split_key_pad_len);
+-	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
+-#endif
+-
+-	ret = gen_split_aead_key(ctx, keys.authkey, keys.authkeylen);
+-	if (ret) {
+-		goto badkey;
+-	}
+-
+-	/* postpend encryption key to auth split key */
+-	memcpy(ctx->key + ctx->split_key_pad_len, keys.enckey, keys.enckeylen);
+-
+-	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->split_key_pad_len +
+-				      keys.enckeylen, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->key_dma)) {
+-		dev_err(jrdev, "unable to map key i/o memory\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
+-		       ctx->split_key_pad_len + keys.enckeylen, 1);
+-#endif
+-
+-	ctx->enckeylen = keys.enckeylen;
++	ctx->enckeylen = enckeylen;
+ 
+ 	ret = aead_set_sh_desc(aead);
+ 	if (ret) {
+ 		dma_unmap_single(jrdev, ctx->key_dma, ctx->split_key_pad_len +
+-				 keys.enckeylen, DMA_TO_DEVICE);
++				 enckeylen, DMA_TO_DEVICE);
+ 	}
+ 
+ 	return ret;
+@@ -1715,154 +548,20 @@
+ 	return -EINVAL;
+ }
+ 
+-static int gcm_setkey(struct crypto_aead *aead,
+-		      const u8 *key, unsigned int keylen)
+-{
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	int ret = 0;
+-
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
+-#endif
+-
+-	memcpy(ctx->key, key, keylen);
+-	ctx->key_dma = dma_map_single(jrdev, ctx->key, keylen,
+-				      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->key_dma)) {
+-		dev_err(jrdev, "unable to map key i/o memory\n");
+-		return -ENOMEM;
+-	}
+-	ctx->enckeylen = keylen;
+-
+-	ret = gcm_set_sh_desc(aead);
+-	if (ret) {
+-		dma_unmap_single(jrdev, ctx->key_dma, ctx->enckeylen,
+-				 DMA_TO_DEVICE);
+-	}
+-
+-	return ret;
+-}
+-
+-static int rfc4106_setkey(struct crypto_aead *aead,
+-			  const u8 *key, unsigned int keylen)
+-{
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	int ret = 0;
+-
+-	if (keylen < 4)
+-		return -EINVAL;
+-
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
+-#endif
+-
+-	memcpy(ctx->key, key, keylen);
+-
+-	/*
+-	 * The last four bytes of the key material are used as the salt value
+-	 * in the nonce. Update the AES key length.
+-	 */
+-	ctx->enckeylen = keylen - 4;
+-
+-	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->enckeylen,
+-				      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->key_dma)) {
+-		dev_err(jrdev, "unable to map key i/o memory\n");
+-		return -ENOMEM;
+-	}
+-
+-	ret = rfc4106_set_sh_desc(aead);
+-	if (ret) {
+-		dma_unmap_single(jrdev, ctx->key_dma, ctx->enckeylen,
+-				 DMA_TO_DEVICE);
+-	}
+-
+-	return ret;
+-}
+-
+-static int rfc4543_setkey(struct crypto_aead *aead,
+-			  const u8 *key, unsigned int keylen)
+-{
+-	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+-	struct device *jrdev = ctx->jrdev;
+-	int ret = 0;
+-
+-	if (keylen < 4)
+-		return -EINVAL;
+-
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
+-#endif
+-
+-	memcpy(ctx->key, key, keylen);
+-
+-	/*
+-	 * The last four bytes of the key material are used as the salt value
+-	 * in the nonce. Update the AES key length.
+-	 */
+-	ctx->enckeylen = keylen - 4;
+-
+-	ctx->key_dma = dma_map_single(jrdev, ctx->key, ctx->enckeylen,
+-				      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->key_dma)) {
+-		dev_err(jrdev, "unable to map key i/o memory\n");
+-		return -ENOMEM;
+-	}
+-
+-	ret = rfc4543_set_sh_desc(aead);
+-	if (ret) {
+-		dma_unmap_single(jrdev, ctx->key_dma, ctx->enckeylen,
+-				 DMA_TO_DEVICE);
+-	}
+-
+-	return ret;
+-}
+-
+ static int ablkcipher_setkey(struct crypto_ablkcipher *ablkcipher,
+ 			     const u8 *key, unsigned int keylen)
+ {
+ 	struct caam_ctx *ctx = crypto_ablkcipher_ctx(ablkcipher);
+-	struct ablkcipher_tfm *crt = &ablkcipher->base.crt_ablkcipher;
+-	struct crypto_tfm *tfm = crypto_ablkcipher_tfm(ablkcipher);
+-	const char *alg_name = crypto_tfm_alg_name(tfm);
++	struct ablkcipher_tfm *tfm = &ablkcipher->base.crt_ablkcipher;
+ 	struct device *jrdev = ctx->jrdev;
+ 	int ret = 0;
+-	u32 *key_jump_cmd;
++	u32 *key_jump_cmd, *jump_cmd;
+ 	u32 *desc;
+-	u32 *nonce;
+-	u32 geniv;
+-	u32 ctx1_iv_off = 0;
+-	const bool ctr_mode = ((ctx->class1_alg_type & OP_ALG_AAI_MASK) ==
+-			       OP_ALG_AAI_CTR_MOD128);
+-	const bool is_rfc3686 = (ctr_mode &&
+-				 (strstr(alg_name, "rfc3686") != NULL));
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "key in @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
+ #endif
+-	/*
+-	 * AES-CTR needs to load IV in CONTEXT1 reg
+-	 * at an offset of 128bits (16bytes)
+-	 * CONTEXT1[255:128] = IV
+-	 */
+-	if (ctr_mode)
+-		ctx1_iv_off = 16;
+-
+-	/*
+-	 * RFC3686 specific:
+-	 *	| CONTEXT1[255:128] = {NONCE, IV, COUNTER}
+-	 *	| *key = {KEY, NONCE}
+-	 */
+-	if (is_rfc3686) {
+-		ctx1_iv_off = 16 + CTR_RFC3686_NONCE_SIZE;
+-		keylen -= CTR_RFC3686_NONCE_SIZE;
+-	}
+ 
+ 	memcpy(ctx->key, key, keylen);
+ 	ctx->key_dma = dma_map_single(jrdev, ctx->key, keylen,
+@@ -1872,10 +571,11 @@
+ 		return -ENOMEM;
+ 	}
+ 	ctx->enckeylen = keylen;
++	dma_sync_single_for_device(jrdev, ctx->key_dma, keylen, DMA_TO_DEVICE);
+ 
+ 	/* ablkcipher_encrypt shared descriptor */
+ 	desc = ctx->sh_desc_enc;
+-	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
++	init_sh_desc(desc, HDR_SHARE_SERIAL);
+ 	/* Skip if already shared */
+ 	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+ 				   JUMP_COND_SHRD);
+@@ -1885,32 +585,20 @@
+ 			  ctx->enckeylen, CLASS_1 |
+ 			  KEY_DEST_CLASS_REG);
+ 
+-	/* Load nonce into CONTEXT1 reg */
+-	if (is_rfc3686) {
+-		nonce = (u32 *)(key + keylen);
+-		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
+-				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
+-		append_move(desc, MOVE_WAITCOMP |
+-			    MOVE_SRC_OUTFIFO |
+-			    MOVE_DEST_CLASS1CTX |
+-			    (16 << MOVE_OFFSET_SHIFT) |
+-			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
+-	}
+-
+ 	set_jump_tgt_here(desc, key_jump_cmd);
+ 
+-	/* Load iv */
+-	append_seq_load(desc, crt->ivsize, LDST_SRCDST_BYTE_CONTEXT |
+-			LDST_CLASS_1_CCB | (ctx1_iv_off << LDST_OFFSET_SHIFT));
+-
+-	/* Load counter into CONTEXT1 reg */
+-	if (is_rfc3686)
+-		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
+-				    LDST_CLASS_1_CCB |
+-				    LDST_SRCDST_BYTE_CONTEXT |
+-				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
+-				     LDST_OFFSET_SHIFT));
++	/* Propagate errors from shared to job descriptor */
++	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
+ 
++	/* load IV */
++	if (strncmp(ablkcipher->base.__crt_alg->cra_name, "ctr(aes)", 8) == 0) {
++		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++			LDST_CLASS_1_CCB | tfm->ivsize |
++			(16 << LDST_OFFSET_SHIFT));
++	} else {
++		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++				    LDST_CLASS_1_CCB | tfm->ivsize);
++	}
+ 	/* Load operation */
+ 	append_operation(desc, ctx->class1_alg_type |
+ 			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+@@ -1926,15 +614,17 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ablkcipher enc shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ablkcipher enc shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_enc_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
++
+ 	/* ablkcipher_decrypt shared descriptor */
+ 	desc = ctx->sh_desc_dec;
+ 
+-	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
++	init_sh_desc(desc, HDR_SHARE_SERIAL);
+ 	/* Skip if already shared */
+ 	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+ 				   JUMP_COND_SHRD);
+@@ -1944,133 +634,49 @@
+ 			  ctx->enckeylen, CLASS_1 |
+ 			  KEY_DEST_CLASS_REG);
+ 
+-	/* Load nonce into CONTEXT1 reg */
+-	if (is_rfc3686) {
+-		nonce = (u32 *)(key + keylen);
+-		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
+-				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
+-		append_move(desc, MOVE_WAITCOMP |
+-			    MOVE_SRC_OUTFIFO |
+-			    MOVE_DEST_CLASS1CTX |
+-			    (16 << MOVE_OFFSET_SHIFT) |
+-			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
+-	}
+-
++	/* For aead, only propagate error immediately if shared */
++	jump_cmd = append_jump(desc, JUMP_TEST_ALL);
+ 	set_jump_tgt_here(desc, key_jump_cmd);
++	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
++	set_jump_tgt_here(desc, jump_cmd);
+ 
+ 	/* load IV */
+-	append_seq_load(desc, crt->ivsize, LDST_SRCDST_BYTE_CONTEXT |
+-			LDST_CLASS_1_CCB | (ctx1_iv_off << LDST_OFFSET_SHIFT));
+-
+-	/* Load counter into CONTEXT1 reg */
+-	if (is_rfc3686)
+-		append_load_imm_u32(desc, be32_to_cpu(1), LDST_IMM |
+-				    LDST_CLASS_1_CCB |
+-				    LDST_SRCDST_BYTE_CONTEXT |
+-				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
+-				     LDST_OFFSET_SHIFT));
++	if (strncmp(ablkcipher->base.__crt_alg->cra_name, "ctr(aes)", 8) == 0) {
++		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++			LDST_CLASS_1_CCB | tfm->ivsize |
++			(16 << LDST_OFFSET_SHIFT));
+ 
+-	/* Choose operation */
+-	if (ctr_mode)
+ 		append_operation(desc, ctx->class1_alg_type |
+-				 OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT);
+-	else
++			OP_ALG_AS_INITFINAL | OP_ALG_DECRYPT);
++	} else {
++		append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++				    LDST_CLASS_1_CCB | tfm->ivsize);
++
++		/* Choose operation */
+ 		append_dec_op1(desc, ctx->class1_alg_type);
++	}
+ 
+ 	/* Perform operation */
+ 	ablkcipher_append_src_dst(desc);
+ 
++	/* Wait for key to load before allowing propagating error */
++	append_dec_shr_done(desc);
++
+ 	ctx->sh_desc_dec_dma = dma_map_single(jrdev, desc,
+ 					      desc_bytes(desc),
+ 					      DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_dec_dma)) {
++	if (dma_mapping_error(jrdev, ctx->sh_desc_enc_dma)) {
+ 		dev_err(jrdev, "unable to map shared descriptor\n");
+ 		return -ENOMEM;
+ 	}
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ablkcipher dec shdesc@"__stringify(__LINE__)": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+-		       desc_bytes(desc), 1);
+-#endif
+-	/* ablkcipher_givencrypt shared descriptor */
+-	desc = ctx->sh_desc_givenc;
+-
+-	init_sh_desc(desc, HDR_SHARE_SERIAL | HDR_SAVECTX);
+-	/* Skip if already shared */
+-	key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
+-				   JUMP_COND_SHRD);
+-
+-	/* Load class1 key only */
+-	append_key_as_imm(desc, (void *)ctx->key, ctx->enckeylen,
+-			  ctx->enckeylen, CLASS_1 |
+-			  KEY_DEST_CLASS_REG);
+-
+-	/* Load Nonce into CONTEXT1 reg */
+-	if (is_rfc3686) {
+-		nonce = (u32 *)(key + keylen);
+-		append_load_imm_u32(desc, *nonce, LDST_CLASS_IND_CCB |
+-				    LDST_SRCDST_BYTE_OUTFIFO | LDST_IMM);
+-		append_move(desc, MOVE_WAITCOMP |
+-			    MOVE_SRC_OUTFIFO |
+-			    MOVE_DEST_CLASS1CTX |
+-			    (16 << MOVE_OFFSET_SHIFT) |
+-			    (CTR_RFC3686_NONCE_SIZE << MOVE_LEN_SHIFT));
+-	}
+-	set_jump_tgt_here(desc, key_jump_cmd);
+-
+-	/* Generate IV */
+-	geniv = NFIFOENTRY_STYPE_PAD | NFIFOENTRY_DEST_DECO |
+-		NFIFOENTRY_DTYPE_MSG | NFIFOENTRY_LC1 |
+-		NFIFOENTRY_PTYPE_RND | (crt->ivsize << NFIFOENTRY_DLEN_SHIFT);
+-	append_load_imm_u32(desc, geniv, LDST_CLASS_IND_CCB |
+-			    LDST_SRCDST_WORD_INFO_FIFO | LDST_IMM);
+-	append_cmd(desc, CMD_LOAD | DISABLE_AUTO_INFO_FIFO);
+-	append_move(desc, MOVE_WAITCOMP |
+-		    MOVE_SRC_INFIFO |
+-		    MOVE_DEST_CLASS1CTX |
+-		    (crt->ivsize << MOVE_LEN_SHIFT) |
+-		    (ctx1_iv_off << MOVE_OFFSET_SHIFT));
+-	append_cmd(desc, CMD_LOAD | ENABLE_AUTO_INFO_FIFO);
+-
+-	/* Copy generated IV to memory */
+-	append_seq_store(desc, crt->ivsize,
+-			 LDST_SRCDST_BYTE_CONTEXT | LDST_CLASS_1_CCB |
+-			 (ctx1_iv_off << LDST_OFFSET_SHIFT));
+-
+-	/* Load Counter into CONTEXT1 reg */
+-	if (is_rfc3686)
+-		append_load_imm_u32(desc, (u32)1, LDST_IMM |
+-				    LDST_CLASS_1_CCB |
+-				    LDST_SRCDST_BYTE_CONTEXT |
+-				    ((ctx1_iv_off + CTR_RFC3686_IV_SIZE) <<
+-				     LDST_OFFSET_SHIFT));
+-
+-	if (ctx1_iv_off)
+-		append_jump(desc, JUMP_JSL | JUMP_TEST_ALL | JUMP_COND_NCP |
+-			    (1 << JUMP_OFFSET_SHIFT));
+-
+-	/* Load operation */
+-	append_operation(desc, ctx->class1_alg_type |
+-			 OP_ALG_AS_INITFINAL | OP_ALG_ENCRYPT);
+-
+-	/* Perform operation */
+-	ablkcipher_append_src_dst(desc);
+-
+-	ctx->sh_desc_givenc_dma = dma_map_single(jrdev, desc,
+-						 desc_bytes(desc),
+-						 DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_givenc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ablkcipher givenc shdesc@" __stringify(__LINE__) ": ",
++	print_hex_dump(KERN_ERR, "ablkcipher dec shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_dec_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
+ 
+ 	return ret;
+ }
+@@ -2195,19 +801,22 @@
+ 	edesc = (struct aead_edesc *)((char *)desc -
+ 		 offsetof(struct aead_edesc, hw_desc));
+ 
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ 	aead_unmap(jrdev, edesc, req);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "assoc  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "assoc  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->assoc),
+ 		       req->assoclen , 1);
+-	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src) - ivsize,
+ 		       edesc->src_nents ? 100 : ivsize, 1);
+-	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 		       edesc->src_nents ? 100 : req->cryptlen +
+ 		       ctx->authsize + 4, 1);
+@@ -2235,16 +844,19 @@
+ 		 offsetof(struct aead_edesc, hw_desc));
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, req->iv,
+ 		       ivsize, 1);
+-	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->dst),
+-		       req->cryptlen - ctx->authsize, 1);
++		       req->cryptlen, 1);
+ #endif
+ 
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ 	aead_unmap(jrdev, edesc, req);
+ 
+@@ -2255,7 +867,7 @@
+ 		err = -EBADMSG;
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "iphdrout@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "iphdrout@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4,
+ 		       ((char *)sg_virt(req->assoc) - sizeof(struct iphdr)),
+ 		       sizeof(struct iphdr) + req->assoclen +
+@@ -2263,7 +875,7 @@
+ 		       ctx->authsize + 36, 1);
+ 	if (!err && edesc->sec4_sg_bytes) {
+ 		struct scatterlist *sg = sg_last(req->src, edesc->src_nents);
+-		print_hex_dump(KERN_ERR, "sglastout@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "sglastout@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(sg),
+ 			sg->length + ctx->authsize + 16, 1);
+ 	}
+@@ -2289,14 +901,17 @@
+ 	edesc = (struct ablkcipher_edesc *)((char *)desc -
+ 		 offsetof(struct ablkcipher_edesc, hw_desc));
+ 
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
+ 		       edesc->src_nents > 1 ? 100 : ivsize, 1);
+-	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 		       edesc->dst_nents > 1 ? 100 : req->nbytes, 1);
+ #endif
+@@ -2321,14 +936,17 @@
+ 
+ 	edesc = (struct ablkcipher_edesc *)((char *)desc -
+ 		 offsetof(struct ablkcipher_edesc, hw_desc));
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "dstiv  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dstiv  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
+ 		       ivsize, 1);
+-	print_hex_dump(KERN_ERR, "dst    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dst    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 		       edesc->dst_nents > 1 ? 100 : req->nbytes, 1);
+ #endif
+@@ -2355,38 +973,29 @@
+ 	u32 out_options = 0, in_options;
+ 	dma_addr_t dst_dma, src_dma;
+ 	int len, sec4_sg_index = 0;
+-	bool is_gcm = false;
+ 
+ #ifdef DEBUG
+ 	debug("assoclen %d cryptlen %d authsize %d\n",
+ 	      req->assoclen, req->cryptlen, authsize);
+-	print_hex_dump(KERN_ERR, "assoc  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "assoc  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->assoc),
+ 		       req->assoclen , 1);
+-	print_hex_dump(KERN_ERR, "presciv@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "presciv@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, req->iv,
+ 		       edesc->src_nents ? 100 : ivsize, 1);
+-	print_hex_dump(KERN_ERR, "src    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "src    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 			edesc->src_nents ? 100 : req->cryptlen, 1);
+-	print_hex_dump(KERN_ERR, "shrdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "shrdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sh_desc,
+ 		       desc_bytes(sh_desc), 1);
+ #endif
+ 
+-	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
+-	      OP_ALG_ALGSEL_AES) &&
+-	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
+-		is_gcm = true;
+-
+ 	len = desc_len(sh_desc);
+ 	init_job_desc_shared(desc, ptr, len, HDR_SHARE_DEFER | HDR_REVERSE);
+ 
+ 	if (all_contig) {
+-		if (is_gcm)
+-			src_dma = edesc->iv_dma;
+-		else
+-			src_dma = sg_dma_address(req->assoc);
++		src_dma = sg_dma_address(req->assoc);
+ 		in_options = 0;
+ 	} else {
+ 		src_dma = edesc->sec4_sg_dma;
+@@ -2394,9 +1003,12 @@
+ 				 (edesc->src_nents ? : 1);
+ 		in_options = LDST_SGF;
+ 	}
+-
+-	append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize + req->cryptlen,
+-			  in_options);
++	if (encrypt)
++		append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize +
++				  req->cryptlen - authsize, in_options);
++	else
++		append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize +
++				  req->cryptlen, in_options);
+ 
+ 	if (likely(req->src == req->dst)) {
+ 		if (all_contig) {
+@@ -2417,8 +1029,7 @@
+ 		}
+ 	}
+ 	if (encrypt)
+-		append_seq_out_ptr(desc, dst_dma, req->cryptlen + authsize,
+-				   out_options);
++		append_seq_out_ptr(desc, dst_dma, req->cryptlen, out_options);
+ 	else
+ 		append_seq_out_ptr(desc, dst_dma, req->cryptlen - authsize,
+ 				   out_options);
+@@ -2440,53 +1051,43 @@
+ 	u32 out_options = 0, in_options;
+ 	dma_addr_t dst_dma, src_dma;
+ 	int len, sec4_sg_index = 0;
+-	bool is_gcm = false;
+ 
+ #ifdef DEBUG
+ 	debug("assoclen %d cryptlen %d authsize %d\n",
+ 	      req->assoclen, req->cryptlen, authsize);
+-	print_hex_dump(KERN_ERR, "assoc  @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "assoc  @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->assoc),
+ 		       req->assoclen , 1);
+-	print_hex_dump(KERN_ERR, "presciv@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "presciv@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, req->iv, ivsize, 1);
+-	print_hex_dump(KERN_ERR, "src    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "src    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 			edesc->src_nents > 1 ? 100 : req->cryptlen, 1);
+-	print_hex_dump(KERN_ERR, "shrdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "shrdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sh_desc,
+ 		       desc_bytes(sh_desc), 1);
+ #endif
+ 
+-	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
+-	      OP_ALG_ALGSEL_AES) &&
+-	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
+-		is_gcm = true;
+-
+ 	len = desc_len(sh_desc);
+ 	init_job_desc_shared(desc, ptr, len, HDR_SHARE_DEFER | HDR_REVERSE);
+ 
+ 	if (contig & GIV_SRC_CONTIG) {
+-		if (is_gcm)
+-			src_dma = edesc->iv_dma;
+-		else
+-			src_dma = sg_dma_address(req->assoc);
++		src_dma = sg_dma_address(req->assoc);
+ 		in_options = 0;
+ 	} else {
+ 		src_dma = edesc->sec4_sg_dma;
+ 		sec4_sg_index += edesc->assoc_nents + 1 + edesc->src_nents;
+ 		in_options = LDST_SGF;
+ 	}
+-	append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize + req->cryptlen,
+-			  in_options);
++	append_seq_in_ptr(desc, src_dma, req->assoclen + ivsize +
++			  req->cryptlen - authsize, in_options);
+ 
+ 	if (contig & GIV_DST_CONTIG) {
+ 		dst_dma = edesc->iv_dma;
+ 	} else {
+ 		if (likely(req->src == req->dst)) {
+ 			dst_dma = src_dma + sizeof(struct sec4_sg_entry) *
+-				  (edesc->assoc_nents +
+-				   (is_gcm ? 1 + edesc->src_nents : 0));
++				  edesc->assoc_nents;
+ 			out_options = LDST_SGF;
+ 		} else {
+ 			dst_dma = edesc->sec4_sg_dma +
+@@ -2496,8 +1097,7 @@
+ 		}
+ 	}
+ 
+-	append_seq_out_ptr(desc, dst_dma, ivsize + req->cryptlen + authsize,
+-			   out_options);
++	append_seq_out_ptr(desc, dst_dma, ivsize + req->cryptlen, out_options);
+ }
+ 
+ /*
+@@ -2516,10 +1116,10 @@
+ 	int len, sec4_sg_index = 0;
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "presciv@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "presciv@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
+ 		       ivsize, 1);
+-	print_hex_dump(KERN_ERR, "src    @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "src    @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 		       edesc->src_nents ? 100 : req->nbytes, 1);
+ #endif
+@@ -2532,7 +1132,7 @@
+ 		in_options = 0;
+ 	} else {
+ 		src_dma = edesc->sec4_sg_dma;
+-		sec4_sg_index += edesc->src_nents + 1;
++		sec4_sg_index += (iv_contig ? 0 : 1) + edesc->src_nents;
+ 		in_options = LDST_SGF;
+ 	}
+ 	append_seq_in_ptr(desc, src_dma, req->nbytes + ivsize, in_options);
+@@ -2558,59 +1158,10 @@
+ }
+ 
+ /*
+- * Fill in ablkcipher givencrypt job descriptor
+- */
+-static void init_ablkcipher_giv_job(u32 *sh_desc, dma_addr_t ptr,
+-				    struct ablkcipher_edesc *edesc,
+-				    struct ablkcipher_request *req,
+-				    bool iv_contig)
+-{
+-	struct crypto_ablkcipher *ablkcipher = crypto_ablkcipher_reqtfm(req);
+-	int ivsize = crypto_ablkcipher_ivsize(ablkcipher);
+-	u32 *desc = edesc->hw_desc;
+-	u32 out_options, in_options;
+-	dma_addr_t dst_dma, src_dma;
+-	int len, sec4_sg_index = 0;
+-
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "presciv@" __stringify(__LINE__) ": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, req->info,
+-		       ivsize, 1);
+-	print_hex_dump(KERN_ERR, "src    @" __stringify(__LINE__) ": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+-		       edesc->src_nents ? 100 : req->nbytes, 1);
+-#endif
+-
+-	len = desc_len(sh_desc);
+-	init_job_desc_shared(desc, ptr, len, HDR_SHARE_DEFER | HDR_REVERSE);
+-
+-	if (!edesc->src_nents) {
+-		src_dma = sg_dma_address(req->src);
+-		in_options = 0;
+-	} else {
+-		src_dma = edesc->sec4_sg_dma;
+-		sec4_sg_index += edesc->src_nents;
+-		in_options = LDST_SGF;
+-	}
+-	append_seq_in_ptr(desc, src_dma, req->nbytes, in_options);
+-
+-	if (iv_contig) {
+-		dst_dma = edesc->iv_dma;
+-		out_options = 0;
+-	} else {
+-		dst_dma = edesc->sec4_sg_dma +
+-			  sec4_sg_index * sizeof(struct sec4_sg_entry);
+-		out_options = LDST_SGF;
+-	}
+-	append_seq_out_ptr(desc, dst_dma, req->nbytes + ivsize, out_options);
+-}
+-
+-/*
+  * allocate and map the aead extended descriptor
+  */
+ static struct aead_edesc *aead_edesc_alloc(struct aead_request *req,
+-					   int desc_bytes, bool *all_contig_ptr,
+-					   bool encrypt)
++					   int desc_bytes, bool *all_contig_ptr)
+ {
+ 	struct crypto_aead *aead = crypto_aead_reqtfm(req);
+ 	struct caam_ctx *ctx = crypto_aead_ctx(aead);
+@@ -2625,26 +1176,15 @@
+ 	bool assoc_chained = false, src_chained = false, dst_chained = false;
+ 	int ivsize = crypto_aead_ivsize(aead);
+ 	int sec4_sg_index, sec4_sg_len = 0, sec4_sg_bytes;
+-	unsigned int authsize = ctx->authsize;
+-	bool is_gcm = false;
+ 
+ 	assoc_nents = sg_count(req->assoc, req->assoclen, &assoc_chained);
++	src_nents = sg_count(req->src, req->cryptlen, &src_chained);
+ 
+-	if (unlikely(req->dst != req->src)) {
+-		src_nents = sg_count(req->src, req->cryptlen, &src_chained);
+-		dst_nents = sg_count(req->dst,
+-				     req->cryptlen +
+-					(encrypt ? authsize : (-authsize)),
+-				     &dst_chained);
+-	} else {
+-		src_nents = sg_count(req->src,
+-				     req->cryptlen +
+-					(encrypt ? authsize : 0),
+-				     &src_chained);
+-	}
++	if (unlikely(req->dst != req->src))
++		dst_nents = sg_count(req->dst, req->cryptlen, &dst_chained);
+ 
+ 	sgc = dma_map_sg_chained(jrdev, req->assoc, assoc_nents ? : 1,
+-				 DMA_TO_DEVICE, assoc_chained);
++				 DMA_BIDIRECTIONAL, assoc_chained);
+ 	if (likely(req->src == req->dst)) {
+ 		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
+ 					 DMA_BIDIRECTIONAL, src_chained);
+@@ -2655,43 +1195,23 @@
+ 					 DMA_FROM_DEVICE, dst_chained);
+ 	}
+ 
++	/* Check if data are contiguous */
+ 	iv_dma = dma_map_single(jrdev, req->iv, ivsize, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, iv_dma)) {
+-		dev_err(jrdev, "unable to map IV\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-
+-	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
+-	      OP_ALG_ALGSEL_AES) &&
+-	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
+-		is_gcm = true;
+-
+-	/*
+-	 * Check if data are contiguous.
+-	 * GCM expected input sequence: IV, AAD, text
+-	 * All other - expected input sequence: AAD, IV, text
+-	 */
+-	if (is_gcm)
+-		all_contig = (!assoc_nents &&
+-			      iv_dma + ivsize == sg_dma_address(req->assoc) &&
+-			      !src_nents && sg_dma_address(req->assoc) +
+-			      req->assoclen == sg_dma_address(req->src));
+-	else
+-		all_contig = (!assoc_nents && sg_dma_address(req->assoc) +
+-			      req->assoclen == iv_dma && !src_nents &&
+-			      iv_dma + ivsize == sg_dma_address(req->src));
+-	if (!all_contig) {
++	if (assoc_nents || sg_dma_address(req->assoc) + req->assoclen !=
++	    iv_dma || src_nents || iv_dma + ivsize !=
++	    sg_dma_address(req->src)) {
++		all_contig = false;
+ 		assoc_nents = assoc_nents ? : 1;
+ 		src_nents = src_nents ? : 1;
+ 		sec4_sg_len = assoc_nents + 1 + src_nents;
+ 	}
+-
+ 	sec4_sg_len += dst_nents;
+ 
+ 	sec4_sg_bytes = sec4_sg_len * sizeof(struct sec4_sg_entry);
++	dma_sync_single_for_device(jrdev, iv_dma, ivsize, DMA_TO_DEVICE);
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct aead_edesc) + desc_bytes +
++	edesc = kzalloc(sizeof(struct aead_edesc) + desc_bytes +
+ 			sec4_sg_bytes, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -2708,46 +1228,32 @@
+ 	edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 	edesc->sec4_sg = (void *)edesc + sizeof(struct aead_edesc) +
+ 			 desc_bytes;
++	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++					    sec4_sg_bytes, DMA_TO_DEVICE);
+ 	*all_contig_ptr = all_contig;
+ 
+ 	sec4_sg_index = 0;
+ 	if (!all_contig) {
+-		if (!is_gcm) {
+-			sg_to_sec4_sg(req->assoc,
+-				      assoc_nents,
+-				      edesc->sec4_sg +
+-				      sec4_sg_index, 0);
+-			sec4_sg_index += assoc_nents;
+-		}
+-
++		sg_to_sec4_sg(req->assoc,
++			      (assoc_nents ? : 1),
++			      edesc->sec4_sg +
++			      sec4_sg_index, 0);
++		sec4_sg_index += assoc_nents ? : 1;
+ 		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
+ 				   iv_dma, ivsize, 0);
+ 		sec4_sg_index += 1;
+-
+-		if (is_gcm) {
+-			sg_to_sec4_sg(req->assoc,
+-				      assoc_nents,
+-				      edesc->sec4_sg +
+-				      sec4_sg_index, 0);
+-			sec4_sg_index += assoc_nents;
+-		}
+-
+ 		sg_to_sec4_sg_last(req->src,
+-				   src_nents,
++				   (src_nents ? : 1),
+ 				   edesc->sec4_sg +
+ 				   sec4_sg_index, 0);
+-		sec4_sg_index += src_nents;
++		sec4_sg_index += src_nents ? : 1;
+ 	}
+ 	if (dst_nents) {
+ 		sg_to_sec4_sg_last(req->dst, dst_nents,
+ 				   edesc->sec4_sg + sec4_sg_index, 0);
+ 	}
+-	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
++				   DMA_TO_DEVICE);
+ 
+ 	return edesc;
+ }
+@@ -2762,9 +1268,11 @@
+ 	u32 *desc;
+ 	int ret = 0;
+ 
++	req->cryptlen += ctx->authsize;
++
+ 	/* allocate extended descriptor */
+ 	edesc = aead_edesc_alloc(req, DESC_JOB_IO_LEN *
+-				 CAAM_CMD_SZ, &all_contig, true);
++				 CAAM_CMD_SZ, &all_contig);
+ 	if (IS_ERR(edesc))
+ 		return PTR_ERR(edesc);
+ 
+@@ -2772,7 +1280,7 @@
+ 	init_aead_job(ctx->sh_desc_enc, ctx->sh_desc_enc_dma, edesc, req,
+ 		      all_contig, true);
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "aead jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "aead jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
+ 		       desc_bytes(edesc->hw_desc), 1);
+ #endif
+@@ -2801,12 +1309,12 @@
+ 
+ 	/* allocate extended descriptor */
+ 	edesc = aead_edesc_alloc(req, DESC_JOB_IO_LEN *
+-				 CAAM_CMD_SZ, &all_contig, false);
++				 CAAM_CMD_SZ, &all_contig);
+ 	if (IS_ERR(edesc))
+ 		return PTR_ERR(edesc);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "dec src@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "dec src@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 		       req->cryptlen, 1);
+ #endif
+@@ -2815,7 +1323,7 @@
+ 	init_aead_job(ctx->sh_desc_dec,
+ 		      ctx->sh_desc_dec_dma, edesc, req, all_contig, false);
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "aead jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "aead jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
+ 		       desc_bytes(edesc->hw_desc), 1);
+ #endif
+@@ -2853,17 +1361,15 @@
+ 	int ivsize = crypto_aead_ivsize(aead);
+ 	bool assoc_chained = false, src_chained = false, dst_chained = false;
+ 	int sec4_sg_index, sec4_sg_len = 0, sec4_sg_bytes;
+-	bool is_gcm = false;
+ 
+ 	assoc_nents = sg_count(req->assoc, req->assoclen, &assoc_chained);
+ 	src_nents = sg_count(req->src, req->cryptlen, &src_chained);
+ 
+ 	if (unlikely(req->dst != req->src))
+-		dst_nents = sg_count(req->dst, req->cryptlen + ctx->authsize,
+-				     &dst_chained);
++		dst_nents = sg_count(req->dst, req->cryptlen, &dst_chained);
+ 
+ 	sgc = dma_map_sg_chained(jrdev, req->assoc, assoc_nents ? : 1,
+-				 DMA_TO_DEVICE, assoc_chained);
++				 DMA_BIDIRECTIONAL, assoc_chained);
+ 	if (likely(req->src == req->dst)) {
+ 		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
+ 					 DMA_BIDIRECTIONAL, src_chained);
+@@ -2874,64 +1380,32 @@
+ 					 DMA_FROM_DEVICE, dst_chained);
+ 	}
+ 
++	/* Check if data are contiguous */
+ 	iv_dma = dma_map_single(jrdev, greq->giv, ivsize, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, iv_dma)) {
+-		dev_err(jrdev, "unable to map IV\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-
+-	if (((ctx->class1_alg_type & OP_ALG_ALGSEL_MASK) ==
+-	      OP_ALG_ALGSEL_AES) &&
+-	    ((ctx->class1_alg_type & OP_ALG_AAI_MASK) == OP_ALG_AAI_GCM))
+-		is_gcm = true;
+-
+-	/*
+-	 * Check if data are contiguous.
+-	 * GCM expected input sequence: IV, AAD, text
+-	 * All other - expected input sequence: AAD, IV, text
+-	 */
+-
+-	if (is_gcm) {
+-		if (assoc_nents || iv_dma + ivsize !=
+-		    sg_dma_address(req->assoc) || src_nents ||
+-		    sg_dma_address(req->assoc) + req->assoclen !=
+-		    sg_dma_address(req->src))
+-			contig &= ~GIV_SRC_CONTIG;
+-	} else {
+-		if (assoc_nents ||
+-		    sg_dma_address(req->assoc) + req->assoclen != iv_dma ||
+-		    src_nents || iv_dma + ivsize != sg_dma_address(req->src))
+-			contig &= ~GIV_SRC_CONTIG;
+-	}
+-
++	if (assoc_nents || sg_dma_address(req->assoc) + req->assoclen !=
++	    iv_dma || src_nents || iv_dma + ivsize != sg_dma_address(req->src))
++		contig &= ~GIV_SRC_CONTIG;
+ 	if (dst_nents || iv_dma + ivsize != sg_dma_address(req->dst))
+ 		contig &= ~GIV_DST_CONTIG;
+-
++	if (unlikely(req->src != req->dst)) {
++		dst_nents = dst_nents ? : 1;
++		sec4_sg_len += 1;
++	}
+ 	if (!(contig & GIV_SRC_CONTIG)) {
+ 		assoc_nents = assoc_nents ? : 1;
+ 		src_nents = src_nents ? : 1;
+ 		sec4_sg_len += assoc_nents + 1 + src_nents;
+-		if (req->src == req->dst &&
+-		    (src_nents || iv_dma + ivsize != sg_dma_address(req->src)))
+-			contig &= ~GIV_DST_CONTIG;
+-	}
+-
+-	/*
+-	 * Add new sg entries for GCM output sequence.
+-	 * Expected output sequence: IV, encrypted text.
+-	 */
+-	if (is_gcm && req->src == req->dst && !(contig & GIV_DST_CONTIG))
+-		sec4_sg_len += 1 + src_nents;
+-
+-	if (unlikely(req->src != req->dst)) {
+-		dst_nents = dst_nents ? : 1;
+-		sec4_sg_len += 1 + dst_nents;
++		if (likely(req->src == req->dst))
++			contig &= ~GIV_DST_CONTIG;
+ 	}
++	sec4_sg_len += dst_nents;
+ 
+ 	sec4_sg_bytes = sec4_sg_len * sizeof(struct sec4_sg_entry);
+ 
++	dma_sync_single_for_device(jrdev, iv_dma, ivsize, DMA_TO_DEVICE);
++
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct aead_edesc) + desc_bytes +
++	edesc = kzalloc(sizeof(struct aead_edesc) + desc_bytes +
+ 			sec4_sg_bytes, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -2948,40 +1422,24 @@
+ 	edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 	edesc->sec4_sg = (void *)edesc + sizeof(struct aead_edesc) +
+ 			 desc_bytes;
++	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++					    sec4_sg_bytes, DMA_TO_DEVICE);
+ 	*contig_ptr = contig;
+ 
+ 	sec4_sg_index = 0;
+ 	if (!(contig & GIV_SRC_CONTIG)) {
+-		if (!is_gcm) {
+-			sg_to_sec4_sg(req->assoc, assoc_nents,
+-				      edesc->sec4_sg + sec4_sg_index, 0);
+-			sec4_sg_index += assoc_nents;
+-		}
+-
++		sg_to_sec4_sg(req->assoc, assoc_nents,
++			      edesc->sec4_sg +
++			      sec4_sg_index, 0);
++		sec4_sg_index += assoc_nents;
+ 		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
+ 				   iv_dma, ivsize, 0);
+ 		sec4_sg_index += 1;
+-
+-		if (is_gcm) {
+-			sg_to_sec4_sg(req->assoc, assoc_nents,
+-				      edesc->sec4_sg + sec4_sg_index, 0);
+-			sec4_sg_index += assoc_nents;
+-		}
+-
+ 		sg_to_sec4_sg_last(req->src, src_nents,
+ 				   edesc->sec4_sg +
+ 				   sec4_sg_index, 0);
+ 		sec4_sg_index += src_nents;
+ 	}
+-
+-	if (is_gcm && req->src == req->dst && !(contig & GIV_DST_CONTIG)) {
+-		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
+-				   iv_dma, ivsize, 0);
+-		sec4_sg_index += 1;
+-		sg_to_sec4_sg_last(req->src, src_nents,
+-				   edesc->sec4_sg + sec4_sg_index, 0);
+-	}
+-
+ 	if (unlikely(req->src != req->dst && !(contig & GIV_DST_CONTIG))) {
+ 		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
+ 				   iv_dma, ivsize, 0);
+@@ -2989,12 +1447,8 @@
+ 		sg_to_sec4_sg_last(req->dst, dst_nents,
+ 				   edesc->sec4_sg + sec4_sg_index, 0);
+ 	}
+-	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
++				   DMA_TO_DEVICE);
+ 
+ 	return edesc;
+ }
+@@ -3010,6 +1464,8 @@
+ 	u32 *desc;
+ 	int ret = 0;
+ 
++	req->cryptlen += ctx->authsize;
++
+ 	/* allocate extended descriptor */
+ 	edesc = aead_giv_edesc_alloc(areq, DESC_JOB_IO_LEN *
+ 				     CAAM_CMD_SZ, &contig);
+@@ -3018,7 +1474,7 @@
+ 		return PTR_ERR(edesc);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "giv src@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "giv src@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, sg_virt(req->src),
+ 		       req->cryptlen, 1);
+ #endif
+@@ -3027,7 +1483,7 @@
+ 	init_aead_giv_job(ctx->sh_desc_givenc,
+ 			  ctx->sh_desc_givenc_dma, edesc, req, contig);
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "aead jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "aead jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
+ 		       desc_bytes(edesc->hw_desc), 1);
+ #endif
+@@ -3044,11 +1500,6 @@
+ 	return ret;
+ }
+ 
+-static int aead_null_givencrypt(struct aead_givcrypt_request *areq)
+-{
+-	return aead_encrypt(&areq->areq);
+-}
+-
+ /*
+  * allocate and map the ablkcipher extended descriptor for ablkcipher
+  */
+@@ -3086,16 +1537,12 @@
+ 					 DMA_FROM_DEVICE, dst_chained);
+ 	}
+ 
+-	iv_dma = dma_map_single(jrdev, req->info, ivsize, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, iv_dma)) {
+-		dev_err(jrdev, "unable to map IV\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-
+ 	/*
+ 	 * Check if iv can be contiguous with source and destination.
+ 	 * If so, include it. If not, create scatterlist.
+ 	 */
++	iv_dma = dma_map_single(jrdev, req->info, ivsize, DMA_TO_DEVICE);
++	dma_sync_single_for_device(jrdev, iv_dma, ivsize, DMA_TO_DEVICE);
+ 	if (!src_nents && iv_dma + ivsize == sg_dma_address(req->src))
+ 		iv_contig = true;
+ 	else
+@@ -3104,7 +1551,7 @@
+ 			sizeof(struct sec4_sg_entry);
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct ablkcipher_edesc) + desc_bytes +
++	edesc = kzalloc(sizeof(struct ablkcipher_edesc) + desc_bytes +
+ 			sec4_sg_bytes, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -3134,15 +1581,13 @@
+ 
+ 	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+ 					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-
+ 	edesc->iv_dma = iv_dma;
+ 
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
++				   DMA_TO_DEVICE);
++
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ablkcipher sec4_sg@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ablkcipher sec4_sg@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->sec4_sg,
+ 		       sec4_sg_bytes, 1);
+ #endif
+@@ -3171,7 +1616,7 @@
+ 	init_ablkcipher_job(ctx->sh_desc_enc,
+ 		ctx->sh_desc_enc_dma, edesc, req, iv_contig);
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
+ 		       desc_bytes(edesc->hw_desc), 1);
+ #endif
+@@ -3209,7 +1654,7 @@
+ 		ctx->sh_desc_dec_dma, edesc, req, iv_contig);
+ 	desc = edesc->hw_desc;
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ablkcipher jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
+ 		       desc_bytes(edesc->hw_desc), 1);
+ #endif
+@@ -3225,291 +1670,28 @@
+ 	return ret;
+ }
+ 
+-/*
+- * allocate and map the ablkcipher extended descriptor
+- * for ablkcipher givencrypt
+- */
+-static struct ablkcipher_edesc *ablkcipher_giv_edesc_alloc(
+-				struct skcipher_givcrypt_request *greq,
+-				int desc_bytes,
+-				bool *iv_contig_out)
+-{
+-	struct ablkcipher_request *req = &greq->creq;
+-	struct crypto_ablkcipher *ablkcipher = crypto_ablkcipher_reqtfm(req);
+-	struct caam_ctx *ctx = crypto_ablkcipher_ctx(ablkcipher);
+-	struct device *jrdev = ctx->jrdev;
+-	gfp_t flags = (req->base.flags & (CRYPTO_TFM_REQ_MAY_BACKLOG |
+-					  CRYPTO_TFM_REQ_MAY_SLEEP)) ?
+-		       GFP_KERNEL : GFP_ATOMIC;
+-	int src_nents, dst_nents = 0, sec4_sg_bytes;
+-	struct ablkcipher_edesc *edesc;
+-	dma_addr_t iv_dma = 0;
+-	bool iv_contig = false;
+-	int sgc;
+-	int ivsize = crypto_ablkcipher_ivsize(ablkcipher);
+-	bool src_chained = false, dst_chained = false;
+-	int sec4_sg_index;
+-
+-	src_nents = sg_count(req->src, req->nbytes, &src_chained);
+-
+-	if (unlikely(req->dst != req->src))
+-		dst_nents = sg_count(req->dst, req->nbytes, &dst_chained);
+-
+-	if (likely(req->src == req->dst)) {
+-		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
+-					 DMA_BIDIRECTIONAL, src_chained);
+-	} else {
+-		sgc = dma_map_sg_chained(jrdev, req->src, src_nents ? : 1,
+-					 DMA_TO_DEVICE, src_chained);
+-		sgc = dma_map_sg_chained(jrdev, req->dst, dst_nents ? : 1,
+-					 DMA_FROM_DEVICE, dst_chained);
+-	}
+-
+-	/*
+-	 * Check if iv can be contiguous with source and destination.
+-	 * If so, include it. If not, create scatterlist.
+-	 */
+-	iv_dma = dma_map_single(jrdev, greq->giv, ivsize, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, iv_dma)) {
+-		dev_err(jrdev, "unable to map IV\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-
+-	if (!dst_nents && iv_dma + ivsize == sg_dma_address(req->dst))
+-		iv_contig = true;
+-	else
+-		dst_nents = dst_nents ? : 1;
+-	sec4_sg_bytes = ((iv_contig ? 0 : 1) + src_nents + dst_nents) *
+-			sizeof(struct sec4_sg_entry);
+-
+-	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(*edesc) + desc_bytes +
+-			sec4_sg_bytes, GFP_DMA | flags);
+-	if (!edesc) {
+-		dev_err(jrdev, "could not allocate extended descriptor\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-
+-	edesc->src_nents = src_nents;
+-	edesc->src_chained = src_chained;
+-	edesc->dst_nents = dst_nents;
+-	edesc->dst_chained = dst_chained;
+-	edesc->sec4_sg_bytes = sec4_sg_bytes;
+-	edesc->sec4_sg = (void *)edesc + sizeof(struct ablkcipher_edesc) +
+-			 desc_bytes;
+-
+-	sec4_sg_index = 0;
+-	if (src_nents) {
+-		sg_to_sec4_sg_last(req->src, src_nents, edesc->sec4_sg, 0);
+-		sec4_sg_index += src_nents;
+-	}
+-
+-	if (!iv_contig) {
+-		dma_to_sec4_sg_one(edesc->sec4_sg + sec4_sg_index,
+-				   iv_dma, ivsize, 0);
+-		sec4_sg_index += 1;
+-		sg_to_sec4_sg_last(req->dst, dst_nents,
+-				   edesc->sec4_sg + sec4_sg_index, 0);
+-	}
+-
+-	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return ERR_PTR(-ENOMEM);
+-	}
+-	edesc->iv_dma = iv_dma;
+-
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ablkcipher sec4_sg@" __stringify(__LINE__) ": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->sec4_sg,
+-		       sec4_sg_bytes, 1);
+-#endif
+-
+-	*iv_contig_out = iv_contig;
+-	return edesc;
+-}
+-
+-static int ablkcipher_givencrypt(struct skcipher_givcrypt_request *creq)
+-{
+-	struct ablkcipher_request *req = &creq->creq;
+-	struct ablkcipher_edesc *edesc;
+-	struct crypto_ablkcipher *ablkcipher = crypto_ablkcipher_reqtfm(req);
+-	struct caam_ctx *ctx = crypto_ablkcipher_ctx(ablkcipher);
+-	struct device *jrdev = ctx->jrdev;
+-	bool iv_contig;
+-	u32 *desc;
+-	int ret = 0;
+-
+-	/* allocate extended descriptor */
+-	edesc = ablkcipher_giv_edesc_alloc(creq, DESC_JOB_IO_LEN *
+-				       CAAM_CMD_SZ, &iv_contig);
+-	if (IS_ERR(edesc))
+-		return PTR_ERR(edesc);
+-
+-	/* Create and submit job descriptor*/
+-	init_ablkcipher_giv_job(ctx->sh_desc_givenc, ctx->sh_desc_givenc_dma,
+-				edesc, req, iv_contig);
+-#ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ablkcipher jobdesc@" __stringify(__LINE__) ": ",
+-		       DUMP_PREFIX_ADDRESS, 16, 4, edesc->hw_desc,
+-		       desc_bytes(edesc->hw_desc), 1);
+-#endif
+-	desc = edesc->hw_desc;
+-	ret = caam_jr_enqueue(jrdev, desc, ablkcipher_encrypt_done, req);
+-
+-	if (!ret) {
+-		ret = -EINPROGRESS;
+-	} else {
+-		ablkcipher_unmap(jrdev, edesc, req);
+-		kfree(edesc);
+-	}
+-
+-	return ret;
+-}
+-
+ #define template_aead		template_u.aead
+ #define template_ablkcipher	template_u.ablkcipher
+ struct caam_alg_template {
+ 	char name[CRYPTO_MAX_ALG_NAME];
+-	char driver_name[CRYPTO_MAX_ALG_NAME];
+-	unsigned int blocksize;
+-	u32 type;
+-	union {
+-		struct ablkcipher_alg ablkcipher;
+-		struct aead_alg aead;
+-		struct blkcipher_alg blkcipher;
+-		struct cipher_alg cipher;
+-		struct compress_alg compress;
+-		struct rng_alg rng;
+-	} template_u;
+-	u32 class1_alg_type;
+-	u32 class2_alg_type;
+-	u32 alg_op;
+-};
+-
+-static struct caam_alg_template driver_algs[] = {
+-	/* single-pass ipsec_esp descriptor */
+-	{
+-		.name = "authenc(hmac(md5),ecb(cipher_null))",
+-		.driver_name = "authenc-hmac-md5-ecb-cipher_null-caam",
+-		.blocksize = NULL_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_null_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = NULL_IV_SIZE,
+-			.maxauthsize = MD5_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = 0,
+-		.class2_alg_type = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha1),ecb(cipher_null))",
+-		.driver_name = "authenc-hmac-sha1-ecb-cipher_null-caam",
+-		.blocksize = NULL_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_null_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = NULL_IV_SIZE,
+-			.maxauthsize = SHA1_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = 0,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha224),ecb(cipher_null))",
+-		.driver_name = "authenc-hmac-sha224-ecb-cipher_null-caam",
+-		.blocksize = NULL_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_null_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = NULL_IV_SIZE,
+-			.maxauthsize = SHA224_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = 0,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA224 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA224 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha256),ecb(cipher_null))",
+-		.driver_name = "authenc-hmac-sha256-ecb-cipher_null-caam",
+-		.blocksize = NULL_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_null_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = NULL_IV_SIZE,
+-			.maxauthsize = SHA256_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = 0,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA256 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA256 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha384),ecb(cipher_null))",
+-		.driver_name = "authenc-hmac-sha384-ecb-cipher_null-caam",
+-		.blocksize = NULL_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_null_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = NULL_IV_SIZE,
+-			.maxauthsize = SHA384_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = 0,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA384 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA384 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha512),ecb(cipher_null))",
+-		.driver_name = "authenc-hmac-sha512-ecb-cipher_null-caam",
+-		.blocksize = NULL_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_null_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = NULL_IV_SIZE,
+-			.maxauthsize = SHA512_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = 0,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA512 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA512 | OP_ALG_AAI_HMAC,
+-	},
++	char driver_name[CRYPTO_MAX_ALG_NAME];
++	unsigned int blocksize;
++	u32 type;
++	union {
++		struct ablkcipher_alg ablkcipher;
++		struct aead_alg aead;
++		struct blkcipher_alg blkcipher;
++		struct cipher_alg cipher;
++		struct compress_alg compress;
++		struct rng_alg rng;
++	} template_u;
++	u32 class1_alg_type;
++	u32 class2_alg_type;
++	u32 alg_op;
++};
++
++static struct caam_alg_template driver_algs[] = {
++	/* single-pass ipsec_esp descriptor */
+ 	{
+ 		.name = "authenc(hmac(md5),cbc(aes))",
+ 		.driver_name = "authenc-hmac-md5-cbc-aes-caam",
+@@ -3865,188 +2047,81 @@
+ 				   OP_ALG_AAI_HMAC_PRECOMP,
+ 		.alg_op = OP_ALG_ALGSEL_SHA512 | OP_ALG_AAI_HMAC,
+ 	},
++	/* ablkcipher descriptor */
+ 	{
+-		.name = "authenc(hmac(md5),rfc3686(ctr(aes)))",
+-		.driver_name = "authenc-hmac-md5-rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			.maxauthsize = MD5_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-		.class2_alg_type = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha1),rfc3686(ctr(aes)))",
+-		.driver_name = "authenc-hmac-sha1-rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			.maxauthsize = SHA1_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA1 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "authenc(hmac(sha224),rfc3686(ctr(aes)))",
+-		.driver_name = "authenc-hmac-sha224-rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			.maxauthsize = SHA224_DIGEST_SIZE,
++		.name = "ecb(des)",
++		.driver_name = "ecb-des-caam",
++		.blocksize = DES_BLOCK_SIZE,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
++		.template_ablkcipher = {
++			.setkey = ablkcipher_setkey,
++			.encrypt = ablkcipher_encrypt,
++			.decrypt = ablkcipher_decrypt,
++			.geniv = "eseqiv",
++			.min_keysize = DES_KEY_SIZE,
++			.max_keysize = DES_KEY_SIZE,
++			.ivsize = DES_BLOCK_SIZE,
+ 			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA224 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA224 | OP_ALG_AAI_HMAC,
++		.class1_alg_type = OP_ALG_ALGSEL_DES | OP_ALG_AAI_ECB,
+ 	},
+ 	{
+-		.name = "authenc(hmac(sha256),rfc3686(ctr(aes)))",
+-		.driver_name = "authenc-hmac-sha256-rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			.maxauthsize = SHA256_DIGEST_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA256 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA256 | OP_ALG_AAI_HMAC,
++		.name = "ecb(arc4)",
++		.driver_name = "ecb-arc4-caam",
++		.blocksize = ARC4_BLOCK_SIZE,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
++		.template_ablkcipher = {
++			.setkey = ablkcipher_setkey,
++			.encrypt = ablkcipher_encrypt,
++			.decrypt = ablkcipher_decrypt,
++			.geniv = "eseqiv",
++			.min_keysize = ARC4_MIN_KEY_SIZE,
++			.max_keysize = ARC4_MAX_KEY_SIZE,
++			.ivsize = ARC4_BLOCK_SIZE,
++		},
++	.class1_alg_type = OP_ALG_ALGSEL_ARC4 | OP_ALG_AAI_ECB
+ 	},
+ 	{
+-		.name = "authenc(hmac(sha384),rfc3686(ctr(aes)))",
+-		.driver_name = "authenc-hmac-sha384-rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			.maxauthsize = SHA384_DIGEST_SIZE,
++		.name = "ecb(aes)",
++		.driver_name = "ecb-aes-caam",
++		.blocksize = AES_BLOCK_SIZE,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
++		.template_ablkcipher = {
++			.setkey = ablkcipher_setkey,
++			.encrypt = ablkcipher_encrypt,
++			.decrypt = ablkcipher_decrypt,
++			.geniv = "eseqiv",
++			.min_keysize = AES_MIN_KEY_SIZE,
++			.max_keysize = AES_MAX_KEY_SIZE,
++			.ivsize = AES_BLOCK_SIZE,
+ 			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA384 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA384 | OP_ALG_AAI_HMAC,
++		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_ECB,
+ 	},
+ 	{
+-		.name = "authenc(hmac(sha512),rfc3686(ctr(aes)))",
+-		.driver_name = "authenc-hmac-sha512-rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = aead_setkey,
+-			.setauthsize = aead_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			.maxauthsize = SHA512_DIGEST_SIZE,
++		.name = "ctr(aes)",
++		.driver_name = "ctr-aes-caam",
++		.blocksize = AES_BLOCK_SIZE,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
++		.template_ablkcipher = {
++			.setkey = ablkcipher_setkey,
++			.encrypt = ablkcipher_encrypt,
++			.decrypt = ablkcipher_decrypt,
++			.geniv = "eseqiv",
++			.min_keysize = AES_MIN_KEY_SIZE,
++			.max_keysize = AES_MAX_KEY_SIZE,
++			.ivsize = AES_BLOCK_SIZE,
+ 			},
+ 		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-		.class2_alg_type = OP_ALG_ALGSEL_SHA512 |
+-				   OP_ALG_AAI_HMAC_PRECOMP,
+-		.alg_op = OP_ALG_ALGSEL_SHA512 | OP_ALG_AAI_HMAC,
+-	},
+-	{
+-		.name = "rfc4106(gcm(aes))",
+-		.driver_name = "rfc4106-gcm-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = rfc4106_setkey,
+-			.setauthsize = rfc4106_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = 8,
+-			.maxauthsize = AES_BLOCK_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_GCM,
+-	},
+-	{
+-		.name = "rfc4543(gcm(aes))",
+-		.driver_name = "rfc4543-gcm-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = rfc4543_setkey,
+-			.setauthsize = rfc4543_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = aead_givencrypt,
+-			.geniv = "<built-in>",
+-			.ivsize = 8,
+-			.maxauthsize = AES_BLOCK_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_GCM,
+-	},
+-	/* Galois Counter Mode */
+-	{
+-		.name = "gcm(aes)",
+-		.driver_name = "gcm-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_AEAD,
+-		.template_aead = {
+-			.setkey = gcm_setkey,
+-			.setauthsize = gcm_setauthsize,
+-			.encrypt = aead_encrypt,
+-			.decrypt = aead_decrypt,
+-			.givencrypt = NULL,
+-			.geniv = "<built-in>",
+-			.ivsize = 12,
+-			.maxauthsize = AES_BLOCK_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_GCM,
+ 	},
+-	/* ablkcipher descriptor */
+ 	{
+ 		.name = "cbc(aes)",
+ 		.driver_name = "cbc-aes-caam",
+ 		.blocksize = AES_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
+ 		.template_ablkcipher = {
+ 			.setkey = ablkcipher_setkey,
+ 			.encrypt = ablkcipher_encrypt,
+ 			.decrypt = ablkcipher_decrypt,
+-			.givencrypt = ablkcipher_givencrypt,
+-			.geniv = "<built-in>",
++			.geniv = "eseqiv",
+ 			.min_keysize = AES_MIN_KEY_SIZE,
+ 			.max_keysize = AES_MAX_KEY_SIZE,
+ 			.ivsize = AES_BLOCK_SIZE,
+@@ -4054,16 +2129,31 @@
+ 		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CBC,
+ 	},
+ 	{
++		.name = "ecb(des3_ede)",
++		.driver_name = "ecb-des3-caam",
++		.blocksize = DES3_EDE_BLOCK_SIZE,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
++		.template_ablkcipher = {
++			.setkey = ablkcipher_setkey,
++			.encrypt = ablkcipher_encrypt,
++			.decrypt = ablkcipher_decrypt,
++			.geniv = "eseqiv",
++			.min_keysize = DES3_EDE_KEY_SIZE,
++			.max_keysize = DES3_EDE_KEY_SIZE,
++			.ivsize = DES3_EDE_BLOCK_SIZE,
++			},
++		.class1_alg_type = OP_ALG_ALGSEL_3DES | OP_ALG_AAI_ECB,
++	},
++	{
+ 		.name = "cbc(des3_ede)",
+ 		.driver_name = "cbc-3des-caam",
+ 		.blocksize = DES3_EDE_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
+ 		.template_ablkcipher = {
+ 			.setkey = ablkcipher_setkey,
+ 			.encrypt = ablkcipher_encrypt,
+ 			.decrypt = ablkcipher_decrypt,
+-			.givencrypt = ablkcipher_givencrypt,
+-			.geniv = "<built-in>",
++			.geniv = "eseqiv",
+ 			.min_keysize = DES3_EDE_KEY_SIZE,
+ 			.max_keysize = DES3_EDE_KEY_SIZE,
+ 			.ivsize = DES3_EDE_BLOCK_SIZE,
+@@ -4074,58 +2164,23 @@
+ 		.name = "cbc(des)",
+ 		.driver_name = "cbc-des-caam",
+ 		.blocksize = DES_BLOCK_SIZE,
+-		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
++		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
+ 		.template_ablkcipher = {
+ 			.setkey = ablkcipher_setkey,
+ 			.encrypt = ablkcipher_encrypt,
+ 			.decrypt = ablkcipher_decrypt,
+-			.givencrypt = ablkcipher_givencrypt,
+-			.geniv = "<built-in>",
++			.geniv = "eseqiv",
+ 			.min_keysize = DES_KEY_SIZE,
+ 			.max_keysize = DES_KEY_SIZE,
+ 			.ivsize = DES_BLOCK_SIZE,
+ 			},
+ 		.class1_alg_type = OP_ALG_ALGSEL_DES | OP_ALG_AAI_CBC,
+-	},
+-	{
+-		.name = "ctr(aes)",
+-		.driver_name = "ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_ABLKCIPHER,
+-		.template_ablkcipher = {
+-			.setkey = ablkcipher_setkey,
+-			.encrypt = ablkcipher_encrypt,
+-			.decrypt = ablkcipher_decrypt,
+-			.geniv = "chainiv",
+-			.min_keysize = AES_MIN_KEY_SIZE,
+-			.max_keysize = AES_MAX_KEY_SIZE,
+-			.ivsize = AES_BLOCK_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+-	},
+-	{
+-		.name = "rfc3686(ctr(aes))",
+-		.driver_name = "rfc3686-ctr-aes-caam",
+-		.blocksize = 1,
+-		.type = CRYPTO_ALG_TYPE_GIVCIPHER,
+-		.template_ablkcipher = {
+-			.setkey = ablkcipher_setkey,
+-			.encrypt = ablkcipher_encrypt,
+-			.decrypt = ablkcipher_decrypt,
+-			.givencrypt = ablkcipher_givencrypt,
+-			.geniv = "<built-in>",
+-			.min_keysize = AES_MIN_KEY_SIZE +
+-				       CTR_RFC3686_NONCE_SIZE,
+-			.max_keysize = AES_MAX_KEY_SIZE +
+-				       CTR_RFC3686_NONCE_SIZE,
+-			.ivsize = CTR_RFC3686_IV_SIZE,
+-			},
+-		.class1_alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_CTR_MOD128,
+ 	}
+ };
+ 
+ struct caam_crypto_alg {
+ 	struct list_head entry;
++	struct device *ctrldev;
+ 	int class1_alg_type;
+ 	int class2_alg_type;
+ 	int alg_op;
+@@ -4138,12 +2193,14 @@
+ 	struct caam_crypto_alg *caam_alg =
+ 		 container_of(alg, struct caam_crypto_alg, crypto_alg);
+ 	struct caam_ctx *ctx = crypto_tfm_ctx(tfm);
++	struct caam_drv_private *priv = dev_get_drvdata(caam_alg->ctrldev);
++	int tgt_jr = atomic_inc_return(&priv->tfm_count);
+ 
+-	ctx->jrdev = caam_jr_alloc();
+-	if (IS_ERR(ctx->jrdev)) {
+-		pr_err("Job Ring Device allocation for transform failed\n");
+-		return PTR_ERR(ctx->jrdev);
+-	}
++	/*
++	 * distribute tfms across job rings to ensure in-order
++	 * crypto request processing per tfm
++	 */
++	ctx->jrdev = priv->algapi_jr[(tgt_jr / 2) % priv->num_jrs_for_algapi];
+ 
+ 	/* copy descriptor header template value */
+ 	ctx->class1_alg_type = OP_TYPE_CLASS1_ALG | caam_alg->class1_alg_type;
+@@ -4170,31 +2227,57 @@
+ 		dma_unmap_single(ctx->jrdev, ctx->sh_desc_givenc_dma,
+ 				 desc_bytes(ctx->sh_desc_givenc),
+ 				 DMA_TO_DEVICE);
+-	if (ctx->key_dma &&
+-	    !dma_mapping_error(ctx->jrdev, ctx->key_dma))
+-		dma_unmap_single(ctx->jrdev, ctx->key_dma,
+-				 ctx->enckeylen + ctx->split_key_pad_len,
+-				 DMA_TO_DEVICE);
+-
+-	caam_jr_free(ctx->jrdev);
+ }
+ 
+ static void __exit caam_algapi_exit(void)
+ {
+ 
++	struct device_node *dev_node;
++	struct platform_device *pdev;
++	struct device *ctrldev;
++	struct caam_drv_private *priv;
+ 	struct caam_crypto_alg *t_alg, *n;
++	int i, err;
++
++	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
++	if (!dev_node) {
++		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
++		if (!dev_node)
++			return;
++	}
++
++	pdev = of_find_device_by_node(dev_node);
++	if (!pdev) {
++		of_node_put(dev_node);
++		return;
++	}
+ 
+-	if (!alg_list.next)
++	ctrldev = &pdev->dev;
++	priv = dev_get_drvdata(ctrldev);
++
++	if (!priv->alg_list.next) {
++		of_node_put(dev_node);
+ 		return;
++	}
+ 
+-	list_for_each_entry_safe(t_alg, n, &alg_list, entry) {
++	list_for_each_entry_safe(t_alg, n, &priv->alg_list, entry) {
+ 		crypto_unregister_alg(&t_alg->crypto_alg);
+ 		list_del(&t_alg->entry);
+ 		kfree(t_alg);
+ 	}
++
++	for (i = 0; i < priv->total_jobrs; i++) {
++		err = caam_jr_deregister(priv->algapi_jr[i]);
++		if (err < 0)
++			break;
++	}
++	kfree(priv->algapi_jr);
++
++	of_node_put(dev_node);
+ }
+ 
+-static struct caam_crypto_alg *caam_alg_alloc(struct caam_alg_template
++static struct caam_crypto_alg *caam_alg_alloc(struct device *ctrldev,
++					      struct caam_alg_template
+ 					      *template)
+ {
+ 	struct caam_crypto_alg *t_alg;
+@@ -4202,7 +2285,7 @@
+ 
+ 	t_alg = kzalloc(sizeof(struct caam_crypto_alg), GFP_KERNEL);
+ 	if (!t_alg) {
+-		pr_err("failed to allocate t_alg\n");
++		dev_err(ctrldev, "failed to allocate t_alg\n");
+ 		return ERR_PTR(-ENOMEM);
+ 	}
+ 
+@@ -4218,13 +2301,13 @@
+ 	alg->cra_blocksize = template->blocksize;
+ 	alg->cra_alignmask = 0;
+ 	alg->cra_ctxsize = sizeof(struct caam_ctx);
+-	alg->cra_flags = CRYPTO_ALG_ASYNC | CRYPTO_ALG_KERN_DRIVER_ONLY |
+-			 template->type;
++	alg->cra_flags = CRYPTO_ALG_ASYNC | template->type;
++
++#ifdef CRYPTO_ALG_KERN_DRIVER_ONLY
++	alg->cra_flags |= CRYPTO_ALG_KERN_DRIVER_ONLY;
++#endif
++
+ 	switch (template->type) {
+-	case CRYPTO_ALG_TYPE_GIVCIPHER:
+-		alg->cra_type = &crypto_givcipher_type;
+-		alg->cra_ablkcipher = template->template_ablkcipher;
+-		break;
+ 	case CRYPTO_ALG_TYPE_ABLKCIPHER:
+ 		alg->cra_type = &crypto_ablkcipher_type;
+ 		alg->cra_ablkcipher = template->template_ablkcipher;
+@@ -4238,6 +2321,7 @@
+ 	t_alg->class1_alg_type = template->class1_alg_type;
+ 	t_alg->class2_alg_type = template->class2_alg_type;
+ 	t_alg->alg_op = template->alg_op;
++	t_alg->ctrldev = ctrldev;
+ 
+ 	return t_alg;
+ }
+@@ -4246,9 +2330,11 @@
+ {
+ 	struct device_node *dev_node;
+ 	struct platform_device *pdev;
+-	struct device *ctrldev;
+-	void *priv;
+-	int i = 0, err = 0;
++	struct device *ctrldev, **jrdev;
++	struct caam_drv_private *priv;
++	int i = 0, err = 0, md_limit = 0;
++	int des_inst, aes_inst, md_inst;
++	u64 cha_inst;
+ 
+ 	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
+ 	if (!dev_node) {
+@@ -4265,42 +2351,117 @@
+ 
+ 	ctrldev = &pdev->dev;
+ 	priv = dev_get_drvdata(ctrldev);
+-	of_node_put(dev_node);
+ 
+-	/*
+-	 * If priv is NULL, it's probably because the caam driver wasn't
+-	 * properly initialized (e.g. RNG4 init failed). Thus, bail out here.
+-	 */
+-	if (!priv)
+-		return -ENODEV;
++	INIT_LIST_HEAD(&priv->alg_list);
++
++	jrdev = kmalloc(sizeof(*jrdev) * priv->total_jobrs, GFP_ATOMIC);
++	if (!jrdev) {
++		of_node_put(dev_node);
++		return -ENOMEM;
++	}
+ 
++	for (i = 0; i < priv->total_jobrs; i++) {
++		err = caam_jr_register(ctrldev, &jrdev[i]);
++		if (err < 0)
++			break;
++	}
++	if (err < 0 && i == 0) {
++		dev_err(ctrldev, "algapi error in job ring registration: %d\n",
++			err);
++		of_node_put(dev_node);
++		kfree(jrdev);
++		return err;
++	}
+ 
+-	INIT_LIST_HEAD(&alg_list);
++	priv->num_jrs_for_algapi = i;
++	priv->algapi_jr = jrdev;
++	atomic_set(&priv->tfm_count, -1);
++
++	/*
++	 * register crypto algorithms the device supports
++	 * first, detect presence of DES, AES, and MD blocks. If MD present,
++	 * determine limit of supported digest size
++	 */
++	cha_inst = rd_reg64(&priv->ctrl->perfmon.cha_num);
++	des_inst = (cha_inst & CHA_ID_DES_MASK) >> CHA_ID_DES_SHIFT;
++	aes_inst = (cha_inst & CHA_ID_AES_MASK) >> CHA_ID_AES_SHIFT;
++	md_inst = (cha_inst & CHA_ID_MD_MASK) >> CHA_ID_MD_SHIFT;
++	if (md_inst) {
++		md_limit = SHA512_DIGEST_SIZE;
++		if ((rd_reg64(&priv->ctrl->perfmon.cha_id) & CHA_ID_MD_MASK)
++		     == CHA_ID_MD_LP256) /* LP256 limits digest size */
++			md_limit = SHA256_DIGEST_SIZE;
++	}
+ 
+-	/* register crypto algorithms the device supports */
+ 	for (i = 0; i < ARRAY_SIZE(driver_algs); i++) {
+-		/* TODO: check if h/w supports alg */
+ 		struct caam_crypto_alg *t_alg;
++		bool done = false;
++
++authencesn:
++		/*
++		 * All registrable algs in this module require a blockcipher
++		 * All aead algs require message digests, so check them for
++		 * instantiation and size.
++		 */
++		if (driver_algs[i].type == CRYPTO_ALG_TYPE_AEAD) {
++			/* If no MD instantiated, or MD too small, skip */
++			if ((!md_inst) ||
++			    (driver_algs[i].template_aead.maxauthsize >
++			     md_limit))
++				continue;
++		}
++		/* If DES alg, and CHA not instantiated, skip */
++		if ((driver_algs[i].class1_alg_type & OP_ALG_ALGSEL_3DES) ||
++		    (driver_algs[i].class1_alg_type & OP_ALG_ALGSEL_DES))
++			if (!des_inst)
++				continue;
++		/* If AES alg, and CHA not instantiated, skip */
++		if (driver_algs[i].class1_alg_type & OP_ALG_ALGSEL_AES)
++			if (!aes_inst)
++				continue;
+ 
+-		t_alg = caam_alg_alloc(&driver_algs[i]);
++		t_alg = caam_alg_alloc(ctrldev, &driver_algs[i]);
+ 		if (IS_ERR(t_alg)) {
+ 			err = PTR_ERR(t_alg);
+-			pr_warn("%s alg allocation failed\n",
+-				driver_algs[i].driver_name);
++			dev_warn(ctrldev, "%s alg allocation failed\n",
++				 driver_algs[i].driver_name);
+ 			continue;
+ 		}
+ 
+ 		err = crypto_register_alg(&t_alg->crypto_alg);
+ 		if (err) {
+-			pr_warn("%s alg registration failed\n",
++			dev_warn(ctrldev, "%s alg registration failed\n",
+ 				t_alg->crypto_alg.cra_driver_name);
+ 			kfree(t_alg);
+-		} else
+-			list_add_tail(&t_alg->entry, &alg_list);
++		} else {
++			list_add_tail(&t_alg->entry, &priv->alg_list);
++			dev_info(ctrldev, "%s\n",
++				 t_alg->crypto_alg.cra_driver_name);
++
++			if (driver_algs[i].type == CRYPTO_ALG_TYPE_AEAD &&
++			    !memcmp(driver_algs[i].name, "authenc", 7) &&
++			    !done) {
++				char *name;
++
++				name = driver_algs[i].name;
++				memmove(name + 10, name + 7, strlen(name) - 7);
++				memcpy(name + 7, "esn", 3);
++
++				name = driver_algs[i].driver_name;
++				memmove(name + 10, name + 7, strlen(name) - 7);
++				memcpy(name + 7, "esn", 3);
++
++				done = true;
++				goto authencesn;
++			}
++		}
+ 	}
+-	if (!list_empty(&alg_list))
+-		pr_info("caam algorithms registered in /proc/crypto\n");
+ 
++	if (!list_empty(&priv->alg_list))
++		dev_info(ctrldev, "%s algorithms registered in /proc/crypto\n",
++			 (char *)of_get_property(dev_node, "compatible", NULL));
++
++	of_node_put(dev_node);
+ 	return err;
+ }
+ 
+diff -Nur linux-4.1.3/drivers/crypto/caam/caamhash.c linux-xbian-imx6/drivers/crypto/caam/caamhash.c
+--- linux-4.1.3/drivers/crypto/caam/caamhash.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/caamhash.c	2015-07-27 23:13:04.209961631 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * caam - Freescale FSL CAAM support for ahash functions of crypto API
+  *
+- * Copyright 2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
+  *
+  * Based on caamalg.c crypto API driver.
+  *
+@@ -62,6 +62,7 @@
+ #include "error.h"
+ #include "sg_sw_sec4.h"
+ #include "key_gen.h"
++#include <linux/string.h>
+ 
+ #define CAAM_CRA_PRIORITY		3000
+ 
+@@ -72,6 +73,8 @@
+ #define CAAM_MAX_HASH_DIGEST_SIZE	SHA512_DIGEST_SIZE
+ 
+ /* length of descriptors text */
++#define DESC_JOB_IO_LEN			(CAAM_CMD_SZ * 5 + CAAM_PTR_SZ * 3)
++
+ #define DESC_AHASH_BASE			(4 * CAAM_CMD_SZ)
+ #define DESC_AHASH_UPDATE_LEN		(6 * CAAM_CMD_SZ)
+ #define DESC_AHASH_UPDATE_FIRST_LEN	(DESC_AHASH_BASE + 4 * CAAM_CMD_SZ)
+@@ -89,14 +92,13 @@
+ 
+ #ifdef DEBUG
+ /* for print_hex_dumps with line references */
++#define xstr(s) str(s)
++#define str(s) #s
+ #define debug(format, arg...) printk(format, arg)
+ #else
+ #define debug(format, arg...)
+ #endif
+ 
+-
+-static struct list_head hash_list;
+-
+ /* ahash per-session context */
+ struct caam_hash_ctx {
+ 	struct device *jrdev;
+@@ -115,6 +117,7 @@
+ 	u8 key[CAAM_MAX_HASH_KEY_SIZE];
+ 	dma_addr_t key_dma;
+ 	int ctx_len;
++	unsigned int key_len;
+ 	unsigned int split_key_len;
+ 	unsigned int split_key_pad_len;
+ };
+@@ -137,20 +140,13 @@
+ /* Common job descriptor seq in/out ptr routines */
+ 
+ /* Map state->caam_ctx, and append seq_out_ptr command that points to it */
+-static inline int map_seq_out_ptr_ctx(u32 *desc, struct device *jrdev,
+-				      struct caam_hash_state *state,
+-				      int ctx_len)
++static inline void map_seq_out_ptr_ctx(u32 *desc, struct device *jrdev,
++				       struct caam_hash_state *state,
++				       int ctx_len)
+ {
+ 	state->ctx_dma = dma_map_single(jrdev, state->caam_ctx,
+ 					ctx_len, DMA_FROM_DEVICE);
+-	if (dma_mapping_error(jrdev, state->ctx_dma)) {
+-		dev_err(jrdev, "unable to map ctx\n");
+-		return -ENOMEM;
+-	}
+-
+ 	append_seq_out_ptr(desc, state->ctx_dma, ctx_len, 0);
+-
+-	return 0;
+ }
+ 
+ /* Map req->result, and append seq_out_ptr command that points to it */
+@@ -173,6 +169,7 @@
+ 	dma_addr_t buf_dma;
+ 
+ 	buf_dma = dma_map_single(jrdev, buf, buflen, DMA_TO_DEVICE);
++	dma_sync_single_for_device(jrdev, buf_dma, buflen, DMA_TO_DEVICE);
+ 	dma_to_sec4_sg_one(sec4_sg, buf_dma, buflen, 0);
+ 
+ 	return buf_dma;
+@@ -208,19 +205,17 @@
+ }
+ 
+ /* Map state->caam_ctx, and add it to link table */
+-static inline int ctx_map_to_sec4_sg(u32 *desc, struct device *jrdev,
+-				     struct caam_hash_state *state, int ctx_len,
+-				     struct sec4_sg_entry *sec4_sg, u32 flag)
++static inline void ctx_map_to_sec4_sg(u32 *desc, struct device *jrdev,
++				      struct caam_hash_state *state,
++				      int ctx_len,
++				      struct sec4_sg_entry *sec4_sg,
++				      u32 flag)
+ {
+ 	state->ctx_dma = dma_map_single(jrdev, state->caam_ctx, ctx_len, flag);
+-	if (dma_mapping_error(jrdev, state->ctx_dma)) {
+-		dev_err(jrdev, "unable to map ctx\n");
+-		return -ENOMEM;
+-	}
+-
++	if ((flag == DMA_TO_DEVICE) || (flag == DMA_BIDIRECTIONAL))
++		dma_sync_single_for_device(jrdev, state->ctx_dma, ctx_len,
++					   flag);
+ 	dma_to_sec4_sg_one(sec4_sg, state->ctx_dma, ctx_len, 0);
+-
+-	return 0;
+ }
+ 
+ /* Common shared descriptor commands */
+@@ -231,6 +226,13 @@
+ 			  KEY_DEST_MDHA_SPLIT | KEY_ENC);
+ }
+ 
++static inline void append_key_axcbc(u32 *desc, struct caam_hash_ctx *ctx)
++{
++	append_key_as_imm(desc, ctx->key, ctx->key_len,
++			  ctx->key_len, CLASS_1 |
++			  KEY_DEST_CLASS_REG);
++}
++
+ /* Append key if it has been set */
+ static inline void init_sh_desc_key_ahash(u32 *desc, struct caam_hash_ctx *ctx)
+ {
+@@ -252,6 +254,25 @@
+ 	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
+ }
+ 
++static inline void init_sh_desc_key_axcbc(u32 *desc, struct caam_hash_ctx *ctx)
++{
++	u32 *key_jump_cmd;
++
++	init_sh_desc(desc, HDR_SHARE_SERIAL);
++
++	if (ctx->key_len) {
++		key_jump_cmd = append_jump(desc, JUMP_JSL | JUMP_TEST_ALL |
++					   JUMP_COND_SHRD);
++
++		append_key_axcbc(desc, ctx);
++
++		set_jump_tgt_here(desc, key_jump_cmd);
++	}
++
++	/* Propagate errors from shared to job descriptor */
++	append_cmd(desc, SET_OK_NO_PROP_ERRORS | CMD_LOAD);
++
++}
+ /*
+  * For ahash read data from seqin following state->caam_ctx,
+  * and write resulting class2 context to seqout, which may be state->caam_ctx
+@@ -271,6 +292,20 @@
+ 			 LDST_SRCDST_BYTE_CONTEXT);
+ }
+ 
++static inline void axcbc_append_load_str(u32 *desc, int digestsize)
++{
++	/* Calculate remaining bytes to read */
++	 append_math_add(desc, VARSEQINLEN, SEQINLEN, REG0, CAAM_CMD_SZ);
++
++	/* Read remaining bytes */
++	append_seq_fifo_load(desc, 0, FIFOLD_CLASS_CLASS1 | FIFOLD_TYPE_LAST1 |
++			     FIFOLD_TYPE_MSG | KEY_VLF);
++
++	/* Store class1 context bytes */
++	append_seq_store(desc, digestsize, LDST_CLASS_1_CCB |
++			 LDST_SRCDST_BYTE_CONTEXT);
++}
++
+ /*
+  * For ahash update, final and finup, import context, read and write to seqout
+  */
+@@ -293,6 +328,27 @@
+ 	ahash_append_load_str(desc, digestsize);
+ }
+ 
++/*
++ * For ahash update, final and finup, import context, read and write to seqout
++ */
++static inline void axcbc_ctx_data_to_out(u32 *desc, u32 op, u32 state,
++					 int digestsize,
++					 struct caam_hash_ctx *ctx)
++{
++	init_sh_desc_key_axcbc(desc, ctx);
++
++	/* Import context from software */
++	append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++		   LDST_CLASS_1_CCB | ctx->ctx_len);
++
++	/* Class 1 operation */
++	append_operation(desc, op | state | OP_ALG_ENCRYPT);
++
++	/*
++	 * Load from buf and/or src and write to req->result or state->context
++	 */
++	axcbc_append_load_str(desc, digestsize);
++}
+ /* For ahash firsts and digest, read and write to seqout */
+ static inline void ahash_data_to_out(u32 *desc, u32 op, u32 state,
+ 				     int digestsize, struct caam_hash_ctx *ctx)
+@@ -308,6 +364,21 @@
+ 	ahash_append_load_str(desc, digestsize);
+ }
+ 
++/* For ahash firsts and digest, read and write to seqout */
++static inline void axcbc_data_to_out(u32 *desc, u32 op, u32 state,
++				     int digestsize, struct caam_hash_ctx *ctx)
++{
++	init_sh_desc_key_axcbc(desc, ctx);
++
++	/* Class 1 operation */
++	append_operation(desc, op | state | OP_ALG_ENCRYPT);
++
++	/*
++	 * Load from buf and/or src and write to req->result or state->context
++	 */
++	axcbc_append_load_str(desc, digestsize);
++}
++
+ static int ahash_set_sh_desc(struct crypto_ahash *ahash)
+ {
+ 	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
+@@ -342,8 +413,7 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ahash update shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ahash update shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -361,10 +431,11 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ahash update first shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ahash update first shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_update_first_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
+ 
+ 	/* ahash_final shared descriptor */
+ 	desc = ctx->sh_desc_fin;
+@@ -379,10 +450,12 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ahash final shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ahash final shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_fin_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
+ 
+ 	/* ahash_finup shared descriptor */
+ 	desc = ctx->sh_desc_finup;
+@@ -397,10 +470,12 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ahash finup shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ahash finup shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_finup_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
+ 
+ 	/* ahash_digest shared descriptor */
+ 	desc = ctx->sh_desc_digest;
+@@ -416,15 +491,134 @@
+ 		return -ENOMEM;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR,
+-		       "ahash digest shdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ahash digest shdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 		       desc_bytes(desc), 1);
+ #endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_digest_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
+ 
+ 	return 0;
+ }
+ 
++static int axcbc_set_sh_desc(struct crypto_ahash *ahash)
++{
++	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
++	int digestsize = crypto_ahash_digestsize(ahash);
++	struct device *jrdev = ctx->jrdev;
++	u32 have_key = 0;
++	u32 *desc;
++
++	/* ahash_update shared descriptor */
++	desc = ctx->sh_desc_update;
++
++	init_sh_desc(desc, HDR_SHARE_SERIAL);
++
++	/* Import context from software */
++	 append_cmd(desc, CMD_SEQ_LOAD | LDST_SRCDST_BYTE_CONTEXT |
++		   LDST_CLASS_1_CCB | ctx->ctx_len);
++
++	/* Class 1 operation */
++	append_operation(desc, ctx->alg_type | OP_ALG_AS_UPDATE |
++			 OP_ALG_ENCRYPT);
++
++	/* Load data and write to result or context */
++	axcbc_append_load_str(desc, ctx->ctx_len);
++
++	ctx->sh_desc_update_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
++						 DMA_TO_DEVICE);
++	if (dma_mapping_error(jrdev, ctx->sh_desc_update_dma)) {
++		dev_err(jrdev, "unable to map shared descriptor\n");
++		return -ENOMEM;
++	}
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ahash update shdesc@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
++#endif
++
++	/* ahash_update_first shared descriptor */
++	desc = ctx->sh_desc_update_first;
++
++	axcbc_data_to_out(desc, have_key | ctx->alg_type, OP_ALG_AS_INIT,
++			  ctx->ctx_len, ctx);
++
++	ctx->sh_desc_update_first_dma = dma_map_single(jrdev, desc,
++						       desc_bytes(desc),
++						       DMA_TO_DEVICE);
++	if (dma_mapping_error(jrdev, ctx->sh_desc_update_first_dma)) {
++		dev_err(jrdev, "unable to map shared descriptor\n");
++		return -ENOMEM;
++	}
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ahash update first shdesc@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
++#endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_update_first_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
++
++	/* ahash_final shared descriptor */
++	desc = ctx->sh_desc_fin;
++
++	axcbc_ctx_data_to_out(desc, have_key | ctx->alg_type,
++			      OP_ALG_AS_FINALIZE, digestsize, ctx);
++
++	ctx->sh_desc_fin_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
++					      DMA_TO_DEVICE);
++	if (dma_mapping_error(jrdev, ctx->sh_desc_fin_dma)) {
++		dev_err(jrdev, "unable to map shared descriptor\n");
++		return -ENOMEM;
++	}
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ahash final shdesc@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
++		       desc_bytes(desc), 1);
++#endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_fin_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
++
++	/* ahash_finup shared descriptor */
++	desc = ctx->sh_desc_finup;
++
++	axcbc_ctx_data_to_out(desc, have_key | ctx->alg_type,
++			      OP_ALG_AS_FINALIZE, digestsize, ctx);
++
++	ctx->sh_desc_finup_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
++						DMA_TO_DEVICE);
++	if (dma_mapping_error(jrdev, ctx->sh_desc_finup_dma)) {
++		dev_err(jrdev, "unable to map shared descriptor\n");
++		return -ENOMEM;
++	}
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ahash finup shdesc@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
++		       desc_bytes(desc), 1);
++#endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_finup_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
++
++	/* ahash_digest shared descriptor */
++	desc = ctx->sh_desc_digest;
++
++	axcbc_data_to_out(desc, have_key | ctx->alg_type, OP_ALG_AS_INITFINAL,
++			  digestsize, ctx);
++
++	ctx->sh_desc_digest_dma = dma_map_single(jrdev, desc,
++						 desc_bytes(desc),
++						 DMA_TO_DEVICE);
++	if (dma_mapping_error(jrdev, ctx->sh_desc_digest_dma)) {
++		dev_err(jrdev, "unable to map shared descriptor\n");
++		return -ENOMEM;
++	}
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ahash digest shdesc@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, desc,
++		       desc_bytes(desc), 1);
++#endif
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_digest_dma,
++				   desc_bytes(desc), DMA_TO_DEVICE);
++
++	return 0;
++}
+ static int gen_split_hash_key(struct caam_hash_ctx *ctx, const u8 *key_in,
+ 			      u32 keylen)
+ {
+@@ -458,6 +652,8 @@
+ 		kfree(desc);
+ 		return -ENOMEM;
+ 	}
++	dma_sync_single_for_device(jrdev, src_dma, *keylen, DMA_TO_DEVICE);
++
+ 	dst_dma = dma_map_single(jrdev, (void *)key_out, digestsize,
+ 				 DMA_FROM_DEVICE);
+ 	if (dma_mapping_error(jrdev, dst_dma)) {
+@@ -478,9 +674,9 @@
+ 			 LDST_SRCDST_BYTE_CONTEXT);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "key_in@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "key_in@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, key_in, *keylen, 1);
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -493,17 +689,17 @@
+ 		wait_for_completion_interruptible(&result.completion);
+ 		ret = result.err;
+ #ifdef DEBUG
+-		print_hex_dump(KERN_ERR,
+-			       "digested key@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "digested key@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, key_in,
+ 			       digestsize, 1);
+ #endif
+ 	}
++	*keylen = digestsize;
++
+ 	dma_unmap_single(jrdev, src_dma, *keylen, DMA_TO_DEVICE);
++	dma_sync_single_for_cpu(jrdev, dst_dma, digestsize, DMA_FROM_DEVICE);
+ 	dma_unmap_single(jrdev, dst_dma, digestsize, DMA_FROM_DEVICE);
+ 
+-	*keylen = digestsize;
+-
+ 	kfree(desc);
+ 
+ 	return ret;
+@@ -545,7 +741,7 @@
+ #ifdef DEBUG
+ 	printk(KERN_ERR "split_key_len %d split_key_pad_len %d\n",
+ 	       ctx->split_key_len, ctx->split_key_pad_len);
+-	print_hex_dump(KERN_ERR, "key in @"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "key in @"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, key, keylen, 1);
+ #endif
+ 
+@@ -557,11 +753,14 @@
+ 				      DMA_TO_DEVICE);
+ 	if (dma_mapping_error(jrdev, ctx->key_dma)) {
+ 		dev_err(jrdev, "unable to map key i/o memory\n");
+-		ret = -ENOMEM;
+-		goto map_err;
++		return -ENOMEM;
+ 	}
++
++	dma_sync_single_for_device(jrdev, ctx->key_dma, ctx->split_key_pad_len,
++				   DMA_TO_DEVICE);
++
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
+ 		       ctx->split_key_pad_len, 1);
+ #endif
+@@ -572,7 +771,6 @@
+ 				 DMA_TO_DEVICE);
+ 	}
+ 
+-map_err:
+ 	kfree(hashed_key);
+ 	return ret;
+ badkey:
+@@ -581,6 +779,25 @@
+ 	return -EINVAL;
+ }
+ 
++static int axcbc_setkey(struct crypto_ahash *ahash,
++			const u8 *key, unsigned int keylen)
++{
++	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
++	int ret = 0;
++
++	ctx->key_len = keylen;
++	memcpy(ctx->key, key, keylen);
++
++#ifdef DEBUG
++	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
++		       DUMP_PREFIX_ADDRESS, 16, 4, ctx->key,
++		       ctx->key_len, 1);
++#endif
++
++	ret = axcbc_set_sh_desc(ahash);
++
++	return ret;
++}
+ /*
+  * ahash_edesc - s/w-extended ahash descriptor
+  * @dst_dma: physical mapped address of req->result
+@@ -608,8 +825,11 @@
+ 	if (edesc->src_nents)
+ 		dma_unmap_sg_chained(dev, req->src, edesc->src_nents,
+ 				     DMA_TO_DEVICE, edesc->chained);
+-	if (edesc->dst_dma)
++	if (edesc->dst_dma) {
++		dma_sync_single_for_cpu(dev, edesc->dst_dma, dst_len,
++					DMA_FROM_DEVICE);
+ 		dma_unmap_single(dev, edesc->dst_dma, dst_len, DMA_FROM_DEVICE);
++	}
+ 
+ 	if (edesc->sec4_sg_bytes)
+ 		dma_unmap_single(dev, edesc->sec4_sg_dma,
+@@ -624,8 +844,12 @@
+ 	struct caam_hash_ctx *ctx = crypto_ahash_ctx(ahash);
+ 	struct caam_hash_state *state = ahash_request_ctx(req);
+ 
+-	if (state->ctx_dma)
++	if (state->ctx_dma) {
++		if ((flag == DMA_FROM_DEVICE) || (flag == DMA_BIDIRECTIONAL))
++			dma_sync_single_for_cpu(dev, state->ctx_dma,
++						ctx->ctx_len, flag);
+ 		dma_unmap_single(dev, state->ctx_dma, ctx->ctx_len, flag);
++	}
+ 	ahash_unmap(dev, edesc, req, dst_len);
+ }
+ 
+@@ -645,18 +869,21 @@
+ 
+ 	edesc = (struct ahash_edesc *)((char *)desc -
+ 		 offsetof(struct ahash_edesc, hw_desc));
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ 	ahash_unmap(jrdev, edesc, req, digestsize);
+ 	kfree(edesc);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
+ 		       ctx->ctx_len, 1);
+ 	if (req->result)
+-		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
+ 			       digestsize, 1);
+ #endif
+@@ -680,18 +907,21 @@
+ 
+ 	edesc = (struct ahash_edesc *)((char *)desc -
+ 		 offsetof(struct ahash_edesc, hw_desc));
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ 	ahash_unmap_ctx(jrdev, edesc, req, ctx->ctx_len, DMA_BIDIRECTIONAL);
+ 	kfree(edesc);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
+ 		       ctx->ctx_len, 1);
+ 	if (req->result)
+-		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
+ 			       digestsize, 1);
+ #endif
+@@ -715,18 +945,21 @@
+ 
+ 	edesc = (struct ahash_edesc *)((char *)desc -
+ 		 offsetof(struct ahash_edesc, hw_desc));
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
+ 
+-	ahash_unmap_ctx(jrdev, edesc, req, digestsize, DMA_TO_DEVICE);
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
++
++	ahash_unmap_ctx(jrdev, edesc, req, digestsize, DMA_FROM_DEVICE);
+ 	kfree(edesc);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
+ 		       ctx->ctx_len, 1);
+ 	if (req->result)
+-		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
+ 			       digestsize, 1);
+ #endif
+@@ -750,18 +983,21 @@
+ 
+ 	edesc = (struct ahash_edesc *)((char *)desc -
+ 		 offsetof(struct ahash_edesc, hw_desc));
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+-	ahash_unmap_ctx(jrdev, edesc, req, ctx->ctx_len, DMA_FROM_DEVICE);
++	ahash_unmap_ctx(jrdev, edesc, req, ctx->ctx_len, DMA_TO_DEVICE);
+ 	kfree(edesc);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ctx@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, state->caam_ctx,
+ 		       ctx->ctx_len, 1);
+ 	if (req->result)
+-		print_hex_dump(KERN_ERR, "result@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "result@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, req->result,
+ 			       digestsize, 1);
+ #endif
+@@ -807,7 +1043,7 @@
+ 		 * allocate space for base edesc and hw desc commands,
+ 		 * link tables
+ 		 */
+-		edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
++		edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
+ 				sec4_sg_bytes, GFP_DMA | flags);
+ 		if (!edesc) {
+ 			dev_err(jrdev,
+@@ -820,11 +1056,12 @@
+ 		edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 		edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 				 DESC_JOB_IO_LEN;
++		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++						     sec4_sg_bytes,
++						     DMA_TO_DEVICE);
+ 
+-		ret = ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
+-					 edesc->sec4_sg, DMA_BIDIRECTIONAL);
+-		if (ret)
+-			return ret;
++		ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
++				   edesc->sec4_sg, DMA_BIDIRECTIONAL);
+ 
+ 		state->buf_dma = try_buf_map_to_sec4_sg(jrdev,
+ 							edesc->sec4_sg + 1,
+@@ -851,21 +1088,16 @@
+ 		init_job_desc_shared(desc, ptr, sh_len, HDR_SHARE_DEFER |
+ 				     HDR_REVERSE);
+ 
+-		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-						     sec4_sg_bytes,
+-						     DMA_TO_DEVICE);
+-		if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-			dev_err(jrdev, "unable to map S/G table\n");
+-			return -ENOMEM;
+-		}
+-
+ 		append_seq_in_ptr(desc, edesc->sec4_sg_dma, ctx->ctx_len +
+ 				       to_hash, LDST_SGF);
+ 
+ 		append_seq_out_ptr(desc, state->ctx_dma, ctx->ctx_len, 0);
+ 
++		dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
++					   sec4_sg_bytes, DMA_TO_DEVICE);
++
+ #ifdef DEBUG
+-		print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 			       desc_bytes(desc), 1);
+ #endif
+@@ -885,9 +1117,9 @@
+ 		*next_buflen = last_buflen;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "buf@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "buf@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, buf, *buflen, 1);
+-	print_hex_dump(KERN_ERR, "next buf@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "next buf@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, next_buf,
+ 		       *next_buflen, 1);
+ #endif
+@@ -918,7 +1150,7 @@
+ 	sec4_sg_bytes = (1 + (buflen ? 1 : 0)) * sizeof(struct sec4_sg_entry);
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
++	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
+ 			sec4_sg_bytes, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -932,37 +1164,29 @@
+ 	edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 			 DESC_JOB_IO_LEN;
++	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++					    sec4_sg_bytes, DMA_TO_DEVICE);
+ 	edesc->src_nents = 0;
+ 
+-	ret = ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
+-				 edesc->sec4_sg, DMA_TO_DEVICE);
+-	if (ret)
+-		return ret;
++	ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len, edesc->sec4_sg,
++			   DMA_TO_DEVICE);
+ 
+ 	state->buf_dma = try_buf_map_to_sec4_sg(jrdev, edesc->sec4_sg + 1,
+ 						buf, state->buf_dma, buflen,
+ 						last_buflen);
+ 	(edesc->sec4_sg + sec4_sg_bytes - 1)->len |= SEC4_SG_LEN_FIN;
+ 
+-	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return -ENOMEM;
+-	}
+-
+ 	append_seq_in_ptr(desc, edesc->sec4_sg_dma, ctx->ctx_len + buflen,
+ 			  LDST_SGF);
+ 
+ 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
+ 						digestsize);
+-	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
+-		dev_err(jrdev, "unable to map dst\n");
+-		return -ENOMEM;
+-	}
++
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
++				   DMA_TO_DEVICE);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -1005,7 +1229,7 @@
+ 			 sizeof(struct sec4_sg_entry);
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
++	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
+ 			sec4_sg_bytes, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -1021,11 +1245,11 @@
+ 	edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 			 DESC_JOB_IO_LEN;
++	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++					    sec4_sg_bytes, DMA_TO_DEVICE);
+ 
+-	ret = ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len,
+-				 edesc->sec4_sg, DMA_TO_DEVICE);
+-	if (ret)
+-		return ret;
++	ctx_map_to_sec4_sg(desc, jrdev, state, ctx->ctx_len, edesc->sec4_sg,
++			   DMA_TO_DEVICE);
+ 
+ 	state->buf_dma = try_buf_map_to_sec4_sg(jrdev, edesc->sec4_sg + 1,
+ 						buf, state->buf_dma, buflen,
+@@ -1034,25 +1258,17 @@
+ 	src_map_to_sec4_sg(jrdev, req->src, src_nents, edesc->sec4_sg +
+ 			   sec4_sg_src_index, chained);
+ 
+-	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return -ENOMEM;
+-	}
+-
+ 	append_seq_in_ptr(desc, edesc->sec4_sg_dma, ctx->ctx_len +
+ 			       buflen + req->nbytes, LDST_SGF);
+ 
+ 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
+ 						digestsize);
+-	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
+-		dev_err(jrdev, "unable to map dst\n");
+-		return -ENOMEM;
+-	}
++
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
++				   DMA_TO_DEVICE);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -1091,7 +1307,7 @@
+ 	sec4_sg_bytes = src_nents * sizeof(struct sec4_sg_entry);
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct ahash_edesc) + sec4_sg_bytes +
++	edesc = kzalloc(sizeof(struct ahash_edesc) + sec4_sg_bytes +
+ 			DESC_JOB_IO_LEN, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -1099,6 +1315,8 @@
+ 	}
+ 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 			  DESC_JOB_IO_LEN;
++	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++					    sec4_sg_bytes, DMA_TO_DEVICE);
+ 	edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 	edesc->src_nents = src_nents;
+ 	edesc->chained = chained;
+@@ -1109,12 +1327,6 @@
+ 
+ 	if (src_nents) {
+ 		sg_to_sec4_sg_last(req->src, src_nents, edesc->sec4_sg, 0);
+-		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-		if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-			dev_err(jrdev, "unable to map S/G table\n");
+-			return -ENOMEM;
+-		}
+ 		src_dma = edesc->sec4_sg_dma;
+ 		options = LDST_SGF;
+ 	} else {
+@@ -1123,15 +1335,14 @@
+ 	}
+ 	append_seq_in_ptr(desc, src_dma, req->nbytes, options);
+ 
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
++				   edesc->sec4_sg_bytes, DMA_TO_DEVICE);
++
+ 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
+ 						digestsize);
+-	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
+-		dev_err(jrdev, "unable to map dst\n");
+-		return -ENOMEM;
+-	}
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -1165,7 +1376,7 @@
+ 	int sh_len;
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN,
++	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN,
+ 			GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -1178,23 +1389,17 @@
+ 	init_job_desc_shared(desc, ptr, sh_len, HDR_SHARE_DEFER | HDR_REVERSE);
+ 
+ 	state->buf_dma = dma_map_single(jrdev, buf, buflen, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, state->buf_dma)) {
+-		dev_err(jrdev, "unable to map src\n");
+-		return -ENOMEM;
+-	}
+ 
+ 	append_seq_in_ptr(desc, state->buf_dma, buflen, 0);
+ 
+ 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
+ 						digestsize);
+-	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
+-		dev_err(jrdev, "unable to map dst\n");
+-		return -ENOMEM;
+-	}
+ 	edesc->src_nents = 0;
+ 
++	dma_sync_single_for_device(jrdev, state->buf_dma, buflen,
++				   DMA_TO_DEVICE);
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -1245,7 +1450,7 @@
+ 		 * allocate space for base edesc and hw desc commands,
+ 		 * link tables
+ 		 */
+-		edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
++		edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
+ 				sec4_sg_bytes, GFP_DMA | flags);
+ 		if (!edesc) {
+ 			dev_err(jrdev,
+@@ -1258,7 +1463,9 @@
+ 		edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 		edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 				 DESC_JOB_IO_LEN;
+-		edesc->dst_dma = 0;
++		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++						    sec4_sg_bytes,
++						    DMA_TO_DEVICE);
+ 
+ 		state->buf_dma = buf_map_to_sec4_sg(jrdev, edesc->sec4_sg,
+ 						    buf, *buflen);
+@@ -1276,22 +1483,14 @@
+ 		init_job_desc_shared(desc, ptr, sh_len, HDR_SHARE_DEFER |
+ 				     HDR_REVERSE);
+ 
+-		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-						    sec4_sg_bytes,
+-						    DMA_TO_DEVICE);
+-		if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-			dev_err(jrdev, "unable to map S/G table\n");
+-			return -ENOMEM;
+-		}
+-
+ 		append_seq_in_ptr(desc, edesc->sec4_sg_dma, to_hash, LDST_SGF);
+ 
+-		ret = map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
+-		if (ret)
+-			return ret;
++		map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
+ 
++		dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
++					   sec4_sg_bytes, DMA_TO_DEVICE);
+ #ifdef DEBUG
+-		print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 			       desc_bytes(desc), 1);
+ #endif
+@@ -1314,9 +1513,9 @@
+ 		*next_buflen = 0;
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "buf@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "buf@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, buf, *buflen, 1);
+-	print_hex_dump(KERN_ERR, "next buf@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "next buf@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, next_buf,
+ 		       *next_buflen, 1);
+ #endif
+@@ -1352,7 +1551,7 @@
+ 			 sizeof(struct sec4_sg_entry);
+ 
+ 	/* allocate space for base edesc and hw desc commands, link tables */
+-	edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
++	edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
+ 			sec4_sg_bytes, GFP_DMA | flags);
+ 	if (!edesc) {
+ 		dev_err(jrdev, "could not allocate extended descriptor\n");
+@@ -1368,6 +1567,8 @@
+ 	edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 	edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 			 DESC_JOB_IO_LEN;
++	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++					    sec4_sg_bytes, DMA_TO_DEVICE);
+ 
+ 	state->buf_dma = try_buf_map_to_sec4_sg(jrdev, edesc->sec4_sg, buf,
+ 						state->buf_dma, buflen,
+@@ -1376,25 +1577,17 @@
+ 	src_map_to_sec4_sg(jrdev, req->src, src_nents, edesc->sec4_sg + 1,
+ 			   chained);
+ 
+-	edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
+-					    sec4_sg_bytes, DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-		dev_err(jrdev, "unable to map S/G table\n");
+-		return -ENOMEM;
+-	}
+-
+ 	append_seq_in_ptr(desc, edesc->sec4_sg_dma, buflen +
+ 			       req->nbytes, LDST_SGF);
+ 
+ 	edesc->dst_dma = map_seq_out_ptr_result(desc, jrdev, req->result,
+ 						digestsize);
+-	if (dma_mapping_error(jrdev, edesc->dst_dma)) {
+-		dev_err(jrdev, "unable to map dst\n");
+-		return -ENOMEM;
+-	}
++
++	dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma, sec4_sg_bytes,
++				   DMA_TO_DEVICE);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -1447,7 +1640,7 @@
+ 		 * allocate space for base edesc and hw desc commands,
+ 		 * link tables
+ 		 */
+-		edesc = kmalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
++		edesc = kzalloc(sizeof(struct ahash_edesc) + DESC_JOB_IO_LEN +
+ 				sec4_sg_bytes, GFP_DMA | flags);
+ 		if (!edesc) {
+ 			dev_err(jrdev,
+@@ -1460,19 +1653,13 @@
+ 		edesc->sec4_sg_bytes = sec4_sg_bytes;
+ 		edesc->sec4_sg = (void *)edesc + sizeof(struct ahash_edesc) +
+ 				 DESC_JOB_IO_LEN;
+-		edesc->dst_dma = 0;
++		edesc->sec4_sg_dma = dma_map_single(jrdev, edesc->sec4_sg,
++						    sec4_sg_bytes,
++						    DMA_TO_DEVICE);
+ 
+ 		if (src_nents) {
+ 			sg_to_sec4_sg_last(req->src, src_nents,
+ 					   edesc->sec4_sg, 0);
+-			edesc->sec4_sg_dma = dma_map_single(jrdev,
+-							    edesc->sec4_sg,
+-							    sec4_sg_bytes,
+-							    DMA_TO_DEVICE);
+-			if (dma_mapping_error(jrdev, edesc->sec4_sg_dma)) {
+-				dev_err(jrdev, "unable to map S/G table\n");
+-				return -ENOMEM;
+-			}
+ 			src_dma = edesc->sec4_sg_dma;
+ 			options = LDST_SGF;
+ 		} else {
+@@ -1491,12 +1678,12 @@
+ 
+ 		append_seq_in_ptr(desc, src_dma, to_hash, options);
+ 
+-		ret = map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
+-		if (ret)
+-			return ret;
++		map_seq_out_ptr_ctx(desc, jrdev, state, ctx->ctx_len);
+ 
++		dma_sync_single_for_device(jrdev, edesc->sec4_sg_dma,
++					   sec4_sg_bytes, DMA_TO_DEVICE);
+ #ifdef DEBUG
+-		print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, desc,
+ 			       desc_bytes(desc), 1);
+ #endif
+@@ -1521,7 +1708,7 @@
+ 					 req->nbytes, 0);
+ 	}
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "next buf@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "next buf@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, next_buf,
+ 		       *next_buflen, 1);
+ #endif
+@@ -1735,10 +1922,33 @@
+ 		.alg_type = OP_ALG_ALGSEL_MD5,
+ 		.alg_op = OP_ALG_ALGSEL_MD5 | OP_ALG_AAI_HMAC,
+ 	},
++	 {
++		.name = "xcbc(aes)",
++		.driver_name = "xcbc-aes-caam",
++		.hmac_name = "xcbc(aes)",
++		.hmac_driver_name = "xcbc-aes-caam",
++		.blocksize = XCBC_MAC_BLOCK_WORDS * 4,
++		.template_ahash = {
++			.init = ahash_init,
++			.update = ahash_update,
++			.final = ahash_final,
++			.finup = ahash_finup,
++			.digest = ahash_digest,
++			.export = ahash_export,
++			.import = ahash_import,
++			.setkey = axcbc_setkey,
++			.halg = {
++				.digestsize = XCBC_MAC_DIGEST_SIZE,
++				},
++			},
++		.alg_type = OP_ALG_ALGSEL_AES | OP_ALG_AAI_XCBC_MAC,
++		.alg_op = OP_ALG_ALGSEL_AES,
++	},
+ };
+ 
+ struct caam_hash_alg {
+ 	struct list_head entry;
++	struct device *ctrldev;
+ 	int alg_type;
+ 	int alg_op;
+ 	struct ahash_alg ahash_alg;
+@@ -1755,6 +1965,7 @@
+ 	struct caam_hash_alg *caam_hash =
+ 		 container_of(alg, struct caam_hash_alg, ahash_alg);
+ 	struct caam_hash_ctx *ctx = crypto_tfm_ctx(tfm);
++	struct caam_drv_private *priv = dev_get_drvdata(caam_hash->ctrldev);
+ 	/* Sizes for MDHA running digests: MD5, SHA1, 224, 256, 384, 512 */
+ 	static const u8 runninglen[] = { HASH_MSG_LEN + MD5_DIGEST_SIZE,
+ 					 HASH_MSG_LEN + SHA1_DIGEST_SIZE,
+@@ -1762,17 +1973,15 @@
+ 					 HASH_MSG_LEN + SHA256_DIGEST_SIZE,
+ 					 HASH_MSG_LEN + 64,
+ 					 HASH_MSG_LEN + SHA512_DIGEST_SIZE };
++	int tgt_jr = atomic_inc_return(&priv->tfm_count);
+ 	int ret = 0;
+ 
+ 	/*
+-	 * Get a Job ring from Job Ring driver to ensure in-order
++	 * distribute tfms across job rings to ensure in-order
+ 	 * crypto request processing per tfm
+ 	 */
+-	ctx->jrdev = caam_jr_alloc();
+-	if (IS_ERR(ctx->jrdev)) {
+-		pr_err("Job Ring Device allocation for transform failed\n");
+-		return PTR_ERR(ctx->jrdev);
+-	}
++	ctx->jrdev = priv->jrdev[tgt_jr % priv->total_jobrs];
++
+ 	/* copy descriptor header template value */
+ 	ctx->alg_type = OP_TYPE_CLASS2_ALG | caam_hash->alg_type;
+ 	ctx->alg_op = OP_TYPE_CLASS2_ALG | caam_hash->alg_op;
+@@ -1788,6 +1997,39 @@
+ 	return ret;
+ }
+ 
++static int caam_axcbc_cra_init(struct crypto_tfm *tfm)
++{
++	struct crypto_ahash *ahash = __crypto_ahash_cast(tfm);
++	struct crypto_alg *base = tfm->__crt_alg;
++	struct hash_alg_common *halg =
++		 container_of(base, struct hash_alg_common, base);
++	struct ahash_alg *alg =
++		 container_of(halg, struct ahash_alg, halg);
++	struct caam_hash_alg *caam_hash =
++		 container_of(alg, struct caam_hash_alg, ahash_alg);
++	struct caam_hash_ctx *ctx = crypto_tfm_ctx(tfm);
++	struct caam_drv_private *priv = dev_get_drvdata(caam_hash->ctrldev);
++	int tgt_jr = atomic_inc_return(&priv->tfm_count);
++	int ret = 0;
++
++	/*
++	 * distribute tfms across job rings to ensure in-order
++	 * crypto request processing per tfm
++	 */
++	ctx->jrdev = priv->jrdev[tgt_jr % priv->total_jobrs];
++
++	/* copy descriptor header template value */
++	ctx->alg_type = OP_TYPE_CLASS1_ALG | caam_hash->alg_type;
++	ctx->alg_op = OP_TYPE_CLASS1_ALG | caam_hash->alg_op;
++
++	crypto_ahash_set_reqsize(__crypto_ahash_cast(tfm),
++				 sizeof(struct caam_hash_state));
++
++	ret = axcbc_set_sh_desc(ahash);
++
++	return ret;
++}
++
+ static void caam_hash_cra_exit(struct crypto_tfm *tfm)
+ {
+ 	struct caam_hash_ctx *ctx = crypto_tfm_ctx(tfm);
+@@ -1815,35 +2057,57 @@
+ 	    !dma_mapping_error(ctx->jrdev, ctx->sh_desc_finup_dma))
+ 		dma_unmap_single(ctx->jrdev, ctx->sh_desc_finup_dma,
+ 				 desc_bytes(ctx->sh_desc_finup), DMA_TO_DEVICE);
+-
+-	caam_jr_free(ctx->jrdev);
+ }
+ 
+ static void __exit caam_algapi_hash_exit(void)
+ {
++	struct device_node *dev_node;
++	struct platform_device *pdev;
++	struct device *ctrldev;
++	struct caam_drv_private *priv;
+ 	struct caam_hash_alg *t_alg, *n;
+ 
+-	if (!hash_list.next)
++	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
++	if (!dev_node) {
++		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
++		if (!dev_node)
++			return;
++	}
++
++	pdev = of_find_device_by_node(dev_node);
++	if (!pdev) {
++		of_node_put(dev_node);
+ 		return;
++	}
+ 
+-	list_for_each_entry_safe(t_alg, n, &hash_list, entry) {
++	ctrldev = &pdev->dev;
++	priv = dev_get_drvdata(ctrldev);
++
++	if (!priv->hash_list.next) {
++		of_node_put(dev_node);
++		return;
++	}
++
++	list_for_each_entry_safe(t_alg, n, &priv->hash_list, entry) {
+ 		crypto_unregister_ahash(&t_alg->ahash_alg);
+ 		list_del(&t_alg->entry);
+ 		kfree(t_alg);
+ 	}
++
++	of_node_put(dev_node);
+ }
+ 
+ static struct caam_hash_alg *
+-caam_hash_alloc(struct caam_hash_template *template,
++caam_hash_alloc(struct device *ctrldev, struct caam_hash_template *template,
+ 		bool keyed)
+ {
+ 	struct caam_hash_alg *t_alg;
+ 	struct ahash_alg *halg;
+ 	struct crypto_alg *alg;
+ 
+-	t_alg = kzalloc(sizeof(struct caam_hash_alg), GFP_KERNEL);
++	t_alg = kzalloc(sizeof(struct caam_hash_alg), GFP_ATOMIC);
+ 	if (!t_alg) {
+-		pr_err("failed to allocate t_alg\n");
++		dev_err(ctrldev, "failed to allocate t_alg\n");
+ 		return ERR_PTR(-ENOMEM);
+ 	}
+ 
+@@ -1863,7 +2127,11 @@
+ 			 template->driver_name);
+ 	}
+ 	alg->cra_module = THIS_MODULE;
+-	alg->cra_init = caam_hash_cra_init;
++
++	if (strstr(alg->cra_name, "xcbc") > 0)
++		alg->cra_init = caam_axcbc_cra_init;
++	else
++		alg->cra_init = caam_hash_cra_init;
+ 	alg->cra_exit = caam_hash_cra_exit;
+ 	alg->cra_ctxsize = sizeof(struct caam_hash_ctx);
+ 	alg->cra_priority = CAAM_CRA_PRIORITY;
+@@ -1874,6 +2142,7 @@
+ 
+ 	t_alg->alg_type = template->alg_type;
+ 	t_alg->alg_op = template->alg_op;
++	t_alg->ctrldev = ctrldev;
+ 
+ 	return t_alg;
+ }
+@@ -1883,8 +2152,9 @@
+ 	struct device_node *dev_node;
+ 	struct platform_device *pdev;
+ 	struct device *ctrldev;
+-	void *priv;
+-	int i = 0, err = 0;
++	struct caam_drv_private *priv;
++	int i = 0, err = 0, md_limit = 0, md_inst;
++	u64 cha_inst;
+ 
+ 	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
+ 	if (!dev_node) {
+@@ -1898,60 +2168,68 @@
+ 		of_node_put(dev_node);
+ 		return -ENODEV;
+ 	}
+-
+ 	ctrldev = &pdev->dev;
+ 	priv = dev_get_drvdata(ctrldev);
+-	of_node_put(dev_node);
+ 
+-	/*
+-	 * If priv is NULL, it's probably because the caam driver wasn't
+-	 * properly initialized (e.g. RNG4 init failed). Thus, bail out here.
+-	 */
+-	if (!priv)
+-		return -ENODEV;
++	INIT_LIST_HEAD(&priv->hash_list);
+ 
+-	INIT_LIST_HEAD(&hash_list);
++	atomic_set(&priv->tfm_count, -1);
++
++	/* register algorithms the device supports */
++	cha_inst = rd_reg64(&priv->ctrl->perfmon.cha_num);
++	md_inst = (cha_inst & CHA_ID_MD_MASK) >> CHA_ID_MD_SHIFT;
++	if (md_inst) {
++		md_limit = SHA512_DIGEST_SIZE;
++		if ((rd_reg64(&priv->ctrl->perfmon.cha_id) & CHA_ID_MD_MASK)
++		     == CHA_ID_MD_LP256) /* LP256 limits digest size */
++			md_limit = SHA256_DIGEST_SIZE;
++	}
+ 
+-	/* register crypto algorithms the device supports */
+ 	for (i = 0; i < ARRAY_SIZE(driver_hash); i++) {
+-		/* TODO: check if h/w supports alg */
+ 		struct caam_hash_alg *t_alg;
+ 
++		/* If no MD instantiated, or MD too small, skip */
++		if ((!md_inst) ||
++		    (driver_hash[i].template_ahash.halg.digestsize >
++		     md_limit))
++			continue;
++
+ 		/* register hmac version */
+-		t_alg = caam_hash_alloc(&driver_hash[i], true);
++		t_alg = caam_hash_alloc(ctrldev, &driver_hash[i], true);
+ 		if (IS_ERR(t_alg)) {
+ 			err = PTR_ERR(t_alg);
+-			pr_warn("%s alg allocation failed\n",
+-				driver_hash[i].driver_name);
++			dev_warn(ctrldev, "%s alg allocation failed\n",
++				 driver_hash[i].driver_name);
+ 			continue;
+ 		}
+ 
+ 		err = crypto_register_ahash(&t_alg->ahash_alg);
+ 		if (err) {
+-			pr_warn("%s alg registration failed\n",
++			dev_warn(ctrldev, "%s alg registration failed\n",
+ 				t_alg->ahash_alg.halg.base.cra_driver_name);
+ 			kfree(t_alg);
+ 		} else
+-			list_add_tail(&t_alg->entry, &hash_list);
++			list_add_tail(&t_alg->entry, &priv->hash_list);
+ 
+ 		/* register unkeyed version */
+-		t_alg = caam_hash_alloc(&driver_hash[i], false);
++		t_alg = caam_hash_alloc(ctrldev, &driver_hash[i], false);
+ 		if (IS_ERR(t_alg)) {
+ 			err = PTR_ERR(t_alg);
+-			pr_warn("%s alg allocation failed\n",
+-				driver_hash[i].driver_name);
++			dev_warn(ctrldev, "%s alg allocation failed\n",
++				 driver_hash[i].driver_name);
+ 			continue;
+ 		}
+ 
+ 		err = crypto_register_ahash(&t_alg->ahash_alg);
+ 		if (err) {
+-			pr_warn("%s alg registration failed\n",
++			dev_warn(ctrldev, "%s alg registration failed\n",
+ 				t_alg->ahash_alg.halg.base.cra_driver_name);
+ 			kfree(t_alg);
+ 		} else
+-			list_add_tail(&t_alg->entry, &hash_list);
++			list_add_tail(&t_alg->entry, &priv->hash_list);
+ 	}
+ 
++	of_node_put(dev_node);
+ 	return err;
+ }
+ 
+diff -Nur linux-4.1.3/drivers/crypto/caam/caam_keyblob.c linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.c
+--- linux-4.1.3/drivers/crypto/caam/caam_keyblob.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.c	2015-07-27 23:13:04.205975852 +0200
+@@ -0,0 +1,687 @@
++/*
++ * Key blob driver based on CAAM hardware
++ *
++ * Copyright (C) 2015 Freescale Semiconductor, Inc.
++ */
++
++#include <linux/of_irq.h>
++#include <linux/of_address.h>
++
++#include "compat.h"
++#include "regs.h"
++#include "jr.h"
++#include "desc.h"
++#include "intern.h"
++#include "sm.h"
++#include "caam_keyblob.h"
++
++#define INITIAL_DESCSZ 16	/* size of tmp buffer for descriptor const. */
++
++/**
++ * struct kb_device - the metadata of the caam key blob device node
++ * @dev:		the actual misc device
++ */
++struct kb_device {
++	struct miscdevice misc_dev;
++    struct device *jr_dev;
++};
++
++/*
++ * Pseudo-synchronous ring access functions for carrying out key
++ * encapsulation and decapsulation
++ */
++
++struct sm_key_job_result {
++	int error;
++	struct completion completion;
++};
++
++
++static struct kb_device *kb_dev;
++
++static struct kb_device *kb_device_create(void);
++static int kb_device_destroy(struct kb_device *kb_dev);
++static int kb_open(struct inode *inode, struct file *file);
++static int kb_release(struct inode *inode, struct file *file);
++static void sm_key_job_done(struct device *dev, u32 *desc,
++		u32 err, void *context);
++static int gen_mem_encap(struct device *jr_dev, void __user *secretbuf,
++		int keylen, void __user *kmodbuf, void __user *outbuf);
++static int gen_mem_decap(struct device *jr_dev, void __user *keyblobbuf,
++		int bloblen, void __user *kmodbuf, void __user *outbuf);
++static long kb_ioctl(struct file *file, unsigned int cmd, unsigned long arg);
++static int caam_keyblob_probe(struct platform_device *pdev);
++static int caam_keyblob_remove(struct platform_device *pdev);
++
++static int kb_open(struct inode *inode, struct file *file)
++{
++	struct miscdevice *miscdev = file->private_data;
++	struct kb_device *dev = container_of(miscdev, struct kb_device, misc_dev);
++    struct device *jr_dev;
++
++    if (!dev->jr_dev) {
++		jr_dev = caam_jr_alloc();
++		if (IS_ERR(jr_dev)) {
++			pr_err("Job Ring Device allocation for transform failed\n");
++			return -ENOMEM;
++		}
++		pr_info("Allocate a job ring device\n");
++		dev->jr_dev = jr_dev;
++    }
++	else {
++		pr_err("Already created a job ring device");
++		return -EPERM;
++	}
++
++	return 0;
++}
++
++static int kb_release(struct inode *inode, struct file *file)
++{
++	struct miscdevice *miscdev = file->private_data;
++	struct kb_device *dev = container_of(miscdev, struct kb_device, misc_dev);
++
++    if (dev && dev->jr_dev) {
++	    caam_jr_free(dev->jr_dev);
++		pr_info("Free a job ring device\n");
++		dev->jr_dev = NULL;
++    }
++	return 0;
++}
++
++static void sm_key_job_done(struct device *dev, u32 *desc,
++		u32 err, void *context)
++{
++	struct sm_key_job_result *res = context;
++
++	res->error = err;	/* save off the error for postprocessing */
++	complete(&res->completion);	/* mark us complete */
++}
++
++/*
++ * Construct a blob encapsulation job descriptor
++ *
++ * This function dynamically constructs a blob encapsulation job descriptor
++ * from the following arguments:
++ *
++ * - desc	pointer to a pointer to the descriptor generated by this
++ *		function. Caller will be responsible to kfree() this
++ *		descriptor after execution.
++ * - keymod	Physical pointer to a key modifier, which must reside in a
++ *		contiguous piece of memory. Modifier will be assumed to be
++ *		8 bytes long for a blob of type SM_SECMEM, or 16 bytes long
++ *		for a blob of type SM_GENMEM (see blobtype argument).
++ * - secretbuf	Physical pointer to a secret, normally a black or red key,
++ *		possibly residing within an accessible secure memory page,
++ *		of the secret to be encapsulated to an output blob.
++ * - outbuf	Physical pointer to the destination buffer to receive the
++ *		encapsulated output. This buffer will need to be 48 bytes
++ *		larger than the input because of the added encapsulation data.
++ *		The generated descriptor will account for the increase in size,
++ *		but the caller must also account for this increase in the
++ *		buffer allocator.
++ * - secretsz	Size of input secret, in bytes. This is limited to 65536
++ *		less the size of blob overhead, since the length embeds into
++ *		DECO pointer in/out instructions.
++ * - keycolor   Determines if the source data is covered (black key) or
++ *		plaintext (red key). RED_KEY or BLACK_KEY are defined in
++ *		for this purpose.
++ * - blobtype	Determine if encapsulated blob should be a secure memory
++ *		blob (SM_SECMEM), with partition data embedded with key
++ *		material, or a general memory blob (SM_GENMEM).
++ * - auth	If BLACK_KEY source is covered via AES-CCM, specify
++ *		KEY_COVER_CCM, else uses AES-ECB (KEY_COVER_ECB).
++ *
++ * Upon completion, desc points to a buffer containing a CAAM job
++ * descriptor which encapsulates data into an externally-storable blob
++ * suitable for use across power cycles.
++ *
++ * This is an example of a black key encapsulation job into a general memory
++ * blob. Notice the 16-byte key modifier in the LOAD instruction. Also note
++ * the output 48 bytes longer than the input:
++ *
++ * [00] B0800008       jobhdr: stidx=0 len=8
++ * [01] 14400010           ld: ccb2-key len=16 offs=0
++ * [02] 08144891               ptr->@0x08144891
++ * [03] F800003A    seqoutptr: len=58
++ * [04] 01000000               out_ptr->@0x01000000
++ * [05] F000000A     seqinptr: len=10
++ * [06] 09745090               in_ptr->@0x09745090
++ * [07] 870D0004    operation: encap blob  reg=memory, black, format=normal
++ *
++ * This is an example of a red key encapsulation job for storing a red key
++ * into a secure memory blob. Note the 8 byte modifier on the 12 byte offset
++ * in the LOAD instruction; this accounts for blob permission storage:
++ *
++ * [00] B0800008       jobhdr: stidx=0 len=8
++ * [01] 14400C08           ld: ccb2-key len=8 offs=12
++ * [02] 087D0784               ptr->@0x087d0784
++ * [03] F8000050    seqoutptr: len=80
++ * [04] 09251BB2               out_ptr->@0x09251bb2
++ * [05] F0000020     seqinptr: len=32
++ * [06] 40000F31               in_ptr->@0x40000f31
++ * [07] 870D0008    operation: encap blob  reg=memory, red, sec_mem,
++ *                             format=normal
++ *
++ * Note: this function only generates 32-bit pointers at present, and should
++ * be refactored using a scheme that allows both 32 and 64 bit addressing
++ */
++
++static int blob_encap_jobdesc(u32 **desc, dma_addr_t keymod,
++			      void *secretbuf, dma_addr_t outbuf,
++			      u16 secretsz, u8 keycolor, u8 blobtype, u8 auth)
++{
++	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
++	u16 dsize, idx;
++
++	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
++	idx = 1;
++
++	/*
++	 * Key modifier works differently for secure/general memory blobs
++	 * This accounts for the permission/protection data encapsulated
++	 * within the blob if a secure memory blob is requested
++	 */
++	if (blobtype == SM_SECMEM)
++		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
++				 LDST_SRCDST_BYTE_KEY |
++				 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK)
++				 | (8 & LDST_LEN_MASK);
++	else /* is general memory blob */
++		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
++				 LDST_SRCDST_BYTE_KEY | (16 & LDST_LEN_MASK);
++
++	tmpdesc[idx++] = (u32)keymod;
++
++	/*
++	 * Encapsulation output must include space for blob key encryption
++	 * key and MAC tag
++	 */
++	tmpdesc[idx++] = CMD_SEQ_OUT_PTR | (secretsz + BLOB_OVERHEAD);
++	tmpdesc[idx++] = (u32)outbuf;
++
++	/* Input data, should be somewhere in secure memory */
++	tmpdesc[idx++] = CMD_SEQ_IN_PTR | secretsz;
++	tmpdesc[idx++] = (u32)secretbuf;
++
++	/* Set blob encap, then color */
++	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_ENCAP_PROTOCOL | OP_PCLID_BLOB;
++
++	if (blobtype == SM_SECMEM)
++		tmpdesc[idx] |= OP_PCL_BLOB_PTXT_SECMEM;
++
++	if (auth == KEY_COVER_CCM)
++		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
++
++	if (keycolor == BLACK_KEY)
++		tmpdesc[idx] |= OP_PCL_BLOB_BLACK;
++
++	idx++;
++	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
++	dsize = idx * sizeof(u32);
++
++	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
++	if (tdesc == NULL)
++		return 0;
++
++	memcpy(tdesc, tmpdesc, dsize);
++	*desc = tdesc;
++	return dsize;
++}
++
++/*
++ * Construct a blob decapsulation job descriptor
++ *
++ * This function dynamically constructs a blob decapsulation job descriptor
++ * from the following arguments:
++ *
++ * - desc	pointer to a pointer to the descriptor generated by this
++ *		function. Caller will be responsible to kfree() this
++ *		descriptor after execution.
++ * - keymod	Physical pointer to a key modifier, which must reside in a
++ *		contiguous piece of memory. Modifier will be assumed to be
++ *		8 bytes long for a blob of type SM_SECMEM, or 16 bytes long
++ *		for a blob of type SM_GENMEM (see blobtype argument).
++ * - blobbuf	Physical pointer (into external memory) of the blob to
++ *		be decapsulated. Blob must reside in a contiguous memory
++ *		segment.
++ * - outbuf	Physical pointer of the decapsulated output, possibly into
++ *		a location within a secure memory page. Must be contiguous.
++ * - secretsz	Size of encapsulated secret in bytes (not the size of the
++ *		input blob).
++ * - keycolor   Determines if decapsulated content is encrypted (BLACK_KEY)
++ *		or left as plaintext (RED_KEY).
++ * - blobtype	Determine if encapsulated blob should be a secure memory
++ *		blob (SM_SECMEM), with partition data embedded with key
++ *		material, or a general memory blob (SM_GENMEM).
++ * - auth	If decapsulation path is specified by BLACK_KEY, then if
++ *		AES-CCM is requested for key covering use KEY_COVER_CCM, else
++ *		use AES-ECB (KEY_COVER_ECB).
++ *
++ * Upon completion, desc points to a buffer containing a CAAM job descriptor
++ * that decapsulates a key blob from external memory into a black (encrypted)
++ * key or red (plaintext) content.
++ *
++ * This is an example of a black key decapsulation job from a general memory
++ * blob. Notice the 16-byte key modifier in the LOAD instruction.
++ *
++ * [00] B0800008       jobhdr: stidx=0 len=8
++ * [01] 14400010           ld: ccb2-key len=16 offs=0
++ * [02] 08A63B7F               ptr->@0x08a63b7f
++ * [03] F8000010    seqoutptr: len=16
++ * [04] 01000000               out_ptr->@0x01000000
++ * [05] F000003A     seqinptr: len=58
++ * [06] 01000010               in_ptr->@0x01000010
++ * [07] 860D0004    operation: decap blob  reg=memory, black, format=normal
++ *
++ * This is an example of a red key decapsulation job for restoring a red key
++ * from a secure memory blob. Note the 8 byte modifier on the 12 byte offset
++ * in the LOAD instruction:
++ *
++ * [00] B0800008       jobhdr: stidx=0 len=8
++ * [01] 14400C08           ld: ccb2-key len=8 offs=12
++ * [02] 01000000               ptr->@0x01000000
++ * [03] F8000020    seqoutptr: len=32
++ * [04] 400000E6               out_ptr->@0x400000e6
++ * [05] F0000050     seqinptr: len=80
++ * [06] 08F0C0EA               in_ptr->@0x08f0c0ea
++ * [07] 860D0008    operation: decap blob  reg=memory, red, sec_mem,
++ *			       format=normal
++ *
++ * Note: this function only generates 32-bit pointers at present, and should
++ * be refactored using a scheme that allows both 32 and 64 bit addressing
++ */
++
++static int blob_decap_jobdesc(u32 **desc, dma_addr_t keymod, dma_addr_t blobbuf,
++			      u8 *outbuf, u16 secretsz, u8 keycolor,
++			      u8 blobtype, u8 auth)
++{
++	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
++	u16 dsize, idx;
++
++	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
++	idx = 1;
++
++	/* Load key modifier */
++	if (blobtype == SM_SECMEM)
++		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
++				 LDST_SRCDST_BYTE_KEY |
++				 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK)
++				 | (8 & LDST_LEN_MASK);
++	else /* is general memory blob */
++		tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB |
++				 LDST_SRCDST_BYTE_KEY | (16 & LDST_LEN_MASK);
++
++	tmpdesc[idx++] = (u32)keymod;
++
++	/* Compensate BKEK + MAC tag over size of encapsulated secret */
++	tmpdesc[idx++] = CMD_SEQ_IN_PTR | (secretsz + BLOB_OVERHEAD);
++	tmpdesc[idx++] = (u32)blobbuf;
++	tmpdesc[idx++] = CMD_SEQ_OUT_PTR | secretsz;
++	tmpdesc[idx++] = (u32)outbuf;
++
++	/* Decapsulate from secure memory partition to black blob */
++	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_DECAP_PROTOCOL | OP_PCLID_BLOB;
++
++	if (blobtype == SM_SECMEM)
++		tmpdesc[idx] |= OP_PCL_BLOB_PTXT_SECMEM;
++
++	if (auth == KEY_COVER_CCM)
++		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
++
++	if (keycolor == BLACK_KEY)
++		tmpdesc[idx] |= OP_PCL_BLOB_BLACK;
++
++	idx++;
++	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
++	dsize = idx * sizeof(u32);
++
++	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
++	if (tdesc == NULL)
++		return 0;
++
++	memcpy(tdesc, tmpdesc, dsize);
++	*desc = tdesc;
++	return dsize;
++}
++
++
++
++static int gen_mem_encap(struct device *jr_dev, void __user *secretbuf,
++		int keylen, void __user *kmodbuf, void __user *outbuf)
++{
++	int retval = 0;
++	u32 dsize;
++    u32 __iomem *encapdesc = NULL;
++	dma_addr_t secret_dma = 0, keymod_dma = 0, outbuf_dma = 0;
++	u8 __iomem *lsecret = NULL, *lkeymod = NULL, *loutbuf = NULL;
++	struct sm_key_job_result testres;
++
++	/* Build/map/flush the scret */
++	lsecret = kmalloc(keylen, GFP_KERNEL | GFP_DMA);
++    if (!lsecret) {
++		dev_err(jr_dev, "%s: can't alloc for key\n", __func__);
++		retval = -ENOMEM;
++		goto out;
++	}
++    if (copy_from_user(lsecret, secretbuf, keylen)) {
++		dev_err(jr_dev, "%s: can't Copy for key\n", __func__);
++		retval = -EFAULT;
++		goto out;
++	}
++	secret_dma = dma_map_single(jr_dev, lsecret, keylen,
++				    DMA_TO_DEVICE);
++
++	/* Build/map/flush the key modifier */
++	lkeymod = kmalloc(GENMEM_KEYMOD_LEN, GFP_KERNEL | GFP_DMA);
++    if (!lkeymod) {
++		dev_err(jr_dev, "%s: can't alloc for keymod\n", __func__);
++		retval = -ENOMEM;
++		goto out;
++	}
++    if (copy_from_user(lkeymod, kmodbuf, GENMEM_KEYMOD_LEN)) {
++		dev_err(jr_dev, "%s: can't Copy for keymod\n", __func__);
++		retval = -EFAULT;
++		goto out;
++	}
++	keymod_dma = dma_map_single(jr_dev, lkeymod, GENMEM_KEYMOD_LEN,
++				    DMA_TO_DEVICE);
++
++	loutbuf = kmalloc(keylen + BLOB_OVERHEAD, GFP_KERNEL | GFP_DMA);
++    if (!lkeymod) {
++		dev_err(jr_dev, "%s: can't alloc for output\n", __func__);
++		retval = -ENOMEM;
++		goto out;
++	}
++	outbuf_dma = dma_map_single(jr_dev, loutbuf, keylen + BLOB_OVERHEAD,
++				    DMA_FROM_DEVICE);
++	dsize = blob_encap_jobdesc(&encapdesc, keymod_dma, (void *)secret_dma, outbuf_dma,
++			keylen, RED_KEY, SM_GENMEM, KEY_COVER_ECB);
++	if (!dsize) {
++		dev_err(jr_dev, "can't alloc an encapsulation descriptor\n");
++		retval = -ENOMEM;
++		goto out;
++	}
++	init_completion(&testres.completion);
++
++	retval = caam_jr_enqueue(jr_dev, encapdesc, sm_key_job_done,
++			&testres);
++	if (!retval) {
++		wait_for_completion_interruptible(&testres.completion);
++		dev_info(jr_dev, "job ring return %d\n", testres.error);
++		if (!testres.error) {
++			dma_sync_single_for_cpu(jr_dev, outbuf_dma, keylen + BLOB_OVERHEAD,
++				DMA_FROM_DEVICE);
++
++			if (copy_to_user(outbuf, loutbuf, keylen + BLOB_OVERHEAD)) {
++				retval = -EFAULT;
++				dev_err(jr_dev, "can't copy for output\n");
++				goto out;
++			}
++		}
++		retval = testres.error;
++	}
++
++out:
++	if (outbuf_dma)
++		dma_unmap_single(jr_dev, outbuf_dma, keylen + BLOB_OVERHEAD,
++			 DMA_FROM_DEVICE);
++	if (keymod_dma)
++		dma_unmap_single(jr_dev, keymod_dma, GENMEM_KEYMOD_LEN, DMA_TO_DEVICE);
++    if (secret_dma)
++		dma_unmap_single(jr_dev, secret_dma, keylen, DMA_TO_DEVICE);
++	kfree(encapdesc);
++	kfree(lkeymod);
++	kfree(lsecret);
++	kfree(loutbuf);
++
++	return retval;
++}
++
++static int gen_mem_decap(struct device *jr_dev, void __user *keyblobbuf,
++		int bloblen, void __user *kmodbuf, void __user *outbuf)
++{
++	int retval = 0;
++    int keylen = bloblen - BLOB_OVERHEAD;
++	u32 dsize;
++	dma_addr_t keyblob_dma = 0, keymod_dma = 0, outbuf_dma = 0;
++	u8 __iomem *lkeyblob = NULL, *lkeymod = NULL, *loutbuf = NULL;
++	struct sm_key_job_result testres;
++	u32 __iomem *decapdesc = NULL;
++
++	/* Build/map/flush the scret */
++	lkeyblob = kmalloc(bloblen, GFP_KERNEL | GFP_DMA);
++    if (!lkeyblob) {
++		dev_err(jr_dev, "%s: can't alloc for keylob\n", __func__);
++		retval = -ENOMEM;
++		goto out;
++	}
++    if (copy_from_user(lkeyblob, keyblobbuf, bloblen)) {
++		dev_err(jr_dev, "%s: can't Copy for keyblob\n", __func__);
++		retval = -EFAULT;
++		goto out;
++    }
++	keyblob_dma = dma_map_single(jr_dev, lkeyblob, bloblen,
++				    DMA_TO_DEVICE);
++
++	/* Build/map/flush the key modifier */
++	lkeymod = kmalloc(GENMEM_KEYMOD_LEN, GFP_KERNEL | GFP_DMA);
++    if (!lkeymod) {
++		dev_err(jr_dev, "%s: can't alloc for keymod\n", __func__);
++		retval = -ENOMEM;
++		goto out;
++	}
++    if (copy_from_user(lkeymod, kmodbuf, GENMEM_KEYMOD_LEN)) {
++		dev_err(jr_dev, "%s: can't Copy for keymod\n", __func__);
++		retval = -EFAULT;
++		goto out;
++	}
++	keymod_dma = dma_map_single(jr_dev, lkeymod, GENMEM_KEYMOD_LEN,
++				    DMA_TO_DEVICE);
++
++	loutbuf = kmalloc(keylen, GFP_KERNEL | GFP_DMA);
++    if (!loutbuf) {
++		dev_err(jr_dev, "%s: can't alloc for outbuf\n", __func__);
++		retval = -ENOMEM;
++		goto out;
++	}
++	outbuf_dma = dma_map_single(jr_dev, loutbuf, keylen,
++				    DMA_FROM_DEVICE);
++
++	/* Build the encapsulation job descriptor */
++	dsize = blob_decap_jobdesc(&decapdesc, keymod_dma, keyblob_dma, (u8 *)outbuf_dma,
++				   keylen, RED_KEY, SM_GENMEM, KEY_COVER_ECB);
++	if (!dsize) {
++		dev_err(jr_dev, "can't alloc a decapsulation descriptor\n");
++		retval = -ENOMEM;
++		goto out;
++	}
++
++	init_completion(&testres.completion);
++
++	retval = caam_jr_enqueue(jr_dev, decapdesc, sm_key_job_done,
++			      &testres);
++	if (!retval) {
++		wait_for_completion_interruptible(&testres.completion);
++		dev_info(jr_dev, "job ring return %d\n", testres.error);
++		if (!testres.error) {
++			dma_sync_single_for_cpu(jr_dev, outbuf_dma, keylen,
++				DMA_FROM_DEVICE);
++
++			if (copy_to_user(outbuf, loutbuf, keylen)) {
++				retval = -EFAULT;
++				goto out;
++			}
++		}
++		retval = testres.error;
++	}
++
++out:
++	if (outbuf_dma)
++		dma_unmap_single(jr_dev, outbuf_dma, keylen,
++				DMA_FROM_DEVICE);
++	if (keymod_dma)
++		dma_unmap_single(jr_dev, keymod_dma, GENMEM_KEYMOD_LEN,
++				DMA_TO_DEVICE);
++	if (keyblob_dma)
++		dma_unmap_single(jr_dev, keyblob_dma, bloblen,
++				DMA_TO_DEVICE);
++	kfree(decapdesc);
++	kfree(lkeymod);
++	kfree(lkeyblob);
++	kfree(loutbuf);
++
++	return retval;
++}
++
++
++static long kb_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
++{
++	int retval = 0;
++    struct caam_kb_data kb_data;
++	struct miscdevice *miscdev = file->private_data;
++	struct kb_device *dev = container_of(miscdev, struct kb_device, misc_dev);
++
++    if (copy_from_user(&kb_data, (void *)arg, sizeof(kb_data))) {
++		retval = -EFAULT;
++		goto err;
++	}
++
++    if (!kb_data.rawkey || !kb_data.keyblob ||
++			(kb_data.rawkey_len + BLOB_OVERHEAD != kb_data.keyblob_len) ||
++			(kb_data.keymod_len != GENMEM_KEYMOD_LEN)) {
++		retval = -EINVAL;
++		goto err;
++	}
++
++	printk(KERN_INFO"%s:rawkey_len %d, keyblob_len %d\n",
++			__func__, kb_data.rawkey_len, kb_data.keyblob_len);
++
++	switch (cmd) {
++	case CAAM_KB_ENCRYPT:
++	    {
++			retval = gen_mem_encap(dev->jr_dev, kb_data.rawkey, kb_data.rawkey_len,
++					kb_data.keymod, kb_data.keyblob);
++		    break;
++	    }
++	case CAAM_KB_DECRYPT:
++	    {
++			retval = gen_mem_decap(dev->jr_dev, kb_data.keyblob, kb_data.keyblob_len,
++					kb_data.keymod, kb_data.rawkey);
++		    break;
++	    }
++	default:
++		    return -ENOTTY;
++	}
++
++err:
++	return retval;
++}
++
++static const struct file_operations kb_fops = {
++	.owner          = THIS_MODULE,
++	.open           = kb_open,
++	.release        = kb_release,
++	.unlocked_ioctl = kb_ioctl,
++};
++
++static struct kb_device *kb_device_create(void)
++{
++	struct kb_device *idev;
++	int ret;
++
++	idev = kzalloc(sizeof(struct kb_device), GFP_KERNEL);
++	if (!idev)
++		return ERR_PTR(-ENOMEM);
++
++	idev->misc_dev.minor = MISC_DYNAMIC_MINOR;
++	idev->misc_dev.name = "caam_kb";
++	idev->misc_dev.fops = &kb_fops;
++	idev->misc_dev.parent = NULL;
++	ret = misc_register(&idev->misc_dev);
++	if (ret) {
++		pr_err("ion: failed to register misc device.\n");
++		return ERR_PTR(ret);
++	}
++
++	return idev;
++}
++
++static int kb_device_destroy(struct kb_device *kb_dev)
++{
++    if ((kb_dev) && (kb_dev->jr_dev)) {
++		caam_jr_free(kb_dev->jr_dev);
++		kb_dev->jr_dev = NULL;
++	}
++
++    if (kb_dev)
++		misc_deregister(&kb_dev->misc_dev);
++
++    return 0;
++}
++/*
++ * Probe key blob device
++ */
++static int caam_keyblob_probe(struct platform_device *pdev)
++{
++	int err;
++
++	dev_dbg(&pdev->dev, "%s enter\n", __func__);
++	kb_dev = kb_device_create();
++	if (IS_ERR_OR_NULL(kb_dev)) {
++		err = PTR_ERR(kb_dev);
++		goto err;
++	}
++	return 0;
++err:
++    return err;
++}
++
++/*
++ * Remove key blob device
++ */
++static int caam_keyblob_remove(struct platform_device *pdev)
++{
++    kb_device_destroy(kb_dev);
++	return 0;
++}
++
++static struct of_device_id caam_keyblob_match[] = {
++	{
++		.compatible = "fsl,sec-v4.0-keyblob",
++	},
++	{
++		.compatible = "fsl,sec4.0-keyblob",
++	},
++	{},
++};
++
++MODULE_DEVICE_TABLE(of, caam_keyblob_match);
++
++static struct platform_driver caam_keyblob_driver = {
++	.driver = {
++		.name = "caam_keyblob",
++		.owner = THIS_MODULE,
++		.of_match_table = caam_keyblob_match,
++	},
++	.probe       = caam_keyblob_probe,
++	.remove      = caam_keyblob_remove,
++};
++
++static int __init keyblob_driver_init(void)
++{
++	return platform_driver_register(&caam_keyblob_driver);
++}
++
++static void __exit keyblob_driver_exit(void)
++{
++	platform_driver_unregister(&caam_keyblob_driver);
++}
++
++module_init(keyblob_driver_init);
++module_exit(keyblob_driver_exit);
++
++
++MODULE_LICENSE("Dual BSD/GPL");
++MODULE_DESCRIPTION("FSL CAAM Secure Memory / Keystore");
++MODULE_AUTHOR("Freescale Semiconductor - NMSG/MAD");
+diff -Nur linux-4.1.3/drivers/crypto/caam/caam_keyblob.h linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.h
+--- linux-4.1.3/drivers/crypto/caam/caam_keyblob.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/caam_keyblob.h	2015-07-27 23:13:04.205975852 +0200
+@@ -0,0 +1,45 @@
++/*
++ * CAAM public-level include definitions for the key blob
++ *
++ * Copyright (C) 2015 Freescale Semiconductor, Inc.
++ */
++
++#ifndef CAAM_KEYBLOB_H
++#define CAAM_KEYBLOB_H
++
++
++#include <linux/ioctl.h>
++#include <linux/types.h>
++
++struct caam_kb_data {
++	char *rawkey;
++    size_t rawkey_len;
++    char *keyblob;
++    size_t keyblob_len;
++    char *keymod;
++    size_t keymod_len;
++};
++
++
++#define CAAM_KB_MAGIC		'I'
++
++/**
++ * DOC: CAAM_KB_ENCRYPT - generate a key blob from raw key
++ *
++ * Takes an caam_kb_data struct and returns it with the key blob
++ */
++#define CAAM_KB_ENCRYPT		_IOWR(CAAM_KB_MAGIC, 0, \
++				      struct caam_kb_data)
++
++/**
++ * DOC: CAAM_KB_DECRYPT - get keys from a key blob
++ *
++ * Takes an caam_kb_data struct and returns it with the raw key.
++ */
++#define CAAM_KB_DECRYPT		_IOWR(CAAM_KB_MAGIC, 1, struct caam_kb_data)
++
++#ifndef GENMEM_KEYMOD_LEN
++#define GENMEM_KEYMOD_LEN 16
++#endif
++
++#endif /* CAAM_KEYBLOB_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/caamrng.c linux-xbian-imx6/drivers/crypto/caam/caamrng.c
+--- linux-4.1.3/drivers/crypto/caam/caamrng.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/caamrng.c	2015-07-27 23:13:04.209961631 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * caam - Freescale FSL CAAM support for hw_random
+  *
+- * Copyright 2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
+  *
+  * Based on caamalg.c crypto API driver.
+  *
+@@ -80,9 +80,12 @@
+ 
+ static inline void rng_unmap_buf(struct device *jrdev, struct buf_data *bd)
+ {
+-	if (bd->addr)
++	if (bd->addr) {
++		dma_sync_single_for_cpu(jrdev, bd->addr, RN_BUF_SIZE,
++					DMA_FROM_DEVICE);
+ 		dma_unmap_single(jrdev, bd->addr, RN_BUF_SIZE,
+ 				 DMA_FROM_DEVICE);
++	}
+ }
+ 
+ static inline void rng_unmap_ctx(struct caam_rng_ctx *ctx)
+@@ -103,11 +106,18 @@
+ 	bd = (struct buf_data *)((char *)desc -
+ 	      offsetof(struct buf_data, hw_desc));
+ 
+-	if (err)
+-		caam_jr_strstatus(jrdev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(jrdev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ 	atomic_set(&bd->empty, BUF_NOT_EMPTY);
+ 	complete(&bd->filled);
++
++	/* Buffer refilled, invalidate cache */
++	dma_sync_single_for_cpu(jrdev, bd->addr, RN_BUF_SIZE, DMA_FROM_DEVICE);
++
+ #ifdef DEBUG
+ 	print_hex_dump(KERN_ERR, "rng refreshed buf@: ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, bd->buf, RN_BUF_SIZE, 1);
+@@ -185,7 +195,7 @@
+ 				      max - copied_idx, false);
+ }
+ 
+-static inline int rng_create_sh_desc(struct caam_rng_ctx *ctx)
++static inline void rng_create_sh_desc(struct caam_rng_ctx *ctx)
+ {
+ 	struct device *jrdev = ctx->jrdev;
+ 	u32 *desc = ctx->sh_desc;
+@@ -203,18 +213,16 @@
+ 
+ 	ctx->sh_desc_dma = dma_map_single(jrdev, desc, desc_bytes(desc),
+ 					  DMA_TO_DEVICE);
+-	if (dma_mapping_error(jrdev, ctx->sh_desc_dma)) {
+-		dev_err(jrdev, "unable to map shared descriptor\n");
+-		return -ENOMEM;
+-	}
++	dma_sync_single_for_device(jrdev, ctx->sh_desc_dma, desc_bytes(desc),
++			       DMA_TO_DEVICE);
++
+ #ifdef DEBUG
+ 	print_hex_dump(KERN_ERR, "rng shdesc@: ", DUMP_PREFIX_ADDRESS, 16, 4,
+ 		       desc, desc_bytes(desc), 1);
+ #endif
+-	return 0;
+ }
+ 
+-static inline int rng_create_job_desc(struct caam_rng_ctx *ctx, int buf_id)
++static inline void rng_create_job_desc(struct caam_rng_ctx *ctx, int buf_id)
+ {
+ 	struct device *jrdev = ctx->jrdev;
+ 	struct buf_data *bd = &ctx->bufs[buf_id];
+@@ -225,17 +233,12 @@
+ 			     HDR_REVERSE);
+ 
+ 	bd->addr = dma_map_single(jrdev, bd->buf, RN_BUF_SIZE, DMA_FROM_DEVICE);
+-	if (dma_mapping_error(jrdev, bd->addr)) {
+-		dev_err(jrdev, "unable to map dst\n");
+-		return -ENOMEM;
+-	}
+ 
+ 	append_seq_out_ptr_intlen(desc, bd->addr, RN_BUF_SIZE, 0);
+ #ifdef DEBUG
+ 	print_hex_dump(KERN_ERR, "rng job desc@: ", DUMP_PREFIX_ADDRESS, 16, 4,
+ 		       desc, desc_bytes(desc), 1);
+ #endif
+-	return 0;
+ }
+ 
+ static void caam_cleanup(struct hwrng *rng)
+@@ -252,44 +255,67 @@
+ 	rng_unmap_ctx(rng_ctx);
+ }
+ 
+-static int caam_init_buf(struct caam_rng_ctx *ctx, int buf_id)
++#ifdef CONFIG_CRYPTO_DEV_FSL_CAAM_RNG_TEST
++static inline void test_len(struct hwrng *rng, size_t len, bool wait)
+ {
+-	struct buf_data *bd = &ctx->bufs[buf_id];
+-	int err;
++	u8 *buf;
++	int real_len;
+ 
+-	err = rng_create_job_desc(ctx, buf_id);
+-	if (err)
+-		return err;
++	buf = kzalloc(sizeof(u8) * len, GFP_KERNEL);
++	real_len = rng->read(rng, buf, len, wait);
++	if (real_len == 0 && wait)
++		pr_err("WAITING FAILED\n");
++	pr_info("wanted %d bytes, got %d\n", len, real_len);
++	print_hex_dump(KERN_INFO, "random bytes@: ", DUMP_PREFIX_ADDRESS,
++		       16, 4, buf, real_len, 1);
++	kfree(buf);
++}
+ 
+-	atomic_set(&bd->empty, BUF_EMPTY);
+-	submit_job(ctx, buf_id == ctx->current_buf);
+-	wait_for_completion(&bd->filled);
++static inline void test_mode_once(struct hwrng *rng, bool wait)
++{
++#define TEST_CHUNK (RN_BUF_SIZE / 4)
+ 
+-	return 0;
++	test_len(rng, TEST_CHUNK, wait);
++	test_len(rng, RN_BUF_SIZE * 2, wait);
++	test_len(rng, RN_BUF_SIZE * 2 - TEST_CHUNK, wait);
+ }
+ 
+-static int caam_init_rng(struct caam_rng_ctx *ctx, struct device *jrdev)
++static inline void test_mode(struct hwrng *rng, bool wait)
+ {
+-	int err;
+-
+-	ctx->jrdev = jrdev;
++#define TEST_PASS 1
++	int i;
+ 
+-	err = rng_create_sh_desc(ctx);
+-	if (err)
+-		return err;
++	for (i = 0; i < TEST_PASS; i++)
++		test_mode_once(rng, wait);
++}
+ 
+-	ctx->current_buf = 0;
+-	ctx->cur_buf_idx = 0;
++static void self_test(struct hwrng *rng)
++{
++	pr_info("testing without waiting\n");
++	test_mode(rng, false);
++	pr_info("testing with waiting\n");
++	test_mode(rng, true);
++}
++#endif
+ 
+-	err = caam_init_buf(ctx, 0);
+-	if (err)
+-		return err;
++static void caam_init_buf(struct caam_rng_ctx *ctx, int buf_id)
++{
++	struct buf_data *bd = &ctx->bufs[buf_id];
+ 
+-	err = caam_init_buf(ctx, 1);
+-	if (err)
+-		return err;
++	rng_create_job_desc(ctx, buf_id);
++	atomic_set(&bd->empty, BUF_EMPTY);
++	submit_job(ctx, buf_id == ctx->current_buf);
++	wait_for_completion(&bd->filled);
++}
+ 
+-	return 0;
++static void caam_init_rng(struct caam_rng_ctx *ctx, struct device *jrdev)
++{
++	ctx->jrdev = jrdev;
++	rng_create_sh_desc(ctx);
++	ctx->current_buf = 0;
++	ctx->cur_buf_idx = 0;
++	caam_init_buf(ctx, 0);
++	caam_init_buf(ctx, 1);
+ }
+ 
+ static struct hwrng caam_rng = {
+@@ -300,19 +326,15 @@
+ 
+ static void __exit caam_rng_exit(void)
+ {
+-	caam_jr_free(rng_ctx->jrdev);
+ 	hwrng_unregister(&caam_rng);
+-	kfree(rng_ctx);
+ }
+ 
+ static int __init caam_rng_init(void)
+ {
+-	struct device *dev;
+ 	struct device_node *dev_node;
+ 	struct platform_device *pdev;
+ 	struct device *ctrldev;
+-	void *priv;
+-	int err;
++	struct caam_drv_private *priv;
+ 
+ 	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
+ 	if (!dev_node) {
+@@ -322,35 +344,26 @@
+ 	}
+ 
+ 	pdev = of_find_device_by_node(dev_node);
+-	if (!pdev) {
+-		of_node_put(dev_node);
++	if (!pdev)
+ 		return -ENODEV;
+-	}
+ 
+ 	ctrldev = &pdev->dev;
+ 	priv = dev_get_drvdata(ctrldev);
+ 	of_node_put(dev_node);
+ 
+-	/*
+-	 * If priv is NULL, it's probably because the caam driver wasn't
+-	 * properly initialized (e.g. RNG4 init failed). Thus, bail out here.
+-	 */
+-	if (!priv)
++	/* Check RNG present in hardware before registration */
++	if (!(rd_reg64(&priv->ctrl->perfmon.cha_num) & CHA_ID_RNG_MASK))
+ 		return -ENODEV;
+ 
+-	dev = caam_jr_alloc();
+-	if (IS_ERR(dev)) {
+-		pr_err("Job Ring Device allocation for transform failed\n");
+-		return PTR_ERR(dev);
+-	}
+-	rng_ctx = kmalloc(sizeof(struct caam_rng_ctx), GFP_DMA);
+-	if (!rng_ctx)
+-		return -ENOMEM;
+-	err = caam_init_rng(rng_ctx, dev);
+-	if (err)
+-		return err;
++	rng_ctx = kmalloc(sizeof(struct caam_rng_ctx), GFP_KERNEL | GFP_DMA);
++
++	caam_init_rng(rng_ctx, priv->jrdev[0]);
++
++#ifdef CONFIG_CRYPTO_DEV_FSL_CAAM_RNG_TEST
++	self_test(&caam_rng);
++#endif
+ 
+-	dev_info(dev, "registering rng-caam\n");
++	dev_info(priv->jrdev[0], "registering rng-caam\n");
+ 	return hwrng_register(&caam_rng);
+ }
+ 
+diff -Nur linux-4.1.3/drivers/crypto/caam/compat.h linux-xbian-imx6/drivers/crypto/caam/compat.h
+--- linux-4.1.3/drivers/crypto/caam/compat.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/compat.h	2015-07-27 23:13:04.209961631 +0200
+@@ -14,6 +14,8 @@
+ #include <linux/hash.h>
+ #include <linux/hw_random.h>
+ #include <linux/of_platform.h>
++#include <linux/of_address.h>
++#include <linux/of_irq.h>
+ #include <linux/dma-mapping.h>
+ #include <linux/io.h>
+ #include <linux/spinlock.h>
+@@ -23,12 +25,15 @@
+ #include <linux/types.h>
+ #include <linux/debugfs.h>
+ #include <linux/circ_buf.h>
++#include <crypto/scatterwalk.h>
++
++#ifdef CONFIG_ARM /* needs the clock control subsystem */
++#include <linux/clk.h>
++#endif
+ #include <net/xfrm.h>
+ 
+ #include <crypto/algapi.h>
+-#include <crypto/null.h>
+ #include <crypto/aes.h>
+-#include <crypto/ctr.h>
+ #include <crypto/des.h>
+ #include <crypto/sha.h>
+ #include <crypto/md5.h>
+diff -Nur linux-4.1.3/drivers/crypto/caam/ctrl.c linux-xbian-imx6/drivers/crypto/caam/ctrl.c
+--- linux-4.1.3/drivers/crypto/caam/ctrl.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/ctrl.c	2015-07-27 23:13:04.209961631 +0200
+@@ -1,405 +1,260 @@
+-/* * CAAM control-plane driver backend
++/*
++ * CAAM control-plane driver backend
+  * Controller-level driver, kernel property detection, initialization
+  *
+- * Copyright 2008-2012 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  */
+ 
+-#include <linux/device.h>
+-#include <linux/of_address.h>
+-#include <linux/of_irq.h>
+-
+ #include "compat.h"
+ #include "regs.h"
+ #include "intern.h"
+ #include "jr.h"
+ #include "desc_constr.h"
+ #include "error.h"
++#include "ctrl.h"
++#include "sm.h"
++#include <linux/device.h>
+ 
+-/*
+- * Descriptor to instantiate RNG State Handle 0 in normal mode and
+- * load the JDKEK, TDKEK and TDSK registers
+- */
+-static void build_instantiation_desc(u32 *desc, int handle, int do_sk)
+-{
+-	u32 *jump_cmd, op_flags;
+-
+-	init_job_desc(desc, 0);
+-
+-	op_flags = OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
+-			(handle << OP_ALG_AAI_SHIFT) | OP_ALG_AS_INIT;
+-
+-	/* INIT RNG in non-test mode */
+-	append_operation(desc, op_flags);
+-
+-	if (!handle && do_sk) {
+-		/*
+-		 * For SH0, Secure Keys must be generated as well
+-		 */
++/* Used to capture the array of job rings */
++struct device **caam_jr_dev;
+ 
+-		/* wait for done */
+-		jump_cmd = append_jump(desc, JUMP_CLASS_CLASS1);
+-		set_jump_tgt_here(desc, jump_cmd);
++static int caam_remove(struct platform_device *pdev)
++{
++	struct device *ctrldev;
++	struct caam_drv_private *ctrlpriv;
++	struct caam_drv_private_jr *jrpriv;
++	struct caam_full __iomem *topregs;
++	int ring, ret = 0;
+ 
+-		/*
+-		 * load 1 to clear written reg:
+-		 * resets the done interrrupt and returns the RNG to idle.
+-		 */
+-		append_load_imm_u32(desc, 1, LDST_SRCDST_WORD_CLRW);
++	ctrldev = &pdev->dev;
++	ctrlpriv = dev_get_drvdata(ctrldev);
++	topregs = (struct caam_full __iomem *)ctrlpriv->ctrl;
+ 
+-		/* Initialize State Handle  */
+-		append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
+-				 OP_ALG_AAI_RNG4_SK);
++	/* shut down JobRs */
++	for (ring = 0; ring < ctrlpriv->total_jobrs; ring++) {
++		ret |= caam_jr_shutdown(ctrlpriv->jrdev[ring]);
++		jrpriv = dev_get_drvdata(ctrlpriv->jrdev[ring]);
++		irq_dispose_mapping(jrpriv->irq);
+ 	}
+ 
+-	append_jump(desc, JUMP_CLASS_CLASS1 | JUMP_TYPE_HALT);
+-}
++	/* Shut down debug views */
++#ifdef CONFIG_DEBUG_FS
++	debugfs_remove_recursive(ctrlpriv->dfs_root);
++#endif
+ 
+-/* Descriptor for deinstantiation of State Handle 0 of the RNG block. */
+-static void build_deinstantiation_desc(u32 *desc, int handle)
+-{
+-	init_job_desc(desc, 0);
++	/* Unmap controller region */
++	iounmap(&topregs->ctrl);
+ 
+-	/* Uninstantiate State Handle 0 */
+-	append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
+-			 (handle << OP_ALG_AAI_SHIFT) | OP_ALG_AS_INITFINAL);
++#ifdef CONFIG_ARM
++	/* shut clocks off before finalizing shutdown */
++	clk_disable(ctrlpriv->caam_ipg);
++	clk_disable(ctrlpriv->caam_mem);
++	clk_disable(ctrlpriv->caam_aclk);
++#endif
++
++	kfree(ctrlpriv->jrdev);
++	kfree(ctrlpriv);
+ 
+-	append_jump(desc, JUMP_CLASS_CLASS1 | JUMP_TYPE_HALT);
++	return ret;
+ }
+ 
+ /*
+- * run_descriptor_deco0 - runs a descriptor on DECO0, under direct control of
+- *			  the software (no JR/QI used).
+- * @ctrldev - pointer to device
+- * @status - descriptor status, after being run
+- *
+- * Return: - 0 if no error occurred
+- *	   - -ENODEV if the DECO couldn't be acquired
+- *	   - -EAGAIN if an error occurred while executing the descriptor
++ * Descriptor to instantiate RNG State Handle 0 in normal mode and
++ * load the JDKEK, TDKEK and TDSK registers
+  */
+-static inline int run_descriptor_deco0(struct device *ctrldev, u32 *desc,
+-					u32 *status)
++static void build_instantiation_desc(u32 *desc)
+ {
+-	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
+-	struct caam_ctrl __iomem *ctrl = ctrlpriv->ctrl;
+-	struct caam_deco __iomem *deco = ctrlpriv->deco;
+-	unsigned int timeout = 100000;
+-	u32 deco_dbg_reg, flags;
+-	int i;
+-
++	u32 *jump_cmd;
+ 
+-	if (ctrlpriv->virt_en == 1) {
+-		setbits32(&ctrl->deco_rsr, DECORSR_JR0);
+-
+-		while (!(rd_reg32(&ctrl->deco_rsr) & DECORSR_VALID) &&
+-		       --timeout)
+-			cpu_relax();
+-
+-		timeout = 100000;
+-	}
+-
+-	setbits32(&ctrl->deco_rq, DECORR_RQD0ENABLE);
+-
+-	while (!(rd_reg32(&ctrl->deco_rq) & DECORR_DEN0) &&
+-								 --timeout)
+-		cpu_relax();
++	init_job_desc(desc, 0);
+ 
+-	if (!timeout) {
+-		dev_err(ctrldev, "failed to acquire DECO 0\n");
+-		clrbits32(&ctrl->deco_rq, DECORR_RQD0ENABLE);
+-		return -ENODEV;
+-	}
++	/* INIT RNG in non-test mode */
++	append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
++			 OP_ALG_AS_INIT);
+ 
+-	for (i = 0; i < desc_len(desc); i++)
+-		wr_reg32(&deco->descbuf[i], *(desc + i));
++	/* wait for done */
++	jump_cmd = append_jump(desc, JUMP_CLASS_CLASS1);
++	set_jump_tgt_here(desc, jump_cmd);
+ 
+-	flags = DECO_JQCR_WHL;
+ 	/*
+-	 * If the descriptor length is longer than 4 words, then the
+-	 * FOUR bit in JRCTRL register must be set.
++	 * load 1 to clear written reg:
++	 * resets the done interrupt and returns the RNG to idle.
+ 	 */
+-	if (desc_len(desc) >= 4)
+-		flags |= DECO_JQCR_FOUR;
++	append_load_imm_u32(desc, 1, LDST_SRCDST_WORD_CLRW);
+ 
+-	/* Instruct the DECO to execute it */
+-	wr_reg32(&deco->jr_ctl_hi, flags);
+-
+-	timeout = 10000000;
+-	do {
+-		deco_dbg_reg = rd_reg32(&deco->desc_dbg);
+-		/*
+-		 * If an error occured in the descriptor, then
+-		 * the DECO status field will be set to 0x0D
+-		 */
+-		if ((deco_dbg_reg & DESC_DBG_DECO_STAT_MASK) ==
+-		    DESC_DBG_DECO_STAT_HOST_ERR)
+-			break;
+-		cpu_relax();
+-	} while ((deco_dbg_reg & DESC_DBG_DECO_STAT_VALID) && --timeout);
+-
+-	*status = rd_reg32(&deco->op_status_hi) &
+-		  DECO_OP_STATUS_HI_ERR_MASK;
+-
+-	if (ctrlpriv->virt_en == 1)
+-		clrbits32(&ctrl->deco_rsr, DECORSR_JR0);
+-
+-	/* Mark the DECO as free */
+-	clrbits32(&ctrl->deco_rq, DECORR_RQD0ENABLE);
+-
+-	if (!timeout)
+-		return -EAGAIN;
+-
+-	return 0;
+ }
+ 
+-/*
+- * instantiate_rng - builds and executes a descriptor on DECO0,
+- *		     which initializes the RNG block.
+- * @ctrldev - pointer to device
+- * @state_handle_mask - bitmask containing the instantiation status
+- *			for the RNG4 state handles which exist in
+- *			the RNG4 block: 1 if it's been instantiated
+- *			by an external entry, 0 otherwise.
+- * @gen_sk  - generate data to be loaded into the JDKEK, TDKEK and TDSK;
+- *	      Caution: this can be done only once; if the keys need to be
+- *	      regenerated, a POR is required
+- *
+- * Return: - 0 if no error occurred
+- *	   - -ENOMEM if there isn't enough memory to allocate the descriptor
+- *	   - -ENODEV if DECO0 couldn't be acquired
+- *	   - -EAGAIN if an error occurred when executing the descriptor
+- *	      f.i. there was a RNG hardware error due to not "good enough"
+- *	      entropy being aquired.
+- */
+-static int instantiate_rng(struct device *ctrldev, int state_handle_mask,
+-			   int gen_sk)
++static void generate_secure_keys_desc(u32 *desc)
+ {
+-	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
+-	struct caam_ctrl __iomem *ctrl;
+-	u32 *desc, status, rdsta_val;
+-	int ret = 0, sh_idx;
+-
+-	ctrl = (struct caam_ctrl __iomem *)ctrlpriv->ctrl;
+-	desc = kmalloc(CAAM_CMD_SZ * 7, GFP_KERNEL);
+-	if (!desc)
+-		return -ENOMEM;
++	/* generate secure keys (non-test) */
++	append_operation(desc, OP_TYPE_CLASS1_ALG | OP_ALG_ALGSEL_RNG |
++					 OP_ALG_RNG4_SK);
++}
+ 
+-	for (sh_idx = 0; sh_idx < RNG4_MAX_HANDLES; sh_idx++) {
+-		/*
+-		 * If the corresponding bit is set, this state handle
+-		 * was initialized by somebody else, so it's left alone.
+-		 */
+-		if ((1 << sh_idx) & state_handle_mask)
+-			continue;
++struct instantiate_result {
++	struct completion completion;
++	int err;
++};
+ 
+-		/* Create the descriptor for instantiating RNG State Handle */
+-		build_instantiation_desc(desc, sh_idx, gen_sk);
++static void rng4_init_done(struct device *dev, u32 *desc, u32 err,
++			   void *context)
++{
++	struct instantiate_result *instantiation = context;
+ 
+-		/* Try to run it through DECO0 */
+-		ret = run_descriptor_deco0(ctrldev, desc, &status);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
+ 
+-		/*
+-		 * If ret is not 0, or descriptor status is not 0, then
+-		 * something went wrong. No need to try the next state
+-		 * handle (if available), bail out here.
+-		 * Also, if for some reason, the State Handle didn't get
+-		 * instantiated although the descriptor has finished
+-		 * without any error (HW optimizations for later
+-		 * CAAM eras), then try again.
+-		 */
+-		rdsta_val = rd_reg32(&ctrl->r4tst[0].rdsta) & RDSTA_IFMASK;
+-		if (status || !(rdsta_val & (1 << sh_idx)))
+-			ret = -EAGAIN;
+-		if (ret)
+-			break;
+-		dev_info(ctrldev, "Instantiated RNG4 SH%d\n", sh_idx);
+-		/* Clear the contents before recreating the descriptor */
+-		memset(desc, 0x00, CAAM_CMD_SZ * 7);
++		dev_err(dev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
+ 	}
+ 
+-	kfree(desc);
+-
+-	return ret;
++	instantiation->err = err;
++	complete(&instantiation->completion);
+ }
+ 
+-/*
+- * deinstantiate_rng - builds and executes a descriptor on DECO0,
+- *		       which deinitializes the RNG block.
+- * @ctrldev - pointer to device
+- * @state_handle_mask - bitmask containing the instantiation status
+- *			for the RNG4 state handles which exist in
+- *			the RNG4 block: 1 if it's been instantiated
+- *
+- * Return: - 0 if no error occurred
+- *	   - -ENOMEM if there isn't enough memory to allocate the descriptor
+- *	   - -ENODEV if DECO0 couldn't be acquired
+- *	   - -EAGAIN if an error occurred when executing the descriptor
+- */
+-static int deinstantiate_rng(struct device *ctrldev, int state_handle_mask)
++static int instantiate_rng(struct device *jrdev, u32 keys_generated)
+ {
+-	u32 *desc, status;
+-	int sh_idx, ret = 0;
++	struct instantiate_result instantiation;
+ 
+-	desc = kmalloc(CAAM_CMD_SZ * 3, GFP_KERNEL);
+-	if (!desc)
++	dma_addr_t desc_dma;
++	u32 *desc;
++	int ret;
++
++	desc = kmalloc(CAAM_CMD_SZ * 6, GFP_KERNEL | GFP_DMA);
++	if (!desc) {
++		dev_err(jrdev, "cannot allocate RNG init descriptor memory\n");
+ 		return -ENOMEM;
+-
+-	for (sh_idx = 0; sh_idx < RNG4_MAX_HANDLES; sh_idx++) {
+-		/*
+-		 * If the corresponding bit is set, then it means the state
+-		 * handle was initialized by us, and thus it needs to be
+-		 * deintialized as well
+-		 */
+-		if ((1 << sh_idx) & state_handle_mask) {
+-			/*
+-			 * Create the descriptor for deinstantating this state
+-			 * handle
+-			 */
+-			build_deinstantiation_desc(desc, sh_idx);
+-
+-			/* Try to run it through DECO0 */
+-			ret = run_descriptor_deco0(ctrldev, desc, &status);
+-
+-			if (ret || status) {
+-				dev_err(ctrldev,
+-					"Failed to deinstantiate RNG4 SH%d\n",
+-					sh_idx);
+-				break;
+-			}
+-			dev_info(ctrldev, "Deinstantiated RNG4 SH%d\n", sh_idx);
+-		}
+ 	}
+ 
+-	kfree(desc);
+-
+-	return ret;
+-}
++	build_instantiation_desc(desc);
+ 
+-static int caam_remove(struct platform_device *pdev)
+-{
+-	struct device *ctrldev;
+-	struct caam_drv_private *ctrlpriv;
+-	struct caam_ctrl __iomem *ctrl;
+-	int ring, ret = 0;
+-
+-	ctrldev = &pdev->dev;
+-	ctrlpriv = dev_get_drvdata(ctrldev);
+-	ctrl = (struct caam_ctrl __iomem *)ctrlpriv->ctrl;
+-
+-	/* Remove platform devices for JobRs */
+-	for (ring = 0; ring < ctrlpriv->total_jobrs; ring++) {
+-		if (ctrlpriv->jrpdev[ring])
+-			of_device_unregister(ctrlpriv->jrpdev[ring]);
++	/* If keys have not been generated, add op code to generate key. */
++	if (!keys_generated)
++		generate_secure_keys_desc(desc);
++
++	desc_dma = dma_map_single(jrdev, desc, desc_bytes(desc), DMA_TO_DEVICE);
++	dma_sync_single_for_device(jrdev, desc_dma, desc_bytes(desc),
++				   DMA_TO_DEVICE);
++	init_completion(&instantiation.completion);
++	ret = caam_jr_enqueue(jrdev, desc, rng4_init_done, &instantiation);
++	if (!ret) {
++		wait_for_completion_interruptible(&instantiation.completion);
++		ret = instantiation.err;
++		if (ret)
++			dev_err(jrdev, "unable to instantiate RNG\n");
+ 	}
+ 
+-	/* De-initialize RNG state handles initialized by this driver. */
+-	if (ctrlpriv->rng4_sh_init)
+-		deinstantiate_rng(ctrldev, ctrlpriv->rng4_sh_init);
+-
+-	/* Shut down debug views */
+-#ifdef CONFIG_DEBUG_FS
+-	debugfs_remove_recursive(ctrlpriv->dfs_root);
+-#endif
++	dma_unmap_single(jrdev, desc_dma, desc_bytes(desc), DMA_TO_DEVICE);
+ 
+-	/* Unmap controller region */
+-	iounmap(&ctrl);
++	kfree(desc);
+ 
+ 	return ret;
+ }
+ 
+ /*
+- * kick_trng - sets the various parameters for enabling the initialization
+- *	       of the RNG4 block in CAAM
+- * @pdev - pointer to the platform device
+- * @ent_delay - Defines the length (in system clocks) of each entropy sample.
++ * By default, the TRNG runs for 200 clocks per sample;
++ * 1600 clocks per sample generates better entropy.
+  */
+-static void kick_trng(struct platform_device *pdev, int ent_delay)
++static void kick_trng(struct platform_device *pdev)
+ {
+ 	struct device *ctrldev = &pdev->dev;
+ 	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
+-	struct caam_ctrl __iomem *ctrl;
++	struct caam_full __iomem *topregs;
+ 	struct rng4tst __iomem *r4tst;
+ 	u32 val;
+ 
+-	ctrl = (struct caam_ctrl __iomem *)ctrlpriv->ctrl;
+-	r4tst = &ctrl->r4tst[0];
++	topregs = (struct caam_full __iomem *)ctrlpriv->ctrl;
++	r4tst = &topregs->ctrl.r4tst[0];
+ 
++	val = rd_reg32(&r4tst->rtmctl);
+ 	/* put RNG4 into program mode */
+ 	setbits32(&r4tst->rtmctl, RTMCTL_PRGM);
+-
+-	/*
+-	 * Performance-wise, it does not make sense to
+-	 * set the delay to a value that is lower
+-	 * than the last one that worked (i.e. the state handles
+-	 * were instantiated properly. Thus, instead of wasting
+-	 * time trying to set the values controlling the sample
+-	 * frequency, the function simply returns.
+-	 */
+-	val = (rd_reg32(&r4tst->rtsdctl) & RTSDCTL_ENT_DLY_MASK)
+-	      >> RTSDCTL_ENT_DLY_SHIFT;
+-	if (ent_delay <= val) {
+-		/* put RNG4 into run mode */
+-		clrbits32(&r4tst->rtmctl, RTMCTL_PRGM);
+-		return;
+-	}
+-
++	/* Set clocks per sample to the default, and divider to zero */
+ 	val = rd_reg32(&r4tst->rtsdctl);
+ 	val = (val & ~RTSDCTL_ENT_DLY_MASK) |
+-	      (ent_delay << RTSDCTL_ENT_DLY_SHIFT);
++	       (RNG4_ENT_CLOCKS_SAMPLE << RTSDCTL_ENT_DLY_SHIFT);
+ 	wr_reg32(&r4tst->rtsdctl, val);
+-	/* min. freq. count, equal to 1/4 of the entropy sample length */
+-	wr_reg32(&r4tst->rtfrqmin, ent_delay >> 2);
+-	/* disable maximum frequency count */
+-	wr_reg32(&r4tst->rtfrqmax, RTFRQMAX_DISABLE);
+-	/* read the control register */
+-	val = rd_reg32(&r4tst->rtmctl);
+-	/*
+-	 * select raw sampling in both entropy shifter
+-	 * and statistical checker
+-	 */
+-	setbits32(&val, RTMCTL_SAMP_MODE_RAW_ES_SC);
++	/* min. freq. count */
++	wr_reg32(&r4tst->rtfrqmin, RNG4_ENT_CLOCKS_SAMPLE / 4);
++	/* max. freq. count */
++	wr_reg32(&r4tst->rtfrqmax, RNG4_ENT_CLOCKS_SAMPLE * 8);
+ 	/* put RNG4 into run mode */
+-	clrbits32(&val, RTMCTL_PRGM);
+-	/* write back the control register */
+-	wr_reg32(&r4tst->rtmctl, val);
++	clrbits32(&r4tst->rtmctl, RTMCTL_PRGM);
+ }
+ 
+ /**
+  * caam_get_era() - Return the ERA of the SEC on SoC, based
+- * on "sec-era" propery in the DTS. This property is updated by u-boot.
++ * on the SEC_VID register.
++ * Returns the ERA number (1..4) or -ENOTSUPP if the ERA is unknown.
++ * @caam_id - the value of the SEC_VID register
+  **/
+-int caam_get_era(void)
++int caam_get_era(u64 caam_id)
+ {
+-	struct device_node *caam_node;
+-	for_each_compatible_node(caam_node, NULL, "fsl,sec-v4.0") {
+-		const uint32_t *prop = (uint32_t *)of_get_property(caam_node,
+-				"fsl,sec-era",
+-				NULL);
+-		return prop ? *prop : -ENOTSUPP;
+-	}
++	struct sec_vid *sec_vid = (struct sec_vid *)&caam_id;
++	static const struct {
++		u16 ip_id;
++		u8 maj_rev;
++		u8 era;
++	} caam_eras[] = {
++		{0x0A10, 1, 1},
++		{0x0A10, 2, 2},
++		{0x0A12, 1, 3},
++		{0x0A14, 1, 3},
++		{0x0A14, 2, 4},
++		{0x0A16, 1, 4},
++		{0x0A11, 1, 4},
++		{0x0A10, 3, 4},
++		{0x0A18, 1, 4},
++		{0x0A11, 2, 5},
++		{0x0A12, 2, 5},
++		{0x0A13, 1, 5},
++		{0x0A1C, 1, 5},
++		{0x0A12, 4, 6},
++		{0x0A13, 2, 6},
++		{0x0A16, 2, 6},
++		{0x0A18, 2, 6},
++		{0x0A1A, 1, 6},
++		{0x0A1C, 2, 6},
++		{0x0A17, 1, 6}
++	};
++	int i;
++
++	for (i = 0; i < ARRAY_SIZE(caam_eras); i++)
++		if (caam_eras[i].ip_id == sec_vid->ip_id &&
++			caam_eras[i].maj_rev == sec_vid->maj_rev)
++				return caam_eras[i].era;
+ 
+ 	return -ENOTSUPP;
+ }
+ EXPORT_SYMBOL(caam_get_era);
+ 
++/*
++ * Return a job ring device.  This is available so outside
++ * entities can gain direct access to the job ring.  For now,
++ * this function returns the first job ring (at index 0).
++ */
++struct device *caam_get_jrdev(void)
++{
++	return caam_jr_dev[0];
++}
++EXPORT_SYMBOL(caam_get_jrdev);
++
++
+ /* Probe routine for CAAM top (controller) level */
+ static int caam_probe(struct platform_device *pdev)
+ {
+-	int ret, ring, rspec, gen_sk, ent_delay = RTSDCTL_ENT_DLY_MIN;
++	int ret, ring, rspec;
+ 	u64 caam_id;
+ 	struct device *dev;
+ 	struct device_node *nprop, *np;
+ 	struct caam_ctrl __iomem *ctrl;
++	struct caam_full __iomem *topregs;
++	struct snvs_full __iomem *snvsregs;
+ 	struct caam_drv_private *ctrlpriv;
+ #ifdef CONFIG_DEBUG_FS
+ 	struct caam_perfmon *perfmon;
+ #endif
+-	u32 scfgr, comp_params;
+-	u32 cha_vid_ls;
+-	int pg_size;
+-	int BLOCK_OFFSET = 0;
+ 
+-	ctrlpriv = devm_kzalloc(&pdev->dev, sizeof(struct caam_drv_private),
+-				GFP_KERNEL);
++	ctrlpriv = kzalloc(sizeof(struct caam_drv_private), GFP_KERNEL);
+ 	if (!ctrlpriv)
+ 		return -ENOMEM;
+ 
+@@ -415,71 +270,128 @@
+ 		dev_err(dev, "caam: of_iomap() failed\n");
+ 		return -ENOMEM;
+ 	}
+-	/* Finding the page size for using the CTPR_MS register */
+-	comp_params = rd_reg32(&ctrl->perfmon.comp_parms_ms);
+-	pg_size = (comp_params & CTPR_MS_PG_SZ_MASK) >> CTPR_MS_PG_SZ_SHIFT;
+-
+-	/* Allocating the BLOCK_OFFSET based on the supported page size on
+-	 * the platform
+-	 */
+-	if (pg_size == 0)
+-		BLOCK_OFFSET = PG_SIZE_4K;
+-	else
+-		BLOCK_OFFSET = PG_SIZE_64K;
+-
+ 	ctrlpriv->ctrl = (struct caam_ctrl __force *)ctrl;
+-	ctrlpriv->assure = (struct caam_assurance __force *)
+-			   ((uint8_t *)ctrl +
+-			    BLOCK_OFFSET * ASSURE_BLOCK_NUMBER
+-			   );
+-	ctrlpriv->deco = (struct caam_deco __force *)
+-			 ((uint8_t *)ctrl +
+-			 BLOCK_OFFSET * DECO_BLOCK_NUMBER
+-			 );
++
++	/* topregs used to derive pointers to CAAM sub-blocks only */
++	topregs = (struct caam_full __iomem *)ctrl;
+ 
+ 	/* Get the IRQ of the controller (for security violations only) */
+-	ctrlpriv->secvio_irq = irq_of_parse_and_map(nprop, 0);
++	ctrlpriv->secvio_irq = of_irq_to_resource(nprop, 0, NULL);
++
++	/* Get SNVS register Page */
++	np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-snvs");
++
++	if (!np)
++		return -ENODEV;
++
++	snvsregs = of_iomap(np, 0);
++	ctrlpriv->snvs = snvsregs;
++	/* Get CAAM-SM node and of_iomap() and save */
++	np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-sm");
++
++	if (!np)
++		return -ENODEV;
++
++	ctrlpriv->sm_base = of_iomap(np, 0);
++	ctrlpriv->sm_size = 0x3fff;
++
++/*
++ * ARM targets tend to have clock control subsystems that can
++ * enable/disable clocking to our device. Turn clocking on to proceed
++ */
++#ifdef CONFIG_ARM
++	ctrlpriv->caam_ipg = devm_clk_get(&ctrlpriv->pdev->dev, "caam_ipg");
++	if (IS_ERR(ctrlpriv->caam_ipg)) {
++		ret = PTR_ERR(ctrlpriv->caam_ipg);
++		dev_err(&ctrlpriv->pdev->dev,
++			"can't identify CAAM ipg clk: %d\n", ret);
++		return -ENODEV;
++	}
++	ctrlpriv->caam_mem = devm_clk_get(&ctrlpriv->pdev->dev, "caam_mem");
++	if (IS_ERR(ctrlpriv->caam_mem)) {
++		ret = PTR_ERR(ctrlpriv->caam_mem);
++		dev_err(&ctrlpriv->pdev->dev,
++			"can't identify CAAM secure mem clk: %d\n", ret);
++		return -ENODEV;
++	}
++	ctrlpriv->caam_aclk = devm_clk_get(&ctrlpriv->pdev->dev, "caam_aclk");
++	if (IS_ERR(ctrlpriv->caam_aclk)) {
++		ret = PTR_ERR(ctrlpriv->caam_aclk);
++		dev_err(&ctrlpriv->pdev->dev,
++			"can't identify CAAM aclk clk: %d\n", ret);
++		return -ENODEV;
++	}
++
++	ret = clk_prepare(ctrlpriv->caam_ipg);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "can't prepare CAAM ipg clock: %d\n", ret);
++		return -ENODEV;
++	}
++	ret = clk_prepare(ctrlpriv->caam_mem);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "can't prepare CAAM secure mem clock: %d\n", ret);
++		return -ENODEV;
++	}
++	ret = clk_prepare(ctrlpriv->caam_aclk);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "can't prepare CAAM aclk clock: %d\n", ret);
++		return -ENODEV;
++	}
++
++	ret = clk_enable(ctrlpriv->caam_ipg);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "can't enable CAAM ipg clock: %d\n", ret);
++		return -ENODEV;
++	}
++	ret = clk_enable(ctrlpriv->caam_mem);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "can't enable CAAM secure mem clock: %d\n", ret);
++		return -ENODEV;
++	}
++	ret = clk_enable(ctrlpriv->caam_aclk);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "can't enable CAAM aclk clock: %d\n", ret);
++		return -ENODEV;
++	}
++
++	pr_debug("%s caam_ipg clock:%d\n", __func__,
++		(int)clk_get_rate(ctrlpriv->caam_ipg));
++	pr_debug("%s caam_mem clock:%d\n", __func__,
++		(int)clk_get_rate(ctrlpriv->caam_mem));
++	pr_debug("%s caam_aclk clock:%d\n", __func__,
++		(int)clk_get_rate(ctrlpriv->caam_aclk));
++#endif
+ 
+ 	/*
+ 	 * Enable DECO watchdogs and, if this is a PHYS_ADDR_T_64BIT kernel,
+ 	 * long pointers in master configuration register
+ 	 */
+-	setbits32(&ctrl->mcr, MCFGR_WDENABLE |
++	setbits32(&topregs->ctrl.mcr, MCFGR_WDENABLE |
+ 		  (sizeof(dma_addr_t) == sizeof(u64) ? MCFGR_LONG_PTR : 0));
+ 
++#ifdef CONFIG_ARCH_MX6
+ 	/*
+-	 *  Read the Compile Time paramters and SCFGR to determine
+-	 * if Virtualization is enabled for this platform
++	 * ERRATA:  mx6 devices have an issue wherein AXI bus transactions
++	 * may not occur in the correct order. This isn't a problem running
++	 * single descriptors, but can be if running multiple concurrent
++	 * descriptors. Reworking the driver to throttle to single requests
++	 * is impractical, thus the workaround is to limit the AXI pipeline
++	 * to a depth of 1 (from it's default of 4) to preclude this situation
++	 * from occurring.
+ 	 */
+-	scfgr = rd_reg32(&ctrl->scfgr);
+-
+-	ctrlpriv->virt_en = 0;
+-	if (comp_params & CTPR_MS_VIRT_EN_INCL) {
+-		/* VIRT_EN_INCL = 1 & VIRT_EN_POR = 1 or
+-		 * VIRT_EN_INCL = 1 & VIRT_EN_POR = 0 & SCFGR_VIRT_EN = 1
+-		 */
+-		if ((comp_params & CTPR_MS_VIRT_EN_POR) ||
+-		    (!(comp_params & CTPR_MS_VIRT_EN_POR) &&
+-		       (scfgr & SCFGR_VIRT_EN)))
+-				ctrlpriv->virt_en = 1;
+-	} else {
+-		/* VIRT_EN_INCL = 0 && VIRT_EN_POR_VALUE = 1 */
+-		if (comp_params & CTPR_MS_VIRT_EN_POR)
+-				ctrlpriv->virt_en = 1;
+-	}
+-
+-	if (ctrlpriv->virt_en == 1)
+-		setbits32(&ctrl->jrstart, JRSTART_JR0_START |
+-			  JRSTART_JR1_START | JRSTART_JR2_START |
+-			  JRSTART_JR3_START);
++	wr_reg32(&topregs->ctrl.mcr,
++		 (rd_reg32(&topregs->ctrl.mcr) & ~(MCFGR_AXIPIPE_MASK)) |
++		 ((1 << MCFGR_AXIPIPE_SHIFT) & MCFGR_AXIPIPE_MASK));
++#endif
+ 
++	/* Set DMA masks according to platform ranging */
+ 	if (sizeof(dma_addr_t) == sizeof(u64))
+-		if (of_device_is_compatible(nprop, "fsl,sec-v5.0"))
+-			dma_set_mask_and_coherent(dev, DMA_BIT_MASK(40));
++		if (of_device_is_compatible(nprop, "fsl,sec-v4.0"))
++			dma_set_mask(dev, DMA_BIT_MASK(40));
+ 		else
+-			dma_set_mask_and_coherent(dev, DMA_BIT_MASK(36));
++			dma_set_mask(dev, DMA_BIT_MASK(36));
+ 	else
+-		dma_set_mask_and_coherent(dev, DMA_BIT_MASK(32));
++		dma_set_mask(dev, DMA_BIT_MASK(32));
+ 
+ 	/*
+ 	 * Detect and enable JobRs
+@@ -487,51 +399,65 @@
+ 	 * for all, then go probe each one.
+ 	 */
+ 	rspec = 0;
+-	for_each_available_child_of_node(nprop, np)
+-		if (of_device_is_compatible(np, "fsl,sec-v4.0-job-ring") ||
+-		    of_device_is_compatible(np, "fsl,sec4.0-job-ring"))
++	for_each_compatible_node(np, NULL, "fsl,sec-v4.0-job-ring")
++		rspec++;
++	if (!rspec) {
++		/* for backward compatible with device trees */
++		for_each_compatible_node(np, NULL, "fsl,sec4.0-job-ring")
+ 			rspec++;
++	}
+ 
+-	ctrlpriv->jrpdev = devm_kzalloc(&pdev->dev,
+-					sizeof(struct platform_device *) * rspec,
+-					GFP_KERNEL);
+-	if (ctrlpriv->jrpdev == NULL) {
+-		iounmap(&ctrl);
++	ctrlpriv->jrdev = kzalloc(sizeof(struct device *) * rspec, GFP_KERNEL);
++	if (ctrlpriv->jrdev == NULL) {
++		iounmap(&topregs->ctrl);
+ 		return -ENOMEM;
+ 	}
+ 
+ 	ring = 0;
+ 	ctrlpriv->total_jobrs = 0;
+-	for_each_available_child_of_node(nprop, np)
+-		if (of_device_is_compatible(np, "fsl,sec-v4.0-job-ring") ||
+-		    of_device_is_compatible(np, "fsl,sec4.0-job-ring")) {
+-			ctrlpriv->jrpdev[ring] =
+-				of_platform_device_create(np, NULL, dev);
+-			if (!ctrlpriv->jrpdev[ring]) {
+-				pr_warn("JR%d Platform device creation error\n",
+-					ring);
+-				continue;
++	for_each_compatible_node(np, NULL, "fsl,sec-v4.0-job-ring") {
++		ret = caam_jr_probe(pdev, np, ring);
++		if (ret < 0) {
++			/*
++			 * Job ring not found, error out.  At some
++			 * point, we should enhance job ring handling
++			 * to allow for non-consecutive job rings to
++			 * be found.
++			 */
++			pr_err("fsl,sec-v4.0-job-ring not found ");
++			pr_err("(ring %d)\n", ring);
++			return ret;
++		}
++		ctrlpriv->total_jobrs++;
++		ring++;
++	}
++
++	if (!ring) {
++		for_each_compatible_node(np, NULL, "fsl,sec4.0-job-ring") {
++			ret = caam_jr_probe(pdev, np, ring);
++			if (ret < 0) {
++				/*
++				 * Job ring not found, error out.  At some
++				 * point, we should enhance job ring handling
++				 * to allow for non-consecutive job rings to
++				 * be found.
++				 */
++				pr_err("fsl,sec4.0-job-ring not found ");
++				pr_err("(ring %d)\n", ring);
++				return ret;
+ 			}
+-			ctrlpriv->jr[ring] = (struct caam_job_ring __force *)
+-					     ((uint8_t *)ctrl +
+-					     (ring + JR_BLOCK_NUMBER) *
+-					      BLOCK_OFFSET
+-					     );
+ 			ctrlpriv->total_jobrs++;
+ 			ring++;
++		}
+ 	}
+ 
+ 	/* Check to see if QI present. If so, enable */
+-	ctrlpriv->qi_present =
+-			!!(rd_reg32(&ctrl->perfmon.comp_parms_ms) &
+-			   CTPR_MS_QI_MASK);
++	ctrlpriv->qi_present = !!(rd_reg64(&topregs->ctrl.perfmon.comp_parms) &
++				  CTPR_QI_MASK);
+ 	if (ctrlpriv->qi_present) {
+-		ctrlpriv->qi = (struct caam_queue_if __force *)
+-			       ((uint8_t *)ctrl +
+-				 BLOCK_OFFSET * QI_BLOCK_NUMBER
+-			       );
++		ctrlpriv->qi = (struct caam_queue_if __force *)&topregs->qi;
+ 		/* This is all that's required to physically enable QI */
+-		wr_reg32(&ctrlpriv->qi->qi_control_lo, QICTL_DQEN);
++		wr_reg32(&topregs->qi.qi_control_lo, QICTL_DQEN);
+ 	}
+ 
+ 	/* If no QI and no rings specified, quit and go home */
+@@ -541,81 +467,53 @@
+ 		return -ENOMEM;
+ 	}
+ 
+-	cha_vid_ls = rd_reg32(&ctrl->perfmon.cha_id_ls);
+-
+ 	/*
+-	 * If SEC has RNG version >= 4 and RNG state handle has not been
+-	 * already instantiated, do RNG instantiation
++	 * RNG4 based SECs (v5+ | >= i.MX6) need special initialization prior
++	 * to executing any descriptors. If there's a problem with init,
++	 * remove other subsystems and return; internal padding functions
++	 * cannot run without an RNG. This procedure assumes a single RNG4
++	 * instance.
+ 	 */
+-	if ((cha_vid_ls & CHA_ID_LS_RNG_MASK) >> CHA_ID_LS_RNG_SHIFT >= 4) {
+-		ctrlpriv->rng4_sh_init =
+-			rd_reg32(&ctrl->r4tst[0].rdsta);
++	if ((rd_reg64(&topregs->ctrl.perfmon.cha_id) & CHA_ID_RNG_MASK)
++	    == CHA_ID_RNG_4) {
++		struct rng4tst __iomem *r4tst;
++		u32 rdsta, rng_if, rng_skvn;
++
+ 		/*
+-		 * If the secure keys (TDKEK, JDKEK, TDSK), were already
+-		 * generated, signal this to the function that is instantiating
+-		 * the state handles. An error would occur if RNG4 attempts
+-		 * to regenerate these keys before the next POR.
++		 * Check to see if the RNG has already been instantiated.
++		 * If either the state 0 or 1 instantiated flags are set,
++		 * then don't continue on and try to instantiate the RNG
++		 * again.
+ 		 */
+-		gen_sk = ctrlpriv->rng4_sh_init & RDSTA_SKVN ? 0 : 1;
+-		ctrlpriv->rng4_sh_init &= RDSTA_IFMASK;
+-		do {
+-			int inst_handles =
+-				rd_reg32(&ctrl->r4tst[0].rdsta) &
+-								RDSTA_IFMASK;
+-			/*
+-			 * If either SH were instantiated by somebody else
+-			 * (e.g. u-boot) then it is assumed that the entropy
+-			 * parameters are properly set and thus the function
+-			 * setting these (kick_trng(...)) is skipped.
+-			 * Also, if a handle was instantiated, do not change
+-			 * the TRNG parameters.
+-			 */
+-			if (!(ctrlpriv->rng4_sh_init || inst_handles)) {
+-				dev_info(dev,
+-					 "Entropy delay = %u\n",
+-					 ent_delay);
+-				kick_trng(pdev, ent_delay);
+-				ent_delay += 400;
++		r4tst = &topregs->ctrl.r4tst[0];
++		rdsta = rd_reg32(&r4tst->rdsta); /* Read RDSTA register */
++
++		/* Check IF bit for non-deterministic instantiation */
++		rng_if = rdsta & RDSTA_IF;
++
++		/* Check SKVN bit for non-deterministic key generation */
++		rng_skvn = rdsta & RDSTA_SKVN;
++		if (!rng_if) {
++			kick_trng(pdev);
++			ret = instantiate_rng(ctrlpriv->jrdev[0], rng_skvn);
++			if (ret) {
++				caam_remove(pdev);
++				return -ENODEV;
+ 			}
+-			/*
+-			 * if instantiate_rng(...) fails, the loop will rerun
+-			 * and the kick_trng(...) function will modfiy the
+-			 * upper and lower limits of the entropy sampling
+-			 * interval, leading to a sucessful initialization of
+-			 * the RNG.
+-			 */
+-			ret = instantiate_rng(dev, inst_handles,
+-					      gen_sk);
+-			if (ret == -EAGAIN)
+-				/*
+-				 * if here, the loop will rerun,
+-				 * so don't hog the CPU
+-				 */
+-				cpu_relax();
+-		} while ((ret == -EAGAIN) && (ent_delay < RTSDCTL_ENT_DLY_MAX));
+-		if (ret) {
+-			dev_err(dev, "failed to instantiate RNG");
+-			caam_remove(pdev);
+-			return ret;
++			ctrlpriv->rng_inst++;
+ 		}
+-		/*
+-		 * Set handles init'ed by this module as the complement of the
+-		 * already initialized ones
+-		 */
+-		ctrlpriv->rng4_sh_init = ~ctrlpriv->rng4_sh_init & RDSTA_IFMASK;
+-
+-		/* Enable RDB bit so that RNG works faster */
+-		setbits32(&ctrl->scfgr, SCFGR_RDBENABLE);
+ 	}
+ 
+ 	/* NOTE: RTIC detection ought to go here, around Si time */
+ 
+-	caam_id = (u64)rd_reg32(&ctrl->perfmon.caam_id_ms) << 32 |
+-		  (u64)rd_reg32(&ctrl->perfmon.caam_id_ls);
++	/* Initialize queue allocator lock */
++	spin_lock_init(&ctrlpriv->jr_alloc_lock);
++
++	caam_id = rd_reg64(&topregs->ctrl.perfmon.caam_id);
+ 
+ 	/* Report "alive" for developer to see */
+ 	dev_info(dev, "device ID = 0x%016llx (Era %d)\n", caam_id,
+-		 caam_get_era());
++		 caam_get_era(caam_id));
+ 	dev_info(dev, "job rings = %d, qi = %d\n",
+ 		 ctrlpriv->total_jobrs, ctrlpriv->qi_present);
+ 
+@@ -627,7 +525,7 @@
+ 	 */
+ 	perfmon = (struct caam_perfmon __force *)&ctrl->perfmon;
+ 
+-	ctrlpriv->dfs_root = debugfs_create_dir(dev_name(dev), NULL);
++	ctrlpriv->dfs_root = debugfs_create_dir("caam", NULL);
+ 	ctrlpriv->ctl = debugfs_create_dir("ctl", ctrlpriv->dfs_root);
+ 
+ 	/* Controller-level - performance monitor counters */
+@@ -716,6 +614,7 @@
+ static struct platform_driver caam_driver = {
+ 	.driver = {
+ 		.name = "caam",
++		.owner = THIS_MODULE,
+ 		.of_match_table = caam_match,
+ 	},
+ 	.probe       = caam_probe,
+diff -Nur linux-4.1.3/drivers/crypto/caam/ctrl.h linux-xbian-imx6/drivers/crypto/caam/ctrl.h
+--- linux-4.1.3/drivers/crypto/caam/ctrl.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/ctrl.h	2015-07-27 23:13:04.209961631 +0200
+@@ -8,6 +8,6 @@
+ #define CTRL_H
+ 
+ /* Prototypes for backend-level services exposed to APIs */
+-int caam_get_era(void);
++int caam_get_era(u64 caam_id);
+ 
+ #endif /* CTRL_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/desc_constr.h linux-xbian-imx6/drivers/crypto/caam/desc_constr.h
+--- linux-4.1.3/drivers/crypto/caam/desc_constr.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/desc_constr.h	2015-07-27 23:13:04.209961631 +0200
+@@ -10,7 +10,6 @@
+ #define CAAM_CMD_SZ sizeof(u32)
+ #define CAAM_PTR_SZ sizeof(dma_addr_t)
+ #define CAAM_DESC_BYTES_MAX (CAAM_CMD_SZ * MAX_CAAM_DESCSIZE)
+-#define DESC_JOB_IO_LEN (CAAM_CMD_SZ * 5 + CAAM_PTR_SZ * 3)
+ 
+ #ifdef DEBUG
+ #define PRINT_POS do { printk(KERN_DEBUG "%02d: %s\n", desc_len(desc),\
+@@ -111,26 +110,6 @@
+ 	(*desc)++;
+ }
+ 
+-#define append_u32 append_cmd
+-
+-static inline void append_u64(u32 *desc, u64 data)
+-{
+-	u32 *offset = desc_end(desc);
+-
+-	*offset = upper_32_bits(data);
+-	*(++offset) = lower_32_bits(data);
+-
+-	(*desc) += 2;
+-}
+-
+-/* Write command without affecting header, and return pointer to next word */
+-static inline u32 *write_cmd(u32 *desc, u32 command)
+-{
+-	*desc = command;
+-
+-	return desc + 1;
+-}
+-
+ static inline void append_cmd_ptr(u32 *desc, dma_addr_t ptr, int len,
+ 				  u32 command)
+ {
+@@ -143,8 +122,7 @@
+ 					 unsigned int len, u32 command)
+ {
+ 	append_cmd(desc, command);
+-	if (!(command & (SQIN_RTO | SQIN_PRE)))
+-		append_ptr(desc, ptr);
++	append_ptr(desc, ptr);
+ 	append_cmd(desc, len);
+ }
+ 
+@@ -155,29 +133,21 @@
+ 	append_data(desc, data, len);
+ }
+ 
+-#define APPEND_CMD_RET(cmd, op) \
+-static inline u32 *append_##cmd(u32 *desc, u32 options) \
+-{ \
+-	u32 *cmd = desc_end(desc); \
+-	PRINT_POS; \
+-	append_cmd(desc, CMD_##op | options); \
+-	return cmd; \
++static inline u32 *append_jump(u32 *desc, u32 options)
++{
++	u32 *cmd = desc_end(desc);
++
++	PRINT_POS;
++	append_cmd(desc, CMD_JUMP | options);
++
++	return cmd;
+ }
+-APPEND_CMD_RET(jump, JUMP)
+-APPEND_CMD_RET(move, MOVE)
+ 
+ static inline void set_jump_tgt_here(u32 *desc, u32 *jump_cmd)
+ {
+ 	*jump_cmd = *jump_cmd | (desc_len(desc) - (jump_cmd - desc));
+ }
+ 
+-static inline void set_move_tgt_here(u32 *desc, u32 *move_cmd)
+-{
+-	*move_cmd &= ~MOVE_OFFSET_MASK;
+-	*move_cmd = *move_cmd | ((desc_len(desc) << (MOVE_OFFSET_SHIFT + 2)) &
+-				 MOVE_OFFSET_MASK);
+-}
+-
+ #define APPEND_CMD(cmd, op) \
+ static inline void append_##cmd(u32 *desc, u32 options) \
+ { \
+@@ -185,6 +155,7 @@
+ 	append_cmd(desc, CMD_##op | options); \
+ }
+ APPEND_CMD(operation, OPERATION)
++APPEND_CMD(move, MOVE)
+ 
+ #define APPEND_CMD_LEN(cmd, op) \
+ static inline void append_##cmd(u32 *desc, unsigned int len, u32 options) \
+@@ -192,8 +163,6 @@
+ 	PRINT_POS; \
+ 	append_cmd(desc, CMD_##op | len | options); \
+ }
+-
+-APPEND_CMD_LEN(seq_load, SEQ_LOAD)
+ APPEND_CMD_LEN(seq_store, SEQ_STORE)
+ APPEND_CMD_LEN(seq_fifo_load, SEQ_FIFO_LOAD)
+ APPEND_CMD_LEN(seq_fifo_store, SEQ_FIFO_STORE)
+@@ -207,36 +176,17 @@
+ }
+ APPEND_CMD_PTR(key, KEY)
+ APPEND_CMD_PTR(load, LOAD)
++APPEND_CMD_PTR(store, STORE)
+ APPEND_CMD_PTR(fifo_load, FIFO_LOAD)
+ APPEND_CMD_PTR(fifo_store, FIFO_STORE)
+ 
+-static inline void append_store(u32 *desc, dma_addr_t ptr, unsigned int len,
+-				u32 options)
+-{
+-	u32 cmd_src;
+-
+-	cmd_src = options & LDST_SRCDST_MASK;
+-
+-	append_cmd(desc, CMD_STORE | options | len);
+-
+-	/* The following options do not require pointer */
+-	if (!(cmd_src == LDST_SRCDST_WORD_DESCBUF_SHARED ||
+-	      cmd_src == LDST_SRCDST_WORD_DESCBUF_JOB    ||
+-	      cmd_src == LDST_SRCDST_WORD_DESCBUF_JOB_WE ||
+-	      cmd_src == LDST_SRCDST_WORD_DESCBUF_SHARED_WE))
+-		append_ptr(desc, ptr);
+-}
+-
+ #define APPEND_SEQ_PTR_INTLEN(cmd, op) \
+ static inline void append_seq_##cmd##_ptr_intlen(u32 *desc, dma_addr_t ptr, \
+ 						 unsigned int len, \
+ 						 u32 options) \
+ { \
+ 	PRINT_POS; \
+-	if (options & (SQIN_RTO | SQIN_PRE)) \
+-		append_cmd(desc, CMD_SEQ_##op##_PTR | len | options); \
+-	else \
+-		append_cmd_ptr(desc, ptr, len, CMD_SEQ_##op##_PTR | options); \
++	append_cmd_ptr(desc, ptr, len, CMD_SEQ_##op##_PTR | options); \
+ }
+ APPEND_SEQ_PTR_INTLEN(in, IN)
+ APPEND_SEQ_PTR_INTLEN(out, OUT)
+@@ -309,7 +259,7 @@
+  */
+ #define APPEND_MATH(op, desc, dest, src_0, src_1, len) \
+ append_cmd(desc, CMD_MATH | MATH_FUN_##op | MATH_DEST_##dest | \
+-	MATH_SRC0_##src_0 | MATH_SRC1_##src_1 | (u32)len);
++	   MATH_SRC0_##src_0 | MATH_SRC1_##src_1 | (u32) (len & MATH_LEN_MASK));
+ 
+ #define append_math_add(desc, dest, src0, src1, len) \
+ 	APPEND_MATH(ADD, desc, dest, src0, src1, len)
+@@ -329,15 +279,13 @@
+ 	APPEND_MATH(LSHIFT, desc, dest, src0, src1, len)
+ #define append_math_rshift(desc, dest, src0, src1, len) \
+ 	APPEND_MATH(RSHIFT, desc, dest, src0, src1, len)
+-#define append_math_ldshift(desc, dest, src0, src1, len) \
+-	APPEND_MATH(SHLD, desc, dest, src0, src1, len)
+ 
+ /* Exactly one source is IMM. Data is passed in as u32 value */
+ #define APPEND_MATH_IMM_u32(op, desc, dest, src_0, src_1, data) \
+ do { \
+ 	APPEND_MATH(op, desc, dest, src_0, src_1, CAAM_CMD_SZ); \
+ 	append_cmd(desc, data); \
+-} while (0)
++} while (0);
+ 
+ #define append_math_add_imm_u32(desc, dest, src0, src1, data) \
+ 	APPEND_MATH_IMM_u32(ADD, desc, dest, src0, src1, data)
+@@ -357,34 +305,3 @@
+ 	APPEND_MATH_IMM_u32(LSHIFT, desc, dest, src0, src1, data)
+ #define append_math_rshift_imm_u32(desc, dest, src0, src1, data) \
+ 	APPEND_MATH_IMM_u32(RSHIFT, desc, dest, src0, src1, data)
+-
+-/* Exactly one source is IMM. Data is passed in as u64 value */
+-#define APPEND_MATH_IMM_u64(op, desc, dest, src_0, src_1, data) \
+-do { \
+-	u32 upper = (data >> 16) >> 16; \
+-	APPEND_MATH(op, desc, dest, src_0, src_1, CAAM_CMD_SZ * 2 | \
+-		    (upper ? 0 : MATH_IFB)); \
+-	if (upper) \
+-		append_u64(desc, data); \
+-	else \
+-		append_u32(desc, data); \
+-} while (0)
+-
+-#define append_math_add_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(ADD, desc, dest, src0, src1, data)
+-#define append_math_sub_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(SUB, desc, dest, src0, src1, data)
+-#define append_math_add_c_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(ADDC, desc, dest, src0, src1, data)
+-#define append_math_sub_b_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(SUBB, desc, dest, src0, src1, data)
+-#define append_math_and_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(AND, desc, dest, src0, src1, data)
+-#define append_math_or_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(OR, desc, dest, src0, src1, data)
+-#define append_math_xor_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(XOR, desc, dest, src0, src1, data)
+-#define append_math_lshift_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(LSHIFT, desc, dest, src0, src1, data)
+-#define append_math_rshift_imm_u64(desc, dest, src0, src1, data) \
+-	APPEND_MATH_IMM_u64(RSHIFT, desc, dest, src0, src1, data)
+diff -Nur linux-4.1.3/drivers/crypto/caam/desc.h linux-xbian-imx6/drivers/crypto/caam/desc.h
+--- linux-4.1.3/drivers/crypto/caam/desc.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/desc.h	2015-07-27 23:13:04.209961631 +0200
+@@ -2,19 +2,35 @@
+  * CAAM descriptor composition header
+  * Definitions to support CAAM descriptor instruction generation
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  */
+ 
+ #ifndef DESC_H
+ #define DESC_H
+ 
++/*
++ * 16-byte hardware scatter/gather table
++ * An 8-byte table exists in the hardware spec, but has never been
++ * implemented to date. The 8/16 option is selected at RTL-compile-time.
++ * and this selection is visible in the Compile Time Parameters Register
++ */
++
++#define SEC4_SG_LEN_EXT		0x80000000	/* Entry points to table */
++#define SEC4_SG_LEN_FIN		0x40000000	/* Last ent in table */
++#define SEC4_SG_BPID_MASK	0x000000ff
++#define SEC4_SG_BPID_SHIFT	16
++#define SEC4_SG_LEN_MASK	0x3fffffff	/* Excludes EXT and FINAL */
++#define SEC4_SG_OFFS_MASK	0x00001fff
++
+ struct sec4_sg_entry {
++#ifdef CONFIG_64BIT
+ 	u64 ptr;
+-#define SEC4_SG_LEN_FIN 0x40000000
+-#define SEC4_SG_LEN_EXT 0x80000000
++#else
++	u32 reserved;
++	u32 ptr;
++#endif
+ 	u32 len;
+-	u8 reserved;
+-	u8 buf_pool_id;
++	u16 buf_pool_id;
+ 	u16 offset;
+ };
+ 
+@@ -231,12 +247,7 @@
+ #define LDST_SRCDST_WORD_PKHA_B_SZ	(0x11 << LDST_SRCDST_SHIFT)
+ #define LDST_SRCDST_WORD_PKHA_N_SZ	(0x12 << LDST_SRCDST_SHIFT)
+ #define LDST_SRCDST_WORD_PKHA_E_SZ	(0x13 << LDST_SRCDST_SHIFT)
+-#define LDST_SRCDST_WORD_CLASS_CTX	(0x20 << LDST_SRCDST_SHIFT)
+ #define LDST_SRCDST_WORD_DESCBUF	(0x40 << LDST_SRCDST_SHIFT)
+-#define LDST_SRCDST_WORD_DESCBUF_JOB	(0x41 << LDST_SRCDST_SHIFT)
+-#define LDST_SRCDST_WORD_DESCBUF_SHARED	(0x42 << LDST_SRCDST_SHIFT)
+-#define LDST_SRCDST_WORD_DESCBUF_JOB_WE	(0x45 << LDST_SRCDST_SHIFT)
+-#define LDST_SRCDST_WORD_DESCBUF_SHARED_WE (0x46 << LDST_SRCDST_SHIFT)
+ #define LDST_SRCDST_WORD_INFO_FIFO	(0x7a << LDST_SRCDST_SHIFT)
+ 
+ /* Offset in source/destination */
+@@ -321,6 +332,7 @@
+ /* Continue - Not the last FIFO store to come */
+ #define FIFOST_CONT_SHIFT	23
+ #define FIFOST_CONT_MASK	(1 << FIFOST_CONT_SHIFT)
++#define FIFOST_CONT_MASK	(1 << FIFOST_CONT_SHIFT)
+ 
+ /*
+  * Extended Length - use 32-bit extended length that
+@@ -370,7 +382,6 @@
+ #define FIFOLD_TYPE_LAST2FLUSH1 (0x05 << FIFOLD_TYPE_SHIFT)
+ #define FIFOLD_TYPE_LASTBOTH	(0x06 << FIFOLD_TYPE_SHIFT)
+ #define FIFOLD_TYPE_LASTBOTHFL	(0x07 << FIFOLD_TYPE_SHIFT)
+-#define FIFOLD_TYPE_NOINFOFIFO	(0x0F << FIFOLD_TYPE_SHIFT)
+ 
+ #define FIFOLDST_LEN_MASK	0xffff
+ #define FIFOLDST_EXT_LEN_MASK	0xffffffff
+@@ -1092,6 +1103,23 @@
+ #define OP_PCL_PKPROT_ECC			 0x0002
+ #define OP_PCL_PKPROT_F2M			 0x0001
+ 
++/* Blob protocol protinfo bits */
++#define OP_PCL_BLOB_TK			0x0200
++#define OP_PCL_BLOB_EKT			0x0100
++
++#define OP_PCL_BLOB_K2KR_MEM		0x0000
++#define OP_PCL_BLOB_K2KR_C1KR		0x0010
++#define OP_PCL_BLOB_K2KR_C2KR		0x0030
++#define OP_PCL_BLOB_K2KR_AFHAS		0x0050
++#define OP_PCL_BLOB_K2KR_C2KR_SPLIT	0x0070
++
++#define OP_PCL_BLOB_PTXT_SECMEM		0x0008
++#define OP_PCL_BLOB_BLACK		0x0004
++
++#define OP_PCL_BLOB_FMT_NORMAL		0x0000
++#define OP_PCL_BLOB_FMT_MSTR		0x0002
++#define OP_PCL_BLOB_FMT_TEST		0x0003
++
+ /* For non-protocol/alg-only op commands */
+ #define OP_ALG_TYPE_SHIFT	24
+ #define OP_ALG_TYPE_MASK	(0x7 << OP_ALG_TYPE_SHIFT)
+@@ -1154,15 +1182,8 @@
+ 
+ /* randomizer AAI set */
+ #define OP_ALG_AAI_RNG		(0x00 << OP_ALG_AAI_SHIFT)
+-#define OP_ALG_AAI_RNG_NZB	(0x10 << OP_ALG_AAI_SHIFT)
+-#define OP_ALG_AAI_RNG_OBP	(0x20 << OP_ALG_AAI_SHIFT)
+-
+-/* RNG4 AAI set */
+-#define OP_ALG_AAI_RNG4_SH_0	(0x00 << OP_ALG_AAI_SHIFT)
+-#define OP_ALG_AAI_RNG4_SH_1	(0x01 << OP_ALG_AAI_SHIFT)
+-#define OP_ALG_AAI_RNG4_PS	(0x40 << OP_ALG_AAI_SHIFT)
+-#define OP_ALG_AAI_RNG4_AI	(0x80 << OP_ALG_AAI_SHIFT)
+-#define OP_ALG_AAI_RNG4_SK	(0x100 << OP_ALG_AAI_SHIFT)
++#define OP_ALG_AAI_RNG_NOZERO	(0x10 << OP_ALG_AAI_SHIFT)
++#define OP_ALG_AAI_RNG_ODD	(0x20 << OP_ALG_AAI_SHIFT)
+ 
+ /* hmac/smac AAI set */
+ #define OP_ALG_AAI_HASH		(0x00 << OP_ALG_AAI_SHIFT)
+@@ -1184,6 +1205,12 @@
+ #define OP_ALG_AAI_GSM		(0x10 << OP_ALG_AAI_SHIFT)
+ #define OP_ALG_AAI_EDGE		(0x20 << OP_ALG_AAI_SHIFT)
+ 
++/* RNG4 set */
++#define OP_ALG_RNG4_SHIFT	4
++#define OP_ALG_RNG4_MASK	(0x1f3 << OP_ALG_RNG4_SHIFT)
++
++#define OP_ALG_RNG4_SK		(0x100 << OP_ALG_RNG4_SHIFT)
++
+ #define OP_ALG_AS_SHIFT		2
+ #define OP_ALG_AS_MASK		(0x3 << OP_ALG_AS_SHIFT)
+ #define OP_ALG_AS_UPDATE	(0 << OP_ALG_AS_SHIFT)
+@@ -1300,10 +1327,10 @@
+ #define SQOUT_SGF	0x01000000
+ 
+ /* Appends to a previous pointer */
+-#define SQOUT_PRE	SQIN_PRE
++#define SQOUT_PRE	0x00800000
+ 
+ /* Restore sequence with pointer/length */
+-#define SQOUT_RTO	 SQIN_RTO
++#define SQOUT_RTO	0x00200000
+ 
+ /* Use extended length following pointer */
+ #define SQOUT_EXT	0x00400000
+@@ -1365,7 +1392,6 @@
+ #define MOVE_DEST_MATH3		(0x07 << MOVE_DEST_SHIFT)
+ #define MOVE_DEST_CLASS1INFIFO	(0x08 << MOVE_DEST_SHIFT)
+ #define MOVE_DEST_CLASS2INFIFO	(0x09 << MOVE_DEST_SHIFT)
+-#define MOVE_DEST_INFIFO_NOINFO (0x0a << MOVE_DEST_SHIFT)
+ #define MOVE_DEST_PK_A		(0x0c << MOVE_DEST_SHIFT)
+ #define MOVE_DEST_CLASS1KEY	(0x0d << MOVE_DEST_SHIFT)
+ #define MOVE_DEST_CLASS2KEY	(0x0e << MOVE_DEST_SHIFT)
+@@ -1418,7 +1444,6 @@
+ #define MATH_SRC0_REG2		(0x02 << MATH_SRC0_SHIFT)
+ #define MATH_SRC0_REG3		(0x03 << MATH_SRC0_SHIFT)
+ #define MATH_SRC0_IMM		(0x04 << MATH_SRC0_SHIFT)
+-#define MATH_SRC0_DPOVRD	(0x07 << MATH_SRC0_SHIFT)
+ #define MATH_SRC0_SEQINLEN	(0x08 << MATH_SRC0_SHIFT)
+ #define MATH_SRC0_SEQOUTLEN	(0x09 << MATH_SRC0_SHIFT)
+ #define MATH_SRC0_VARSEQINLEN	(0x0a << MATH_SRC0_SHIFT)
+@@ -1433,7 +1458,6 @@
+ #define MATH_SRC1_REG2		(0x02 << MATH_SRC1_SHIFT)
+ #define MATH_SRC1_REG3		(0x03 << MATH_SRC1_SHIFT)
+ #define MATH_SRC1_IMM		(0x04 << MATH_SRC1_SHIFT)
+-#define MATH_SRC1_DPOVRD	(0x07 << MATH_SRC0_SHIFT)
+ #define MATH_SRC1_INFIFO	(0x0a << MATH_SRC1_SHIFT)
+ #define MATH_SRC1_OUTFIFO	(0x0b << MATH_SRC1_SHIFT)
+ #define MATH_SRC1_ONE		(0x0c << MATH_SRC1_SHIFT)
+@@ -1609,13 +1633,28 @@
+ #define NFIFOENTRY_PLEN_SHIFT	0
+ #define NFIFOENTRY_PLEN_MASK	(0xFF << NFIFOENTRY_PLEN_SHIFT)
+ 
+-/* Append Load Immediate Command */
+-#define FD_CMD_APPEND_LOAD_IMMEDIATE			0x80000000
++/*
++ * PDB internal definitions
++ */
++
++/* IPSec ESP CBC Encap/Decap Options */
++#define PDBOPTS_ESPCBC_ARSNONE	0x00	/* no antireplay window	*/
++#define PDBOPTS_ESPCBC_ARS32	0x40	/* 32-entry antireplay window */
++#define PDBOPTS_ESPCBC_ARS64	0xc0	/* 64-entry antireplay window */
++#define PDBOPTS_ESPCBC_IVSRC	0x20	/* IV comes from internal random gen */
++#define PDBOPTS_ESPCBC_ESN	0x10	/* extended sequence included */
++#define PDBOPTS_ESPCBC_OUTFMT	0x08	/* output only decapsulation (decap) */
++#define PDBOPTS_ESPCBC_IPHDRSRC 0x08	/* IP header comes from PDB (encap) */
++#define PDBOPTS_ESPCBC_INCIPHDR 0x04	/* Prepend IP header to output frame */
++#define PDBOPTS_ESPCBC_IPVSN	0x02	/* process IPv6 header */
++#define PDBOPTS_ESPCBC_TUNNEL	0x01	/* tunnel mode next-header byte */
++
++#define ARC4_BLOCK_SIZE       1
++#define ARC4_MAX_KEY_SIZE     256
++#define ARC4_MIN_KEY_SIZE     1
+ 
+-/* Set SEQ LIODN equal to the Non-SEQ LIODN for the job */
+-#define FD_CMD_SET_SEQ_LIODN_EQUAL_NONSEQ_LIODN		0x40000000
++#define XCBC_MAC_DIGEST_SIZE  16
++#define XCBC_MAC_BLOCK_WORDS  16
+ 
+-/* Frame Descriptor Command for Replacement Job Descriptor */
+-#define FD_CMD_REPLACE_JOB_DESC				0x20000000
+ 
+ #endif /* DESC_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/error.c linux-xbian-imx6/drivers/crypto/caam/error.c
+--- linux-4.1.3/drivers/crypto/caam/error.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/error.c	2015-07-27 23:13:04.213947410 +0200
+@@ -11,243 +11,264 @@
+ #include "jr.h"
+ #include "error.h"
+ 
+-static const struct {
+-	u8 value;
+-	const char *error_text;
+-} desc_error_list[] = {
+-	{ 0x00, "No error." },
+-	{ 0x01, "SGT Length Error. The descriptor is trying to read more data than is contained in the SGT table." },
+-	{ 0x02, "SGT Null Entry Error." },
+-	{ 0x03, "Job Ring Control Error. There is a bad value in the Job Ring Control register." },
+-	{ 0x04, "Invalid Descriptor Command. The Descriptor Command field is invalid." },
+-	{ 0x05, "Reserved." },
+-	{ 0x06, "Invalid KEY Command" },
+-	{ 0x07, "Invalid LOAD Command" },
+-	{ 0x08, "Invalid STORE Command" },
+-	{ 0x09, "Invalid OPERATION Command" },
+-	{ 0x0A, "Invalid FIFO LOAD Command" },
+-	{ 0x0B, "Invalid FIFO STORE Command" },
+-	{ 0x0C, "Invalid MOVE/MOVE_LEN Command" },
+-	{ 0x0D, "Invalid JUMP Command. A nonlocal JUMP Command is invalid because the target is not a Job Header Command, or the jump is from a Trusted Descriptor to a Job Descriptor, or because the target Descriptor contains a Shared Descriptor." },
+-	{ 0x0E, "Invalid MATH Command" },
+-	{ 0x0F, "Invalid SIGNATURE Command" },
+-	{ 0x10, "Invalid Sequence Command. A SEQ IN PTR OR SEQ OUT PTR Command is invalid or a SEQ KEY, SEQ LOAD, SEQ FIFO LOAD, or SEQ FIFO STORE decremented the input or output sequence length below 0. This error may result if a built-in PROTOCOL Command has encountered a malformed PDU." },
+-	{ 0x11, "Skip data type invalid. The type must be 0xE or 0xF."},
+-	{ 0x12, "Shared Descriptor Header Error" },
+-	{ 0x13, "Header Error. Invalid length or parity, or certain other problems." },
+-	{ 0x14, "Burster Error. Burster has gotten to an illegal state" },
+-	{ 0x15, "Context Register Length Error. The descriptor is trying to read or write past the end of the Context Register. A SEQ LOAD or SEQ STORE with the VLF bit set was executed with too large a length in the variable length register (VSOL for SEQ STORE or VSIL for SEQ LOAD)." },
+-	{ 0x16, "DMA Error" },
+-	{ 0x17, "Reserved." },
+-	{ 0x1A, "Job failed due to JR reset" },
+-	{ 0x1B, "Job failed due to Fail Mode" },
+-	{ 0x1C, "DECO Watchdog timer timeout error" },
+-	{ 0x1D, "DECO tried to copy a key from another DECO but the other DECO's Key Registers were locked" },
+-	{ 0x1E, "DECO attempted to copy data from a DECO that had an unmasked Descriptor error" },
+-	{ 0x1F, "LIODN error. DECO was trying to share from itself or from another DECO but the two Non-SEQ LIODN values didn't match or the 'shared from' DECO's Descriptor required that the SEQ LIODNs be the same and they aren't." },
+-	{ 0x20, "DECO has completed a reset initiated via the DRR register" },
+-	{ 0x21, "Nonce error. When using EKT (CCM) key encryption option in the FIFO STORE Command, the Nonce counter reached its maximum value and this encryption mode can no longer be used." },
+-	{ 0x22, "Meta data is too large (> 511 bytes) for TLS decap (input frame; block ciphers) and IPsec decap (output frame, when doing the next header byte update) and DCRC (output frame)." },
+-	{ 0x23, "Read Input Frame error" },
+-	{ 0x24, "JDKEK, TDKEK or TDSK not loaded error" },
+-	{ 0x80, "DNR (do not run) error" },
+-	{ 0x81, "undefined protocol command" },
+-	{ 0x82, "invalid setting in PDB" },
+-	{ 0x83, "Anti-replay LATE error" },
+-	{ 0x84, "Anti-replay REPLAY error" },
+-	{ 0x85, "Sequence number overflow" },
+-	{ 0x86, "Sigver invalid signature" },
+-	{ 0x87, "DSA Sign Illegal test descriptor" },
+-	{ 0x88, "Protocol Format Error - A protocol has seen an error in the format of data received. When running RSA, this means that formatting with random padding was used, and did not follow the form: 0x00, 0x02, 8-to-N bytes of non-zero pad, 0x00, F data." },
+-	{ 0x89, "Protocol Size Error - A protocol has seen an error in size. When running RSA, pdb size N < (size of F) when no formatting is used; or pdb size N < (F + 11) when formatting is used." },
+-	{ 0xC1, "Blob Command error: Undefined mode" },
+-	{ 0xC2, "Blob Command error: Secure Memory Blob mode error" },
+-	{ 0xC4, "Blob Command error: Black Blob key or input size error" },
+-	{ 0xC5, "Blob Command error: Invalid key destination" },
+-	{ 0xC8, "Blob Command error: Trusted/Secure mode error" },
+-	{ 0xF0, "IPsec TTL or hop limit field either came in as 0, or was decremented to 0" },
+-	{ 0xF1, "3GPP HFN matches or exceeds the Threshold" },
+-};
+-
+-static const char * const cha_id_list[] = {
+-	"",
+-	"AES",
+-	"DES",
+-	"ARC4",
+-	"MDHA",
+-	"RNG",
+-	"SNOW f8",
+-	"Kasumi f8/9",
+-	"PKHA",
+-	"CRCA",
+-	"SNOW f9",
+-	"ZUCE",
+-	"ZUCA",
+-};
+-
+-static const char * const err_id_list[] = {
+-	"No error.",
+-	"Mode error.",
+-	"Data size error.",
+-	"Key size error.",
+-	"PKHA A memory size error.",
+-	"PKHA B memory size error.",
+-	"Data arrived out of sequence error.",
+-	"PKHA divide-by-zero error.",
+-	"PKHA modulus even error.",
+-	"DES key parity error.",
+-	"ICV check failed.",
+-	"Hardware error.",
+-	"Unsupported CCM AAD size.",
+-	"Class 1 CHA is not reset",
+-	"Invalid CHA combination was selected",
+-	"Invalid CHA selected.",
+-};
+-
+-static const char * const rng_err_id_list[] = {
+-	"",
+-	"",
+-	"",
+-	"Instantiate",
+-	"Not instantiated",
+-	"Test instantiate",
+-	"Prediction resistance",
+-	"Prediction resistance and test request",
+-	"Uninstantiate",
+-	"Secure key generation",
+-};
++#define SPRINTFCAT(str, format, param, max_alloc)		\
++{								\
++	char *tmp;						\
++								\
++	tmp = kmalloc(sizeof(format) + max_alloc, GFP_ATOMIC);	\
++	if (likely(tmp)) {					\
++		sprintf(tmp, format, param);			\
++		strcat(str, tmp);				\
++		kfree(tmp);					\
++	} else {						\
++		strcat(str, "kmalloc failure in SPRINTFCAT");	\
++	}							\
++}
+ 
+-static void report_ccb_status(struct device *jrdev, const u32 status,
+-			      const char *error)
++static void report_jump_idx(u32 status, char *outstr)
+ {
+-	u8 cha_id = (status & JRSTA_CCBERR_CHAID_MASK) >>
+-		    JRSTA_CCBERR_CHAID_SHIFT;
+-	u8 err_id = status & JRSTA_CCBERR_ERRID_MASK;
+ 	u8 idx = (status & JRSTA_DECOERR_INDEX_MASK) >>
+ 		  JRSTA_DECOERR_INDEX_SHIFT;
+-	char *idx_str;
+-	const char *cha_str = "unidentified cha_id value 0x";
+-	char cha_err_code[3] = { 0 };
+-	const char *err_str = "unidentified err_id value 0x";
+-	char err_err_code[3] = { 0 };
+ 
+ 	if (status & JRSTA_DECOERR_JUMP)
+-		idx_str = "jump tgt desc idx";
++		strcat(outstr, "jump tgt desc idx ");
+ 	else
+-		idx_str = "desc idx";
++		strcat(outstr, "desc idx ");
+ 
+-	if (cha_id < ARRAY_SIZE(cha_id_list))
+-		cha_str = cha_id_list[cha_id];
+-	else
+-		snprintf(cha_err_code, sizeof(cha_err_code), "%02x", cha_id);
++	SPRINTFCAT(outstr, "%d: ", idx, sizeof("255"));
++}
++
++static void report_ccb_status(u32 status, char *outstr)
++{
++	static const char * const cha_id_list[] = {
++		"",
++		"AES",
++		"DES",
++		"ARC4",
++		"MDHA",
++		"RNG",
++		"SNOW f8",
++		"Kasumi f8/9",
++		"PKHA",
++		"CRCA",
++		"SNOW f9",
++		"ZUCE",
++		"ZUCA",
++	};
++	static const char * const err_id_list[] = {
++		"No error.",
++		"Mode error.",
++		"Data size error.",
++		"Key size error.",
++		"PKHA A memory size error.",
++		"PKHA B memory size error.",
++		"Data arrived out of sequence error.",
++		"PKHA divide-by-zero error.",
++		"PKHA modulus even error.",
++		"DES key parity error.",
++		"ICV check failed.",
++		"Hardware error.",
++		"Unsupported CCM AAD size.",
++		"Class 1 CHA is not reset",
++		"Invalid CHA combination was selected",
++		"Invalid CHA selected.",
++	};
++	static const char * const rng_err_id_list[] = {
++		"",
++		"",
++		"",
++		"Instantiate",
++		"Not instantiated",
++		"Test instantiate",
++		"Prediction resistance",
++		"Prediction resistance and test request",
++		"Uninstantiate",
++		"Secure key generation",
++	};
++	u8 cha_id = (status & JRSTA_CCBERR_CHAID_MASK) >>
++		    JRSTA_CCBERR_CHAID_SHIFT;
++	u8 err_id = status & JRSTA_CCBERR_ERRID_MASK;
++
++	report_jump_idx(status, outstr);
++
++	if (cha_id < ARRAY_SIZE(cha_id_list)) {
++		SPRINTFCAT(outstr, "%s: ", cha_id_list[cha_id],
++			   strlen(cha_id_list[cha_id]));
++	} else {
++		SPRINTFCAT(outstr, "unidentified cha_id value 0x%02x: ",
++			   cha_id, sizeof("ff"));
++	}
+ 
+ 	if ((cha_id << JRSTA_CCBERR_CHAID_SHIFT) == JRSTA_CCBERR_CHAID_RNG &&
+ 	    err_id < ARRAY_SIZE(rng_err_id_list) &&
+ 	    strlen(rng_err_id_list[err_id])) {
+ 		/* RNG-only error */
+-		err_str = rng_err_id_list[err_id];
+-	} else if (err_id < ARRAY_SIZE(err_id_list))
+-		err_str = err_id_list[err_id];
+-	else
+-		snprintf(err_err_code, sizeof(err_err_code), "%02x", err_id);
+-
+-	/*
+-	 * CCB ICV check failures are part of normal operation life;
+-	 * we leave the upper layers to do what they want with them.
+-	 */
+-	if (err_id != JRSTA_CCBERR_ERRID_ICVCHK)
+-		dev_err(jrdev, "%08x: %s: %s %d: %s%s: %s%s\n",
+-			status, error, idx_str, idx,
+-			cha_str, cha_err_code,
+-			err_str, err_err_code);
++		SPRINTFCAT(outstr, "%s", rng_err_id_list[err_id],
++			   strlen(rng_err_id_list[err_id]));
++	} else if (err_id < ARRAY_SIZE(err_id_list)) {
++		SPRINTFCAT(outstr, "%s", err_id_list[err_id],
++			   strlen(err_id_list[err_id]));
++	} else {
++		SPRINTFCAT(outstr, "unidentified err_id value 0x%02x",
++			   err_id, sizeof("ff"));
++	}
+ }
+ 
+-static void report_jump_status(struct device *jrdev, const u32 status,
+-			       const char *error)
++static void report_jump_status(u32 status, char *outstr)
+ {
+-	dev_err(jrdev, "%08x: %s: %s() not implemented\n",
+-		status, error, __func__);
++	SPRINTFCAT(outstr, "%s() not implemented", __func__, sizeof(__func__));
+ }
+ 
+-static void report_deco_status(struct device *jrdev, const u32 status,
+-			       const char *error)
++static void report_deco_status(u32 status, char *outstr)
+ {
+-	u8 err_id = status & JRSTA_DECOERR_ERROR_MASK;
+-	u8 idx = (status & JRSTA_DECOERR_INDEX_MASK) >>
+-		  JRSTA_DECOERR_INDEX_SHIFT;
+-	char *idx_str;
+-	const char *err_str = "unidentified error value 0x";
+-	char err_err_code[3] = { 0 };
++	static const struct {
++		u8 value;
++		char *error_text;
++	} desc_error_list[] = {
++		{ 0x00, "No error." },
++		{ 0x01, "SGT Length Error. The descriptor is trying to read "
++			"more data than is contained in the SGT table." },
++		{ 0x02, "SGT Null Entry Error." },
++		{ 0x03, "Job Ring Control Error. There is a bad value in the "
++			"Job Ring Control register." },
++		{ 0x04, "Invalid Descriptor Command. The Descriptor Command "
++			"field is invalid." },
++		{ 0x05, "Reserved." },
++		{ 0x06, "Invalid KEY Command" },
++		{ 0x07, "Invalid LOAD Command" },
++		{ 0x08, "Invalid STORE Command" },
++		{ 0x09, "Invalid OPERATION Command" },
++		{ 0x0A, "Invalid FIFO LOAD Command" },
++		{ 0x0B, "Invalid FIFO STORE Command" },
++		{ 0x0C, "Invalid MOVE/MOVE_LEN Command" },
++		{ 0x0D, "Invalid JUMP Command. A nonlocal JUMP Command is "
++			"invalid because the target is not a Job Header "
++			"Command, or the jump is from a Trusted Descriptor to "
++			"a Job Descriptor, or because the target Descriptor "
++			"contains a Shared Descriptor." },
++		{ 0x0E, "Invalid MATH Command" },
++		{ 0x0F, "Invalid SIGNATURE Command" },
++		{ 0x10, "Invalid Sequence Command. A SEQ IN PTR OR SEQ OUT PTR "
++			"Command is invalid or a SEQ KEY, SEQ LOAD, SEQ FIFO "
++			"LOAD, or SEQ FIFO STORE decremented the input or "
++			"output sequence length below 0. This error may result "
++			"if a built-in PROTOCOL Command has encountered a "
++			"malformed PDU." },
++		{ 0x11, "Skip data type invalid. The type must be 0xE or 0xF."},
++		{ 0x12, "Shared Descriptor Header Error" },
++		{ 0x13, "Header Error. Invalid length or parity, or certain "
++			"other problems." },
++		{ 0x14, "Burster Error. Burster has gotten to an illegal "
++			"state" },
++		{ 0x15, "Context Register Length Error. The descriptor is "
++			"trying to read or write past the end of the Context "
++			"Register. A SEQ LOAD or SEQ STORE with the VLF bit "
++			"set was executed with too large a length in the "
++			"variable length register (VSOL for SEQ STORE or VSIL "
++			"for SEQ LOAD)." },
++		{ 0x16, "DMA Error" },
++		{ 0x17, "Reserved." },
++		{ 0x1A, "Job failed due to JR reset" },
++		{ 0x1B, "Job failed due to Fail Mode" },
++		{ 0x1C, "DECO Watchdog timer timeout error" },
++		{ 0x1D, "DECO tried to copy a key from another DECO but the "
++			"other DECO's Key Registers were locked" },
++		{ 0x1E, "DECO attempted to copy data from a DECO that had an "
++			"unmasked Descriptor error" },
++		{ 0x1F, "LIODN error. DECO was trying to share from itself or "
++			"from another DECO but the two Non-SEQ LIODN values "
++			"didn't match or the 'shared from' DECO's Descriptor "
++			"required that the SEQ LIODNs be the same and they "
++			"aren't." },
++		{ 0x20, "DECO has completed a reset initiated via the DRR "
++			"register" },
++		{ 0x21, "Nonce error. When using EKT (CCM) key encryption "
++			"option in the FIFO STORE Command, the Nonce counter "
++			"reached its maximum value and this encryption mode "
++			"can no longer be used." },
++		{ 0x22, "Meta data is too large (> 511 bytes) for TLS decap "
++			"(input frame; block ciphers) and IPsec decap (output "
++			"frame, when doing the next header byte update) and "
++			"DCRC (output frame)." },
++		{ 0x23, "Read Input Frame error" },
++		{ 0x24, "JDKEK, TDKEK or TDSK not loaded error" },
++		{ 0x80, "DNR (do not run) error" },
++		{ 0x81, "undefined protocol command" },
++		{ 0x82, "invalid setting in PDB" },
++		{ 0x83, "Anti-replay LATE error" },
++		{ 0x84, "Anti-replay REPLAY error" },
++		{ 0x85, "Sequence number overflow" },
++		{ 0x86, "Sigver invalid signature" },
++		{ 0x87, "DSA Sign Illegal test descriptor" },
++		{ 0x88, "Protocol Format Error - A protocol has seen an error "
++			"in the format of data received. When running RSA, "
++			"this means that formatting with random padding was "
++			"used, and did not follow the form: 0x00, 0x02, 8-to-N "
++			"bytes of non-zero pad, 0x00, F data." },
++		{ 0x89, "Protocol Size Error - A protocol has seen an error in "
++			"size. When running RSA, pdb size N < (size of F) when "
++			"no formatting is used; or pdb size N < (F + 11) when "
++			"formatting is used." },
++		{ 0xC1, "Blob Command error: Undefined mode" },
++		{ 0xC2, "Blob Command error: Secure Memory Blob mode error" },
++		{ 0xC4, "Blob Command error: Black Blob key or input size "
++			"error" },
++		{ 0xC5, "Blob Command error: Invalid key destination" },
++		{ 0xC8, "Blob Command error: Trusted/Secure mode error" },
++		{ 0xF0, "IPsec TTL or hop limit field either came in as 0, "
++			"or was decremented to 0" },
++		{ 0xF1, "3GPP HFN matches or exceeds the Threshold" },
++	};
++	u8 desc_error = status & JRSTA_DECOERR_ERROR_MASK;
+ 	int i;
+ 
+-	if (status & JRSTA_DECOERR_JUMP)
+-		idx_str = "jump tgt desc idx";
+-	else
+-		idx_str = "desc idx";
++	report_jump_idx(status, outstr);
+ 
+ 	for (i = 0; i < ARRAY_SIZE(desc_error_list); i++)
+-		if (desc_error_list[i].value == err_id)
++		if (desc_error_list[i].value == desc_error)
+ 			break;
+ 
+-	if (i != ARRAY_SIZE(desc_error_list) && desc_error_list[i].error_text)
+-		err_str = desc_error_list[i].error_text;
+-	else
+-		snprintf(err_err_code, sizeof(err_err_code), "%02x", err_id);
+-
+-	dev_err(jrdev, "%08x: %s: %s %d: %s%s\n",
+-		status, error, idx_str, idx, err_str, err_err_code);
++	if (i != ARRAY_SIZE(desc_error_list) && desc_error_list[i].error_text) {
++		SPRINTFCAT(outstr, "%s", desc_error_list[i].error_text,
++			   strlen(desc_error_list[i].error_text));
++	} else {
++		SPRINTFCAT(outstr, "unidentified error value 0x%02x",
++			   desc_error, sizeof("ff"));
++	}
+ }
+ 
+-static void report_jr_status(struct device *jrdev, const u32 status,
+-			     const char *error)
++static void report_jr_status(u32 status, char *outstr)
+ {
+-	dev_err(jrdev, "%08x: %s: %s() not implemented\n",
+-		status, error, __func__);
++	SPRINTFCAT(outstr, "%s() not implemented", __func__, sizeof(__func__));
+ }
+ 
+-static void report_cond_code_status(struct device *jrdev, const u32 status,
+-				    const char *error)
++static void report_cond_code_status(u32 status, char *outstr)
+ {
+-	dev_err(jrdev, "%08x: %s: %s() not implemented\n",
+-		status, error, __func__);
++	SPRINTFCAT(outstr, "%s() not implemented", __func__, sizeof(__func__));
+ }
+ 
+-void caam_jr_strstatus(struct device *jrdev, u32 status)
++char *caam_jr_strstatus(char *outstr, u32 status)
+ {
+ 	static const struct stat_src {
+-		void (*report_ssed)(struct device *jrdev, const u32 status,
+-				    const char *error);
+-		const char *error;
+-	} status_src[16] = {
++		void (*report_ssed)(u32 status, char *outstr);
++		char *error;
++	} status_src[] = {
+ 		{ NULL, "No error" },
+ 		{ NULL, NULL },
+ 		{ report_ccb_status, "CCB" },
+ 		{ report_jump_status, "Jump" },
+ 		{ report_deco_status, "DECO" },
+-		{ NULL, "Queue Manager Interface" },
++		{ NULL, NULL },
+ 		{ report_jr_status, "Job Ring" },
+ 		{ report_cond_code_status, "Condition Code" },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+-		{ NULL, NULL },
+ 	};
+ 	u32 ssrc = status >> JRSTA_SSRC_SHIFT;
+-	const char *error = status_src[ssrc].error;
+ 
+-	/*
+-	 * If there is an error handling function, call it to report the error.
+-	 * Otherwise print the error source name.
+-	 */
++	sprintf(outstr, "%s: ", status_src[ssrc].error);
++
+ 	if (status_src[ssrc].report_ssed)
+-		status_src[ssrc].report_ssed(jrdev, status, error);
+-	else if (error)
+-		dev_err(jrdev, "%d: %s\n", ssrc, error);
+-	else
+-		dev_err(jrdev, "%d: unknown error source\n", ssrc);
++		status_src[ssrc].report_ssed(status, outstr);
++
++	return outstr;
+ }
+ EXPORT_SYMBOL(caam_jr_strstatus);
+diff -Nur linux-4.1.3/drivers/crypto/caam/error.h linux-xbian-imx6/drivers/crypto/caam/error.h
+--- linux-4.1.3/drivers/crypto/caam/error.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/error.h	2015-07-27 23:13:04.213947410 +0200
+@@ -7,5 +7,5 @@
+ #ifndef CAAM_ERROR_H
+ #define CAAM_ERROR_H
+ #define CAAM_ERROR_STR_MAX 302
+-void caam_jr_strstatus(struct device *jrdev, u32 status);
++extern char *caam_jr_strstatus(char *outstr, u32 status);
+ #endif /* CAAM_ERROR_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/intern.h linux-xbian-imx6/drivers/crypto/caam/intern.h
+--- linux-4.1.3/drivers/crypto/caam/intern.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/intern.h	2015-07-27 23:13:04.213947410 +0200
+@@ -2,13 +2,19 @@
+  * CAAM/SEC 4.x driver backend
+  * Private/internal definitions between modules
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  *
+  */
+ 
+ #ifndef INTERN_H
+ #define INTERN_H
+ 
++#define JOBR_UNASSIGNED 0
++#define JOBR_ASSIGNED 1
++
++/* Default clock/sample settings for an RNG4 entropy source */
++#define RNG4_ENT_CLOCKS_SAMPLE 1600
++
+ /* Currently comes from Kconfig param as a ^2 (driver-required) */
+ #define JOBR_DEPTH (1 << CONFIG_CRYPTO_DEV_FSL_CAAM_RINGSIZE)
+ 
+@@ -37,15 +43,13 @@
+ 
+ /* Private sub-storage for a single JobR */
+ struct caam_drv_private_jr {
+-	struct list_head	list_node;	/* Job Ring device list */
+-	struct device		*dev;
++	struct device *parentdev;	/* points back to controller dev */
++	struct platform_device *jr_pdev;/* points to platform device for JR */
+ 	int ridx;
+ 	struct caam_job_ring __iomem *rregs;	/* JobR's register space */
+ 	struct tasklet_struct irqtask;
+ 	int irq;			/* One per queue */
+-
+-	/* Number of scatterlist crypt transforms active on the JobR */
+-	atomic_t tfm_count ____cacheline_aligned;
++	int assign;			/* busy/free */
+ 
+ 	/* Job ring info */
+ 	int ringsize;	/* Size of rings (assume input = output) */
+@@ -66,15 +70,20 @@
+ struct caam_drv_private {
+ 
+ 	struct device *dev;
+-	struct platform_device **jrpdev; /* Alloc'ed array per sub-device */
++	struct device *smdev;
++	struct device *secviodev;
++	struct device **jrdev; /* Alloc'ed array per sub-device */
++	spinlock_t jr_alloc_lock;
+ 	struct platform_device *pdev;
+ 
+ 	/* Physical-presence section */
+-	struct caam_ctrl __iomem *ctrl; /* controller region */
+-	struct caam_deco __iomem *deco; /* DECO/CCB views */
+-	struct caam_assurance __iomem *assure;
+-	struct caam_queue_if __iomem *qi; /* QI control region */
+-	struct caam_job_ring __iomem *jr[4];	/* JobR's register space */
++	struct caam_ctrl *ctrl; /* controller region */
++	struct caam_deco **deco; /* DECO/CCB views */
++	struct caam_assurance *ac;
++	struct caam_queue_if *qi; /* QI control region */
++	struct snvs_full __iomem *snvs;	/* SNVS HP+LP register space */
++	dma_addr_t __iomem *sm_base;	/* Secure memory storage base */
++	u32 sm_size;
+ 
+ 	/*
+ 	 * Detected geometry block. Filled in from device tree if powerpc,
+@@ -83,14 +92,22 @@
+ 	u8 total_jobrs;		/* Total Job Rings in device */
+ 	u8 qi_present;		/* Nonzero if QI present in device */
+ 	int secvio_irq;		/* Security violation interrupt number */
+-	int virt_en;		/* Virtualization enabled in CAAM */
+-
+-#define	RNG4_MAX_HANDLES 2
+-	/* RNG4 block */
+-	u32 rng4_sh_init;	/* This bitmap shows which of the State
+-				   Handles of the RNG4 block are initialized
+-				   by this driver */
++	int rng_inst;		/* Total instantiated RNGs */
+ 
++	/* which jr allocated to scatterlist crypto */
++	atomic_t tfm_count ____cacheline_aligned;
++	int num_jrs_for_algapi;
++	struct device **algapi_jr;
++	/* list of registered crypto algorithms (mk generic context handle?) */
++	struct list_head alg_list;
++	/* list of registered hash algorithms (mk generic context handle?) */
++	struct list_head hash_list;
++
++#ifdef CONFIG_ARM
++	struct clk *caam_ipg;
++	struct clk *caam_mem;
++	struct clk *caam_aclk;
++#endif
+ 	/*
+ 	 * debugfs entries for developer view into driver/device
+ 	 * variables at runtime.
+diff -Nur linux-4.1.3/drivers/crypto/caam/jr.c linux-xbian-imx6/drivers/crypto/caam/jr.c
+--- linux-4.1.3/drivers/crypto/caam/jr.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/jr.c	2015-07-27 23:13:04.213947410 +0200
+@@ -2,125 +2,15 @@
+  * CAAM/SEC 4.x transport/backend driver
+  * JobR backend functionality
+  *
+- * Copyright 2008-2012 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  */
+ 
+-#include <linux/of_irq.h>
+-#include <linux/of_address.h>
+-
+ #include "compat.h"
+ #include "regs.h"
+ #include "jr.h"
+ #include "desc.h"
+ #include "intern.h"
+ 
+-struct jr_driver_data {
+-	/* List of Physical JobR's with the Driver */
+-	struct list_head	jr_list;
+-	spinlock_t		jr_alloc_lock;	/* jr_list lock */
+-} ____cacheline_aligned;
+-
+-static struct jr_driver_data driver_data;
+-
+-static int caam_reset_hw_jr(struct device *dev)
+-{
+-	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
+-	unsigned int timeout = 100000;
+-
+-	/*
+-	 * mask interrupts since we are going to poll
+-	 * for reset completion status
+-	 */
+-	setbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
+-
+-	/* initiate flush (required prior to reset) */
+-	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
+-	while (((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) ==
+-		JRINT_ERR_HALT_INPROGRESS) && --timeout)
+-		cpu_relax();
+-
+-	if ((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) !=
+-	    JRINT_ERR_HALT_COMPLETE || timeout == 0) {
+-		dev_err(dev, "failed to flush job ring %d\n", jrp->ridx);
+-		return -EIO;
+-	}
+-
+-	/* initiate reset */
+-	timeout = 100000;
+-	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
+-	while ((rd_reg32(&jrp->rregs->jrcommand) & JRCR_RESET) && --timeout)
+-		cpu_relax();
+-
+-	if (timeout == 0) {
+-		dev_err(dev, "failed to reset job ring %d\n", jrp->ridx);
+-		return -EIO;
+-	}
+-
+-	/* unmask interrupts */
+-	clrbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
+-
+-	return 0;
+-}
+-
+-/*
+- * Shutdown JobR independent of platform property code
+- */
+-int caam_jr_shutdown(struct device *dev)
+-{
+-	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
+-	dma_addr_t inpbusaddr, outbusaddr;
+-	int ret;
+-
+-	ret = caam_reset_hw_jr(dev);
+-
+-	tasklet_kill(&jrp->irqtask);
+-
+-	/* Release interrupt */
+-	free_irq(jrp->irq, dev);
+-
+-	/* Free rings */
+-	inpbusaddr = rd_reg64(&jrp->rregs->inpring_base);
+-	outbusaddr = rd_reg64(&jrp->rregs->outring_base);
+-	dma_free_coherent(dev, sizeof(dma_addr_t) * JOBR_DEPTH,
+-			  jrp->inpring, inpbusaddr);
+-	dma_free_coherent(dev, sizeof(struct jr_outentry) * JOBR_DEPTH,
+-			  jrp->outring, outbusaddr);
+-	kfree(jrp->entinfo);
+-
+-	return ret;
+-}
+-
+-static int caam_jr_remove(struct platform_device *pdev)
+-{
+-	int ret;
+-	struct device *jrdev;
+-	struct caam_drv_private_jr *jrpriv;
+-
+-	jrdev = &pdev->dev;
+-	jrpriv = dev_get_drvdata(jrdev);
+-
+-	/*
+-	 * Return EBUSY if job ring already allocated.
+-	 */
+-	if (atomic_read(&jrpriv->tfm_count)) {
+-		dev_err(jrdev, "Device is busy\n");
+-		return -EBUSY;
+-	}
+-
+-	/* Remove the node from Physical JobR list maintained by driver */
+-	spin_lock(&driver_data.jr_alloc_lock);
+-	list_del(&jrpriv->list_node);
+-	spin_unlock(&driver_data.jr_alloc_lock);
+-
+-	/* Release ring */
+-	ret = caam_jr_shutdown(jrdev);
+-	if (ret)
+-		dev_err(jrdev, "Failed to shut down job ring\n");
+-	irq_dispose_mapping(jrpriv->irq);
+-
+-	return ret;
+-}
+-
+ /* Main per-ring interrupt handler */
+ static irqreturn_t caam_jr_interrupt(int irq, void *st_dev)
+ {
+@@ -168,6 +58,9 @@
+ 	void (*usercall)(struct device *dev, u32 *desc, u32 status, void *arg);
+ 	u32 *userdesc, userstatus;
+ 	void *userarg;
++	dma_addr_t outbusaddr;
++
++	outbusaddr = rd_reg64(&jrp->rregs->outring_base);
+ 
+ 	while (rd_reg32(&jrp->rregs->outring_used)) {
+ 
+@@ -177,10 +70,15 @@
+ 
+ 		sw_idx = tail = jrp->tail;
+ 		hw_idx = jrp->out_ring_read_index;
++		dma_sync_single_for_cpu(dev, outbusaddr,
++					sizeof(struct jr_outentry) * JOBR_DEPTH,
++					DMA_FROM_DEVICE);
+ 
+ 		for (i = 0; CIRC_CNT(head, tail + i, JOBR_DEPTH) >= 1; i++) {
+ 			sw_idx = (tail + i) & (JOBR_DEPTH - 1);
+ 
++			smp_read_barrier_depends();
++
+ 			if (jrp->outring[hw_idx].desc ==
+ 			    jrp->entinfo[sw_idx].desc_addr_dma)
+ 				break; /* found */
+@@ -202,6 +100,8 @@
+ 		userdesc = jrp->entinfo[sw_idx].desc_addr_virt;
+ 		userstatus = jrp->outring[hw_idx].jrstatus;
+ 
++		smp_mb();
++
+ 		/* set done */
+ 		wr_reg32(&jrp->rregs->outring_rmvd, 1);
+ 
+@@ -216,6 +116,7 @@
+ 		if (sw_idx == tail) {
+ 			do {
+ 				tail = (tail + 1) & (JOBR_DEPTH - 1);
++				smp_read_barrier_depends();
+ 			} while (CIRC_CNT(head, tail, JOBR_DEPTH) >= 1 &&
+ 				 jrp->entinfo[tail].desc_addr_dma == 0);
+ 
+@@ -233,57 +134,70 @@
+ }
+ 
+ /**
+- * caam_jr_alloc() - Alloc a job ring for someone to use as needed.
+- *
+- * returns :  pointer to the newly allocated physical
+- *	      JobR dev can be written to if successful.
++ * caam_jr_register() - Alloc a ring for someone to use as needed. Returns
++ * an ordinal of the rings allocated, else returns -ENODEV if no rings
++ * are available.
++ * @ctrldev: points to the controller level dev (parent) that
++ *           owns rings available for use.
++ * @dev:     points to where a pointer to the newly allocated queue's
++ *           dev can be written to if successful.
+  **/
+-struct device *caam_jr_alloc(void)
++int caam_jr_register(struct device *ctrldev, struct device **rdev)
+ {
+-	struct caam_drv_private_jr *jrpriv, *min_jrpriv = NULL;
+-	struct device *dev = NULL;
+-	int min_tfm_cnt	= INT_MAX;
+-	int tfm_cnt;
+-
+-	spin_lock(&driver_data.jr_alloc_lock);
+-
+-	if (list_empty(&driver_data.jr_list)) {
+-		spin_unlock(&driver_data.jr_alloc_lock);
+-		return ERR_PTR(-ENODEV);
+-	}
+-
+-	list_for_each_entry(jrpriv, &driver_data.jr_list, list_node) {
+-		tfm_cnt = atomic_read(&jrpriv->tfm_count);
+-		if (tfm_cnt < min_tfm_cnt) {
+-			min_tfm_cnt = tfm_cnt;
+-			min_jrpriv = jrpriv;
++	struct caam_drv_private *ctrlpriv = dev_get_drvdata(ctrldev);
++	struct caam_drv_private_jr *jrpriv = NULL;
++	int ring;
++
++	/* Lock, if free ring - assign, unlock */
++	spin_lock(&ctrlpriv->jr_alloc_lock);
++	for (ring = 0; ring < ctrlpriv->total_jobrs; ring++) {
++		jrpriv = dev_get_drvdata(ctrlpriv->jrdev[ring]);
++		if (jrpriv->assign == JOBR_UNASSIGNED) {
++			jrpriv->assign = JOBR_ASSIGNED;
++			*rdev = ctrlpriv->jrdev[ring];
++			spin_unlock(&ctrlpriv->jr_alloc_lock);
++			return ring;
+ 		}
+-		if (!min_tfm_cnt)
+-			break;
+ 	}
+ 
+-	if (min_jrpriv) {
+-		atomic_inc(&min_jrpriv->tfm_count);
+-		dev = min_jrpriv->dev;
+-	}
+-	spin_unlock(&driver_data.jr_alloc_lock);
++	/* If assigned, write dev where caller needs it */
++	spin_unlock(&ctrlpriv->jr_alloc_lock);
++	*rdev = NULL;
+ 
+-	return dev;
++	return -ENODEV;
+ }
+-EXPORT_SYMBOL(caam_jr_alloc);
++EXPORT_SYMBOL(caam_jr_register);
+ 
+ /**
+- * caam_jr_free() - Free the Job Ring
+- * @rdev     - points to the dev that identifies the Job ring to
+- *             be released.
++ * caam_jr_deregister() - Deregister an API and release the queue.
++ * Returns 0 if OK, -EBUSY if queue still contains pending entries
++ * or unprocessed results at the time of the call
++ * @dev     - points to the dev that identifies the queue to
++ *            be released.
+  **/
+-void caam_jr_free(struct device *rdev)
++int caam_jr_deregister(struct device *rdev)
+ {
+ 	struct caam_drv_private_jr *jrpriv = dev_get_drvdata(rdev);
++	struct caam_drv_private *ctrlpriv;
++
++	/* Get the owning controller's private space */
++	ctrlpriv = dev_get_drvdata(jrpriv->parentdev);
++
++	/*
++	 * Make sure ring empty before release
++	 */
++	if (rd_reg32(&jrpriv->rregs->outring_used) ||
++	    (rd_reg32(&jrpriv->rregs->inpring_avail) != JOBR_DEPTH))
++		return -EBUSY;
+ 
+-	atomic_dec(&jrpriv->tfm_count);
++	/* Release ring */
++	spin_lock(&ctrlpriv->jr_alloc_lock);
++	jrpriv->assign = JOBR_UNASSIGNED;
++	spin_unlock(&ctrlpriv->jr_alloc_lock);
++
++	return 0;
+ }
+-EXPORT_SYMBOL(caam_jr_free);
++EXPORT_SYMBOL(caam_jr_deregister);
+ 
+ /**
+  * caam_jr_enqueue() - Enqueue a job descriptor head. Returns 0 if OK,
+@@ -321,7 +235,7 @@
+ 	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
+ 	struct caam_jrentry_info *head_entry;
+ 	int head, tail, desc_size;
+-	dma_addr_t desc_dma;
++	dma_addr_t desc_dma, inpbusaddr;
+ 
+ 	desc_size = (*desc & HDR_JD_LENGTH_MASK) * sizeof(u32);
+ 	desc_dma = dma_map_single(dev, desc, desc_size, DMA_TO_DEVICE);
+@@ -330,6 +244,13 @@
+ 		return -EIO;
+ 	}
+ 
++	dma_sync_single_for_device(dev, desc_dma, desc_size, DMA_TO_DEVICE);
++
++	inpbusaddr = rd_reg64(&jrp->rregs->inpring_base);
++	dma_sync_single_for_device(dev, inpbusaddr,
++					sizeof(dma_addr_t) * JOBR_DEPTH,
++					DMA_TO_DEVICE);
++
+ 	spin_lock_bh(&jrp->inplock);
+ 
+ 	head = jrp->head;
+@@ -351,12 +272,18 @@
+ 
+ 	jrp->inpring[jrp->inp_ring_write_index] = desc_dma;
+ 
++	dma_sync_single_for_device(dev, inpbusaddr,
++					sizeof(dma_addr_t) * JOBR_DEPTH,
++					DMA_TO_DEVICE);
++
+ 	smp_wmb();
+ 
+ 	jrp->inp_ring_write_index = (jrp->inp_ring_write_index + 1) &
+ 				    (JOBR_DEPTH - 1);
+ 	jrp->head = (head + 1) & (JOBR_DEPTH - 1);
+ 
++	wmb();
++
+ 	wr_reg32(&jrp->rregs->inpring_jobadd, 1);
+ 
+ 	spin_unlock_bh(&jrp->inplock);
+@@ -365,6 +292,46 @@
+ }
+ EXPORT_SYMBOL(caam_jr_enqueue);
+ 
++static int caam_reset_hw_jr(struct device *dev)
++{
++	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
++	unsigned int timeout = 100000;
++
++	/*
++	 * mask interrupts since we are going to poll
++	 * for reset completion status
++	 */
++	setbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
++
++	/* initiate flush (required prior to reset) */
++	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
++	while (((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) ==
++		JRINT_ERR_HALT_INPROGRESS) && --timeout)
++		cpu_relax();
++
++	if ((rd_reg32(&jrp->rregs->jrintstatus) & JRINT_ERR_HALT_MASK) !=
++	    JRINT_ERR_HALT_COMPLETE || timeout == 0) {
++		dev_err(dev, "failed to flush job ring %d\n", jrp->ridx);
++		return -EIO;
++	}
++
++	/* initiate reset */
++	timeout = 100000;
++	wr_reg32(&jrp->rregs->jrcommand, JRCR_RESET);
++	while ((rd_reg32(&jrp->rregs->jrcommand) & JRCR_RESET) && --timeout)
++		cpu_relax();
++
++	if (timeout == 0) {
++		dev_err(dev, "failed to reset job ring %d\n", jrp->ridx);
++		return -EIO;
++	}
++
++	/* unmask interrupts */
++	clrbits32(&jrp->rregs->rconfig_lo, JRCFG_IMSK);
++
++	return 0;
++}
++
+ /*
+  * Init JobR independent of platform property detection
+  */
+@@ -380,32 +347,34 @@
+ 
+ 	/* Connect job ring interrupt handler. */
+ 	error = request_irq(jrp->irq, caam_jr_interrupt, IRQF_SHARED,
+-			    dev_name(dev), dev);
++			    "caam-jobr", dev);
+ 	if (error) {
+ 		dev_err(dev, "can't connect JobR %d interrupt (%d)\n",
+ 			jrp->ridx, jrp->irq);
+-		goto out_kill_deq;
++		irq_dispose_mapping(jrp->irq);
++		jrp->irq = 0;
++		return -EINVAL;
+ 	}
+ 
+ 	error = caam_reset_hw_jr(dev);
+ 	if (error)
+-		goto out_free_irq;
++		return error;
+ 
+-	error = -ENOMEM;
+ 	jrp->inpring = dma_alloc_coherent(dev, sizeof(dma_addr_t) * JOBR_DEPTH,
+ 					  &inpbusaddr, GFP_KERNEL);
+-	if (!jrp->inpring)
+-		goto out_free_irq;
+ 
+ 	jrp->outring = dma_alloc_coherent(dev, sizeof(struct jr_outentry) *
+ 					  JOBR_DEPTH, &outbusaddr, GFP_KERNEL);
+-	if (!jrp->outring)
+-		goto out_free_inpring;
+ 
+ 	jrp->entinfo = kzalloc(sizeof(struct caam_jrentry_info) * JOBR_DEPTH,
+ 			       GFP_KERNEL);
+-	if (!jrp->entinfo)
+-		goto out_free_outring;
++
++	if ((jrp->inpring == NULL) || (jrp->outring == NULL) ||
++	    (jrp->entinfo == NULL)) {
++		dev_err(dev, "can't allocate job rings for %d\n",
++			jrp->ridx);
++		return -ENOMEM;
++	}
+ 
+ 	for (i = 0; i < JOBR_DEPTH; i++)
+ 		jrp->entinfo[i].desc_addr_dma = !0;
+@@ -431,120 +400,123 @@
+ 		  (JOBR_INTC_COUNT_THLD << JRCFG_ICDCT_SHIFT) |
+ 		  (JOBR_INTC_TIME_THLD << JRCFG_ICTT_SHIFT));
+ 
++	jrp->assign = JOBR_UNASSIGNED;
+ 	return 0;
++}
+ 
+-out_free_outring:
+-	dma_free_coherent(dev, sizeof(struct jr_outentry) * JOBR_DEPTH,
+-			  jrp->outring, outbusaddr);
+-out_free_inpring:
++/*
++ * Shutdown JobR independent of platform property code
++ */
++int caam_jr_shutdown(struct device *dev)
++{
++	struct caam_drv_private_jr *jrp = dev_get_drvdata(dev);
++	dma_addr_t inpbusaddr, outbusaddr;
++	int ret;
++
++	ret = caam_reset_hw_jr(dev);
++
++	tasklet_kill(&jrp->irqtask);
++
++	/* Release interrupt */
++	free_irq(jrp->irq, dev);
++
++	/* Free rings */
++	inpbusaddr = rd_reg64(&jrp->rregs->inpring_base);
++	outbusaddr = rd_reg64(&jrp->rregs->outring_base);
+ 	dma_free_coherent(dev, sizeof(dma_addr_t) * JOBR_DEPTH,
+ 			  jrp->inpring, inpbusaddr);
+-	dev_err(dev, "can't allocate job rings for %d\n", jrp->ridx);
+-out_free_irq:
+-	free_irq(jrp->irq, dev);
+-out_kill_deq:
+-	tasklet_kill(&jrp->irqtask);
+-	return error;
+-}
++	dma_free_coherent(dev, sizeof(struct jr_outentry) * JOBR_DEPTH,
++			  jrp->outring, outbusaddr);
++	kfree(jrp->entinfo);
++	of_device_unregister(jrp->jr_pdev);
+ 
++	return ret;
++}
+ 
+ /*
+- * Probe routine for each detected JobR subsystem.
++ * Probe routine for each detected JobR subsystem. It assumes that
++ * property detection was picked up externally.
+  */
+-static int caam_jr_probe(struct platform_device *pdev)
++int caam_jr_probe(struct platform_device *pdev, struct device_node *np,
++		  int ring)
+ {
+-	struct device *jrdev;
+-	struct device_node *nprop;
+-	struct caam_job_ring __iomem *ctrl;
++	struct device *ctrldev, *jrdev;
++	struct platform_device *jr_pdev;
++	struct caam_drv_private *ctrlpriv;
+ 	struct caam_drv_private_jr *jrpriv;
+-	static int total_jobrs;
++	const __be32 *jroffset_addr;
++	u32 jroffset;
+ 	int error;
+ 
+-	jrdev = &pdev->dev;
+-	jrpriv = devm_kmalloc(jrdev, sizeof(struct caam_drv_private_jr),
+-			      GFP_KERNEL);
+-	if (!jrpriv)
++	ctrldev = &pdev->dev;
++	ctrlpriv = dev_get_drvdata(ctrldev);
++
++	jrpriv = kmalloc(sizeof(struct caam_drv_private_jr),
++			 GFP_KERNEL);
++	if (jrpriv == NULL) {
++		dev_err(ctrldev, "can't alloc private mem for job ring %d\n",
++			ring);
+ 		return -ENOMEM;
++	}
++	jrpriv->parentdev = ctrldev; /* point back to parent */
++	jrpriv->ridx = ring; /* save ring identity relative to detection */
+ 
+-	dev_set_drvdata(jrdev, jrpriv);
++	/*
++	 * Derive a pointer to the detected JobRs regs
++	 * Driver has already iomapped the entire space, we just
++	 * need to add in the offset to this JobR. Don't know if I
++	 * like this long-term, but it'll run
++	 */
++	jroffset_addr = of_get_property(np, "reg", NULL);
+ 
+-	/* save ring identity relative to detection */
+-	jrpriv->ridx = total_jobrs++;
++	if (jroffset_addr == NULL) {
++		kfree(jrpriv);
++		return -EINVAL;
++	}
+ 
+-	nprop = pdev->dev.of_node;
+-	/* Get configuration properties from device tree */
+-	/* First, get register page */
+-	ctrl = of_iomap(nprop, 0);
+-	if (!ctrl) {
+-		dev_err(jrdev, "of_iomap() failed\n");
+-		return -ENOMEM;
++	/*
++	 * Fix the endianness of this value read from the device
++	 * tree if running on ARM.
++	 */
++	jroffset = be32_to_cpup(jroffset_addr);
++
++	jrpriv->rregs = (struct caam_job_ring __iomem *)((void *)ctrlpriv->ctrl
++							 + jroffset);
++
++	/* Build a local dev for each detected queue */
++	jr_pdev = of_platform_device_create(np, NULL, ctrldev);
++	if (jr_pdev == NULL) {
++		kfree(jrpriv);
++		return -EINVAL;
+ 	}
+ 
+-	jrpriv->rregs = (struct caam_job_ring __force *)ctrl;
++	jrpriv->jr_pdev = jr_pdev;
++	jrdev = &jr_pdev->dev;
++	dev_set_drvdata(jrdev, jrpriv);
++	ctrlpriv->jrdev[ring] = jrdev;
+ 
+ 	if (sizeof(dma_addr_t) == sizeof(u64))
+-		if (of_device_is_compatible(nprop, "fsl,sec-v5.0-job-ring"))
+-			dma_set_mask_and_coherent(jrdev, DMA_BIT_MASK(40));
++		if (of_device_is_compatible(np, "fsl,sec-v4.0-job-ring"))
++			dma_set_mask(jrdev, DMA_BIT_MASK(40));
+ 		else
+-			dma_set_mask_and_coherent(jrdev, DMA_BIT_MASK(36));
++			dma_set_mask(jrdev, DMA_BIT_MASK(36));
+ 	else
+-		dma_set_mask_and_coherent(jrdev, DMA_BIT_MASK(32));
++		dma_set_mask(jrdev, DMA_BIT_MASK(32));
+ 
+ 	/* Identify the interrupt */
+-	jrpriv->irq = irq_of_parse_and_map(nprop, 0);
++	jrpriv->irq = of_irq_to_resource(np, 0, NULL);
++	if (jrpriv->irq <= 0) {
++		kfree(jrpriv);
++		return -EINVAL;
++	}
+ 
+ 	/* Now do the platform independent part */
+ 	error = caam_jr_init(jrdev); /* now turn on hardware */
+ 	if (error) {
+-		irq_dispose_mapping(jrpriv->irq);
++		of_device_unregister(jr_pdev);
++		kfree(jrpriv);
+ 		return error;
+ 	}
+ 
+-	jrpriv->dev = jrdev;
+-	spin_lock(&driver_data.jr_alloc_lock);
+-	list_add_tail(&jrpriv->list_node, &driver_data.jr_list);
+-	spin_unlock(&driver_data.jr_alloc_lock);
+-
+-	atomic_set(&jrpriv->tfm_count, 0);
+-
+-	return 0;
+-}
+-
+-static struct of_device_id caam_jr_match[] = {
+-	{
+-		.compatible = "fsl,sec-v4.0-job-ring",
+-	},
+-	{
+-		.compatible = "fsl,sec4.0-job-ring",
+-	},
+-	{},
+-};
+-MODULE_DEVICE_TABLE(of, caam_jr_match);
+-
+-static struct platform_driver caam_jr_driver = {
+-	.driver = {
+-		.name = "caam_jr",
+-		.of_match_table = caam_jr_match,
+-	},
+-	.probe       = caam_jr_probe,
+-	.remove      = caam_jr_remove,
+-};
+-
+-static int __init jr_driver_init(void)
+-{
+-	spin_lock_init(&driver_data.jr_alloc_lock);
+-	INIT_LIST_HEAD(&driver_data.jr_list);
+-	return platform_driver_register(&caam_jr_driver);
+-}
+-
+-static void __exit jr_driver_exit(void)
+-{
+-	platform_driver_unregister(&caam_jr_driver);
++	return error;
+ }
+-
+-module_init(jr_driver_init);
+-module_exit(jr_driver_exit);
+-
+-MODULE_LICENSE("GPL");
+-MODULE_DESCRIPTION("FSL CAAM JR request backend");
+-MODULE_AUTHOR("Freescale Semiconductor - NMG/STC");
+diff -Nur linux-4.1.3/drivers/crypto/caam/jr.h linux-xbian-imx6/drivers/crypto/caam/jr.h
+--- linux-4.1.3/drivers/crypto/caam/jr.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/jr.h	2015-07-27 23:13:04.213947410 +0200
+@@ -1,18 +1,22 @@
+ /*
+  * CAAM public-level include definitions for the JobR backend
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  */
+ 
+ #ifndef JR_H
+ #define JR_H
+ 
+ /* Prototypes for backend-level services exposed to APIs */
+-struct device *caam_jr_alloc(void);
+-void caam_jr_free(struct device *rdev);
++int caam_jr_register(struct device *ctrldev, struct device **rdev);
++int caam_jr_deregister(struct device *rdev);
+ int caam_jr_enqueue(struct device *dev, u32 *desc,
+ 		    void (*cbk)(struct device *dev, u32 *desc, u32 status,
+ 				void *areq),
+ 		    void *areq);
+ 
++extern int caam_jr_probe(struct platform_device *pdev, struct device_node *np,
++			 int ring);
++extern int caam_jr_shutdown(struct device *dev);
++extern struct device *caam_get_jrdev(void);
+ #endif /* JR_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/Kconfig linux-xbian-imx6/drivers/crypto/caam/Kconfig
+--- linux-4.1.3/drivers/crypto/caam/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/Kconfig	2015-07-27 23:13:04.205975852 +0200
+@@ -1,32 +1,19 @@
+ config CRYPTO_DEV_FSL_CAAM
+ 	tristate "Freescale CAAM-Multicore driver backend"
+-	depends on FSL_SOC
++	depends on FSL_SOC || ARCH_MXC
+ 	help
+ 	  Enables the driver module for Freescale's Cryptographic Accelerator
+ 	  and Assurance Module (CAAM), also known as the SEC version 4 (SEC4).
+-	  This module creates job ring devices, and configures h/w
++	  This module adds a job ring operation interface, and configures h/w
+ 	  to operate as a DPAA component automatically, depending
+ 	  on h/w feature availability.
+ 
+ 	  To compile this driver as a module, choose M here: the module
+ 	  will be called caam.
+ 
+-config CRYPTO_DEV_FSL_CAAM_JR
+-	tristate "Freescale CAAM Job Ring driver backend"
+-	depends on CRYPTO_DEV_FSL_CAAM
+-	default y
+-	help
+-	  Enables the driver module for Job Rings which are part of
+-	  Freescale's Cryptographic Accelerator
+-	  and Assurance Module (CAAM). This module adds a job ring operation
+-	  interface.
+-
+-	  To compile this driver as a module, choose M here: the module
+-	  will be called caam_jr.
+-
+ config CRYPTO_DEV_FSL_CAAM_RINGSIZE
+ 	int "Job Ring size"
+-	depends on CRYPTO_DEV_FSL_CAAM_JR
++	depends on CRYPTO_DEV_FSL_CAAM
+ 	range 2 9
+ 	default "9"
+ 	help
+@@ -44,7 +31,7 @@
+ 
+ config CRYPTO_DEV_FSL_CAAM_INTC
+ 	bool "Job Ring interrupt coalescing"
+-	depends on CRYPTO_DEV_FSL_CAAM_JR
++	depends on CRYPTO_DEV_FSL_CAAM
+ 	default n
+ 	help
+ 	  Enable the Job Ring's interrupt coalescing feature.
+@@ -75,7 +62,7 @@
+ 
+ config CRYPTO_DEV_FSL_CAAM_CRYPTO_API
+ 	tristate "Register algorithm implementations with the Crypto API"
+-	depends on CRYPTO_DEV_FSL_CAAM && CRYPTO_DEV_FSL_CAAM_JR
++	depends on CRYPTO_DEV_FSL_CAAM
+ 	default y
+ 	select CRYPTO_ALGAPI
+ 	select CRYPTO_AUTHENC
+@@ -89,7 +76,7 @@
+ 
+ config CRYPTO_DEV_FSL_CAAM_AHASH_API
+ 	tristate "Register hash algorithm implementations with Crypto API"
+-	depends on CRYPTO_DEV_FSL_CAAM && CRYPTO_DEV_FSL_CAAM_JR
++	depends on CRYPTO_DEV_FSL_CAAM
+ 	default y
+ 	select CRYPTO_HASH
+ 	help
+@@ -101,7 +88,7 @@
+ 
+ config CRYPTO_DEV_FSL_CAAM_RNG_API
+ 	tristate "Register caam device for hwrng API"
+-	depends on CRYPTO_DEV_FSL_CAAM && CRYPTO_DEV_FSL_CAAM_JR
++	depends on CRYPTO_DEV_FSL_CAAM
+ 	default y
+ 	select CRYPTO_RNG
+ 	select HW_RANDOM
+@@ -112,6 +99,54 @@
+ 	  To compile this as a module, choose M here: the module
+ 	  will be called caamrng.
+ 
++config CRYPTO_DEV_FSL_CAAM_RNG_TEST
++	boolean "Test caam rng"
++	depends on CRYPTO_DEV_FSL_CAAM_RNG_API
++	default n
++	help
++	  Selecting this will enable self-test for caam rng.
++
++config CRYPTO_DEV_FSL_CAAM_SM
++	tristate "CAAM Secure Memory / Keystore API (EXPERIMENTAL)"
++	default n
++	help
++	  Enables use of a prototype kernel-level Keystore API with CAAM
++	  Secure Memory for insertion/extraction of bus-protected secrets.
++
++config CRYPTO_DEV_FSL_CAAM_SM_SLOTSIZE
++	int "Size of each keystore slot in Secure Memory"
++	depends on CRYPTO_DEV_FSL_CAAM_SM
++	range 5 9
++	default 7
++	help
++	  Select size of allocation units to divide Secure Memory pages into
++	  (the size of a "slot" as referenced inside the API code).
++	  Established as powers of two.
++	  Examples:
++		5 => 32 bytes
++		6 => 64 bytes
++		7 => 128 bytes
++		8 => 256 bytes
++		9 => 512 bytes
++
++config CRYPTO_DEV_FSL_CAAM_SM_TEST
++	tristate "CAAM Secure Memory - Keystore Test/Example (EXPERIMENTAL)"
++	depends on CRYPTO_DEV_FSL_CAAM_SM
++	default n
++	help
++	  Example thread to exercise the Keystore API and to verify that
++	  stored and recovered secrets can be used for general purpose
++	  encryption/decryption.
++
++config CRYPTO_DEV_FSL_CAAM_SECVIO
++	tristate "CAAM/SNVS Security Violation Handler (EXPERIMENTAL)"
++	depends on CRYPTO_DEV_FSL_CAAM
++	default n
++	help
++	  Enables installation of an interrupt handler with registrable
++          handler functions which can be specified to act on the consequences
++          of a security violation.
++
+ config CRYPTO_DEV_FSL_CAAM_DEBUG
+ 	bool "Enable debug output in CAAM driver"
+ 	depends on CRYPTO_DEV_FSL_CAAM
+@@ -119,3 +154,19 @@
+ 	help
+ 	  Selecting this will enable printing of various debug
+ 	  information in the CAAM driver.
++
++config CRYPTO_DEV_FSL_CAAM_KEYBLOB
++	tristate "Freescale CAAM memory keyblob driver backend"
++	depends on CRYPTO_DEV_FSL_CAAM
++	depends on CRYPTO_DEV_FSL_CAAM_JR
++	default y
++	help
++	  Enables the driver module for Key Blob which are part of
++	  Freescale's Cryptographic Accelerator
++	  and Assurance Module (CAAM). This module adds a key blob operation
++	  interface.
++
++	  To compile this driver as a module, choose M here: the module
++	  will be called caam_keyblob.
++
++
+diff -Nur linux-4.1.3/drivers/crypto/caam/key_gen.c linux-xbian-imx6/drivers/crypto/caam/key_gen.c
+--- linux-4.1.3/drivers/crypto/caam/key_gen.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/key_gen.c	2015-07-27 23:13:04.213947410 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * CAAM/SEC 4.x functions for handling key-generation jobs
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  *
+  */
+ #include "compat.h"
+@@ -19,8 +19,11 @@
+ 	dev_err(dev, "%s %d: err 0x%x\n", __func__, __LINE__, err);
+ #endif
+ 
+-	if (err)
+-		caam_jr_strstatus(dev, err);
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++
++		dev_err(dev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
+ 
+ 	res->err = err;
+ 
+@@ -48,29 +51,24 @@
+ 	u32 *desc;
+ 	struct split_key_result result;
+ 	dma_addr_t dma_addr_in, dma_addr_out;
+-	int ret = -ENOMEM;
++	int ret = 0;
+ 
+ 	desc = kmalloc(CAAM_CMD_SZ * 6 + CAAM_PTR_SZ * 2, GFP_KERNEL | GFP_DMA);
+ 	if (!desc) {
+ 		dev_err(jrdev, "unable to allocate key input memory\n");
+-		return ret;
++		return -ENOMEM;
+ 	}
+ 
++	init_job_desc(desc, 0);
++
+ 	dma_addr_in = dma_map_single(jrdev, (void *)key_in, keylen,
+ 				     DMA_TO_DEVICE);
+ 	if (dma_mapping_error(jrdev, dma_addr_in)) {
+ 		dev_err(jrdev, "unable to map key input memory\n");
+-		goto out_free;
++		kfree(desc);
++		return -ENOMEM;
+ 	}
+-
+-	dma_addr_out = dma_map_single(jrdev, key_out, split_key_pad_len,
+-				      DMA_FROM_DEVICE);
+-	if (dma_mapping_error(jrdev, dma_addr_out)) {
+-		dev_err(jrdev, "unable to map key output memory\n");
+-		goto out_unmap_in;
+-	}
+-
+-	init_job_desc(desc, 0);
++	dma_sync_single_for_device(jrdev, dma_addr_in, keylen, DMA_TO_DEVICE);
+ 	append_key(desc, dma_addr_in, keylen, CLASS_2 | KEY_DEST_CLASS_REG);
+ 
+ 	/* Sets MDHA up into an HMAC-INIT */
+@@ -91,9 +89,9 @@
+ 			  LDST_CLASS_2_CCB | FIFOST_TYPE_SPLIT_KEK);
+ 
+ #ifdef DEBUG
+-	print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, key_in, keylen, 1);
+-	print_hex_dump(KERN_ERR, "jobdesc@"__stringify(__LINE__)": ",
++	print_hex_dump(KERN_ERR, "jobdesc@"xstr(__LINE__)": ",
+ 		       DUMP_PREFIX_ADDRESS, 16, 4, desc, desc_bytes(desc), 1);
+ #endif
+ 
+@@ -106,12 +104,13 @@
+ 		wait_for_completion_interruptible(&result.completion);
+ 		ret = result.err;
+ #ifdef DEBUG
+-		print_hex_dump(KERN_ERR, "ctx.key@"__stringify(__LINE__)": ",
++		print_hex_dump(KERN_ERR, "ctx.key@"xstr(__LINE__)": ",
+ 			       DUMP_PREFIX_ADDRESS, 16, 4, key_out,
+ 			       split_key_pad_len, 1);
+ #endif
+ 	}
+-
++	dma_sync_single_for_cpu(jrdev, dma_addr_out, split_key_pad_len,
++				DMA_FROM_DEVICE);
+ 	dma_unmap_single(jrdev, dma_addr_out, split_key_pad_len,
+ 			 DMA_FROM_DEVICE);
+ out_unmap_in:
+diff -Nur linux-4.1.3/drivers/crypto/caam/Makefile linux-xbian-imx6/drivers/crypto/caam/Makefile
+--- linux-4.1.3/drivers/crypto/caam/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/Makefile	2015-07-27 23:13:04.205975852 +0200
+@@ -1,15 +1,14 @@
+ #
+ # Makefile for the CAAM backend and dependent components
+ #
+-ifeq ($(CONFIG_CRYPTO_DEV_FSL_CAAM_DEBUG), y)
+-	EXTRA_CFLAGS := -DDEBUG
+-endif
+ 
+ obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM) += caam.o
+-obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_JR) += caam_jr.o
+ obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_CRYPTO_API) += caamalg.o
+ obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_AHASH_API) += caamhash.o
+ obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_RNG_API) += caamrng.o
++obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_SM) += sm_store.o
++obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_SM_TEST) += sm_test.o
++obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_SECVIO) += secvio.o
++obj-$(CONFIG_CRYPTO_DEV_FSL_CAAM_KEYBLOB) += caam_keyblob.o
+ 
+-caam-objs := ctrl.o
+-caam_jr-objs := jr.o key_gen.o error.o
++caam-objs := ctrl.o jr.o error.o key_gen.o
+diff -Nur linux-4.1.3/drivers/crypto/caam/pdb.h linux-xbian-imx6/drivers/crypto/caam/pdb.h
+--- linux-4.1.3/drivers/crypto/caam/pdb.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/pdb.h	2015-07-27 23:13:04.213947410 +0200
+@@ -44,7 +44,6 @@
+ #define PDBOPTS_ESP_IPHDRSRC	0x08 /* IP header comes from PDB (encap) */
+ #define PDBOPTS_ESP_INCIPHDR	0x04 /* Prepend IP header to output frame */
+ #define PDBOPTS_ESP_IPVSN	0x02 /* process IPv6 header */
+-#define PDBOPTS_ESP_AOFL	0x04 /* adjust out frame len (decap, SEC>=5.3)*/
+ #define PDBOPTS_ESP_TUNNEL	0x01 /* tunnel mode next-header byte */
+ #define PDBOPTS_ESP_IPV6	0x02 /* ip header version is V6 */
+ #define PDBOPTS_ESP_DIFFSERV	0x40 /* copy TOS/TC from inner iphdr */
+diff -Nur linux-4.1.3/drivers/crypto/caam/regs.h linux-xbian-imx6/drivers/crypto/caam/regs.h
+--- linux-4.1.3/drivers/crypto/caam/regs.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/regs.h	2015-07-27 23:13:04.213947410 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * CAAM hardware register-level view
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  */
+ 
+ #ifndef REGS_H
+@@ -74,17 +74,22 @@
+ #endif
+ #else
+ #ifdef __LITTLE_ENDIAN
+-#define wr_reg32(reg, data) __raw_writel(data, reg)
+-#define rd_reg32(reg) __raw_readl(reg)
++#define wr_reg32(reg, data) writel(data, reg)
++#define rd_reg32(reg) readl(reg)
+ #ifdef CONFIG_64BIT
+-#define wr_reg64(reg, data) __raw_writeq(data, reg)
+-#define rd_reg64(reg) __raw_readq(reg)
++#define wr_reg64(reg, data) writeq(data, reg)
++#define rd_reg64(reg) readq(reg)
+ #endif
+ #endif
+ #endif
+ 
++#ifdef CONFIG_ARM
++/* These are common macros for Power, put here for ARMs */
++#define setbits32(_addr, _v) writel((readl(_addr) | (_v)), (_addr))
++#define clrbits32(_addr, _v) writel((readl(_addr) & ~(_v)), (_addr))
++#endif
++
+ #ifndef CONFIG_64BIT
+-#ifdef __BIG_ENDIAN
+ static inline void wr_reg64(u64 __iomem *reg, u64 data)
+ {
+ 	wr_reg32((u32 __iomem *)reg, (data & 0xffffffff00000000ull) >> 32);
+@@ -96,21 +101,6 @@
+ 	return (((u64)rd_reg32((u32 __iomem *)reg)) << 32) |
+ 		((u64)rd_reg32((u32 __iomem *)reg + 1));
+ }
+-#else
+-#ifdef __LITTLE_ENDIAN
+-static inline void wr_reg64(u64 __iomem *reg, u64 data)
+-{
+-	wr_reg32((u32 __iomem *)reg + 1, (data & 0xffffffff00000000ull) >> 32);
+-	wr_reg32((u32 __iomem *)reg, data & 0x00000000ffffffffull);
+-}
+-
+-static inline u64 rd_reg64(u64 __iomem *reg)
+-{
+-	return (((u64)rd_reg32((u32 __iomem *)reg + 1)) << 32) |
+-		((u64)rd_reg32((u32 __iomem *)reg));
+-}
+-#endif
+-#endif
+ #endif
+ 
+ /*
+@@ -123,6 +113,98 @@
+ } __packed;
+ 
+ /*
++ * CHA version ID / instantiation bitfields
++ * Defined for use within cha_id in perfmon
++ * Note that the same shift/mask selectors can be used to pull out number
++ * of instantiated blocks within cha_num in perfmon, the locations are
++ * the same.
++ */
++
++/* Job Ring */
++#define CHA_ID_JR_SHIFT	60
++#define CHA_ID_JR_MASK		(0xfull << CHA_ID_JR_SHIFT)
++
++/* DEscriptor COntroller */
++#define CHA_ID_DECO_SHIFT	56
++#define CHA_ID_DECO_MASK	(0xfull << CHA_ID_DECO_SHIFT)
++#define CHA_NUM_DECONUM_SHIFT	56 /* legacy definition */
++#define CHA_NUM_DECONUM_MASK	(0xfull << CHA_NUM_DECONUM_SHIFT)
++
++/* ZUC-Authentication */
++#define CHA_ID_ZA_SHIFT	44
++#define CHA_ID_ZA_MASK		(0xfull << CHA_ID_ZA_SHIFT)
++
++/* ZUC-Encryption */
++#define CHA_ID_ZE_SHIFT	40
++#define CHA_ID_ZE_MASK		(0xfull << CHA_ID_ZE_SHIFT)
++
++/* SNOW f9 */
++#define CHA_ID_SNW9_SHIFT	36
++#define CHA_ID_SNW9_MASK	(0xfull << CHA_ID_SNW9_SHIFT)
++
++/* CRC */
++#define CHA_ID_CRC_SHIFT	32
++#define CHA_ID_CRC_MASK		(0xfull << CHA_ID_CRC_SHIFT)
++
++/* Public Key */
++#define CHA_ID_PK_SHIFT	28
++#define CHA_ID_PK_MASK		(0xfull << CHA_ID_PK_SHIFT)
++
++/* Kasumi */
++#define CHA_ID_KAS_SHIFT	24
++#define CHA_ID_KAS_MASK		(0xfull << CHA_ID_KAS_SHIFT)
++
++/* SNOW f8 */
++#define CHA_ID_SNW8_SHIFT	20
++#define CHA_ID_SNW8_MASK	(0xfull << CHA_ID_SNW8_SHIFT)
++
++/*
++ * Random Generator
++ * RNG4 = FIPS-verification-compliant, requires init kickstart for use
++ */
++#define CHA_ID_RNG_SHIFT	16
++#define CHA_ID_RNG_MASK		(0xfull << CHA_ID_RNG_SHIFT)
++#define CHA_ID_RNG_A		(0x1ull << CHA_ID_RNG_SHIFT)
++#define CHA_ID_RNG_B		(0x2ull << CHA_ID_RNG_SHIFT)
++#define CHA_ID_RNG_C		(0x3ull << CHA_ID_RNG_SHIFT)
++#define CHA_ID_RNG_4		(0x4ull << CHA_ID_RNG_SHIFT)
++
++/*
++ * Message Digest
++ * LP256 = Low Power (MD5/SHA1/SHA224/SHA256 + HMAC)
++ * LP512 = Low Power (LP256 + SHA384/SHA512)
++ * HP    = High Power (LP512 + SMAC)
++ */
++#define CHA_ID_MD_SHIFT		12
++#define CHA_ID_MD_MASK		(0xfull << CHA_ID_MD_SHIFT)
++#define CHA_ID_MD_LP256		(0x0ull << CHA_ID_MD_SHIFT)
++#define CHA_ID_MD_LP512		(0x1ull << CHA_ID_MD_SHIFT)
++#define CHA_ID_MD_HP		(0x2ull << CHA_ID_MD_SHIFT)
++
++/* ARC4 Streamcipher */
++#define CHA_ID_ARC4_SHIFT	8
++#define CHA_ID_ARC4_MASK	(0xfull << CHA_ID_ARC4_SHIFT)
++#define CHA_ID_ARC4_LP		(0x0ull << CHA_ID_ARC4_SHIFT)
++#define CHA_ID_ARC4_HP		(0x1ull << CHA_ID_ARC4_SHIFT)
++
++/* DES Blockcipher Accelerator */
++#define CHA_ID_DES_SHIFT	4
++#define CHA_ID_DES_MASK		(0xfull << CHA_ID_DES_SHIFT)
++
++/*
++ * AES Blockcipher + Combo Mode Accelerator
++ * LP = Low Power (includes ECB/CBC/CFB128/OFB/CTR/CCM/CMAC/XCBC-MAC)
++ * HP = High Power (LP + CBCXCBC/CTRXCBC/XTS/GCM)
++ * DIFFPWR = ORed in if differential-power-analysis resistance implemented
++ */
++#define CHA_ID_AES_SHIFT	0
++#define CHA_ID_AES_MASK		(0xfull << CHA_ID_AES_SHIFT)
++#define CHA_ID_AES_LP		(0x3ull << CHA_ID_AES_SHIFT)
++#define CHA_ID_AES_HP		(0x4ull << CHA_ID_AES_SHIFT)
++#define CHA_ID_AES_DIFFPWR	(0x1ull << CHA_ID_AES_SHIFT)
++
++
++/*
+  * caam_perfmon - Performance Monitor/Secure Memory Status/
+  *                CAAM Global Status/Component Version IDs
+  *
+@@ -130,45 +212,8 @@
+  */
+ 
+ /* Number of DECOs */
+-#define CHA_NUM_MS_DECONUM_SHIFT	24
+-#define CHA_NUM_MS_DECONUM_MASK	(0xfull << CHA_NUM_MS_DECONUM_SHIFT)
+-
+-/* CHA Version IDs */
+-#define CHA_ID_LS_AES_SHIFT	0
+-#define CHA_ID_LS_AES_MASK		(0xfull << CHA_ID_LS_AES_SHIFT)
+-
+-#define CHA_ID_LS_DES_SHIFT	4
+-#define CHA_ID_LS_DES_MASK		(0xfull << CHA_ID_LS_DES_SHIFT)
+-
+-#define CHA_ID_LS_ARC4_SHIFT	8
+-#define CHA_ID_LS_ARC4_MASK	(0xfull << CHA_ID_LS_ARC4_SHIFT)
+-
+-#define CHA_ID_LS_MD_SHIFT	12
+-#define CHA_ID_LS_MD_MASK	(0xfull << CHA_ID_LS_MD_SHIFT)
+-
+-#define CHA_ID_LS_RNG_SHIFT	16
+-#define CHA_ID_LS_RNG_MASK	(0xfull << CHA_ID_LS_RNG_SHIFT)
+-
+-#define CHA_ID_LS_SNW8_SHIFT	20
+-#define CHA_ID_LS_SNW8_MASK	(0xfull << CHA_ID_LS_SNW8_SHIFT)
+-
+-#define CHA_ID_LS_KAS_SHIFT	24
+-#define CHA_ID_LS_KAS_MASK	(0xfull << CHA_ID_LS_KAS_SHIFT)
+-
+-#define CHA_ID_LS_PK_SHIFT	28
+-#define CHA_ID_LS_PK_MASK	(0xfull << CHA_ID_LS_PK_SHIFT)
+-
+-#define CHA_ID_MS_CRC_SHIFT	0
+-#define CHA_ID_MS_CRC_MASK	(0xfull << CHA_ID_MS_CRC_SHIFT)
+-
+-#define CHA_ID_MS_SNW9_SHIFT	4
+-#define CHA_ID_MS_SNW9_MASK	(0xfull << CHA_ID_MS_SNW9_SHIFT)
+-
+-#define CHA_ID_MS_DECO_SHIFT	24
+-#define CHA_ID_MS_DECO_MASK	(0xfull << CHA_ID_MS_DECO_SHIFT)
+-
+-#define CHA_ID_MS_JR_SHIFT	28
+-#define CHA_ID_MS_JR_MASK	(0xfull << CHA_ID_MS_JR_SHIFT)
++#define CHA_NUM_DECONUM_SHIFT	56
++#define CHA_NUM_DECONUM_MASK	(0xfull << CHA_NUM_DECONUM_SHIFT)
+ 
+ struct sec_vid {
+ 	u16 ip_id;
+@@ -176,6 +221,10 @@
+ 	u8 min_rev;
+ };
+ 
++#define SEC_VID_IPID_SHIFT      16
++#define SEC_VID_MAJ_SHIFT       8
++#define SEC_VID_MAJ_MASK        0xFF00
++
+ struct caam_perfmon {
+ 	/* Performance Monitor Registers			f00-f9f */
+ 	u64 req_dequeued;	/* PC_REQ_DEQ - Dequeued Requests	     */
+@@ -188,36 +237,89 @@
+ 	u64 rsvd[13];
+ 
+ 	/* CAAM Hardware Instantiation Parameters		fa0-fbf */
+-	u32 cha_rev_ms;		/* CRNR - CHA Rev No. Most significant half*/
+-	u32 cha_rev_ls;		/* CRNR - CHA Rev No. Least significant half*/
+-#define CTPR_MS_QI_SHIFT	25
+-#define CTPR_MS_QI_MASK		(0x1ull << CTPR_MS_QI_SHIFT)
+-#define CTPR_MS_VIRT_EN_INCL	0x00000001
+-#define CTPR_MS_VIRT_EN_POR	0x00000002
+-#define CTPR_MS_PG_SZ_MASK	0x10
+-#define CTPR_MS_PG_SZ_SHIFT	4
+-	u32 comp_parms_ms;	/* CTPR - Compile Parameters Register	*/
+-	u32 comp_parms_ls;	/* CTPR - Compile Parameters Register	*/
+-	u64 rsvd1[2];
++	u64 cha_rev;		/* CRNR - CHA Revision Number		*/
++#define CTPR_QI_SHIFT		57
++#define CTPR_QI_MASK		(0x1ull << CTPR_QI_SHIFT)
++	u64 comp_parms;	/* CTPR - Compile Parameters Register	*/
++
++	/* Secure Memory State Visibility */
++	u32 rsvd1;
++	u32 smstatus;	/* Secure memory status */
++	u32 rsvd2;
++	u32 smpartown;	/* Secure memory partition owner */
+ 
+ 	/* CAAM Global Status					fc0-fdf */
+ 	u64 faultaddr;	/* FAR  - Fault Address		*/
+ 	u32 faultliodn;	/* FALR - Fault Address LIODN	*/
+ 	u32 faultdetail;	/* FADR - Fault Addr Detail	*/
+-	u32 rsvd2;
++	u32 rsvd3;
+ 	u32 status;		/* CSTA - CAAM Status */
+-	u64 rsvd3;
++	u32 smpart;		/* Secure Memory Partition Parameters */
++	u32 smvid;		/* Secure Memory Version ID */
+ 
+ 	/* Component Instantiation Parameters			fe0-fff */
+ 	u32 rtic_id;		/* RVID - RTIC Version ID	*/
+ 	u32 ccb_id;		/* CCBVID - CCB Version ID	*/
+-	u32 cha_id_ms;		/* CHAVID - CHA Version ID Most Significant*/
+-	u32 cha_id_ls;		/* CHAVID - CHA Version ID Least Significant*/
+-	u32 cha_num_ms;		/* CHANUM - CHA Number Most Significant	*/
+-	u32 cha_num_ls;		/* CHANUM - CHA Number Least Significant*/
+-	u32 caam_id_ms;		/* CAAMVID - CAAM Version ID MS	*/
+-	u32 caam_id_ls;		/* CAAMVID - CAAM Version ID LS	*/
+-};
++	u64 cha_id;		/* CHAVID - CHA Version ID	*/
++	u64 cha_num;		/* CHANUM - CHA Number		*/
++	u64 caam_id;		/* CAAMVID - CAAM Version ID	*/
++};
++
++#define SMSTATUS_PART_SHIFT	28
++#define SMSTATUS_PART_MASK	(0xf << SMSTATUS_PART_SHIFT)
++#define SMSTATUS_PAGE_SHIFT	16
++#define SMSTATUS_PAGE_MASK	(0x7ff << SMSTATUS_PAGE_SHIFT)
++#define SMSTATUS_MID_SHIFT	8
++#define SMSTATUS_MID_MASK	(0x3f << SMSTATUS_MID_SHIFT)
++#define SMSTATUS_ACCERR_SHIFT	4
++#define SMSTATUS_ACCERR_MASK	(0xf << SMSTATUS_ACCERR_SHIFT)
++#define SMSTATUS_ACCERR_NONE	0
++#define SMSTATUS_ACCERR_ALLOC	1	/* Page not allocated */
++#define SMSTATUS_ACCESS_ID	2	/* Not granted by ID */
++#define SMSTATUS_ACCESS_WRITE	3	/* Writes not allowed */
++#define SMSTATUS_ACCESS_READ	4	/* Reads not allowed */
++#define SMSTATUS_ACCESS_NONKEY	6	/* Non-key reads not allowed */
++#define SMSTATUS_ACCESS_BLOB	9	/* Blob access not allowed */
++#define SMSTATUS_ACCESS_DESCB	10	/* Descriptor Blob access spans pages */
++#define SMSTATUS_ACCESS_NON_SM	11	/* Outside Secure Memory range */
++#define SMSTATUS_ACCESS_XPAGE	12	/* Access crosses pages */
++#define SMSTATUS_ACCESS_INITPG	13	/* Page still initializing */
++#define SMSTATUS_STATE_SHIFT	0
++#define SMSTATUS_STATE_MASK	(0xf << SMSTATUS_STATE_SHIFT)
++#define SMSTATUS_STATE_RESET	0
++#define SMSTATUS_STATE_INIT	1
++#define SMSTATUS_STATE_NORMAL	2
++#define SMSTATUS_STATE_FAIL	3
++
++/* up to 15 rings, 2 bits shifted by ring number */
++#define SMPARTOWN_RING_SHIFT	2
++#define SMPARTOWN_RING_MASK	3
++#define SMPARTOWN_AVAILABLE	0
++#define SMPARTOWN_NOEXIST	1
++#define SMPARTOWN_UNAVAILABLE	2
++#define SMPARTOWN_OURS		3
++
++/* Maximum number of pages possible */
++#define SMPART_MAX_NUMPG_SHIFT	16
++#define SMPART_MAX_NUMPG_MASK	(0x3f << SMPART_MAX_NUMPG_SHIFT)
++
++/* Maximum partition number */
++#define SMPART_MAX_PNUM_SHIFT	12
++#define SMPART_MAX_PNUM_MASK	(0xf << SMPART_MAX_PNUM_SHIFT)
++
++/* Highest possible page number */
++#define SMPART_MAX_PG_SHIFT	0
++#define SMPART_MAX_PG_MASK	(0x3f << SMPART_MAX_PG_SHIFT)
++
++/* Max size of a page */
++#define SMVID_PG_SIZE_SHIFT	16
++#define SMVID_PG_SIZE_MASK	(0x7 << SMVID_PG_SIZE_SHIFT)
++
++/* Major/Minor Version ID */
++#define SMVID_MAJ_VERS_SHIFT	8
++#define SMVID_MAJ_VERS		(0xf << SMVID_MAJ_VERS_SHIFT)
++#define SMVID_MIN_VERS_SHIFT	0
++#define SMVID_MIN_VERS		(0xf << SMVID_MIN_VERS_SHIFT)
+ 
+ /* LIODN programming for DMA configuration */
+ #define MSTRID_LOCK_LIODN	0x80000000
+@@ -270,17 +372,7 @@
+ 
+ /* RNG4 TRNG test registers */
+ struct rng4tst {
+-#define RTMCTL_PRGM	0x00010000	/* 1 -> program mode, 0 -> run mode */
+-#define RTMCTL_SAMP_MODE_VON_NEUMANN_ES_SC	0 /* use von Neumann data in
+-						     both entropy shifter and
+-						     statistical checker */
+-#define RTMCTL_SAMP_MODE_RAW_ES_SC		1 /* use raw data in both
+-						     entropy shifter and
+-						     statistical checker */
+-#define RTMCTL_SAMP_MODE_VON_NEUMANN_ES_RAW_SC	2 /* use von Neumann data in
+-						     entropy shifter, raw data
+-						     in statistical checker */
+-#define RTMCTL_SAMP_MODE_INVALID		3 /* invalid combination */
++#define RTMCTL_PRGM 0x00010000	/* 1 -> program mode, 0 -> run mode */
+ 	u32 rtmctl;		/* misc. control register */
+ 	u32 rtscmisc;		/* statistical check misc. register */
+ 	u32 rtpkrrng;		/* poker range register */
+@@ -290,26 +382,22 @@
+ 	};
+ #define RTSDCTL_ENT_DLY_SHIFT 16
+ #define RTSDCTL_ENT_DLY_MASK (0xffff << RTSDCTL_ENT_DLY_SHIFT)
+-#define RTSDCTL_ENT_DLY_MIN 3200
+-#define RTSDCTL_ENT_DLY_MAX 12800
+ 	u32 rtsdctl;		/* seed control register */
+ 	union {
+ 		u32 rtsblim;	/* PRGM=1: sparse bit limit register */
+ 		u32 rttotsam;	/* PRGM=0: total samples register */
+ 	};
+ 	u32 rtfrqmin;		/* frequency count min. limit register */
+-#define RTFRQMAX_DISABLE	(1 << 20)
+ 	union {
+ 		u32 rtfrqmax;	/* PRGM=1: freq. count max. limit register */
+ 		u32 rtfrqcnt;	/* PRGM=0: freq. count register */
+ 	};
+ 	u32 rsvd1[40];
+-#define RDSTA_SKVT 0x80000000
+-#define RDSTA_SKVN 0x40000000
+-#define RDSTA_IF0 0x00000001
+-#define RDSTA_IF1 0x00000002
+-#define RDSTA_IFMASK (RDSTA_IF1 | RDSTA_IF0)
+-	u32 rdsta;
++#define RDSTA_IF 0x00000003 /* state handle instantiated flags 0 and 1 */
++#define RDSTA_SKVN 0x40000000 /* Secure Key Valid Non-Test mode */
++#define RDSTA_SKVT 0x80000000 /* Secure Key Valid Test. non-test mode */
++#define RDSTA_TF   0x00000300 /* State handle instantiated Test-mode */
++	u32 rdsta;              /* DRNG status register */
+ 	u32 rsvd2[15];
+ };
+ 
+@@ -340,12 +428,9 @@
+ 	/* Bus Access Configuration Section			010-11f */
+ 	/* Read/Writable                                                */
+ 	struct masterid jr_mid[4];	/* JRxLIODNR - JobR LIODN setup */
+-	u32 rsvd3[11];
+-	u32 jrstart;			/* JRSTART - Job Ring Start Register */
++	u32 rsvd3[12];
+ 	struct masterid rtic_mid[4];	/* RTICxLIODNR - RTIC LIODN setup */
+-	u32 rsvd4[5];
+-	u32 deco_rsr;			/* DECORSR - Deco Request Source */
+-	u32 rsvd11;
++	u32 rsvd4[7];
+ 	u32 deco_rq;			/* DECORR - DECO Request */
+ 	struct partid deco_mid[5];	/* DECOxLIODNR - 1 per DECO */
+ 	u32 rsvd5[22];
+@@ -386,11 +471,6 @@
+ #define MCFGR_DMA_RESET		0x10000000
+ #define MCFGR_LONG_PTR		0x00010000 /* Use >32-bit desc addressing */
+ #define SCFGR_RDBENABLE		0x00000400
+-#define SCFGR_VIRT_EN		0x00008000
+-#define DECORR_RQD0ENABLE	0x00000001 /* Enable DECO0 for direct access */
+-#define DECORSR_JR0		0x00000001 /* JR to supply TZ, SDID, ICID */
+-#define DECORSR_VALID		0x80000000
+-#define DECORR_DEN0		0x00010000 /* DECO0 available for access*/
+ 
+ /* AXI read cache control */
+ #define MCFGR_ARCACHE_SHIFT	12
+@@ -407,12 +487,6 @@
+ #define MCFGR_AXIPRI		0x00000008 /* Assert AXI priority sideband */
+ #define MCFGR_BURST_64		0x00000001 /* Max burst size */
+ 
+-/* JRSTART register offsets */
+-#define JRSTART_JR0_START       0x00000001 /* Start Job ring 0 */
+-#define JRSTART_JR1_START       0x00000002 /* Start Job ring 1 */
+-#define JRSTART_JR2_START       0x00000004 /* Start Job ring 2 */
+-#define JRSTART_JR3_START       0x00000008 /* Start Job ring 3 */
+-
+ /*
+  * caam_job_ring - direct job ring setup
+  * 1-4 possible per instantiation, base + 1000/2000/3000/4000
+@@ -455,7 +529,18 @@
+ 	u32 rsvd11;
+ 	u32 jrcommand;	/* JRCRx - JobR command */
+ 
+-	u32 rsvd12[932];
++	u32 rsvd12[33];
++
++	/* Secure Memory Configuration - if you have it */
++	u32 sm_cmd;	/* SMCJRx - Secure memory command */
++	u32 rsvd13;
++	u32 sm_status;	/* SMCSJRx - Secure memory status */
++	u32 rsvd14;
++	u32 sm_perm;	/* SMAPJRx - Secure memory access perms */
++	u32 sm_group2;	/* SMAP2JRx - Secure memory access group 2 */
++	u32 sm_group1;	/* SMAP1JRx - Secure memory access group 1 */
++
++	u32 rsvd15[891];
+ 
+ 	/* Performance Monitor                                  f00-fff */
+ 	struct caam_perfmon perfmon;
+@@ -578,6 +663,62 @@
+ 
+ #define JRCR_RESET                  0x01
+ 
++/* secure memory command */
++#define SMC_PAGE_SHIFT	16
++#define SMC_PAGE_MASK	(0xffff << SMC_PAGE_SHIFT)
++#define SMC_PART_SHIFT	8
++#define SMC_PART_MASK	(0x0f << SMC_PART_SHIFT)
++#define SMC_CMD_SHIFT	0
++#define SMC_CMD_MASK	(0x0f << SMC_CMD_SHIFT)
++
++#define SMC_CMD_ALLOC_PAGE	0x01	/* allocate page to this partition */
++#define SMC_CMD_DEALLOC_PAGE	0x02	/* deallocate page from partition */
++#define SMC_CMD_DEALLOC_PART	0x03	/* deallocate partition */
++#define SMC_CMD_PAGE_INQUIRY	0x05	/* find partition associate with page */
++
++/* secure memory (command) status */
++#define SMCS_PAGE_SHIFT		16
++#define SMCS_PAGE_MASK		(0x0fff << SMCS_PAGE_SHIFT)
++#define SMCS_CMDERR_SHIFT	14
++#define SMCS_CMDERR_MASK	(3 << SMCS_CMDERR_SHIFT)
++#define SMCS_ALCERR_SHIFT	12
++#define SMCS_ALCERR_MASK	(3 << SMCS_ALCERR_SHIFT)
++#define SMCS_PGOWN_SHIFT	6
++#define SMCS_PGWON_MASK		(3 << SMCS_PGOWN_SHIFT)
++#define SMCS_PART_SHIFT		0
++#define SMCS_PART_MASK		(0xf << SMCS_PART_SHIFT)
++
++#define SMCS_CMDERR_NONE	0
++#define SMCS_CMDERR_INCOMP	1	/* Command not yet complete */
++#define SMCS_CMDERR_SECFAIL	2	/* Security failure occurred */
++#define SMCS_CMDERR_OVERFLOW	3	/* Command overflow */
++
++#define SMCS_ALCERR_NONE	0
++#define SMCS_ALCERR_PSPERR	1	/* Partion marked PSP (dealloc only) */
++#define SMCS_ALCERR_PAGEAVAIL	2	/* Page not available */
++#define SMCS_ALCERR_PARTOWN	3	/* Partition ownership error */
++
++#define SMCS_PGOWN_AVAIL	0	/* Page is available */
++#define SMCS_PGOWN_NOEXIST	1	/* Page initializing or nonexistent */
++#define SMCS_PGOWN_NOOWN	2	/* Page owned by another processor */
++#define SMCS_PGOWN_OWNED	3	/* Page belongs to this processor */
++
++/* secure memory access permissions */
++#define SMCS_PERM_KEYMOD_SHIFT	16
++#define SMCA_PERM_KEYMOD_MASK	(0xff << SMCS_PERM_KEYMOD_SHIFT)
++#define SMCA_PERM_CSP_ZERO	0x8000	/* Zero when deallocated or released */
++#define SMCA_PERM_PSP_LOCK	0x4000	/* Part./pages can't be deallocated */
++#define SMCA_PERM_PERM_LOCK	0x2000	/* Lock permissions */
++#define SMCA_PERM_GRP_LOCK	0x1000	/* Lock access groups */
++#define SMCA_PERM_RINGID_SHIFT	10
++#define SMCA_PERM_RINGID_MASK	(3 << SMCA_PERM_RINGID_SHIFT)
++#define SMCA_PERM_G2_BLOB	0x0080	/* Group 2 blob import/export */
++#define SMCA_PERM_G2_WRITE	0x0020	/* Group 2 write */
++#define SMCA_PERM_G2_READ	0x0010	/* Group 2 read */
++#define SMCA_PERM_G1_BLOB	0x0008	/* Group 1... */
++#define SMCA_PERM_G1_WRITE	0x0002
++#define SMCA_PERM_G1_READ	0x0001
++
+ /*
+  * caam_assurance - Assurance Controller View
+  * base + 0x6000 padded out to 0x1000
+@@ -746,7 +887,6 @@
+ 	u32 jr_ctl_hi;	/* CxJRR - JobR Control Register      @800 */
+ 	u32 jr_ctl_lo;
+ 	u64 jr_descaddr;	/* CxDADR - JobR Descriptor Address */
+-#define DECO_OP_STATUS_HI_ERR_MASK 0xF00000FF
+ 	u32 op_status_hi;	/* DxOPSTA - DECO Operation Status */
+ 	u32 op_status_lo;
+ 	u32 rsvd24[2];
+@@ -760,21 +900,36 @@
+ 	struct deco_sg_table sctr_tbl[4];	/* DxSTR - Scatter Tables */
+ 	u32 rsvd29[48];
+ 	u32 descbuf[64];	/* DxDESB - Descriptor buffer */
+-	u32 rscvd30[193];
+-#define DESC_DBG_DECO_STAT_HOST_ERR	0x00D00000
+-#define DESC_DBG_DECO_STAT_VALID	0x80000000
+-#define DESC_DBG_DECO_STAT_MASK		0x00F00000
+-	u32 desc_dbg;		/* DxDDR - DECO Debug Register */
+-	u32 rsvd31[126];
+-};
+-
+-#define DECO_JQCR_WHL		0x20000000
+-#define DECO_JQCR_FOUR		0x10000000
+-
+-#define JR_BLOCK_NUMBER		1
+-#define ASSURE_BLOCK_NUMBER	6
+-#define QI_BLOCK_NUMBER		7
+-#define DECO_BLOCK_NUMBER	8
+-#define PG_SIZE_4K		0x1000
+-#define PG_SIZE_64K		0x10000
++	u32 rsvd30[320];
++};
++
++/*
++ * Current top-level view of memory map is:
++ *
++ * 0x0000 - 0x0fff - CAAM Top-Level Control
++ * 0x1000 - 0x1fff - Job Ring 0
++ * 0x2000 - 0x2fff - Job Ring 1
++ * 0x3000 - 0x3fff - Job Ring 2
++ * 0x4000 - 0x4fff - Job Ring 3
++ * 0x5000 - 0x5fff - (unused)
++ * 0x6000 - 0x6fff - Assurance Controller
++ * 0x7000 - 0x7fff - Queue Interface
++ * 0x8000 - 0x8fff - DECO-CCB 0
++ * 0x9000 - 0x9fff - DECO-CCB 1
++ * 0xa000 - 0xafff - DECO-CCB 2
++ * 0xb000 - 0xbfff - DECO-CCB 3
++ * 0xc000 - 0xcfff - DECO-CCB 4
++ *
++ * caam_full describes the full register view of CAAM if useful,
++ * although many configurations may choose to implement parts of
++ * the register map separately, in differing privilege regions
++ */
++struct caam_full {
++	struct caam_ctrl __iomem ctrl;
++	struct caam_job_ring jr[4];
++	u64 rsvd[512];
++	struct caam_assurance assure;
++	struct caam_queue_if qi;
++};
++
+ #endif /* REGS_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/secvio.c linux-xbian-imx6/drivers/crypto/caam/secvio.c
+--- linux-4.1.3/drivers/crypto/caam/secvio.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/secvio.c	2015-07-27 23:13:04.213947410 +0200
+@@ -0,0 +1,290 @@
++
++/*
++ * SNVS Security Violation Handler
++ * Copyright (C) 2012-2015 Freescale Semiconductor, Inc., All Rights Reserved
++ */
++
++#include "compat.h"
++#include "intern.h"
++#include "secvio.h"
++#include "regs.h"
++
++/*
++ * These names are associated with each violation handler.
++ * The source names were taken from MX6, and are based on recommendations
++ * for most common SoCs.
++ */
++static const u8 *violation_src_name[] = {
++	"CAAM Internal Security Violation",
++	"JTAG Alarm",
++	"Watchdog",
++	"(reserved)",
++	"External Boot",
++	"External Tamper Detect",
++};
++
++/* These names help describe security monitor state for the console */
++static const u8 *snvs_ssm_state_name[] = {
++	"init",
++	"hard fail",
++	"(undef:2)",
++	"soft fail",
++	"(undef:4)",
++	"(undef:5)",
++	"(undef:6)",
++	"(undef:7)",
++	"transition",
++	"check",
++	"(undef:10)",
++	"non-secure",
++	"(undef:12)",
++	"trusted",
++	"(undef:14)",
++	"secure",
++};
++
++/* Top-level security violation interrupt */
++static irqreturn_t snvs_secvio_interrupt(int irq, void *snvsdev)
++{
++	struct device *dev = snvsdev;
++	struct snvs_secvio_drv_private *svpriv = dev_get_drvdata(dev);
++
++	/* Check the HP secvio status register */
++	svpriv->irqcause = rd_reg32(&svpriv->svregs->hp.secvio_status) &
++				    HP_SECVIOST_SECVIOMASK;
++
++	if (!svpriv->irqcause)
++		return IRQ_NONE;
++
++	/* Now ACK cause */
++	setbits32(&svpriv->svregs->hp.secvio_status, svpriv->irqcause);
++
++	/* And run deferred service */
++	preempt_disable();
++	tasklet_schedule(&svpriv->irqtask[smp_processor_id()]);
++	preempt_enable();
++
++	return IRQ_HANDLED;
++}
++
++/* Deferred service handler. Tasklet arg is simply the SNVS dev */
++static void snvs_secvio_dispatch(unsigned long indev)
++{
++	struct device *dev = (struct device *)indev;
++	struct snvs_secvio_drv_private *svpriv = dev_get_drvdata(dev);
++	unsigned long flags;
++	int i;
++
++
++	/* Look through stored causes, call each handler if exists */
++	for (i = 0; i < MAX_SECVIO_SOURCES; i++)
++		if (svpriv->irqcause & (1 << i)) {
++			spin_lock_irqsave(&svpriv->svlock, flags);
++			svpriv->intsrc[i].handler(dev, i,
++						  svpriv->intsrc[i].ext);
++			spin_unlock_irqrestore(&svpriv->svlock, flags);
++		};
++
++	/* Re-enable now-serviced interrupts */
++	setbits32(&svpriv->svregs->hp.secvio_intcfg, svpriv->irqcause);
++}
++
++/*
++ * Default cause handler, used in lieu of an application-defined handler.
++ * All it does at this time is print a console message. It could force a halt.
++ */
++static void snvs_secvio_default(struct device *dev, u32 cause, void *ext)
++{
++	struct snvs_secvio_drv_private *svpriv = dev_get_drvdata(dev);
++
++	dev_err(dev, "Unhandled Security Violation Interrupt %d = %s\n",
++		cause, svpriv->intsrc[cause].intname);
++}
++
++/*
++ * Install an application-defined handler for a specified cause
++ * Arguments:
++ * - dev        points to SNVS-owning device
++ * - cause      interrupt source cause
++ * - handler    application-defined handler, gets called with dev
++ *              source cause, and locally-defined handler argument
++ * - cause_description   points to a string to override the default cause
++ *                       name, this can be used as an alternate for error
++ *                       messages and such. If left NULL, the default
++ *                       description string is used.
++ * - ext        pointer to any extra data needed by the handler.
++ */
++int snvs_secvio_install_handler(struct device *dev, enum secvio_cause cause,
++				void (*handler)(struct device *dev, u32 cause,
++						void *ext),
++				u8 *cause_description, void *ext)
++{
++	unsigned long flags;
++	struct snvs_secvio_drv_private *svpriv;
++
++	svpriv = dev_get_drvdata(dev);
++
++	if ((handler == NULL) || (cause > SECVIO_CAUSE_SOURCE_5))
++		return -EINVAL;
++
++	spin_lock_irqsave(&svpriv->svlock, flags);
++	svpriv->intsrc[cause].handler = handler;
++	if (cause_description != NULL)
++		svpriv->intsrc[cause].intname = cause_description;
++	if (ext != NULL)
++		svpriv->intsrc[cause].ext = ext;
++	spin_unlock_irqrestore(&svpriv->svlock, flags);
++
++	return 0;
++}
++EXPORT_SYMBOL(snvs_secvio_install_handler);
++
++/*
++ * Remove an application-defined handler for a specified cause (and, by
++ * implication, restore the "default".
++ * Arguments:
++ * - dev	points to SNVS-owning device
++ * - cause	interrupt source cause
++ */
++int snvs_secvio_remove_handler(struct device *dev, enum secvio_cause cause)
++{
++	unsigned long flags;
++	struct snvs_secvio_drv_private *svpriv;
++
++	svpriv = dev_get_drvdata(dev);
++
++	if (cause > SECVIO_CAUSE_SOURCE_5)
++		return -EINVAL;
++
++	spin_lock_irqsave(&svpriv->svlock, flags);
++	svpriv->intsrc[cause].intname = violation_src_name[cause];
++	svpriv->intsrc[cause].handler = snvs_secvio_default;
++	svpriv->intsrc[cause].ext = NULL;
++	spin_unlock_irqrestore(&svpriv->svlock, flags);
++	return 0;
++}
++EXPORT_SYMBOL(snvs_secvio_remove_handler);
++
++static int snvs_secvio_remove(struct platform_device *pdev)
++{
++	struct device *svdev;
++	struct snvs_secvio_drv_private *svpriv;
++	int i;
++
++	svdev = &pdev->dev;
++	svpriv = dev_get_drvdata(svdev);
++
++	/* Set all sources to nonfatal */
++	wr_reg32(&svpriv->svregs->hp.secvio_intcfg, 0);
++
++	/* Remove tasklets and release interrupt */
++	for_each_possible_cpu(i)
++		tasklet_kill(&svpriv->irqtask[i]);
++
++	free_irq(svpriv->irq, svdev);
++	iounmap(svpriv->svregs);
++	kfree(svpriv);
++
++	return 0;
++}
++
++static int snvs_secvio_probe(struct platform_device *pdev)
++{
++	struct device *svdev;
++	struct snvs_secvio_drv_private *svpriv;
++	struct device_node *np, *npirq;
++	struct snvs_full __iomem *snvsregs;
++	int i, error;
++	u32 hpstate;
++
++	svpriv = kzalloc(sizeof(struct snvs_secvio_drv_private), GFP_KERNEL);
++	if (!svpriv)
++		return -ENOMEM;
++
++	svdev = &pdev->dev;
++	dev_set_drvdata(svdev, svpriv);
++	svpriv->pdev = pdev;
++	np = pdev->dev.of_node;
++
++	npirq = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-secvio");
++	if (!npirq) {
++		dev_err(svdev, "can't identify secvio interrupt\n");
++		kfree(svpriv);
++		return -EINVAL;
++	}
++	svpriv->irq = irq_of_parse_and_map(npirq, 0);
++	if (svpriv->irq <= 0) {
++		kfree(svpriv);
++		return -EINVAL;
++	}
++
++	snvsregs = of_iomap(np, 0);
++	if (!snvsregs) {
++		dev_err(svdev, "register mapping failed\n");
++		return -ENOMEM;
++	}
++	svpriv->svregs = (struct snvs_full __force *)snvsregs;
++
++	 /* Device data set up. Now init interrupt source descriptions */
++	for (i = 0; i < MAX_SECVIO_SOURCES; i++) {
++		svpriv->intsrc[i].intname = violation_src_name[i];
++		svpriv->intsrc[i].handler = snvs_secvio_default;
++	}
++	/* Connect main handler */
++	for_each_possible_cpu(i)
++		tasklet_init(&svpriv->irqtask[i], snvs_secvio_dispatch,
++			     (unsigned long)svdev);
++
++	error = request_irq(svpriv->irq, snvs_secvio_interrupt,
++			    IRQF_SHARED, "snvs-secvio", svdev);
++	if (error) {
++		dev_err(svdev, "can't connect secvio interrupt\n");
++		irq_dispose_mapping(svpriv->irq);
++		svpriv->irq = 0;
++		iounmap(svpriv->svregs);
++		kfree(svpriv);
++		return -EINVAL;
++	}
++
++	/*
++	 * Configure all sources as fatal violations except LP section,
++	 * source #5 (typically used as an external tamper detect), and
++	 * source #3 (typically unused). Whenever the transition to
++	 * secure mode has occurred, these will now be "fatal" violations
++	 */
++	wr_reg32(&svpriv->svregs->hp.secvio_intcfg,
++		 HP_SECVIO_INTEN_SRC4 | HP_SECVIO_INTEN_SRC2 |
++		 HP_SECVIO_INTEN_SRC1 | HP_SECVIO_INTEN_SRC0);
++
++	hpstate = (rd_reg32(&svpriv->svregs->hp.status) &
++			    HP_STATUS_SSM_ST_MASK) >> HP_STATUS_SSM_ST_SHIFT;
++	dev_info(svdev, "violation handlers armed - %s state\n",
++		 snvs_ssm_state_name[hpstate]);
++
++	return 0;
++}
++
++static struct of_device_id snvs_secvio_match[] = {
++	{
++		.compatible = "fsl,imx6q-caam-snvs",
++	},
++	{},
++};
++MODULE_DEVICE_TABLE(of, snvs_secvio_match);
++
++static struct platform_driver snvs_secvio_driver = {
++	.driver = {
++		.name = "snvs-secvio",
++		.owner = THIS_MODULE,
++		.of_match_table = snvs_secvio_match,
++	},
++	.probe       = snvs_secvio_probe,
++	.remove      = snvs_secvio_remove,
++};
++
++module_platform_driver(snvs_secvio_driver);
++
++MODULE_LICENSE("Dual BSD/GPL");
++MODULE_DESCRIPTION("FSL SNVS Security Violation Handler");
++MODULE_AUTHOR("Freescale Semiconductor - MCU");
++
+diff -Nur linux-4.1.3/drivers/crypto/caam/secvio.h linux-xbian-imx6/drivers/crypto/caam/secvio.h
+--- linux-4.1.3/drivers/crypto/caam/secvio.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/secvio.h	2015-07-27 23:13:04.213947410 +0200
+@@ -0,0 +1,66 @@
++
++/*
++ * CAAM Security Violation Handler
++ * Copyright (C) 2012-2014 Freescale Semiconductor, Inc., All Rights Reserved
++ */
++
++#ifndef SECVIO_H
++#define SECVIO_H
++
++#include "snvsregs.h"
++
++
++/*
++ * Defines the published interfaces to install/remove application-specified
++ * handlers for catching violations
++ */
++
++#define MAX_SECVIO_SOURCES 6
++
++/* these are the untranslated causes */
++enum secvio_cause {
++	SECVIO_CAUSE_SOURCE_0,
++	SECVIO_CAUSE_SOURCE_1,
++	SECVIO_CAUSE_SOURCE_2,
++	SECVIO_CAUSE_SOURCE_3,
++	SECVIO_CAUSE_SOURCE_4,
++	SECVIO_CAUSE_SOURCE_5
++};
++
++/* These are common "recommended" cause definitions for most devices */
++#define SECVIO_CAUSE_CAAM_VIOLATION	SECVIO_CAUSE_SOURCE_0
++#define SECVIO_CAUSE_JTAG_ALARM		SECVIO_CAUSE_SOURCE_1
++#define SECVIO_CAUSE_WATCHDOG		SECVIO_CAUSE_SOURCE_2
++#define SECVIO_CAUSE_EXTERNAL_BOOT	SECVIO_CAUSE_SOURCE_4
++#define SECVIO_CAUSE_TAMPER_DETECT	SECVIO_CAUSE_SOURCE_5
++
++int snvs_secvio_install_handler(struct device *dev, enum secvio_cause cause,
++				void (*handler)(struct device *dev, u32 cause,
++						void *ext),
++				u8 *cause_description, void *ext);
++int snvs_secvio_remove_handler(struct device *dev, enum  secvio_cause cause);
++
++/*
++ * Private data definitions for the secvio "driver"
++ */
++
++struct secvio_int_src {
++	const u8 *intname;	/* Points to a descriptive name for source */
++	void *ext;		/* Extended data to pass to the handler */
++	void (*handler)(struct device *dev, u32 cause, void *ext);
++};
++
++struct snvs_secvio_drv_private {
++	struct platform_device *pdev;
++	spinlock_t svlock ____cacheline_aligned;
++	struct tasklet_struct irqtask[NR_CPUS];
++	struct snvs_full __iomem *svregs;	/* both HP and LP domains */
++	int irq;
++	u32 irqcause; /* stashed cause of violation interrupt */
++
++	/* Registered handlers for each violation */
++	struct secvio_int_src intsrc[MAX_SECVIO_SOURCES];
++
++};
++
++#endif /* SECVIO_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/sg_sw_sec4.h linux-xbian-imx6/drivers/crypto/caam/sg_sw_sec4.h
+--- linux-4.1.3/drivers/crypto/caam/sg_sw_sec4.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/crypto/caam/sg_sw_sec4.h	2015-07-27 23:13:04.213947410 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * CAAM/SEC 4.x functions for using scatterlists in caam driver
+  *
+- * Copyright 2008-2011 Freescale Semiconductor, Inc.
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
+  *
+  */
+ 
+@@ -91,13 +91,22 @@
+ {
+ 	if (unlikely(chained)) {
+ 		int i;
++	struct scatterlist *tsg = sg;
++
++	/* We use a local copy of the sg pointer to avoid moving the
++	 * head of the list pointed to by sg as we wall the list.
++	 */
+ 		for (i = 0; i < nents; i++) {
+-			dma_map_sg(dev, sg, 1, dir);
+-			sg = sg_next(sg);
++			dma_map_sg(dev, tsg, 1, dir);
++			tsg = sg_next(tsg);
+ 		}
+ 	} else {
+ 		dma_map_sg(dev, sg, nents, dir);
+ 	}
++
++	if ((dir == DMA_TO_DEVICE) || (dir == DMA_BIDIRECTIONAL))
++		dma_sync_sg_for_device(dev, sg, nents, dir);
++
+ 	return nents;
+ }
+ 
+@@ -105,6 +114,9 @@
+ 				unsigned int nents, enum dma_data_direction dir,
+ 				bool chained)
+ {
++	if ((dir == DMA_FROM_DEVICE) || (dir == DMA_BIDIRECTIONAL))
++		dma_sync_sg_for_cpu(dev, sg, nents, dir);
++
+ 	if (unlikely(chained)) {
+ 		int i;
+ 		for (i = 0; i < nents; i++) {
+@@ -116,3 +128,41 @@
+ 	}
+ 	return nents;
+ }
++
++/* Copy from len bytes of sg to dest, starting from beginning */
++static inline void sg_copy(u8 *dest, struct scatterlist *sg, unsigned int len)
++{
++	struct scatterlist *current_sg = sg;
++	int cpy_index = 0, next_cpy_index = current_sg->length;
++
++	while (next_cpy_index < len) {
++		memcpy(dest + cpy_index, (u8 *) sg_virt(current_sg),
++		       current_sg->length);
++		current_sg = sg_next(current_sg);
++		cpy_index = next_cpy_index;
++		next_cpy_index += current_sg->length;
++	}
++	if (cpy_index < len)
++		memcpy(dest + cpy_index, (u8 *) sg_virt(current_sg),
++		       len - cpy_index);
++}
++
++/* Copy sg data, from to_skip to end, to dest */
++static inline void sg_copy_part(u8 *dest, struct scatterlist *sg,
++				      int to_skip, unsigned int end)
++{
++	struct scatterlist *current_sg = sg;
++	int sg_index, cpy_index;
++
++	sg_index = current_sg->length;
++	while (sg_index <= to_skip) {
++		current_sg = sg_next(current_sg);
++		sg_index += current_sg->length;
++	}
++	cpy_index = sg_index - to_skip;
++	memcpy(dest, (u8 *) sg_virt(current_sg) +
++	       current_sg->length - cpy_index, cpy_index);
++	current_sg = sg_next(current_sg);
++	if (end - sg_index)
++		sg_copy(dest + cpy_index, current_sg, end - sg_index);
++}
+diff -Nur linux-4.1.3/drivers/crypto/caam/sm.h linux-xbian-imx6/drivers/crypto/caam/sm.h
+--- linux-4.1.3/drivers/crypto/caam/sm.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/sm.h	2015-07-27 23:13:04.213947410 +0200
+@@ -0,0 +1,88 @@
++
++/*
++ * CAAM Secure Memory/Keywrap API Definitions
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
++ */
++
++#ifndef SM_H
++#define SM_H
++
++
++/* Storage access permissions */
++#define SM_PERM_READ 0x01
++#define SM_PERM_WRITE 0x02
++#define SM_PERM_BLOB 0x03
++
++
++/* Keystore maintenance functions */
++void sm_init_keystore(struct device *dev);
++u32 sm_detect_keystore_units(struct device *dev);
++int sm_establish_keystore(struct device *dev, u32 unit);
++void sm_release_keystore(struct device *dev, u32 unit);
++void caam_sm_shutdown(struct platform_device *pdev);
++int caam_sm_example_init(struct platform_device *pdev);
++
++/* Keystore accessor functions */
++extern int sm_keystore_slot_alloc(struct device *dev, u32 unit, u32 size,
++				  u32 *slot);
++extern int sm_keystore_slot_dealloc(struct device *dev, u32 unit, u32 slot);
++extern int sm_keystore_slot_load(struct device *dev, u32 unit, u32 slot,
++				 const u8 *key_data, u32 key_length);
++extern int sm_keystore_slot_read(struct device *dev, u32 unit, u32 slot,
++				 u32 key_length, u8 *key_data);
++extern int sm_keystore_slot_encapsulate(struct device *dev, u32 unit,
++					u32 inslot, u32 outslot, u16 secretlen,
++					u8 *keymod, u16 keymodlen);
++extern int sm_keystore_slot_decapsulate(struct device *dev, u32 unit,
++					u32 inslot, u32 outslot, u16 secretlen,
++					u8 *keymod, u16 keymodlen);
++
++/* Data structure to hold per-slot information */
++struct keystore_data_slot_info {
++	u8	allocated;	/* Track slot assignments */
++	u32	key_length;	/* Size of the key */
++};
++
++/* Data structure to hold keystore information */
++struct keystore_data {
++	void	*base_address;	/* Base of the Secure Partition */
++	u32	slot_count;	/* Number of slots in the keystore */
++	struct keystore_data_slot_info *slot; /* Per-slot information */
++};
++
++/* store the detected attributes of a secure memory page */
++struct sm_page_descriptor {
++	u16 phys_pagenum;	/* may be discontiguous */
++	u16 own_part;		/* Owning partition */
++	void *pg_base;		/* Calculated virtual address */
++	struct keystore_data *ksdata;
++};
++
++struct caam_drv_private_sm {
++	struct device *parentdev;	/* this ends up as the controller */
++	struct device *smringdev;	/* ring that owns this instance */
++	spinlock_t kslock ____cacheline_aligned;
++
++	/* Default parameters for geometry */
++	u32 max_pages;		/* maximum pages this instance can support */
++	u32 top_partition;	/* highest partition number in this instance */
++	u32 top_page;		/* highest page number in this instance */
++	u32 page_size;		/* page size */
++	u32 slot_size;		/* selected size of each storage block */
++
++	/* Partition/Page Allocation Map */
++	u32 localpages;		/* Number of pages we can access */
++	struct sm_page_descriptor *pagedesc;	/* Allocated per-page */
++
++	/* Installed handlers for keystore access */
++	int (*data_init)(struct device *dev, u32 unit);
++	void (*data_cleanup)(struct device *dev, u32 unit);
++	int (*slot_alloc)(struct device *dev, u32 unit, u32 size, u32 *slot);
++	int (*slot_dealloc)(struct device *dev, u32 unit, u32 slot);
++	void *(*slot_get_address)(struct device *dev, u32 unit, u32 handle);
++	u32 (*slot_get_base)(struct device *dev, u32 unit, u32 handle);
++	u32 (*slot_get_offset)(struct device *dev, u32 unit, u32 handle);
++	u32 (*slot_get_slot_size)(struct device *dev, u32 unit, u32 handle);
++};
++
++#endif /* SM_H */
+diff -Nur linux-4.1.3/drivers/crypto/caam/sm_store.c linux-xbian-imx6/drivers/crypto/caam/sm_store.c
+--- linux-4.1.3/drivers/crypto/caam/sm_store.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/sm_store.c	2015-07-27 23:13:04.213947410 +0200
+@@ -0,0 +1,896 @@
++
++/*
++ * CAAM Secure Memory Storage Interface
++ * Copyright (C) 2008-2013 Freescale Semiconductor, Inc.
++ *
++ * Loosely based on the SHW Keystore API for SCC/SCC2
++ * Experimental implementation and NOT intended for upstream use. Expect
++ * this interface to be amended significantly in the future once it becomes
++ * integrated into live applications.
++ *
++ * Known issues:
++ *
++ * - Executes one instance of an secure memory "driver". This is tied to the
++ *   fact that job rings can't run as standalone instances in the present
++ *   configuration.
++ *
++ * - It does not expose a userspace interface. The value of a userspace
++ *   interface for access to secrets is a point for further architectural
++ *   discussion.
++ *
++ * - Partition/permission management is not part of this interface. It
++ *   depends on some level of "knowledge" agreed upon between bootloader,
++ *   provisioning applications, and OS-hosted software (which uses this
++ *   driver).
++ *
++ * - No means of identifying the location or purpose of secrets managed by
++ *   this interface exists; "slot location" and format of a given secret
++ *   needs to be agreed upon between bootloader, provisioner, and OS-hosted
++ *   application.
++ */
++
++#include "compat.h"
++#include "regs.h"
++#include "jr.h"
++#include "desc.h"
++#include "intern.h"
++#include "error.h"
++#include "sm.h"
++
++#ifdef SM_DEBUG_CONT
++void sm_show_page(struct device *dev, struct sm_page_descriptor *pgdesc)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	u32 i, *smdata;
++
++	dev_info(dev, "physical page %d content at 0x%08x\n",
++		 pgdesc->phys_pagenum, pgdesc->pg_base);
++	smdata = pgdesc->pg_base;
++	for (i = 0; i < (smpriv->page_size / sizeof(u32)); i += 4)
++		dev_info(dev, "[0x%08x] 0x%08x 0x%08x 0x%08x 0x%08x\n",
++			 (u32)&smdata[i], smdata[i], smdata[i+1], smdata[i+2],
++			 smdata[i+3]);
++}
++#endif
++
++/*
++ * Construct a secure memory blob encapsulation job descriptor
++ *
++ * - desc	pointer to hold new (to be allocated) pointer to the generated
++ *		descriptor for later use. Calling thread can kfree the
++ *		descriptor after execution.
++ * - keymod	Physical pointer to key modifier (contiguous piece).
++ * - keymodsz	Size of key modifier in bytes (should normally be 8).
++ * - secretbuf	Physical pointer (within an accessible secure memory page)
++ *		of the secret to be encapsulated.
++ * - outbuf	Physical pointer (within an accessible secure memory page)
++ *		of the encapsulated output. This will be larger than the
++ *		input secret because of the added encapsulation data.
++ * - secretsz	Size of input secret, in bytes.
++ * - auth	If nonzero, use AES-CCM for encapsulation, else use ECB
++ *
++ * Note: this uses 32-bit pointers at present
++ */
++#define INITIAL_DESCSZ 16	/* size of tmp buffer for descriptor const. */
++static int blob_encap_desc(u32 **desc, dma_addr_t keymod, u16 keymodsz,
++			   dma_addr_t secretbuf, dma_addr_t outbuf,
++			   u16 secretsz, bool auth)
++{
++	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
++	u16 dsize, idx;
++
++	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
++	idx = 1;
++
++	/* Load key modifier */
++	tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB | LDST_SRCDST_BYTE_KEY |
++			 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK) |
++			 (keymodsz & LDST_LEN_MASK);
++
++	tmpdesc[idx++] = (u32)keymod;
++
++	/* Encapsulate to secure memory */
++	tmpdesc[idx++] = CMD_SEQ_IN_PTR | secretsz;
++	tmpdesc[idx++] = (u32)secretbuf;
++
++	/* Add space for BKEK and MAC tag */
++	tmpdesc[idx++] = CMD_SEQ_IN_PTR | (secretsz + (32 + 16));
++
++	tmpdesc[idx++] = (u32)outbuf;
++	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_ENCAP_PROTOCOL | OP_PCLID_BLOB |
++		     OP_PCL_BLOB_PTXT_SECMEM;
++	if (auth)
++		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
++
++	idx++;
++	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
++	dsize = idx * sizeof(u32);
++
++	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
++	if (tdesc == NULL)
++		return 0;
++
++	memcpy(tdesc, tmpdesc, dsize);
++	*desc = tdesc;
++	return dsize;
++}
++
++/*
++ * Construct a secure memory blob decapsulation job descriptor
++ *
++ * - desc	pointer to hold new (to be allocated) pointer to the generated
++ *		descriptor for later use. Calling thread can kfree the
++ *		descriptor after execution.
++ * - keymod	Physical pointer to key modifier (contiguous piece).
++ * - keymodsz	Size of key modifier in bytes (should normally be 16).
++ * - blobbuf	Physical pointer (within an accessible secure memory page)
++ *		of the blob to be decapsulated.
++ * - outbuf	Physical pointer (within an accessible secure memory page)
++ *		of the decapsulated output.
++ * - secretsz	Size of input blob, in bytes.
++ * - auth	If nonzero, assume AES-CCM for decapsulation, else use ECB
++ *
++ * Note: this uses 32-bit pointers at present
++ */
++static int blob_decap_desc(u32 **desc, dma_addr_t keymod, u16 keymodsz,
++			   dma_addr_t blobbuf, dma_addr_t outbuf,
++			   u16 blobsz, bool auth)
++{
++	u32 *tdesc, tmpdesc[INITIAL_DESCSZ];
++	u16 dsize, idx;
++
++	memset(tmpdesc, 0, INITIAL_DESCSZ * sizeof(u32));
++	idx = 1;
++
++	/* Load key modifier */
++	tmpdesc[idx++] = CMD_LOAD | LDST_CLASS_2_CCB | LDST_SRCDST_BYTE_KEY |
++			 ((12 << LDST_OFFSET_SHIFT) & LDST_OFFSET_MASK) |
++			 (keymodsz & LDST_LEN_MASK);
++
++	tmpdesc[idx++] = (u32)keymod;
++
++	/* Compensate BKEK + MAC tag */
++	tmpdesc[idx++] = CMD_SEQ_IN_PTR | (blobsz + 32 + 16);
++
++	tmpdesc[idx++] = (u32)blobbuf;
++	tmpdesc[idx++] = CMD_SEQ_OUT_PTR | blobsz;
++	tmpdesc[idx++] = (u32)outbuf;
++
++	/* Decapsulate from secure memory partition to black blob */
++	tmpdesc[idx] = CMD_OPERATION | OP_TYPE_DECAP_PROTOCOL | OP_PCLID_BLOB |
++		     OP_PCL_BLOB_PTXT_SECMEM | OP_PCL_BLOB_BLACK;
++	if (auth)
++		tmpdesc[idx] |= OP_PCL_BLOB_EKT;
++
++	idx++;
++	tmpdesc[0] = CMD_DESC_HDR | HDR_ONE | (idx & HDR_DESCLEN_MASK);
++	dsize = idx * sizeof(u32);
++
++	tdesc = kmalloc(dsize, GFP_KERNEL | GFP_DMA);
++	if (tdesc == NULL)
++		return 0;
++
++	memcpy(tdesc, tmpdesc, dsize);
++	*desc = tdesc;
++	return dsize;
++}
++
++/*
++ * Pseudo-synchronous ring access functions for carrying out key
++ * encapsulation and decapsulation
++ */
++
++struct sm_key_job_result {
++	int error;
++	struct completion completion;
++};
++
++void sm_key_job_done(struct device *dev, u32 *desc, u32 err, void *context)
++{
++	struct sm_key_job_result *res = context;
++
++	res->error = err;	/* save off the error for postprocessing */
++	complete(&res->completion);	/* mark us complete */
++}
++
++static int sm_key_job(struct device *ksdev, u32 *jobdesc)
++{
++	struct sm_key_job_result testres;
++	struct caam_drv_private_sm *kspriv;
++	int rtn = 0;
++
++	kspriv = dev_get_drvdata(ksdev);
++
++	init_completion(&testres.completion);
++
++	rtn = caam_jr_enqueue(kspriv->smringdev, jobdesc, sm_key_job_done,
++			      &testres);
++	if (!rtn) {
++		wait_for_completion_interruptible(&testres.completion);
++		rtn = testres.error;
++	}
++	return rtn;
++}
++
++/*
++ * Following section establishes the default methods for keystore access
++ * They are NOT intended for use external to this module
++ *
++ * In the present version, these are the only means for the higher-level
++ * interface to deal with the mechanics of accessing the phyiscal keystore
++ */
++
++
++int slot_alloc(struct device *dev, u32 unit, u32 size, u32 *slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
++	u32 i;
++#ifdef SM_DEBUG
++	dev_info(dev, "slot_alloc(): requesting slot for %d bytes\n", size);
++#endif
++
++	if (size > smpriv->slot_size)
++		return -EKEYREJECTED;
++
++	for (i = 0; i < ksdata->slot_count; i++) {
++		if (ksdata->slot[i].allocated == 0) {
++			ksdata->slot[i].allocated = 1;
++			(*slot) = i;
++#ifdef SM_DEBUG
++			dev_info(dev, "slot_alloc(): new slot %d allocated\n",
++				 *slot);
++#endif
++			return 0;
++		}
++	}
++
++	return -ENOSPC;
++}
++EXPORT_SYMBOL(slot_alloc);
++
++int slot_dealloc(struct device *dev, u32 unit, u32 slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
++	u8 __iomem *slotdata;
++
++#ifdef SM_DEBUG
++	dev_info(dev, "slot_dealloc(): releasing slot %d\n", slot);
++#endif
++	if (slot >= ksdata->slot_count)
++		return -EINVAL;
++	slotdata = ksdata->base_address + slot * smpriv->slot_size;
++
++	if (ksdata->slot[slot].allocated == 1) {
++		/* Forcibly overwrite the data from the keystore */
++		memset(ksdata->base_address + slot * smpriv->slot_size, 0,
++		       smpriv->slot_size);
++
++		ksdata->slot[slot].allocated = 0;
++#ifdef SM_DEBUG
++		dev_info(dev, "slot_dealloc(): slot %d released\n", slot);
++#endif
++		return 0;
++	}
++
++	return -EINVAL;
++}
++EXPORT_SYMBOL(slot_dealloc);
++
++void *slot_get_address(struct device *dev, u32 unit, u32 slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
++
++	if (slot >= ksdata->slot_count)
++		return NULL;
++
++#ifdef SM_DEBUG
++	dev_info(dev, "slot_get_address(): slot %d is 0x%08x\n", slot,
++		 (u32)ksdata->base_address + slot * smpriv->slot_size);
++#endif
++
++	return ksdata->base_address + slot * smpriv->slot_size;
++}
++
++u32 slot_get_base(struct device *dev, u32 unit, u32 slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
++
++	/*
++	 * There could potentially be more than one secure partition object
++	 * associated with this keystore.  For now, there is just one.
++	 */
++
++	(void)slot;
++
++#ifdef SM_DEBUG
++	dev_info(dev, "slot_get_base(): slot %d = 0x%08x\n",
++		slot, (u32)ksdata->base_address);
++#endif
++
++	return (u32)(ksdata->base_address);
++}
++
++u32 slot_get_offset(struct device *dev, u32 unit, u32 slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	struct keystore_data *ksdata = smpriv->pagedesc[unit].ksdata;
++
++	if (slot >= ksdata->slot_count)
++		return -EINVAL;
++
++#ifdef SM_DEBUG
++	dev_info(dev, "slot_get_offset(): slot %d = %d\n", slot,
++		slot * smpriv->slot_size);
++#endif
++
++	return slot * smpriv->slot_size;
++}
++
++u32 slot_get_slot_size(struct device *dev, u32 unit, u32 slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++
++
++#ifdef SM_DEBUG
++	dev_info(dev, "slot_get_slot_size(): slot %d = %d\n", slot,
++		 smpriv->slot_size);
++#endif
++	/* All slots are the same size in the default implementation */
++	return smpriv->slot_size;
++}
++
++
++
++int kso_init_data(struct device *dev, u32 unit)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = -EINVAL;
++	struct keystore_data *keystore_data = NULL;
++	u32 slot_count;
++	u32 keystore_data_size;
++
++	/*
++	 * Calculate the required size of the keystore data structure, based
++	 * on the number of keys that can fit in the partition.
++	 */
++	slot_count = smpriv->page_size / smpriv->slot_size;
++#ifdef SM_DEBUG
++	dev_info(dev, "kso_init_data: %d slots initializing\n", slot_count);
++#endif
++
++	keystore_data_size = sizeof(struct keystore_data) +
++				slot_count *
++				sizeof(struct keystore_data_slot_info);
++
++	keystore_data = kzalloc(keystore_data_size, GFP_KERNEL);
++
++	if (keystore_data == NULL) {
++		retval = -ENOSPC;
++		goto out;
++	}
++
++#ifdef SM_DEBUG
++	dev_info(dev, "kso_init_data: keystore data size = %d\n",
++		 keystore_data_size);
++#endif
++
++	/*
++	 * Place the slot information structure directly after the keystore data
++	 * structure.
++	 */
++	keystore_data->slot = (struct keystore_data_slot_info *)
++			      (keystore_data + 1);
++	keystore_data->slot_count = slot_count;
++
++	smpriv->pagedesc[unit].ksdata = keystore_data;
++	smpriv->pagedesc[unit].ksdata->base_address =
++		smpriv->pagedesc[unit].pg_base;
++
++	retval = 0;
++
++out:
++	if (retval != 0)
++		if (keystore_data != NULL)
++			kfree(keystore_data);
++
++
++	return retval;
++}
++
++void kso_cleanup_data(struct device *dev, u32 unit)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	struct keystore_data *keystore_data = NULL;
++
++	if (smpriv->pagedesc[unit].ksdata != NULL)
++		keystore_data = smpriv->pagedesc[unit].ksdata;
++
++	/* Release the allocated keystore management data */
++	kfree(smpriv->pagedesc[unit].ksdata);
++
++	return;
++}
++
++
++
++/*
++ * Keystore management section
++ */
++
++void sm_init_keystore(struct device *dev)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++
++	smpriv->data_init = kso_init_data;
++	smpriv->data_cleanup = kso_cleanup_data;
++	smpriv->slot_alloc = slot_alloc;
++	smpriv->slot_dealloc = slot_dealloc;
++	smpriv->slot_get_address = slot_get_address;
++	smpriv->slot_get_base = slot_get_base;
++	smpriv->slot_get_offset = slot_get_offset;
++	smpriv->slot_get_slot_size = slot_get_slot_size;
++#ifdef SM_DEBUG
++	dev_info(dev, "sm_init_keystore(): handlers installed\n");
++#endif
++}
++EXPORT_SYMBOL(sm_init_keystore);
++
++/* Return available pages/units */
++u32 sm_detect_keystore_units(struct device *dev)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++
++	return smpriv->localpages;
++}
++EXPORT_SYMBOL(sm_detect_keystore_units);
++
++/*
++ * Do any keystore specific initializations
++ */
++int sm_establish_keystore(struct device *dev, u32 unit)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++
++#ifdef SM_DEBUG
++	dev_info(dev, "sm_establish_keystore(): unit %d initializing\n", unit);
++#endif
++
++	if (smpriv->data_init == NULL)
++		return -EINVAL;
++
++	/* Call the data_init function for any user setup */
++	return smpriv->data_init(dev, unit);
++}
++EXPORT_SYMBOL(sm_establish_keystore);
++
++void sm_release_keystore(struct device *dev, u32 unit)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++
++#ifdef SM_DEBUG
++	dev_info(dev, "sm_establish_keystore(): unit %d releasing\n", unit);
++#endif
++	if ((smpriv != NULL) && (smpriv->data_cleanup != NULL))
++		smpriv->data_cleanup(dev, unit);
++
++	return;
++}
++EXPORT_SYMBOL(sm_release_keystore);
++
++/*
++ * Subsequent interfacce (sm_keystore_*) forms the accessor interfacce to
++ * the keystore
++ */
++int sm_keystore_slot_alloc(struct device *dev, u32 unit, u32 size, u32 *slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = -EINVAL;
++
++	spin_lock(&smpriv->kslock);
++
++	if ((smpriv->slot_alloc == NULL) ||
++	    (smpriv->pagedesc[unit].ksdata == NULL))
++		goto out;
++
++	retval =  smpriv->slot_alloc(dev, unit, size, slot);
++
++out:
++	spin_unlock(&smpriv->kslock);
++	return retval;
++}
++EXPORT_SYMBOL(sm_keystore_slot_alloc);
++
++int sm_keystore_slot_dealloc(struct device *dev, u32 unit, u32 slot)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = -EINVAL;
++
++	spin_lock(&smpriv->kslock);
++
++	if ((smpriv->slot_alloc == NULL) ||
++	    (smpriv->pagedesc[unit].ksdata == NULL))
++		goto out;
++
++	retval = smpriv->slot_dealloc(dev, unit, slot);
++out:
++	spin_unlock(&smpriv->kslock);
++	return retval;
++}
++EXPORT_SYMBOL(sm_keystore_slot_dealloc);
++
++int sm_keystore_slot_load(struct device *dev, u32 unit, u32 slot,
++			  const u8 *key_data, u32 key_length)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = -EINVAL;
++	u32 slot_size;
++	u32 i;
++	u8 __iomem *slot_location;
++
++	spin_lock(&smpriv->kslock);
++
++	slot_size = smpriv->slot_get_slot_size(dev, unit, slot);
++
++	if (key_length > slot_size) {
++		retval = -EFBIG;
++		goto out;
++	}
++
++	slot_location = smpriv->slot_get_address(dev, unit, slot);
++
++	for (i = 0; i < key_length; i++)
++		slot_location[i] = key_data[i];
++
++	retval = 0;
++
++out:
++	spin_unlock(&smpriv->kslock);
++	return retval;
++}
++EXPORT_SYMBOL(sm_keystore_slot_load);
++
++int sm_keystore_slot_read(struct device *dev, u32 unit, u32 slot,
++			  u32 key_length, u8 *key_data)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = -EINVAL;
++	u8 __iomem *slot_addr;
++	u32 slot_size;
++
++	spin_lock(&smpriv->kslock);
++
++	slot_addr = smpriv->slot_get_address(dev, unit, slot);
++	slot_size = smpriv->slot_get_slot_size(dev, unit, slot);
++
++	if (key_length > slot_size) {
++		retval = -EKEYREJECTED;
++		goto out;
++	}
++
++	memcpy(key_data, slot_addr, key_length);
++	retval = 0;
++
++out:
++	spin_unlock(&smpriv->kslock);
++	return retval;
++}
++EXPORT_SYMBOL(sm_keystore_slot_read);
++
++int sm_keystore_slot_encapsulate(struct device *dev, u32 unit, u32 inslot,
++				 u32 outslot, u16 secretlen, u8 *keymod,
++				 u16 keymodlen)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = 0;
++	u32 slot_length, dsize, jstat;
++	u32 __iomem *encapdesc = NULL;
++	u8 __iomem *lkeymod, *inpslotaddr, *outslotaddr;
++	dma_addr_t keymod_dma;
++
++	/* Ensure that the full blob  will fit in the key slot */
++	slot_length = smpriv->slot_get_slot_size(dev, unit, outslot);
++	if ((secretlen + 48) > slot_length)
++		goto out;
++
++	/* Get the base addresses of both keystore slots */
++	inpslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, inslot);
++	outslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, outslot);
++
++	/* Build the key modifier */
++	lkeymod = kmalloc(keymodlen, GFP_KERNEL | GFP_DMA);
++	memcpy(lkeymod, keymod, keymodlen);
++	keymod_dma = dma_map_single(dev, lkeymod, keymodlen, DMA_TO_DEVICE);
++	dma_sync_single_for_device(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
++
++	/* Build the encapsulation job descriptor */
++	dsize = blob_encap_desc(&encapdesc, keymod_dma, keymodlen,
++				__pa(inpslotaddr), __pa(outslotaddr),
++				secretlen, 0);
++	if (!dsize) {
++		dev_err(dev, "can't alloc an encap descriptor\n");
++		retval = -ENOMEM;
++		goto out;
++	}
++	jstat = sm_key_job(dev, encapdesc);
++
++	dma_unmap_single(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
++	kfree(encapdesc);
++
++out:
++	return retval;
++
++}
++EXPORT_SYMBOL(sm_keystore_slot_encapsulate);
++
++int sm_keystore_slot_decapsulate(struct device *dev, u32 unit, u32 inslot,
++				 u32 outslot, u16 secretlen, u8 *keymod,
++				 u16 keymodlen)
++{
++	struct caam_drv_private_sm *smpriv = dev_get_drvdata(dev);
++	int retval = 0;
++	u32 slot_length, dsize, jstat;
++	u32 __iomem *decapdesc = NULL;
++	u8 __iomem *lkeymod, *inpslotaddr, *outslotaddr;
++	dma_addr_t keymod_dma;
++
++	/* Ensure that the decap data will fit in the key slot */
++	slot_length = smpriv->slot_get_slot_size(dev, unit, outslot);
++	if (secretlen > slot_length)
++		goto out;
++
++	/* Get the base addresses of both keystore slots */
++	inpslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, inslot);
++	outslotaddr = (u8 *)smpriv->slot_get_address(dev, unit, outslot);
++
++	/* Build the key modifier */
++	lkeymod = kmalloc(keymodlen, GFP_KERNEL | GFP_DMA);
++	memcpy(lkeymod, keymod, keymodlen);
++	keymod_dma = dma_map_single(dev, lkeymod, keymodlen, DMA_TO_DEVICE);
++	dma_sync_single_for_device(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
++
++	/* Build the decapsulation job descriptor */
++	dsize = blob_decap_desc(&decapdesc, keymod_dma, keymodlen,
++				__pa(inpslotaddr), __pa(outslotaddr),
++				secretlen, 0);
++	if (!dsize) {
++		dev_err(dev, "can't alloc a decap descriptor\n");
++		retval = -ENOMEM;
++		goto out;
++	}
++	jstat = sm_key_job(dev, decapdesc);
++
++	dma_unmap_single(dev, keymod_dma, keymodlen, DMA_TO_DEVICE);
++	kfree(decapdesc);
++
++out:
++	return retval;
++
++}
++EXPORT_SYMBOL(sm_keystore_slot_decapsulate);
++
++
++/*
++ * Initialization/shutdown subsystem
++ * Assumes statically-invoked startup/shutdown from the controller driver
++ * for the present time, to be reworked when a device tree becomes
++ * available. This code will not modularize in present form.
++ *
++ * Also, simply uses ring 0 for execution at the present
++ */
++
++int caam_sm_startup(struct platform_device *pdev)
++{
++	struct device *ctrldev, *smdev;
++	struct caam_drv_private *ctrlpriv;
++	struct caam_drv_private_sm *smpriv;
++	struct caam_drv_private_jr *jrpriv;	/* need this for reg page */
++	struct platform_device *sm_pdev;
++	struct sm_page_descriptor *lpagedesc;
++	u32 page, pgstat, lpagect, detectedpage;
++
++	struct device_node *np;
++	ctrldev = &pdev->dev;
++	ctrlpriv = dev_get_drvdata(ctrldev);
++
++	/*
++	 * Set up the private block for secure memory
++	 * Only one instance is possible
++	 */
++	smpriv = kzalloc(sizeof(struct caam_drv_private_sm), GFP_KERNEL);
++	if (smpriv == NULL) {
++		dev_err(ctrldev, "can't alloc private mem for secure memory\n");
++		return -ENOMEM;
++	}
++	smpriv->parentdev = ctrldev; /* copy of parent dev is handy */
++
++	/* Create the dev */
++#ifdef CONFIG_OF
++	np = of_find_compatible_node(NULL, NULL, "fsl,imx6q-caam-sm");
++	sm_pdev = of_platform_device_create(np, "caam_sm", ctrldev);
++#else
++	sm_pdev = platform_device_register_data(ctrldev, "caam_sm", 0,
++						smpriv,
++					sizeof(struct caam_drv_private_sm));
++#endif
++	if (sm_pdev == NULL) {
++		kfree(smpriv);
++		return -EINVAL;
++	}
++	smdev = &sm_pdev->dev;
++	dev_set_drvdata(smdev, smpriv);
++	ctrlpriv->smdev = smdev;
++
++	/*
++	 * Collect configuration limit data for reference
++	 * This batch comes from the partition data/vid registers in perfmon
++	 */
++	smpriv->max_pages = ((rd_reg32(&ctrlpriv->ctrl->perfmon.smpart)
++			    & SMPART_MAX_NUMPG_MASK) >>
++			    SMPART_MAX_NUMPG_SHIFT) + 1;
++	smpriv->top_partition = ((rd_reg32(&ctrlpriv->ctrl->perfmon.smpart)
++				& SMPART_MAX_PNUM_MASK) >>
++				SMPART_MAX_PNUM_SHIFT) + 1;
++	smpriv->top_page =  ((rd_reg32(&ctrlpriv->ctrl->perfmon.smpart)
++			    & SMPART_MAX_PG_MASK) >> SMPART_MAX_PG_SHIFT) + 1;
++	smpriv->page_size = 1024 << ((rd_reg32(&ctrlpriv->ctrl->perfmon.smvid)
++			    & SMVID_PG_SIZE_MASK) >> SMVID_PG_SIZE_SHIFT);
++	smpriv->slot_size = 1 << CONFIG_CRYPTO_DEV_FSL_CAAM_SM_SLOTSIZE;
++
++#ifdef SM_DEBUG
++	dev_info(smdev, "max pages = %d, top partition = %d\n",
++			smpriv->max_pages, smpriv->top_partition);
++	dev_info(smdev, "top page = %d, page size = %d (total = %d)\n",
++			smpriv->top_page, smpriv->page_size,
++			smpriv->top_page * smpriv->page_size);
++	dev_info(smdev, "selected slot size = %d\n", smpriv->slot_size);
++#endif
++
++	/*
++	 * Now probe for partitions/pages to which we have access. Note that
++	 * these have likely been set up by a bootloader or platform
++	 * provisioning application, so we have to assume that we "inherit"
++	 * a configuration and work within the constraints of what it might be.
++	 *
++	 * Assume use of the zeroth ring in the present iteration (until
++	 * we can divorce the controller and ring drivers, and then assign
++	 * an SM instance to any ring instance).
++	 */
++	smpriv->smringdev = ctrlpriv->jrdev[0];
++	jrpriv = dev_get_drvdata(smpriv->smringdev);
++	lpagect = 0;
++	lpagedesc = kzalloc(sizeof(struct sm_page_descriptor)
++			    * smpriv->max_pages, GFP_KERNEL);
++	if (lpagedesc == NULL) {
++		kfree(smpriv);
++		return -ENOMEM;
++	}
++
++	for (page = 0; page < smpriv->max_pages; page++) {
++		wr_reg32(&jrpriv->rregs->sm_cmd,
++			 ((page << SMC_PAGE_SHIFT) & SMC_PAGE_MASK) |
++			 (SMC_CMD_PAGE_INQUIRY & SMC_CMD_MASK));
++		pgstat = rd_reg32(&jrpriv->rregs->sm_status);
++		if (((pgstat & SMCS_PGWON_MASK) >> SMCS_PGOWN_SHIFT)
++		    == SMCS_PGOWN_OWNED) { /* our page? */
++			lpagedesc[page].phys_pagenum =
++				(pgstat & SMCS_PAGE_MASK) >> SMCS_PAGE_SHIFT;
++			lpagedesc[page].own_part =
++				(pgstat & SMCS_PART_SHIFT) >> SMCS_PART_MASK;
++			lpagedesc[page].pg_base = ctrlpriv->sm_base +
++				((smpriv->page_size * page) / sizeof(u32));
++			lpagect++;
++#ifdef SM_DEBUG
++			dev_info(smdev,
++				"physical page %d, owning partition = %d\n",
++				lpagedesc[page].phys_pagenum,
++				lpagedesc[page].own_part);
++#endif
++		}
++	}
++
++	smpriv->pagedesc = kzalloc(sizeof(struct sm_page_descriptor) * lpagect,
++				   GFP_KERNEL);
++	if (smpriv->pagedesc == NULL) {
++		kfree(lpagedesc);
++		kfree(smpriv);
++		return -ENOMEM;
++	}
++	smpriv->localpages = lpagect;
++
++	detectedpage = 0;
++	for (page = 0; page < smpriv->max_pages; page++) {
++		if (lpagedesc[page].pg_base != NULL) {	/* e.g. live entry */
++			memcpy(&smpriv->pagedesc[detectedpage],
++			       &lpagedesc[page],
++			       sizeof(struct sm_page_descriptor));
++#ifdef SM_DEBUG_CONT
++			sm_show_page(smdev, &smpriv->pagedesc[detectedpage]);
++#endif
++			detectedpage++;
++		}
++	}
++
++	kfree(lpagedesc);
++
++	sm_init_keystore(smdev);
++
++	return 0;
++}
++
++void caam_sm_shutdown(struct platform_device *pdev)
++{
++	struct device *ctrldev, *smdev;
++	struct caam_drv_private *priv;
++	struct caam_drv_private_sm *smpriv;
++
++	ctrldev = &pdev->dev;
++	priv = dev_get_drvdata(ctrldev);
++	smdev = priv->smdev;
++	smpriv = dev_get_drvdata(smdev);
++
++	kfree(smpriv->pagedesc);
++	kfree(smpriv);
++}
++EXPORT_SYMBOL(caam_sm_shutdown);
++#ifdef CONFIG_OF
++static void  __exit caam_sm_exit(void)
++{
++	struct device_node *dev_node;
++	struct platform_device *pdev;
++
++	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
++	if (!dev_node) {
++		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
++		if (!dev_node)
++			return;
++	}
++
++	pdev = of_find_device_by_node(dev_node);
++	if (!pdev)
++		return;
++
++	of_node_put(dev_node);
++
++	caam_sm_shutdown(pdev);
++
++	return;
++}
++
++static int __init caam_sm_init(void)
++{
++	struct device_node *dev_node;
++	struct platform_device *pdev;
++
++	/*
++	 * Do of_find_compatible_node() then of_find_device_by_node()
++	 * once a functional device tree is available
++	 */
++	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
++	if (!dev_node) {
++		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
++		if (!dev_node)
++			return -ENODEV;
++	}
++
++	pdev = of_find_device_by_node(dev_node);
++	if (!pdev)
++		return -ENODEV;
++
++	of_node_get(dev_node);
++
++	caam_sm_startup(pdev);
++
++	return 0;
++}
++
++module_init(caam_sm_init);
++module_exit(caam_sm_exit);
++
++MODULE_LICENSE("Dual BSD/GPL");
++MODULE_DESCRIPTION("FSL CAAM Secure Memory / Keystore");
++MODULE_AUTHOR("Freescale Semiconductor - NMSG/MAD");
++#endif
+diff -Nur linux-4.1.3/drivers/crypto/caam/sm_test.c linux-xbian-imx6/drivers/crypto/caam/sm_test.c
+--- linux-4.1.3/drivers/crypto/caam/sm_test.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/sm_test.c	2015-07-27 23:13:04.213947410 +0200
+@@ -0,0 +1,844 @@
++/*
++ * Secure Memory / Keystore Exemplification Module
++ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved
++ *
++ * Serves as a functional example, and as a self-contained unit test for
++ * the functionality contained in sm_store.c.
++ *
++ * The example function, caam_sm_example_init(), runs a thread that:
++ *
++ * - initializes a set of fixed keys
++ * - stores one copy in clear buffers
++ * - stores them again in secure memory
++ * - extracts stored keys back out for use
++ * - intializes 3 data buffers for a test:
++ *   (1) containing cleartext
++ *   (2) to hold ciphertext encrypted with an extracted black key
++ *   (3) to hold extracted cleartext decrypted with an equivalent clear key
++ *
++ * The function then builds simple job descriptors that reference the key
++ * material and buffers as initialized, and executes an encryption job
++ * with a black key, and a decryption job using a the same key held in the
++ * clear. The output of the decryption job is compared to the original
++ * cleartext; if they don't compare correctly, one can assume a key problem
++ * exists, where the function will exit with an error.
++ *
++ * This module can use a substantial amount of refactoring, which may occur
++ * after the API gets some mileage. Furthermore, expect this module to
++ * eventually disappear once the API is integrated into "real" software.
++ */
++
++#include "compat.h"
++#include "intern.h"
++#include "desc.h"
++#include "error.h"
++#include "jr.h"
++#include "sm.h"
++
++static u8 skeymod[] = {
++	0x0f, 0x0e, 0x0d, 0x0c, 0x0b, 0x0a, 0x09, 0x08,
++	0x07, 0x06, 0x05, 0x04, 0x03, 0x02, 0x01, 0x00
++};
++static u8 symkey[] = {
++	0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
++	0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
++	0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
++	0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f
++};
++
++static u8 symdata[] = {
++	0x00, 0x01, 0x02, 0x03, 0x04, 0x0f, 0x06, 0x07,
++	0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
++	0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
++	0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
++	0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27,
++	0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f,
++	0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
++	0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f,
++	0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47,
++	0x48, 0x49, 0x4a, 0x4b, 0x4c, 0x4d, 0x4e, 0x4f,
++	0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57,
++	0x58, 0x59, 0x5a, 0x5b, 0x5c, 0x5d, 0x5e, 0x5f,
++	0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67,
++	0x68, 0x69, 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f,
++	0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77,
++	0x78, 0x79, 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f,
++	0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
++	0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
++	0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
++	0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
++	0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
++	0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
++	0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
++	0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
++	0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
++	0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
++	0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
++	0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
++	0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
++	0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
++	0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
++	0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff
++};
++
++static int mk_job_desc(u32 *desc, dma_addr_t key, u16 keysz, dma_addr_t indata,
++		       dma_addr_t outdata, u16 sz, u32 cipherdir, u32 keymode)
++{
++	desc[1] = CMD_KEY | CLASS_1 | (keysz & KEY_LENGTH_MASK) | keymode;
++	desc[2] = (u32)key;
++	desc[3] = CMD_OPERATION | OP_TYPE_CLASS1_ALG | OP_ALG_AAI_ECB |
++		  cipherdir;
++	desc[4] = CMD_FIFO_LOAD | FIFOLD_CLASS_CLASS1 |
++		  FIFOLD_TYPE_MSG | FIFOLD_TYPE_LAST1 | sz;
++	desc[5] = (u32)indata;
++	desc[6] = CMD_FIFO_STORE | FIFOST_TYPE_MESSAGE_DATA | sz;
++	desc[7] = (u32)outdata;
++
++	desc[0] = CMD_DESC_HDR | HDR_ONE | (8 & HDR_DESCLEN_MASK);
++	return 8 * sizeof(u32);
++}
++
++struct exec_test_result {
++	int error;
++	struct completion completion;
++};
++
++void exec_test_done(struct device *dev, u32 *desc, u32 err, void *context)
++{
++	struct exec_test_result *res = context;
++
++	if (err) {
++		char tmp[CAAM_ERROR_STR_MAX];
++		dev_err(dev, "%08x: %s\n", err, caam_jr_strstatus(tmp, err));
++	}
++
++	res->error = err;
++	complete(&res->completion);
++}
++
++static int exec_test_job(struct device *ksdev, u32 *jobdesc)
++{
++	struct exec_test_result testres;
++	struct caam_drv_private_sm *kspriv;
++	int rtn = 0;
++
++	kspriv = dev_get_drvdata(ksdev);
++
++	init_completion(&testres.completion);
++
++	rtn = caam_jr_enqueue(kspriv->smringdev, jobdesc, exec_test_done,
++			      &testres);
++	if (!rtn) {
++		wait_for_completion_interruptible(&testres.completion);
++		rtn = testres.error;
++	}
++	return rtn;
++}
++
++
++int caam_sm_example_init(struct platform_device *pdev)
++{
++	struct device *ctrldev, *ksdev;
++	struct caam_drv_private *ctrlpriv;
++	struct caam_drv_private_sm *kspriv;
++	u32 unit, units, jdescsz;
++	int stat, jstat, rtnval = 0;
++	u8 __iomem *syminp, *symint, *symout = NULL;
++	dma_addr_t syminp_dma, symint_dma, symout_dma;
++	u8 __iomem *black_key_des, *black_key_aes128;
++	u8 __iomem  *black_key_aes256;
++	dma_addr_t black_key_des_dma, black_key_aes128_dma;
++	dma_addr_t black_key_aes256_dma;
++	u8 __iomem *clear_key_des, *clear_key_aes128, *clear_key_aes256;
++	dma_addr_t clear_key_des_dma, clear_key_aes128_dma;
++	dma_addr_t clear_key_aes256_dma;
++	u32 __iomem *jdesc;
++	u32 keyslot_des, keyslot_aes128, keyslot_aes256 = 0;
++
++	jdesc = NULL;
++	black_key_des = black_key_aes128 = black_key_aes256 = NULL;
++	clear_key_des = clear_key_aes128 = clear_key_aes256 = NULL;
++
++	/* We can lose this cruft once we can get a pdev by name */
++	ctrldev = &pdev->dev;
++	ctrlpriv = dev_get_drvdata(ctrldev);
++	ksdev = ctrlpriv->smdev;
++	kspriv = dev_get_drvdata(ksdev);
++	if (kspriv == NULL)
++		return -ENODEV;
++
++	/* Now that we have the dev for the single SM instance, connect */
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test_init() running\n");
++#endif
++	/* Probe to see what keystores are available to us */
++	units = sm_detect_keystore_units(ksdev);
++	if (!units)
++		dev_err(ksdev, "caam_sm_test: no keystore units available\n");
++
++	/*
++	 * MX6 bootloader stores some stuff in unit 0, so let's
++	 * use 1 or above
++	 */
++	if (units < 2) {
++		dev_err(ksdev, "caam_sm_test: insufficient keystore units\n");
++		return -ENODEV;
++	}
++	unit = 1;
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: %d keystore units available\n", units);
++#endif
++
++	/* Initialize/Establish Keystore */
++	sm_establish_keystore(ksdev, unit);	/* Initalize store in #1 */
++
++	/*
++	 * Top of main test thread
++	 */
++
++	/* Allocate test data blocks (input, intermediate, output) */
++	syminp = kmalloc(256, GFP_KERNEL | GFP_DMA);
++	symint = kmalloc(256, GFP_KERNEL | GFP_DMA);
++	symout = kmalloc(256, GFP_KERNEL | GFP_DMA);
++	if ((syminp == NULL) || (symint == NULL) || (symout == NULL)) {
++		rtnval = -ENOMEM;
++		dev_err(ksdev, "caam_sm_test: can't get test data buffers\n");
++		goto freemem;
++	}
++
++	/* Allocate storage for 3 black keys: encapsulated 8, 16, 32 */
++	black_key_des = kmalloc(16, GFP_KERNEL | GFP_DMA); /* padded to 16... */
++	black_key_aes128 = kmalloc(16, GFP_KERNEL | GFP_DMA);
++	black_key_aes256 = kmalloc(16, GFP_KERNEL | GFP_DMA);
++	if ((black_key_des == NULL) || (black_key_aes128 == NULL) ||
++	    (black_key_aes256 == NULL)) {
++		rtnval = -ENOMEM;
++		dev_err(ksdev, "caam_sm_test: can't black key buffers\n");
++		goto freemem;
++	}
++
++	clear_key_des = kmalloc(8, GFP_KERNEL | GFP_DMA);
++	clear_key_aes128 = kmalloc(16, GFP_KERNEL | GFP_DMA);
++	clear_key_aes256 = kmalloc(32, GFP_KERNEL | GFP_DMA);
++	if ((clear_key_des == NULL) || (clear_key_aes128 == NULL) ||
++	    (clear_key_aes256 == NULL)) {
++		rtnval = -ENOMEM;
++		dev_err(ksdev, "caam_sm_test: can't get clear key buffers\n");
++		goto freemem;
++	}
++
++	/* Allocate storage for job descriptor */
++	jdesc = kmalloc(8 * sizeof(u32), GFP_KERNEL | GFP_DMA);
++	if (jdesc == NULL) {
++		rtnval = -ENOMEM;
++		dev_err(ksdev, "caam_sm_test: can't get descriptor buffers\n");
++		goto freemem;
++	}
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: all buffers allocated\n");
++#endif
++
++	/* Load up input data block, clear outputs */
++	memcpy(syminp, symdata, 256);
++	memset(symint, 0, 256);
++	memset(symout, 0, 256);
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[0], syminp[1], syminp[2], syminp[3],
++		 syminp[4], syminp[5], syminp[6], syminp[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[0], symout[1], symout[2], symout[3],
++		 symout[4], symout[5], symout[6], symout[7]);
++
++	dev_info(ksdev, "caam_sm_test: data buffers initialized\n");
++#endif
++
++	/* Load up clear keys */
++	memcpy(clear_key_des, symkey, 8);
++	memcpy(clear_key_aes128, symkey, 16);
++	memcpy(clear_key_aes256, symkey, 32);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: all clear keys loaded\n");
++#endif
++
++	/*
++	 * Place clear keys in keystore.
++	 * All the interesting stuff happens here.
++	 */
++	/* 8 bit DES key */
++	stat = sm_keystore_slot_alloc(ksdev, unit, 8, &keyslot_des);
++	if (stat)
++		goto freemem;
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: 8 byte key slot in %d\n", keyslot_des);
++#endif
++	stat = sm_keystore_slot_load(ksdev, unit, keyslot_des, clear_key_des,
++				     8);
++	if (stat) {
++#ifdef SM_TEST_DETAIL
++		dev_info(ksdev, "caam_sm_test: can't load 8 byte key in %d\n",
++			 keyslot_des);
++#endif
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
++		goto freemem;
++	}
++
++	/* 16 bit AES key */
++	stat = sm_keystore_slot_alloc(ksdev, unit, 16, &keyslot_aes128);
++	if (stat) {
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
++		goto freemem;
++	}
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: 16 byte key slot in %d\n",
++		 keyslot_aes128);
++#endif
++	stat = sm_keystore_slot_load(ksdev, unit, keyslot_aes128,
++				     clear_key_aes128, 16);
++	if (stat) {
++#ifdef SM_TEST_DETAIL
++		dev_info(ksdev, "caam_sm_test: can't load 16 byte key in %d\n",
++			 keyslot_aes128);
++#endif
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
++		goto freemem;
++	}
++
++	/* 32 bit AES key */
++	stat = sm_keystore_slot_alloc(ksdev, unit, 32, &keyslot_aes256);
++	if (stat) {
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
++		goto freemem;
++	}
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: 32 byte key slot in %d\n",
++		 keyslot_aes256);
++#endif
++	stat = sm_keystore_slot_load(ksdev, unit, keyslot_aes256,
++				     clear_key_aes256, 32);
++	if (stat) {
++#ifdef SM_TEST_DETAIL
++		dev_info(ksdev, "caam_sm_test: can't load 32 byte key in %d\n",
++			 keyslot_aes128);
++#endif
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes256);
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
++		sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
++		goto freemem;
++	}
++
++	/* Encapsulate all keys as SM blobs */
++	stat = sm_keystore_slot_encapsulate(ksdev, unit, keyslot_des,
++					    keyslot_des, 8, skeymod, 8);
++	if (stat) {
++		dev_info(ksdev, "caam_sm_test: can't encapsulate DES key\n");
++		goto freekeys;
++	}
++
++	stat = sm_keystore_slot_encapsulate(ksdev, unit, keyslot_aes128,
++					    keyslot_aes128, 16, skeymod, 8);
++	if (stat) {
++		dev_info(ksdev, "caam_sm_test: can't encapsulate AES128 key\n");
++		goto freekeys;
++	}
++
++	stat = sm_keystore_slot_encapsulate(ksdev, unit, keyslot_aes256,
++					    keyslot_aes256, 32, skeymod, 8);
++	if (stat) {
++		dev_info(ksdev, "caam_sm_test: can't encapsulate AES256 key\n");
++		goto freekeys;
++	}
++
++	/* Now decapsulate as black key blobs */
++	stat = sm_keystore_slot_decapsulate(ksdev, unit, keyslot_des,
++					    keyslot_des, 8, skeymod, 8);
++	if (stat) {
++		dev_info(ksdev, "caam_sm_test: can't decapsulate DES key\n");
++		goto freekeys;
++	}
++
++	stat = sm_keystore_slot_decapsulate(ksdev, unit, keyslot_aes128,
++					    keyslot_aes128, 16, skeymod, 8);
++	if (stat) {
++		dev_info(ksdev, "caam_sm_test: can't decapsulate AES128 key\n");
++		goto freekeys;
++	}
++
++	stat = sm_keystore_slot_decapsulate(ksdev, unit, keyslot_aes256,
++					    keyslot_aes256, 32, skeymod, 8);
++	if (stat) {
++		dev_info(ksdev, "caam_sm_test: can't decapsulate AES128 key\n");
++		goto freekeys;
++	}
++
++	/* Extract 8/16/32 byte black keys */
++	sm_keystore_slot_read(ksdev, unit, keyslot_des, 8, black_key_des);
++	sm_keystore_slot_read(ksdev, unit, keyslot_aes128, 16,
++			      black_key_aes128);
++	sm_keystore_slot_read(ksdev, unit, keyslot_aes256, 32,
++			      black_key_aes256);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: all black keys extracted\n");
++#endif
++
++	/* DES encrypt using 8 byte black key */
++	black_key_des_dma = dma_map_single(ksdev, black_key_des, 8,
++					   DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, black_key_des_dma, 8, DMA_TO_DEVICE);
++	syminp_dma = dma_map_single(ksdev, syminp, 256, DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
++	symint_dma = dma_map_single(ksdev, symint, 256, DMA_FROM_DEVICE);
++
++	jdescsz = mk_job_desc(jdesc, black_key_des_dma, 8, syminp_dma,
++			      symint_dma, 256,
++			      OP_ALG_ENCRYPT | OP_ALG_ALGSEL_DES, 0);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "jobdesc:\n");
++	dev_info(ksdev, "0x%08x\n", jdesc[0]);
++	dev_info(ksdev, "0x%08x\n", jdesc[1]);
++	dev_info(ksdev, "0x%08x\n", jdesc[2]);
++	dev_info(ksdev, "0x%08x\n", jdesc[3]);
++	dev_info(ksdev, "0x%08x\n", jdesc[4]);
++	dev_info(ksdev, "0x%08x\n", jdesc[5]);
++	dev_info(ksdev, "0x%08x\n", jdesc[6]);
++	dev_info(ksdev, "0x%08x\n", jdesc[7]);
++#endif
++
++	jstat = exec_test_job(ksdev, jdesc);
++
++	dma_sync_single_for_cpu(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
++	dma_unmap_single(ksdev, black_key_des_dma, 8, DMA_TO_DEVICE);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "input block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[0], syminp[1], syminp[2], syminp[3],
++		 syminp[4], syminp[5], syminp[6], syminp[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[8], syminp[9], syminp[10], syminp[11],
++		 syminp[12], syminp[13], syminp[14], syminp[15]);
++	dev_info(ksdev, "intermediate block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[8], symint[9], symint[10], symint[11],
++		 symint[12], symint[13], symint[14], symint[15]);
++	dev_info(ksdev, "caam_sm_test: encrypt cycle with 8 byte key\n");
++#endif
++
++	/* DES decrypt using 8 byte clear key */
++	clear_key_des_dma = dma_map_single(ksdev, clear_key_des, 8,
++					   DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, clear_key_des_dma, 8, DMA_TO_DEVICE);
++	symint_dma = dma_map_single(ksdev, symint, 256, DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, symint_dma, 256, DMA_TO_DEVICE);
++	symout_dma = dma_map_single(ksdev, symout, 256, DMA_FROM_DEVICE);
++
++	jdescsz = mk_job_desc(jdesc, clear_key_des_dma, 8, symint_dma,
++			      symout_dma, 256,
++			      OP_ALG_DECRYPT | OP_ALG_ALGSEL_DES, 0);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "jobdesc:\n");
++	dev_info(ksdev, "0x%08x\n", jdesc[0]);
++	dev_info(ksdev, "0x%08x\n", jdesc[1]);
++	dev_info(ksdev, "0x%08x\n", jdesc[2]);
++	dev_info(ksdev, "0x%08x\n", jdesc[3]);
++	dev_info(ksdev, "0x%08x\n", jdesc[4]);
++	dev_info(ksdev, "0x%08x\n", jdesc[5]);
++	dev_info(ksdev, "0x%08x\n", jdesc[6]);
++	dev_info(ksdev, "0x%08x\n", jdesc[7]);
++#endif
++
++	jstat = exec_test_job(ksdev, jdesc);
++
++	dma_sync_single_for_cpu(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symint_dma, 256, DMA_TO_DEVICE);
++	dma_unmap_single(ksdev, clear_key_des_dma, 8, DMA_TO_DEVICE);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "intermediate block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[8], symint[9], symint[10], symint[11],
++		 symint[12], symint[13], symint[14], symint[15]);
++	dev_info(ksdev, "decrypted block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[0], symout[1], symout[2], symout[3],
++		 symout[4], symout[5], symout[6], symout[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[8], symout[9], symout[10], symout[11],
++		 symout[12], symout[13], symout[14], symout[15]);
++	dev_info(ksdev, "caam_sm_test: decrypt cycle with 8 byte key\n");
++#endif
++
++	/* Check result */
++	if (memcmp(symout, syminp, 256)) {
++		dev_info(ksdev, "caam_sm_test: 8-byte key test mismatch\n");
++		rtnval = -1;
++		goto freekeys;
++	} else
++		dev_info(ksdev, "caam_sm_test: 8-byte key test match OK\n");
++
++	/* AES-128 encrypt using 16 byte black key */
++	black_key_aes128_dma = dma_map_single(ksdev, black_key_aes128, 16,
++					      DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, black_key_aes128_dma, 16,
++				   DMA_TO_DEVICE);
++	syminp_dma = dma_map_single(ksdev, syminp, 256, DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
++	symint_dma = dma_map_single(ksdev, symint, 256, DMA_FROM_DEVICE);
++
++	jdescsz = mk_job_desc(jdesc, black_key_aes128_dma, 16, syminp_dma,
++			      symint_dma, 256,
++			      OP_ALG_ENCRYPT | OP_ALG_ALGSEL_AES, 0);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "jobdesc:\n");
++	dev_info(ksdev, "0x%08x\n", jdesc[0]);
++	dev_info(ksdev, "0x%08x\n", jdesc[1]);
++	dev_info(ksdev, "0x%08x\n", jdesc[2]);
++	dev_info(ksdev, "0x%08x\n", jdesc[3]);
++	dev_info(ksdev, "0x%08x\n", jdesc[4]);
++	dev_info(ksdev, "0x%08x\n", jdesc[5]);
++	dev_info(ksdev, "0x%08x\n", jdesc[6]);
++	dev_info(ksdev, "0x%08x\n", jdesc[7]);
++#endif
++
++	jstat = exec_test_job(ksdev, jdesc);
++
++	dma_sync_single_for_cpu(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
++	dma_unmap_single(ksdev, black_key_aes128_dma, 16, DMA_TO_DEVICE);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "input block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[0], syminp[1], syminp[2], syminp[3],
++		 syminp[4], syminp[5], syminp[6], syminp[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[8], syminp[9], syminp[10], syminp[11],
++		 syminp[12], syminp[13], syminp[14], syminp[15]);
++	dev_info(ksdev, "intermediate block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[8], symint[9], symint[10], symint[11],
++		 symint[12], symint[13], symint[14], symint[15]);
++	dev_info(ksdev, "caam_sm_test: encrypt cycle with 16 byte key\n");
++#endif
++
++	/* AES-128 decrypt using 16 byte clear key */
++	clear_key_aes128_dma = dma_map_single(ksdev, clear_key_aes128, 16,
++					      DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, clear_key_aes128_dma, 16,
++				   DMA_TO_DEVICE);
++	symint_dma = dma_map_single(ksdev, symint, 256, DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, symint_dma, 256, DMA_TO_DEVICE);
++	symout_dma = dma_map_single(ksdev, symout, 256, DMA_FROM_DEVICE);
++
++	jdescsz = mk_job_desc(jdesc, clear_key_aes128_dma, 16, symint_dma,
++			      symout_dma, 256,
++			      OP_ALG_DECRYPT | OP_ALG_ALGSEL_AES, 0);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "jobdesc:\n");
++	dev_info(ksdev, "0x%08x\n", jdesc[0]);
++	dev_info(ksdev, "0x%08x\n", jdesc[1]);
++	dev_info(ksdev, "0x%08x\n", jdesc[2]);
++	dev_info(ksdev, "0x%08x\n", jdesc[3]);
++	dev_info(ksdev, "0x%08x\n", jdesc[4]);
++	dev_info(ksdev, "0x%08x\n", jdesc[5]);
++	dev_info(ksdev, "0x%08x\n", jdesc[6]);
++	dev_info(ksdev, "0x%08x\n", jdesc[7]);
++#endif
++	jstat = exec_test_job(ksdev, jdesc);
++
++	dma_sync_single_for_cpu(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symint_dma, 256, DMA_TO_DEVICE);
++	dma_unmap_single(ksdev, clear_key_aes128_dma, 16, DMA_TO_DEVICE);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "intermediate block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[8], symint[9], symint[10], symint[11],
++		 symint[12], symint[13], symint[14], symint[15]);
++	dev_info(ksdev, "decrypted block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[0], symout[1], symout[2], symout[3],
++		 symout[4], symout[5], symout[6], symout[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[8], symout[9], symout[10], symout[11],
++		 symout[12], symout[13], symout[14], symout[15]);
++	dev_info(ksdev, "caam_sm_test: decrypt cycle with 16 byte key\n");
++#endif
++
++	/* Check result */
++	if (memcmp(symout, syminp, 256)) {
++		dev_info(ksdev, "caam_sm_test: 16-byte key test mismatch\n");
++		rtnval = -1;
++		goto freekeys;
++	} else
++		dev_info(ksdev, "caam_sm_test: 16-byte key test match OK\n");
++
++	/* AES-256 encrypt using 32 byte black key */
++	black_key_aes256_dma = dma_map_single(ksdev, black_key_aes256, 32,
++					      DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, black_key_aes256_dma, 32,
++				   DMA_TO_DEVICE);
++	syminp_dma = dma_map_single(ksdev, syminp, 256, DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
++	symint_dma = dma_map_single(ksdev, symint, 256, DMA_FROM_DEVICE);
++
++	jdescsz = mk_job_desc(jdesc, black_key_aes256_dma, 32, syminp_dma,
++			      symint_dma, 256,
++			      OP_ALG_ENCRYPT | OP_ALG_ALGSEL_AES, 0);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "jobdesc:\n");
++	dev_info(ksdev, "0x%08x\n", jdesc[0]);
++	dev_info(ksdev, "0x%08x\n", jdesc[1]);
++	dev_info(ksdev, "0x%08x\n", jdesc[2]);
++	dev_info(ksdev, "0x%08x\n", jdesc[3]);
++	dev_info(ksdev, "0x%08x\n", jdesc[4]);
++	dev_info(ksdev, "0x%08x\n", jdesc[5]);
++	dev_info(ksdev, "0x%08x\n", jdesc[6]);
++	dev_info(ksdev, "0x%08x\n", jdesc[7]);
++#endif
++
++	jstat = exec_test_job(ksdev, jdesc);
++
++	dma_sync_single_for_cpu(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symint_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, syminp_dma, 256, DMA_TO_DEVICE);
++	dma_unmap_single(ksdev, black_key_aes256_dma, 32, DMA_TO_DEVICE);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "input block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[0], syminp[1], syminp[2], syminp[3],
++		 syminp[4], syminp[5], syminp[6], syminp[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 syminp[8], syminp[9], syminp[10], syminp[11],
++		 syminp[12], syminp[13], syminp[14], syminp[15]);
++	dev_info(ksdev, "intermediate block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[8], symint[9], symint[10], symint[11],
++		 symint[12], symint[13], symint[14], symint[15]);
++	dev_info(ksdev, "caam_sm_test: encrypt cycle with 32 byte key\n");
++#endif
++
++	/* AES-256 decrypt using 32-byte black key */
++	clear_key_aes256_dma = dma_map_single(ksdev, clear_key_aes256, 32,
++					      DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, clear_key_aes256_dma, 32,
++				   DMA_TO_DEVICE);
++	symint_dma = dma_map_single(ksdev, symint, 256, DMA_TO_DEVICE);
++	dma_sync_single_for_device(ksdev, symint_dma, 256, DMA_TO_DEVICE);
++	symout_dma = dma_map_single(ksdev, symout, 256, DMA_FROM_DEVICE);
++
++	jdescsz = mk_job_desc(jdesc, clear_key_aes256_dma, 32, symint_dma,
++			      symout_dma, 256,
++			      OP_ALG_DECRYPT | OP_ALG_ALGSEL_AES, 0);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "jobdesc:\n");
++	dev_info(ksdev, "0x%08x\n", jdesc[0]);
++	dev_info(ksdev, "0x%08x\n", jdesc[1]);
++	dev_info(ksdev, "0x%08x\n", jdesc[2]);
++	dev_info(ksdev, "0x%08x\n", jdesc[3]);
++	dev_info(ksdev, "0x%08x\n", jdesc[4]);
++	dev_info(ksdev, "0x%08x\n", jdesc[5]);
++	dev_info(ksdev, "0x%08x\n", jdesc[6]);
++	dev_info(ksdev, "0x%08x\n", jdesc[7]);
++#endif
++
++	jstat = exec_test_job(ksdev, jdesc);
++
++	dma_sync_single_for_cpu(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symout_dma, 256, DMA_FROM_DEVICE);
++	dma_unmap_single(ksdev, symint_dma, 256, DMA_TO_DEVICE);
++	dma_unmap_single(ksdev, clear_key_aes256_dma, 32, DMA_TO_DEVICE);
++
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "intermediate block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[0], symint[1], symint[2], symint[3],
++		 symint[4], symint[5], symint[6], symint[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symint[8], symint[9], symint[10], symint[11],
++		 symint[12], symint[13], symint[14], symint[15]);
++	dev_info(ksdev, "decrypted block:\n");
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[0], symout[1], symout[2], symout[3],
++		 symout[4], symout[5], symout[6], symout[7]);
++	dev_info(ksdev, "0x%02x 0x%02x 0x%02x 0x%02x " \
++			"0x%02x 0x%02x 0x%02x 0x%02x\n",
++		 symout[8], symout[9], symout[10], symout[11],
++		 symout[12], symout[13], symout[14], symout[15]);
++	dev_info(ksdev, "caam_sm_test: decrypt cycle with 32 byte key\n");
++#endif
++
++	/* Check result */
++	if (memcmp(symout, syminp, 256)) {
++		dev_info(ksdev, "caam_sm_test: 32-byte key test mismatch\n");
++		rtnval = -1;
++		goto freekeys;
++	} else
++		dev_info(ksdev, "caam_sm_test: 32-byte key test match OK\n");
++
++
++	/* Remove 8/16/32 byte keys from keystore */
++freekeys:
++	stat = sm_keystore_slot_dealloc(ksdev, unit, keyslot_des);
++	if (stat)
++		dev_info(ksdev, "caam_sm_test: can't release slot %d\n",
++			 keyslot_des);
++
++	stat = sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes128);
++	if (stat)
++		dev_info(ksdev, "caam_sm_test: can't release slot %d\n",
++			 keyslot_aes128);
++
++	stat = sm_keystore_slot_dealloc(ksdev, unit, keyslot_aes256);
++	if (stat)
++		dev_info(ksdev, "caam_sm_test: can't release slot %d\n",
++			 keyslot_aes256);
++
++
++	/* Free resources */
++freemem:
++#ifdef SM_TEST_DETAIL
++	dev_info(ksdev, "caam_sm_test: cleaning up\n");
++#endif
++	kfree(syminp);
++	kfree(symint);
++	kfree(symout);
++	kfree(clear_key_des);
++	kfree(clear_key_aes128);
++	kfree(clear_key_aes256);
++	kfree(black_key_des);
++	kfree(black_key_aes128);
++	kfree(black_key_aes256);
++	kfree(jdesc);
++
++	/* Disconnect from keystore and leave */
++	sm_release_keystore(ksdev, unit);
++
++	return rtnval;
++}
++EXPORT_SYMBOL(caam_sm_example_init);
++
++void caam_sm_example_shutdown(void)
++{
++	/* unused in present version */
++	struct device_node *dev_node;
++	struct platform_device *pdev;
++
++	/*
++	 * Do of_find_compatible_node() then of_find_device_by_node()
++	 * once a functional device tree is available
++	 */
++	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
++	if (!dev_node) {
++		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
++		if (!dev_node)
++			return;
++	}
++
++	pdev = of_find_device_by_node(dev_node);
++	if (!pdev)
++		return;
++
++	of_node_get(dev_node);
++
++}
++
++static int __init caam_sm_test_init(void)
++{
++	struct device_node *dev_node;
++	struct platform_device *pdev;
++
++	/*
++	 * Do of_find_compatible_node() then of_find_device_by_node()
++	 * once a functional device tree is available
++	 */
++	dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec-v4.0");
++	if (!dev_node) {
++		dev_node = of_find_compatible_node(NULL, NULL, "fsl,sec4.0");
++		if (!dev_node)
++			return -ENODEV;
++	}
++
++	pdev = of_find_device_by_node(dev_node);
++	if (!pdev)
++		return -ENODEV;
++
++	of_node_put(dev_node);
++
++	caam_sm_example_init(pdev);
++
++	return 0;
++}
++
++
++/* Module-based initialization needs to wait for dev tree */
++#ifdef CONFIG_OF
++module_init(caam_sm_test_init);
++module_exit(caam_sm_example_shutdown);
++
++MODULE_LICENSE("Dual BSD/GPL");
++MODULE_DESCRIPTION("FSL CAAM Keystore Usage Example");
++MODULE_AUTHOR("Freescale Semiconductor - NMSG/MAD");
++#endif
+diff -Nur linux-4.1.3/drivers/crypto/caam/snvsregs.h linux-xbian-imx6/drivers/crypto/caam/snvsregs.h
+--- linux-4.1.3/drivers/crypto/caam/snvsregs.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/crypto/caam/snvsregs.h	2015-07-27 23:13:04.213947410 +0200
+@@ -0,0 +1,237 @@
++/*
++ * SNVS hardware register-level view
++ *
++ * Copyright (C) 2012-2014 Freescale Semiconductor, Inc., All Rights Reserved
++ */
++
++#ifndef SNVSREGS_H
++#define SNVSREGS_H
++
++#include <linux/types.h>
++#include <linux/io.h>
++
++/*
++ * SNVS High Power Domain
++ * Includes security violations, HA counter, RTC, alarm
++ */
++struct snvs_hp {
++	u32 lock;		/* HPLR - HP Lock */
++	u32 cmd;		/* HPCOMR - HP Command */
++	u32 ctl;		/* HPCR - HP Control */
++	u32 secvio_intcfg;	/* HPSICR - Security Violation Int Config */
++	u32 secvio_ctl;		/* HPSVCR - Security Violation Control */
++	u32 status;		/* HPSR - HP Status */
++	u32 secvio_status;	/* HPSVSR - Security Violation Status */
++	u32 ha_counteriv;	/* High Assurance Counter IV */
++	u32 ha_counter;		/* High Assurance Counter */
++	u32 rtc_msb;		/* Real Time Clock/Counter MSB */
++	u32 rtc_lsb;		/* Real Time Counter LSB */
++	u32 time_alarm_msb;	/* Time Alarm MSB */
++	u32 time_alarm_lsb;	/* Time Alarm LSB */
++};
++
++#define HP_LOCK_HAC_LCK		0x00040000
++#define HP_LOCK_HPSICR_LCK	0x00020000
++#define HP_LOCK_HPSVCR_LCK	0x00010000
++#define HP_LOCK_MKEYSEL_LCK	0x00000200
++#define HP_LOCK_TAMPCFG_LCK	0x00000100
++#define HP_LOCK_TAMPFLT_LCK	0x00000080
++#define HP_LOCK_SECVIO_LCK	0x00000040
++#define HP_LOCK_GENP_LCK	0x00000020
++#define HP_LOCK_MONOCTR_LCK	0x00000010
++#define HP_LOCK_CALIB_LCK	0x00000008
++#define HP_LOCK_SRTC_LCK	0x00000004
++#define HP_LOCK_ZMK_RD_LCK	0x00000002
++#define HP_LOCK_ZMK_WT_LCK	0x00000001
++
++#define HP_CMD_NONPRIV_AXS	0x80000000
++#define HP_CMD_HAC_STOP		0x00080000
++#define HP_CMD_HAC_CLEAR	0x00040000
++#define HP_CMD_HAC_LOAD		0x00020000
++#define HP_CMD_HAC_CFG_EN	0x00010000
++#define HP_CMD_SNVS_MSTR_KEY	0x00002000
++#define HP_CMD_PROG_ZMK		0x00001000
++#define HP_CMD_SW_LPSV		0x00000400
++#define HP_CMD_SW_FSV		0x00000200
++#define HP_CMD_SW_SV		0x00000100
++#define HP_CMD_LP_SWR_DIS	0x00000020
++#define HP_CMD_LP_SWR		0x00000010
++#define HP_CMD_SSM_SFNS_DIS	0x00000004
++#define HP_CMD_SSM_ST_DIS	0x00000002
++#define HP_CMD_SMM_ST		0x00000001
++
++#define HP_CTL_TIME_SYNC	0x00010000
++#define HP_CTL_CAL_VAL_SHIFT	10
++#define HP_CTL_CAL_VAL_MASK	(0x1f << HP_CTL_CALIB_SHIFT)
++#define HP_CTL_CALIB_EN		0x00000100
++#define HP_CTL_PI_FREQ_SHIFT	4
++#define HP_CTL_PI_FREQ_MASK	(0xf << HP_CTL_PI_FREQ_SHIFT)
++#define HP_CTL_PI_EN		0x00000008
++#define HP_CTL_TIMEALARM_EN	0x00000002
++#define HP_CTL_RTC_EN		0x00000001
++
++#define HP_SECVIO_INTEN_EN	0x10000000
++#define HP_SECVIO_INTEN_SRC5	0x00000020
++#define HP_SECVIO_INTEN_SRC4	0x00000010
++#define HP_SECVIO_INTEN_SRC3	0x00000008
++#define HP_SECVIO_INTEN_SRC2	0x00000004
++#define HP_SECVIO_INTEN_SRC1	0x00000002
++#define HP_SECVIO_INTEN_SRC0	0x00000001
++#define HP_SECVIO_INTEN_ALL	0x8000003f
++
++#define HP_SECVIO_ICTL_CFG_SHIFT	30
++#define HP_SECVIO_ICTL_CFG_MASK		(0x3 << HP_SECVIO_ICTL_CFG_SHIFT)
++#define HP_SECVIO_ICTL_CFG5_SHIFT	5
++#define HP_SECVIO_ICTL_CFG5_MASK	(0x3 << HP_SECVIO_ICTL_CFG5_SHIFT)
++#define HP_SECVIO_ICTL_CFG_DISABLE	0
++#define HP_SECVIO_ICTL_CFG_NONFATAL	1
++#define HP_SECVIO_ICTL_CFG_FATAL	2
++#define HP_SECVIO_ICTL_CFG4_FATAL	0x00000010
++#define HP_SECVIO_ICTL_CFG3_FATAL	0x00000008
++#define HP_SECVIO_ICTL_CFG2_FATAL	0x00000004
++#define HP_SECVIO_ICTL_CFG1_FATAL	0x00000002
++#define HP_SECVIO_ICTL_CFG0_FATAL	0x00000001
++
++#define HP_STATUS_ZMK_ZERO		0x80000000
++#define HP_STATUS_OTPMK_ZERO		0x08000000
++#define HP_STATUS_OTPMK_SYN_SHIFT	16
++#define HP_STATUS_OTPMK_SYN_MASK	(0x1ff << HP_STATUS_OTPMK_SYN_SHIFT)
++#define HP_STATUS_SSM_ST_SHIFT		8
++#define HP_STATUS_SSM_ST_MASK		(0xf << HP_STATUS_SSM_ST_SHIFT)
++#define HP_STATUS_SSM_ST_INIT		0
++#define HP_STATUS_SSM_ST_HARDFAIL	1
++#define HP_STATUS_SSM_ST_SOFTFAIL	3
++#define HP_STATUS_SSM_ST_INITINT	8
++#define HP_STATUS_SSM_ST_CHECK		9
++#define HP_STATUS_SSM_ST_NONSECURE	11
++#define HP_STATUS_SSM_ST_TRUSTED	13
++#define HP_STATUS_SSM_ST_SECURE		15
++
++#define HP_SECVIOST_ZMK_ECC_FAIL	0x08000000	/* write to clear */
++#define HP_SECVIOST_ZMK_SYN_SHIFT	16
++#define HP_SECVIOST_ZMK_SYN_MASK	(0x1ff << HP_SECVIOST_ZMK_SYN_SHIFT)
++#define HP_SECVIOST_SECVIO5		0x00000020
++#define HP_SECVIOST_SECVIO4		0x00000010
++#define HP_SECVIOST_SECVIO3		0x00000008
++#define HP_SECVIOST_SECVIO2		0x00000004
++#define HP_SECVIOST_SECVIO1		0x00000002
++#define HP_SECVIOST_SECVIO0		0x00000001
++#define HP_SECVIOST_SECVIOMASK		0x0000003f
++
++/*
++ * SNVS Low Power Domain
++ * Includes glitch detector, SRTC, alarm, monotonic counter, ZMK
++ */
++struct snvs_lp {
++	u32 lock;
++	u32 ctl;
++	u32 mstr_key_ctl;	/* Master Key Control */
++	u32 secvio_ctl;		/* Security Violation Control */
++	u32 tamper_filt_cfg;	/* Tamper Glitch Filters Configuration */
++	u32 tamper_det_cfg;	/* Tamper Detectors Configuration */
++	u32 status;
++	u32 srtc_msb;		/* Secure Real Time Clock/Counter MSB */
++	u32 srtc_lsb;		/* Secure Real Time Clock/Counter LSB */
++	u32 time_alarm;		/* Time Alarm */
++	u32 smc_msb;		/* Secure Monotonic Counter MSB */
++	u32 smc_lsb;		/* Secure Monotonic Counter LSB */
++	u32 pwr_glitch_det;	/* Power Glitch Detector */
++	u32 gen_purpose;
++	u32 zmk[8];		/* Zeroizable Master Key */
++};
++
++#define LP_LOCK_MKEYSEL_LCK	0x00000200
++#define LP_LOCK_TAMPDET_LCK	0x00000100
++#define LP_LOCK_TAMPFLT_LCK	0x00000080
++#define LP_LOCK_SECVIO_LCK	0x00000040
++#define LP_LOCK_GENP_LCK	0x00000020
++#define LP_LOCK_MONOCTR_LCK	0x00000010
++#define LP_LOCK_CALIB_LCK	0x00000008
++#define LP_LOCK_SRTC_LCK	0x00000004
++#define LP_LOCK_ZMK_RD_LCK	0x00000002
++#define LP_LOCK_ZMK_WT_LCK	0x00000001
++
++#define LP_CTL_CAL_VAL_SHIFT	10
++#define LP_CTL_CAL_VAL_MASK	(0x1f << LP_CTL_CAL_VAL_SHIFT)
++#define LP_CTL_CALIB_EN		0x00000100
++#define LP_CTL_SRTC_INVAL_EN	0x00000010
++#define LP_CTL_WAKE_INT_EN	0x00000008
++#define LP_CTL_MONOCTR_EN	0x00000004
++#define LP_CTL_TIMEALARM_EN	0x00000002
++#define LP_CTL_SRTC_EN		0x00000001
++
++#define LP_MKEYCTL_ZMKECC_SHIFT	8
++#define LP_MKEYCTL_ZMKECC_MASK	(0xff << LP_MKEYCTL_ZMKECC_SHIFT)
++#define LP_MKEYCTL_ZMKECC_EN	0x00000010
++#define LP_MKEYCTL_ZMKECC_VAL	0x00000008
++#define LP_MKEYCTL_ZMKECC_PROG	0x00000004
++#define LP_MKEYCTL_MKSEL_SHIFT	0
++#define LP_MKEYCTL_MKSEL_MASK	(3 << LP_MKEYCTL_MKSEL_SHIFT)
++#define LP_MKEYCTL_MK_OTP	0
++#define LP_MKEYCTL_MK_ZMK	2
++#define LP_MKEYCTL_MK_COMB	3
++
++#define LP_SECVIO_CTL_SRC5	0x20
++#define LP_SECVIO_CTL_SRC4	0x10
++#define LP_SECVIO_CTL_SRC3	0x08
++#define LP_SECVIO_CTL_SRC2	0x04
++#define LP_SECVIO_CTL_SRC1	0x02
++#define LP_SECVIO_CTL_SRC0	0x01
++
++#define LP_TAMPFILT_EXT2_EN	0x80000000
++#define LP_TAMPFILT_EXT2_SHIFT	24
++#define LP_TAMPFILT_EXT2_MASK	(0x1f << LP_TAMPFILT_EXT2_SHIFT)
++#define LP_TAMPFILT_EXT1_EN	0x00800000
++#define LP_TAMPFILT_EXT1_SHIFT	16
++#define LP_TAMPFILT_EXT1_MASK	(0x1f << LP_TAMPFILT_EXT1_SHIFT)
++#define LP_TAMPFILT_WM_EN	0x00000080
++#define LP_TAMPFILT_WM_SHIFT	0
++#define LP_TAMPFILT_WM_MASK	(0x1f << LP_TAMPFILT_WM_SHIFT)
++
++#define LP_TAMPDET_OSC_BPS	0x10000000
++#define LP_TAMPDET_VRC_SHIFT	24
++#define LP_TAMPDET_VRC_MASK	(3 << LP_TAMPFILT_VRC_SHIFT)
++#define LP_TAMPDET_HTDC_SHIFT	20
++#define LP_TAMPDET_HTDC_MASK	(3 << LP_TAMPFILT_HTDC_SHIFT)
++#define LP_TAMPDET_LTDC_SHIFT	16
++#define LP_TAMPDET_LTDC_MASK	(3 << LP_TAMPFILT_LTDC_SHIFT)
++#define LP_TAMPDET_POR_OBS	0x00008000
++#define LP_TAMPDET_PFD_OBS	0x00004000
++#define LP_TAMPDET_ET2_EN	0x00000400
++#define LP_TAMPDET_ET1_EN	0x00000200
++#define LP_TAMPDET_WMT2_EN	0x00000100
++#define LP_TAMPDET_WMT1_EN	0x00000080
++#define LP_TAMPDET_VT_EN	0x00000040
++#define LP_TAMPDET_TT_EN	0x00000020
++#define LP_TAMPDET_CT_EN	0x00000010
++#define LP_TAMPDET_MCR_EN	0x00000004
++#define LP_TAMPDET_SRTCR_EN	0x00000002
++
++#define LP_STATUS_SECURE
++#define LP_STATUS_NONSECURE
++#define LP_STATUS_SCANEXIT	0x00100000	/* all write 1 clear here on */
++#define LP_STATUS_EXT_SECVIO	0x00010000
++#define LP_STATUS_ET2		0x00000400
++#define LP_STATUS_ET1		0x00000200
++#define LP_STATUS_WMT2		0x00000100
++#define LP_STATUS_WMT1		0x00000080
++#define LP_STATUS_VTD		0x00000040
++#define LP_STATUS_TTD		0x00000020
++#define LP_STATUS_CTD		0x00000010
++#define LP_STATUS_PGD		0x00000008
++#define LP_STATUS_MCR		0x00000004
++#define LP_STATUS_SRTCR		0x00000002
++#define LP_STATUS_LPTA		0x00000001
++
++/* Full SNVS register page, including version/options */
++struct snvs_full {
++	struct snvs_hp hp;
++	struct snvs_lp lp;
++	u32 rsvd[731];		/* deadspace 0x08c-0xbf7 */
++
++	/* Version / Revision / Option ID space - end of register page */
++	u32 vid;		/* 0xbf8 HP Version ID (VID 1) */
++	u32 opt_rev;		/* 0xbfc HP Options / Revision (VID 2) */
++};
++
++#endif /* SNVSREGS_H */
+diff -Nur linux-4.1.3/drivers/dma/imx-sdma.c linux-xbian-imx6/drivers/dma/imx-sdma.c
+--- linux-4.1.3/drivers/dma/imx-sdma.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/dma/imx-sdma.c	2015-07-27 23:13:04.285691435 +0200
+@@ -29,6 +29,7 @@
+ #include <linux/semaphore.h>
+ #include <linux/spinlock.h>
+ #include <linux/device.h>
++#include <linux/genalloc.h>
+ #include <linux/dma-mapping.h>
+ #include <linux/firmware.h>
+ #include <linux/slab.h>
+@@ -232,6 +233,14 @@
+ 
+ struct sdma_engine;
+ 
++enum sdma_mode {
++	SDMA_MODE_INVALID = 0,
++	SDMA_MODE_LOOP,
++	SDMA_MODE_NORMAL,
++	SDMA_MODE_P2P,
++	SDMA_MODE_NO_BD,
++};
++
+ /**
+  * struct sdma_channel - housekeeping for a SDMA channel
+  *
+@@ -244,6 +253,7 @@
+  * @word_size		peripheral access size
+  * @buf_tail		ID of the buffer that was processed
+  * @num_bd		max NUM_BD. number of descriptors currently handling
++ * @bd_iram		flag indicating the memory location of buffer descriptor
+  */
+ struct sdma_channel {
+ 	struct sdma_engine		*sdma;
+@@ -258,12 +268,16 @@
+ 	unsigned int			period_len;
+ 	struct sdma_buffer_descriptor	*bd;
+ 	dma_addr_t			bd_phys;
++	bool				bd_iram;
+ 	unsigned int			pc_from_device, pc_to_device;
+-	unsigned long			flags;
+-	dma_addr_t			per_address;
++	unsigned int			device_to_device;
++	unsigned int			other_script;
++	enum sdma_mode			mode;
++	dma_addr_t			per_address, per_address2;
+ 	unsigned long			event_mask[2];
+ 	unsigned long			watermark_level;
+ 	u32				shp_addr, per_addr;
++	u32				data_addr1, data_addr2;
+ 	struct dma_chan			chan;
+ 	spinlock_t			lock;
+ 	struct dma_async_tx_descriptor	desc;
+@@ -271,11 +285,8 @@
+ 	unsigned int			chn_count;
+ 	unsigned int			chn_real_count;
+ 	struct tasklet_struct		tasklet;
+-	struct imx_dma_data		data;
+ };
+ 
+-#define IMX_DMA_SG_LOOP		BIT(0)
+-
+ #define MAX_DMA_CHANNELS 32
+ #define MXC_SDMA_DEFAULT_PRIORITY 1
+ #define MXC_SDMA_MIN_PRIORITY 1
+@@ -327,6 +338,7 @@
+ 	spinlock_t			channel_0_lock;
+ 	u32				script_number;
+ 	struct sdma_script_start_addrs	*script_addrs;
++	struct gen_pool 		*iram_pool;
+ 	const struct sdma_driver_data	*drvdata;
+ };
+ 
+@@ -546,12 +558,14 @@
+ 	dma_addr_t buf_phys;
+ 	int ret;
+ 	unsigned long flags;
++	bool use_iram = true;
+ 
+-	buf_virt = dma_alloc_coherent(NULL,
+-			size,
+-			&buf_phys, GFP_KERNEL);
++	buf_virt = gen_pool_dma_alloc(sdma->iram_pool, size, &buf_phys);
+ 	if (!buf_virt) {
+-		return -ENOMEM;
++		use_iram = false;
++		buf_virt = dma_alloc_coherent(NULL, size, &buf_phys, GFP_KERNEL);
++		if (!buf_virt)
++			return -ENOMEM;
+ 	}
+ 
+ 	spin_lock_irqsave(&sdma->channel_0_lock, flags);
+@@ -568,7 +582,10 @@
+ 
+ 	spin_unlock_irqrestore(&sdma->channel_0_lock, flags);
+ 
+-	dma_free_coherent(NULL, size, buf_virt, buf_phys);
++	if (use_iram)
++		gen_pool_free(sdma->iram_pool, (unsigned long)buf_virt, size);
++	else
++		dma_free_coherent(NULL, size, buf_virt, buf_phys);
+ 
+ 	return ret;
+ }
+@@ -654,14 +671,31 @@
+ 		sdmac->desc.callback(sdmac->desc.callback_param);
+ }
+ 
++static void sdma_handle_other_intr(struct sdma_channel *sdmac)
++{
++	if (sdmac->desc.callback)
++		sdmac->desc.callback(sdmac->desc.callback_param);
++}
++
+ static void sdma_tasklet(unsigned long data)
+ {
+ 	struct sdma_channel *sdmac = (struct sdma_channel *) data;
++	struct sdma_engine *sdma = sdmac->sdma;
+ 
+-	if (sdmac->flags & IMX_DMA_SG_LOOP)
++	switch (sdmac->mode) {
++	case SDMA_MODE_LOOP:
+ 		sdma_handle_channel_loop(sdmac);
+-	else
++		break;
++	case SDMA_MODE_NORMAL:
+ 		mxc_sdma_handle_channel_normal(sdmac);
++		break;
++	case SDMA_MODE_NO_BD:
++		sdma_handle_other_intr(sdmac);
++		break;
++	default:
++		dev_err(sdma->dev, "invalid SDMA MODE!\n");
++		break;
++	}
+ }
+ 
+ static irqreturn_t sdma_int_handler(int irq, void *dev_id)
+@@ -678,7 +712,7 @@
+ 		int channel = fls(stat) - 1;
+ 		struct sdma_channel *sdmac = &sdma->channel[channel];
+ 
+-		if (sdmac->flags & IMX_DMA_SG_LOOP)
++		if (sdmac->mode & SDMA_MODE_LOOP)
+ 			sdma_update_channel_loop(sdmac);
+ 
+ 		tasklet_schedule(&sdmac->tasklet);
+@@ -702,9 +736,12 @@
+ 	 * two peripherals or memory-to-memory transfers
+ 	 */
+ 	int per_2_per = 0, emi_2_emi = 0;
++	int other = 0;
+ 
+ 	sdmac->pc_from_device = 0;
+ 	sdmac->pc_to_device = 0;
++	sdmac->device_to_device = 0;
++	sdmac->other_script = 0;
+ 
+ 	switch (peripheral_type) {
+ 	case IMX_DMATYPE_MEMORY:
+@@ -733,7 +770,6 @@
+ 	case IMX_DMATYPE_CSPI:
+ 	case IMX_DMATYPE_EXT:
+ 	case IMX_DMATYPE_SSI:
+-	case IMX_DMATYPE_SAI:
+ 		per_2_emi = sdma->script_addrs->app_2_mcu_addr;
+ 		emi_2_per = sdma->script_addrs->mcu_2_app_addr;
+ 		break;
+@@ -751,11 +787,6 @@
+ 		emi_2_per = sdma->script_addrs->mcu_2_shp_addr;
+ 		break;
+ 	case IMX_DMATYPE_ASRC:
+-		per_2_emi = sdma->script_addrs->asrc_2_mcu_addr;
+-		emi_2_per = sdma->script_addrs->asrc_2_mcu_addr;
+-		per_2_per = sdma->script_addrs->per_2_per_addr;
+-		break;
+-	case IMX_DMATYPE_ASRC_SP:
+ 		per_2_emi = sdma->script_addrs->shp_2_mcu_addr;
+ 		emi_2_per = sdma->script_addrs->mcu_2_shp_addr;
+ 		per_2_per = sdma->script_addrs->per_2_per_addr;
+@@ -774,12 +805,17 @@
+ 	case IMX_DMATYPE_IPU_MEMORY:
+ 		emi_2_per = sdma->script_addrs->ext_mem_2_ipu_addr;
+ 		break;
++	case IMX_DMATYPE_HDMI:
++		other = sdma->script_addrs->hdmi_dma_addr;
++		break;
+ 	default:
+ 		break;
+ 	}
+ 
+ 	sdmac->pc_from_device = per_2_emi;
+ 	sdmac->pc_to_device = emi_2_per;
++	sdmac->device_to_device = per_2_per;
++	sdmac->other_script = other;
+ }
+ 
+ static int sdma_load_context(struct sdma_channel *sdmac)
+@@ -792,11 +828,14 @@
+ 	int ret;
+ 	unsigned long flags;
+ 
+-	if (sdmac->direction == DMA_DEV_TO_MEM) {
++	if (sdmac->direction == DMA_DEV_TO_MEM)
+ 		load_address = sdmac->pc_from_device;
+-	} else {
++	else if (sdmac->direction == DMA_DEV_TO_DEV)
++		load_address = sdmac->device_to_device;
++	else if (sdmac->direction == DMA_MEM_TO_DEV)
+ 		load_address = sdmac->pc_to_device;
+-	}
++	else
++		load_address = sdmac->other_script;
+ 
+ 	if (load_address < 0)
+ 		return load_address;
+@@ -816,11 +855,16 @@
+ 	/* Send by context the event mask,base address for peripheral
+ 	 * and watermark level
+ 	 */
+-	context->gReg[0] = sdmac->event_mask[1];
+-	context->gReg[1] = sdmac->event_mask[0];
+-	context->gReg[2] = sdmac->per_addr;
+-	context->gReg[6] = sdmac->shp_addr;
+-	context->gReg[7] = sdmac->watermark_level;
++	if (sdmac->peripheral_type == IMX_DMATYPE_HDMI) {
++		context->gReg[4] = sdmac->data_addr1;
++		context->gReg[6] = sdmac->data_addr2;
++	} else {
++		context->gReg[0] = sdmac->event_mask[1];
++		context->gReg[1] = sdmac->event_mask[0];
++		context->gReg[2] = sdmac->per_addr;
++		context->gReg[6] = sdmac->shp_addr;
++		context->gReg[7] = sdmac->watermark_level;
++	}
+ 
+ 	bd0->mode.command = C0_SETDM;
+ 	bd0->mode.status = BD_DONE | BD_INTR | BD_WRAP | BD_EXTD;
+@@ -854,6 +898,7 @@
+ static int sdma_config_channel(struct dma_chan *chan)
+ {
+ 	struct sdma_channel *sdmac = to_sdma_chan(chan);
++	struct imx_dma_data *data = sdmac->chan.private;
+ 	int ret;
+ 
+ 	sdma_disable_channel(chan);
+@@ -862,12 +907,19 @@
+ 	sdmac->event_mask[1] = 0;
+ 	sdmac->shp_addr = 0;
+ 	sdmac->per_addr = 0;
++	sdmac->data_addr1 = 0;
++	sdmac->data_addr2 = 0;
+ 
+-	if (sdmac->event_id0) {
++	if (sdmac->event_id0 >= 0) {
+ 		if (sdmac->event_id0 >= sdmac->sdma->drvdata->num_events)
+ 			return -EINVAL;
+ 		sdma_event_enable(sdmac, sdmac->event_id0);
+ 	}
++	if (sdmac->event_id1) {
++		if (sdmac->event_id1 >= sdmac->sdma->drvdata->num_events)
++			return -EINVAL;
++		sdma_event_enable(sdmac, sdmac->event_id1);
++	}
+ 
+ 	switch (sdmac->peripheral_type) {
+ 	case IMX_DMATYPE_DSP:
+@@ -887,19 +939,75 @@
+ 			(sdmac->peripheral_type != IMX_DMATYPE_DSP)) {
+ 		/* Handle multiple event channels differently */
+ 		if (sdmac->event_id1) {
+-			sdmac->event_mask[1] = BIT(sdmac->event_id1 % 32);
+-			if (sdmac->event_id1 > 31)
+-				__set_bit(31, &sdmac->watermark_level);
+-			sdmac->event_mask[0] = BIT(sdmac->event_id0 % 32);
+-			if (sdmac->event_id0 > 31)
+-				__set_bit(30, &sdmac->watermark_level);
++			if (sdmac->event_id0 > 31) {
++				sdmac->event_mask[0] |= 0;
++				__set_bit(28, &sdmac->watermark_level);
++				sdmac->event_mask[1] |=
++						BIT(sdmac->event_id0 % 32);
++			} else {
++				sdmac->event_mask[1] |= 0;
++				sdmac->event_mask[0] |=
++						BIT(sdmac->event_id0 % 32);
++			}
++			if (sdmac->event_id1 > 31) {
++				sdmac->event_mask[0] |= 0;
++				__set_bit(29, &sdmac->watermark_level);
++				sdmac->event_mask[1] |=
++						BIT(sdmac->event_id1 % 32);
++			} else {
++				sdmac->event_mask[1] |= 0;
++				sdmac->event_mask[0] |=
++						BIT(sdmac->event_id1 % 32);
++			}
++			/* BIT 11:
++			 * 1 : Source on SPBA
++			 * 0 : Source on AIPS
++			 */
++			__set_bit(11, &sdmac->watermark_level);
++			/* BIT 12:
++			 * 1 : Destination on SPBA
++			 * 0 : Destination on AIPS
++			 */
++			__set_bit(12, &sdmac->watermark_level);
++			__set_bit(31, &sdmac->watermark_level);
++			/* BIT 31:
++			 * 1 : Amount of samples to be transferred is
++			 * unknown and script will keep on transferring
++			 * samples as long as both events are detected
++			 * and script must be manually stopped by the
++			 * application.
++			 * 0 : The amount of samples to be is equal to
++			 * the count field of mode word
++			 * */
++			__set_bit(25, &sdmac->watermark_level);
++			__clear_bit(24, &sdmac->watermark_level);
+ 		} else {
+-			__set_bit(sdmac->event_id0, sdmac->event_mask);
++			if (sdmac->event_id0 > 31) {
++				sdmac->event_mask[0] = 0;
++				sdmac->event_mask[1] |=
++						BIT(sdmac->event_id0 % 32);
++			} else {
++				sdmac->event_mask[0] |=
++						BIT(sdmac->event_id0 % 32);
++				sdmac->event_mask[1] = 0;
++			}
+ 		}
+ 		/* Watermark Level */
+ 		sdmac->watermark_level |= sdmac->watermark_level;
+ 		/* Address */
+-		sdmac->shp_addr = sdmac->per_address;
++		if (sdmac->direction == DMA_DEV_TO_DEV) {
++			sdmac->shp_addr = sdmac->per_address2;
++			sdmac->per_addr = sdmac->per_address;
++		} else if (sdmac->direction == DMA_TRANS_NONE) {
++			if (sdmac->peripheral_type != IMX_DMATYPE_HDMI ||
++					!data->data_addr1 || !data->data_addr2)
++				return -EINVAL;
++			sdmac->data_addr1 = *(u32 *)data->data_addr1;
++			sdmac->data_addr2 = *(u32 *)data->data_addr2;
++			sdmac->watermark_level = 0;
++		} else {
++			sdmac->shp_addr = sdmac->per_address;
++		}
+ 	} else {
+ 		sdmac->watermark_level = 0; /* FIXME: M3_BASE_ADDRESS */
+ 	}
+@@ -931,13 +1039,19 @@
+ 	int channel = sdmac->channel;
+ 	int ret = -EBUSY;
+ 
+-	sdmac->bd = dma_zalloc_coherent(NULL, PAGE_SIZE, &sdmac->bd_phys,
+-					GFP_KERNEL);
++	sdmac->bd_iram = true;
++	sdmac->bd = gen_pool_dma_alloc(sdma->iram_pool, PAGE_SIZE, &sdmac->bd_phys);
+ 	if (!sdmac->bd) {
+-		ret = -ENOMEM;
+-		goto out;
++		sdmac->bd_iram = false;
++		sdmac->bd = dma_alloc_coherent(NULL, PAGE_SIZE, &sdmac->bd_phys, GFP_KERNEL);
++		if (!sdmac->bd) {
++			ret = -ENOMEM;
++			goto out;
++		}
+ 	}
+ 
++	memset(sdmac->bd, 0, PAGE_SIZE);
++
+ 	sdma->channel_control[channel].base_bd_ptr = sdmac->bd_phys;
+ 	sdma->channel_control[channel].current_bd_ptr = sdmac->bd_phys;
+ 
+@@ -987,6 +1101,7 @@
+ 
+ 	sdmac->peripheral_type = data->peripheral_type;
+ 	sdmac->event_id0 = data->dma_request;
++	sdmac->event_id1 = data->dma_request2;
+ 
+ 	clk_enable(sdmac->sdma->clk_ipg);
+ 	clk_enable(sdmac->sdma->clk_ahb);
+@@ -1004,6 +1119,9 @@
+ 	/* txd.flags will be overwritten in prep funcs */
+ 	sdmac->desc.flags = DMA_CTRL_ACK;
+ 
++	/* Set SDMA channel mode to unvalid to avoid misconfig */
++	sdmac->mode = SDMA_MODE_INVALID;
++
+ 	return 0;
+ }
+ 
+@@ -1014,7 +1132,7 @@
+ 
+ 	sdma_disable_channel(chan);
+ 
+-	if (sdmac->event_id0)
++	if (sdmac->event_id0 >= 0)
+ 		sdma_event_disable(sdmac, sdmac->event_id0);
+ 	if (sdmac->event_id1)
+ 		sdma_event_disable(sdmac, sdmac->event_id1);
+@@ -1024,7 +1142,10 @@
+ 
+ 	sdma_set_channel_priority(sdmac, 0);
+ 
+-	dma_free_coherent(NULL, PAGE_SIZE, sdmac->bd, sdmac->bd_phys);
++	if (sdmac->bd_iram)
++		gen_pool_free(sdma->iram_pool, (unsigned long)sdmac->bd, PAGE_SIZE);
++	else
++		dma_free_coherent(NULL, PAGE_SIZE, sdmac->bd, sdmac->bd_phys);
+ 
+ 	clk_disable(sdma->clk_ipg);
+ 	clk_disable(sdma->clk_ahb);
+@@ -1045,7 +1166,7 @@
+ 		return NULL;
+ 	sdmac->status = DMA_IN_PROGRESS;
+ 
+-	sdmac->flags = 0;
++	sdmac->mode = SDMA_MODE_NORMAL;
+ 
+ 	sdmac->buf_tail = 0;
+ 
+@@ -1134,13 +1255,13 @@
+ static struct dma_async_tx_descriptor *sdma_prep_dma_cyclic(
+ 		struct dma_chan *chan, dma_addr_t dma_addr, size_t buf_len,
+ 		size_t period_len, enum dma_transfer_direction direction,
+-		unsigned long flags)
++		unsigned long flags, void *context)
+ {
+ 	struct sdma_channel *sdmac = to_sdma_chan(chan);
+ 	struct sdma_engine *sdma = sdmac->sdma;
+-	int num_periods = buf_len / period_len;
+ 	int channel = sdmac->channel;
+ 	int ret, i = 0, buf = 0;
++	int num_periods;
+ 
+ 	dev_dbg(sdma->dev, "%s channel: %d\n", __func__, channel);
+ 
+@@ -1152,12 +1273,33 @@
+ 	sdmac->buf_tail = 0;
+ 	sdmac->period_len = period_len;
+ 
+-	sdmac->flags |= IMX_DMA_SG_LOOP;
+ 	sdmac->direction = direction;
++
++	switch (sdmac->direction) {
++	case DMA_DEV_TO_DEV:
++		sdmac->mode = SDMA_MODE_P2P;
++		break;
++	case DMA_TRANS_NONE:
++		sdmac->mode = SDMA_MODE_NO_BD;
++		break;
++	case DMA_MEM_TO_DEV:
++	case DMA_DEV_TO_MEM:
++		sdmac->mode = SDMA_MODE_LOOP;
++		break;
++	default:
++		dev_err(sdma->dev, "invalid SDMA direction %d\n", direction);
++		return NULL;
++	}
++
+ 	ret = sdma_load_context(sdmac);
+ 	if (ret)
+ 		goto err_out;
+ 
++	if (period_len)
++		num_periods = buf_len / period_len;
++	else
++		return &sdmac->desc;
++
+ 	if (num_periods > NUM_BD) {
+ 		dev_err(sdma->dev, "SDMA channel %d: maximum number of sg exceeded: %d > %d\n",
+ 				channel, num_periods, NUM_BD);
+@@ -1216,7 +1358,16 @@
+ {
+ 	struct sdma_channel *sdmac = to_sdma_chan(chan);
+ 
+-	if (dmaengine_cfg->direction == DMA_DEV_TO_MEM) {
++	if (dmaengine_cfg->direction == DMA_DEV_TO_DEV) {
++		sdmac->per_address = dmaengine_cfg->src_addr;
++		sdmac->per_address2 = dmaengine_cfg->dst_addr;
++		sdmac->watermark_level = 0;
++		sdmac->watermark_level |=
++		dmaengine_cfg->src_maxburst;
++		sdmac->watermark_level |=
++			dmaengine_cfg->dst_maxburst << 16;
++		sdmac->word_size = dmaengine_cfg->dst_addr_width;
++	} else if (dmaengine_cfg->direction == DMA_DEV_TO_MEM) {
+ 		sdmac->per_address = dmaengine_cfg->src_addr;
+ 		sdmac->watermark_level = dmaengine_cfg->src_maxburst *
+ 			dmaengine_cfg->src_addr_width;
+@@ -1238,7 +1389,7 @@
+ 	struct sdma_channel *sdmac = to_sdma_chan(chan);
+ 	u32 residue;
+ 
+-	if (sdmac->flags & IMX_DMA_SG_LOOP)
++	if (sdmac->mode & SDMA_MODE_LOOP)
+ 		residue = (sdmac->num_bd - sdmac->buf_tail) * sdmac->period_len;
+ 	else
+ 		residue = sdmac->chn_count - sdmac->chn_real_count;
+@@ -1286,8 +1437,7 @@
+ 	unsigned short *ram_code;
+ 
+ 	if (!fw) {
+-		dev_info(sdma->dev, "external firmware not found, using ROM firmware\n");
+-		/* In this case we just use the ROM firmware. */
++		dev_err(sdma->dev, "firmware not found\n");
+ 		return;
+ 	}
+ 
+@@ -1302,7 +1452,10 @@
+ 		goto err_firmware;
+ 	switch (header->version_major) {
+ 	case 1:
+-		sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V1;
++		if (header->version_minor > 0)
++			sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V2;
++		else
++			sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V1;
+ 		break;
+ 	case 2:
+ 		sdma->script_number = SDMA_SCRIPT_ADDRS_ARRAY_SIZE_V2;
+@@ -1337,7 +1490,7 @@
+ 	release_firmware(fw);
+ }
+ 
+-static int sdma_get_firmware(struct sdma_engine *sdma,
++static int __init sdma_get_firmware(struct sdma_engine *sdma,
+ 		const char *fw_name)
+ {
+ 	int ret;
+@@ -1349,9 +1502,9 @@
+ 	return ret;
+ }
+ 
+-static int sdma_init(struct sdma_engine *sdma)
++static int __init sdma_init(struct sdma_engine *sdma)
+ {
+-	int i, ret;
++	int i, ret, ccbsize;
+ 	dma_addr_t ccb_phys;
+ 
+ 	clk_enable(sdma->clk_ipg);
+@@ -1360,14 +1513,17 @@
+ 	/* Be sure SDMA has not started yet */
+ 	writel_relaxed(0, sdma->regs + SDMA_H_C0PTR);
+ 
+-	sdma->channel_control = dma_alloc_coherent(NULL,
+-			MAX_DMA_CHANNELS * sizeof (struct sdma_channel_control) +
+-			sizeof(struct sdma_context_data),
+-			&ccb_phys, GFP_KERNEL);
++	ccbsize = MAX_DMA_CHANNELS * sizeof (struct sdma_channel_control)
++		+ sizeof(struct sdma_context_data);
+ 
++	sdma->channel_control = gen_pool_dma_alloc(sdma->iram_pool, ccbsize, &ccb_phys);
+ 	if (!sdma->channel_control) {
+-		ret = -ENOMEM;
+-		goto err_dma_alloc;
++		sdma->channel_control = dma_alloc_coherent(NULL, ccbsize,
++						&ccb_phys, GFP_KERNEL);
++		if (!sdma->channel_control) {
++			ret = -ENOMEM;
++			goto err_dma_alloc;
++		}
+ 	}
+ 
+ 	sdma->context = (void *)sdma->channel_control +
+@@ -1419,14 +1575,12 @@
+ 
+ static bool sdma_filter_fn(struct dma_chan *chan, void *fn_param)
+ {
+-	struct sdma_channel *sdmac = to_sdma_chan(chan);
+ 	struct imx_dma_data *data = fn_param;
+ 
+ 	if (!imx_dma_is_general_purpose(chan))
+ 		return false;
+ 
+-	sdmac->data = *data;
+-	chan->private = &sdmac->data;
++	chan->private = data;
+ 
+ 	return true;
+ }
+@@ -1444,11 +1598,12 @@
+ 	data.dma_request = dma_spec->args[0];
+ 	data.peripheral_type = dma_spec->args[1];
+ 	data.priority = dma_spec->args[2];
++	data.dma_request2 = 0;
+ 
+ 	return dma_request_channel(mask, sdma_filter_fn, &data);
+ }
+ 
+-static int sdma_probe(struct platform_device *pdev)
++static int __init sdma_probe(struct platform_device *pdev)
+ {
+ 	const struct of_device_id *of_id =
+ 			of_match_device(sdma_dt_ids, &pdev->dev);
+@@ -1547,6 +1702,11 @@
+ 					&sdma->dma_device.channels);
+ 	}
+ 
++	if (np)
++		sdma->iram_pool = of_get_named_gen_pool(np, "iram", 0);
++	if (!sdma->iram_pool)
++		dev_warn(&pdev->dev, "no iram assigned, using external mem\n");
++
+ 	ret = sdma_init(sdma);
+ 	if (ret)
+ 		goto err_init;
+@@ -1583,7 +1743,7 @@
+ 	sdma->dma_device.device_free_chan_resources = sdma_free_chan_resources;
+ 	sdma->dma_device.device_tx_status = sdma_tx_status;
+ 	sdma->dma_device.device_prep_slave_sg = sdma_prep_slave_sg;
+-	sdma->dma_device.device_prep_dma_cyclic = sdma_prep_dma_cyclic;
++	sdma->dma_device.device_prep_dma_cyclic = (void*)sdma_prep_dma_cyclic;
+ 	sdma->dma_device.device_config = sdma_config;
+ 	sdma->dma_device.device_terminate_all = sdma_disable_channel;
+ 	sdma->dma_device.src_addr_widths = BIT(DMA_SLAVE_BUSWIDTH_4_BYTES);
+@@ -1594,8 +1754,6 @@
+ 	sdma->dma_device.dev->dma_parms = &sdma->dma_parms;
+ 	dma_set_max_seg_size(sdma->dma_device.dev, 65535);
+ 
+-	platform_set_drvdata(pdev, sdma);
+-
+ 	ret = dma_async_device_register(&sdma->dma_device);
+ 	if (ret) {
+ 		dev_err(&pdev->dev, "unable to register\n");
+@@ -1647,10 +1805,13 @@
+ 	},
+ 	.id_table	= sdma_devtypes,
+ 	.remove		= sdma_remove,
+-	.probe		= sdma_probe,
+ };
+ 
+-module_platform_driver(sdma_driver);
++static int __init sdma_module_init(void)
++{
++	return platform_driver_probe(&sdma_driver, sdma_probe);
++}
++module_init(sdma_module_init);
+ 
+ MODULE_AUTHOR("Sascha Hauer, Pengutronix <s.hauer@pengutronix.de>");
+ MODULE_DESCRIPTION("i.MX SDMA driver");
+diff -Nur linux-4.1.3/drivers/gpu/drm/Kconfig linux-xbian-imx6/drivers/gpu/drm/Kconfig
+--- linux-4.1.3/drivers/gpu/drm/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/gpu/drm/Kconfig	2015-07-27 23:13:04.353449682 +0200
+@@ -217,3 +217,5 @@
+ source "drivers/gpu/drm/amd/amdkfd/Kconfig"
+ 
+ source "drivers/gpu/drm/imx/Kconfig"
++
++source "drivers/gpu/drm/vivante/Kconfig"
+diff -Nur linux-4.1.3/drivers/gpu/drm/Makefile linux-xbian-imx6/drivers/gpu/drm/Makefile
+--- linux-4.1.3/drivers/gpu/drm/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/gpu/drm/Makefile	2015-07-27 23:13:04.353449682 +0200
+@@ -67,6 +67,7 @@
+ obj-$(CONFIG_DRM_TEGRA) += tegra/
+ obj-$(CONFIG_DRM_STI) += sti/
+ obj-$(CONFIG_DRM_IMX) += imx/
++obj-$(CONFIG_DRM_VIVANTE) += vivante/
+ obj-y			+= i2c/
+ obj-y			+= panel/
+ obj-y			+= bridge/
+diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/Kconfig linux-xbian-imx6/drivers/gpu/drm/vivante/Kconfig
+--- linux-4.1.3/drivers/gpu/drm/vivante/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/gpu/drm/vivante/Kconfig	2015-07-27 23:13:04.744056042 +0200
+@@ -0,0 +1,6 @@
++config DRM_VIVANTE
++        tristate "Vivante GCCore"
++        depends on DRM
++        help
++          Choose this option if you have a Vivante graphics card.
++          If M is selected, the module will be called vivante.
+diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/Makefile linux-xbian-imx6/drivers/gpu/drm/vivante/Makefile
+--- linux-4.1.3/drivers/gpu/drm/vivante/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/gpu/drm/vivante/Makefile	2015-07-27 23:13:04.744056042 +0200
+@@ -0,0 +1,29 @@
++##############################################################################
++#
++#    Copyright (C) 2005 - 2013 by Vivante Corp.
++#
++#    This program is free software; you can redistribute it and/or modify
++#    it under the terms of the GNU General Public License as published by
++#    the Free Software Foundation; either version 2 of the license, or
++#    (at your option) any later version.
++#
++#    This program is distributed in the hope that it will be useful,
++#    but WITHOUT ANY WARRANTY; without even the implied warranty of
++#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++#    GNU General Public License for more details.
++#
++#    You should have received a copy of the GNU General Public License
++#    along with this program; if not write to the Free Software
++#    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++#
++##############################################################################
++
++
++#
++# Makefile for the drm device driver.  This driver provides support for the
++# Direct Rendering Infrastructure (DRI) in XFree86 4.1.0 and higher.
++
++ccflags-y := -Iinclude/drm
++vivante-y := vivante_drv.o
++
++obj-$(CONFIG_DRM_VIVANTE)	+= vivante.o
+diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.c linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.c
+--- linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.c	2015-07-27 23:13:04.744056042 +0200
+@@ -0,0 +1,112 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++/* vivante_drv.c -- vivante driver -*- linux-c -*-
++ *
++ *
++ * Permission is hereby granted, free of charge, to any person obtaining a
++ * copy of this software and associated documentation files (the "Software"),
++ * to deal in the Software without restriction, including without limitation
++ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
++ * and/or sell copies of the Software, and to permit persons to whom the
++ * Software is furnished to do so, subject to the following conditions:
++ *
++ * The above copyright notice and this permission notice (including the next
++ * paragraph) shall be included in all copies or substantial portions of the
++ * Software.
++ *
++ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
++ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
++ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
++ * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
++ * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
++ * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
++ * DEALINGS IN THE SOFTWARE.
++ *
++ * Authors:
++ *    Rickard E. (Rik) Faith <faith@valinux.com>
++ *    Daryll Strauss <daryll@valinux.com>
++ *    Gareth Hughes <gareth@valinux.com>
++ */
++
++#include <linux/version.h>
++#include <linux/module.h>
++
++#include "drmP.h"
++#include "vivante_drv.h"
++
++#include "drm_pciids.h"
++
++static char platformdevicename[] = "Vivante GCCore";
++static struct platform_device *pplatformdev;
++
++static const struct file_operations viv_driver_fops = {
++	.owner = THIS_MODULE,
++	.open = drm_open,
++	.release = drm_release,
++	.unlocked_ioctl = drm_ioctl,
++	.mmap = drm_legacy_mmap,
++	.poll = drm_poll,
++	.llseek = noop_llseek,
++};
++
++static struct drm_driver driver = {
++//	.driver_features = DRIVER_RENDER,
++	.fops = &viv_driver_fops,
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 18, 0)
++	.set_busid = drm_platform_set_busid,
++#endif
++	.name = DRIVER_NAME,
++	.desc = DRIVER_DESC,
++	.date = DRIVER_DATE,
++	.major = DRIVER_MAJOR,
++	.minor = DRIVER_MINOR,
++	.patchlevel = DRIVER_PATCHLEVEL,
++};
++
++static int __init vivante_init(void)
++{
++	int retcode;
++
++	pplatformdev = platform_device_register_simple(platformdevicename,
++			-1, NULL, 0);
++	if (pplatformdev == NULL)
++		printk(KERN_ERR"Platform device is null\n");
++
++	retcode = drm_platform_init(&driver, pplatformdev);
++
++	return retcode;
++}
++
++static void __exit vivante_exit(void)
++{
++	if (pplatformdev) {
++		platform_device_unregister(pplatformdev);
++		pplatformdev = NULL;
++	}
++}
++
++module_init(vivante_init);
++module_exit(vivante_exit);
++
++MODULE_AUTHOR(DRIVER_AUTHOR);
++MODULE_DESCRIPTION(DRIVER_DESC);
++MODULE_LICENSE("GPL and additional rights");
+diff -Nur linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.h linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.h
+--- linux-4.1.3/drivers/gpu/drm/vivante/vivante_drv.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/gpu/drm/vivante/vivante_drv.h	2015-07-27 23:13:04.744056042 +0200
+@@ -0,0 +1,69 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++/* vivante_drv.h -- Vivante DRM template customization -*- linux-c -*-
++ * Created: Wed Feb 14 12:32:32 2012 by John Zhao
++ */
++/*
++ *
++ * Permission is hereby granted, free of charge, to any person obtaining a
++ * copy of this software and associated documentation files (the "Software"),
++ * to deal in the Software without restriction, including without limitation
++ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
++ * and/or sell copies of the Software, and to permit persons to whom the
++ * Software is furnished to do so, subject to the following conditions:
++ *
++ * The above copyright notice and this permission notice (including the next
++ * paragraph) shall be included in all copies or substantial portions of the
++ * Software.
++ *
++ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
++ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
++ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
++ * VA LINUX SYSTEMS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
++ * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
++ * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
++ * OTHER DEALINGS IN THE SOFTWARE.
++ *
++ * Authors:
++ *    Gareth Hughes <gareth@valinux.com>
++ */
++
++#ifndef __VIVANTE_DRV_H__
++#define __VIVANTE_DRV_H__
++
++/* General customization:
++ */
++
++#include <drm/drm_legacy.h>
++#include <drm/drm_mm.h>
++
++#define DRIVER_AUTHOR		"Vivante Inc."
++
++#define DRIVER_NAME		"vivante"
++#define DRIVER_DESC		"Vivante GCCore"
++#define DRIVER_DATE		"20120216"
++
++#define DRIVER_MAJOR		1
++#define DRIVER_MINOR		0
++#define DRIVER_PATCHLEVEL	0
++
++#endif
+diff -Nur linux-4.1.3/drivers/Kconfig linux-xbian-imx6/drivers/Kconfig
+--- linux-4.1.3/drivers/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/Kconfig	2015-07-27 23:13:03.699781896 +0200
+@@ -182,4 +182,6 @@
+ 
+ source "drivers/android/Kconfig"
+ 
++source "drivers/mxc/Kconfig"
++
+ endmenu
+diff -Nur linux-4.1.3/drivers/Makefile linux-xbian-imx6/drivers/Makefile
+--- linux-4.1.3/drivers/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/Makefile	2015-07-27 23:13:03.699781896 +0200
+@@ -165,3 +165,4 @@
+ obj-$(CONFIG_THUNDERBOLT)	+= thunderbolt/
+ obj-$(CONFIG_CORESIGHT)		+= hwtracing/coresight/
+ obj-$(CONFIG_ANDROID)		+= android/
++obj-y                           += mxc/
+diff -Nur linux-4.1.3/drivers/mfd/Kconfig linux-xbian-imx6/drivers/mfd/Kconfig
+--- linux-4.1.3/drivers/mfd/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mfd/Kconfig	2015-07-27 23:13:06.023491162 +0200
+@@ -207,6 +207,13 @@
+ 	  Additional drivers must be enabled in order to use the specific
+ 	  features of the device.
+ 
++config MFD_MXC_HDMI
++	tristate "Freescale HDMI Core"
++	select MFD_CORE
++	help
++	  This is the core driver for the Freescale i.MX6 on-chip HDMI.
++	  This MFD driver connects with the video and audio drivers for HDMI.
++
+ config MFD_DLN2
+ 	tristate "Diolan DLN2 support"
+ 	select MFD_CORE
+diff -Nur linux-4.1.3/drivers/mfd/Makefile linux-xbian-imx6/drivers/mfd/Makefile
+--- linux-4.1.3/drivers/mfd/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mfd/Makefile	2015-07-27 23:13:06.023491162 +0200
+@@ -185,3 +185,4 @@
+ intel-soc-pmic-objs		:= intel_soc_pmic_core.o intel_soc_pmic_crc.o
+ obj-$(CONFIG_INTEL_SOC_PMIC)	+= intel-soc-pmic.o
+ obj-$(CONFIG_MFD_MT6397)	+= mt6397-core.o
++obj-$(CONFIG_MFD_MXC_HDMI)      += mxc-hdmi-core.o
+diff -Nur linux-4.1.3/drivers/mfd/mxc-hdmi-core.c linux-xbian-imx6/drivers/mfd/mxc-hdmi-core.c
+--- linux-4.1.3/drivers/mfd/mxc-hdmi-core.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mfd/mxc-hdmi-core.c	2015-07-27 23:13:06.051391618 +0200
+@@ -0,0 +1,723 @@
++/*
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++#include <linux/kernel.h>
++#include <linux/module.h>
++#include <linux/init.h>
++#include <linux/slab.h>
++#include <linux/device.h>
++#include <linux/err.h>
++#include <linux/io.h>
++#include <linux/clk.h>
++#include <linux/spinlock.h>
++#include <linux/irq.h>
++#include <linux/interrupt.h>
++
++#include <linux/platform_device.h>
++#include <linux/regulator/machine.h>
++#include <asm/mach-types.h>
++
++#include <video/mxc_hdmi.h>
++#include <linux/ipu-v3.h>
++#include <video/mxc_edid.h>
++#include "../mxc/ipu3/ipu_prv.h"
++#include <linux/mfd/mxc-hdmi-core.h>
++#include <linux/of_device.h>
++#include <linux/mod_devicetable.h>
++
++struct mxc_hdmi_data {
++	struct platform_device *pdev;
++	unsigned long __iomem *reg_base;
++	unsigned long reg_phys_base;
++	struct device *dev;
++};
++
++static void __iomem *hdmi_base;
++static struct clk *isfr_clk;
++static struct clk *iahb_clk;
++static spinlock_t irq_spinlock;
++static spinlock_t edid_spinlock;
++static unsigned int sample_rate;
++static unsigned long pixel_clk_rate;
++static struct clk *pixel_clk;
++static int hdmi_ratio;
++int mxc_hdmi_ipu_id;
++int mxc_hdmi_disp_id;
++static int hdmi_core_edid_status;
++static struct mxc_edid_cfg hdmi_core_edid_cfg;
++static int hdmi_core_init;
++static unsigned int hdmi_dma_running;
++static struct snd_pcm_substream *hdmi_audio_stream_playback;
++static unsigned int hdmi_cable_state;
++static unsigned int hdmi_blank_state;
++static unsigned int hdmi_abort_state;
++static spinlock_t hdmi_audio_lock, hdmi_blank_state_lock, hdmi_cable_state_lock;
++
++void hdmi_set_dvi_mode(unsigned int state)
++{
++	if (state) {
++		mxc_hdmi_abort_stream();
++		hdmi_cec_stop_device();
++	} else {
++		hdmi_cec_start_device();
++	}
++}
++EXPORT_SYMBOL(hdmi_set_dvi_mode);
++
++unsigned int hdmi_set_cable_state(unsigned int state)
++{
++	unsigned long flags;
++	struct snd_pcm_substream *substream = hdmi_audio_stream_playback;
++
++	spin_lock_irqsave(&hdmi_cable_state_lock, flags);
++	hdmi_cable_state = state;
++	spin_unlock_irqrestore(&hdmi_cable_state_lock, flags);
++
++	if (check_hdmi_state() && substream && hdmi_abort_state) {
++		hdmi_abort_state = 0;
++		substream->ops->trigger(substream, SNDRV_PCM_TRIGGER_START);
++	}
++	return 0;
++}
++EXPORT_SYMBOL(hdmi_set_cable_state);
++
++unsigned int hdmi_set_blank_state(unsigned int state)
++{
++	unsigned long flags;
++	struct snd_pcm_substream *substream = hdmi_audio_stream_playback;
++
++	spin_lock_irqsave(&hdmi_blank_state_lock, flags);
++	hdmi_blank_state = state;
++	spin_unlock_irqrestore(&hdmi_blank_state_lock, flags);
++
++	if (check_hdmi_state() && substream && hdmi_abort_state) {
++		hdmi_abort_state = 0;
++		substream->ops->trigger(substream, SNDRV_PCM_TRIGGER_START);
++	}
++	return 0;
++}
++EXPORT_SYMBOL(hdmi_set_blank_state);
++
++static void hdmi_audio_abort_stream(struct snd_pcm_substream *substream)
++{
++	unsigned long flags;
++
++	snd_pcm_stream_lock_irqsave(substream, flags);
++
++	if (snd_pcm_running(substream)) {
++		hdmi_abort_state = 1;
++		substream->ops->trigger(substream, SNDRV_PCM_TRIGGER_STOP);
++	}
++
++	snd_pcm_stream_unlock_irqrestore(substream, flags);
++}
++
++int mxc_hdmi_abort_stream(void)
++{
++	unsigned long flags;
++	spin_lock_irqsave(&hdmi_audio_lock, flags);
++	if (hdmi_audio_stream_playback)
++		hdmi_audio_abort_stream(hdmi_audio_stream_playback);
++	spin_unlock_irqrestore(&hdmi_audio_lock, flags);
++
++	return 0;
++}
++EXPORT_SYMBOL(mxc_hdmi_abort_stream);
++
++int check_hdmi_state(void)
++{
++	unsigned long flags1, flags2;
++	unsigned int ret;
++
++	spin_lock_irqsave(&hdmi_cable_state_lock, flags1);
++	spin_lock_irqsave(&hdmi_blank_state_lock, flags2);
++
++	ret = hdmi_cable_state && hdmi_blank_state;
++
++	spin_unlock_irqrestore(&hdmi_blank_state_lock, flags2);
++	spin_unlock_irqrestore(&hdmi_cable_state_lock, flags1);
++
++	return ret;
++}
++EXPORT_SYMBOL(check_hdmi_state);
++
++int mxc_hdmi_register_audio(struct snd_pcm_substream *substream)
++{
++	unsigned long flags, flags1;
++	int ret = 0;
++
++	snd_pcm_stream_lock_irqsave(substream, flags);
++
++	if (substream && check_hdmi_state()) {
++		spin_lock_irqsave(&hdmi_audio_lock, flags1);
++		if (hdmi_audio_stream_playback) {
++			pr_err("%s unconsist hdmi auido stream!\n", __func__);
++			ret = -EINVAL;
++		}
++		hdmi_audio_stream_playback = substream;
++		hdmi_abort_state = 0;
++		spin_unlock_irqrestore(&hdmi_audio_lock, flags1);
++	} else
++		ret = -EINVAL;
++
++	snd_pcm_stream_unlock_irqrestore(substream, flags);
++
++	return ret;
++}
++EXPORT_SYMBOL(mxc_hdmi_register_audio);
++
++void mxc_hdmi_unregister_audio(struct snd_pcm_substream *substream)
++{
++	unsigned long flags;
++
++	spin_lock_irqsave(&hdmi_audio_lock, flags);
++	hdmi_audio_stream_playback = NULL;
++	hdmi_abort_state = 0;
++	spin_unlock_irqrestore(&hdmi_audio_lock, flags);
++}
++EXPORT_SYMBOL(mxc_hdmi_unregister_audio);
++
++u8 hdmi_readb(unsigned int reg)
++{
++	u8 value;
++
++	value = __raw_readb(hdmi_base + reg);
++
++	return value;
++}
++EXPORT_SYMBOL(hdmi_readb);
++
++#ifdef DEBUG
++static bool overflow_lo;
++static bool overflow_hi;
++
++bool hdmi_check_overflow(void)
++{
++	u8 val, lo, hi;
++
++	val = hdmi_readb(HDMI_IH_FC_STAT2);
++	lo = (val & HDMI_IH_FC_STAT2_LOW_PRIORITY_OVERFLOW) != 0;
++	hi = (val & HDMI_IH_FC_STAT2_HIGH_PRIORITY_OVERFLOW) != 0;
++
++	if ((lo != overflow_lo) || (hi != overflow_hi)) {
++		pr_debug("%s LowPriority=%d HighPriority=%d  <=======================\n",
++			__func__, lo, hi);
++		overflow_lo = lo;
++		overflow_hi = hi;
++		return true;
++	}
++	return false;
++}
++#else
++bool hdmi_check_overflow(void)
++{
++	return false;
++}
++#endif
++EXPORT_SYMBOL(hdmi_check_overflow);
++
++void hdmi_writeb(u8 value, unsigned int reg)
++{
++	hdmi_check_overflow();
++	__raw_writeb(value, hdmi_base + reg);
++	hdmi_check_overflow();
++}
++EXPORT_SYMBOL(hdmi_writeb);
++
++void hdmi_mask_writeb(u8 data, unsigned int reg, u8 shift, u8 mask)
++{
++	u8 value = hdmi_readb(reg) & ~mask;
++	value |= (data << shift) & mask;
++	hdmi_writeb(value, reg);
++}
++EXPORT_SYMBOL(hdmi_mask_writeb);
++
++unsigned int hdmi_read4(unsigned int reg)
++{
++	/* read a four byte address from registers */
++	return (hdmi_readb(reg + 3) << 24) |
++		(hdmi_readb(reg + 2) << 16) |
++		(hdmi_readb(reg + 1) << 8) |
++		hdmi_readb(reg);
++}
++EXPORT_SYMBOL(hdmi_read4);
++
++void hdmi_write4(unsigned int value, unsigned int reg)
++{
++	/* write a four byte address to hdmi regs */
++	hdmi_writeb(value & 0xff, reg);
++	hdmi_writeb((value >> 8) & 0xff, reg + 1);
++	hdmi_writeb((value >> 16) & 0xff, reg + 2);
++	hdmi_writeb((value >> 24) & 0xff, reg + 3);
++}
++EXPORT_SYMBOL(hdmi_write4);
++
++static void initialize_hdmi_ih_mutes(void)
++{
++	u8 ih_mute;
++
++	/*
++	 * Boot up defaults are:
++	 * HDMI_IH_MUTE   = 0x03 (disabled)
++	 * HDMI_IH_MUTE_* = 0x00 (enabled)
++	 */
++
++	/* Disable top level interrupt bits in HDMI block */
++	ih_mute = hdmi_readb(HDMI_IH_MUTE) |
++		  HDMI_IH_MUTE_MUTE_WAKEUP_INTERRUPT |
++		  HDMI_IH_MUTE_MUTE_ALL_INTERRUPT;
++
++	hdmi_writeb(ih_mute, HDMI_IH_MUTE);
++
++	/* by default mask all interrupts */
++	hdmi_writeb(0xff, HDMI_VP_MASK);
++	hdmi_writeb(0xff, HDMI_FC_MASK0);
++	hdmi_writeb(0xff, HDMI_FC_MASK1);
++	hdmi_writeb(0xff, HDMI_FC_MASK2);
++	hdmi_writeb(0xff, HDMI_PHY_MASK0);
++	hdmi_writeb(0xff, HDMI_PHY_I2CM_INT_ADDR);
++	hdmi_writeb(0xff, HDMI_PHY_I2CM_CTLINT_ADDR);
++	hdmi_writeb(0xff, HDMI_AUD_INT);
++	hdmi_writeb(0xff, HDMI_AUD_SPDIFINT);
++	hdmi_writeb(0xff, HDMI_AUD_HBR_MASK);
++	hdmi_writeb(0xff, HDMI_GP_MASK);
++	hdmi_writeb(0xff, HDMI_A_APIINTMSK);
++	hdmi_writeb(0xff, HDMI_CEC_MASK);
++	hdmi_writeb(0xff, HDMI_I2CM_INT);
++	hdmi_writeb(0xff, HDMI_I2CM_CTLINT);
++
++	/* Disable interrupts in the IH_MUTE_* registers */
++	hdmi_writeb(0xff, HDMI_IH_MUTE_FC_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_FC_STAT1);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_FC_STAT2);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_AS_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_PHY_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_I2CM_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_CEC_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_VP_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_I2CMPHY_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
++
++	/* Enable top level interrupt bits in HDMI block */
++	ih_mute &= ~(HDMI_IH_MUTE_MUTE_WAKEUP_INTERRUPT |
++		    HDMI_IH_MUTE_MUTE_ALL_INTERRUPT);
++	hdmi_writeb(ih_mute, HDMI_IH_MUTE);
++}
++
++static void hdmi_set_clock_regenerator_n(unsigned int value)
++{
++	u8 val;
++
++	if (!hdmi_dma_running) {
++		hdmi_writeb(value & 0xff, HDMI_AUD_N1);
++		hdmi_writeb(0, HDMI_AUD_N2);
++		hdmi_writeb(0, HDMI_AUD_N3);
++	}
++
++	hdmi_writeb(value & 0xff, HDMI_AUD_N1);
++	hdmi_writeb((value >> 8) & 0xff, HDMI_AUD_N2);
++	hdmi_writeb((value >> 16) & 0x0f, HDMI_AUD_N3);
++
++	/* nshift factor = 0 */
++	val = hdmi_readb(HDMI_AUD_CTS3);
++	val &= ~HDMI_AUD_CTS3_N_SHIFT_MASK;
++	hdmi_writeb(val, HDMI_AUD_CTS3);
++}
++
++static void hdmi_set_clock_regenerator_cts(unsigned int cts)
++{
++	u8 val;
++
++	if (!hdmi_dma_running) {
++		hdmi_writeb(cts & 0xff, HDMI_AUD_CTS1);
++		hdmi_writeb(0, HDMI_AUD_CTS2);
++		hdmi_writeb(0, HDMI_AUD_CTS3);
++	}
++
++	/* Must be set/cleared first */
++	val = hdmi_readb(HDMI_AUD_CTS3);
++	val &= ~HDMI_AUD_CTS3_CTS_MANUAL;
++	hdmi_writeb(val, HDMI_AUD_CTS3);
++
++	hdmi_writeb(cts & 0xff, HDMI_AUD_CTS1);
++	hdmi_writeb((cts >> 8) & 0xff, HDMI_AUD_CTS2);
++	hdmi_writeb(((cts >> 16) & HDMI_AUD_CTS3_AUDCTS19_16_MASK) |
++		    HDMI_AUD_CTS3_CTS_MANUAL, HDMI_AUD_CTS3);
++}
++
++struct imx6_hdmi_acr {
++	int		FREQ;
++	int		N;
++	int		CTS;
++};
++
++struct imx6_hdmi_acr_def {
++	int			CLK;
++	struct imx6_hdmi_acr	imx6_data[3];
++};
++
++static const struct imx6_hdmi_acr_def imx6_hdmi_conv[] = {
++	/*		 32kHz			  44.1kHz		    48kHz    */
++	/* Clock                  N     CTS                N     CTS                 N     CTS */
++	{ 2517/*5*/, { { 32000, 4096,  25175 }, { 44100, 28224, 125875 }, { 48000,  6144,  25175 } } }, /*  25,20/1.001 MHz */
++	{ 2520/*0*/, { { 32000, 4096,  25200 }, { 44100,  6272,  28000 }, { 48000,  6144,  25200 } } }, /*  25.20       MHz */
++	{ 2700/*0*/, { { 32000, 4096,  27000 }, { 44100,  6272,  30000 }, { 48000,  6144,  27000 } } }, /*  27.00       MHz */
++	{ 2702/*7*/, { { 32000, 4096,  27027 }, { 44100,  6272,  30030 }, { 48000,  6144,  27027 } } }, /*  27.00*1.001 MHz */
++	{ 5400/*0*/, { { 32000, 4096,  54000 }, { 44100,  6272,  60000 }, { 48000,  6144,  54000 } } }, /*  54.00       MHz */
++	{ 5405/*4*/, { { 32000, 4096,  54054 }, { 44100,  6272,  60060 }, { 48000,  6144,  54054 } } }, /*  54.00*1.001 MHz */
++	{ 7417/*6*/, { { 32000, 4096,  74176 }, { 44100,  5733,  75335 }, { 48000,  6144,  74176 } } }, /*  74.25/1.001 MHz */
++	{ 7425/*0*/, { { 32000, 4096,  74250 }, { 44100,  6272,  82500 }, { 48000,  6144,  74250 } } }, /*  74.25       MHz */
++	{14836/*2*/, { { 32000, 4096, 148352 }, { 44100,  5733, 150670 }, { 48000,  6144, 148352 } } }, /* 148.50/1.001 MHz */
++	{14850/*0*/, { { 32000, 4096, 148500 }, { 44100,  6272, 165000 }, { 48000,  6144, 148500 } } }, /* 148.50       MHz */
++	{         0, { { 32000, 4096,      0 }, { 44100,  6272,      0 }, { 48000,  6144,      0 } } }  /* Other */
++};
++
++static void hdmi_compute_cts_n(unsigned int freq, unsigned long pixel_clk,
++				   unsigned int *n, unsigned int *cts)
++{
++	unsigned int clk = pixel_clk / 10000;
++	unsigned int frq = freq;
++	int i, j;
++
++	*n = 1;
++	switch (frq) {
++	case 88200:
++		frq = 44100;
++		*n = 2;
++		break;
++	case 96000:
++		frq = 48000;
++		*n = 2;
++		break;
++	case 176400:
++		frq = 44100;
++		*n = 4;
++		break;
++	case 192000:
++		frq = 48000;
++		*n = 4;
++		break;
++	default:
++		break;
++	}
++
++	for (i = 0; i < ARRAY_SIZE(imx6_hdmi_conv); i++) {
++		if (imx6_hdmi_conv[i].CLK == clk || imx6_hdmi_conv[i].CLK == 0) {
++			for (j = 0; j < 3; j++) {
++				if (imx6_hdmi_conv[i].imx6_data[j].FREQ == frq) {
++					*n *= imx6_hdmi_conv[i].imx6_data[j].N;
++					*cts = imx6_hdmi_conv[i].imx6_data[j].CTS;
++					return;
++				}
++			}
++		}
++	}
++}
++
++static void hdmi_set_clk_regenerator(void)
++{
++	unsigned int clk_n, clk_cts = 0;
++
++	hdmi_compute_cts_n(sample_rate, pixel_clk_rate, &clk_n, &clk_cts);
++
++	if (clk_cts == 0) {
++		clk_n = (128 * sample_rate) / 1000;
++		clk_cts = (clk_n / 128) * pixel_clk_rate;
++		clk_cts += (clk_n % 128) * pixel_clk_rate / 128;
++		clk_cts /= (sample_rate / 10);
++		pr_debug("%s: pixel clock not supported - fallback calculation: %d, N=%d, cts: %d\n",
++			__func__, (int)pixel_clk_rate, clk_n, clk_cts);
++	}
++//	if (ratio != 100)
++//		clk_cts = (clk_cts * ratio) / 100;
++
++	pr_debug("%s: samplerate=%d  ratio=%d  pixelclk=%d  N=%d  cts=%d\n",
++		__func__, sample_rate, hdmi_ratio, (int)pixel_clk_rate,
++		clk_n, clk_cts);
++
++	hdmi_set_clock_regenerator_cts(clk_cts);
++	hdmi_set_clock_regenerator_n(clk_n);
++}
++
++static int hdmi_core_get_of_property(struct platform_device *pdev)
++{
++	struct device_node *np = pdev->dev.of_node;
++	int err;
++	int ipu_id, disp_id;
++
++	err = of_property_read_u32(np, "ipu_id", &ipu_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property ipu_id fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "disp_id", &disp_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property disp_id fail\n");
++		return err;
++	}
++
++	mxc_hdmi_ipu_id = ipu_id;
++	mxc_hdmi_disp_id = disp_id;
++
++	return err;
++}
++
++/* Need to run this before phy is enabled the first time to prevent
++ * overflow condition in HDMI_IH_FC_STAT2 */
++void hdmi_init_clk_regenerator(void)
++{
++	if (pixel_clk_rate == 0) {
++		pixel_clk_rate = 74250000;
++		hdmi_set_clk_regenerator();
++	}
++}
++EXPORT_SYMBOL(hdmi_init_clk_regenerator);
++
++void hdmi_clk_regenerator_update_pixel_clock(u32 pixclock)
++{
++
++	/* Translate pixel clock in ps (pico seconds) to Hz  */
++	pixel_clk_rate = PICOS2KHZ(pixclock) * 1000UL;
++	hdmi_set_clk_regenerator();
++}
++EXPORT_SYMBOL(hdmi_clk_regenerator_update_pixel_clock);
++
++void hdmi_set_dma_mode(unsigned int dma_running)
++{
++	hdmi_dma_running = dma_running;
++	hdmi_set_clk_regenerator();
++}
++EXPORT_SYMBOL(hdmi_set_dma_mode);
++
++void hdmi_set_sample_rate(unsigned int rate)
++{
++	sample_rate = rate;
++}
++EXPORT_SYMBOL(hdmi_set_sample_rate);
++
++void hdmi_set_edid_cfg(int edid_status, struct mxc_edid_cfg *cfg)
++{
++	unsigned long flags;
++
++	spin_lock_irqsave(&edid_spinlock, flags);
++	hdmi_core_edid_status = edid_status;
++	memcpy(&hdmi_core_edid_cfg, cfg, sizeof(struct mxc_edid_cfg));
++	spin_unlock_irqrestore(&edid_spinlock, flags);
++}
++EXPORT_SYMBOL(hdmi_set_edid_cfg);
++
++int hdmi_get_edid_cfg(struct mxc_edid_cfg *cfg)
++{
++	unsigned long flags;
++
++	spin_lock_irqsave(&edid_spinlock, flags);
++	memcpy(cfg, &hdmi_core_edid_cfg, sizeof(struct mxc_edid_cfg));
++	spin_unlock_irqrestore(&edid_spinlock, flags);
++
++	return hdmi_core_edid_status;
++}
++EXPORT_SYMBOL(hdmi_get_edid_cfg);
++
++void hdmi_set_registered(int registered)
++{
++	hdmi_core_init = registered;
++}
++EXPORT_SYMBOL(hdmi_set_registered);
++
++int hdmi_get_registered(void)
++{
++	return hdmi_core_init;
++}
++EXPORT_SYMBOL(hdmi_get_registered);
++
++static int mxc_hdmi_core_probe(struct platform_device *pdev)
++{
++	struct mxc_hdmi_data *hdmi_data;
++	struct resource *res;
++	unsigned long flags;
++	int ret = 0;
++
++#ifdef DEBUG
++	overflow_lo = false;
++	overflow_hi = false;
++#endif
++
++	hdmi_core_init = 0;
++	hdmi_dma_running = 0;
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res)
++		return -ENOENT;
++
++	ret = hdmi_core_get_of_property(pdev);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "get hdmi of property fail\n");
++		return -ENOENT;
++	}
++
++	hdmi_data = devm_kzalloc(&pdev->dev, sizeof(struct mxc_hdmi_data), GFP_KERNEL);
++	if (!hdmi_data) {
++		dev_err(&pdev->dev, "Couldn't allocate mxc hdmi mfd device\n");
++		return -ENOMEM;
++	}
++	hdmi_data->pdev = pdev;
++
++	pixel_clk = NULL;
++	sample_rate = 48000;
++	pixel_clk_rate = 0;
++	hdmi_ratio = 100;
++
++	spin_lock_init(&irq_spinlock);
++	spin_lock_init(&edid_spinlock);
++
++
++	spin_lock_init(&hdmi_cable_state_lock);
++	spin_lock_init(&hdmi_blank_state_lock);
++	spin_lock_init(&hdmi_audio_lock);
++
++	spin_lock_irqsave(&hdmi_cable_state_lock, flags);
++	hdmi_cable_state = 0;
++	spin_unlock_irqrestore(&hdmi_cable_state_lock, flags);
++
++	spin_lock_irqsave(&hdmi_blank_state_lock, flags);
++	hdmi_blank_state = 0;
++	spin_unlock_irqrestore(&hdmi_blank_state_lock, flags);
++
++	spin_lock_irqsave(&hdmi_audio_lock, flags);
++	hdmi_audio_stream_playback = NULL;
++	hdmi_abort_state = 0;
++	spin_unlock_irqrestore(&hdmi_audio_lock, flags);
++
++	isfr_clk = clk_get(&hdmi_data->pdev->dev, "hdmi_isfr");
++	if (IS_ERR(isfr_clk)) {
++		ret = PTR_ERR(isfr_clk);
++		dev_err(&hdmi_data->pdev->dev,
++			"Unable to get HDMI isfr clk: %d\n", ret);
++		goto eclkg;
++	}
++
++	ret = clk_prepare_enable(isfr_clk);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "Cannot enable HDMI clock: %d\n", ret);
++		goto eclke;
++	}
++
++	pr_debug("%s isfr_clk:%d\n", __func__,
++		(int)clk_get_rate(isfr_clk));
++
++	iahb_clk = clk_get(&hdmi_data->pdev->dev, "hdmi_iahb");
++	if (IS_ERR(iahb_clk)) {
++		ret = PTR_ERR(iahb_clk);
++		dev_err(&hdmi_data->pdev->dev,
++			"Unable to get HDMI iahb clk: %d\n", ret);
++		goto eclkg2;
++	}
++
++	ret = clk_prepare_enable(iahb_clk);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "Cannot enable HDMI clock: %d\n", ret);
++		goto eclke2;
++	}
++
++	hdmi_data->reg_phys_base = res->start;
++	if (!request_mem_region(res->start, resource_size(res),
++				dev_name(&pdev->dev))) {
++		dev_err(&pdev->dev, "request_mem_region failed\n");
++		ret = -EBUSY;
++		goto emem;
++	}
++
++	hdmi_data->reg_base = ioremap(res->start, resource_size(res));
++	if (!hdmi_data->reg_base) {
++		dev_err(&pdev->dev, "ioremap failed\n");
++		ret = -ENOMEM;
++		goto eirq;
++	}
++	hdmi_base = hdmi_data->reg_base;
++
++	pr_debug("\n%s hdmi hw base = 0x%08x\n\n", __func__, (int)res->start);
++
++	initialize_hdmi_ih_mutes();
++
++	/* Disable HDMI clocks until video/audio sub-drivers are initialized */
++	clk_disable_unprepare(isfr_clk);
++	clk_disable_unprepare(iahb_clk);
++
++	/* Replace platform data coming in with a local struct */
++	platform_set_drvdata(pdev, hdmi_data);
++
++	return ret;
++
++eirq:
++	release_mem_region(res->start, resource_size(res));
++emem:
++	clk_disable_unprepare(iahb_clk);
++eclke2:
++	clk_put(iahb_clk);
++eclkg2:
++	clk_disable_unprepare(isfr_clk);
++eclke:
++	clk_put(isfr_clk);
++eclkg:
++	return ret;
++}
++
++
++static int __exit mxc_hdmi_core_remove(struct platform_device *pdev)
++{
++	struct mxc_hdmi_data *hdmi_data = platform_get_drvdata(pdev);
++	struct resource *res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++
++	iounmap(hdmi_data->reg_base);
++	release_mem_region(res->start, resource_size(res));
++
++	return 0;
++}
++
++static const struct of_device_id imx_hdmi_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-hdmi-core", },
++	{ .compatible = "fsl,imx6dl-hdmi-core", },
++	{ /* sentinel */ }
++};
++
++static struct platform_driver mxc_hdmi_core_driver = {
++	.driver = {
++		.name = "mxc_hdmi_core",
++		.of_match_table	= imx_hdmi_dt_ids,
++		.owner = THIS_MODULE,
++	},
++	.remove = __exit_p(mxc_hdmi_core_remove),
++};
++
++static int __init mxc_hdmi_core_init(void)
++{
++	return platform_driver_probe(&mxc_hdmi_core_driver,
++				     mxc_hdmi_core_probe);
++}
++
++static void __exit mxc_hdmi_core_exit(void)
++{
++	platform_driver_unregister(&mxc_hdmi_core_driver);
++}
++
++subsys_initcall(mxc_hdmi_core_init);
++module_exit(mxc_hdmi_core_exit);
++
++MODULE_DESCRIPTION("Core driver for Freescale i.Mx on-chip HDMI");
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/misc/sram.c linux-xbian-imx6/drivers/misc/sram.c
+--- linux-4.1.3/drivers/misc/sram.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/misc/sram.c	2015-07-27 23:13:06.095235186 +0200
+@@ -17,6 +17,7 @@
+  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
+  * MA 02110-1301, USA.
+  */
++#define DEBUG
+ 
+ #include <linux/kernel.h>
+ #include <linux/init.h>
+diff -Nur linux-4.1.3/drivers/mmc/core/core.c linux-xbian-imx6/drivers/mmc/core/core.c
+--- linux-4.1.3/drivers/mmc/core/core.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mmc/core/core.c	2015-07-27 23:13:06.115164084 +0200
+@@ -13,11 +13,13 @@
+ #include <linux/module.h>
+ #include <linux/init.h>
+ #include <linux/interrupt.h>
++#include <linux/clk.h>
+ #include <linux/completion.h>
+ #include <linux/device.h>
+ #include <linux/delay.h>
+ #include <linux/pagemap.h>
+ #include <linux/err.h>
++#include <linux/gpio/consumer.h>
+ #include <linux/leds.h>
+ #include <linux/scatterlist.h>
+ #include <linux/log2.h>
+@@ -1601,6 +1603,43 @@
+ 	mmc_host_clk_release(host);
+ }
+ 
++static void mmc_card_power_up(struct mmc_host *host)
++{
++	int i;
++	struct gpio_desc **gds = host->card_reset_gpios;
++
++	for (i = 0; i < ARRAY_SIZE(host->card_reset_gpios); i++) {
++		if (gds[i]) {
++			dev_dbg(host->parent, "Asserting reset line %d", i);
++			gpiod_set_value(gds[i], 1);
++		}
++	}
++
++	if (host->card_regulator) {
++		dev_dbg(host->parent, "Enabling external regulator");
++		if (regulator_enable(host->card_regulator))
++			dev_err(host->parent, "Failed to enable external regulator");
++	}
++
++	if (host->card_clk) {
++		dev_dbg(host->parent, "Enabling external clock");
++		clk_prepare_enable(host->card_clk);
++	}
++
++	/* 2ms delay to let clocks and power settle */
++	mmc_delay(20);
++
++	for (i = 0; i < ARRAY_SIZE(host->card_reset_gpios); i++) {
++		if (gds[i]) {
++			dev_dbg(host->parent, "Deasserting reset line %d", i);
++			gpiod_set_value(gds[i], 0);
++		}
++	}
++
++	/* 2ms delay to after reset release */
++	mmc_delay(20);
++}
++
+ /*
+  * Apply power to the MMC stack.  This is a two-stage process.
+  * First, we enable power to the card without the clock running.
+@@ -1661,6 +1700,9 @@
+ 	if (host->ios.power_mode == MMC_POWER_OFF)
+ 		return;
+ 
++	/* Power up the card/module first, if needed */
++	mmc_card_power_up(host);
++
+ 	mmc_host_clk_hold(host);
+ 
+ 	mmc_pwrseq_power_off(host);
+@@ -1686,7 +1728,7 @@
+ {
+ 	mmc_power_off(host);
+ 	/* Wait at least 1 ms according to SD spec */
+-	mmc_delay(1);
++	mmc_delay(3);
+ 	mmc_power_up(host, ocr);
+ }
+ 
+diff -Nur linux-4.1.3/drivers/mmc/core/host.c linux-xbian-imx6/drivers/mmc/core/host.c
+--- linux-4.1.3/drivers/mmc/core/host.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mmc/core/host.c	2015-07-27 23:13:06.115164084 +0200
+@@ -12,14 +12,18 @@
+  *  MMC host class device management
+  */
+ 
++#include <linux/kernel.h>
++#include <linux/clk.h>
+ #include <linux/device.h>
+ #include <linux/err.h>
++#include <linux/gpio/consumer.h>
+ #include <linux/idr.h>
+ #include <linux/of.h>
+ #include <linux/of_gpio.h>
+ #include <linux/pagemap.h>
+ #include <linux/export.h>
+ #include <linux/leds.h>
++#include <linux/regulator/consumer.h>
+ #include <linux/slab.h>
+ #include <linux/suspend.h>
+ 
+@@ -454,6 +458,66 @@
+ 
+ EXPORT_SYMBOL(mmc_of_parse);
+ 
++static int mmc_of_parse_child(struct mmc_host *host)
++{
++	struct device_node *np;
++	struct clk *clk;
++	int i;
++
++	if (!host->parent || !host->parent->of_node)
++		return 0;
++
++	np = host->parent->of_node;
++
++	host->card_regulator = regulator_get(host->parent, "card-external-vcc");
++	if (IS_ERR(host->card_regulator)) {
++		if (PTR_ERR(host->card_regulator) == -EPROBE_DEFER)
++			return PTR_ERR(host->card_regulator);
++		host->card_regulator = NULL;
++	}
++
++	/* Parse card power/reset/clock control */
++	if (of_find_property(np, "card-reset-gpios", NULL)) {
++		struct gpio_desc *gpd;
++		int level = 0;
++
++		/*
++		 * If the regulator is enabled, then we can hold the
++		 * card in reset with an active high resets.  Otherwise,
++		 * hold the resets low.
++		 */
++		if (host->card_regulator && regulator_is_enabled(host->card_regulator))
++			level = 1;
++
++		for (i = 0; i < ARRAY_SIZE(host->card_reset_gpios); i++) {
++			gpd = devm_gpiod_get_index(host->parent, "card-reset", i);
++			if (IS_ERR(gpd)) {
++				if (PTR_ERR(gpd) == -EPROBE_DEFER)
++					return PTR_ERR(gpd);
++				break;
++			}
++			gpiod_direction_output(gpd, gpiod_is_active_low(gpd) | level);
++			host->card_reset_gpios[i] = gpd;
++		}
++
++		gpd = devm_gpiod_get_index(host->parent, "card-reset", ARRAY_SIZE(host->card_reset_gpios));
++		if (!IS_ERR(gpd)) {
++			dev_warn(host->parent, "More reset gpios than we can handle");
++			gpiod_put(gpd);
++		}
++	}
++
++	clk = of_clk_get_by_name(np, "card_ext_clock");
++	if (IS_ERR(clk)) {
++		if (PTR_ERR(clk) == -EPROBE_DEFER)
++			return PTR_ERR(clk);
++		clk = NULL;
++	}
++	host->card_clk = clk;
++
++	return 0;
++}
++
+ /**
+  *	mmc_alloc_host - initialise the per-host structure.
+  *	@extra: sizeof private data structure
+@@ -533,6 +597,10 @@
+ {
+ 	int err;
+ 
++	err = mmc_of_parse_child(host);
++	if (err)
++		return err;
++
+ 	WARN_ON((host->caps & MMC_CAP_SDIO_IRQ) &&
+ 		!host->ops->enable_sdio_irq);
+ 
+diff -Nur linux-4.1.3/drivers/mmc/core/mmc_ops.c linux-xbian-imx6/drivers/mmc/core/mmc_ops.c
+--- linux-4.1.3/drivers/mmc/core/mmc_ops.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mmc/core/mmc_ops.c	2015-07-27 23:13:06.115164084 +0200
+@@ -513,6 +513,12 @@
+ 		return 0;
+ 
+ 	/*
++	 * WORKAROUND: for Sandisk eMMC cards, it might need certain delay
++	 * before sending CMD13 after CMD6
++	 */
++	mdelay(1);
++
++	/*
+ 	 * CRC errors shall only be ignored in cases were CMD13 is used to poll
+ 	 * to detect busy completion.
+ 	 */
+diff -Nur linux-4.1.3/drivers/mmc/core/sd.c linux-xbian-imx6/drivers/mmc/core/sd.c
+--- linux-4.1.3/drivers/mmc/core/sd.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mmc/core/sd.c	2015-07-27 23:13:06.119149862 +0200
+@@ -521,6 +521,13 @@
+ 	else {
+ 		mmc_set_timing(card->host, timing);
+ 		mmc_set_clock(card->host, card->sw_caps.uhs_max_dtr);
++
++		/*
++		 * FIXME: Sandisk SD3.0 cards DDR50 mode requires such
++		 * delay to get stable, without this delay we may encounter
++		 * CRC errors after switch to DDR50 mode
++		 */
++		mmc_delay(100);
+ 	}
+ 
+ 	return 0;
+diff -Nur linux-4.1.3/drivers/mmc/host/sdhci-esdhc-imx.c linux-xbian-imx6/drivers/mmc/host/sdhci-esdhc-imx.c
+--- linux-4.1.3/drivers/mmc/host/sdhci-esdhc-imx.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/mmc/host/sdhci-esdhc-imx.c	2015-07-27 23:13:06.131107202 +0200
+@@ -65,6 +65,8 @@
+ /* NOTE: the minimum valid tuning start tap for mx6sl is 1 */
+ #define ESDHC_TUNING_START_TAP		0x1
+ 
++#define ESDHC_TUNING_BLOCK_PATTERN_LEN	64
++
+ /* pinctrl state */
+ #define ESDHC_PINCTRL_STATE_100MHZ	"state_100mhz"
+ #define ESDHC_PINCTRL_STATE_200MHZ	"state_200mhz"
+@@ -112,6 +114,12 @@
+ #define ESDHC_FLAG_STD_TUNING		BIT(5)
+ /* The IP has SDHCI_CAPABILITIES_1 register */
+ #define ESDHC_FLAG_HAVE_CAP1		BIT(6)
++/*
++ * The IP has errata ERR004536
++ * uSDHC: ADMA Length Mismatch Error occurs if the AHB read access is slow,
++ * when reading data from the card
++ */
++#define ESDHC_FLAG_ERR004536		BIT(7)
+ 
+ struct esdhc_soc_data {
+ 	u32 flags;
+@@ -445,6 +453,10 @@
+ 			if (val & SDHCI_CTRL_EXEC_TUNING) {
+ 				v |= ESDHC_MIX_CTRL_EXE_TUNE;
+ 				m |= ESDHC_MIX_CTRL_FBCLK_SEL;
++				writel(readl(host->ioaddr + ESDHC_TUNING_CTRL) |
++					ESDHC_STD_TUNING_EN |
++					ESDHC_TUNING_START_TAP,
++					host->ioaddr + ESDHC_TUNING_CTRL);
+ 			} else {
+ 				v &= ~ESDHC_MIX_CTRL_EXE_TUNE;
+ 			}
+@@ -700,6 +712,56 @@
+ 			val, readl(host->ioaddr + ESDHC_TUNE_CTRL_STATUS));
+ }
+ 
++static void esdhc_request_done(struct mmc_request *mrq)
++{
++	complete(&mrq->completion);
++}
++
++static int esdhc_send_tuning_cmd(struct sdhci_host *host, u32 opcode,
++				 struct scatterlist *sg)
++{
++	struct mmc_command cmd = {0};
++	struct mmc_request mrq = {NULL};
++	struct mmc_data data = {0};
++
++	cmd.opcode = opcode;
++	cmd.arg = 0;
++	cmd.flags = MMC_RSP_R1 | MMC_CMD_ADTC;
++
++	data.blksz = ESDHC_TUNING_BLOCK_PATTERN_LEN;
++	data.blocks = 1;
++	data.flags = MMC_DATA_READ;
++	data.sg = sg;
++	data.sg_len = 1;
++
++	mrq.cmd = &cmd;
++	mrq.cmd->mrq = &mrq;
++	mrq.data = &data;
++	mrq.data->mrq = &mrq;
++	mrq.cmd->data = mrq.data;
++
++	mrq.done = esdhc_request_done;
++	init_completion(&(mrq.completion));
++
++	disable_irq(host->irq);
++	spin_lock(&host->lock);
++	host->mrq = &mrq;
++
++	sdhci_send_command(host, mrq.cmd);
++
++	spin_unlock(&host->lock);
++	enable_irq(host->irq);
++
++	wait_for_completion(&mrq.completion);
++
++	if (cmd.error)
++		return cmd.error;
++	if (data.error)
++		return data.error;
++
++	return 0;
++}
++
+ static void esdhc_post_tuning(struct sdhci_host *host)
+ {
+ 	u32 reg;
+@@ -711,13 +773,21 @@
+ 
+ static int esdhc_executing_tuning(struct sdhci_host *host, u32 opcode)
+ {
++	struct scatterlist sg;
++	char *tuning_pattern;
+ 	int min, max, avg, ret;
+ 
++	tuning_pattern = kmalloc(ESDHC_TUNING_BLOCK_PATTERN_LEN, GFP_KERNEL);
++	if (!tuning_pattern)
++		return -ENOMEM;
++
++	sg_init_one(&sg, tuning_pattern, ESDHC_TUNING_BLOCK_PATTERN_LEN);
++
+ 	/* find the mininum delay first which can pass tuning */
+ 	min = ESDHC_TUNE_CTRL_MIN;
+ 	while (min < ESDHC_TUNE_CTRL_MAX) {
+ 		esdhc_prepare_tuning(host, min);
+-		if (!mmc_send_tuning(host->mmc))
++		if (!esdhc_send_tuning_cmd(host, opcode, &sg))
+ 			break;
+ 		min += ESDHC_TUNE_CTRL_STEP;
+ 	}
+@@ -726,7 +796,7 @@
+ 	max = min + ESDHC_TUNE_CTRL_STEP;
+ 	while (max < ESDHC_TUNE_CTRL_MAX) {
+ 		esdhc_prepare_tuning(host, max);
+-		if (mmc_send_tuning(host->mmc)) {
++		if (esdhc_send_tuning_cmd(host, opcode, &sg)) {
+ 			max -= ESDHC_TUNE_CTRL_STEP;
+ 			break;
+ 		}
+@@ -736,9 +806,11 @@
+ 	/* use average delay to get the best timing */
+ 	avg = (min + max) / 2;
+ 	esdhc_prepare_tuning(host, avg);
+-	ret = mmc_send_tuning(host->mmc);
++	ret = esdhc_send_tuning_cmd(host, opcode, &sg);
+ 	esdhc_post_tuning(host);
+ 
++	kfree(tuning_pattern);
++
+ 	dev_dbg(mmc_dev(host->mmc), "tunning %s at 0x%x ret %d\n",
+ 		ret ? "failed" : "passed", avg, ret);
+ 
+@@ -901,6 +973,9 @@
+ 	if (of_property_read_u32(np, "fsl,delay-line", &boarddata->delay_line))
+ 		boarddata->delay_line = 0;
+ 
++	if (of_find_property(np, "keep-power-in-suspend", NULL))
++		host->mmc->pm_caps |= MMC_PM_KEEP_POWER;
++
+ 	mmc_of_parse_voltage(np, &host->ocr_mask);
+ 
+ 	return 0;
+@@ -997,10 +1072,8 @@
+ 		sdhci_esdhc_ops.platform_execute_tuning =
+ 					esdhc_executing_tuning;
+ 
+-	if (imx_data->socdata->flags & ESDHC_FLAG_STD_TUNING)
+-		writel(readl(host->ioaddr + ESDHC_TUNING_CTRL) |
+-			ESDHC_STD_TUNING_EN | ESDHC_TUNING_START_TAP,
+-			host->ioaddr + ESDHC_TUNING_CTRL);
++	if (imx_data->socdata->flags & ESDHC_FLAG_ERR004536)
++		host->quirks |= SDHCI_QUIRK_BROKEN_ADMA;
+ 
+ 	boarddata = &imx_data->boarddata;
+ 	if (sdhci_esdhc_imx_probe_dt(pdev, host, boarddata) < 0) {
+diff -Nur linux-4.1.3/drivers/mxc/asrc/Kconfig linux-xbian-imx6/drivers/mxc/asrc/Kconfig
+--- linux-4.1.3/drivers/mxc/asrc/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/asrc/Kconfig	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,14 @@
++#
++# ASRC configuration
++#
++
++menu "MXC Asynchronous Sample Rate Converter support"
++
++config MXC_ASRC
++	tristate "ASRC support"
++	depends on SOC_IMX35 || SOC_IMX53 || SOC_IMX6
++#	select SND_SOC_FSL_ASRC
++	---help---
++         Say Y to get the ASRC service.
++
++endmenu
+diff -Nur linux-4.1.3/drivers/mxc/asrc/Makefile linux-xbian-imx6/drivers/mxc/asrc/Makefile
+--- linux-4.1.3/drivers/mxc/asrc/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/asrc/Makefile	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,4 @@
++#
++# Makefile for the kernel Asynchronous Sample Rate Converter driver
++#
++obj-$(CONFIG_MXC_ASRC) += mxc_asrc.o
+diff -Nur linux-4.1.3/drivers/mxc/asrc/mxc_asrc.c linux-xbian-imx6/drivers/mxc/asrc/mxc_asrc.c
+--- linux-4.1.3/drivers/mxc/asrc/mxc_asrc.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/asrc/mxc_asrc.c	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,2045 @@
++/*
++ * Freescale Asynchronous Sample Rate Converter (ASRC) driver
++ *
++ * Copyright 2008-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This file is licensed under the terms of the GNU General Public License
++ * version 2.  This program  is licensed "as is" without any warranty of any
++ * kind, whether express or implied.
++ */
++
++#include <linux/clk.h>
++#include <linux/slab.h>
++#include <linux/delay.h>
++#include <linux/sched.h>
++#include <linux/regmap.h>
++#include <linux/module.h>
++#include <linux/proc_fs.h>
++#include <linux/pagemap.h>
++#include <linux/interrupt.h>
++#include <linux/miscdevice.h>
++#include <linux/dma-mapping.h>
++#include <linux/of_platform.h>
++#include <linux/platform_data/dma-imx.h>
++
++#include <linux/mxc_asrc.h>
++
++#define ASRC_PROC_PATH "driver/asrc"
++
++#define ASRC_RATIO_DECIMAL_DEPTH 26
++
++#define pair_err(fmt, ...) \
++	dev_err(asrc->dev, "Pair %c: " fmt, 'A' + index, ##__VA_ARGS__)
++
++#define pair_dbg(fmt, ...) \
++	dev_dbg(asrc->dev, "Pair %c: " fmt, 'A' + index, ##__VA_ARGS__)
++
++DEFINE_SPINLOCK(data_lock);
++DEFINE_SPINLOCK(pair_lock);
++
++/* Sample rates are aligned with that defined in pcm.h file */
++static const unsigned char asrc_process_table[][8][2] = {
++	/* 32kHz 44.1kHz 48kHz   64kHz   88.2kHz 96kHz   176kHz  192kHz */
++	{{0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 5512Hz */
++	{{0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 8kHz */
++	{{0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 11025Hz */
++	{{0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 16kHz */
++	{{0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0}, {0, 0}, {0, 0}, {0, 0},},	/* 22050Hz */
++	{{0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0}, {0, 0},},	/* 32kHz */
++	{{0, 2}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0},},	/* 44.1kHz */
++	{{0, 2}, {0, 2}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0}, {0, 0},},	/* 48kHz */
++	{{1, 2}, {0, 2}, {0, 2}, {0, 1}, {0, 1}, {0, 1}, {0, 1}, {0, 0},},	/* 64kHz */
++	{{1, 2}, {1, 2}, {1, 2}, {1, 1}, {1, 1}, {1, 1}, {1, 1}, {1, 1},},	/* 88.2kHz */
++	{{1, 2}, {1, 2}, {1, 2}, {1, 1}, {1, 1}, {1, 1}, {1, 1}, {1, 1},},	/* 96kHz */
++	{{2, 2}, {2, 2}, {2, 2}, {2, 1}, {2, 1}, {2, 1}, {2, 1}, {2, 1},},	/* 176kHz */
++	{{2, 2}, {2, 2}, {2, 2}, {2, 1}, {2, 1}, {2, 1}, {2, 1}, {2, 1},},	/* 192kHz */
++};
++
++static struct asrc_data *asrc;
++
++/*
++ * The following tables map the relationship between asrc_inclk/asrc_outclk in
++ * mxc_asrc.h and the registers of ASRCSR
++ */
++static unsigned char input_clk_map_v1[] = {
++	0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0xa, 0xb, 0xc, 0xd, 0xe, 0xf,
++};
++
++static unsigned char output_clk_map_v1[] = {
++	0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0xa, 0xb, 0xc, 0xd, 0xe, 0xf,
++};
++
++/* V2 uses the same map for input and output */
++static unsigned char input_clk_map_v2[] = {
++/*	0x0  0x1  0x2  0x3  0x4  0x5  0x6  0x7  0x8  0x9  0xa  0xb  0xc  0xd  0xe  0xf */
++	0x0, 0x1, 0x2, 0x7, 0x4, 0x5, 0x6, 0x3, 0x8, 0x9, 0xa, 0xb, 0xc, 0xf, 0xe, 0xd,
++};
++
++static unsigned char output_clk_map_v2[] = {
++/*	0x0  0x1  0x2  0x3  0x4  0x5  0x6  0x7  0x8  0x9  0xa  0xb  0xc  0xd  0xe  0xf */
++	0x8, 0x9, 0xa, 0x7, 0xc, 0x5, 0x6, 0xb, 0x0, 0x1, 0x2, 0x3, 0x4, 0xf, 0xe, 0xd,
++};
++
++static unsigned char *input_clk_map, *output_clk_map;
++
++enum mxc_asrc_type {
++	IMX35_ASRC,
++	IMX53_ASRC,
++};
++
++static const struct platform_device_id mxc_asrc_devtype[] = {
++	{
++		.name = "imx35-asrc",
++		.driver_data = IMX35_ASRC,
++	}, {
++		.name = "imx53-asrc",
++		.driver_data = IMX53_ASRC,
++	}, {
++		/* sentinel */
++	}
++};
++MODULE_DEVICE_TABLE(platform, mxc_asrc_devtype);
++
++static const struct of_device_id fsl_asrc_ids[] = {
++	{
++		.compatible = "fsl,imx35-asrc",
++		.data = &mxc_asrc_devtype[IMX35_ASRC],
++	}, {
++		.compatible = "fsl,imx53-asrc",
++		.data = &mxc_asrc_devtype[IMX53_ASRC],
++	}, {
++		/* sentinel */
++	}
++};
++MODULE_DEVICE_TABLE(of, fsl_asrc_ids);
++
++
++#ifdef DEBUG
++u32 asrc_reg[] = {
++	REG_ASRCTR,
++	REG_ASRIER,
++	REG_ASRCNCR,
++	REG_ASRCFG,
++	REG_ASRCSR,
++	REG_ASRCDR1,
++	REG_ASRCDR2,
++	REG_ASRSTR,
++	REG_ASRRA,
++	REG_ASRRB,
++	REG_ASRRC,
++	REG_ASRPM1,
++	REG_ASRPM2,
++	REG_ASRPM3,
++	REG_ASRPM4,
++	REG_ASRPM5,
++	REG_ASRTFR1,
++	REG_ASRCCR,
++	REG_ASRIDRHA,
++	REG_ASRIDRLA,
++	REG_ASRIDRHB,
++	REG_ASRIDRLB,
++	REG_ASRIDRHC,
++	REG_ASRIDRLC,
++	REG_ASR76K,
++	REG_ASR56K,
++	REG_ASRMCRA,
++	REG_ASRFSTA,
++	REG_ASRMCRB,
++	REG_ASRFSTB,
++	REG_ASRMCRC,
++	REG_ASRFSTC,
++	REG_ASRMCR1A,
++	REG_ASRMCR1B,
++	REG_ASRMCR1C,
++};
++
++static void dump_regs(void)
++{
++	u32 reg, val;
++	int i;
++
++	for (i = 0; i < ARRAY_SIZE(asrc_reg); i++) {
++		reg = asrc_reg[i];
++		regmap_read(asrc->regmap, reg, &val);
++		dev_dbg(asrc->dev, "REG addr=0x%x val=0x%x\n", reg, val);
++	}
++}
++#else
++static void dump_regs(void) {}
++#endif
++
++/* Only used for Ideal Ratio mode */
++static int asrc_set_clock_ratio(enum asrc_pair_index index,
++				int inrate, int outrate)
++{
++	unsigned long val = 0;
++	int integ, i;
++
++	if (outrate == 0) {
++		dev_err(asrc->dev, "wrong output sample rate: %d\n", outrate);
++		return -EINVAL;
++	}
++
++	/* Formula: r = (1 << ASRC_RATIO_DECIMAL_DEPTH) / outrate * inrate; */
++	for (integ = 0; inrate >= outrate; integ++)
++		inrate -= outrate;
++
++	val |= (integ << ASRC_RATIO_DECIMAL_DEPTH);
++
++	for (i = 1; i <= ASRC_RATIO_DECIMAL_DEPTH; i++) {
++		if ((inrate * 2) >= outrate) {
++			val |= (1 << (ASRC_RATIO_DECIMAL_DEPTH - i));
++			inrate = inrate * 2 - outrate;
++		} else
++			inrate = inrate << 1;
++
++		if (inrate == 0)
++			break;
++	}
++
++	regmap_write(asrc->regmap, REG_ASRIDRL(index), val);
++	regmap_write(asrc->regmap, REG_ASRIDRH(index), (val >> 24));
++
++	return 0;
++}
++
++/* Corresponding to asrc_process_table */
++static int supported_input_rate[] = {
++	5512, 8000, 11025, 16000, 22050, 32000, 44100, 48000, 64000, 88200,
++	96000, 176400, 192000,
++};
++
++static int supported_output_rate[] = {
++	32000, 44100, 48000, 64000, 88200, 96000, 176400, 192000,
++};
++
++static int asrc_set_process_configuration(enum asrc_pair_index index,
++					int inrate, int outrate)
++{
++	int in, out;
++
++	for (in = 0; in < ARRAY_SIZE(supported_input_rate); in++) {
++		if (inrate == supported_input_rate[in])
++			break;
++	}
++
++	if (in == ARRAY_SIZE(supported_input_rate)) {
++		dev_err(asrc->dev, "unsupported input sample rate: %d\n", in);
++		return -EINVAL;
++	}
++
++	for (out = 0; out < ARRAY_SIZE(supported_output_rate); out++) {
++		if (outrate == supported_output_rate[out])
++			break;
++	}
++
++	if (out == ARRAY_SIZE(supported_output_rate)) {
++		dev_err(asrc->dev, "unsupported output sample rate: %d\n", out);
++		return -EINVAL;
++	}
++
++	regmap_update_bits(asrc->regmap, REG_ASRCFG,
++			ASRCFG_PREMODx_MASK(index) | ASRCFG_POSTMODx_MASK(index),
++			ASRCFG_PREMOD(index, asrc_process_table[in][out][0]) |
++			ASRCFG_POSTMOD(index, asrc_process_table[in][out][1]));
++
++	return 0;
++}
++
++static int asrc_get_asrck_clock_divider(int samplerate)
++{
++	unsigned int prescaler, divider, ratio, ra, i;
++	unsigned long bitclk;
++
++	if (samplerate == 0) {
++		dev_err(asrc->dev, "invalid sample rate: %d\n", samplerate);
++		return -EINVAL;
++	}
++
++	bitclk = clk_get_rate(asrc->asrck_clk);
++
++	ra = bitclk / samplerate;
++	ratio = ra;
++
++	/* Calculate the prescaler */
++	for (i = 0; ratio > 8; i++)
++		ratio >>= 1;
++
++	prescaler = i;
++
++	/* Calculate the divider */
++	divider = i ? (((ra + (1 << (i - 1)) - 1) >> i) - 1) : (ra - 1);
++
++	/* The totally divider is (2 ^ prescaler) * divider */
++	return (divider << ASRCDRx_AxCPx_WIDTH) + prescaler;
++}
++
++int asrc_req_pair(int chn_num, enum asrc_pair_index *index)
++{
++	int imax = 0, busy = 0, i, ret = 0;
++	unsigned long lock_flags;
++	struct asrc_pair *pair;
++
++	spin_lock_irqsave(&data_lock, lock_flags);
++
++	for (i = ASRC_PAIR_A; i < ASRC_PAIR_MAX_NUM; i++) {
++		pair = &asrc->asrc_pair[i];
++		if (chn_num > pair->chn_max) {
++			imax++;
++			continue;
++		} else if (pair->active) {
++			busy++;
++			continue;
++		}
++		/* Save the current qualified pair */
++		*index = i;
++
++		/* Check if this pair is a perfect one */
++		if (chn_num == pair->chn_max)
++			break;
++	}
++
++	if (imax == ASRC_PAIR_MAX_NUM) {
++		dev_err(asrc->dev, "no pair could afford required channel number\n");
++		ret = -EINVAL;
++	} else if (busy == ASRC_PAIR_MAX_NUM) {
++		dev_err(asrc->dev, "all pairs are busy now\n");
++		ret = -EBUSY;
++	} else if (busy + imax >= ASRC_PAIR_MAX_NUM) {
++		dev_err(asrc->dev, "all affordable pairs are busy now\n");
++		ret = -EBUSY;
++	} else {
++		pair = &asrc->asrc_pair[*index];
++		pair->chn_num = chn_num;
++		pair->active = 1;
++	}
++
++	spin_unlock_irqrestore(&data_lock, lock_flags);
++
++	if (!ret) {
++		clk_prepare_enable(asrc->mem_clk);
++		clk_prepare_enable(asrc->ipg_clk);
++		clk_prepare_enable(asrc->asrck_clk);
++		clk_prepare_enable(asrc->dma_clk);
++	}
++
++	return ret;
++}
++EXPORT_SYMBOL(asrc_req_pair);
++
++void asrc_release_pair(enum asrc_pair_index index)
++{
++	struct asrc_pair *pair = &asrc->asrc_pair[index];
++	unsigned long lock_flags;
++
++	spin_lock_irqsave(&data_lock, lock_flags);
++
++	pair->active = 0;
++	pair->overload_error = 0;
++
++	spin_unlock_irqrestore(&data_lock, lock_flags);
++
++	/* Disable PAIR */
++	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEx_MASK(index), 0);
++}
++EXPORT_SYMBOL(asrc_release_pair);
++
++int asrc_config_pair(struct asrc_config *config)
++{
++	u32 inrate = config->input_sample_rate, indiv;
++	u32 outrate = config->output_sample_rate, outdiv;
++	int ret, channels, index = config->pair;
++	unsigned long lock_flags;
++
++	/* Set the channel number */
++	spin_lock_irqsave(&data_lock, lock_flags);
++	asrc->asrc_pair[index].chn_num = config->channel_num;
++	spin_unlock_irqrestore(&data_lock, lock_flags);
++
++	if (asrc->channel_bits > 3)
++		channels = config->channel_num;
++	else
++		channels = (config->channel_num + 1) / 2;
++
++	/* Update channel number of current pair */
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(index, asrc->channel_bits),
++			ASRCNCR_ANCx_set(index, channels, asrc->channel_bits));
++
++	/* Set the clock source */
++	regmap_update_bits(asrc->regmap, REG_ASRCSR,
++			ASRCSR_AICSx_MASK(index) | ASRCSR_AOCSx_MASK(index),
++			ASRCSR_AICS(index, input_clk_map[config->inclk]) |
++			ASRCSR_AOCS(index, output_clk_map[config->outclk]));
++
++	/* Default setting: Automatic selection for processing mode */
++	regmap_update_bits(asrc->regmap, REG_ASRCTR,
++			ASRCTR_ATSx_MASK(index), ASRCTR_ATS(index));
++	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_USRx_MASK(index), 0);
++
++	/* Default Input Clock Divider Setting */
++	switch (config->inclk & ASRCSR_AxCSx_MASK) {
++	case INCLK_SPDIF_RX:
++		indiv = ASRC_PRESCALER_SPDIF_RX;
++		break;
++	case INCLK_SPDIF_TX:
++		indiv = ASRC_PRESCALER_SPDIF_TX;
++		break;
++	case INCLK_ASRCK1_CLK:
++		indiv = asrc_get_asrck_clock_divider(inrate);
++		break;
++	default:
++		switch (config->input_word_width) {
++		case ASRC_WIDTH_16_BIT:
++			indiv = ASRC_PRESCALER_I2S_16BIT;
++			break;
++		case ASRC_WIDTH_24_BIT:
++			indiv = ASRC_PRESCALER_I2S_24BIT;
++			break;
++		default:
++			pair_err("unsupported input word width %d\n",
++					config->input_word_width);
++			return -EINVAL;
++		}
++		break;
++	}
++
++	/* Default Output Clock Divider Setting */
++	switch (config->outclk & ASRCSR_AxCSx_MASK) {
++	case OUTCLK_SPDIF_RX:
++		outdiv = ASRC_PRESCALER_SPDIF_RX;
++		break;
++	case OUTCLK_SPDIF_TX:
++		outdiv = ASRC_PRESCALER_SPDIF_TX;
++		break;
++	case OUTCLK_ASRCK1_CLK:
++		if ((config->inclk & ASRCSR_AxCSx_MASK) == INCLK_NONE)
++			outdiv = ASRC_PRESCALER_IDEAL_RATIO;
++		else
++			outdiv = asrc_get_asrck_clock_divider(outrate);
++		break;
++	default:
++		switch (config->output_word_width) {
++		case ASRC_WIDTH_16_BIT:
++			outdiv = ASRC_PRESCALER_I2S_16BIT;
++			break;
++		case ASRC_WIDTH_24_BIT:
++			outdiv = ASRC_PRESCALER_I2S_24BIT;
++			break;
++		default:
++			pair_err("unsupported output word width %d\n",
++					config->input_word_width);
++			return -EINVAL;
++		}
++		break;
++	}
++
++	/* indiv and outdiv'd include prescaler's value, so add its MASK too */
++	regmap_update_bits(asrc->regmap, REG_ASRCDR(index),
++			ASRCDRx_AOCPx_MASK(index) | ASRCDRx_AICPx_MASK(index) |
++			ASRCDRx_AOCDx_MASK(index) | ASRCDRx_AICDx_MASK(index),
++			ASRCDRx_AOCP(index, outdiv) | ASRCDRx_AICP(index, indiv));
++
++	/* Check whether ideal ratio is a must */
++	switch (config->inclk & ASRCSR_AxCSx_MASK) {
++	case INCLK_NONE:
++		/* Clear ASTSx bit to use ideal ratio */
++		regmap_update_bits(asrc->regmap, REG_ASRCTR,
++				ASRCTR_ATSx_MASK(index), 0);
++
++		regmap_update_bits(asrc->regmap, REG_ASRCTR,
++				ASRCTR_IDRx_MASK(index) | ASRCTR_USRx_MASK(index),
++				ASRCTR_IDR(index) | ASRCTR_USR(index));
++
++		ret = asrc_set_clock_ratio(index, inrate, outrate);
++		if (ret)
++			return ret;
++
++		ret = asrc_set_process_configuration(index, inrate, outrate);
++		if (ret)
++			return ret;
++
++		break;
++	case INCLK_ASRCK1_CLK:
++		/* This case and default are both remained for v1 */
++		if (inrate == 44100 || inrate == 88200) {
++			pair_err("unsupported sample rate %d by selected clock\n",
++					inrate);
++			return -EINVAL;
++		}
++		break;
++	default:
++		if ((config->outclk & ASRCSR_AxCSx_MASK) != OUTCLK_ASRCK1_CLK)
++			break;
++
++		if (outrate == 44100 || outrate == 88200) {
++			pair_err("unsupported sample rate %d by selected clock\n",
++					outrate);
++			return -EINVAL;
++		}
++		break;
++	}
++
++	/* Config input and output wordwidth */
++	if (config->output_word_width == ASRC_WIDTH_8_BIT) {
++		pair_err("unsupported wordwidth for output: 8bit\n");
++		pair_err("output only support: 16bit or 24bit\n");
++		return -EINVAL;
++	}
++
++	regmap_update_bits(asrc->regmap, REG_ASRMCR1(index),
++			ASRMCR1x_OW16_MASK | ASRMCR1x_IWD_MASK,
++			ASRMCR1x_OW16(config->output_word_width) |
++			ASRMCR1x_IWD(config->input_word_width));
++
++	/* Enable BUFFER STALL */
++	regmap_update_bits(asrc->regmap, REG_ASRMCR(index),
++			ASRMCRx_BUFSTALLx_MASK, ASRMCRx_BUFSTALLx);
++
++	/* Set Threshold for input and output FIFO */
++	return asrc_set_watermark(index, ASRC_INPUTFIFO_THRESHOLD,
++			ASRC_INPUTFIFO_THRESHOLD);
++}
++EXPORT_SYMBOL(asrc_config_pair);
++
++int asrc_set_watermark(enum asrc_pair_index index, u32 in_wm, u32 out_wm)
++{
++	if (in_wm > ASRC_FIFO_THRESHOLD_MAX || out_wm > ASRC_FIFO_THRESHOLD_MAX) {
++		pair_err("invalid watermark!\n");
++		return -EINVAL;
++	}
++
++	return regmap_update_bits(asrc->regmap, REG_ASRMCR(index),
++			ASRMCRx_EXTTHRSHx_MASK | ASRMCRx_INFIFO_THRESHOLD_MASK |
++			ASRMCRx_OUTFIFO_THRESHOLD_MASK,
++			ASRMCRx_EXTTHRSHx | ASRMCRx_INFIFO_THRESHOLD(in_wm) |
++			ASRMCRx_OUTFIFO_THRESHOLD(out_wm));
++}
++EXPORT_SYMBOL(asrc_set_watermark);
++
++void asrc_start_conv(enum asrc_pair_index index)
++{
++	int reg, retry, channels, i;
++
++	regmap_update_bits(asrc->regmap, REG_ASRCTR,
++			ASRCTR_ASRCEx_MASK(index), ASRCTR_ASRCE(index));
++
++	/* Wait for status of initialization */
++	for (retry = 10, reg = 0; !reg && retry; --retry) {
++		udelay(5);
++		regmap_read(asrc->regmap, REG_ASRCFG, &reg);
++		reg &= ASRCFG_INIRQx_MASK(index);
++	}
++
++	/* Set the input fifo to ASRC STALL level */
++	regmap_read(asrc->regmap, REG_ASRCNCR, &reg);
++	channels = ASRCNCR_ANCx_get(index, reg, asrc->channel_bits);
++	for (i = 0; i < channels * 4; i++)
++		regmap_write(asrc->regmap, REG_ASRDI(index), 0);
++
++	/* Overload Interrupt Enable */
++	regmap_write(asrc->regmap, REG_ASRIER, ASRIER_AOLIE);
++}
++EXPORT_SYMBOL(asrc_start_conv);
++
++void asrc_stop_conv(enum asrc_pair_index index)
++{
++	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEx_MASK(index), 0);
++}
++EXPORT_SYMBOL(asrc_stop_conv);
++
++void asrc_finish_conv(enum asrc_pair_index index)
++{
++	clk_disable_unprepare(asrc->dma_clk);
++	clk_disable_unprepare(asrc->asrck_clk);
++	clk_disable_unprepare(asrc->ipg_clk);
++	clk_disable_unprepare(asrc->mem_clk);
++}
++EXPORT_SYMBOL(asrc_finish_conv);
++
++#define SET_OVERLOAD_ERR(index, err, msg) \
++	do { \
++		asrc->asrc_pair[index].overload_error |= err; \
++		pair_dbg(msg); \
++	} while (0)
++
++static irqreturn_t asrc_isr(int irq, void *dev_id)
++{
++	enum asrc_pair_index index;
++	u32 status;
++
++	regmap_read(asrc->regmap, REG_ASRSTR, &status);
++
++	for (index = ASRC_PAIR_A; index < ASRC_PAIR_MAX_NUM; index++) {
++		if (asrc->asrc_pair[index].active == 0)
++			continue;
++		if (status & ASRSTR_ATQOL)
++			SET_OVERLOAD_ERR(index, ASRC_TASK_Q_OVERLOAD,
++					"Task Queue FIFO overload");
++		if (status & ASRSTR_AOOL(index))
++			SET_OVERLOAD_ERR(index, ASRC_OUTPUT_TASK_OVERLOAD,
++					"Output Task Overload");
++		if (status & ASRSTR_AIOL(index))
++			SET_OVERLOAD_ERR(index, ASRC_INPUT_TASK_OVERLOAD,
++					"Input Task Overload");
++		if (status & ASRSTR_AODO(index))
++			SET_OVERLOAD_ERR(index, ASRC_OUTPUT_BUFFER_OVERFLOW,
++					"Output Data Buffer has overflowed");
++		if (status & ASRSTR_AIDU(index))
++			SET_OVERLOAD_ERR(index, ASRC_INPUT_BUFFER_UNDERRUN,
++					"Input Data Buffer has underflowed");
++	}
++
++	/* Clean overload error  */
++	regmap_write(asrc->regmap, REG_ASRSTR, ASRSTR_AOLE);
++
++	return IRQ_HANDLED;
++}
++
++void asrc_get_status(struct asrc_status_flags *flags)
++{
++	enum asrc_pair_index index = flags->index;
++	unsigned long lock_flags;
++
++	spin_lock_irqsave(&data_lock, lock_flags);
++
++	flags->overload_error = asrc->asrc_pair[index].overload_error;
++
++	spin_unlock_irqrestore(&data_lock, lock_flags);
++}
++EXPORT_SYMBOL(asrc_get_status);
++
++u32 asrc_get_per_addr(enum asrc_pair_index index, bool in)
++{
++	return asrc->paddr + (in ? REG_ASRDI(index) : REG_ASRDO(index));
++}
++EXPORT_SYMBOL(asrc_get_per_addr);
++
++static int mxc_init_asrc(void)
++{
++	/* Halt ASRC internal FP when input FIFO needs data for pair A, B, C */
++	regmap_write(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEN);
++
++	/* Disable interrupt by default */
++	regmap_write(asrc->regmap, REG_ASRIER, 0x0);
++
++	/* Default 2: 6: 2 channel assignment */
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(ASRC_PAIR_A, asrc->channel_bits),
++			ASRCNCR_ANCx_set(ASRC_PAIR_A, 2, asrc->channel_bits));
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(ASRC_PAIR_B, asrc->channel_bits),
++			ASRCNCR_ANCx_set(ASRC_PAIR_B, 6, asrc->channel_bits));
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(ASRC_PAIR_C, asrc->channel_bits),
++			ASRCNCR_ANCx_set(ASRC_PAIR_C, 2, asrc->channel_bits));
++
++	/* Parameter Registers recommended settings */
++	regmap_write(asrc->regmap, REG_ASRPM1, 0x7fffff);
++	regmap_write(asrc->regmap, REG_ASRPM2, 0x255555);
++	regmap_write(asrc->regmap, REG_ASRPM3, 0xff7280);
++	regmap_write(asrc->regmap, REG_ASRPM4, 0xff7280);
++	regmap_write(asrc->regmap, REG_ASRPM5, 0xff7280);
++
++	/* Base address for task queue FIFO. Set to 0x7C */
++	regmap_update_bits(asrc->regmap, REG_ASRTFR1,
++			ASRTFR1_TF_BASE_MASK, ASRTFR1_TF_BASE(0xfc));
++
++	/* Set the processing clock for 76KHz, 133M */
++	regmap_write(asrc->regmap, REG_ASR76K, 0x06D6);
++
++	/* Set the processing clock for 56KHz, 133M */
++	return regmap_write(asrc->regmap, REG_ASR56K, 0x0947);
++}
++
++#define ASRC_xPUT_DMA_CALLBACK(in) \
++	((in) ? asrc_input_dma_callback : asrc_output_dma_callback)
++
++static void asrc_input_dma_callback(void *data)
++{
++	struct asrc_pair_params *params = (struct asrc_pair_params *)data;
++
++	complete(&params->input_complete);
++}
++
++static void asrc_output_dma_callback(void *data)
++{
++	struct asrc_pair_params *params = (struct asrc_pair_params *)data;
++
++	complete(&params->output_complete);
++}
++
++static unsigned int asrc_get_output_FIFO_size(enum asrc_pair_index index)
++{
++	u32 val;
++
++	regmap_read(asrc->regmap, REG_ASRFST(index), &val);
++
++	val &= ASRFSTx_OUTPUT_FIFO_MASK;
++
++	return val >> ASRFSTx_OUTPUT_FIFO_SHIFT;
++}
++
++static u32 asrc_read_one_from_output_FIFO(enum asrc_pair_index index)
++{
++	u32 val;
++
++	regmap_read(asrc->regmap, REG_ASRDO(index), &val);
++
++	return val;
++}
++
++static void asrc_read_output_FIFO(struct asrc_pair_params *params)
++{
++	u32 *reg24 = params->output_last_period.dma_vaddr;
++	u16 *reg16 = params->output_last_period.dma_vaddr;
++	enum asrc_pair_index index = params->index;
++	u32 i, j, reg, size, t_size;
++	bool bit24 = false;
++
++	if (params->output_word_width == ASRC_WIDTH_24_BIT)
++		bit24 = true;
++
++	t_size = 0;
++	do {
++		size = asrc_get_output_FIFO_size(index);
++		for (i = 0; i < size; i++) {
++			for (j = 0; j < params->channel_nums; j++) {
++				reg = asrc_read_one_from_output_FIFO(index);
++				if (bit24) {
++					*(reg24) = reg;
++					reg24++;
++				} else {
++					*(reg16) = (u16)reg;
++					reg16++;
++				}
++			}
++		}
++		t_size += size;
++	} while (size);
++
++	if (t_size > params->last_period_sample)
++		t_size = params->last_period_sample;
++
++	params->output_last_period.length = t_size * params->channel_nums * 2;
++	if (bit24)
++		params->output_last_period.length *= 2;
++}
++
++static void mxc_free_dma_buf(struct asrc_pair_params *params)
++{
++	if (params->input_dma_total.dma_vaddr != NULL) {
++		kfree(params->input_dma_total.dma_vaddr);
++		params->input_dma_total.dma_vaddr = NULL;
++	}
++
++	if (params->output_dma_total.dma_vaddr != NULL) {
++		kfree(params->output_dma_total.dma_vaddr);
++		params->output_dma_total.dma_vaddr = NULL;
++	}
++
++	if (params->output_last_period.dma_vaddr) {
++		dma_free_coherent(asrc->dev, 1024 * params->last_period_sample,
++				params->output_last_period.dma_vaddr,
++				params->output_last_period.dma_paddr);
++		params->output_last_period.dma_vaddr = NULL;
++	}
++}
++
++static int mxc_allocate_dma_buf(struct asrc_pair_params *params)
++{
++	struct dma_block *input_a, *output_a, *last_period;
++	enum asrc_pair_index index = params->index;
++
++	input_a = &params->input_dma_total;
++	output_a = &params->output_dma_total;
++	last_period = &params->output_last_period;
++
++	input_a->dma_vaddr = kzalloc(input_a->length, GFP_KERNEL);
++	if (!input_a->dma_vaddr) {
++		pair_err("failed to allocate input dma buffer\n");
++		goto exit;
++	}
++	input_a->dma_paddr = virt_to_dma(NULL, input_a->dma_vaddr);
++
++	output_a->dma_vaddr = kzalloc(output_a->length, GFP_KERNEL);
++	if (!output_a->dma_vaddr) {
++		pair_err("failed to allocate output dma buffer\n");
++		goto exit;
++	}
++	output_a->dma_paddr = virt_to_dma(NULL, output_a->dma_vaddr);
++
++	last_period->dma_vaddr = dma_zalloc_coherent(asrc->dev,
++			1024 * params->last_period_sample,
++			&last_period->dma_paddr, GFP_KERNEL);
++	if (!last_period->dma_vaddr) {
++		pair_err("failed to allocate last period buffer\n");
++		goto exit;
++	}
++
++	return 0;
++
++exit:
++	mxc_free_dma_buf(params);
++
++	return -ENOBUFS;
++}
++
++static struct dma_chan *imx_asrc_get_dma_channel(enum asrc_pair_index index, bool in)
++{
++	char name[4];
++
++	sprintf(name, "%cx%c", in ? 'r' : 't', index + 'a');
++
++	return dma_request_slave_channel(asrc->dev, name);
++}
++
++static int imx_asrc_dma_config(struct asrc_pair_params *params,
++				struct dma_chan *chan, u32 dma_addr,
++				void *buf_addr, u32 buf_len, bool in,
++				enum asrc_word_width word_width)
++{
++	enum asrc_pair_index index = params->index;
++	struct dma_async_tx_descriptor *desc;
++	struct dma_slave_config slave_config;
++	enum dma_slave_buswidth buswidth;
++	struct scatterlist *sg;
++	unsigned int sg_nent, i;
++	int ret;
++
++	if (in) {
++		sg = params->input_sg;
++		sg_nent = params->input_sg_nodes;
++		desc = params->desc_in;
++	} else {
++		sg = params->output_sg;
++		sg_nent = params->output_sg_nodes;
++		desc = params->desc_out;
++	}
++
++	switch (word_width) {
++	case ASRC_WIDTH_16_BIT:
++		buswidth = DMA_SLAVE_BUSWIDTH_2_BYTES;
++		break;
++	case ASRC_WIDTH_24_BIT:
++		buswidth = DMA_SLAVE_BUSWIDTH_4_BYTES;
++		break;
++	default:
++		pair_err("invalid word width\n");
++		return -EINVAL;
++	}
++
++//	slave_config.dma_request0 = 0;
++//	slave_config.dma_request1 = 0;
++
++	if (in) {
++		slave_config.direction = DMA_MEM_TO_DEV;
++		slave_config.dst_addr = dma_addr;
++		slave_config.dst_addr_width = buswidth;
++		slave_config.dst_maxburst =
++			params->input_wm * params->channel_nums;
++	} else {
++		slave_config.direction = DMA_DEV_TO_MEM;
++		slave_config.src_addr = dma_addr;
++		slave_config.src_addr_width = buswidth;
++		slave_config.src_maxburst =
++			params->output_wm * params->channel_nums;
++	}
++	ret = dmaengine_slave_config(chan, &slave_config);
++	if (ret) {
++		pair_err("failed to config dmaengine for %sput task: %d\n",
++				in ? "in" : "out", ret);
++		return -EINVAL;
++	}
++
++	sg_init_table(sg, sg_nent);
++	switch (sg_nent) {
++	case 1:
++		sg_init_one(sg, buf_addr, buf_len);
++		break;
++	case 2:
++	case 3:
++	case 4:
++		for (i = 0; i < (sg_nent - 1); i++)
++			sg_set_buf(&sg[i], buf_addr + i * ASRC_MAX_BUFFER_SIZE,
++					ASRC_MAX_BUFFER_SIZE);
++
++		sg_set_buf(&sg[i], buf_addr + i * ASRC_MAX_BUFFER_SIZE,
++				buf_len - ASRC_MAX_BUFFER_SIZE * i);
++		break;
++	default:
++		pair_err("invalid input DMA nodes number: %d\n", sg_nent);
++		return -EINVAL;
++	}
++
++	ret = dma_map_sg(NULL, sg, sg_nent, slave_config.direction);
++	if (ret != sg_nent) {
++		pair_err("failed to map dma sg for %sput task\n",
++				in ? "in" : "out");
++		return -EINVAL;
++	}
++
++	desc = dmaengine_prep_slave_sg(chan, sg, sg_nent,
++			slave_config.direction, DMA_PREP_INTERRUPT);
++	if (!desc) {
++		pair_err("failed to prepare slave sg for %sput task\n",
++				in ? "in" : "out");
++		return -EINVAL;
++	}
++
++	if (in) {
++		params->desc_in = desc;
++		params->desc_in->callback = asrc_input_dma_callback;
++	} else {
++		params->desc_out = desc;
++		params->desc_out->callback = asrc_output_dma_callback;
++	}
++
++	desc->callback = ASRC_xPUT_DMA_CALLBACK(in);
++	desc->callback_param = params;
++
++	return 0;
++}
++
++static int mxc_asrc_prepare_io_buffer(struct asrc_pair_params *params,
++				struct asrc_convert_buffer *pbuf, bool in)
++{
++	enum asrc_pair_index index = params->index;
++	struct dma_chan *dma_channel;
++	enum asrc_word_width width;
++	unsigned int *dma_len, *sg_nodes, buf_len, wm;
++	void __user *buf_vaddr;
++	void *dma_vaddr;
++	u32 word_size, fifo_addr;
++
++	if (in) {
++		dma_channel = params->input_dma_channel;
++		dma_vaddr = params->input_dma_total.dma_vaddr;
++		dma_len = &params->input_dma_total.length;
++		width = params->input_word_width;
++		sg_nodes = &params->input_sg_nodes;
++		wm = params->input_wm;
++		buf_vaddr = (void __user *)pbuf->input_buffer_vaddr;
++		buf_len = pbuf->input_buffer_length;
++	} else {
++		dma_channel = params->output_dma_channel;
++		dma_vaddr = params->output_dma_total.dma_vaddr;
++		dma_len = &params->output_dma_total.length;
++		width = params->output_word_width;
++		sg_nodes = &params->output_sg_nodes;
++		wm = params->last_period_sample;
++		buf_vaddr = (void __user *)pbuf->output_buffer_vaddr;
++		buf_len = pbuf->output_buffer_length;
++	}
++
++	switch (width) {
++	case ASRC_WIDTH_24_BIT:
++		word_size = 4;
++		break;
++	case ASRC_WIDTH_16_BIT:
++	case ASRC_WIDTH_8_BIT:
++		word_size = 2;
++		break;
++	default:
++		pair_err("invalid %sput word size!\n", in ? "in" : "out");
++		return -EINVAL;
++	}
++
++	if (buf_len < word_size * params->channel_nums * wm) {
++		pair_err("%sput buffer size[%d] is too small!\n",
++				in ? "in" : "out", buf_len);
++		return -EINVAL;
++	}
++
++	/* Copy origin data into input buffer */
++	if (in && copy_from_user(dma_vaddr, buf_vaddr, buf_len))
++		return -EFAULT;
++
++	*dma_len = buf_len;
++	if (!in)
++		*dma_len -= wm * word_size * params->channel_nums;
++
++	*sg_nodes = *dma_len / ASRC_MAX_BUFFER_SIZE + 1;
++
++	fifo_addr = asrc_get_per_addr(params->index, in);
++
++	return imx_asrc_dma_config(params, dma_channel, fifo_addr, dma_vaddr,
++			*dma_len, in, width);
++}
++
++static int mxc_asrc_prepare_buffer(struct asrc_pair_params *params,
++				struct asrc_convert_buffer *pbuf)
++{
++	enum asrc_pair_index index = params->index;
++	int ret;
++
++	ret = mxc_asrc_prepare_io_buffer(params, pbuf, true);
++	if (ret) {
++		pair_err("failed to prepare input buffer: %d\n", ret);
++		return ret;
++	}
++
++	ret = mxc_asrc_prepare_io_buffer(params, pbuf, false);
++	if (ret) {
++		pair_err("failed to prepare output buffer: %d\n", ret);
++		return ret;
++	}
++
++	return 0;
++}
++
++int mxc_asrc_process_buffer_pre(struct completion *complete,
++				enum asrc_pair_index index, bool in)
++{
++	if (!wait_for_completion_interruptible_timeout(complete, 10 * HZ)) {
++		pair_err("%sput dma task timeout\n", in ? "in" : "out");
++		return -ETIME;
++	} else if (signal_pending(current)) {
++		pair_err("%sput task forcibly aborted\n", in ? "in" : "out");
++		return -EBUSY;
++	}
++
++	init_completion(complete);
++
++	return 0;
++}
++
++#define mxc_asrc_dma_umap(params) \
++	do { \
++		dma_unmap_sg(NULL, params->input_sg, params->input_sg_nodes, \
++				DMA_MEM_TO_DEV); \
++		dma_unmap_sg(NULL, params->output_sg, params->output_sg_nodes, \
++				DMA_DEV_TO_MEM); \
++	} while (0)
++
++int mxc_asrc_process_buffer(struct asrc_pair_params *params,
++			struct asrc_convert_buffer *pbuf)
++{
++	enum asrc_pair_index index = params->index;
++	unsigned long lock_flags;
++	int ret;
++
++	/* Check input task first */
++	ret = mxc_asrc_process_buffer_pre(&params->input_complete, index, false);
++	if (ret) {
++		mxc_asrc_dma_umap(params);
++		return ret;
++	}
++
++	/* ...then output task*/
++	ret = mxc_asrc_process_buffer_pre(&params->output_complete, index, true);
++	if (ret) {
++		mxc_asrc_dma_umap(params);
++		return ret;
++	}
++
++	mxc_asrc_dma_umap(params);
++
++	pbuf->input_buffer_length = params->input_dma_total.length;
++	pbuf->output_buffer_length = params->output_dma_total.length;
++
++	spin_lock_irqsave(&pair_lock, lock_flags);
++	if (!params->pair_hold) {
++		spin_unlock_irqrestore(&pair_lock, lock_flags);
++		return -EFAULT;
++	}
++	spin_unlock_irqrestore(&pair_lock, lock_flags);
++
++	asrc_read_output_FIFO(params);
++
++	if (copy_to_user((void __user *)pbuf->output_buffer_vaddr,
++			 params->output_dma_total.dma_vaddr,
++			 params->output_dma_total.length))
++		return -EFAULT;
++
++	pbuf->output_buffer_length += params->output_last_period.length;
++
++	if (copy_to_user((void __user *)pbuf->output_buffer_vaddr +
++			 params->output_dma_total.length,
++			 params->output_last_period.dma_vaddr,
++			 params->output_last_period.length))
++		return -EFAULT;
++
++	return 0;
++}
++
++#ifdef ASRC_POLLING_WITHOUT_DMA
++static void asrc_write_one_to_input_FIFO(enum asrc_pair_index index, u32 val)
++{
++	regmap_write(asrc->regmap, REG_ASRDI(index), val);
++}
++
++/* THIS FUNCTION ONLY EXISTS FOR DEBUGGING AND ONLY SUPPORTS TWO CHANNELS */
++static void asrc_polling_debug(struct asrc_pair_params *params)
++{
++	enum asrc_pair_index index = params->index;
++	u32 *in24 = params->input_dma_total.dma_vaddr;
++	u32 dma_len = params->input_dma_total.length / (params->channel_nums * 4);
++	u32 size, i, j, t_size, reg;
++	u32 *reg24 = params->output_dma_total.dma_vaddr;
++
++	t_size = 0;
++
++	for (i = 0; i < dma_len; ) {
++		for (j = 0; j < 2; j++) {
++			asrc_write_one_to_input_FIFO(index, *in24);
++			in24++;
++			asrc_write_one_to_input_FIFO(index, *in24);
++			in24++;
++			i++;
++		}
++		udelay(50);
++		udelay(50 * params->output_sample_rate / params->input_sample_rate);
++
++		size = asrc_get_output_FIFO_size(index);
++		for (j = 0; j < size; j++) {
++			reg = asrc_read_one_from_output_FIFO(index);
++			*(reg24) = reg;
++			reg24++;
++			reg = asrc_read_one_from_output_FIFO(index);
++			*(reg24) = reg;
++			reg24++;
++		}
++		t_size += size;
++	}
++
++	mdelay(1);
++	size = asrc_get_output_FIFO_size(index);
++	for (j = 0; j < size; j++) {
++		reg = asrc_read_one_from_output_FIFO(index);
++		*(reg24) = reg;
++		reg24++;
++		reg = asrc_read_one_from_output_FIFO(index);
++		*(reg24) = reg;
++		reg24++;
++	}
++	t_size += size;
++
++	params->output_dma_total.length = t_size * params->channel_nums * 4;
++	params->output_last_period.length = 0;
++
++	complete(&params->input_complete);
++}
++#else
++static void mxc_asrc_submit_dma(struct asrc_pair_params *params)
++{
++	enum asrc_pair_index index = params->index;
++	u32 size = asrc_get_output_FIFO_size(params->index);
++	int i, j;
++
++	/* Read all data in OUTPUT FIFO */
++	while (size) {
++		for (j = 0; j < size; j++)
++			for (i = 0; i < params->channel_nums; i++)
++				asrc_read_one_from_output_FIFO(index);
++		/* Fetch the data every 100us */
++		udelay(100);
++
++		size = asrc_get_output_FIFO_size(index);
++	}
++
++	/* Submit dma request */
++	dmaengine_submit(params->desc_in);
++	dma_async_issue_pending(params->desc_in->chan);
++
++	dmaengine_submit(params->desc_out);
++	dma_async_issue_pending(params->desc_out->chan);
++
++	/*
++	 * Clear dma request during the stall state of ASRC:
++	 * During STALL state, the remaining in input fifo would never be
++	 * smaller than the input threshold while the output fifo would not
++	 * be bigger than output one. Thus the dma request would be cleared.
++	 */
++	asrc_set_watermark(index, ASRC_FIFO_THRESHOLD_MIN, ASRC_FIFO_THRESHOLD_MAX);
++
++	/* Update the real input threshold to raise dma request */
++	asrc_set_watermark(index, params->input_wm, params->output_wm);
++}
++#endif
++
++static long asrc_ioctl_req_pair(struct asrc_pair_params *params,
++				void __user *user)
++{
++	unsigned long lock_flags;
++	struct asrc_req req;
++	long ret;
++
++	ret = copy_from_user(&req, user, sizeof(req));
++	if (ret) {
++		dev_err(asrc->dev, "failed to get req from user space: %ld\n", ret);
++		return ret;
++	}
++
++	ret = asrc_req_pair(req.chn_num, &req.index);
++	if (ret) {
++		dev_err(asrc->dev, "failed to request pair: %ld\n", ret);
++		return ret;
++	}
++
++	spin_lock_irqsave(&pair_lock, lock_flags);
++	params->pair_hold = 1;
++	spin_unlock_irqrestore(&pair_lock, lock_flags);
++	params->index = req.index;
++	params->channel_nums = req.chn_num;
++
++	ret = copy_to_user(user, &req, sizeof(req));
++	if (ret) {
++		dev_err(asrc->dev, "failed to send req to user space: %ld\n", ret);
++		return ret;
++	}
++
++	return 0;
++}
++
++static long asrc_ioctl_config_pair(struct asrc_pair_params *params,
++				void __user *user)
++{
++	struct asrc_config config;
++	enum asrc_pair_index index;
++	long ret;
++
++	ret = copy_from_user(&config, user, sizeof(config));
++	if (ret) {
++		dev_err(asrc->dev, "failed to get config from user space: %ld\n", ret);
++		return ret;
++	}
++
++	index = config.pair;
++
++	ret = asrc_config_pair(&config);
++	if (ret) {
++		pair_err("failed to config pair: %ld\n", ret);
++		return ret;
++	}
++
++	params->input_wm = 4;
++	params->output_wm = 2;
++
++	ret = asrc_set_watermark(index, params->input_wm, params->output_wm);
++	if (ret)
++		return ret;
++
++	params->output_buffer_size = config.dma_buffer_size;
++	params->input_buffer_size = config.dma_buffer_size;
++	if (config.buffer_num > ASRC_DMA_BUFFER_NUM)
++		params->buffer_num = ASRC_DMA_BUFFER_NUM;
++	else
++		params->buffer_num = config.buffer_num;
++
++	params->input_dma_total.length = ASRC_DMA_BUFFER_SIZE;
++	params->output_dma_total.length = ASRC_DMA_BUFFER_SIZE;
++
++	params->input_word_width = config.input_word_width;
++	params->output_word_width = config.output_word_width;
++
++	params->input_sample_rate = config.input_sample_rate;
++	params->output_sample_rate = config.output_sample_rate;
++
++	if (params->output_sample_rate > params->input_sample_rate)
++		params->last_period_sample = ASRC_OUTPUT_LAST_SAMPLE_DEFAULT_MAX;
++	else
++	params->last_period_sample = ASRC_OUTPUT_LAST_SAMPLE_DEFAULT;
++
++
++	ret = mxc_allocate_dma_buf(params);
++	if (ret) {
++		pair_err("failed to allocate dma buffer: %ld\n", ret);
++		return ret;
++	}
++
++	/* Request DMA channel for both input and output */
++	params->input_dma_channel = imx_asrc_get_dma_channel(index, true);
++	if (params->input_dma_channel == NULL) {
++		pair_err("failed to request input task dma channel\n");
++		return  -EBUSY;
++	}
++
++	params->output_dma_channel = imx_asrc_get_dma_channel(index, false);
++	if (params->output_dma_channel == NULL) {
++		pair_err("failed to request output task dma channel\n");
++		return  -EBUSY;
++	}
++
++	ret = copy_to_user(user, &config, sizeof(config));
++	if (ret) {
++		pair_err("failed to send config to user space: %ld\n", ret);
++		return ret;
++	}
++
++	return 0;
++}
++
++static long asrc_ioctl_release_pair(struct asrc_pair_params *params,
++				void __user *user)
++{
++	enum asrc_pair_index index;
++	unsigned long lock_flags;
++	long ret;
++
++	ret = copy_from_user(&index, user, sizeof(index));
++	if (ret) {
++		dev_err(asrc->dev, "failed to get index from user space: %ld\n", ret);
++		return ret;
++	}
++
++	/* index might be not valid due to some application failure. */
++	if (index < 0)
++		return -EINVAL;
++
++	params->asrc_active = 0;
++
++	spin_lock_irqsave(&pair_lock, lock_flags);
++	params->pair_hold = 0;
++	spin_unlock_irqrestore(&pair_lock, lock_flags);
++
++	if (params->input_dma_channel)
++		dma_release_channel(params->input_dma_channel);
++	if (params->output_dma_channel)
++		dma_release_channel(params->output_dma_channel);
++	mxc_free_dma_buf(params);
++	asrc_release_pair(index);
++	asrc_finish_conv(index);
++
++	return 0;
++}
++
++static long asrc_ioctl_convert(struct asrc_pair_params *params,
++				void __user *user)
++{
++	enum asrc_pair_index index = params->index;
++	struct asrc_convert_buffer buf;
++	long ret;
++
++	ret = copy_from_user(&buf, user, sizeof(buf));
++	if (ret) {
++		pair_err("failed to get buf from user space: %ld\n", ret);
++		return ret;
++	}
++
++	ret = mxc_asrc_prepare_buffer(params, &buf);
++	if (ret) {
++		pair_err("failed to prepare buffer: %ld\n", ret);
++		return ret;
++	}
++
++#ifdef ASRC_POLLING_WITHOUT_DMA
++	asrc_polling_debug(params);
++#else
++	mxc_asrc_submit_dma(params);
++#endif
++
++	ret = mxc_asrc_process_buffer(params, &buf);
++	if (ret) {
++		pair_err("failed to process buffer: %ld\n", ret);
++		return ret;
++	}
++
++	ret = copy_to_user(user, &buf, sizeof(buf));
++	if (ret) {
++		pair_err("failed to send buf to user space: %ld\n", ret);
++		return ret;
++	}
++
++	return 0;
++}
++
++static long asrc_ioctl_start_conv(struct asrc_pair_params *params,
++				void __user *user)
++{
++	enum asrc_pair_index index;
++	long ret;
++
++	ret = copy_from_user(&index, user, sizeof(index));
++	if (ret) {
++		dev_err(asrc->dev, "failed to get index from user space: %ld\n", ret);
++		return ret;
++	}
++
++	params->asrc_active = 1;
++	asrc_start_conv(index);
++
++	return 0;
++}
++
++static long asrc_ioctl_stop_conv(struct asrc_pair_params *params,
++				void __user *user)
++{
++	enum asrc_pair_index index;
++	long ret;
++
++	ret = copy_from_user(&index, user, sizeof(index));
++	if (ret) {
++		dev_err(asrc->dev, "failed to get index from user space: %ld\n", ret);
++		return ret;
++	}
++
++	dmaengine_terminate_all(params->input_dma_channel);
++	dmaengine_terminate_all(params->output_dma_channel);
++
++	asrc_stop_conv(index);
++	params->asrc_active = 0;
++
++	return 0;
++}
++
++static long asrc_ioctl_status(struct asrc_pair_params *params,
++				void __user *user)
++{
++	enum asrc_pair_index index = params->index;
++	struct asrc_status_flags flags;
++	long ret;
++
++	ret = copy_from_user(&flags, user, sizeof(flags));
++	if (ret) {
++		pair_err("failed to get flags from user space: %ld\n", ret);
++		return ret;
++	}
++
++	asrc_get_status(&flags);
++
++	ret = copy_to_user(user, &flags, sizeof(flags));
++	if (ret) {
++		pair_err("failed to send flags to user space: %ld\n", ret);
++		return ret;
++	}
++
++	return 0;
++}
++
++static long asrc_ioctl_flush(struct asrc_pair_params *params,
++				void __user *user)
++{
++	enum asrc_pair_index index = params->index;
++	init_completion(&params->input_complete);
++	init_completion(&params->output_complete);
++
++	/* Release DMA and request again */
++	dma_release_channel(params->input_dma_channel);
++	dma_release_channel(params->output_dma_channel);
++
++	params->input_dma_channel = imx_asrc_get_dma_channel(index, true);
++	if (params->input_dma_channel == NULL) {
++		pair_err("failed to request input task dma channel\n");
++		return -EBUSY;
++	}
++
++	params->output_dma_channel = imx_asrc_get_dma_channel(index, false);
++	if (params->output_dma_channel == NULL) {
++		pair_err("failed to request output task dma channel\n");
++		return -EBUSY;
++	}
++
++	return 0;
++}
++
++static long asrc_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
++{
++	struct asrc_pair_params *params = file->private_data;
++	void __user *user = (void __user *)arg;
++	long ret = 0;
++
++	switch (cmd) {
++	case ASRC_REQ_PAIR:
++		ret = asrc_ioctl_req_pair(params, user);
++		break;
++	case ASRC_CONFIG_PAIR:
++		ret = asrc_ioctl_config_pair(params, user);
++		break;
++	case ASRC_RELEASE_PAIR:
++		ret = asrc_ioctl_release_pair(params, user);
++		break;
++	case ASRC_CONVERT:
++		ret = asrc_ioctl_convert(params, user);
++		break;
++	case ASRC_START_CONV:
++		ret = asrc_ioctl_start_conv(params, user);
++		dump_regs();
++		break;
++	case ASRC_STOP_CONV:
++		ret = asrc_ioctl_stop_conv(params, user);
++		break;
++	case ASRC_STATUS:
++		ret = asrc_ioctl_status(params, user);
++		break;
++	case ASRC_FLUSH:
++		ret = asrc_ioctl_flush(params, user);
++		break;
++	default:
++		dev_err(asrc->dev, "invalid ioctl cmd!\n");
++		break;
++	}
++
++	return ret;
++}
++
++static int mxc_asrc_open(struct inode *inode, struct file *file)
++{
++	struct asrc_pair_params *params;
++	unsigned long lock_flags;
++	int i = 0, ret = 0;
++
++	ret = signal_pending(current);
++	if (ret) {
++		dev_err(asrc->dev, "current process has a signal pending\n");
++		return ret;
++	}
++
++	params = kzalloc(sizeof(struct asrc_pair_params), GFP_KERNEL);
++	if (params == NULL) {
++		dev_err(asrc->dev, "failed to allocate pair_params\n");
++		return -ENOBUFS;
++	}
++
++	file->private_data = params;
++
++	while (asrc->params[i])
++		i++;
++
++	if (i >= ASRC_PAIR_MAX_NUM) {
++		dev_err(asrc->dev, "All pairs are being occupied\n");
++		return -EBUSY;
++	}
++
++	init_completion(&params->input_complete);
++	init_completion(&params->output_complete);
++
++	spin_lock_irqsave(&pair_lock, lock_flags);
++	asrc->params[i] = params;
++	spin_unlock_irqrestore(&pair_lock, lock_flags);
++
++	return ret;
++}
++
++static int mxc_asrc_close(struct inode *inode, struct file *file)
++{
++	struct asrc_pair_params *params;
++	unsigned long lock_flags;
++	int i;
++
++	params = file->private_data;
++
++	spin_lock_irqsave(&pair_lock, lock_flags);
++	for (i = 0; i < ASRC_PAIR_MAX_NUM; i++)
++		if (asrc->params[i] == params)
++			asrc->params[i] = NULL;
++	spin_unlock_irqrestore(&pair_lock, lock_flags);
++
++	if (!params)
++		return 0;
++
++	if (params->asrc_active) {
++		params->asrc_active = 0;
++
++		dmaengine_terminate_all(params->input_dma_channel);
++		dmaengine_terminate_all(params->output_dma_channel);
++
++		asrc_stop_conv(params->index);
++
++		complete(&params->input_complete);
++		complete(&params->output_complete);
++	}
++
++		spin_lock_irqsave(&pair_lock, lock_flags);
++	if (params->pair_hold) {
++		params->pair_hold = 0;
++		spin_unlock_irqrestore(&pair_lock, lock_flags);
++
++		if (params->input_dma_channel)
++			dma_release_channel(params->input_dma_channel);
++		if (params->output_dma_channel)
++			dma_release_channel(params->output_dma_channel);
++
++		mxc_free_dma_buf(params);
++
++		asrc_release_pair(params->index);
++		asrc_finish_conv(params->index);
++	} else {
++		spin_unlock_irqrestore(&pair_lock, lock_flags);
++	}
++
++	spin_lock_irqsave(&pair_lock, lock_flags);
++	kfree(params);
++	spin_unlock_irqrestore(&pair_lock, lock_flags);
++	file->private_data = NULL;
++
++	return 0;
++}
++
++static int mxc_asrc_mmap(struct file *file, struct vm_area_struct *vma)
++{
++	unsigned long size = vma->vm_end - vma->vm_start;
++	int ret;
++
++	vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
++
++	ret = remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
++			size, vma->vm_page_prot);
++	if (ret) {
++		dev_err(asrc->dev, "failed to memory map!\n");
++		return ret;
++	}
++
++	vma->vm_flags &= ~VM_IO;
++
++	return ret;
++}
++
++static const struct file_operations asrc_fops = {
++	.owner		= THIS_MODULE,
++	.unlocked_ioctl	= asrc_ioctl,
++	.mmap		= mxc_asrc_mmap,
++	.open		= mxc_asrc_open,
++	.release	= mxc_asrc_close,
++};
++
++static struct miscdevice asrc_miscdev = {
++	.name	= "mxc_asrc",
++	.fops	= &asrc_fops,
++	.minor	= MISC_DYNAMIC_MINOR,
++};
++
++static int asrc_read_proc_attr(struct file *file, char __user *buf,
++				size_t count, loff_t *off)
++{
++	char tmpbuf[80];
++	int len = 0;
++	u32 reg;
++
++	if (*off)
++		return 0;
++
++	regmap_read(asrc->regmap, REG_ASRCNCR, &reg);
++
++	len += sprintf(tmpbuf, "ANCA: %d\nANCB: %d\nANCC: %d\n",
++			ASRCNCR_ANCx_get(ASRC_PAIR_A, reg, asrc->channel_bits),
++			ASRCNCR_ANCx_get(ASRC_PAIR_B, reg, asrc->channel_bits),
++			ASRCNCR_ANCx_get(ASRC_PAIR_C, reg, asrc->channel_bits));
++
++	if (len > count)
++		return 0;
++
++	if (copy_to_user(buf, &tmpbuf, len))
++		return -EFAULT;
++
++	*off += len;
++
++	return len;
++}
++
++#define ASRC_MAX_PROC_BUFFER_SIZE 63
++
++static int asrc_write_proc_attr(struct file *file, const char __user *buffer,
++				size_t count, loff_t *data)
++{
++	char buf[ASRC_MAX_PROC_BUFFER_SIZE];
++	int na, nb, nc;
++	int total;
++
++	if (count > ASRC_MAX_PROC_BUFFER_SIZE) {
++		dev_err(asrc->dev, "proc write: the input string was too long\n");
++		return -EINVAL;
++	}
++
++	if (copy_from_user(buf, buffer, count)) {
++		dev_err(asrc->dev, "proc write: failed to copy buffer from user\n");
++		return -EFAULT;
++	}
++
++	sscanf(buf, "ANCA: %d\nANCB: %d\nANCC: %d", &na, &nb, &nc);
++
++	total = asrc->channel_bits > 3 ? 10 : 5;
++
++	if (na + nb + nc > total) {
++		dev_err(asrc->dev, "don't surpass %d for total\n", total);
++		return -EINVAL;
++	} else if (asrc->channel_bits < 4 &&
++		   (na % 2 != 0 || nb % 2 != 0 || nc % 2 != 0)) {
++		dev_err(asrc->dev, "please set an even number for each pair\n");
++		return -EINVAL;
++	} else if (na < 0 || nb < 0 || nc < 0) {
++		dev_err(asrc->dev, "please set an positive number for each pair\n");
++		return -EINVAL;
++	}
++
++
++	asrc->asrc_pair[ASRC_PAIR_A].chn_max = na;
++	asrc->asrc_pair[ASRC_PAIR_B].chn_max = nb;
++	asrc->asrc_pair[ASRC_PAIR_C].chn_max = nc;
++
++	/* Update channel number settings */
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(ASRC_PAIR_A, asrc->channel_bits),
++			ASRCNCR_ANCx_set(ASRC_PAIR_A, na, asrc->channel_bits));
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(ASRC_PAIR_B, asrc->channel_bits),
++			ASRCNCR_ANCx_set(ASRC_PAIR_B, nb, asrc->channel_bits));
++	regmap_update_bits(asrc->regmap, REG_ASRCNCR,
++			ASRCNCR_ANCx_MASK(ASRC_PAIR_C, asrc->channel_bits),
++			ASRCNCR_ANCx_set(ASRC_PAIR_C, nc, asrc->channel_bits));
++
++	return count;
++}
++
++static const struct file_operations asrc_proc_fops = {
++	.read		= asrc_read_proc_attr,
++	.write		= asrc_write_proc_attr,
++};
++
++static void asrc_proc_create(void)
++{
++	struct proc_dir_entry *proc_attr;
++
++	asrc->proc_asrc = proc_mkdir(ASRC_PROC_PATH, NULL);
++	if (!asrc->proc_asrc) {
++		dev_err(asrc->dev, "failed to create proc entry %s\n", ASRC_PROC_PATH);
++		return;
++	}
++
++	proc_attr = proc_create("ChSettings", S_IFREG | S_IRUGO | S_IWUSR,
++			asrc->proc_asrc, &asrc_proc_fops);
++	if (!proc_attr) {
++		remove_proc_entry(ASRC_PROC_PATH, NULL);
++		dev_err(asrc->dev, "failed to create proc attribute entry\n");
++	}
++}
++
++static void asrc_proc_remove(void)
++{
++	remove_proc_entry("ChSettings", asrc->proc_asrc);
++	remove_proc_entry(ASRC_PROC_PATH, NULL);
++}
++
++
++static bool asrc_readable_reg(struct device *dev, unsigned int reg)
++{
++	switch (reg) {
++	case REG_ASRCTR:
++	case REG_ASRIER:
++	case REG_ASRCNCR:
++	case REG_ASRCFG:
++	case REG_ASRCSR:
++	case REG_ASRCDR1:
++	case REG_ASRCDR2:
++	case REG_ASRSTR:
++	case REG_ASRPM1:
++	case REG_ASRPM2:
++	case REG_ASRPM3:
++	case REG_ASRPM4:
++	case REG_ASRPM5:
++	case REG_ASRTFR1:
++	case REG_ASRCCR:
++	case REG_ASRDOA:
++	case REG_ASRDOB:
++	case REG_ASRDOC:
++	case REG_ASRIDRHA:
++	case REG_ASRIDRLA:
++	case REG_ASRIDRHB:
++	case REG_ASRIDRLB:
++	case REG_ASRIDRHC:
++	case REG_ASRIDRLC:
++	case REG_ASR76K:
++	case REG_ASR56K:
++	case REG_ASRMCRA:
++	case REG_ASRFSTA:
++	case REG_ASRMCRB:
++	case REG_ASRFSTB:
++	case REG_ASRMCRC:
++	case REG_ASRFSTC:
++	case REG_ASRMCR1A:
++	case REG_ASRMCR1B:
++	case REG_ASRMCR1C:
++		return true;
++	default:
++		return false;
++	}
++}
++
++static bool asrc_volatile_reg(struct device *dev, unsigned int reg)
++{
++	switch (reg) {
++	case REG_ASRSTR:
++	case REG_ASRDIA:
++	case REG_ASRDIB:
++	case REG_ASRDIC:
++	case REG_ASRDOA:
++	case REG_ASRDOB:
++	case REG_ASRDOC:
++	case REG_ASRFSTA:
++	case REG_ASRFSTB:
++	case REG_ASRFSTC:
++	case REG_ASRCFG:
++		return true;
++	default:
++		return false;
++	}
++}
++
++static bool asrc_writeable_reg(struct device *dev, unsigned int reg)
++{
++	switch (reg) {
++	case REG_ASRCTR:
++	case REG_ASRIER:
++	case REG_ASRCNCR:
++	case REG_ASRCFG:
++	case REG_ASRCSR:
++	case REG_ASRCDR1:
++	case REG_ASRCDR2:
++	case REG_ASRSTR:
++	case REG_ASRPM1:
++	case REG_ASRPM2:
++	case REG_ASRPM3:
++	case REG_ASRPM4:
++	case REG_ASRPM5:
++	case REG_ASRTFR1:
++	case REG_ASRCCR:
++	case REG_ASRDIA:
++	case REG_ASRDIB:
++	case REG_ASRDIC:
++	case REG_ASRIDRHA:
++	case REG_ASRIDRLA:
++	case REG_ASRIDRHB:
++	case REG_ASRIDRLB:
++	case REG_ASRIDRHC:
++	case REG_ASRIDRLC:
++	case REG_ASR76K:
++	case REG_ASR56K:
++	case REG_ASRMCRA:
++	case REG_ASRMCRB:
++	case REG_ASRMCRC:
++	case REG_ASRMCR1A:
++	case REG_ASRMCR1B:
++	case REG_ASRMCR1C:
++		return true;
++	default:
++		return false;
++	}
++}
++
++static struct regmap_config asrc_regmap_config = {
++	.reg_bits = 32,
++	.reg_stride = 4,
++	.val_bits = 32,
++
++	.max_register = REG_ASRMCR1C,
++	.readable_reg = asrc_readable_reg,
++	.volatile_reg = asrc_volatile_reg,
++	.writeable_reg = asrc_writeable_reg,
++	.cache_type = REGCACHE_RBTREE,
++};
++
++static int mxc_asrc_probe(struct platform_device *pdev)
++{
++	const struct of_device_id *of_id = of_match_device(fsl_asrc_ids, &pdev->dev);
++	struct device_node *np = pdev->dev.of_node;
++	enum mxc_asrc_type devtype;
++	struct resource *res;
++	void __iomem *regs;
++	int ret;
++
++	/* Check if the device is existed */
++	if (!np)
++		return -ENODEV;
++
++	asrc = devm_kzalloc(&pdev->dev, sizeof(struct asrc_data), GFP_KERNEL);
++	if (!asrc)
++		return -ENOMEM;
++
++	if (of_id) {
++		const struct platform_device_id *id_entry = of_id->data;
++		devtype = id_entry->driver_data;
++	} else {
++		devtype = pdev->id_entry->driver_data;
++	}
++
++	asrc->dev = &pdev->dev;
++	asrc->dev->coherent_dma_mask = DMA_BIT_MASK(32);
++
++	asrc->asrc_pair[ASRC_PAIR_A].chn_max = 2;
++	asrc->asrc_pair[ASRC_PAIR_B].chn_max = 6;
++	asrc->asrc_pair[ASRC_PAIR_C].chn_max = 2;
++	asrc->asrc_pair[ASRC_PAIR_A].overload_error = 0;
++	asrc->asrc_pair[ASRC_PAIR_B].overload_error = 0;
++	asrc->asrc_pair[ASRC_PAIR_C].overload_error = 0;
++
++	/* Map the address */
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (IS_ERR(res)) {
++		dev_err(&pdev->dev, "could not determine device resources\n");
++		return PTR_ERR(res);
++	}
++
++	regs = devm_ioremap_resource(&pdev->dev, res);
++	if (IS_ERR(regs)) {
++		dev_err(&pdev->dev, "could not map device resources\n");
++		return PTR_ERR(regs);
++	}
++	asrc->paddr = res->start;
++
++	/* Register regmap and let it prepare core clock */
++	asrc->regmap = devm_regmap_init_mmio_clk(&pdev->dev,
++			"mem", regs, &asrc_regmap_config);
++	if (IS_ERR(asrc->regmap)) {
++		dev_err(&pdev->dev, "regmap init failed\n");
++		return PTR_ERR(asrc->regmap);
++	}
++
++	asrc->irq = platform_get_irq(pdev, 0);
++	if (asrc->irq == NO_IRQ) {
++		dev_err(&pdev->dev, "no irq for node %s\n", np->full_name);
++		return asrc->irq;
++	}
++
++	ret = devm_request_irq(&pdev->dev, asrc->irq, asrc_isr, 0, np->name, NULL);
++	if (ret) {
++		dev_err(&pdev->dev, "could not claim irq %u: %d\n", asrc->irq, ret);
++		return ret;
++	}
++
++	asrc->mem_clk = devm_clk_get(&pdev->dev, "mem");
++	if (IS_ERR(asrc->mem_clk)) {
++		dev_err(&pdev->dev, "failed to get mem clock\n");
++		return PTR_ERR(asrc->ipg_clk);
++	}
++
++	asrc->ipg_clk = devm_clk_get(&pdev->dev, "ipg");
++	if (IS_ERR(asrc->ipg_clk)) {
++		dev_err(&pdev->dev, "failed to get ipg clock\n");
++		return PTR_ERR(asrc->ipg_clk);
++	}
++
++	asrc->asrck_clk = devm_clk_get(&pdev->dev, "asrck");
++	if (IS_ERR(asrc->asrck_clk)) {
++		dev_err(&pdev->dev, "failed to get asrck clock\n");
++		return PTR_ERR(asrc->asrck_clk);
++	}
++
++	asrc->dma_clk = devm_clk_get(&pdev->dev, "dma");
++	if (IS_ERR(asrc->dma_clk)) {
++		dev_err(&pdev->dev, "failed to get dma script clock\n");
++		return PTR_ERR(asrc->dma_clk);
++	}
++
++	switch (devtype) {
++	case IMX35_ASRC:
++		asrc->channel_bits = 3;
++		input_clk_map = input_clk_map_v1;
++		output_clk_map = output_clk_map_v1;
++		break;
++	case IMX53_ASRC:
++		asrc->channel_bits = 4;
++		input_clk_map = input_clk_map_v2;
++		output_clk_map = output_clk_map_v2;
++		break;
++	default:
++		dev_err(&pdev->dev, "unsupported device type\n");
++		return -EINVAL;
++	}
++
++	ret = misc_register(&asrc_miscdev);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to register char device %d\n", ret);
++		return ret;
++	}
++
++	asrc_proc_create();
++
++	ret = mxc_init_asrc();
++	if (ret) {
++		dev_err(&pdev->dev, "failed to init asrc %d\n", ret);
++		goto err_misc;
++	}
++
++	dev_info(&pdev->dev, "mxc_asrc registered\n");
++
++	return ret;
++
++err_misc:
++	misc_deregister(&asrc_miscdev);
++
++	return ret;
++}
++
++static int mxc_asrc_remove(struct platform_device *pdev)
++{
++	asrc_proc_remove();
++	misc_deregister(&asrc_miscdev);
++
++	return 0;
++}
++
++#if CONFIG_PM_SLEEP
++static int mxc_asrc_suspend(struct device *dev)
++{
++	struct asrc_pair_params *params;
++	unsigned long lock_flags;
++	int i;
++
++	for (i = 0; i < ASRC_PAIR_MAX_NUM; i++) {
++		spin_lock_irqsave(&pair_lock, lock_flags);
++
++		params = asrc->params[i];
++		if (!params || !params->pair_hold) {
++			spin_unlock_irqrestore(&pair_lock, lock_flags);
++			continue;
++		}
++
++		if (!completion_done(&params->input_complete)) {
++			if (params->input_dma_channel)
++				dmaengine_terminate_all(params->input_dma_channel);
++			asrc_input_dma_callback((void *)params);
++		}
++		if (!completion_done(&params->output_complete)) {
++			if (params->output_dma_channel)
++				dmaengine_terminate_all(params->output_dma_channel);
++			asrc_output_dma_callback((void *)params);
++		}
++
++		spin_unlock_irqrestore(&pair_lock, lock_flags);
++	}
++
++	regcache_cache_only(asrc->regmap, true);
++	regcache_mark_dirty(asrc->regmap);
++
++	return 0;
++}
++
++static int mxc_asrc_resume(struct device *dev)
++{
++	u32 asrctr;
++
++	/* Stop all pairs provisionally */
++	regmap_read(asrc->regmap, REG_ASRCTR, &asrctr);
++	regmap_update_bits(asrc->regmap, REG_ASRCTR, ASRCTR_ASRCEx_ALL_MASK, 0);
++
++	regcache_cache_only(asrc->regmap, false);
++	regcache_sync(asrc->regmap);
++
++	/* Restart enabled pairs */
++	regmap_update_bits(asrc->regmap, REG_ASRCTR,
++			   ASRCTR_ASRCEx_ALL_MASK, asrctr);
++
++	return 0;
++}
++#endif /* CONFIG_PM_SLEEP */
++
++static const struct dev_pm_ops mxc_asrc_pm_ops = {
++	SET_SYSTEM_SLEEP_PM_OPS(mxc_asrc_suspend, mxc_asrc_resume)
++};
++
++static struct platform_driver mxc_asrc_driver = {
++	.driver = {
++		.name = "mxc_asrc",
++		.of_match_table = fsl_asrc_ids,
++		.pm = &mxc_asrc_pm_ops,
++	},
++	.probe = mxc_asrc_probe,
++	.remove = mxc_asrc_remove,
++};
++
++module_platform_driver(mxc_asrc_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("Asynchronous Sample Rate Converter");
++MODULE_LICENSE("GPL");
++MODULE_ALIAS("platform:mxc_asrc");
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.c	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,932 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++
++#if gcdENABLE_VG
++
++#include "gc_hal_kernel_hardware_command_vg.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_COMMAND
++
++/******************************************************************************\
++****************************** gckVGCOMMAND API code *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_InitializeInfo
++**
++**  Initialize architecture dependent command buffer information.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to the Command object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGCOMMAND_InitializeInfo(
++    IN gckVGCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    do
++    {
++        /* Reset interrupts. */
++        Command->info.feBufferInt   = -1;
++        Command->info.tsOverflowInt = -1;
++
++        /* Set command buffer attributes. */
++        Command->info.addressAlignment = 64;
++        Command->info.commandAlignment = 8;
++
++        /* Determine command alignment address mask. */
++        Command->info.addressMask = ((((gctUINT32) (Command->info.addressAlignment - 1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0 ) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++        /* Query the number of bytes needed by the STATE command. */
++        gcmkERR_BREAK(gckVGCOMMAND_StateCommand(
++            Command, 0x0, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.stateCommandSize
++            ));
++
++        /* Query the number of bytes needed by the RESTART command. */
++        gcmkERR_BREAK(gckVGCOMMAND_RestartCommand(
++            Command, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.restartCommandSize
++            ));
++
++        /* Query the number of bytes needed by the FETCH command. */
++        gcmkERR_BREAK(gckVGCOMMAND_FetchCommand(
++            Command, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.fetchCommandSize
++            ));
++
++        /* Query the number of bytes needed by the CALL command. */
++        gcmkERR_BREAK(gckVGCOMMAND_CallCommand(
++            Command, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.callCommandSize
++            ));
++
++        /* Query the number of bytes needed by the RETURN command. */
++        gcmkERR_BREAK(gckVGCOMMAND_ReturnCommand(
++            Command, gcvNULL,
++            &Command->info.returnCommandSize
++            ));
++
++        /* Query the number of bytes needed by the EVENT command. */
++        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
++            Command, gcvNULL, gcvBLOCK_PIXEL, -1,
++            &Command->info.eventCommandSize
++            ));
++
++        /* Query the number of bytes needed by the END command. */
++        gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
++            Command, gcvNULL, -1,
++            &Command->info.endCommandSize
++            ));
++
++        /* Determine the tail reserve size. */
++        Command->info.staticTailSize = gcmMAX(
++            Command->info.fetchCommandSize,
++            gcmMAX(
++                Command->info.returnCommandSize,
++                Command->info.endCommandSize
++                )
++            );
++
++        /* Determine the maximum tail size. */
++        Command->info.dynamicTailSize
++            = Command->info.staticTailSize
++            + Command->info.eventCommandSize * gcvBLOCK_COUNT;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_StateCommand
++**
++**  Append a STATE command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctUINT32 Pipe
++**          Harwdare destination pipe.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          STATE command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 Address
++**          Starting register address of the state buffer.
++**          If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT32 Count
++**          Number of states in state buffer.
++**          If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the STATE command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the STATE command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_StateCommand(
++    IN gckVGCOMMAND Command,
++    IN gctUINT32 Pipe,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Address,
++    IN gctSIZE_T Count,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Pipe=0x%x Logical=0x%x Address=0x%x Count=0x%x Bytes = 0x%x",
++                   Command, Pipe, Logical, Address, Count, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append STATE. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) ((gctUINT32) (Pipe) & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the STATE command. */
++            *Bytes = 4 * (Count + 1);
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append LOAD_STATE. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the STATE command. */
++            *Bytes = 4 * (Count + 1);
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_RestartCommand
++**
++**  Form a RESTART command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          RESTART command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 FetchAddress
++**          The address of another command buffer to be executed by this RESTART
++**          command.  If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT FetchCount
++**          The number of 64-bit data quantities in another command buffer to
++**          be executed by this RESTART command.  If 'Logical' is gcvNULL, this
++**          argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the RESTART command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the RESTART command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_RestartCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
++                   Command, Logical, FetchAddress, FetchCount, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++            gctUINT32 beginEndMark;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Determine Begin/End flag. */
++            beginEndMark = (FetchCount > 0)
++                ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
++                : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)));
++
++            /* Append RESTART. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x9 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)))
++                | beginEndMark;
++
++            buffer[1]
++                = FetchAddress;
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the RESTART command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_FetchCommand
++**
++**  Form a FETCH command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          FETCH command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 FetchAddress
++**          The address of another command buffer to be executed by this FETCH
++**          command.  If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT FetchCount
++**          The number of 64-bit data quantities in another command buffer to
++**          be executed by this FETCH command.  If 'Logical' is gcvNULL, this
++**          argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the FETCH command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the FETCH command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_FetchCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
++                   Command, Logical, FetchAddress, FetchCount, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append FETCH. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x5 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
++
++            buffer[1]
++                = gcmkFIXADDRESS(FetchAddress);
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the FETCH command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append LINK. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            buffer[1]
++                = gcmkFIXADDRESS(FetchAddress);
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the LINK command. */
++            *Bytes = 8;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_CallCommand
++**
++**  Append a CALL command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          CALL command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 FetchAddress
++**          The address of another command buffer to be executed by this CALL
++**          command.  If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT FetchCount
++**          The number of 64-bit data quantities in another command buffer to
++**          be executed by this CALL command.  If 'Logical' is gcvNULL, this
++**          argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the CALL command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the CALL command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_CallCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
++                   Command, Logical, FetchAddress, FetchCount, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append CALL. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x6 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
++
++            buffer[1]
++                = gcmkFIXADDRESS(FetchAddress);
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the CALL command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_ReturnCommand
++**
++**  Append a RETURN command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          RETURN command at or gcvNULL to query the size of the command.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the RETURN command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the RETURN command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_ReturnCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x  Bytes = 0x%x",
++                   Command, Logical, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append RETURN. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x7 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the RETURN command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_EventCommand
++**
++**  Form an EVENT command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to the Command object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          EVENT command at or gcvNULL to query the size of the command.
++**
++**      gctINT32 InterruptId
++**          The ID of the interrupt to generate.
++**          If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gceBLOCK Block
++**          Block that will generate the interrupt.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the EVENT command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_EventCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gceBLOCK Block,
++    IN gctINT32 InterruptId,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x Block=0x%x InterruptId=0x%x Bytes = 0x%x",
++                   Command, Logical, Block, InterruptId, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        typedef struct _gcsEVENTSTATES
++        {
++            /* Chips before VG21 use these values. */
++            gctUINT     eventFromFE;
++            gctUINT     eventFromPE;
++
++            /* VG21 chips and later use SOURCE field. */
++            gctUINT     eventSource;
++        }
++        gcsEVENTSTATES;
++
++        static gcsEVENTSTATES states[] =
++        {
++            /* gcvBLOCK_COMMAND */
++            {
++                (gctUINT)~0,
++                (gctUINT)~0,
++                (gctUINT)~0
++            },
++
++            /* gcvBLOCK_TESSELLATOR */
++            {
++                0x0,
++                0x1,
++                0x10
++            },
++
++            /* gcvBLOCK_TESSELLATOR2 */
++            {
++                0x0,
++                0x1,
++                0x12
++            },
++
++            /* gcvBLOCK_TESSELLATOR3 */
++            {
++                0x0,
++                0x1,
++                0x14
++            },
++
++            /* gcvBLOCK_RASTER */
++            {
++                0x0,
++                0x1,
++                0x07,
++            },
++
++            /* gcvBLOCK_VG */
++            {
++                0x0,
++                0x1,
++                0x0F
++            },
++
++            /* gcvBLOCK_VG2 */
++            {
++                0x0,
++                0x1,
++                0x11
++            },
++
++            /* gcvBLOCK_VG3 */
++            {
++                0x0,
++                0x1,
++                0x13
++            },
++
++            /* gcvBLOCK_PIXEL */
++            {
++                0x0,
++                0x1,
++                0x07
++            },
++        };
++
++        /* Verify block ID. */
++        gcmkVERIFY_ARGUMENT(gcmIS_VALID_INDEX(Block, states));
++
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append EVENT. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
++
++            /* Determine chip version. */
++            if (Command->vg21)
++            {
++                /* Get the event source for the block. */
++                gctUINT eventSource = states[Block].eventSource;
++
++                /* Supported? */
++                if (eventSource == ~0)
++                {
++                    gcmkFOOTER_NO();
++                    return gcvSTATUS_NOT_SUPPORTED;
++                }
++
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) ((gctUINT32) (eventSource) & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++            }
++            else
++            {
++                /* Get the event source for the block. */
++                gctUINT eventFromFE = states[Block].eventFromFE;
++                gctUINT eventFromPE = states[Block].eventFromPE;
++
++                /* Supported? */
++                if (eventFromFE == ~0)
++                {
++                    gcmkFOOTER_NO();
++                    return gcvSTATUS_NOT_SUPPORTED;
++                }
++
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (eventFromFE) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (eventFromPE) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++            }
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Make sure the events are directly supported for the block. */
++            if (states[Block].eventSource == ~0)
++            {
++                gcmkFOOTER_NO();
++                return gcvSTATUS_NOT_SUPPORTED;
++            }
++
++            /* Return number of bytes required by the END command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append EVENT. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            /* Determine event source. */
++            if (Block == gcvBLOCK_COMMAND)
++            {
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++            }
++            else
++            {
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++            }
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the EVENT and END commands. */
++            *Bytes = 8;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_EndCommand
++**
++**  Form an END command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to the Command object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          END command at or gcvNULL to query the size of the command.
++**
++**      gctINT32 InterruptId
++**          The ID of the interrupt to generate.
++**          If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the END command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_EndCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctINT32 InterruptId,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x InterruptId=0x%x Bytes = 0x%x",
++                   Command, Logical, InterruptId, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append END. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the END command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR memory;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++
++            /* Cast the buffer pointer. */
++            memory = (gctUINT32_PTR) Logical;
++
++            /* Append EVENT. */
++            memory[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            memory[1]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++            /* Append END. */
++            memory[2]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the EVENT and END commands. */
++            *Bytes = 16;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++#endif /* gcdENABLE_VG */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_command_vg.h	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,319 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_hardware_command_vg_h_
++#define __gc_hal_kernel_hardware_command_vg_h_
++
++/******************************************************************************\
++******************* Task and Interrupt Management Structures. ******************
++\******************************************************************************/
++
++/* Task storage header. */
++typedef struct _gcsTASK_STORAGE * gcsTASK_STORAGE_PTR;
++typedef struct _gcsTASK_STORAGE
++{
++    /* Next allocated storage buffer. */
++    gcsTASK_STORAGE_PTR         next;
++}
++gcsTASK_STORAGE;
++
++/* Task container header. */
++typedef struct _gcsTASK_CONTAINER * gcsTASK_CONTAINER_PTR;
++typedef struct _gcsTASK_CONTAINER
++{
++    /* The number of tasks left to be processed in the container. */
++    gctINT                      referenceCount;
++
++    /* Size of the buffer. */
++    gctUINT                     size;
++
++    /* Link to the previous and the next allocated containers. */
++    gcsTASK_CONTAINER_PTR       allocPrev;
++    gcsTASK_CONTAINER_PTR       allocNext;
++
++    /* Link to the previous and the next containers in the free list. */
++    gcsTASK_CONTAINER_PTR       freePrev;
++    gcsTASK_CONTAINER_PTR       freeNext;
++}
++gcsTASK_CONTAINER;
++
++/* Kernel space task master table entry. */
++typedef struct _gcsBLOCK_TASK_ENTRY * gcsBLOCK_TASK_ENTRY_PTR;
++typedef struct _gcsBLOCK_TASK_ENTRY
++{
++    /* Pointer to the current task container for the block. */
++    gcsTASK_CONTAINER_PTR       container;
++
++    /* Pointer to the current task data within the container. */
++    gcsTASK_HEADER_PTR          task;
++
++    /* Pointer to the last link task within the container. */
++    gcsTASK_LINK_PTR            link;
++
++    /* Number of interrupts allocated for this block. */
++    gctUINT                     interruptCount;
++
++    /* The index of the current interrupt. */
++    gctUINT                     interruptIndex;
++
++    /* Interrupt semaphore. */
++    gctSEMAPHORE                interruptSemaphore;
++
++    /* Interrupt value array. */
++    gctINT32                    interruptArray[32];
++}
++gcsBLOCK_TASK_ENTRY;
++
++
++/******************************************************************************\
++********************* Command Queue Management Structures. *********************
++\******************************************************************************/
++
++/* Command queue kernel element pointer. */
++typedef struct _gcsKERNEL_CMDQUEUE * gcsKERNEL_CMDQUEUE_PTR;
++
++/* Command queue object handler function type. */
++typedef gceSTATUS (* gctOBJECT_HANDLER) (
++    gckVGKERNEL Kernel,
++    gcsKERNEL_CMDQUEUE_PTR Entry
++    );
++
++/* Command queue kernel element. */
++typedef struct _gcsKERNEL_CMDQUEUE
++{
++    /* The number of buffers in the queue. */
++    gcsCMDBUFFER_PTR            commandBuffer;
++
++    /* Pointer to the object handler function. */
++    gctOBJECT_HANDLER           handler;
++}
++gcsKERNEL_CMDQUEUE;
++
++/* Command queue header. */
++typedef struct _gcsKERNEL_QUEUE_HEADER * gcsKERNEL_QUEUE_HEADER_PTR;
++typedef struct _gcsKERNEL_QUEUE_HEADER
++{
++    /* The size of the buffer in bytes. */
++    gctUINT                     size;
++
++    /* The number of pending entries to be processed. */
++    volatile gctUINT            pending;
++
++    /* The current command queue entry. */
++    gcsKERNEL_CMDQUEUE_PTR      currentEntry;
++
++    /* Next buffer. */
++    gcsKERNEL_QUEUE_HEADER_PTR  next;
++}
++gcsKERNEL_QUEUE_HEADER;
++
++
++/******************************************************************************\
++******************************* gckVGCOMMAND Object *******************************
++\******************************************************************************/
++
++/* gckVGCOMMAND object. */
++struct _gckVGCOMMAND
++{
++    /***************************************************************************
++    ** Object data and pointers.
++    */
++
++    gcsOBJECT                   object;
++    gckVGKERNEL                 kernel;
++    gckOS                       os;
++    gckVGHARDWARE                   hardware;
++
++    /* Features. */
++    gctBOOL                     fe20;
++    gctBOOL                     vg20;
++    gctBOOL                     vg21;
++
++
++    /***************************************************************************
++    ** Enable command queue dumping.
++    */
++
++    gctBOOL                     enableDumping;
++
++
++    /***************************************************************************
++    ** Bus Error interrupt.
++    */
++
++    gctINT32                    busErrorInt;
++
++
++    /***************************************************************************
++    ** Command buffer information.
++    */
++
++    gcsCOMMAND_BUFFER_INFO      info;
++
++
++    /***************************************************************************
++    ** Synchronization objects.
++    */
++
++    gctPOINTER                  queueMutex;
++    gctPOINTER                  taskMutex;
++    gctPOINTER                  commitMutex;
++
++
++    /***************************************************************************
++    ** Task management.
++    */
++
++    /* The head of the storage buffer linked list. */
++    gcsTASK_STORAGE_PTR         taskStorage;
++
++    /* Allocation size. */
++    gctUINT                     taskStorageGranularity;
++    gctUINT                     taskStorageUsable;
++
++    /* The free container list. */
++    gcsTASK_CONTAINER_PTR       taskFreeHead;
++    gcsTASK_CONTAINER_PTR       taskFreeTail;
++
++    /* Task table */
++    gcsBLOCK_TASK_ENTRY         taskTable[gcvBLOCK_COUNT];
++
++
++    /***************************************************************************
++    ** Command queue.
++    */
++
++    /* Pointer to the allocated queue memory. */
++    gcsKERNEL_QUEUE_HEADER_PTR  queue;
++
++    /* Pointer to the current available queue from which new queue entries
++       will be allocated. */
++    gcsKERNEL_QUEUE_HEADER_PTR  queueHead;
++
++    /* If different from queueHead, points to the command queue which is
++       currently being executed by the hardware. */
++    gcsKERNEL_QUEUE_HEADER_PTR  queueTail;
++
++    /* Points to the queue to merge the tail with when the tail is processed. */
++    gcsKERNEL_QUEUE_HEADER_PTR  mergeQueue;
++
++    /* Queue overflow counter. */
++    gctUINT                     queueOverflow;
++
++
++    /***************************************************************************
++    ** Context.
++    */
++
++    /* Context counter used for unique ID. */
++    gctUINT64                   contextCounter;
++
++    /* Current context ID. */
++    gctUINT64                   currentContext;
++
++    /* Command queue power semaphore. */
++    gctPOINTER                  powerSemaphore;
++    gctINT32                    powerStallInt;
++    gcsCMDBUFFER_PTR            powerStallBuffer;
++    gctSIGNAL                   powerStallSignal;
++
++};
++
++/******************************************************************************\
++************************ gckVGCOMMAND Object Internal API. ***********************
++\******************************************************************************/
++
++/* Initialize architecture dependent command buffer information. */
++gceSTATUS
++gckVGCOMMAND_InitializeInfo(
++    IN gckVGCOMMAND Command
++    );
++
++/* Form a STATE command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_StateCommand(
++    IN gckVGCOMMAND Command,
++    IN gctUINT32 Pipe,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Address,
++    IN gctSIZE_T Count,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Form a RESTART command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_RestartCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Form a FETCH command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_FetchCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Form a CALL command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_CallCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Form a RETURN command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_ReturnCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Form an EVENT command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_EventCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gceBLOCK Block,
++    IN gctINT32 InterruptId,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Form an END command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_EndCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctINT32 InterruptId,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++#endif  /* __gc_hal_kernel_hardware_command_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.c	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,2114 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#include "gc_hal_kernel_hardware_command_vg.h"
++
++#if gcdENABLE_VG
++
++#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
++
++typedef enum
++{
++    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
++    gcvPOWER_FLAG_STALL         = 1 << 1,
++    gcvPOWER_FLAG_STOP          = 1 << 2,
++    gcvPOWER_FLAG_START         = 1 << 3,
++    gcvPOWER_FLAG_RELEASE       = 1 << 4,
++    gcvPOWER_FLAG_DELAY         = 1 << 5,
++    gcvPOWER_FLAG_SAVE          = 1 << 6,
++    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
++    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
++    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
++    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
++    gcvPOWER_FLAG_NOP           = 1 << 11,
++}
++gcePOWER_FLAGS;
++
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++static gceSTATUS
++_ResetGPU(
++    IN gckOS Os
++    )
++{
++    gctUINT32 control, idle;
++    gceSTATUS status;
++
++    /* Read register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                     gcvCORE_VG,
++                                     0x00000,
++                                     &control));
++
++    for (;;)
++    {
++        /* Disable clock gating. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    gcvCORE_VG,
++                    0x00104,
++                    0x00000000));
++
++        /* Wait for clock being stable. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Isolate the GPU. */
++        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          control));
++
++        /* Set soft reset. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Wait for reset. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Reset soft reset bit. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Reset GPU isolation. */
++        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          control));
++
++        /* Read idle register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         gcvCORE_VG,
++                                         0x00004,
++                                         &idle));
++
++        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
++        {
++            continue;
++        }
++
++        /* Read reset register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         gcvCORE_VG,
++                                         0x00000,
++                                         &control));
++
++        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
++        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
++        )
++        {
++            continue;
++        }
++
++        /* GPU is idle. */
++        break;
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the error. */
++    return status;
++}
++
++
++static gceSTATUS
++_IdentifyHardware(
++    IN gckOS Os,
++    OUT gceCHIPMODEL * ChipModel,
++    OUT gctUINT32 * ChipRevision,
++    OUT gctUINT32 * ChipFeatures,
++    OUT gctUINT32 * ChipMinorFeatures,
++    OUT gctUINT32 * ChipMinorFeatures2
++    )
++{
++    gceSTATUS status;
++    gctUINT32 chipIdentity;
++
++    do
++    {
++        /* Read chip identity register. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG, 0x00018, &chipIdentity));
++
++        /* Special case for older graphic cores. */
++        if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
++        {
++            *ChipModel    = gcv500;
++            *ChipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
++        }
++
++        else
++        {
++            /* Read chip identity register. */
++            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
++                                            0x00020,
++                                            (gctUINT32 *) ChipModel));
++
++            /* Read CHIP_REV register. */
++            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
++                                            0x00024,
++                                            ChipRevision));
++        }
++
++        /* Read chip feature register. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(
++            Os, gcvCORE_VG, 0x0001C, ChipFeatures
++            ));
++
++        /* Read chip minor feature register. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(
++            Os, gcvCORE_VG, 0x00034, ChipMinorFeatures
++            ));
++
++        /* Read chip minor feature register #2. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(
++            Os, gcvCORE_VG, 0x00074, ChipMinorFeatures2
++            ));
++
++        gcmkTRACE(
++            gcvLEVEL_VERBOSE,
++            "ChipModel=0x%08X\n"
++            "ChipRevision=0x%08X\n"
++            "ChipFeatures=0x%08X\n"
++            "ChipMinorFeatures=0x%08X\n"
++            "ChipMinorFeatures2=0x%08X\n",
++            *ChipModel,
++            *ChipRevision,
++            *ChipFeatures,
++            *ChipMinorFeatures,
++            *ChipMinorFeatures2
++            );
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Return the status. */
++    return status;
++}
++
++#if gcdPOWEROFF_TIMEOUT
++void
++_VGPowerTimerFunction(
++    gctPOINTER Data
++    )
++{
++    gckVGHARDWARE hardware = (gckVGHARDWARE)Data;
++    gcmkVERIFY_OK(
++        gckVGHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
++}
++#endif
++
++/******************************************************************************\
++****************************** gckVGHARDWARE API code *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_Construct
++**
++**  Construct a new gckVGHARDWARE object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an initialized gckOS object.
++**
++**  OUTPUT:
++**
++**      gckVGHARDWARE * Hardware
++**          Pointer to a variable that will hold the pointer to the gckVGHARDWARE
++**          object.
++*/
++gceSTATUS
++gckVGHARDWARE_Construct(
++    IN gckOS Os,
++    OUT gckVGHARDWARE * Hardware
++    )
++{
++    gckVGHARDWARE hardware = gcvNULL;
++    gceSTATUS status;
++    gceCHIPMODEL chipModel;
++    gctUINT32 chipRevision;
++    gctUINT32 chipFeatures;
++    gctUINT32 chipMinorFeatures;
++    gctUINT32 chipMinorFeatures2;
++
++    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x ", Os, Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
++
++    do
++    {
++        gcmkERR_BREAK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvTRUE, gcvTRUE));
++
++        status = _ResetGPU(Os);
++
++        if (status != gcvSTATUS_OK)
++        {
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                "_ResetGPU failed: status=%d\n", status);
++        }
++
++        /* Identify the hardware. */
++        gcmkERR_BREAK(_IdentifyHardware(Os,
++            &chipModel, &chipRevision,
++            &chipFeatures, &chipMinorFeatures, &chipMinorFeatures2
++            ));
++
++        /* Allocate the gckVGHARDWARE object. */
++        gcmkERR_BREAK(gckOS_Allocate(Os,
++            gcmSIZEOF(struct _gckVGHARDWARE), (gctPOINTER *) &hardware
++            ));
++
++        /* Initialize the gckVGHARDWARE object. */
++        hardware->object.type = gcvOBJ_HARDWARE;
++        hardware->os = Os;
++
++        /* Set chip identity. */
++        hardware->chipModel          = chipModel;
++        hardware->chipRevision       = chipRevision;
++        hardware->chipFeatures       = chipFeatures;
++        hardware->chipMinorFeatures  = chipMinorFeatures;
++        hardware->chipMinorFeatures2 = chipMinorFeatures2;
++
++        hardware->powerMutex            = gcvNULL;
++        hardware->chipPowerState        = gcvPOWER_ON;
++        hardware->chipPowerStateGlobal  = gcvPOWER_ON;
++        hardware->clockState            = gcvTRUE;
++        hardware->powerState            = gcvTRUE;
++
++#if gcdPOWEROFF_TIMEOUT
++        hardware->powerOffTime          = 0;
++        hardware->powerOffTimeout = gcdPOWEROFF_TIMEOUT;
++
++        gcmkVERIFY_OK(gckOS_CreateTimer(Os,
++                                        _VGPowerTimerFunction,
++                                        (gctPOINTER)hardware,
++                                        &hardware->powerOffTimer));
++#endif
++
++        /* Determine whether FE 2.0 is present. */
++        hardware->fe20 = ((((gctUINT32) (hardware->chipFeatures)) >> (0 ? 28:28) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))));
++
++        /* Determine whether VG 2.0 is present. */
++        hardware->vg20 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 13:13) & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))));
++
++        /* Determine whether VG 2.1 is present. */
++        hardware->vg21 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
++
++        /* Set default event mask. */
++        hardware->eventMask = 0xFFFFFFFF;
++
++        gcmkERR_BREAK(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
++
++        /* Set fast clear to auto. */
++        gcmkVERIFY_OK(gckVGHARDWARE_SetFastClear(hardware, -1));
++
++        gcmkERR_BREAK(gckOS_CreateMutex(Os, &hardware->powerMutex));
++
++        /* Enable power management by default. */
++        hardware->powerManagement = gcvTRUE;
++
++        /* Return pointer to the gckVGHARDWARE object. */
++        *Hardware = hardware;
++
++        gcmkFOOTER_NO();
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++#if gcdPOWEROFF_TIMEOUT
++        if (hardware->powerOffTimer != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
++            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
++        }
++#endif
++
++    if (hardware->pageTableDirty != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
++    }
++
++    if (hardware != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_Free(Os, hardware));
++    }
++
++    gcmkVERIFY_OK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvFALSE, gcvFALSE));
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_Destroy
++**
++**  Destroy an gckVGHARDWARE object.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object that needs to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGHARDWARE_Destroy(
++    IN gckVGHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Mark the object as unknown. */
++    Hardware->object.type = gcvOBJ_UNKNOWN;
++
++    if (Hardware->powerMutex != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_DeleteMutex(
++            Hardware->os, Hardware->powerMutex));
++    }
++
++#if gcdPOWEROFF_TIMEOUT
++    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
++    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
++#endif
++
++    if (Hardware->pageTableDirty != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
++    }
++
++    /* Free the object. */
++    status = gckOS_Free(Hardware->os, Hardware);
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_QueryMemory
++**
++**  Query the amount of memory available on the hardware.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * InternalSize
++**          Pointer to a variable that will hold the size of the internal video
++**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
++**          internal memory will be returned.
++**
++**      gctUINT32 * InternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * InternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctSIZE_T * ExternalSize
++**          Pointer to a variable that will hold the size of the external video
++**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
++**          external memory will be returned.
++**
++**      gctUINT32 * ExternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * ExternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * HorizontalTileSize
++**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
++**          gcvNULL, no horizontal pixel per tile will be returned.
++**
++**      gctUINT32 * VerticalTileSize
++**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
++**          gcvNULL, no vertical pixel per tile will be returned.
++*/
++gceSTATUS
++gckVGHARDWARE_QueryMemory(
++    IN gckVGHARDWARE Hardware,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctUINT32 * InternalBaseAddress,
++    OUT gctUINT32 * InternalAlignment,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctUINT32 * ExternalBaseAddress,
++    OUT gctUINT32 * ExternalAlignment,
++    OUT gctUINT32 * HorizontalTileSize,
++    OUT gctUINT32 * VerticalTileSize
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x InternalSize=0x%x InternalBaseAddress=0x%x InternalAlignment=0x%x"
++        "ExternalSize=0x%x ExternalBaseAddress=0x%x ExternalAlignment=0x%x HorizontalTileSize=0x%x VerticalTileSize=0x%x",
++        Hardware, InternalSize, InternalBaseAddress, InternalAlignment,
++        ExternalSize, ExternalBaseAddress, ExternalAlignment, HorizontalTileSize, VerticalTileSize);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (InternalSize != gcvNULL)
++    {
++        /* No internal memory. */
++        *InternalSize = 0;
++    }
++
++    if (ExternalSize != gcvNULL)
++    {
++        /* No external memory. */
++        *ExternalSize = 0;
++    }
++
++    if (HorizontalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *HorizontalTileSize = 4;
++    }
++
++    if (VerticalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *VerticalTileSize = 4;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_QueryChipIdentity
++**
++**  Query the identity of the hardware.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gceCHIPMODEL * ChipModel
++**          If 'ChipModel' is not gcvNULL, the variable it points to will
++**          receive the model of the chip.
++**
++**      gctUINT32 * ChipRevision
++**          If 'ChipRevision' is not gcvNULL, the variable it points to will
++**          receive the revision of the chip.
++**
++**      gctUINT32 * ChipFeatures
++**          If 'ChipFeatures' is not gcvNULL, the variable it points to will
++**          receive the feature set of the chip.
++**
++**      gctUINT32 * ChipMinorFeatures
++**          If 'ChipMinorFeatures' is not gcvNULL, the variable it points to
++**          will receive the minor feature set of the chip.
++**
++**      gctUINT32 * ChipMinorFeatures2
++**          If 'ChipMinorFeatures2' is not gcvNULL, the variable it points to
++**          will receive the minor feature set of the chip.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_QueryChipIdentity(
++    IN gckVGHARDWARE Hardware,
++    OUT gceCHIPMODEL * ChipModel,
++    OUT gctUINT32 * ChipRevision,
++    OUT gctUINT32* ChipFeatures,
++    OUT gctUINT32* ChipMinorFeatures,
++    OUT gctUINT32* ChipMinorFeatures2
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x ChipModel=0x%x ChipRevision=0x%x ChipFeatures = 0x%x ChipMinorFeatures = 0x%x ChipMinorFeatures2 = 0x%x",
++                   Hardware, ChipModel, ChipRevision, ChipFeatures, ChipMinorFeatures, ChipMinorFeatures2);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Return chip model. */
++    if (ChipModel != gcvNULL)
++    {
++        *ChipModel = Hardware->chipModel;
++    }
++
++    /* Return revision number. */
++    if (ChipRevision != gcvNULL)
++    {
++        *ChipRevision = Hardware->chipRevision;
++    }
++
++    /* Return feature set. */
++    if (ChipFeatures != gcvNULL)
++    {
++        gctUINT32 features = Hardware->chipFeatures;
++
++        if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++        {
++            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++        }
++
++        /* Mark 2D pipe as available for GC500.0 since it did not have this *\
++        \* bit.                                                             */
++        if ((Hardware->chipModel == gcv500)
++        &&  (Hardware->chipRevision == 0)
++        )
++        {
++            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++        }
++
++        /* Mark 2D pipe as available for GC300 since it did not have this   *\
++        \* bit.                                                             */
++        if (Hardware->chipModel == gcv300)
++        {
++            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++        }
++
++        *ChipFeatures = features;
++    }
++
++    /* Return minor feature set. */
++    if (ChipMinorFeatures != gcvNULL)
++    {
++        *ChipMinorFeatures = Hardware->chipMinorFeatures;
++    }
++
++    /* Return minor feature set #2. */
++    if (ChipMinorFeatures2 != gcvNULL)
++    {
++        *ChipMinorFeatures2 = Hardware->chipMinorFeatures2;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_ConvertFormat
++**
++**  Convert an API format to hardware parameters.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**      gceSURF_FORMAT Format
++**          API format to convert.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * BitsPerPixel
++**          Pointer to a variable that will hold the number of bits per pixel.
++**
++**      gctUINT32 * BytesPerTile
++**          Pointer to a variable that will hold the number of bytes per tile.
++*/
++gceSTATUS
++gckVGHARDWARE_ConvertFormat(
++    IN gckVGHARDWARE Hardware,
++    IN gceSURF_FORMAT Format,
++    OUT gctUINT32 * BitsPerPixel,
++    OUT gctUINT32 * BytesPerTile
++    )
++{
++    gctUINT32 bitsPerPixel;
++    gctUINT32 bytesPerTile;
++
++    gcmkHEADER_ARG("Hardware=0x%x Format=0x%x BitsPerPixel=0x%x BytesPerTile = 0x%x",
++                   Hardware, Format, BitsPerPixel, BytesPerTile);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Dispatch on format. */
++    switch (Format)
++    {
++    case gcvSURF_A1:
++    case gcvSURF_L1:
++        /* 1-bpp format. */
++        bitsPerPixel  = 1;
++        bytesPerTile  = (1 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_A4:
++        /* 4-bpp format. */
++        bitsPerPixel  = 4;
++        bytesPerTile  = (4 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_INDEX8:
++    case gcvSURF_A8:
++    case gcvSURF_L8:
++        /* 8-bpp format. */
++        bitsPerPixel  = 8;
++        bytesPerTile  = (8 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_YV12:
++        /* 12-bpp planar YUV formats. */
++        bitsPerPixel  = 12;
++        bytesPerTile  = (12 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_NV12:
++        /* 12-bpp planar YUV formats. */
++        bitsPerPixel  = 12;
++        bytesPerTile  = (12 * 4 * 4) / 8;
++        break;
++
++    /* 4444 variations. */
++    case gcvSURF_X4R4G4B4:
++    case gcvSURF_A4R4G4B4:
++    case gcvSURF_R4G4B4X4:
++    case gcvSURF_R4G4B4A4:
++    case gcvSURF_B4G4R4X4:
++    case gcvSURF_B4G4R4A4:
++    case gcvSURF_X4B4G4R4:
++    case gcvSURF_A4B4G4R4:
++
++    /* 1555 variations. */
++    case gcvSURF_X1R5G5B5:
++    case gcvSURF_A1R5G5B5:
++    case gcvSURF_R5G5B5X1:
++    case gcvSURF_R5G5B5A1:
++    case gcvSURF_X1B5G5R5:
++    case gcvSURF_A1B5G5R5:
++    case gcvSURF_B5G5R5X1:
++    case gcvSURF_B5G5R5A1:
++
++    /* 565 variations. */
++    case gcvSURF_R5G6B5:
++    case gcvSURF_B5G6R5:
++
++    case gcvSURF_A8L8:
++    case gcvSURF_YUY2:
++    case gcvSURF_UYVY:
++    case gcvSURF_D16:
++        /* 16-bpp format. */
++        bitsPerPixel  = 16;
++        bytesPerTile  = (16 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_X8R8G8B8:
++    case gcvSURF_A8R8G8B8:
++    case gcvSURF_X8B8G8R8:
++    case gcvSURF_A8B8G8R8:
++    case gcvSURF_R8G8B8X8:
++    case gcvSURF_R8G8B8A8:
++    case gcvSURF_B8G8R8X8:
++    case gcvSURF_B8G8R8A8:
++    case gcvSURF_D32:
++        /* 32-bpp format. */
++        bitsPerPixel  = 32;
++        bytesPerTile  = (32 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_D24S8:
++        /* 24-bpp format. */
++        bitsPerPixel  = 32;
++        bytesPerTile  = (32 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_DXT1:
++    case gcvSURF_ETC1:
++        bitsPerPixel  = 4;
++        bytesPerTile  = (4 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_DXT2:
++    case gcvSURF_DXT3:
++    case gcvSURF_DXT4:
++    case gcvSURF_DXT5:
++        bitsPerPixel  = 8;
++        bytesPerTile  = (8 * 4 * 4) / 8;
++        break;
++
++    default:
++        /* Invalid format. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_INVALID_ARGUMENT;
++    }
++
++    /* Set the result. */
++    if (BitsPerPixel != gcvNULL)
++    {
++        * BitsPerPixel = bitsPerPixel;
++    }
++
++    if (BytesPerTile != gcvNULL)
++    {
++        * BytesPerTile = bytesPerTile;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_SplitMemory
++**
++**  Split a hardware specific memory address into a pool and offset.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**      gctUINT32 Address
++**          Address in hardware specific format.
++**
++**  OUTPUT:
++**
++**      gcePOOL * Pool
++**          Pointer to a variable that will hold the pool type for the address.
++**
++**      gctUINT32 * Offset
++**          Pointer to a variable that will hold the offset for the address.
++*/
++gceSTATUS
++gckVGHARDWARE_SplitMemory(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Pool=0x%x Offset = 0x%x",
++                   Hardware, Address, Pool, Offset);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
++
++    /* Dispatch on memory type. */
++    switch ((((((gctUINT32) (Address)) >> (0 ? 1:0)) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1)))))) ))
++    {
++    case 0x0:
++        /* System memory. */
++        *Pool = gcvPOOL_SYSTEM;
++        break;
++
++    case 0x2:
++        /* Virtual memory. */
++        *Pool = gcvPOOL_VIRTUAL;
++        break;
++
++    default:
++        /* Invalid memory type. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_INVALID_ARGUMENT;
++    }
++
++    /* Return offset of address. */
++    *Offset = ((((gctUINT32) (Address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_Execute
++**
++**  Kickstart the hardware's command processor with an initialized command
++**  buffer.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**      gctUINT32 Address
++**          Address of the command buffer.
++**
++**      gctSIZE_T Count
++**          Number of command-sized data units to be executed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGHARDWARE_Execute(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Address,
++    IN gctSIZE_T Count
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Count=0x%x",
++                   Hardware, Address, Count);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    do
++    {
++        /* Enable all events. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(
++            Hardware->os,
++            gcvCORE_VG,
++            0x00014,
++            Hardware->eventMask
++            ));
++
++        if (Hardware->fe20)
++        {
++            /* Write address register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00500,
++                gcmkFIXADDRESS(Address)
++                ));
++
++            /* Write control register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00504,
++                Count
++                ));
++        }
++        else
++        {
++            /* Write address register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00654,
++                gcmkFIXADDRESS(Address)
++                ));
++
++            /* Write control register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00658,
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                ));
++        }
++
++        /* Success. */
++        gcmkFOOTER();
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_AlignToTile
++**
++**  Align the specified width and height to tile boundaries.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gceSURF_TYPE Type
++**          Type of alignment.
++**
++**      gctUINT32 * Width
++**          Pointer to the width to be aligned.  If 'Width' is gcvNULL, no width
++**          will be aligned.
++**
++**      gctUINT32 * Height
++**          Pointer to the height to be aligned.  If 'Height' is gcvNULL, no height
++**          will be aligned.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Width
++**          Pointer to a variable that will receive the aligned width.
++**
++**      gctUINT32 * Height
++**          Pointer to a variable that will receive the aligned height.
++*/
++gceSTATUS
++gckVGHARDWARE_AlignToTile(
++    IN gckVGHARDWARE Hardware,
++    IN gceSURF_TYPE Type,
++    IN OUT gctUINT32 * Width,
++    IN OUT gctUINT32 * Height
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Type=0x%x Width=0x%x Height=0x%x",
++                   Hardware, Type, Width, Height);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Width != gcvNULL)
++    {
++        /* Align the width. */
++        *Width = gcmALIGN(*Width, (Type == gcvSURF_TEXTURE) ? 4 : 16);
++    }
++
++    if (Height != gcvNULL)
++    {
++        /* Special case for VG images. */
++        if ((*Height == 0) && (Type == gcvSURF_IMAGE))
++        {
++            *Height = 4;
++        }
++        else
++        {
++            /* Align the height. */
++            *Height = gcmALIGN(*Height, 4);
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_ConvertLogical
++**
++**  Convert a logical system address into a hardware specific address.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address to convert.
++**
++**      gctUINT32* Address
++**          Return hardware specific address.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGHARDWARE_ConvertLogical(
++    IN gckVGHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Address=0x%x",
++                   Hardware, Logical, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    do
++    {
++        /* Convert logical address into a physical address. */
++        gcmkERR_BREAK(gckOS_GetPhysicalAddress(
++            Hardware->os, Logical, &address
++            ));
++
++        /* Return hardware specific address. */
++        *Address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++        /* Success. */
++        gcmkFOOTER();
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_QuerySystemMemory
++**
++**  Query the command buffer alignment and number of reserved bytes.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * SystemSize
++**          Pointer to a variable that receives the maximum size of the system
++**          memory.
++**
++**      gctUINT32 * SystemBaseAddress
++**          Poinetr to a variable that receives the base address for system
++**          memory.
++*/
++gceSTATUS gckVGHARDWARE_QuerySystemMemory(
++    IN gckVGHARDWARE Hardware,
++    OUT gctSIZE_T * SystemSize,
++    OUT gctUINT32 * SystemBaseAddress
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x SystemSize=0x%x SystemBaseAddress=0x%x",
++                   Hardware, SystemSize, SystemBaseAddress);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (SystemSize != gcvNULL)
++    {
++        /* Maximum system memory can be 2GB. */
++        *SystemSize = (gctSIZE_T)(1 << 31);
++    }
++
++    if (SystemBaseAddress != gcvNULL)
++    {
++        /* Set system memory base address. */
++        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_SetMMU
++**
++**  Set the page table base address.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of the page table.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGHARDWARE_SetMMU(
++    IN gckVGHARDWARE Hardware,
++    IN gctPOINTER Logical
++    )
++{
++    gceSTATUS status;
++    gctUINT32 address = 0;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x",
++                   Hardware, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    do
++    {
++        /* Convert the logical address into an hardware address. */
++        gcmkERR_BREAK(gckVGHARDWARE_ConvertLogical(Hardware, Logical, &address) );
++
++        /* Write the AQMemoryFePageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00400,
++                                      gcmkFIXADDRESS(address)) );
++
++        /* Write the AQMemoryTxPageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00404,
++                                      gcmkFIXADDRESS(address)) );
++
++        /* Write the AQMemoryPePageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00408,
++                                      gcmkFIXADDRESS(address)) );
++
++        /* Write the AQMemoryPezPageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x0040C,
++                                      gcmkFIXADDRESS(address)) );
++
++        /* Write the AQMemoryRaPageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00410,
++                                      gcmkFIXADDRESS(address)) );
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_FlushMMU
++**
++**  Flush the page table.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGHARDWARE_FlushMMU(
++    IN gckVGHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gckVGCOMMAND command;
++
++    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    do
++    {
++        gcsCMDBUFFER_PTR commandBuffer;
++        gctUINT32_PTR buffer;
++
++        /* Create a shortcut to the command buffer object. */
++        command = Hardware->kernel->command;
++
++        /* Allocate command buffer space. */
++        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
++            command, 8, &commandBuffer, (gctPOINTER *) &buffer
++            ));
++
++        buffer[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[1]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++    }
++    while(gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_BuildVirtualAddress
++**
++**  Build a virtual address.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gctUINT32 Index
++**          Index into page table.
++**
++**      gctUINT32 Offset
++**          Offset into page.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Pointer to a variable receiving te hardware address.
++*/
++gceSTATUS gckVGHARDWARE_BuildVirtualAddress(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Index,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++
++    gcmkHEADER_ARG("Hardware=0x%x Index=0x%x Offset=0x%x Address=0x%x",
++                   Hardware, Index, Offset, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Build virtual address. */
++    address = (Index << 12) | Offset;
++
++    /* Set virtual type. */
++    address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++    /* Set the result. */
++    *Address = address;
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGHARDWARE_GetIdle(
++    IN gckVGHARDWARE Hardware,
++    OUT gctUINT32 * Data
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%x Data=0x%x", Hardware, Data);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
++
++    /* Read register and return. */
++    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, Data);
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckVGHARDWARE_SetFastClear(
++    IN gckVGHARDWARE Hardware,
++    IN gctINT Enable
++    )
++{
++    gctUINT32 debug;
++    gceSTATUS status;
++
++    if (!(((((gctUINT32) (Hardware->chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++    {
++        return gcvSTATUS_OK;
++    }
++
++    do
++    {
++        if (Enable == -1)
++        {
++            Enable = (Hardware->chipModel > gcv500) ||
++                ((Hardware->chipModel == gcv500) && (Hardware->chipRevision >= 3));
++        }
++
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
++                                        0x00414,
++                    &debug));
++
++        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
++
++#ifdef AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION
++        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION)));
++#endif
++
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                     0x00414,
++                     debug));
++
++        Hardware->allowFastClear = Enable;
++
++        status = gcvFALSE;
++    }
++    while (gcvFALSE);
++
++    return status;
++}
++
++gceSTATUS
++gckVGHARDWARE_ReadInterrupt(
++    IN gckVGHARDWARE Hardware,
++    OUT gctUINT32_PTR IDs
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%x IDs=0x%x", Hardware, IDs);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(IDs != gcvNULL);
++
++    /* Read AQIntrAcknowledge register. */
++    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
++                              0x00010,
++                              IDs);
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS _CommandStall(
++    gckVGHARDWARE Hardware)
++{
++    gceSTATUS status;
++    gckVGCOMMAND command;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    do
++    {
++        gctUINT32_PTR buffer;
++        command = Hardware->kernel->command;
++
++        /* Allocate command buffer space. */
++        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
++            command, 8, &command->powerStallBuffer,
++            (gctPOINTER *) &buffer
++            ));
++
++        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
++            command, buffer, gcvBLOCK_PIXEL,
++            command->powerStallInt, gcvNULL));
++
++        gcmkERR_BREAK(gckVGCOMMAND_Execute(
++            command,
++            command->powerStallBuffer
++            ));
++
++        /* Wait the signal. */
++        gcmkERR_BREAK(gckOS_WaitSignal(
++            command->os,
++            command->powerStallSignal,
++            gcdGPU_TIMEOUT));
++
++
++    }
++    while(gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagementState
++**
++**  Set GPU to a specified power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE State
++**          Power State.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_SetPowerManagementState(
++    IN gckVGHARDWARE Hardware,
++    IN gceCHIPPOWERSTATE State
++    )
++{
++    gceSTATUS status;
++    gckVGCOMMAND command = gcvNULL;
++    gckOS os;
++    gctUINT flag/*, clock*/;
++
++    gctBOOL acquired        = gcvFALSE;
++    gctBOOL stall           = gcvTRUE;
++    gctBOOL commitMutex     = gcvFALSE;
++    gctBOOL mutexAcquired   = gcvFALSE;
++
++#if gcdPOWEROFF_TIMEOUT
++    gctBOOL timeout = gcvFALSE;
++    gctBOOL isAfter = gcvFALSE;
++    gctUINT32 currentTime;
++#endif
++
++    gctBOOL broadcast = gcvFALSE;
++    gctUINT32 process, thread;
++    gctBOOL global = gcvFALSE;
++
++#if gcdENABLE_PROFILING
++    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
++              initTime, offTime, startTime, totalTime;
++#endif
++
++    /* State transition flags. */
++    static const gctUINT flags[4][4] =
++    {
++        /* gcvPOWER_ON           */
++        {   /* ON                */ 0,
++            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_NOP,
++            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_OFF          */
++        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_RELEASE    |
++                                    gcvPOWER_FLAG_DELAY,
++            /* OFF               */ 0,
++            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_RELEASE    |
++                                    gcvPOWER_FLAG_DELAY,
++            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_IDLE         */
++        {   /* ON                */ gcvPOWER_FLAG_NOP,
++            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ 0,
++            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_SUSPEND      */
++        {   /* ON                */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_RELEASE   |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* OFF               */ gcvPOWER_FLAG_SAVE      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_RELEASE   |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* SUSPEND           */ 0,
++        },
++    };
++
++    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Switching to power state %d",
++                   State);
++#endif
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Get the gckOS object pointer. */
++    os = Hardware->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Get the gckCOMMAND object pointer. */
++    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
++    command = Hardware->kernel->command;
++    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
++
++    if (Hardware->powerManagement == gcvFALSE)
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Start profiler. */
++    gcmkPROFILE_INIT(freq, time);
++
++    /* Convert the broadcast power state. */
++    switch (State)
++    {
++    case gcvPOWER_SUSPEND_ATPOWERON:
++        /* Convert to SUSPEND and don't wait for STALL. */
++        State = gcvPOWER_SUSPEND;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_OFF_ATPOWERON:
++        /* Convert to OFF and don't wait for STALL. */
++        State = gcvPOWER_OFF;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_IDLE_BROADCAST:
++        /* Convert to IDLE and note we are inside broadcast. */
++        State     = gcvPOWER_IDLE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_SUSPEND_BROADCAST:
++        /* Convert to SUSPEND and note we are inside broadcast. */
++        State     = gcvPOWER_SUSPEND;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_BROADCAST:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_RECOVERY:
++        /* Convert to OFF and note we are inside recovery. */
++        State     = gcvPOWER_OFF;
++        stall     = gcvFALSE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_ON_AUTO:
++        /* Convert to ON and note we are inside recovery. */
++        State = gcvPOWER_ON;
++        break;
++
++    case gcvPOWER_ON:
++    case gcvPOWER_IDLE:
++    case gcvPOWER_SUSPEND:
++    case gcvPOWER_OFF:
++        /* Mark as global power management. */
++        global = gcvTRUE;
++        break;
++
++#if gcdPOWEROFF_TIMEOUT
++    case gcvPOWER_OFF_TIMEOUT:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        /* Check time out */
++        timeout = gcvTRUE;
++        break;
++#endif
++
++    default:
++        break;
++    }
++
++    /* Get current process and thread IDs. */
++    gcmkONERROR(gckOS_GetProcessID(&process));
++    gcmkONERROR(gckOS_GetThreadID(&thread));
++
++    /* Acquire the power mutex. */
++    if (broadcast)
++    {
++        /* Try to acquire the power mutex. */
++        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
++
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            /* Check if we already own this mutex. */
++            if ((Hardware->powerProcess == process)
++            &&  (Hardware->powerThread  == thread)
++            )
++            {
++                /* Bail out on recursive power management. */
++                gcmkFOOTER_NO();
++                return gcvSTATUS_OK;
++            }
++            else if (State == gcvPOWER_IDLE)
++            {
++                /* gcvPOWER_IDLE_BROADCAST is from IST,
++                ** so waiting here will cause deadlock,
++                ** if lock holder call gckCOMMAND_Stall() */
++                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++            }
++            else
++            {
++                /* Acquire the power mutex. */
++                gcmkONERROR(gckOS_AcquireMutex(os,
++                                               Hardware->powerMutex,
++                                               gcvINFINITE));
++            }
++        }
++    }
++    else
++    {
++        /* Acquire the power mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
++    }
++
++    /* Get time until mtuex acquired. */
++    gcmkPROFILE_QUERY(time, mutexTime);
++
++    Hardware->powerProcess = process;
++    Hardware->powerThread  = thread;
++    mutexAcquired          = gcvTRUE;
++
++    /* Grab control flags and clock. */
++    flag  = flags[Hardware->chipPowerState][State];
++    /*clock = clocks[State];*/
++
++#if gcdPOWEROFF_TIMEOUT
++    if (timeout)
++    {
++        gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++        gcmkONERROR(
++            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
++
++        /* powerOffTime is pushed forward, give up.*/
++        if (isAfter
++        /* Expect a transition start from IDLE. */
++        ||  (Hardware->chipPowerState == gcvPOWER_ON)
++        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
++        )
++        {
++            /* Release the power mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++            /* No need to do anything. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++    }
++#endif
++
++    if (flag == 0)
++    {
++        /* Release the power mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++        /* No need to do anything. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* internal power control */
++    if (!global)
++    {
++        if (Hardware->chipPowerStateGlobal == gcvPOWER_OFF)
++        {
++            /* Release the power mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++            /* No need to do anything. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++    }
++    else
++    {
++        if (flag & gcvPOWER_FLAG_ACQUIRE)
++        {
++            /* Acquire the power management semaphore. */
++            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++            acquired = gcvTRUE;
++
++            /* avoid acquiring again. */
++            flag &= ~gcvPOWER_FLAG_ACQUIRE;
++        }
++    }
++
++    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
++    {
++        /* Turn on the power. */
++        gcmkONERROR(gckOS_SetGPUPower(os, gcvCORE_VG, gcvTRUE, gcvTRUE));
++
++        /* Mark clock and power as enabled. */
++        Hardware->clockState = gcvTRUE;
++        Hardware->powerState = gcvTRUE;
++    }
++
++    /* Get time until powered on. */
++    gcmkPROFILE_QUERY(time, onTime);
++
++    if ((flag & gcvPOWER_FLAG_STALL) && stall)
++    {
++        /* Acquire the mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(
++            command->os,
++            command->commitMutex,
++            gcvINFINITE
++            ));
++
++        commitMutex = gcvTRUE;
++
++        gcmkONERROR(_CommandStall(Hardware));
++    }
++
++    /* Get time until stalled. */
++    gcmkPROFILE_QUERY(time, stallTime);
++
++    if (flag & gcvPOWER_FLAG_ACQUIRE)
++    {
++        /* Acquire the power management semaphore. */
++        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++
++        acquired = gcvTRUE;
++    }
++
++    if (flag & gcvPOWER_FLAG_STOP)
++    {
++    }
++
++    /* Get time until stopped. */
++    gcmkPROFILE_QUERY(time, stopTime);
++
++    /* Only process this when hardware is enabled. */
++    if (Hardware->clockState && Hardware->powerState)
++    {
++    }
++
++    if (flag & gcvPOWER_FLAG_DELAY)
++    {
++        /* Wait for the specified amount of time to settle coming back from
++        ** power-off or suspend state. */
++        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
++    }
++
++    /* Get time until delayed. */
++    gcmkPROFILE_QUERY(time, delayTime);
++
++    if (flag & gcvPOWER_FLAG_INITIALIZE)
++    {
++        gcmkONERROR(gckVGHARDWARE_SetMMU(Hardware, Hardware->kernel->mmu->pageTableLogical));
++
++        /* Force the command queue to reload the next context. */
++        command->currentContext = 0;
++    }
++
++    /* Get time until initialized. */
++    gcmkPROFILE_QUERY(time, initTime);
++
++    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
++    {
++        /* Turn off the GPU power. */
++        gcmkONERROR(
++            gckOS_SetGPUPower(os,
++                              gcvCORE_VG,
++                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                               : gcvTRUE,
++                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                               : gcvTRUE));
++
++        /* Save current hardware power and clock states. */
++        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++    }
++
++    /* Get time until off. */
++    gcmkPROFILE_QUERY(time, offTime);
++
++    if (flag & gcvPOWER_FLAG_START)
++    {
++    }
++
++    /* Get time until started. */
++    gcmkPROFILE_QUERY(time, startTime);
++
++    if (flag & gcvPOWER_FLAG_RELEASE)
++    {
++        /* Release the power management semaphore. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
++        acquired = gcvFALSE;
++    }
++
++    /* Save the new power state. */
++    Hardware->chipPowerState = State;
++
++    if (global)
++    {
++        /* Save the new power state. */
++        Hardware->chipPowerStateGlobal = State;
++    }
++
++    if (commitMutex)
++    {
++        /* Acquire the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(
++            command->os,
++            command->commitMutex
++            ));
++    }
++
++#if gcdPOWEROFF_TIMEOUT
++    /* Reset power off time */
++    gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++    Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
++
++    if (State == gcvPOWER_IDLE)
++    {
++        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
++        gcmkVERIFY_OK(gckOS_StartTimer(os,
++                                       Hardware->powerOffTimer,
++                                       Hardware->powerOffTimeout));
++    }
++    else
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
++
++        /* Cancel running timer when GPU enters ON or OFF. */
++        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
++    }
++#endif
++
++    /* Release the power mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++    /* Get total time. */
++    gcmkPROFILE_QUERY(time, totalTime);
++#if gcdENABLE_PROFILING
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
++                   freq, mutexTime, onTime, stallTime, stopTime);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
++                   delayTime, initTime, offTime, startTime, totalTime);
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    if (acquired)
++    {
++        /* Release semaphore. */
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
++                                             command->powerSemaphore));
++    }
++
++    if (mutexAcquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++
++    if (commitMutex)
++    {
++        /* Acquire the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(
++            command->os,
++            command->commitMutex
++            ));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryPowerManagementState
++**
++**  Get GPU power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE* State
++**          Power State.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_QueryPowerManagementState(
++    IN gckVGHARDWARE Hardware,
++    OUT gceCHIPPOWERSTATE* State
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(State != gcvNULL);
++
++    /* Return the statue. */
++    *State = Hardware->chipPowerState;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*State=%d", *State);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_SetPowerManagement
++**
++**  Configure GPU power management function.
++**  Only used in driver initialization stage.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL PowerManagement
++**          Power Mangement State.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_SetPowerManagement(
++    IN gckVGHARDWARE Hardware,
++    IN gctBOOL PowerManagement
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    Hardware->powerManagement = PowerManagement;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGHARDWARE_SetPowerOffTimeout(
++    IN gckVGHARDWARE  Hardware,
++    IN gctUINT32    Timeout
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
++
++#if gcdPOWEROFF_TIMEOUT
++    Hardware->powerOffTimeout = Timeout;
++#endif
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++gceSTATUS
++gckVGHARDWARE_QueryPowerOffTimeout(
++    IN gckVGHARDWARE  Hardware,
++    OUT gctUINT32*  Timeout
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++#if gcdPOWEROFF_TIMEOUT
++    *Timeout = Hardware->powerOffTimeout;
++#endif
++
++    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGHARDWARE_QueryIdle(
++    IN gckVGHARDWARE Hardware,
++    OUT gctBOOL_PTR IsIdle
++    )
++{
++    gceSTATUS status;
++    gctUINT32 idle;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
++
++    /* We are idle when the power is not ON. */
++    if (Hardware->chipPowerState != gcvPOWER_ON)
++    {
++        *IsIdle = gcvTRUE;
++    }
++
++    else
++    {
++        /* Read idle register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, &idle));
++
++        /* Pipe must be idle. */
++        if (((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 8:8)) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 10:10)) & ((gctUINT32) ((((1 ? 10:10) - (0 ? 10:10) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 10:10) - (0 ? 10:10) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) ) != 1)
++        )
++        {
++            /* Something is busy. */
++            *IsIdle = gcvFALSE;
++        }
++
++        else
++        {
++            *IsIdle = gcvTRUE;
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif /* gcdENABLE_VG */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/GC350/hal/kernel/gc_hal_kernel_hardware_vg.h	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,75 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_hardware_vg_h_
++#define __gc_hal_kernel_hardware_vg_h_
++
++/* gckHARDWARE object. */
++struct _gckVGHARDWARE
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckKERNEL object. */
++    gckVGKERNEL                 kernel;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Chip characteristics. */
++    gceCHIPMODEL                chipModel;
++    gctUINT32                   chipRevision;
++    gctUINT32                   chipFeatures;
++    gctUINT32                   chipMinorFeatures;
++    gctUINT32                   chipMinorFeatures2;
++    gctBOOL                     allowFastClear;
++
++    /* Features. */
++    gctBOOL                     fe20;
++    gctBOOL                     vg20;
++    gctBOOL                     vg21;
++
++    /* Event mask. */
++    gctUINT32                   eventMask;
++
++    gctBOOL                     clockState;
++    gctBOOL                     powerState;
++    gctPOINTER                  powerMutex;
++    gctUINT32                   powerProcess;
++    gctUINT32                   powerThread;
++    gceCHIPPOWERSTATE           chipPowerState;
++    gceCHIPPOWERSTATE           chipPowerStateGlobal;
++    gctISRMANAGERFUNC           startIsr;
++    gctISRMANAGERFUNC           stopIsr;
++    gctPOINTER                  isrContext;
++    gctPOINTER                  pageTableDirty;
++
++#if gcdPOWEROFF_TIMEOUT
++    gctUINT32                   powerOffTime;
++    gctUINT32                   powerOffTimeout;
++    gctPOINTER                  powerOffTimer;
++#endif
++
++    gctBOOL                     powerManagement;
++};
++
++#endif /* __gc_hal_kernel_hardware_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.c	2015-07-27 23:13:06.170964992 +0200
+@@ -0,0 +1,1735 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#include "gc_hal_kernel_context.h"
++#include "gc_hal_kernel_buffer.h"
++
++/******************************************************************************\
++******************************** Debugging Macro *******************************
++\******************************************************************************/
++
++/* Zone used for header/footer. */
++#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
++
++
++/******************************************************************************\
++************************** Context State Buffer Helpers ************************
++\******************************************************************************/
++
++#define _STATE(reg)                                                            \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        reg ## _Count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _STATE_COUNT(reg, count)                                               \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _STATE_COUNT_OFFSET(reg, offset, count)                                \
++    _State(\
++        Context, index, \
++        (reg ## _Address >> 2) + offset, \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _STATE_MIRROR_COUNT(reg, mirror, count)                                \
++    _StateMirror(\
++        Context, \
++        reg ## _Address >> 2, \
++        count, \
++        mirror ## _Address >> 2                                                \
++        )
++
++#define _STATE_HINT(reg)                                                       \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        reg ## _Count, \
++        gcvFALSE, gcvTRUE                                                      \
++        )
++
++#define _STATE_HINT_BLOCK(reg, block, count)                                   \
++    _State(\
++        Context, index, \
++        (reg ## _Address >> 2) + (block << reg ## _BLK), \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvTRUE                                                      \
++        )
++
++#define _STATE_X(reg)                                                          \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        reg ## _Count, \
++        gcvTRUE, gcvFALSE                                                      \
++        )
++
++#define _CLOSE_RANGE()                                                         \
++    _TerminateStateBlock(Context, index)
++
++#define _ENABLE(reg, field)                                                    \
++    do                                                                         \
++    {                                                                          \
++        if (gcmVERIFYFIELDVALUE(data, reg, MASK_ ## field, ENABLED))           \
++        {                                                                      \
++            enable |= gcmFIELDMASK(reg, field);                                \
++        }                                                                      \
++    }                                                                          \
++    while (gcvFALSE)
++
++#define _BLOCK_COUNT(reg)                                                      \
++    ((reg ## _Count) >> (reg ## _BLK))
++
++
++/******************************************************************************\
++*********************** Support Functions and Definitions **********************
++\******************************************************************************/
++
++#define gcdSTATE_MASK \
++    (((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 | 0xC0FFEE & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))))
++
++#if !defined(VIVANTE_NO_3D)
++static gctSIZE_T
++_TerminateStateBlock(
++    IN gckCONTEXT Context,
++    IN gctSIZE_T Index
++    )
++{
++    gctUINT32_PTR buffer;
++    gctSIZE_T align;
++
++    /* Determine if we need alignment. */
++    align = (Index & 1) ? 1 : 0;
++
++    /* Address correct index. */
++    buffer = (Context->buffer == gcvNULL)
++        ? gcvNULL
++        : Context->buffer->logical;
++
++    /* Flush the current state block; make sure no pairing with the states
++       to follow happens. */
++    if (align && (buffer != gcvNULL))
++    {
++        buffer[Index] = 0xDEADDEAD;
++    }
++
++    /* Reset last address. */
++    Context->lastAddress = ~0U;
++
++    /* Return alignment requirement. */
++    return align;
++}
++#endif
++
++
++static gctSIZE_T
++_FlushPipe(
++    IN gckCONTEXT Context,
++    IN gctSIZE_T Index,
++    IN gcePIPE_SELECT Pipe
++    )
++{
++    if (Context->buffer != gcvNULL)
++    {
++        gctUINT32_PTR buffer;
++
++        /* Address correct index. */
++        buffer = Context->buffer->logical + Index;
++
++        /* Flush the current pipe. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = (Pipe == gcvPIPE_2D)
++                ?   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++                :   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++
++        /* Semaphore from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Stall from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++    }
++
++    /* Flushing 3D pipe takes 6 slots. */
++    return 6;
++}
++
++#if !defined(VIVANTE_NO_3D)
++static gctSIZE_T
++_SemaphoreStall(
++    IN gckCONTEXT Context,
++    IN gctSIZE_T Index
++    )
++{
++    if (Context->buffer != gcvNULL)
++    {
++        gctUINT32_PTR buffer;
++
++        /* Address correct index. */
++        buffer = Context->buffer->logical + Index;
++
++        /* Semaphore from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Stall from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++    }
++
++    /* Semaphore/stall takes 4 slots. */
++    return 4;
++}
++#endif
++
++static gctSIZE_T
++_SwitchPipe(
++    IN gckCONTEXT Context,
++    IN gctSIZE_T Index,
++    IN gcePIPE_SELECT Pipe
++    )
++{
++    if (Context->buffer != gcvNULL)
++    {
++        gctUINT32_PTR buffer;
++
++        /* Address correct index. */
++        buffer = Context->buffer->logical + Index;
++
++        /* LoadState(AQPipeSelect, 1), pipe. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        *buffer
++            = (Pipe == gcvPIPE_2D)
++                ? 0x1
++                : 0x0;
++    }
++
++    return 2;
++}
++
++#if !defined(VIVANTE_NO_3D)
++static gctSIZE_T
++_State(
++    IN gckCONTEXT Context,
++    IN gctSIZE_T Index,
++    IN gctUINT32 Address,
++    IN gctUINT32 Value,
++    IN gctSIZE_T Size,
++    IN gctBOOL FixedPoint,
++    IN gctBOOL Hinted
++    )
++{
++    gctUINT32_PTR buffer;
++    gctSIZE_T align, i;
++
++    /* Determine if we need alignment. */
++    align = (Index & 1) ? 1 : 0;
++
++    /* Address correct index. */
++    buffer = (Context->buffer == gcvNULL)
++        ? gcvNULL
++        : Context->buffer->logical;
++
++    if ((buffer == gcvNULL) && (Address + Size > Context->stateCount))
++    {
++        /* Determine maximum state. */
++        Context->stateCount = Address + Size;
++    }
++
++    /* Do we need a new entry? */
++    if ((Address != Context->lastAddress) || (FixedPoint != Context->lastFixed))
++    {
++        if (buffer != gcvNULL)
++        {
++            if (align)
++            {
++                /* Add filler. */
++                buffer[Index++] = 0xDEADDEAD;
++            }
++
++            /* LoadState(Address, Count). */
++            gcmkASSERT((Index & 1) == 0);
++
++            if (FixedPoint)
++            {
++                buffer[Index]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++            }
++            else
++            {
++                buffer[Index]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++            }
++
++            /* Walk all the states. */
++            for (i = 0; i < Size; i += 1)
++            {
++                /* Set state to uninitialized value. */
++                buffer[Index + 1 + i] = Value;
++
++                /* Set index in state mapping table. */
++                Context->map[Address + i].index = Index + 1 + i;
++
++#if gcdSECURE_USER
++                /* Save hint. */
++                if (Context->hint != gcvNULL)
++                {
++                    Context->hint[Address + i] = Hinted;
++                }
++#endif
++            }
++        }
++
++        /* Save information for this LoadState. */
++        Context->lastIndex   = Index;
++        Context->lastAddress = Address + Size;
++        Context->lastSize    = Size;
++        Context->lastFixed   = FixedPoint;
++
++        /* Return size for load state. */
++        return align + 1 + Size;
++    }
++
++    /* Append this state to the previous one. */
++    if (buffer != gcvNULL)
++    {
++        /* Update last load state. */
++        buffer[Context->lastIndex] =
++            ((((gctUINT32) (buffer[Context->lastIndex])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Context->lastSize + Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        /* Walk all the states. */
++        for (i = 0; i < Size; i += 1)
++        {
++            /* Set state to uninitialized value. */
++            buffer[Index + i] = Value;
++
++            /* Set index in state mapping table. */
++            Context->map[Address + i].index = Index + i;
++
++#if gcdSECURE_USER
++            /* Save hint. */
++            if (Context->hint != gcvNULL)
++            {
++                Context->hint[Address + i] = Hinted;
++            }
++#endif
++        }
++    }
++
++    /* Update last address and size. */
++    Context->lastAddress += Size;
++    Context->lastSize    += Size;
++
++    /* Return number of slots required. */
++    return Size;
++}
++
++static gctSIZE_T
++_StateMirror(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Address,
++    IN gctSIZE_T Size,
++    IN gctUINT32 AddressMirror
++    )
++{
++    gctSIZE_T i;
++
++    /* Process when buffer is set. */
++    if (Context->buffer != gcvNULL)
++    {
++        /* Walk all states. */
++        for (i = 0; i < Size; i++)
++        {
++            /* Copy the mapping address. */
++            Context->map[Address + i].index =
++                Context->map[AddressMirror + i].index;
++        }
++    }
++
++    /* Return the number of required maps. */
++    return Size;
++}
++#endif
++
++static gceSTATUS
++_InitializeContextBuffer(
++    IN gckCONTEXT Context
++    )
++{
++    gctUINT32_PTR buffer;
++    gctSIZE_T index;
++
++#if !defined(VIVANTE_NO_3D)
++    gctUINT i;
++    gctUINT vertexUniforms, fragmentUniforms;
++    gctUINT fe2vsCount;
++    gctBOOL halti0;
++#endif
++
++    /* Reset the buffer index. */
++    index = 0;
++
++    /* Reset the last state address. */
++    Context->lastAddress = ~0U;
++
++    /* Get the buffer pointer. */
++    buffer = (Context->buffer == gcvNULL)
++        ? gcvNULL
++        : Context->buffer->logical;
++
++
++    /**************************************************************************/
++    /* Build 2D states. *******************************************************/
++
++
++#if !defined(VIVANTE_NO_3D)
++    /**************************************************************************/
++    /* Build 3D states. *******************************************************/
++    halti0 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) );
++
++    /* Query shader support. */
++    gcmkVERIFY_OK(gckHARDWARE_QueryShaderCaps(
++        Context->hardware, &vertexUniforms, &fragmentUniforms, gcvNULL));
++
++    /* Store the 3D entry index. */
++    Context->entryOffset3D = index * gcmSIZEOF(gctUINT32);
++
++    /* Flush 2D pipe. */
++    index += _FlushPipe(Context, index, gcvPIPE_2D);
++
++    /* Switch to 3D pipe. */
++    index += _SwitchPipe(Context, index, gcvPIPE_3D);
++
++    /* Current context pointer. */
++#if gcdDEBUG
++    index += _State(Context, index, 0x03850 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++#endif
++
++    index += _FlushPipe(Context, index, gcvPIPE_3D);
++
++    /* Global states. */
++    index += _State(Context, index, 0x03814 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03818 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0381C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03820 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03828 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0382C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03834 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0384C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    /* Front End states. */
++	fe2vsCount = 12;
++	if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) ))
++	{
++		fe2vsCount = 16;
++	}
++    index += _State(Context, index, 0x00600 >> 2, 0x00000000, fe2vsCount, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    index += _State(Context, index, 0x00644 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x00648 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0064C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x00650 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00680 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x006A0 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0067C >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x006C0 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00700 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00740 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00780 >> 2, 0x3F800000, 16, gcvFALSE, gcvFALSE);
++
++    /* Vertex Shader states. */
++    index += _State(Context, index, 0x00800 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00804 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00808 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0080C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00810 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00820 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00830 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    if (Context->hardware->identity.instructionCount <= 256)
++    {
++        index += _State(Context, index, 0x04000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
++    }
++
++    index += _CLOSE_RANGE();
++    index += _State(Context, index, 0x05000 >> 2, 0x00000000, vertexUniforms * 4, gcvFALSE, gcvFALSE);
++
++    /* Primitive Assembly states. */
++    index += _State(Context, index, 0x00A00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A08 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A0C >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A10 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A1C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A28 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A2C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A30 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A40 >> 2, 0x00000000, 10, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A34 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A38 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A3C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A80 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A84 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A8C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    /* Setup states. */
++    index += _State(Context, index, 0x00C00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C08 >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C0C >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C10 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C1C >> 2, 0x42000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C20 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C24 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++
++    /* Raster states. */
++    index += _State(Context, index, 0x00E00 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E10 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E04 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E40 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E08 >> 2, 0x00000031, 1, gcvFALSE, gcvFALSE);
++
++    /* Pixel Shader states. */
++    index += _State(Context, index, 0x01000 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01004 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0100C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01010 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01018 >> 2, 0x01000000, 1, gcvFALSE, gcvFALSE);
++    if (Context->hardware->identity.instructionCount <= 256)
++    {
++        index += _State(Context, index, 0x06000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
++    }
++
++    index += _CLOSE_RANGE();
++    index += _State(Context, index, 0x07000 >> 2, 0x00000000, fragmentUniforms * 4, gcvFALSE, gcvFALSE);
++
++    /* Texture states. */
++    index += _State(Context, index, 0x02000 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02040 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02080 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x020C0 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02100 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02140 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02180 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x021C0 >> 2, 0x00321000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02200 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02240 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, (0x02400 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02440 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02480 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x024C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02500 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02540 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02580 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x025C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02600 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02640 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02680 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x026C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02700 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02740 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _CLOSE_RANGE();
++
++    if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) ))
++    {
++        gctUINT texBlockCount;
++
++        /* New texture block. */
++        index += _State(Context, index, 0x10000 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10080 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10100 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10180 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10200 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10280 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        for (i = 0; i < 256 / 16; i += 1)
++        {
++            index += _State(Context, index, (0x02C00 >> 2) + i * 16, 0x00000000, 14, gcvFALSE, gcvFALSE);
++        }
++        index += _State(Context, index, 0x10300 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10380 >> 2, 0x00321000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10400 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10480 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++
++        if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 15:15)) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1)))))) ))
++        {
++            index += _State(Context, index, 0x12000 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
++            index += _State(Context, index, 0x12400 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
++        }
++
++        if ((Context->hardware->identity.chipModel == gcv2000)
++         && (Context->hardware->identity.chipRevision == 0x5108))
++        {
++            texBlockCount = 12;
++        }
++        else
++        {
++            texBlockCount = ((512) >> (4));
++        }
++        for (i = 0; i < texBlockCount; i += 1)
++        {
++            index += _State(Context, index, (0x10800 >> 2) + (i << 4), 0x00000000, 14, gcvFALSE, gcvTRUE);
++        }
++    }
++
++    /* YUV. */
++    index += _State(Context, index, 0x01678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0167C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01680 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01684 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01688 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0168C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01690 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01694 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01698 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0169C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    /* Thread walker states. */
++    index += _State(Context, index, 0x00900 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00904 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00908 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0090C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00910 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00914 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00918 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0091C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00924 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++	if (Context->hardware->identity.instructionCount > 1024)
++	{
++		/* New Shader instruction memory. */
++		index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++		index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
++		index += _State(Context, index, 0x00860 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++		index += _CLOSE_RANGE();
++
++		for (i = 0;
++		     i < Context->hardware->identity.instructionCount << 2;
++		     i += 256 << 2
++		     )
++		{
++			index += _State(Context, index, (0x20000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
++			index += _CLOSE_RANGE();
++		}
++	}
++	else if (Context->hardware->identity.instructionCount > 256)
++	{
++		/* New Shader instruction memory. */
++		index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++		index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
++		index += _CLOSE_RANGE();
++
++		/* VX instruction memory. */
++		for (i = 0;
++		     i < Context->hardware->identity.instructionCount << 2;
++		     i += 256 << 2
++		     )
++		{
++			index += _State(Context, index, (0x0C000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
++			index += _CLOSE_RANGE();
++		}
++
++		_StateMirror(Context, 0x08000 >> 2, Context->hardware->identity.instructionCount << 2 , 0x0C000 >> 2);
++	}
++
++    /* Store the index of the "XD" entry. */
++    Context->entryOffsetXDFrom3D = index * gcmSIZEOF(gctUINT32);
++
++
++    /* Pixel Engine states. */
++    index += _State(Context, index, 0x01400 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01404 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01408 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0140C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01414 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01418 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0141C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01420 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01424 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01428 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0142C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01434 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01454 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01458 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0145C >> 2, 0x00000010, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014A8 >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014AC >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014B0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014A4 >> 2, 0x000E400C, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01580 >> 2, 0x00000000, 3, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014B8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    /* Composition states. */
++    index += _State(Context, index, 0x03008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    if (Context->hardware->identity.pixelPipes == 1)
++    {
++        index += _State(Context, index, 0x01460 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++
++        index += _State(Context, index, 0x01430 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++        index += _State(Context, index, 0x01410 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    }
++    else
++    {
++        index += _State(Context, index, (0x01460 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++
++        for (i = 0; i < 2; i++)
++        {
++            index += _State(Context, index, (0x01500 >> 2) + (i << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++        }
++    }
++
++    if (Context->hardware->identity.pixelPipes > 1 || halti0)
++    {
++        index += _State(Context, index, (0x01480 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++    }
++
++    /* Resolve states. */
++    index += _State(Context, index, 0x01604 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01608 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0160C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01610 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01614 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01620 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01630 >> 2, 0x00000000, 2, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01640 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0163C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    if (Context->hardware->identity.pixelPipes > 1)
++    {
++        index += _State(Context, index, (0x016C0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++
++        index += _State(Context, index, (0x016E0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++
++        index += _State(Context, index, 0x01700 >> 2, 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvFALSE);
++    }
++
++    /* Tile status. */
++    index += _State(Context, index, 0x01654 >> 2, 0x00200000, 1, gcvFALSE, gcvFALSE);
++
++    index += _CLOSE_RANGE();
++    index += _State(Context, index, 0x01658 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0165C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01660 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01664 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01668 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0166C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01674 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016A4 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x016AC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016A8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01720 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01740 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01760 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    /* Semaphore/stall. */
++    index += _SemaphoreStall(Context, index);
++#endif
++
++    /**************************************************************************/
++    /* Link to another address. ***********************************************/
++
++    Context->linkIndex3D = index;
++
++    if (buffer != gcvNULL)
++    {
++        buffer[index + 0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[index + 1]
++            = 0;
++    }
++
++    index += 2;
++
++    /* Store the end of the context buffer. */
++    Context->bufferSize = index * gcmSIZEOF(gctUINT32);
++
++
++    /**************************************************************************/
++    /* Pipe switch for the case where neither 2D nor 3D are used. *************/
++
++    /* Store the 3D entry index. */
++    Context->entryOffsetXDFrom2D = index * gcmSIZEOF(gctUINT32);
++
++    /* Flush 2D pipe. */
++    index += _FlushPipe(Context, index, gcvPIPE_2D);
++
++    /* Switch to 3D pipe. */
++    index += _SwitchPipe(Context, index, gcvPIPE_3D);
++
++    /* Store the location of the link. */
++    Context->linkIndexXD = index;
++
++    if (buffer != gcvNULL)
++    {
++        buffer[index + 0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[index + 1]
++            = 0;
++    }
++
++    index += 2;
++
++
++    /**************************************************************************/
++    /* Save size for buffer. **************************************************/
++
++    Context->totalSize = index * gcmSIZEOF(gctUINT32);
++
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++_DestroyContext(
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    if (Context != gcvNULL)
++    {
++        gcsCONTEXT_PTR bufferHead;
++
++        /* Free context buffers. */
++        for (bufferHead = Context->buffer; Context->buffer != gcvNULL;)
++        {
++            /* Get a shortcut to the current buffer. */
++            gcsCONTEXT_PTR buffer = Context->buffer;
++
++            /* Get the next buffer. */
++            gcsCONTEXT_PTR next = buffer->next;
++
++            /* Last item? */
++            if (next == bufferHead)
++            {
++                next = gcvNULL;
++            }
++
++            /* Destroy the signal. */
++            if (buffer->signal != gcvNULL)
++            {
++                gcmkONERROR(gckOS_DestroySignal(
++                    Context->os, buffer->signal
++                    ));
++
++                buffer->signal = gcvNULL;
++            }
++
++            /* Free state delta map. */
++            if (buffer->logical != gcvNULL)
++            {
++#if gcdVIRTUAL_COMMAND_BUFFER
++                gcmkONERROR(gckEVENT_DestroyVirtualCommandBuffer(
++                    Context->hardware->kernel->eventObj,
++                    Context->totalSize,
++                    buffer->physical,
++                    buffer->logical,
++                    gcvKERNEL_PIXEL
++                    ));
++
++#else
++                gcmkONERROR(gckEVENT_FreeContiguousMemory(
++                    Context->hardware->kernel->eventObj,
++                    Context->totalSize,
++                    buffer->physical,
++                    buffer->logical,
++                    gcvKERNEL_PIXEL
++                    ));
++#endif
++
++                buffer->logical = gcvNULL;
++            }
++
++            /* Free context buffer. */
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, buffer));
++
++            /* Remove from the list. */
++            Context->buffer = next;
++        }
++
++#if gcdSECURE_USER
++        /* Free the hint array. */
++        if (Context->hint != gcvNULL)
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->hint));
++        }
++#endif
++        /* Free record array copy. */
++        if (Context->recordArray != gcvNULL)
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->recordArray));
++        }
++
++        /* Free the state mapping. */
++        if (Context->map != gcvNULL)
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->map));
++        }
++
++        /* Mark the gckCONTEXT object as unknown. */
++        Context->object.type = gcvOBJ_UNKNOWN;
++
++        /* Free the gckCONTEXT object. */
++        gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context));
++    }
++
++OnError:
++    return status;
++}
++
++
++/******************************************************************************\
++**************************** Context Management API ****************************
++\******************************************************************************/
++
++/******************************************************************************\
++**
++**  gckCONTEXT_Construct
++**
++**  Construct a new gckCONTEXT object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Current process ID.
++**
++**      gckHARDWARE Hardware
++**          Pointer to gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gckCONTEXT * Context
++**          Pointer to a variable thet will receive the gckCONTEXT object
++**          pointer.
++*/
++gceSTATUS
++gckCONTEXT_Construct(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 ProcessID,
++    OUT gckCONTEXT * Context
++    )
++{
++    gceSTATUS status;
++    gckCONTEXT context = gcvNULL;
++    gctSIZE_T allocationSize;
++    gctUINT i;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%08X Hardware=0x%08X", Os, Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Context != gcvNULL);
++
++
++    /**************************************************************************/
++    /* Allocate and initialize basic fields of gckCONTEXT. ********************/
++
++    /* The context object size. */
++    allocationSize = gcmSIZEOF(struct _gckCONTEXT);
++
++    /* Allocate the object. */
++    gcmkONERROR(gckOS_Allocate(
++        Os, allocationSize, &pointer
++        ));
++
++    context = pointer;
++
++    /* Reset the entire object. */
++    gcmkONERROR(gckOS_ZeroMemory(context, allocationSize));
++
++    /* Initialize the gckCONTEXT object. */
++    context->object.type = gcvOBJ_CONTEXT;
++    context->os          = Os;
++    context->hardware    = Hardware;
++
++
++#if defined(VIVANTE_NO_3D)
++    context->entryPipe = gcvPIPE_2D;
++    context->exitPipe  = gcvPIPE_2D;
++#elif gcdCMD_NO_2D_CONTEXT
++    context->entryPipe = gcvPIPE_3D;
++    context->exitPipe  = gcvPIPE_3D;
++#else
++    context->entryPipe
++        = (((((gctUINT32) (context->hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) )
++            ? gcvPIPE_2D
++            : gcvPIPE_3D;
++    context->exitPipe = gcvPIPE_3D;
++#endif
++
++    /* Get the command buffer requirements. */
++    gcmkONERROR(gckHARDWARE_QueryCommandBuffer(
++        Hardware,
++        &context->alignment,
++        &context->reservedHead,
++        &context->reservedTail
++        ));
++
++    /* Mark the context as dirty to force loading of the entire state table
++       the first time. */
++    context->dirty = gcvTRUE;
++
++
++    /**************************************************************************/
++    /* Get the size of the context buffer. ************************************/
++
++    gcmkONERROR(_InitializeContextBuffer(context));
++
++
++    /**************************************************************************/
++    /* Compute the size of the record array. **********************************/
++
++    context->recordArraySize
++        = gcmSIZEOF(gcsSTATE_DELTA_RECORD) * context->stateCount;
++
++
++    if (context->stateCount > 0)
++    {
++        /**************************************************************************/
++        /* Allocate and reset the state mapping table. ****************************/
++
++        /* Allocate the state mapping table. */
++        gcmkONERROR(gckOS_Allocate(
++            Os,
++            gcmSIZEOF(gcsSTATE_MAP) * context->stateCount,
++            &pointer
++            ));
++
++        context->map = pointer;
++
++        /* Zero the state mapping table. */
++        gcmkONERROR(gckOS_ZeroMemory(
++            context->map, gcmSIZEOF(gcsSTATE_MAP) * context->stateCount
++            ));
++
++
++        /**************************************************************************/
++        /* Allocate the hint array. ***********************************************/
++
++#if gcdSECURE_USER
++        /* Allocate hints. */
++        gcmkONERROR(gckOS_Allocate(
++            Os,
++            gcmSIZEOF(gctBOOL) * context->stateCount,
++            &pointer
++            ));
++
++        context->hint = pointer;
++#endif
++    }
++
++    /**************************************************************************/
++    /* Allocate the context and state delta buffers. **************************/
++
++    for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i += 1)
++    {
++        /* Allocate a context buffer. */
++        gcsCONTEXT_PTR buffer;
++
++        /* Allocate the context buffer structure. */
++        gcmkONERROR(gckOS_Allocate(
++            Os,
++            gcmSIZEOF(gcsCONTEXT),
++            &pointer
++            ));
++
++        buffer = pointer;
++
++        /* Reset the context buffer structure. */
++        gcmkVERIFY_OK(gckOS_ZeroMemory(
++            buffer, gcmSIZEOF(gcsCONTEXT)
++            ));
++
++        /* Append to the list. */
++        if (context->buffer == gcvNULL)
++        {
++            buffer->next    = buffer;
++            context->buffer = buffer;
++        }
++        else
++        {
++            buffer->next          = context->buffer->next;
++            context->buffer->next = buffer;
++        }
++
++        /* Set the number of delta in the order of creation. */
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++        buffer->num = i;
++#endif
++
++        /* Create the busy signal. */
++        gcmkONERROR(gckOS_CreateSignal(
++            Os, gcvFALSE, &buffer->signal
++            ));
++
++        /* Set the signal, buffer is currently not busy. */
++        gcmkONERROR(gckOS_Signal(
++            Os, buffer->signal, gcvTRUE
++            ));
++
++        /* Create a new physical context buffer. */
++#if gcdVIRTUAL_COMMAND_BUFFER
++        gcmkONERROR(gckKERNEL_AllocateVirtualCommandBuffer(
++            context->hardware->kernel,
++            gcvFALSE,
++            &context->totalSize,
++            &buffer->physical,
++            &pointer
++            ));
++
++#else
++        gcmkONERROR(gckOS_AllocateContiguous(
++            Os,
++            gcvFALSE,
++            &context->totalSize,
++            &buffer->physical,
++            &pointer
++            ));
++#endif
++
++        buffer->logical = pointer;
++
++        /* Set gckEVENT object pointer. */
++        buffer->eventObj = Hardware->kernel->eventObj;
++
++        /* Set the pointers to the LINK commands. */
++        if (context->linkIndex2D != 0)
++        {
++            buffer->link2D = &buffer->logical[context->linkIndex2D];
++        }
++
++        if (context->linkIndex3D != 0)
++        {
++            buffer->link3D = &buffer->logical[context->linkIndex3D];
++        }
++
++        if (context->linkIndexXD != 0)
++        {
++            gctPOINTER xdLink;
++            gctUINT8_PTR xdEntryLogical;
++            gctSIZE_T xdEntrySize;
++            gctSIZE_T linkBytes;
++
++            /* Determine LINK parameters. */
++            xdLink
++                = &buffer->logical[context->linkIndexXD];
++
++            xdEntryLogical
++                = (gctUINT8_PTR) buffer->logical
++                + context->entryOffsetXDFrom3D;
++
++            xdEntrySize
++                = context->bufferSize
++                - context->entryOffsetXDFrom3D;
++
++            /* Query LINK size. */
++            gcmkONERROR(gckHARDWARE_Link(
++                Hardware, gcvNULL, gcvNULL, 0, &linkBytes
++                ));
++
++            /* Generate a LINK. */
++            gcmkONERROR(gckHARDWARE_Link(
++                Hardware,
++                xdLink,
++                xdEntryLogical,
++                xdEntrySize,
++                &linkBytes
++                ));
++        }
++    }
++
++
++    /**************************************************************************/
++    /* Initialize the context buffers. ****************************************/
++
++    /* Initialize the current context buffer. */
++    gcmkONERROR(_InitializeContextBuffer(context));
++
++    /* Make all created contexts equal. */
++    {
++        gcsCONTEXT_PTR currContext, tempContext;
++
++        /* Set the current context buffer. */
++        currContext = context->buffer;
++
++        /* Get the next context buffer. */
++        tempContext = currContext->next;
++
++        /* Loop through all buffers. */
++        while (tempContext != currContext)
++        {
++            if (tempContext == gcvNULL)
++            {
++                gcmkONERROR(gcvSTATUS_NOT_FOUND);
++            }
++
++            /* Copy the current context. */
++            gckOS_MemCopy(
++                tempContext->logical,
++                currContext->logical,
++                context->totalSize
++                );
++
++            /* Get the next context buffer. */
++            tempContext = tempContext->next;
++        }
++    }
++
++    /* Return pointer to the gckCONTEXT object. */
++    *Context = context;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Context=0x%08X", *Context);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back on error. */
++    gcmkVERIFY_OK(_DestroyContext(context));
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/******************************************************************************\
++**
++**  gckCONTEXT_Destroy
++**
++**  Destroy a gckCONTEXT object.
++**
++**  INPUT:
++**
++**      gckCONTEXT Context
++**          Pointer to an gckCONTEXT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCONTEXT_Destroy(
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Context=0x%08X", Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    /* Destroy the context and all related objects. */
++    status = _DestroyContext(Context);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return status;
++}
++
++/******************************************************************************\
++**
++**  gckCONTEXT_Update
++**
++**  Merge all pending state delta buffers into the current context buffer.
++**
++**  INPUT:
++**
++**      gckCONTEXT Context
++**          Pointer to an gckCONTEXT object.
++**
++**      gctUINT32 ProcessID
++**          Current process ID.
++**
++**      gcsSTATE_DELTA_PTR StateDelta
++**          Pointer to the state delta.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCONTEXT_Update(
++    IN gckCONTEXT Context,
++    IN gctUINT32 ProcessID,
++    IN gcsSTATE_DELTA_PTR StateDelta
++    )
++{
++#ifndef VIVANTE_NO_3D
++    gceSTATUS status = gcvSTATUS_OK;
++    gcsSTATE_DELTA _stateDelta;
++    gckKERNEL kernel;
++    gcsCONTEXT_PTR buffer;
++    gcsSTATE_MAP_PTR map;
++    gctBOOL needCopy = gcvFALSE;
++    gcsSTATE_DELTA_PTR nDelta;
++    gcsSTATE_DELTA_PTR uDelta = gcvNULL;
++    gcsSTATE_DELTA_PTR kDelta = gcvNULL;
++    gcsSTATE_DELTA_RECORD_PTR record;
++    gcsSTATE_DELTA_RECORD_PTR recordArray = gcvNULL;
++    gctUINT elementCount;
++    gctUINT address;
++    gctUINT32 mask;
++    gctUINT32 data;
++    gctUINT index;
++    gctUINT i, j;
++
++#if gcdSECURE_USER
++    gcskSECURE_CACHE_PTR cache;
++#endif
++
++    gcmkHEADER_ARG(
++        "Context=0x%08X ProcessID=%d StateDelta=0x%08X",
++        Context, ProcessID, StateDelta
++        );
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    /* Get a shortcut to the kernel object. */
++    kernel = Context->hardware->kernel;
++
++    /* Check wehther we need to copy the structures or not. */
++    gcmkONERROR(gckOS_QueryNeedCopy(Context->os, ProcessID, &needCopy));
++
++    /* Allocate the copy buffer for the user record array. */
++    if (needCopy && (Context->recordArray == gcvNULL))
++    {
++        /* Allocate the buffer. */
++        gcmkONERROR(gckOS_Allocate(
++            Context->os,
++            Context->recordArraySize,
++            (gctPOINTER *) &Context->recordArray
++            ));
++    }
++
++    /* Get the current context buffer. */
++    buffer = Context->buffer;
++
++    /* Wait until the context buffer becomes available; this will
++       also reset the signal and mark the buffer as busy. */
++    gcmkONERROR(gckOS_WaitSignal(
++        Context->os, buffer->signal, gcvINFINITE
++        ));
++
++#if gcdSECURE_USER
++    /* Get the cache form the database. */
++    gcmkONERROR(gckKERNEL_GetProcessDBCache(kernel, ProcessID, &cache));
++#endif
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE) && 1 && !defined(VIVANTE_NO_3D)
++    /* Update current context token. */
++    buffer->logical[Context->map[0x0E14].index]
++        = gcmPTR2INT(Context);
++#endif
++
++    /* Are there any pending deltas? */
++    if (buffer->deltaCount != 0)
++    {
++        /* Get the state map. */
++        map = Context->map;
++
++        /* Get the first delta item. */
++        uDelta = buffer->delta;
++
++        /* Reset the vertex stream count. */
++        elementCount = 0;
++
++        /* Merge all pending deltas. */
++        for (i = 0; i < buffer->deltaCount; i += 1)
++        {
++            /* Get access to the state delta. */
++            gcmkONERROR(gckKERNEL_OpenUserData(
++                kernel, needCopy,
++                &_stateDelta,
++                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++                (gctPOINTER *) &kDelta
++                ));
++
++            /* Get access to the state records. */
++            gcmkONERROR(gckKERNEL_OpenUserData(
++                kernel, needCopy,
++                Context->recordArray,
++                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
++                (gctPOINTER *) &recordArray
++                ));
++
++            /* Merge all pending states. */
++            for (j = 0; j < kDelta->recordCount; j += 1)
++            {
++                if (j >= Context->stateCount)
++                {
++                    break;
++                }
++
++                /* Get the current state record. */
++                record = &recordArray[j];
++
++                /* Get the state address. */
++                address = record->address;
++
++                /* Make sure the state is a part of the mapping table. */
++                if (address >= Context->stateCount)
++                {
++                    gcmkTRACE(
++                        gcvLEVEL_ERROR,
++                        "%s(%d): State 0x%04X is not mapped.\n",
++                        __FUNCTION__, __LINE__,
++                        address
++                        );
++
++                    continue;
++                }
++
++                /* Get the state index. */
++                index = map[address].index;
++
++                /* Skip the state if not mapped. */
++                if (index == 0)
++                {
++#if gcdDEBUG
++                    if ((address != 0x0594)
++                     && (address != 0x0E00)
++                     && (address != 0x0E03)
++                        )
++                    {
++#endif
++                        gcmkTRACE(
++                            gcvLEVEL_ERROR,
++                            "%s(%d): State 0x%04X is not mapped.\n",
++                            __FUNCTION__, __LINE__,
++                            address
++                            );
++#if gcdDEBUG
++                    }
++#endif
++                    continue;
++                }
++
++                /* Get the data mask. */
++                mask = record->mask;
++
++                /* Masked states that are being completly reset or regular states. */
++                if ((mask == 0) || (mask == ~0U))
++                {
++                    /* Get the new data value. */
++                    data = record->data;
++
++                    /* Process special states. */
++                    if (address == 0x0595)
++                    {
++                        /* Force auto-disable to be disabled. */
++                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13)));
++                    }
++
++#if gcdSECURE_USER
++                    /* Do we need to convert the logical address? */
++                    if (Context->hint[address])
++                    {
++                        /* Map handle into physical address. */
++                        gcmkONERROR(gckKERNEL_MapLogicalToPhysical(
++                            kernel, cache, (gctPOINTER) &data
++                            ));
++                    }
++#endif
++
++                    /* Set new data. */
++                    buffer->logical[index] = data;
++                }
++
++                /* Masked states that are being set partially. */
++                else
++                {
++                    buffer->logical[index]
++                        = (~mask & buffer->logical[index])
++                        | (mask & record->data);
++                }
++            }
++
++            /* Get the element count. */
++            if (kDelta->elementCount != 0)
++            {
++                elementCount = kDelta->elementCount;
++            }
++
++            /* Dereference delta. */
++            kDelta->refCount -= 1;
++            gcmkASSERT(kDelta->refCount >= 0);
++
++            /* Get the next state delta. */
++            nDelta = gcmUINT64_TO_PTR(kDelta->next);
++
++            /* Get access to the state records. */
++            gcmkONERROR(gckKERNEL_CloseUserData(
++                kernel, needCopy,
++                gcvFALSE,
++                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
++                (gctPOINTER *) &recordArray
++                ));
++
++            /* Close access to the current state delta. */
++            gcmkONERROR(gckKERNEL_CloseUserData(
++                kernel, needCopy,
++                gcvTRUE,
++                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++                (gctPOINTER *) &kDelta
++                ));
++
++            /* Update the user delta pointer. */
++            uDelta = nDelta;
++        }
++
++        /* Hardware disables all input streams when the stream 0 is programmed,
++           it then reenables those streams that were explicitely programmed by
++           the software. Because of this we cannot program the entire array of
++           values, otherwise we'll get all streams reenabled, but rather program
++           only those that are actully needed by the software. */
++        if (elementCount != 0)
++        {
++            gctUINT base;
++            gctUINT nopCount;
++            gctUINT32_PTR nop;
++            gctUINT fe2vsCount = 12;
++
++            if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) ))
++            {
++                fe2vsCount = 16;
++            }
++
++            /* Determine the base index of the vertex stream array. */
++            base = map[0x0180].index;
++
++            /* Set the proper state count. */
++            buffer->logical[base - 1]
++                = ((((gctUINT32) (buffer->logical[base - 1])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (elementCount ) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            /* Determine the number of NOP commands. */
++            nopCount
++                = (fe2vsCount / 2)
++                - (elementCount / 2);
++
++            /* Determine the location of the first NOP. */
++            nop = &buffer->logical[base + (elementCount | 1)];
++
++            /* Fill the unused space with NOPs. */
++            for (i = 0; i < nopCount; i += 1)
++            {
++                if (nop >= buffer->logical + Context->totalSize)
++                {
++                    break;
++                }
++
++                /* Generate a NOP command. */
++                *nop = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++                /* Advance. */
++                nop += 2;
++            }
++        }
++
++        /* Reset pending deltas. */
++        buffer->deltaCount = 0;
++        buffer->delta      = gcvNULL;
++    }
++
++    /* Set state delta user pointer. */
++    uDelta = StateDelta;
++
++    /* Get access to the state delta. */
++    gcmkONERROR(gckKERNEL_OpenUserData(
++        kernel, needCopy,
++        &_stateDelta,
++        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++        (gctPOINTER *) &kDelta
++        ));
++
++    /* State delta cannot be attached to anything yet. */
++    if (kDelta->refCount != 0)
++    {
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): kDelta->refCount = %d (has to be 0).\n",
++            __FUNCTION__, __LINE__,
++            kDelta->refCount
++            );
++    }
++
++    /* Attach to all contexts. */
++    buffer = Context->buffer;
++
++    do
++    {
++        /* Attach to the context if nothing is attached yet. If a delta
++           is allready attached, all we need to do is to increment
++           the number of deltas in the context. */
++        if (buffer->delta == gcvNULL)
++        {
++            buffer->delta = uDelta;
++        }
++
++        /* Update reference count. */
++        kDelta->refCount += 1;
++
++        /* Update counters. */
++        buffer->deltaCount += 1;
++
++        /* Get the next context buffer. */
++        buffer = buffer->next;
++
++		if (buffer == gcvNULL)
++		{
++			gcmkONERROR(gcvSTATUS_NOT_FOUND);
++		}
++    }
++    while (Context->buffer != buffer);
++
++    /* Close access to the current state delta. */
++    gcmkONERROR(gckKERNEL_CloseUserData(
++        kernel, needCopy,
++        gcvTRUE,
++        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++        (gctPOINTER *) &kDelta
++        ));
++
++    /* Schedule an event to mark the context buffer as available. */
++    gcmkONERROR(gckEVENT_Signal(
++        buffer->eventObj, buffer->signal, gcvKERNEL_PIXEL
++        ));
++
++    /* Advance to the next context buffer. */
++    Context->buffer = buffer->next;
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Get access to the state records. */
++	if (kDelta != gcvNULL)
++	{
++        gcmkVERIFY_OK(gckKERNEL_CloseUserData(
++            kernel, needCopy,
++            gcvFALSE,
++            gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
++            (gctPOINTER *) &recordArray
++            ));
++	}
++
++    /* Close access to the current state delta. */
++    gcmkVERIFY_OK(gckKERNEL_CloseUserData(
++        kernel, needCopy,
++        gcvTRUE,
++        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++        (gctPOINTER *) &kDelta
++        ));
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    return gcvSTATUS_OK;
++#endif
++}
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_context.h	2015-07-27 23:13:06.170964992 +0200
+@@ -0,0 +1,157 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_context_h_
++#define __gc_hal_kernel_context_h_
++
++#include "gc_hal_kernel_buffer.h"
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/* Maps state locations within the context buffer. */
++typedef struct _gcsSTATE_MAP * gcsSTATE_MAP_PTR;
++typedef struct _gcsSTATE_MAP
++{
++    /* Index of the state in the context buffer. */
++    gctUINT                     index;
++
++    /* State mask. */
++    gctUINT32                   mask;
++}
++gcsSTATE_MAP;
++
++/* Context buffer. */
++typedef struct _gcsCONTEXT * gcsCONTEXT_PTR;
++typedef struct _gcsCONTEXT
++{
++    /* For debugging: the number of context buffer in the order of creation. */
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    gctUINT                     num;
++#endif
++
++    /* Pointer to gckEVENT object. */
++    gckEVENT                    eventObj;
++
++    /* Context busy signal. */
++    gctSIGNAL                   signal;
++
++    /* Physical address of the context buffer. */
++    gctPHYS_ADDR                physical;
++
++    /* Logical address of the context buffer. */
++    gctUINT32_PTR               logical;
++
++    /* Pointer to the LINK commands. */
++    gctPOINTER                  link2D;
++    gctPOINTER                  link3D;
++
++    /* The number of pending state deltas. */
++    gctUINT                     deltaCount;
++
++    /* Pointer to the first delta to be applied. */
++    gcsSTATE_DELTA_PTR          delta;
++
++    /* Next context buffer. */
++    gcsCONTEXT_PTR              next;
++}
++gcsCONTEXT;
++
++/* gckCONTEXT structure that hold the current context. */
++struct _gckCONTEXT
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Pointer to gckHARDWARE object. */
++    gckHARDWARE                 hardware;
++
++    /* Command buffer alignment. */
++    gctSIZE_T                   alignment;
++    gctSIZE_T                   reservedHead;
++    gctSIZE_T                   reservedTail;
++
++    /* Context buffer metrics. */
++    gctSIZE_T                   stateCount;
++    gctSIZE_T                   totalSize;
++    gctSIZE_T                   bufferSize;
++    gctUINT32                   linkIndex2D;
++    gctUINT32                   linkIndex3D;
++    gctUINT32                   linkIndexXD;
++    gctUINT32                   entryOffset3D;
++    gctUINT32                   entryOffsetXDFrom2D;
++    gctUINT32                   entryOffsetXDFrom3D;
++
++    /* Dirty flags. */
++    gctBOOL                     dirty;
++    gctBOOL                     dirty2D;
++    gctBOOL                     dirty3D;
++    gcsCONTEXT_PTR              dirtyBuffer;
++
++    /* State mapping. */
++    gcsSTATE_MAP_PTR            map;
++
++    /* List of context buffers. */
++    gcsCONTEXT_PTR              buffer;
++
++    /* A copy of the user record array. */
++    gctUINT                     recordArraySize;
++    gcsSTATE_DELTA_RECORD_PTR   recordArray;
++
++    /* Requested pipe select for context. */
++    gcePIPE_SELECT              entryPipe;
++    gcePIPE_SELECT              exitPipe;
++
++    /* Variables used for building state buffer. */
++    gctUINT32                   lastAddress;
++    gctSIZE_T                   lastSize;
++    gctUINT32                   lastIndex;
++    gctBOOL                     lastFixed;
++
++    /* Hint array. */
++#if gcdSECURE_USER
++    gctBOOL_PTR                 hint;
++#endif
++
++#if VIVANTE_PROFILER_CONTEXT
++    gcsPROFILER_COUNTERS        latestProfiler;
++    gcsPROFILER_COUNTERS        histroyProfiler;
++    gctUINT32                   prevVSInstCount;
++    gctUINT32                   prevVSBranchInstCount;
++    gctUINT32                   prevVSTexInstCount;
++    gctUINT32                   prevVSVertexCount;
++    gctUINT32                   prevPSInstCount;
++    gctUINT32                   prevPSBranchInstCount;
++    gctUINT32                   prevPSTexInstCount;
++    gctUINT32                   prevPSPixelCount;
++#endif
++};
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_context_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.c	2015-07-27 23:13:06.170964992 +0200
+@@ -0,0 +1,7280 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#if VIVANTE_PROFILER_CONTEXT
++#include "gc_hal_kernel_context.h"
++#endif
++
++#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
++
++typedef struct _gcsiDEBUG_REGISTERS * gcsiDEBUG_REGISTERS_PTR;
++typedef struct _gcsiDEBUG_REGISTERS
++{
++    gctSTRING       module;
++    gctUINT         index;
++    gctUINT         shift;
++    gctUINT         data;
++    gctUINT         count;
++    gctUINT32       signature;
++}
++gcsiDEBUG_REGISTERS;
++
++extern int gpu3DMinClock;
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++static gceSTATUS
++_ResetGPU(
++    IN gckHARDWARE Hardware,
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++static gceSTATUS
++_IdentifyHardware(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++    )
++{
++    gceSTATUS status;
++
++    gctUINT32 chipIdentity;
++
++    gctUINT32 streamCount = 0;
++    gctUINT32 registerMax = 0;
++    gctUINT32 threadCount = 0;
++    gctUINT32 shaderCoreCount = 0;
++    gctUINT32 vertexCacheSize = 0;
++    gctUINT32 vertexOutputBufferSize = 0;
++    gctUINT32 pixelPipes = 0;
++    gctUINT32 instructionCount = 0;
++    gctUINT32 numConstants = 0;
++    gctUINT32 bufferSize = 0;
++    gctUINT32 varyingsCount = 0;
++    gctBOOL useHZ;
++
++    gcmkHEADER_ARG("Os=0x%x", Os);
++
++    /***************************************************************************
++    ** Get chip ID and revision.
++    */
++
++    /* Read chip identity register. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Os, Core,
++                             0x00018,
++                             &chipIdentity));
++
++    /* Special case for older graphic cores. */
++    if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
++    {
++        Identity->chipModel    = gcv500;
++        Identity->chipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
++    }
++
++    else
++    {
++        /* Read chip identity register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00020,
++                                 (gctUINT32_PTR) &Identity->chipModel));
++
++        /* !!!! HACK ALERT !!!! */
++        /* Because people change device IDs without letting software know
++        ** about it - here is the hack to make it all look the same.  Only
++        ** for GC400 family.  Next time - TELL ME!!! */
++        if (((Identity->chipModel & 0xFF00) == 0x0400)
++          && (Identity->chipModel != 0x0420))
++        {
++            Identity->chipModel = (gceCHIPMODEL) (Identity->chipModel & 0x0400);
++        }
++
++        /* Read CHIP_REV register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00024,
++                                 &Identity->chipRevision));
++
++        if ((Identity->chipModel    == gcv300)
++        &&  (Identity->chipRevision == 0x2201)
++        )
++        {
++            gctUINT32 chipDate;
++            gctUINT32 chipTime;
++
++            /* Read date and time registers. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00028,
++                                     &chipDate));
++
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x0002C,
++                                     &chipTime));
++
++            if ((chipDate == 0x20080814) && (chipTime == 0x12051100))
++            {
++                /* This IP has an ECO; put the correct revision in it. */
++                Identity->chipRevision = 0x1051;
++            }
++        }
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipModel=%X",
++                   Identity->chipModel);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipRevision=%X",
++                   Identity->chipRevision);
++
++
++    /***************************************************************************
++    ** Get chip features.
++    */
++
++    /* Read chip feature register. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Os, Core,
++                             0x0001C,
++                             &Identity->chipFeatures));
++
++#ifndef VIVANTE_NO_3D
++    /* Disable fast clear on GC700. */
++    if (Identity->chipModel == gcv700)
++    {
++        Identity->chipFeatures
++            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++    }
++#endif
++
++    if (((Identity->chipModel == gcv500) && (Identity->chipRevision < 2))
++    ||  ((Identity->chipModel == gcv300) && (Identity->chipRevision < 0x2000))
++    )
++    {
++        /* GC500 rev 1.x and GC300 rev < 2.0 doesn't have these registers. */
++        Identity->chipMinorFeatures  = 0;
++        Identity->chipMinorFeatures1 = 0;
++        Identity->chipMinorFeatures2 = 0;
++        Identity->chipMinorFeatures3 = 0;
++        Identity->chipMinorFeatures4 = 0;
++    }
++    else
++    {
++        /* Read chip minor feature register #0. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00034,
++                                 &Identity->chipMinorFeatures));
++
++        if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))))
++        )
++        {
++            /* Read chip minor featuress register #1. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00074,
++                                     &Identity->chipMinorFeatures1));
++
++            /* Read chip minor featuress register #2. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00084,
++                                     &Identity->chipMinorFeatures2));
++
++            /*Identity->chipMinorFeatures2 &= ~(0x1 << 3);*/
++
++            /* Read chip minor featuress register #1. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00088,
++                                     &Identity->chipMinorFeatures3));
++
++            /*The BG2 chip has no compression supertiled, and the bit of GCMinorFeature3BugFixes15 is n/a*/
++            if(Identity->chipModel == gcv1000 && Identity->chipRevision == 0x5036)
++            {
++                Identity->chipMinorFeatures3
++                    = ((((gctUINT32) (Identity->chipMinorFeatures3)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++                Identity->chipMinorFeatures3
++                    = ((((gctUINT32) (Identity->chipMinorFeatures3)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27)));
++            }
++
++            /* Read chip minor featuress register #4. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00094,
++                                     &Identity->chipMinorFeatures4));
++        }
++        else
++        {
++            /* Chip doesn't has minor features register #1 or 2 or 3 or 4. */
++            Identity->chipMinorFeatures1 = 0;
++            Identity->chipMinorFeatures2 = 0;
++            Identity->chipMinorFeatures3 = 0;
++            Identity->chipMinorFeatures4 = 0;
++        }
++    }
++
++    /* Get the Supertile layout in the hardware. */
++    if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))))
++     || ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))))
++    {
++        Identity->superTileMode = 2;
++    }
++    else if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))))
++    {
++        Identity->superTileMode = 1;
++    }
++    else
++    {
++        Identity->superTileMode = 0;
++    }
++
++    /* Exception for GC1000, revision 5035 &  GC800, revision 4612 */
++    if (((Identity->chipModel == gcv1000) && ((Identity->chipRevision == 0x5035)
++                                           || (Identity->chipRevision == 0x5036)
++                                           || (Identity->chipRevision == 0x5037)))
++	 || ((Identity->chipModel == gcv800) && (Identity->chipRevision == 0x4612))
++     || ((Identity->chipModel == gcv860) && (Identity->chipRevision == 0x4647)))
++    {
++        Identity->superTileMode = 1;
++    }
++
++    if (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5245)
++    {
++        useHZ = ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))))
++             || ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))));
++    }
++    else
++    {
++        useHZ = gcvFALSE;
++    }
++
++    if (useHZ)
++    {
++        /* Disable EZ. */
++        Identity->chipFeatures
++            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
++    }
++
++    /* Disable HZ when EZ is present for older chips. */
++    else if (!((((gctUINT32) (Identity->chipFeatures)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))))
++    {
++        /* Disable HIERARCHICAL_Z. */
++        Identity->chipMinorFeatures
++            = ((((gctUINT32) (Identity->chipMinorFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27)));
++    }
++
++    /* Disable rectangle primitive when chip is gc880_5_1_0_rc6*/
++    if ((Identity->chipModel == gcv880) && (Identity->chipRevision == 0x5106))
++    {
++        /* Disable rectangle primitive. */
++        Identity->chipMinorFeatures2
++            = ((((gctUINT32) (Identity->chipMinorFeatures2)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++    }
++
++    if ((Identity->chipModel == gcv800) && (Identity->chipRevision == 0x4605))
++    {
++        /* Correct feature bit: RTL does not have such feature. */
++        Identity->chipFeatures
++            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)));
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipFeatures=0x%08X",
++                   Identity->chipFeatures);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures=0x%08X",
++                   Identity->chipMinorFeatures);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures1=0x%08X",
++                   Identity->chipMinorFeatures1);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures2=0x%08X",
++                   Identity->chipMinorFeatures2);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures3=0x%08X",
++                   Identity->chipMinorFeatures3);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures4=0x%08X",
++                   Identity->chipMinorFeatures4);
++
++    /***************************************************************************
++    ** Get chip specs.
++    */
++
++    if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
++    {
++        gctUINT32 specs, specs2, specs3;
++
++        /* Read gcChipSpecs register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00048,
++                                 &specs));
++
++        /* Extract the fields. */
++        streamCount            = (((((gctUINT32) (specs)) >> (0 ? 3:0)) & ((gctUINT32) ((((1 ? 3:0) - (0 ? 3:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:0) - (0 ? 3:0) + 1)))))) );
++        registerMax            = (((((gctUINT32) (specs)) >> (0 ? 7:4)) & ((gctUINT32) ((((1 ? 7:4) - (0 ? 7:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:4) - (0 ? 7:4) + 1)))))) );
++        threadCount            = (((((gctUINT32) (specs)) >> (0 ? 11:8)) & ((gctUINT32) ((((1 ? 11:8) - (0 ? 11:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:8) - (0 ? 11:8) + 1)))))) );
++        shaderCoreCount        = (((((gctUINT32) (specs)) >> (0 ? 24:20)) & ((gctUINT32) ((((1 ? 24:20) - (0 ? 24:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:20) - (0 ? 24:20) + 1)))))) );
++        vertexCacheSize        = (((((gctUINT32) (specs)) >> (0 ? 16:12)) & ((gctUINT32) ((((1 ? 16:12) - (0 ? 16:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:12) - (0 ? 16:12) + 1)))))) );
++        vertexOutputBufferSize = (((((gctUINT32) (specs)) >> (0 ? 31:28)) & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1)))))) );
++        pixelPipes             = (((((gctUINT32) (specs)) >> (0 ? 27:25)) & ((gctUINT32) ((((1 ? 27:25) - (0 ? 27:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:25) - (0 ? 27:25) + 1)))))) );
++
++        /* Read gcChipSpecs2 register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00080,
++                                 &specs2));
++
++        instructionCount       = (((((gctUINT32) (specs2)) >> (0 ? 15:8)) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1)))))) );
++        numConstants           = (((((gctUINT32) (specs2)) >> (0 ? 31:16)) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1)))))) );
++        bufferSize             = (((((gctUINT32) (specs2)) >> (0 ? 7:0)) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1)))))) );
++
++        /* Read gcChipSpecs3 register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x0008C,
++                                 &specs3));
++
++        varyingsCount          = (((((gctUINT32) (specs3)) >> (0 ? 8:4)) & ((gctUINT32) ((((1 ? 8:4) - (0 ? 8:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:4) - (0 ? 8:4) + 1)))))) );
++    }
++
++    /* Get the number of pixel pipes. */
++    Identity->pixelPipes = gcmMAX(pixelPipes, 1);
++
++    /* Get the stream count. */
++    Identity->streamCount = (streamCount != 0)
++                          ? streamCount
++                          : (Identity->chipModel >= gcv1000) ? 4 : 1;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: streamCount=%u%s",
++                   Identity->streamCount,
++                   (streamCount == 0) ? " (default)" : "");
++
++    /* Get the vertex output buffer size. */
++    Identity->vertexOutputBufferSize = (vertexOutputBufferSize != 0)
++                                     ? 1 << vertexOutputBufferSize
++                                     : (Identity->chipModel == gcv400)
++                                       ? (Identity->chipRevision < 0x4000) ? 512
++                                       : (Identity->chipRevision < 0x4200) ? 256
++                                       : 128
++                                     : (Identity->chipModel == gcv530)
++                                       ? (Identity->chipRevision < 0x4200) ? 512
++                                       : 128
++                                     : 512;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: vertexOutputBufferSize=%u%s",
++                   Identity->vertexOutputBufferSize,
++                   (vertexOutputBufferSize == 0) ? " (default)" : "");
++
++    /* Get the maximum number of threads. */
++    Identity->threadCount = (threadCount != 0)
++                          ? 1 << threadCount
++                          : (Identity->chipModel == gcv400) ? 64
++                          : (Identity->chipModel == gcv500) ? 128
++                          : (Identity->chipModel == gcv530) ? 128
++                          : 256;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: threadCount=%u%s",
++                   Identity->threadCount,
++                   (threadCount == 0) ? " (default)" : "");
++
++    /* Get the number of shader cores. */
++    Identity->shaderCoreCount = (shaderCoreCount != 0)
++                              ? shaderCoreCount
++                              : (Identity->chipModel >= gcv1000) ? 2
++                              : 1;
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: shaderCoreCount=%u%s",
++                   Identity->shaderCoreCount,
++                   (shaderCoreCount == 0) ? " (default)" : "");
++
++    /* Get the vertex cache size. */
++    Identity->vertexCacheSize = (vertexCacheSize != 0)
++                              ? vertexCacheSize
++                              : 8;
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: vertexCacheSize=%u%s",
++                   Identity->vertexCacheSize,
++                   (vertexCacheSize == 0) ? " (default)" : "");
++
++    /* Get the maximum number of temporary registers. */
++    Identity->registerMax = (registerMax != 0)
++        /* Maximum of registerMax/4 registers are accessible to 1 shader */
++                          ? 1 << registerMax
++                          : (Identity->chipModel == gcv400) ? 32
++                          : 64;
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: registerMax=%u%s",
++                   Identity->registerMax,
++                   (registerMax == 0) ? " (default)" : "");
++
++    /* Get the instruction count. */
++    Identity->instructionCount = (instructionCount == 0) ? 256
++                               : (instructionCount == 1) ? 1024
++                               : (instructionCount == 2) ? 2048
++                               : (instructionCount == 0xFF) ? 512
++                               : 256;
++
++    if (Identity->instructionCount == 256)
++    {
++        if ((Identity->chipModel == gcv2000 && Identity->chipRevision == 0x5108)
++        ||  Identity->chipModel == gcv880)
++        {
++            Identity->instructionCount = 512;
++        }
++    }
++
++    if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))))
++    {
++        Identity->instructionCount = 512;
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: instructionCount=%u%s",
++                   Identity->instructionCount,
++                   (instructionCount == 0) ? " (default)" : "");
++
++    /* Get the number of constants. */
++    Identity->numConstants = (numConstants == 0) ? 168 : numConstants;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: numConstants=%u%s",
++                   Identity->numConstants,
++                   (numConstants == 0) ? " (default)" : "");
++
++    /* Get the buffer size. */
++    Identity->bufferSize = bufferSize;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: bufferSize=%u%s",
++                   Identity->bufferSize,
++                   (bufferSize == 0) ? " (default)" : "");
++
++
++     if (varyingsCount != 0)
++     {
++         /* Bug 4480. */
++         /*Identity->varyingsCount = varyingsCount;*/
++         Identity->varyingsCount = 12;
++     }
++     else if (((((gctUINT32) (Identity->chipMinorFeatures1)) >> (0 ? 23:23) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))))
++     {
++         Identity->varyingsCount = 12;
++     }
++     else
++     {
++         Identity->varyingsCount = 8;
++     }
++
++     /* For some cores, it consumes two varying for position, so the max varying vectors should minus one. */
++     if ((Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5222) ||
++         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5208) ||
++         ((Identity->chipModel == gcv2100 || Identity->chipModel == gcv2000) && Identity->chipRevision == 0x5108) ||
++         (Identity->chipModel == gcv880 && (Identity->chipRevision == 0x5107 || Identity->chipRevision == 0x5106)))
++     {
++         Identity->varyingsCount -= 1;
++     }
++
++    Identity->chip2DControl = 0;
++    if (Identity->chipModel == gcv320)
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os,
++                                 Core,
++                                 0x0002C,
++                                 &data));
++
++        if ((data != 33956864) &&
++            ((Identity->chipRevision == 0x5007) ||
++            (Identity->chipRevision == 0x5220)))
++        {
++            Identity->chip2DControl |= 0xFF &
++                (Identity->chipRevision == 0x5220 ? 8 :
++                (Identity->chipRevision == 0x5007 ? 12 : 0));
++        }
++
++        if  (Identity->chipRevision == 0x5007)
++        {
++            /* Disable splitting rectangle. */
++            Identity->chip2DControl |= 0x100;
++
++            /* Enable 2D Flush. */
++            Identity->chip2DControl |= 0x200;
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdPOWEROFF_TIMEOUT
++void
++_PowerTimerFunction(
++    gctPOINTER Data
++    )
++{
++    gckHARDWARE hardware = (gckHARDWARE)Data;
++    gcmkVERIFY_OK(
++        gckHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
++}
++#endif
++
++static gceSTATUS
++_VerifyDMA(
++    IN gckOS Os,
++    IN gceCORE Core,
++    gctUINT32_PTR Address1,
++    gctUINT32_PTR Address2,
++    gctUINT32_PTR State1,
++    gctUINT32_PTR State2
++    )
++{
++    gceSTATUS status;
++    gctUINT32 i;
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State1));
++    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address1));
++
++    for (i = 0; i < 500; i += 1)
++    {
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State2));
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address2));
++
++        if (*Address1 != *Address2)
++        {
++            break;
++        }
++
++        if (*State1 != *State2)
++        {
++            break;
++        }
++    }
++
++OnError:
++    return status;
++}
++
++static gceSTATUS
++_DumpDebugRegisters(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gcsiDEBUG_REGISTERS_PTR Descriptor
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctUINT32 select;
++    gctUINT32 data = 0;
++    gctUINT i;
++
++    gcmkHEADER_ARG("Os=0x%X Descriptor=0x%X", Os, Descriptor);
++
++    gcmkPRINT_N(4, "    %s debug registers:\n", Descriptor->module);
++
++    for (i = 0; i < Descriptor->count; i += 1)
++    {
++        select = i << Descriptor->shift;
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
++#if gcdFPGA_BUILD
++        gcmkONERROR(gckOS_Delay(Os, 1000));
++#endif
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
++
++        gcmkPRINT_N(12, "      [0x%02X] 0x%08X\n", i, data);
++    }
++
++    select = 0xF << Descriptor->shift;
++
++    for (i = 0; i < 500; i += 1)
++    {
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
++#if gcdFPGA_BUILD
++        gcmkONERROR(gckOS_Delay(Os, 1000));
++#endif
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
++
++        if (data == Descriptor->signature)
++        {
++            break;
++        }
++    }
++
++    if (i == 500)
++    {
++        gcmkPRINT_N(4, "      failed to obtain the signature (read 0x%08X).\n", data);
++    }
++    else
++    {
++        gcmkPRINT_N(8, "      signature = 0x%08X (%d read attempt(s))\n", data, i + 1);
++    }
++
++OnError:
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++_IsGPUPresent(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gcsHAL_QUERY_CHIP_IDENTITY identity;
++    gctUINT32 control;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &control));
++
++    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
++    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      control));
++
++    /* Identify the hardware. */
++    gcmkONERROR(_IdentifyHardware(Hardware->os,
++                                  Hardware->core,
++                                  &identity));
++
++    /* Check if these are the same values as saved before. */
++    if ((Hardware->identity.chipModel          != identity.chipModel)
++    ||  (Hardware->identity.chipRevision       != identity.chipRevision)
++    ||  (Hardware->identity.chipFeatures       != identity.chipFeatures)
++    ||  (Hardware->identity.chipMinorFeatures  != identity.chipMinorFeatures)
++    ||  (Hardware->identity.chipMinorFeatures1 != identity.chipMinorFeatures1)
++    ||  (Hardware->identity.chipMinorFeatures2 != identity.chipMinorFeatures2)
++    )
++    {
++        gcmkPRINT("[galcore]: GPU is not present.");
++        gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++_FlushCache(
++    gckHARDWARE Hardware,
++    gckCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T bytes, requested;
++    gctPOINTER buffer;
++
++    /* Get the size of the flush command. */
++    gcmkONERROR(gckHARDWARE_Flush(Hardware,
++                                  gcvFLUSH_ALL,
++                                  gcvNULL,
++                                  &requested));
++
++    /* Reserve space in the command queue. */
++    gcmkONERROR(gckCOMMAND_Reserve(Command,
++                                   requested,
++                                   &buffer,
++                                   &bytes));
++
++    /* Append a flush. */
++    gcmkONERROR(gckHARDWARE_Flush(
++        Hardware, gcvFLUSH_ALL, buffer, &bytes
++        ));
++
++    /* Execute the command queue. */
++    gcmkONERROR(gckCOMMAND_Execute(Command, requested));
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++/******************************************************************************\
++****************************** gckHARDWARE API code *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Construct
++**
++**  Construct a new gckHARDWARE object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an initialized gckOS object.
++**
++**      gceCORE Core
++**          Specified core.
++**
++**  OUTPUT:
++**
++**      gckHARDWARE * Hardware
++**          Pointer to a variable that will hold the pointer to the gckHARDWARE
++**          object.
++*/
++gceSTATUS
++gckHARDWARE_Construct(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gckHARDWARE * Hardware
++    )
++{
++    gceSTATUS status;
++    gckHARDWARE hardware = gcvNULL;
++    gctUINT16 data = 0xff00;
++    gctUINT32 axi_ot;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%x", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
++
++    /* Enable the GPU. */
++    gcmkONERROR(gckOS_SetGPUPower(Os, Core, gcvTRUE, gcvTRUE));
++    gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                      Core,
++                                      0x00000,
++                                      0x00000900));
++
++    /* Allocate the gckHARDWARE object. */
++    gcmkONERROR(gckOS_Allocate(Os,
++                               gcmSIZEOF(struct _gckHARDWARE),
++                               &pointer));
++
++    hardware = (gckHARDWARE) pointer;
++
++    /* Initialize the gckHARDWARE object. */
++    hardware->object.type = gcvOBJ_HARDWARE;
++    hardware->os          = Os;
++    hardware->core        = Core;
++
++    /* Identify the hardware. */
++    gcmkONERROR(_IdentifyHardware(Os, Core, &hardware->identity));
++
++    /* Determine the hardware type */
++    switch (hardware->identity.chipModel)
++    {
++    case gcv350:
++    case gcv355:
++        hardware->type = gcvHARDWARE_VG;
++        break;
++
++    case gcv300:
++    case gcv320:
++    case gcv420:
++        hardware->type = gcvHARDWARE_2D;
++        /*set outstanding limit*/
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x00414, &axi_ot));
++        axi_ot = (axi_ot & (~0xFF)) | 0x10;
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00414, axi_ot));
++        break;
++
++    default:
++        hardware->type = gcvHARDWARE_3D;
++        if(hardware->identity.chipModel == gcv880)
++        {
++            /*set outstanding limit*/
++            gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x00414, &axi_ot));
++            axi_ot = (axi_ot & (~0xFF)) | 0x10;
++            gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00414, axi_ot));
++        }
++
++        if ((((((gctUINT32) (hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ))
++        {
++            hardware->type = (gceHARDWARE_TYPE) (hardware->type | gcvHARDWARE_2D);
++        }
++    }
++
++    hardware->powerBaseAddress
++        = ((hardware->identity.chipModel   == gcv300)
++        && (hardware->identity.chipRevision < 0x2000))
++            ? 0x0100
++            : 0x0000;
++
++    /* _ResetGPU need powerBaseAddress. */
++    status = _ResetGPU(hardware, Os, Core);
++
++    if (status != gcvSTATUS_OK)
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "_ResetGPU failed: status=%d\n", status);
++    }
++
++    hardware->powerMutex = gcvNULL;
++
++    hardware->mmuVersion
++        = (((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 28:28)) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) );
++
++    /* Determine whether bug fixes #1 are present. */
++    hardware->extraEventStates = ((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))));
++
++    /* Check if big endian */
++    hardware->bigEndian = (*(gctUINT8 *)&data == 0xff);
++
++    /* Initialize the fast clear. */
++    gcmkONERROR(gckHARDWARE_SetFastClear(hardware, -1, -1));
++
++#if !gcdENABLE_128B_MERGE
++
++    if (((((gctUINT32) (hardware->identity.chipMinorFeatures2)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
++    {
++        /* 128B merge is turned on by default. Disable it. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00558, 0));
++    }
++
++#endif
++
++    /* Set power state to ON. */
++    hardware->chipPowerState  = gcvPOWER_ON;
++    hardware->clockState      = gcvTRUE;
++    hardware->powerState      = gcvTRUE;
++    hardware->lastWaitLink    = ~0U;
++    hardware->globalSemaphore = gcvNULL;
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    hardware->powerOnFscaleVal = 64;
++#endif
++
++    gcmkONERROR(gckOS_CreateMutex(Os, &hardware->powerMutex));
++    gcmkONERROR(gckOS_CreateSemaphore(Os, &hardware->globalSemaphore));
++    hardware->startIsr = gcvNULL;
++    hardware->stopIsr = gcvNULL;
++
++#if gcdPOWEROFF_TIMEOUT
++    hardware->powerOffTimeout = gcdPOWEROFF_TIMEOUT;
++
++    gcmkVERIFY_OK(gckOS_CreateTimer(Os,
++                                    _PowerTimerFunction,
++                                    (gctPOINTER)hardware,
++                                    &hardware->powerOffTimer));
++#endif
++
++    gcmkONERROR(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
++
++#if gcdLINK_QUEUE_SIZE
++    hardware->linkQueue.front = 0;
++    hardware->linkQueue.rear = 0;
++    hardware->linkQueue.count = 0;
++#endif
++
++    /* Enable power management by default. */
++    hardware->powerManagement = gcvTRUE;
++
++    /* Disable profiler by default */
++    hardware->gpuProfiler = gcvFALSE;
++
++    /* Return pointer to the gckHARDWARE object. */
++    *Hardware = hardware;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Hardware=0x%x", *Hardware);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (hardware != gcvNULL)
++    {
++        /* Turn off the power. */
++        gcmkVERIFY_OK(gckOS_SetGPUPower(Os, Core, gcvFALSE, gcvFALSE));
++
++        if (hardware->globalSemaphore != gcvNULL)
++        {
++            /* Destroy the global semaphore. */
++            gcmkVERIFY_OK(gckOS_DestroySemaphore(Os,
++                                                 hardware->globalSemaphore));
++        }
++
++        if (hardware->powerMutex != gcvNULL)
++        {
++            /* Destroy the power mutex. */
++            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, hardware->powerMutex));
++        }
++
++#if gcdPOWEROFF_TIMEOUT
++        if (hardware->powerOffTimer != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
++            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
++        }
++#endif
++
++        if (hardware->pageTableDirty != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, hardware));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Destroy
++**
++**  Destroy an gckHARDWARE object.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object that needs to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Destroy(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Destroy the power semaphore. */
++    gcmkVERIFY_OK(gckOS_DestroySemaphore(Hardware->os,
++                                         Hardware->globalSemaphore));
++
++    /* Destroy the power mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Hardware->os, Hardware->powerMutex));
++
++#if gcdPOWEROFF_TIMEOUT
++    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
++    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
++#endif
++
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
++
++    /* Mark the object as unknown. */
++    Hardware->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the object. */
++    gcmkONERROR(gcmkOS_SAFE_FREE(Hardware->os, Hardware));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_GetType
++**
++**  Get the hardware type.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gceHARDWARE_TYPE * Type
++**          Pointer to a variable that receives the type of hardware object.
++*/
++gceSTATUS
++gckHARDWARE_GetType(
++    IN gckHARDWARE Hardware,
++    OUT gceHARDWARE_TYPE * Type
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++    gcmkVERIFY_ARGUMENT(Type != gcvNULL);
++
++    *Type = Hardware->type;
++
++    gcmkFOOTER_ARG("*Type=%d", *Type);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_InitializeHardware
++**
++**  Initialize the hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_InitializeHardware(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gctUINT32 baseAddress;
++    gctUINT32 chipRev;
++    gctUINT32 control;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Read the chip revision register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00024,
++                                     &chipRev));
++
++    if (chipRev != Hardware->identity.chipRevision)
++    {
++        /* Chip is not there! */
++        gcmkONERROR(gcvSTATUS_CONTEXT_LOSSED);
++    }
++
++    /* Disable isolate GPU bit. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)))));
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &control));
++
++    /* Enable debug register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
++
++    /* Reset memory counters. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      ~0U));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      0));
++
++    /* Get the system's physical base address. */
++    gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
++
++    /* Program the base addesses. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0041C,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00418,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00428,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00420,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00424,
++                                      baseAddress));
++
++#if !VIVANTE_PROFILER
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         Hardware->powerBaseAddress +
++                                         0x00100,
++                                         &data));
++
++        /* Enable clock gating. */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        if ((Hardware->identity.chipRevision == 0x4301)
++        ||  (Hardware->identity.chipRevision == 0x4302)
++        )
++        {
++            /* Disable stall module level clock gating for 4.3.0.1 and 4.3.0.2
++            ** revisions. */
++            data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
++        }
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          Hardware->powerBaseAddress
++                                          + 0x00100,
++                                          data));
++
++#ifndef VIVANTE_NO_3D
++        /* Disable PE clock gating on revs < 5.0 when HZ is present without a
++        ** bug fix. */
++        if ((Hardware->identity.chipRevision < 0x5000)
++        &&  ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))))
++        &&  ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))))
++        )
++        {
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     Hardware->powerBaseAddress
++                                     + 0x00104,
++                                     &data));
++
++            /* Disable PE clock gating. */
++            data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
++
++            gcmkONERROR(
++                gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      Hardware->powerBaseAddress
++                                      + 0x00104,
++                                      data));
++        }
++
++#endif
++    }
++#endif
++
++    /* Special workaround for this core
++    ** Make sure pulse eater kicks in only when SH is idle */
++    if (Hardware->identity.chipModel == gcv4000 &&
++        Hardware->identity.chipRevision == 0x5208)
++    {
++		gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x0010C,
++                                  ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)))));
++    }
++
++    if ((gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HALTI2) == gcvFALSE)
++     || (gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HALTI2) && (Hardware->identity.chipRevision < 0x5422))
++    )
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &data));
++
++
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15)));
++
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  data));
++    }
++
++    /* Special workaround for this core
++    ** Make sure FE and TX are on different buses */
++    if ((Hardware->identity.chipModel == gcv2000)
++    &&  (Hardware->identity.chipRevision  == 0x5108))
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00480,
++                                 &data));
++
++        /* Set FE bus to one, TX bus to zero */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00480,
++                                  data));
++    }
++
++    /* Test if MMU is initialized. */
++    if ((Hardware->kernel      != gcvNULL)
++    &&  (Hardware->kernel->mmu != gcvNULL)
++    )
++    {
++        /* Reset MMU. */
++        if (Hardware->mmuVersion == 0)
++        {
++            gcmkONERROR(
++                    gckHARDWARE_SetMMU(Hardware,
++                        Hardware->kernel->mmu->pageTableLogical));
++        }
++    }
++
++    if (Hardware->identity.chipModel >= gcv400
++    &&  Hardware->identity.chipModel != gcv420
++    &&  (((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 15:15) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) != gcvTRUE)
++    )
++    {
++		gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &data));
++
++        /* Disable PA clock gating. */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  data));
++    }
++
++#if gcdHZ_L2_DISALBE
++    /* Disable HZ-L2. */
++    if (((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) == gcvTRUE ||
++            ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) == gcvTRUE)
++    {
++		gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00414,
++                                 &data));
++
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00414,
++                                  data));
++    }
++#endif
++
++    /* Limit 2D outstanding request. */
++    if(Hardware->identity.chipModel == gcv880)
++    {
++        gctUINT32 axi_ot;
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &axi_ot));
++        axi_ot = (axi_ot & (~0xFF)) | 0x10;
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00414, axi_ot));
++    }
++
++    if (Hardware->identity.chip2DControl & 0xFF)
++    {
++		gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00414,
++                                 &data));
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (Hardware->identity.chip2DControl & 0xFF) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00414,
++                                  data));
++    }
++
++    /* Update GPU AXI cache atttribute. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00008,
++                                      0x00002200));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryMemory
++**
++**  Query the amount of memory available on the hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * InternalSize
++**          Pointer to a variable that will hold the size of the internal video
++**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
++**          internal memory will be returned.
++**
++**      gctUINT32 * InternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * InternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctSIZE_T * ExternalSize
++**          Pointer to a variable that will hold the size of the external video
++**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
++**          external memory will be returned.
++**
++**      gctUINT32 * ExternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * ExternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * HorizontalTileSize
++**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
++**          gcvNULL, no horizontal pixel per tile will be returned.
++**
++**      gctUINT32 * VerticalTileSize
++**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
++**          gcvNULL, no vertical pixel per tile will be returned.
++*/
++gceSTATUS
++gckHARDWARE_QueryMemory(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctUINT32 * InternalBaseAddress,
++    OUT gctUINT32 * InternalAlignment,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctUINT32 * ExternalBaseAddress,
++    OUT gctUINT32 * ExternalAlignment,
++    OUT gctUINT32 * HorizontalTileSize,
++    OUT gctUINT32 * VerticalTileSize
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (InternalSize != gcvNULL)
++    {
++        /* No internal memory. */
++        *InternalSize = 0;
++    }
++
++    if (ExternalSize != gcvNULL)
++    {
++        /* No external memory. */
++        *ExternalSize = 0;
++    }
++
++    if (HorizontalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *HorizontalTileSize = 4;
++    }
++
++    if (VerticalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *VerticalTileSize = 4;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*InternalSize=%lu *InternalBaseAddress=0x%08x "
++                   "*InternalAlignment=0x%08x *ExternalSize=%lu "
++                   "*ExternalBaseAddress=0x%08x *ExtenalAlignment=0x%08x "
++                   "*HorizontalTileSize=%u *VerticalTileSize=%u",
++                   gcmOPT_VALUE(InternalSize),
++                   gcmOPT_VALUE(InternalBaseAddress),
++                   gcmOPT_VALUE(InternalAlignment),
++                   gcmOPT_VALUE(ExternalSize),
++                   gcmOPT_VALUE(ExternalBaseAddress),
++                   gcmOPT_VALUE(ExternalAlignment),
++                   gcmOPT_VALUE(HorizontalTileSize),
++                   gcmOPT_VALUE(VerticalTileSize));
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryChipIdentity
++**
++**  Query the identity of the hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++**          Pointer to the identity structure.
++**
++*/
++gceSTATUS
++gckHARDWARE_QueryChipIdentity(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++    )
++{
++    gctUINT32 features;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Identity != gcvNULL);
++
++    /* Return chip model and revision. */
++    Identity->chipModel = Hardware->identity.chipModel;
++    Identity->chipRevision = Hardware->identity.chipRevision;
++
++    /* Return feature set. */
++    features = Hardware->identity.chipFeatures;
++
++    if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++    {
++        /* Override fast clear by command line. */
++        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++    }
++
++    if ((((((gctUINT32) (features)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ))
++    {
++        /* Override compression by command line. */
++        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (Hardware->allowCompression) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++    }
++
++    /* Mark 2D pipe as available for GC500.0 through GC500.2 and GC300,
++    ** since they did not have this bit. */
++    if (((Hardware->identity.chipModel == gcv500) && (Hardware->identity.chipRevision <= 2))
++    ||   (Hardware->identity.chipModel == gcv300)
++    )
++    {
++        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++    }
++
++    Identity->chipFeatures = features;
++
++    /* Return minor features. */
++    Identity->chipMinorFeatures  = Hardware->identity.chipMinorFeatures;
++    Identity->chipMinorFeatures1 = Hardware->identity.chipMinorFeatures1;
++    Identity->chipMinorFeatures2 = Hardware->identity.chipMinorFeatures2;
++    Identity->chipMinorFeatures3 = Hardware->identity.chipMinorFeatures3;
++    Identity->chipMinorFeatures4 = Hardware->identity.chipMinorFeatures4;
++
++    /* Return chip specs. */
++    Identity->streamCount            = Hardware->identity.streamCount;
++    Identity->registerMax            = Hardware->identity.registerMax;
++    Identity->threadCount            = Hardware->identity.threadCount;
++    Identity->shaderCoreCount        = Hardware->identity.shaderCoreCount;
++    Identity->vertexCacheSize        = Hardware->identity.vertexCacheSize;
++    Identity->vertexOutputBufferSize = Hardware->identity.vertexOutputBufferSize;
++    Identity->pixelPipes             = Hardware->identity.pixelPipes;
++    Identity->instructionCount       = Hardware->identity.instructionCount;
++    Identity->numConstants           = Hardware->identity.numConstants;
++    Identity->bufferSize             = Hardware->identity.bufferSize;
++    Identity->varyingsCount          = Hardware->identity.varyingsCount;
++    Identity->superTileMode          = Hardware->identity.superTileMode;
++    Identity->chip2DControl          = Hardware->identity.chip2DControl;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SplitMemory
++**
++**  Split a hardware specific memory address into a pool and offset.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gctUINT32 Address
++**          Address in hardware specific format.
++**
++**  OUTPUT:
++**
++**      gcePOOL * Pool
++**          Pointer to a variable that will hold the pool type for the address.
++**
++**      gctUINT32 * Offset
++**          Pointer to a variable that will hold the offset for the address.
++*/
++gceSTATUS
++gckHARDWARE_SplitMemory(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Addres=0x%08x", Hardware, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
++
++    if (Hardware->mmuVersion == 0)
++    {
++        /* Dispatch on memory type. */
++        switch ((((((gctUINT32) (Address)) >> (0 ? 31:31)) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) ))
++        {
++        case 0x0:
++            /* System memory. */
++            *Pool = gcvPOOL_SYSTEM;
++            break;
++
++        case 0x1:
++            /* Virtual memory. */
++            *Pool = gcvPOOL_VIRTUAL;
++            break;
++
++        default:
++            /* Invalid memory type. */
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
++            return gcvSTATUS_INVALID_ARGUMENT;
++        }
++
++        /* Return offset of address. */
++        *Offset = (((((gctUINT32) (Address)) >> (0 ? 30:0)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1)))))) );
++    }
++    else
++    {
++        *Pool = gcvPOOL_SYSTEM;
++        *Offset = Address;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Pool=%d *Offset=0x%08x", *Pool, *Offset);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Execute
++**
++**  Kickstart the hardware's command processor with an initialized command
++**  buffer.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of command buffer.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes for the prefetch unit (until after the first LINK).
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Execute(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++#ifdef __QNXNTO__
++    IN gctPOINTER Physical,
++    IN gctBOOL PhysicalAddresses,
++#endif
++    IN gctSIZE_T Bytes
++    )
++{
++    gceSTATUS status;
++    gctUINT32 address = 0, control;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Bytes=%lu",
++                   Hardware, Logical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++#ifdef __QNXNTO__
++    if (PhysicalAddresses && (Hardware->mmuVersion == 0))
++    {
++        /* Convert physical into hardware specific address. */
++        gcmkONERROR(
++            gckHARDWARE_ConvertPhysical(Hardware, Physical, &address));
++    }
++    else
++    {
++#endif
++    /* Convert logical into hardware specific address. */
++    gcmkONERROR(
++        gckHARDWARE_ConvertLogical(Hardware, Logical, &address));
++#ifdef __QNXNTO__
++    }
++#endif
++
++    /* Enable all events. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00014, ~0U));
++
++    /* Write address register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00654, address));
++
++    /* Build control register. */
++    control = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) ((Bytes + 7) >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++    /* Set big endian */
++    if (Hardware->bigEndian)
++    {
++        control |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20)));
++    }
++
++    /* Write control register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00658, control));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                  "Started command buffer @ 0x%08x",
++                  address);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_WaitLink
++**
++**  Append a WAIT/LINK command sequence at the specified location in the command
++**  queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          WAIT/LINK command sequence at or gcvNULL just to query the size of the
++**          WAIT/LINK command sequence.
++**
++**      gctUINT32 Offset
++**          Offset into command buffer required for alignment.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the WAIT/LINK command
++**          sequence.  If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          by the WAIT/LINK command sequence.  If 'Bytes' is gcvNULL, nothing will
++**          be returned.
++**
++**      gctUINT32 * WaitOffset
++**          Pointer to a variable that will receive the offset of the WAIT command
++**          from the specified logcial pointer.
++**          If 'WaitOffset' is gcvNULL nothing will be returned.
++**
++**      gctSIZE_T * WaitSize
++**          Pointer to a variable that will receive the number of bytes used by
++**          the WAIT command.  If 'LinkSize' is gcvNULL nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_WaitLink(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctUINT32 * WaitOffset,
++    OUT gctSIZE_T * WaitSize
++    )
++{
++    static const gctUINT waitCount = 200;
++
++    gceSTATUS status;
++    gctUINT32 address;
++    gctUINT32_PTR logical;
++    gctSIZE_T bytes;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x *Bytes=%lu",
++                   Hardware, Logical, Offset, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical != gcvNULL) || (Bytes != gcvNULL));
++
++    /* Compute number of bytes required. */
++#if gcd6000_SUPPORT
++    bytes = gcmALIGN(Offset + 96, 8) - Offset;
++#else
++    bytes = gcmALIGN(Offset + 16, 8) - Offset;
++#endif
++
++    /* Cast the input pointer. */
++    logical = (gctUINT32_PTR) Logical;
++
++    if (logical != gcvNULL)
++    {
++        /* Not enough space? */
++        if (*Bytes < bytes)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Convert logical into hardware specific address. */
++        gcmkONERROR(gckHARDWARE_ConvertLogical(Hardware, logical, &address));
++
++        /* Store the WAIT/LINK address. */
++        Hardware->lastWaitLink = address;
++
++        /* Append WAIT(count). */
++        logical[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (waitCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++#if gcd6000_SUPPORT
++        /* Send FE-PE sempahore token. */
++        logical[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[3]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Send FE-PE stall token. */
++        logical[4]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        logical[5]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /*************************************************************/
++        /* Enable chip ID 0. */
++        logical[6] =
++            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | (1 << 0);
++
++        /* Send semaphore from FE to ChipID 1. */
++        logical[8] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[9] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
++
++        /* Send semaphore from FE to ChipID 1. */
++        logical[10] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        logical[11] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
++
++        /*************************************************************/
++        /* Enable chip ID 1. */
++        logical[12] =
++            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | (1 << 1);
++
++        /* Send semaphore from FE to ChipID 1. */
++        logical[14] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[15] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
++
++        /* Wait for semaphore from ChipID 0. */
++        logical[16] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        logical[17] =
++              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x0F & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:24) - (0 ? 27:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:24) - (0 ? 27:24) + 1))))))) << (0 ? 27:24)));
++
++        /*************************************************************/
++        /* Enable all chips. */
++        logical[18] =
++            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | (0xFFFF);
++
++        /* LoadState(AQFlush, 1), flush. */
++        logical[20]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[21]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++        /* Append LINK(2, address). */
++        logical[22]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[23] = address;
++#else
++        /* Append LINK(2, address). */
++        logical[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[3] = address;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "0x%08x: WAIT %u", address, waitCount
++            );
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "0x%08x: LINK 0x%08x, #%lu",
++            address + 8, address, bytes
++            );
++#endif
++
++        if (WaitOffset != gcvNULL)
++        {
++            /* Return the offset pointer to WAIT command. */
++            *WaitOffset = 0;
++        }
++
++        if (WaitSize != gcvNULL)
++        {
++            /* Return number of bytes used by the WAIT command. */
++            *WaitSize = 8;
++        }
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the WAIT/LINK command
++        ** sequence. */
++        *Bytes = bytes;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu *WaitOffset=0x%x *WaitSize=%lu",
++                   gcmOPT_VALUE(Bytes), gcmOPT_VALUE(WaitOffset),
++                   gcmOPT_VALUE(WaitSize));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_End
++**
++**  Append an END command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          END command at or gcvNULL just to query the size of the END command.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the END command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the END command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_End(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
++                   Hardware, Logical, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Append END. */
++       logical[0] =
++            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: END", Logical);
++
++        /* Make sure the CPU writes out the data to memory. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, Logical));
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the END command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Nop
++**
++**  Append a NOP command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          NOP command at or gcvNULL just to query the size of the NOP command.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the NOP command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the NOP command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_Nop(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
++                   Hardware, Logical, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Append NOP. */
++        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: NOP", Logical);
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the NOP command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Wait
++**
++**  Append a WAIT command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          WAIT command at or gcvNULL just to query the size of the WAIT command.
++**
++**      gctUINT32 Count
++**          Number of cycles to wait.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the WAIT command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the NOP command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_Wait(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Count,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gceSTATUS status;
++    gctUINT32_PTR logical;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Count=%u *Bytes=%lu",
++                   Hardware, Logical, Count, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    /* Cast the input pointer. */
++    logical = (gctUINT32_PTR) Logical;
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Append WAIT. */
++        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++        {
++            gctUINT32 address;
++
++            /* Convert logical into hardware specific address. */
++            gcmkONERROR(gckHARDWARE_ConvertLogical(
++                Hardware, logical, &address
++                ));
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                "0x%08x: WAIT %u", address, Count
++                );
++        }
++#endif
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the WAIT command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Event
++**
++**  Append an EVENT command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          the EVENT command at or gcvNULL just to query the size of the EVENT
++**          command.
++**
++**      gctUINT8 Event
++**          Event ID to program.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Location of the pipe to send the event.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the EVENT command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the EVENT command.  If 'Bytes' is gcvNULL, nothing will be
++**          returned.
++*/
++gceSTATUS
++gckHARDWARE_Event(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT8 Event,
++    IN gceKERNEL_WHERE FromWhere,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT size;
++    gctUINT32 destination = 0;
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Event=%u FromWhere=%d *Bytes=%lu",
++                   Hardware, Logical, Event, FromWhere, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++    gcmkVERIFY_ARGUMENT(Event < 32);
++
++    /* Determine the size of the command. */
++
++    size = (Hardware->extraEventStates && (FromWhere == gcvKERNEL_PIXEL))
++         ? gcmALIGN(8 + (1 + 5) * 4, 8) /* EVENT + 5 STATES */
++         : 8;
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < size)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        switch (FromWhere)
++        {
++        case gcvKERNEL_COMMAND:
++            /* From command processor. */
++            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++            break;
++
++        case gcvKERNEL_PIXEL:
++            /* From pixel engine. */
++            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++            break;
++
++        default:
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        /* Append EVENT(Event, destiantion). */
++        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[1] = ((((gctUINT32) (destination)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (Event) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
++
++        /* Make sure the event ID gets written out before GPU can access it. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, logical + 1));
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++        {
++            gctUINT32 phys;
++            gckOS_GetPhysicalAddress(Hardware->os, Logical, &phys);
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "0x%08x: EVENT %d", phys, Event);
++        }
++#endif
++
++        /* Append the extra states. These are needed for the chips that do not
++        ** support back-to-back events due to the async interface. The extra
++        ** states add the necessary delay to ensure that event IDs do not
++        ** collide. */
++        if (size > 8)
++        {
++            logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0100) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++            logical[3] = 0;
++            logical[4] = 0;
++            logical[5] = 0;
++            logical[6] = 0;
++            logical[7] = 0;
++        }
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the EVENT command. */
++        *Bytes = size;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_PipeSelect
++**
++**  Append a PIPESELECT command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          the PIPESELECT command at or gcvNULL just to query the size of the
++**          PIPESELECT command.
++**
++**      gcePIPE_SELECT Pipe
++**          Pipe value to select.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the PIPESELECT command.
++**          If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the PIPESELECT command.  If 'Bytes' is gcvNULL, nothing will be
++**          returned.
++*/
++gceSTATUS
++gckHARDWARE_PipeSelect(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gcePIPE_SELECT Pipe,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Pipe=%d *Bytes=%lu",
++                   Hardware, Logical, Pipe, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    /* Append a PipeSelect. */
++    if (Logical != gcvNULL)
++    {
++        gctUINT32 flush, stall;
++
++        if (*Bytes < 32)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        flush = (Pipe == gcvPIPE_2D)
++              ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++              : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++
++        stall = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LoadState(AQFlush, 1), flush. */
++        logical[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[1]
++            = flush;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: FLUSH 0x%x", logical, flush);
++
++        /* LoadState(AQSempahore, 1), stall. */
++        logical[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[3]
++            = stall;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: SEMAPHORE 0x%x", logical + 2, stall);
++
++        /* Stall, stall. */
++        logical[4] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++        logical[5] = stall;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: STALL 0x%x", logical + 4, stall);
++
++        /* LoadState(AQPipeSelect, 1), pipe. */
++        logical[6]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[7] = (Pipe == gcvPIPE_2D)
++            ? 0x1
++            : 0x0;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: PIPE %d", logical + 6, Pipe);
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the PIPESELECT command. */
++        *Bytes = 32;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Link
++**
++**  Append a LINK command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          the LINK command at or gcvNULL just to query the size of the LINK
++**          command.
++**
++**      gctPOINTER FetchAddress
++**          Logical address of destination of LINK.
++**
++**      gctSIZE_T FetchSize
++**          Number of bytes in destination of LINK.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the LINK command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the LINK command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_Link(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctPOINTER FetchAddress,
++    IN gctSIZE_T FetchSize,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T bytes;
++    gctUINT32 address;
++    gctUINT32 link;
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x FetchAddress=0x%x FetchSize=%lu "
++                   "*Bytes=%lu",
++                   Hardware, Logical, FetchAddress, FetchSize,
++                   gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Convert logical address to hardware address. */
++        gcmkONERROR(
++            gckHARDWARE_ConvertLogical(Hardware, FetchAddress, &address));
++
++        gcmkONERROR(
++            gckOS_WriteMemory(Hardware->os, logical + 1, address));
++
++        /* Make sure the address got written before the LINK command. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, logical + 1));
++
++        /* Compute number of 64-byte aligned bytes to fetch. */
++        bytes = gcmALIGN(address + FetchSize, 8) - address;
++
++        /* Append LINK(bytes / 8), FetchAddress. */
++        link = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        gcmkONERROR(
++            gckOS_WriteMemory(Hardware->os, logical, link));
++
++        /* Memory barrier. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, logical));
++
++#if gcdLINK_QUEUE_SIZE && gcdVIRTUAL_COMMAND_BUFFER
++        if (address >= 0x80000000)
++        {
++            gckLINKQUEUE_Enqueue(&Hardware->linkQueue, address, address + bytes);
++        }
++#endif
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the LINK command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_UpdateQueueTail
++**
++**  Update the tail of the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of the start of the command queue.
++**
++**      gctUINT32 Offset
++**          Offset into the command queue of the tail (last command).
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_UpdateQueueTail(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x",
++                   Hardware, Logical, Offset);
++
++    /* Verify the hardware. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Force a barrier. */
++    gcmkONERROR(
++        gckOS_MemoryBarrier(Hardware->os, Logical));
++
++    /* Notify gckKERNEL object of change. */
++    gcmkONERROR(
++        gckKERNEL_Notify(Hardware->kernel,
++                         gcvNOTIFY_COMMAND_QUEUE,
++                         gcvFALSE));
++
++    if (status == gcvSTATUS_CHIP_NOT_READY)
++    {
++        gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_ConvertLogical
++**
++**  Convert a logical system address into a hardware specific address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address to convert.
++**
++**      gctUINT32* Address
++**          Return hardware specific address.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_ConvertLogical(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++    gceSTATUS status;
++    gctUINT32 baseAddress;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x", Hardware, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++    status = gckKERNEL_GetGPUAddress(Hardware->kernel, Logical, Address);
++
++    if (status == gcvSTATUS_INVALID_ADDRESS)
++#endif
++    {
++        /* Convert logical address into a physical address. */
++        gcmkONERROR(
++            gckOS_GetPhysicalAddress(Hardware->os, Logical, &address));
++
++        /* For old MMU, get GPU address according to baseAddress. */
++        if (Hardware->mmuVersion == 0)
++        {
++            gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
++
++            /* Subtract base address to get a GPU address. */
++            gcmkASSERT(address >= baseAddress);
++            address -= baseAddress;
++        }
++
++        /* Return hardware specific address. */
++        *Address = (Hardware->mmuVersion == 0)
++                 ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (address) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)))
++                 : address;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_ConvertPhysical
++**
++**  Convert a physical address into a hardware specific address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address to convert.
++**
++**      gctUINT32* Address
++**          Return hardware specific address.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_ConvertPhysical(
++    IN gckHARDWARE Hardware,
++    IN gctPHYS_ADDR Physical,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++    gctUINT32 baseAddress;
++
++    gcmkHEADER_ARG("Hardware=0x%x Physical=0x%x", Hardware, Physical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    address = gcmPTR2INT(Physical);
++
++    /* For old MMU, get GPU address according to baseAddress. */
++    if (Hardware->mmuVersion == 0)
++    {
++        gcmkVERIFY_OK(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
++
++        /* Subtract base address to get a GPU address. */
++        gcmkASSERT(address >= baseAddress);
++        address -= baseAddress;
++    }
++
++    /* Return hardware specific address. */
++    *Address = (Hardware->mmuVersion == 0)
++             ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
++               | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (address) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)))
++             : address;
++
++    /* Return the status. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Interrupt
++**
++**  Process an interrupt.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL InterruptValid
++**          If gcvTRUE, this function will read the interrupt acknowledge
++**          register, stores the data, and return whether or not the interrupt
++**          is ours or not.  If gcvFALSE, this functions will read the interrupt
++**          acknowledge register and combine it with any stored value to handle
++**          the event notifications.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Interrupt(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL InterruptValid
++    )
++{
++    gckEVENT eventObj;
++    gctUINT32 data;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x InterruptValid=%d", Hardware, InterruptValid);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Extract gckEVENT object. */
++    eventObj = Hardware->kernel->eventObj;
++    gcmkVERIFY_OBJECT(eventObj, gcvOBJ_EVENT);
++
++    if (InterruptValid)
++    {
++        /* Read AQIntrAcknowledge register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00010,
++                                 &data));
++
++        if (data == 0)
++        {
++            /* Not our interrupt. */
++            status = gcvSTATUS_NOT_OUR_INTERRUPT;
++        }
++        else
++        {
++            /* Inform gckEVENT of the interrupt. */
++            status = gckEVENT_Interrupt(eventObj, data);
++        }
++    }
++    else
++    {
++        /* Handle events. */
++        status = gckEVENT_Notify(eventObj, 0);
++    }
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryCommandBuffer
++**
++**  Query the command buffer alignment and number of reserved bytes.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Alignment
++**          Pointer to a variable receiving the alignment for each command.
++**
++**      gctSIZE_T * ReservedHead
++**          Pointer to a variable receiving the number of reserved bytes at the
++**          head of each command buffer.
++**
++**      gctSIZE_T * ReservedTail
++**          Pointer to a variable receiving the number of bytes reserved at the
++**          tail of each command buffer.
++*/
++gceSTATUS
++gckHARDWARE_QueryCommandBuffer(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * Alignment,
++    OUT gctSIZE_T * ReservedHead,
++    OUT gctSIZE_T * ReservedTail
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Alignment != gcvNULL)
++    {
++        /* Align every 8 bytes. */
++        *Alignment = 8;
++    }
++
++    if (ReservedHead != gcvNULL)
++    {
++        /* Reserve space for SelectPipe(). */
++        *ReservedHead = 32;
++    }
++
++    if (ReservedTail != gcvNULL)
++    {
++        /* Reserve space for Link(). */
++        *ReservedTail = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Alignment=%lu *ReservedHead=%lu *ReservedTail=%lu",
++                   gcmOPT_VALUE(Alignment), gcmOPT_VALUE(ReservedHead),
++                   gcmOPT_VALUE(ReservedTail));
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QuerySystemMemory
++**
++**  Query the command buffer alignment and number of reserved bytes.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * SystemSize
++**          Pointer to a variable that receives the maximum size of the system
++**          memory.
++**
++**      gctUINT32 * SystemBaseAddress
++**          Poinetr to a variable that receives the base address for system
++**          memory.
++*/
++gceSTATUS
++gckHARDWARE_QuerySystemMemory(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * SystemSize,
++    OUT gctUINT32 * SystemBaseAddress
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (SystemSize != gcvNULL)
++    {
++        /* Maximum system memory can be 2GB. */
++        *SystemSize = 1U << 31;
++    }
++
++    if (SystemBaseAddress != gcvNULL)
++    {
++        /* Set system memory base address. */
++        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*SystemSize=%lu *SystemBaseAddress=%lu",
++                   gcmOPT_VALUE(SystemSize), gcmOPT_VALUE(SystemBaseAddress));
++    return gcvSTATUS_OK;
++}
++
++#ifndef VIVANTE_NO_3D
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryShaderCaps
++**
++**  Query the shader capabilities.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      gctUINT * VertexUniforms
++**          Pointer to a variable receiving the number of uniforms in the vertex
++**          shader.
++**
++**      gctUINT * FragmentUniforms
++**          Pointer to a variable receiving the number of uniforms in the
++**          fragment shader.
++**
++**      gctUINT * Varyings
++**          Pointer to a variable receiving the maimum number of varyings.
++*/
++gceSTATUS
++gckHARDWARE_QueryShaderCaps(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT * VertexUniforms,
++    OUT gctUINT * FragmentUniforms,
++    OUT gctUINT * Varyings
++    )
++{
++    gctUINT32 vsConstMax;
++    gctUINT32 psConstMax;
++
++    gcmkHEADER_ARG("Hardware=0x%x VertexUniforms=0x%x "
++                   "FragmentUniforms=0x%x Varyings=0x%x",
++                   Hardware, VertexUniforms,
++                   FragmentUniforms, Varyings);
++
++    if ((Hardware->identity.chipModel == gcv2000)
++     && (Hardware->identity.chipRevision == 0x5118))
++    {
++        vsConstMax   = 256;
++        psConstMax   = 64;
++    }
++    else if (Hardware->identity.numConstants > 256)
++    {
++        vsConstMax   = 256;
++        psConstMax   = 256;
++    }
++    else if (Hardware->identity.numConstants == 256)
++    {
++        vsConstMax   = 256;
++        psConstMax   = 256;
++    }
++    else
++    {
++        vsConstMax   = 168;
++        psConstMax   = 64;
++    }
++
++    if (VertexUniforms != gcvNULL)
++    {
++        *VertexUniforms = vsConstMax;
++    }
++
++    if (FragmentUniforms != gcvNULL)
++    {
++        *FragmentUniforms = psConstMax;
++    }
++
++    if (Varyings != gcvNULL)
++    {
++		/* Return the shader varyings count. */
++        *Varyings = Hardware->identity.varyingsCount;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetMMU
++**
++**  Set the page table base address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of the page table.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_SetMMU(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical
++    )
++{
++    gceSTATUS status;
++    gctUINT32 address = 0;
++    gctUINT32 baseAddress;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x", Hardware, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Convert the logical address into an hardware address. */
++    gcmkONERROR(
++        gckHARDWARE_ConvertLogical(Hardware, Logical, &address));
++
++    /* Also get the base address - we need a real physical address. */
++    gcmkONERROR(
++        gckOS_GetBaseAddress(Hardware->os, &baseAddress));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Setting page table to 0x%08X",
++                   address + baseAddress);
++
++    /* Write the AQMemoryFePageTable register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              0x00400,
++                              address + baseAddress));
++
++    /* Write the AQMemoryRaPageTable register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              0x00410,
++                              address + baseAddress));
++
++    /* Write the AQMemoryTxPageTable register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              0x00404,
++                              address + baseAddress));
++
++
++    /* Write the AQMemoryPePageTable register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              0x00408,
++                              address + baseAddress));
++
++    /* Write the AQMemoryPezPageTable register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              0x0040C,
++                              address + baseAddress));
++
++    /* Return the status. */
++    gcmkFOOTER_NO();
++    return status;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_FlushMMU
++**
++**  Flush the page table.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_FlushMMU(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command;
++    gctUINT32_PTR buffer;
++    gctSIZE_T bufferSize;
++    gctBOOL commitEntered = gcvFALSE;
++    gctPOINTER pointer = gcvNULL;
++    gctUINT32 flushSize;
++    gctUINT32 count;
++    gctUINT32 physical;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Verify the gckCOMMAND object pointer. */
++    command = Hardware->kernel->command;
++
++    /* Acquire the command queue. */
++    gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvFALSE));
++    commitEntered = gcvTRUE;
++
++    /* Flush the memory controller. */
++    if (Hardware->mmuVersion == 0)
++    {
++        gcmkONERROR(gckCOMMAND_Reserve(
++            command, 8, &pointer, &bufferSize
++            ));
++
++        buffer = (gctUINT32_PTR) pointer;
++
++        buffer[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[1]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++
++        gcmkONERROR(gckCOMMAND_Execute(command, 8));
++    }
++    else
++    {
++        flushSize =  16 * 4;
++
++        gcmkONERROR(gckCOMMAND_Reserve(
++            command, flushSize, &pointer, &bufferSize
++            ));
++
++        buffer = (gctUINT32_PTR) pointer;
++
++        count = (bufferSize - flushSize + 7) >> 3;
++
++        gcmkONERROR(gckOS_GetPhysicalAddress(command->os, buffer, &physical));
++
++        /* Flush cache. */
++        buffer[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[1]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++        /* Arm the PE-FE Semaphore. */
++        buffer[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[3]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        buffer[4]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        buffer[5]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LINK to next slot to flush FE FIFO. */
++        buffer[6]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[7]
++            = physical + 8 * gcmSIZEOF(gctUINT32);
++
++        /* Flush MMU cache. */
++        buffer[8]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[9]
++            = (((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) &  ((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))));
++
++        /* Arm the PE-FE Semaphore. */
++        buffer[10]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[11]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        buffer[12]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        buffer[13]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LINK to next slot to flush FE FIFO. */
++        buffer[14]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[15]
++            = physical + flushSize;
++
++        gcmkONERROR(gckCOMMAND_Execute(command, flushSize));
++    }
++
++    /* Release the command queue. */
++    gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvFALSE));
++    commitEntered = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(Hardware->kernel->command,
++                                            gcvFALSE));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetMMUv2
++**
++**  Set the page table base address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_SetMMUv2(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Enable,
++    IN gctPOINTER MtlbAddress,
++    IN gceMMU_MODE Mode,
++    IN gctPOINTER SafeAddress,
++    IN gctBOOL FromPower
++    )
++{
++    gceSTATUS status;
++    gctUINT32 config, address;
++    gckCOMMAND command;
++    gctUINT32_PTR buffer;
++    gctSIZE_T bufferSize;
++    gctBOOL commitEntered = gcvFALSE;
++    gctPOINTER pointer = gcvNULL;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL config2D;
++    gctSIZE_T configSize;
++
++    gcmkHEADER_ARG("Hardware=0x%x Enable=%d", Hardware, Enable);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    config2D =  gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_3D)
++             && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_2D);
++
++    configSize = 4 * 4;
++
++    if (config2D)
++    {
++        configSize +=
++            /* Pipe Select. */
++            4 * 4
++            /* Configure MMU States. */
++          + 4 * 4;
++    }
++
++    /* Convert logical address into physical address. */
++    gcmkONERROR(
++        gckOS_GetPhysicalAddress(Hardware->os, MtlbAddress, &config));
++
++    gcmkONERROR(
++        gckOS_GetPhysicalAddress(Hardware->os, SafeAddress, &address));
++
++    if (address & 0x3F)
++    {
++        gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++    }
++
++    switch (Mode)
++    {
++    case gcvMMU_MODE_1K:
++        if (config & 0x3FF)
++        {
++            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++        }
++
++        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        break;
++
++    case gcvMMU_MODE_4K:
++        if (config & 0xFFF)
++        {
++            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++        }
++
++        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        break;
++
++    default:
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Verify the gckCOMMAND object pointer. */
++    command = Hardware->kernel->command;
++
++    /* Acquire the command queue. */
++    gcmkONERROR(gckCOMMAND_EnterCommit(command, FromPower));
++    commitEntered = gcvTRUE;
++
++    gcmkONERROR(gckCOMMAND_Reserve(
++        command, configSize, &pointer, &bufferSize
++        ));
++
++    buffer = pointer;
++
++    buffer[0]
++        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++    buffer[1] = config;
++
++    buffer[2]
++        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++    buffer[3] = address;
++
++    if (config2D)
++    {
++        /* LoadState(AQPipeSelect, 1), pipe. */
++        buffer[4]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[5] = 0x1;
++
++        buffer[6]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[7] = config;
++
++        buffer[8]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[9] = address;
++
++        /* LoadState(AQPipeSelect, 1), pipe. */
++        buffer[10]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[11] = 0x0;
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++        "Setup MMU: config=%08x, Safe Address=%08x\n.", config, address);
++
++    gcmkONERROR(gckCOMMAND_Execute(command, configSize));
++
++    if (FromPower == gcvFALSE)
++    {
++        /* Acquire global semaphore to suspend power management until MMU
++        ** is enabled. And acquired it before gckCOMMAND_ExitCommit to
++        ** make sure GPU keeps ON. */
++        gcmkONERROR(
++            gckOS_AcquireSemaphore(Hardware->os, Hardware->globalSemaphore));
++
++        acquired = gcvTRUE;
++    }
++
++    /* Release the command queue. */
++    gcmkONERROR(gckCOMMAND_ExitCommit(command, FromPower));
++    commitEntered = gcvFALSE;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++        "call gckCOMMAND_Stall to make sure the config is done.\n ");
++
++    gcmkONERROR(gckCOMMAND_Stall(command, FromPower));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++        "Enable MMU through GCREG_MMU_CONTROL.");
++
++    /* Enable MMU. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              0x0018C,
++                              ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Enable) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))));
++
++    if (FromPower == gcvFALSE)
++    {
++        /* Relase global semaphore. */
++        gcmkVERIFY_OK(
++            gckOS_ReleaseSemaphore(Hardware->os, Hardware->globalSemaphore));
++
++        acquired = gcvFALSE;
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++        "call gckCOMMAND_Stall to check MMU available.\n");
++
++    gcmkONERROR(gckCOMMAND_Stall(command, FromPower));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++        "The MMU is available.\n");
++
++    /* Return the status. */
++    gcmkFOOTER_NO();
++    return status;
++
++OnError:
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(Hardware->kernel->command,
++                                            FromPower));
++    }
++
++    if (acquired)
++    {
++        gcmkVERIFY_OK(
++            gckOS_ReleaseSemaphore(Hardware->os, Hardware->globalSemaphore));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_BuildVirtualAddress
++**
++**  Build a virtual address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctUINT32 Index
++**          Index into page table.
++**
++**      gctUINT32 Offset
++**          Offset into page.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Pointer to a variable receiving te hardware address.
++*/
++gceSTATUS
++gckHARDWARE_BuildVirtualAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Index,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Index=%u Offset=%u", Hardware, Index, Offset);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Build virtual address. */
++    *Address = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
++             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (Offset | (Index << 12)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckHARDWARE_GetIdle(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Wait,
++    OUT gctUINT32 * Data
++    )
++{
++    gceSTATUS status;
++    gctUINT32 idle = 0;
++    gctINT retry, poll, pollCount;
++
++    gcmkHEADER_ARG("Hardware=0x%x Wait=%d", Hardware, Wait);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
++
++
++    /* If we have to wait, try 100 polls per millisecond. */
++    pollCount = Wait ? 100 : 1;
++
++    /* At most, try for 1 second. */
++    for (retry = 0; retry < 1000; ++retry)
++    {
++        /* If we have to wait, try 100 polls per millisecond. */
++        for (poll = pollCount; poll > 0; --poll)
++        {
++            /* Read register. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
++
++            /* See if we have to wait for FE idle. */
++            if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++            {
++                /* FE is idle. */
++                break;
++            }
++        }
++
++        /* Check if we need to wait for FE and FE is busy. */
++        if (Wait && !(((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++        {
++            /* Wait a little. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "%s: Waiting for idle: 0x%08X",
++                           __FUNCTION__, idle);
++
++            gcmkVERIFY_OK(gckOS_Delay(Hardware->os, 1));
++        }
++        else
++        {
++            break;
++        }
++    }
++
++    /* Return idle to caller. */
++    *Data = idle;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/* Flush the caches. */
++gceSTATUS
++gckHARDWARE_Flush(
++    IN gckHARDWARE Hardware,
++    IN gceKERNEL_FLUSH Flush,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT32 pipe;
++    gctUINT32 flush = 0;
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++    gctBOOL fcFlushStall;
++    gctUINT32 reserveBytes = 8;
++
++    gcmkHEADER_ARG("Hardware=0x%x Flush=0x%x Logical=0x%x *Bytes=%lu",
++                   Hardware, Flush, Logical, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Get current pipe. */
++    pipe = Hardware->kernel->command->pipeSelect;
++
++    fcFlushStall
++        = ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 31:31) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))))
++        && (Flush == gcvFLUSH_ALL)
++        ;
++
++    if (fcFlushStall)
++    {
++        reserveBytes += 8;
++    }
++
++    /* Flush 3D color cache. */
++    if ((Flush & gcvFLUSH_COLOR) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
++    }
++
++    /* Flush 3D depth cache. */
++    if ((Flush & gcvFLUSH_DEPTH) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++    }
++
++    /* Flush 3D texture cache. */
++    if ((Flush & gcvFLUSH_TEXTURE) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++    }
++
++    /* Flush 2D cache. */
++    if ((Flush & gcvFLUSH_2D) && (pipe == 0x1))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++    }
++
++    /* See if there is a valid flush. */
++    if (flush == 0)
++    {
++        if (Bytes != gcvNULL)
++        {
++            /* No bytes required. */
++            *Bytes = 0;
++        }
++    }
++
++    else
++    {
++        /* Copy to command queue. */
++        if (Logical != gcvNULL)
++        {
++            if (*Bytes < reserveBytes)
++            {
++                /* Command queue too small. */
++                gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++            }
++
++            /* Append LOAD_STATE to AQFlush. */
++            logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            logical[1] = flush;
++
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "0x%x: FLUSH 0x%x", logical, flush);
++
++            if (fcFlushStall)
++            {
++                logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                           | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                           | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++                logical[3] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++
++                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                               "0x%x: FLUSH 0x%x", logical + 3, logical[3]);
++            }
++
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* bytes required. */
++            *Bytes = reserveBytes;
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_SetFastClear(
++    IN gckHARDWARE Hardware,
++    IN gctINT Enable,
++    IN gctINT Compression
++    )
++{
++#ifndef VIVANTE_NO_3D
++    gctUINT32 debug;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Enable=%d Compression=%d",
++                   Hardware, Enable, Compression);
++
++    /* Only process if fast clear is available. */
++    if ((((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++    {
++        if (Enable == -1)
++        {
++            /* Determine automatic value for fast clear. */
++            Enable = ((Hardware->identity.chipModel    != gcv500)
++                     || (Hardware->identity.chipRevision >= 3)
++                     ) ? 1 : 0;
++        }
++
++        if (Compression == -1)
++        {
++            /* Determine automatic value for compression. */
++            Compression = Enable
++                        & (((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) );
++        }
++
++        /* Read AQMemoryDebug register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &debug));
++
++        /* Set fast clear bypass. */
++        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
++
++        if (
++            ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) ||
++            (Hardware->identity.chipModel >= gcv4000))
++        {
++            /* Set compression bypass. */
++            debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21))) | (((gctUINT32) ((gctUINT32) (Compression == 0) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21)));
++        }
++
++        /* Write back AQMemoryDebug register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00414,
++                                  debug));
++
++        /* Store fast clear and comprersison flags. */
++        Hardware->allowFastClear   = Enable;
++        Hardware->allowCompression = Compression;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "FastClear=%d Compression=%d", Enable, Compression);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    return gcvSTATUS_OK;
++#endif
++}
++
++typedef enum
++{
++    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
++    gcvPOWER_FLAG_STALL         = 1 << 1,
++    gcvPOWER_FLAG_STOP          = 1 << 2,
++    gcvPOWER_FLAG_START         = 1 << 3,
++    gcvPOWER_FLAG_RELEASE       = 1 << 4,
++    gcvPOWER_FLAG_DELAY         = 1 << 5,
++    gcvPOWER_FLAG_SAVE          = 1 << 6,
++    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
++    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
++    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
++    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
++}
++gcePOWER_FLAGS;
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++static gctCONST_STRING
++_PowerEnum(gceCHIPPOWERSTATE State)
++{
++    const gctCONST_STRING states[] =
++    {
++        gcmSTRING(gcvPOWER_ON),
++        gcmSTRING(gcvPOWER_OFF),
++        gcmSTRING(gcvPOWER_IDLE),
++        gcmSTRING(gcvPOWER_SUSPEND),
++        gcmSTRING(gcvPOWER_SUSPEND_ATPOWERON),
++        gcmSTRING(gcvPOWER_OFF_ATPOWERON),
++        gcmSTRING(gcvPOWER_IDLE_BROADCAST),
++        gcmSTRING(gcvPOWER_SUSPEND_BROADCAST),
++        gcmSTRING(gcvPOWER_OFF_BROADCAST),
++        gcmSTRING(gcvPOWER_OFF_RECOVERY),
++        gcmSTRING(gcvPOWER_ON_AUTO)
++    };
++
++    if ((State >= gcvPOWER_ON) && (State <= gcvPOWER_ON_AUTO))
++    {
++        return states[State - gcvPOWER_ON];
++    }
++
++    return "unknown";
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagementState
++**
++**  Set GPU to a specified power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE State
++**          Power State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetPowerManagementState(
++    IN gckHARDWARE Hardware,
++    IN gceCHIPPOWERSTATE State
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command = gcvNULL;
++    gckOS os;
++    gctUINT flag, clock;
++    gctPOINTER buffer;
++    gctSIZE_T bytes, requested;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL mutexAcquired = gcvFALSE;
++    gctBOOL stall = gcvTRUE;
++    gctBOOL broadcast = gcvFALSE;
++#if gcdPOWEROFF_TIMEOUT
++    gctBOOL timeout = gcvFALSE;
++    gctBOOL isAfter = gcvFALSE;
++    gctUINT32 currentTime;
++#endif
++    gctUINT32 process, thread;
++    gctBOOL commitEntered = gcvFALSE;
++    gctBOOL commandStarted = gcvFALSE;
++    gctBOOL isrStarted = gcvFALSE;
++
++#if gcdENABLE_PROFILING
++    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
++              initTime, offTime, startTime, totalTime;
++#endif
++    gctBOOL global = gcvFALSE;
++    gctBOOL globalAcquired = gcvFALSE;
++    gctBOOL configMmu = gcvFALSE;
++
++    /* State transition flags. */
++    static const gctUINT flags[4][4] =
++    {
++        /* gcvPOWER_ON           */
++        {   /* ON                */ 0,
++            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL,
++            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_OFF          */
++        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_RELEASE    |
++                                    gcvPOWER_FLAG_DELAY,
++            /* OFF               */ 0,
++            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_DELAY,
++            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_IDLE         */
++        {   /* ON                */ gcvPOWER_FLAG_RELEASE,
++            /* OFF               */ gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ 0,
++            /* SUSPEND           */ gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_SUSPEND      */
++        {   /* ON                */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_RELEASE   |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* OFF               */ gcvPOWER_FLAG_SAVE      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* SUSPEND           */ 0,
++        },
++    };
++
++    /* Clocks. */
++    static const gctUINT clocks[4] =
++    {
++        /* gcvPOWER_ON */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (64) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++
++        /* gcvPOWER_OFF */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++
++        /* gcvPOWER_IDLE */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++
++        /* gcvPOWER_SUSPEND */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++    };
++
++    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Switching to power state %d(%s)",
++                   State, _PowerEnum(State));
++#endif
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Get the gckOS object pointer. */
++    os = Hardware->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Get the gckCOMMAND object pointer. */
++    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
++    command = Hardware->kernel->command;
++    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
++
++    if (Hardware->powerManagement == gcvFALSE)
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Start profiler. */
++    gcmkPROFILE_INIT(freq, time);
++
++    /* Convert the broadcast power state. */
++    switch (State)
++    {
++    case gcvPOWER_SUSPEND_ATPOWERON:
++        /* Convert to SUSPEND and don't wait for STALL. */
++        State = gcvPOWER_SUSPEND;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_OFF_ATPOWERON:
++        /* Convert to OFF and don't wait for STALL. */
++        State = gcvPOWER_OFF;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_IDLE_BROADCAST:
++        /* Convert to IDLE and note we are inside broadcast. */
++        State     = gcvPOWER_IDLE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_SUSPEND_BROADCAST:
++        /* Convert to SUSPEND and note we are inside broadcast. */
++        State     = gcvPOWER_SUSPEND;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_BROADCAST:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_RECOVERY:
++        /* Convert to OFF and note we are inside recovery. */
++        State     = gcvPOWER_OFF;
++        stall     = gcvFALSE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_ON_AUTO:
++        /* Convert to ON and note we are inside recovery. */
++        State = gcvPOWER_ON;
++        break;
++
++    case gcvPOWER_ON:
++    case gcvPOWER_IDLE:
++    case gcvPOWER_SUSPEND:
++    case gcvPOWER_OFF:
++        /* Mark as global power management. */
++        global = gcvTRUE;
++        break;
++
++#if gcdPOWEROFF_TIMEOUT
++    case gcvPOWER_OFF_TIMEOUT:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        /* Check time out */
++        timeout = gcvTRUE;
++        break;
++#endif
++
++    default:
++        break;
++    }
++
++    /* Get current process and thread IDs. */
++    gcmkONERROR(gckOS_GetProcessID(&process));
++    gcmkONERROR(gckOS_GetThreadID(&thread));
++
++    /* Before we grab locks see if this is actually a needed change */
++    if (State == Hardware->chipPowerState)
++        return gcvSTATUS_OK;
++
++    if (broadcast)
++    {
++        /* Try to acquire the power mutex. */
++        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
++
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            /* Check if we already own this mutex. */
++            if ((Hardware->powerProcess == process)
++            &&  (Hardware->powerThread  == thread)
++            )
++            {
++                /* Bail out on recursive power management. */
++                gcmkFOOTER_NO();
++                return gcvSTATUS_OK;
++            }
++            else if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
++            {
++                /* Called from IST,
++                ** so waiting here will cause deadlock,
++                ** if lock holder call gckCOMMAND_Stall() */
++                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++            }
++#if gcdPOWEROFF_TIMEOUT
++            else if(State == gcvPOWER_OFF && timeout == gcvTRUE)
++            {
++                /*
++                ** try to aqcuire the mutex with more milliseconds,
++                ** flush_delayed_work should be running with timeout,
++                ** so waiting here will cause deadlock */
++                status = gckOS_AcquireMutex(os, Hardware->powerMutex, gcdPOWEROFF_TIMEOUT);
++
++                if (status == gcvSTATUS_TIMEOUT)
++                {
++                    gckOS_Print("GPU Timer deadlock, exit by timeout!!!!\n");
++
++                    gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++                }
++            }
++#endif
++            else
++            {
++                /* Acquire the power mutex. */
++                gcmkONERROR(gckOS_AcquireMutex(os,
++                                               Hardware->powerMutex,
++                                               gcvINFINITE));
++            }
++        }
++    }
++    else
++    {
++        /* Acquire the power mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
++    }
++
++    /* Get time until mtuex acquired. */
++    gcmkPROFILE_QUERY(time, mutexTime);
++
++    Hardware->powerProcess = process;
++    Hardware->powerThread  = thread;
++    mutexAcquired          = gcvTRUE;
++
++    /* Grab control flags and clock. */
++    flag  = flags[Hardware->chipPowerState][State];
++    clock = clocks[State];
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    if (State == gcvPOWER_ON)
++    {
++        clock = ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (Hardware->powerOnFscaleVal) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)));
++    }
++#endif
++
++    if (State == gcvPOWER_SUSPEND && Hardware->chipPowerState == gcvPOWER_OFF && broadcast)
++    {
++#if gcdPOWER_SUSNPEND_WHEN_IDLE
++	/* Do nothing */
++
++    	/* Release the power mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++       	gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++#else
++	/* Clock should be on when switch power from off to suspend */
++        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) ;
++#endif
++    }
++
++#if gcdPOWEROFF_TIMEOUT
++    if (timeout)
++    {
++        gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++        gcmkONERROR(
++            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
++
++        /* powerOffTime is pushed forward, give up.*/
++        if (isAfter
++        /* Expect a transition start from IDLE or SUSPEND. */
++        ||  (Hardware->chipPowerState == gcvPOWER_ON)
++        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
++        )
++        {
++            /* Release the power mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++            /* No need to do anything. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Power Off GPU[%d] at %u [supposed to be at %u]",
++                       Hardware->core, currentTime, Hardware->powerOffTime);
++    }
++
++    if (State == gcvPOWER_ON || State == gcvPOWER_OFF)
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
++
++        /* Cancel running timer when GPU enters ON or OFF. */
++        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
++    }
++#endif
++
++    if (flag == 0)
++    {
++        /* Release the power mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++        /* No need to do anything. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* If this is an internal power management, we have to check if we can grab
++    ** the global power semaphore. If we cannot, we have to wait until the
++    ** external world changes power management. */
++    if (!global)
++    {
++        /* Try to acquire the global semaphore. */
++        status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
++            {
++                /* Called from thread routine which should NEVER sleep.*/
++                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++            }
++
++            /* Release the power mutex. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "Releasing the power mutex.");
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++            mutexAcquired = gcvFALSE;
++
++            /* Wait for the semaphore. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "Waiting for global semaphore.");
++            gcmkONERROR(gckOS_AcquireSemaphore(os, Hardware->globalSemaphore));
++            globalAcquired = gcvTRUE;
++
++            /* Acquire the power mutex. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "Reacquiring the power mutex.");
++            gcmkONERROR(gckOS_AcquireMutex(os,
++                                           Hardware->powerMutex,
++                                           gcvINFINITE));
++            mutexAcquired = gcvTRUE;
++
++            /* chipPowerState may be changed by external world during the time
++            ** we give up powerMutex, so updating flag now is necessary. */
++            flag = flags[Hardware->chipPowerState][State];
++
++            if (flag == 0)
++            {
++                gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
++                globalAcquired = gcvFALSE;
++
++                gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++                mutexAcquired = gcvFALSE;
++
++                gcmkFOOTER_NO();
++                return gcvSTATUS_OK;
++            }
++        }
++        else
++        {
++            /* Error. */
++            gcmkONERROR(status);
++        }
++
++        /* Release the global semaphore again. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
++        globalAcquired = gcvFALSE;
++    }
++    else
++    {
++        if (State == gcvPOWER_OFF || State == gcvPOWER_SUSPEND || State == gcvPOWER_IDLE)
++        {
++            /* Acquire the global semaphore if it has not been acquired. */
++            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
++            if (status == gcvSTATUS_OK)
++            {
++                globalAcquired = gcvTRUE;
++            }
++            else if (status != gcvSTATUS_TIMEOUT)
++            {
++                /* Other errors. */
++                gcmkONERROR(status);
++            }
++            /* Ignore gcvSTATUS_TIMEOUT and leave globalAcquired as gcvFALSE.
++            ** gcvSTATUS_TIMEOUT means global semaphore has already
++            ** been acquired before this operation, so even if we fail,
++            ** we should not release it in our error handling. It should be
++            ** released by the next successful global gcvPOWER_ON. */
++        }
++
++        /* Global power management can't be aborted, so sync with
++        ** proceeding last commit. */
++        if (flag & gcvPOWER_FLAG_ACQUIRE)
++        {
++            /* Acquire the power management semaphore. */
++            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++            acquired = gcvTRUE;
++
++            /* avoid acquiring again. */
++            flag &= ~gcvPOWER_FLAG_ACQUIRE;
++        }
++    }
++
++    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
++    {
++        /* Turn on the power. */
++        gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
++
++        /* Mark clock and power as enabled. */
++        Hardware->clockState = gcvTRUE;
++        Hardware->powerState = gcvTRUE;
++
++        for (;;)
++        {
++            /* Check if GPU is present and awake. */
++            status = _IsGPUPresent(Hardware);
++
++            /* Check if the GPU is not responding. */
++            if (status == gcvSTATUS_GPU_NOT_RESPONDING)
++            {
++                /* Turn off the power and clock. */
++                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvFALSE, gcvFALSE));
++
++                Hardware->clockState = gcvFALSE;
++                Hardware->powerState = gcvFALSE;
++
++                /* Wait a little. */
++                gckOS_Delay(os, 1);
++
++                /* Turn on the power and clock. */
++                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
++
++                Hardware->clockState = gcvTRUE;
++                Hardware->powerState = gcvTRUE;
++
++                /* We need to initialize the hardware and start the command
++                 * processor. */
++                flag |= gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_START;
++            }
++            else
++            {
++                /* Test for error. */
++                gcmkONERROR(status);
++
++                /* Break out of loop. */
++                break;
++            }
++        }
++    }
++
++    /* Get time until powered on. */
++    gcmkPROFILE_QUERY(time, onTime);
++
++    if ((flag & gcvPOWER_FLAG_STALL) && stall)
++    {
++        gctBOOL idle;
++        gctINT32 atomValue;
++
++        /* For global operation, all pending commits have already been
++        ** blocked by globalSemaphore or powerSemaphore.*/
++        if (!global)
++        {
++            /* Check commit atom. */
++            gcmkONERROR(gckOS_AtomGet(os, command->atomCommit, &atomValue));
++
++            if (atomValue > 0)
++            {
++                /* Commits are pending - abort power management. */
++                status = broadcast ? gcvSTATUS_CHIP_NOT_READY
++                                   : gcvSTATUS_MORE_DATA;
++                goto OnError;
++            }
++        }
++
++        if (broadcast)
++        {
++            /* Check for idle. */
++            gcmkONERROR(gckHARDWARE_QueryIdle(Hardware, &idle));
++
++            if (!idle)
++            {
++                status = gcvSTATUS_CHIP_NOT_READY;
++                goto OnError;
++            }
++        }
++
++        else
++        {
++            /* Acquire the command queue. */
++            gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvTRUE));
++            commitEntered = gcvTRUE;
++
++            /* Get the size of the flush command. */
++            gcmkONERROR(gckHARDWARE_Flush(Hardware,
++                                          gcvFLUSH_ALL,
++                                          gcvNULL,
++                                          &requested));
++
++            /* Reserve space in the command queue. */
++            gcmkONERROR(gckCOMMAND_Reserve(command,
++                                           requested,
++                                           &buffer,
++                                           &bytes));
++
++            /* Append a flush. */
++            gcmkONERROR(gckHARDWARE_Flush(
++                Hardware, gcvFLUSH_ALL, buffer, &bytes
++                ));
++
++            /* Execute the command queue. */
++            gcmkONERROR(gckCOMMAND_Execute(command, requested));
++
++            /* Release the command queue. */
++            gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvTRUE));
++            commitEntered = gcvFALSE;
++
++            /* Wait to finish all commands. */
++            gcmkONERROR(gckCOMMAND_Stall(command, gcvTRUE));
++        }
++    }
++
++    /* Get time until stalled. */
++    gcmkPROFILE_QUERY(time, stallTime);
++
++    if (flag & gcvPOWER_FLAG_ACQUIRE)
++    {
++        /* Acquire the power management semaphore. */
++        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++        acquired = gcvTRUE;
++    }
++
++    if (flag & gcvPOWER_FLAG_STOP)
++    {
++        /* Stop the command parser. */
++        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
++
++        /* Stop the Isr. */
++        if (Hardware->stopIsr)
++        {
++            gcmkONERROR(Hardware->stopIsr(Hardware->isrContext, Hardware->core));
++        }
++    }
++
++    /* Flush Cache before Power Off. */
++    if (flag & gcvPOWER_FLAG_POWER_OFF)
++    {
++        if (Hardware->clockState == gcvFALSE)
++        {
++            /* Turn off the GPU power. */
++            gcmkONERROR(
++                    gckOS_SetGPUPower(os,
++                        Hardware->core,
++                        gcvTRUE,
++                        gcvTRUE));
++
++            Hardware->clockState = gcvTRUE;
++
++            if (gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE)
++            {
++                /* Write the clock control register. */
++                gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                                  Hardware->core,
++                                                  0x00000,
++                                                  clocks[0]));
++
++                /* Done loading the frequency scaler. */
++                gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                                  Hardware->core,
++                                                  0x00000,
++                                                  ((((gctUINT32) (clocks[0])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++            }
++        }
++
++        gcmkONERROR(gckCOMMAND_Start(command));
++
++        gcmkONERROR(_FlushCache(Hardware, command));
++
++        gckOS_Delay(gcvNULL, 1);
++
++        /* Stop the command parser. */
++        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
++
++        flag |= gcvPOWER_FLAG_CLOCK_OFF;
++    }
++
++    /* Get time until stopped. */
++    gcmkPROFILE_QUERY(time, stopTime);
++
++    /* Only process this when hardware is enabled. */
++    if (Hardware->clockState && Hardware->powerState
++    /* Don't touch clock control if dynamic frequency scaling is available. */
++    && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE
++    )
++    {
++        if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
++        {
++            if (Hardware->identity.chipModel == gcv4000
++            && Hardware->identity.chipRevision == 0x5208)
++            {
++                clock &= ~2U;
++            }
++        }
++
++        /* Write the clock control register. */
++        gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                          Hardware->core,
++                                          0x00000,
++                                          clock));
++
++        /* Done loading the frequency scaler. */
++        gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++    }
++
++    if (flag & gcvPOWER_FLAG_DELAY)
++    {
++        /* Wait for the specified amount of time to settle coming back from
++        ** power-off or suspend state. */
++        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
++    }
++
++    /* Get time until delayed. */
++    gcmkPROFILE_QUERY(time, delayTime);
++
++    if (flag & gcvPOWER_FLAG_INITIALIZE)
++    {
++        /* Initialize hardware. */
++        gcmkONERROR(gckHARDWARE_InitializeHardware(Hardware));
++
++        gcmkONERROR(gckHARDWARE_SetFastClear(Hardware,
++                                             Hardware->allowFastClear,
++                                             Hardware->allowCompression));
++
++        /* Force the command queue to reload the next context. */
++        command->currContext = gcvNULL;
++
++        /* Need to config mmu after command start. */
++        configMmu = gcvTRUE;
++    }
++
++    /* Get time until initialized. */
++    gcmkPROFILE_QUERY(time, initTime);
++
++    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
++    {
++        /* Turn off the GPU power. */
++        gcmkONERROR(
++            gckOS_SetGPUPower(os,
++                              Hardware->core,
++                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                               : gcvTRUE,
++                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                               : gcvTRUE));
++
++        /* Save current hardware power and clock states. */
++        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++    }
++
++    /* Get time until off. */
++    gcmkPROFILE_QUERY(time, offTime);
++
++    if (flag & gcvPOWER_FLAG_START)
++    {
++        /* Start the command processor. */
++        gcmkONERROR(gckCOMMAND_Start(command));
++        commandStarted = gcvTRUE;
++
++        if (Hardware->startIsr)
++        {
++            /* Start the Isr. */
++            gcmkONERROR(Hardware->startIsr(Hardware->isrContext, Hardware->core));
++            isrStarted = gcvTRUE;
++        }
++
++        /* Set NEW MMU. */
++        if (Hardware->mmuVersion != 0 && configMmu)
++        {
++            gcmkONERROR(
++                    gckHARDWARE_SetMMUv2(
++                        Hardware,
++                        gcvTRUE,
++                        Hardware->kernel->mmu->mtlbLogical,
++                        gcvMMU_MODE_4K,
++                        (gctUINT8_PTR)Hardware->kernel->mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
++                        gcvTRUE
++                        ));
++        }
++    }
++
++    /* Get time until started. */
++    gcmkPROFILE_QUERY(time, startTime);
++
++    if (flag & gcvPOWER_FLAG_RELEASE)
++    {
++        /* Release the power management semaphore. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
++        acquired = gcvFALSE;
++
++        if (global)
++        {
++            /* Verify global semaphore has been acquired already before
++            ** we release it.
++            ** If it was acquired, gckOS_TryAcquireSemaphore will return
++            ** gcvSTATUS_TIMEOUT and we release it. Otherwise, global
++            ** semaphore will be acquried now, but it still is released
++            ** immediately. */
++            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
++            if (status != gcvSTATUS_TIMEOUT)
++            {
++                gcmkONERROR(status);
++            }
++
++            /* Release the global semaphore. */
++            gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
++            globalAcquired = gcvFALSE;
++        }
++    }
++
++    /* Save the new power state. */
++    Hardware->chipPowerState = State;
++
++#if gcdDVFS
++    if (State == gcvPOWER_ON && Hardware->kernel->dvfs)
++    {
++        gckDVFS_Start(Hardware->kernel->dvfs);
++    }
++#endif
++
++#if gcdPOWEROFF_TIMEOUT
++    if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
++    {
++        gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++        Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
++        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
++        gcmkVERIFY_OK(gckOS_StartTimer(os,
++                                       Hardware->powerOffTimer,
++                                       Hardware->powerOffTimeout));
++    }
++#endif
++
++    /* Release the power mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++    /* Get total time. */
++    gcmkPROFILE_QUERY(time, totalTime);
++#if gcdENABLE_PROFILING
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
++                   freq, mutexTime, onTime, stallTime, stopTime);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
++                   delayTime, initTime, offTime, startTime, totalTime);
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (commandStarted)
++    {
++        gcmkVERIFY_OK(gckCOMMAND_Stop(command, gcvFALSE));
++    }
++
++    if (isrStarted)
++    {
++        gcmkVERIFY_OK(Hardware->stopIsr(Hardware->isrContext, Hardware->core));
++    }
++
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, gcvTRUE));
++    }
++
++    if (acquired)
++    {
++        /* Release semaphore. */
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
++                                             command->powerSemaphore));
++    }
++
++    if (globalAcquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
++                                             Hardware->globalSemaphore));
++    }
++
++    if (mutexAcquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryPowerManagementState
++**
++**  Get GPU power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE* State
++**          Power State.
++**
++*/
++gceSTATUS
++gckHARDWARE_QueryPowerManagementState(
++    IN gckHARDWARE Hardware,
++    OUT gceCHIPPOWERSTATE* State
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(State != gcvNULL);
++
++    /* Return the statue. */
++    *State = Hardware->chipPowerState;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*State=%d", *State);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagement
++**
++**  Configure GPU power management function.
++**  Only used in driver initialization stage.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL PowerManagement
++**          Power Mangement State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetPowerManagement(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL PowerManagement
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    Hardware->powerManagement = PowerManagement;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetGpuProfiler
++**
++**  Configure GPU profiler function.
++**  Only used in driver initialization stage.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL GpuProfiler
++**          GOU Profiler State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetGpuProfiler(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL GpuProfiler
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    Hardware->gpuProfiler = GpuProfiler;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++gceSTATUS
++gckHARDWARE_SetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32   FscaleValue
++    )
++{
++    gceSTATUS status;
++    gctUINT32 clock;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Hardware=0x%x FscaleValue=%d", Hardware, FscaleValue);
++
++    gcmkVERIFY_ARGUMENT(FscaleValue > 0 && FscaleValue <= 64);
++
++    gcmkONERROR(
++        gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE));
++    acquired =  gcvTRUE;
++
++    Hardware->powerOnFscaleVal = FscaleValue;
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++		gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &data));
++
++        /* Disable all clock gating. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
++
++        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (FscaleValue) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          clock));
++
++        /* Done loading the frequency scaler. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++
++        /* Restore all clock gating. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  data));
++    }
++
++    gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_GetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT * FscaleValue,
++    IN gctUINT * MinFscaleValue,
++    IN gctUINT * MaxFscaleValue
++    )
++{
++    *FscaleValue = Hardware->powerOnFscaleVal;
++    if ((gpu3DMinClock > 0) && (gpu3DMinClock <= 64) && (Hardware->core == gcvCORE_MAJOR))
++        *MinFscaleValue = gpu3DMinClock;
++    else
++        *MinFscaleValue = 1;
++    *MaxFscaleValue = 64;
++
++    return gcvSTATUS_OK;
++}
++
++#endif
++
++#if gcdPOWEROFF_TIMEOUT
++gceSTATUS
++gckHARDWARE_SetPowerOffTimeout(
++    IN gckHARDWARE  Hardware,
++    IN gctUINT32    Timeout
++)
++{
++    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
++
++    Hardware->powerOffTimeout = Timeout;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++gceSTATUS
++gckHARDWARE_QueryPowerOffTimeout(
++    IN gckHARDWARE  Hardware,
++    OUT gctUINT32*  Timeout
++)
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    *Timeout = Hardware->powerOffTimeout;
++
++    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
++    return gcvSTATUS_OK;
++}
++#endif
++
++gceSTATUS
++gckHARDWARE_QueryIdle(
++    IN gckHARDWARE Hardware,
++    OUT gctBOOL_PTR IsIdle
++    )
++{
++    gceSTATUS status;
++    gctUINT32 idle, address;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
++
++    /* We are idle when the power is not ON. */
++    if (Hardware->chipPowerState != gcvPOWER_ON)
++    {
++        *IsIdle = gcvTRUE;
++    }
++
++    else
++    {
++        /* Read idle register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
++
++        /* Pipe must be idle. */
++        if (((((((gctUINT32) (idle)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) ) != 1)
++        )
++        {
++            /* Something is busy. */
++            *IsIdle = gcvFALSE;
++        }
++
++        else
++        {
++            /* Read the current FE address. */
++            gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                             Hardware->core,
++                                             0x00664,
++                                             &address));
++
++            /* Test if address is inside the last WAIT/LINK sequence. */
++            if ((address >= Hardware->lastWaitLink)
++            &&  (address <= Hardware->lastWaitLink + 16)
++            )
++            {
++                /* FE is in last WAIT/LINK and the pipe is idle. */
++                *IsIdle = gcvTRUE;
++            }
++            else
++            {
++                /* FE is not in WAIT/LINK yet. */
++                *IsIdle = gcvFALSE;
++            }
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++** Handy macros that will help in reading those debug registers.
++*/
++
++#define gcmkREAD_DEBUG_REGISTER(control, block, index, data) \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          index))); \
++    gcmkONERROR(\
++        gckOS_ReadRegisterEx(Hardware->os, \
++                             Hardware->core, \
++                             GC_DEBUG_SIGNALS_##block##_Address, \
++                             &profiler->data))
++
++#define gcmkREAD_DEBUG_REGISTER_N(control, block, index, data) \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          index))); \
++    gcmkONERROR(\
++        gckOS_ReadRegisterEx(Hardware->os, \
++                             Hardware->core, \
++                             GC_DEBUG_SIGNALS_##block##_Address, \
++                             &data))
++
++#define gcmkRESET_DEBUG_REGISTER(control, block) \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          15))); \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          0)))
++
++/*******************************************************************************
++**
++**  gckHARDWARE_ProfileEngine2D
++**
++**  Read the profile registers available in the 2D engine and sets them in the
++**  profile.  The function will also reset the pixelsRendered counter every time.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      OPTIONAL gcs2D_PROFILE_PTR Profile
++**          Pointer to a gcs2D_Profile structure.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_ProfileEngine2D(
++    IN gckHARDWARE Hardware,
++    OPTIONAL gcs2D_PROFILE_PTR Profile
++    )
++{
++    gceSTATUS status;
++    gcs2D_PROFILE_PTR profiler = Profile;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Profile != gcvNULL)
++    {
++        /* Read the cycle count. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00438,
++                                 &Profile->cycleCount));
++
++        /* Read pixels rendered by 2D engine. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &profiler->pixelsRendered));
++
++        /* Reset counter. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if VIVANTE_PROFILER
++gceSTATUS
++gckHARDWARE_QueryProfileRegisters(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL   Reset,
++    OUT gcsPROFILER_COUNTERS * Counters
++    )
++{
++    gceSTATUS status;
++    gcsPROFILER_COUNTERS * profiler = Counters;
++    gctUINT i, clock;
++    gctUINT32 colorKilled, colorDrawn, depthKilled, depthDrawn;
++    gctUINT32 totalRead, totalWrite;
++
++    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Read the counters. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00438,
++                             &profiler->gpuCyclesCounter));
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00078,
++                             &profiler->gpuTotalCyclesCounter));
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++	                     Hardware->core,
++                             0x0007C,
++                             &profiler->gpuIdleCyclesCounter));
++
++
++    /* Read clock control register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &clock));
++
++    profiler->gpuTotalRead64BytesPerFrame = 0;
++    profiler->gpuTotalWrite64BytesPerFrame = 0;
++    profiler->pe_pixel_count_killed_by_color_pipe = 0;
++    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
++
++     /* Walk through all avaiable pixel pipes. */
++    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
++    {
++        /* Select proper pipe. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                           Hardware->core,
++                                           0x00000,
++                                           ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
++
++        /* BW */
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00040,
++                             &totalRead));
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00044,
++                             &totalWrite));
++
++        profiler->gpuTotalRead64BytesPerFrame += totalRead;
++        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
++
++        /* PE */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
++
++        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
++        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
++        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
++        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
++    }
++
++    /* Reset clock control register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      clock));
++
++    if(Reset){
++            /* Reset counters. */
++            gcmkONERROR(
++                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
++            gcmkONERROR(
++                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
++            gcmkONERROR(
++                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
++            gcmkONERROR(
++                gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
++            gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++    }
++
++    /* SH */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
++    if(Reset){  gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));}
++
++    /* PA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
++    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));}
++
++    /* SE */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
++    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));}
++
++    /* RA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
++    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));}
++
++    /* TX */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
++    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));}
++
++    /* MC */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
++    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));}
++
++    /* HI */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
++    if(Reset){ gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));}
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++#if VIVANTE_PROFILER_CONTEXT
++#define gcmkUPDATE_PROFILE_DATA(data) \
++    profilerHistroy->data += profiler->data
++
++gceSTATUS
++gckHARDWARE_QueryContextProfile(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL   Reset,
++    IN gckCONTEXT Context,
++    OUT gcsPROFILER_COUNTERS * Counters
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command = Hardware->kernel->command;
++    gcsPROFILER_COUNTERS * profiler = Counters;
++
++    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Acquire the context sequnence mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(
++        command->os, command->mutexContextSeq, gcvINFINITE
++        ));
++
++    /* Read the counters. */
++    gcmkVERIFY_OK(gckOS_MemCopy(
++        profiler, &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
++        ));
++
++    if (Reset)
++    {
++        /* Reset counters. */
++        gcmkVERIFY_OK(gckOS_ZeroMemory(
++            &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
++            ));
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(
++        command->os, command->mutexContextSeq
++        ));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++
++gceSTATUS
++gckHARDWARE_UpdateContextProfile(
++    IN gckHARDWARE Hardware,
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status;
++    gcsPROFILER_COUNTERS * profiler = &Context->latestProfiler;
++    gcsPROFILER_COUNTERS * profilerHistroy = &Context->histroyProfiler;
++    gctUINT i, clock;
++    gctUINT32 colorKilled, colorDrawn, depthKilled, depthDrawn;
++    gctUINT32 totalRead, totalWrite;
++    gceCHIPMODEL chipModel;
++    gctUINT32 chipRevision;
++    gctUINT32 temp;
++    gctBOOL needResetShader = gcvFALSE;
++
++    gcmkHEADER_ARG("Hardware=0x%x Context=0x%x", Hardware, Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    chipModel = Hardware->identity.chipModel;
++    chipRevision = Hardware->identity.chipRevision;
++    if (chipModel == gcv2000 || (chipModel == gcv2100 && chipRevision == 0x5118))
++    {
++        needResetShader = gcvTRUE;
++    }
++
++    /* Read the counters. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00438,
++                             &profiler->gpuCyclesCounter));
++    gcmkUPDATE_PROFILE_DATA(gpuCyclesCounter);
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00078,
++                             &profiler->gpuTotalCyclesCounter));
++    gcmkUPDATE_PROFILE_DATA(gpuTotalCyclesCounter);
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x0007C,
++                             &profiler->gpuIdleCyclesCounter));
++    gcmkUPDATE_PROFILE_DATA(gpuIdleCyclesCounter);
++
++    /* Read clock control register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &clock));
++
++    profiler->gpuTotalRead64BytesPerFrame = 0;
++    profiler->gpuTotalWrite64BytesPerFrame = 0;
++    profiler->pe_pixel_count_killed_by_color_pipe = 0;
++    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
++
++    /* Walk through all avaiable pixel pipes. */
++    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
++    {
++        /* Select proper pipe. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                           Hardware->core,
++                                           0x00000,
++                                           ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
++
++        /* BW */
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00040,
++                             &totalRead));
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00044,
++                             &totalWrite));
++
++        profiler->gpuTotalRead64BytesPerFrame += totalRead;
++        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
++        gcmkUPDATE_PROFILE_DATA(gpuTotalRead64BytesPerFrame);
++        gcmkUPDATE_PROFILE_DATA(gpuTotalWrite64BytesPerFrame);
++
++        /* PE */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
++
++        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
++        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
++        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
++        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_color_pipe);
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_depth_pipe);
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_color_pipe);
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_depth_pipe);
++    }
++
++    /* Reset clock control register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      clock));
++
++
++
++
++    /* Reset counters. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++
++    /* SH */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->ps_inst_counter;
++        profiler->ps_inst_counter -= Context->prevPSInstCount;
++        Context->prevPSInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(ps_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
++    if (needResetShader)
++    {
++        temp = profiler->rendered_pixel_counter;
++        profiler->rendered_pixel_counter -= Context->prevPSPixelCount;
++        Context->prevPSPixelCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(rendered_pixel_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->vs_inst_counter;
++        profiler->vs_inst_counter -= Context->prevVSInstCount;
++        Context->prevVSInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(vs_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
++    if (needResetShader)
++    {
++        temp = profiler->rendered_vertice_counter;
++        profiler->rendered_vertice_counter -= Context->prevVSVertexCount;
++        Context->prevVSVertexCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(rendered_vertice_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->vtx_branch_inst_counter;
++        profiler->vtx_branch_inst_counter -= Context->prevVSBranchInstCount;
++        Context->prevVSBranchInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(vtx_branch_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->vtx_texld_inst_counter;
++        profiler->vtx_texld_inst_counter -= Context->prevVSTexInstCount;
++        Context->prevVSTexInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(vtx_texld_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->pxl_branch_inst_counter;
++        profiler->pxl_branch_inst_counter -= Context->prevPSBranchInstCount;
++        Context->prevPSBranchInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(pxl_branch_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->pxl_texld_inst_counter;
++        profiler->pxl_texld_inst_counter -= Context->prevPSTexInstCount;
++        Context->prevPSTexInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(pxl_texld_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));
++
++    /* PA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_input_vtx_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_input_prim_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_output_prim_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_depth_clipped_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_trivial_rejected_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_culled_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));
++
++    /* SE */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
++    gcmkUPDATE_PROFILE_DATA(se_culled_triangle_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
++    gcmkUPDATE_PROFILE_DATA(se_culled_lines_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));
++
++    /* RA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
++    gcmkUPDATE_PROFILE_DATA(ra_valid_pixel_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
++    gcmkUPDATE_PROFILE_DATA(ra_total_quad_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
++    gcmkUPDATE_PROFILE_DATA(ra_valid_quad_count_after_early_z);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
++    gcmkUPDATE_PROFILE_DATA(ra_total_primitive_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
++    gcmkUPDATE_PROFILE_DATA(ra_pipe_cache_miss_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
++    gcmkUPDATE_PROFILE_DATA(ra_prefetch_cache_miss_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++
++    /* TX */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_bilinear_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_trilinear_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_discarded_texture_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_texture_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
++    gcmkUPDATE_PROFILE_DATA(tx_mem_read_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
++    gcmkUPDATE_PROFILE_DATA(tx_mem_read_in_8B_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
++    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
++    gcmkUPDATE_PROFILE_DATA(tx_cache_hit_texel_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
++    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_texel_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));
++
++    /* MC */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
++    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_pipeline);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
++    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_IP);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
++    gcmkUPDATE_PROFILE_DATA(mc_total_write_req_8B_from_pipeline);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));
++
++    /* HI */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
++    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_read_request_stalled);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
++    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_request_stalled);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
++    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_data_stalled);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++static gceSTATUS
++_ResetGPU(
++    IN gckHARDWARE Hardware,
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++    gctUINT32 control, idle;
++    gceSTATUS status;
++
++    for (;;)
++    {
++        /* Disable clock gating. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    Hardware->powerBaseAddress +
++                    0x00104,
++                    0x00000000));
++
++        control = ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
++
++        /* Disable pulse-eater. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x0010C,
++                    control));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x0010C,
++                    ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x0010C,
++                    control));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x00000,
++                    ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x00000,
++                    0x00000900));
++
++        /* Wait for clock being stable. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Isolate the GPU. */
++        control = ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          control));
++
++        /* Set soft reset. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Wait for reset. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Reset soft reset bit. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Reset GPU isolation. */
++        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          control));
++
++        /* Read idle register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         Core,
++                                         0x00004,
++                                         &idle));
++
++        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
++        {
++            continue;
++        }
++
++        /* Read reset register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         Core,
++                                         0x00000,
++                                         &control));
++
++        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
++        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
++        )
++        {
++            continue;
++        }
++
++        /* GPU is idle. */
++        break;
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the error. */
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_Reset(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL mutexAcquired = gcvFALSE;
++    gctUINT32 process, thread;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
++    command = Hardware->kernel->command;
++    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
++
++    if (Hardware->identity.chipRevision < 0x4600)
++    {
++        /* Not supported - we need the isolation bit. */
++        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++    }
++
++    status = gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, 0);
++    if (status == gcvSTATUS_TIMEOUT)
++    {
++        gcmkONERROR(gckOS_GetProcessID(&process));
++        gcmkONERROR(gckOS_GetThreadID(&thread));
++
++        if ((Hardware->powerProcess == process)
++        &&  (Hardware->powerThread  == thread))
++        {
++            /* No way to recovery from a error in power management. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++    }
++    else
++    {
++        mutexAcquired = gcvTRUE;
++    }
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++        /* Acquire the power management semaphore. */
++        gcmkONERROR(
++            gckOS_AcquireSemaphore(Hardware->os, command->powerSemaphore));
++        acquired = gcvTRUE;
++    }
++
++    if ((Hardware->chipPowerState == gcvPOWER_ON)
++    ||  (Hardware->chipPowerState == gcvPOWER_IDLE)
++    )
++    {
++        /* Stop the command processor. */
++        gcmkONERROR(gckCOMMAND_Stop(command, gcvTRUE));
++    }
++
++    /* Stop isr, we will start it again when power on GPU. */
++    if (Hardware->stopIsr)
++    {
++        gcmkONERROR(Hardware->stopIsr(Hardware->isrContext, Hardware->core));
++    }
++
++    /* Hardware reset. */
++    status = gckOS_ResetGPU(Hardware->os, Hardware->core);
++
++    if (gcmIS_ERROR(status))
++    {
++        /* Soft reset. */
++        gcmkONERROR(_ResetGPU(Hardware, Hardware->os, Hardware->core));
++    }
++
++    /* Force an OFF to ON power switch. */
++    Hardware->chipPowerState = gcvPOWER_OFF;
++
++    gcmkONERROR(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    mutexAcquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the power management semaphore. */
++        gcmkVERIFY_OK(
++            gckOS_ReleaseSemaphore(Hardware->os, command->powerSemaphore));
++    }
++
++    if (mutexAcquired)
++    {
++        gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
++    }
++
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_GetBaseAddress(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32_PTR BaseAddress
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(BaseAddress != gcvNULL);
++
++    /* Test if we have a new Memory Controller. */
++    if (((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))))
++    {
++        /* No base address required. */
++        *BaseAddress = 0;
++    }
++    else
++    {
++        /* Get the base address from the OS. */
++        gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, BaseAddress));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*BaseAddress=0x%08x", *BaseAddress);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_NeedBaseAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 State,
++    OUT gctBOOL_PTR NeedBase
++    )
++{
++    gctBOOL need = gcvFALSE;
++
++    gcmkHEADER_ARG("Hardware=0x%x State=0x%08x", Hardware, State);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(NeedBase != gcvNULL);
++
++    /* Make sure this is a load state. */
++    if (((((gctUINT32) (State)) >> (0 ? 31:27) & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))))
++    {
++#ifndef VIVANTE_NO_3D
++        /* Get the state address. */
++        switch ((((((gctUINT32) (State)) >> (0 ? 15:0)) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1)))))) ))
++        {
++        case 0x0596:
++        case 0x0597:
++        case 0x0599:
++        case 0x059A:
++        case 0x05A9:
++            /* These states need a TRUE physical address. */
++            need = gcvTRUE;
++            break;
++        }
++#else
++        /* 2D addresses don't need a base address. */
++#endif
++    }
++
++    /* Return the flag. */
++    *NeedBase = need;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*NeedBase=%d", *NeedBase);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckHARDWARE_SetIsrManager(
++   IN gckHARDWARE Hardware,
++   IN gctISRMANAGERFUNC StartIsr,
++   IN gctISRMANAGERFUNC StopIsr,
++   IN gctPOINTER Context
++   )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    gcmkHEADER_ARG("Hardware=0x%x, StartIsr=0x%x, StopIsr=0x%x, Context=0x%x",
++                   Hardware, StartIsr, StopIsr, Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (StartIsr == gcvNULL ||
++        StopIsr == gcvNULL ||
++        Context == gcvNULL)
++    {
++        status = gcvSTATUS_INVALID_ARGUMENT;
++
++        gcmkFOOTER();
++        return status;
++    }
++
++    Hardware->startIsr = StartIsr;
++    Hardware->stopIsr = StopIsr;
++    Hardware->isrContext = Context;
++
++    /* Success. */
++    gcmkFOOTER();
++
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Compose
++**
++**  Start a composition.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Compose(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Offset,
++    IN gctSIZE_T Size,
++    IN gctUINT8 EventID
++    )
++{
++#ifndef VIVANTE_NO_3D
++    gceSTATUS status;
++    gctUINT32_PTR triggerState;
++
++    gcmkHEADER_ARG("Hardware=0x%x Physical=0x%x Logical=0x%x"
++                   " Offset=%d Size=%d EventID=%d",
++                   Hardware, Physical, Logical, Offset, Size, EventID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(((Size + 8) & 63) == 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Program the trigger state. */
++    triggerState = (gctUINT32_PTR) ((gctUINT8_PTR) Logical + Offset + Size);
++    triggerState[0] = 0x0C03;
++    triggerState[1]
++        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16))) | (((gctUINT32) ((gctUINT32) (EventID) & ((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16)))
++        ;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache for the wait/link. */
++    gcmkONERROR(gckOS_CacheClean(
++        Hardware->os, ProcessID, gcvNULL,
++        Physical, Logical, Offset + Size
++        ));
++#endif
++
++    /* Start composition. */
++    gcmkONERROR(gckOS_WriteRegisterEx(
++        Hardware->os, Hardware->core, 0x00554,
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
++        ));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    /* Return the status. */
++    return gcvSTATUS_NOT_SUPPORTED;
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_IsFeatureAvailable
++**
++**  Verifies whether the specified feature is available in hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gceFEATURE Feature
++**          Feature to be verified.
++*/
++gceSTATUS
++gckHARDWARE_IsFeatureAvailable(
++    IN gckHARDWARE Hardware,
++    IN gceFEATURE Feature
++    )
++{
++    gctBOOL available;
++
++    gcmkHEADER_ARG("Hardware=0x%x Feature=%d", Hardware, Feature);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Only features needed by common kernel logic added here. */
++    switch (Feature)
++    {
++    case gcvFEATURE_END_EVENT:
++        /*available = gcmVERIFYFIELDVALUE(Hardware->identity.chipMinorFeatures2,
++            GC_MINOR_FEATURES2, END_EVENT, AVAILABLE
++            );*/
++        available = gcvFALSE;
++        break;
++    case gcvFEATURE_MC20:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))));
++        break;
++    case gcvFEATURE_DYNAMIC_FREQUENCY_SCALING:
++        /* This feature doesn't apply for 2D cores. */
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 14:14) & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))))
++            &&      ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
++        break;
++
++    case gcvFEATURE_PIPE_2D:
++        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))));
++        break;
++
++    case gcvFEATURE_PIPE_3D:
++#ifndef VIVANTE_NO_3D
++        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
++#else
++        available = gcvFALSE;
++#endif
++        break;
++
++    case gcvFEATURE_HALTI2:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures4)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))));
++        break;
++
++    default:
++        gcmkFATAL("Invalid feature has been requested.");
++        available = gcvFALSE;
++    }
++
++    /* Return result. */
++    gcmkFOOTER_ARG("%d", available ? gcvSTATUS_TRUE : gcvSTATUS_OK);
++    return available ? gcvSTATUS_TRUE : gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_DumpMMUException
++**
++**  Dump the MMU debug info on an MMU exception.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_DumpMMUException(
++    IN gckHARDWARE Hardware
++    )
++{
++#if !gcdPOWER_SUSNPEND_WHEN_IDLE && !gcdPOWEROFF_TIMEOUT
++    gctUINT32 mmu, mmuStatus, address, i;
++#if gcdDEBUG
++    gctUINT32 mtlb, stlb, offset;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    gcmkPRINT("GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
++              Hardware->core,
++              Hardware->identity.chipModel,
++              Hardware->identity.chipRevision);
++
++    gcmkPRINT("**************************\n");
++    gcmkPRINT("***   MMU ERROR DUMP   ***\n");
++    gcmkPRINT("**************************\n");
++
++    gcmkVERIFY_OK(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00188,
++                             &mmuStatus));
++
++    gcmkPRINT("  MMU status = 0x%08X\n", mmuStatus);
++
++    for (i = 0; i < 4; i += 1)
++    {
++        mmu = mmuStatus & 0xF;
++        mmuStatus >>= 4;
++
++        if (mmu == 0)
++        {
++            continue;
++        }
++
++        switch (mmu)
++        {
++        case 1:
++              gcmkPRINT("  MMU%d: slave not present\n", i);
++              break;
++
++        case 2:
++              gcmkPRINT("  MMU%d: page not present\n", i);
++              break;
++
++        case 3:
++              gcmkPRINT("  MMU%d: write violation\n", i);
++              break;
++
++        default:
++              gcmkPRINT("  MMU%d: unknown state\n", i);
++        }
++
++        gcmkVERIFY_OK(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00190 + i * 4,
++                                 &address));
++
++        mtlb   = (address & gcdMMU_MTLB_MASK) >> gcdMMU_MTLB_SHIFT;
++        stlb   = (address & gcdMMU_STLB_4K_MASK) >> gcdMMU_STLB_4K_SHIFT;
++        offset =  address & gcdMMU_OFFSET_4K_MASK;
++
++        gcmkPRINT("  MMU%d: exception address = 0x%08X\n", i, address);
++
++        gcmkPRINT("    MTLB entry = %d\n", mtlb);
++
++        gcmkPRINT("    STLB entry = %d\n", stlb);
++
++        gcmkPRINT("    Offset = 0x%08X (%d)\n", offset, offset);
++
++        gckMMU_DumpPageTableEntry(Hardware->kernel->mmu, address);
++
++    }
++
++	gcmkFOOTER_NO();
++#else
++    /* If clock could be off automatically, we can't read mmu debug
++    ** register here; build driver with gcdPOWER_SUSPEND_WHEN_IDLE = 0
++    ** and gcdPOWEROFF_TIMEOUT = 0 to make it safe to read mmu register. */
++    gcmkPRINT("[galcore] %s(%d): MMU Exception!", __FUNCTION__, __LINE__);
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_DumpGPUState
++**
++**  Dump the GPU debug registers.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_DumpGPUState(
++    IN gckHARDWARE Hardware
++    )
++{
++    static gctCONST_STRING _cmdState[] =
++    {
++        "PAR_IDLE_ST", "PAR_DEC_ST", "PAR_ADR0_ST", "PAR_LOAD0_ST",
++        "PAR_ADR1_ST", "PAR_LOAD1_ST", "PAR_3DADR_ST", "PAR_3DCMD_ST",
++        "PAR_3DCNTL_ST", "PAR_3DIDXCNTL_ST", "PAR_INITREQDMA_ST",
++        "PAR_DRAWIDX_ST", "PAR_DRAW_ST", "PAR_2DRECT0_ST", "PAR_2DRECT1_ST",
++        "PAR_2DDATA0_ST", "PAR_2DDATA1_ST", "PAR_WAITFIFO_ST", "PAR_WAIT_ST",
++        "PAR_LINK_ST", "PAR_END_ST", "PAR_STALL_ST"
++    };
++
++    static gctCONST_STRING _cmdDmaState[] =
++    {
++        "CMD_IDLE_ST", "CMD_START_ST", "CMD_REQ_ST", "CMD_END_ST"
++    };
++
++    static gctCONST_STRING _cmdFetState[] =
++    {
++        "FET_IDLE_ST", "FET_RAMVALID_ST", "FET_VALID_ST"
++    };
++
++    static gctCONST_STRING _reqDmaState[] =
++    {
++        "REQ_IDLE_ST", "REQ_WAITIDX_ST", "REQ_CAL_ST"
++    };
++
++    static gctCONST_STRING _calState[] =
++    {
++        "CAL_IDLE_ST", "CAL_LDADR_ST", "CAL_IDXCALC_ST"
++    };
++
++    static gctCONST_STRING _veReqState[] =
++    {
++        "VER_IDLE_ST", "VER_CKCACHE_ST", "VER_MISS_ST"
++    };
++
++    static gcsiDEBUG_REGISTERS _dbgRegs[] =
++    {
++        { "RA", 0x474, 16, 0x448, 16, 0x12344321 },
++        { "TX", 0x474, 24, 0x44C, 16, 0x12211221 },
++        { "FE", 0x470, 0, 0x450, 16, 0xBABEF00D },
++        { "PE", 0x470, 16, 0x454, 16, 0xBABEF00D },
++        { "DE", 0x470, 8, 0x458, 16, 0xBABEF00D },
++        { "SH", 0x470, 24, 0x45C, 16, 0xDEADBEEF },
++        { "PA", 0x474, 0, 0x460, 16, 0x0000AAAA },
++        { "SE", 0x474, 8, 0x464, 16, 0x5E5E5E5E },
++        { "MC", 0x478, 0, 0x468, 16, 0x12345678 },
++        { "HI", 0x478, 8, 0x46C, 16, 0xAAAAAAAA }
++    };
++
++    static gctUINT32 _otherRegs[] =
++    {
++        0x040, 0x044, 0x04C, 0x050, 0x054, 0x058, 0x05C, 0x060,
++        0x43c, 0x440, 0x444, 0x414,
++    };
++
++    gceSTATUS status;
++    gckKERNEL kernel;
++    gctUINT32 idle, axi;
++    gctUINT32 dmaAddress1, dmaAddress2;
++    gctUINT32 dmaState1, dmaState2;
++    gctUINT32 dmaLow, dmaHigh;
++    gctUINT32 cmdState, cmdDmaState, cmdFetState;
++    gctUINT32 dmaReqState, calState, veReqState;
++    gctUINT i;
++    gctUINT pipe, pixelPipes;
++    gctUINT32 control, oldControl;
++    gckOS os = Hardware->os;
++    gceCORE core = Hardware->core;
++
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    kernel = Hardware->kernel;
++
++    gcmkPRINT_N(12, "GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
++                core,
++                Hardware->identity.chipModel,
++                Hardware->identity.chipRevision);
++
++    pixelPipes = Hardware->identity.pixelPipes
++               ? Hardware->identity.pixelPipes
++               : 1;
++
++    /* Reset register values. */
++    idle        = axi         =
++    dmaState1   = dmaState2   =
++    dmaAddress1 = dmaAddress2 =
++    dmaLow      = dmaHigh     = 0;
++
++    /* Verify whether DMA is running. */
++    gcmkONERROR(_VerifyDMA(
++        os, core, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
++        ));
++
++    cmdState    =  dmaState2        & 0x1F;
++    cmdDmaState = (dmaState2 >>  8) & 0x03;
++    cmdFetState = (dmaState2 >> 10) & 0x03;
++    dmaReqState = (dmaState2 >> 12) & 0x03;
++    calState    = (dmaState2 >> 14) & 0x03;
++    veReqState  = (dmaState2 >> 16) & 0x03;
++
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x004, &idle));
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x00C, &axi));
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x668, &dmaLow));
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x66C, &dmaHigh));
++
++    gcmkPRINT_N(0, "**************************\n");
++    gcmkPRINT_N(0, "***   GPU STATE DUMP   ***\n");
++    gcmkPRINT_N(0, "**************************\n");
++
++    gcmkPRINT_N(4, "  axi      = 0x%08X\n", axi);
++
++    gcmkPRINT_N(4, "  idle     = 0x%08X\n", idle);
++    if ((idle & 0x00000001) == 0) gcmkPRINT_N(0, "    FE not idle\n");
++    if ((idle & 0x00000002) == 0) gcmkPRINT_N(0, "    DE not idle\n");
++    if ((idle & 0x00000004) == 0) gcmkPRINT_N(0, "    PE not idle\n");
++    if ((idle & 0x00000008) == 0) gcmkPRINT_N(0, "    SH not idle\n");
++    if ((idle & 0x00000010) == 0) gcmkPRINT_N(0, "    PA not idle\n");
++    if ((idle & 0x00000020) == 0) gcmkPRINT_N(0, "    SE not idle\n");
++    if ((idle & 0x00000040) == 0) gcmkPRINT_N(0, "    RA not idle\n");
++    if ((idle & 0x00000080) == 0) gcmkPRINT_N(0, "    TX not idle\n");
++    if ((idle & 0x00000100) == 0) gcmkPRINT_N(0, "    VG not idle\n");
++    if ((idle & 0x00000200) == 0) gcmkPRINT_N(0, "    IM not idle\n");
++    if ((idle & 0x00000400) == 0) gcmkPRINT_N(0, "    FP not idle\n");
++    if ((idle & 0x00000800) == 0) gcmkPRINT_N(0, "    TS not idle\n");
++    if ((idle & 0x80000000) != 0) gcmkPRINT_N(0, "    AXI low power mode\n");
++
++    if (
++        (dmaAddress1 == dmaAddress2)
++     && (dmaState1 == dmaState2)
++    )
++    {
++        gcmkPRINT_N(0, "  DMA appears to be stuck at this address:\n");
++        gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
++    }
++    else
++    {
++        if (dmaAddress1 == dmaAddress2)
++        {
++            gcmkPRINT_N(0, "  DMA address is constant, but state is changing:\n");
++            gcmkPRINT_N(4, "    0x%08X\n", dmaState1);
++            gcmkPRINT_N(4, "    0x%08X\n", dmaState2);
++        }
++        else
++        {
++            gcmkPRINT_N(0, "  DMA is running; known addresses are:\n");
++            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
++            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress2);
++        }
++    }
++    gcmkPRINT_N(4, "  dmaLow   = 0x%08X\n", dmaLow);
++    gcmkPRINT_N(4, "  dmaHigh  = 0x%08X\n", dmaHigh);
++    gcmkPRINT_N(4, "  dmaState = 0x%08X\n", dmaState2);
++    gcmkPRINT_N(8, "    command state       = %d (%s)\n", cmdState, _cmdState   [cmdState]);
++    gcmkPRINT_N(8, "    command DMA state   = %d (%s)\n", cmdDmaState, _cmdDmaState[cmdDmaState]);
++    gcmkPRINT_N(8, "    command fetch state = %d (%s)\n", cmdFetState, _cmdFetState[cmdFetState]);
++    gcmkPRINT_N(8, "    DMA request state   = %d (%s)\n", dmaReqState, _reqDmaState[dmaReqState]);
++    gcmkPRINT_N(8, "    cal state           = %d (%s)\n", calState, _calState   [calState]);
++    gcmkPRINT_N(8, "    VE request state    = %d (%s)\n", veReqState, _veReqState [veReqState]);
++
++    /* Record control. */
++    gckOS_ReadRegisterEx(os, core, 0x0, &oldControl);
++
++    for (pipe = 0; pipe < pixelPipes; pipe++)
++    {
++        gcmkPRINT_N(4, "  Debug registers of pipe[%d]:\n", pipe);
++
++        /* Switch pipe. */
++        gckOS_ReadRegisterEx(os, core, 0x0, &control);
++        control &= ~(0xF << 20);
++        control |= (pipe << 20);
++        gckOS_WriteRegisterEx(os, core, 0x0, control);
++
++        for (i = 0; i < gcmCOUNTOF(_dbgRegs); i += 1)
++        {
++            gcmkONERROR(_DumpDebugRegisters(os, core, &_dbgRegs[i]));
++        }
++
++        gcmkPRINT_N(0, "    Other Registers:\n");
++        for (i = 0; i < gcmCOUNTOF(_otherRegs); i += 1)
++        {
++            gctUINT32 read;
++            gcmkONERROR(gckOS_ReadRegisterEx(os, core, _otherRegs[i], &read));
++            gcmkPRINT_N(12, "      [0x%04X] 0x%08X\n", _otherRegs[i], read);
++        }
++    }
++
++    if (kernel->hardware->identity.chipFeatures & (1 << 4))
++    {
++        gctUINT32 read0, read1, write;
++
++        read0 = read1 = write = 0;
++
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x43C, &read0));
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x440, &read1));
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x444, &write));
++
++        gcmkPRINT_N(4, "  read0    = 0x%08X\n", read0);
++        gcmkPRINT_N(4, "  read1    = 0x%08X\n", read1);
++        gcmkPRINT_N(4, "  write    = 0x%08X\n", write);
++    }
++
++    /* Restore control. */
++    gckOS_WriteRegisterEx(os, core, 0x0, oldControl);
++
++    /* dump stack. */
++    gckOS_DumpCallStack(os);
++
++OnError:
++
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++
++#if gcdFRAME_DB
++static gceSTATUS
++gckHARDWARE_ReadPerformanceRegister(
++    IN gckHARDWARE Hardware,
++    IN gctUINT PerformanceAddress,
++    IN gctUINT IndexAddress,
++    IN gctUINT IndexShift,
++    IN gctUINT Index,
++    OUT gctUINT32_PTR Value
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x PerformanceAddress=0x%x IndexAddress=0x%x "
++                   "IndexShift=%u Index=%u",
++                   Hardware, PerformanceAddress, IndexAddress, IndexShift,
++                   Index);
++
++    /* Write the index. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      IndexAddress,
++                                      Index << IndexShift));
++
++    /* Read the register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     PerformanceAddress,
++                                     Value));
++
++    /* Test for reset. */
++    if (Index == 15)
++    {
++        /* Index another register to get out of reset. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, IndexAddress, 0));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Value=0x%x", *Value);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_GetFrameInfo(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_FRAME_INFO * FrameInfo
++    )
++{
++    gceSTATUS status;
++    gctUINT i, clock;
++    gcsHAL_FRAME_INFO info;
++#if gcdFRAME_DB_RESET
++	gctUINT reset;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Get profile tick. */
++    gcmkONERROR(gckOS_GetProfileTick(&info.ticks));
++
++    /* Read SH counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        4,
++        &info.shaderCycles));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        9,
++        &info.vsInstructionCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        12,
++        &info.vsTextureCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        7,
++        &info.psInstructionCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        14,
++        &info.psTextureCount));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        15,
++        &reset));
++#endif
++
++    /* Read PA counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        3,
++        &info.vertexCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        4,
++        &info.primitiveCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        7,
++        &info.rejectedPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        8,
++        &info.culledPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        6,
++        &info.clippedPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        5,
++        &info.outPrimitives));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        15,
++        &reset));
++#endif
++
++    /* Read RA counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        3,
++        &info.inPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        11,
++        &info.culledQuadCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        1,
++        &info.totalQuadCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        2,
++        &info.quadCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        0,
++        &info.totalPixelCount));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        15,
++        &reset));
++#endif
++
++    /* Read TX counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        0,
++        &info.bilinearRequests));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        1,
++        &info.trilinearRequests));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        8,
++        &info.txHitCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        9,
++        &info.txMissCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        6,
++        &info.txBytes8));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        15,
++        &reset));
++#endif
++
++    /* Read clock control register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &clock));
++
++    /* Walk through all avaiable pixel pipes. */
++    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
++    {
++        /* Select proper pipe. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
++
++        /* Read cycle registers. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00078,
++                                         &info.cycles[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x0007C,
++                                         &info.idleCycles[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00438,
++                                         &info.mcCycles[i]));
++
++        /* Read bandwidth registers. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x0005C,
++                                         &info.readRequests[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00040,
++                                         &info.readBytes8[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00050,
++                                         &info.writeRequests[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00044,
++                                         &info.writeBytes8[i]));
++
++        /* Read PE counters. */
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            0,
++            &info.colorKilled[i]));
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            2,
++            &info.colorDrawn[i]));
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            1,
++            &info.depthKilled[i]));
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            3,
++            &info.depthDrawn[i]));
++    }
++
++    /* Zero out remaning reserved counters. */
++    for (; i < 8; ++i)
++    {
++        info.readBytes8[i]    = 0;
++        info.writeBytes8[i]   = 0;
++        info.cycles[i]        = 0;
++        info.idleCycles[i]    = 0;
++        info.mcCycles[i]      = 0;
++        info.readRequests[i]  = 0;
++        info.writeRequests[i] = 0;
++        info.colorKilled[i]   = 0;
++        info.colorDrawn[i]    = 0;
++        info.depthKilled[i]   = 0;
++        info.depthDrawn[i]    = 0;
++    }
++
++    /* Reset clock control register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      clock));
++
++    /* Reset cycle and bandwidth counters. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      1));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      0));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00078,
++                                      0));
++
++#if gcdFRAME_DB_RESET
++    /* Reset PE counters. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00454,
++        0x00470,
++        16,
++        15,
++        &reset));
++#endif
++
++    /* Copy to user. */
++    gcmkONERROR(gckOS_CopyToUserData(Hardware->os,
++                                     &info,
++                                     FrameInfo,
++                                     gcmSIZEOF(info)));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++#if gcdDVFS
++#define READ_FROM_EATER1 0
++
++gceSTATUS
++gckHARDWARE_QueryLoad(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32 * Load
++    )
++{
++    gctUINT32 debug1;
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Load != gcvNULL);
++
++    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00110,
++                                         Load));
++#if READ_FROM_EATER1
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00134,
++                                         Load));
++#endif
++
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00114,
++                                         &debug1));
++
++        /* Patch result of 0x110 with result of 0x114. */
++        if ((debug1 & 0xFF) == 1)
++        {
++            *Load &= ~0xFF;
++            *Load |= 1;
++        }
++
++        if (((debug1 & 0xFF00) >> 8) == 1)
++        {
++            *Load &= ~(0xFF << 8);
++            *Load |= 1 << 8;
++        }
++
++        if (((debug1 & 0xFF0000) >> 16) == 1)
++        {
++            *Load &= ~(0xFF << 16);
++            *Load |= 1 << 16;
++        }
++
++        if (((debug1 & 0xFF000000) >> 24) == 1)
++        {
++            *Load &= ~(0xFF << 24);
++            *Load |= 1 << 24;
++        }
++    }
++    else
++    {
++        status = gcvSTATUS_INVALID_REQUEST;
++    }
++
++OnError:
++
++    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_SetDVFSPeroid(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32 Frequency
++    )
++{
++    gceSTATUS status;
++    gctUINT32 period;
++    gctUINT32 eater;
++
++#if READ_FROM_EATER1
++    gctUINT32 period1;
++    gctUINT32 eater1;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%X Frequency=%d", Hardware, Frequency);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    period = 0;
++
++    while((64 << period) < (gcdDVFS_ANAYLSE_WINDOW * Frequency * 1000) )
++    {
++        period++;
++    }
++
++#if READ_FROM_EATER1
++    /*
++    *  Peroid = F * 1000 * 1000 / (60 * 16 * 1024);
++    */
++    period1 = Frequency * 6250 / 6114;
++#endif
++
++    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++        /* Get current configure. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x0010C,
++                                         &eater));
++
++        /* Change peroid. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x0010C,
++                                          ((((gctUINT32) (eater)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (period) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))));
++
++#if READ_FROM_EATER1
++        /* Config eater1. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00130,
++                                         &eater1));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00130,
++                                          ((((gctUINT32) (eater1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16))) | (((gctUINT32) ((gctUINT32) (period1) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16)))));
++#endif
++    }
++    else
++    {
++        status = gcvSTATUS_INVALID_REQUEST;
++    }
++
++OnError:
++    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_InitDVFS(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gctUINT32 data;
++
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x0010C,
++                                     &data));
++
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22)));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "DVFS Configure=0x%X",
++                   data);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0010C,
++                                      data));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/arch/XAQ2/hal/kernel/gc_hal_kernel_hardware.h	2015-07-27 23:13:06.170964992 +0200
+@@ -0,0 +1,136 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_hardware_h_
++#define __gc_hal_kernel_hardware_h_
++
++#if gcdENABLE_VG
++#include "gc_hal_kernel_hardware_vg.h"
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/* gckHARDWARE object. */
++struct _gckHARDWARE
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gctKERNEL object. */
++    gckKERNEL                   kernel;
++
++    /* Pointer to gctOS object. */
++    gckOS                       os;
++
++    /* Core */
++    gceCORE                     core;
++
++    /* Chip characteristics. */
++    gcsHAL_QUERY_CHIP_IDENTITY  identity;
++    gctBOOL                     allowFastClear;
++    gctBOOL                     allowCompression;
++    gctUINT32                   powerBaseAddress;
++    gctBOOL                     extraEventStates;
++
++    /* Big endian */
++    gctBOOL                     bigEndian;
++
++    /* Chip status */
++    gctPOINTER                  powerMutex;
++    gctUINT32                   powerProcess;
++    gctUINT32                   powerThread;
++    gceCHIPPOWERSTATE           chipPowerState;
++    gctUINT32                   lastWaitLink;
++    gctBOOL                     clockState;
++    gctBOOL                     powerState;
++    gctPOINTER                  globalSemaphore;
++
++    gctISRMANAGERFUNC           startIsr;
++    gctISRMANAGERFUNC           stopIsr;
++    gctPOINTER                  isrContext;
++
++    gctUINT32                   mmuVersion;
++
++    /* Type */
++    gceHARDWARE_TYPE            type;
++
++#if gcdPOWEROFF_TIMEOUT
++    gctUINT32                   powerOffTime;
++    gctUINT32                   powerOffTimeout;
++    gctPOINTER                  powerOffTimer;
++#endif
++
++    gctPOINTER                  pageTableDirty;
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    /* FSCALE_VAL when gcvPOWER_ON. */
++    gctUINT32                   powerOnFscaleVal;
++#endif
++
++#if gcdLINK_QUEUE_SIZE
++    struct _gckLINKQUEUE        linkQueue;
++#endif
++
++    gctBOOL                     powerManagement;
++    gctBOOL                     gpuProfiler;
++};
++
++gceSTATUS
++gckHARDWARE_GetBaseAddress(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32_PTR BaseAddress
++    );
++
++gceSTATUS
++gckHARDWARE_NeedBaseAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 State,
++    OUT gctBOOL_PTR NeedBase
++    );
++
++gceSTATUS
++gckHARDWARE_GetFrameInfo(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_FRAME_INFO * FrameInfo
++    );
++
++gceSTATUS
++gckHARDWARE_SetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32   FscaleValue
++    );
++
++gceSTATUS
++gckHARDWARE_GetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT * FscaleValue,
++    IN gctUINT * MinFscaleValue,
++    IN gctUINT * MaxFscaleValue
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_hardware_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/config linux-xbian-imx6/drivers/mxc/gpu-viv/config
+--- linux-4.1.3/drivers/mxc/gpu-viv/config	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/config	2015-07-27 23:13:06.170964992 +0200
+@@ -0,0 +1,38 @@
++##############################################################################
++#
++#    Copyright (C) 2005 - 2013 by Vivante Corp.
++#
++#    This program is free software; you can redistribute it and/or modify
++#    it under the terms of the GNU General Public License as published by
++#    the Free Software Foundation; either version 2 of the license, or
++#    (at your option) any later version.
++#
++#    This program is distributed in the hope that it will be useful,
++#    but WITHOUT ANY WARRANTY; without even the implied warranty of
++#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++#    GNU General Public License for more details.
++#
++#    You should have received a copy of the GNU General Public License
++#    along with this program; if not write to the Free Software
++#    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++#
++##############################################################################
++
++
++ARCH_TYPE                         ?= arm
++SDK_DIR                           ?= $(AQROOT)/build/sdk
++USE_3D_VG                         ?= 1
++FORCE_ALL_VIDEO_MEMORY_CACHED     ?= 0
++NONPAGED_MEMORY_CACHEABLE         ?= 0
++NONPAGED_MEMORY_BUFFERABLE        ?= 1
++CACHE_FUNCTION_UNIMPLEMENTED      ?= 0
++VIVANTE_ENABLE_VG                 ?= 1
++NO_USER_DIRECT_ACCESS_FROM_KERNEL ?= 1
++VIVANTE_NO_3D                     ?= 0
++ENABLE_OUTER_CACHE_PATCH          ?= 1
++USE_BANK_ALIGNMENT                ?= 1
++BANK_BIT_START                    ?= 13
++BANK_BIT_END                      ?= 15
++BANK_CHANNEL_BIT                  ?= 12
++ENABLE_GPU_CLOCK_BY_DRIVER        = 1
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.c	2015-07-27 23:13:06.186908111 +0200
+@@ -0,0 +1,2317 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#include "gc_hal_kernel_context.h"
++#include "gc_hal_kernel_buffer.h"
++
++/******************************************************************************\
++******************************** Debugging Macro *******************************
++\******************************************************************************/
++
++/* Zone used for header/footer. */
++#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
++
++
++/******************************************************************************\
++************************** Context State Buffer Helpers ************************
++\******************************************************************************/
++
++#define _STATE(reg)                                                            \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        reg ## _Count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _STATE_COUNT(reg, count)                                               \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _STATE_COUNT_OFFSET(reg, offset, count)                                \
++    _State(\
++        Context, index, \
++        (reg ## _Address >> 2) + offset, \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _STATE_MIRROR_COUNT(reg, mirror, count)                                \
++    _StateMirror(\
++        Context, \
++        reg ## _Address >> 2, \
++        count, \
++        mirror ## _Address >> 2                                                \
++        )
++
++#define _STATE_HINT(reg)                                                       \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        reg ## _Count, \
++        gcvFALSE, gcvTRUE                                                      \
++        )
++
++#define _STATE_HINT_BLOCK(reg, block, count)                                   \
++    _State(\
++        Context, index, \
++        (reg ## _Address >> 2) + (block << reg ## _BLK), \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvTRUE                                                      \
++        )
++
++#define _STATE_COUNT_OFFSET_HINT(reg, offset, count)                           \
++    _State(\
++        Context, index, \
++        (reg ## _Address >> 2) + offset, \
++        reg ## _ResetValue, \
++        count, \
++        gcvFALSE, gcvTRUE                                                      \
++        )
++
++#define _STATE_X(reg)                                                          \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        reg ## _ResetValue, \
++        reg ## _Count, \
++        gcvTRUE, gcvFALSE                                                      \
++        )
++
++#define _STATE_INIT_VALUE(reg, value)                                          \
++    _State(\
++        Context, index, \
++        reg ## _Address >> 2, \
++        value, \
++        reg ## _Count, \
++        gcvFALSE, gcvFALSE                                                     \
++        )
++
++#define _CLOSE_RANGE()                                                         \
++    _TerminateStateBlock(Context, index)
++
++#define _ENABLE(reg, field)                                                    \
++    do                                                                         \
++    {                                                                          \
++        if (gcmVERIFYFIELDVALUE(data, reg, MASK_ ## field, ENABLED))           \
++        {                                                                      \
++            enable |= gcmFIELDMASK(reg, field);                                \
++        }                                                                      \
++    }                                                                          \
++    while (gcvFALSE)
++
++#define _BLOCK_COUNT(reg)                                                      \
++    ((reg ## _Count) >> (reg ## _BLK))
++
++
++/******************************************************************************\
++*********************** Support Functions and Definitions **********************
++\******************************************************************************/
++
++#define gcdSTATE_MASK \
++    (((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 | 0xC0FFEE & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))))
++
++#if gcdENABLE_3D
++static gctUINT32
++_TerminateStateBlock(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Index
++    )
++{
++    gctUINT32_PTR buffer;
++    gctUINT32 align;
++
++    /* Determine if we need alignment. */
++    align = (Index & 1) ? 1 : 0;
++
++    /* Address correct index. */
++    buffer = (Context->buffer == gcvNULL)
++        ? gcvNULL
++        : Context->buffer->logical;
++
++    /* Flush the current state block; make sure no pairing with the states
++       to follow happens. */
++    if (align && (buffer != gcvNULL))
++    {
++        buffer[Index] = 0xDEADDEAD;
++    }
++
++    /* Reset last address. */
++    Context->lastAddress = ~0U;
++
++    /* Return alignment requirement. */
++    return align;
++}
++#endif
++
++
++#if (gcdENABLE_3D || gcdENABLE_2D)
++static gctUINT32
++_FlushPipe(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Index,
++    IN gcePIPE_SELECT Pipe
++    )
++{
++    gctBOOL fcFlushStall;
++    gctUINT32 flushSlots;
++    gctBOOL iCacheInvalidate;
++
++    fcFlushStall
++        = gckHARDWARE_IsFeatureAvailable(Context->hardware, gcvFEATURE_FC_FLUSH_STALL);
++
++    iCacheInvalidate
++        = ((((gctUINT32) (Context->hardware->identity.chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))));
++
++    flushSlots = 6;
++
++    if (fcFlushStall)
++    {
++        /* Flush tile status cache. */
++        flushSlots += 6;
++    }
++
++    if (iCacheInvalidate)
++    {
++        flushSlots += 12;
++    }
++
++    if (Context->buffer != gcvNULL)
++    {
++        gctUINT32_PTR buffer;
++
++        /* Address correct index. */
++        buffer = Context->buffer->logical + Index;
++
++        /* Flush the current pipe. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = (Pipe == gcvPIPE_2D)
++                ?   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++                :   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++
++        /* Semaphore from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Stall from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        if (fcFlushStall)
++        {
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++            /* Semaphore from FE to PE. */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++            /* Stall from FE to PE. */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++        }
++
++        if (iCacheInvalidate)
++        {
++            /* Invalidate I$ after pipe is stalled */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0218) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x021A) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0218) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x021A) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++
++            /* Semaphore from FE to PE. */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++            /* Stall from FE to PE. */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++        }
++    }
++
++    /* Number of slots taken by flushing pipe. */
++    return flushSlots;
++}
++#endif
++
++#if gcdENABLE_3D
++static gctUINT32
++_SemaphoreStall(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Index
++    )
++{
++    if (Context->buffer != gcvNULL)
++    {
++        gctUINT32_PTR buffer;
++
++        /* Address correct index. */
++        buffer = Context->buffer->logical + Index;
++
++        /* Semaphore from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Stall from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++    }
++
++    /* Semaphore/stall takes 4 slots. */
++    return 4;
++}
++#endif
++
++#if (gcdENABLE_3D || gcdENABLE_2D)
++static gctUINT32
++_SwitchPipe(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Index,
++    IN gcePIPE_SELECT Pipe
++    )
++{
++    gctUINT32 slots = 6;
++
++    if (Context->buffer != gcvNULL)
++    {
++        gctUINT32_PTR buffer;
++
++        /* Address correct index. */
++        buffer = Context->buffer->logical + Index;
++
++        /* LoadState(AQPipeSelect, 1), pipe. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        *buffer++
++            = (Pipe == gcvPIPE_2D)
++                ? 0x1
++                : 0x0;
++
++        /* Semaphore from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Stall from FE to PE. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++    }
++
++    Context->pipeSelectBytes = slots * gcmSIZEOF(gctUINT32);
++
++    return slots;
++}
++#endif
++
++#if gcdENABLE_3D
++static gctUINT32
++_State(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Index,
++    IN gctUINT32 Address,
++    IN gctUINT32 Value,
++    IN gctUINT32 Size,
++    IN gctBOOL FixedPoint,
++    IN gctBOOL Hinted
++    )
++{
++    gctUINT32_PTR buffer;
++    gctUINT32 align;
++    gctUINT32 i;
++
++    /* Determine if we need alignment. */
++    align = (Index & 1) ? 1 : 0;
++
++    /* Address correct index. */
++    buffer = (Context->buffer == gcvNULL)
++        ? gcvNULL
++        : Context->buffer->logical;
++
++    if ((buffer == gcvNULL) && (Address + Size > Context->stateCount))
++    {
++        /* Determine maximum state. */
++        Context->stateCount = Address + Size;
++    }
++
++    /* Do we need a new entry? */
++    if ((Address != Context->lastAddress) || (FixedPoint != Context->lastFixed))
++    {
++        if (buffer != gcvNULL)
++        {
++            if (align)
++            {
++                /* Add filler. */
++                buffer[Index++] = 0xDEADDEAD;
++            }
++
++            /* LoadState(Address, Count). */
++            gcmkASSERT((Index & 1) == 0);
++
++            if (FixedPoint)
++            {
++                buffer[Index]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++            }
++            else
++            {
++                buffer[Index]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1))))))) << (0 ? 26:26)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++            }
++
++            /* Walk all the states. */
++            for (i = 0; i < (gctUINT32)Size; i += 1)
++            {
++                /* Set state to uninitialized value. */
++                buffer[Index + 1 + i] = Value;
++
++                /* Set index in state mapping table. */
++                Context->map[Address + i].index = (gctUINT)Index + 1 + i;
++
++#if gcdSECURE_USER
++                /* Save hint. */
++                if (Context->hint != gcvNULL)
++                {
++                    Context->hint[Address + i] = Hinted;
++                }
++#endif
++            }
++        }
++
++        /* Save information for this LoadState. */
++        Context->lastIndex   = (gctUINT)Index;
++        Context->lastAddress = Address + (gctUINT32)Size;
++        Context->lastSize    = Size;
++        Context->lastFixed   = FixedPoint;
++
++        /* Return size for load state. */
++        return align + 1 + Size;
++    }
++
++    /* Append this state to the previous one. */
++    if (buffer != gcvNULL)
++    {
++        /* Update last load state. */
++        buffer[Context->lastIndex] =
++            ((((gctUINT32) (buffer[Context->lastIndex])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Context->lastSize + Size) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        /* Walk all the states. */
++        for (i = 0; i < (gctUINT32)Size; i += 1)
++        {
++            /* Set state to uninitialized value. */
++            buffer[Index + i] = Value;
++
++            /* Set index in state mapping table. */
++            Context->map[Address + i].index = (gctUINT)Index + i;
++
++#if gcdSECURE_USER
++            /* Save hint. */
++            if (Context->hint != gcvNULL)
++            {
++                Context->hint[Address + i] = Hinted;
++            }
++#endif
++        }
++    }
++
++    /* Update last address and size. */
++    Context->lastAddress += (gctUINT32)Size;
++    Context->lastSize    += Size;
++
++    /* Return number of slots required. */
++    return Size;
++}
++
++static gctUINT32
++_StateMirror(
++    IN gckCONTEXT Context,
++    IN gctUINT32 Address,
++    IN gctUINT32 Size,
++    IN gctUINT32 AddressMirror
++    )
++{
++    gctUINT32 i;
++
++    /* Process when buffer is set. */
++    if (Context->buffer != gcvNULL)
++    {
++        /* Walk all states. */
++        for (i = 0; i < Size; i++)
++        {
++            /* Copy the mapping address. */
++            Context->map[Address + i].index =
++                Context->map[AddressMirror + i].index;
++        }
++    }
++
++    /* Return the number of required maps. */
++    return Size;
++}
++#endif
++
++#if (gcdENABLE_3D || gcdENABLE_2D)
++static gceSTATUS
++_InitializeContextBuffer(
++    IN gckCONTEXT Context
++    )
++{
++    gctUINT32_PTR buffer;
++    gctUINT32 index;
++
++#if gcdENABLE_3D
++    gctBOOL halti0, halti1, halti2, halti3;
++    gctUINT i;
++    gctUINT vertexUniforms, fragmentUniforms, vsConstBase, psConstBase, constMax;
++    gctBOOL unifiedUniform;
++    gctUINT fe2vsCount;
++#endif
++
++    /* Reset the buffer index. */
++    index = 0;
++
++    /* Reset the last state address. */
++    Context->lastAddress = ~0U;
++
++    /* Get the buffer pointer. */
++    buffer = (Context->buffer == gcvNULL)
++        ? gcvNULL
++        : Context->buffer->logical;
++
++
++    /**************************************************************************/
++    /* Build 2D states. *******************************************************/
++
++
++#if gcdENABLE_3D
++    /**************************************************************************/
++    /* Build 3D states. *******************************************************/
++
++    halti0 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) );
++    halti1 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) );
++    halti2 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures4)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) );
++    halti3 = (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures5)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) );
++
++    /* Query how many uniforms can support for non-unified uniform mode. */
++    {if (Context->hardware->identity.numConstants > 256){    unifiedUniform = gcvTRUE;    vsConstBase  = 0xC000;    psConstBase  = 0xC000;    constMax     = Context->hardware->identity.numConstants;    vertexUniforms   = 256;    fragmentUniforms   = constMax - vertexUniforms;}else if (Context->hardware->identity.numConstants == 256){    if (Context->hardware->identity.chipModel == gcv2000 && Context->hardware->identity.chipRevision == 0x5118)    {        unifiedUniform = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vertexUniforms   = 256;        fragmentUniforms   = 64;        constMax     = 320;    }    else    {        unifiedUniform = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vertexUniforms   = 256;        fragmentUniforms   = 256;        constMax     = 512;    }}else{    unifiedUniform = gcvFALSE;    vsConstBase  = 0x1400;    psConstBase  = 0x1C00;    vertexUniforms   = 168;    fragmentUniforms   = 64;    constMax     = 232;}};
++
++#if !gcdENABLE_UNIFIED_CONSTANT
++    if (Context->hardware->identity.numConstants > 256)
++    {
++        unifiedUniform = gcvTRUE;
++    }
++    else
++    {
++        unifiedUniform = gcvFALSE;
++    }
++#endif
++
++    /* Store the 3D entry index. */
++    Context->entryOffset3D = (gctUINT)index * gcmSIZEOF(gctUINT32);
++
++    /* Switch to 3D pipe. */
++    index += _SwitchPipe(Context, index, gcvPIPE_3D);
++
++    /* Current context pointer. */
++#if gcdDEBUG
++    index += _State(Context, index, 0x03850 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++#endif
++
++    index += _FlushPipe(Context, index, gcvPIPE_3D);
++
++    /* Global states. */
++    index += _State(Context, index, 0x03814 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03818 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0381C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03820 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03828 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0382C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03834 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03854 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0384C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    /* Front End states. */
++    fe2vsCount = 12;
++    if (halti0)
++    {
++        fe2vsCount = 16;
++    }
++    index += _State(Context, index, 0x00600 >> 2, 0x00000000, fe2vsCount, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    index += _State(Context, index, 0x00644 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x00648 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0064C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x00650 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00680 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x006A0 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00674 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0067C >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x006C0 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00700 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00740 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00780 >> 2, 0x3F800000, 16, gcvFALSE, gcvFALSE);
++
++    if (halti2)
++    {
++        index += _State(Context, index, 0x14600 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x14640 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x14680 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    }
++
++    /* This register is programed by all chips, which program all DECODE_SELECT as VS
++    ** except SAMPLER_DECODE_SELECT.
++    */
++    index += _State(Context, index, 0x00860 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    if (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))))
++    {
++        /* I-Cache states. */
++        index += _State(Context, index, 0x00868 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x0086C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x0304C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x01028 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _CLOSE_RANGE();
++
++        if (halti3)
++        {
++            index += _State(Context, index, 0x00890 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++            index += _State(Context, index, 0x0104C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++            index += _CLOSE_RANGE();
++        }
++    }
++
++    /* Vertex Shader states. */
++    index += _State(Context, index, 0x00804 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00808 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0080C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00810 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00820 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00830 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    index += _CLOSE_RANGE();
++
++    /* Primitive Assembly states. */
++    index += _State(Context, index, 0x00A00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A08 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A0C >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A10 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A1C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A28 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A2C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A30 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A40 >> 2, 0x00000000, Context->hardware->identity.varyingsCount, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A34 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A38 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A3C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A80 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A84 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00A8C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00A88 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++#if gcdMULTI_GPU
++    index += _State(Context, index, 0x03A00 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03A04 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x03A08 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++#endif
++    /* Setup states. */
++    index += _State(Context, index, 0x00C00 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C04 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C08 >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C0C >> 2, 0x45000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C10 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C14 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C18 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C1C >> 2, 0x42000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00C20 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++    index += _State(Context, index, 0x00C24 >> 2, 0x00000000, 1, gcvTRUE, gcvFALSE);
++
++    /* Raster states. */
++    index += _State(Context, index, 0x00E00 >> 2, 0x00000001, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E10 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E04 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E40 >> 2, 0x00000000, 16, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E08 >> 2, 0x00000031, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E24 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00E20 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    if (halti2)
++    {
++        index += _State(Context, index, 0x00E0C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    }
++
++    /* Pixel Shader states. */
++    index += _State(Context, index, 0x01004 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0100C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01010 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01030 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    index += _CLOSE_RANGE();
++
++    /* Texture states. */
++    index += _State(Context, index, 0x02000 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02040 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02080 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x020C0 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02100 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02140 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02180 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x021C0 >> 2, 0x00321000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02200 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x02240 >> 2, 0x00000000, 12, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, (0x02400 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02440 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02480 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x024C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02500 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02540 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02580 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x025C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02600 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02640 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02680 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x026C0 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02700 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, (0x02740 >> 2) + (0 << 4), 0x00000000, 12, gcvFALSE, gcvTRUE);
++    index += _CLOSE_RANGE();
++
++    if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 22:22)) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) ))
++    {
++        /*
++         * Linear stride LODn will overwrite LOD0 on GC880,GC2000.
++         * And only LOD0 is valid for this register.
++         */
++        gctUINT count = halti1 ? 14 : 1;
++
++        for (i = 0; i < 12; i += 1)
++        {
++            index += _State(Context, index, (0x02C00 >> 2) + i * 16, 0x00000000, count, gcvFALSE, gcvFALSE);
++        }
++    }
++
++    if (halti1)
++    {
++        gctUINT texBlockCount;
++        gctUINT gcregTXLogSizeResetValue;
++
++        /* Enable the integer filter pipe for all texture samplers
++           so that the floating point filter clock will shut off until
++           we start using the floating point filter.
++        */
++        gcregTXLogSizeResetValue = ((((gctUINT32) (0x00000000)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 29:29) - (0 ? 29:29) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 29:29) - (0 ? 29:29) + 1))))))) << (0 ? 29:29))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 29:29) - (0 ? 29:29) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 29:29) - (0 ? 29:29) + 1))))))) << (0 ? 29:29)));
++
++        /* New texture block. */
++        index += _State(Context, index, 0x10000 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10080 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10100 >> 2, gcregTXLogSizeResetValue, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10180 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10200 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10280 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10300 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10380 >> 2, 0x00321000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10400 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10480 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++
++        if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures2)) >> (0 ? 15:15)) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1)))))) ))
++        {
++            index += _State(Context, index, 0x12000 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
++            index += _State(Context, index, 0x12400 >> 2, 0x00000000, 256, gcvFALSE, gcvFALSE);
++        }
++
++        texBlockCount = ((512) >> (4));
++
++        for (i = 0; i < texBlockCount; i += 1)
++        {
++            index += _State(Context, index, (0x10800 >> 2) + (i << 4), 0x00000000, 14, gcvFALSE, gcvTRUE);
++        }
++    }
++
++    if (halti2)
++    {
++        index += _State(Context, index, 0x10700 >> 2, 0x00000F00, 32, gcvFALSE, gcvFALSE);
++    }
++
++    if (halti3)
++    {
++        index += _State(Context, index, 0x10780 >> 2, 0x00030000, 32, gcvFALSE, gcvFALSE);
++    }
++
++    /* ASTC */
++    if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures4)) >> (0 ? 13:13)) & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))) ))
++    {
++        index += _State(Context, index, 0x10500 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10580 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10600 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x10680 >> 2, 0x00000000, 32, gcvFALSE, gcvFALSE);
++    }
++
++    /* YUV. */
++    index += _State(Context, index, 0x01678 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0167C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01680 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01684 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01688 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0168C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01690 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01694 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01698 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0169C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    /* Thread walker states. */
++    index += _State(Context, index, 0x00900 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00904 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00908 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0090C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00910 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00914 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00918 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0091C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x00924 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    if (((((gctUINT32) (Context->hardware->identity.chipMinorFeatures3)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
++    {
++        index += _State(Context, index, 0x00940 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x00944 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x00948 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x0094C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x00950 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x00954 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    }
++
++    index += _CLOSE_RANGE();
++
++    if (!halti3)
++    {
++        if (Context->hardware->identity.instructionCount > 1024)
++        {
++            /* New Shader instruction PC registers. */
++            index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++            index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
++            index += _CLOSE_RANGE();
++
++            for (i = 0;
++                 i < Context->hardware->identity.instructionCount << 2;
++                 i += 256 << 2
++                 )
++            {
++                index += _State(Context, index, (0x20000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
++                index += _CLOSE_RANGE();
++            }
++        }
++        else if (Context->hardware->identity.instructionCount > 256)
++        {
++            /* New Shader instruction PC registers. */
++            index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++            index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
++            index += _CLOSE_RANGE();
++
++            /* VX instruction memory. */
++            for (i = 0;
++                 i < Context->hardware->identity.instructionCount << 2;
++                 i += 256 << 2
++                 )
++            {
++                index += _State(Context, index, (0x0C000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
++                index += _CLOSE_RANGE();
++            }
++
++            _StateMirror(Context, 0x08000 >> 2, Context->hardware->identity.instructionCount << 2 , 0x0C000 >> 2);
++        }
++        else /* if (Context->hardware->identity.instructionCount <= 256) */
++        {
++            /* old shader instruction PC registers */
++            index += _State(Context, index, 0x00800 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++            index += _State(Context, index, 0x00838 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++            index += _CLOSE_RANGE();
++
++            index += _State(Context, index, 0x01000 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++            index += _State(Context, index, 0x01018 >> 2, 0x01000000, 1, gcvFALSE, gcvFALSE);
++            index += _CLOSE_RANGE();
++
++            index += _State(Context, index, 0x04000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
++            index += _CLOSE_RANGE();
++            index += _State(Context, index, 0x06000 >> 2, 0x00000000, 1024, gcvFALSE, gcvFALSE);
++            index += _CLOSE_RANGE();
++        }
++    }
++    /* I cache use the new instruction PC registers */
++    else
++    {
++        /* New Shader instruction PC registers. */
++        index += _State(Context, index, 0x0085C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x0101C >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
++        index += _CLOSE_RANGE();
++    }
++
++    if (unifiedUniform)
++    {
++        gctINT numConstants = Context->hardware->identity.numConstants;
++
++        index += _State(Context, index, 0x01024 >> 2, 0x00000100, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x00864 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _CLOSE_RANGE();
++
++        for (i = 0;
++             numConstants > 0;
++             i += 256 << 2,
++             numConstants -= 256
++             )
++        {
++            if (numConstants >= 256)
++            {
++                index += _State(Context, index, (0x30000 >> 2) + i, 0x00000000, 256 << 2, gcvFALSE, gcvFALSE);
++            }
++            else
++            {
++                index += _State(Context, index, (0x30000 >> 2) + i, 0x00000000, numConstants << 2, gcvFALSE, gcvFALSE);
++            }
++            index += _CLOSE_RANGE();
++        }
++    }
++#if gcdENABLE_UNIFIED_CONSTANT
++    else
++#endif
++    {
++        index += _State(Context, index, 0x05000 >> 2, 0x00000000, vertexUniforms * 4, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x07000 >> 2, 0x00000000, fragmentUniforms * 4, gcvFALSE, gcvFALSE);
++    }
++
++    /* Store the index of the "XD" entry. */
++    Context->entryOffsetXDFrom3D = (gctUINT)index * gcmSIZEOF(gctUINT32);
++
++
++    /* Pixel Engine states. */
++    index += _State(Context, index, 0x01400 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01404 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01408 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0140C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01414 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01418 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0141C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01420 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01424 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01428 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0142C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01434 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01454 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01458 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0145C >> 2, 0x00000010, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014A8 >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014AC >> 2, 0xFFFFFFFF, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014B0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014A4 >> 2, 0x000E400C, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01580 >> 2, 0x00000000, 3, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x014B8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    /* Composition states. */
++    index += _State(Context, index, 0x03008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    if (Context->hardware->identity.pixelPipes == 1)
++    {
++        index += _State(Context, index, 0x01460 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++
++        index += _State(Context, index, 0x01430 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++        index += _State(Context, index, 0x01410 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    }
++    else
++    {
++        index += _State(Context, index, (0x01460 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++    }
++
++    if (Context->hardware->identity.pixelPipes > 1 || halti0)
++    {
++        index += _State(Context, index, (0x01480 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++    }
++
++    for (i = 0; i < 3; i++)
++    {
++        index += _State(Context, index, (0x01500 >> 2) + (i << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++    }
++
++    if (halti2)
++    {
++        for (i = 0; i < 7; i++)
++        {
++          index += _State(Context, index, (0x14800 >> 2) + (i << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++        }
++        index += _State(Context, index, 0x14900 >> 2, 0x00000000, 7, gcvFALSE, gcvFALSE);
++    }
++
++
++    if (halti3)
++    {
++        index += _State(Context, index, 0x014BC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    }
++
++    /* Resolve states. */
++    index += _State(Context, index, 0x01604 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01608 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0160C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01610 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01614 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01620 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01630 >> 2, 0x00000000, 2, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01640 >> 2, 0x00000000, 4, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x0163C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016A0 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016B4 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _CLOSE_RANGE();
++
++    if ((Context->hardware->identity.pixelPipes > 1) || halti1)
++    {
++        index += _State(Context, index, (0x016C0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++
++        index += _State(Context, index, (0x016E0 >> 2) + (0 << 3), 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvTRUE);
++
++        index += _State(Context, index, 0x01700 >> 2, 0x00000000, Context->hardware->identity.pixelPipes, gcvFALSE, gcvFALSE);
++    }
++
++#if gcd3DBLIT
++    index += _State(Context, index, (0x14000 >> 2) + (0 << 1), 0x00000000, 2, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x14008 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1400C >> 2, 0x0001C800, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14010 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x14014 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, (0x14018 >> 2) + (0 << 1), 0x00000000, 2, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x14020 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x14024 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14028 >> 2, 0x0001C800, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1402C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14030 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14034 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14038 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1403C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14040 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14044 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14048 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1404C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14050 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14058 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1405C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14054 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14100 >> 2, 0x00000000, 64, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14200 >> 2, 0x00000000, 64, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14064 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14068 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    index += _State(Context, index, 0x1406C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14070 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14074 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14078 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1407C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14080 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14084 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14088 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x1408C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14090 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++
++    index += _State(Context, index, 0x14094 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x14098 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++#endif
++
++    /* Tile status. */
++    index += _State(Context, index, 0x01654 >> 2, 0x00200000, 1, gcvFALSE, gcvFALSE);
++
++    index += _CLOSE_RANGE();
++    index += _State(Context, index, 0x01658 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0165C >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01660 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01664 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01668 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x0166C >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01670 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01674 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016A4 >> 2, 0x00000000, 1, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x016AC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x016A8 >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01720 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++    index += _State(Context, index, 0x01740 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++    index += _State(Context, index, 0x01760 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++
++
++    if (halti2)
++    {
++        index += _State(Context, index, 0x01780 >> 2, 0x00000000, 8, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, 0x016BC >> 2, 0x00000000, 1, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, (0x017A0 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, (0x017C0 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvTRUE);
++        index += _State(Context, index, (0x017E0 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvTRUE);
++        index += _State(Context, index, (0x01A00 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, (0x01A20 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
++        index += _State(Context, index, (0x01A40 >> 2) + 1, 0x00000000, 7, gcvFALSE, gcvFALSE);
++    }
++
++    index += _CLOSE_RANGE();
++
++    if(((((gctUINT32) (Context->hardware->identity.chipMinorFeatures4)) >> (0 ? 25:25) & ((gctUINT32) ((((1 ? 25:25) - (0 ? 25:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:25) - (0 ? 25:25) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 25:25) - (0 ? 25:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:25) - (0 ? 25:25) + 1))))))))
++    {
++        index += _State(Context, index, 0x03860 >> 2, 0x6, 1, gcvFALSE, gcvFALSE);
++        index += _CLOSE_RANGE();
++    }
++
++    if (halti3)
++    {
++        index += _State(Context, index, 0x01A80 >> 2, 0x00000000, 8, gcvFALSE, gcvTRUE);
++        index += _CLOSE_RANGE();
++    }
++
++    /* Semaphore/stall. */
++    index += _SemaphoreStall(Context, index);
++#endif
++
++    /**************************************************************************/
++    /* Link to another address. ***********************************************/
++
++    Context->linkIndex3D = (gctUINT)index;
++
++    if (buffer != gcvNULL)
++    {
++        buffer[index + 0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[index + 1]
++            = 0;
++    }
++
++    index += 2;
++
++    /* Store the end of the context buffer. */
++    Context->bufferSize = index * gcmSIZEOF(gctUINT32);
++
++
++    /**************************************************************************/
++    /* Pipe switch for the case where neither 2D nor 3D are used. *************/
++
++    /* Store the 3D entry index. */
++    Context->entryOffsetXDFrom2D = (gctUINT)index * gcmSIZEOF(gctUINT32);
++
++    /* Flush 2D pipe. */
++    index += _FlushPipe(Context, index, gcvPIPE_2D);
++
++    /* Switch to 3D pipe. */
++    index += _SwitchPipe(Context, index, gcvPIPE_3D);
++
++    /* Store the location of the link. */
++    Context->linkIndexXD = (gctUINT)index;
++
++    if (buffer != gcvNULL)
++    {
++        buffer[index + 0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[index + 1]
++            = 0;
++    }
++
++    index += 2;
++
++
++    /**************************************************************************/
++    /* Save size for buffer. **************************************************/
++
++    Context->totalSize = index * gcmSIZEOF(gctUINT32);
++
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++#endif
++
++static gceSTATUS
++_DestroyContext(
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    if (Context != gcvNULL)
++    {
++        gcsCONTEXT_PTR bufferHead;
++
++        /* Free context buffers. */
++        for (bufferHead = Context->buffer; Context->buffer != gcvNULL;)
++        {
++            /* Get a shortcut to the current buffer. */
++            gcsCONTEXT_PTR buffer = Context->buffer;
++
++            /* Get the next buffer. */
++            gcsCONTEXT_PTR next = buffer->next;
++
++            /* Last item? */
++            if (next == bufferHead)
++            {
++                next = gcvNULL;
++            }
++
++            /* Destroy the signal. */
++            if (buffer->signal != gcvNULL)
++            {
++                gcmkONERROR(gckOS_DestroySignal(
++                    Context->os, buffer->signal
++                    ));
++
++                buffer->signal = gcvNULL;
++            }
++
++            /* Free state delta map. */
++            if (buffer->logical != gcvNULL)
++            {
++                if (Context->hardware->kernel->virtualCommandBuffer)
++                {
++                    gcmkONERROR(gckEVENT_DestroyVirtualCommandBuffer(
++                        Context->hardware->kernel->eventObj,
++                        Context->totalSize,
++                        buffer->physical,
++                        buffer->logical,
++                        gcvKERNEL_PIXEL
++                        ));
++                }
++                else
++                {
++                    gcmkONERROR(gckEVENT_FreeContiguousMemory(
++                        Context->hardware->kernel->eventObj,
++                        Context->totalSize,
++                        buffer->physical,
++                        buffer->logical,
++                        gcvKERNEL_PIXEL
++                        ));
++                }
++
++                buffer->logical = gcvNULL;
++            }
++
++            /* Free context buffer. */
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, buffer));
++
++            /* Remove from the list. */
++            Context->buffer = next;
++        }
++
++#if gcdSECURE_USER
++        /* Free the hint array. */
++        if (Context->hint != gcvNULL)
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->hint));
++        }
++#endif
++        /* Free record array copy. */
++#if REMOVE_DUPLICATED_COPY_FROM_USER
++        if (Context->recordArrayMap != gcvNULL)
++        {
++            gcsRECORD_ARRAY_MAP_PTR map = Context->recordArrayMap;
++
++            do
++            {
++                /* Free record array. */
++                gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, map->kData));
++                map = map->next;
++            }
++            while (map != Context->recordArrayMap);
++
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->recordArrayMap));
++        }
++#else
++        if (Context->recordArray != gcvNULL)
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->recordArray));
++        }
++#endif
++
++        /* Free the state mapping. */
++        if (Context->map != gcvNULL)
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context->map));
++        }
++
++        /* Mark the gckCONTEXT object as unknown. */
++        Context->object.type = gcvOBJ_UNKNOWN;
++
++        /* Free the gckCONTEXT object. */
++        gcmkONERROR(gcmkOS_SAFE_FREE(Context->os, Context));
++    }
++
++OnError:
++    return status;
++}
++
++
++/******************************************************************************\
++**************************** Context Management API ****************************
++\******************************************************************************/
++
++/******************************************************************************\
++**
++**  gckCONTEXT_Construct
++**
++**  Construct a new gckCONTEXT object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Current process ID.
++**
++**      gckHARDWARE Hardware
++**          Pointer to gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gckCONTEXT * Context
++**          Pointer to a variable thet will receive the gckCONTEXT object
++**          pointer.
++*/
++#if (gcdENABLE_3D || gcdENABLE_2D)
++gceSTATUS
++gckCONTEXT_Construct(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 ProcessID,
++    OUT gckCONTEXT * Context
++    )
++{
++    gceSTATUS status;
++    gckCONTEXT context = gcvNULL;
++    gctUINT32 allocationSize;
++    gctUINT i;
++    gctPOINTER pointer = gcvNULL;
++    gctUINT32 address;
++
++    gcmkHEADER_ARG("Os=0x%08X Hardware=0x%08X", Os, Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Context != gcvNULL);
++
++
++    /**************************************************************************/
++    /* Allocate and initialize basic fields of gckCONTEXT. ********************/
++
++    /* The context object size. */
++    allocationSize = gcmSIZEOF(struct _gckCONTEXT);
++
++    /* Allocate the object. */
++    gcmkONERROR(gckOS_Allocate(
++        Os, allocationSize, &pointer
++        ));
++
++    context = pointer;
++
++    /* Reset the entire object. */
++    gcmkONERROR(gckOS_ZeroMemory(context, allocationSize));
++
++    /* Initialize the gckCONTEXT object. */
++    context->object.type = gcvOBJ_CONTEXT;
++    context->os          = Os;
++    context->hardware    = Hardware;
++
++
++#if !gcdENABLE_3D
++    context->entryPipe = gcvPIPE_2D;
++    context->exitPipe  = gcvPIPE_2D;
++#elif gcdCMD_NO_2D_CONTEXT
++    context->entryPipe = gcvPIPE_3D;
++    context->exitPipe  = gcvPIPE_3D;
++#else
++    context->entryPipe
++        = (((((gctUINT32) (context->hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) )
++            ? gcvPIPE_2D
++            : gcvPIPE_3D;
++    context->exitPipe = gcvPIPE_3D;
++#endif
++
++    /* Get the command buffer requirements. */
++    gcmkONERROR(gckHARDWARE_QueryCommandBuffer(
++        Hardware,
++        &context->alignment,
++        &context->reservedHead,
++        &context->reservedTail
++        ));
++
++    /* Mark the context as dirty to force loading of the entire state table
++       the first time. */
++    context->dirty = gcvTRUE;
++
++
++    /**************************************************************************/
++    /* Get the size of the context buffer. ************************************/
++
++    gcmkONERROR(_InitializeContextBuffer(context));
++
++
++    /**************************************************************************/
++    /* Compute the size of the record array. **********************************/
++
++    context->recordArraySize
++        = gcmSIZEOF(gcsSTATE_DELTA_RECORD) * (gctUINT)context->stateCount;
++
++
++    if (context->stateCount > 0)
++    {
++        /**************************************************************************/
++        /* Allocate and reset the state mapping table. ****************************/
++
++        /* Allocate the state mapping table. */
++        gcmkONERROR(gckOS_Allocate(
++            Os,
++            gcmSIZEOF(gcsSTATE_MAP) * context->stateCount,
++            &pointer
++            ));
++
++        context->map = pointer;
++
++        /* Zero the state mapping table. */
++        gcmkONERROR(gckOS_ZeroMemory(
++            context->map, gcmSIZEOF(gcsSTATE_MAP) * context->stateCount
++            ));
++
++
++        /**************************************************************************/
++        /* Allocate the hint array. ***********************************************/
++
++#if gcdSECURE_USER
++        /* Allocate hints. */
++        gcmkONERROR(gckOS_Allocate(
++            Os,
++            gcmSIZEOF(gctBOOL) * context->stateCount,
++            &pointer
++            ));
++
++        context->hint = pointer;
++#endif
++    }
++
++    /**************************************************************************/
++    /* Allocate the context and state delta buffers. **************************/
++
++    for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i += 1)
++    {
++        /* Allocate a context buffer. */
++        gcsCONTEXT_PTR buffer;
++
++        gctSIZE_T totalSize = context->totalSize;
++
++        /* Allocate the context buffer structure. */
++        gcmkONERROR(gckOS_Allocate(
++            Os,
++            gcmSIZEOF(gcsCONTEXT),
++            &pointer
++            ));
++
++        buffer = pointer;
++
++        /* Reset the context buffer structure. */
++        gcmkVERIFY_OK(gckOS_ZeroMemory(
++            buffer, gcmSIZEOF(gcsCONTEXT)
++            ));
++
++        /* Append to the list. */
++        if (context->buffer == gcvNULL)
++        {
++            buffer->next    = buffer;
++            context->buffer = buffer;
++        }
++        else
++        {
++            buffer->next          = context->buffer->next;
++            context->buffer->next = buffer;
++        }
++
++        /* Set the number of delta in the order of creation. */
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++        buffer->num = i;
++#endif
++
++        /* Create the busy signal. */
++        gcmkONERROR(gckOS_CreateSignal(
++            Os, gcvFALSE, &buffer->signal
++            ));
++
++        /* Set the signal, buffer is currently not busy. */
++        gcmkONERROR(gckOS_Signal(
++            Os, buffer->signal, gcvTRUE
++            ));
++
++        /* Create a new physical context buffer. */
++        if (context->hardware->kernel->virtualCommandBuffer)
++        {
++            gcmkONERROR(gckKERNEL_AllocateVirtualCommandBuffer(
++                context->hardware->kernel,
++                gcvFALSE,
++                &totalSize,
++                &buffer->physical,
++                &pointer
++                ));
++
++            gcmkONERROR(gckKERNEL_GetGPUAddress(
++                context->hardware->kernel,
++                pointer,
++                gcvFALSE,
++                &address
++                ));
++        }
++        else
++        {
++            gcmkONERROR(gckOS_AllocateContiguous(
++                Os,
++                gcvFALSE,
++                &totalSize,
++                &buffer->physical,
++                &pointer
++                ));
++
++            gcmkONERROR(gckHARDWARE_ConvertLogical(
++                context->hardware,
++                pointer,
++                gcvFALSE,
++                &address
++                ));
++        }
++
++        buffer->logical = pointer;
++        buffer->address = address;
++
++        /* Set gckEVENT object pointer. */
++        buffer->eventObj = Hardware->kernel->eventObj;
++
++        /* Set the pointers to the LINK commands. */
++        if (context->linkIndex2D != 0)
++        {
++            buffer->link2D = &buffer->logical[context->linkIndex2D];
++        }
++
++        if (context->linkIndex3D != 0)
++        {
++            buffer->link3D = &buffer->logical[context->linkIndex3D];
++        }
++
++        if (context->linkIndexXD != 0)
++        {
++            gctPOINTER xdLink;
++            gctUINT32 xdEntryAddress;
++            gctUINT32 xdEntrySize;
++            gctUINT32 linkBytes;
++
++            /* Determine LINK parameters. */
++            xdLink
++                = &buffer->logical[context->linkIndexXD];
++
++            xdEntryAddress
++                = buffer->address
++                + context->entryOffsetXDFrom3D;
++
++            xdEntrySize
++                = context->bufferSize
++                - context->entryOffsetXDFrom3D;
++
++            /* Query LINK size. */
++            gcmkONERROR(gckHARDWARE_Link(
++                Hardware, gcvNULL, 0, 0, &linkBytes
++                ));
++
++            /* Generate a LINK. */
++            gcmkONERROR(gckHARDWARE_Link(
++                Hardware,
++                xdLink,
++                xdEntryAddress,
++                xdEntrySize,
++                &linkBytes
++                ));
++        }
++    }
++
++
++    /**************************************************************************/
++    /* Initialize the context buffers. ****************************************/
++
++    /* Initialize the current context buffer. */
++    gcmkONERROR(_InitializeContextBuffer(context));
++
++    /* Make all created contexts equal. */
++    {
++        gcsCONTEXT_PTR currContext, tempContext;
++
++        /* Set the current context buffer. */
++        currContext = context->buffer;
++
++        /* Get the next context buffer. */
++        tempContext = currContext->next;
++
++        /* Loop through all buffers. */
++        while (tempContext != currContext)
++        {
++            if (tempContext == gcvNULL)
++            {
++                gcmkONERROR(gcvSTATUS_NOT_FOUND);
++            }
++
++            /* Copy the current context. */
++            gckOS_MemCopy(
++                tempContext->logical,
++                currContext->logical,
++                context->totalSize
++                );
++
++            /* Get the next context buffer. */
++            tempContext = tempContext->next;
++        }
++    }
++
++    /* Return pointer to the gckCONTEXT object. */
++    *Context = context;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Context=0x%08X", *Context);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back on error. */
++    gcmkVERIFY_OK(_DestroyContext(context));
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++/******************************************************************************\
++**
++**  gckCONTEXT_Destroy
++**
++**  Destroy a gckCONTEXT object.
++**
++**  INPUT:
++**
++**      gckCONTEXT Context
++**          Pointer to an gckCONTEXT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCONTEXT_Destroy(
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Context=0x%08X", Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    /* Destroy the context and all related objects. */
++    status = _DestroyContext(Context);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return status;
++}
++
++/******************************************************************************\
++**
++**  gckCONTEXT_Update
++**
++**  Merge all pending state delta buffers into the current context buffer.
++**
++**  INPUT:
++**
++**      gckCONTEXT Context
++**          Pointer to an gckCONTEXT object.
++**
++**      gctUINT32 ProcessID
++**          Current process ID.
++**
++**      gcsSTATE_DELTA_PTR StateDelta
++**          Pointer to the state delta.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCONTEXT_Update(
++    IN gckCONTEXT Context,
++    IN gctUINT32 ProcessID,
++    IN gcsSTATE_DELTA_PTR StateDelta
++    )
++{
++#if gcdENABLE_3D
++    gceSTATUS status = gcvSTATUS_OK;
++    gcsSTATE_DELTA _stateDelta;
++    gckKERNEL kernel;
++    gcsCONTEXT_PTR buffer;
++    gcsSTATE_MAP_PTR map;
++    gctBOOL needCopy = gcvFALSE;
++    gcsSTATE_DELTA_PTR nDelta;
++    gcsSTATE_DELTA_PTR uDelta = gcvNULL;
++    gcsSTATE_DELTA_PTR kDelta = gcvNULL;
++    gcsSTATE_DELTA_RECORD_PTR record;
++    gcsSTATE_DELTA_RECORD_PTR recordArray = gcvNULL;
++#if REMOVE_DUPLICATED_COPY_FROM_USER
++    gcsRECORD_ARRAY_MAP_PTR recordArrayMap = gcvNULL;
++#endif
++    gctUINT elementCount;
++    gctUINT address;
++    gctUINT32 mask;
++    gctUINT32 data;
++    gctUINT index;
++    gctUINT i, j;
++
++#if gcdSECURE_USER
++    gcskSECURE_CACHE_PTR cache;
++#endif
++
++    gcmkHEADER_ARG(
++        "Context=0x%08X ProcessID=%d StateDelta=0x%08X",
++        Context, ProcessID, StateDelta
++        );
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    /* Get a shortcut to the kernel object. */
++    kernel = Context->hardware->kernel;
++
++    /* Check wehther we need to copy the structures or not. */
++    gcmkONERROR(gckOS_QueryNeedCopy(Context->os, ProcessID, &needCopy));
++
++    /* Allocate the copy buffer for the user record array. */
++#if REMOVE_DUPLICATED_COPY_FROM_USER
++    if (needCopy && (Context->recordArrayMap == gcvNULL))
++    {
++        /* Allocate enough maps. */
++        gcmkONERROR(gckOS_Allocate(
++            Context->os,
++            gcmSIZEOF(gcsRECORD_ARRAY_MAP_PTR) * gcdCONTEXT_BUFFER_COUNT,
++            (gctPOINTER *) &Context->recordArrayMap
++            ));
++
++        for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i++)
++        {
++            /* Next mapping id. */
++            gctUINT n = (i + 1) % gcdCONTEXT_BUFFER_COUNT;
++
++            recordArrayMap = &Context->recordArrayMap[i];
++
++            /* Allocate the buffer. */
++            gcmkONERROR(gckOS_Allocate(
++                Context->os,
++                Context->recordArraySize,
++                (gctPOINTER *) &recordArrayMap->kData
++                ));
++
++            /* Initialize fields. */
++            recordArrayMap->key  = 0;
++            recordArrayMap->next = &Context->recordArrayMap[n];
++        }
++    }
++#else
++    if (needCopy && (Context->recordArray == gcvNULL))
++    {
++        /* Allocate the buffer. */
++        gcmkONERROR(gckOS_Allocate(
++            Context->os,
++            Context->recordArraySize,
++            (gctPOINTER *) &Context->recordArray
++            ));
++    }
++#endif
++
++    /* Get the current context buffer. */
++    buffer = Context->buffer;
++
++    /* Wait until the context buffer becomes available; this will
++       also reset the signal and mark the buffer as busy. */
++    gcmkONERROR(gckOS_WaitSignal(
++        Context->os, buffer->signal, gcvINFINITE
++        ));
++
++#if gcdSECURE_USER
++    /* Get the cache form the database. */
++    gcmkONERROR(gckKERNEL_GetProcessDBCache(kernel, ProcessID, &cache));
++#endif
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE) && 1 && gcdENABLE_3D
++    /* Update current context token. */
++    buffer->logical[Context->map[0x0E14].index]
++        = (gctUINT32)gcmPTR2INT32(Context);
++#endif
++
++    /* Are there any pending deltas? */
++    if (buffer->deltaCount != 0)
++    {
++        /* Get the state map. */
++        map = Context->map;
++
++        /* Get the first delta item. */
++        uDelta = buffer->delta;
++
++        /* Reset the vertex stream count. */
++        elementCount = 0;
++
++        /* Merge all pending deltas. */
++        for (i = 0; i < buffer->deltaCount; i += 1)
++        {
++            /* Get access to the state delta. */
++            gcmkONERROR(gckKERNEL_OpenUserData(
++                kernel, needCopy,
++                &_stateDelta,
++                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++                (gctPOINTER *) &kDelta
++                ));
++
++#if REMOVE_DUPLICATED_COPY_FROM_USER
++            if (needCopy)
++            {
++                recordArray    = gcvNULL;
++                recordArrayMap = Context->recordArrayMap;
++
++                do
++                {
++                    /* Check if recordArray is alreay opened. */
++                    if (recordArrayMap->key == kDelta->recordArray)
++                    {
++                        /* Found. */
++                        recordArray = recordArrayMap->kData;
++                        break;
++                    }
++
++                    recordArrayMap = recordArrayMap->next;
++                }
++                while (recordArrayMap != Context->recordArrayMap);
++
++                if (recordArray == gcvNULL)
++                {
++                    while (recordArrayMap->key != 0)
++                    {
++                        /* Found an empty slot. */
++                        recordArrayMap = recordArrayMap->next;
++                    }
++
++                    /* Get access to the state records. */
++                    gcmkONERROR(gckOS_CopyFromUserData(
++                        kernel->os,
++                        recordArrayMap->kData,
++                        gcmUINT64_TO_PTR(kDelta->recordArray),
++                        Context->recordArraySize
++                        ));
++
++                    /* Save user pointer as key. */
++                    recordArrayMap->key = kDelta->recordArray;
++                    recordArray         = recordArrayMap->kData;
++                }
++            }
++            else
++            {
++                /* Get access to the state records. */
++                gcmkONERROR(gckOS_MapUserPointer(
++                    kernel->os,
++                    gcmUINT64_TO_PTR(kDelta->recordArray),
++                    Context->recordArraySize,
++                    (gctPOINTER *) &recordArray
++                    ));
++            }
++#else
++            /* Get access to the state records. */
++            gcmkONERROR(gckKERNEL_OpenUserData(
++                kernel, needCopy,
++                Context->recordArray,
++                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
++                (gctPOINTER *) &recordArray
++                ));
++#endif
++
++            /* Merge all pending states. */
++            for (j = 0; j < kDelta->recordCount; j += 1)
++            {
++                if (j >= Context->stateCount)
++                {
++                    break;
++                }
++
++                /* Get the current state record. */
++                record = &recordArray[j];
++
++                /* Get the state address. */
++                address = record->address;
++
++                /* Make sure the state is a part of the mapping table. */
++                if (address >= Context->stateCount)
++                {
++                    gcmkTRACE(
++                        gcvLEVEL_ERROR,
++                        "%s(%d): State 0x%04X is not mapped.\n",
++                        __FUNCTION__, __LINE__,
++                        address
++                        );
++
++                    continue;
++                }
++
++                /* Get the state index. */
++                index = map[address].index;
++
++                /* Skip the state if not mapped. */
++                if (index == 0)
++                {
++                    continue;
++                }
++
++                /* Get the data mask. */
++                mask = record->mask;
++
++                /* Masked states that are being completly reset or regular states. */
++                if ((mask == 0) || (mask == ~0U))
++                {
++                    /* Get the new data value. */
++                    data = record->data;
++
++                    /* Process special states. */
++                    if (address == 0x0595)
++                    {
++                        /* Force auto-disable to be disabled. */
++                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++                        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1))))))) << (0 ? 13:13)));
++                    }
++
++#if gcdSECURE_USER
++                    /* Do we need to convert the logical address? */
++                    if (Context->hint[address])
++                    {
++                        /* Map handle into physical address. */
++                        gcmkONERROR(gckKERNEL_MapLogicalToPhysical(
++                            kernel, cache, (gctPOINTER) &data
++                            ));
++                    }
++#endif
++
++                    /* Set new data. */
++                    buffer->logical[index] = data;
++                }
++
++                /* Masked states that are being set partially. */
++                else
++                {
++                    buffer->logical[index]
++                        = (~mask & buffer->logical[index])
++                        | (mask & record->data);
++                }
++            }
++
++            /* Get the element count. */
++            if (kDelta->elementCount != 0)
++            {
++                elementCount = kDelta->elementCount;
++            }
++
++            /* Dereference delta. */
++            kDelta->refCount -= 1;
++            gcmkASSERT(kDelta->refCount >= 0);
++
++            /* Get the next state delta. */
++            nDelta = gcmUINT64_TO_PTR(kDelta->next);
++
++#if REMOVE_DUPLICATED_COPY_FROM_USER
++            if (needCopy)
++            {
++                if (kDelta->refCount == 0)
++                {
++                    /* No other reference, reset the mapping. */
++                    recordArrayMap->key = 0;
++                }
++            }
++            else
++            {
++                /* Close access to the state records. */
++                gcmkONERROR(gckOS_UnmapUserPointer(
++                    kernel->os,
++                    gcmUINT64_TO_PTR(kDelta->recordArray),
++                    Context->recordArraySize,
++                    (gctPOINTER *) recordArray
++                    ));
++
++                recordArray = gcvNULL;
++            }
++#else
++            /* Get access to the state records. */
++            gcmkONERROR(gckKERNEL_CloseUserData(
++                kernel, needCopy,
++                gcvFALSE,
++                gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
++                (gctPOINTER *) &recordArray
++                ));
++#endif
++
++            /* Close access to the current state delta. */
++            gcmkONERROR(gckKERNEL_CloseUserData(
++                kernel, needCopy,
++                gcvTRUE,
++                uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++                (gctPOINTER *) &kDelta
++                ));
++
++            /* Update the user delta pointer. */
++            uDelta = nDelta;
++        }
++
++        /* Hardware disables all input streams when the stream 0 is programmed,
++           it then reenables those streams that were explicitely programmed by
++           the software. Because of this we cannot program the entire array of
++           values, otherwise we'll get all streams reenabled, but rather program
++           only those that are actully needed by the software. */
++        if (elementCount != 0)
++        {
++            gctUINT base;
++            gctUINT nopCount;
++            gctUINT32_PTR nop;
++            gctUINT fe2vsCount = 12;
++
++            if ((((((gctUINT32) (Context->hardware->identity.chipMinorFeatures1)) >> (0 ? 23:23)) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) ))
++            {
++                fe2vsCount = 16;
++            }
++
++            /* Determine the base index of the vertex stream array. */
++            base = map[0x0180].index;
++
++            /* Set the proper state count. */
++            buffer->logical[base - 1]
++                = ((((gctUINT32) (buffer->logical[base - 1])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (elementCount ) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            /* Determine the number of NOP commands. */
++            nopCount
++                = (fe2vsCount / 2)
++                - (elementCount / 2);
++
++            /* Determine the location of the first NOP. */
++            nop = &buffer->logical[base + (elementCount | 1)];
++
++            /* Fill the unused space with NOPs. */
++            for (i = 0; i < nopCount; i += 1)
++            {
++                if (nop >= buffer->logical + Context->totalSize)
++                {
++                    break;
++                }
++
++                /* Generate a NOP command. */
++                *nop = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++                /* Advance. */
++                nop += 2;
++            }
++        }
++
++        /* Reset pending deltas. */
++        buffer->deltaCount = 0;
++        buffer->delta      = gcvNULL;
++    }
++
++    /* Set state delta user pointer. */
++    uDelta = StateDelta;
++
++    /* Get access to the state delta. */
++    gcmkONERROR(gckKERNEL_OpenUserData(
++        kernel, needCopy,
++        &_stateDelta,
++        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++        (gctPOINTER *) &kDelta
++        ));
++
++    /* State delta cannot be attached to anything yet. */
++    if (kDelta->refCount != 0)
++    {
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): kDelta->refCount = %d (has to be 0).\n",
++            __FUNCTION__, __LINE__,
++            kDelta->refCount
++            );
++    }
++
++    /* Attach to all contexts. */
++    buffer = Context->buffer;
++
++    do
++    {
++        /* Attach to the context if nothing is attached yet. If a delta
++           is allready attached, all we need to do is to increment
++           the number of deltas in the context. */
++        if (buffer->delta == gcvNULL)
++        {
++            buffer->delta = uDelta;
++        }
++
++        /* Update reference count. */
++        kDelta->refCount += 1;
++
++        /* Update counters. */
++        buffer->deltaCount += 1;
++
++        /* Get the next context buffer. */
++        buffer = buffer->next;
++
++        if (buffer == gcvNULL)
++        {
++            gcmkONERROR(gcvSTATUS_NOT_FOUND);
++        }
++    }
++    while (Context->buffer != buffer);
++
++    /* Close access to the current state delta. */
++    gcmkONERROR(gckKERNEL_CloseUserData(
++        kernel, needCopy,
++        gcvTRUE,
++        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++        (gctPOINTER *) &kDelta
++        ));
++
++    /* Schedule an event to mark the context buffer as available. */
++    gcmkONERROR(gckEVENT_Signal(
++        buffer->eventObj, buffer->signal, gcvKERNEL_PIXEL
++        ));
++
++    /* Advance to the next context buffer. */
++    Context->buffer = buffer->next;
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Get access to the state records. */
++    if (kDelta != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckKERNEL_CloseUserData(
++            kernel, needCopy,
++            gcvFALSE,
++            gcmUINT64_TO_PTR(kDelta->recordArray), Context->recordArraySize,
++            (gctPOINTER *) &recordArray
++            ));
++    }
++
++    /* Close access to the current state delta. */
++    gcmkVERIFY_OK(gckKERNEL_CloseUserData(
++        kernel, needCopy,
++        gcvTRUE,
++        uDelta, gcmSIZEOF(gcsSTATE_DELTA),
++        (gctPOINTER *) &kDelta
++        ));
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    return gcvSTATUS_OK;
++#endif
++}
++
++gceSTATUS
++gckCONTEXT_MapBuffer(
++    IN gckCONTEXT Context,
++    OUT gctUINT32 *Physicals,
++    OUT gctUINT64 *Logicals,
++    OUT gctUINT32 *Bytes
++    )
++{
++    gceSTATUS status;
++    int i = 0;
++    gctSIZE_T pageCount;
++    gckVIRTUAL_COMMAND_BUFFER_PTR commandBuffer;
++    gckKERNEL kernel = Context->hardware->kernel;
++    gctPOINTER logical;
++    gctPHYS_ADDR physical;
++
++    gcsCONTEXT_PTR buffer;
++
++    gcmkHEADER();
++
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    buffer = Context->buffer;
++
++    for (i = 0; i < gcdCONTEXT_BUFFER_COUNT; i++)
++    {
++        if (kernel->virtualCommandBuffer)
++        {
++            commandBuffer = (gckVIRTUAL_COMMAND_BUFFER_PTR)buffer->physical;
++            physical = commandBuffer->physical;
++
++            gcmkONERROR(gckOS_CreateUserVirtualMapping(
++                kernel->os,
++                physical,
++                Context->totalSize,
++                &logical,
++                &pageCount));
++        }
++        else
++        {
++            physical = buffer->physical;
++
++            gcmkONERROR(gckOS_MapMemory(
++                kernel->os,
++                physical,
++                Context->totalSize,
++                &logical));
++        }
++
++        Physicals[i] = gcmPTR_TO_NAME(physical);
++
++        Logicals[i] = gcmPTR_TO_UINT64(logical);
++
++        buffer = buffer->next;
++    }
++
++    *Bytes = (gctUINT)Context->totalSize;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_context.h	2015-07-27 23:13:06.186908111 +0200
+@@ -0,0 +1,183 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_context_h_
++#define __gc_hal_kernel_context_h_
++
++#include "gc_hal_kernel_buffer.h"
++
++/* Exprimental optimization. */
++#define REMOVE_DUPLICATED_COPY_FROM_USER 1
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/* Maps state locations within the context buffer. */
++typedef struct _gcsSTATE_MAP * gcsSTATE_MAP_PTR;
++typedef struct _gcsSTATE_MAP
++{
++    /* Index of the state in the context buffer. */
++    gctUINT                     index;
++
++    /* State mask. */
++    gctUINT32                   mask;
++}
++gcsSTATE_MAP;
++
++/* Context buffer. */
++typedef struct _gcsCONTEXT * gcsCONTEXT_PTR;
++typedef struct _gcsCONTEXT
++{
++    /* For debugging: the number of context buffer in the order of creation. */
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    gctUINT                     num;
++#endif
++
++    /* Pointer to gckEVENT object. */
++    gckEVENT                    eventObj;
++
++    /* Context busy signal. */
++    gctSIGNAL                   signal;
++
++    /* Physical address of the context buffer. */
++    gctPHYS_ADDR                physical;
++
++    /* Logical address of the context buffer. */
++    gctUINT32_PTR               logical;
++
++    /* Hardware address of the context buffer. */
++    gctUINT32                   address;
++
++    /* Pointer to the LINK commands. */
++    gctPOINTER                  link2D;
++    gctPOINTER                  link3D;
++
++    /* The number of pending state deltas. */
++    gctUINT                     deltaCount;
++
++    /* Pointer to the first delta to be applied. */
++    gcsSTATE_DELTA_PTR          delta;
++
++    /* Next context buffer. */
++    gcsCONTEXT_PTR              next;
++}
++gcsCONTEXT;
++
++typedef struct _gcsRECORD_ARRAY_MAP * gcsRECORD_ARRAY_MAP_PTR;
++struct  _gcsRECORD_ARRAY_MAP
++{
++    /* User pointer key. */
++    gctUINT64                   key;
++
++    /* Kernel memory buffer. */
++    gcsSTATE_DELTA_RECORD_PTR   kData;
++
++    /* Next map. */
++    gcsRECORD_ARRAY_MAP_PTR     next;
++
++};
++
++/* gckCONTEXT structure that hold the current context. */
++struct _gckCONTEXT
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Pointer to gckHARDWARE object. */
++    gckHARDWARE                 hardware;
++
++    /* Command buffer alignment. */
++    gctUINT32                   alignment;
++    gctUINT32                   reservedHead;
++    gctUINT32                   reservedTail;
++
++    /* Context buffer metrics. */
++    gctSIZE_T                   stateCount;
++    gctUINT32                   totalSize;
++    gctUINT32                   bufferSize;
++    gctUINT32                   linkIndex2D;
++    gctUINT32                   linkIndex3D;
++    gctUINT32                   linkIndexXD;
++    gctUINT32                   entryOffset3D;
++    gctUINT32                   entryOffsetXDFrom2D;
++    gctUINT32                   entryOffsetXDFrom3D;
++
++    /* Dirty flags. */
++    gctBOOL                     dirty;
++    gctBOOL                     dirty2D;
++    gctBOOL                     dirty3D;
++    gcsCONTEXT_PTR              dirtyBuffer;
++
++    /* State mapping. */
++    gcsSTATE_MAP_PTR            map;
++
++    /* List of context buffers. */
++    gcsCONTEXT_PTR              buffer;
++
++    /* A copy of the user record array. */
++    gctUINT                     recordArraySize;
++#if REMOVE_DUPLICATED_COPY_FROM_USER
++    gcsRECORD_ARRAY_MAP_PTR     recordArrayMap;
++#else
++    gcsSTATE_DELTA_RECORD_PTR   recordArray;
++#endif
++
++    /* Requested pipe select for context. */
++    gcePIPE_SELECT              entryPipe;
++    gcePIPE_SELECT              exitPipe;
++
++    /* Variables used for building state buffer. */
++    gctUINT32                   lastAddress;
++    gctSIZE_T                   lastSize;
++    gctUINT32                   lastIndex;
++    gctBOOL                     lastFixed;
++
++    gctUINT32                   pipeSelectBytes;
++
++    /* Hint array. */
++#if gcdSECURE_USER
++    gctBOOL_PTR                 hint;
++#endif
++
++#if VIVANTE_PROFILER_CONTEXT
++    gcsPROFILER_COUNTERS        latestProfiler;
++    gcsPROFILER_COUNTERS        histroyProfiler;
++    gctUINT32                   prevVSInstCount;
++    gctUINT32                   prevVSBranchInstCount;
++    gctUINT32                   prevVSTexInstCount;
++    gctUINT32                   prevVSVertexCount;
++    gctUINT32                   prevPSInstCount;
++    gctUINT32                   prevPSBranchInstCount;
++    gctUINT32                   prevPSTexInstCount;
++    gctUINT32                   prevPSPixelCount;
++#endif
++};
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_context_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.c	2015-07-27 23:13:06.186908111 +0200
+@@ -0,0 +1,8036 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#if VIVANTE_PROFILER_CONTEXT
++#include "gc_hal_kernel_context.h"
++#endif
++
++#define gcdDISABLE_FE_L2    1
++
++#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
++
++#define gcmSEMAPHORESTALL(buffer) \
++        do \
++        { \
++            /* Arm the PE-FE Semaphore. */ \
++            *buffer++ \
++                = gcmSETFIELDVALUE(0, AQ_COMMAND_LOAD_STATE_COMMAND, OPCODE, LOAD_STATE) \
++                | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, COUNT, 1) \
++                | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, ADDRESS, 0x0E02); \
++            \
++            *buffer++ \
++                = gcmSETFIELDVALUE(0, AQ_SEMAPHORE, SOURCE, FRONT_END) \
++                | gcmSETFIELDVALUE(0, AQ_SEMAPHORE, DESTINATION, PIXEL_ENGINE);\
++            \
++            /* STALL FE until PE is done flushing. */ \
++            *buffer++ \
++                = gcmSETFIELDVALUE(0, STALL_COMMAND, OPCODE, STALL); \
++            \
++            *buffer++ \
++                = gcmSETFIELDVALUE(0, STALL_STALL, SOURCE, FRONT_END) \
++                | gcmSETFIELDVALUE(0, STALL_STALL, DESTINATION, PIXEL_ENGINE); \
++        } while(0)
++
++typedef struct _gcsiDEBUG_REGISTERS * gcsiDEBUG_REGISTERS_PTR;
++typedef struct _gcsiDEBUG_REGISTERS
++{
++    gctSTRING       module;
++    gctUINT         index;
++    gctUINT         shift;
++    gctUINT         data;
++    gctUINT         count;
++    gctUINT32       signature;
++}
++gcsiDEBUG_REGISTERS;
++
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++static gctBOOL
++_IsHardwareMatch(
++    IN gckHARDWARE Hardware,
++    IN gctINT32 ChipModel,
++    IN gctUINT32 ChipRevision
++    )
++{
++    return ((Hardware->identity.chipModel == ChipModel) &&
++            (Hardware->identity.chipRevision == ChipRevision));
++}
++
++static gceSTATUS
++_ResetGPU(
++    IN gckHARDWARE Hardware,
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++static gceSTATUS
++_IdentifyHardware(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++    )
++{
++    gceSTATUS status;
++
++    gctUINT32 chipIdentity;
++
++    gctUINT32 streamCount = 0;
++    gctUINT32 registerMax = 0;
++    gctUINT32 threadCount = 0;
++    gctUINT32 shaderCoreCount = 0;
++    gctUINT32 vertexCacheSize = 0;
++    gctUINT32 vertexOutputBufferSize = 0;
++    gctUINT32 pixelPipes = 0;
++    gctUINT32 instructionCount = 0;
++    gctUINT32 numConstants = 0;
++    gctUINT32 bufferSize = 0;
++    gctUINT32 varyingsCount = 0;
++#if gcdMULTI_GPU
++    gctUINT32 gpuCoreCount = 0;
++#endif
++
++    gcmkHEADER_ARG("Os=0x%x", Os);
++
++    /***************************************************************************
++    ** Get chip ID and revision.
++    */
++
++    /* Read chip identity register. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Os, Core,
++                             0x00018,
++                             &chipIdentity));
++
++    /* Special case for older graphic cores. */
++    if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
++    {
++        Identity->chipModel    = gcv500;
++        Identity->chipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
++    }
++
++    else
++    {
++        /* Read chip identity register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00020,
++                                 (gctUINT32_PTR) &Identity->chipModel));
++
++        if (((Identity->chipModel & 0xFF00) == 0x0400)
++          && (Identity->chipModel != 0x0420)
++          && (Identity->chipModel != 0x0428))
++        {
++            Identity->chipModel = (gceCHIPMODEL) (Identity->chipModel & 0x0400);
++        }
++
++        /* Read CHIP_REV register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00024,
++                                 &Identity->chipRevision));
++
++        if ((Identity->chipModel    == gcv300)
++        &&  (Identity->chipRevision == 0x2201)
++        )
++        {
++            gctUINT32 chipDate;
++            gctUINT32 chipTime;
++
++            /* Read date and time registers. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00028,
++                                     &chipDate));
++
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x0002C,
++                                     &chipTime));
++
++            if ((chipDate == 0x20080814) && (chipTime == 0x12051100))
++            {
++                /* This IP has an ECO; put the correct revision in it. */
++                Identity->chipRevision = 0x1051;
++            }
++        }
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x000A8,
++                                 &Identity->productID));
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipModel=%X",
++                   Identity->chipModel);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipRevision=%X",
++                   Identity->chipRevision);
++
++
++    /***************************************************************************
++    ** Get chip features.
++    */
++
++    /* Read chip feature register. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Os, Core,
++                             0x0001C,
++                             &Identity->chipFeatures));
++
++#if gcdENABLE_3D
++    /* Disable fast clear on GC700. */
++    if (Identity->chipModel == gcv700)
++    {
++        Identity->chipFeatures
++            = ((((gctUINT32) (Identity->chipFeatures)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++    }
++#endif
++
++    if (((Identity->chipModel == gcv500) && (Identity->chipRevision < 2))
++    ||  ((Identity->chipModel == gcv300) && (Identity->chipRevision < 0x2000))
++    )
++    {
++        /* GC500 rev 1.x and GC300 rev < 2.0 doesn't have these registers. */
++        Identity->chipMinorFeatures  = 0;
++        Identity->chipMinorFeatures1 = 0;
++        Identity->chipMinorFeatures2 = 0;
++        Identity->chipMinorFeatures3 = 0;
++        Identity->chipMinorFeatures4 = 0;
++        Identity->chipMinorFeatures5 = 0;
++    }
++    else
++    {
++        /* Read chip minor feature register #0. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00034,
++                                 &Identity->chipMinorFeatures));
++
++        if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))))
++        )
++        {
++            /* Read chip minor featuress register #1. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00074,
++                                     &Identity->chipMinorFeatures1));
++
++            /* Read chip minor featuress register #2. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00084,
++                                     &Identity->chipMinorFeatures2));
++
++            /*Identity->chipMinorFeatures2 &= ~(0x1 << 3);*/
++
++            /* Read chip minor featuress register #1. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00088,
++                                     &Identity->chipMinorFeatures3));
++
++
++            /* Read chip minor featuress register #4. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x00094,
++                                     &Identity->chipMinorFeatures4));
++
++            /* Read chip minor featuress register #5. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Os, Core,
++                                     0x000A0,
++                                     &Identity->chipMinorFeatures5));
++        }
++        else
++        {
++            /* Chip doesn't has minor features register #1 or 2 or 3 or 4. */
++            Identity->chipMinorFeatures1 = 0;
++            Identity->chipMinorFeatures2 = 0;
++            Identity->chipMinorFeatures3 = 0;
++            Identity->chipMinorFeatures4 = 0;
++            Identity->chipMinorFeatures5 = 0;
++        }
++    }
++
++    /* Get the Supertile layout in the hardware. */
++    if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))))
++     || ((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))))
++    {
++        Identity->superTileMode = 2;
++    }
++    else if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))))
++    {
++        Identity->superTileMode = 1;
++    }
++    else
++    {
++        Identity->superTileMode = 0;
++    }
++
++    /* Exception for GC1000, revision 5035 &  GC800, revision 4612 */
++    if (((Identity->chipModel == gcv1000) && ((Identity->chipRevision == 0x5035)
++                                           || (Identity->chipRevision == 0x5036)
++                                           || (Identity->chipRevision == 0x5037)
++                                           || (Identity->chipRevision == 0x5039)
++                                           || (Identity->chipRevision >= 0x5040)))
++    || ((Identity->chipModel == gcv800) && (Identity->chipRevision == 0x4612))
++    || ((Identity->chipModel == gcv600) && (Identity->chipRevision >= 0x4650))
++    || ((Identity->chipModel == gcv860) && (Identity->chipRevision == 0x4647))
++    || ((Identity->chipModel == gcv400) && (Identity->chipRevision >= 0x4633)))
++    {
++        Identity->superTileMode = 1;
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipFeatures=0x%08X",
++                   Identity->chipFeatures);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures=0x%08X",
++                   Identity->chipMinorFeatures);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures1=0x%08X",
++                   Identity->chipMinorFeatures1);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures2=0x%08X",
++                   Identity->chipMinorFeatures2);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures3=0x%08X",
++                   Identity->chipMinorFeatures3);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures4=0x%08X",
++                   Identity->chipMinorFeatures4);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Identity: chipMinorFeatures5=0x%08X",
++                   Identity->chipMinorFeatures5);
++
++    /***************************************************************************
++    ** Get chip specs.
++    */
++
++    if (((((gctUINT32) (Identity->chipMinorFeatures)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
++    {
++        gctUINT32 specs, specs2, specs3, specs4;
++
++        /* Read gcChipSpecs register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00048,
++                                 &specs));
++
++        /* Extract the fields. */
++        registerMax            = (((((gctUINT32) (specs)) >> (0 ? 7:4)) & ((gctUINT32) ((((1 ? 7:4) - (0 ? 7:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:4) - (0 ? 7:4) + 1)))))) );
++        threadCount            = (((((gctUINT32) (specs)) >> (0 ? 11:8)) & ((gctUINT32) ((((1 ? 11:8) - (0 ? 11:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:8) - (0 ? 11:8) + 1)))))) );
++        shaderCoreCount        = (((((gctUINT32) (specs)) >> (0 ? 24:20)) & ((gctUINT32) ((((1 ? 24:20) - (0 ? 24:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:20) - (0 ? 24:20) + 1)))))) );
++        vertexCacheSize        = (((((gctUINT32) (specs)) >> (0 ? 16:12)) & ((gctUINT32) ((((1 ? 16:12) - (0 ? 16:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:12) - (0 ? 16:12) + 1)))))) );
++        vertexOutputBufferSize = (((((gctUINT32) (specs)) >> (0 ? 31:28)) & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1)))))) );
++        pixelPipes             = (((((gctUINT32) (specs)) >> (0 ? 27:25)) & ((gctUINT32) ((((1 ? 27:25) - (0 ? 27:25) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:25) - (0 ? 27:25) + 1)))))) );
++
++        /* Read gcChipSpecs2 register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x00080,
++                                 &specs2));
++
++        instructionCount       = (((((gctUINT32) (specs2)) >> (0 ? 15:8)) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1)))))) );
++        numConstants           = (((((gctUINT32) (specs2)) >> (0 ? 31:16)) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1)))))) );
++        bufferSize             = (((((gctUINT32) (specs2)) >> (0 ? 7:0)) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1)))))) );
++
++        /* Read gcChipSpecs3 register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x0008C,
++                                 &specs3));
++
++        varyingsCount          = (((((gctUINT32) (specs3)) >> (0 ? 8:4)) & ((gctUINT32) ((((1 ? 8:4) - (0 ? 8:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:4) - (0 ? 8:4) + 1)))))) );
++#if gcdMULTI_GPU
++        gpuCoreCount           = (((((gctUINT32) (specs3)) >> (0 ? 2:0)) & ((gctUINT32) ((((1 ? 2:0) - (0 ? 2:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:0) - (0 ? 2:0) + 1)))))) );
++#endif
++
++        /* Read gcChipSpecs4 register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os, Core,
++                                 0x0009C,
++                                 &specs4));
++
++
++        streamCount            = (((((gctUINT32) (specs4)) >> (0 ? 16:12)) & ((gctUINT32) ((((1 ? 16:12) - (0 ? 16:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:12) - (0 ? 16:12) + 1)))))) );
++        if (streamCount == 0)
++        {
++            /* Extract stream count from older register. */
++            streamCount        = (((((gctUINT32) (specs)) >> (0 ? 3:0)) & ((gctUINT32) ((((1 ? 3:0) - (0 ? 3:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:0) - (0 ? 3:0) + 1)))))) );
++        }
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Identity: chipSpecs1=0x%08X",
++                       specs);
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Identity: chipSpecs2=0x%08X",
++                       specs2);
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Identity: chipSpecs3=0x%08X",
++                       specs3);
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Identity: chipSpecs4=0x%08X",
++                       specs4);
++    }
++
++    /* Get the number of pixel pipes. */
++    Identity->pixelPipes = gcmMAX(pixelPipes, 1);
++
++    /* Get the stream count. */
++    Identity->streamCount = (streamCount != 0)
++                          ? streamCount
++                          : (Identity->chipModel >= gcv1000) ? 4 : 1;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: streamCount=%u%s",
++                   Identity->streamCount,
++                   (streamCount == 0) ? " (default)" : "");
++
++    /* Get the vertex output buffer size. */
++    Identity->vertexOutputBufferSize = (vertexOutputBufferSize != 0)
++                                     ? 1 << vertexOutputBufferSize
++                                     : (Identity->chipModel == gcv400)
++                                       ? (Identity->chipRevision < 0x4000) ? 512
++                                       : (Identity->chipRevision < 0x4200) ? 256
++                                       : 128
++                                     : (Identity->chipModel == gcv530)
++                                       ? (Identity->chipRevision < 0x4200) ? 512
++                                       : 128
++                                     : 512;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: vertexOutputBufferSize=%u%s",
++                   Identity->vertexOutputBufferSize,
++                   (vertexOutputBufferSize == 0) ? " (default)" : "");
++
++    /* Get the maximum number of threads. */
++    Identity->threadCount = (threadCount != 0)
++                          ? 1 << threadCount
++                          : (Identity->chipModel == gcv400) ? 64
++                          : (Identity->chipModel == gcv500) ? 128
++                          : (Identity->chipModel == gcv530) ? 128
++                          : 256;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: threadCount=%u%s",
++                   Identity->threadCount,
++                   (threadCount == 0) ? " (default)" : "");
++
++    /* Get the number of shader cores. */
++    Identity->shaderCoreCount = (shaderCoreCount != 0)
++                              ? shaderCoreCount
++                              : (Identity->chipModel >= gcv1000) ? 2
++                              : 1;
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: shaderCoreCount=%u%s",
++                   Identity->shaderCoreCount,
++                   (shaderCoreCount == 0) ? " (default)" : "");
++
++    /* Get the vertex cache size. */
++    Identity->vertexCacheSize = (vertexCacheSize != 0)
++                              ? vertexCacheSize
++                              : 8;
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: vertexCacheSize=%u%s",
++                   Identity->vertexCacheSize,
++                   (vertexCacheSize == 0) ? " (default)" : "");
++
++    /* Get the maximum number of temporary registers. */
++    Identity->registerMax = (registerMax != 0)
++        /* Maximum of registerMax/4 registers are accessible to 1 shader */
++                          ? 1 << registerMax
++                          : (Identity->chipModel == gcv400) ? 32
++                          : 64;
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: registerMax=%u%s",
++                   Identity->registerMax,
++                   (registerMax == 0) ? " (default)" : "");
++
++    /* Get the instruction count. */
++    Identity->instructionCount = (instructionCount == 0) ? 256
++                               : (instructionCount == 1) ? 1024
++                               : (instructionCount == 2) ? 2048
++                               : (instructionCount == 0xFF) ? 512
++                               : 256;
++
++    if (Identity->instructionCount == 256)
++    {
++        if ((Identity->chipModel == gcv2000 && Identity->chipRevision == 0x5108)
++        ||  Identity->chipModel == gcv880)
++        {
++            Identity->instructionCount = 512;
++        }
++        else if (((((gctUINT32) (Identity->chipMinorFeatures3)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))))
++        {
++            Identity->instructionCount = 512;
++        }
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: instructionCount=%u%s",
++                   Identity->instructionCount,
++                   (instructionCount == 0) ? " (default)" : "");
++
++    /* Get the number of constants. */
++    Identity->numConstants = (numConstants == 0) ? 168 : numConstants;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: numConstants=%u%s",
++                   Identity->numConstants,
++                   (numConstants == 0) ? " (default)" : "");
++
++    /* Get the buffer size. */
++    Identity->bufferSize = bufferSize;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Specs: bufferSize=%u%s",
++                   Identity->bufferSize,
++                   (bufferSize == 0) ? " (default)" : "");
++
++
++     if (varyingsCount != 0)
++     {
++         Identity->varyingsCount = varyingsCount;
++     }
++     else if (((((gctUINT32) (Identity->chipMinorFeatures1)) >> (0 ? 23:23) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))))
++     {
++         Identity->varyingsCount = 12;
++     }
++     else
++     {
++         Identity->varyingsCount = 8;
++     }
++
++     /* For some cores, it consumes two varying for position, so the max varying vectors should minus one. */
++     if ((Identity->chipModel == gcv5000 && Identity->chipRevision == 0x5434) ||
++         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5222) ||
++         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5208) ||
++         (Identity->chipModel == gcv4000 && Identity->chipRevision == 0x5245) ||
++         (Identity->chipModel == gcv3000 && Identity->chipRevision == 0x5435) ||
++         (Identity->chipModel == gcv2200 && Identity->chipRevision == 0x5244) ||
++         (Identity->chipModel == gcv1500 && Identity->chipRevision == 0x5246) ||
++         ((Identity->chipModel == gcv2100 || Identity->chipModel == gcv2000) && Identity->chipRevision == 0x5108) ||
++         (Identity->chipModel == gcv880 && (Identity->chipRevision == 0x5107 || Identity->chipRevision == 0x5106)))
++     {
++         Identity->varyingsCount -= 1;
++     }
++
++    Identity->chip2DControl = 0;
++    if (Identity->chipModel == gcv320)
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Os,
++                                 Core,
++                                 0x0002C,
++                                 &data));
++
++        if ((data != 33956864) &&
++            ((Identity->chipRevision == 0x5007) ||
++            (Identity->chipRevision == 0x5220)))
++        {
++            Identity->chip2DControl |= 0xFF &
++                (Identity->chipRevision == 0x5220 ? 8 :
++                (Identity->chipRevision == 0x5007 ? 12 : 0));
++        }
++
++        if  (Identity->chipRevision == 0x5007)
++        {
++            /* Disable splitting rectangle. */
++            Identity->chip2DControl |= 0x100;
++
++            /* Enable 2D Flush. */
++            Identity->chip2DControl |= 0x200;
++        }
++    }
++
++#if gcdMULTI_GPU
++#if gcdMULTI_GPU > 1
++     Identity->gpuCoreCount = gpuCoreCount + 1;
++#else
++     Identity->gpuCoreCount = 1;
++#endif
++#endif
++
++    /* Success. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#define gcdDEBUG_MODULE_CLOCK_GATING   0
++#define gcdDISABLE_MODULE_CLOCK_GATING 0
++#define gcdDISABLE_FE_CLOCK_GATING     0
++#define gcdDISABLE_PE_CLOCK_GATING     0
++#define gcdDISABLE_SH_CLOCK_GATING     0
++#define gcdDISABLE_PA_CLOCK_GATING     0
++#define gcdDISABLE_SE_CLOCK_GATING     0
++#define gcdDISABLE_RA_CLOCK_GATING     0
++#define gcdDISABLE_RA_EZ_CLOCK_GATING  0
++#define gcdDISABLE_RA_HZ_CLOCK_GATING  0
++#define gcdDISABLE_TX_CLOCK_GATING     0
++
++#if gcdDEBUG_MODULE_CLOCK_GATING
++gceSTATUS
++_ConfigureModuleLevelClockGating(
++    gckHARDWARE Hardware
++    )
++{
++    gctUINT32 data;
++
++    gcmkVERIFY_OK(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             Hardware->powerBaseAddress
++                             + 0x00104,
++                             &data));
++
++#if gcdDISABLE_FE_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++#endif
++
++#if gcdDISABLE_PE_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
++#endif
++
++#if gcdDISABLE_SH_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++#endif
++
++#if gcdDISABLE_PA_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++#endif
++
++#if gcdDISABLE_SE_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++#endif
++
++#if gcdDISABLE_RA_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++#endif
++
++#if gcdDISABLE_TX_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
++#endif
++
++#if gcdDISABLE_RA_EZ_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
++#endif
++
++#if gcdDISABLE_RA_HZ_CLOCK_GATING
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
++#endif
++
++    gcmkVERIFY_OK(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              Hardware->powerBaseAddress
++                              + 0x00104,
++                              data));
++
++#if gcdDISABLE_MODULE_CLOCK_GATING
++    gcmkVERIFY_OK(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             Hardware->powerBaseAddress +
++                             0x00100,
++                             &data));
++
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++
++    gcmkVERIFY_OK(
++        gckOS_WriteRegisterEx(Hardware->os,
++                              Hardware->core,
++                              Hardware->powerBaseAddress
++                              + 0x00100,
++                              data));
++#endif
++
++    return gcvSTATUS_OK;
++}
++#endif
++
++#if gcdPOWEROFF_TIMEOUT
++void
++_PowerTimerFunction(
++    gctPOINTER Data
++    )
++{
++    gckHARDWARE hardware = (gckHARDWARE)Data;
++    gcmkVERIFY_OK(
++        gckHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
++}
++#endif
++
++static gceSTATUS
++_VerifyDMA(
++    IN gckOS Os,
++    IN gceCORE Core,
++    gctUINT32_PTR Address1,
++    gctUINT32_PTR Address2,
++    gctUINT32_PTR State1,
++    gctUINT32_PTR State2
++    )
++{
++    gceSTATUS status;
++    gctUINT32 i;
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State1));
++    gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address1));
++
++    for (i = 0; i < 500; i += 1)
++    {
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x660, State2));
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x664, Address2));
++
++        if (*Address1 != *Address2)
++        {
++            break;
++        }
++
++        if (*State1 != *State2)
++        {
++            break;
++        }
++    }
++
++OnError:
++    return status;
++}
++
++static gceSTATUS
++_DumpDebugRegisters(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gcsiDEBUG_REGISTERS_PTR Descriptor
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctUINT32 select;
++    gctUINT32 data = 0;
++    gctUINT i;
++
++    gcmkHEADER_ARG("Os=0x%X Descriptor=0x%X", Os, Descriptor);
++
++    gcmkPRINT_N(4, "    %s debug registers:\n", Descriptor->module);
++
++    for (i = 0; i < Descriptor->count; i += 1)
++    {
++        select = i << Descriptor->shift;
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
++#if gcdFPGA_BUILD
++        gcmkONERROR(gckOS_Delay(Os, 1000));
++#endif
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
++
++        gcmkPRINT_N(12, "      [0x%02X] 0x%08X\n", i, data);
++    }
++
++    select = 0xF << Descriptor->shift;
++
++    for (i = 0; i < 500; i += 1)
++    {
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, Descriptor->index, select));
++#if gcdFPGA_BUILD
++        gcmkONERROR(gckOS_Delay(Os, 1000));
++#endif
++        gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, Descriptor->data, &data));
++
++        if (data == Descriptor->signature)
++        {
++            break;
++        }
++    }
++
++    if (i == 500)
++    {
++        gcmkPRINT_N(4, "      failed to obtain the signature (read 0x%08X).\n", data);
++    }
++    else
++    {
++        gcmkPRINT_N(8, "      signature = 0x%08X (%d read attempt(s))\n", data, i + 1);
++    }
++
++OnError:
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++_IsGPUPresent(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gcsHAL_QUERY_CHIP_IDENTITY identity;
++    gctUINT32 control;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &control));
++
++    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
++    control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      control));
++
++    /* Identify the hardware. */
++    gcmkONERROR(_IdentifyHardware(Hardware->os,
++                                  Hardware->core,
++                                  &identity));
++
++    /* Check if these are the same values as saved before. */
++    if ((Hardware->identity.chipModel          != identity.chipModel)
++    ||  (Hardware->identity.chipRevision       != identity.chipRevision)
++    ||  (Hardware->identity.chipFeatures       != identity.chipFeatures)
++    ||  (Hardware->identity.chipMinorFeatures  != identity.chipMinorFeatures)
++    ||  (Hardware->identity.chipMinorFeatures1 != identity.chipMinorFeatures1)
++    ||  (Hardware->identity.chipMinorFeatures2 != identity.chipMinorFeatures2)
++    )
++    {
++        gcmkPRINT("[galcore]: GPU is not present.");
++        gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++_FlushCache(
++    gckHARDWARE Hardware,
++    gckCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gctUINT32 bytes, requested;
++    gctPOINTER buffer;
++
++    /* Get the size of the flush command. */
++    gcmkONERROR(gckHARDWARE_Flush(Hardware,
++                                  gcvFLUSH_ALL,
++                                  gcvNULL,
++                                  &requested));
++
++    /* Reserve space in the command queue. */
++    gcmkONERROR(gckCOMMAND_Reserve(Command,
++                                   requested,
++                                   &buffer,
++                                   &bytes));
++
++    /* Append a flush. */
++    gcmkONERROR(gckHARDWARE_Flush(
++        Hardware, gcvFLUSH_ALL, buffer, &bytes
++        ));
++
++    /* Execute the command queue. */
++    gcmkONERROR(gckCOMMAND_Execute(Command, requested));
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++gctBOOL
++_IsGPUIdle(
++    IN gctUINT32 Idle
++    )
++{
++   return  (((((gctUINT32) (Idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) )
++        && (((((gctUINT32) (Idle)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) )
++        ;
++}
++
++/******************************************************************************\
++****************************** gckHARDWARE API code *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Construct
++**
++**  Construct a new gckHARDWARE object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an initialized gckOS object.
++**
++**      gceCORE Core
++**          Specified core.
++**
++**  OUTPUT:
++**
++**      gckHARDWARE * Hardware
++**          Pointer to a variable that will hold the pointer to the gckHARDWARE
++**          object.
++*/
++gceSTATUS
++gckHARDWARE_Construct(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gckHARDWARE * Hardware
++    )
++{
++    gceSTATUS status;
++    gckHARDWARE hardware = gcvNULL;
++    gctUINT16 data = 0xff00;
++    gctPOINTER pointer = gcvNULL;
++#if gcdMULTI_GPU_AFFINITY
++    gctUINT32 control;
++#endif
++
++    gcmkHEADER_ARG("Os=0x%x", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
++
++    /* Enable the GPU. */
++    gcmkONERROR(gckOS_SetGPUPower(Os, Core, gcvTRUE, gcvTRUE));
++    gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                      Core,
++                                      0x00000,
++                                      0x00000900));
++
++    /* Allocate the gckHARDWARE object. */
++    gcmkONERROR(gckOS_Allocate(Os,
++                               gcmSIZEOF(struct _gckHARDWARE),
++                               &pointer));
++
++    hardware = (gckHARDWARE) pointer;
++
++    /* Initialize the gckHARDWARE object. */
++    hardware->object.type = gcvOBJ_HARDWARE;
++    hardware->os          = Os;
++    hardware->core        = Core;
++
++    /* Identify the hardware. */
++    gcmkONERROR(_IdentifyHardware(Os, Core, &hardware->identity));
++
++    /* Determine the hardware type */
++    switch (hardware->identity.chipModel)
++    {
++    case gcv350:
++    case gcv355:
++        hardware->type = gcvHARDWARE_VG;
++        break;
++
++    case gcv200:
++    case gcv300:
++    case gcv320:
++    case gcv328:
++    case gcv420:
++    case gcv428:
++        hardware->type = gcvHARDWARE_2D;
++        break;
++
++    default:
++#if gcdMULTI_GPU_AFFINITY
++        hardware->type = (Core == gcvCORE_MAJOR) ? gcvHARDWARE_3D : gcvHARDWARE_OCL;
++#else
++        hardware->type = gcvHARDWARE_3D;
++#endif
++
++        if(hardware->identity.chipModel == gcv880 && hardware->identity.chipRevision == 0x5107)
++        {
++            /*set outstanding limit*/
++            gctUINT32 axi_ot;
++            gcmkONERROR(gckOS_ReadRegisterEx(Os, Core, 0x00414, &axi_ot));
++            axi_ot = (axi_ot & (~0xFF)) | 0x00010;
++            gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00414, axi_ot));
++        }
++
++
++        if ((((((gctUINT32) (hardware->identity.chipFeatures)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ))
++        {
++            hardware->type = (gceHARDWARE_TYPE) (hardware->type | gcvHARDWARE_2D);
++        }
++    }
++
++    hardware->powerBaseAddress
++        = ((hardware->identity.chipModel   == gcv300)
++        && (hardware->identity.chipRevision < 0x2000))
++            ? 0x0100
++            : 0x0000;
++
++    /* _ResetGPU need powerBaseAddress. */
++    status = _ResetGPU(hardware, Os, Core);
++
++    if (status != gcvSTATUS_OK)
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "_ResetGPU failed: status=%d\n", status);
++    }
++
++#if gcdMULTI_GPU
++    gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                      Core,
++                                      0x0055C,
++#if gcdDISABLE_FE_L2
++                                      0x00FFFFFF));
++#else
++                                      0x00FFFF05));
++#endif
++
++#elif gcdMULTI_GPU_AFFINITY
++    control = ((((gctUINT32) (0x00FF0A05)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) << (0 ? 27:27)));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                      Core,
++                                      0x0055C,
++                                      control));
++#endif
++
++    hardware->powerMutex = gcvNULL;
++
++    hardware->mmuVersion
++        = (((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 28:28)) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) );
++
++    /* Determine whether bug fixes #1 are present. */
++    hardware->extraEventStates = ((((gctUINT32) (hardware->identity.chipMinorFeatures1)) >> (0 ? 3:3) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))));
++
++    /* Check if big endian */
++    hardware->bigEndian = (*(gctUINT8 *)&data == 0xff);
++
++    /* Initialize the fast clear. */
++    gcmkONERROR(gckHARDWARE_SetFastClear(hardware, -1, -1));
++
++#if !gcdENABLE_128B_MERGE
++
++    if (((((gctUINT32) (hardware->identity.chipMinorFeatures2)) >> (0 ? 21:21) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))))
++    {
++        /* 128B merge is turned on by default. Disable it. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os, Core, 0x00558, 0));
++    }
++
++#endif
++
++    /* Set power state to ON. */
++    hardware->chipPowerState  = gcvPOWER_ON;
++    hardware->clockState      = gcvTRUE;
++    hardware->powerState      = gcvTRUE;
++    hardware->lastWaitLink    = ~0U;
++    hardware->lastEnd         = ~0U;
++    hardware->globalSemaphore = gcvNULL;
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    hardware->powerOnFscaleVal = 64;
++#endif
++
++    gcmkONERROR(gckOS_CreateMutex(Os, &hardware->powerMutex));
++    gcmkONERROR(gckOS_CreateSemaphore(Os, &hardware->globalSemaphore));
++    hardware->startIsr = gcvNULL;
++    hardware->stopIsr = gcvNULL;
++
++#if gcdPOWEROFF_TIMEOUT
++    hardware->powerOffTimeout = gcdPOWEROFF_TIMEOUT;
++
++    gcmkVERIFY_OK(gckOS_CreateTimer(Os,
++                                    _PowerTimerFunction,
++                                    (gctPOINTER)hardware,
++                                    &hardware->powerOffTimer));
++#endif
++
++    gcmkONERROR(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
++    gcmkONERROR(gckOS_AtomConstruct(Os, &hardware->pendingEvent));
++
++#if gcdLINK_QUEUE_SIZE
++    hardware->linkQueue.front = 0;
++    hardware->linkQueue.rear = 0;
++    hardware->linkQueue.count = 0;
++#endif
++
++    /* Enable power management by default. */
++    hardware->powerManagement = gcvTRUE;
++
++    /* Disable profiler by default */
++    hardware->gpuProfiler = gcvFALSE;
++
++#if defined(LINUX) || defined(__QNXNTO__) || defined(UNDERCE)
++    if (hardware->mmuVersion)
++    {
++        hardware->endAfterFlushMmuCache = gcvTRUE;
++    }
++    else
++#endif
++    {
++        hardware->endAfterFlushMmuCache = gcvFALSE;
++    }
++
++    gcmkONERROR(gckOS_QueryOption(Os, "mmu", (gctUINT32_PTR)&hardware->enableMMU));
++
++    hardware->minFscaleValue = 1;
++
++    /* Return pointer to the gckHARDWARE object. */
++    *Hardware = hardware;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Hardware=0x%x", *Hardware);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (hardware != gcvNULL)
++    {
++        /* Turn off the power. */
++        gcmkVERIFY_OK(gckOS_SetGPUPower(Os, Core, gcvFALSE, gcvFALSE));
++
++        if (hardware->globalSemaphore != gcvNULL)
++        {
++            /* Destroy the global semaphore. */
++            gcmkVERIFY_OK(gckOS_DestroySemaphore(Os,
++                                                 hardware->globalSemaphore));
++        }
++
++        if (hardware->powerMutex != gcvNULL)
++        {
++            /* Destroy the power mutex. */
++            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, hardware->powerMutex));
++        }
++
++#if gcdPOWEROFF_TIMEOUT
++        if (hardware->powerOffTimer != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
++            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
++        }
++#endif
++
++        if (hardware->pageTableDirty != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
++        }
++
++        if (hardware->pendingEvent != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pendingEvent));
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, hardware));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Destroy
++**
++**  Destroy an gckHARDWARE object.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object that needs to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Destroy(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Destroy the power semaphore. */
++    gcmkVERIFY_OK(gckOS_DestroySemaphore(Hardware->os,
++                                         Hardware->globalSemaphore));
++
++    /* Destroy the power mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Hardware->os, Hardware->powerMutex));
++
++#if gcdPOWEROFF_TIMEOUT
++    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
++    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
++#endif
++
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
++
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pendingEvent));
++
++    gcmkVERIFY_OK(gckOS_FreeNonPagedMemory(
++        Hardware->os,
++        Hardware->functionBytes,
++        Hardware->functionPhysical,
++        Hardware->functionLogical
++        ));
++
++    /* Mark the object as unknown. */
++    Hardware->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the object. */
++    gcmkONERROR(gcmkOS_SAFE_FREE(Hardware->os, Hardware));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_GetType
++**
++**  Get the hardware type.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gceHARDWARE_TYPE * Type
++**          Pointer to a variable that receives the type of hardware object.
++*/
++gceSTATUS
++gckHARDWARE_GetType(
++    IN gckHARDWARE Hardware,
++    OUT gceHARDWARE_TYPE * Type
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++    gcmkVERIFY_ARGUMENT(Type != gcvNULL);
++
++    *Type = Hardware->type;
++
++    gcmkFOOTER_ARG("*Type=%d", *Type);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_InitializeHardware
++**
++**  Initialize the hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_InitializeHardware(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gctUINT32 baseAddress;
++    gctUINT32 chipRev;
++    gctUINT32 control;
++    gctUINT32 data;
++    gctUINT32 regPMC = 0;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Read the chip revision register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00024,
++                                     &chipRev));
++
++    if (chipRev != Hardware->identity.chipRevision)
++    {
++        /* Chip is not there! */
++        gcmkONERROR(gcvSTATUS_CONTEXT_LOSSED);
++    }
++
++    /* Disable isolate GPU bit. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)))));
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &control));
++
++    /* Enable debug register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
++
++    /* Reset memory counters. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      ~0U));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      0));
++
++    /* Get the system's physical base address. */
++    gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
++
++    /* Program the base addesses. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0041C,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00418,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00428,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00420,
++                                      baseAddress));
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00424,
++                                      baseAddress));
++
++    {
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         Hardware->powerBaseAddress +
++                                         0x00100,
++                                         &data));
++
++        /* Enable clock gating. */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        if ((Hardware->identity.chipRevision == 0x4301)
++        ||  (Hardware->identity.chipRevision == 0x4302)
++        )
++        {
++            /* Disable stall module level clock gating for 4.3.0.1 and 4.3.0.2
++            ** revisions. */
++            data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
++        }
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          Hardware->powerBaseAddress
++                                          + 0x00100,
++                                          data));
++
++#if gcdENABLE_3D
++        /* Disable PE clock gating on revs < 5.0 when HZ is present without a
++        ** bug fix. */
++        if ((Hardware->identity.chipRevision < 0x5000)
++        &&  gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HZ)
++        &&  ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))))
++        )
++        {
++            if (regPMC == 0)
++            {
++                gcmkONERROR(
++                    gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         Hardware->powerBaseAddress
++                                         + 0x00104,
++                                         &regPMC));
++            }
++
++            /* Disable PE clock gating. */
++            regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
++        }
++
++#endif
++    }
++
++    if (Hardware->identity.chipModel == gcv4000 &&
++        ((Hardware->identity.chipRevision == 0x5208) || (Hardware->identity.chipRevision == 0x5222)))
++    {
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x0010C,
++                                  ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)))));
++    }
++
++    if (Hardware->identity.chipModel == gcv1000 &&
++        (Hardware->identity.chipRevision == 0x5039 ||
++        Hardware->identity.chipRevision == 0x5040))
++    {
++        gctUINT32 pulseEater;
++
++        pulseEater = ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x0010C,
++                                  ((((gctUINT32) (pulseEater)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)))));
++    }
++
++    if ((gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_HALTI2) == gcvSTATUS_FALSE)
++     || (Hardware->identity.chipRevision < 0x5422)
++    )
++    {
++        if (regPMC == 0)
++        {
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     Hardware->powerBaseAddress
++                                     + 0x00104,
++                                     &regPMC));
++        }
++
++        regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:15) - (0 ? 15:15) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:15) - (0 ? 15:15) + 1))))))) << (0 ? 15:15)));
++    }
++
++    if (_IsHardwareMatch(Hardware, gcv2000, 0x5108))
++    {
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00480,
++                                 &data));
++
++        /* Set FE bus to one, TX bus to zero */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00480,
++                                  data));
++    }
++
++    gcmkONERROR(
++        gckHARDWARE_SetMMU(Hardware,
++                           Hardware->kernel->mmu->pageTableLogical));
++
++    if (Hardware->identity.chipModel >= gcv400
++    &&  Hardware->identity.chipModel != gcv420)
++    {
++        if (regPMC == 0)
++        {
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &regPMC));
++        }
++
++        /* Disable PA clock gating. */
++        regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++    }
++
++    /* Limit 2D outstanding request. */
++    if (_IsHardwareMatch(Hardware, gcv880, 0x5107))
++    {
++        gctUINT32 axi_ot;
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &axi_ot));
++        axi_ot = (axi_ot & (~0xFF)) | 0x00010;
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00414, axi_ot));
++    }
++
++    if (Hardware->identity.chip2DControl & 0xFF)
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00414,
++                                 &data));
++
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (Hardware->identity.chip2DControl & 0xFF) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00414,
++                                  data));
++    }
++
++    if (_IsHardwareMatch(Hardware, gcv1000, 0x5035))
++    {
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00414,
++                                 &data));
++
++        /* Disable HZ-L2. */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)));
++
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00414,
++                                  data));
++    }
++
++    if (_IsHardwareMatch(Hardware, gcv4000, 0x5222))
++    {
++        if (regPMC == 0)
++        {
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &regPMC));
++        }
++
++        /* Disable TX clock gating. */
++        regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)));
++    }
++
++    if (_IsHardwareMatch(Hardware, gcv880, 0x5106))
++    {
++        Hardware->kernel->timeOut = 140 * 1000;
++    }
++
++    if (regPMC == 0)
++    {
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &regPMC));
++    }
++
++    /* Disable RA HZ clock gating. */
++    regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
++
++    /* Disable RA EZ clock gating. */
++    regPMC = ((((gctUINT32) (regPMC)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
++
++    if (regPMC != 0)
++    {
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  regPMC));
++    }
++
++    if (_IsHardwareMatch(Hardware, gcv2000, 0x5108)
++     || _IsHardwareMatch(Hardware, gcv320, 0x5007)
++     || _IsHardwareMatch(Hardware, gcv880, 0x5106)
++     || _IsHardwareMatch(Hardware, gcv400, 0x4645)
++    )
++    {
++        /* Update GPU AXI cache atttribute. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00008,
++                                          0x00002200));
++    }
++
++
++    if ((Hardware->identity.chipRevision > 0x5420)
++     && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_3D))
++    {
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x0010C,
++                                     &data));
++
++        /* Disable internal DFS. */
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0010C,
++                                      data));
++    }
++
++#if gcdDEBUG_MODULE_CLOCK_GATING
++    _ConfigureModuleLevelClockGating(Hardware);
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryMemory
++**
++**  Query the amount of memory available on the hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * InternalSize
++**          Pointer to a variable that will hold the size of the internal video
++**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
++**          internal memory will be returned.
++**
++**      gctUINT32 * InternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * InternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctSIZE_T * ExternalSize
++**          Pointer to a variable that will hold the size of the external video
++**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
++**          external memory will be returned.
++**
++**      gctUINT32 * ExternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * ExternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * HorizontalTileSize
++**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
++**          gcvNULL, no horizontal pixel per tile will be returned.
++**
++**      gctUINT32 * VerticalTileSize
++**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
++**          gcvNULL, no vertical pixel per tile will be returned.
++*/
++gceSTATUS
++gckHARDWARE_QueryMemory(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctUINT32 * InternalBaseAddress,
++    OUT gctUINT32 * InternalAlignment,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctUINT32 * ExternalBaseAddress,
++    OUT gctUINT32 * ExternalAlignment,
++    OUT gctUINT32 * HorizontalTileSize,
++    OUT gctUINT32 * VerticalTileSize
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (InternalSize != gcvNULL)
++    {
++        /* No internal memory. */
++        *InternalSize = 0;
++    }
++
++    if (ExternalSize != gcvNULL)
++    {
++        /* No external memory. */
++        *ExternalSize = 0;
++    }
++
++    if (HorizontalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *HorizontalTileSize = 4;
++    }
++
++    if (VerticalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *VerticalTileSize = 4;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*InternalSize=%lu *InternalBaseAddress=0x%08x "
++                   "*InternalAlignment=0x%08x *ExternalSize=%lu "
++                   "*ExternalBaseAddress=0x%08x *ExtenalAlignment=0x%08x "
++                   "*HorizontalTileSize=%u *VerticalTileSize=%u",
++                   gcmOPT_VALUE(InternalSize),
++                   gcmOPT_VALUE(InternalBaseAddress),
++                   gcmOPT_VALUE(InternalAlignment),
++                   gcmOPT_VALUE(ExternalSize),
++                   gcmOPT_VALUE(ExternalBaseAddress),
++                   gcmOPT_VALUE(ExternalAlignment),
++                   gcmOPT_VALUE(HorizontalTileSize),
++                   gcmOPT_VALUE(VerticalTileSize));
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryChipIdentity
++**
++**  Query the identity of the hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++**          Pointer to the identity structure.
++**
++*/
++gceSTATUS
++gckHARDWARE_QueryChipIdentity(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++    )
++{
++    gctUINT32 features;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Identity != gcvNULL);
++
++    /* Return chip model and revision. */
++    Identity->chipModel = Hardware->identity.chipModel;
++    Identity->chipRevision = Hardware->identity.chipRevision;
++
++    /* Return feature set. */
++    features = Hardware->identity.chipFeatures;
++
++    if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++    {
++        /* Override fast clear by command line. */
++        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++    }
++
++    if ((((((gctUINT32) (features)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ))
++    {
++        /* Override compression by command line. */
++        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (Hardware->allowCompression) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++    }
++
++    /* Mark 2D pipe as available for GC500.0 through GC500.2 and GC300,
++    ** since they did not have this bit. */
++    if (((Hardware->identity.chipModel == gcv500) && (Hardware->identity.chipRevision <= 2))
++    ||   (Hardware->identity.chipModel == gcv300)
++    )
++    {
++        features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++    }
++
++    Identity->chipFeatures = features;
++
++    /* Return minor features. */
++    Identity->chipMinorFeatures  = Hardware->identity.chipMinorFeatures;
++    Identity->chipMinorFeatures1 = Hardware->identity.chipMinorFeatures1;
++    Identity->chipMinorFeatures2 = Hardware->identity.chipMinorFeatures2;
++    Identity->chipMinorFeatures3 = Hardware->identity.chipMinorFeatures3;
++    Identity->chipMinorFeatures4 = Hardware->identity.chipMinorFeatures4;
++    Identity->chipMinorFeatures5 = Hardware->identity.chipMinorFeatures5;
++
++    /* Return chip specs. */
++    Identity->streamCount            = Hardware->identity.streamCount;
++    Identity->registerMax            = Hardware->identity.registerMax;
++    Identity->threadCount            = Hardware->identity.threadCount;
++    Identity->shaderCoreCount        = Hardware->identity.shaderCoreCount;
++    Identity->vertexCacheSize        = Hardware->identity.vertexCacheSize;
++    Identity->vertexOutputBufferSize = Hardware->identity.vertexOutputBufferSize;
++    Identity->pixelPipes             = Hardware->identity.pixelPipes;
++    Identity->instructionCount       = Hardware->identity.instructionCount;
++    Identity->numConstants           = Hardware->identity.numConstants;
++    Identity->bufferSize             = Hardware->identity.bufferSize;
++    Identity->varyingsCount          = Hardware->identity.varyingsCount;
++    Identity->superTileMode          = Hardware->identity.superTileMode;
++#if gcdMULTI_GPU
++    Identity->gpuCoreCount           = Hardware->identity.gpuCoreCount;
++#endif
++    Identity->chip2DControl          = Hardware->identity.chip2DControl;
++
++    Identity->productID              = Hardware->identity.productID;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SplitMemory
++**
++**  Split a hardware specific memory address into a pool and offset.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gctUINT32 Address
++**          Address in hardware specific format.
++**
++**  OUTPUT:
++**
++**      gcePOOL * Pool
++**          Pointer to a variable that will hold the pool type for the address.
++**
++**      gctUINT32 * Offset
++**          Pointer to a variable that will hold the offset for the address.
++*/
++gceSTATUS
++gckHARDWARE_SplitMemory(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Addres=0x%08x", Hardware, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
++
++    if (Hardware->mmuVersion == 0)
++    {
++        /* Dispatch on memory type. */
++        switch ((((((gctUINT32) (Address)) >> (0 ? 31:31)) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) ))
++        {
++        case 0x0:
++            /* System memory. */
++            *Pool = gcvPOOL_SYSTEM;
++            break;
++
++        case 0x1:
++            /* Virtual memory. */
++            *Pool = gcvPOOL_VIRTUAL;
++            break;
++
++        default:
++            /* Invalid memory type. */
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
++            return gcvSTATUS_INVALID_ARGUMENT;
++        }
++
++        /* Return offset of address. */
++        *Offset = (((((gctUINT32) (Address)) >> (0 ? 30:0)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1)))))) );
++    }
++    else
++    {
++        *Pool = gcvPOOL_SYSTEM;
++        *Offset = Address;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Pool=%d *Offset=0x%08x", *Pool, *Offset);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Execute
++**
++**  Kickstart the hardware's command processor with an initialized command
++**  buffer.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gctUINT32 Address
++**          Hardware address of command buffer.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes for the prefetch unit (until after the first LINK).
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Execute(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Address,
++    IN gctSIZE_T Bytes
++    )
++{
++    gceSTATUS status;
++    gctUINT32 control;
++
++    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Bytes=%lu",
++                   Hardware, Address, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Enable all events. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00014, ~0U));
++
++    /* Write address register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00654, Address));
++
++    /* Build control register. */
++    control = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) ((Bytes + 7) >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++    /* Set big endian */
++    if (Hardware->bigEndian)
++    {
++        control |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 21:20) - (0 ? 21:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:20) - (0 ? 21:20) + 1))))))) << (0 ? 21:20)));
++    }
++
++    /* Write control register. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00658, control));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                  "Started command buffer @ 0x%08x",
++                  Address);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_WaitLink
++**
++**  Append a WAIT/LINK command sequence at the specified location in the command
++**  queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          WAIT/LINK command sequence at or gcvNULL just to query the size of the
++**          WAIT/LINK command sequence.
++**
++**      gctUINT32 Offset
++**          Offset into command buffer required for alignment.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the WAIT/LINK command
++**          sequence.  If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          by the WAIT/LINK command sequence.  If 'Bytes' is gcvNULL, nothing will
++**          be returned.
++**
++**      gctUINT32 * WaitOffset
++**          Pointer to a variable that will receive the offset of the WAIT command
++**          from the specified logcial pointer.
++**          If 'WaitOffset' is gcvNULL nothing will be returned.
++**
++**      gctSIZE_T * WaitSize
++**          Pointer to a variable that will receive the number of bytes used by
++**          the WAIT command.  If 'LinkSize' is gcvNULL nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_WaitLink(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset,
++    IN OUT gctUINT32 * Bytes,
++    OUT gctUINT32 * WaitOffset,
++    OUT gctUINT32 * WaitSize
++    )
++{
++    static const gctUINT waitCount = 200;
++
++    gceSTATUS status;
++    gctUINT32 address;
++    gctUINT32_PTR logical;
++    gctUINT32 bytes;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x *Bytes=%lu",
++                   Hardware, Logical, Offset, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical != gcvNULL) || (Bytes != gcvNULL));
++
++#if gcdMULTI_GPU && !gcdDISABLE_FE_L2
++    bytes = gcmALIGN(Offset + 40, 8) - Offset;
++#else
++    /* Compute number of bytes required. */
++    bytes = gcmALIGN(Offset + 16, 8) - Offset;
++#endif
++    /* Cast the input pointer. */
++    logical = (gctUINT32_PTR) Logical;
++
++    if (logical != gcvNULL)
++    {
++        /* Not enough space? */
++        if (*Bytes < bytes)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Convert logical into hardware specific address. */
++        gcmkONERROR(gckHARDWARE_ConvertLogical(Hardware, logical, gcvFALSE, &address));
++
++        /* Store the WAIT/LINK address. */
++        Hardware->lastWaitLink = address;
++
++        /* Append WAIT(count). */
++        logical[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (waitCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++#if gcdMULTI_GPU && !gcdDISABLE_FE_L2
++        logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | gcvCORE_3D_0_MASK;
++
++        logical[3] = 0;
++
++        /* LoadState(AQFlush, 1), flush. */
++        logical[4] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[5] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++        logical[6] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | gcvCORE_3D_ALL_MASK;
++
++        logical[7] = 0;
++
++        /* Append LINK(2, address). */
++        logical[8] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[9] = address;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "0x%08x: WAIT %u", address, waitCount
++            );
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                        "0x%x: FLUSH 0x%x", address + 8, logical[3]);
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "0x%08x: LINK 0x%08x, #%lu",
++            address + 16, address, bytes
++            );
++#else
++
++        /* Append LINK(2, address). */
++        logical[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[3] = address;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "0x%08x: WAIT %u", address, waitCount
++            );
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_HARDWARE,
++            "0x%08x: LINK 0x%08x, #%lu",
++            address + 8, address, bytes
++            );
++#endif
++        if (WaitOffset != gcvNULL)
++        {
++            /* Return the offset pointer to WAIT command. */
++            *WaitOffset = 0;
++        }
++
++        if (WaitSize != gcvNULL)
++        {
++            /* Return number of bytes used by the WAIT command. */
++#if gcdMULTI_GPU && !gcdDISABLE_FE_L2
++            *WaitSize = 32;
++#else
++            *WaitSize = 8;
++#endif
++        }
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the WAIT/LINK command
++        ** sequence. */
++        *Bytes = bytes;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu *WaitOffset=0x%x *WaitSize=%lu",
++                   gcmOPT_VALUE(Bytes), gcmOPT_VALUE(WaitOffset),
++                   gcmOPT_VALUE(WaitSize));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_End
++**
++**  Append an END command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          END command at or gcvNULL just to query the size of the END command.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the END command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the END command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_End(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gctUINT32 address;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
++                   Hardware, Logical, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Append END. */
++       logical[0] =
++            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: END", Logical);
++
++        /* Make sure the CPU writes out the data to memory. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, Logical));
++
++        gcmkONERROR(gckHARDWARE_ConvertLogical(Hardware, logical, gcvFALSE, &address));
++
++        Hardware->lastEnd = address;
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the END command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdMULTI_GPU
++gceSTATUS
++gckHARDWARE_ChipEnable(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gceCORE_3D_MASK ChipEnable,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x ChipEnable=0x%x *Bytes=%lu",
++                   Hardware, Logical, ChipEnable, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Append CHIPENABLE. */
++        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x0D & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | ChipEnable;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: CHIPENABLE 0x%x", Logical, ChipEnable);
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the CHIPENABLE command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Nop
++**
++**  Append a NOP command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          NOP command at or gcvNULL just to query the size of the NOP command.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the NOP command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the NOP command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_Nop(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x *Bytes=%lu",
++                   Hardware, Logical, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        /* Append NOP. */
++        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x03 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "0x%x: NOP", Logical);
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the NOP command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Event
++**
++**  Append an EVENT command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          the EVENT command at or gcvNULL just to query the size of the EVENT
++**          command.
++**
++**      gctUINT8 Event
++**          Event ID to program.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Location of the pipe to send the event.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the EVENT command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the EVENT command.  If 'Bytes' is gcvNULL, nothing will be
++**          returned.
++*/
++gceSTATUS
++gckHARDWARE_Event(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT8 Event,
++    IN gceKERNEL_WHERE FromWhere,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gctUINT size;
++    gctUINT32 destination = 0;
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Event=%u FromWhere=%d *Bytes=%lu",
++                   Hardware, Logical, Event, FromWhere, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++    gcmkVERIFY_ARGUMENT(Event < 32);
++
++#if gcdMULTI_GPU
++    if (FromWhere == gcvKERNEL_COMMAND) FromWhere = gcvKERNEL_PIXEL;
++#endif
++
++    /* Determine the size of the command. */
++
++    size = (Hardware->extraEventStates && (FromWhere == gcvKERNEL_PIXEL))
++         ? gcmALIGN(8 + (1 + 5) * 4, 8) /* EVENT + 5 STATES */
++         : 8;
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < size)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        switch (FromWhere)
++        {
++        case gcvKERNEL_COMMAND:
++            /* From command processor. */
++            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++            break;
++
++        case gcvKERNEL_PIXEL:
++            /* From pixel engine. */
++            destination = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++            break;
++
++        default:
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        /* Append EVENT(Event, destiantion). */
++        logical[0] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                   | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[1] = ((((gctUINT32) (destination)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (Event) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
++
++        /* Make sure the event ID gets written out before GPU can access it. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, logical + 1));
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++        {
++            gctUINT32 phys;
++            gckOS_GetPhysicalAddress(Hardware->os, Logical, &phys);
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "0x%08x: EVENT %d", phys, Event);
++        }
++#endif
++
++        /* Append the extra states. These are needed for the chips that do not
++        ** support back-to-back events due to the async interface. The extra
++        ** states add the necessary delay to ensure that event IDs do not
++        ** collide. */
++        if (size > 8)
++        {
++            logical[2] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0100) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                       | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++            logical[3] = 0;
++            logical[4] = 0;
++            logical[5] = 0;
++            logical[6] = 0;
++            logical[7] = 0;
++        }
++
++#if gcdINTERRUPT_STATISTIC
++        if (Event < gcmCOUNTOF(Hardware->kernel->eventObj->queues))
++        {
++            gckOS_AtomSetMask(Hardware->pendingEvent, 1 << Event);
++        }
++#endif
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the EVENT command. */
++        *Bytes = size;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_PipeSelect
++**
++**  Append a PIPESELECT command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          the PIPESELECT command at or gcvNULL just to query the size of the
++**          PIPESELECT command.
++**
++**      gcePIPE_SELECT Pipe
++**          Pipe value to select.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the PIPESELECT command.
++**          If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the PIPESELECT command.  If 'Bytes' is gcvNULL, nothing will be
++**          returned.
++*/
++gceSTATUS
++gckHARDWARE_PipeSelect(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gcePIPE_SELECT Pipe,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Pipe=%d *Bytes=%lu",
++                   Hardware, Logical, Pipe, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    /* Append a PipeSelect. */
++    if (Logical != gcvNULL)
++    {
++        gctUINT32 flush, stall;
++
++        if (*Bytes < 32)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        flush = (Pipe == gcvPIPE_2D)
++              ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++              : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++
++        stall = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LoadState(AQFlush, 1), flush. */
++        logical[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[1]
++            = flush;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: FLUSH 0x%x", logical, flush);
++
++        /* LoadState(AQSempahore, 1), stall. */
++        logical[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        logical[3]
++            = stall;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: SEMAPHORE 0x%x", logical + 2, stall);
++
++        /* Stall, stall. */
++        logical[4] = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++        logical[5] = stall;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: STALL 0x%x", logical + 4, stall);
++
++        /* LoadState(AQPipeSelect, 1), pipe. */
++        logical[6]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        logical[7] = (Pipe == gcvPIPE_2D)
++            ? 0x1
++            : 0x0;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "0x%x: PIPE %d", logical + 6, Pipe);
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the PIPESELECT command. */
++        *Bytes = 32;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Link
++**
++**  Append a LINK command at the specified location in the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          the LINK command at or gcvNULL just to query the size of the LINK
++**          command.
++**
++**      gctUINT32 FetchAddress
++**          Hardware address of destination of LINK.
++**
++**      gctSIZE_T FetchSize
++**          Number of bytes in destination of LINK.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the LINK command.  If
++**          'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the LINK command.  If 'Bytes' is gcvNULL, nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_Link(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT32 FetchSize,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T bytes;
++    gctUINT32 link;
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x FetchAddress=0x%x FetchSize=%lu "
++                   "*Bytes=%lu",
++                   Hardware, Logical, FetchAddress, FetchSize,
++                   gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT((Logical == gcvNULL) || (Bytes != gcvNULL));
++
++    if (Logical != gcvNULL)
++    {
++        if (*Bytes < 8)
++        {
++            /* Command queue too small. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++
++        gcmkONERROR(
++            gckOS_WriteMemory(Hardware->os, logical + 1, FetchAddress));
++
++        /* Make sure the address got written before the LINK command. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, logical + 1));
++
++        /* Compute number of 64-byte aligned bytes to fetch. */
++        bytes = gcmALIGN(FetchAddress + FetchSize, 64) - FetchAddress;
++
++        /* Append LINK(bytes / 8), FetchAddress. */
++        link = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (bytes >> 3) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        gcmkONERROR(
++            gckOS_WriteMemory(Hardware->os, logical, link));
++
++        /* Memory barrier. */
++        gcmkONERROR(
++            gckOS_MemoryBarrier(Hardware->os, logical));
++
++#if gcdLINK_QUEUE_SIZE && !gcdPROCESS_ADDRESS_SPACE
++        if ((Hardware->kernel->virtualCommandBuffer)
++         && (Hardware->kernel->stuckDump > 2)
++        )
++        {
++            gctBOOL in;
++
++            gcmkVERIFY_OK(gckCOMMAND_AddressInKernelCommandBuffer(
++                Hardware->kernel->command, FetchAddress, &in));
++
++            if (in == gcvFALSE)
++            {
++                /* Record user command buffer and context buffer link
++                ** information for stuck dump.
++                **/
++                gckLINKQUEUE_Enqueue(
++                    &Hardware->linkQueue, FetchAddress, FetchAddress + (gctUINT)bytes);
++            }
++        }
++#endif
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return number of bytes required by the LINK command. */
++        *Bytes = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_UpdateQueueTail
++**
++**  Update the tail of the command queue.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of the start of the command queue.
++**
++**      gctUINT32 Offset
++**          Offset into the command queue of the tail (last command).
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_UpdateQueueTail(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x Offset=0x%08x",
++                   Hardware, Logical, Offset);
++
++    /* Verify the hardware. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Force a barrier. */
++    gcmkONERROR(
++        gckOS_MemoryBarrier(Hardware->os, Logical));
++
++    /* Notify gckKERNEL object of change. */
++#if gcdMULTI_GPU
++    gcmkONERROR(
++        gckKERNEL_Notify(Hardware->kernel,
++                         0,
++                         gcvNOTIFY_COMMAND_QUEUE,
++                         gcvFALSE));
++#else
++    gcmkONERROR(
++        gckKERNEL_Notify(Hardware->kernel,
++                         gcvNOTIFY_COMMAND_QUEUE,
++                         gcvFALSE));
++#endif
++
++    if (status == gcvSTATUS_CHIP_NOT_READY)
++    {
++        gcmkONERROR(gcvSTATUS_DEVICE);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_ConvertLogical
++**
++**  Convert a logical system address into a hardware specific address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address to convert.
++**
++**      gctBOOL InUserSpace
++**          gcvTRUE if the memory in user space.
++**
++**      gctUINT32* Address
++**          Return hardware specific address.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_ConvertLogical(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctBOOL InUserSpace,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++    gceSTATUS status;
++    gctUINT32 baseAddress;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x InUserSpace=%d",
++                   Hardware, Logical, InUserSpace);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Convert logical address into a physical address. */
++    if (InUserSpace)
++    {
++        gcmkONERROR(gckOS_UserLogicalToPhysical(Hardware->os, Logical, &address));
++    }
++    else
++    {
++        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, Logical, &address));
++    }
++
++    /* For old MMU, get GPU address according to baseAddress. */
++    if (Hardware->mmuVersion == 0)
++    {
++        gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, &baseAddress));
++
++        /* Subtract base address to get a GPU address. */
++        gcmkASSERT(address >= baseAddress);
++        address -= baseAddress;
++    }
++
++    /* Return hardware specific address. */
++    *Address = (Hardware->mmuVersion == 0)
++             ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
++               | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (address) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)))
++             : address;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Interrupt
++**
++**  Process an interrupt.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL InterruptValid
++**          If gcvTRUE, this function will read the interrupt acknowledge
++**          register, stores the data, and return whether or not the interrupt
++**          is ours or not.  If gcvFALSE, this functions will read the interrupt
++**          acknowledge register and combine it with any stored value to handle
++**          the event notifications.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Interrupt(
++    IN gckHARDWARE Hardware,
++#if gcdMULTI_GPU
++    IN gctUINT CoreId,
++#endif
++    IN gctBOOL InterruptValid
++    )
++{
++    gckEVENT eventObj;
++    gctUINT32 data = 0;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x InterruptValid=%d", Hardware, InterruptValid);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Extract gckEVENT object. */
++    eventObj = Hardware->kernel->eventObj;
++    gcmkVERIFY_OBJECT(eventObj, gcvOBJ_EVENT);
++
++    if (InterruptValid)
++    {
++        /* Read AQIntrAcknowledge register. */
++#if gcdMULTI_GPU
++        if (Hardware->core == gcvCORE_MAJOR)
++        {
++            gcmkONERROR(
++                gckOS_ReadRegisterByCoreId(Hardware->os,
++                                           Hardware->core,
++                                           CoreId,
++                                           0x00010,
++                                           &data));
++        }
++        else
++        {
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00010,
++                                     &data));
++        }
++#else
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00010,
++                                 &data));
++#endif
++
++        if (data == 0)
++        {
++            /* Not our interrupt. */
++            status = gcvSTATUS_NOT_OUR_INTERRUPT;
++        }
++        else
++        {
++
++#if gcdINTERRUPT_STATISTIC
++            gckOS_AtomClearMask(Hardware->pendingEvent, data);
++#endif
++
++            /* Inform gckEVENT of the interrupt. */
++            status = gckEVENT_Interrupt(eventObj,
++#if gcdMULTI_GPU
++                                        CoreId,
++#endif
++                                        data);
++        }
++    }
++    else
++    {
++            /* Handle events. */
++            status = gckEVENT_Notify(eventObj, 0);
++    }
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryCommandBuffer
++**
++**  Query the command buffer alignment and number of reserved bytes.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Alignment
++**          Pointer to a variable receiving the alignment for each command.
++**
++**      gctSIZE_T * ReservedHead
++**          Pointer to a variable receiving the number of reserved bytes at the
++**          head of each command buffer.
++**
++**      gctSIZE_T * ReservedTail
++**          Pointer to a variable receiving the number of bytes reserved at the
++**          tail of each command buffer.
++*/
++gceSTATUS
++gckHARDWARE_QueryCommandBuffer(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32 * Alignment,
++    OUT gctUINT32 * ReservedHead,
++    OUT gctUINT32 * ReservedTail
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Alignment != gcvNULL)
++    {
++        /* Align every 8 bytes. */
++        *Alignment = 8;
++    }
++
++    if (ReservedHead != gcvNULL)
++    {
++        /* Reserve space for SelectPipe(). */
++        *ReservedHead = 32;
++    }
++
++    if (ReservedTail != gcvNULL)
++    {
++        /* Reserve space for Link(). */
++        *ReservedTail = 8;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Alignment=%lu *ReservedHead=%lu *ReservedTail=%lu",
++                   gcmOPT_VALUE(Alignment), gcmOPT_VALUE(ReservedHead),
++                   gcmOPT_VALUE(ReservedTail));
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QuerySystemMemory
++**
++**  Query the command buffer alignment and number of reserved bytes.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * SystemSize
++**          Pointer to a variable that receives the maximum size of the system
++**          memory.
++**
++**      gctUINT32 * SystemBaseAddress
++**          Poinetr to a variable that receives the base address for system
++**          memory.
++*/
++gceSTATUS
++gckHARDWARE_QuerySystemMemory(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * SystemSize,
++    OUT gctUINT32 * SystemBaseAddress
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (SystemSize != gcvNULL)
++    {
++        /* Maximum system memory can be 2GB. */
++        *SystemSize = 1U << 31;
++    }
++
++    if (SystemBaseAddress != gcvNULL)
++    {
++        /* Set system memory base address. */
++        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*SystemSize=%lu *SystemBaseAddress=%lu",
++                   gcmOPT_VALUE(SystemSize), gcmOPT_VALUE(SystemBaseAddress));
++    return gcvSTATUS_OK;
++}
++
++#if gcdENABLE_3D
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryShaderCaps
++**
++**  Query the shader capabilities.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      gctUINT * VertexUniforms
++**          Pointer to a variable receiving the number of uniforms in the vertex
++**          shader.
++**
++**      gctUINT * FragmentUniforms
++**          Pointer to a variable receiving the number of uniforms in the
++**          fragment shader.
++**
++**      gctBOOL * UnifiedUnforms
++**          Pointer to a variable receiving whether the uniformas are unified.
++*/
++gceSTATUS
++gckHARDWARE_QueryShaderCaps(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT * VertexUniforms,
++    OUT gctUINT * FragmentUniforms,
++    OUT gctBOOL * UnifiedUnforms
++    )
++{
++    gctBOOL unifiedConst;
++    gctUINT32 vsConstMax;
++    gctUINT32 psConstMax;
++    gctUINT32 vsConstBase;
++    gctUINT32 psConstBase;
++    gctUINT32 ConstMax;
++
++    gcmkHEADER_ARG("Hardware=0x%x VertexUniforms=0x%x "
++                   "FragmentUniforms=0x%x UnifiedUnforms=0x%x",
++                   Hardware, VertexUniforms,
++                   FragmentUniforms, UnifiedUnforms);
++
++    {if (Hardware->identity.numConstants > 256){    unifiedConst = gcvTRUE;    vsConstBase  = 0xC000;    psConstBase  = 0xC000;    ConstMax     = Hardware->identity.numConstants;    vsConstMax   = 256;    psConstMax   = ConstMax - vsConstMax;}else if (Hardware->identity.numConstants == 256){    if (Hardware->identity.chipModel == gcv2000 && Hardware->identity.chipRevision == 0x5118)    {        unifiedConst = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vsConstMax   = 256;        psConstMax   = 64;        ConstMax     = 320;    }    else    {        unifiedConst = gcvFALSE;        vsConstBase  = 0x1400;        psConstBase  = 0x1C00;        vsConstMax   = 256;        psConstMax   = 256;        ConstMax     = 512;    }}else{    unifiedConst = gcvFALSE;    vsConstBase  = 0x1400;    psConstBase  = 0x1C00;    vsConstMax   = 168;    psConstMax   = 64;    ConstMax     = 232;}};
++
++    if (VertexUniforms != gcvNULL)
++    {
++        /* Return the vs shader const count. */
++        *VertexUniforms = vsConstMax;
++    }
++
++    if (FragmentUniforms != gcvNULL)
++    {
++        /* Return the ps shader const count. */
++        *FragmentUniforms = psConstMax;
++    }
++
++    if (UnifiedUnforms != gcvNULL)
++    {
++        /* Return whether the uniformas are unified. */
++        *UnifiedUnforms = unifiedConst;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetMMU
++**
++**  Set the page table base address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of the page table.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_SetMMU(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical
++    )
++{
++    gceSTATUS status;
++    gctUINT32 address = 0;
++    gctUINT32 idle;
++    gctUINT32 timer = 0, delay = 1;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x", Hardware, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Hardware->mmuVersion == 0)
++    {
++        gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++        /* Convert the logical address into physical address. */
++        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, Logical, &address));
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Setting page table to 0x%08X",
++                       address);
++
++        /* Write the AQMemoryFePageTable register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00400,
++                                  address));
++
++        /* Write the AQMemoryRaPageTable register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00410,
++                                  address));
++
++        /* Write the AQMemoryTxPageTable register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00404,
++                                  address));
++
++
++        /* Write the AQMemoryPePageTable register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00408,
++                                  address));
++
++        /* Write the AQMemoryPezPageTable register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x0040C,
++                                  address));
++    }
++    else if (Hardware->enableMMU == gcvTRUE)
++    {
++        /* Execute prepared command sequence. */
++        gcmkONERROR(gckHARDWARE_Execute(
++            Hardware,
++            Hardware->functions[gcvHARDWARE_FUNCTION_MMU].address,
++            Hardware->functions[gcvHARDWARE_FUNCTION_MMU].bytes
++            ));
++
++        /* Wait until MMU configure finishes. */
++        do
++        {
++            gckOS_Delay(Hardware->os, delay);
++
++            gcmkONERROR(gckOS_ReadRegisterEx(
++                Hardware->os,
++                Hardware->core,
++                0x00004,
++                &idle));
++
++            timer += delay;
++            delay *= 2;
++
++#if gcdGPU_TIMEOUT
++            if (timer >= Hardware->kernel->timeOut)
++            {
++                /* Even if hardware is not reset correctly, let software
++                ** continue to avoid software stuck. Software will timeout again
++                ** and try to recover GPU in next timeout.
++                */
++                gcmkONERROR(gcvSTATUS_DEVICE);
++            }
++#endif
++        }
++        while (!(((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ));
++
++        /* Enable MMU. */
++        gcmkONERROR(gckOS_WriteRegisterEx(
++            Hardware->os,
++            Hardware->core,
++            0x0018C,
++            ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (gcvTRUE) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++            ));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_FlushMMU
++**
++**  Flush the page table.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_FlushMMU(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command;
++    gctUINT32_PTR buffer;
++    gctUINT32 bufferSize;
++    gctPOINTER pointer = gcvNULL;
++    gctUINT32 flushSize;
++    gctUINT32 count;
++    gctUINT32 physical;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Verify the gckCOMMAND object pointer. */
++    command = Hardware->kernel->command;
++
++    /* Flush the memory controller. */
++    if (Hardware->mmuVersion == 0)
++    {
++        gcmkONERROR(gckCOMMAND_Reserve(
++            command, 8, &pointer, &bufferSize
++            ));
++
++        buffer = (gctUINT32_PTR) pointer;
++
++        buffer[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[1]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++
++        gcmkONERROR(gckCOMMAND_Execute(command, 8));
++    }
++    else
++    {
++        flushSize =  16 * 4;
++
++        gcmkONERROR(gckCOMMAND_Reserve(
++            command, flushSize, &pointer, &bufferSize
++            ));
++
++        buffer = (gctUINT32_PTR) pointer;
++
++        count = ((gctUINT)bufferSize - flushSize + 7) >> 3;
++
++        gcmkONERROR(gckOS_GetPhysicalAddress(command->os, buffer, &physical));
++
++        /* Flush cache. */
++        buffer[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[1]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++        /* Arm the PE-FE Semaphore. */
++        buffer[2]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[3]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        buffer[4]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        buffer[5]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LINK to next slot to flush FE FIFO. */
++        buffer[6]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[7]
++            = physical + 8 * gcmSIZEOF(gctUINT32);
++
++        /* Flush MMU cache. */
++        buffer[8]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[9]
++            = (((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) &  ((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))));
++
++        /* Arm the PE-FE Semaphore. */
++        buffer[10]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[11]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        buffer[12]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        buffer[13]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LINK to next slot to flush FE FIFO. */
++        buffer[14]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        buffer[15]
++            = physical + flushSize;
++
++        gcmkONERROR(gckCOMMAND_Execute(command, flushSize));
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_SetMMUStates(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER MtlbAddress,
++    IN gceMMU_MODE Mode,
++    IN gctPOINTER SafeAddress,
++    IN gctPOINTER Logical,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gceSTATUS status;
++    gctUINT32 config, address;
++    gctUINT32_PTR buffer;
++    gctBOOL ace;
++    gctUINT32 reserveBytes = 16 + 4 * 4;
++
++    gctBOOL config2D;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Hardware->mmuVersion != 0);
++
++    ace = gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_ACE);
++
++    if (ace)
++    {
++        reserveBytes += 8;
++    }
++
++    config2D =  gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_3D)
++             && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_PIPE_2D);
++
++    if (config2D)
++    {
++        reserveBytes +=
++            /* Pipe Select. */
++            4 * 4
++            /* Configure MMU States. */
++          + 4 * 4
++            /* Semaphore stall */
++          + 4 * 8;
++    }
++
++    /* Convert logical address into physical address. */
++    gcmkONERROR(
++        gckOS_GetPhysicalAddress(Hardware->os, MtlbAddress, &config));
++
++    gcmkONERROR(
++        gckOS_GetPhysicalAddress(Hardware->os, SafeAddress, &address));
++
++    if (address & 0x3F)
++    {
++        gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++    }
++
++    switch (Mode)
++    {
++    case gcvMMU_MODE_1K:
++        if (config & 0x3FF)
++        {
++            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++        }
++
++        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        break;
++
++    case gcvMMU_MODE_4K:
++        if (config & 0xFFF)
++        {
++            gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++        }
++
++        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        break;
++
++    default:
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if (Logical != gcvNULL)
++    {
++        buffer = Logical;
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        *buffer++ = config;
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        *buffer++ = address;
++
++        if (ace)
++        {
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0068) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            *buffer++ = 0;
++        }
++
++        do{*buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));} while(0);;
++
++        if (config2D)
++        {
++            /* LoadState(AQPipeSelect, 1), pipe. */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            *buffer++ = 0x1;
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            *buffer++ = config;
++
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0060) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            *buffer++ = address;
++
++            do{*buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));} while(0);;
++
++            /* LoadState(AQPipeSelect, 1), pipe. */
++            *buffer++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E00) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            *buffer++ = 0x0;
++
++            do{*buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))); *buffer++ = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));} while(0);;
++        }
++
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        *Bytes = reserveBytes;
++    }
++
++    /* Return the status. */
++    gcmkFOOTER_NO();
++    return status;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdPROCESS_ADDRESS_SPACE
++/*******************************************************************************
++**
++**  gckHARDWARE_ConfigMMU
++**
++**  Append a MMU Configuration command sequence at the specified location in the command
++**  queue. That command sequence consists of mmu configuration, LINK and WAIT/LINK.
++**  LINK is fetched and paresed with new mmu configuration.
++**
++**  If MMU Configuration is not changed between commit, change last WAIT/LINK to
++**  link to ENTRY.
++**
++**  -+-----------+-----------+-----------------------------------------
++**   | WAIT/LINK | WAIT/LINK |
++**  -+-----------+-----------+-----------------------------------------
++**         |          /|\
++**        \|/          |
++**    +--------------------+
++**    | ENTRY | ... | LINK |
++**    +--------------------+
++**
++**  If MMU Configuration is changed between commit, change last WAIT/LINK to
++**  link to MMU CONFIGURATION command sequence, and there are an EVNET and
++**  an END at the end of this command sequence, when interrupt handler
++**  receives this event, it will start FE at ENTRY to continue the command
++**  buffer execution.
++**
++**  -+-----------+-------------------+---------+---------+-----------+--
++**   | WAIT/LINK | MMU CONFIGURATION |  EVENT  |  END    | WAIT/LINK |
++**  -+-----------+-------------------+---------+---------+-----------+--
++**        |            /|\                                   /|\
++**        +-------------+                                     |
++**                                          +--------------------+
++**                                          | ENTRY | ... | LINK |
++**                                          +--------------------+
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command queue to append
++**          command sequence at or gcvNULL just to query the size of the
++**          command sequence.
++**
++**      gctPOINTER MtlbLogical
++**          Pointer to the current Master TLB.
++**
++**      gctUINT32 Offset
++**          Offset into command buffer required for alignment.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the command
++**          sequence.  If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          by the command sequence.  If 'Bytes' is gcvNULL, nothing will
++**          be returned.
++**
++**      gctUINT32 * WaitLinkOffset
++**          Pointer to a variable that will receive the offset of the WAIT/LINK command
++**          from the specified logcial pointer.
++**          If 'WaitLinkOffset' is gcvNULL nothing will be returned.
++**
++**      gctSIZE_T * WaitLinkBytes
++**          Pointer to a variable that will receive the number of bytes used by
++**          the WAIT command.
++**          If 'WaitLinkBytes' is gcvNULL nothing will be returned.
++*/
++gceSTATUS
++gckHARDWARE_ConfigMMU(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctPOINTER MtlbLogical,
++    IN gctUINT32 Offset,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctSIZE_T * WaitLinkOffset,
++    OUT gctSIZE_T * WaitLinkBytes
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T bytes, bytesAligned;
++    gctUINT32 config;
++    gctUINT32_PTR buffer = (gctUINT32_PTR) Logical;
++    gctUINT32 physical;
++    gctUINT32 event;
++
++    gcmkHEADER_ARG("Hardware=0x%08X Logical=0x%08x MtlbLogical=0x%08X",
++                   Hardware, Logical, MtlbLogical);
++
++    bytes
++        /* Flush cache states. */
++        = 18 * 4
++        /* MMU configuration states. */
++        + 6 * 4
++        /* EVENT. */
++        + 2 * 4
++        /* END. */
++        + 2 * 4
++        /* WAIT/LINK. */
++        + 4 * 4;
++
++    /* Compute number of bytes required. */
++    bytesAligned = gcmALIGN(Offset + bytes, 8) - Offset;
++
++    if (buffer != gcvNULL)
++    {
++        if (MtlbLogical == gcvNULL)
++        {
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        /* Get physical address of this command buffer segment. */
++        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, buffer, &physical));
++
++        /* Get physical address of Master TLB. */
++        gcmkONERROR(gckOS_GetPhysicalAddress(Hardware->os, MtlbLogical, &config));
++
++        config |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++
++        /* Flush cache. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++        /* Flush tile status cache. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++        /* Arm the PE-FE Semaphore. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LINK to next slot to flush FE FIFO. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = physical + 10 * gcmSIZEOF(gctUINT32);
++
++        /* Configure MMU. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        *buffer++
++            = (((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) &  ((((gctUINT32) (~0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))));
++
++        /* Arm the PE-FE Semaphore. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* LINK to next slot to flush FE FIFO. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = physical + 18 * 4;
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0061) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        *buffer++
++            = config;
++
++        /* Arm the PE-FE Semaphore. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* STALL FE until PE is done flushing. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++        /* Event 29. */
++        *buffer++
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        event = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++        event = ((((gctUINT32) (event)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (29) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
++
++        *buffer++
++            = event;
++
++        /* Append END. */
++        *buffer++
++           = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        *Bytes = bytesAligned;
++    }
++
++    if (WaitLinkOffset != gcvNULL)
++    {
++        *WaitLinkOffset = bytes - 4 * 4;
++    }
++
++    if (WaitLinkBytes != gcvNULL)
++    {
++#if gcdMULTI_GPU
++        *WaitLinkBytes = 40;
++#else
++        *WaitLinkBytes = 4 * 4;
++#endif
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_BuildVirtualAddress
++**
++**  Build a virtual address.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctUINT32 Index
++**          Index into page table.
++**
++**      gctUINT32 Offset
++**          Offset into page.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Pointer to a variable receiving te hardware address.
++*/
++gceSTATUS
++gckHARDWARE_BuildVirtualAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Index,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Index=%u Offset=%u", Hardware, Index, Offset);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Build virtual address. */
++    *Address = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1))))))) << (0 ? 31:31)))
++             | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0))) | (((gctUINT32) ((gctUINT32) (Offset | (Index << 12)) & ((gctUINT32) ((((1 ? 30:0) - (0 ? 30:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 30:0) - (0 ? 30:0) + 1))))))) << (0 ? 30:0)));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckHARDWARE_GetIdle(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Wait,
++    OUT gctUINT32 * Data
++    )
++{
++    gceSTATUS status;
++    gctUINT32 idle = 0;
++    gctINT retry, poll, pollCount;
++    gctUINT32 address;
++
++    gcmkHEADER_ARG("Hardware=0x%x Wait=%d", Hardware, Wait);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
++
++
++    /* If we have to wait, try 100 polls per millisecond. */
++    pollCount = Wait ? 100 : 1;
++
++    /* At most, try for 1 second. */
++    for (retry = 0; retry < 1000; ++retry)
++    {
++        /* If we have to wait, try 100 polls per millisecond. */
++        for (poll = pollCount; poll > 0; --poll)
++        {
++            /* Read register. */
++            gcmkONERROR(
++                gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
++
++            /* Read the current FE address. */
++            gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                             Hardware->core,
++                                             0x00664,
++                                             &address));
++
++
++            /* See if we have to wait for FE idle. */
++            if (_IsGPUIdle(idle)
++             && (address == Hardware->lastEnd + 8)
++             )
++            {
++                /* FE is idle. */
++                break;
++            }
++        }
++
++        /* Check if we need to wait for FE and FE is busy. */
++        if (Wait && !_IsGPUIdle(idle))
++        {
++            /* Wait a little. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "%s: Waiting for idle: 0x%08X",
++                           __FUNCTION__, idle);
++
++            gcmkVERIFY_OK(gckOS_Delay(Hardware->os, 1));
++        }
++        else
++        {
++            break;
++        }
++    }
++
++    /* Return idle to caller. */
++    *Data = idle;
++
++#if defined(EMULATOR)
++    /* Wait a little while until CModel FE gets END.
++     * END is supposed to be appended by caller.
++     */
++    gckOS_Delay(gcvNULL, 100);
++#endif
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/* Flush the caches. */
++gceSTATUS
++gckHARDWARE_Flush(
++    IN gckHARDWARE Hardware,
++    IN gceKERNEL_FLUSH Flush,
++    IN gctPOINTER Logical,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gctUINT32 pipe;
++    gctUINT32 flush = 0;
++    gctBOOL flushTileStatus;
++    gctUINT32_PTR logical = (gctUINT32_PTR) Logical;
++    gceSTATUS status;
++    gctUINT32 reserveBytes
++        /* Semaphore/Stall */
++        = 4 * gcmSIZEOF(gctUINT32);
++
++    gcmkHEADER_ARG("Hardware=0x%x Flush=0x%x Logical=0x%x *Bytes=%lu",
++                   Hardware, Flush, Logical, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Get current pipe. */
++    pipe = Hardware->kernel->command->pipeSelect;
++
++    /* Flush tile status cache. */
++    flushTileStatus = Flush & gcvFLUSH_TILE_STATUS;
++
++    /* Flush 3D color cache. */
++    if ((Flush & gcvFLUSH_COLOR) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)));
++    }
++
++    /* Flush 3D depth cache. */
++    if ((Flush & gcvFLUSH_DEPTH) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++    }
++
++    /* Flush 3D texture cache. */
++    if ((Flush & gcvFLUSH_TEXTURE) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)));
++    }
++
++    /* Flush 2D cache. */
++    if ((Flush & gcvFLUSH_2D) && (pipe == 0x1))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)));
++    }
++
++#if gcdMULTI_GPU
++    /* Flush L2 cache. */
++    if ((Flush & gcvFLUSH_L2) && (pipe == 0x0))
++    {
++        flush |= ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++    }
++#endif
++
++    /* Determine reserve bytes. */
++    if (flush)
++    {
++        reserveBytes += 2 * gcmSIZEOF(gctUINT32);
++    }
++
++    if (flushTileStatus)
++    {
++        reserveBytes += 2 * gcmSIZEOF(gctUINT32);
++    }
++
++    /* See if there is a valid flush. */
++    if ((flush == 0) && (flushTileStatus == gcvFALSE))
++    {
++        if (Bytes != gcvNULL)
++        {
++            /* No bytes required. */
++            *Bytes = 0;
++        }
++    }
++
++    else
++    {
++        /* Copy to command queue. */
++        if (Logical != gcvNULL)
++        {
++            if (*Bytes < reserveBytes)
++            {
++                /* Command queue too small. */
++                gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++            }
++
++            if (flush)
++            {
++                /* Append LOAD_STATE to AQFlush. */
++                *logical++
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E03) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++                *logical++
++                    = flush;
++
++                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                        "0x%x: FLUSH 0x%x", logical - 1, flush);
++            }
++
++            if (flushTileStatus)
++            {
++                *logical++
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0594) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++                *logical++
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                               "0x%x: FLUSH TILE STATUS 0x%x", logical - 1, logical[-1]);
++            }
++
++            /* Semaphore. */
++            *logical++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E02) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            *logical++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++
++            /* Stall. */
++            *logical++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x09 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++
++            *logical++
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) (0x05 & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) (0x07 & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* bytes required. */
++            *Bytes = reserveBytes;
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_SetFastClear(
++    IN gckHARDWARE Hardware,
++    IN gctINT Enable,
++    IN gctINT Compression
++    )
++{
++#if gcdENABLE_3D
++    gctUINT32 debug;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Enable=%d Compression=%d",
++                   Hardware, Enable, Compression);
++
++    /* Only process if fast clear is available. */
++    if ((((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++    {
++        if (Enable == -1)
++        {
++            /* Determine automatic value for fast clear. */
++            Enable = ((Hardware->identity.chipModel    != gcv500)
++                     || (Hardware->identity.chipRevision >= 3)
++                     ) ? 1 : 0;
++        }
++
++        if (Compression == -1)
++        {
++            /* Determine automatic value for compression. */
++            Compression = Enable
++                        & (((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) );
++        }
++
++        /* Read AQMemoryDebug register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00414, &debug));
++
++        /* Set fast clear bypass. */
++        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
++
++        if (
++            ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1))))))) ||
++            (Hardware->identity.chipModel >= gcv4000))
++        {
++            /* Set compression bypass. */
++            debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21))) | (((gctUINT32) ((gctUINT32) (Compression == 0) & ((gctUINT32) ((((1 ? 21:21) - (0 ? 21:21) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 21:21) - (0 ? 21:21) + 1))))))) << (0 ? 21:21)));
++        }
++
++        /* Write back AQMemoryDebug register. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  0x00414,
++                                  debug));
++
++        /* Store fast clear and comprersison flags. */
++        Hardware->allowFastClear   = Enable;
++        Hardware->allowCompression = Compression;
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "FastClear=%d Compression=%d", Enable, Compression);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    return gcvSTATUS_OK;
++#endif
++}
++
++typedef enum
++{
++    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
++    gcvPOWER_FLAG_STALL         = 1 << 1,
++    gcvPOWER_FLAG_STOP          = 1 << 2,
++    gcvPOWER_FLAG_START         = 1 << 3,
++    gcvPOWER_FLAG_RELEASE       = 1 << 4,
++    gcvPOWER_FLAG_DELAY         = 1 << 5,
++    gcvPOWER_FLAG_SAVE          = 1 << 6,
++    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
++    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
++    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
++    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
++}
++gcePOWER_FLAGS;
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++static gctCONST_STRING
++_PowerEnum(gceCHIPPOWERSTATE State)
++{
++    const gctCONST_STRING states[] =
++    {
++        gcmSTRING(gcvPOWER_ON),
++        gcmSTRING(gcvPOWER_OFF),
++        gcmSTRING(gcvPOWER_IDLE),
++        gcmSTRING(gcvPOWER_SUSPEND),
++        gcmSTRING(gcvPOWER_SUSPEND_ATPOWERON),
++        gcmSTRING(gcvPOWER_OFF_ATPOWERON),
++        gcmSTRING(gcvPOWER_IDLE_BROADCAST),
++        gcmSTRING(gcvPOWER_SUSPEND_BROADCAST),
++        gcmSTRING(gcvPOWER_OFF_BROADCAST),
++        gcmSTRING(gcvPOWER_OFF_RECOVERY),
++        gcmSTRING(gcvPOWER_OFF_TIMEOUT),
++        gcmSTRING(gcvPOWER_ON_AUTO)
++    };
++
++    if ((State >= gcvPOWER_ON) && (State <= gcvPOWER_ON_AUTO))
++    {
++        return states[State - gcvPOWER_ON];
++    }
++
++    return "unknown";
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagementState
++**
++**  Set GPU to a specified power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE State
++**          Power State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetPowerManagementState(
++    IN gckHARDWARE Hardware,
++    IN gceCHIPPOWERSTATE State
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command = gcvNULL;
++    gckOS os;
++    gctUINT flag, clock;
++    gctPOINTER buffer;
++    gctUINT32 bytes, requested;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL mutexAcquired = gcvFALSE;
++    gctBOOL stall = gcvTRUE;
++    gctBOOL broadcast = gcvFALSE;
++#if gcdPOWEROFF_TIMEOUT
++    gctBOOL timeout = gcvFALSE;
++    gctBOOL isAfter = gcvFALSE;
++    gctUINT32 currentTime;
++#endif
++    gctUINT32 process, thread;
++    gctBOOL commitEntered = gcvFALSE;
++    gctBOOL commandStarted = gcvFALSE;
++    gctBOOL isrStarted = gcvFALSE;
++
++#if gcdENABLE_PROFILING
++    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
++              initTime, offTime, startTime, totalTime;
++#endif
++    gctBOOL global = gcvFALSE;
++    gctBOOL globalAcquired = gcvFALSE;
++    gctBOOL configMmu = gcvFALSE;
++
++    /* State transition flags. */
++    static const gctUINT flags[4][4] =
++    {
++        /* gcvPOWER_ON           */
++        {   /* ON                */ 0,
++            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL,
++            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_OFF          */
++        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_RELEASE    |
++                                    gcvPOWER_FLAG_DELAY,
++            /* OFF               */ 0,
++            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_DELAY,
++            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_IDLE         */
++        {   /* ON                */ gcvPOWER_FLAG_RELEASE,
++            /* OFF               */ gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ 0,
++            /* SUSPEND           */ gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_SUSPEND      */
++        {   /* ON                */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_RELEASE   |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* OFF               */ gcvPOWER_FLAG_SAVE      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* SUSPEND           */ 0,
++        },
++    };
++
++    /* Clocks. */
++    static const gctUINT clocks[4] =
++    {
++        /* gcvPOWER_ON */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (64) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++
++        /* gcvPOWER_OFF */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++
++        /* gcvPOWER_IDLE */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++
++        /* gcvPOWER_SUSPEND */
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))),
++    };
++
++    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Switching to power state %d(%s)",
++                   State, _PowerEnum(State));
++#endif
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Get the gckOS object pointer. */
++    os = Hardware->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Get the gckCOMMAND object pointer. */
++    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
++    command = Hardware->kernel->command;
++    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
++
++    /* Start profiler. */
++    gcmkPROFILE_INIT(freq, time);
++
++    /* Convert the broadcast power state. */
++    switch (State)
++    {
++    case gcvPOWER_SUSPEND_ATPOWERON:
++        /* Convert to SUSPEND and don't wait for STALL. */
++        State = gcvPOWER_SUSPEND;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_OFF_ATPOWERON:
++        /* Convert to OFF and don't wait for STALL. */
++        State = gcvPOWER_OFF;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_IDLE_BROADCAST:
++        /* Convert to IDLE and note we are inside broadcast. */
++        State     = gcvPOWER_IDLE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_SUSPEND_BROADCAST:
++        /* Convert to SUSPEND and note we are inside broadcast. */
++        State     = gcvPOWER_SUSPEND;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_BROADCAST:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_RECOVERY:
++        /* Convert to OFF and note we are inside recovery. */
++        State     = gcvPOWER_OFF;
++        stall     = gcvFALSE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_ON_AUTO:
++        /* Convert to ON and note we are inside recovery. */
++        State = gcvPOWER_ON;
++        break;
++
++    case gcvPOWER_ON:
++    case gcvPOWER_IDLE:
++    case gcvPOWER_SUSPEND:
++    case gcvPOWER_OFF:
++        /* Mark as global power management. */
++        global = gcvTRUE;
++        break;
++
++#if gcdPOWEROFF_TIMEOUT
++    case gcvPOWER_OFF_TIMEOUT:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        /* Check time out */
++        timeout = gcvTRUE;
++        break;
++#endif
++
++    default:
++        break;
++    }
++
++    if (Hardware->powerManagement == gcvFALSE
++     && State != gcvPOWER_ON
++    )
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Get current process and thread IDs. */
++    gcmkONERROR(gckOS_GetProcessID(&process));
++    gcmkONERROR(gckOS_GetThreadID(&thread));
++
++    if (broadcast)
++    {
++        /* Try to acquire the power mutex. */
++        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
++
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            /* Check if we already own this mutex. */
++            if ((Hardware->powerProcess == process)
++            &&  (Hardware->powerThread  == thread)
++            )
++            {
++                /* Bail out on recursive power management. */
++                gcmkFOOTER_NO();
++                return gcvSTATUS_OK;
++            }
++            else if (State != gcvPOWER_ON)
++            {
++                /* Called from IST,
++                ** so waiting here will cause deadlock,
++                ** if lock holder call gckCOMMAND_Stall() */
++                status = gcvSTATUS_INVALID_REQUEST;
++                goto OnError;
++            }
++            else
++            {
++                /* Acquire the power mutex. */
++                gcmkONERROR(gckOS_AcquireMutex(os,
++                                               Hardware->powerMutex,
++                                               gcvINFINITE));
++            }
++        }
++    }
++    else
++    {
++        /* Acquire the power mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
++    }
++
++    /* Get time until mtuex acquired. */
++    gcmkPROFILE_QUERY(time, mutexTime);
++
++    Hardware->powerProcess = process;
++    Hardware->powerThread  = thread;
++    mutexAcquired          = gcvTRUE;
++
++    /* Grab control flags and clock. */
++    flag  = flags[Hardware->chipPowerState][State];
++    clock = clocks[State];
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    if (State == gcvPOWER_ON)
++    {
++        clock = ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (Hardware->powerOnFscaleVal) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)));
++    }
++#endif
++
++    if (State == gcvPOWER_SUSPEND && Hardware->chipPowerState == gcvPOWER_OFF && broadcast)
++    {
++#if gcdPOWER_SUSPEND_WHEN_IDLE
++    /* Do nothing */
++
++        /* Release the power mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++           gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++#else
++    /* Clock should be on when switch power from off to suspend */
++        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) ;
++#endif
++    }
++
++#if gcdPOWEROFF_TIMEOUT
++    if (timeout)
++    {
++        gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++        gcmkONERROR(
++            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
++
++        /* powerOffTime is pushed forward, give up.*/
++        if (isAfter
++        /* Expect a transition start from IDLE or SUSPEND. */
++        ||  (Hardware->chipPowerState == gcvPOWER_ON)
++        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
++        )
++        {
++            /* Release the power mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++            /* No need to do anything. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                       "Power Off GPU[%d] at %u [supposed to be at %u]",
++                       Hardware->core, currentTime, Hardware->powerOffTime);
++    }
++#endif
++
++    if (flag == 0)
++    {
++        /* Release the power mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++        /* No need to do anything. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* If this is an internal power management, we have to check if we can grab
++    ** the global power semaphore. If we cannot, we have to wait until the
++    ** external world changes power management. */
++    if (!global)
++    {
++        /* Try to acquire the global semaphore. */
++        status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
++            {
++                /* Called from thread routine which should NEVER sleep.*/
++                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++            }
++
++            /* Release the power mutex. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "Releasing the power mutex.");
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++            mutexAcquired = gcvFALSE;
++
++            /* Wait for the semaphore. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "Waiting for global semaphore.");
++            gcmkONERROR(gckOS_AcquireSemaphore(os, Hardware->globalSemaphore));
++            globalAcquired = gcvTRUE;
++
++            /* Acquire the power mutex. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                           "Reacquiring the power mutex.");
++            gcmkONERROR(gckOS_AcquireMutex(os,
++                                           Hardware->powerMutex,
++                                           gcvINFINITE));
++            mutexAcquired = gcvTRUE;
++
++            /* chipPowerState may be changed by external world during the time
++            ** we give up powerMutex, so updating flag now is necessary. */
++            flag = flags[Hardware->chipPowerState][State];
++
++            if (flag == 0)
++            {
++                gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
++                globalAcquired = gcvFALSE;
++
++                gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++                mutexAcquired = gcvFALSE;
++
++                gcmkFOOTER_NO();
++                return gcvSTATUS_OK;
++            }
++        }
++        else
++        {
++            /* Error. */
++            gcmkONERROR(status);
++        }
++
++        /* Release the global semaphore again. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
++        globalAcquired = gcvFALSE;
++    }
++    else
++    {
++        if (State == gcvPOWER_OFF || State == gcvPOWER_SUSPEND || State == gcvPOWER_IDLE)
++        {
++            /* Acquire the global semaphore if it has not been acquired. */
++            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
++            if (status == gcvSTATUS_OK)
++            {
++                globalAcquired = gcvTRUE;
++            }
++            else if (status != gcvSTATUS_TIMEOUT)
++            {
++                /* Other errors. */
++                gcmkONERROR(status);
++            }
++            /* Ignore gcvSTATUS_TIMEOUT and leave globalAcquired as gcvFALSE.
++            ** gcvSTATUS_TIMEOUT means global semaphore has already
++            ** been acquired before this operation, so even if we fail,
++            ** we should not release it in our error handling. It should be
++            ** released by the next successful global gcvPOWER_ON. */
++        }
++
++        /* Global power management can't be aborted, so sync with
++        ** proceeding last commit. */
++        if (flag & gcvPOWER_FLAG_ACQUIRE)
++        {
++            /* Acquire the power management semaphore. */
++            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++            acquired = gcvTRUE;
++
++            /* avoid acquiring again. */
++            flag &= ~gcvPOWER_FLAG_ACQUIRE;
++        }
++    }
++
++    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
++    {
++        /* Turn on the power. */
++        gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
++
++        /* Mark clock and power as enabled. */
++        Hardware->clockState = gcvTRUE;
++        Hardware->powerState = gcvTRUE;
++
++        for (;;)
++        {
++            /* Check if GPU is present and awake. */
++            status = _IsGPUPresent(Hardware);
++
++            /* Check if the GPU is not responding. */
++            if (status == gcvSTATUS_GPU_NOT_RESPONDING)
++            {
++                /* Turn off the power and clock. */
++                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvFALSE, gcvFALSE));
++
++                Hardware->clockState = gcvFALSE;
++                Hardware->powerState = gcvFALSE;
++
++                /* Wait a little. */
++                gckOS_Delay(os, 1);
++
++                /* Turn on the power and clock. */
++                gcmkONERROR(gckOS_SetGPUPower(os, Hardware->core, gcvTRUE, gcvTRUE));
++
++                Hardware->clockState = gcvTRUE;
++                Hardware->powerState = gcvTRUE;
++
++                /* We need to initialize the hardware and start the command
++                 * processor. */
++                flag |= gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_START;
++            }
++            else
++            {
++                /* Test for error. */
++                gcmkONERROR(status);
++
++                /* Break out of loop. */
++                break;
++            }
++        }
++    }
++
++    /* Get time until powered on. */
++    gcmkPROFILE_QUERY(time, onTime);
++
++    if ((flag & gcvPOWER_FLAG_STALL) && stall)
++    {
++        gctBOOL idle;
++        gctINT32 atomValue;
++
++        /* For global operation, all pending commits have already been
++        ** blocked by globalSemaphore or powerSemaphore.*/
++        if (!global)
++        {
++            /* Check commit atom. */
++            gcmkONERROR(gckOS_AtomGet(os, command->atomCommit, &atomValue));
++
++            if (atomValue > 0)
++            {
++                /* Commits are pending - abort power management. */
++                status = broadcast ? gcvSTATUS_CHIP_NOT_READY
++                                   : gcvSTATUS_MORE_DATA;
++                goto OnError;
++            }
++        }
++
++        if (broadcast)
++        {
++            /* Check for idle. */
++            gcmkONERROR(gckHARDWARE_QueryIdle(Hardware, &idle));
++
++            if (!idle)
++            {
++                status = gcvSTATUS_CHIP_NOT_READY;
++                goto OnError;
++            }
++        }
++
++        else
++        {
++            /* Acquire the command queue. */
++            gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvTRUE));
++            commitEntered = gcvTRUE;
++
++            /* Get the size of the flush command. */
++            gcmkONERROR(gckHARDWARE_Flush(Hardware,
++                                          gcvFLUSH_ALL,
++                                          gcvNULL,
++                                          &requested));
++
++            /* Reserve space in the command queue. */
++            gcmkONERROR(gckCOMMAND_Reserve(command,
++                                           requested,
++                                           &buffer,
++                                           &bytes));
++
++            /* Append a flush. */
++            gcmkONERROR(gckHARDWARE_Flush(
++                Hardware, gcvFLUSH_ALL, buffer, &bytes
++                ));
++
++            /* Execute the command queue. */
++            gcmkONERROR(gckCOMMAND_Execute(command, requested));
++
++            /* Release the command queue. */
++            gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvTRUE));
++            commitEntered = gcvFALSE;
++
++            /* Wait to finish all commands. */
++#if gcdMULTI_GPU
++            gcmkONERROR(gckCOMMAND_Stall(command, gcvTRUE, gcvCORE_3D_ALL_MASK));
++#else
++            gcmkONERROR(gckCOMMAND_Stall(command, gcvTRUE));
++#endif
++        }
++    }
++
++    /* Get time until stalled. */
++    gcmkPROFILE_QUERY(time, stallTime);
++
++    if (flag & gcvPOWER_FLAG_ACQUIRE)
++    {
++        /* Acquire the power management semaphore. */
++        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++        acquired = gcvTRUE;
++    }
++
++    if (flag & gcvPOWER_FLAG_STOP)
++    {
++        /* Stop the command parser. */
++        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
++
++        /* Stop the Isr. */
++        if (Hardware->stopIsr)
++        {
++            gcmkONERROR(Hardware->stopIsr(Hardware->isrContext));
++        }
++    }
++
++    /* Flush Cache before Power Off. */
++    if (flag & gcvPOWER_FLAG_POWER_OFF)
++    {
++        if (Hardware->clockState == gcvFALSE)
++        {
++            /* Turn off the GPU power. */
++            gcmkONERROR(
++                    gckOS_SetGPUPower(os,
++                        Hardware->core,
++                        gcvTRUE,
++                        gcvTRUE));
++
++            Hardware->clockState = gcvTRUE;
++
++            if (gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE)
++            {
++                /* Write the clock control register. */
++                gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                                  Hardware->core,
++                                                  0x00000,
++                                                  clocks[0]));
++
++                /* Done loading the frequency scaler. */
++                gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                                  Hardware->core,
++                                                  0x00000,
++                                                  ((((gctUINT32) (clocks[0])) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++            }
++        }
++
++        gcmkONERROR(gckCOMMAND_Start(command));
++
++        gcmkONERROR(_FlushCache(Hardware, command));
++
++        gckOS_Delay(gcvNULL, 1);
++
++        /* Stop the command parser. */
++        gcmkONERROR(gckCOMMAND_Stop(command, gcvFALSE));
++
++        flag |= gcvPOWER_FLAG_CLOCK_OFF;
++    }
++
++    /* Get time until stopped. */
++    gcmkPROFILE_QUERY(time, stopTime);
++
++    /* Only process this when hardware is enabled. */
++    if (Hardware->clockState && Hardware->powerState
++    /* Don't touch clock control if dynamic frequency scaling is available. */
++    && gckHARDWARE_IsFeatureAvailable(Hardware, gcvFEATURE_DYNAMIC_FREQUENCY_SCALING) != gcvTRUE
++    )
++    {
++        if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
++        {
++            if (Hardware->identity.chipModel == gcv4000
++            && ((Hardware->identity.chipRevision == 0x5208) || (Hardware->identity.chipRevision == 0x5222)))
++            {
++                clock &= ~2U;
++            }
++        }
++
++        /* Write the clock control register. */
++        gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                          Hardware->core,
++                                          0x00000,
++                                          clock));
++
++        /* Done loading the frequency scaler. */
++        gcmkONERROR(gckOS_WriteRegisterEx(os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++    }
++
++    if (flag & gcvPOWER_FLAG_DELAY)
++    {
++        /* Wait for the specified amount of time to settle coming back from
++        ** power-off or suspend state. */
++        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
++    }
++
++    /* Get time until delayed. */
++    gcmkPROFILE_QUERY(time, delayTime);
++
++    if (flag & gcvPOWER_FLAG_INITIALIZE)
++    {
++        /* Initialize hardware. */
++        gcmkONERROR(gckHARDWARE_InitializeHardware(Hardware));
++
++        gcmkONERROR(gckHARDWARE_SetFastClear(Hardware,
++                                             Hardware->allowFastClear,
++                                             Hardware->allowCompression));
++
++        /* Force the command queue to reload the next context. */
++        command->currContext = gcvNULL;
++
++        /* Need to config mmu after command start. */
++        configMmu = gcvTRUE;
++    }
++
++    /* Get time until initialized. */
++    gcmkPROFILE_QUERY(time, initTime);
++
++    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
++    {
++        /* Turn off the GPU power. */
++        gcmkONERROR(
++            gckOS_SetGPUPower(os,
++                              Hardware->core,
++                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                               : gcvTRUE,
++                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                               : gcvTRUE));
++
++        /* Save current hardware power and clock states. */
++        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++    }
++
++    /* Get time until off. */
++    gcmkPROFILE_QUERY(time, offTime);
++
++    if (flag & gcvPOWER_FLAG_START)
++    {
++        /* Start the command processor. */
++        gcmkONERROR(gckCOMMAND_Start(command));
++        commandStarted = gcvTRUE;
++
++        if (Hardware->startIsr)
++        {
++            /* Start the Isr. */
++            gcmkONERROR(Hardware->startIsr(Hardware->isrContext));
++            isrStarted = gcvTRUE;
++        }
++    }
++
++    /* Get time until started. */
++    gcmkPROFILE_QUERY(time, startTime);
++
++    if (flag & gcvPOWER_FLAG_RELEASE)
++    {
++        /* Release the power management semaphore. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
++        acquired = gcvFALSE;
++
++        if (global)
++        {
++            /* Verify global semaphore has been acquired already before
++            ** we release it.
++            ** If it was acquired, gckOS_TryAcquireSemaphore will return
++            ** gcvSTATUS_TIMEOUT and we release it. Otherwise, global
++            ** semaphore will be acquried now, but it still is released
++            ** immediately. */
++            status = gckOS_TryAcquireSemaphore(os, Hardware->globalSemaphore);
++            if (status != gcvSTATUS_TIMEOUT)
++            {
++                gcmkONERROR(status);
++            }
++
++            /* Release the global semaphore. */
++            gcmkONERROR(gckOS_ReleaseSemaphore(os, Hardware->globalSemaphore));
++            globalAcquired = gcvFALSE;
++        }
++    }
++
++    /* Save the new power state. */
++    Hardware->chipPowerState = State;
++
++#if gcdDVFS
++    if (State == gcvPOWER_ON && Hardware->kernel->dvfs)
++    {
++        gckDVFS_Start(Hardware->kernel->dvfs);
++    }
++#endif
++
++#if gcdPOWEROFF_TIMEOUT
++    /* Reset power off time */
++    gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++    Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
++
++    if (State == gcvPOWER_IDLE || State == gcvPOWER_SUSPEND)
++    {
++        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
++        gcmkVERIFY_OK(gckOS_StartTimer(os,
++                                       Hardware->powerOffTimer,
++                                       Hardware->powerOffTimeout));
++    }
++    else
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
++
++        /* Cancel running timer when GPU enters ON or OFF. */
++        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
++    }
++#endif
++
++    /* Release the power mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++    /* Get total time. */
++    gcmkPROFILE_QUERY(time, totalTime);
++#if gcdENABLE_PROFILING
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
++                   freq, mutexTime, onTime, stallTime, stopTime);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
++                   delayTime, initTime, offTime, startTime, totalTime);
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (commandStarted)
++    {
++        gcmkVERIFY_OK(gckCOMMAND_Stop(command, gcvFALSE));
++    }
++
++    if (isrStarted)
++    {
++        gcmkVERIFY_OK(Hardware->stopIsr(Hardware->isrContext));
++    }
++
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, gcvTRUE));
++    }
++
++    if (acquired)
++    {
++        /* Release semaphore. */
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
++                                             command->powerSemaphore));
++    }
++
++    if (globalAcquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
++                                             Hardware->globalSemaphore));
++    }
++
++    if (mutexAcquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryPowerManagementState
++**
++**  Get GPU power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE* State
++**          Power State.
++**
++*/
++gceSTATUS
++gckHARDWARE_QueryPowerManagementState(
++    IN gckHARDWARE Hardware,
++    OUT gceCHIPPOWERSTATE* State
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(State != gcvNULL);
++
++    /* Return the statue. */
++    *State = Hardware->chipPowerState;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*State=%d", *State);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagement
++**
++**  Configure GPU power management function.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL PowerManagement
++**          Power Mangement State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetPowerManagement(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL PowerManagement
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    if(!Hardware->powerManagementLock)
++    {
++        gcmkVERIFY_OK(
++            gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE));
++
++        Hardware->powerManagement = PowerManagement;
++
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagementLock
++**
++**  Disable dynamic GPU power management switch.
++**  Only used in driver initialization stage.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL Lock
++**          Power Mangement Lock State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetPowerManagementLock(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Lock
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    Hardware->powerManagementLock = Lock;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++/*******************************************************************************
++**
++**  gckHARDWARE_SetGpuProfiler
++**
++**  Configure GPU profiler function.
++**  Only used in driver initialization stage.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL GpuProfiler
++**          GOU Profiler State.
++**
++*/
++gceSTATUS
++gckHARDWARE_SetGpuProfiler(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL GpuProfiler
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (GpuProfiler == gcvTRUE)
++    {
++        gctUINT32 data = 0;
++
++        /* Need to disable clock gating when doing profiling. */
++        gcmkVERIFY_OK(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress +
++                                 0x00100,
++                                 &data));
++
++        data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++
++
++        gcmkVERIFY_OK(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00100,
++                                  data));
++    }
++
++    Hardware->gpuProfiler = GpuProfiler;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++gceSTATUS
++gckHARDWARE_SetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32   FscaleValue
++    )
++{
++    gceSTATUS status;
++    gctUINT32 clock;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Hardware=0x%x FscaleValue=%d", Hardware, FscaleValue);
++
++    gcmkVERIFY_ARGUMENT(FscaleValue > 0 && FscaleValue <= 64);
++
++    gcmkONERROR(
++        gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE));
++    acquired =  gcvTRUE;
++
++    Hardware->powerOnFscaleVal = FscaleValue;
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++        gctUINT32 data;
++
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 Hardware->powerBaseAddress
++                                 + 0x00104,
++                                 &data));
++
++        /* Disable all clock gating. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1))))))) << (0 ? 7:7)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))
++                                  | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
++
++        clock = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2))) | (((gctUINT32) ((gctUINT32) (FscaleValue) & ((gctUINT32) ((((1 ? 8:2) - (0 ? 8:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:2) - (0 ? 8:2) + 1))))))) << (0 ? 8:2)))
++              | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          clock));
++
++        /* Done loading the frequency scaler. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++
++        /* Restore all clock gating. */
++        gcmkONERROR(
++            gckOS_WriteRegisterEx(Hardware->os,
++                                  Hardware->core,
++                                  Hardware->powerBaseAddress
++                                  + 0x00104,
++                                  data));
++    }
++
++    gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_GetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT * FscaleValue,
++    IN gctUINT * MinFscaleValue,
++    IN gctUINT * MaxFscaleValue
++    )
++{
++    *FscaleValue = Hardware->powerOnFscaleVal;
++    *MinFscaleValue = Hardware->minFscaleValue;
++    *MaxFscaleValue = 64;
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckHARDWARE_SetMinFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT MinFscaleValue
++    )
++{
++    if (MinFscaleValue >= 1 && MinFscaleValue <= 64)
++    {
++        Hardware->minFscaleValue = MinFscaleValue;
++    }
++
++    return gcvSTATUS_OK;
++}
++#endif
++
++#if gcdPOWEROFF_TIMEOUT
++gceSTATUS
++gckHARDWARE_SetPowerOffTimeout(
++    IN gckHARDWARE  Hardware,
++    IN gctUINT32    Timeout
++)
++{
++    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
++
++    Hardware->powerOffTimeout = Timeout;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++gceSTATUS
++gckHARDWARE_QueryPowerOffTimeout(
++    IN gckHARDWARE  Hardware,
++    OUT gctUINT32*  Timeout
++)
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    *Timeout = Hardware->powerOffTimeout;
++
++    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
++    return gcvSTATUS_OK;
++}
++#endif
++
++gceSTATUS
++gckHARDWARE_QueryIdle(
++    IN gckHARDWARE Hardware,
++    OUT gctBOOL_PTR IsIdle
++    )
++{
++    gceSTATUS status;
++    gctUINT32 idle, address;
++    gctBOOL   isIdle;
++#if gcdMULTI_GPU > 1
++    gctUINT32 idle3D1 = 0;
++    gctUINT32 address3D1;
++    gctBOOL   isIdle3D1 = gcvFALSE;
++#endif
++
++#if gcdINTERRUPT_STATISTIC
++    gctINT32 pendingInterrupt;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
++
++    /* We are idle when the power is not ON. */
++    if (Hardware->chipPowerState != gcvPOWER_ON)
++    {
++        isIdle = gcvTRUE;
++#if gcdMULTI_GPU > 1
++        isIdle3D1 = gcvTRUE;
++#endif
++    }
++
++    else
++    {
++        /* Read idle register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00004, &idle));
++
++#if gcdMULTI_GPU > 1
++        if (Hardware->core == gcvCORE_MAJOR)
++        {
++            gcmkONERROR(
++                gckOS_ReadRegisterByCoreId(Hardware->os,
++                                           Hardware->core,
++                                           gcvCORE_3D_1_ID,
++                                           0x00004,
++                                           &idle3D1));
++        }
++#endif
++
++        /* Pipe must be idle. */
++        if (((((((gctUINT32) (idle)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) ) != 1)
++        )
++        {
++            /* Something is busy. */
++            isIdle = gcvFALSE;
++        }
++
++        else
++        {
++#if gcdSECURITY
++            isIdle = gcvTRUE;
++            address = 0;
++#else
++            /* Read the current FE address. */
++            gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                             Hardware->core,
++                                             0x00664,
++                                             &address));
++
++            /* Test if address is inside the last WAIT/LINK sequence. */
++            if ((address >= Hardware->lastWaitLink)
++#if gcdMULTI_GPU
++            &&  (address <= Hardware->lastWaitLink + 40)
++#else
++            &&  (address <= Hardware->lastWaitLink + 16)
++#endif
++            )
++            {
++                /* FE is in last WAIT/LINK and the pipe is idle. */
++                isIdle = gcvTRUE;
++            }
++            else
++            {
++                /* FE is not in WAIT/LINK yet. */
++                isIdle = gcvFALSE;
++            }
++#endif
++        }
++
++#if gcdMULTI_GPU > 1
++        if (Hardware->core == gcvCORE_MAJOR)
++        {
++            /* Pipe must be idle. */
++            if (((((((gctUINT32) (idle3D1)) >> (0 ? 1:1)) & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1)))))) ) != 1)
++                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 3:3)) & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1)))))) ) != 1)
++                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 4:4)) & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1)))))) ) != 1)
++                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 5:5)) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1)))))) ) != 1)
++                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 6:6)) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1)))))) ) != 1)
++                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 7:7)) & ((gctUINT32) ((((1 ? 7:7) - (0 ? 7:7) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:7) - (0 ? 7:7) + 1)))))) ) != 1)
++                ||  ((((((gctUINT32) (idle3D1)) >> (0 ? 2:2)) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) ) != 1)
++            )
++            {
++                /* Something is busy. */
++                isIdle3D1 = gcvFALSE;
++            }
++
++            else
++            {
++                /* Read the current FE address. */
++                gcmkONERROR(gckOS_ReadRegisterByCoreId(Hardware->os,
++                                                       Hardware->core,
++                                                       gcvCORE_3D_1_ID,
++                                                       0x00664,
++                                                       &address3D1));
++
++                /* Test if address is inside the last WAIT/LINK sequence. */
++                if ((address3D1 >= Hardware->lastWaitLink)
++                    &&  (address3D1 <= Hardware->lastWaitLink + 40)
++                )
++                {
++                    /* FE is in last WAIT/LINK and the pipe is idle. */
++                    isIdle3D1 = gcvTRUE;
++                }
++                else
++                {
++                    /* FE is not in WAIT/LINK yet. */
++                    isIdle3D1 = gcvFALSE;
++                }
++            }
++        }
++#endif
++
++    }
++
++#if gcdINTERRUPT_STATISTIC
++    gcmkONERROR(gckOS_AtomGet(
++        Hardware->os,
++        Hardware->kernel->eventObj->interruptCount,
++        &pendingInterrupt
++        ));
++
++    if (pendingInterrupt)
++    {
++        isIdle = gcvFALSE;
++    }
++#endif
++
++#if gcdMULTI_GPU > 1
++    if (Hardware->core == gcvCORE_MAJOR)
++    {
++        *IsIdle = (isIdle & isIdle3D1);
++    }
++    else
++#endif
++    {
++        *IsIdle = isIdle;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++** Handy macros that will help in reading those debug registers.
++*/
++
++#define gcmkREAD_DEBUG_REGISTER(control, block, index, data) \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          index))); \
++    gcmkONERROR(\
++        gckOS_ReadRegisterEx(Hardware->os, \
++                             Hardware->core, \
++                             GC_DEBUG_SIGNALS_##block##_Address, \
++                             &profiler->data))
++
++#define gcmkREAD_DEBUG_REGISTER_N(control, block, index, data) \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          index))); \
++    gcmkONERROR(\
++        gckOS_ReadRegisterEx(Hardware->os, \
++                             Hardware->core, \
++                             GC_DEBUG_SIGNALS_##block##_Address, \
++                             &data))
++
++#define gcmkRESET_DEBUG_REGISTER(control, block) \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          15))); \
++    gcmkONERROR(\
++        gckOS_WriteRegisterEx(Hardware->os, \
++                              Hardware->core, \
++                              GC_DEBUG_CONTROL##control##_Address, \
++                              gcmSETFIELD(0, \
++                                          GC_DEBUG_CONTROL##control, \
++                                          block, \
++                                          0)))
++
++/*******************************************************************************
++**
++**  gckHARDWARE_ProfileEngine2D
++**
++**  Read the profile registers available in the 2D engine and sets them in the
++**  profile.  The function will also reset the pixelsRendered counter every time.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      OPTIONAL gcs2D_PROFILE_PTR Profile
++**          Pointer to a gcs2D_Profile structure.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_ProfileEngine2D(
++    IN gckHARDWARE Hardware,
++    OPTIONAL gcs2D_PROFILE_PTR Profile
++    )
++{
++    gceSTATUS status;
++    gcs2D_PROFILE_PTR profiler = Profile;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Profile != gcvNULL)
++    {
++        /* Read the cycle count. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00438,
++                                 &Profile->cycleCount));
++
++        /* Read pixels rendered by 2D engine. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &profiler->pixelsRendered));
++
++        /* Reset counter. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if VIVANTE_PROFILER
++gceSTATUS
++gckHARDWARE_QueryProfileRegisters(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Reset,
++    OUT gcsPROFILER_COUNTERS * Counters
++    )
++{
++    gceSTATUS status;
++    gcsPROFILER_COUNTERS * profiler = Counters;
++    gctUINT i, clock;
++    gctUINT32 colorKilled, colorDrawn, depthKilled, depthDrawn;
++    gctUINT32 totalRead, totalWrite;
++
++    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Read the counters. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00438,
++                             &profiler->gpuCyclesCounter));
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00078,
++                             &profiler->gpuTotalCyclesCounter));
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x0007C,
++                             &profiler->gpuIdleCyclesCounter));
++
++
++    /* Read clock control register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &clock));
++
++    profiler->gpuTotalRead64BytesPerFrame = 0;
++    profiler->gpuTotalWrite64BytesPerFrame = 0;
++    profiler->pe_pixel_count_killed_by_color_pipe = 0;
++    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
++
++    /* Walk through all avaiable pixel pipes. */
++    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
++    {
++        /* Select proper pipe. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
++
++        /* BW */
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00040,
++                             &totalRead));
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00044,
++                             &totalWrite));
++
++        profiler->gpuTotalRead64BytesPerFrame += totalRead;
++        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
++
++        /* PE */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
++
++        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
++        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
++        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
++        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
++    }
++
++    /* Reset clock control register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      clock));
++
++    /* Reset counters. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++
++    /* SH */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));
++
++    /* PA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));
++
++    /* SE */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));
++
++    /* RA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++
++    /* TX */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));
++
++    /* MC */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));
++
++    /* HI */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++
++#if VIVANTE_PROFILER_CONTEXT
++#define gcmkUPDATE_PROFILE_DATA(data) \
++    profilerHistroy->data += profiler->data
++
++gceSTATUS
++gckHARDWARE_QueryContextProfile(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Reset,
++    IN gckCONTEXT Context,
++    OUT gcsPROFILER_COUNTERS * Counters
++    )
++{
++    gceSTATUS status;
++    gckCOMMAND command = Hardware->kernel->command;
++    gcsPROFILER_COUNTERS * profiler = Counters;
++
++    gcmkHEADER_ARG("Hardware=0x%x Counters=0x%x", Hardware, Counters);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Acquire the context sequnence mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(
++        command->os, command->mutexContextSeq, gcvINFINITE
++        ));
++
++    /* Read the counters. */
++    gcmkVERIFY_OK(gckOS_MemCopy(
++        profiler, &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
++        ));
++
++    /* Reset counters. */
++    gcmkVERIFY_OK(gckOS_ZeroMemory(
++        &Context->histroyProfiler, gcmSIZEOF(gcsPROFILER_COUNTERS)
++        ));
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(
++        command->os, command->mutexContextSeq
++        ));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gctUINT32
++CalcDelta(
++    IN gctUINT32 new,
++    IN gctUINT32 old
++    )
++{
++    if (new >= old)
++    {
++        return new - old;
++    }
++    else
++    {
++        return (gctUINT32)((gctUINT64)new + 0x100000000ll - old);
++    }
++}
++
++gceSTATUS
++gckHARDWARE_UpdateContextProfile(
++    IN gckHARDWARE Hardware,
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status;
++    gcsPROFILER_COUNTERS * profiler = &Context->latestProfiler;
++    gcsPROFILER_COUNTERS * profilerHistroy = &Context->histroyProfiler;
++    gctUINT i, clock;
++    gctUINT32 colorKilled = 0, colorDrawn = 0, depthKilled = 0, depthDrawn = 0;
++    gctUINT32 totalRead, totalWrite;
++    gceCHIPMODEL chipModel;
++    gctUINT32 chipRevision;
++    gctUINT32 temp;
++    gctBOOL needResetShader = gcvFALSE;
++
++    gcmkHEADER_ARG("Hardware=0x%x Context=0x%x", Hardware, Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_OBJECT(Context, gcvOBJ_CONTEXT);
++
++    chipModel = Hardware->identity.chipModel;
++    chipRevision = Hardware->identity.chipRevision;
++    if (chipModel == gcv2000 || (chipModel == gcv2100 && chipRevision == 0x5118))
++    {
++        needResetShader = gcvTRUE;
++    }
++
++    /* Read the counters. */
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00438,
++                             &profiler->gpuCyclesCounter));
++    gcmkUPDATE_PROFILE_DATA(gpuCyclesCounter);
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00078,
++                             &profiler->gpuTotalCyclesCounter));
++    gcmkUPDATE_PROFILE_DATA(gpuTotalCyclesCounter);
++
++    gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x0007C,
++                             &profiler->gpuIdleCyclesCounter));
++    gcmkUPDATE_PROFILE_DATA(gpuIdleCyclesCounter);
++
++    /* Read clock control register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &clock));
++
++    profiler->gpuTotalRead64BytesPerFrame = 0;
++    profiler->gpuTotalWrite64BytesPerFrame = 0;
++    profiler->pe_pixel_count_killed_by_color_pipe = 0;
++    profiler->pe_pixel_count_killed_by_depth_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_color_pipe = 0;
++    profiler->pe_pixel_count_drawn_by_depth_pipe = 0;
++
++    /* Walk through all avaiable pixel pipes. */
++    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
++    {
++        /* Select proper pipe. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                           Hardware->core,
++                                           0x00000,
++                                           ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
++
++        /* BW */
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00040,
++                             &totalRead));
++        gcmkONERROR(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00044,
++                             &totalWrite));
++
++        profiler->gpuTotalRead64BytesPerFrame += totalRead;
++        profiler->gpuTotalWrite64BytesPerFrame += totalWrite;
++        gcmkUPDATE_PROFILE_DATA(gpuTotalRead64BytesPerFrame);
++        gcmkUPDATE_PROFILE_DATA(gpuTotalWrite64BytesPerFrame);
++
++        /* PE */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthKilled));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &colorDrawn));
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470, ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))));gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00454, &depthDrawn));
++
++        profiler->pe_pixel_count_killed_by_color_pipe += colorKilled;
++        profiler->pe_pixel_count_killed_by_depth_pipe += depthKilled;
++        profiler->pe_pixel_count_drawn_by_color_pipe += colorDrawn;
++        profiler->pe_pixel_count_drawn_by_depth_pipe += depthDrawn;
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_color_pipe);
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_killed_by_depth_pipe);
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_color_pipe);
++        gcmkUPDATE_PROFILE_DATA(pe_pixel_count_drawn_by_depth_pipe);
++    }
++
++    /* Reset clock control register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      clock));
++
++
++    /* Reset counters. */
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 1));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x0003C, 0));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00438, 0));
++    gcmkONERROR(
++        gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00078, 0));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++
++    /* SH */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->ps_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->ps_inst_counter;
++        profiler->ps_inst_counter = CalcDelta(temp, Context->prevPSInstCount);
++        Context->prevPSInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(ps_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_pixel_counter));
++    if (needResetShader)
++    {
++        temp = profiler->rendered_pixel_counter;
++        profiler->rendered_pixel_counter = CalcDelta(temp, Context->prevPSPixelCount);
++        Context->prevPSPixelCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(rendered_pixel_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vs_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->vs_inst_counter;
++        profiler->vs_inst_counter = CalcDelta(temp, Context->prevVSInstCount);
++        Context->prevVSInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(vs_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->rendered_vertice_counter));
++    if (needResetShader)
++    {
++        temp = profiler->rendered_vertice_counter;
++        profiler->rendered_vertice_counter = CalcDelta(temp, Context->prevVSVertexCount);
++        Context->prevVSVertexCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(rendered_vertice_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (11) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_branch_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->vtx_branch_inst_counter;
++        profiler->vtx_branch_inst_counter = CalcDelta(temp, Context->prevVSBranchInstCount);
++        Context->prevVSBranchInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(vtx_branch_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (12) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->vtx_texld_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->vtx_texld_inst_counter;
++        profiler->vtx_texld_inst_counter = CalcDelta(temp, Context->prevVSTexInstCount);
++        Context->prevVSTexInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(vtx_texld_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (13) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_branch_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->pxl_branch_inst_counter;
++        profiler->pxl_branch_inst_counter = CalcDelta(temp, Context->prevPSBranchInstCount);
++        Context->prevPSBranchInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(pxl_branch_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (14) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0045C, &profiler->pxl_texld_inst_counter));
++    if (needResetShader)
++    {
++        temp = profiler->pxl_texld_inst_counter;
++        profiler->pxl_texld_inst_counter = CalcDelta(temp, Context->prevPSTexInstCount);
++        Context->prevPSTexInstCount = temp;
++    }
++    gcmkUPDATE_PROFILE_DATA(pxl_texld_inst_counter);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00470,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));
++
++    /* PA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_vtx_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_input_vtx_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (4) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_input_prim_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_input_prim_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_output_prim_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_output_prim_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_depth_clipped_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_depth_clipped_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_trivial_rejected_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_trivial_rejected_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00460, &profiler->pa_culled_counter));
++    gcmkUPDATE_PROFILE_DATA(pa_culled_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));
++
++    /* SE */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_triangle_count));
++    gcmkUPDATE_PROFILE_DATA(se_culled_triangle_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00464, &profiler->se_culled_lines_count));
++    gcmkUPDATE_PROFILE_DATA(se_culled_lines_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));
++
++    /* RA */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_pixel_count));
++    gcmkUPDATE_PROFILE_DATA(ra_valid_pixel_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_quad_count));
++    gcmkUPDATE_PROFILE_DATA(ra_total_quad_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_valid_quad_count_after_early_z));
++    gcmkUPDATE_PROFILE_DATA(ra_valid_quad_count_after_early_z);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_total_primitive_count));
++    gcmkUPDATE_PROFILE_DATA(ra_total_primitive_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_pipe_cache_miss_counter));
++    gcmkUPDATE_PROFILE_DATA(ra_pipe_cache_miss_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (10) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00448, &profiler->ra_prefetch_cache_miss_counter));
++    gcmkUPDATE_PROFILE_DATA(ra_prefetch_cache_miss_counter);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 23:16) - (0 ? 23:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:16) - (0 ? 23:16) + 1))))))) << (0 ? 23:16)))
++));
++
++    /* TX */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_bilinear_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_bilinear_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_trilinear_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_trilinear_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_discarded_texture_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_discarded_texture_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_total_texture_requests));
++    gcmkUPDATE_PROFILE_DATA(tx_total_texture_requests);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (5) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_count));
++    gcmkUPDATE_PROFILE_DATA(tx_mem_read_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (6) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_mem_read_in_8B_count));
++    gcmkUPDATE_PROFILE_DATA(tx_mem_read_in_8B_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (7) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_count));
++    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (8) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_hit_texel_count));
++    gcmkUPDATE_PROFILE_DATA(tx_cache_hit_texel_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (9) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0044C, &profiler->tx_cache_miss_texel_count));
++    gcmkUPDATE_PROFILE_DATA(tx_cache_miss_texel_count);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00474,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))) << (0 ? 31:24)))
++));
++
++    /* MC */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_pipeline));
++    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_pipeline);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_read_req_8B_from_IP));
++    gcmkUPDATE_PROFILE_DATA(mc_total_read_req_8B_from_IP);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (3) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x00468, &profiler->mc_total_write_req_8B_from_pipeline));
++    gcmkUPDATE_PROFILE_DATA(mc_total_write_req_8B_from_pipeline);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 7:0) - (0 ? 7:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 7:0) - (0 ? 7:0) + 1))))))) << (0 ? 7:0)))
++));
++
++    /* HI */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_read_request_stalled));
++    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_read_request_stalled);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_request_stalled));
++    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_request_stalled);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (2) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os, Hardware->core, 0x0046C, &profiler->hi_axi_cycles_write_data_stalled));
++    gcmkUPDATE_PROFILE_DATA(hi_axi_cycles_write_data_stalled);
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (15) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) ));
++gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, 0x00478,   ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))
++));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++
++#if VIVANTE_PROFILER_NEW
++gceSTATUS
++gckHARDWARE_InitProfiler(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gctUINT32 control;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &control));
++    /* Enable debug register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1))))))) << (0 ? 11:11)))));
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++static gceSTATUS
++_ResetGPU(
++    IN gckHARDWARE Hardware,
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++    gctUINT32 control, idle;
++    gceSTATUS status;
++
++    for (;;)
++    {
++        /* Disable clock gating. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    Hardware->powerBaseAddress +
++                    0x00104,
++                    0x00000000));
++
++        control = ((((gctUINT32) (0x01590880)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1))))))) << (0 ? 17:17)));
++
++        /* Disable pulse-eater. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x0010C,
++                    control));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x0010C,
++                    ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x0010C,
++                    control));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x00000,
++                    ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)))));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    Core,
++                    0x00000,
++                    0x00000900));
++
++        /* Wait for clock being stable. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Isolate the GPU. */
++        control = ((((gctUINT32) (0x00000900)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          control));
++
++        /* Set soft reset. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Wait for reset. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Reset soft reset bit. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Reset GPU isolation. */
++        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          Core,
++                                          0x00000,
++                                          control));
++
++        /* Read idle register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         Core,
++                                         0x00004,
++                                         &idle));
++
++        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
++        {
++            continue;
++        }
++
++#if gcdMULTI_GPU > 1
++        if (Core == gcvCORE_MAJOR)
++        {
++            /* Read idle register. */
++            gcmkONERROR(gckOS_ReadRegisterByCoreId(Os,
++                                                   Core,
++                                                   gcvCORE_3D_1_ID,
++                                                   0x00004,
++                                                   &idle));
++
++            if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
++            {
++                continue;
++            }
++        }
++#endif
++        /* Read reset register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         Core,
++                                         0x00000,
++                                         &control));
++
++        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
++        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
++        )
++        {
++            continue;
++        }
++
++#if gcdMULTI_GPU > 1
++        if (Core == gcvCORE_MAJOR)
++        {
++            /* Read reset register. */
++            gcmkONERROR(gckOS_ReadRegisterByCoreId(Os,
++                                                   Core,
++                                                   gcvCORE_3D_1_ID,
++                                                   0x00000,
++                                                   &control));
++
++            if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
++                ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
++            )
++            {
++                continue;
++            }
++        }
++#endif
++        /* GPU is idle. */
++        break;
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the error. */
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_Reset(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
++
++    /* Hardware reset. */
++    status = gckOS_ResetGPU(Hardware->os, Hardware->core);
++
++    if (gcmIS_ERROR(status))
++    {
++        if (Hardware->identity.chipRevision < 0x4600)
++        {
++            /* Not supported - we need the isolation bit. */
++            gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++        }
++
++        /* Soft reset. */
++        gcmkONERROR(_ResetGPU(Hardware, Hardware->os, Hardware->core));
++    }
++
++    /* Initialize hardware. */
++    gcmkONERROR(gckHARDWARE_InitializeHardware(Hardware));
++
++    /* Jump to address into which GPU should run if it doesn't stuck. */
++    gcmkONERROR(gckHARDWARE_Execute(Hardware, Hardware->kernel->restoreAddress, 16));
++
++    gcmkPRINT("[galcore]: recovery done");
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkPRINT("[galcore]: Hardware not reset successfully, give up");
++
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_GetBaseAddress(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32_PTR BaseAddress
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(BaseAddress != gcvNULL);
++
++    /* Test if we have a new Memory Controller. */
++    if (((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))))
++    {
++        /* No base address required. */
++        *BaseAddress = 0;
++    }
++    else
++    {
++        /* Get the base address from the OS. */
++        gcmkONERROR(gckOS_GetBaseAddress(Hardware->os, BaseAddress));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*BaseAddress=0x%08x", *BaseAddress);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_NeedBaseAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 State,
++    OUT gctBOOL_PTR NeedBase
++    )
++{
++    gctBOOL need = gcvFALSE;
++
++    gcmkHEADER_ARG("Hardware=0x%x State=0x%08x", Hardware, State);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(NeedBase != gcvNULL);
++
++    /* Make sure this is a load state. */
++    if (((((gctUINT32) (State)) >> (0 ? 31:27) & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))))
++    {
++#if gcdENABLE_3D
++        /* Get the state address. */
++        switch ((((((gctUINT32) (State)) >> (0 ? 15:0)) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1)))))) ))
++        {
++        case 0x0596:
++        case 0x0597:
++        case 0x0599:
++        case 0x059A:
++        case 0x05A9:
++            /* These states need a TRUE physical address. */
++            need = gcvTRUE;
++            break;
++        }
++#else
++        /* 2D addresses don't need a base address. */
++#endif
++    }
++
++    /* Return the flag. */
++    *NeedBase = need;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*NeedBase=%d", *NeedBase);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckHARDWARE_SetIsrManager(
++   IN gckHARDWARE Hardware,
++   IN gctISRMANAGERFUNC StartIsr,
++   IN gctISRMANAGERFUNC StopIsr,
++   IN gctPOINTER Context
++   )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    gcmkHEADER_ARG("Hardware=0x%x, StartIsr=0x%x, StopIsr=0x%x, Context=0x%x",
++                   Hardware, StartIsr, StopIsr, Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (StartIsr == gcvNULL ||
++        StopIsr == gcvNULL ||
++        Context == gcvNULL)
++    {
++        status = gcvSTATUS_INVALID_ARGUMENT;
++
++        gcmkFOOTER();
++        return status;
++    }
++
++    Hardware->startIsr = StartIsr;
++    Hardware->stopIsr = StopIsr;
++    Hardware->isrContext = Context;
++
++    /* Success. */
++    gcmkFOOTER();
++
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_Compose
++**
++**  Start a composition.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_Compose(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Offset,
++    IN gctSIZE_T Size,
++    IN gctUINT8 EventID
++    )
++{
++#if gcdENABLE_3D
++    gceSTATUS status;
++    gctUINT32_PTR triggerState;
++
++    gcmkHEADER_ARG("Hardware=0x%x Physical=0x%x Logical=0x%x"
++                   " Offset=%d Size=%d EventID=%d",
++                   Hardware, Physical, Logical, Offset, Size, EventID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(((Size + 8) & 63) == 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Program the trigger state. */
++    triggerState = (gctUINT32_PTR) ((gctUINT8_PTR) Logical + Offset + Size);
++    triggerState[0] = 0x0C03;
++    triggerState[1]
++        = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 5:4) - (0 ? 5:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:4) - (0 ? 5:4) + 1))))))) << (0 ? 5:4)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1))))))) << (0 ? 8:8)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))
++        | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16))) | (((gctUINT32) ((gctUINT32) (EventID) & ((gctUINT32) ((((1 ? 20:16) - (0 ? 20:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:16) - (0 ? 20:16) + 1))))))) << (0 ? 20:16)))
++        ;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache for the wait/link. */
++    gcmkONERROR(gckOS_CacheClean(
++        Hardware->os, ProcessID, gcvNULL,
++        (gctUINT32)Physical, Logical, Offset + Size
++        ));
++#endif
++
++    /* Start composition. */
++    gcmkONERROR(gckOS_WriteRegisterEx(
++        Hardware->os, Hardware->core, 0x00554,
++        ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)))
++        ));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    /* Return the status. */
++    return gcvSTATUS_NOT_SUPPORTED;
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_IsFeatureAvailable
++**
++**  Verifies whether the specified feature is available in hardware.
++**
++**  INPUT:
++**
++**      gckHARDWARE Hardware
++**          Pointer to an gckHARDWARE object.
++**
++**      gceFEATURE Feature
++**          Feature to be verified.
++*/
++gceSTATUS
++gckHARDWARE_IsFeatureAvailable(
++    IN gckHARDWARE Hardware,
++    IN gceFEATURE Feature
++    )
++{
++    gctBOOL available;
++
++    gcmkHEADER_ARG("Hardware=0x%x Feature=%d", Hardware, Feature);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Only features needed by common kernel logic added here. */
++    switch (Feature)
++    {
++    case gcvFEATURE_END_EVENT:
++        /*available = gcmVERIFYFIELDVALUE(Hardware->identity.chipMinorFeatures2,
++            GC_MINOR_FEATURES2, END_EVENT, AVAILABLE
++            );*/
++        available = gcvFALSE;
++        break;
++
++    case gcvFEATURE_MC20:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 22:22) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1)))))));
++        break;
++
++    case gcvFEATURE_EARLY_Z:
++        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x0 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))));
++        break;
++
++    case gcvFEATURE_HZ:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures)) >> (0 ? 27:27) & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 27:27) - (0 ? 27:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:27) - (0 ? 27:27) + 1)))))));
++        break;
++
++    case gcvFEATURE_NEW_HZ:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 26:26) & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 26:26) - (0 ? 26:26) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:26) - (0 ? 26:26) + 1)))))));
++        break;
++
++    case gcvFEATURE_FAST_MSAA:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 8:8) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))));
++        break;
++
++    case gcvFEATURE_SMALL_MSAA:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures4)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
++        break;
++
++    case gcvFEATURE_DYNAMIC_FREQUENCY_SCALING:
++        /* This feature doesn't apply for 2D cores. */
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures2)) >> (0 ? 14:14) & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 14:14) - (0 ? 14:14) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 14:14) - (0 ? 14:14) + 1)))))))
++            &&      ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
++
++        if (Hardware->identity.chipModel == gcv1000 &&
++            (Hardware->identity.chipRevision == 0x5039 ||
++            Hardware->identity.chipRevision == 0x5040))
++        {
++            available = gcvFALSE;
++        }
++        break;
++
++    case gcvFEATURE_ACE:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures3)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
++        break;
++
++    case gcvFEATURE_HALTI2:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures4)) >> (0 ? 16:16) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))));
++        break;
++
++    case gcvFEATURE_PIPE_2D:
++        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 9:9) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))));
++        break;
++
++    case gcvFEATURE_PIPE_3D:
++#if gcdENABLE_3D
++        available = ((((gctUINT32) (Hardware->identity.chipFeatures)) >> (0 ? 2:2) & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1)))))));
++#else
++        available = gcvFALSE;
++#endif
++        break;
++
++    case gcvFEATURE_FC_FLUSH_STALL:
++        available = ((((gctUINT32) (Hardware->identity.chipMinorFeatures1)) >> (0 ? 31:31) & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))) == (0x1 & ((gctUINT32) ((((1 ? 31:31) - (0 ? 31:31) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:31) - (0 ? 31:31) + 1)))))));
++        break;
++
++    default:
++        gcmkFATAL("Invalid feature has been requested.");
++        available = gcvFALSE;
++    }
++
++    /* Return result. */
++    gcmkFOOTER_ARG("%d", available ? gcvSTATUS_TRUE : gcvSTATUS_FALSE);
++    return available ? gcvSTATUS_TRUE : gcvSTATUS_FALSE;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_DumpMMUException
++**
++**  Dump the MMU debug info on an MMU exception.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_DumpMMUException(
++    IN gckHARDWARE Hardware
++    )
++{
++    gctUINT32 mmu       = 0;
++    gctUINT32 mmuStatus = 0;
++    gctUINT32 address   = 0;
++    gctUINT32 i         = 0;
++    gctUINT32 mtlb      = 0;
++    gctUINT32 stlb      = 0;
++    gctUINT32 offset    = 0;
++#if gcdPROCESS_ADDRESS_SPACE
++    gcsDATABASE_PTR database;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    gcmkPRINT("GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
++              Hardware->core,
++              Hardware->identity.chipModel,
++              Hardware->identity.chipRevision);
++
++    gcmkPRINT("**************************\n");
++    gcmkPRINT("***   MMU ERROR DUMP   ***\n");
++    gcmkPRINT("**************************\n");
++
++    gcmkVERIFY_OK(
++        gckOS_ReadRegisterEx(Hardware->os,
++                             Hardware->core,
++                             0x00188,
++                             &mmuStatus));
++
++    gcmkPRINT("  MMU status = 0x%08X\n", mmuStatus);
++
++    for (i = 0; i < 4; i += 1)
++    {
++        mmu = mmuStatus & 0xF;
++        mmuStatus >>= 4;
++
++        if (mmu == 0)
++        {
++            continue;
++        }
++
++        switch (mmu)
++        {
++        case 1:
++              gcmkPRINT("  MMU%d: slave not present\n", i);
++              break;
++
++        case 2:
++              gcmkPRINT("  MMU%d: page not present\n", i);
++              break;
++
++        case 3:
++              gcmkPRINT("  MMU%d: write violation\n", i);
++              break;
++
++        default:
++              gcmkPRINT("  MMU%d: unknown state\n", i);
++        }
++
++        gcmkVERIFY_OK(
++            gckOS_ReadRegisterEx(Hardware->os,
++                                 Hardware->core,
++                                 0x00190 + i * 4,
++                                 &address));
++
++        mtlb   = (address & gcdMMU_MTLB_MASK) >> gcdMMU_MTLB_SHIFT;
++        stlb   = (address & gcdMMU_STLB_4K_MASK) >> gcdMMU_STLB_4K_SHIFT;
++        offset =  address & gcdMMU_OFFSET_4K_MASK;
++
++        gcmkPRINT("  MMU%d: exception address = 0x%08X\n", i, address);
++
++        gcmkPRINT("    MTLB entry = %d\n", mtlb);
++
++        gcmkPRINT("    STLB entry = %d\n", stlb);
++
++        gcmkPRINT("    Offset = 0x%08X (%d)\n", offset, offset);
++
++        gckMMU_DumpPageTableEntry(Hardware->kernel->mmu, address);
++
++#if gcdPROCESS_ADDRESS_SPACE
++        for (i = 0; i < gcmCOUNTOF(Hardware->kernel->db->db); ++i)
++        {
++            for (database = Hardware->kernel->db->db[i];
++                    database != gcvNULL;
++                    database = database->next)
++            {
++                gcmkPRINT("    database [%d] :", database->processID);
++                gckMMU_DumpPageTableEntry(database->mmu, address);
++            }
++        }
++#endif
++    }
++
++    gckHARDWARE_DumpGPUState(Hardware);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_DumpGPUState
++**
++**  Dump the GPU debug registers.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHARDWARE_DumpGPUState(
++    IN gckHARDWARE Hardware
++    )
++{
++    static gctCONST_STRING _cmdState[] =
++    {
++        "PAR_IDLE_ST", "PAR_DEC_ST", "PAR_ADR0_ST", "PAR_LOAD0_ST",
++        "PAR_ADR1_ST", "PAR_LOAD1_ST", "PAR_3DADR_ST", "PAR_3DCMD_ST",
++        "PAR_3DCNTL_ST", "PAR_3DIDXCNTL_ST", "PAR_INITREQDMA_ST",
++        "PAR_DRAWIDX_ST", "PAR_DRAW_ST", "PAR_2DRECT0_ST", "PAR_2DRECT1_ST",
++        "PAR_2DDATA0_ST", "PAR_2DDATA1_ST", "PAR_WAITFIFO_ST", "PAR_WAIT_ST",
++        "PAR_LINK_ST", "PAR_END_ST", "PAR_STALL_ST"
++    };
++
++    static gctCONST_STRING _cmdDmaState[] =
++    {
++        "CMD_IDLE_ST", "CMD_START_ST", "CMD_REQ_ST", "CMD_END_ST"
++    };
++
++    static gctCONST_STRING _cmdFetState[] =
++    {
++        "FET_IDLE_ST", "FET_RAMVALID_ST", "FET_VALID_ST"
++    };
++
++    static gctCONST_STRING _reqDmaState[] =
++    {
++        "REQ_IDLE_ST", "REQ_WAITIDX_ST", "REQ_CAL_ST"
++    };
++
++    static gctCONST_STRING _calState[] =
++    {
++        "CAL_IDLE_ST", "CAL_LDADR_ST", "CAL_IDXCALC_ST"
++    };
++
++    static gctCONST_STRING _veReqState[] =
++    {
++        "VER_IDLE_ST", "VER_CKCACHE_ST", "VER_MISS_ST"
++    };
++
++    static gcsiDEBUG_REGISTERS _dbgRegs[] =
++    {
++        { "RA", 0x474, 16, 0x448, 16, 0x12344321 },
++        { "TX", 0x474, 24, 0x44C, 16, 0x12211221 },
++        { "FE", 0x470, 0, 0x450, 16, 0xBABEF00D },
++        { "PE", 0x470, 16, 0x454, 16, 0xBABEF00D },
++        { "DE", 0x470, 8, 0x458, 16, 0xBABEF00D },
++        { "SH", 0x470, 24, 0x45C, 16, 0xDEADBEEF },
++        { "PA", 0x474, 0, 0x460, 16, 0x0000AAAA },
++        { "SE", 0x474, 8, 0x464, 16, 0x5E5E5E5E },
++        { "MC", 0x478, 0, 0x468, 16, 0x12345678 },
++        { "HI", 0x478, 8, 0x46C, 16, 0xAAAAAAAA }
++    };
++
++    static gctUINT32 _otherRegs[] =
++    {
++        0x040, 0x044, 0x04C, 0x050, 0x054, 0x058, 0x05C, 0x060,
++        0x43c, 0x440, 0x444, 0x414,
++    };
++
++    gceSTATUS status;
++    gckKERNEL kernel = gcvNULL;
++    gctUINT32 idle = 0, axi = 0;
++    gctUINT32 dmaAddress1 = 0, dmaAddress2 = 0;
++    gctUINT32 dmaState1 = 0, dmaState2 = 0;
++    gctUINT32 dmaLow = 0, dmaHigh = 0;
++    gctUINT32 cmdState = 0, cmdDmaState = 0, cmdFetState = 0;
++    gctUINT32 dmaReqState = 0, calState = 0, veReqState = 0;
++    gctUINT i;
++    gctUINT pipe = 0, pixelPipes = 0;
++    gctUINT32 control = 0, oldControl = 0;
++    gckOS os = Hardware->os;
++    gceCORE core = Hardware->core;
++
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    kernel = Hardware->kernel;
++
++    gcmkPRINT_N(12, "GPU[%d](ChipModel=0x%x ChipRevision=0x%x):\n",
++                core,
++                Hardware->identity.chipModel,
++                Hardware->identity.chipRevision);
++
++    pixelPipes = Hardware->identity.pixelPipes
++               ? Hardware->identity.pixelPipes
++               : 1;
++
++    /* Reset register values. */
++    idle        = axi         =
++    dmaState1   = dmaState2   =
++    dmaAddress1 = dmaAddress2 =
++    dmaLow      = dmaHigh     = 0;
++
++    /* Verify whether DMA is running. */
++    gcmkONERROR(_VerifyDMA(
++        os, core, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
++        ));
++
++    cmdState    =  dmaState2        & 0x1F;
++    cmdDmaState = (dmaState2 >>  8) & 0x03;
++    cmdFetState = (dmaState2 >> 10) & 0x03;
++    dmaReqState = (dmaState2 >> 12) & 0x03;
++    calState    = (dmaState2 >> 14) & 0x03;
++    veReqState  = (dmaState2 >> 16) & 0x03;
++
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x004, &idle));
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x00C, &axi));
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x668, &dmaLow));
++    gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x66C, &dmaHigh));
++
++    gcmkPRINT_N(0, "**************************\n");
++    gcmkPRINT_N(0, "***   GPU STATE DUMP   ***\n");
++    gcmkPRINT_N(0, "**************************\n");
++
++    gcmkPRINT_N(4, "  axi      = 0x%08X\n", axi);
++
++    gcmkPRINT_N(4, "  idle     = 0x%08X\n", idle);
++    if ((idle & 0x00000001) == 0) gcmkPRINT_N(0, "    FE not idle\n");
++    if ((idle & 0x00000002) == 0) gcmkPRINT_N(0, "    DE not idle\n");
++    if ((idle & 0x00000004) == 0) gcmkPRINT_N(0, "    PE not idle\n");
++    if ((idle & 0x00000008) == 0) gcmkPRINT_N(0, "    SH not idle\n");
++    if ((idle & 0x00000010) == 0) gcmkPRINT_N(0, "    PA not idle\n");
++    if ((idle & 0x00000020) == 0) gcmkPRINT_N(0, "    SE not idle\n");
++    if ((idle & 0x00000040) == 0) gcmkPRINT_N(0, "    RA not idle\n");
++    if ((idle & 0x00000080) == 0) gcmkPRINT_N(0, "    TX not idle\n");
++    if ((idle & 0x00000100) == 0) gcmkPRINT_N(0, "    VG not idle\n");
++    if ((idle & 0x00000200) == 0) gcmkPRINT_N(0, "    IM not idle\n");
++    if ((idle & 0x00000400) == 0) gcmkPRINT_N(0, "    FP not idle\n");
++    if ((idle & 0x00000800) == 0) gcmkPRINT_N(0, "    TS not idle\n");
++    if ((idle & 0x80000000) != 0) gcmkPRINT_N(0, "    AXI low power mode\n");
++
++    if (
++        (dmaAddress1 == dmaAddress2)
++     && (dmaState1 == dmaState2)
++    )
++    {
++        gcmkPRINT_N(0, "  DMA appears to be stuck at this address:\n");
++        gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
++    }
++    else
++    {
++        if (dmaAddress1 == dmaAddress2)
++        {
++            gcmkPRINT_N(0, "  DMA address is constant, but state is changing:\n");
++            gcmkPRINT_N(4, "    0x%08X\n", dmaState1);
++            gcmkPRINT_N(4, "    0x%08X\n", dmaState2);
++        }
++        else
++        {
++            gcmkPRINT_N(0, "  DMA is running; known addresses are:\n");
++            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress1);
++            gcmkPRINT_N(4, "    0x%08X\n", dmaAddress2);
++        }
++    }
++
++    gcmkPRINT_N(4, "  dmaLow   = 0x%08X\n", dmaLow);
++    gcmkPRINT_N(4, "  dmaHigh  = 0x%08X\n", dmaHigh);
++    gcmkPRINT_N(4, "  dmaState = 0x%08X\n", dmaState2);
++    gcmkPRINT_N(8, "    command state       = %d (%s)\n", cmdState, _cmdState   [cmdState]);
++    gcmkPRINT_N(8, "    command DMA state   = %d (%s)\n", cmdDmaState, _cmdDmaState[cmdDmaState]);
++    gcmkPRINT_N(8, "    command fetch state = %d (%s)\n", cmdFetState, _cmdFetState[cmdFetState]);
++    gcmkPRINT_N(8, "    DMA request state   = %d (%s)\n", dmaReqState, _reqDmaState[dmaReqState]);
++    gcmkPRINT_N(8, "    cal state           = %d (%s)\n", calState, _calState   [calState]);
++    gcmkPRINT_N(8, "    VE request state    = %d (%s)\n", veReqState, _veReqState [veReqState]);
++
++    /* Record control. */
++    gckOS_ReadRegisterEx(os, core, 0x0, &oldControl);
++
++    for (pipe = 0; pipe < pixelPipes; pipe++)
++    {
++        gcmkPRINT_N(4, "  Debug registers of pipe[%d]:\n", pipe);
++
++        /* Switch pipe. */
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x0, &control));
++        control &= ~(0xF << 20);
++        control |= (pipe << 20);
++        gcmkONERROR(gckOS_WriteRegisterEx(os, core, 0x0, control));
++
++        for (i = 0; i < gcmCOUNTOF(_dbgRegs); i += 1)
++        {
++            gcmkONERROR(_DumpDebugRegisters(os, core, &_dbgRegs[i]));
++        }
++
++        gcmkPRINT_N(0, "    Other Registers:\n");
++        for (i = 0; i < gcmCOUNTOF(_otherRegs); i += 1)
++        {
++            gctUINT32 read;
++            gcmkONERROR(gckOS_ReadRegisterEx(os, core, _otherRegs[i], &read));
++            gcmkPRINT_N(12, "      [0x%04X] 0x%08X\n", _otherRegs[i], read);
++        }
++    }
++
++    if (kernel->hardware->identity.chipFeatures & (1 << 4))
++    {
++        gctUINT32 read0, read1, write;
++
++        read0 = read1 = write = 0;
++
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x43C, &read0));
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x440, &read1));
++        gcmkONERROR(gckOS_ReadRegisterEx(os, core, 0x444, &write));
++
++        gcmkPRINT_N(4, "  read0    = 0x%08X\n", read0);
++        gcmkPRINT_N(4, "  read1    = 0x%08X\n", read1);
++        gcmkPRINT_N(4, "  write    = 0x%08X\n", write);
++    }
++
++    /* Restore control. */
++    gcmkONERROR(gckOS_WriteRegisterEx(os, core, 0x0, oldControl));
++
++    /* dump stack. */
++    gckOS_DumpCallStack(os);
++
++OnError:
++
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++gckHARDWARE_ReadPerformanceRegister(
++    IN gckHARDWARE Hardware,
++    IN gctUINT PerformanceAddress,
++    IN gctUINT IndexAddress,
++    IN gctUINT IndexShift,
++    IN gctUINT Index,
++    OUT gctUINT32_PTR Value
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x PerformanceAddress=0x%x IndexAddress=0x%x "
++                   "IndexShift=%u Index=%u",
++                   Hardware, PerformanceAddress, IndexAddress, IndexShift,
++                   Index);
++
++    /* Write the index. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      IndexAddress,
++                                      Index << IndexShift));
++
++    /* Read the register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     PerformanceAddress,
++                                     Value));
++
++    /* Test for reset. */
++    if (Index == 15)
++    {
++        /* Index another register to get out of reset. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os, Hardware->core, IndexAddress, 0));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Value=0x%x", *Value);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_GetFrameInfo(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_FRAME_INFO * FrameInfo
++    )
++{
++    gceSTATUS status;
++    gctUINT i, clock;
++    gcsHAL_FRAME_INFO info;
++#if gcdFRAME_DB_RESET
++    gctUINT reset;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Get profile tick. */
++    gcmkONERROR(gckOS_GetProfileTick(&info.ticks));
++
++    /* Read SH counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        4,
++        &info.shaderCycles));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        9,
++        &info.vsInstructionCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        12,
++        &info.vsTextureCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        7,
++        &info.psInstructionCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        14,
++        &info.psTextureCount));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0045C,
++        0x00470,
++        24,
++        15,
++        &reset));
++#endif
++
++    /* Read PA counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        3,
++        &info.vertexCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        4,
++        &info.primitiveCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        7,
++        &info.rejectedPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        8,
++        &info.culledPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        6,
++        &info.clippedPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        5,
++        &info.outPrimitives));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00460,
++        0x00474,
++        0,
++        15,
++        &reset));
++#endif
++
++    /* Read RA counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        3,
++        &info.inPrimitives));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        11,
++        &info.culledQuadCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        1,
++        &info.totalQuadCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        2,
++        &info.quadCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        0,
++        &info.totalPixelCount));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00448,
++        0x00474,
++        16,
++        15,
++        &reset));
++#endif
++
++    /* Read TX counters and reset them. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        0,
++        &info.bilinearRequests));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        1,
++        &info.trilinearRequests));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        8,
++        &info.txHitCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        9,
++        &info.txMissCount));
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        6,
++        &info.txBytes8));
++#if gcdFRAME_DB_RESET
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x0044C,
++        0x00474,
++        24,
++        15,
++        &reset));
++#endif
++
++    /* Read clock control register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x00000,
++                                     &clock));
++
++    /* Walk through all avaiable pixel pipes. */
++    for (i = 0; i < Hardware->identity.pixelPipes; ++i)
++    {
++        /* Select proper pipe. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00000,
++                                          ((((gctUINT32) (clock)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20))) | (((gctUINT32) ((gctUINT32) (i) & ((gctUINT32) ((((1 ? 23:20) - (0 ? 23:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:20) - (0 ? 23:20) + 1))))))) << (0 ? 23:20)))));
++
++        /* Read cycle registers. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00078,
++                                         &info.cycles[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x0007C,
++                                         &info.idleCycles[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00438,
++                                         &info.mcCycles[i]));
++
++        /* Read bandwidth registers. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x0005C,
++                                         &info.readRequests[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00040,
++                                         &info.readBytes8[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00050,
++                                         &info.writeRequests[i]));
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00044,
++                                         &info.writeBytes8[i]));
++
++        /* Read PE counters. */
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            0,
++            &info.colorKilled[i]));
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            2,
++            &info.colorDrawn[i]));
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            1,
++            &info.depthKilled[i]));
++        gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++            Hardware,
++            0x00454,
++            0x00470,
++            16,
++            3,
++            &info.depthDrawn[i]));
++    }
++
++    /* Zero out remaning reserved counters. */
++    for (; i < 8; ++i)
++    {
++        info.readBytes8[i]    = 0;
++        info.writeBytes8[i]   = 0;
++        info.cycles[i]        = 0;
++        info.idleCycles[i]    = 0;
++        info.mcCycles[i]      = 0;
++        info.readRequests[i]  = 0;
++        info.writeRequests[i] = 0;
++        info.colorKilled[i]   = 0;
++        info.colorDrawn[i]    = 0;
++        info.depthKilled[i]   = 0;
++        info.depthDrawn[i]    = 0;
++    }
++
++    /* Reset clock control register. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00000,
++                                      clock));
++
++    /* Reset cycle and bandwidth counters. */
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      1));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0003C,
++                                      0));
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x00078,
++                                      0));
++
++#if gcdFRAME_DB_RESET
++    /* Reset PE counters. */
++    gcmkONERROR(gckHARDWARE_ReadPerformanceRegister(
++        Hardware,
++        0x00454,
++        0x00470,
++        16,
++        15,
++        &reset));
++#endif
++
++    /* Copy to user. */
++    gcmkONERROR(gckOS_CopyToUserData(Hardware->os,
++                                     &info,
++                                     FrameInfo,
++                                     gcmSIZEOF(info)));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdDVFS
++#define READ_FROM_EATER1 0
++
++gceSTATUS
++gckHARDWARE_QueryLoad(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32 * Load
++    )
++{
++    gctUINT32 debug1;
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Load != gcvNULL);
++
++    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00110,
++                                         Load));
++#if READ_FROM_EATER1
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00134,
++                                         Load));
++#endif
++
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00114,
++                                         &debug1));
++
++        /* Patch result of 0x110 with result of 0x114. */
++        if ((debug1 & 0xFF) == 1)
++        {
++            *Load &= ~0xFF;
++            *Load |= 1;
++        }
++
++        if (((debug1 & 0xFF00) >> 8) == 1)
++        {
++            *Load &= ~(0xFF << 8);
++            *Load |= 1 << 8;
++        }
++
++        if (((debug1 & 0xFF0000) >> 16) == 1)
++        {
++            *Load &= ~(0xFF << 16);
++            *Load |= 1 << 16;
++        }
++
++        if (((debug1 & 0xFF000000) >> 24) == 1)
++        {
++            *Load &= ~(0xFF << 24);
++            *Load |= 1 << 24;
++        }
++    }
++    else
++    {
++        status = gcvSTATUS_INVALID_REQUEST;
++    }
++
++OnError:
++
++    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_SetDVFSPeroid(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32 Frequency
++    )
++{
++    gceSTATUS status;
++    gctUINT32 period;
++    gctUINT32 eater;
++
++#if READ_FROM_EATER1
++    gctUINT32 period1;
++    gctUINT32 eater1;
++#endif
++
++    gcmkHEADER_ARG("Hardware=0x%X Frequency=%d", Hardware, Frequency);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    period = 0;
++
++    while((64 << period) < (gcdDVFS_ANAYLSE_WINDOW * Frequency * 1000) )
++    {
++        period++;
++    }
++
++#if READ_FROM_EATER1
++    /*
++    *  Peroid = F * 1000 * 1000 / (60 * 16 * 1024);
++    */
++    period1 = Frequency * 6250 / 6114;
++#endif
++
++    gckOS_AcquireMutex(Hardware->os, Hardware->powerMutex, gcvINFINITE);
++
++    if (Hardware->chipPowerState == gcvPOWER_ON)
++    {
++        /* Get current configure. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x0010C,
++                                         &eater));
++
++        /* Change peroid. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x0010C,
++                                          ((((gctUINT32) (eater)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8))) | (((gctUINT32) ((gctUINT32) (period) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1))))))) << (0 ? 15:8)))));
++
++#if READ_FROM_EATER1
++        /* Config eater1. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                         Hardware->core,
++                                         0x00130,
++                                         &eater1));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                          Hardware->core,
++                                          0x00130,
++                                          ((((gctUINT32) (eater1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16))) | (((gctUINT32) ((gctUINT32) (period1) & ((gctUINT32) ((((1 ? 31:16) - (0 ? 31:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:16) - (0 ? 31:16) + 1))))))) << (0 ? 31:16)))));
++#endif
++    }
++    else
++    {
++        status = gcvSTATUS_INVALID_REQUEST;
++    }
++
++OnError:
++    gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex);
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckHARDWARE_InitDVFS(
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gctUINT32 data;
++
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    gcmkONERROR(gckOS_ReadRegisterEx(Hardware->os,
++                                     Hardware->core,
++                                     0x0010C,
++                                     &data));
++
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1))))))) << (0 ? 18:18)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 23:23) - (0 ? 23:23) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 23:23) - (0 ? 23:23) + 1))))))) << (0 ? 23:23)));
++    data = ((((gctUINT32) (data)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 22:22) - (0 ? 22:22) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 22:22) - (0 ? 22:22) + 1))))))) << (0 ? 22:22)));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "DVFS Configure=0x%X",
++                   data);
++
++    gcmkONERROR(gckOS_WriteRegisterEx(Hardware->os,
++                                      Hardware->core,
++                                      0x0010C,
++                                      data));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckHARDWARE_PrepareFunctions
++**
++**  Generate command buffer snippets which will be used by gckHARDWARE, by which
++**  gckHARDWARE can manipulate GPU by FE command without using gckCOMMAND to avoid
++**  race condition and deadlock.
++**
++**  Notice:
++**  1. Each snippet can only be executed when GPU is idle.
++**  2. Execution is triggered by AHB (0x658)
++**  3. Each snippet followed by END so software can sync with GPU by checking GPU
++**     idle
++**  4. It is transparent to gckCOMMAND command buffer.
++**
++**  Existing Snippets:
++**  1. MMU Configure
++**     For new MMU, after GPU is reset, FE execute this command sequence to enble MMU.
++*/
++gceSTATUS
++gckHARDWARE_PrepareFunctions(
++    gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gckOS os;
++    gctUINT32 offset = 0;
++    gctUINT32 mmuBytes;
++    gctUINT32 endBytes;
++    gctUINT8_PTR logical;
++
++    gcmkHEADER_ARG("%x", Hardware);
++
++    os = Hardware->os;
++
++    gcmkVERIFY_OK(gckOS_GetPageSize(os, &Hardware->functionBytes));
++
++    /* Allocate a command buffer. */
++    gcmkONERROR(gckOS_AllocateNonPagedMemory(
++        os,
++        gcvFALSE,
++        &Hardware->functionBytes,
++        &Hardware->functionPhysical,
++        &Hardware->functionLogical
++        ));
++
++    gcmkONERROR(gckOS_GetPhysicalAddress(
++        os,
++        Hardware->functionLogical,
++        &Hardware->functionAddress
++        ));
++
++    if (Hardware->mmuVersion > 0)
++    {
++        /* MMU configure command sequence. */
++        logical = (gctUINT8_PTR)Hardware->functionLogical + offset;
++
++        Hardware->functions[gcvHARDWARE_FUNCTION_MMU].address
++            = Hardware->functionAddress + offset;
++
++        gcmkONERROR(gckHARDWARE_SetMMUStates(
++            Hardware,
++            Hardware->kernel->mmu->mtlbLogical,
++            gcvMMU_MODE_4K,
++            (gctUINT8_PTR)Hardware->kernel->mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
++            logical,
++            &mmuBytes
++            ));
++
++        offset += mmuBytes;
++
++        logical = (gctUINT8_PTR)Hardware->functionLogical + offset;
++
++        gcmkONERROR(gckHARDWARE_End(
++            Hardware,
++            gcvNULL,
++            &endBytes
++            ));
++
++        gcmkONERROR(gckHARDWARE_End(
++            Hardware,
++            logical,
++            &endBytes
++            ));
++
++        offset += endBytes;
++
++        Hardware->functions[gcvHARDWARE_FUNCTION_MMU].bytes = mmuBytes + endBytes;
++    }
++
++    gcmkASSERT(offset < Hardware->functionBytes);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_hardware.h	2015-07-27 23:13:06.186908111 +0200
+@@ -0,0 +1,160 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_hardware_h_
++#define __gc_hal_kernel_hardware_h_
++
++#if gcdENABLE_VG
++#include "gc_hal_kernel_hardware_vg.h"
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++typedef enum {
++    gcvHARDWARE_FUNCTION_MMU,
++    gcvHARDWARE_FUNCTION_FLUSH,
++
++    gcvHARDWARE_FUNCTION_NUM,
++}
++gceHARDWARE_FUNCTION;
++
++
++typedef struct _gcsHARWARE_FUNCTION
++{
++    /* Entry of the function. */
++    gctUINT32                   address;
++
++    /* Bytes of the function. */
++    gctUINT32                   bytes;
++}
++gcsHARDWARE_FUNCTION;
++
++/* gckHARDWARE object. */
++struct _gckHARDWARE
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gctKERNEL object. */
++    gckKERNEL                   kernel;
++
++    /* Pointer to gctOS object. */
++    gckOS                       os;
++
++    /* Core */
++    gceCORE                     core;
++
++    /* Chip characteristics. */
++    gcsHAL_QUERY_CHIP_IDENTITY  identity;
++    gctBOOL                     allowFastClear;
++    gctBOOL                     allowCompression;
++    gctUINT32                   powerBaseAddress;
++    gctBOOL                     extraEventStates;
++
++    /* Big endian */
++    gctBOOL                     bigEndian;
++
++    /* Chip status */
++    gctPOINTER                  powerMutex;
++    gctUINT32                   powerProcess;
++    gctUINT32                   powerThread;
++    gceCHIPPOWERSTATE           chipPowerState;
++    gctUINT32                   lastWaitLink;
++    gctUINT32                   lastEnd;
++    gctBOOL                     clockState;
++    gctBOOL                     powerState;
++    gctPOINTER                  globalSemaphore;
++
++    gctISRMANAGERFUNC           startIsr;
++    gctISRMANAGERFUNC           stopIsr;
++    gctPOINTER                  isrContext;
++
++    gctUINT32                   mmuVersion;
++
++    /* Whether use new MMU. It is meaningless
++    ** for old MMU since old MMU is always enabled.
++    */
++    gctBOOL                     enableMMU;
++
++    /* Type */
++    gceHARDWARE_TYPE            type;
++
++#if gcdPOWEROFF_TIMEOUT
++    gctUINT32                   powerOffTime;
++    gctUINT32                   powerOffTimeout;
++    gctPOINTER                  powerOffTimer;
++#endif
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    gctUINT32                   powerOnFscaleVal;
++#endif
++    gctPOINTER                  pageTableDirty;
++
++#if gcdLINK_QUEUE_SIZE
++    struct _gckLINKQUEUE        linkQueue;
++#endif
++
++    gctBOOL                     powerManagement;
++    gctBOOL                     powerManagementLock;
++    gctBOOL                     gpuProfiler;
++
++    gctBOOL                     endAfterFlushMmuCache;
++
++    gctUINT32                   minFscaleValue;
++
++    gctPOINTER                  pendingEvent;
++
++    /* Function used by gckHARDWARE. */
++    gctPHYS_ADDR                functionPhysical;
++    gctPOINTER                  functionLogical;
++    gctUINT32                   functionAddress;
++    gctSIZE_T                   functionBytes;
++
++    gcsHARDWARE_FUNCTION        functions[gcvHARDWARE_FUNCTION_NUM];
++};
++
++gceSTATUS
++gckHARDWARE_GetBaseAddress(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32_PTR BaseAddress
++    );
++
++gceSTATUS
++gckHARDWARE_NeedBaseAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 State,
++    OUT gctBOOL_PTR NeedBase
++    );
++
++gceSTATUS
++gckHARDWARE_GetFrameInfo(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_FRAME_INFO * FrameInfo
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_hardware_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/arch/gc_hal_kernel_recorder.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,679 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#include "gc_hal_kernel_context.h"
++
++/*
++ *                          -----------------------
++ *                          HARDWARE STATE RECORDER
++ *                          -----------------------
++ *
++ * State mirror buffer is used to 'mirror' hardware states since hardware
++ * states can't be dumpped. It is a context buffer which stores 'global'
++ * context.
++ *
++ * For each commit, state recorder
++ * 1) Records context buffer (if there is) and command buffers in this commit.
++ * 2) Parse those buffers to estimate the state changed.
++ * 3) Stores result to a mirror buffer.
++ *
++ * == Commit 0 ====================================================================
++ *
++ *      Context Buffer 0
++ *
++ *      Command Buffer 0
++ *
++ *      Mirror Buffer  0  <- Context Buffer 0 + Command Buffer 0
++ *
++ * == Commit 1 ====================================================================
++ *
++ *      Command Buffer 1
++ *
++ *      Mirror Buffer  1  <- Command buffer 1 + Mirror Buffer 0
++ *
++ * == Commit 2 ====================================================================
++ *
++ *      Context Buffer 2 (optional)
++ *
++ *      Command Buffer 2
++ *
++ *      Mirror  Buffer 2  <- Command buffer 2 + Context Buffer 2 + Mirror Buffer 1
++ *
++ * == Commit N ====================================================================
++ *
++ * For Commit N, these buffers are needed to reproduce hardware's behavior in
++ * this commit.
++ *
++ *  Mirror  Buffer [N - 1] : State Mirror accumlated by past commits,
++ *                           which is used to restore hardware state.
++ *  Context Buffer [N]     :
++ *  Command Buffer [N]     : Command buffer executed by hardware in this commit.
++ *
++ *  If sequence of states programming matters, hardware's behavior can't be reproduced,
++ *  but the state values stored in mirror buffer are assuring.
++ */
++
++/* Queue size. */
++#define gcdNUM_RECORDS  6
++
++typedef struct _gcsPARSER_HANDLER * gckPARSER_HANDLER;
++
++typedef void
++(*HandlerFunction)(
++    IN gckPARSER_HANDLER Handler,
++    IN gctUINT32 Addr,
++    IN gctUINT32 Data
++    );
++
++typedef struct _gcsPARSER_HANDLER
++{
++    gctUINT32           type;
++    gctUINT32           cmd;
++    gctPOINTER          private;
++    HandlerFunction     function;
++}
++gcsPARSER_HANDLER;
++
++typedef struct _gcsPARSER * gckPARSER;
++typedef struct _gcsPARSER
++{
++    gctUINT8_PTR        currentCmdBufferAddr;
++
++    /* Current command. */
++    gctUINT32           lo;
++    gctUINT32           hi;
++
++    gctUINT8            cmdOpcode;
++    gctUINT16           cmdAddr;
++    gctUINT32           cmdSize;
++    gctUINT32           cmdRectCount;
++    gctUINT8            skip;
++    gctUINT32           skipCount;
++
++    gctBOOL             allow;
++
++    /* Callback used by parser to handle a command. */
++    gckPARSER_HANDLER   commandHandler;
++}
++gcsPARSER;
++
++typedef struct _gcsMIRROR
++{
++    gctUINT32_PTR       logical[gcdNUM_RECORDS];
++    gctUINT32           bytes;
++    gcsSTATE_MAP_PTR    map;
++    gctUINT32           stateCount;
++}
++gcsMIRROR;
++
++typedef struct _gcsDELTA
++{
++    gctUINT64           commitStamp;
++    gctUINT32_PTR       command;
++    gctUINT32           commandBytes;
++    gctUINT32_PTR       context;
++    gctUINT32           contextBytes;
++}
++gcsDELTA;
++
++typedef struct _gcsRECORDER
++{
++    gckOS               os;
++    gcsMIRROR           mirror;
++    gcsDELTA            deltas[gcdNUM_RECORDS];
++
++    /* Index of current record. */
++    gctUINT             index;
++
++    /* Number of records. */
++    gctUINT             num;
++
++    /* Plugin used by gckPARSER. */
++    gcsPARSER_HANDLER   recorderHandler;
++    gckPARSER           parser;
++}
++gcsRECORDER;
++
++
++/******************************************************************************\
++***************************** Command Buffer Parser ****************************
++\******************************************************************************/
++
++/*
++** Command buffer parser checks command buffer in FE's view to make sure there
++** is no format error.
++**
++** Parser provide a callback mechnisam, so plug-in can be added to implement
++** other functions.
++*/
++
++static void
++_HandleLoadState(
++    IN OUT gckPARSER Parser
++    )
++{
++    gctUINT i;
++    gctUINT32_PTR data = (gctUINT32_PTR)Parser->currentCmdBufferAddr;
++    gctUINT32 cmdAddr = Parser->cmdAddr;
++
++    if (Parser->commandHandler == gcvNULL
++     || Parser->commandHandler->cmd != 0x01
++    )
++    {
++        /* No handler for this command. */
++        return;
++    }
++
++    for (i = 0; i < Parser->cmdSize; i++)
++    {
++        Parser->commandHandler->function(Parser->commandHandler, cmdAddr, *data);
++
++        /* Advance to next state. */
++        cmdAddr++;
++        data++;
++    }
++}
++
++static void
++_GetCommand(
++    IN OUT gckPARSER Parser
++    )
++{
++    gctUINT32 * buffer = (gctUINT32 *)Parser->currentCmdBufferAddr;
++
++    gctUINT16 cmdRectCount;
++    gctUINT16 cmdDataCount;
++
++    Parser->hi = buffer[0];
++    Parser->lo = buffer[1];
++
++    Parser->cmdOpcode = (((((gctUINT32) (Parser->hi)) >> (0 ? 31:27)) & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1)))))) );
++    Parser->cmdRectCount = 1;
++
++    switch (Parser->cmdOpcode)
++    {
++    case 0x01:
++        /* Extract count. */
++        Parser->cmdSize = (((((gctUINT32) (Parser->hi)) >> (0 ? 25:16)) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1)))))) );
++        if (Parser->cmdSize == 0)
++        {
++            /* 0 means 1024. */
++            Parser->cmdSize = 1024;
++        }
++        Parser->skip = (Parser->cmdSize & 0x1) ? 0 : 1;
++
++        /* Extract address. */
++        Parser->cmdAddr = (((((gctUINT32) (Parser->hi)) >> (0 ? 15:0)) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1)))))) );
++
++        Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr + 4;
++        Parser->skipCount = Parser->cmdSize + Parser->skip;
++        break;
++
++     case 0x05:
++        Parser->cmdSize   = 4;
++        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
++        break;
++
++    case 0x06:
++        Parser->cmdSize   = 5;
++        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
++        break;
++
++    case 0x0C:
++        Parser->cmdSize   = 3;
++        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
++        break;
++
++    case 0x09:
++        Parser->cmdSize   = 2;
++        Parser->cmdAddr   = 0x0F16;
++        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2);
++        break;
++
++     case 0x04:
++        Parser->cmdSize = 1;
++        Parser->cmdAddr = 0x0F06;
++
++        cmdRectCount = (((((gctUINT32) (Parser->hi)) >> (0 ? 15:8)) & ((gctUINT32) ((((1 ? 15:8) - (0 ? 15:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:8) - (0 ? 15:8) + 1)))))) );
++        cmdDataCount = (((((gctUINT32) (Parser->hi)) >> (0 ? 26:16)) & ((gctUINT32) ((((1 ? 26:16) - (0 ? 26:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 26:16) - (0 ? 26:16) + 1)))))) );
++
++        Parser->skipCount = gcmALIGN(Parser->cmdSize, 2)
++                          + cmdRectCount * 2
++                          + gcmALIGN(cmdDataCount, 2);
++
++        Parser->cmdRectCount = cmdRectCount;
++        break;
++
++    case 0x03:
++        Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr + 8;
++        Parser->skipCount = 0;
++        break;
++
++    case 0x02:
++        Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr + 8;
++        Parser->skipCount = 0;
++        break;
++
++    default:
++        /* Unknown command is a risk. */
++        Parser->allow = gcvFALSE;
++        break;
++    }
++}
++
++static void
++_ParseCommand(
++    IN OUT gckPARSER Parser
++    )
++{
++    switch(Parser->cmdOpcode)
++    {
++    case 0x01:
++        _HandleLoadState(Parser);
++        break;
++    case 0x05:
++    case 0x06:
++    case 0x0C:
++        break;
++    case 0x04:
++        break;
++    default:
++        break;
++    }
++
++    /* Advance to next command. */
++    Parser->currentCmdBufferAddr = Parser->currentCmdBufferAddr
++                                 + (Parser->skipCount << 2);
++}
++
++gceSTATUS
++gckPARSER_Parse(
++    IN gckPARSER Parser,
++    IN gctUINT8_PTR Buffer,
++    IN gctUINT32 Bytes
++    )
++{
++    gckPARSER parser = Parser;
++    gctUINT8_PTR end = (gctUINT8_PTR)Buffer + Bytes;
++
++    /* Initialize parser. */
++    parser->currentCmdBufferAddr = (gctUINT8_PTR)Buffer;
++    parser->skip = 0;
++    parser->allow = gcvTRUE;
++
++    /* Go through command buffer until reaching the end
++    ** or meeting an error. */
++    do
++    {
++        _GetCommand(parser);
++
++        _ParseCommand(parser);
++    }
++    while ((parser->currentCmdBufferAddr < end) && (parser->allow == gcvTRUE));
++
++    if (parser->allow == gcvFALSE)
++    {
++        /* Error detected. */
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckPARSER_RegisterCommandHandler
++**
++**  Register a command handler which will be called when parser get a command.
++**
++*/
++gceSTATUS
++gckPARSER_RegisterCommandHandler(
++    IN gckPARSER Parser,
++    IN gckPARSER_HANDLER Handler
++    )
++{
++    Parser->commandHandler = Handler;
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckPARSER_Construct(
++    IN gckOS Os,
++    IN gckPARSER_HANDLER Handler,
++    OUT gckPARSER * Parser
++    )
++{
++    gceSTATUS status;
++    gckPARSER pointer;
++
++    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcsPARSER), (gctPOINTER *)&pointer));
++
++    /* Put it here temp, should have a more general plug-in mechnisam. */
++    pointer->commandHandler = Handler;
++
++    *Parser = pointer;
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++void
++gckPARSER_Destroy(
++    IN gckOS Os,
++    IN gckPARSER Parser
++    )
++{
++    gcmkOS_SAFE_FREE(Os, Parser);
++}
++
++/******************************************************************************\
++**************************** Hardware States Recorder **************************
++\******************************************************************************/
++
++static void
++_RecodeState(
++    IN gckPARSER_HANDLER Handler,
++    IN gctUINT32 Addr,
++    IN gctUINT32 Data
++    )
++{
++    gcmkVERIFY_OK(gckRECORDER_UpdateMirror(Handler->private, Addr, Data));
++}
++
++static gctUINT
++_Previous(
++    IN gctUINT Index
++    )
++{
++    if (Index == 0)
++    {
++        return gcdNUM_RECORDS - 1;
++    }
++
++    return Index - 1;
++}
++
++static gctUINT
++_Next(
++    IN gctUINT Index
++    )
++{
++    return (Index + 1) % gcdNUM_RECORDS;
++}
++
++gceSTATUS
++gckRECORDER_Construct(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    OUT gckRECORDER * Recorder
++    )
++{
++    gceSTATUS status;
++    gckCONTEXT context = gcvNULL;
++    gckRECORDER recorder = gcvNULL;
++    gctUINT32 mapSize;
++    gctUINT i;
++    gctBOOL virtualCommandBuffer = Hardware->kernel->virtualCommandBuffer;
++
++    /* TODO: We only need context buffer and state map, it should be able to get without construct a
++    ** new context.
++    ** Now it is leaked, since we can't free it when command buffer is gone.
++    */
++
++    /* MMU is not ready now. */
++    Hardware->kernel->virtualCommandBuffer = gcvFALSE;
++
++    gcmkONERROR(gckCONTEXT_Construct(Os, Hardware, 0, &context));
++
++    /* Restore. */
++    Hardware->kernel->virtualCommandBuffer = virtualCommandBuffer;
++
++    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcsRECORDER), (gctPOINTER *)&recorder));
++
++    gckOS_ZeroMemory(recorder, gcmSIZEOF(gcsRECORDER));
++
++    /* Copy state map. */
++    recorder->mirror.stateCount = context->stateCount;
++
++    mapSize = context->stateCount * gcmSIZEOF(gcsSTATE_MAP);
++
++    gcmkONERROR(gckOS_Allocate(Os, mapSize, (gctPOINTER *)&recorder->mirror.map));
++
++    gckOS_MemCopy(recorder->mirror.map, context->map, mapSize);
++
++    /* Copy context buffer. */
++    recorder->mirror.bytes = context->totalSize;
++
++    for (i = 0; i < gcdNUM_RECORDS; i++)
++    {
++        gcmkONERROR(gckOS_Allocate(Os, context->totalSize, (gctPOINTER *)&recorder->mirror.logical[i]));
++        gckOS_MemCopy(recorder->mirror.logical[i], context->buffer->logical, context->totalSize);
++    }
++
++    for (i = 0; i < gcdNUM_RECORDS; i++)
++    {
++        /* TODO : Optimize size. */
++        gcmkONERROR(gckOS_Allocate(Os, gcdCMD_BUFFER_SIZE, (gctPOINTER *)&recorder->deltas[i].command));
++        gcmkONERROR(gckOS_Allocate(Os, context->totalSize, (gctPOINTER *)&recorder->deltas[i].context));
++    }
++
++    recorder->index = 0;
++    recorder->num   = 0;
++
++    /* Initialize Parser plugin. */
++    recorder->recorderHandler.cmd = 0x01;
++    recorder->recorderHandler.private = recorder;
++    recorder->recorderHandler.function = _RecodeState;
++
++    gcmkONERROR(gckPARSER_Construct(Os, &recorder->recorderHandler, &recorder->parser));
++
++    recorder->os = Os;
++
++    *Recorder = recorder;
++
++    return gcvSTATUS_OK;
++
++OnError:
++    if (recorder)
++    {
++        gckRECORDER_Destory(Os, recorder);
++    }
++
++    return status;
++}
++
++gceSTATUS
++gckRECORDER_Destory(
++    IN gckOS Os,
++    IN gckRECORDER Recorder
++    )
++{
++    gctUINT i;
++
++    if (Recorder->mirror.map)
++    {
++        gcmkOS_SAFE_FREE(Os, Recorder->mirror.map);
++    }
++
++    for (i = 0; i < gcdNUM_RECORDS; i++)
++    {
++        if (Recorder->mirror.logical[i])
++        {
++            gcmkOS_SAFE_FREE(Os, Recorder->mirror.logical[i]);
++        }
++    }
++
++    for (i = 0; i < gcdNUM_RECORDS; i++)
++    {
++        if (Recorder->deltas[i].command)
++        {
++            gcmkOS_SAFE_FREE(Os, Recorder->deltas[i].command);
++        }
++
++        if (Recorder->deltas[i].context)
++        {
++            gcmkOS_SAFE_FREE(Os, Recorder->deltas[i].context);
++        }
++    }
++
++    if (Recorder->parser)
++    {
++        gckPARSER_Destroy(Os, Recorder->parser);
++    }
++
++    gcmkOS_SAFE_FREE(Os, Recorder);
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckRECORDER_UpdateMirror(
++    IN gckRECORDER Recorder,
++    IN gctUINT32 State,
++    IN gctUINT32 Data
++    )
++{
++    gctUINT32 index;
++    gcsSTATE_MAP_PTR map = Recorder->mirror.map;
++    gctUINT32_PTR buffer = Recorder->mirror.logical[Recorder->index];
++
++    if (State >= Recorder->mirror.stateCount)
++    {
++        /* Ignore them just like HW does. */
++        return gcvSTATUS_OK;
++    }
++
++    index = map[State].index;
++
++    if (index)
++    {
++        buffer[index] = Data;
++    }
++
++    return gcvSTATUS_OK;
++}
++
++void
++gckRECORDER_AdvanceIndex(
++    IN gckRECORDER Recorder,
++    IN gctUINT64 CommitStamp
++    )
++{
++    /* Get next record. */
++    gctUINT next = (Recorder->index + 1) % gcdNUM_RECORDS;
++
++    /* Record stamp of this commit. */
++    Recorder->deltas[Recorder->index].commitStamp = CommitStamp;
++
++    /* Mirror of next record is mirror of this record and delta in next record. */
++    gckOS_MemCopy(Recorder->mirror.logical[next],
++        Recorder->mirror.logical[Recorder->index], Recorder->mirror.bytes);
++
++    /* Advance to next record. */
++    Recorder->index = next;
++
++    Recorder->num = gcmMIN(Recorder->num + 1, gcdNUM_RECORDS - 1);
++
++
++    /* Reset delta. */
++    Recorder->deltas[Recorder->index].commandBytes = 0;
++    Recorder->deltas[Recorder->index].contextBytes = 0;
++}
++
++void
++gckRECORDER_Record(
++    IN gckRECORDER Recorder,
++    IN gctUINT8_PTR CommandBuffer,
++    IN gctUINT32 CommandBytes,
++    IN gctUINT8_PTR ContextBuffer,
++    IN gctUINT32 ContextBytes
++    )
++{
++    gcsDELTA * delta = &Recorder->deltas[Recorder->index];
++
++    if (CommandBytes != 0xFFFFFFFF)
++    {
++        gckPARSER_Parse(Recorder->parser, CommandBuffer, CommandBytes);
++        gckOS_MemCopy(delta->command, CommandBuffer, CommandBytes);
++        delta->commandBytes = CommandBytes;
++    }
++
++    if (ContextBytes != 0xFFFFFFFF)
++    {
++        gckPARSER_Parse(Recorder->parser, ContextBuffer, ContextBytes);
++        gckOS_MemCopy(delta->context, ContextBuffer, ContextBytes);
++        delta->contextBytes = ContextBytes;
++    }
++}
++
++void
++gckRECORDER_Dump(
++    IN gckRECORDER Recorder
++    )
++{
++    gctUINT last = Recorder->index;
++    gctUINT previous;
++    gctUINT i;
++    gcsMIRROR *mirror = &Recorder->mirror;
++    gcsDELTA *delta;
++    gckOS os = Recorder->os;
++
++    for (i = 0; i < Recorder->num; i++)
++    {
++        last = _Previous(last);
++    }
++
++    for (i = 0; i < Recorder->num; i++)
++    {
++        delta = &Recorder->deltas[last];
++
++        /* Dump record */
++        gcmkPRINT("#[commit %llu]", delta->commitStamp);
++
++        if (delta->commitStamp)
++        {
++            previous = _Previous(last);
++
++            gcmkPRINT("#[mirror]");
++            gckOS_DumpBuffer(os, mirror->logical[previous], mirror->bytes, gceDUMP_BUFFER_CONTEXT, gcvTRUE);
++            gcmkPRINT("@[kernel.execute]");
++        }
++
++        if (delta->contextBytes)
++        {
++            gckOS_DumpBuffer(os, delta->context, delta->contextBytes, gceDUMP_BUFFER_CONTEXT, gcvTRUE);
++            gcmkPRINT("@[kernel.execute]");
++        }
++
++        gckOS_DumpBuffer(os, delta->command, delta->commandBytes, gceDUMP_BUFFER_USER, gcvTRUE);
++        gcmkPRINT("@[kernel.execute]");
++
++        last = _Next(last);
++    }
++}
++
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,932 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++
++#if gcdENABLE_VG
++
++#include "gc_hal_kernel_hardware_command_vg.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_COMMAND
++
++/******************************************************************************\
++****************************** gckVGCOMMAND API code *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_InitializeInfo
++**
++**  Initialize architecture dependent command buffer information.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to the Command object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGCOMMAND_InitializeInfo(
++    IN gckVGCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    do
++    {
++        /* Reset interrupts. */
++        Command->info.feBufferInt   = -1;
++        Command->info.tsOverflowInt = -1;
++
++        /* Set command buffer attributes. */
++        Command->info.addressAlignment = 64;
++        Command->info.commandAlignment = 8;
++
++        /* Determine command alignment address mask. */
++        Command->info.addressMask = ((((gctUINT32) (Command->info.addressAlignment - 1)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0 ) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++        /* Query the number of bytes needed by the STATE command. */
++        gcmkERR_BREAK(gckVGCOMMAND_StateCommand(
++            Command, 0x0, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.stateCommandSize
++            ));
++
++        /* Query the number of bytes needed by the RESTART command. */
++        gcmkERR_BREAK(gckVGCOMMAND_RestartCommand(
++            Command, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.restartCommandSize
++            ));
++
++        /* Query the number of bytes needed by the FETCH command. */
++        gcmkERR_BREAK(gckVGCOMMAND_FetchCommand(
++            Command, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.fetchCommandSize
++            ));
++
++        /* Query the number of bytes needed by the CALL command. */
++        gcmkERR_BREAK(gckVGCOMMAND_CallCommand(
++            Command, gcvNULL, (gctUINT32)~0, 0,
++            &Command->info.callCommandSize
++            ));
++
++        /* Query the number of bytes needed by the RETURN command. */
++        gcmkERR_BREAK(gckVGCOMMAND_ReturnCommand(
++            Command, gcvNULL,
++            &Command->info.returnCommandSize
++            ));
++
++        /* Query the number of bytes needed by the EVENT command. */
++        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
++            Command, gcvNULL, gcvBLOCK_PIXEL, -1,
++            &Command->info.eventCommandSize
++            ));
++
++        /* Query the number of bytes needed by the END command. */
++        gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
++            Command, gcvNULL, -1,
++            &Command->info.endCommandSize
++            ));
++
++        /* Determine the tail reserve size. */
++        Command->info.staticTailSize = gcmMAX(
++            Command->info.fetchCommandSize,
++            gcmMAX(
++                Command->info.returnCommandSize,
++                Command->info.endCommandSize
++                )
++            );
++
++        /* Determine the maximum tail size. */
++        Command->info.dynamicTailSize
++            = Command->info.staticTailSize
++            + Command->info.eventCommandSize * gcvBLOCK_COUNT;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_StateCommand
++**
++**  Append a STATE command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctUINT32 Pipe
++**          Harwdare destination pipe.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          STATE command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 Address
++**          Starting register address of the state buffer.
++**          If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT32 Count
++**          Number of states in state buffer.
++**          If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the STATE command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the STATE command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_StateCommand(
++    IN gckVGCOMMAND Command,
++    IN gctUINT32 Pipe,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Address,
++    IN gctUINT32 Count,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Pipe=0x%x Logical=0x%x Address=0x%x Count=0x%x Bytes = 0x%x",
++                   Command, Pipe, Logical, Address, Count, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append STATE. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) ((gctUINT32) (Pipe) & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the STATE command. */
++            *Bytes = 4 * (Count + 1);
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append LOAD_STATE. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Address) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the STATE command. */
++            *Bytes = 4 * (Count + 1);
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_RestartCommand
++**
++**  Form a RESTART command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          RESTART command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 FetchAddress
++**          The address of another command buffer to be executed by this RESTART
++**          command.  If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT FetchCount
++**          The number of 64-bit data quantities in another command buffer to
++**          be executed by this RESTART command.  If 'Logical' is gcvNULL, this
++**          argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the RESTART command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the RESTART command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_RestartCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
++                   Command, Logical, FetchAddress, FetchCount, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++            gctUINT32 beginEndMark;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Determine Begin/End flag. */
++            beginEndMark = (FetchCount > 0)
++                ? ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)))
++                : ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 24:24) - (0 ? 24:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 24:24) - (0 ? 24:24) + 1))))))) << (0 ? 24:24)));
++
++            /* Append RESTART. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x9 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)))
++                | beginEndMark;
++
++            buffer[1]
++                = FetchAddress;
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the RESTART command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_FetchCommand
++**
++**  Form a FETCH command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          FETCH command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 FetchAddress
++**          The address of another command buffer to be executed by this FETCH
++**          command.  If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT FetchCount
++**          The number of 64-bit data quantities in another command buffer to
++**          be executed by this FETCH command.  If 'Logical' is gcvNULL, this
++**          argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the FETCH command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the FETCH command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_FetchCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
++                   Command, Logical, FetchAddress, FetchCount, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append FETCH. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x5 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
++
++            buffer[1]
++                = gcmkFIXADDRESS(FetchAddress);
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the FETCH command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append LINK. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x08 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)));
++
++            buffer[1]
++                = gcmkFIXADDRESS(FetchAddress);
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the LINK command. */
++            *Bytes = 8;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_CallCommand
++**
++**  Append a CALL command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          CALL command at or gcvNULL to query the size of the command.
++**
++**      gctUINT32 FetchAddress
++**          The address of another command buffer to be executed by this CALL
++**          command.  If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gctUINT FetchCount
++**          The number of 64-bit data quantities in another command buffer to
++**          be executed by this CALL command.  If 'Logical' is gcvNULL, this
++**          argument is ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the CALL command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the CALL command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_CallCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x FetchAddress=0x%x FetchCount=0x%x Bytes = 0x%x",
++                   Command, Logical, FetchAddress, FetchCount, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append CALL. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x6 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0))) | (((gctUINT32) ((gctUINT32) (FetchCount) & ((gctUINT32) ((((1 ? 20:0) - (0 ? 20:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:0) - (0 ? 20:0) + 1))))))) << (0 ? 20:0)));
++
++            buffer[1]
++                = gcmkFIXADDRESS(FetchAddress);
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the CALL command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_ReturnCommand
++**
++**  Append a RETURN command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to an gckVGCOMMAND object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          RETURN command at or gcvNULL to query the size of the command.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the RETURN command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the RETURN command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_ReturnCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x  Bytes = 0x%x",
++                   Command, Logical, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append RETURN. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x7 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the RETURN command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_NOT_SUPPORTED;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_EventCommand
++**
++**  Form an EVENT command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to the Command object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          EVENT command at or gcvNULL to query the size of the command.
++**
++**      gctINT32 InterruptId
++**          The ID of the interrupt to generate.
++**          If 'Logical' is gcvNULL, this argument is ignored.
++**
++**      gceBLOCK Block
++**          Block that will generate the interrupt.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the EVENT command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_EventCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gceBLOCK Block,
++    IN gctINT32 InterruptId,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x Block=0x%x InterruptId=0x%x Bytes = 0x%x",
++                   Command, Logical, Block, InterruptId, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        typedef struct _gcsEVENTSTATES
++        {
++            /* Chips before VG21 use these values. */
++            gctUINT     eventFromFE;
++            gctUINT     eventFromPE;
++
++            /* VG21 chips and later use SOURCE field. */
++            gctUINT     eventSource;
++        }
++        gcsEVENTSTATES;
++
++        static gcsEVENTSTATES states[] =
++        {
++            /* gcvBLOCK_COMMAND */
++            {
++                (gctUINT)~0,
++                (gctUINT)~0,
++                (gctUINT)~0
++            },
++
++            /* gcvBLOCK_TESSELLATOR */
++            {
++                0x0,
++                0x1,
++                0x10
++            },
++
++            /* gcvBLOCK_TESSELLATOR2 */
++            {
++                0x0,
++                0x1,
++                0x12
++            },
++
++            /* gcvBLOCK_TESSELLATOR3 */
++            {
++                0x0,
++                0x1,
++                0x14
++            },
++
++            /* gcvBLOCK_RASTER */
++            {
++                0x0,
++                0x1,
++                0x07,
++            },
++
++            /* gcvBLOCK_VG */
++            {
++                0x0,
++                0x1,
++                0x0F
++            },
++
++            /* gcvBLOCK_VG2 */
++            {
++                0x0,
++                0x1,
++                0x11
++            },
++
++            /* gcvBLOCK_VG3 */
++            {
++                0x0,
++                0x1,
++                0x13
++            },
++
++            /* gcvBLOCK_PIXEL */
++            {
++                0x0,
++                0x1,
++                0x07
++            },
++        };
++
++        /* Verify block ID. */
++        gcmkVERIFY_ARGUMENT(gcmIS_VALID_INDEX(Block, states));
++
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append EVENT. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x3 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 11:0) - (0 ? 11:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:0) - (0 ? 11:0) + 1))))))) << (0 ? 11:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 27:16) - (0 ? 27:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 27:16) - (0 ? 27:16) + 1))))))) << (0 ? 27:16)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 13:12) - (0 ? 13:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:12) - (0 ? 13:12) + 1))))))) << (0 ? 13:12)));
++
++            /* Determine chip version. */
++            if (Command->vg21)
++            {
++                /* Get the event source for the block. */
++                gctUINT eventSource = states[Block].eventSource;
++
++                /* Supported? */
++                if (eventSource == ~0)
++                {
++                    gcmkFOOTER_NO();
++                    return gcvSTATUS_NOT_SUPPORTED;
++                }
++
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8))) | (((gctUINT32) ((gctUINT32) (eventSource) & ((gctUINT32) ((((1 ? 12:8) - (0 ? 12:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:8) - (0 ? 12:8) + 1))))))) << (0 ? 12:8)));
++            }
++            else
++            {
++                /* Get the event source for the block. */
++                gctUINT eventFromFE = states[Block].eventFromFE;
++                gctUINT eventFromPE = states[Block].eventFromPE;
++
++                /* Supported? */
++                if (eventFromFE == ~0)
++                {
++                    gcmkFOOTER_NO();
++                    return gcvSTATUS_NOT_SUPPORTED;
++                }
++
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) ((gctUINT32) (eventFromFE) & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) ((gctUINT32) (eventFromPE) & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++            }
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Make sure the events are directly supported for the block. */
++            if (states[Block].eventSource == ~0)
++            {
++                gcmkFOOTER_NO();
++                return gcvSTATUS_NOT_SUPPORTED;
++            }
++
++            /* Return number of bytes required by the END command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++            gcmkVERIFY_ARGUMENT(InterruptId <= ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))));
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append EVENT. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            /* Determine event source. */
++            if (Block == gcvBLOCK_COMMAND)
++            {
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 5:5) - (0 ? 5:5) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 5:5) - (0 ? 5:5) + 1))))))) << (0 ? 5:5)));
++            }
++            else
++            {
++                buffer[1]
++                    = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                    | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++            }
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the EVENT and END commands. */
++            *Bytes = 8;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGCOMMAND_EndCommand
++**
++**  Form an END command at the specified location in the command buffer.
++**
++**  INPUT:
++**
++**      gckVGCOMMAND Command
++**          Pointer to the Command object.
++**
++**      gctPOINTER Logical
++**          Pointer to the current location inside the command buffer to append
++**          END command at or gcvNULL to query the size of the command.
++**
++**      gctINT32 InterruptId
++**          The ID of the interrupt to generate.
++**          If 'Logical' is gcvNULL, this argument will be ignored.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes available for the END command.
++**          If 'Logical' is gcvNULL, the value from this argument is ignored.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that will receive the number of bytes required
++**          for the END command.  If 'Bytes' is gcvNULL, nothing is returned.
++*/
++gceSTATUS
++gckVGCOMMAND_EndCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctINT32 InterruptId,
++    IN OUT gctUINT32 * Bytes
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Logical=0x%x InterruptId=0x%x Bytes = 0x%x",
++                   Command, Logical, InterruptId, Bytes);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->fe20)
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR buffer;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++
++            /* Cast the buffer pointer. */
++            buffer = (gctUINT32_PTR) Logical;
++
++            /* Append END. */
++            buffer[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 31:28) - (0 ? 31:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:28) - (0 ? 31:28) + 1))))))) << (0 ? 31:28)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the END command. */
++            *Bytes = 8;
++        }
++    }
++    else
++    {
++        if (Logical != gcvNULL)
++        {
++            gctUINT32_PTR memory;
++
++            /* Verify the event ID. */
++            gcmkVERIFY_ARGUMENT(InterruptId >= 0);
++
++            /* Cast the buffer pointer. */
++            memory = (gctUINT32_PTR) Logical;
++
++            /* Append EVENT. */
++            memory[0]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E01) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++            memory[1]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0))) | (((gctUINT32) ((gctUINT32) (InterruptId) & ((gctUINT32) ((((1 ? 4:0) - (0 ? 4:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:0) - (0 ? 4:0) + 1))))))) << (0 ? 4:0)))
++                | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 6:6) - (0 ? 6:6) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 6:6) - (0 ? 6:6) + 1))))))) << (0 ? 6:6)));
++
++            /* Append END. */
++            memory[2]
++                = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x02 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)));
++        }
++
++        if (Bytes != gcvNULL)
++        {
++            /* Return number of bytes required by the EVENT and END commands. */
++            *Bytes = 16;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++#endif /* gcdENABLE_VG */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_command_vg.h	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,319 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_hardware_command_vg_h_
++#define __gc_hal_kernel_hardware_command_vg_h_
++
++/******************************************************************************\
++******************* Task and Interrupt Management Structures. ******************
++\******************************************************************************/
++
++/* Task storage header. */
++typedef struct _gcsTASK_STORAGE * gcsTASK_STORAGE_PTR;
++typedef struct _gcsTASK_STORAGE
++{
++    /* Next allocated storage buffer. */
++    gcsTASK_STORAGE_PTR         next;
++}
++gcsTASK_STORAGE;
++
++/* Task container header. */
++typedef struct _gcsTASK_CONTAINER * gcsTASK_CONTAINER_PTR;
++typedef struct _gcsTASK_CONTAINER
++{
++    /* The number of tasks left to be processed in the container. */
++    gctINT                      referenceCount;
++
++    /* Size of the buffer. */
++    gctUINT                     size;
++
++    /* Link to the previous and the next allocated containers. */
++    gcsTASK_CONTAINER_PTR       allocPrev;
++    gcsTASK_CONTAINER_PTR       allocNext;
++
++    /* Link to the previous and the next containers in the free list. */
++    gcsTASK_CONTAINER_PTR       freePrev;
++    gcsTASK_CONTAINER_PTR       freeNext;
++}
++gcsTASK_CONTAINER;
++
++/* Kernel space task master table entry. */
++typedef struct _gcsBLOCK_TASK_ENTRY * gcsBLOCK_TASK_ENTRY_PTR;
++typedef struct _gcsBLOCK_TASK_ENTRY
++{
++    /* Pointer to the current task container for the block. */
++    gcsTASK_CONTAINER_PTR       container;
++
++    /* Pointer to the current task data within the container. */
++    gcsTASK_HEADER_PTR          task;
++
++    /* Pointer to the last link task within the container. */
++    gcsTASK_LINK_PTR            link;
++
++    /* Number of interrupts allocated for this block. */
++    gctUINT                     interruptCount;
++
++    /* The index of the current interrupt. */
++    gctUINT                     interruptIndex;
++
++    /* Interrupt semaphore. */
++    gctSEMAPHORE                interruptSemaphore;
++
++    /* Interrupt value array. */
++    gctINT32                    interruptArray[32];
++}
++gcsBLOCK_TASK_ENTRY;
++
++
++/******************************************************************************\
++********************* Command Queue Management Structures. *********************
++\******************************************************************************/
++
++/* Command queue kernel element pointer. */
++typedef struct _gcsKERNEL_CMDQUEUE * gcsKERNEL_CMDQUEUE_PTR;
++
++/* Command queue object handler function type. */
++typedef gceSTATUS (* gctOBJECT_HANDLER) (
++    gckVGKERNEL Kernel,
++    gcsKERNEL_CMDQUEUE_PTR Entry
++    );
++
++/* Command queue kernel element. */
++typedef struct _gcsKERNEL_CMDQUEUE
++{
++    /* The number of buffers in the queue. */
++    gcsCMDBUFFER_PTR            commandBuffer;
++
++    /* Pointer to the object handler function. */
++    gctOBJECT_HANDLER           handler;
++}
++gcsKERNEL_CMDQUEUE;
++
++/* Command queue header. */
++typedef struct _gcsKERNEL_QUEUE_HEADER * gcsKERNEL_QUEUE_HEADER_PTR;
++typedef struct _gcsKERNEL_QUEUE_HEADER
++{
++    /* The size of the buffer in bytes. */
++    gctUINT                     size;
++
++    /* The number of pending entries to be processed. */
++    volatile gctUINT            pending;
++
++    /* The current command queue entry. */
++    gcsKERNEL_CMDQUEUE_PTR      currentEntry;
++
++    /* Next buffer. */
++    gcsKERNEL_QUEUE_HEADER_PTR  next;
++}
++gcsKERNEL_QUEUE_HEADER;
++
++
++/******************************************************************************\
++******************************* gckVGCOMMAND Object *******************************
++\******************************************************************************/
++
++/* gckVGCOMMAND object. */
++struct _gckVGCOMMAND
++{
++    /***************************************************************************
++    ** Object data and pointers.
++    */
++
++    gcsOBJECT                   object;
++    gckVGKERNEL                 kernel;
++    gckOS                       os;
++    gckVGHARDWARE                   hardware;
++
++    /* Features. */
++    gctBOOL                     fe20;
++    gctBOOL                     vg20;
++    gctBOOL                     vg21;
++
++
++    /***************************************************************************
++    ** Enable command queue dumping.
++    */
++
++    gctBOOL                     enableDumping;
++
++
++    /***************************************************************************
++    ** Bus Error interrupt.
++    */
++
++    gctINT32                    busErrorInt;
++
++
++    /***************************************************************************
++    ** Command buffer information.
++    */
++
++    gcsCOMMAND_BUFFER_INFO      info;
++
++
++    /***************************************************************************
++    ** Synchronization objects.
++    */
++
++    gctPOINTER                  queueMutex;
++    gctPOINTER                  taskMutex;
++    gctPOINTER                  commitMutex;
++
++
++    /***************************************************************************
++    ** Task management.
++    */
++
++    /* The head of the storage buffer linked list. */
++    gcsTASK_STORAGE_PTR         taskStorage;
++
++    /* Allocation size. */
++    gctUINT                     taskStorageGranularity;
++    gctUINT                     taskStorageUsable;
++
++    /* The free container list. */
++    gcsTASK_CONTAINER_PTR       taskFreeHead;
++    gcsTASK_CONTAINER_PTR       taskFreeTail;
++
++    /* Task table */
++    gcsBLOCK_TASK_ENTRY         taskTable[gcvBLOCK_COUNT];
++
++
++    /***************************************************************************
++    ** Command queue.
++    */
++
++    /* Pointer to the allocated queue memory. */
++    gcsKERNEL_QUEUE_HEADER_PTR  queue;
++
++    /* Pointer to the current available queue from which new queue entries
++       will be allocated. */
++    gcsKERNEL_QUEUE_HEADER_PTR  queueHead;
++
++    /* If different from queueHead, points to the command queue which is
++       currently being executed by the hardware. */
++    gcsKERNEL_QUEUE_HEADER_PTR  queueTail;
++
++    /* Points to the queue to merge the tail with when the tail is processed. */
++    gcsKERNEL_QUEUE_HEADER_PTR  mergeQueue;
++
++    /* Queue overflow counter. */
++    gctUINT                     queueOverflow;
++
++
++    /***************************************************************************
++    ** Context.
++    */
++
++    /* Context counter used for unique ID. */
++    gctUINT64                   contextCounter;
++
++    /* Current context ID. */
++    gctUINT64                   currentContext;
++
++    /* Command queue power semaphore. */
++    gctPOINTER                  powerSemaphore;
++    gctINT32                    powerStallInt;
++    gcsCMDBUFFER_PTR            powerStallBuffer;
++    gctSIGNAL                   powerStallSignal;
++
++};
++
++/******************************************************************************\
++************************ gckVGCOMMAND Object Internal API. ***********************
++\******************************************************************************/
++
++/* Initialize architecture dependent command buffer information. */
++gceSTATUS
++gckVGCOMMAND_InitializeInfo(
++    IN gckVGCOMMAND Command
++    );
++
++/* Form a STATE command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_StateCommand(
++    IN gckVGCOMMAND Command,
++    IN gctUINT32 Pipe,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Address,
++    IN gctUINT32 Count,
++    IN OUT gctUINT32 * Bytes
++    );
++
++/* Form a RESTART command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_RestartCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctUINT32 * Bytes
++    );
++
++/* Form a FETCH command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_FetchCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctUINT32 * Bytes
++    );
++
++/* Form a CALL command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_CallCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctUINT32 FetchAddress,
++    IN gctUINT FetchCount,
++    IN OUT gctUINT32 * Bytes
++    );
++
++/* Form a RETURN command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_ReturnCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN OUT gctUINT32 * Bytes
++    );
++
++/* Form an EVENT command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_EventCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gceBLOCK Block,
++    IN gctINT32 InterruptId,
++    IN OUT gctUINT32 * Bytes
++    );
++
++/* Form an END command at the specified location in the command buffer. */
++gceSTATUS
++gckVGCOMMAND_EndCommand(
++    IN gckVGCOMMAND Command,
++    IN gctPOINTER Logical,
++    IN gctINT32 InterruptId,
++    IN OUT gctUINT32 * Bytes
++    );
++
++#endif  /* __gc_hal_kernel_hardware_command_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,2119 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal.h"
++#include "gc_hal_kernel.h"
++#include "gc_hal_kernel_hardware_command_vg.h"
++
++#if gcdENABLE_VG
++
++#define _GC_OBJ_ZONE    gcvZONE_HARDWARE
++
++typedef enum
++{
++    gcvPOWER_FLAG_INITIALIZE    = 1 << 0,
++    gcvPOWER_FLAG_STALL         = 1 << 1,
++    gcvPOWER_FLAG_STOP          = 1 << 2,
++    gcvPOWER_FLAG_START         = 1 << 3,
++    gcvPOWER_FLAG_RELEASE       = 1 << 4,
++    gcvPOWER_FLAG_DELAY         = 1 << 5,
++    gcvPOWER_FLAG_SAVE          = 1 << 6,
++    gcvPOWER_FLAG_ACQUIRE       = 1 << 7,
++    gcvPOWER_FLAG_POWER_OFF     = 1 << 8,
++    gcvPOWER_FLAG_CLOCK_OFF     = 1 << 9,
++    gcvPOWER_FLAG_CLOCK_ON      = 1 << 10,
++    gcvPOWER_FLAG_NOP           = 1 << 11,
++}
++gcePOWER_FLAGS;
++
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++static gceSTATUS
++_ResetGPU(
++    IN gckOS Os
++    )
++{
++    gctUINT32 control, idle;
++    gceSTATUS status;
++
++    /* Read register. */
++    gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                     gcvCORE_VG,
++                                     0x00000,
++                                     &control));
++
++    for (;;)
++    {
++        /* Disable clock gating. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                    gcvCORE_VG,
++                    0x00104,
++                    0x00000000));
++
++        /* Wait for clock being stable. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Isolate the GPU. */
++        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          control));
++
++        /* Set soft reset. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Wait for reset. */
++        gcmkONERROR(gckOS_Delay(Os, 1));
++
++        /* Reset soft reset bit. */
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 12:12) - (0 ? 12:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 12:12) - (0 ? 12:12) + 1))))))) << (0 ? 12:12)))));
++
++        /* Reset GPU isolation. */
++        control = ((((gctUINT32) (control)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 19:19) - (0 ? 19:19) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 19:19) - (0 ? 19:19) + 1))))))) << (0 ? 19:19)));
++
++        gcmkONERROR(gckOS_WriteRegisterEx(Os,
++                                          gcvCORE_VG,
++                                          0x00000,
++                                          control));
++
++        /* Read idle register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         gcvCORE_VG,
++                                         0x00004,
++                                         &idle));
++
++        if ((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) == 0)
++        {
++            continue;
++        }
++
++        /* Read reset register. */
++        gcmkONERROR(gckOS_ReadRegisterEx(Os,
++                                         gcvCORE_VG,
++                                         0x00000,
++                                         &control));
++
++        if (((((((gctUINT32) (control)) >> (0 ? 16:16)) & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1)))))) ) == 0)
++        ||  ((((((gctUINT32) (control)) >> (0 ? 17:17)) & ((gctUINT32) ((((1 ? 17:17) - (0 ? 17:17) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 17:17) - (0 ? 17:17) + 1)))))) ) == 0)
++        )
++        {
++            continue;
++        }
++
++        /* GPU is idle. */
++        break;
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the error. */
++    return status;
++}
++
++
++static gceSTATUS
++_IdentifyHardware(
++    IN gckOS Os,
++    OUT gceCHIPMODEL * ChipModel,
++    OUT gctUINT32 * ChipRevision,
++    OUT gctUINT32 * ChipFeatures,
++    OUT gctUINT32 * ChipMinorFeatures,
++    OUT gctUINT32 * ChipMinorFeatures2
++    )
++{
++    gceSTATUS status;
++    gctUINT32 chipIdentity;
++
++    do
++    {
++        /* Read chip identity register. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG, 0x00018, &chipIdentity));
++
++        /* Special case for older graphic cores. */
++        if (((((gctUINT32) (chipIdentity)) >> (0 ? 31:24) & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1)))))) == (0x01 & ((gctUINT32) ((((1 ? 31:24) - (0 ? 31:24) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:24) - (0 ? 31:24) + 1))))))))
++        {
++            *ChipModel    = gcv500;
++            *ChipRevision = (((((gctUINT32) (chipIdentity)) >> (0 ? 15:12)) & ((gctUINT32) ((((1 ? 15:12) - (0 ? 15:12) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:12) - (0 ? 15:12) + 1)))))) );
++        }
++
++        else
++        {
++            /* Read chip identity register. */
++            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
++                                            0x00020,
++                                            (gctUINT32 *) ChipModel));
++
++            /* Read CHIP_REV register. */
++            gcmkERR_BREAK(gckOS_ReadRegisterEx(Os, gcvCORE_VG,
++                                            0x00024,
++                                            ChipRevision));
++        }
++
++        /* Read chip feature register. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(
++            Os, gcvCORE_VG, 0x0001C, ChipFeatures
++            ));
++
++        /* Read chip minor feature register. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(
++            Os, gcvCORE_VG, 0x00034, ChipMinorFeatures
++            ));
++
++        /* Read chip minor feature register #2. */
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(
++            Os, gcvCORE_VG, 0x00074, ChipMinorFeatures2
++            ));
++
++        gcmkTRACE(
++            gcvLEVEL_VERBOSE,
++            "ChipModel=0x%08X\n"
++            "ChipRevision=0x%08X\n"
++            "ChipFeatures=0x%08X\n"
++            "ChipMinorFeatures=0x%08X\n"
++            "ChipMinorFeatures2=0x%08X\n",
++            *ChipModel,
++            *ChipRevision,
++            *ChipFeatures,
++            *ChipMinorFeatures,
++            *ChipMinorFeatures2
++            );
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Return the status. */
++    return status;
++}
++
++#if gcdPOWEROFF_TIMEOUT
++void
++_VGPowerTimerFunction(
++    gctPOINTER Data
++    )
++{
++    gckVGHARDWARE hardware = (gckVGHARDWARE)Data;
++    gcmkVERIFY_OK(
++        gckVGHARDWARE_SetPowerManagementState(hardware, gcvPOWER_OFF_TIMEOUT));
++}
++#endif
++
++/******************************************************************************\
++****************************** gckVGHARDWARE API code *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_Construct
++**
++**  Construct a new gckVGHARDWARE object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an initialized gckOS object.
++**
++**  OUTPUT:
++**
++**      gckVGHARDWARE * Hardware
++**          Pointer to a variable that will hold the pointer to the gckVGHARDWARE
++**          object.
++*/
++gceSTATUS
++gckVGHARDWARE_Construct(
++    IN gckOS Os,
++    OUT gckVGHARDWARE * Hardware
++    )
++{
++    gckVGHARDWARE hardware = gcvNULL;
++    gceSTATUS status;
++    gceCHIPMODEL chipModel;
++    gctUINT32 chipRevision;
++    gctUINT32 chipFeatures;
++    gctUINT32 chipMinorFeatures;
++    gctUINT32 chipMinorFeatures2;
++
++    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x ", Os, Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
++
++    do
++    {
++        gcmkERR_BREAK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvTRUE, gcvTRUE));
++
++        status = _ResetGPU(Os);
++
++        if (status != gcvSTATUS_OK)
++        {
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                "_ResetGPU failed: status=%d\n", status);
++        }
++
++        /* Identify the hardware. */
++        gcmkERR_BREAK(_IdentifyHardware(Os,
++            &chipModel, &chipRevision,
++            &chipFeatures, &chipMinorFeatures, &chipMinorFeatures2
++            ));
++
++        /* Allocate the gckVGHARDWARE object. */
++        gcmkERR_BREAK(gckOS_Allocate(Os,
++            gcmSIZEOF(struct _gckVGHARDWARE), (gctPOINTER *) &hardware
++            ));
++
++        /* Initialize the gckVGHARDWARE object. */
++        hardware->object.type = gcvOBJ_HARDWARE;
++        hardware->os = Os;
++
++        /* Set chip identity. */
++        hardware->chipModel          = chipModel;
++        hardware->chipRevision       = chipRevision;
++        hardware->chipFeatures       = chipFeatures;
++        hardware->chipMinorFeatures  = chipMinorFeatures;
++        hardware->chipMinorFeatures2 = chipMinorFeatures2;
++
++        hardware->powerMutex            = gcvNULL;
++        hardware->chipPowerState        = gcvPOWER_ON;
++        hardware->chipPowerStateGlobal  = gcvPOWER_ON;
++        hardware->clockState            = gcvTRUE;
++        hardware->powerState            = gcvTRUE;
++
++#if gcdPOWEROFF_TIMEOUT
++        hardware->powerOffTime          = 0;
++        hardware->powerOffTimeout       = gcdPOWEROFF_TIMEOUT;
++
++        gcmkVERIFY_OK(gckOS_CreateTimer(Os,
++                                        _VGPowerTimerFunction,
++                                        (gctPOINTER)hardware,
++                                        &hardware->powerOffTimer));
++#endif
++
++        /* Determine whether FE 2.0 is present. */
++        hardware->fe20 = ((((gctUINT32) (hardware->chipFeatures)) >> (0 ? 28:28) & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 28:28) - (0 ? 28:28) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 28:28) - (0 ? 28:28) + 1)))))));
++
++        /* Determine whether VG 2.0 is present. */
++        hardware->vg20 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 13:13) & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 13:13) - (0 ? 13:13) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 13:13) - (0 ? 13:13) + 1)))))));
++
++        /* Determine whether VG 2.1 is present. */
++        hardware->vg21 = ((((gctUINT32) (hardware->chipMinorFeatures)) >> (0 ? 18:18) & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))) == (0x1  & ((gctUINT32) ((((1 ? 18:18) - (0 ? 18:18) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 18:18) - (0 ? 18:18) + 1)))))));
++
++        /* Set default event mask. */
++        hardware->eventMask = 0xFFFFFFFF;
++
++        gcmkERR_BREAK(gckOS_AtomConstruct(Os, &hardware->pageTableDirty));
++
++        /* Set fast clear to auto. */
++        gcmkVERIFY_OK(gckVGHARDWARE_SetFastClear(hardware, -1));
++
++        gcmkERR_BREAK(gckOS_CreateMutex(Os, &hardware->powerMutex));
++
++        /* Enable power management by default. */
++        hardware->powerManagement = gcvTRUE;
++
++        /* Return pointer to the gckVGHARDWARE object. */
++        *Hardware = hardware;
++
++        gcmkFOOTER_NO();
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++#if gcdPOWEROFF_TIMEOUT
++    if (hardware->powerOffTimer != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_StopTimer(Os, hardware->powerOffTimer));
++        gcmkVERIFY_OK(gckOS_DestroyTimer(Os, hardware->powerOffTimer));
++    }
++#endif
++
++    gcmkVERIFY_OK(gckOS_SetGPUPower(Os, gcvCORE_VG, gcvFALSE, gcvFALSE));
++
++    if (hardware != gcvNULL && hardware->pageTableDirty != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_AtomDestroy(Os, hardware->pageTableDirty));
++    }
++
++    if (hardware != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_Free(Os, hardware));
++    }
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_Destroy
++**
++**  Destroy an gckVGHARDWARE object.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object that needs to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGHARDWARE_Destroy(
++    IN gckVGHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Mark the object as unknown. */
++    Hardware->object.type = gcvOBJ_UNKNOWN;
++
++    if (Hardware->powerMutex != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_DeleteMutex(
++            Hardware->os, Hardware->powerMutex));
++    }
++
++#if gcdPOWEROFF_TIMEOUT
++    gcmkVERIFY_OK(gckOS_StopTimer(Hardware->os, Hardware->powerOffTimer));
++    gcmkVERIFY_OK(gckOS_DestroyTimer(Hardware->os, Hardware->powerOffTimer));
++#endif
++
++    if (Hardware->pageTableDirty != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_AtomDestroy(Hardware->os, Hardware->pageTableDirty));
++    }
++
++    /* Free the object. */
++    status = gckOS_Free(Hardware->os, Hardware);
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_QueryMemory
++**
++**  Query the amount of memory available on the hardware.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * InternalSize
++**          Pointer to a variable that will hold the size of the internal video
++**          memory in bytes.  If 'InternalSize' is gcvNULL, no information of the
++**          internal memory will be returned.
++**
++**      gctUINT32 * InternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * InternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the internal video memory.  This pointer cannot be gcvNULL if
++**          'InternalSize' is also non-gcvNULL.
++**
++**      gctSIZE_T * ExternalSize
++**          Pointer to a variable that will hold the size of the external video
++**          memory in bytes.  If 'ExternalSize' is gcvNULL, no information of the
++**          external memory will be returned.
++**
++**      gctUINT32 * ExternalBaseAddress
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * ExternalAlignment
++**          Pointer to a variable that will hold the hardware's base address for
++**          the external video memory.  This pointer cannot be gcvNULL if
++**          'ExternalSize' is also non-gcvNULL.
++**
++**      gctUINT32 * HorizontalTileSize
++**          Number of horizontal pixels per tile.  If 'HorizontalTileSize' is
++**          gcvNULL, no horizontal pixel per tile will be returned.
++**
++**      gctUINT32 * VerticalTileSize
++**          Number of vertical pixels per tile.  If 'VerticalTileSize' is
++**          gcvNULL, no vertical pixel per tile will be returned.
++*/
++gceSTATUS
++gckVGHARDWARE_QueryMemory(
++    IN gckVGHARDWARE Hardware,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctUINT32 * InternalBaseAddress,
++    OUT gctUINT32 * InternalAlignment,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctUINT32 * ExternalBaseAddress,
++    OUT gctUINT32 * ExternalAlignment,
++    OUT gctUINT32 * HorizontalTileSize,
++    OUT gctUINT32 * VerticalTileSize
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x InternalSize=0x%x InternalBaseAddress=0x%x InternalAlignment=0x%x"
++        "ExternalSize=0x%x ExternalBaseAddress=0x%x ExternalAlignment=0x%x HorizontalTileSize=0x%x VerticalTileSize=0x%x",
++        Hardware, InternalSize, InternalBaseAddress, InternalAlignment,
++        ExternalSize, ExternalBaseAddress, ExternalAlignment, HorizontalTileSize, VerticalTileSize);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (InternalSize != gcvNULL)
++    {
++        /* No internal memory. */
++        *InternalSize = 0;
++    }
++
++    if (ExternalSize != gcvNULL)
++    {
++        /* No external memory. */
++        *ExternalSize = 0;
++    }
++
++    if (HorizontalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *HorizontalTileSize = 4;
++    }
++
++    if (VerticalTileSize != gcvNULL)
++    {
++        /* 4x4 tiles. */
++        *VerticalTileSize = 4;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_QueryChipIdentity
++**
++**  Query the identity of the hardware.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gceCHIPMODEL * ChipModel
++**          If 'ChipModel' is not gcvNULL, the variable it points to will
++**          receive the model of the chip.
++**
++**      gctUINT32 * ChipRevision
++**          If 'ChipRevision' is not gcvNULL, the variable it points to will
++**          receive the revision of the chip.
++**
++**      gctUINT32 * ChipFeatures
++**          If 'ChipFeatures' is not gcvNULL, the variable it points to will
++**          receive the feature set of the chip.
++**
++**      gctUINT32 * ChipMinorFeatures
++**          If 'ChipMinorFeatures' is not gcvNULL, the variable it points to
++**          will receive the minor feature set of the chip.
++**
++**      gctUINT32 * ChipMinorFeatures2
++**          If 'ChipMinorFeatures2' is not gcvNULL, the variable it points to
++**          will receive the minor feature set of the chip.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_QueryChipIdentity(
++    IN gckVGHARDWARE Hardware,
++    OUT gceCHIPMODEL * ChipModel,
++    OUT gctUINT32 * ChipRevision,
++    OUT gctUINT32* ChipFeatures,
++    OUT gctUINT32* ChipMinorFeatures,
++    OUT gctUINT32* ChipMinorFeatures2
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x ChipModel=0x%x ChipRevision=0x%x ChipFeatures = 0x%x ChipMinorFeatures = 0x%x ChipMinorFeatures2 = 0x%x",
++                   Hardware, ChipModel, ChipRevision, ChipFeatures, ChipMinorFeatures, ChipMinorFeatures2);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Return chip model. */
++    if (ChipModel != gcvNULL)
++    {
++        *ChipModel = Hardware->chipModel;
++    }
++
++    /* Return revision number. */
++    if (ChipRevision != gcvNULL)
++    {
++        *ChipRevision = Hardware->chipRevision;
++    }
++
++    /* Return feature set. */
++    if (ChipFeatures != gcvNULL)
++    {
++        gctUINT32 features = Hardware->chipFeatures;
++
++        if ((((((gctUINT32) (features)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++        {
++            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) ((gctUINT32) (Hardware->allowFastClear) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)));
++        }
++
++        /* Mark 2D pipe as available for GC500.0 since it did not have this *\
++        \* bit.                                                             */
++        if ((Hardware->chipModel == gcv500)
++        &&  (Hardware->chipRevision == 0)
++        )
++        {
++            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++        }
++
++        /* Mark 2D pipe as available for GC300 since it did not have this   *\
++        \* bit.                                                             */
++        if (Hardware->chipModel == gcv300)
++        {
++            features = ((((gctUINT32) (features)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1))))))) << (0 ? 9:9)));
++        }
++
++        *ChipFeatures = features;
++    }
++
++    /* Return minor feature set. */
++    if (ChipMinorFeatures != gcvNULL)
++    {
++        *ChipMinorFeatures = Hardware->chipMinorFeatures;
++    }
++
++    /* Return minor feature set #2. */
++    if (ChipMinorFeatures2 != gcvNULL)
++    {
++        *ChipMinorFeatures2 = Hardware->chipMinorFeatures2;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_ConvertFormat
++**
++**  Convert an API format to hardware parameters.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**      gceSURF_FORMAT Format
++**          API format to convert.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * BitsPerPixel
++**          Pointer to a variable that will hold the number of bits per pixel.
++**
++**      gctUINT32 * BytesPerTile
++**          Pointer to a variable that will hold the number of bytes per tile.
++*/
++gceSTATUS
++gckVGHARDWARE_ConvertFormat(
++    IN gckVGHARDWARE Hardware,
++    IN gceSURF_FORMAT Format,
++    OUT gctUINT32 * BitsPerPixel,
++    OUT gctUINT32 * BytesPerTile
++    )
++{
++    gctUINT32 bitsPerPixel;
++    gctUINT32 bytesPerTile;
++
++    gcmkHEADER_ARG("Hardware=0x%x Format=0x%x BitsPerPixel=0x%x BytesPerTile = 0x%x",
++                   Hardware, Format, BitsPerPixel, BytesPerTile);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Dispatch on format. */
++    switch (Format)
++    {
++    case gcvSURF_A1:
++    case gcvSURF_L1:
++        /* 1-bpp format. */
++        bitsPerPixel  = 1;
++        bytesPerTile  = (1 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_A4:
++        /* 4-bpp format. */
++        bitsPerPixel  = 4;
++        bytesPerTile  = (4 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_INDEX8:
++    case gcvSURF_A8:
++    case gcvSURF_L8:
++        /* 8-bpp format. */
++        bitsPerPixel  = 8;
++        bytesPerTile  = (8 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_YV12:
++        /* 12-bpp planar YUV formats. */
++        bitsPerPixel  = 12;
++        bytesPerTile  = (12 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_NV12:
++        /* 12-bpp planar YUV formats. */
++        bitsPerPixel  = 12;
++        bytesPerTile  = (12 * 4 * 4) / 8;
++        break;
++
++    /* 4444 variations. */
++    case gcvSURF_X4R4G4B4:
++    case gcvSURF_A4R4G4B4:
++    case gcvSURF_R4G4B4X4:
++    case gcvSURF_R4G4B4A4:
++    case gcvSURF_B4G4R4X4:
++    case gcvSURF_B4G4R4A4:
++    case gcvSURF_X4B4G4R4:
++    case gcvSURF_A4B4G4R4:
++
++    /* 1555 variations. */
++    case gcvSURF_X1R5G5B5:
++    case gcvSURF_A1R5G5B5:
++    case gcvSURF_R5G5B5X1:
++    case gcvSURF_R5G5B5A1:
++    case gcvSURF_X1B5G5R5:
++    case gcvSURF_A1B5G5R5:
++    case gcvSURF_B5G5R5X1:
++    case gcvSURF_B5G5R5A1:
++
++    /* 565 variations. */
++    case gcvSURF_R5G6B5:
++    case gcvSURF_B5G6R5:
++
++    case gcvSURF_A8L8:
++    case gcvSURF_YUY2:
++    case gcvSURF_UYVY:
++    case gcvSURF_D16:
++        /* 16-bpp format. */
++        bitsPerPixel  = 16;
++        bytesPerTile  = (16 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_X8R8G8B8:
++    case gcvSURF_A8R8G8B8:
++    case gcvSURF_X8B8G8R8:
++    case gcvSURF_A8B8G8R8:
++    case gcvSURF_R8G8B8X8:
++    case gcvSURF_R8G8B8A8:
++    case gcvSURF_B8G8R8X8:
++    case gcvSURF_B8G8R8A8:
++    case gcvSURF_D32:
++        /* 32-bpp format. */
++        bitsPerPixel  = 32;
++        bytesPerTile  = (32 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_D24S8:
++        /* 24-bpp format. */
++        bitsPerPixel  = 32;
++        bytesPerTile  = (32 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_DXT1:
++    case gcvSURF_ETC1:
++        bitsPerPixel  = 4;
++        bytesPerTile  = (4 * 4 * 4) / 8;
++        break;
++
++    case gcvSURF_DXT2:
++    case gcvSURF_DXT3:
++    case gcvSURF_DXT4:
++    case gcvSURF_DXT5:
++        bitsPerPixel  = 8;
++        bytesPerTile  = (8 * 4 * 4) / 8;
++        break;
++
++    default:
++        /* Invalid format. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_INVALID_ARGUMENT;
++    }
++
++    /* Set the result. */
++    if (BitsPerPixel != gcvNULL)
++    {
++        * BitsPerPixel = bitsPerPixel;
++    }
++
++    if (BytesPerTile != gcvNULL)
++    {
++        * BytesPerTile = bytesPerTile;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_SplitMemory
++**
++**  Split a hardware specific memory address into a pool and offset.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**      gctUINT32 Address
++**          Address in hardware specific format.
++**
++**  OUTPUT:
++**
++**      gcePOOL * Pool
++**          Pointer to a variable that will hold the pool type for the address.
++**
++**      gctUINT32 * Offset
++**          Pointer to a variable that will hold the offset for the address.
++*/
++gceSTATUS
++gckVGHARDWARE_SplitMemory(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Pool=0x%x Offset = 0x%x",
++                   Hardware, Address, Pool, Offset);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Offset != gcvNULL);
++
++    /* Dispatch on memory type. */
++    switch ((((((gctUINT32) (Address)) >> (0 ? 1:0)) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1)))))) ))
++    {
++    case 0x0:
++        /* System memory. */
++        *Pool = gcvPOOL_SYSTEM;
++        break;
++
++    case 0x2:
++        /* Virtual memory. */
++        *Pool = gcvPOOL_VIRTUAL;
++        break;
++
++    default:
++        /* Invalid memory type. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_INVALID_ARGUMENT;
++    }
++
++    /* Return offset of address. */
++    *Offset = ((((gctUINT32) (Address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) ((gctUINT32) (0) & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_Execute
++**
++**  Kickstart the hardware's command processor with an initialized command
++**  buffer.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to the gckVGHARDWARE object.
++**
++**      gctUINT32 Address
++**          Address of the command buffer.
++**
++**      gctSIZE_T Count
++**          Number of command-sized data units to be executed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGHARDWARE_Execute(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Address,
++    IN gctUINT32 Count
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Address=0x%x Count=0x%x",
++                   Hardware, Address, Count);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    do
++    {
++        /* Enable all events. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(
++            Hardware->os,
++            gcvCORE_VG,
++            0x00014,
++            Hardware->eventMask
++            ));
++
++        if (Hardware->fe20)
++        {
++            /* Write address register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00500,
++                gcmkFIXADDRESS(Address)
++                ));
++
++            /* Write control register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00504,
++                Count
++                ));
++        }
++        else
++        {
++            /* Write address register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00654,
++                gcmkFIXADDRESS(Address)
++                ));
++
++            /* Write control register. */
++            gcmkERR_BREAK(gckOS_WriteRegisterEx(
++                Hardware->os,
++                gcvCORE_VG,
++                0x00658,
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 16:16) - (0 ? 16:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 16:16) - (0 ? 16:16) + 1))))))) << (0 ? 16:16))) |
++                ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (Count) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++                ));
++        }
++
++        /* Success. */
++        gcmkFOOTER();
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_AlignToTile
++**
++**  Align the specified width and height to tile boundaries.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gceSURF_TYPE Type
++**          Type of alignment.
++**
++**      gctUINT32 * Width
++**          Pointer to the width to be aligned.  If 'Width' is gcvNULL, no width
++**          will be aligned.
++**
++**      gctUINT32 * Height
++**          Pointer to the height to be aligned.  If 'Height' is gcvNULL, no height
++**          will be aligned.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Width
++**          Pointer to a variable that will receive the aligned width.
++**
++**      gctUINT32 * Height
++**          Pointer to a variable that will receive the aligned height.
++*/
++gceSTATUS
++gckVGHARDWARE_AlignToTile(
++    IN gckVGHARDWARE Hardware,
++    IN gceSURF_TYPE Type,
++    IN OUT gctUINT32 * Width,
++    IN OUT gctUINT32 * Height
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Type=0x%x Width=0x%x Height=0x%x",
++                   Hardware, Type, Width, Height);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (Width != gcvNULL)
++    {
++        /* Align the width. */
++        *Width = gcmALIGN(*Width, (Type == gcvSURF_TEXTURE) ? 4 : 16);
++    }
++
++    if (Height != gcvNULL)
++    {
++        /* Special case for VG images. */
++        if ((*Height == 0) && (Type == gcvSURF_IMAGE))
++        {
++            *Height = 4;
++        }
++        else
++        {
++            /* Align the height. */
++            *Height = gcmALIGN(*Height, 4);
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_ConvertLogical
++**
++**  Convert a logical system address into a hardware specific address.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Hardware
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address to convert.
++**
++**      gctBOOL InUserSpace
++**          gcvTRUE if the memory in user space.
++**
++**      gctUINT32* Address
++**          Return hardware specific address.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVGHARDWARE_ConvertLogical(
++    IN gckVGHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctBOOL InUserSpace,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x InUserSpace=%d Address=0x%x",
++                   Hardware, Logical, InUserSpace, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    do
++    {
++        /* Convert logical address into a physical address. */
++        if (InUserSpace)
++        {
++            gcmkERR_BREAK(gckOS_UserLogicalToPhysical(
++                Hardware->os, Logical, &address
++                ));
++        }
++        else
++        {
++            gcmkERR_BREAK(gckOS_GetPhysicalAddress(
++                Hardware->os, Logical, &address
++                ));
++        }
++
++        /* Return hardware specific address. */
++        *Address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++        /* Success. */
++        gcmkFOOTER();
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_QuerySystemMemory
++**
++**  Query the command buffer alignment and number of reserved bytes.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * SystemSize
++**          Pointer to a variable that receives the maximum size of the system
++**          memory.
++**
++**      gctUINT32 * SystemBaseAddress
++**          Poinetr to a variable that receives the base address for system
++**          memory.
++*/
++gceSTATUS gckVGHARDWARE_QuerySystemMemory(
++    IN gckVGHARDWARE Hardware,
++    OUT gctSIZE_T * SystemSize,
++    OUT gctUINT32 * SystemBaseAddress
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x SystemSize=0x%x SystemBaseAddress=0x%x",
++                   Hardware, SystemSize, SystemBaseAddress);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    if (SystemSize != gcvNULL)
++    {
++        /* Maximum system memory can be 2GB. */
++        *SystemSize = (gctSIZE_T)(1 << 31);
++    }
++
++    if (SystemBaseAddress != gcvNULL)
++    {
++        /* Set system memory base address. */
++        *SystemBaseAddress = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x0 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_SetMMU
++**
++**  Set the page table base address.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gctPOINTER Logical
++**          Logical address of the page table.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGHARDWARE_SetMMU(
++    IN gckVGHARDWARE Hardware,
++    IN gctPOINTER Logical
++    )
++{
++    gceSTATUS status;
++    gctUINT32 address = 0;
++
++    gcmkHEADER_ARG("Hardware=0x%x Logical=0x%x",
++                   Hardware, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    do
++    {
++        /* Convert the logical address into an hardware address. */
++        gcmkERR_BREAK(gckVGHARDWARE_ConvertLogical(Hardware, Logical,
++                                      gcvFALSE, &address));
++
++        /* Write the AQMemoryFePageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00400,
++                                      gcmkFIXADDRESS(address)));
++
++        /* Write the AQMemoryTxPageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00404,
++                                      gcmkFIXADDRESS(address)));
++
++        /* Write the AQMemoryPePageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00408,
++                                      gcmkFIXADDRESS(address)));
++
++        /* Write the AQMemoryPezPageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x0040C,
++                                      gcmkFIXADDRESS(address)));
++
++        /* Write the AQMemoryRaPageTable register. */
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                      0x00410,
++                                      gcmkFIXADDRESS(address)));
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_FlushMMU
++**
++**  Flush the page table.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGHARDWARE_FlushMMU(
++    IN gckVGHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gckVGCOMMAND command;
++
++    gcmkHEADER_ARG("Hardware=0x%x ", Hardware);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    do
++    {
++        gcsCMDBUFFER_PTR commandBuffer;
++        gctUINT32_PTR buffer;
++
++        /* Create a shortcut to the command buffer object. */
++        command = Hardware->kernel->command;
++
++        /* Allocate command buffer space. */
++        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
++            command, 8, &commandBuffer, (gctPOINTER *) &buffer
++            ));
++
++        buffer[0]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27))) | (((gctUINT32) (0x01 & ((gctUINT32) ((((1 ? 31:27) - (0 ? 31:27) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 31:27) - (0 ? 31:27) + 1))))))) << (0 ? 31:27)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0))) | (((gctUINT32) ((gctUINT32) (0x0E04) & ((gctUINT32) ((((1 ? 15:0) - (0 ? 15:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 15:0) - (0 ? 15:0) + 1))))))) << (0 ? 15:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16))) | (((gctUINT32) ((gctUINT32) (1) & ((gctUINT32) ((((1 ? 25:16) - (0 ? 25:16) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 25:16) - (0 ? 25:16) + 1))))))) << (0 ? 25:16)));
++
++        buffer[1]
++            = ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1))))))) << (0 ? 0:0)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 1:1) - (0 ? 1:1) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:1) - (0 ? 1:1) + 1))))))) << (0 ? 1:1)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 2:2) - (0 ? 2:2) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 2:2) - (0 ? 2:2) + 1))))))) << (0 ? 2:2)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 3:3) - (0 ? 3:3) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 3:3) - (0 ? 3:3) + 1))))))) << (0 ? 3:3)))
++            | ((((gctUINT32) (0)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4))) | (((gctUINT32) (0x1 & ((gctUINT32) ((((1 ? 4:4) - (0 ? 4:4) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 4:4) - (0 ? 4:4) + 1))))))) << (0 ? 4:4)));
++    }
++    while(gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_BuildVirtualAddress
++**
++**  Build a virtual address.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckVGHARDWARE object.
++**
++**      gctUINT32 Index
++**          Index into page table.
++**
++**      gctUINT32 Offset
++**          Offset into page.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Pointer to a variable receiving te hardware address.
++*/
++gceSTATUS gckVGHARDWARE_BuildVirtualAddress(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Index,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    )
++{
++    gctUINT32 address;
++
++    gcmkHEADER_ARG("Hardware=0x%x Index=0x%x Offset=0x%x Address=0x%x",
++                   Hardware, Index, Offset, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Build virtual address. */
++    address = (Index << 12) | Offset;
++
++    /* Set virtual type. */
++    address = ((((gctUINT32) (address)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0))) | (((gctUINT32) (0x2 & ((gctUINT32) ((((1 ? 1:0) - (0 ? 1:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 1:0) - (0 ? 1:0) + 1))))))) << (0 ? 1:0)));
++
++    /* Set the result. */
++    *Address = address;
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGHARDWARE_GetIdle(
++    IN gckVGHARDWARE Hardware,
++    OUT gctUINT32 * Data
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%x Data=0x%x", Hardware, Data);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
++
++    /* Read register and return. */
++    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, Data);
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckVGHARDWARE_SetFastClear(
++    IN gckVGHARDWARE Hardware,
++    IN gctINT Enable
++    )
++{
++    gctUINT32 debug;
++    gceSTATUS status;
++
++    if (!(((((gctUINT32) (Hardware->chipFeatures)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ))
++    {
++        return gcvSTATUS_OK;
++    }
++
++    do
++    {
++        if (Enable == -1)
++        {
++            Enable = (Hardware->chipModel > gcv500) ||
++                ((Hardware->chipModel == gcv500) && (Hardware->chipRevision >= 3));
++        }
++
++        gcmkERR_BREAK(gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
++                                        0x00414,
++                    &debug));
++
++        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? 20:20) - (0 ? 20:20) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 20:20) - (0 ? 20:20) + 1))))))) << (0 ? 20:20)));
++
++#ifdef AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION
++        debug = ((((gctUINT32) (debug)) & ~(((gctUINT32) (((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION))) | (((gctUINT32) ((gctUINT32) (Enable == 0) & ((gctUINT32) ((((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1) == 32) ? ~0 : (~(~0 << ((1 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) - (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION) + 1))))))) << (0 ? AQ_MEMORY_DEBUG_DISABLE_Z_COMPRESSION)));
++#endif
++
++        gcmkERR_BREAK(gckOS_WriteRegisterEx(Hardware->os, gcvCORE_VG,
++                                     0x00414,
++                     debug));
++
++        Hardware->allowFastClear = Enable;
++
++        status = gcvFALSE;
++    }
++    while (gcvFALSE);
++
++    return status;
++}
++
++gceSTATUS
++gckVGHARDWARE_ReadInterrupt(
++    IN gckVGHARDWARE Hardware,
++    OUT gctUINT32_PTR IDs
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Hardware=0x%x IDs=0x%x", Hardware, IDs);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(IDs != gcvNULL);
++
++    /* Read AQIntrAcknowledge register. */
++    status = gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG,
++                              0x00010,
++                              IDs);
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS _CommandStall(
++    gckVGHARDWARE Hardware)
++{
++    gceSTATUS status;
++    gckVGCOMMAND command;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    do
++    {
++        gctUINT32_PTR buffer;
++        command = Hardware->kernel->command;
++
++        /* Allocate command buffer space. */
++        gcmkERR_BREAK(gckVGCOMMAND_Allocate(
++            command, 8, &command->powerStallBuffer,
++            (gctPOINTER *) &buffer
++            ));
++
++        gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
++            command, buffer, gcvBLOCK_PIXEL,
++            command->powerStallInt, gcvNULL));
++
++        gcmkERR_BREAK(gckVGCOMMAND_Execute(
++            command,
++            command->powerStallBuffer
++            ));
++
++        /* Wait the signal. */
++        gcmkERR_BREAK(gckOS_WaitSignal(
++            command->os,
++            command->powerStallSignal,
++            command->kernel->kernel->timeOut));
++
++
++    }
++    while(gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_SetPowerManagementState
++**
++**  Set GPU to a specified power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE State
++**          Power State.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_SetPowerManagementState(
++    IN gckVGHARDWARE Hardware,
++    IN gceCHIPPOWERSTATE State
++    )
++{
++    gceSTATUS status;
++    gckVGCOMMAND command = gcvNULL;
++    gckOS os;
++    gctUINT flag/*, clock*/;
++
++    gctBOOL acquired        = gcvFALSE;
++    gctBOOL stall           = gcvTRUE;
++    gctBOOL commitMutex     = gcvFALSE;
++    gctBOOL mutexAcquired   = gcvFALSE;
++
++#if gcdPOWEROFF_TIMEOUT
++    gctBOOL timeout = gcvFALSE;
++    gctBOOL isAfter = gcvFALSE;
++    gctUINT32 currentTime;
++#endif
++
++    gctBOOL broadcast = gcvFALSE;
++    gctUINT32 process, thread;
++    gctBOOL global = gcvFALSE;
++
++#if gcdENABLE_PROFILING
++    gctUINT64 time, freq, mutexTime, onTime, stallTime, stopTime, delayTime,
++              initTime, offTime, startTime, totalTime;
++#endif
++
++    /* State transition flags. */
++    static const gctUINT flags[4][4] =
++    {
++        /* gcvPOWER_ON           */
++        {   /* ON                */ 0,
++            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_NOP,
++            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STALL     |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_OFF          */
++        {   /* ON                */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_RELEASE    |
++                                    gcvPOWER_FLAG_DELAY,
++            /* OFF               */ 0,
++            /* IDLE              */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_START      |
++                                    gcvPOWER_FLAG_RELEASE    |
++                                    gcvPOWER_FLAG_DELAY,
++            /* SUSPEND           */ gcvPOWER_FLAG_INITIALIZE |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_IDLE         */
++        {   /* ON                */ gcvPOWER_FLAG_NOP,
++            /* OFF               */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ 0,
++            /* SUSPEND           */ gcvPOWER_FLAG_ACQUIRE   |
++                                    gcvPOWER_FLAG_STOP      |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++        },
++
++        /* gcvPOWER_SUSPEND      */
++        {   /* ON                */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_RELEASE   |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* OFF               */ gcvPOWER_FLAG_SAVE      |
++                                    gcvPOWER_FLAG_POWER_OFF |
++                                    gcvPOWER_FLAG_CLOCK_OFF,
++            /* IDLE              */ gcvPOWER_FLAG_START     |
++                                    gcvPOWER_FLAG_DELAY     |
++                                    gcvPOWER_FLAG_RELEASE   |
++                                    gcvPOWER_FLAG_CLOCK_ON,
++            /* SUSPEND           */ 0,
++        },
++    };
++
++    gcmkHEADER_ARG("Hardware=0x%x State=%d", Hardware, State);
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "Switching to power state %d",
++                   State);
++#endif
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    /* Get the gckOS object pointer. */
++    os = Hardware->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Get the gckCOMMAND object pointer. */
++    gcmkVERIFY_OBJECT(Hardware->kernel, gcvOBJ_KERNEL);
++    command = Hardware->kernel->command;
++    gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
++
++    if (Hardware->powerManagement == gcvFALSE)
++    {
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Start profiler. */
++    gcmkPROFILE_INIT(freq, time);
++
++    /* Convert the broadcast power state. */
++    switch (State)
++    {
++    case gcvPOWER_SUSPEND_ATPOWERON:
++        /* Convert to SUSPEND and don't wait for STALL. */
++        State = gcvPOWER_SUSPEND;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_OFF_ATPOWERON:
++        /* Convert to OFF and don't wait for STALL. */
++        State = gcvPOWER_OFF;
++        stall = gcvFALSE;
++        break;
++
++    case gcvPOWER_IDLE_BROADCAST:
++        /* Convert to IDLE and note we are inside broadcast. */
++        State     = gcvPOWER_IDLE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_SUSPEND_BROADCAST:
++        /* Convert to SUSPEND and note we are inside broadcast. */
++        State     = gcvPOWER_SUSPEND;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_BROADCAST:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_OFF_RECOVERY:
++        /* Convert to OFF and note we are inside recovery. */
++        State     = gcvPOWER_OFF;
++        stall     = gcvFALSE;
++        broadcast = gcvTRUE;
++        break;
++
++    case gcvPOWER_ON_AUTO:
++        /* Convert to ON and note we are inside recovery. */
++        State = gcvPOWER_ON;
++        break;
++
++    case gcvPOWER_ON:
++    case gcvPOWER_IDLE:
++    case gcvPOWER_SUSPEND:
++    case gcvPOWER_OFF:
++        /* Mark as global power management. */
++        global = gcvTRUE;
++        break;
++
++#if gcdPOWEROFF_TIMEOUT
++    case gcvPOWER_OFF_TIMEOUT:
++        /* Convert to OFF and note we are inside broadcast. */
++        State     = gcvPOWER_OFF;
++        broadcast = gcvTRUE;
++        /* Check time out */
++        timeout = gcvTRUE;
++        break;
++#endif
++
++    default:
++        break;
++    }
++
++    /* Get current process and thread IDs. */
++    gcmkONERROR(gckOS_GetProcessID(&process));
++    gcmkONERROR(gckOS_GetThreadID(&thread));
++
++    /* Acquire the power mutex. */
++    if (broadcast)
++    {
++        /* Try to acquire the power mutex. */
++        status = gckOS_AcquireMutex(os, Hardware->powerMutex, 0);
++
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            /* Check if we already own this mutex. */
++            if ((Hardware->powerProcess == process)
++            &&  (Hardware->powerThread  == thread)
++            )
++            {
++                /* Bail out on recursive power management. */
++                gcmkFOOTER_NO();
++                return gcvSTATUS_OK;
++            }
++            else if (State == gcvPOWER_IDLE)
++            {
++                /* gcvPOWER_IDLE_BROADCAST is from IST,
++                ** so waiting here will cause deadlock,
++                ** if lock holder call gckCOMMAND_Stall() */
++                gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++            }
++            else
++            {
++                /* Acquire the power mutex. */
++                gcmkONERROR(gckOS_AcquireMutex(os,
++                                               Hardware->powerMutex,
++                                               gcvINFINITE));
++            }
++        }
++    }
++    else
++    {
++        /* Acquire the power mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(os, Hardware->powerMutex, gcvINFINITE));
++    }
++
++    /* Get time until mtuex acquired. */
++    gcmkPROFILE_QUERY(time, mutexTime);
++
++    Hardware->powerProcess = process;
++    Hardware->powerThread  = thread;
++    mutexAcquired          = gcvTRUE;
++
++    /* Grab control flags and clock. */
++    flag  = flags[Hardware->chipPowerState][State];
++    /*clock = clocks[State];*/
++
++#if gcdPOWEROFF_TIMEOUT
++    if (timeout)
++    {
++        gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++        gcmkONERROR(
++            gckOS_TicksAfter(Hardware->powerOffTime, currentTime, &isAfter));
++
++        /* powerOffTime is pushed forward, give up.*/
++        if (isAfter
++        /* Expect a transition start from IDLE. */
++        ||  (Hardware->chipPowerState == gcvPOWER_ON)
++        ||  (Hardware->chipPowerState == gcvPOWER_OFF)
++        )
++        {
++            /* Release the power mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++            /* No need to do anything. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++    }
++#endif
++
++    if (flag == 0)
++    {
++        /* Release the power mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++        /* No need to do anything. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* internal power control */
++    if (!global)
++    {
++        if (Hardware->chipPowerStateGlobal == gcvPOWER_OFF)
++        {
++            /* Release the power mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++            /* No need to do anything. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++    }
++    else
++    {
++        if (flag & gcvPOWER_FLAG_ACQUIRE)
++        {
++            /* Acquire the power management semaphore. */
++            gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++            acquired = gcvTRUE;
++
++            /* avoid acquiring again. */
++            flag &= ~gcvPOWER_FLAG_ACQUIRE;
++        }
++    }
++
++    if (flag & (gcvPOWER_FLAG_INITIALIZE | gcvPOWER_FLAG_CLOCK_ON))
++    {
++        /* Turn on the power. */
++        gcmkONERROR(gckOS_SetGPUPower(os, gcvCORE_VG, gcvTRUE, gcvTRUE));
++
++        /* Mark clock and power as enabled. */
++        Hardware->clockState = gcvTRUE;
++        Hardware->powerState = gcvTRUE;
++    }
++
++    /* Get time until powered on. */
++    gcmkPROFILE_QUERY(time, onTime);
++
++    if ((flag & gcvPOWER_FLAG_STALL) && stall)
++    {
++        /* Acquire the mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(
++            command->os,
++            command->commitMutex,
++            gcvINFINITE
++            ));
++
++        commitMutex = gcvTRUE;
++
++        gcmkONERROR(_CommandStall(Hardware));
++    }
++
++    /* Get time until stalled. */
++    gcmkPROFILE_QUERY(time, stallTime);
++
++    if (flag & gcvPOWER_FLAG_ACQUIRE)
++    {
++        /* Acquire the power management semaphore. */
++        gcmkONERROR(gckOS_AcquireSemaphore(os, command->powerSemaphore));
++
++        acquired = gcvTRUE;
++    }
++
++
++    /* Get time until stopped. */
++    gcmkPROFILE_QUERY(time, stopTime);
++
++
++    if (flag & gcvPOWER_FLAG_DELAY)
++    {
++        /* Wait for the specified amount of time to settle coming back from
++        ** power-off or suspend state. */
++        gcmkONERROR(gckOS_Delay(os, gcdPOWER_CONTROL_DELAY));
++    }
++
++    /* Get time until delayed. */
++    gcmkPROFILE_QUERY(time, delayTime);
++
++    if (flag & gcvPOWER_FLAG_INITIALIZE)
++    {
++
++        /* Initialize GPU here, replaced by InitializeHardware later */
++        gcmkONERROR(gckVGHARDWARE_SetMMU(Hardware, Hardware->kernel->mmu->pageTableLogical));
++        gcmkVERIFY_OK(gckVGHARDWARE_SetFastClear(Hardware, -1));
++
++        /* Force the command queue to reload the next context. */
++        command->currentContext = 0;
++    }
++
++    /* Get time until initialized. */
++    gcmkPROFILE_QUERY(time, initTime);
++
++    if (flag & (gcvPOWER_FLAG_POWER_OFF | gcvPOWER_FLAG_CLOCK_OFF))
++    {
++        /* Turn off the GPU power. */
++        gcmkONERROR(
++            gckOS_SetGPUPower(os,
++                              gcvCORE_VG,
++                              (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                               : gcvTRUE,
++                              (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                               : gcvTRUE));
++
++        /* Save current hardware power and clock states. */
++        Hardware->clockState = (flag & gcvPOWER_FLAG_CLOCK_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++        Hardware->powerState = (flag & gcvPOWER_FLAG_POWER_OFF) ? gcvFALSE
++                                                                : gcvTRUE;
++    }
++
++    /* Get time until off. */
++    gcmkPROFILE_QUERY(time, offTime);
++
++
++    /* Get time until started. */
++    gcmkPROFILE_QUERY(time, startTime);
++
++    if (flag & gcvPOWER_FLAG_RELEASE)
++    {
++        /* Release the power management semaphore. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(os, command->powerSemaphore));
++        acquired = gcvFALSE;
++    }
++
++    /* Save the new power state. */
++    Hardware->chipPowerState = State;
++
++    if (global)
++    {
++        /* Save the new power state. */
++        Hardware->chipPowerStateGlobal = State;
++    }
++
++    if (commitMutex)
++    {
++        /* Acquire the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(
++            command->os,
++            command->commitMutex
++            ));
++    }
++
++#if gcdPOWEROFF_TIMEOUT
++    /* Reset power off time */
++    gcmkONERROR(gckOS_GetTicks(&currentTime));
++
++    Hardware->powerOffTime = currentTime + Hardware->powerOffTimeout;
++
++    if (State == gcvPOWER_IDLE)
++    {
++        /* Start a timer to power off GPU when GPU enters IDLE or SUSPEND. */
++        gcmkVERIFY_OK(gckOS_StartTimer(os,
++                                       Hardware->powerOffTimer,
++                                       Hardware->powerOffTimeout));
++    }
++    else
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE, "Cancel powerOfftimer");
++
++        /* Cancel running timer when GPU enters ON or OFF. */
++        gcmkVERIFY_OK(gckOS_StopTimer(os, Hardware->powerOffTimer));
++    }
++#endif
++
++    /* Release the power mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(os, Hardware->powerMutex));
++
++    /* Get total time. */
++    gcmkPROFILE_QUERY(time, totalTime);
++#if gcdENABLE_PROFILING
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "PROF(%llu): mutex:%llu on:%llu stall:%llu stop:%llu",
++                   freq, mutexTime, onTime, stallTime, stopTime);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HARDWARE,
++                   "  delay:%llu init:%llu off:%llu start:%llu total:%llu",
++                   delayTime, initTime, offTime, startTime, totalTime);
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    if (acquired)
++    {
++        /* Release semaphore. */
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(Hardware->os,
++                                             command->powerSemaphore));
++    }
++
++    if (mutexAcquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Hardware->os, Hardware->powerMutex));
++    }
++
++    if (commitMutex)
++    {
++        /* Acquire the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(
++            command->os,
++            command->commitMutex
++            ));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHARDWARE_QueryPowerManagementState
++**
++**  Get GPU power state.
++**
++**  INPUT:
++**
++**      gckHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gceCHIPPOWERSTATE* State
++**          Power State.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_QueryPowerManagementState(
++    IN gckVGHARDWARE Hardware,
++    OUT gceCHIPPOWERSTATE* State
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(State != gcvNULL);
++
++    /* Return the statue. */
++    *State = Hardware->chipPowerState;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*State=%d", *State);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGHARDWARE_SetPowerManagement
++**
++**  Configure GPU power management function.
++**  Only used in driver initialization stage.
++**
++**  INPUT:
++**
++**      gckVGHARDWARE Harwdare
++**          Pointer to an gckHARDWARE object.
++**
++**      gctBOOL PowerManagement
++**          Power Mangement State.
++**
++*/
++gceSTATUS
++gckVGHARDWARE_SetPowerManagement(
++    IN gckVGHARDWARE Hardware,
++    IN gctBOOL PowerManagement
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    Hardware->powerManagement = PowerManagement;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#if gcdPOWEROFF_TIMEOUT
++gceSTATUS
++gckVGHARDWARE_SetPowerOffTimeout(
++    IN gckVGHARDWARE  Hardware,
++    IN gctUINT32    Timeout
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x Timeout=%d", Hardware, Timeout);
++
++    Hardware->powerOffTimeout = Timeout;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++gceSTATUS
++gckVGHARDWARE_QueryPowerOffTimeout(
++    IN gckVGHARDWARE  Hardware,
++    OUT gctUINT32*  Timeout
++    )
++{
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    *Timeout = Hardware->powerOffTimeout;
++
++    gcmkFOOTER_ARG("*Timeout=%d", *Timeout);
++    return gcvSTATUS_OK;
++}
++#endif
++
++gceSTATUS
++gckVGHARDWARE_QueryIdle(
++    IN gckVGHARDWARE Hardware,
++    OUT gctBOOL_PTR IsIdle
++    )
++{
++    gceSTATUS status;
++    gctUINT32 idle;
++
++    gcmkHEADER_ARG("Hardware=0x%x", Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(IsIdle != gcvNULL);
++
++    /* We are idle when the power is not ON. */
++    if (Hardware->chipPowerState != gcvPOWER_ON)
++    {
++        *IsIdle = gcvTRUE;
++    }
++
++    else
++    {
++        /* Read idle register. */
++        gcmkONERROR(
++            gckOS_ReadRegisterEx(Hardware->os, gcvCORE_VG, 0x00004, &idle));
++
++        /* Pipe must be idle. */
++        if (((((((gctUINT32) (idle)) >> (0 ? 0:0)) & ((gctUINT32) ((((1 ? 0:0) - (0 ? 0:0) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 0:0) - (0 ? 0:0) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 8:8)) & ((gctUINT32) ((((1 ? 8:8) - (0 ? 8:8) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 8:8) - (0 ? 8:8) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 9:9)) & ((gctUINT32) ((((1 ? 9:9) - (0 ? 9:9) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 9:9) - (0 ? 9:9) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 10:10)) & ((gctUINT32) ((((1 ? 10:10) - (0 ? 10:10) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 10:10) - (0 ? 10:10) + 1)))))) ) != 1)
++        ||  ((((((gctUINT32) (idle)) >> (0 ? 11:11)) & ((gctUINT32) ((((1 ? 11:11) - (0 ? 11:11) + 1) == 32) ? ~0 : (~(~0 << ((1 ? 11:11) - (0 ? 11:11) + 1)))))) ) != 1)
++        )
++        {
++            /* Something is busy. */
++            *IsIdle = gcvFALSE;
++        }
++
++        else
++        {
++            *IsIdle = gcvTRUE;
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif /* gcdENABLE_VG */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/archvg/gc_hal_kernel_hardware_vg.h	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,74 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_hardware_vg_h_
++#define __gc_hal_kernel_hardware_vg_h_
++
++/* gckHARDWARE object. */
++struct _gckVGHARDWARE
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckKERNEL object. */
++    gckVGKERNEL                 kernel;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Chip characteristics. */
++    gceCHIPMODEL                chipModel;
++    gctUINT32                   chipRevision;
++    gctUINT32                   chipFeatures;
++    gctUINT32                   chipMinorFeatures;
++    gctUINT32                   chipMinorFeatures2;
++    gctBOOL                     allowFastClear;
++
++    /* Features. */
++    gctBOOL                     fe20;
++    gctBOOL                     vg20;
++    gctBOOL                     vg21;
++
++    /* Event mask. */
++    gctUINT32                   eventMask;
++
++    gctBOOL                     clockState;
++    gctBOOL                     powerState;
++    gctPOINTER                  powerMutex;
++    gctUINT32                   powerProcess;
++    gctUINT32                   powerThread;
++    gceCHIPPOWERSTATE           chipPowerState;
++    gceCHIPPOWERSTATE           chipPowerStateGlobal;
++    gctISRMANAGERFUNC           startIsr;
++    gctISRMANAGERFUNC           stopIsr;
++    gctPOINTER                  isrContext;
++    gctPOINTER                  pageTableDirty;
++#if gcdPOWEROFF_TIMEOUT
++    gctUINT32                   powerOffTime;
++    gctUINT32                   powerOffTimeout;
++    gctPOINTER                  powerOffTimer;
++#endif
++
++    gctBOOL                     powerManagement;
++};
++
++#endif /* __gc_hal_kernel_hardware_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,3976 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_KERNEL
++
++/*******************************************************************************
++***** Version Signature *******************************************************/
++
++#define _gcmTXT2STR(t) #t
++#define gcmTXT2STR(t) _gcmTXT2STR(t)
++const char * _VERSION = "\n\0$VERSION$"
++                        gcmTXT2STR(gcvVERSION_MAJOR) "."
++                        gcmTXT2STR(gcvVERSION_MINOR) "."
++                        gcmTXT2STR(gcvVERSION_PATCH) ":"
++                        gcmTXT2STR(gcvVERSION_BUILD) "$\n";
++
++/******************************************************************************\
++******************************* gckKERNEL API Code ******************************
++\******************************************************************************/
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++#define gcmDEFINE2TEXT(d) #d
++gctCONST_STRING _DispatchText[] =
++{
++    gcmDEFINE2TEXT(gcvHAL_QUERY_VIDEO_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_QUERY_CHIP_IDENTITY),
++    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_NON_PAGED_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_FREE_NON_PAGED_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_FREE_CONTIGUOUS_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_VIDEO_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_FREE_VIDEO_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_MAP_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_UNMAP_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_MAP_USER_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_UNMAP_USER_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_LOCK_VIDEO_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_UNLOCK_VIDEO_MEMORY),
++    gcmDEFINE2TEXT(gcvHAL_EVENT_COMMIT),
++    gcmDEFINE2TEXT(gcvHAL_USER_SIGNAL),
++    gcmDEFINE2TEXT(gcvHAL_SIGNAL),
++    gcmDEFINE2TEXT(gcvHAL_WRITE_DATA),
++    gcmDEFINE2TEXT(gcvHAL_COMMIT),
++    gcmDEFINE2TEXT(gcvHAL_STALL),
++    gcmDEFINE2TEXT(gcvHAL_READ_REGISTER),
++    gcmDEFINE2TEXT(gcvHAL_WRITE_REGISTER),
++    gcmDEFINE2TEXT(gcvHAL_GET_PROFILE_SETTING),
++    gcmDEFINE2TEXT(gcvHAL_SET_PROFILE_SETTING),
++    gcmDEFINE2TEXT(gcvHAL_READ_ALL_PROFILE_REGISTERS),
++#if VIVANTE_PROFILER_PERDRAW
++    gcmDEFINE2TEXT(gcvHAL_READ_PROFILER_REGISTER_SETTING),
++#endif
++    gcmDEFINE2TEXT(gcvHAL_PROFILE_REGISTERS_2D),
++    gcmDEFINE2TEXT(gcvHAL_SET_POWER_MANAGEMENT_STATE),
++    gcmDEFINE2TEXT(gcvHAL_QUERY_POWER_MANAGEMENT_STATE),
++    gcmDEFINE2TEXT(gcvHAL_GET_BASE_ADDRESS),
++    gcmDEFINE2TEXT(gcvHAL_SET_IDLE),
++    gcmDEFINE2TEXT(gcvHAL_QUERY_KERNEL_SETTINGS),
++    gcmDEFINE2TEXT(gcvHAL_RESET),
++    gcmDEFINE2TEXT(gcvHAL_MAP_PHYSICAL),
++    gcmDEFINE2TEXT(gcvHAL_DEBUG),
++    gcmDEFINE2TEXT(gcvHAL_CACHE),
++    gcmDEFINE2TEXT(gcvHAL_TIMESTAMP),
++    gcmDEFINE2TEXT(gcvHAL_DATABASE),
++    gcmDEFINE2TEXT(gcvHAL_VERSION),
++    gcmDEFINE2TEXT(gcvHAL_CHIP_INFO),
++    gcmDEFINE2TEXT(gcvHAL_ATTACH),
++    gcmDEFINE2TEXT(gcvHAL_DETACH)
++};
++#endif
++
++#if gcdENABLE_RECOVERY
++void
++_ResetFinishFunction(
++    gctPOINTER Data
++    )
++{
++    gckKERNEL kernel = (gckKERNEL)Data;
++
++    gckOS_AtomSet(kernel->os, kernel->resetAtom, 0);
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckKERNEL_Construct
++**
++**  Construct a new gckKERNEL object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gceCORE Core
++**          Specified core.
++**
++**      IN gctPOINTER Context
++**          Pointer to a driver defined context.
++**
++**      IN gckDB SharedDB,
++**          Pointer to a shared DB.
++**
++**  OUTPUT:
++**
++**      gckKERNEL * Kernel
++**          Pointer to a variable that will hold the pointer to the gckKERNEL
++**          object.
++*/
++
++gceSTATUS
++gckKERNEL_Construct(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPOINTER Context,
++    IN gckDB SharedDB,
++    OUT gckKERNEL * Kernel
++    )
++{
++    gckKERNEL kernel = gcvNULL;
++    gceSTATUS status;
++    gctSIZE_T i;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%x Context=0x%x", Os, Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Kernel != gcvNULL);
++
++    /* Allocate the gckKERNEL object. */
++    gcmkONERROR(gckOS_Allocate(Os,
++                               gcmSIZEOF(struct _gckKERNEL),
++                               &pointer));
++
++    kernel = pointer;
++
++    /* Zero the object pointers. */
++    kernel->hardware     = gcvNULL;
++    kernel->command      = gcvNULL;
++    kernel->eventObj     = gcvNULL;
++    kernel->mmu          = gcvNULL;
++#if gcdDVFS
++    kernel->dvfs         = gcvNULL;
++#endif
++
++    kernel->vidmemMutex  = gcvNULL;
++
++    /* Initialize the gckKERNEL object. */
++    kernel->object.type = gcvOBJ_KERNEL;
++    kernel->os          = Os;
++    kernel->core        = Core;
++
++
++    if (SharedDB == gcvNULL)
++    {
++        gcmkONERROR(gckOS_Allocate(Os,
++                                   gcmSIZEOF(struct _gckDB),
++                                   &pointer));
++
++        kernel->db               = pointer;
++        kernel->dbCreated        = gcvTRUE;
++        kernel->db->freeDatabase = gcvNULL;
++        kernel->db->freeRecord   = gcvNULL;
++        kernel->db->dbMutex      = gcvNULL;
++        kernel->db->lastDatabase = gcvNULL;
++        kernel->db->idleTime     = 0;
++        kernel->db->lastIdle     = 0;
++        kernel->db->lastSlowdown = 0;
++
++        for (i = 0; i < gcmCOUNTOF(kernel->db->db); ++i)
++        {
++            kernel->db->db[i] = gcvNULL;
++        }
++
++        /* Construct a database mutex. */
++        gcmkONERROR(gckOS_CreateMutex(Os, &kernel->db->dbMutex));
++
++        /* Construct a id-pointer database. */
++        gcmkONERROR(gckKERNEL_CreateIntegerDatabase(kernel, &kernel->db->pointerDatabase));
++
++        /* Construct a id-pointer database mutex. */
++        gcmkONERROR(gckOS_CreateMutex(Os, &kernel->db->pointerDatabaseMutex));
++    }
++    else
++    {
++        kernel->db               = SharedDB;
++        kernel->dbCreated        = gcvFALSE;
++    }
++
++    for (i = 0; i < gcmCOUNTOF(kernel->timers); ++i)
++    {
++        kernel->timers[i].startTime = 0;
++        kernel->timers[i].stopTime = 0;
++    }
++
++    kernel->timeOut      = gcdGPU_TIMEOUT;
++
++    /* Save context. */
++    kernel->context = Context;
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++    kernel->virtualBufferHead =
++    kernel->virtualBufferTail = gcvNULL;
++
++    gcmkONERROR(
++        gckOS_CreateMutex(Os, (gctPOINTER)&kernel->virtualBufferLock));
++#endif
++
++    /* Construct atom holding number of clients. */
++    kernel->atomClients = gcvNULL;
++    gcmkONERROR(gckOS_AtomConstruct(Os, &kernel->atomClients));
++
++#if gcdENABLE_VG
++    kernel->vg = gcvNULL;
++
++    if (Core == gcvCORE_VG)
++    {
++        /* Construct the gckMMU object. */
++        gcmkONERROR(
++            gckVGKERNEL_Construct(Os, Context, kernel, &kernel->vg));
++    }
++    else
++#endif
++    {
++        /* Construct the gckHARDWARE object. */
++        gcmkONERROR(
++            gckHARDWARE_Construct(Os, kernel->core, &kernel->hardware));
++
++        /* Set pointer to gckKERNEL object in gckHARDWARE object. */
++        kernel->hardware->kernel = kernel;
++
++        /* Initialize the hardware. */
++        gcmkONERROR(
++            gckHARDWARE_InitializeHardware(kernel->hardware));
++
++        /* Construct the gckCOMMAND object. */
++        gcmkONERROR(
++            gckCOMMAND_Construct(kernel, &kernel->command));
++
++        /* Construct the gckEVENT object. */
++        gcmkONERROR(
++            gckEVENT_Construct(kernel, &kernel->eventObj));
++
++        /* Construct the gckMMU object. */
++        gcmkONERROR(
++            gckMMU_Construct(kernel, gcdMMU_SIZE, &kernel->mmu));
++
++#if gcdENABLE_RECOVERY
++        gcmkONERROR(
++            gckOS_AtomConstruct(Os, &kernel->resetAtom));
++
++        gcmkVERIFY_OK(
++            gckOS_CreateTimer(Os,
++                              (gctTIMERFUNCTION)_ResetFinishFunction,
++                              (gctPOINTER)kernel,
++                              &kernel->resetFlagClearTimer));
++        kernel->resetTimeStamp = 0;
++#endif
++
++#if gcdDVFS
++        if (gckHARDWARE_IsFeatureAvailable(kernel->hardware,
++                                           gcvFEATURE_DYNAMIC_FREQUENCY_SCALING))
++        {
++            gcmkONERROR(gckDVFS_Construct(kernel->hardware, &kernel->dvfs));
++            gcmkONERROR(gckDVFS_Start(kernel->dvfs));
++        }
++#endif
++    }
++
++    spin_lock_init(&kernel->irq_lock);
++
++#if VIVANTE_PROFILER
++    /* Initialize profile setting */
++    kernel->profileEnable = gcvFALSE;
++    kernel->profileCleanRegister = gcvTRUE;
++#endif
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    gcmkONERROR(gckOS_CreateSyncTimeline(Os, &kernel->timeline));
++#endif
++
++    /* Construct a video memory mutex. */
++    gcmkONERROR(gckOS_GetVideoMemoryMutex(Os, &kernel->vidmemMutex));
++
++    /* Return pointer to the gckKERNEL object. */
++    *Kernel = kernel;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Kernel=0x%x", *Kernel);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (kernel != gcvNULL)
++    {
++#if gcdENABLE_VG
++        if (Core != gcvCORE_VG)
++#endif
++        {
++            if (kernel->eventObj != gcvNULL)
++            {
++                gcmkVERIFY_OK(gckEVENT_Destroy(kernel->eventObj));
++            }
++
++            if (kernel->command != gcvNULL)
++            {
++            gcmkVERIFY_OK(gckCOMMAND_Destroy(kernel->command));
++            }
++
++            if (kernel->hardware != gcvNULL)
++            {
++                /* Turn off the power. */
++                gcmkVERIFY_OK(gckOS_SetGPUPower(kernel->hardware->os,
++                                                kernel->hardware->core,
++                                                gcvFALSE,
++                                                gcvFALSE));
++                gcmkVERIFY_OK(gckHARDWARE_Destroy(kernel->hardware));
++            }
++        }
++
++        if (kernel->atomClients != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, kernel->atomClients));
++        }
++
++#if gcdENABLE_RECOVERY
++        if (kernel->resetAtom != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(Os, kernel->resetAtom));
++        }
++
++        if (kernel->resetFlagClearTimer)
++        {
++            gcmkVERIFY_OK(gckOS_StopTimer(Os, kernel->resetFlagClearTimer));
++            gcmkVERIFY_OK(gckOS_DestroyTimer(Os, kernel->resetFlagClearTimer));
++        }
++#endif
++
++        if (kernel->dbCreated && kernel->db != gcvNULL)
++        {
++            if (kernel->db->dbMutex != gcvNULL)
++            {
++                /* Destroy the database mutex. */
++                gcmkVERIFY_OK(gckOS_DeleteMutex(Os, kernel->db->dbMutex));
++            }
++
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, kernel->db));
++        }
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++        if (kernel->virtualBufferLock != gcvNULL)
++        {
++            /* Destroy the virtual command buffer mutex. */
++            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, kernel->virtualBufferLock));
++        }
++#endif
++
++#if gcdDVFS
++        if (kernel->dvfs)
++        {
++            gcmkVERIFY_OK(gckDVFS_Stop(kernel->dvfs));
++            gcmkVERIFY_OK(gckDVFS_Destroy(kernel->dvfs));
++        }
++#endif
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++        if (kernel->timeline)
++        {
++            gcmkVERIFY_OK(gckOS_DestroySyncTimeline(Os, kernel->timeline));
++        }
++#endif
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, kernel));
++    }
++
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_Destroy
++**
++**  Destroy an gckKERNEL object.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_Destroy(
++    IN gckKERNEL Kernel
++    )
++{
++    gctSIZE_T i;
++    gcsDATABASE_PTR database, databaseNext;
++    gcsDATABASE_RECORD_PTR record, recordNext;
++
++    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++#if QNX_SINGLE_THREADED_DEBUGGING
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->debugMutex));
++#endif
++
++    /* Destroy the database. */
++    if (Kernel->dbCreated)
++    {
++        for (i = 0; i < gcmCOUNTOF(Kernel->db->db); ++i)
++        {
++            if (Kernel->db->db[i] != gcvNULL)
++            {
++                gcmkVERIFY_OK(
++                    gckKERNEL_DestroyProcessDB(Kernel, Kernel->db->db[i]->processID));
++            }
++        }
++
++        /* Free all databases. */
++        for (database = Kernel->db->freeDatabase;
++             database != gcvNULL;
++             database = databaseNext)
++        {
++            databaseNext = database->next;
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, database));
++        }
++
++        if (Kernel->db->lastDatabase != gcvNULL)
++        {
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, Kernel->db->lastDatabase));
++        }
++
++        /* Free all database records. */
++        for (record = Kernel->db->freeRecord; record != gcvNULL; record = recordNext)
++        {
++            recordNext = record->next;
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, record));
++        }
++
++        /* Destroy the database mutex. */
++        gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->db->dbMutex));
++
++
++        /* Destroy id-pointer database. */
++        gcmkVERIFY_OK(gckKERNEL_DestroyIntegerDatabase(Kernel, Kernel->db->pointerDatabase));
++
++        /* Destroy id-pointer database mutex. */
++        gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->db->pointerDatabaseMutex));
++    }
++
++#if gcdENABLE_VG
++    if (Kernel->vg)
++    {
++        gcmkVERIFY_OK(gckVGKERNEL_Destroy(Kernel->vg));
++    }
++    else
++#endif
++    {
++        /* Destroy the gckMMU object. */
++        gcmkVERIFY_OK(gckMMU_Destroy(Kernel->mmu));
++
++        /* Destroy the gckCOMMNAND object. */
++        gcmkVERIFY_OK(gckCOMMAND_Destroy(Kernel->command));
++
++        /* Destroy the gckEVENT object. */
++        gcmkVERIFY_OK(gckEVENT_Destroy(Kernel->eventObj));
++
++        /* Destroy the gckHARDWARE object. */
++        gcmkVERIFY_OK(gckHARDWARE_Destroy(Kernel->hardware));
++
++#if gcdENABLE_RECOVERY
++        gcmkVERIFY_OK(gckOS_AtomDestroy(Kernel->os, Kernel->resetAtom));
++
++        if (Kernel->resetFlagClearTimer)
++        {
++            gcmkVERIFY_OK(gckOS_StopTimer(Kernel->os, Kernel->resetFlagClearTimer));
++            gcmkVERIFY_OK(gckOS_DestroyTimer(Kernel->os, Kernel->resetFlagClearTimer));
++        }
++#endif
++    }
++
++    /* Detsroy the client atom. */
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Kernel->os, Kernel->atomClients));
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, Kernel->virtualBufferLock));
++#endif
++
++#if gcdDVFS
++    if (Kernel->dvfs)
++    {
++        gcmkVERIFY_OK(gckDVFS_Stop(Kernel->dvfs));
++        gcmkVERIFY_OK(gckDVFS_Destroy(Kernel->dvfs));
++    }
++#endif
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    gcmkVERIFY_OK(gckOS_DestroySyncTimeline(Kernel->os, Kernel->timeline));
++#endif
++
++    /* Mark the gckKERNEL object as unknown. */
++    Kernel->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckKERNEL object. */
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, Kernel));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++#include <linux/kernel.h>
++#include <linux/mm.h>
++#include <linux/oom.h>
++#include <linux/sched.h>
++#include <linux/notifier.h>
++
++extern struct task_struct *lowmem_deathpending;
++static unsigned long lowmem_deathpending_timeout;
++
++static int force_contiguous_lowmem_shrink(IN gckKERNEL Kernel)
++{
++	struct task_struct *p;
++	struct task_struct *selected = NULL;
++	int tasksize;
++        int ret = -1;
++	int min_adj = 0;
++	int selected_tasksize = 0;
++	int selected_oom_adj;
++	/*
++	 * If we already have a death outstanding, then
++	 * bail out right away; indicating to vmscan
++	 * that we have nothing further to offer on
++	 * this pass.
++	 *
++	 */
++	if (lowmem_deathpending &&
++	    time_before_eq(jiffies, lowmem_deathpending_timeout))
++		return 0;
++	selected_oom_adj = min_adj;
++
++	read_lock(&tasklist_lock);
++	for_each_process(p) {
++		struct mm_struct *mm;
++		struct signal_struct *sig;
++                gcuDATABASE_INFO info;
++		int oom_adj, pid;
++
++		task_lock(p);
++		mm = p->mm;
++		sig = p->signal;
++                pid = p->pid;
++		if (!mm || !sig) {
++			task_unlock(p);
++			continue;
++		}
++		oom_adj = sig->oom_adj;
++		task_unlock(p);
++		if (oom_adj < min_adj) {
++			continue;
++		}
++
++                read_unlock(&tasklist_lock);
++
++		tasksize = 0;
++		if (gckKERNEL_QueryProcessDB(Kernel, pid, gcvFALSE, gcvDB_VIDEO_MEMORY, &info) == gcvSTATUS_OK){
++			tasksize += info.counters.bytes / PAGE_SIZE;
++		}
++		if (gckKERNEL_QueryProcessDB(Kernel, pid, gcvFALSE, gcvDB_CONTIGUOUS, &info) == gcvSTATUS_OK){
++			tasksize += info.counters.bytes / PAGE_SIZE;
++		}
++
++                read_lock(&tasklist_lock);
++
++		if (tasksize <= 0)
++			continue;
++
++		gckOS_Print("<gpu> pid %d (%s), adj %d, size %d \n", p->pid, p->comm, oom_adj, tasksize);
++
++		if (selected) {
++			if (oom_adj < selected_oom_adj)
++				continue;
++			if (oom_adj == selected_oom_adj &&
++			    tasksize <= selected_tasksize)
++				continue;
++		}
++		selected = p;
++		selected_tasksize = tasksize;
++		selected_oom_adj = oom_adj;
++	}
++	if (selected) {
++		gckOS_Print("<gpu> send sigkill to %d (%s), adj %d, size %d\n",
++			     selected->pid, selected->comm,
++			     selected_oom_adj, selected_tasksize);
++		lowmem_deathpending = selected;
++		lowmem_deathpending_timeout = jiffies + HZ;
++		force_sig(SIGKILL, selected);
++		ret = 0;
++	}
++	read_unlock(&tasklist_lock);
++	return ret;
++}
++
++#endif
++
++/*******************************************************************************
++**
++**  _AllocateMemory
++**
++**  Private function to walk all required memory pools to allocate the requested
++**  amount of video memory.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to a gcsHAL_INTERFACE structure that defines the command to
++**          be dispatched.
++**
++**  OUTPUT:
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to a gcsHAL_INTERFACE structure that receives any data to be
++**          returned.
++*/
++static gceSTATUS
++_AllocateMemory(
++    IN gckKERNEL Kernel,
++    IN OUT gcePOOL * Pool,
++    IN gctSIZE_T Bytes,
++    IN gctSIZE_T Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    )
++{
++    gcePOOL pool;
++    gceSTATUS status;
++    gckVIDMEM videoMemory;
++    gctINT loopCount;
++    gcuVIDMEM_NODE_PTR node = gcvNULL;
++    gctBOOL tileStatusInVirtual;
++    gctBOOL forceContiguous = gcvFALSE;
++
++    gcmkHEADER_ARG("Kernel=0x%x *Pool=%d Bytes=%lu Alignment=%lu Type=%d",
++                   Kernel, *Pool, Bytes, Alignment, Type);
++
++    gcmkVERIFY_ARGUMENT(Pool != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes != 0);
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++_AllocateMemory_Retry:
++#endif
++    /* Get initial pool. */
++    switch (pool = *Pool)
++    {
++    case gcvPOOL_DEFAULT_FORCE_CONTIGUOUS:
++        forceContiguous = gcvTRUE;
++    case gcvPOOL_DEFAULT:
++    case gcvPOOL_LOCAL:
++        pool      = gcvPOOL_LOCAL_INTERNAL;
++        loopCount = (gctINT) gcvPOOL_NUMBER_OF_POOLS;
++        break;
++
++    case gcvPOOL_UNIFIED:
++        pool      = gcvPOOL_SYSTEM;
++        loopCount = (gctINT) gcvPOOL_NUMBER_OF_POOLS;
++        break;
++
++    case gcvPOOL_CONTIGUOUS:
++        loopCount = (gctINT) gcvPOOL_NUMBER_OF_POOLS;
++        break;
++
++    case gcvPOOL_DEFAULT_FORCE_CONTIGUOUS_CACHEABLE:
++        pool      = gcvPOOL_CONTIGUOUS;
++        loopCount = 1;
++        forceContiguous = gcvTRUE;
++        break;
++
++    default:
++        loopCount = 1;
++        break;
++    }
++
++    while (loopCount-- > 0)
++    {
++        if (pool == gcvPOOL_VIRTUAL)
++        {
++            /* Create a gcuVIDMEM_NODE for virtual memory. */
++            gcmkONERROR(
++                gckVIDMEM_ConstructVirtual(Kernel, gcvFALSE, Bytes, &node));
++
++            /* Success. */
++            break;
++        }
++
++        else
++        if (pool == gcvPOOL_CONTIGUOUS)
++        {
++#if gcdCONTIGUOUS_SIZE_LIMIT
++            if (Bytes > gcdCONTIGUOUS_SIZE_LIMIT && forceContiguous == gcvFALSE)
++            {
++                status = gcvSTATUS_OUT_OF_MEMORY;
++            }
++            else
++#endif
++            {
++                /* Create a gcuVIDMEM_NODE from contiguous memory. */
++                status = gckVIDMEM_ConstructVirtual(Kernel, gcvTRUE, Bytes, &node);
++            }
++
++            if (gcmIS_SUCCESS(status) || forceContiguous == gcvTRUE)
++            {
++                /* Memory allocated. */
++                if(node && forceContiguous == gcvTRUE)
++                {
++                    gctUINT32 physAddr=0;
++                    gctUINT32 baseAddress = 0;
++
++                    gcmkONERROR(
++                        gckOS_LockPages(Kernel->os,
++                                        node->Virtual.physical,
++                                        node->Virtual.bytes,
++                                        gcvFALSE,
++                                        &node->Virtual.logical,
++                                        &node->Virtual.pageCount));
++
++                    /* Convert logical address into a physical address. */
++                    gcmkONERROR(
++                        gckOS_GetPhysicalAddress(Kernel->os,
++                                                 node->Virtual.logical,
++                                                 &physAddr));
++
++                    gcmkONERROR(
++                        gckOS_UnlockPages(Kernel->os,
++                                          node->Virtual.physical,
++                                          node->Virtual.bytes,
++                                          node->Virtual.logical));
++
++                    gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
++
++                    gcmkASSERT(physAddr >= baseAddress);
++
++                    /* Subtract baseAddress to get a GPU address used for programming. */
++                    physAddr -= baseAddress;
++
++                    if((physAddr & 0x80000000) || ((physAddr + Bytes) & 0x80000000))
++                    {
++                        gckOS_Print("gpu virtual memory 0x%x cannot be allocated in force contiguous request!\n", physAddr);
++
++                        gcmkONERROR(gckVIDMEM_Free(Kernel,node));
++
++                        node = gcvNULL;
++                    }
++                }
++
++                break;
++            }
++        }
++
++        else
++        {
++            /* Get pointer to gckVIDMEM object for pool. */
++#if gcdUSE_VIDMEM_PER_PID
++            gctUINT32 pid;
++            gckOS_GetProcessID(&pid);
++
++            status = gckKERNEL_GetVideoMemoryPoolPid(Kernel, pool, pid, &videoMemory);
++            if (status == gcvSTATUS_NOT_FOUND)
++            {
++                /* Create VidMem pool for this process. */
++                status = gckKERNEL_CreateVideoMemoryPoolPid(Kernel, pool, pid, &videoMemory);
++            }
++#else
++            status = gckKERNEL_GetVideoMemoryPool(Kernel, pool, &videoMemory);
++#endif
++
++            if (gcmIS_SUCCESS(status))
++            {
++                /* Allocate memory. */
++                status = gckVIDMEM_AllocateLinear(Kernel,
++                                                  videoMemory,
++                                                  Bytes,
++                                                  Alignment,
++                                                  Type,
++                                                  &node);
++
++                if (gcmIS_SUCCESS(status))
++                {
++                    /* Memory allocated. */
++                    node->VidMem.pool = pool;
++                    break;
++                }
++            }
++        }
++
++        if (pool == gcvPOOL_LOCAL_INTERNAL)
++        {
++            /* Advance to external memory. */
++            pool = gcvPOOL_LOCAL_EXTERNAL;
++        }
++
++        else
++        if (pool == gcvPOOL_LOCAL_EXTERNAL)
++        {
++            /* Advance to contiguous system memory. */
++            pool = gcvPOOL_SYSTEM;
++        }
++
++        else
++        if (pool == gcvPOOL_SYSTEM)
++        {
++            /* Advance to contiguous memory. */
++            pool = gcvPOOL_CONTIGUOUS;
++        }
++
++        else
++        if (pool == gcvPOOL_CONTIGUOUS)
++        {
++            tileStatusInVirtual =
++                gckHARDWARE_IsFeatureAvailable(Kernel->hardware,
++                                               gcvFEATURE_MC20);
++
++            if (Type == gcvSURF_TILE_STATUS && tileStatusInVirtual != gcvTRUE)
++            {
++                gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++            }
++
++            /* Advance to virtual memory. */
++            pool = gcvPOOL_VIRTUAL;
++        }
++
++        else
++        {
++            /* Out of pools. */
++            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++        }
++    }
++
++    if (node == gcvNULL)
++    {
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++        if(forceContiguous == gcvTRUE)
++        {
++            if(force_contiguous_lowmem_shrink(Kernel) == 0)
++            {
++                 /* Sleep 1 millisecond. */
++                 gckOS_Delay(gcvNULL, 1);
++                 goto _AllocateMemory_Retry;
++            }
++        }
++#endif
++        /* Nothing allocated. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Return node and pool used for allocation. */
++    *Node = node;
++    *Pool = pool;
++
++    /* Return status. */
++    gcmkFOOTER_ARG("*Pool=%d *Node=0x%x", *Pool, *Node);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_Dispatch
++**
++**  Dispatch a command received from the user HAL layer.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL FromUser
++**          whether the call is from the user space.
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to a gcsHAL_INTERFACE structure that defines the command to
++**          be dispatched.
++**
++**  OUTPUT:
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to a gcsHAL_INTERFACE structure that receives any data to be
++**          returned.
++*/
++
++gceSTATUS
++gckKERNEL_Dispatch(
++    IN gckKERNEL Kernel,
++    IN gctBOOL FromUser,
++    IN OUT gcsHAL_INTERFACE * Interface
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctSIZE_T bytes;
++    gcuVIDMEM_NODE_PTR node;
++    gctBOOL locked = gcvFALSE;
++    gctPHYS_ADDR physical = gcvNULL;
++    gctPOINTER logical = gcvNULL;
++    gctPOINTER info = gcvNULL;
++    gckCONTEXT context = gcvNULL;
++    gctUINT32 address;
++    gctUINT32 processID;
++    gckKERNEL kernel = Kernel;
++#if gcdSECURE_USER
++    gcskSECURE_CACHE_PTR cache;
++#endif
++    gctBOOL asynchronous;
++    gctPOINTER paddr = gcvNULL;
++#if !USE_NEW_LINUX_SIGNAL
++    gctSIGNAL   signal;
++#endif
++    gceSURF_TYPE type;
++
++    gcmkHEADER_ARG("Kernel=0x%x FromUser=%d Interface=0x%x",
++                   Kernel, FromUser, Interface);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
++                   "Dispatching command %d (%s)",
++                   Interface->command, _DispatchText[Interface->command]);
++#endif
++#if QNX_SINGLE_THREADED_DEBUGGING
++    gckOS_AcquireMutex(Kernel->os, Kernel->debugMutex, gcvINFINITE);
++#endif
++
++    /* Get the current process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&processID));
++
++#if gcdSECURE_USER
++    gcmkONERROR(gckKERNEL_GetProcessDBCache(Kernel, processID, &cache));
++#endif
++
++    /* Dispatch on command. */
++    switch (Interface->command)
++    {
++    case gcvHAL_GET_BASE_ADDRESS:
++        /* Get base address. */
++        gcmkONERROR(
++            gckOS_GetBaseAddress(Kernel->os,
++                                 &Interface->u.GetBaseAddress.baseAddress));
++        break;
++
++    case gcvHAL_QUERY_VIDEO_MEMORY:
++        /* Query video memory size. */
++        gcmkONERROR(gckKERNEL_QueryVideoMemory(Kernel, Interface));
++        break;
++
++    case gcvHAL_QUERY_CHIP_IDENTITY:
++        /* Query chip identity. */
++        gcmkONERROR(
++            gckHARDWARE_QueryChipIdentity(
++                Kernel->hardware,
++                &Interface->u.QueryChipIdentity));
++        break;
++
++    case gcvHAL_MAP_MEMORY:
++        physical = gcmINT2PTR(Interface->u.MapMemory.physical);
++
++        /* Map memory. */
++        gcmkONERROR(
++            gckKERNEL_MapMemory(Kernel,
++                                physical,
++                                (gctSIZE_T) Interface->u.MapMemory.bytes,
++                                &logical));
++
++        Interface->u.MapMemory.logical = gcmPTR_TO_UINT64(logical);
++
++        gcmkVERIFY_OK(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_MAP_MEMORY,
++                                   logical,
++                                   physical,
++                                   (gctSIZE_T) Interface->u.MapMemory.bytes));
++        break;
++
++    case gcvHAL_UNMAP_MEMORY:
++        physical = gcmINT2PTR(Interface->u.UnmapMemory.physical);
++
++        /* Unmap memory. */
++        gcmkONERROR(
++            gckKERNEL_UnmapMemory(Kernel,
++                                  physical,
++                                  (gctSIZE_T) Interface->u.UnmapMemory.bytes,
++                                  gcmUINT64_TO_PTR(Interface->u.UnmapMemory.logical)));
++        gcmkVERIFY_OK(
++            gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_MAP_MEMORY,
++                                      gcmUINT64_TO_PTR(Interface->u.UnmapMemory.logical)));
++        break;
++
++    case gcvHAL_ALLOCATE_NON_PAGED_MEMORY:
++        bytes = (gctSIZE_T) Interface->u.AllocateNonPagedMemory.bytes;
++
++        /* Allocate non-paged memory. */
++        gcmkONERROR(
++            gckOS_AllocateNonPagedMemory(
++                Kernel->os,
++                FromUser,
++                &bytes,
++                &physical,
++                &logical));
++
++        Interface->u.AllocateNonPagedMemory.bytes    = bytes;
++        Interface->u.AllocateNonPagedMemory.logical  = gcmPTR_TO_UINT64(logical);
++        Interface->u.AllocateNonPagedMemory.physical = gcmPTR_TO_NAME(physical);
++
++        gcmkVERIFY_OK(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_NON_PAGED,
++                                   logical,
++                                   gcmINT2PTR(Interface->u.AllocateNonPagedMemory.physical),
++                                   bytes));
++
++        break;
++
++    case gcvHAL_ALLOCATE_VIRTUAL_COMMAND_BUFFER:
++#if gcdVIRTUAL_COMMAND_BUFFER
++        bytes = (gctSIZE_T) Interface->u.AllocateVirtualCommandBuffer.bytes;
++
++        gcmkONERROR(
++            gckKERNEL_AllocateVirtualCommandBuffer(
++                Kernel,
++                FromUser,
++                &bytes,
++                &physical,
++                &logical));
++
++        Interface->u.AllocateVirtualCommandBuffer.bytes    = bytes;
++        Interface->u.AllocateVirtualCommandBuffer.logical  = gcmPTR_TO_UINT64(logical);
++        Interface->u.AllocateVirtualCommandBuffer.physical = gcmPTR_TO_NAME(physical);
++
++        gcmkVERIFY_OK(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_COMMAND_BUFFER,
++                                   logical,
++                                   gcmINT2PTR(Interface->u.AllocateVirtualCommandBuffer.physical),
++                                   bytes));
++#else
++        status = gcvSTATUS_NOT_SUPPORTED;
++#endif
++        break;
++
++    case gcvHAL_FREE_NON_PAGED_MEMORY:
++        physical = gcmNAME_TO_PTR(Interface->u.FreeNonPagedMemory.physical);
++
++        /* Unmap user logical out of physical memory first. */
++        gcmkONERROR(gckOS_UnmapUserLogical(Kernel->os,
++                                           physical,
++                                           (gctSIZE_T) Interface->u.FreeNonPagedMemory.bytes,
++                                           gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
++
++        /* Free non-paged memory. */
++        gcmkONERROR(
++            gckOS_FreeNonPagedMemory(Kernel->os,
++                                     (gctSIZE_T) Interface->u.FreeNonPagedMemory.bytes,
++                                     physical,
++                                     gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
++
++        gcmkVERIFY_OK(
++            gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_NON_PAGED,
++                                      gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
++
++#if gcdSECURE_USER
++        gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++            Kernel,
++            cache,
++            gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical),
++            Interface->u.FreeNonPagedMemory.bytes));
++#endif
++
++        gcmRELEASE_NAME(Interface->u.FreeNonPagedMemory.physical);
++
++        break;
++
++    case gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY:
++        bytes = (gctSIZE_T) Interface->u.AllocateContiguousMemory.bytes;
++
++        /* Allocate contiguous memory. */
++        gcmkONERROR(gckOS_AllocateContiguous(
++            Kernel->os,
++            FromUser,
++            &bytes,
++            &physical,
++            &logical));
++
++        Interface->u.AllocateContiguousMemory.bytes    = bytes;
++        Interface->u.AllocateContiguousMemory.logical  = gcmPTR_TO_UINT64(logical);
++        Interface->u.AllocateContiguousMemory.physical = gcmPTR_TO_NAME(physical);
++
++        gcmkONERROR(gckHARDWARE_ConvertLogical(
++            Kernel->hardware,
++            gcmUINT64_TO_PTR(Interface->u.AllocateContiguousMemory.logical),
++            &Interface->u.AllocateContiguousMemory.address));
++
++        gcmkVERIFY_OK(gckKERNEL_AddProcessDB(
++            Kernel,
++            processID, gcvDB_CONTIGUOUS,
++            logical,
++            gcmINT2PTR(Interface->u.AllocateContiguousMemory.physical),
++            bytes));
++
++        break;
++
++    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
++        physical = gcmNAME_TO_PTR(Interface->u.FreeContiguousMemory.physical);
++
++        /* Unmap user logical out of physical memory first. */
++        gcmkONERROR(gckOS_UnmapUserLogical(Kernel->os,
++                                           physical,
++                                           (gctSIZE_T) Interface->u.FreeContiguousMemory.bytes,
++                                           gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical)));
++
++        /* Free contiguous memory. */
++        gcmkONERROR(
++            gckOS_FreeContiguous(Kernel->os,
++                                 physical,
++                                 gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical),
++                                 (gctSIZE_T) Interface->u.FreeContiguousMemory.bytes));
++
++        gcmkVERIFY_OK(
++            gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_CONTIGUOUS,
++                                      gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
++
++#if gcdSECURE_USER
++        gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++            Kernel,
++            cache,
++            gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical),
++            Interface->u.FreeContiguousMemory.bytes));
++#endif
++
++        gcmRELEASE_NAME(Interface->u.FreeContiguousMemory.physical);
++
++        break;
++
++    case gcvHAL_ALLOCATE_VIDEO_MEMORY:
++
++        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++
++        break;
++
++    case gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY:
++        type = Interface->u.AllocateLinearVideoMemory.type;
++
++        /* Allocate memory. */
++        gcmkONERROR(
++            _AllocateMemory(Kernel,
++                            &Interface->u.AllocateLinearVideoMemory.pool,
++                            Interface->u.AllocateLinearVideoMemory.bytes,
++                            Interface->u.AllocateLinearVideoMemory.alignment,
++                            Interface->u.AllocateLinearVideoMemory.type,
++                            &node));
++
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++            bytes = node->VidMem.bytes;
++            node->VidMem.type = type;
++
++            gcmkONERROR(
++                gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_VIDEO_MEMORY_RESERVED,
++                                   node,
++                                   gcvNULL,
++                                   bytes));
++        }
++        else
++        {
++            bytes = node->Virtual.bytes;
++            node->Virtual.type = type;
++
++            if(node->Virtual.contiguous)
++            {
++                gcmkONERROR(
++                    gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_VIDEO_MEMORY_CONTIGUOUS,
++                                   node,
++                                   gcvNULL,
++                                   bytes));
++            }
++            else
++            {
++                gcmkONERROR(
++                    gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_VIDEO_MEMORY_VIRTUAL,
++                                   node,
++                                   gcvNULL,
++                                   bytes));
++            }
++
++        }
++
++        gcmkONERROR(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_VIDEO_MEMORY,
++                                   node,
++                                   gcvNULL,
++                                   bytes));
++
++        /* Get the node. */
++        Interface->u.AllocateLinearVideoMemory.node = gcmPTR_TO_UINT64(node);
++        break;
++
++    case gcvHAL_FREE_VIDEO_MEMORY:
++        node = gcmUINT64_TO_PTR(Interface->u.FreeVideoMemory.node);
++#ifdef __QNXNTO__
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM
++         && node->VidMem.logical != gcvNULL)
++        {
++            gcmkONERROR(
++                    gckKERNEL_UnmapVideoMemory(Kernel,
++                                               node->VidMem.logical,
++                                               processID,
++                                               node->VidMem.bytes));
++            node->VidMem.logical = gcvNULL;
++        }
++#endif
++        /* Free video memory. */
++        gcmkONERROR(
++            gckVIDMEM_Free(Kernel, node));
++
++        gcmkONERROR(
++            gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_VIDEO_MEMORY,
++                                      node));
++
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++           gcmkONERROR(
++                gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_VIDEO_MEMORY_RESERVED,
++                                      node));
++        }
++        else if(node->Virtual.contiguous)
++        {
++            gcmkONERROR(
++                gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_VIDEO_MEMORY_CONTIGUOUS,
++                                      node));
++        }
++        else
++        {
++            gcmkONERROR(
++                gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_VIDEO_MEMORY_VIRTUAL,
++                                      node));
++        }
++
++        break;
++
++    case gcvHAL_LOCK_VIDEO_MEMORY:
++        node = gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node);
++
++        /* Lock video memory. */
++        gcmkONERROR(
++            gckVIDMEM_Lock(Kernel,
++                           node,
++                           Interface->u.LockVideoMemory.cacheable,
++                           &Interface->u.LockVideoMemory.address));
++
++        locked = gcvTRUE;
++
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++            /* Map video memory address into user space. */
++#ifdef __QNXNTO__
++        if (node->VidMem.logical == gcvNULL)
++        {
++            gcmkONERROR(
++                gckKERNEL_MapVideoMemory(Kernel,
++                                         FromUser,
++                                         Interface->u.LockVideoMemory.address,
++                                         processID,
++                                         node->VidMem.bytes,
++                                         &node->VidMem.logical));
++        }
++        gcmkASSERT(node->VidMem.logical != gcvNULL);
++
++        Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->VidMem.logical);
++#else
++            gcmkONERROR(
++                gckKERNEL_MapVideoMemory(Kernel,
++                                         FromUser,
++                                         Interface->u.LockVideoMemory.address,
++                                         &logical));
++
++            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(logical);
++#endif
++        }
++        else
++        {
++            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->Virtual.logical);
++
++            /* Success. */
++            status = gcvSTATUS_OK;
++        }
++
++#if gcdSECURE_USER
++        /* Return logical address as physical address. */
++        Interface->u.LockVideoMemory.address =
++            Interface->u.LockVideoMemory.memory;
++#endif
++        gcmkONERROR(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_VIDEO_MEMORY_LOCKED,
++                                   node,
++                                   gcvNULL,
++                                   0));
++
++        break;
++
++    case gcvHAL_UNLOCK_VIDEO_MEMORY:
++        /* Unlock video memory. */
++        node = gcmUINT64_TO_PTR(Interface->u.UnlockVideoMemory.node);
++
++#if gcdSECURE_USER
++        /* Save node information before it disappears. */
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++            logical = gcvNULL;
++            bytes   = 0;
++        }
++        else
++        {
++            logical = node->Virtual.logical;
++            bytes   = node->Virtual.bytes;
++        }
++#endif
++
++        /* Unlock video memory. */
++        gcmkONERROR(
++            gckVIDMEM_Unlock(Kernel,
++                             node,
++                             Interface->u.UnlockVideoMemory.type,
++                             &Interface->u.UnlockVideoMemory.asynchroneous));
++
++#if gcdSECURE_USER
++        /* Flush the translation cache for virtual surfaces. */
++        if (logical != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(Kernel,
++                                                          cache,
++                                                          logical,
++                                                          bytes));
++        }
++#endif
++        if (Interface->u.UnlockVideoMemory.asynchroneous == gcvFALSE)
++        {
++            /* There isn't a event to unlock this node, remove record now */
++            gcmkONERROR(
++                gckKERNEL_RemoveProcessDB(Kernel,
++                                          processID, gcvDB_VIDEO_MEMORY_LOCKED,
++                                          node));
++        }
++        break;
++
++    case gcvHAL_EVENT_COMMIT:
++        /* Commit an event queue. */
++        gcmkONERROR(
++            gckEVENT_Commit(Kernel->eventObj,
++                            gcmUINT64_TO_PTR(Interface->u.Event.queue)));
++        break;
++
++    case gcvHAL_COMMIT:
++        /* Commit a command and context buffer. */
++        gcmkONERROR(
++            gckCOMMAND_Commit(Kernel->command,
++                              Interface->u.Commit.context ?
++                                  gcmNAME_TO_PTR(Interface->u.Commit.context) : gcvNULL,
++                              gcmUINT64_TO_PTR(Interface->u.Commit.commandBuffer),
++                              gcmUINT64_TO_PTR(Interface->u.Commit.delta),
++                              gcmUINT64_TO_PTR(Interface->u.Commit.queue),
++                              processID));
++        break;
++
++    case gcvHAL_STALL:
++        /* Stall the command queue. */
++        gcmkONERROR(gckCOMMAND_Stall(Kernel->command, gcvFALSE));
++        break;
++
++    case gcvHAL_MAP_USER_MEMORY:
++        /* Map user memory to DMA. */
++        gcmkONERROR(
++            gckOS_MapUserMemory(Kernel->os,
++                                Kernel->core,
++                                gcmUINT64_TO_PTR(Interface->u.MapUserMemory.memory),
++                                Interface->u.MapUserMemory.physical,
++                                (gctSIZE_T) Interface->u.MapUserMemory.size,
++                                &info,
++                                &Interface->u.MapUserMemory.address));
++
++        Interface->u.MapUserMemory.info = gcmPTR_TO_NAME(info);
++
++        gcmkVERIFY_OK(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_MAP_USER_MEMORY,
++                                   gcmINT2PTR(Interface->u.MapUserMemory.info),
++                                   gcmUINT64_TO_PTR(Interface->u.MapUserMemory.memory),
++                                   (gctSIZE_T) Interface->u.MapUserMemory.size));
++        break;
++
++    case gcvHAL_UNMAP_USER_MEMORY:
++        address = Interface->u.UnmapUserMemory.address;
++        info = gcmNAME_TO_PTR(Interface->u.UnmapUserMemory.info);
++
++        /* Unmap user memory. */
++        gcmkONERROR(
++            gckOS_UnmapUserMemory(Kernel->os,
++                                  Kernel->core,
++                                  gcmUINT64_TO_PTR(Interface->u.UnmapUserMemory.memory),
++                                  (gctSIZE_T) Interface->u.UnmapUserMemory.size,
++                                  info,
++                                  address));
++
++#if gcdSECURE_USER
++        gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++            Kernel,
++            cache,
++            gcmUINT64_TO_PTR(Interface->u.UnmapUserMemory.memory),
++            Interface->u.UnmapUserMemory.size));
++#endif
++        gcmkVERIFY_OK(
++            gckKERNEL_RemoveProcessDB(Kernel,
++                                      processID, gcvDB_MAP_USER_MEMORY,
++                                      gcmINT2PTR(Interface->u.UnmapUserMemory.info)));
++
++        gcmRELEASE_NAME(Interface->u.UnmapUserMemory.info);
++
++        break;
++
++#if !USE_NEW_LINUX_SIGNAL
++    case gcvHAL_USER_SIGNAL:
++        /* Dispatch depends on the user signal subcommands. */
++        switch(Interface->u.UserSignal.command)
++        {
++        case gcvUSER_SIGNAL_CREATE:
++            /* Create a signal used in the user space. */
++            gcmkONERROR(
++                gckOS_CreateUserSignal(Kernel->os,
++                                       Interface->u.UserSignal.manualReset,
++                                       &Interface->u.UserSignal.id));
++
++            gcmkVERIFY_OK(
++                gckKERNEL_AddProcessDB(Kernel,
++                                       processID, gcvDB_SIGNAL,
++                                       gcmINT2PTR(Interface->u.UserSignal.id),
++                                       gcvNULL,
++                                       0));
++            break;
++
++        case gcvUSER_SIGNAL_DESTROY:
++            /* Destroy the signal. */
++            gcmkONERROR(
++                gckOS_DestroyUserSignal(Kernel->os,
++                                        Interface->u.UserSignal.id));
++
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Kernel,
++                processID, gcvDB_SIGNAL,
++                gcmINT2PTR(Interface->u.UserSignal.id)));
++            break;
++
++        case gcvUSER_SIGNAL_SIGNAL:
++            /* Signal the signal. */
++            gcmkONERROR(
++                gckOS_SignalUserSignal(Kernel->os,
++                                       Interface->u.UserSignal.id,
++                                       Interface->u.UserSignal.state));
++            break;
++
++        case gcvUSER_SIGNAL_WAIT:
++#if gcdGPU_TIMEOUT
++            if (Interface->u.UserSignal.wait == gcvINFINITE)
++            {
++                gckHARDWARE hardware;
++                gctUINT32 timer = 0;
++
++                for(;;)
++                {
++                    /* Wait on the signal. */
++                    status = gckOS_WaitUserSignal(Kernel->os,
++                                                  Interface->u.UserSignal.id,
++                                                  gcdGPU_ADVANCETIMER);
++
++                    if (status == gcvSTATUS_TIMEOUT)
++                    {
++                        gcmkONERROR(
++                            gckOS_SignalQueryHardware(Kernel->os,
++                                                      (gctSIGNAL)(gctUINTPTR_T)Interface->u.UserSignal.id,
++                                                      &hardware));
++
++                        if (hardware)
++                        {
++                            /* This signal is bound to a hardware,
++                            ** so the timeout is limited by Kernel->timeOut.
++                            */
++                            timer += gcdGPU_ADVANCETIMER;
++                        }
++
++                        if (timer >= Kernel->timeOut)
++                        {
++                            gcmkONERROR(
++                                gckOS_Broadcast(Kernel->os,
++                                                hardware,
++                                                gcvBROADCAST_GPU_STUCK));
++
++                            timer = 0;
++
++                            /* If a few process try to reset GPU, only one
++                            ** of them can do the real reset, other processes
++                            ** still need to wait for this signal is triggered,
++                            ** which menas reset is finished.
++                            */
++                            continue;
++                        }
++                    }
++                    else
++                    {
++                        /* Bail out on other error. */
++                        gcmkONERROR(status);
++
++                        /* Wait for signal successfully. */
++                        break;
++                    }
++                }
++            }
++            else
++#endif
++            {
++                /* Wait on the signal. */
++                status = gckOS_WaitUserSignal(Kernel->os,
++                                              Interface->u.UserSignal.id,
++                                              Interface->u.UserSignal.wait);
++            }
++
++            break;
++
++        case gcvUSER_SIGNAL_MAP:
++            gcmkONERROR(
++                gckOS_MapSignal(Kernel->os,
++                               (gctSIGNAL)(gctUINTPTR_T)Interface->u.UserSignal.id,
++                               (gctHANDLE)(gctUINTPTR_T)processID,
++                               &signal));
++
++            gcmkVERIFY_OK(
++                gckKERNEL_AddProcessDB(Kernel,
++                                       processID, gcvDB_SIGNAL,
++                                       gcmINT2PTR(Interface->u.UserSignal.id),
++                                       gcvNULL,
++                                       0));
++            break;
++
++        case gcvUSER_SIGNAL_UNMAP:
++            /* Destroy the signal. */
++            gcmkONERROR(
++                gckOS_DestroyUserSignal(Kernel->os,
++                                        Interface->u.UserSignal.id));
++
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Kernel,
++                processID, gcvDB_SIGNAL,
++                gcmINT2PTR(Interface->u.UserSignal.id)));
++            break;
++
++        default:
++            /* Invalid user signal command. */
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++        break;
++#endif
++
++    case gcvHAL_SET_POWER_MANAGEMENT_STATE:
++        /* Set the power management state. */
++        gcmkONERROR(
++            gckHARDWARE_SetPowerManagementState(
++                Kernel->hardware,
++                Interface->u.SetPowerManagement.state));
++        break;
++
++    case gcvHAL_QUERY_POWER_MANAGEMENT_STATE:
++        /* Chip is not idle. */
++        Interface->u.QueryPowerManagement.isIdle = gcvFALSE;
++
++        /* Query the power management state. */
++        gcmkONERROR(gckHARDWARE_QueryPowerManagementState(
++            Kernel->hardware,
++            &Interface->u.QueryPowerManagement.state));
++
++        /* Query the idle state. */
++        gcmkONERROR(
++            gckHARDWARE_QueryIdle(Kernel->hardware,
++                                  &Interface->u.QueryPowerManagement.isIdle));
++        break;
++
++    case gcvHAL_READ_REGISTER:
++#if gcdREGISTER_ACCESS_FROM_USER
++        {
++            gceCHIPPOWERSTATE power;
++
++            gckOS_AcquireMutex(Kernel->os, Kernel->hardware->powerMutex, gcvINFINITE);
++            gcmkONERROR(gckHARDWARE_QueryPowerManagementState(Kernel->hardware,
++                                                              &power));
++            if (power == gcvPOWER_ON)
++            {
++                /* Read a register. */
++                gcmkONERROR(gckOS_ReadRegisterEx(
++                    Kernel->os,
++                    Kernel->core,
++                    Interface->u.ReadRegisterData.address,
++                    &Interface->u.ReadRegisterData.data));
++            }
++            else
++            {
++                /* Chip is in power-state. */
++                Interface->u.ReadRegisterData.data = 0;
++                status = gcvSTATUS_CHIP_NOT_READY;
++            }
++            gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->hardware->powerMutex));
++        }
++#else
++        /* No access from user land to read registers. */
++        Interface->u.ReadRegisterData.data = 0;
++        status = gcvSTATUS_NOT_SUPPORTED;
++#endif
++        break;
++
++    case gcvHAL_WRITE_REGISTER:
++#if gcdREGISTER_ACCESS_FROM_USER
++        {
++            gceCHIPPOWERSTATE power;
++
++            gckOS_AcquireMutex(Kernel->os, Kernel->hardware->powerMutex, gcvINFINITE);
++            gcmkONERROR(gckHARDWARE_QueryPowerManagementState(Kernel->hardware,
++                                                                  &power));
++            if (power == gcvPOWER_ON)
++            {
++                /* Write a register. */
++                gcmkONERROR(
++                    gckOS_WriteRegisterEx(Kernel->os,
++                                          Kernel->core,
++                                          Interface->u.WriteRegisterData.address,
++                                          Interface->u.WriteRegisterData.data));
++            }
++            else
++            {
++                /* Chip is in power-state. */
++                Interface->u.WriteRegisterData.data = 0;
++                status = gcvSTATUS_CHIP_NOT_READY;
++            }
++            gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->hardware->powerMutex));
++        }
++#else
++        /* No access from user land to write registers. */
++        status = gcvSTATUS_NOT_SUPPORTED;
++#endif
++        break;
++
++    case gcvHAL_READ_ALL_PROFILE_REGISTERS:
++#if VIVANTE_PROFILER && VIVANTE_PROFILER_CONTEXT
++        /* Read profile data according to the context. */
++        gcmkONERROR(
++            gckHARDWARE_QueryContextProfile(
++                Kernel->hardware,
++                Kernel->profileCleanRegister,
++                gcmNAME_TO_PTR(Interface->u.RegisterProfileData.context),
++                &Interface->u.RegisterProfileData.counters));
++#elif VIVANTE_PROFILER
++        /* Read all 3D profile registers. */
++        gcmkONERROR(
++            gckHARDWARE_QueryProfileRegisters(
++                Kernel->hardware,
++                Kernel->profileCleanRegister,
++                &Interface->u.RegisterProfileData.counters));
++#else
++        status = gcvSTATUS_OK;
++#endif
++        break;
++
++    case gcvHAL_PROFILE_REGISTERS_2D:
++#if VIVANTE_PROFILER
++        /* Read all 2D profile registers. */
++        gcmkONERROR(
++            gckHARDWARE_ProfileEngine2D(
++                Kernel->hardware,
++                gcmUINT64_TO_PTR(Interface->u.RegisterProfileData2D.hwProfile2D)));
++#else
++        status = gcvSTATUS_OK;
++#endif
++        break;
++
++    case gcvHAL_GET_PROFILE_SETTING:
++#if VIVANTE_PROFILER
++        /* Get profile setting */
++        Interface->u.GetProfileSetting.enable = Kernel->profileEnable;
++#endif
++
++        status = gcvSTATUS_OK;
++        break;
++    case gcvHAL_SET_PROFILE_SETTING:
++#if VIVANTE_PROFILER
++        /* Set profile setting */
++        if(Kernel->hardware->gpuProfiler)
++            Kernel->profileEnable = Interface->u.SetProfileSetting.enable;
++        else
++        {
++            status = gcvSTATUS_NOT_SUPPORTED;
++            break;
++        }
++#endif
++
++        status = gcvSTATUS_OK;
++        break;
++
++#if VIVANTE_PROFILER_PERDRAW
++    case gcvHAL_READ_PROFILER_REGISTER_SETTING:
++    #if VIVANTE_PROFILER
++        Kernel->profileCleanRegister = Interface->u.SetProfilerRegisterClear.bclear;
++    #endif
++        status = gcvSTATUS_OK;
++        break;
++#endif
++
++    case gcvHAL_QUERY_KERNEL_SETTINGS:
++        /* Get kernel settings. */
++        gcmkONERROR(
++            gckKERNEL_QuerySettings(Kernel,
++                                    &Interface->u.QueryKernelSettings.settings));
++        break;
++
++    case gcvHAL_RESET:
++        /* Reset the hardware. */
++        gckKERNEL_Recovery(Kernel);
++        break;
++
++    case gcvHAL_DEBUG:
++        /* Set debug level and zones. */
++        if (Interface->u.Debug.set)
++        {
++            gckOS_SetDebugLevel(Interface->u.Debug.level);
++            gckOS_SetDebugZones(Interface->u.Debug.zones,
++                                Interface->u.Debug.enable);
++        }
++
++        if (Interface->u.Debug.message[0] != '\0')
++        {
++            /* Print a message to the debugger. */
++            if (Interface->u.Debug.type == gcvMESSAGE_TEXT)
++            {
++               gckOS_CopyPrint(Interface->u.Debug.message);
++            }
++            else
++            {
++               gckOS_DumpBuffer(Kernel->os,
++                                Interface->u.Debug.message,
++                                Interface->u.Debug.messageSize,
++                                gceDUMP_BUFFER_FROM_USER,
++                                gcvTRUE);
++            }
++        }
++        status = gcvSTATUS_OK;
++        break;
++
++    case gcvHAL_DUMP_GPU_STATE:
++        /* Dump GPU state */
++        {
++            gceCHIPPOWERSTATE power;
++            gcmkONERROR(gckHARDWARE_QueryPowerManagementState(Kernel->hardware,
++                                                              &power));
++            if (power == gcvPOWER_ON)
++            {
++                Interface->u.ReadRegisterData.data = 1;
++                gcmkVERIFY_OK(
++                    gckHARDWARE_DumpGPUState(Kernel->hardware));
++#if gcdVIRTUAL_COMMAND_BUFFER
++                gcmkVERIFY_OK(
++                    gckCOMMAND_DumpExecutingBuffer(Kernel->command));
++#endif
++            }
++            else
++            {
++                Interface->u.ReadRegisterData.data = 0;
++                status = gcvSTATUS_CHIP_NOT_READY;
++            }
++        }
++        break;
++
++    case gcvHAL_DUMP_EVENT:
++        /* Dump GPU event */
++        gcmkVERIFY_OK(gckEVENT_Dump(Kernel->eventObj));
++
++        /* Dump Process DB. */
++        gcmkVERIFY_OK(gckKERNEL_DumpProcessDB(Kernel));
++        break;
++
++    case gcvHAL_CACHE:
++        node = gcmUINT64_TO_PTR(Interface->u.Cache.node);
++        if (node == gcvNULL)
++        {
++            /* FIXME Surface wrap some memory which is not allocated by us,
++            ** So we don't have physical address to handle outer cache, ignore it*/
++            status = gcvSTATUS_OK;
++            break;
++        }
++        else if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++            /* Video memory has no physical handles. */
++            physical = gcvNULL;
++        }
++        else
++        {
++            /* Grab physical handle. */
++            physical = node->Virtual.physical;
++        }
++
++        logical = gcmUINT64_TO_PTR(Interface->u.Cache.logical);
++        bytes = (gctSIZE_T) Interface->u.Cache.bytes;
++        switch(Interface->u.Cache.operation)
++        {
++        case gcvCACHE_FLUSH:
++            /* Clean and invalidate the cache. */
++            status = gckOS_CacheFlush(Kernel->os,
++                                      processID,
++                                      physical,
++                                      paddr,
++                                      logical,
++                                      bytes);
++            break;
++        case gcvCACHE_CLEAN:
++            /* Clean the cache. */
++            status = gckOS_CacheClean(Kernel->os,
++                                      processID,
++                                      physical,
++                                      paddr,
++                                      logical,
++                                      bytes);
++            break;
++        case gcvCACHE_INVALIDATE:
++            /* Invalidate the cache. */
++            status = gckOS_CacheInvalidate(Kernel->os,
++                                           processID,
++                                           physical,
++                                           paddr,
++                                           logical,
++                                           bytes);
++            break;
++
++	case gcvCACHE_MEMORY_BARRIER:
++	   status = gckOS_MemoryBarrier(Kernel->os,
++                                        logical);
++	   break;
++        default:
++            status = gcvSTATUS_INVALID_ARGUMENT;
++            break;
++        }
++        break;
++
++    case gcvHAL_TIMESTAMP:
++        /* Check for invalid timer. */
++        if ((Interface->u.TimeStamp.timer >= gcmCOUNTOF(Kernel->timers))
++        ||  (Interface->u.TimeStamp.request != 2))
++        {
++            Interface->u.TimeStamp.timeDelta = 0;
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        /* Return timer results and reset timer. */
++        {
++            gcsTIMER_PTR timer = &(Kernel->timers[Interface->u.TimeStamp.timer]);
++            gctUINT64 timeDelta = 0;
++
++            if (timer->stopTime < timer->startTime )
++            {
++                Interface->u.TimeStamp.timeDelta = 0;
++                gcmkONERROR(gcvSTATUS_TIMER_OVERFLOW);
++            }
++
++            timeDelta = timer->stopTime - timer->startTime;
++
++            /* Check truncation overflow. */
++            Interface->u.TimeStamp.timeDelta = (gctINT32) timeDelta;
++			/*bit0~bit30 is available*/
++            if (timeDelta>>31)
++            {
++                Interface->u.TimeStamp.timeDelta = 0;
++                gcmkONERROR(gcvSTATUS_TIMER_OVERFLOW);
++            }
++
++            status = gcvSTATUS_OK;
++        }
++        break;
++
++    case gcvHAL_DATABASE:
++        /* Query video memory. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.Database.processID,
++                                     !Interface->u.Database.validProcessID,
++                                     gcvDB_VIDEO_MEMORY,
++                                     &Interface->u.Database.vidMem));
++
++        /* Query non-paged memory. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.Database.processID,
++                                     !Interface->u.Database.validProcessID,
++                                     gcvDB_NON_PAGED,
++                                     &Interface->u.Database.nonPaged));
++
++        /* Query contiguous memory. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.Database.processID,
++                                     !Interface->u.Database.validProcessID,
++                                     gcvDB_CONTIGUOUS,
++                                     &Interface->u.Database.contiguous));
++
++        /* Query GPU idle time. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.Database.processID,
++                                     !Interface->u.Database.validProcessID,
++                                     gcvDB_IDLE,
++                                     &Interface->u.Database.gpuIdle));
++        break;
++
++    case gcvHAL_VIDMEM_DATABASE:
++        /* Query reserved video memory. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.VidMemDatabase.processID,
++                                     !Interface->u.VidMemDatabase.validProcessID,
++                                     gcvDB_VIDEO_MEMORY_RESERVED,
++                                     &Interface->u.VidMemDatabase.vidMemResv));
++
++        /* Query contiguous video memory. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.VidMemDatabase.processID,
++                                     !Interface->u.VidMemDatabase.validProcessID,
++                                     gcvDB_VIDEO_MEMORY_CONTIGUOUS,
++                                     &Interface->u.VidMemDatabase.vidMemCont));
++
++        /* Query virtual video memory. */
++        gcmkONERROR(
++            gckKERNEL_QueryProcessDB(Kernel,
++                                     Interface->u.VidMemDatabase.processID,
++                                     !Interface->u.VidMemDatabase.validProcessID,
++                                     gcvDB_VIDEO_MEMORY_VIRTUAL,
++                                     &Interface->u.VidMemDatabase.vidMemVirt));
++
++        break;
++
++    case gcvHAL_VERSION:
++        Interface->u.Version.major = gcvVERSION_MAJOR;
++        Interface->u.Version.minor = gcvVERSION_MINOR;
++        Interface->u.Version.patch = gcvVERSION_PATCH;
++        Interface->u.Version.build = gcvVERSION_BUILD;
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
++                       "KERNEL version %d.%d.%d build %u %s %s",
++                       gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH,
++                       gcvVERSION_BUILD, gcvVERSION_DATE, gcvVERSION_TIME);
++#endif
++        break;
++
++    case gcvHAL_CHIP_INFO:
++        /* Only if not support multi-core */
++        Interface->u.ChipInfo.count = 1;
++        Interface->u.ChipInfo.types[0] = Kernel->hardware->type;
++        break;
++
++    case gcvHAL_ATTACH:
++        /* Attach user process. */
++        gcmkONERROR(
++            gckCOMMAND_Attach(Kernel->command,
++                              &context,
++                              &bytes,
++                              processID));
++
++        Interface->u.Attach.stateCount = bytes;
++        Interface->u.Attach.context = gcmPTR_TO_NAME(context);
++
++        gcmkVERIFY_OK(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_CONTEXT,
++                                   gcmINT2PTR(Interface->u.Attach.context),
++                                   gcvNULL,
++                                   0));
++        break;
++
++    case gcvHAL_DETACH:
++        /* Detach user process. */
++        gcmkONERROR(
++            gckCOMMAND_Detach(Kernel->command,
++                              gcmNAME_TO_PTR(Interface->u.Detach.context)));
++
++        gcmkVERIFY_OK(
++            gckKERNEL_RemoveProcessDB(Kernel,
++                              processID, gcvDB_CONTEXT,
++                              gcmINT2PTR(Interface->u.Detach.context)));
++
++        gcmRELEASE_NAME(Interface->u.Detach.context);
++        break;
++
++    case gcvHAL_COMPOSE:
++        Interface->u.Compose.physical = gcmPTR_TO_UINT64(gcmNAME_TO_PTR(Interface->u.Compose.physical));
++        /* Start composition. */
++        gcmkONERROR(
++            gckEVENT_Compose(Kernel->eventObj,
++                             &Interface->u.Compose));
++        break;
++
++    case gcvHAL_SET_TIMEOUT:
++         /* set timeOut value from user */
++         gckKERNEL_SetTimeOut(Kernel, Interface->u.SetTimeOut.timeOut);
++        break;
++
++#if gcdFRAME_DB
++    case gcvHAL_GET_FRAME_INFO:
++        gcmkONERROR(gckHARDWARE_GetFrameInfo(
++            Kernel->hardware,
++            gcmUINT64_TO_PTR(Interface->u.GetFrameInfo.frameInfo)));
++        break;
++#endif
++
++    case gcvHAL_GET_SHARED_INFO:
++        if (Interface->u.GetSharedInfo.data == gcvNULL)
++        {
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++        else
++        {
++            gctUINT32 pid    = Interface->u.GetSharedInfo.pid;
++            gctUINT32 dataId = Interface->u.GetSharedInfo.dataId;
++            gctSIZE_T bytes  = Interface->u.GetSharedInfo.bytes;
++            gctPOINTER data  = Interface->u.GetSharedInfo.data;
++            gcsDATABASE_RECORD record;
++
++            /* Find record. */
++            gcmkONERROR(
++                gckKERNEL_FindProcessDB(Kernel,
++                                        pid,
++                                        0,
++                                        gcvDB_SHARED_INFO,
++                                        gcmINT2PTR(dataId),
++                                        &record));
++
++            /* Check memory size. */
++            if (bytes < record.bytes)
++            {
++                /* Insufficient memory to hold shared data. */
++                gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++            }
++
++            /* Copy to user. */
++            status = gckOS_CopyToUserData(Kernel->os,
++                                          record.physical,
++                                          data,
++                                          record.bytes);
++
++            /*
++             * Remove from process db.
++             * Every time when shared info is taken, the record is erased in
++             * kernel side.
++             */
++            gcmkVERIFY_OK(
++                gckKERNEL_RemoveProcessDB(Kernel,
++                                          pid,
++                                          gcvDB_SHARED_INFO,
++                                          gcmINT2PTR(dataId)));
++            /* Free existed data. */
++            gcmkVERIFY_OK(
++                gckOS_FreeMemory(Kernel->os, record.physical));
++        }
++        break;
++
++    case gcvHAL_SET_SHARED_INFO:
++        {
++            gctUINT32 dataId = Interface->u.SetSharedInfo.dataId;
++            gctPOINTER data  = Interface->u.SetSharedInfo.data;
++            gctUINT32 bytes  = Interface->u.SetSharedInfo.bytes;
++            gctPOINTER memory = gcvNULL;
++            gcsDATABASE_RECORD record;
++
++            if (gcmIS_SUCCESS(gckKERNEL_FindProcessDB(Kernel,
++                                                     processID,
++                                                     0,
++                                                     gcvDB_SHARED_INFO,
++                                                     gcmINT2PTR(dataId),
++                                                     &record)))
++            {
++                /* Find a record with the same id. */
++                if (bytes != record.bytes)
++                {
++                    /* Remove from process db. */
++                    gcmkVERIFY_OK(
++                        gckKERNEL_RemoveProcessDB(Kernel,
++                                                  processID,
++                                                  gcvDB_SHARED_INFO,
++                                                  gcmINT2PTR(dataId)));
++
++                    /* Free existed data. */
++                    gcmkVERIFY_OK(
++                        gckOS_FreeMemory(Kernel->os, record.physical));
++                }
++                else
++                {
++                    /* Re-use allocated memory. */
++                    memory = record.physical;
++                }
++            }
++
++            if ((data == gcvNULL) || (bytes == 0))
++            {
++                /* Nothing to record. */
++                break;
++            }
++
++            if (bytes > 1024)
++            {
++                /* Limite data size. */
++                gcmkONERROR(gcvSTATUS_TOO_COMPLEX);
++            }
++
++            if (memory == gcvNULL)
++            {
++                /* Allocate memory for holding shared data. */
++                gcmkONERROR(
++                    gckOS_AllocateMemory(Kernel->os, bytes, &memory));
++
++                /* Add to process db. */
++                status = gckKERNEL_AddProcessDB(Kernel,
++                                                processID,
++                                                gcvDB_SHARED_INFO,
++                                                gcmINT2PTR(dataId),
++                                                memory,
++                                                bytes);
++
++                if (gcmIS_ERROR(status))
++                {
++                    /* Failed to add process db. Free allocated memory. */
++                    gcmkVERIFY_OK(gckOS_FreeMemory(Kernel->os, memory));
++                    break;
++                }
++            }
++
++            /* Copy shared data to kernel memory. */
++            gcmkONERROR(
++                gckOS_CopyFromUserData(Kernel->os,
++                                       memory,
++                                       data,
++                                       bytes));
++        }
++        break;
++
++    case gcvHAL_SET_FSCALE_VALUE:
++#if gcdENABLE_FSCALE_VAL_ADJUST
++        status = gckHARDWARE_SetFscaleValue(Kernel->hardware,
++                                            Interface->u.SetFscaleValue.value);
++#else
++        status = gcvSTATUS_NOT_SUPPORTED;
++#endif
++        break;
++    case gcvHAL_GET_FSCALE_VALUE:
++#if gcdENABLE_FSCALE_VAL_ADJUST
++        status = gckHARDWARE_GetFscaleValue(Kernel->hardware,
++                                            &Interface->u.GetFscaleValue.value,
++                                            &Interface->u.GetFscaleValue.minValue,
++                                            &Interface->u.GetFscaleValue.maxValue);
++#else
++        status = gcvSTATUS_NOT_SUPPORTED;
++#endif
++        break;
++
++    case gcvHAL_QUERY_RESET_TIME_STAMP:
++#if gcdENABLE_RECOVERY
++        Interface->u.QueryResetTimeStamp.timeStamp = Kernel->resetTimeStamp;
++#else
++        Interface->u.QueryResetTimeStamp.timeStamp = 0;
++#endif
++        break;
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    case gcvHAL_SYNC_POINT:
++        {
++            gctSYNC_POINT syncPoint;
++
++            switch (Interface->u.SyncPoint.command)
++            {
++            case gcvSYNC_POINT_CREATE:
++                gcmkONERROR(gckOS_CreateSyncPoint(Kernel->os, &syncPoint));
++
++                Interface->u.SyncPoint.syncPoint = gcmPTR_TO_UINT64(syncPoint);
++
++                gcmkVERIFY_OK(
++                    gckKERNEL_AddProcessDB(Kernel,
++                                           processID, gcvDB_SYNC_POINT,
++                                           syncPoint,
++                                           gcvNULL,
++                                           0));
++                break;
++
++            case gcvSYNC_POINT_DESTROY:
++                syncPoint = gcmUINT64_TO_PTR(Interface->u.SyncPoint.syncPoint);
++
++                gcmkONERROR(gckOS_DestroySyncPoint(Kernel->os, syncPoint));
++
++                gcmkVERIFY_OK(
++                    gckKERNEL_RemoveProcessDB(Kernel,
++                                              processID, gcvDB_SYNC_POINT,
++                                              syncPoint));
++                break;
++
++            default:
++                gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++                break;
++            }
++        }
++        break;
++
++    case gcvHAL_CREATE_NATIVE_FENCE:
++        {
++            gctINT fenceFD;
++            gctSYNC_POINT syncPoint =
++                gcmUINT64_TO_PTR(Interface->u.CreateNativeFence.syncPoint);
++
++            gcmkONERROR(
++                gckOS_CreateNativeFence(Kernel->os,
++                                        Kernel->timeline,
++                                        syncPoint,
++                                        &fenceFD));
++
++            Interface->u.CreateNativeFence.fenceFD = fenceFD;
++        }
++        break;
++#endif
++
++    default:
++        /* Invalid command. */
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++OnError:
++    /* Save status. */
++    Interface->status = status;
++
++    if (gcmIS_ERROR(status))
++    {
++        if (locked)
++        {
++            /* Roll back the lock. */
++            gcmkVERIFY_OK(
++                gckVIDMEM_Unlock(Kernel,
++                                 gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node),
++                                 gcvSURF_TYPE_UNKNOWN,
++                                 &asynchronous));
++
++            if (gcvTRUE == asynchronous)
++            {
++                /* Bottom Half */
++                gcmkVERIFY_OK(
++                    gckVIDMEM_Unlock(Kernel,
++                                     gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node),
++                                     gcvSURF_TYPE_UNKNOWN,
++                                     gcvNULL));
++            }
++        }
++    }
++
++#if QNX_SINGLE_THREADED_DEBUGGING
++    gckOS_ReleaseMutex(Kernel->os, Kernel->debugMutex);
++#endif
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_AttachProcess
++**
++**  Attach or detach a process.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL Attach
++**          gcvTRUE if a new process gets attached or gcFALSE when a process
++**          gets detatched.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_AttachProcess(
++    IN gckKERNEL Kernel,
++    IN gctBOOL Attach
++    )
++{
++    gceSTATUS status;
++    gctUINT32 processID;
++
++    gcmkHEADER_ARG("Kernel=0x%x Attach=%d", Kernel, Attach);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Get current process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&processID));
++
++    gcmkONERROR(gckKERNEL_AttachProcessEx(Kernel, Attach, processID));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_AttachProcessEx
++**
++**  Attach or detach a process with the given PID. Can be paired with gckKERNEL_AttachProcess
++**     provided the programmer is aware of the consequences.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL Attach
++**          gcvTRUE if a new process gets attached or gcFALSE when a process
++**          gets detatched.
++**
++**      gctUINT32 PID
++**          PID of the process to attach or detach.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_AttachProcessEx(
++    IN gckKERNEL Kernel,
++    IN gctBOOL Attach,
++    IN gctUINT32 PID
++    )
++{
++    gceSTATUS status;
++    gctINT32 old;
++
++    gcmkHEADER_ARG("Kernel=0x%x Attach=%d PID=%d", Kernel, Attach, PID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    if (Attach)
++    {
++        /* Increment the number of clients attached. */
++        gcmkONERROR(
++            gckOS_AtomIncrement(Kernel->os, Kernel->atomClients, &old));
++
++        if (old == 0)
++        {
++#if gcdENABLE_VG
++            if (Kernel->vg == gcvNULL)
++#endif
++            {
++                gcmkONERROR(gckOS_Broadcast(Kernel->os,
++                                            Kernel->hardware,
++                                            gcvBROADCAST_FIRST_PROCESS));
++            }
++        }
++
++        if (Kernel->dbCreated)
++        {
++            /* Create the process database. */
++            gcmkONERROR(gckKERNEL_CreateProcessDB(Kernel, PID));
++        }
++    }
++    else
++    {
++        if (Kernel->dbCreated)
++        {
++            /* Clean up the process database. */
++            gcmkONERROR(gckKERNEL_DestroyProcessDB(Kernel, PID));
++
++            /* Save the last know process ID. */
++            Kernel->db->lastProcessID = PID;
++        }
++
++#if gcdENABLE_VG
++        if (Kernel->vg == gcvNULL)
++#endif
++        {
++            status = gckEVENT_Submit(Kernel->eventObj, gcvTRUE, gcvFALSE);
++
++            if (status == gcvSTATUS_INTERRUPTED && Kernel->eventObj->submitTimer)
++            {
++                gcmkONERROR(gckOS_StartTimer(Kernel->os,
++                                             Kernel->eventObj->submitTimer,
++                                             1));
++            }
++            else
++            {
++                gcmkONERROR(status);
++            }
++        }
++
++        /* Decrement the number of clients attached. */
++        gcmkONERROR(
++            gckOS_AtomDecrement(Kernel->os, Kernel->atomClients, &old));
++
++        if (old == 1)
++        {
++#if gcdENABLE_VG
++            if (Kernel->vg == gcvNULL)
++#endif
++            {
++                /* Last client detached, switch to SUSPEND power state. */
++                gcmkONERROR(gckOS_Broadcast(Kernel->os,
++                                            Kernel->hardware,
++                                            gcvBROADCAST_LAST_PROCESS));
++            }
++
++            /* Flush the debug cache. */
++            gcmkDEBUGFLUSH(~0U);
++        }
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdSECURE_USER
++gceSTATUS
++gckKERNEL_MapLogicalToPhysical(
++    IN gckKERNEL Kernel,
++    IN gcskSECURE_CACHE_PTR Cache,
++    IN OUT gctPOINTER * Data
++    )
++{
++    gceSTATUS status;
++    static gctBOOL baseAddressValid = gcvFALSE;
++    static gctUINT32 baseAddress;
++    gctBOOL needBase;
++    gcskLOGICAL_CACHE_PTR slot;
++
++    gcmkHEADER_ARG("Kernel=0x%x Cache=0x%x *Data=0x%x",
++                   Kernel, Cache, gcmOPT_POINTER(Data));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    if (!baseAddressValid)
++    {
++        /* Get base address. */
++        gcmkONERROR(gckHARDWARE_GetBaseAddress(Kernel->hardware, &baseAddress));
++
++        baseAddressValid = gcvTRUE;
++    }
++
++    /* Does this state load need a base address? */
++    gcmkONERROR(gckHARDWARE_NeedBaseAddress(Kernel->hardware,
++                                            ((gctUINT32_PTR) Data)[-1],
++                                            &needBase));
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LRU
++    {
++        gcskLOGICAL_CACHE_PTR next;
++        gctINT i;
++
++        /* Walk all used cache slots. */
++        for (i = 1, slot = Cache->cache[0].next, next = gcvNULL;
++             (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
++             ++i, slot = slot->next
++        )
++        {
++            if (slot->logical == *Data)
++            {
++                /* Bail out. */
++                next = slot;
++                break;
++            }
++        }
++
++        /* See if we had a miss. */
++        if (next == gcvNULL)
++        {
++            /* Use the tail of the cache. */
++            slot = Cache->cache[0].prev;
++
++            /* Initialize the cache line. */
++            slot->logical = *Data;
++
++            /* Map the logical address to a DMA address. */
++            gcmkONERROR(
++                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
++        }
++
++        /* Move slot to head of list. */
++        if (slot != Cache->cache[0].next)
++        {
++            /* Unlink. */
++            slot->prev->next = slot->next;
++            slot->next->prev = slot->prev;
++
++            /* Move to head of chain. */
++            slot->prev       = &Cache->cache[0];
++            slot->next       = Cache->cache[0].next;
++            slot->prev->next = slot;
++            slot->next->prev = slot;
++        }
++    }
++#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LINEAR
++    {
++        gctINT i;
++        gcskLOGICAL_CACHE_PTR next = gcvNULL;
++        gcskLOGICAL_CACHE_PTR oldestSlot = gcvNULL;
++        slot = gcvNULL;
++
++        if (Cache->cacheIndex != gcvNULL)
++        {
++            /* Walk the cache forwards. */
++            for (i = 1, slot = Cache->cacheIndex;
++                 (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
++                 ++i, slot = slot->next)
++            {
++                if (slot->logical == *Data)
++                {
++                    /* Bail out. */
++                    next = slot;
++                    break;
++                }
++
++                /* Determine age of this slot. */
++                if ((oldestSlot       == gcvNULL)
++                ||  (oldestSlot->stamp > slot->stamp)
++                )
++                {
++                    oldestSlot = slot;
++                }
++            }
++
++            if (next == gcvNULL)
++            {
++                /* Walk the cache backwards. */
++                for (slot = Cache->cacheIndex->prev;
++                     (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
++                     ++i, slot = slot->prev)
++                {
++                    if (slot->logical == *Data)
++                    {
++                        /* Bail out. */
++                        next = slot;
++                        break;
++                    }
++
++                    /* Determine age of this slot. */
++                    if ((oldestSlot       == gcvNULL)
++                    ||  (oldestSlot->stamp > slot->stamp)
++                    )
++                    {
++                        oldestSlot = slot;
++                    }
++                }
++            }
++        }
++
++        /* See if we had a miss. */
++        if (next == gcvNULL)
++        {
++            if (Cache->cacheFree != 0)
++            {
++                slot = &Cache->cache[Cache->cacheFree];
++                gcmkASSERT(slot->logical == gcvNULL);
++
++                ++ Cache->cacheFree;
++                if (Cache->cacheFree >= gcmCOUNTOF(Cache->cache))
++                {
++                    Cache->cacheFree = 0;
++                }
++            }
++            else
++            {
++                /* Use the oldest cache slot. */
++                gcmkASSERT(oldestSlot != gcvNULL);
++                slot = oldestSlot;
++
++                /* Unlink from the chain. */
++                slot->prev->next = slot->next;
++                slot->next->prev = slot->prev;
++
++                /* Append to the end. */
++                slot->prev       = Cache->cache[0].prev;
++                slot->next       = &Cache->cache[0];
++                slot->prev->next = slot;
++                slot->next->prev = slot;
++            }
++
++            /* Initialize the cache line. */
++            slot->logical = *Data;
++
++            /* Map the logical address to a DMA address. */
++            gcmkONERROR(
++                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
++        }
++
++        /* Save time stamp. */
++        slot->stamp = ++ Cache->cacheStamp;
++
++        /* Save current slot for next lookup. */
++        Cache->cacheIndex = slot;
++    }
++#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++    {
++        gctINT i;
++        gctUINT32 data = gcmPTR2INT(*Data);
++        gctUINT32 key, index;
++        gcskLOGICAL_CACHE_PTR hash;
++
++        /* Generate a hash key. */
++        key   = (data >> 24) + (data >> 16) + (data >> 8) + data;
++        index = key % gcmCOUNTOF(Cache->hash);
++
++        /* Get the hash entry. */
++        hash = &Cache->hash[index];
++
++        for (slot = hash->nextHash, i = 0;
++             (slot != gcvNULL) && (i < gcdSECURE_CACHE_SLOTS);
++             slot = slot->nextHash, ++i
++        )
++        {
++            if (slot->logical == (*Data))
++            {
++                break;
++            }
++        }
++
++        if (slot == gcvNULL)
++        {
++            /* Grab from the tail of the cache. */
++            slot = Cache->cache[0].prev;
++
++            /* Unlink slot from any hash table it is part of. */
++            if (slot->prevHash != gcvNULL)
++            {
++                slot->prevHash->nextHash = slot->nextHash;
++            }
++            if (slot->nextHash != gcvNULL)
++            {
++                slot->nextHash->prevHash = slot->prevHash;
++            }
++
++            /* Initialize the cache line. */
++            slot->logical = *Data;
++
++            /* Map the logical address to a DMA address. */
++            gcmkONERROR(
++                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
++
++            if (hash->nextHash != gcvNULL)
++            {
++                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
++                               "Hash Collision: logical=0x%x key=0x%08x",
++                               *Data, key);
++            }
++
++            /* Insert the slot at the head of the hash list. */
++            slot->nextHash     = hash->nextHash;
++            if (slot->nextHash != gcvNULL)
++            {
++                slot->nextHash->prevHash = slot;
++            }
++            slot->prevHash     = hash;
++            hash->nextHash     = slot;
++        }
++
++        /* Move slot to head of list. */
++        if (slot != Cache->cache[0].next)
++        {
++            /* Unlink. */
++            slot->prev->next = slot->next;
++            slot->next->prev = slot->prev;
++
++            /* Move to head of chain. */
++            slot->prev       = &Cache->cache[0];
++            slot->next       = Cache->cache[0].next;
++            slot->prev->next = slot;
++            slot->next->prev = slot;
++        }
++    }
++#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_TABLE
++    {
++        gctUINT32 index = (gcmPTR2INT(*Data) % gcdSECURE_CACHE_SLOTS) + 1;
++
++        /* Get cache slot. */
++        slot = &Cache->cache[index];
++
++        /* Check for cache miss. */
++        if (slot->logical != *Data)
++        {
++            /* Initialize the cache line. */
++            slot->logical = *Data;
++
++            /* Map the logical address to a DMA address. */
++            gcmkONERROR(
++                gckOS_GetPhysicalAddress(Kernel->os, *Data, &slot->dma));
++        }
++    }
++#endif
++
++    /* Return DMA address. */
++    *Data = gcmINT2PTR(slot->dma + (needBase ? baseAddress : 0));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_FlushTranslationCache(
++    IN gckKERNEL Kernel,
++    IN gcskSECURE_CACHE_PTR Cache,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gctINT i;
++    gcskLOGICAL_CACHE_PTR slot;
++    gctUINT8_PTR ptr;
++
++    gcmkHEADER_ARG("Kernel=0x%x Cache=0x%x Logical=0x%x Bytes=%lu",
++                   Kernel, Cache, Logical, Bytes);
++
++    /* Do we need to flush the entire cache? */
++    if (Logical == gcvNULL)
++    {
++        /* Clear all cache slots. */
++        for (i = 1; i <= gcdSECURE_CACHE_SLOTS; ++i)
++        {
++            Cache->cache[i].logical  = gcvNULL;
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++            Cache->cache[i].nextHash = gcvNULL;
++            Cache->cache[i].prevHash = gcvNULL;
++#endif
++}
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++        /* Zero the hash table. */
++        for (i = 0; i < gcmCOUNTOF(Cache->hash); ++i)
++        {
++            Cache->hash[i].nextHash = gcvNULL;
++        }
++#endif
++
++        /* Reset the cache functionality. */
++        Cache->cacheIndex = gcvNULL;
++        Cache->cacheFree  = 1;
++        Cache->cacheStamp = 0;
++    }
++
++    else
++    {
++        gctUINT8_PTR low  = (gctUINT8_PTR) Logical;
++        gctUINT8_PTR high = low + Bytes;
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LRU
++        gcskLOGICAL_CACHE_PTR next;
++
++        /* Walk all used cache slots. */
++        for (i = 1, slot = Cache->cache[0].next;
++             (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
++             ++i, slot = next
++        )
++        {
++            /* Save pointer to next slot. */
++            next = slot->next;
++
++            /* Test if this slot falls within the range to flush. */
++            ptr = (gctUINT8_PTR) slot->logical;
++            if ((ptr >= low) && (ptr < high))
++            {
++                /* Unlink slot. */
++                slot->prev->next = slot->next;
++                slot->next->prev = slot->prev;
++
++                /* Append slot to tail of cache. */
++                slot->prev       = Cache->cache[0].prev;
++                slot->next       = &Cache->cache[0];
++                slot->prev->next = slot;
++                slot->next->prev = slot;
++
++                /* Mark slot as empty. */
++                slot->logical = gcvNULL;
++            }
++        }
++
++#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LINEAR
++        gcskLOGICAL_CACHE_PTR next;
++
++        for (i = 1, slot = Cache->cache[0].next;
++             (i <= gcdSECURE_CACHE_SLOTS) && (slot->logical != gcvNULL);
++             ++i, slot = next)
++        {
++            /* Save pointer to next slot. */
++            next = slot->next;
++
++            /* Test if this slot falls within the range to flush. */
++            ptr = (gctUINT8_PTR) slot->logical;
++            if ((ptr >= low) && (ptr < high))
++            {
++                /* Test if this slot is the current slot. */
++                if (slot == Cache->cacheIndex)
++                {
++                    /* Move to next or previous slot. */
++                    Cache->cacheIndex = (slot->next->logical != gcvNULL)
++                                      ? slot->next
++                                      : (slot->prev->logical != gcvNULL)
++                                      ? slot->prev
++                                      : gcvNULL;
++                }
++
++                /* Unlink slot from cache. */
++                slot->prev->next = slot->next;
++                slot->next->prev = slot->prev;
++
++                /* Insert slot to head of cache. */
++                slot->prev       = &Cache->cache[0];
++                slot->next       = Cache->cache[0].next;
++                slot->prev->next = slot;
++                slot->next->prev = slot;
++
++                /* Mark slot as empty. */
++                slot->logical = gcvNULL;
++                slot->stamp   = 0;
++            }
++        }
++
++#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++        gctINT j;
++        gcskLOGICAL_CACHE_PTR hash, next;
++
++        /* Walk all hash tables. */
++        for (i = 0, hash = Cache->hash;
++             i < gcmCOUNTOF(Cache->hash);
++             ++i, ++hash)
++        {
++            /* Walk all slots in the hash. */
++            for (j = 0, slot = hash->nextHash;
++                 (j < gcdSECURE_CACHE_SLOTS) && (slot != gcvNULL);
++                 ++j, slot = next)
++            {
++                /* Save pointer to next slot. */
++                next = slot->next;
++
++                /* Test if this slot falls within the range to flush. */
++                ptr = (gctUINT8_PTR) slot->logical;
++                if ((ptr >= low) && (ptr < high))
++                {
++                    /* Unlink slot from hash table. */
++                    if (slot->prevHash == hash)
++                    {
++                        hash->nextHash = slot->nextHash;
++                    }
++                    else
++                    {
++                        slot->prevHash->nextHash = slot->nextHash;
++                    }
++
++                    if (slot->nextHash != gcvNULL)
++                    {
++                        slot->nextHash->prevHash = slot->prevHash;
++                    }
++
++                    /* Unlink slot from cache. */
++                    slot->prev->next = slot->next;
++                    slot->next->prev = slot->prev;
++
++                    /* Append slot to tail of cache. */
++                    slot->prev       = Cache->cache[0].prev;
++                    slot->next       = &Cache->cache[0];
++                    slot->prev->next = slot;
++                    slot->next->prev = slot;
++
++                    /* Mark slot as empty. */
++                    slot->logical  = gcvNULL;
++                    slot->prevHash = gcvNULL;
++                    slot->nextHash = gcvNULL;
++                }
++            }
++        }
++
++#elif gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_TABLE
++        gctUINT32 index;
++
++        /* Loop while inside the range. */
++        for (i = 1; (low < high) && (i <= gcdSECURE_CACHE_SLOTS); ++i)
++        {
++            /* Get index into cache for this range. */
++            index = (gcmPTR2INT(low) % gcdSECURE_CACHE_SLOTS) + 1;
++            slot  = &Cache->cache[index];
++
++            /* Test if this slot falls within the range to flush. */
++            ptr = (gctUINT8_PTR) slot->logical;
++            if ((ptr >= low) && (ptr < high))
++            {
++                /* Remove entry from cache. */
++                slot->logical = gcvNULL;
++            }
++
++            /* Next block. */
++            low += gcdSECURE_CACHE_SLOTS;
++        }
++#endif
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckKERNEL_Recovery
++**
++**  Try to recover the GPU from a fatal error.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_Recovery(
++    IN gckKERNEL Kernel
++    )
++{
++#if gcdENABLE_RECOVERY
++#define gcdEVENT_MASK 0x3FFFFFFF
++    gceSTATUS status;
++    gckEVENT eventObj;
++    gckHARDWARE hardware;
++#if gcdSECURE_USER
++    gctUINT32 processID;
++    gcskSECURE_CACHE_PTR cache;
++#endif
++    gctUINT32 oldValue;
++    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
++
++    /* Validate the arguemnts. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Grab gckEVENT object. */
++    eventObj = Kernel->eventObj;
++    gcmkVERIFY_OBJECT(eventObj, gcvOBJ_EVENT);
++
++    /* Grab gckHARDWARE object. */
++    hardware = Kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++#if gcdSECURE_USER
++    /* Flush the secure mapping cache. */
++    gcmkONERROR(gckOS_GetProcessID(&processID));
++    gcmkONERROR(gckKERNEL_GetProcessDBCache(Kernel, processID, &cache));
++    gcmkONERROR(gckKERNEL_FlushTranslationCache(Kernel, cache, gcvNULL, 0));
++#endif
++
++    gcmkONERROR(
++        gckOS_AtomicExchange(Kernel->os, Kernel->resetAtom, 1, &oldValue));
++
++    if (oldValue)
++    {
++        /* Some one else will recovery GPU. */
++        return gcvSTATUS_OK;
++    }
++
++    gcmkPRINT("[galcore]: GPU[%d] hang, automatic recovery.", Kernel->core);
++
++    /* Start a timer to clear reset flag, before timer is expired,
++    ** other recovery request is ignored. */
++    gcmkVERIFY_OK(
++        gckOS_StartTimer(Kernel->os,
++                         Kernel->resetFlagClearTimer,
++                         gcdGPU_TIMEOUT - 500));
++
++
++    /* Try issuing a soft reset for the GPU. */
++    status = gckHARDWARE_Reset(hardware);
++    if (status == gcvSTATUS_NOT_SUPPORTED)
++    {
++        /* Switch to OFF power.  The next submit should return the GPU to ON
++        ** state. */
++        gcmkONERROR(
++            gckHARDWARE_SetPowerManagementState(hardware,
++                                                gcvPOWER_OFF_RECOVERY));
++    }
++    else
++    {
++        /* Bail out on reset error. */
++        gcmkONERROR(status);
++    }
++
++    /* Handle all outstanding events now. */
++#if gcdSMP
++    gcmkONERROR(gckOS_AtomSet(Kernel->os, eventObj->pending, gcdEVENT_MASK));
++#else
++    eventObj->pending = gcdEVENT_MASK;
++#endif
++    gcmkONERROR(gckEVENT_Notify(eventObj, 1));
++
++    /* Again in case more events got submitted. */
++#if gcdSMP
++    gcmkONERROR(gckOS_AtomSet(Kernel->os, eventObj->pending, gcdEVENT_MASK));
++#else
++    eventObj->pending = gcdEVENT_MASK;
++#endif
++    gcmkONERROR(gckEVENT_Notify(eventObj, 2));
++
++    Kernel->resetTimeStamp++;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#else
++    return gcvSTATUS_OK;
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_OpenUserData
++**
++**  Get access to the user data.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL NeedCopy
++**          The flag indicating whether or not the data should be copied.
++**
++**      gctPOINTER StaticStorage
++**          Pointer to the kernel storage where the data is to be copied if
++**          NeedCopy is gcvTRUE.
++**
++**      gctPOINTER UserPointer
++**          User pointer to the data.
++**
++**      gctSIZE_T Size
++**          Size of the data.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * KernelPointer
++**          Pointer to the kernel pointer that will be pointing to the data.
++*/
++gceSTATUS
++gckKERNEL_OpenUserData(
++    IN gckKERNEL Kernel,
++    IN gctBOOL NeedCopy,
++    IN gctPOINTER StaticStorage,
++    IN gctPOINTER UserPointer,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG(
++        "Kernel=0x%08X NeedCopy=%d StaticStorage=0x%08X "
++        "UserPointer=0x%08X Size=%lu KernelPointer=0x%08X",
++        Kernel, NeedCopy, StaticStorage, UserPointer, Size, KernelPointer
++        );
++
++    /* Validate the arguemnts. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(!NeedCopy || (StaticStorage != gcvNULL));
++    gcmkVERIFY_ARGUMENT(UserPointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++
++    if (NeedCopy)
++    {
++        /* Copy the user data to the static storage. */
++        gcmkONERROR(gckOS_CopyFromUserData(
++            Kernel->os, StaticStorage, UserPointer, Size
++            ));
++
++        /* Set the kernel pointer. */
++        * KernelPointer = StaticStorage;
++    }
++    else
++    {
++        gctPOINTER pointer = gcvNULL;
++
++        /* Map the user pointer. */
++        gcmkONERROR(gckOS_MapUserPointer(
++            Kernel->os, UserPointer, Size, &pointer
++            ));
++
++        /* Set the kernel pointer. */
++        * KernelPointer = pointer;
++    }
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_CloseUserData
++**
++**  Release resources associated with the user data connection opened by
++**  gckKERNEL_OpenUserData.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL NeedCopy
++**          The flag indicating whether or not the data should be copied.
++**
++**      gctBOOL FlushData
++**          If gcvTRUE, the data is written back to the user.
++**
++**      gctPOINTER UserPointer
++**          User pointer to the data.
++**
++**      gctSIZE_T Size
++**          Size of the data.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * KernelPointer
++**          Kernel pointer to the data.
++*/
++gceSTATUS
++gckKERNEL_CloseUserData(
++    IN gckKERNEL Kernel,
++    IN gctBOOL NeedCopy,
++    IN gctBOOL FlushData,
++    IN gctPOINTER UserPointer,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctPOINTER pointer;
++
++    gcmkHEADER_ARG(
++        "Kernel=0x%08X NeedCopy=%d FlushData=%d "
++        "UserPointer=0x%08X Size=%lu KernelPointer=0x%08X",
++        Kernel, NeedCopy, FlushData, UserPointer, Size, KernelPointer
++        );
++
++    /* Validate the arguemnts. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(UserPointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++
++    /* Get a shortcut to the kernel pointer. */
++    pointer = * KernelPointer;
++
++    if (pointer != gcvNULL)
++    {
++        if (NeedCopy)
++        {
++            if (FlushData)
++            {
++                gcmkONERROR(gckOS_CopyToUserData(
++                    Kernel->os, * KernelPointer, UserPointer, Size
++                    ));
++            }
++        }
++        else
++        {
++            /* Unmap record from kernel memory. */
++            gcmkONERROR(gckOS_UnmapUserPointer(
++                Kernel->os,
++                UserPointer,
++                Size,
++                * KernelPointer
++                ));
++        }
++
++        /* Reset the kernel pointer. */
++        * KernelPointer = gcvNULL;
++    }
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++void
++gckKERNEL_SetTimeOut(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 timeOut
++    )
++{
++    gcmkHEADER_ARG("Kernel=0x%x timeOut=%d", Kernel, timeOut);
++#if gcdGPU_TIMEOUT
++    Kernel->timeOut = timeOut;
++#endif
++    gcmkFOOTER_NO();
++}
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++gceSTATUS
++gckKERNEL_AllocateVirtualCommandBuffer(
++    IN gckKERNEL Kernel,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    )
++{
++    gckOS os = Kernel->os;
++    gceSTATUS status;
++    gctPOINTER logical;
++    gctSIZE_T pageCount;
++    gctSIZE_T bytes = *Bytes;
++    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
++
++    gcmkHEADER_ARG("Os=0x%X InUserSpace=%d *Bytes=%lu",
++                   os, InUserSpace, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes != gcvNULL);
++    gcmkVERIFY_ARGUMENT(*Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    gcmkONERROR(gckOS_Allocate(os,
++                               sizeof(gckVIRTUAL_COMMAND_BUFFER),
++                               (gctPOINTER)&buffer));
++
++    gcmkONERROR(gckOS_ZeroMemory(buffer, sizeof(gckVIRTUAL_COMMAND_BUFFER)));
++
++    gcmkONERROR(gckOS_AllocatePagedMemoryEx(os,
++                                            gcvFALSE,
++                                            bytes,
++                                            &buffer->physical));
++
++    if (InUserSpace)
++    {
++        gcmkONERROR(gckOS_LockPages(os,
++                                    buffer->physical,
++                                    bytes,
++                                    gcvFALSE,
++                                    &logical,
++                                    &pageCount));
++
++        *Logical =
++        buffer->userLogical = logical;
++    }
++    else
++    {
++        gcmkONERROR(
++            gckOS_CreateKernelVirtualMapping(buffer->physical,
++                                             &pageCount,
++                                             &logical));
++        *Logical =
++        buffer->kernelLogical = logical;
++    }
++
++    buffer->pageCount = pageCount;
++    buffer->kernel = Kernel;
++
++    gcmkONERROR(gckOS_GetProcessID(&buffer->pid));
++
++    gcmkONERROR(gckMMU_AllocatePages(Kernel->mmu,
++                                     pageCount,
++                                     &buffer->pageTable,
++                                     &buffer->gpuAddress));
++
++    gcmkONERROR(gckOS_MapPagesEx(os,
++                                 Kernel->core,
++                                 buffer->physical,
++                                 pageCount,
++                                 buffer->pageTable));
++
++    gcmkONERROR(gckMMU_Flush(Kernel->mmu));
++
++    *Physical = buffer;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_KERNEL,
++                   "gpuAddress = %x pageCount = %d kernelLogical = %x userLogical=%x",
++                   buffer->gpuAddress, buffer->pageCount,
++                   buffer->kernelLogical, buffer->userLogical);
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(os, Kernel->virtualBufferLock, gcvINFINITE));
++
++    if (Kernel->virtualBufferHead == gcvNULL)
++    {
++        Kernel->virtualBufferHead =
++        Kernel->virtualBufferTail = buffer;
++    }
++    else
++    {
++        buffer->prev = Kernel->virtualBufferTail;
++        Kernel->virtualBufferTail->next = buffer;
++        Kernel->virtualBufferTail = buffer;
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, Kernel->virtualBufferLock));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (buffer->gpuAddress)
++    {
++        gcmkVERIFY_OK(
++            gckMMU_FreePages(Kernel->mmu, buffer->pageTable, buffer->pageCount));
++    }
++
++    if (buffer->userLogical)
++    {
++        gcmkVERIFY_OK(
++            gckOS_UnlockPages(os, buffer->physical, bytes, buffer->userLogical));
++    }
++
++    if (buffer->kernelLogical)
++    {
++        gcmkVERIFY_OK(
++            gckOS_DestroyKernelVirtualMapping(buffer->kernelLogical));
++    }
++
++    if (buffer->physical)
++    {
++        gcmkVERIFY_OK(gckOS_FreePagedMemory(os, buffer->physical, bytes));
++    }
++
++    gcmkVERIFY_OK(gckOS_Free(os, buffer));
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_DestroyVirtualCommandBuffer(
++    IN gckKERNEL Kernel,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical
++    )
++{
++    gckOS os;
++    gckKERNEL kernel;
++    gckVIRTUAL_COMMAND_BUFFER_PTR buffer = (gckVIRTUAL_COMMAND_BUFFER_PTR)Physical;
++
++    gcmkHEADER();
++    gcmkVERIFY_ARGUMENT(buffer != gcvNULL);
++
++    kernel = buffer->kernel;
++    os = kernel->os;
++
++    if (buffer->userLogical)
++    {
++        gcmkVERIFY_OK(gckOS_UnlockPages(os, buffer->physical, Bytes, Logical));
++    }
++    else
++    {
++        gcmkVERIFY_OK(gckOS_DestroyKernelVirtualMapping(Logical));
++    }
++
++    gcmkVERIFY_OK(
++        gckMMU_FreePages(kernel->mmu, buffer->pageTable, buffer->pageCount));
++
++    gcmkVERIFY_OK(gckOS_FreePagedMemory(os, buffer->physical, Bytes));
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(os, kernel->virtualBufferLock, gcvINFINITE));
++
++    if (buffer == kernel->virtualBufferHead)
++    {
++        if ((kernel->virtualBufferHead = buffer->next) == gcvNULL)
++        {
++            kernel->virtualBufferTail = gcvNULL;
++        }
++    }
++    else
++    {
++        buffer->prev->next = buffer->next;
++
++        if (buffer == kernel->virtualBufferTail)
++        {
++            kernel->virtualBufferTail = buffer->prev;
++        }
++        else
++        {
++            buffer->next->prev = buffer->prev;
++        }
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, kernel->virtualBufferLock));
++
++    gcmkVERIFY_OK(gckOS_Free(os, buffer));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckKERNEL_GetGPUAddress(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    )
++{
++    gceSTATUS status;
++    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
++    gctPOINTER start;
++    gctINT pid;
++
++    gcmkHEADER_ARG("Logical = %x", Logical);
++
++    gckOS_GetProcessID(&pid);
++
++    status = gcvSTATUS_INVALID_ADDRESS;
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(Kernel->os, Kernel->virtualBufferLock, gcvINFINITE));
++
++    /* Walk all command buffer. */
++    for (buffer = Kernel->virtualBufferHead; buffer != gcvNULL; buffer = buffer->next)
++    {
++        if (buffer->userLogical)
++        {
++            start = buffer->userLogical;
++        }
++        else
++        {
++            start = buffer->kernelLogical;
++        }
++
++        if (Logical >= start
++        && (Logical < (start + buffer->pageCount * 4096))
++        && pid == buffer->pid
++        )
++        {
++            * Address = buffer->gpuAddress + (Logical - start);
++            status = gcvSTATUS_OK;
++            break;
++        }
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->virtualBufferLock));
++
++    gcmkFOOTER_NO();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_QueryGPUAddress(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 GpuAddress,
++    OUT gckVIRTUAL_COMMAND_BUFFER_PTR * Buffer
++    )
++{
++    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
++    gctUINT32 start;
++    gceSTATUS status = gcvSTATUS_NOT_SUPPORTED;
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(Kernel->os, Kernel->virtualBufferLock, gcvINFINITE));
++
++    /* Walk all command buffers. */
++    for (buffer = Kernel->virtualBufferHead; buffer != gcvNULL; buffer = buffer->next)
++    {
++        start = (gctUINT32)buffer->gpuAddress;
++
++        if (GpuAddress >= start && GpuAddress < (start + buffer->pageCount * 4096))
++        {
++            /* Find a range matched. */
++            *Buffer = buffer;
++            status = gcvSTATUS_OK;
++            break;
++        }
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->virtualBufferLock));
++
++    return status;
++}
++#endif
++
++#if gcdLINK_QUEUE_SIZE
++static void
++gckLINKQUEUE_Dequeue(
++    IN gckLINKQUEUE LinkQueue
++    )
++{
++    gcmkASSERT(LinkQueue->count == gcdLINK_QUEUE_SIZE);
++
++    LinkQueue->count--;
++    LinkQueue->front = (LinkQueue->front + 1) % gcdLINK_QUEUE_SIZE;
++}
++
++void
++gckLINKQUEUE_Enqueue(
++    IN gckLINKQUEUE LinkQueue,
++    IN gctUINT32 start,
++    IN gctUINT32 end
++    )
++{
++    if (LinkQueue->count == gcdLINK_QUEUE_SIZE)
++    {
++        gckLINKQUEUE_Dequeue(LinkQueue);
++    }
++
++    gcmkASSERT(LinkQueue->count < gcdLINK_QUEUE_SIZE);
++
++    LinkQueue->count++;
++
++    LinkQueue->data[LinkQueue->rear].start = start;
++    LinkQueue->data[LinkQueue->rear].end = end;
++
++    gcmkVERIFY_OK(
++        gckOS_GetProcessID(&LinkQueue->data[LinkQueue->rear].pid));
++
++    LinkQueue->rear = (LinkQueue->rear + 1) % gcdLINK_QUEUE_SIZE;
++}
++
++void
++gckLINKQUEUE_GetData(
++    IN gckLINKQUEUE LinkQueue,
++    IN gctUINT32 Index,
++    OUT gckLINKDATA * Data
++    )
++{
++    gcmkASSERT(Index >= 0 && Index < gcdLINK_QUEUE_SIZE);
++
++    *Data = &LinkQueue->data[(Index + LinkQueue->front) % gcdLINK_QUEUE_SIZE];
++}
++#endif
++
++/******************************************************************************\
++*************************** Pointer - ID translation ***************************
++\******************************************************************************/
++#define gcdID_TABLE_LENGTH 1024
++typedef struct _gcsINTEGERDB * gckINTEGERDB;
++typedef struct _gcsINTEGERDB
++{
++    gckOS                       os;
++    gctPOINTER*                 table;
++    gctPOINTER                  mutex;
++    gctUINT32                   tableLen;
++    gctUINT32                   currentID;
++    gctUINT32                   unused;
++}
++gcsINTEGERDB;
++
++gceSTATUS
++gckKERNEL_CreateIntegerDatabase(
++    IN gckKERNEL Kernel,
++    OUT gctPOINTER * Database
++    )
++{
++    gceSTATUS status;
++    gckINTEGERDB database = gcvNULL;
++
++    gcmkHEADER_ARG("Kernel=0x%08X Datbase=0x%08X", Kernel, Database);
++
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Database != gcvNULL);
++
++    /* Allocate a database. */
++    gcmkONERROR(gckOS_Allocate(
++        Kernel->os, gcmSIZEOF(gcsINTEGERDB), (gctPOINTER *)&database));
++
++    gckOS_ZeroMemory(database, gcmSIZEOF(gcsINTEGERDB));
++
++    /* Allocate a pointer table. */
++    gcmkONERROR(gckOS_Allocate(
++        Kernel->os, gcmSIZEOF(gctPOINTER) * gcdID_TABLE_LENGTH, (gctPOINTER *)&database->table));
++
++    gckOS_ZeroMemory(database->table, gcmSIZEOF(gctPOINTER) * gcdID_TABLE_LENGTH);
++
++    /* Allocate a database mutex. */
++    gcmkONERROR(gckOS_CreateMutex(Kernel->os, &database->mutex));
++
++    /* Initialize. */
++    database->currentID = 0;
++    database->unused = gcdID_TABLE_LENGTH;
++    database->os = Kernel->os;
++    database->tableLen = gcdID_TABLE_LENGTH;
++
++    *Database = database;
++
++    gcmkFOOTER_ARG("*Database=0x%08X", *Database);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Rollback. */
++    if (database)
++    {
++        if (database->table)
++        {
++            gcmkOS_SAFE_FREE(Kernel->os, database->table);
++        }
++
++        gcmkOS_SAFE_FREE(Kernel->os, database);
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_DestroyIntegerDatabase(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Database
++    )
++{
++    gckINTEGERDB database = Database;
++
++    gcmkHEADER_ARG("Kernel=0x%08X Datbase=0x%08X", Kernel, Database);
++
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Database != gcvNULL);
++
++    /* Destroy pointer table. */
++    gcmkOS_SAFE_FREE(Kernel->os, database->table);
++
++    /* Destroy database mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Kernel->os, database->mutex));
++
++    /* Destroy database. */
++    gcmkOS_SAFE_FREE(Kernel->os, database);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckKERNEL_AllocateIntegerId(
++    IN gctPOINTER Database,
++    IN gctPOINTER Pointer,
++    OUT gctUINT32 * Id
++    )
++{
++    gceSTATUS status;
++    gckINTEGERDB database = Database;
++    gctUINT32 i, unused, currentID, tableLen;
++    gctPOINTER * table;
++    gckOS os = database->os;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Database=0x%08X Pointer=0x%08X", Database, Pointer);
++
++    gcmkVERIFY_ARGUMENT(Id != gcvNULL);
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(os, database->mutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    if (database->unused < 1)
++    {
++        /* Extend table. */
++        gcmkONERROR(
++            gckOS_Allocate(os,
++                           gcmSIZEOF(gctPOINTER) * (database->tableLen + gcdID_TABLE_LENGTH),
++                           (gctPOINTER *)&table));
++
++        gckOS_ZeroMemory(table + database->tableLen,
++                         gcmSIZEOF(gctPOINTER) * gcdID_TABLE_LENGTH);
++
++        /* Copy data from old table. */
++        gckOS_MemCopy(table,
++                      database->table,
++                      database->tableLen * gcmSIZEOF(gctPOINTER));
++
++        gcmkOS_SAFE_FREE(os, database->table);
++
++        /* Update databse with new allocated table. */
++        database->table = table;
++        database->currentID = database->tableLen;
++        database->tableLen += gcdID_TABLE_LENGTH;
++        database->unused += gcdID_TABLE_LENGTH;
++    }
++
++    table = database->table;
++    currentID = database->currentID;
++    tableLen = database->tableLen;
++    unused = database->unused;
++
++    /* Connect id with pointer. */
++    table[currentID] = Pointer;
++
++    *Id = currentID + 1;
++
++    /* Update the currentID. */
++    if (--unused > 0)
++    {
++        for (i = 0; i < tableLen; i++)
++        {
++            if (++currentID >= tableLen)
++            {
++                /* Wrap to the begin. */
++                currentID = 0;
++            }
++
++            if (table[currentID] == gcvNULL)
++            {
++                break;
++            }
++        }
++    }
++
++    database->table = table;
++    database->currentID = currentID;
++    database->tableLen = tableLen;
++    database->unused = unused;
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
++    acquired = gcvFALSE;
++
++    gcmkFOOTER_ARG("*Id=%d", *Id);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_FreeIntegerId(
++    IN gctPOINTER Database,
++    IN gctUINT32 Id
++    )
++{
++    gceSTATUS status;
++    gckINTEGERDB database = Database;
++    gckOS os = database->os;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Database=0x%08X Id=%d", Database, Id);
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(os, database->mutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    if (!(Id > 0 && Id <= database->tableLen))
++    {
++        gcmkONERROR(gcvSTATUS_NOT_FOUND);
++    }
++
++    Id -= 1;
++
++    database->table[Id] = gcvNULL;
++
++    if (database->unused++ == 0)
++    {
++        database->currentID = Id;
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
++    acquired = gcvFALSE;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_QueryIntegerId(
++    IN gctPOINTER Database,
++    IN gctUINT32 Id,
++    OUT gctPOINTER * Pointer
++    )
++{
++    gceSTATUS status;
++    gckINTEGERDB database = Database;
++    gctPOINTER pointer;
++    gckOS os = database->os;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Database=0x%08X Id=%d", Database, Id);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++
++    gcmkVERIFY_OK(gckOS_AcquireMutex(os, database->mutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    if (!(Id > 0 && Id <= database->tableLen))
++    {
++        gcmkONERROR(gcvSTATUS_NOT_FOUND);
++    }
++
++    Id -= 1;
++
++    pointer = database->table[Id];
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
++    acquired = gcvFALSE;
++
++    if (pointer)
++    {
++        *Pointer = pointer;
++    }
++    else
++    {
++        gcmkONERROR(gcvSTATUS_NOT_FOUND);
++    }
++
++    gcmkFOOTER_ARG("*Pointer=0x%08X", *Pointer);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(os, database->mutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++
++gctUINT32
++gckKERNEL_AllocateNameFromPointer(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Pointer
++    )
++{
++    gceSTATUS status;
++    gctUINT32 name;
++    gctPOINTER database = Kernel->db->pointerDatabase;
++
++    gcmkHEADER_ARG("Kernel=0x%X Pointer=0x%X", Kernel, Pointer);
++
++    gcmkONERROR(
++        gckKERNEL_AllocateIntegerId(database, Pointer, &name));
++
++    gcmkFOOTER_ARG("name=%d", name);
++    return name;
++
++OnError:
++    gcmkFOOTER();
++    return 0;
++}
++
++gctPOINTER
++gckKERNEL_QueryPointerFromName(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 Name
++    )
++{
++    gceSTATUS status;
++    gctPOINTER pointer = gcvNULL;
++    gctPOINTER database = Kernel->db->pointerDatabase;
++
++    gcmkHEADER_ARG("Kernel=0x%X Name=%d", Kernel, Name);
++
++    /* Lookup in database to get pointer. */
++    gcmkONERROR(gckKERNEL_QueryIntegerId(database, Name, &pointer));
++
++    gcmkFOOTER_ARG("pointer=0x%X", pointer);
++    return pointer;
++
++OnError:
++    gcmkFOOTER();
++    return gcvNULL;
++}
++
++gceSTATUS
++gckKERNEL_DeleteName(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 Name
++    )
++{
++    gctPOINTER database = Kernel->db->pointerDatabase;
++
++    gcmkHEADER_ARG("Kernel=0x%X Name=0x%X", Kernel, Name);
++
++    /* Free name if exists. */
++    gcmkVERIFY_OK(gckKERNEL_FreeIntegerId(database, Name));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++/*******************************************************************************
++***** Test Code ****************************************************************
++*******************************************************************************/
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,3042 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++#include "gc_hal_kernel_context.h"
++
++#ifdef __QNXNTO__
++#include <sys/slog.h>
++#endif
++
++#define _GC_OBJ_ZONE            gcvZONE_COMMAND
++
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  _NewQueue
++**
++**  Allocate a new command queue.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object.
++**
++**  OUTPUT:
++**
++**      gckCOMMAND Command
++**          gckCOMMAND object has been updated with a new command queue.
++*/
++static gceSTATUS
++_NewQueue(
++    IN OUT gckCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gctINT currentIndex, newIndex;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Switch to the next command buffer. */
++    currentIndex = Command->index;
++    newIndex     = (currentIndex + 1) % gcdCOMMAND_QUEUES;
++
++    /* Wait for availability. */
++#if gcdDUMP_COMMAND
++    gcmkPRINT("@[kernel.waitsignal]");
++#endif
++
++    gcmkONERROR(gckOS_WaitSignal(
++        Command->os,
++        Command->queues[newIndex].signal,
++        gcvINFINITE
++        ));
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    if (newIndex < currentIndex)
++    {
++        Command->wrapCount += 1;
++
++        gcmkTRACE_ZONE_N(
++            gcvLEVEL_INFO, gcvZONE_COMMAND,
++            2 * 4,
++            "%s(%d): queue array wrapped around.\n",
++            __FUNCTION__, __LINE__
++            );
++    }
++
++    gcmkTRACE_ZONE_N(
++        gcvLEVEL_INFO, gcvZONE_COMMAND,
++        3 * 4,
++        "%s(%d): total queue wrap arounds %d.\n",
++        __FUNCTION__, __LINE__, Command->wrapCount
++        );
++
++    gcmkTRACE_ZONE_N(
++        gcvLEVEL_INFO, gcvZONE_COMMAND,
++        3 * 4,
++        "%s(%d): switched to queue %d.\n",
++        __FUNCTION__, __LINE__, newIndex
++        );
++#endif
++
++    /* Update gckCOMMAND object with new command queue. */
++    Command->index    = newIndex;
++    Command->newQueue = gcvTRUE;
++    Command->logical  = Command->queues[newIndex].logical;
++    Command->offset   = 0;
++
++    gcmkONERROR(
++        gckOS_GetPhysicalAddress(
++            Command->os,
++            Command->logical,
++            (gctUINT32 *) &Command->physical
++            ));
++
++    if (currentIndex != -1)
++    {
++        /* Mark the command queue as available. */
++        gcmkONERROR(gckEVENT_Signal(
++            Command->kernel->eventObj,
++            Command->queues[currentIndex].signal,
++            gcvKERNEL_COMMAND
++            ));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("Command->index=%d", Command->index);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++_IncrementCommitAtom(
++    IN gckCOMMAND Command,
++    IN gctBOOL Increment
++    )
++{
++    gceSTATUS status;
++    gckHARDWARE hardware;
++    gctINT32 atomValue;
++    gctBOOL powerAcquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Extract the gckHARDWARE and gckEVENT objects. */
++    hardware = Command->kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    /* Grab the power mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(
++        Command->os, hardware->powerMutex, gcvINFINITE
++        ));
++    powerAcquired = gcvTRUE;
++
++    /* Increment the commit atom. */
++    if (Increment)
++    {
++        gcmkONERROR(gckOS_AtomIncrement(
++            Command->os, Command->atomCommit, &atomValue
++            ));
++    }
++    else
++    {
++        gcmkONERROR(gckOS_AtomDecrement(
++            Command->os, Command->atomCommit, &atomValue
++            ));
++    }
++
++    /* Release the power mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(
++        Command->os, hardware->powerMutex
++        ));
++    powerAcquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (powerAcquired)
++    {
++        /* Release the power mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(
++            Command->os, hardware->powerMutex
++            ));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdSECURE_USER
++static gceSTATUS
++_ProcessHints(
++    IN gckCOMMAND Command,
++    IN gctUINT32 ProcessID,
++    IN gcoCMDBUF CommandBuffer
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gckKERNEL kernel;
++    gctBOOL needCopy = gcvFALSE;
++    gcskSECURE_CACHE_PTR cache;
++    gctUINT8_PTR commandBufferLogical;
++    gctUINT8_PTR hintedData;
++    gctUINT32_PTR hintArray;
++    gctUINT i, hintCount;
++
++    gcmkHEADER_ARG(
++        "Command=0x%08X ProcessID=%d CommandBuffer=0x%08X",
++        Command, ProcessID, CommandBuffer
++        );
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Reset state array pointer. */
++    hintArray = gcvNULL;
++
++    /* Get the kernel object. */
++    kernel = Command->kernel;
++
++    /* Get the cache form the database. */
++    gcmkONERROR(gckKERNEL_GetProcessDBCache(kernel, ProcessID, &cache));
++
++    /* Determine the start of the command buffer. */
++    commandBufferLogical
++        = (gctUINT8_PTR) CommandBuffer->logical
++        +                CommandBuffer->startOffset;
++
++    /* Determine the number of records in the state array. */
++    hintCount = CommandBuffer->hintArrayTail - CommandBuffer->hintArray;
++
++    /* Check wehther we need to copy the structures or not. */
++    gcmkONERROR(gckOS_QueryNeedCopy(Command->os, ProcessID, &needCopy));
++
++    /* Get access to the state array. */
++    if (needCopy)
++    {
++        gctUINT copySize;
++
++        if (Command->hintArrayAllocated &&
++            (Command->hintArraySize < CommandBuffer->hintArraySize))
++        {
++            gcmkONERROR(gcmkOS_SAFE_FREE(Command->os, gcmUINT64_TO_PTR(Command->hintArray)));
++            Command->hintArraySize = gcvFALSE;
++        }
++
++        if (!Command->hintArrayAllocated)
++        {
++            gctPOINTER pointer = gcvNULL;
++
++            gcmkONERROR(gckOS_Allocate(
++                Command->os,
++                CommandBuffer->hintArraySize,
++                &pointer
++                ));
++
++            Command->hintArray          = gcmPTR_TO_UINT64(pointer);
++            Command->hintArrayAllocated = gcvTRUE;
++            Command->hintArraySize      = CommandBuffer->hintArraySize;
++        }
++
++        hintArray = gcmUINT64_TO_PTR(Command->hintArray);
++        copySize   = hintCount * gcmSIZEOF(gctUINT32);
++
++        gcmkONERROR(gckOS_CopyFromUserData(
++            Command->os,
++            hintArray,
++            gcmUINT64_TO_PTR(CommandBuffer->hintArray),
++            copySize
++            ));
++    }
++    else
++    {
++        gctPOINTER pointer = gcvNULL;
++
++        gcmkONERROR(gckOS_MapUserPointer(
++            Command->os,
++            gcmUINT64_TO_PTR(CommandBuffer->hintArray),
++            CommandBuffer->hintArraySize,
++            &pointer
++            ));
++
++        hintArray = pointer;
++    }
++
++    /* Scan through the buffer. */
++    for (i = 0; i < hintCount; i += 1)
++    {
++        /* Determine the location of the hinted data. */
++        hintedData = commandBufferLogical + hintArray[i];
++
++        /* Map handle into physical address. */
++        gcmkONERROR(gckKERNEL_MapLogicalToPhysical(
++            kernel, cache, (gctPOINTER) hintedData
++            ));
++    }
++
++OnError:
++    /* Get access to the state array. */
++    if (!needCopy && (hintArray != gcvNULL))
++    {
++        gcmkVERIFY_OK(gckOS_UnmapUserPointer(
++            Command->os,
++            gcmUINT64_TO_PTR(CommandBuffer->hintArray),
++            CommandBuffer->hintArraySize,
++            hintArray
++            ));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++static gceSTATUS
++_FlushMMU(
++    IN gckCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gctUINT32 oldValue;
++    gckHARDWARE hardware = Command->kernel->hardware;
++
++    gcmkONERROR(gckOS_AtomicExchange(Command->os,
++                                     hardware->pageTableDirty,
++                                     0,
++                                     &oldValue));
++
++    if (oldValue)
++    {
++        /* Page Table is upated, flush mmu before commit. */
++        gcmkONERROR(gckHARDWARE_FlushMMU(hardware));
++    }
++
++    return gcvSTATUS_OK;
++OnError:
++    return status;
++}
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++static void
++_DumpBuffer(
++    IN gctPOINTER Buffer,
++    IN gctUINT32 GpuAddress,
++    IN gctSIZE_T Size
++    )
++{
++    gctINT i, line, left;
++    gctUINT32_PTR data = Buffer;
++
++    line = Size / 32;
++    left = Size % 32;
++
++
++    for (i = 0; i < line; i++)
++    {
++        gcmkPRINT("%X : %08X %08X %08X %08X %08X %08X %08X %08X ",
++                  GpuAddress, data[0], data[1], data[2], data[3], data[4], data[5], data[6], data[7]);
++        data += 8;
++        GpuAddress += 8 * 4;
++    }
++
++    switch(left)
++    {
++        case 28:
++            gcmkPRINT("%X : %08X %08X %08X %08X %08X %08X %08X ",
++                      GpuAddress, data[0], data[1], data[2], data[3], data[4], data[5], data[6]);
++            break;
++        case 24:
++            gcmkPRINT("%X : %08X %08X %08X %08X %08X %08X ",
++                      GpuAddress, data[0], data[1], data[2], data[3], data[4], data[5]);
++            break;
++        case 20:
++            gcmkPRINT("%X : %08X %08X %08X %08X %08X ",
++                      GpuAddress, data[0], data[1], data[2], data[3], data[4]);
++            break;
++        case 16:
++            gcmkPRINT("%X : %08X %08X %08X %08X ",
++                      GpuAddress, data[0], data[1], data[2], data[3]);
++            break;
++        case 12:
++            gcmkPRINT("%X : %08X %08X %08X ",
++                      GpuAddress, data[0], data[1], data[2]);
++            break;
++        case 8:
++            gcmkPRINT("%X : %08X %08X ",
++                      GpuAddress, data[0], data[1]);
++            break;
++        case 4:
++            gcmkPRINT("%X : %08X ",
++                      GpuAddress, data[0]);
++            break;
++        default:
++            break;
++    }
++}
++
++static void
++_DumpKernelCommandBuffer(
++    IN gckCOMMAND Command
++)
++{
++    gctINT i;
++    gctUINT32 physical;
++    gctPOINTER entry;
++
++    for (i = 0; i < gcdCOMMAND_QUEUES; i++)
++    {
++        entry = Command->queues[i].logical;
++
++        gckOS_GetPhysicalAddress(Command->os, entry, &physical);
++
++        gcmkPRINT("Kernel command buffer %d\n", i);
++
++        _DumpBuffer(entry, physical, Command->pageSize);
++    }
++}
++#endif
++
++/******************************************************************************\
++****************************** gckCOMMAND API Code ******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Construct
++**
++**  Construct a new gckCOMMAND object.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**  OUTPUT:
++**
++**      gckCOMMAND * Command
++**          Pointer to a variable that will hold the pointer to the gckCOMMAND
++**          object.
++*/
++gceSTATUS
++gckCOMMAND_Construct(
++    IN gckKERNEL Kernel,
++    OUT gckCOMMAND * Command
++    )
++{
++    gckOS os;
++    gckCOMMAND command = gcvNULL;
++    gceSTATUS status;
++    gctINT i;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Command != gcvNULL);
++
++    /* Extract the gckOS object. */
++    os = Kernel->os;
++
++    /* Allocate the gckCOMMAND structure. */
++    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(struct _gckCOMMAND), &pointer));
++    command = pointer;
++
++    /* Reset the entire object. */
++    gcmkONERROR(gckOS_ZeroMemory(command, gcmSIZEOF(struct _gckCOMMAND)));
++
++    /* Initialize the gckCOMMAND object.*/
++    command->object.type    = gcvOBJ_COMMAND;
++    command->kernel         = Kernel;
++    command->os             = os;
++
++    /* Get the command buffer requirements. */
++    gcmkONERROR(gckHARDWARE_QueryCommandBuffer(
++        Kernel->hardware,
++        &command->alignment,
++        &command->reservedHead,
++        &command->reservedTail
++        ));
++
++    /* Create the command queue mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &command->mutexQueue));
++
++    /* Create the context switching mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &command->mutexContext));
++
++#if VIVANTE_PROFILER_CONTEXT
++    /* Create the context switching mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &command->mutexContextSeq));
++#endif
++
++    /* Create the power management semaphore. */
++    gcmkONERROR(gckOS_CreateSemaphore(os, &command->powerSemaphore));
++
++    /* Create the commit atom. */
++    gcmkONERROR(gckOS_AtomConstruct(os, &command->atomCommit));
++
++    /* Get the page size from teh OS. */
++    gcmkONERROR(gckOS_GetPageSize(os, &command->pageSize));
++
++    /* Get process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&command->kernelProcessID));
++
++    /* Set hardware to pipe 0. */
++    command->pipeSelect = gcvPIPE_INVALID;
++
++    /* Pre-allocate the command queues. */
++    for (i = 0; i < gcdCOMMAND_QUEUES; ++i)
++    {
++        gcmkONERROR(gckOS_AllocateNonPagedMemory(
++            os,
++            gcvFALSE,
++            &command->pageSize,
++            &command->queues[i].physical,
++            &command->queues[i].logical
++            ));
++
++        gcmkONERROR(gckOS_CreateSignal(
++            os, gcvFALSE, &command->queues[i].signal
++            ));
++
++        gcmkONERROR(gckOS_Signal(
++            os, command->queues[i].signal, gcvTRUE
++            ));
++    }
++
++    /* No command queue in use yet. */
++    command->index    = -1;
++    command->logical  = gcvNULL;
++    command->newQueue = gcvFALSE;
++
++    /* Command is not yet running. */
++    command->running = gcvFALSE;
++
++    /* Command queue is idle. */
++    command->idle = gcvTRUE;
++
++    /* Commit stamp is zero. */
++    command->commitStamp = 0;
++
++    /* END event signal not created. */
++    command->endEventSignal = gcvNULL;
++
++    /* Return pointer to the gckCOMMAND object. */
++    *Command = command;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Command=0x%x", *Command);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (command != gcvNULL)
++    {
++        if (command->atomCommit != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(os, command->atomCommit));
++        }
++
++        if (command->powerSemaphore != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DestroySemaphore(os, command->powerSemaphore));
++        }
++
++        if (command->mutexContext != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(os, command->mutexContext));
++        }
++
++#if VIVANTE_PROFILER_CONTEXT
++        if (command->mutexContextSeq != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(os, command->mutexContextSeq));
++        }
++#endif
++
++        if (command->mutexQueue != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(os, command->mutexQueue));
++        }
++
++        for (i = 0; i < gcdCOMMAND_QUEUES; ++i)
++        {
++            if (command->queues[i].signal != gcvNULL)
++            {
++                gcmkVERIFY_OK(gckOS_DestroySignal(
++                    os, command->queues[i].signal
++                    ));
++            }
++
++            if (command->queues[i].logical != gcvNULL)
++            {
++                gcmkVERIFY_OK(gckOS_FreeNonPagedMemory(
++                    os,
++                    command->pageSize,
++                    command->queues[i].physical,
++                    command->queues[i].logical
++                    ));
++            }
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, command));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Destroy
++**
++**  Destroy an gckCOMMAND object.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Destroy(
++    IN gckCOMMAND Command
++    )
++{
++    gctINT i;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Stop the command queue. */
++    gcmkVERIFY_OK(gckCOMMAND_Stop(Command, gcvFALSE));
++
++    for (i = 0; i < gcdCOMMAND_QUEUES; ++i)
++    {
++        gcmkASSERT(Command->queues[i].signal != gcvNULL);
++        gcmkVERIFY_OK(gckOS_DestroySignal(
++            Command->os, Command->queues[i].signal
++            ));
++
++        gcmkASSERT(Command->queues[i].logical != gcvNULL);
++        gcmkVERIFY_OK(gckOS_FreeNonPagedMemory(
++            Command->os,
++            Command->pageSize,
++            Command->queues[i].physical,
++            Command->queues[i].logical
++            ));
++    }
++
++    /* END event signal. */
++    if (Command->endEventSignal != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_DestroySignal(
++            Command->os, Command->endEventSignal
++            ));
++    }
++
++    /* Delete the context switching mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Command->os, Command->mutexContext));
++
++#if VIVANTE_PROFILER_CONTEXT
++    if (Command->mutexContextSeq != gcvNULL)
++        gcmkVERIFY_OK(gckOS_DeleteMutex(Command->os, Command->mutexContextSeq));
++#endif
++
++    /* Delete the command queue mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Command->os, Command->mutexQueue));
++
++    /* Destroy the power management semaphore. */
++    gcmkVERIFY_OK(gckOS_DestroySemaphore(Command->os, Command->powerSemaphore));
++
++    /* Destroy the commit atom. */
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Command->os, Command->atomCommit));
++
++#if gcdSECURE_USER
++    /* Free state array. */
++    if (Command->hintArrayAllocated)
++    {
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Command->os, gcmUINT64_TO_PTR(Command->hintArray)));
++        Command->hintArrayAllocated = gcvFALSE;
++    }
++#endif
++
++    /* Mark object as unknown. */
++    Command->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckCOMMAND object. */
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Command->os, Command));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_EnterCommit
++**
++**  Acquire command queue synchronization objects.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object to destroy.
++**
++**      gctBOOL FromPower
++**          Determines whether the call originates from inside the power
++**          management or not.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_EnterCommit(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromPower
++    )
++{
++    gceSTATUS status;
++    gckHARDWARE hardware;
++    gctBOOL atomIncremented = gcvFALSE;
++    gctBOOL semaAcquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Extract the gckHARDWARE and gckEVENT objects. */
++    hardware = Command->kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    if (!FromPower)
++    {
++        /* Increment COMMIT atom to let power management know that a commit is
++        ** in progress. */
++        gcmkONERROR(_IncrementCommitAtom(Command, gcvTRUE));
++        atomIncremented = gcvTRUE;
++
++        /* Notify the system the GPU has a commit. */
++        gcmkONERROR(gckOS_Broadcast(Command->os,
++                                    hardware,
++                                    gcvBROADCAST_GPU_COMMIT));
++
++        /* Acquire the power management semaphore. */
++        gcmkONERROR(gckOS_AcquireSemaphore(Command->os,
++                                           Command->powerSemaphore));
++        semaAcquired = gcvTRUE;
++    }
++
++    /* Grab the conmmand queue mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Command->os,
++                                   Command->mutexQueue,
++                                   gcvINFINITE));
++
++    /* Success. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (semaAcquired)
++    {
++        /* Release the power management semaphore. */
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(
++            Command->os, Command->powerSemaphore
++            ));
++    }
++
++    if (atomIncremented)
++    {
++        /* Decrement the commit atom. */
++        gcmkVERIFY_OK(_IncrementCommitAtom(
++            Command, gcvFALSE
++            ));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_ExitCommit
++**
++**  Release command queue synchronization objects.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object to destroy.
++**
++**      gctBOOL FromPower
++**          Determines whether the call originates from inside the power
++**          management or not.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_ExitCommit(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromPower
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Release the power mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexQueue));
++
++    if (!FromPower)
++    {
++        /* Release the power management semaphore. */
++        gcmkONERROR(gckOS_ReleaseSemaphore(Command->os,
++                                           Command->powerSemaphore));
++
++        /* Decrement the commit atom. */
++        gcmkONERROR(_IncrementCommitAtom(Command, gcvFALSE));
++    }
++
++    /* Success. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Start
++**
++**  Start up the command queue.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object to start.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Start(
++    IN gckCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gckHARDWARE hardware;
++    gctUINT32 waitOffset;
++    gctSIZE_T waitLinkBytes;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->running)
++    {
++        /* Command queue already running. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Extract the gckHARDWARE object. */
++    hardware = Command->kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    if (Command->logical == gcvNULL)
++    {
++        /* Start at beginning of a new queue. */
++        gcmkONERROR(_NewQueue(Command));
++    }
++
++    /* Start at beginning of page. */
++    Command->offset = 0;
++
++    /* Set abvailable number of bytes for WAIT/LINK command sequence. */
++    waitLinkBytes = Command->pageSize;
++
++    /* Append WAIT/LINK. */
++    gcmkONERROR(gckHARDWARE_WaitLink(
++        hardware,
++        Command->logical,
++        0,
++        &waitLinkBytes,
++        &waitOffset,
++        &Command->waitSize
++        ));
++
++    Command->waitLogical  = (gctUINT8_PTR) Command->logical  + waitOffset;
++    Command->waitPhysical = (gctUINT8_PTR) Command->physical + waitOffset;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache for the wait/link. */
++    gcmkONERROR(gckOS_CacheClean(
++        Command->os,
++        Command->kernelProcessID,
++        gcvNULL,
++        Command->physical,
++        Command->logical,
++        waitLinkBytes
++        ));
++#endif
++
++    /* Adjust offset. */
++    Command->offset   = waitLinkBytes;
++    Command->newQueue = gcvFALSE;
++
++    /* Enable command processor. */
++#ifdef __QNXNTO__
++    gcmkONERROR(gckHARDWARE_Execute(
++        hardware,
++        Command->logical,
++        Command->physical,
++        gcvTRUE,
++        waitLinkBytes
++        ));
++#else
++    gcmkONERROR(gckHARDWARE_Execute(
++        hardware,
++        Command->logical,
++        waitLinkBytes
++        ));
++#endif
++
++    /* Command queue is running. */
++    Command->running = gcvTRUE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Stop
++**
++**  Stop the command queue.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object to stop.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Stop(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromRecovery
++    )
++{
++    gckHARDWARE hardware;
++    gceSTATUS status;
++    gctUINT32 idle;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (!Command->running)
++    {
++        /* Command queue is not running. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Extract the gckHARDWARE object. */
++    hardware = Command->kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    if (gckHARDWARE_IsFeatureAvailable(hardware,
++                                       gcvFEATURE_END_EVENT) == gcvSTATUS_TRUE)
++    {
++        /* Allocate the signal. */
++        if (Command->endEventSignal == gcvNULL)
++        {
++            gcmkONERROR(gckOS_CreateSignal(Command->os,
++                                           gcvTRUE,
++                                           &Command->endEventSignal));
++        }
++
++        /* Append the END EVENT command to trigger the signal. */
++        gcmkONERROR(gckEVENT_Stop(Command->kernel->eventObj,
++                                  Command->kernelProcessID,
++                                  Command->waitPhysical,
++                                  Command->waitLogical,
++                                  Command->endEventSignal,
++								  &Command->waitSize));
++    }
++    else
++    {
++        /* Replace last WAIT with END. */
++        gcmkONERROR(gckHARDWARE_End(
++            hardware, Command->waitLogical, &Command->waitSize
++            ));
++
++        /* Update queue tail pointer. */
++        gcmkONERROR(gckHARDWARE_UpdateQueueTail(Command->kernel->hardware,
++                                                Command->logical,
++                                                Command->offset));
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        /* Flush the cache for the END. */
++        gcmkONERROR(gckOS_CacheClean(
++            Command->os,
++            Command->kernelProcessID,
++            gcvNULL,
++            Command->waitPhysical,
++            Command->waitLogical,
++            Command->waitSize
++            ));
++#endif
++
++        /* Wait for idle. */
++        gcmkONERROR(gckHARDWARE_GetIdle(hardware, !FromRecovery, &idle));
++    }
++
++    /* Command queue is no longer running. */
++    Command->running = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Commit
++**
++**  Commit a command buffer to the command queue.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to a gckCOMMAND object.
++**
++**      gckCONTEXT Context
++**          Pointer to a gckCONTEXT object.
++**
++**      gcoCMDBUF CommandBuffer
++**          Pointer to a gcoCMDBUF object.
++**
++**      gcsSTATE_DELTA_PTR StateDelta
++**          Pointer to the state delta.
++**
++**      gctUINT32 ProcessID
++**          Current process ID.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Commit(
++    IN gckCOMMAND Command,
++    IN gckCONTEXT Context,
++    IN gcoCMDBUF CommandBuffer,
++    IN gcsSTATE_DELTA_PTR StateDelta,
++    IN gcsQUEUE_PTR EventQueue,
++    IN gctUINT32 ProcessID
++    )
++{
++    gceSTATUS status;
++    gctBOOL commitEntered = gcvFALSE;
++    gctBOOL contextAcquired = gcvFALSE;
++    gckHARDWARE hardware;
++    gctBOOL needCopy = gcvFALSE;
++    gcsQUEUE_PTR eventRecord = gcvNULL;
++    gcsQUEUE _eventRecord;
++    gcsQUEUE_PTR nextEventRecord;
++    gctBOOL commandBufferMapped = gcvFALSE;
++    gcoCMDBUF commandBufferObject = gcvNULL;
++
++#if !gcdNULL_DRIVER
++    gcsCONTEXT_PTR contextBuffer;
++    struct _gcoCMDBUF _commandBufferObject;
++    gctPHYS_ADDR commandBufferPhysical;
++    gctUINT8_PTR commandBufferLogical;
++    gctUINT8_PTR commandBufferLink;
++    gctUINT commandBufferSize;
++    gctSIZE_T nopBytes;
++    gctSIZE_T pipeBytes;
++    gctSIZE_T linkBytes;
++    gctSIZE_T bytes;
++    gctUINT32 offset;
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    gctPHYS_ADDR entryPhysical;
++#endif
++    gctPOINTER entryLogical;
++    gctSIZE_T entryBytes;
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    gctPHYS_ADDR exitPhysical;
++#endif
++    gctPOINTER exitLogical;
++    gctSIZE_T exitBytes;
++    gctPHYS_ADDR waitLinkPhysical;
++    gctPOINTER waitLinkLogical;
++    gctSIZE_T waitLinkBytes;
++    gctPHYS_ADDR waitPhysical;
++    gctPOINTER waitLogical;
++    gctUINT32 waitOffset;
++    gctSIZE_T waitSize;
++
++#if gcdDUMP_COMMAND
++    gctPOINTER contextDumpLogical = gcvNULL;
++    gctSIZE_T contextDumpBytes = 0;
++    gctPOINTER bufferDumpLogical = gcvNULL;
++    gctSIZE_T bufferDumpBytes = 0;
++# endif
++#endif
++
++#if VIVANTE_PROFILER_CONTEXT
++    gctBOOL sequenceAcquired = gcvFALSE;
++#endif
++
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG(
++        "Command=0x%x CommandBuffer=0x%x ProcessID=%d",
++        Command, CommandBuffer, ProcessID
++        );
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    if (Command->kernel->core == gcvCORE_2D)
++    {
++        /* There is no context for 2D. */
++        Context = gcvNULL;
++    }
++
++    gcmkONERROR(_FlushMMU(Command));
++
++#if VIVANTE_PROFILER_CONTEXT
++    if((Command->kernel->hardware->gpuProfiler) && (Command->kernel->profileEnable))
++    {
++        /* Acquire the context sequnence mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(
++            Command->os, Command->mutexContextSeq, gcvINFINITE
++            ));
++        sequenceAcquired = gcvTRUE;
++    }
++#endif
++
++    /* Acquire the command queue. */
++    gcmkONERROR(gckCOMMAND_EnterCommit(Command, gcvFALSE));
++    commitEntered = gcvTRUE;
++
++    /* Acquire the context switching mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(
++        Command->os, Command->mutexContext, gcvINFINITE
++        ));
++    contextAcquired = gcvTRUE;
++
++    /* Extract the gckHARDWARE and gckEVENT objects. */
++    hardware = Command->kernel->hardware;
++
++    /* Check wehther we need to copy the structures or not. */
++    gcmkONERROR(gckOS_QueryNeedCopy(Command->os, ProcessID, &needCopy));
++
++#if gcdNULL_DRIVER
++    /* Context switch required? */
++    if ((Context != gcvNULL) && (Command->currContext != Context))
++    {
++        /* Yes, merge in the deltas. */
++        gckCONTEXT_Update(Context, ProcessID, StateDelta);
++
++		/* Update the current context. */
++		Command->currContext = Context;
++	}
++#else
++    if (needCopy)
++    {
++        commandBufferObject = &_commandBufferObject;
++
++        gcmkONERROR(gckOS_CopyFromUserData(
++            Command->os,
++            commandBufferObject,
++            CommandBuffer,
++            gcmSIZEOF(struct _gcoCMDBUF)
++            ));
++
++        gcmkVERIFY_OBJECT(commandBufferObject, gcvOBJ_COMMANDBUFFER);
++    }
++    else
++    {
++        gcmkONERROR(gckOS_MapUserPointer(
++            Command->os,
++            CommandBuffer,
++            gcmSIZEOF(struct _gcoCMDBUF),
++            &pointer
++            ));
++
++        commandBufferObject = pointer;
++
++        gcmkVERIFY_OBJECT(commandBufferObject, gcvOBJ_COMMANDBUFFER);
++        commandBufferMapped = gcvTRUE;
++    }
++
++    /* Query the size of NOP command. */
++    gcmkONERROR(gckHARDWARE_Nop(
++        hardware, gcvNULL, &nopBytes
++        ));
++
++    /* Query the size of pipe select command sequence. */
++    gcmkONERROR(gckHARDWARE_PipeSelect(
++        hardware, gcvNULL, gcvPIPE_3D, &pipeBytes
++        ));
++
++    /* Query the size of LINK command. */
++    gcmkONERROR(gckHARDWARE_Link(
++        hardware, gcvNULL, gcvNULL, 0, &linkBytes
++        ));
++
++    /* Compute the command buffer entry and the size. */
++    commandBufferLogical
++        = (gctUINT8_PTR) gcmUINT64_TO_PTR(commandBufferObject->logical)
++        +                commandBufferObject->startOffset;
++
++    gcmkONERROR(gckOS_GetPhysicalAddress(
++        Command->os,
++        commandBufferLogical,
++        (gctUINT32_PTR)&commandBufferPhysical
++        ));
++
++    commandBufferSize
++        = commandBufferObject->offset
++        + Command->reservedTail
++        - commandBufferObject->startOffset;
++
++    /* Get the current offset. */
++    offset = Command->offset;
++
++    /* Compute number of bytes left in current kernel command queue. */
++    bytes = Command->pageSize - offset;
++
++    /* Query the size of WAIT/LINK command sequence. */
++    gcmkONERROR(gckHARDWARE_WaitLink(
++        hardware,
++        gcvNULL,
++        offset,
++        &waitLinkBytes,
++        gcvNULL,
++        gcvNULL
++        ));
++
++    /* Is there enough space in the current command queue? */
++    if (bytes < waitLinkBytes)
++    {
++        /* No, create a new one. */
++        gcmkONERROR(_NewQueue(Command));
++
++        /* Get the new current offset. */
++        offset = Command->offset;
++
++        /* Recompute the number of bytes in the new kernel command queue. */
++        bytes = Command->pageSize - offset;
++        gcmkASSERT(bytes >= waitLinkBytes);
++    }
++
++    /* Compute the location if WAIT/LINK command sequence. */
++    waitLinkPhysical = (gctUINT8_PTR) Command->physical + offset;
++    waitLinkLogical  = (gctUINT8_PTR) Command->logical  + offset;
++
++    /* Context switch required? */
++    if (Context == gcvNULL)
++    {
++        /* See if we have to switch pipes for the command buffer. */
++        if (commandBufferObject->entryPipe == Command->pipeSelect)
++        {
++            /* Skip pipe switching sequence. */
++            offset = pipeBytes;
++        }
++        else
++        {
++            /* The current hardware and the entry command buffer pipes
++            ** are different, switch to the correct pipe. */
++            gcmkONERROR(gckHARDWARE_PipeSelect(
++                Command->kernel->hardware,
++                commandBufferLogical,
++                commandBufferObject->entryPipe,
++                &pipeBytes
++                ));
++
++            /* Do not skip pipe switching sequence. */
++            offset = 0;
++        }
++
++        /* Compute the entry. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        entryPhysical = (gctUINT8_PTR) commandBufferPhysical + offset;
++#endif
++        entryLogical  =                commandBufferLogical  + offset;
++        entryBytes    =                commandBufferSize     - offset;
++    }
++    else if (Command->currContext != Context)
++    {
++        /* Temporary disable context length oprimization. */
++        Context->dirty = gcvTRUE;
++
++        /* Get the current context buffer. */
++        contextBuffer = Context->buffer;
++
++        /* Yes, merge in the deltas. */
++        gcmkONERROR(gckCONTEXT_Update(Context, ProcessID, StateDelta));
++
++        /* Determine context entry and exit points. */
++        if (0)
++        {
++            /* Reset 2D dirty flag. */
++            Context->dirty2D = gcvFALSE;
++
++            if (Context->dirty || commandBufferObject->using3D)
++            {
++                /***************************************************************
++                ** SWITCHING CONTEXT: 2D and 3D are used.
++                */
++
++                /* Reset 3D dirty flag. */
++                Context->dirty3D = gcvFALSE;
++
++                /* Compute the entry. */
++                if (Command->pipeSelect == gcvPIPE_2D)
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
++                    entryBytes    =                Context->bufferSize     - pipeBytes;
++                }
++                else
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
++                    entryBytes    =                Context->bufferSize;
++                }
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_3D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* Ensure the NOP between 2D and 3D is in place so that the
++                   execution falls through from 2D to 3D. */
++                gcmkONERROR(gckHARDWARE_Nop(
++                    hardware,
++                    contextBuffer->link2D,
++                    &nopBytes
++                    ));
++
++                /* Generate a LINK from the context buffer to
++                   the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link3D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++
++                /* Mark context as not dirty. */
++                Context->dirty = gcvFALSE;
++            }
++            else
++            {
++                /***************************************************************
++                ** SWITCHING CONTEXT: 2D only command buffer.
++                */
++
++                /* Mark 3D as dirty. */
++                Context->dirty3D = gcvTRUE;
++
++                /* Compute the entry. */
++                if (Command->pipeSelect == gcvPIPE_2D)
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
++                    entryBytes    =                Context->entryOffset3D  - pipeBytes;
++                }
++                else
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
++                    entryBytes    =                Context->entryOffset3D;
++                }
++
++                /* Store the current context buffer. */
++                Context->dirtyBuffer = contextBuffer;
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_2D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* 3D is not used, generate a LINK from the end of 2D part of
++                   the context buffer to the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link2D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++            }
++        }
++
++        /* Not using 2D. */
++        else
++        {
++            /* Mark 2D as dirty. */
++            Context->dirty2D = gcvTRUE;
++
++            /* Store the current context buffer. */
++            Context->dirtyBuffer = contextBuffer;
++
++            if (Context->dirty || commandBufferObject->using3D)
++            {
++                /***************************************************************
++                ** SWITCHING CONTEXT: 3D only command buffer.
++                */
++
++                /* Reset 3D dirty flag. */
++                Context->dirty3D = gcvFALSE;
++
++                /* Determine context buffer entry offset. */
++                offset = (Command->pipeSelect == gcvPIPE_3D)
++
++                    /* Skip pipe switching sequence. */
++                    ? Context->entryOffset3D + pipeBytes
++
++                    /* Do not skip pipe switching sequence. */
++                    : Context->entryOffset3D;
++
++                /* Compute the entry. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                entryPhysical = (gctUINT8_PTR) contextBuffer->physical + offset;
++#endif
++                entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + offset;
++                entryBytes    =                Context->bufferSize     - offset;
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_3D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* Generate a LINK from the context buffer to
++                   the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link3D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++            }
++            else
++            {
++                /***************************************************************
++                ** SWITCHING CONTEXT: "XD" command buffer - neither 2D nor 3D.
++                */
++
++                /* Mark 3D as dirty. */
++                Context->dirty3D = gcvTRUE;
++
++                /* Compute the entry. */
++                if (Command->pipeSelect == gcvPIPE_3D)
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical
++                        = (gctUINT8_PTR) contextBuffer->physical
++                        + Context->entryOffsetXDFrom3D;
++#endif
++                    entryLogical
++                        = (gctUINT8_PTR) contextBuffer->logical
++                        + Context->entryOffsetXDFrom3D;
++
++                    entryBytes
++                        = Context->bufferSize
++                        - Context->entryOffsetXDFrom3D;
++                }
++                else
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical
++                        = (gctUINT8_PTR) contextBuffer->physical
++                        + Context->entryOffsetXDFrom2D;
++#endif
++                    entryLogical
++                        = (gctUINT8_PTR) contextBuffer->logical
++                        + Context->entryOffsetXDFrom2D;
++
++                    entryBytes
++                        = Context->totalSize
++                        - Context->entryOffsetXDFrom2D;
++                }
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_3D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* Generate a LINK from the context buffer to
++                   the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link3D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++            }
++        }
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        /* Flush the context buffer cache. */
++        gcmkONERROR(gckOS_CacheClean(
++            Command->os,
++            Command->kernelProcessID,
++            gcvNULL,
++            entryPhysical,
++            entryLogical,
++            entryBytes
++            ));
++#endif
++
++        /* Update the current context. */
++        Command->currContext = Context;
++
++#if gcdDUMP_COMMAND
++        contextDumpLogical = entryLogical;
++        contextDumpBytes   = entryBytes;
++#endif
++    }
++
++    /* Same context. */
++    else
++    {
++        /* Determine context entry and exit points. */
++        if (commandBufferObject->using2D && Context->dirty2D)
++        {
++            /* Reset 2D dirty flag. */
++            Context->dirty2D = gcvFALSE;
++
++            /* Get the "dirty" context buffer. */
++            contextBuffer = Context->dirtyBuffer;
++
++            if (commandBufferObject->using3D && Context->dirty3D)
++            {
++                /* Reset 3D dirty flag. */
++                Context->dirty3D = gcvFALSE;
++
++                /* Compute the entry. */
++                if (Command->pipeSelect == gcvPIPE_2D)
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
++                    entryBytes    =                Context->bufferSize     - pipeBytes;
++                }
++                else
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
++                    entryBytes    =                Context->bufferSize;
++                }
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_3D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* Ensure the NOP between 2D and 3D is in place so that the
++                   execution falls through from 2D to 3D. */
++                gcmkONERROR(gckHARDWARE_Nop(
++                    hardware,
++                    contextBuffer->link2D,
++                    &nopBytes
++                    ));
++
++                /* Generate a LINK from the context buffer to
++                   the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link3D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++            }
++            else
++            {
++                /* Compute the entry. */
++                if (Command->pipeSelect == gcvPIPE_2D)
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical + pipeBytes;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + pipeBytes;
++                    entryBytes    =                Context->entryOffset3D  - pipeBytes;
++                }
++                else
++                {
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                    entryPhysical = (gctUINT8_PTR) contextBuffer->physical;
++#endif
++                    entryLogical  = (gctUINT8_PTR) contextBuffer->logical;
++                    entryBytes    =                Context->entryOffset3D;
++                }
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_2D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* 3D is not used, generate a LINK from the end of 2D part of
++                   the context buffer to the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link2D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++            }
++        }
++        else
++        {
++            if (commandBufferObject->using3D && Context->dirty3D)
++            {
++                /* Reset 3D dirty flag. */
++                Context->dirty3D = gcvFALSE;
++
++                /* Get the "dirty" context buffer. */
++                contextBuffer = Context->dirtyBuffer;
++
++                /* Determine context buffer entry offset. */
++                offset = (Command->pipeSelect == gcvPIPE_3D)
++
++                    /* Skip pipe switching sequence. */
++                    ? Context->entryOffset3D + pipeBytes
++
++                    /* Do not skip pipe switching sequence. */
++                    : Context->entryOffset3D;
++
++                /* Compute the entry. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                entryPhysical = (gctUINT8_PTR) contextBuffer->physical + offset;
++#endif
++                entryLogical  = (gctUINT8_PTR) contextBuffer->logical  + offset;
++                entryBytes    =                Context->bufferSize     - offset;
++
++                /* See if we have to switch pipes between the context
++                   and command buffers. */
++                if (commandBufferObject->entryPipe == gcvPIPE_3D)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the initial context pipes are
++                       different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* Generate a LINK from the context buffer to
++                   the command buffer. */
++                gcmkONERROR(gckHARDWARE_Link(
++                    hardware,
++                    contextBuffer->link3D,
++                    commandBufferLogical + offset,
++                    commandBufferSize    - offset,
++                    &linkBytes
++                    ));
++            }
++            else
++            {
++                /* See if we have to switch pipes for the command buffer. */
++                if (commandBufferObject->entryPipe == Command->pipeSelect)
++                {
++                    /* Skip pipe switching sequence. */
++                    offset = pipeBytes;
++                }
++                else
++                {
++                    /* The current hardware and the entry command buffer pipes
++                    ** are different, switch to the correct pipe. */
++                    gcmkONERROR(gckHARDWARE_PipeSelect(
++                        Command->kernel->hardware,
++                        commandBufferLogical,
++                        commandBufferObject->entryPipe,
++                        &pipeBytes
++                        ));
++
++                    /* Do not skip pipe switching sequence. */
++                    offset = 0;
++                }
++
++                /* Compute the entry. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++                entryPhysical = (gctUINT8_PTR) commandBufferPhysical + offset;
++#endif
++                entryLogical  =                commandBufferLogical  + offset;
++                entryBytes    =                commandBufferSize     - offset;
++            }
++        }
++    }
++
++#if gcdDUMP_COMMAND
++    bufferDumpLogical = commandBufferLogical + offset;
++    bufferDumpBytes   = commandBufferSize    - offset;
++#endif
++
++#if gcdSECURE_USER
++    /* Process user hints. */
++    gcmkONERROR(_ProcessHints(Command, ProcessID, commandBufferObject));
++#endif
++
++    /* Determine the location to jump to for the command buffer being
++    ** scheduled. */
++    if (Command->newQueue)
++    {
++        /* New command queue, jump to the beginning of it. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        exitPhysical = Command->physical;
++#endif
++        exitLogical  = Command->logical;
++        exitBytes    = Command->offset + waitLinkBytes;
++    }
++    else
++    {
++        /* Still within the preexisting command queue, jump to the new
++           WAIT/LINK command sequence. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        exitPhysical = waitLinkPhysical;
++#endif
++        exitLogical  = waitLinkLogical;
++        exitBytes    = waitLinkBytes;
++    }
++
++    /* Add a new WAIT/LINK command sequence. When the command buffer which is
++       currently being scheduled is fully executed by the GPU, the FE will
++       jump to this WAIT/LINK sequence. */
++    gcmkONERROR(gckHARDWARE_WaitLink(
++        hardware,
++        waitLinkLogical,
++        offset,
++        &waitLinkBytes,
++        &waitOffset,
++        &waitSize
++        ));
++
++    /* Compute the location if WAIT command. */
++    waitPhysical = (gctUINT8_PTR) waitLinkPhysical + waitOffset;
++    waitLogical  = (gctUINT8_PTR) waitLinkLogical  + waitOffset;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the command queue cache. */
++    gcmkONERROR(gckOS_CacheClean(
++        Command->os,
++        Command->kernelProcessID,
++        gcvNULL,
++        exitPhysical,
++        exitLogical,
++        exitBytes
++        ));
++#endif
++
++    /* Determine the location of the LINK command in the command buffer. */
++    commandBufferLink
++        = (gctUINT8_PTR) gcmUINT64_TO_PTR(commandBufferObject->logical)
++        +                commandBufferObject->offset;
++
++    /* Generate a LINK from the end of the command buffer being scheduled
++       back to the kernel command queue. */
++    gcmkONERROR(gckHARDWARE_Link(
++        hardware,
++        commandBufferLink,
++        exitLogical,
++        exitBytes,
++        &linkBytes
++        ));
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the command buffer cache. */
++    gcmkONERROR(gckOS_CacheClean(
++        Command->os,
++        ProcessID,
++        gcvNULL,
++        commandBufferPhysical,
++        commandBufferLogical,
++        commandBufferSize
++        ));
++#endif
++
++    /* Generate a LINK from the previous WAIT/LINK command sequence to the
++       entry determined above (either the context or the command buffer).
++       This LINK replaces the WAIT instruction from the previous WAIT/LINK
++       pair, therefore we use WAIT metrics for generation of this LINK.
++       This action will execute the entire sequence. */
++    gcmkONERROR(gckHARDWARE_Link(
++        hardware,
++        Command->waitLogical,
++        entryLogical,
++        entryBytes,
++        &Command->waitSize
++        ));
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache for the link. */
++    gcmkONERROR(gckOS_CacheClean(
++        Command->os,
++        Command->kernelProcessID,
++        gcvNULL,
++        Command->waitPhysical,
++        Command->waitLogical,
++        Command->waitSize
++        ));
++#endif
++
++    gcmkDUMPCOMMAND(
++        Command->os,
++        Command->waitLogical,
++        Command->waitSize,
++        gceDUMP_BUFFER_LINK,
++        gcvFALSE
++        );
++
++    gcmkDUMPCOMMAND(
++        Command->os,
++        contextDumpLogical,
++        contextDumpBytes,
++        gceDUMP_BUFFER_CONTEXT,
++        gcvFALSE
++        );
++
++    gcmkDUMPCOMMAND(
++        Command->os,
++        bufferDumpLogical,
++        bufferDumpBytes,
++        gceDUMP_BUFFER_USER,
++        gcvFALSE
++        );
++
++    gcmkDUMPCOMMAND(
++        Command->os,
++        waitLinkLogical,
++        waitLinkBytes,
++        gceDUMP_BUFFER_WAITLINK,
++        gcvFALSE
++        );
++
++    /* Update the current pipe. */
++    Command->pipeSelect = commandBufferObject->exitPipe;
++
++    /* Update command queue offset. */
++    Command->offset  += waitLinkBytes;
++    Command->newQueue = gcvFALSE;
++
++    /* Update address of last WAIT. */
++    Command->waitPhysical = waitPhysical;
++    Command->waitLogical  = waitLogical;
++    Command->waitSize     = waitSize;
++
++    /* Update queue tail pointer. */
++    gcmkONERROR(gckHARDWARE_UpdateQueueTail(
++        hardware, Command->logical, Command->offset
++        ));
++
++#if gcdDUMP_COMMAND
++    gcmkPRINT("@[kernel.commit]");
++#endif
++#endif /* gcdNULL_DRIVER */
++
++    /* Release the context switching mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
++    contextAcquired = gcvFALSE;
++
++    /* Release the command queue. */
++    gcmkONERROR(gckCOMMAND_ExitCommit(Command, gcvFALSE));
++    commitEntered = gcvFALSE;
++
++#if VIVANTE_PROFILER_CONTEXT
++    if(sequenceAcquired)
++    {
++        gcmkONERROR(gckCOMMAND_Stall(Command, gcvTRUE));
++        if (Command->currContext)
++        {
++            gcmkONERROR(gckHARDWARE_UpdateContextProfile(
++                hardware,
++                Command->currContext));
++        }
++
++        /* Release the context switching mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContextSeq));
++        sequenceAcquired = gcvFALSE;
++    }
++#endif
++
++    /* Loop while there are records in the queue. */
++    while (EventQueue != gcvNULL)
++    {
++        if (needCopy)
++        {
++            /* Point to stack record. */
++            eventRecord = &_eventRecord;
++
++            /* Copy the data from the client. */
++            gcmkONERROR(gckOS_CopyFromUserData(
++                Command->os, eventRecord, EventQueue, gcmSIZEOF(gcsQUEUE)
++                ));
++        }
++        else
++        {
++            /* Map record into kernel memory. */
++            gcmkONERROR(gckOS_MapUserPointer(Command->os,
++                                             EventQueue,
++                                             gcmSIZEOF(gcsQUEUE),
++                                             &pointer));
++
++            eventRecord = pointer;
++        }
++
++        /* Append event record to event queue. */
++        gcmkONERROR(gckEVENT_AddList(
++            Command->kernel->eventObj, &eventRecord->iface, gcvKERNEL_PIXEL, gcvTRUE, gcvFALSE
++            ));
++
++        /* Next record in the queue. */
++        nextEventRecord = gcmUINT64_TO_PTR(eventRecord->next);
++
++        if (!needCopy)
++        {
++            /* Unmap record from kernel memory. */
++            gcmkONERROR(gckOS_UnmapUserPointer(
++                Command->os, EventQueue, gcmSIZEOF(gcsQUEUE), (gctPOINTER *) eventRecord
++                ));
++
++            eventRecord = gcvNULL;
++        }
++
++        EventQueue = nextEventRecord;
++    }
++
++    if (Command->kernel->eventObj->queueHead == gcvNULL
++     && Command->kernel->hardware->powerManagement == gcvTRUE
++    )
++    {
++        /* Commit done event by which work thread knows all jobs done. */
++        gcmkVERIFY_OK(
++            gckEVENT_CommitDone(Command->kernel->eventObj, gcvKERNEL_PIXEL));
++    }
++
++    /* Submit events. */
++    status = gckEVENT_Submit(Command->kernel->eventObj, gcvTRUE, gcvFALSE);
++
++    if (status == gcvSTATUS_INTERRUPTED)
++    {
++        gcmkTRACE(
++            gcvLEVEL_INFO,
++            "%s(%d): Intterupted in gckEVENT_Submit",
++            __FUNCTION__, __LINE__
++            );
++        status = gcvSTATUS_OK;
++    }
++    else
++    {
++        gcmkONERROR(status);
++    }
++
++    /* Unmap the command buffer pointer. */
++    if (commandBufferMapped)
++    {
++        gcmkONERROR(gckOS_UnmapUserPointer(
++            Command->os,
++            CommandBuffer,
++            gcmSIZEOF(struct _gcoCMDBUF),
++            commandBufferObject
++            ));
++
++        commandBufferMapped = gcvFALSE;
++    }
++
++    /* Return status. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if ((eventRecord != gcvNULL) && !needCopy)
++    {
++        /* Roll back. */
++        gcmkVERIFY_OK(gckOS_UnmapUserPointer(
++            Command->os,
++            EventQueue,
++            gcmSIZEOF(gcsQUEUE),
++            (gctPOINTER *) eventRecord
++            ));
++    }
++
++    if (contextAcquired)
++    {
++        /* Release the context switching mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
++    }
++
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(Command, gcvFALSE));
++    }
++
++#if VIVANTE_PROFILER_CONTEXT
++    if (sequenceAcquired)
++    {
++        /* Release the context sequence mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContextSeq));
++    }
++#endif
++
++    /* Unmap the command buffer pointer. */
++    if (commandBufferMapped)
++    {
++        gcmkVERIFY_OK(gckOS_UnmapUserPointer(
++            Command->os,
++            CommandBuffer,
++            gcmSIZEOF(struct _gcoCMDBUF),
++            commandBufferObject
++            ));
++    }
++
++    /* Return status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Reserve
++**
++**  Reserve space in the command queue.  Also acquire the command queue mutex.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object.
++**
++**      gctSIZE_T RequestedBytes
++**          Number of bytes previously reserved.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Buffer
++**          Pointer to a variable that will receive the address of the reserved
++**          space.
++**
++**      gctSIZE_T * BufferSize
++**          Pointer to a variable that will receive the number of bytes
++**          available in the command queue.
++*/
++gceSTATUS
++gckCOMMAND_Reserve(
++    IN gckCOMMAND Command,
++    IN gctSIZE_T RequestedBytes,
++    OUT gctPOINTER * Buffer,
++    OUT gctSIZE_T * BufferSize
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T bytes;
++    gctSIZE_T requiredBytes;
++    gctUINT32 requestedAligned;
++
++    gcmkHEADER_ARG("Command=0x%x RequestedBytes=%lu", Command, RequestedBytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Compute aligned number of reuested bytes. */
++    requestedAligned = gcmALIGN(RequestedBytes, Command->alignment);
++
++    /* Another WAIT/LINK command sequence will have to be appended after
++       the requested area being reserved. Compute the number of bytes
++       required for WAIT/LINK at the location after the reserved area. */
++    gcmkONERROR(gckHARDWARE_WaitLink(
++        Command->kernel->hardware,
++        gcvNULL,
++        Command->offset + requestedAligned,
++        &requiredBytes,
++        gcvNULL,
++        gcvNULL
++        ));
++
++    /* Compute total number of bytes required. */
++    requiredBytes += requestedAligned;
++
++    /* Compute number of bytes available in command queue. */
++    bytes = Command->pageSize - Command->offset;
++
++    /* Is there enough space in the current command queue? */
++    if (bytes < requiredBytes)
++    {
++        /* Create a new command queue. */
++        gcmkONERROR(_NewQueue(Command));
++
++        /* Recompute the number of bytes in the new kernel command queue. */
++        bytes = Command->pageSize - Command->offset;
++
++        /* Still not enough space? */
++        if (bytes < requiredBytes)
++        {
++            /* Rare case, not enough room in command queue. */
++            gcmkONERROR(gcvSTATUS_BUFFER_TOO_SMALL);
++        }
++    }
++
++    /* Return pointer to empty slot command queue. */
++    *Buffer = (gctUINT8 *) Command->logical + Command->offset;
++
++    /* Return number of bytes left in command queue. */
++    *BufferSize = bytes;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Buffer=0x%x *BufferSize=%lu", *Buffer, *BufferSize);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Execute
++**
++**  Execute a previously reserved command queue by appending a WAIT/LINK command
++**  sequence after it and modifying the last WAIT into a LINK command.  The
++**  command FIFO mutex will be released whether this function succeeds or not.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object.
++**
++**      gctSIZE_T RequestedBytes
++**          Number of bytes previously reserved.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Execute(
++    IN gckCOMMAND Command,
++    IN gctSIZE_T RequestedBytes
++    )
++{
++    gceSTATUS status;
++
++    gctPHYS_ADDR waitLinkPhysical;
++    gctUINT8_PTR waitLinkLogical;
++    gctUINT32 waitLinkOffset;
++    gctSIZE_T waitLinkBytes;
++
++    gctPHYS_ADDR waitPhysical;
++    gctPOINTER waitLogical;
++    gctUINT32 waitOffset;
++    gctSIZE_T waitBytes;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    gctPHYS_ADDR execPhysical;
++#endif
++    gctPOINTER execLogical;
++    gctSIZE_T execBytes;
++
++    gcmkHEADER_ARG("Command=0x%x RequestedBytes=%lu", Command, RequestedBytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Compute offset for WAIT/LINK. */
++    waitLinkOffset = Command->offset + RequestedBytes;
++
++    /* Compute number of bytes left in command queue. */
++    waitLinkBytes = Command->pageSize - waitLinkOffset;
++
++    /* Compute the location if WAIT/LINK command sequence. */
++    waitLinkPhysical = (gctUINT8_PTR) Command->physical + waitLinkOffset;
++    waitLinkLogical  = (gctUINT8_PTR) Command->logical  + waitLinkOffset;
++
++    /* Append WAIT/LINK in command queue. */
++    gcmkONERROR(gckHARDWARE_WaitLink(
++        Command->kernel->hardware,
++        waitLinkLogical,
++        waitLinkOffset,
++        &waitLinkBytes,
++        &waitOffset,
++        &waitBytes
++        ));
++
++    /* Compute the location if WAIT command. */
++    waitPhysical = (gctUINT8_PTR) waitLinkPhysical + waitOffset;
++    waitLogical  =                waitLinkLogical  + waitOffset;
++
++    /* Determine the location to jump to for the command buffer being
++    ** scheduled. */
++    if (Command->newQueue)
++    {
++        /* New command queue, jump to the beginning of it. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        execPhysical = Command->physical;
++#endif
++        execLogical  = Command->logical;
++        execBytes    = waitLinkOffset + waitLinkBytes;
++    }
++    else
++    {
++        /* Still within the preexisting command queue, jump directly to the
++           reserved area. */
++#if gcdNONPAGED_MEMORY_CACHEABLE
++        execPhysical = (gctUINT8 *) Command->physical + Command->offset;
++#endif
++        execLogical  = (gctUINT8 *) Command->logical  + Command->offset;
++        execBytes    = RequestedBytes + waitLinkBytes;
++    }
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache. */
++    gcmkONERROR(gckOS_CacheClean(
++        Command->os,
++        Command->kernelProcessID,
++        gcvNULL,
++        execPhysical,
++        execLogical,
++        execBytes
++        ));
++#endif
++
++    /* Convert the last WAIT into a LINK. */
++    gcmkONERROR(gckHARDWARE_Link(
++        Command->kernel->hardware,
++        Command->waitLogical,
++        execLogical,
++        execBytes,
++        &Command->waitSize
++        ));
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache. */
++    gcmkONERROR(gckOS_CacheClean(
++        Command->os,
++        Command->kernelProcessID,
++        gcvNULL,
++        Command->waitPhysical,
++        Command->waitLogical,
++        Command->waitSize
++        ));
++#endif
++
++    gcmkDUMPCOMMAND(
++        Command->os,
++        Command->waitLogical,
++        Command->waitSize,
++        gceDUMP_BUFFER_LINK,
++        gcvFALSE
++        );
++
++    gcmkDUMPCOMMAND(
++        Command->os,
++        execLogical,
++        execBytes,
++        gceDUMP_BUFFER_KERNEL,
++        gcvFALSE
++        );
++
++    /* Update the pointer to the last WAIT. */
++    Command->waitPhysical = waitPhysical;
++    Command->waitLogical  = waitLogical;
++    Command->waitSize     = waitBytes;
++
++    /* Update the command queue. */
++    Command->offset  += RequestedBytes + waitLinkBytes;
++    Command->newQueue = gcvFALSE;
++
++    /* Update queue tail pointer. */
++    gcmkONERROR(gckHARDWARE_UpdateQueueTail(
++        Command->kernel->hardware, Command->logical, Command->offset
++        ));
++
++#if gcdDUMP_COMMAND
++    gcmkPRINT("@[kernel.execute]");
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Stall
++**
++**  The calling thread will be suspended until the command queue has been
++**  completed.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to an gckCOMMAND object.
++**
++**      gctBOOL FromPower
++**          Determines whether the call originates from inside the power
++**          management or not.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Stall(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromPower
++    )
++{
++#if gcdNULL_DRIVER
++    /* Do nothing with infinite hardware. */
++    return gcvSTATUS_OK;
++#else
++    gckOS os;
++    gckHARDWARE hardware;
++    gckEVENT eventObject;
++    gceSTATUS status;
++    gctSIGNAL signal = gcvNULL;
++    gctUINT timer = 0;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Extract the gckOS object pointer. */
++    os = Command->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Extract the gckHARDWARE object pointer. */
++    hardware = Command->kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    /* Extract the gckEVENT object pointer. */
++    eventObject = Command->kernel->eventObj;
++    gcmkVERIFY_OBJECT(eventObject, gcvOBJ_EVENT);
++
++    /* Allocate the signal. */
++    gcmkONERROR(gckOS_CreateSignal(os, gcvTRUE, &signal));
++
++    /* Append the EVENT command to trigger the signal. */
++    gcmkONERROR(gckEVENT_Signal(eventObject, signal, gcvKERNEL_PIXEL));
++
++    /* Submit the event queue. */
++    gcmkONERROR(gckEVENT_Submit(eventObject, gcvTRUE, FromPower));
++
++#if gcdDUMP_COMMAND
++    gcmkPRINT("@[kernel.stall]");
++#endif
++
++    if (status == gcvSTATUS_CHIP_NOT_READY)
++    {
++        /* Error. */
++        goto OnError;
++    }
++
++    do
++    {
++        /* Wait for the signal. */
++        status = gckOS_WaitSignal(os, signal, gcdGPU_ADVANCETIMER);
++
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++            gctUINT32 idle;
++
++            /* Read idle register. */
++            gcmkVERIFY_OK(gckHARDWARE_GetIdle(
++                hardware, gcvFALSE, &idle
++                ));
++
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): idle=%08x",
++                __FUNCTION__, __LINE__, idle
++                );
++
++            gcmkONERROR(gckOS_MemoryBarrier(os, gcvNULL));
++
++#ifdef __QNXNTO__
++            gctUINT32 reg_cmdbuf_fetch;
++            gctUINT32 reg_intr;
++
++            gcmkVERIFY_OK(gckOS_ReadRegisterEx(
++                Command->kernel->hardware->os, Command->kernel->core, 0x0664, &reg_cmdbuf_fetch
++                ));
++
++            if (idle == 0x7FFFFFFE)
++            {
++                /*
++                 * GPU is idle so there should not be pending interrupts.
++                 * Just double check.
++                 *
++                 * Note that reading interrupt register clears it.
++                 * That's why we don't read it in all cases.
++                 */
++                gcmkVERIFY_OK(gckOS_ReadRegisterEx(
++                    Command->kernel->hardware->os, Command->kernel->core, 0x10, &reg_intr
++                    ));
++
++                slogf(
++                    _SLOG_SETCODE(1, 0),
++                    _SLOG_CRITICAL,
++                    "GALcore: Stall timeout (idle = 0x%X, command buffer fetch = 0x%X, interrupt = 0x%X)",
++                    idle, reg_cmdbuf_fetch, reg_intr
++                    );
++            }
++            else
++            {
++                slogf(
++                    _SLOG_SETCODE(1, 0),
++                    _SLOG_CRITICAL,
++                    "GALcore: Stall timeout (idle = 0x%X, command buffer fetch = 0x%X)",
++                    idle, reg_cmdbuf_fetch
++                    );
++            }
++#endif
++#endif
++            /* Advance timer. */
++            timer += gcdGPU_ADVANCETIMER;
++        }
++        else if (status == gcvSTATUS_INTERRUPTED)
++        {
++            gcmkONERROR(gcvSTATUS_INTERRUPTED);
++        }
++
++    }
++    while (gcmIS_ERROR(status)
++#if gcdGPU_TIMEOUT
++           && (timer < Command->kernel->timeOut)
++#endif
++           );
++
++    /* Bail out on timeout. */
++    if (gcmIS_ERROR(status))
++    {
++        /* Broadcast the stuck GPU. */
++        gcmkONERROR(gckOS_Broadcast(
++            os, hardware, gcvBROADCAST_GPU_STUCK
++            ));
++    }
++
++    /* Delete the signal. */
++    gcmkVERIFY_OK(gckOS_DestroySignal(os, signal));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (signal != gcvNULL)
++    {
++        /* Free the signal. */
++        gcmkVERIFY_OK(gckOS_DestroySignal(os, signal));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Attach
++**
++**  Attach user process.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to a gckCOMMAND object.
++**
++**      gctUINT32 ProcessID
++**          Current process ID.
++**
++**  OUTPUT:
++**
++**      gckCONTEXT * Context
++**          Pointer to a variable that will receive a pointer to a new
++**          gckCONTEXT object.
++**
++**      gctSIZE_T * StateCount
++**          Pointer to a variable that will receive the number of states
++**          in the context buffer.
++*/
++gceSTATUS
++gckCOMMAND_Attach(
++    IN gckCOMMAND Command,
++    OUT gckCONTEXT * Context,
++    OUT gctSIZE_T * StateCount,
++    IN gctUINT32 ProcessID
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Acquire the context switching mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(
++        Command->os, Command->mutexContext, gcvINFINITE
++        ));
++    acquired = gcvTRUE;
++
++    /* Construct a gckCONTEXT object. */
++    gcmkONERROR(gckCONTEXT_Construct(
++        Command->os,
++        Command->kernel->hardware,
++        ProcessID,
++        Context
++        ));
++
++    /* Return the number of states in the context. */
++    * StateCount = (* Context)->stateCount;
++
++    /* Release the context switching mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Context=0x%x", *Context);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Release mutex. */
++    if (acquired)
++    {
++        /* Release the context switching mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
++        acquired = gcvFALSE;
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckCOMMAND_Detach
++**
++**  Detach user process.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to a gckCOMMAND object.
++**
++**      gckCONTEXT Context
++**          Pointer to a gckCONTEXT object to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_Detach(
++    IN gckCOMMAND Command,
++    IN gckCONTEXT Context
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Command=0x%x Context=0x%x", Command, Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    /* Acquire the context switching mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(
++        Command->os, Command->mutexContext, gcvINFINITE
++        ));
++    acquired = gcvTRUE;
++
++    /* Construct a gckCONTEXT object. */
++    gcmkONERROR(gckCONTEXT_Destroy(Context));
++
++    if (Command->currContext == Context)
++    {
++        /* Detach from gckCOMMAND object if the destoryed context is current context. */
++        Command->currContext = gcvNULL;
++    }
++
++    /* Release the context switching mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
++    acquired = gcvFALSE;
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Release mutex. */
++    if (acquired)
++    {
++        /* Release the context switching mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Command->os, Command->mutexContext));
++        acquired = gcvFALSE;
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++/*******************************************************************************
++**
++**  gckCOMMAND_DumpExecutingBuffer
++**
++**  Dump the command buffer which GPU is executing.
++**
++**  INPUT:
++**
++**      gckCOMMAND Command
++**          Pointer to a gckCOMMAND object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckCOMMAND_DumpExecutingBuffer(
++    IN gckCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gckVIRTUAL_COMMAND_BUFFER_PTR buffer;
++    gctUINT32 gpuAddress;
++    gctSIZE_T pageCount;
++    gctPOINTER entry;
++    gckOS os = Command->os;
++    gckKERNEL kernel = Command->kernel;
++#if gcdLINK_QUEUE_SIZE
++    gctINT pid;
++    gctINT i, rear;
++    gctUINT32 start, end;
++    gctUINT32 dumpFront, dumpRear;
++    gckLINKQUEUE queue = &kernel->hardware->linkQueue;
++    gckLINKQUEUE queueMirror;
++    gctUINT32 bytes;
++    gckLINKDATA linkData;
++#endif
++
++    gcmkPRINT("**************************\n");
++    gcmkPRINT("**** COMMAND BUF DUMP ****\n");
++    gcmkPRINT("**************************\n");
++
++    gcmkVERIFY_OK(gckOS_ReadRegisterEx(os, kernel->core, 0x664, &gpuAddress));
++
++    gcmkPRINT("DMA Address 0x%08X", gpuAddress);
++
++#if gcdLINK_QUEUE_SIZE
++    /* Duplicate queue because it will be changed.*/
++    gcmkONERROR(gckOS_AllocateMemory(os,
++                                     sizeof(struct _gckLINKQUEUE),
++                                     (gctPOINTER *)&queueMirror));
++
++    gcmkONERROR(gckOS_MemCopy(queueMirror,
++                              queue,
++                              sizeof(struct _gckLINKQUEUE)));
++
++    /* If kernel command buffer link to a context buffer, then link to a user command
++    ** buffer, the second link will be in queue first, so we must fix this.
++    **     In Queue:    C1 U1 U2 C2 U3 U4 U5 C3
++    **         Real: C1 X1 U1 C2 U2 U3 U4 C3 U5
++    ** Command buffer X1 which is after C1 is out of queue, so C1 is meaningless.
++    */
++    for (i = 0; i < gcdLINK_QUEUE_SIZE; i++)
++    {
++        gckLINKQUEUE_GetData(queueMirror, i, &linkData);
++
++        status = gckKERNEL_QueryGPUAddress(kernel, linkData->start, &buffer);
++
++        if (gcmIS_ERROR(status))
++        {
++            /* Can't find it in virtual command buffer list, ignore it. */
++            continue;
++        }
++
++        if (buffer->kernelLogical)
++        {
++            /* It is a context buffer. */
++            if (i == 0)
++            {
++                /* The real command buffer is out, so clear this slot. */
++                linkData->start = 0;
++                linkData->end = 0;
++                linkData->pid = 0;
++            }
++            else
++            {
++                /* switch context buffer and command buffer. */
++                struct _gckLINKDATA tmp = *linkData;
++                gckLINKDATA linkDataPrevious;
++
++                gckLINKQUEUE_GetData(queueMirror, i - 1, &linkDataPrevious);
++                *linkData = *linkDataPrevious;
++                *linkDataPrevious = tmp;
++           }
++        }
++    }
++
++    /* Clear search result. */
++    dumpFront = dumpRear = gcvINFINITE;
++
++    gcmkPRINT("Link Stack:");
++
++    /* Search stuck address in link queue from rear. */
++    rear = gcdLINK_QUEUE_SIZE - 1;
++    for (i = 0; i < gcdLINK_QUEUE_SIZE; i++)
++    {
++        gckLINKQUEUE_GetData(queueMirror, rear, &linkData);
++
++        start = linkData->start;
++        end = linkData->end;
++        pid = linkData->pid;
++
++        if (gpuAddress >= start && gpuAddress < end)
++        {
++            /* Find latest matched command buffer. */
++            gcmkPRINT("  %d, [%08X - %08X]", pid, start, end);
++
++            /* Initiliaze dump information. */
++            dumpFront = dumpRear = rear;
++        }
++
++        /* Advance to previous one. */
++        rear--;
++
++        if (dumpFront != gcvINFINITE)
++        {
++            break;
++        }
++    }
++
++    if (dumpFront == gcvINFINITE)
++    {
++        /* Can't find matched record in link queue, dump kernel command buffer. */
++        _DumpKernelCommandBuffer(Command);
++
++        /* Free local copy. */
++        gcmkOS_SAFE_FREE(os, queueMirror);
++        return gcvSTATUS_OK;
++    }
++
++    /* Search the last context buffer linked. */
++    while (rear >= 0)
++    {
++        gckLINKQUEUE_GetData(queueMirror, rear, &linkData);
++
++        gcmkPRINT("  %d, [%08X - %08X]",
++                  linkData->pid,
++                  linkData->start,
++                  linkData->end);
++
++        status = gckKERNEL_QueryGPUAddress(kernel, linkData->start, &buffer);
++
++        if (gcmIS_SUCCESS(status) && buffer->kernelLogical)
++        {
++            /* Find a context buffer. */
++            dumpFront = rear;
++            break;
++        }
++
++        rear--;
++    }
++
++    /* Dump from last context buffer to last command buffer where hang happens. */
++    for (i = dumpFront; i <= dumpRear; i++)
++    {
++        gckLINKQUEUE_GetData(queueMirror, i, &linkData);
++
++        /* Get gpu address of this command buffer. */
++        gpuAddress = linkData->start;
++        bytes = linkData->end - gpuAddress;
++
++        /* Get the whole buffer. */
++        status = gckKERNEL_QueryGPUAddress(kernel, gpuAddress, &buffer);
++
++        if (gcmIS_ERROR(status))
++        {
++            gcmkPRINT("Buffer [%08X - %08X] is lost",
++                      linkData->start,
++                      linkData->end);
++            continue;
++        }
++
++        /* Get kernel logical for dump. */
++        if (buffer->kernelLogical)
++        {
++            /* Get kernel logical directly if it is a context buffer. */
++            entry = buffer->kernelLogical;
++            gcmkPRINT("Context Buffer:");
++        }
++        else
++        {
++            /* Make it accessiable by kernel if it is a user command buffer. */
++            gcmkVERIFY_OK(
++                gckOS_CreateKernelVirtualMapping(buffer->physical,
++                                                 &pageCount,
++                                                 &entry));
++            gcmkPRINT("User Command Buffer:");
++        }
++
++        /* Dump from the entry. */
++        _DumpBuffer(entry + (gpuAddress - buffer->gpuAddress), gpuAddress, bytes);
++
++        /* Release kernel logical address if neccessary. */
++        if (!buffer->kernelLogical)
++        {
++            gcmkVERIFY_OK(gckOS_DestroyKernelVirtualMapping(entry));
++        }
++    }
++
++    /* Free local copy. */
++    gcmkOS_SAFE_FREE(os, queueMirror);
++    return gcvSTATUS_OK;
++OnError:
++    return status;
++#else
++    /* Without link queue information, we don't know the entry of last command
++    ** buffer, just dump the page where GPU stuck. */
++    status = gckKERNEL_QueryGPUAddress(kernel, gpuAddress, &buffer);
++
++    if (gcmIS_SUCCESS(status))
++    {
++        gcmkVERIFY_OK(
++            gckOS_CreateKernelVirtualMapping(buffer->physical, &pageCount, &entry));
++
++        if (entry)
++        {
++            gctUINT32 offset = gpuAddress - buffer->gpuAddress;
++            gctPOINTER entryDump = entry;
++
++            /* Dump one pages. */
++            gctUINT32 bytes = 4096;
++
++            /* Align to page. */
++            offset &= 0xfffff000;
++
++            /* Kernel address of page where stall point stay. */
++            entryDump += offset;
++
++            /* Align to page. */
++            gpuAddress &= 0xfffff000;
++
++            gcmkPRINT("User Command Buffer:\n");
++            _DumpBuffer(entryDump, gpuAddress, bytes);
++        }
++
++        gcmkVERIFY_OK(
++            gckOS_DestroyKernelVirtualMapping(entry));
++    }
++    else
++    {
++        _DumpKernelCommandBuffer(Command);
++    }
++
++    return gcvSTATUS_OK;
++#endif
++}
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_command_vg.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,3678 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#if gcdENABLE_VG
++
++#include "gc_hal_kernel_hardware_command_vg.h"
++
++#define _GC_OBJ_ZONE            gcvZONE_COMMAND
++
++/******************************************************************************\
++*********************************** Debugging **********************************
++\******************************************************************************/
++
++#define gcvDISABLE_TIMEOUT      1
++#define gcvDUMP_COMMAND_BUFFER  0
++#define gcvDUMP_COMMAND_LINES   0
++
++
++#if gcvDEBUG || defined(EMULATOR) || gcvDISABLE_TIMEOUT
++#   define gcvQUEUE_TIMEOUT ~0
++#else
++#   define gcvQUEUE_TIMEOUT 10
++#endif
++
++
++/******************************************************************************\
++********************************** Definitions *********************************
++\******************************************************************************/
++
++/* Minimum buffer size. */
++#define gcvMINUMUM_BUFFER \
++    gcmSIZEOF(gcsKERNEL_QUEUE_HEADER) + \
++    gcmSIZEOF(gcsKERNEL_CMDQUEUE) * 2
++
++#define gcmDECLARE_INTERRUPT_HANDLER(Block, Number) \
++    static gceSTATUS \
++    _EventHandler_##Block##_##Number( \
++        IN gckVGKERNEL Kernel \
++        )
++
++#define gcmDEFINE_INTERRUPT_HANDLER(Block, Number) \
++    gcmDECLARE_INTERRUPT_HANDLER(Block, Number) \
++    { \
++        return _EventHandler_Block( \
++            Kernel, \
++            &Kernel->command->taskTable[gcvBLOCK_##Block], \
++            gcvFALSE \
++            ); \
++    }
++
++#define gcmDEFINE_INTERRUPT_HANDLER_ENTRY(Block, Number) \
++    { gcvBLOCK_##Block, _EventHandler_##Block##_##Number }
++
++/* Block interrupt handling table entry. */
++typedef struct _gcsBLOCK_INTERRUPT_HANDLER * gcsBLOCK_INTERRUPT_HANDLER_PTR;
++typedef struct _gcsBLOCK_INTERRUPT_HANDLER
++{
++    gceBLOCK                block;
++    gctINTERRUPT_HANDLER    handler;
++}
++gcsBLOCK_INTERRUPT_HANDLER;
++
++/* Queue control functions. */
++typedef struct _gcsQUEUE_UPDATE_CONTROL * gcsQUEUE_UPDATE_CONTROL_PTR;
++typedef struct _gcsQUEUE_UPDATE_CONTROL
++{
++    gctOBJECT_HANDLER       execute;
++    gctOBJECT_HANDLER       update;
++    gctOBJECT_HANDLER       lastExecute;
++    gctOBJECT_HANDLER       lastUpdate;
++}
++gcsQUEUE_UPDATE_CONTROL;
++
++
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++static gceSTATUS
++_FlushMMU(
++    IN gckVGCOMMAND Command
++    )
++{
++    gceSTATUS status;
++    gctUINT32 oldValue;
++    gckVGHARDWARE hardware = Command->hardware;
++
++    gcmkONERROR(gckOS_AtomicExchange(Command->os,
++                                     hardware->pageTableDirty,
++                                     0,
++                                     &oldValue));
++
++    if (oldValue)
++    {
++        /* Page Table is upated, flush mmu before commit. */
++        gcmkONERROR(gckVGHARDWARE_FlushMMU(hardware));
++    }
++
++    return gcvSTATUS_OK;
++OnError:
++    return status;
++}
++
++static gceSTATUS
++_WaitForIdle(
++    IN gckVGCOMMAND Command,
++    IN gcsKERNEL_QUEUE_HEADER_PTR Queue
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctUINT32 idle;
++    gctUINT timeout = 0;
++
++    /* Loop while not idle. */
++    while (Queue->pending)
++    {
++        /* Did we reach the timeout limit? */
++        if (timeout == gcvQUEUE_TIMEOUT)
++        {
++            /* Hardware is probably dead... */
++            return gcvSTATUS_TIMEOUT;
++        }
++
++        /* Sleep for 100ms. */
++        gcmkERR_BREAK(gckOS_Delay(Command->os, 100));
++
++        /* Not the first loop? */
++        if (timeout > 0)
++        {
++            /* Read IDLE register. */
++            gcmkVERIFY_OK(gckVGHARDWARE_GetIdle(Command->hardware, &idle));
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_COMMAND,
++                "%s: timeout, IDLE=%08X\n",
++                __FUNCTION__, idle
++                );
++        }
++
++        /* Increment the timeout counter. */
++        timeout += 1;
++    }
++
++    /* Return status. */
++    return status;
++}
++
++static gctINT32
++_GetNextInterrupt(
++    IN gckVGCOMMAND Command,
++    IN gceBLOCK Block
++    )
++{
++    gctUINT index;
++    gcsBLOCK_TASK_ENTRY_PTR entry;
++    gctINT32 interrupt;
++
++    /* Get the block entry. */
++    entry = &Command->taskTable[Block];
++
++    /* Make sure we have initialized interrupts. */
++    gcmkASSERT(entry->interruptCount > 0);
++
++    /* Decrement the interrupt usage semaphore. */
++    gcmkVERIFY_OK(gckOS_DecrementSemaphore(
++        Command->os, entry->interruptSemaphore
++        ));
++
++    /* Get the value index. */
++    index = entry->interruptIndex;
++
++    /* Get the interrupt value. */
++    interrupt = entry->interruptArray[index];
++
++    /* Must be a valid value. */
++    gcmkASSERT((interrupt >= 0) && (interrupt <= 31));
++
++    /* Advance the index to the next value. */
++    index += 1;
++
++    /* Set the new index. */
++    entry->interruptIndex = (index == entry->interruptCount)
++        ? 0
++        : index;
++
++    /* Return interrupt value. */
++    return interrupt;
++}
++
++
++/******************************************************************************\
++***************************** Task Storage Management **************************
++\******************************************************************************/
++
++/* Minimum task buffer size. */
++#define gcvMIN_TASK_BUFFER \
++( \
++    gcmSIZEOF(gcsTASK_CONTAINER) + 128 \
++)
++
++/* Free list terminator. */
++#define gcvFREE_TASK_TERMINATOR \
++( \
++    (gcsTASK_CONTAINER_PTR) gcmINT2PTR(~0) \
++)
++
++
++/*----------------------------------------------------------------------------*/
++/*------------------- Allocated Task Buffer List Management ------------------*/
++
++static void
++_InsertTaskBuffer(
++    IN gcsTASK_CONTAINER_PTR AddAfter,
++    IN gcsTASK_CONTAINER_PTR Buffer
++    )
++{
++    gcsTASK_CONTAINER_PTR addBefore;
++
++    /* Cannot add before the first buffer. */
++    gcmkASSERT(AddAfter != gcvNULL);
++
++    /* Create a shortcut to the next buffer. */
++    addBefore = AddAfter->allocNext;
++
++    /* Initialize the links. */
++    Buffer->allocPrev = AddAfter;
++    Buffer->allocNext = addBefore;
++
++    /* Link to the previous buffer. */
++    AddAfter->allocNext = Buffer;
++
++    /* Link to the next buffer. */
++    if (addBefore != gcvNULL)
++    {
++        addBefore->allocPrev = Buffer;
++    }
++}
++
++static void
++_RemoveTaskBuffer(
++    IN gcsTASK_CONTAINER_PTR Buffer
++    )
++{
++    gcsTASK_CONTAINER_PTR prev;
++    gcsTASK_CONTAINER_PTR next;
++
++    /* Cannot remove the first buffer. */
++    gcmkASSERT(Buffer->allocPrev != gcvNULL);
++
++    /* Create shortcuts to the previous and next buffers. */
++    prev = Buffer->allocPrev;
++    next = Buffer->allocNext;
++
++    /* Tail buffer? */
++    if (next == gcvNULL)
++    {
++        /* Remove from the list. */
++        prev->allocNext = gcvNULL;
++    }
++
++    /* Buffer from the middle. */
++    else
++    {
++        prev->allocNext = next;
++        next->allocPrev = prev;
++    }
++}
++
++
++/*----------------------------------------------------------------------------*/
++/*--------------------- Free Task Buffer List Management ---------------------*/
++
++static void
++_AppendToFreeList(
++    IN gckVGCOMMAND Command,
++    IN gcsTASK_CONTAINER_PTR Buffer
++    )
++{
++    /* Cannot be a part of the free list already. */
++    gcmkASSERT(Buffer->freePrev == gcvNULL);
++    gcmkASSERT(Buffer->freeNext == gcvNULL);
++
++    /* First buffer to add? */
++    if (Command->taskFreeHead == gcvNULL)
++    {
++        /* Terminate the links. */
++        Buffer->freePrev = gcvFREE_TASK_TERMINATOR;
++        Buffer->freeNext = gcvFREE_TASK_TERMINATOR;
++
++        /* Initialize the list pointer. */
++        Command->taskFreeHead = Command->taskFreeTail = Buffer;
++    }
++
++    /* Not the first, add after the tail. */
++    else
++    {
++        /* Initialize the new tail buffer. */
++        Buffer->freePrev = Command->taskFreeTail;
++        Buffer->freeNext = gcvFREE_TASK_TERMINATOR;
++
++        /* Add after the tail. */
++        Command->taskFreeTail->freeNext = Buffer;
++        Command->taskFreeTail = Buffer;
++    }
++}
++
++static void
++_RemoveFromFreeList(
++    IN gckVGCOMMAND Command,
++    IN gcsTASK_CONTAINER_PTR Buffer
++    )
++{
++    /* Has to be a part of the free list. */
++    gcmkASSERT(Buffer->freePrev != gcvNULL);
++    gcmkASSERT(Buffer->freeNext != gcvNULL);
++
++    /* Head buffer? */
++    if (Buffer->freePrev == gcvFREE_TASK_TERMINATOR)
++    {
++        /* Tail buffer as well? */
++        if (Buffer->freeNext == gcvFREE_TASK_TERMINATOR)
++        {
++            /* Reset the list pointer. */
++            Command->taskFreeHead = Command->taskFreeTail = gcvNULL;
++        }
++
++        /* No, just the head. */
++        else
++        {
++            /* Update the head. */
++            Command->taskFreeHead = Buffer->freeNext;
++
++            /* Terminate the next buffer. */
++            Command->taskFreeHead->freePrev = gcvFREE_TASK_TERMINATOR;
++        }
++    }
++
++    /* Not the head. */
++    else
++    {
++        /* Tail buffer? */
++        if (Buffer->freeNext == gcvFREE_TASK_TERMINATOR)
++        {
++            /* Update the tail. */
++            Command->taskFreeTail = Buffer->freePrev;
++
++            /* Terminate the previous buffer. */
++            Command->taskFreeTail->freeNext = gcvFREE_TASK_TERMINATOR;
++        }
++
++        /* A buffer in the middle. */
++        else
++        {
++            /* Remove the buffer from the list. */
++            Buffer->freePrev->freeNext = Buffer->freeNext;
++            Buffer->freeNext->freePrev = Buffer->freePrev;
++        }
++    }
++
++    /* Reset free list pointers. */
++    Buffer->freePrev = gcvNULL;
++    Buffer->freeNext = gcvNULL;
++}
++
++
++/*----------------------------------------------------------------------------*/
++/*-------------------------- Task Buffer Allocation --------------------------*/
++
++static void
++_SplitTaskBuffer(
++    IN gckVGCOMMAND Command,
++    IN gcsTASK_CONTAINER_PTR Buffer,
++    IN gctUINT Size
++    )
++{
++    /* Determine the size of the new buffer. */
++    gctINT splitBufferSize = Buffer->size - Size;
++    gcmkASSERT(splitBufferSize >= 0);
++
++    /* Is the split buffer big enough to become a separate buffer? */
++    if (splitBufferSize >= gcvMIN_TASK_BUFFER)
++    {
++        /* Place the new path data. */
++        gcsTASK_CONTAINER_PTR splitBuffer = (gcsTASK_CONTAINER_PTR)
++        (
++            (gctUINT8_PTR) Buffer + Size
++        );
++
++        /* Set the trimmed buffer size. */
++        Buffer->size = Size;
++
++        /* Initialize the split buffer. */
++        splitBuffer->referenceCount = 0;
++        splitBuffer->size           = splitBufferSize;
++        splitBuffer->freePrev       = gcvNULL;
++        splitBuffer->freeNext       = gcvNULL;
++
++        /* Link in. */
++        _InsertTaskBuffer(Buffer, splitBuffer);
++        _AppendToFreeList(Command, splitBuffer);
++    }
++}
++
++static gceSTATUS
++_AllocateTaskContainer(
++    IN gckVGCOMMAND Command,
++    IN gctUINT Size,
++    OUT gcsTASK_CONTAINER_PTR * Buffer
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Command=0x%x Size=0x%x, Buffer ==0x%x", Command, Size, Buffer);
++
++    /* Verify arguments. */
++    gcmkVERIFY_ARGUMENT(Buffer != gcvNULL);
++
++    do
++    {
++        gcsTASK_STORAGE_PTR storage;
++        gcsTASK_CONTAINER_PTR buffer;
++
++        /* Adjust the size. */
++        Size += gcmSIZEOF(gcsTASK_CONTAINER);
++
++        /* Adjust the allocation size if not big enough. */
++        if (Size > Command->taskStorageUsable)
++        {
++            Command->taskStorageGranularity
++                = gcmALIGN(Size + gcmSIZEOF(gcsTASK_STORAGE), 1024);
++
++            Command->taskStorageUsable
++                = Command->taskStorageGranularity - gcmSIZEOF(gcsTASK_STORAGE);
++        }
++
++        /* Is there a free buffer available? */
++        else if (Command->taskFreeHead != gcvNULL)
++        {
++            /* Set the initial free buffer. */
++            gcsTASK_CONTAINER_PTR buffer = Command->taskFreeHead;
++
++            do
++            {
++                /* Is the buffer big enough? */
++                if (buffer->size >= Size)
++                {
++                    /* Remove the buffer from the free list. */
++                    _RemoveFromFreeList(Command, buffer);
++
++                    /* Split the buffer. */
++                    _SplitTaskBuffer(Command, buffer, Size);
++
++                    /* Set the result. */
++                    * Buffer = buffer;
++
++                    gcmkFOOTER_ARG("*Buffer=0x%x",*Buffer);
++                    /* Success. */
++                    return gcvSTATUS_OK;
++                }
++
++                /* Get the next free buffer. */
++                buffer = buffer->freeNext;
++            }
++            while (buffer != gcvFREE_TASK_TERMINATOR);
++        }
++
++        /* Allocate a container. */
++        gcmkERR_BREAK(gckOS_Allocate(
++            Command->os,
++            Command->taskStorageGranularity,
++            (gctPOINTER *) &storage
++            ));
++
++        /* Link in the storage buffer. */
++        storage->next = Command->taskStorage;
++        Command->taskStorage = storage;
++
++        /* Place the task buffer. */
++        buffer = (gcsTASK_CONTAINER_PTR) (storage + 1);
++
++        /* Determine the size of the buffer. */
++        buffer->size
++            = Command->taskStorageGranularity
++            - gcmSIZEOF(gcsTASK_STORAGE);
++
++        /* Initialize the task buffer. */
++        buffer->referenceCount = 0;
++        buffer->allocPrev      = gcvNULL;
++        buffer->allocNext      = gcvNULL;
++        buffer->freePrev       = gcvNULL;
++        buffer->freeNext       = gcvNULL;
++
++        /* Split the buffer. */
++        _SplitTaskBuffer(Command, buffer, Size);
++
++        /* Set the result. */
++        * Buffer = buffer;
++
++        gcmkFOOTER_ARG("*Buffer=0x%x",*Buffer);
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++static void
++_FreeTaskContainer(
++    IN gckVGCOMMAND Command,
++    IN gcsTASK_CONTAINER_PTR Buffer
++    )
++{
++    gcsTASK_CONTAINER_PTR prev;
++    gcsTASK_CONTAINER_PTR next;
++    gcsTASK_CONTAINER_PTR merged;
++
++    gctSIZE_T mergedSize;
++
++    /* Verify arguments. */
++    gcmkASSERT(Buffer != gcvNULL);
++    gcmkASSERT(Buffer->freePrev == gcvNULL);
++    gcmkASSERT(Buffer->freeNext == gcvNULL);
++
++    /* Get shortcuts to the previous and next path data buffers. */
++    prev = Buffer->allocPrev;
++    next = Buffer->allocNext;
++
++    /* Is the previous path data buffer already free? */
++    if (prev && prev->freeNext)
++    {
++        /* The previous path data buffer is the one that remains. */
++        merged = prev;
++
++        /* Is the next path data buffer already free? */
++        if (next && next->freeNext)
++        {
++            /* Merge all three path data buffers into the previous. */
++            mergedSize = prev->size + Buffer->size + next->size;
++
++            /* Remove the next path data buffer. */
++            _RemoveFromFreeList(Command, next);
++            _RemoveTaskBuffer(next);
++        }
++        else
++        {
++            /* Merge the current path data buffer into the previous. */
++            mergedSize = prev->size + Buffer->size;
++        }
++
++        /* Delete the current path data buffer. */
++        _RemoveTaskBuffer(Buffer);
++
++        /* Set new size. */
++        merged->size = mergedSize;
++    }
++    else
++    {
++        /* The current path data buffer is the one that remains. */
++        merged = Buffer;
++
++        /* Is the next buffer already free? */
++        if (next && next->freeNext)
++        {
++            /* Merge the next into the current. */
++            mergedSize = Buffer->size + next->size;
++
++            /* Remove the next buffer. */
++            _RemoveFromFreeList(Command, next);
++            _RemoveTaskBuffer(next);
++
++            /* Set new size. */
++            merged->size = mergedSize;
++        }
++
++        /* Add the current buffer into the free list. */
++        _AppendToFreeList(Command, merged);
++    }
++}
++
++gceSTATUS
++_RemoveRecordFromProcesDB(
++    IN gckVGCOMMAND Command,
++    IN gcsTASK_HEADER_PTR Task
++    )
++{
++    gcsTASK_PTR task = (gcsTASK_PTR)((gctUINT8_PTR)Task - sizeof(gcsTASK));
++    gcsTASK_FREE_VIDEO_MEMORY_PTR freeVideoMemory;
++    gcsTASK_UNLOCK_VIDEO_MEMORY_PTR unlockVideoMemory;
++    gctINT pid;
++    gctUINT32 size;
++
++    /* Get the total size of all tasks. */
++    size = task->size;
++
++    gcmkVERIFY_OK(gckOS_GetProcessID((gctUINT32_PTR)&pid));
++
++    do
++    {
++        switch (Task->id)
++        {
++        case gcvTASK_FREE_VIDEO_MEMORY:
++            freeVideoMemory = (gcsTASK_FREE_VIDEO_MEMORY_PTR)Task;
++
++            /* Remove record from process db. */
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Command->kernel->kernel,
++                pid,
++                gcvDB_VIDEO_MEMORY,
++                gcmUINT64_TO_PTR(freeVideoMemory->node)));
++
++            /* Advance to next task. */
++            size -= sizeof(gcsTASK_FREE_VIDEO_MEMORY);
++            Task = (gcsTASK_HEADER_PTR)(freeVideoMemory + 1);
++
++            break;
++        case gcvTASK_UNLOCK_VIDEO_MEMORY:
++            unlockVideoMemory = (gcsTASK_UNLOCK_VIDEO_MEMORY_PTR)Task;
++
++            /* Remove record from process db. */
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Command->kernel->kernel,
++                pid,
++                gcvDB_VIDEO_MEMORY_LOCKED,
++                gcmUINT64_TO_PTR(unlockVideoMemory->node)));
++
++            /* Advance to next task. */
++            size -= sizeof(gcsTASK_UNLOCK_VIDEO_MEMORY);
++            Task = (gcsTASK_HEADER_PTR)(unlockVideoMemory + 1);
++
++            break;
++        default:
++            /* Skip the whole task. */
++            size = 0;
++            break;
++        }
++    }
++    while(size);
++
++    return gcvSTATUS_OK;
++}
++
++/******************************************************************************\
++********************************* Task Scheduling ******************************
++\******************************************************************************/
++
++static gceSTATUS
++_ScheduleTasks(
++    IN gckVGCOMMAND Command,
++    IN gcsTASK_MASTER_TABLE_PTR TaskTable,
++    IN gctUINT8_PTR PreviousEnd
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        gctINT block;
++        gcsTASK_CONTAINER_PTR container;
++        gcsTASK_MASTER_ENTRY_PTR userTaskEntry;
++        gcsBLOCK_TASK_ENTRY_PTR kernelTaskEntry;
++        gcsTASK_PTR userTask;
++        gctUINT8_PTR kernelTask;
++        gctINT32 interrupt;
++        gctUINT8_PTR eventCommand;
++
++        /* Nothing to schedule? */
++        if (TaskTable->size == 0)
++        {
++            status = gcvSTATUS_OK;
++            break;
++        }
++
++        /* Acquire the mutex. */
++        gcmkERR_BREAK(gckOS_AcquireMutex(
++            Command->os,
++            Command->taskMutex,
++            gcvINFINITE
++            ));
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++            "%s(%d)\n",
++            __FUNCTION__, __LINE__
++            );
++
++        do
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                "  number of tasks scheduled   = %d\n"
++                "  size of event data in bytes = %d\n",
++                TaskTable->count,
++                TaskTable->size
++                );
++
++            /* Allocate task buffer. */
++            gcmkERR_BREAK(_AllocateTaskContainer(
++                Command,
++                TaskTable->size,
++                &container
++                ));
++
++            /* Determine the task data pointer. */
++            kernelTask = (gctUINT8_PTR) (container + 1);
++
++            /* Initialize the reference count. */
++            container->referenceCount = TaskTable->count;
++
++            /* Process tasks. */
++            for (block = gcvBLOCK_COUNT - 1; block >= 0; block -= 1)
++            {
++                /* Get the current user table entry. */
++                userTaskEntry = &TaskTable->table[block];
++
++                /* Are there tasks scheduled? */
++                if (userTaskEntry->head == gcvNULL)
++                {
++                    /* No, skip to the next block. */
++                    continue;
++                }
++
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                    "  processing tasks for block %d\n",
++                    block
++                    );
++
++                /* Get the current kernel table entry. */
++                kernelTaskEntry = &Command->taskTable[block];
++
++                /* Are there tasks for the current block scheduled? */
++                if (kernelTaskEntry->container == gcvNULL)
++                {
++                    gcmkTRACE_ZONE(
++                        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                        "  first task container for the block added\n",
++                        block
++                        );
++
++                    /* Nothing yet, set the container buffer pointer. */
++                    kernelTaskEntry->container = container;
++                    kernelTaskEntry->task      = (gcsTASK_HEADER_PTR) kernelTask;
++                }
++
++                /* Yes, append to the end. */
++                else
++                {
++                    kernelTaskEntry->link->cotainer = container;
++                    kernelTaskEntry->link->task     = (gcsTASK_HEADER_PTR) kernelTask;
++                }
++
++                /* Set initial task. */
++                userTask = userTaskEntry->head;
++
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                    "  copying user tasks over to the kernel\n"
++                    );
++
++                /* Copy tasks. */
++                do
++                {
++                    gcsTASK_HEADER_PTR taskHeader = (gcsTASK_HEADER_PTR) (userTask + 1);
++
++                    gcmkVERIFY_OK(_RemoveRecordFromProcesDB(Command, taskHeader));
++
++                    gcmkTRACE_ZONE(
++                        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                        "    task ID = %d, size = %d\n",
++                        ((gcsTASK_HEADER_PTR) (userTask + 1))->id,
++                        userTask->size
++                        );
++
++#ifdef __QNXNTO__
++                    if (taskHeader->id == gcvTASK_SIGNAL)
++                    {
++                        ((gcsTASK_SIGNAL_PTR)taskHeader)->coid  = TaskTable->coid;
++                        ((gcsTASK_SIGNAL_PTR)taskHeader)->rcvid = TaskTable->rcvid;
++                    }
++#endif /* __QNXNTO__ */
++                    /* Copy the task data. */
++                    gcmkVERIFY_OK(gckOS_MemCopy(
++                        kernelTask, taskHeader, userTask->size
++                        ));
++
++                    /* Advance to the next task. */
++                    kernelTask += userTask->size;
++                    userTask    = userTask->next;
++                }
++                while (userTask != gcvNULL);
++
++                /* Update link pointer in the header. */
++                kernelTaskEntry->link = (gcsTASK_LINK_PTR) kernelTask;
++
++                /* Initialize link task. */
++                kernelTaskEntry->link->id       = gcvTASK_LINK;
++                kernelTaskEntry->link->cotainer = gcvNULL;
++                kernelTaskEntry->link->task     = gcvNULL;
++
++                /* Advance the task data pointer. */
++                kernelTask += gcmSIZEOF(gcsTASK_LINK);
++            }
++        }
++        while (gcvFALSE);
++
++        /* Release the mutex. */
++        gcmkERR_BREAK(gckOS_ReleaseMutex(
++            Command->os,
++            Command->taskMutex
++            ));
++
++        /* Assign interrupts to the blocks. */
++        eventCommand = PreviousEnd;
++
++        for (block = gcvBLOCK_COUNT - 1; block >= 0; block -= 1)
++        {
++            /* Get the current user table entry. */
++            userTaskEntry = &TaskTable->table[block];
++
++            /* Are there tasks scheduled? */
++            if (userTaskEntry->head == gcvNULL)
++            {
++                /* No, skip to the next block. */
++                continue;
++            }
++
++            /* Get the interrupt number. */
++            interrupt = _GetNextInterrupt(Command, block);
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                "%s(%d): block = %d interrupt = %d\n",
++                __FUNCTION__, __LINE__,
++                block, interrupt
++                );
++
++            /* Determine the command position. */
++            eventCommand -= Command->info.eventCommandSize;
++
++            /* Append an EVENT command. */
++            gcmkERR_BREAK(gckVGCOMMAND_EventCommand(
++                Command, eventCommand, block, interrupt, gcvNULL
++                ));
++        }
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++
++/******************************************************************************\
++******************************** Memory Management *****************************
++\******************************************************************************/
++
++static gceSTATUS
++_HardwareToKernel(
++    IN gckOS Os,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    gceSTATUS status;
++    gckVIDMEM memory;
++    gctUINT32 offset;
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY
++    gctUINT32 nodePhysical;
++#endif
++    status = gcvSTATUS_OK;
++    /* Assume a non-virtual node and get the pool manager object. */
++    memory = Node->VidMem.memory;
++
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY
++    nodePhysical = memory->baseAddress
++                 + Node->VidMem.offset
++                 + Node->VidMem.alignment;
++
++    if (Node->VidMem.kernelVirtual == gcvNULL)
++    {
++        status = gckOS_MapPhysical(Os,
++                        nodePhysical,
++                        Node->VidMem.bytes,
++                        (gctPOINTER *)&Node->VidMem.kernelVirtual);
++
++        if (gcmkIS_ERROR(status))
++        {
++            return status;
++        }
++    }
++
++    offset = Address - nodePhysical;
++    *KernelPointer = (gctPOINTER)((gctUINT8_PTR)Node->VidMem.kernelVirtual + offset);
++#else
++    /* Determine the header offset within the pool it is allocated in. */
++    offset = Address - memory->baseAddress;
++
++    /* Translate the offset into the kernel side pointer. */
++    status = gckOS_GetKernelLogicalEx(
++        Os,
++        gcvCORE_VG,
++        offset,
++        KernelPointer
++        );
++#endif
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_ConvertUserCommandBufferPointer(
++    IN gckVGCOMMAND Command,
++    IN gcsCMDBUFFER_PTR UserCommandBuffer,
++    OUT gcsCMDBUFFER_PTR * KernelCommandBuffer
++    )
++{
++    gceSTATUS status, last;
++    gcsCMDBUFFER_PTR mappedUserCommandBuffer = gcvNULL;
++
++    do
++    {
++        gctUINT32 headerAddress;
++
++        /* Map the command buffer structure into the kernel space. */
++        gcmkERR_BREAK(gckOS_MapUserPointer(
++            Command->os,
++            UserCommandBuffer,
++            gcmSIZEOF(gcsCMDBUFFER),
++            (gctPOINTER *) &mappedUserCommandBuffer
++            ));
++
++        /* Determine the address of the header. */
++        headerAddress
++            = mappedUserCommandBuffer->address
++            - mappedUserCommandBuffer->bufferOffset;
++
++        /* Translate the logical address to the kernel space. */
++        gcmkERR_BREAK(_HardwareToKernel(
++            Command->os,
++            gcmUINT64_TO_PTR(mappedUserCommandBuffer->node),
++            headerAddress,
++            (gctPOINTER *) KernelCommandBuffer
++            ));
++    }
++    while (gcvFALSE);
++
++    /* Unmap the user command buffer. */
++    if (mappedUserCommandBuffer != gcvNULL)
++    {
++        gcmkCHECK_STATUS(gckOS_UnmapUserPointer(
++            Command->os,
++            UserCommandBuffer,
++            gcmSIZEOF(gcsCMDBUFFER),
++            mappedUserCommandBuffer
++            ));
++    }
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_AllocateLinear(
++    IN gckVGCOMMAND Command,
++    IN gctUINT Size,
++    IN gctUINT Alignment,
++    OUT gcuVIDMEM_NODE_PTR * Node,
++    OUT gctUINT32 * Address,
++    OUT gctPOINTER * Logical
++    )
++{
++    gceSTATUS status, last;
++    gcuVIDMEM_NODE_PTR node = gcvNULL;
++    gctUINT32 address = (gctUINT32)~0;
++
++    do
++    {
++        gcePOOL pool;
++        gctPOINTER logical;
++
++        /* Allocate from the system pool. */
++        pool = gcvPOOL_SYSTEM;
++
++        /* Allocate memory. */
++        gcmkERR_BREAK(gckKERNEL_AllocateLinearMemory(
++            Command->kernel->kernel, &pool,
++            Size, Alignment,
++            gcvSURF_TYPE_UNKNOWN,
++            &node
++            ));
++
++        /* Do not accept virtual pools for now because we don't handle the
++           kernel pointer translation at the moment. */
++        if (pool == gcvPOOL_VIRTUAL)
++        {
++            status = gcvSTATUS_OUT_OF_MEMORY;
++            break;
++        }
++
++        /* Lock the command buffer. */
++        gcmkERR_BREAK(gckVIDMEM_Lock(
++            Command->kernel->kernel,
++            node,
++            gcvFALSE,
++            &address
++            ));
++
++        /* Translate the logical address to the kernel space. */
++        gcmkERR_BREAK(_HardwareToKernel(
++            Command->os,
++            node,
++            address,
++            &logical
++            ));
++
++        /* Set return values. */
++        * Node    = node;
++        * Address = address;
++        * Logical = logical;
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Roll back. */
++    if (node != gcvNULL)
++    {
++        /* Unlock the command buffer. */
++        if (address != ~0)
++        {
++            gcmkCHECK_STATUS(gckVIDMEM_Unlock(
++                Command->kernel->kernel, node, gcvSURF_TYPE_UNKNOWN, gcvNULL
++                ));
++        }
++
++        /* Free the command buffer. */
++        gcmkCHECK_STATUS(gckVIDMEM_Free(
++            Command->kernel->kernel,
++            node
++            ));
++    }
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_FreeLinear(
++    IN gckVGKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Unlock the linear buffer. */
++        gcmkERR_BREAK(gckVIDMEM_Unlock(Kernel->kernel, Node, gcvSURF_TYPE_UNKNOWN, gcvNULL));
++
++        /* Free the linear buffer. */
++        gcmkERR_BREAK(gckVIDMEM_Free(Kernel->kernel, Node));
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++gceSTATUS
++_AllocateCommandBuffer(
++    IN gckVGCOMMAND Command,
++    IN gctSIZE_T Size,
++    OUT gcsCMDBUFFER_PTR * CommandBuffer
++    )
++{
++    gceSTATUS status, last;
++    gcuVIDMEM_NODE_PTR node = gcvNULL;
++
++    do
++    {
++        gctUINT alignedHeaderSize;
++        gctUINT requestedSize;
++        gctUINT allocationSize;
++        gctUINT32 address = 0;
++        gcsCMDBUFFER_PTR commandBuffer;
++        gctUINT8_PTR endCommand;
++
++        /* Determine the aligned header size. */
++        alignedHeaderSize
++            = gcmALIGN(gcmSIZEOF(gcsCMDBUFFER), Command->info.addressAlignment);
++
++        /* Align the requested size. */
++        requestedSize
++            = gcmALIGN(Size, Command->info.commandAlignment);
++
++        /* Determine the size of the buffer to allocate. */
++        allocationSize
++            = alignedHeaderSize
++            + requestedSize
++            + Command->info.staticTailSize;
++
++        /* Allocate the command buffer. */
++        gcmkERR_BREAK(_AllocateLinear(
++            Command,
++            allocationSize,
++            Command->info.addressAlignment,
++            &node,
++            &address,
++            (gctPOINTER *) &commandBuffer
++            ));
++
++        /* Initialize the structure. */
++        commandBuffer->completion    = gcvVACANT_BUFFER;
++        commandBuffer->node          = gcmPTR_TO_UINT64(node);
++        commandBuffer->address       = address + alignedHeaderSize;
++        commandBuffer->bufferOffset  = alignedHeaderSize;
++        commandBuffer->size          = requestedSize;
++        commandBuffer->offset        = requestedSize;
++        commandBuffer->nextAllocated = gcvNULL;
++        commandBuffer->nextSubBuffer = gcvNULL;
++
++        /* Determine the data count. */
++        commandBuffer->dataCount
++            = (requestedSize + Command->info.staticTailSize)
++            / Command->info.commandAlignment;
++
++        /* Determine the location of the END command. */
++        endCommand
++            = (gctUINT8_PTR) commandBuffer
++            + alignedHeaderSize
++            + requestedSize;
++
++        /* Append an END command. */
++        gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
++            Command,
++            endCommand,
++            Command->info.feBufferInt,
++            gcvNULL
++            ));
++
++        /* Set the return pointer. */
++        * CommandBuffer = commandBuffer;
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Roll back. */
++    if (node != gcvNULL)
++    {
++        /* Free the command buffer. */
++        gcmkCHECK_STATUS(_FreeLinear(Command->kernel, node));
++    }
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_FreeCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsCMDBUFFER_PTR CommandBuffer
++    )
++{
++    gceSTATUS status;
++
++    /* Free the buffer. */
++    status = _FreeLinear(Kernel, gcmUINT64_TO_PTR(CommandBuffer->node));
++
++    /* Return status. */
++    return status;
++}
++
++
++/******************************************************************************\
++****************************** TS Overflow Handler *****************************
++\******************************************************************************/
++
++static gceSTATUS
++_EventHandler_TSOverflow(
++    IN gckVGKERNEL Kernel
++    )
++{
++    gcmkTRACE(
++        gcvLEVEL_ERROR,
++        "%s(%d): **** TS OVERFLOW ENCOUNTERED ****\n",
++        __FUNCTION__, __LINE__
++        );
++
++    return gcvSTATUS_OK;
++}
++
++
++/******************************************************************************\
++****************************** Bus Error Handler *******************************
++\******************************************************************************/
++
++static gceSTATUS
++_EventHandler_BusError(
++    IN gckVGKERNEL Kernel
++    )
++{
++    gcmkTRACE(
++        gcvLEVEL_ERROR,
++        "%s(%d): **** BUS ERROR ENCOUNTERED ****\n",
++        __FUNCTION__, __LINE__
++        );
++
++    return gcvSTATUS_OK;
++}
++
++/******************************************************************************\
++****************************** Power Stall Handler *******************************
++\******************************************************************************/
++
++static gceSTATUS
++_EventHandler_PowerStall(
++    IN gckVGKERNEL Kernel
++    )
++{
++    /* Signal. */
++    return gckOS_Signal(
++        Kernel->os,
++        Kernel->command->powerStallSignal,
++        gcvTRUE);
++}
++
++/******************************************************************************\
++******************************** Task Routines *********************************
++\******************************************************************************/
++
++typedef gceSTATUS (* gctTASKROUTINE) (
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskLink(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskCluster(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskIncrement(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskDecrement(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskSignal(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskLockdown(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskUnlockVideoMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskFreeVideoMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskFreeContiguousMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gceSTATUS
++_TaskUnmapUserMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    );
++
++static gctTASKROUTINE _taskRoutine[] =
++{
++    _TaskLink,                  /* gcvTASK_LINK                   */
++    _TaskCluster,               /* gcvTASK_CLUSTER                */
++    _TaskIncrement,             /* gcvTASK_INCREMENT              */
++    _TaskDecrement,             /* gcvTASK_DECREMENT              */
++    _TaskSignal,                /* gcvTASK_SIGNAL                 */
++    _TaskLockdown,              /* gcvTASK_LOCKDOWN               */
++    _TaskUnlockVideoMemory,     /* gcvTASK_UNLOCK_VIDEO_MEMORY    */
++    _TaskFreeVideoMemory,       /* gcvTASK_FREE_VIDEO_MEMORY      */
++    _TaskFreeContiguousMemory,  /* gcvTASK_FREE_CONTIGUOUS_MEMORY */
++    _TaskUnmapUserMemory,       /* gcvTASK_UNMAP_USER_MEMORY      */
++};
++
++static gceSTATUS
++_TaskLink(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    /* Cast the task pointer. */
++    gcsTASK_LINK_PTR task = (gcsTASK_LINK_PTR) TaskHeader->task;
++
++    /* Save the pointer to the container. */
++    gcsTASK_CONTAINER_PTR container = TaskHeader->container;
++
++    /* No more tasks in the list? */
++    if (task->task == gcvNULL)
++    {
++        /* Reset the entry. */
++        TaskHeader->container = gcvNULL;
++        TaskHeader->task      = gcvNULL;
++        TaskHeader->link      = gcvNULL;
++    }
++    else
++    {
++        /* Update the entry. */
++        TaskHeader->container = task->cotainer;
++        TaskHeader->task      = task->task;
++    }
++
++    /* Decrement the task buffer reference. */
++    gcmkASSERT(container->referenceCount >= 0);
++    if (container->referenceCount == 0)
++    {
++        /* Free the container. */
++        _FreeTaskContainer(Command, container);
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++_TaskCluster(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    /* Cast the task pointer. */
++    gcsTASK_CLUSTER_PTR cluster = (gcsTASK_CLUSTER_PTR) TaskHeader->task;
++
++    /* Get the number of tasks. */
++    gctUINT taskCount = cluster->taskCount;
++
++    /* Advance to the next task. */
++    TaskHeader->task = (gcsTASK_HEADER_PTR) (cluster + 1);
++
++    /* Perform all tasks in the cluster. */
++    while (taskCount)
++    {
++        /* Perform the current task. */
++        gcmkERR_BREAK(_taskRoutine[TaskHeader->task->id](
++            Command,
++            TaskHeader
++            ));
++
++        /* Update the task count. */
++        taskCount -= 1;
++    }
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskIncrement(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_INCREMENT_PTR task = (gcsTASK_INCREMENT_PTR) TaskHeader->task;
++
++        /* Convert physical into logical address. */
++        gctUINT32_PTR logical;
++        gcmkERR_BREAK(gckOS_MapPhysical(
++            Command->os,
++            task->address,
++            gcmSIZEOF(gctUINT32),
++            (gctPOINTER *) &logical
++            ));
++
++        /* Increment data. */
++        (* logical) += 1;
++
++        /* Unmap the physical memory. */
++        gcmkERR_BREAK(gckOS_UnmapPhysical(
++            Command->os,
++            logical,
++            gcmSIZEOF(gctUINT32)
++            ));
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskDecrement(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_DECREMENT_PTR task = (gcsTASK_DECREMENT_PTR) TaskHeader->task;
++
++        /* Convert physical into logical address. */
++        gctUINT32_PTR logical;
++        gcmkERR_BREAK(gckOS_MapPhysical(
++            Command->os,
++            task->address,
++            gcmSIZEOF(gctUINT32),
++            (gctPOINTER *) &logical
++            ));
++
++        /* Decrement data. */
++        (* logical) -= 1;
++
++        /* Unmap the physical memory. */
++        gcmkERR_BREAK(gckOS_UnmapPhysical(
++            Command->os,
++            logical,
++            gcmSIZEOF(gctUINT32)
++            ));
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskSignal(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_SIGNAL_PTR task = (gcsTASK_SIGNAL_PTR) TaskHeader->task;
++
++
++        /* Map the signal into kernel space. */
++#ifdef __QNXNTO__
++        gcmkERR_BREAK(gckOS_UserSignal(
++            Command->os, task->signal, task->rcvid, task->coid
++            ));
++#else
++        gcmkERR_BREAK(gckOS_UserSignal(
++            Command->os, task->signal, task->process
++            ));
++#endif /* __QNXNTO__ */
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskLockdown(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++    gctUINT32_PTR userCounter   = gcvNULL;
++    gctUINT32_PTR kernelCounter = gcvNULL;
++    gctSIGNAL signal            = gcvNULL;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_LOCKDOWN_PTR task = (gcsTASK_LOCKDOWN_PTR) TaskHeader->task;
++
++        /* Convert physical addresses into logical. */
++        gcmkERR_BREAK(gckOS_MapPhysical(
++            Command->os,
++            task->userCounter,
++            gcmSIZEOF(gctUINT32),
++            (gctPOINTER *) &userCounter
++            ));
++
++        gcmkERR_BREAK(gckOS_MapPhysical(
++            Command->os,
++            task->kernelCounter,
++            gcmSIZEOF(gctUINT32),
++            (gctPOINTER *) &kernelCounter
++            ));
++
++        /* Update the kernel counter. */
++        (* kernelCounter) += 1;
++
++        /* Are the counters equal? */
++        if ((* userCounter) == (* kernelCounter))
++        {
++            /* Map the signal into kernel space. */
++            gcmkERR_BREAK(gckOS_MapSignal(
++                Command->os, task->signal, task->process, &signal
++                ));
++
++            if (signal == gcvNULL)
++            {
++                /* Signal. */
++                gcmkERR_BREAK(gckOS_Signal(
++                    Command->os, task->signal, gcvTRUE
++                    ));
++            }
++            else
++            {
++                /* Signal. */
++                gcmkERR_BREAK(gckOS_Signal(
++                    Command->os, signal, gcvTRUE
++                    ));
++            }
++        }
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Destroy the mapped signal. */
++    if (signal != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_DestroySignal(
++            Command->os, signal
++            ));
++    }
++
++    /* Unmap the physical memory. */
++    if (kernelCounter != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_UnmapPhysical(
++            Command->os,
++            kernelCounter,
++            gcmSIZEOF(gctUINT32)
++            ));
++    }
++
++    if (userCounter != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_UnmapPhysical(
++            Command->os,
++            userCounter,
++            gcmSIZEOF(gctUINT32)
++            ));
++    }
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskUnlockVideoMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_UNLOCK_VIDEO_MEMORY_PTR task
++            = (gcsTASK_UNLOCK_VIDEO_MEMORY_PTR) TaskHeader->task;
++
++        /* Unlock video memory. */
++        gcmkERR_BREAK(gckVIDMEM_Unlock(
++            Command->kernel->kernel,
++            gcmUINT64_TO_PTR(task->node),
++            gcvSURF_TYPE_UNKNOWN,
++            gcvNULL));
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskFreeVideoMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_FREE_VIDEO_MEMORY_PTR task
++            = (gcsTASK_FREE_VIDEO_MEMORY_PTR) TaskHeader->task;
++
++        /* Free video memory. */
++        gcmkERR_BREAK(gckVIDMEM_Free(Command->kernel->kernel, gcmUINT64_TO_PTR(task->node)));
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskFreeContiguousMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_FREE_CONTIGUOUS_MEMORY_PTR task
++            = (gcsTASK_FREE_CONTIGUOUS_MEMORY_PTR) TaskHeader->task;
++
++        /* Free contiguous memory. */
++        gcmkERR_BREAK(gckOS_FreeContiguous(
++            Command->os, task->physical, task->logical, task->bytes
++            ));
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_TaskUnmapUserMemory(
++    gckVGCOMMAND Command,
++    gcsBLOCK_TASK_ENTRY_PTR TaskHeader
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the task pointer. */
++        gcsTASK_UNMAP_USER_MEMORY_PTR task
++            = (gcsTASK_UNMAP_USER_MEMORY_PTR) TaskHeader->task;
++
++        /* Unmap the user memory. */
++        gcmkERR_BREAK(gckOS_UnmapUserMemory(
++            Command->os, gcvCORE_VG, task->memory, task->size, task->info, task->address
++            ));
++
++        /* Update the reference counter. */
++        TaskHeader->container->referenceCount -= 1;
++
++        /* Update the task pointer. */
++        TaskHeader->task = (gcsTASK_HEADER_PTR) (task + 1);
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++/******************************************************************************\
++************ Hardware Block Interrupt Handlers For Scheduled Events ************
++\******************************************************************************/
++
++static gceSTATUS
++_EventHandler_Block(
++    IN gckVGKERNEL Kernel,
++    IN gcsBLOCK_TASK_ENTRY_PTR TaskHeader,
++    IN gctBOOL ProcessAll
++    )
++{
++    gceSTATUS status, last;
++
++    gcmkHEADER_ARG("Kernel=0x%x TaskHeader=0x%x ProcessAll=0x%x", Kernel, TaskHeader, ProcessAll);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    do
++    {
++        gckVGCOMMAND command;
++
++        /* Get the command buffer object. */
++        command = Kernel->command;
++
++        /* Increment the interrupt usage semaphore. */
++        gcmkERR_BREAK(gckOS_IncrementSemaphore(
++            command->os, TaskHeader->interruptSemaphore
++            ));
++
++        /* Acquire the mutex. */
++        gcmkERR_BREAK(gckOS_AcquireMutex(
++            command->os,
++            command->taskMutex,
++            gcvINFINITE
++            ));
++
++        /* Verify inputs. */
++        gcmkASSERT(TaskHeader            != gcvNULL);
++        gcmkASSERT(TaskHeader->container != gcvNULL);
++        gcmkASSERT(TaskHeader->task      != gcvNULL);
++        gcmkASSERT(TaskHeader->link      != gcvNULL);
++
++        /* Process tasks. */
++        do
++        {
++            /* Process the current task. */
++            gcmkERR_BREAK(_taskRoutine[TaskHeader->task->id](
++                command,
++                TaskHeader
++                ));
++
++            /* Is the next task is LINK? */
++            if (TaskHeader->task->id == gcvTASK_LINK)
++            {
++                gcmkERR_BREAK(_taskRoutine[TaskHeader->task->id](
++                    command,
++                    TaskHeader
++                    ));
++
++                /* Done. */
++                break;
++            }
++        }
++        while (ProcessAll);
++
++        /* Release the mutex. */
++        gcmkCHECK_STATUS(gckOS_ReleaseMutex(
++            command->os,
++            command->taskMutex
++            ));
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++gcmDECLARE_INTERRUPT_HANDLER(COMMAND, 0)
++{
++    gceSTATUS status, last;
++
++    gcmkHEADER_ARG("Kernel=0x%x ", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++
++    do
++    {
++        gckVGCOMMAND command;
++        gcsKERNEL_QUEUE_HEADER_PTR mergeQueue;
++        gcsKERNEL_QUEUE_HEADER_PTR queueTail;
++        gcsKERNEL_CMDQUEUE_PTR entry;
++        gctUINT entryCount;
++
++        /* Get the command buffer object. */
++        command = Kernel->command;
++
++        /* Acquire the mutex. */
++        gcmkERR_BREAK(gckOS_AcquireMutex(
++            command->os,
++            command->queueMutex,
++            gcvINFINITE
++            ));
++
++        /* Get the current queue. */
++        queueTail = command->queueTail;
++
++        /* Get the current queue entry. */
++        entry = queueTail->currentEntry;
++
++        /* Get the number of entries in the queue. */
++        entryCount = queueTail->pending;
++
++        /* Process all entries. */
++        while (gcvTRUE)
++        {
++            /* Call post-execution function. */
++            status = entry->handler(Kernel, entry);
++
++            /* Failed? */
++            if (gcmkIS_ERROR(status))
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_ERROR,
++                    gcvZONE_COMMAND,
++                    "[%s] line %d: post action failed.\n",
++                    __FUNCTION__, __LINE__
++                    );
++            }
++
++            /* Executed the next buffer? */
++            if (status == gcvSTATUS_EXECUTED)
++            {
++                /* Update the queue. */
++                queueTail->pending      = entryCount;
++                queueTail->currentEntry = entry;
++
++                /* Success. */
++                status = gcvSTATUS_OK;
++
++                /* Break out of the loop. */
++                break;
++            }
++
++            /* Advance to the next entry. */
++            entry      += 1;
++            entryCount -= 1;
++
++            /* Last entry? */
++            if (entryCount == 0)
++            {
++                /* Reset the queue to idle. */
++                queueTail->pending = 0;
++
++                /* Get a shortcut to the queue to merge with. */
++                mergeQueue = command->mergeQueue;
++
++                /* Merge the queues if necessary. */
++                if (mergeQueue != queueTail)
++                {
++                    gcmkASSERT(mergeQueue < queueTail);
++                    gcmkASSERT(mergeQueue->next == queueTail);
++
++                    mergeQueue->size
++                        += gcmSIZEOF(gcsKERNEL_QUEUE_HEADER)
++                        + queueTail->size;
++
++                    mergeQueue->next = queueTail->next;
++                }
++
++                /* Advance to the next queue. */
++                queueTail = queueTail->next;
++
++                /* Did it wrap around? */
++                if (command->queue == queueTail)
++                {
++                    /* Reset merge queue. */
++                    command->mergeQueue = queueTail;
++                }
++
++                /* Set new queue. */
++                command->queueTail = queueTail;
++
++                /* Is the next queue scheduled? */
++                if (queueTail->pending > 0)
++                {
++                    gcsCMDBUFFER_PTR commandBuffer;
++
++                    /* The first entry must be a command buffer. */
++                    commandBuffer = queueTail->currentEntry->commandBuffer;
++
++                    /* Start the command processor. */
++                    status = gckVGHARDWARE_Execute(
++                        command->hardware,
++                        commandBuffer->address,
++                        commandBuffer->dataCount
++                        );
++
++                    /* Failed? */
++                    if (gcmkIS_ERROR(status))
++                    {
++                        gcmkTRACE_ZONE(
++                            gcvLEVEL_ERROR,
++                            gcvZONE_COMMAND,
++                            "[%s] line %d: failed to start the next queue.\n",
++                            __FUNCTION__, __LINE__
++                            );
++                    }
++                }
++                else
++                {
++                    status = gckVGHARDWARE_SetPowerManagementState(
++                                Kernel->command->hardware, gcvPOWER_IDLE_BROADCAST
++                                );
++                }
++
++                /* Break out of the loop. */
++                break;
++            }
++        }
++
++        /* Release the mutex. */
++        gcmkCHECK_STATUS(gckOS_ReleaseMutex(
++            command->os,
++            command->queueMutex
++            ));
++    }
++    while (gcvFALSE);
++
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++/* Define standard block interrupt handlers. */
++gcmDEFINE_INTERRUPT_HANDLER(TESSELLATOR, 0)
++gcmDEFINE_INTERRUPT_HANDLER(VG,          0)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       0)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       1)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       2)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       3)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       4)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       5)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       6)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       7)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       8)
++gcmDEFINE_INTERRUPT_HANDLER(PIXEL,       9)
++
++/* The entries in the array are arranged by event priority. */
++static gcsBLOCK_INTERRUPT_HANDLER _blockHandlers[] =
++{
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(TESSELLATOR, 0),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(VG,          0),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       0),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       1),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       2),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       3),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       4),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       5),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       6),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       7),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       8),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(PIXEL,       9),
++    gcmDEFINE_INTERRUPT_HANDLER_ENTRY(COMMAND,     0),
++};
++
++
++/******************************************************************************\
++************************* Static Command Buffer Handlers ***********************
++\******************************************************************************/
++
++static gceSTATUS
++_UpdateStaticCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "%s(%d)\n",
++        __FUNCTION__, __LINE__
++        );
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++_ExecuteStaticCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        gcsCMDBUFFER_PTR commandBuffer;
++
++        /* Cast the command buffer header. */
++        commandBuffer = Entry->commandBuffer;
++
++        /* Set to update the command buffer next time. */
++        Entry->handler = _UpdateStaticCommandBuffer;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
++            __FUNCTION__, __LINE__,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            );
++
++        /* Start the command processor. */
++        gcmkERR_BREAK(gckVGHARDWARE_Execute(
++            Kernel->hardware,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            ));
++
++        /* Success. */
++        return gcvSTATUS_EXECUTED;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_UpdateLastStaticCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++#if gcvDEBUG || gcdFORCE_MESSAGES
++    /* Get the command buffer header. */
++    gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
++
++    /* Validate the command buffer. */
++    gcmkASSERT(commandBuffer->completion != gcvNULL);
++    gcmkASSERT(commandBuffer->completion != gcvVACANT_BUFFER);
++
++#endif
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "%s(%d): processing all tasks scheduled for FE.\n",
++        __FUNCTION__, __LINE__
++        );
++
++    /* Perform scheduled tasks. */
++    return _EventHandler_Block(
++        Kernel,
++        &Kernel->command->taskTable[gcvBLOCK_COMMAND],
++        gcvTRUE
++        );
++}
++
++static gceSTATUS
++_ExecuteLastStaticCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the command buffer header. */
++        gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
++
++        /* Set to update the command buffer next time. */
++        Entry->handler = _UpdateLastStaticCommandBuffer;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
++            __FUNCTION__, __LINE__,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            );
++
++        /* Start the command processor. */
++        gcmkERR_BREAK(gckVGHARDWARE_Execute(
++            Kernel->hardware,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            ));
++
++        /* Success. */
++        return gcvSTATUS_EXECUTED;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++
++/******************************************************************************\
++************************* Dynamic Command Buffer Handlers **********************
++\******************************************************************************/
++
++static gceSTATUS
++_UpdateDynamicCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "%s(%d)\n",
++        __FUNCTION__, __LINE__
++        );
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++_ExecuteDynamicCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the command buffer header. */
++        gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
++
++        /* Set to update the command buffer next time. */
++        Entry->handler = _UpdateDynamicCommandBuffer;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
++            __FUNCTION__, __LINE__,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            );
++
++        /* Start the command processor. */
++        gcmkERR_BREAK(gckVGHARDWARE_Execute(
++            Kernel->hardware,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            ));
++
++        /* Success. */
++        return gcvSTATUS_EXECUTED;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_UpdateLastDynamicCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++#if gcvDEBUG || gcdFORCE_MESSAGES
++    /* Get the command buffer header. */
++    gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
++
++    /* Validate the command buffer. */
++    gcmkASSERT(commandBuffer->completion != gcvNULL);
++    gcmkASSERT(commandBuffer->completion != gcvVACANT_BUFFER);
++
++#endif
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "%s(%d): processing all tasks scheduled for FE.\n",
++        __FUNCTION__, __LINE__
++        );
++
++    /* Perform scheduled tasks. */
++    return _EventHandler_Block(
++        Kernel,
++        &Kernel->command->taskTable[gcvBLOCK_COMMAND],
++        gcvTRUE
++        );
++}
++
++static gceSTATUS
++_ExecuteLastDynamicCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Cast the command buffer header. */
++        gcsCMDBUFFER_PTR commandBuffer = Entry->commandBuffer;
++
++        /* Set to update the command buffer next time. */
++        Entry->handler = _UpdateLastDynamicCommandBuffer;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++            "%s(%d): executing next buffer @ 0x%08X, data count = %d\n",
++            __FUNCTION__, __LINE__,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            );
++
++        /* Start the command processor. */
++        gcmkERR_BREAK(gckVGHARDWARE_Execute(
++            Kernel->hardware,
++            commandBuffer->address,
++            commandBuffer->dataCount
++            ));
++
++        /* Success. */
++        return gcvSTATUS_EXECUTED;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++
++/******************************************************************************\
++********************************* Other Handlers *******************************
++\******************************************************************************/
++
++static gceSTATUS
++_FreeKernelCommandBuffer(
++    IN gckVGKERNEL Kernel,
++    IN gcsKERNEL_CMDQUEUE_PTR Entry
++    )
++{
++    gceSTATUS status;
++
++    /* Free the command buffer. */
++    status = _FreeCommandBuffer(Kernel, Entry->commandBuffer);
++
++    /* Return status. */
++    return status;
++}
++
++
++/******************************************************************************\
++******************************* Queue Management *******************************
++\******************************************************************************/
++
++#if gcvDUMP_COMMAND_BUFFER
++static void
++_DumpCommandQueue(
++    IN gckVGCOMMAND Command,
++    IN gcsKERNEL_QUEUE_HEADER_PTR QueueHeader,
++    IN gctUINT EntryCount
++    )
++{
++    gcsKERNEL_CMDQUEUE_PTR entry;
++    gctUINT queueIndex;
++
++#if defined(gcvCOMMAND_BUFFER_NAME)
++    static gctUINT arrayCount = 0;
++#endif
++
++    /* Is dumpinng enabled? */
++    if (!Commad->enableDumping)
++    {
++        return;
++    }
++
++#if !defined(gcvCOMMAND_BUFFER_NAME)
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_COMMAND,
++        "COMMAND QUEUE DUMP: %d entries\n", EntryCount
++        );
++#endif
++
++    /* Get the pointer to the first entry. */
++    entry = QueueHeader->currentEntry;
++
++    /* Iterate through the queue. */
++    for (queueIndex = 0; queueIndex < EntryCount; queueIndex += 1)
++    {
++        gcsCMDBUFFER_PTR buffer;
++        gctUINT bufferCount;
++        gctUINT bufferIndex;
++        gctUINT i, count;
++        gctUINT size;
++        gctUINT32_PTR data;
++
++#if gcvDUMP_COMMAND_LINES
++        gctUINT lineNumber;
++#endif
++
++#if !defined(gcvCOMMAND_BUFFER_NAME)
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_COMMAND,
++            "ENTRY %d\n", queueIndex
++            );
++#endif
++
++        /* Reset the count. */
++        bufferCount = 0;
++
++        /* Set the initial buffer. */
++        buffer = entry->commandBuffer;
++
++        /* Loop through all subbuffers. */
++        while (buffer)
++        {
++            /* Update the count. */
++            bufferCount += 1;
++
++            /* Advance to the next subbuffer. */
++            buffer = buffer->nextSubBuffer;
++        }
++
++#if !defined(gcvCOMMAND_BUFFER_NAME)
++        if (bufferCount > 1)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO,
++                gcvZONE_COMMAND,
++                "  COMMAND BUFFER SET: %d buffers.\n",
++                bufferCount
++                );
++        }
++#endif
++
++        /* Reset the buffer index. */
++        bufferIndex = 0;
++
++        /* Set the initial buffer. */
++        buffer = entry->commandBuffer;
++
++        /* Loop through all subbuffers. */
++        while (buffer)
++        {
++            /* Determine the size of the buffer. */
++            size = buffer->dataCount * Command->info.commandAlignment;
++
++#if !defined(gcvCOMMAND_BUFFER_NAME)
++            /* A single buffer? */
++            if (bufferCount == 1)
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_INFO,
++                    gcvZONE_COMMAND,
++                    "  COMMAND BUFFER: count=%d (0x%X), size=%d bytes @ %08X.\n",
++                    buffer->dataCount,
++                    buffer->dataCount,
++                    size,
++                    buffer->address
++                    );
++            }
++            else
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_INFO,
++                    gcvZONE_COMMAND,
++                    "  COMMAND BUFFER %d: count=%d (0x%X), size=%d bytes @ %08X\n",
++                    bufferIndex,
++                    buffer->dataCount,
++                    buffer->dataCount,
++                    size,
++                    buffer->address
++                    );
++            }
++#endif
++
++            /* Determine the number of double words to print. */
++            count = size / 4;
++
++            /* Determine the buffer location. */
++            data = (gctUINT32_PTR)
++            (
++                (gctUINT8_PTR) buffer + buffer->bufferOffset
++            );
++
++#if defined(gcvCOMMAND_BUFFER_NAME)
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO,
++                gcvZONE_COMMAND,
++                "unsigned int _" gcvCOMMAND_BUFFER_NAME "_%d[] =\n",
++                arrayCount
++                );
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO,
++                gcvZONE_COMMAND,
++                "{\n"
++                );
++
++            arrayCount += 1;
++#endif
++
++#if gcvDUMP_COMMAND_LINES
++            /* Reset the line number. */
++            lineNumber = 0;
++#endif
++
++#if defined(gcvCOMMAND_BUFFER_NAME)
++            count -= 2;
++#endif
++
++            for (i = 0; i < count; i += 1)
++            {
++                if ((i % 8) == 0)
++                {
++#if defined(gcvCOMMAND_BUFFER_NAME)
++                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "\t");
++#else
++                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "    ");
++#endif
++                }
++
++#if gcvDUMP_COMMAND_LINES
++                if (lineNumber == gcvDUMP_COMMAND_LINES)
++                {
++                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, " . . . . . . . . .\n");
++                    break;
++                }
++#endif
++                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "0x%08X", data[i]);
++
++                if (i + 1 == count)
++                {
++                    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, "\n");
++
++#if gcvDUMP_COMMAND_LINES
++                    lineNumber += 1;
++#endif
++                }
++                else
++                {
++                    if (((i + 1) % 8) == 0)
++                    {
++                        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, ",\n");
++
++#if gcvDUMP_COMMAND_LINES
++                        lineNumber += 1;
++#endif
++                    }
++                    else
++                    {
++                        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_COMMAND, ", ");
++                    }
++                }
++            }
++
++#if defined(gcvCOMMAND_BUFFER_NAME)
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO,
++                gcvZONE_COMMAND,
++                "};\n\n"
++                );
++#endif
++
++            /* Advance to the next subbuffer. */
++            buffer = buffer->nextSubBuffer;
++            bufferIndex += 1;
++        }
++
++        /* Advance to the next entry. */
++        entry += 1;
++    }
++}
++#endif
++
++static gceSTATUS
++_LockCurrentQueue(
++    IN gckVGCOMMAND Command,
++    OUT gcsKERNEL_CMDQUEUE_PTR * Entries,
++    OUT gctUINT_PTR EntryCount
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        gcsKERNEL_QUEUE_HEADER_PTR queueHead;
++
++        /* Get a shortcut to the head of the queue. */
++        queueHead = Command->queueHead;
++
++        /* Is the head buffer still being worked on? */
++        if (queueHead->pending)
++        {
++            /* Increment overflow count. */
++            Command->queueOverflow += 1;
++
++            /* Wait until the head becomes idle. */
++            gcmkERR_BREAK(_WaitForIdle(Command, queueHead));
++        }
++
++        /* Acquire the mutex. */
++        gcmkERR_BREAK(gckOS_AcquireMutex(
++            Command->os,
++            Command->queueMutex,
++            gcvINFINITE
++            ));
++
++        /* Determine the first queue entry. */
++        queueHead->currentEntry = (gcsKERNEL_CMDQUEUE_PTR)
++        (
++            (gctUINT8_PTR) queueHead + gcmSIZEOF(gcsKERNEL_QUEUE_HEADER)
++        );
++
++        /* Set the pointer to the first entry. */
++        * Entries = queueHead->currentEntry;
++
++        /* Determine the number of available entries. */
++        * EntryCount = queueHead->size / gcmSIZEOF(gcsKERNEL_CMDQUEUE);
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++static gceSTATUS
++_UnlockCurrentQueue(
++    IN gckVGCOMMAND Command,
++    IN gctUINT EntryCount
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++#if !gcdENABLE_INFINITE_SPEED_HW
++        gcsKERNEL_QUEUE_HEADER_PTR queueTail;
++        gcsKERNEL_QUEUE_HEADER_PTR queueHead;
++        gcsKERNEL_QUEUE_HEADER_PTR queueNext;
++        gctUINT queueSize;
++        gctUINT newSize;
++        gctUINT unusedSize;
++
++        /* Get shortcut to the head and to the tail of the queue. */
++        queueTail = Command->queueTail;
++        queueHead = Command->queueHead;
++
++        /* Dump the command buffer. */
++#if gcvDUMP_COMMAND_BUFFER
++        _DumpCommandQueue(Command, queueHead, EntryCount);
++#endif
++
++        /* Get a shortcut to the current queue size. */
++        queueSize = queueHead->size;
++
++        /* Determine the new queue size. */
++        newSize = EntryCount * gcmSIZEOF(gcsKERNEL_CMDQUEUE);
++        gcmkASSERT(newSize <= queueSize);
++
++        /* Determine the size of the unused area. */
++        unusedSize = queueSize - newSize;
++
++        /* Is the unused area big enough to become a buffer? */
++        if (unusedSize >= gcvMINUMUM_BUFFER)
++        {
++            gcsKERNEL_QUEUE_HEADER_PTR nextHead;
++
++            /* Place the new header. */
++            nextHead = (gcsKERNEL_QUEUE_HEADER_PTR)
++            (
++                (gctUINT8_PTR) queueHead
++                    + gcmSIZEOF(gcsKERNEL_QUEUE_HEADER)
++                    + newSize
++            );
++
++            /* Initialize the buffer. */
++            nextHead->size    = unusedSize - gcmSIZEOF(gcsKERNEL_QUEUE_HEADER);
++            nextHead->pending = 0;
++
++            /* Link the buffer in. */
++            nextHead->next  = queueHead->next;
++            queueHead->next = nextHead;
++            queueNext       = nextHead;
++
++            /* Update the size of the current buffer. */
++            queueHead->size = newSize;
++        }
++
++        /* Not big enough. */
++        else
++        {
++            /* Determine the next queue. */
++            queueNext = queueHead->next;
++        }
++
++        /* Mark the buffer as busy. */
++        queueHead->pending = EntryCount;
++
++        /* Advance to the next buffer. */
++        Command->queueHead = queueNext;
++
++        /* Start the command processor if the queue was empty. */
++        if (queueTail == queueHead)
++        {
++            gcsCMDBUFFER_PTR commandBuffer;
++
++            /* The first entry must be a command buffer. */
++            commandBuffer = queueTail->currentEntry->commandBuffer;
++
++            /* Start the command processor. */
++            gcmkERR_BREAK(gckVGHARDWARE_Execute(
++                Command->hardware,
++                commandBuffer->address,
++                commandBuffer->dataCount
++                ));
++        }
++
++        /* The queue was not empty. */
++        else
++        {
++            /* Advance the merge buffer if needed. */
++            if (queueHead == Command->mergeQueue)
++            {
++                Command->mergeQueue = queueNext;
++            }
++        }
++#endif
++
++        /* Release the mutex. */
++        gcmkERR_BREAK(gckOS_ReleaseMutex(
++            Command->os,
++            Command->queueMutex
++            ));
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    return status;
++}
++
++
++
++/******************************************************************************\
++****************************** gckVGCOMMAND API Code *****************************
++\******************************************************************************/
++gceSTATUS
++gckVGCOMMAND_Construct(
++    IN gckVGKERNEL Kernel,
++    IN gctUINT TaskGranularity,
++    IN gctUINT QueueSize,
++    OUT gckVGCOMMAND * Command
++    )
++{
++    gceSTATUS status, last;
++    gckVGCOMMAND command = gcvNULL;
++    gcsKERNEL_QUEUE_HEADER_PTR queue;
++    gctUINT i, j;
++
++    gcmkHEADER_ARG("Kernel=0x%x TaskGranularity=0x%x QueueSize=0x%x Command=0x%x",
++        Kernel, TaskGranularity, QueueSize, Command);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(QueueSize >= gcvMINUMUM_BUFFER);
++    gcmkVERIFY_ARGUMENT(Command != gcvNULL);
++
++    do
++    {
++        /***********************************************************************
++        ** Generic object initialization.
++        */
++
++        /* Allocate the gckVGCOMMAND structure. */
++        gcmkERR_BREAK(gckOS_Allocate(
++            Kernel->os,
++            gcmSIZEOF(struct _gckVGCOMMAND),
++            (gctPOINTER *) &command
++            ));
++
++        /* Initialize the object. */
++        command->object.type = gcvOBJ_COMMAND;
++
++        /* Set the object pointers. */
++        command->kernel      = Kernel;
++        command->os          = Kernel->os;
++        command->hardware    = Kernel->hardware;
++
++        /* Reset pointers. */
++        command->queue       = gcvNULL;
++        command->queueMutex  = gcvNULL;
++        command->taskMutex   = gcvNULL;
++        command->commitMutex = gcvNULL;
++
++        command->powerStallBuffer   = gcvNULL;
++        command->powerStallSignal   = gcvNULL;
++        command->powerSemaphore     = gcvNULL;
++
++        /* Reset context states. */
++        command->contextCounter = 0;
++        command->currentContext = 0;
++
++        /* Enable command buffer dumping. */
++        command->enableDumping = gcvTRUE;
++
++        /* Set features. */
++        command->fe20 = Kernel->hardware->fe20;
++        command->vg20 = Kernel->hardware->vg20;
++        command->vg21 = Kernel->hardware->vg21;
++
++        /* Reset task table .*/
++        gcmkVERIFY_OK(gckOS_ZeroMemory(
++            command->taskTable, gcmSIZEOF(command->taskTable)
++            ));
++
++        /* Query command buffer attributes. */
++        gcmkERR_BREAK(gckVGCOMMAND_InitializeInfo(command));
++
++        /* Create the control mutexes. */
++        gcmkERR_BREAK(gckOS_CreateMutex(Kernel->os, &command->queueMutex));
++        gcmkERR_BREAK(gckOS_CreateMutex(Kernel->os, &command->taskMutex));
++        gcmkERR_BREAK(gckOS_CreateMutex(Kernel->os, &command->commitMutex));
++
++        /* Create the power management semaphore. */
++        gcmkERR_BREAK(gckOS_CreateSemaphore(Kernel->os,
++            &command->powerSemaphore));
++
++        gcmkERR_BREAK(gckOS_CreateSignal(Kernel->os,
++            gcvFALSE, &command->powerStallSignal));
++
++        /***********************************************************************
++        ** Command queue initialization.
++        */
++
++        /* Allocate the command queue. */
++        gcmkERR_BREAK(gckOS_Allocate(
++            Kernel->os,
++            QueueSize,
++            (gctPOINTER *) &command->queue
++            ));
++
++        /* Initialize the command queue. */
++        queue = command->queue;
++
++        queue->size    = QueueSize - gcmSIZEOF(gcsKERNEL_QUEUE_HEADER);
++        queue->pending = 0;
++        queue->next    = queue;
++
++        command->queueHead  =
++        command->queueTail  =
++        command->mergeQueue = command->queue;
++
++        command->queueOverflow = 0;
++
++
++        /***********************************************************************
++        ** Enable TS overflow interrupt.
++        */
++
++        command->info.tsOverflowInt = 0;
++        gcmkERR_BREAK(gckVGINTERRUPT_Enable(
++            Kernel->interrupt,
++            &command->info.tsOverflowInt,
++            _EventHandler_TSOverflow
++            ));
++
++        /* Mask out the interrupt. */
++        Kernel->hardware->eventMask &= ~(1 << command->info.tsOverflowInt);
++
++
++        /***********************************************************************
++        ** Enable Bus Error interrupt.
++        */
++
++        /* Hardwired to bit 31. */
++        command->busErrorInt = 31;
++
++        /* Enable the interrupt. */
++        gcmkERR_BREAK(gckVGINTERRUPT_Enable(
++            Kernel->interrupt,
++            &command->busErrorInt,
++            _EventHandler_BusError
++            ));
++
++
++        command->powerStallInt = 30;
++        /* Enable the interrupt. */
++        gcmkERR_BREAK(gckVGINTERRUPT_Enable(
++            Kernel->interrupt,
++            &command->powerStallInt,
++            _EventHandler_PowerStall
++            ));
++
++        /***********************************************************************
++        ** Task management initialization.
++        */
++
++        command->taskStorage            = gcvNULL;
++        command->taskStorageGranularity = TaskGranularity;
++        command->taskStorageUsable      = TaskGranularity - gcmSIZEOF(gcsTASK_STORAGE);
++
++        command->taskFreeHead = gcvNULL;
++        command->taskFreeTail = gcvNULL;
++
++        /* Enable block handlers. */
++        for (i = 0; i < gcmCOUNTOF(_blockHandlers); i += 1)
++        {
++            /* Get the target hardware block. */
++            gceBLOCK block = _blockHandlers[i].block;
++
++            /* Get the interrupt array entry. */
++            gcsBLOCK_TASK_ENTRY_PTR entry = &command->taskTable[block];
++
++            /* Determine the interrupt value index. */
++            gctUINT index = entry->interruptCount;
++
++            /* Create the block semaphore. */
++            if (entry->interruptSemaphore == gcvNULL)
++            {
++                gcmkERR_BREAK(gckOS_CreateSemaphoreVG(
++                    command->os, &entry->interruptSemaphore
++                    ));
++            }
++
++            /* Enable auto-detection. */
++            entry->interruptArray[index] = -1;
++
++            /* Enable interrupt for the block. */
++            gcmkERR_BREAK(gckVGINTERRUPT_Enable(
++                Kernel->interrupt,
++                &entry->interruptArray[index],
++                _blockHandlers[i].handler
++                ));
++
++            /* Update the number of registered interrupts. */
++            entry->interruptCount += 1;
++
++            /* Inrement the semaphore to allow the usage of the registered
++               interrupt. */
++            gcmkERR_BREAK(gckOS_IncrementSemaphore(
++                command->os, entry->interruptSemaphore
++                ));
++
++        }
++
++        /* Error? */
++        if (gcmkIS_ERROR(status))
++        {
++            break;
++        }
++
++        /* Get the FE interrupt. */
++        command->info.feBufferInt
++            = command->taskTable[gcvBLOCK_COMMAND].interruptArray[0];
++
++        /* Return gckVGCOMMAND object pointer. */
++        *Command = command;
++
++        gcmkFOOTER_ARG("*Command=0x%x",*Command);
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Roll back. */
++    if (command != gcvNULL)
++    {
++        /* Disable block handlers. */
++        for (i = 0; i < gcvBLOCK_COUNT; i += 1)
++        {
++            /* Get the task table entry. */
++            gcsBLOCK_TASK_ENTRY_PTR entry = &command->taskTable[i];
++
++            /* Destroy the semaphore. */
++            if (entry->interruptSemaphore != gcvNULL)
++            {
++                gcmkCHECK_STATUS(gckOS_DestroySemaphore(
++                    command->os, entry->interruptSemaphore
++                    ));
++            }
++
++            /* Disable all enabled interrupts. */
++            for (j = 0; j < entry->interruptCount; j += 1)
++            {
++                /* Must be a valid value. */
++                gcmkASSERT(entry->interruptArray[j] >= 0);
++                gcmkASSERT(entry->interruptArray[j] <= 31);
++
++                /* Disable the interrupt. */
++                gcmkCHECK_STATUS(gckVGINTERRUPT_Disable(
++                    Kernel->interrupt,
++                    entry->interruptArray[j]
++                    ));
++            }
++        }
++
++        /* Disable the bus error interrupt. */
++        gcmkCHECK_STATUS(gckVGINTERRUPT_Disable(
++            Kernel->interrupt,
++            command->busErrorInt
++            ));
++
++        /* Disable TS overflow interrupt. */
++        if (command->info.tsOverflowInt != -1)
++        {
++            gcmkCHECK_STATUS(gckVGINTERRUPT_Disable(
++                Kernel->interrupt,
++                command->info.tsOverflowInt
++                ));
++        }
++
++        /* Delete the commit mutex. */
++        if (command->commitMutex != gcvNULL)
++        {
++            gcmkCHECK_STATUS(gckOS_DeleteMutex(
++                Kernel->os, command->commitMutex
++                ));
++        }
++
++        /* Delete the command queue mutex. */
++        if (command->taskMutex != gcvNULL)
++        {
++            gcmkCHECK_STATUS(gckOS_DeleteMutex(
++                Kernel->os, command->taskMutex
++                ));
++        }
++
++        /* Delete the command queue mutex. */
++        if (command->queueMutex != gcvNULL)
++        {
++            gcmkCHECK_STATUS(gckOS_DeleteMutex(
++                Kernel->os, command->queueMutex
++                ));
++        }
++
++        /* Delete the command queue. */
++        if (command->queue != gcvNULL)
++        {
++            gcmkCHECK_STATUS(gckOS_Free(
++                Kernel->os, command->queue
++                ));
++        }
++
++        if (command->powerSemaphore != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DestroySemaphore(
++                Kernel->os, command->powerSemaphore));
++        }
++
++        if (command->powerStallSignal != gcvNULL)
++        {
++            /* Create the power management semaphore. */
++            gcmkVERIFY_OK(gckOS_DestroySignal(
++                Kernel->os,
++                command->powerStallSignal));
++        }
++
++        /* Free the gckVGCOMMAND structure. */
++        gcmkCHECK_STATUS(gckOS_Free(
++            Kernel->os, command
++            ));
++    }
++
++    gcmkFOOTER();
++    /* Return the error. */
++    return status;
++}
++
++gceSTATUS
++gckVGCOMMAND_Destroy(
++    OUT gckVGCOMMAND Command
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    gcmkHEADER_ARG("Command=0x%x", Command);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++
++    do
++    {
++        gctUINT i;
++        gcsTASK_STORAGE_PTR nextStorage;
++
++        if (Command->queueHead != gcvNULL)
++        {
++            /* Wait until the head becomes idle. */
++            gcmkERR_BREAK(_WaitForIdle(Command, Command->queueHead));
++        }
++
++        /* Disable block handlers. */
++        for (i = 0; i < gcvBLOCK_COUNT; i += 1)
++        {
++            /* Get the interrupt array entry. */
++            gcsBLOCK_TASK_ENTRY_PTR entry = &Command->taskTable[i];
++
++            /* Determine the index of the last interrupt in the array. */
++            gctINT index = entry->interruptCount - 1;
++
++            /* Destroy the semaphore. */
++            if (entry->interruptSemaphore != gcvNULL)
++            {
++                gcmkERR_BREAK(gckOS_DestroySemaphore(
++                    Command->os, entry->interruptSemaphore
++                    ));
++            }
++
++            /* Disable all enabled interrupts. */
++            while (index >= 0)
++            {
++                /* Must be a valid value. */
++                gcmkASSERT(entry->interruptArray[index] >= 0);
++                gcmkASSERT(entry->interruptArray[index] <= 31);
++
++                /* Disable the interrupt. */
++                gcmkERR_BREAK(gckVGINTERRUPT_Disable(
++                    Command->kernel->interrupt,
++                    entry->interruptArray[index]
++                    ));
++
++                /* Update to the next interrupt. */
++                index                 -= 1;
++                entry->interruptCount -= 1;
++            }
++
++            /* Error? */
++            if (gcmkIS_ERROR(status))
++            {
++                break;
++            }
++        }
++
++        /* Error? */
++        if (gcmkIS_ERROR(status))
++        {
++            break;
++        }
++
++        /* Disable the bus error interrupt. */
++        gcmkERR_BREAK(gckVGINTERRUPT_Disable(
++            Command->kernel->interrupt,
++            Command->busErrorInt
++            ));
++
++        /* Disable TS overflow interrupt. */
++        if (Command->info.tsOverflowInt != -1)
++        {
++            gcmkERR_BREAK(gckVGINTERRUPT_Disable(
++                Command->kernel->interrupt,
++                Command->info.tsOverflowInt
++                ));
++
++            Command->info.tsOverflowInt = -1;
++        }
++
++        /* Delete the commit mutex. */
++        if (Command->commitMutex != gcvNULL)
++        {
++            gcmkERR_BREAK(gckOS_DeleteMutex(
++                Command->os, Command->commitMutex
++                ));
++
++            Command->commitMutex = gcvNULL;
++        }
++
++        /* Delete the command queue mutex. */
++        if (Command->taskMutex != gcvNULL)
++        {
++            gcmkERR_BREAK(gckOS_DeleteMutex(
++                Command->os, Command->taskMutex
++                ));
++
++            Command->taskMutex = gcvNULL;
++        }
++
++        /* Delete the command queue mutex. */
++        if (Command->queueMutex != gcvNULL)
++        {
++            gcmkERR_BREAK(gckOS_DeleteMutex(
++                Command->os, Command->queueMutex
++                ));
++
++            Command->queueMutex = gcvNULL;
++        }
++
++        if (Command->powerSemaphore != gcvNULL)
++        {
++            /* Destroy the power management semaphore. */
++            gcmkERR_BREAK(gckOS_DestroySemaphore(
++                Command->os, Command->powerSemaphore));
++        }
++
++        if (Command->powerStallSignal != gcvNULL)
++        {
++            /* Create the power management semaphore. */
++            gcmkERR_BREAK(gckOS_DestroySignal(
++                Command->os,
++                Command->powerStallSignal));
++        }
++
++        if (Command->queue != gcvNULL)
++        {
++            /* Delete the command queue. */
++            gcmkERR_BREAK(gckOS_Free(
++                Command->os, Command->queue
++                ));
++        }
++
++        /* Destroy all allocated buffers. */
++        while (Command->taskStorage)
++        {
++            /* Copy the buffer pointer. */
++            nextStorage = Command->taskStorage->next;
++
++            /* Free the current container. */
++            gcmkERR_BREAK(gckOS_Free(
++                Command->os, Command->taskStorage
++                ));
++
++            /* Advance to the next one. */
++            Command->taskStorage = nextStorage;
++        }
++
++        /* Error? */
++        if (gcmkIS_ERROR(status))
++        {
++            break;
++        }
++
++        /* Mark the object as unknown. */
++        Command->object.type = gcvOBJ_UNKNOWN;
++
++        /* Free the gckVGCOMMAND structure. */
++        gcmkERR_BREAK(gckOS_Free(Command->os, Command));
++
++        gcmkFOOTER_NO();
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Restore the object type if failed. */
++    Command->object.type = gcvOBJ_COMMAND;
++
++    gcmkFOOTER();
++    /* Return the error. */
++    return status;
++}
++
++gceSTATUS
++gckVGCOMMAND_QueryCommandBuffer(
++    IN gckVGCOMMAND Command,
++    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
++    )
++{
++    gcmkHEADER_ARG("Command=0x%x Information=0x%x", Command, Information);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++    gcmkVERIFY_ARGUMENT(Information != gcvNULL);
++
++    /* Copy the information. */
++    gcmkVERIFY_OK(gckOS_MemCopy(
++        Information, &Command->info, sizeof(gcsCOMMAND_BUFFER_INFO)
++        ));
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGCOMMAND_Allocate(
++    IN gckVGCOMMAND Command,
++    IN gctSIZE_T Size,
++    OUT gcsCMDBUFFER_PTR * CommandBuffer,
++    OUT gctPOINTER * Data
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Command=0x%x Size=0x%x CommandBuffer=0x%x Data=0x%x",
++        Command, Size, CommandBuffer, Data);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
++
++    do
++    {
++        /* Allocate the buffer. */
++        gcmkERR_BREAK(_AllocateCommandBuffer(Command, Size, CommandBuffer));
++
++        /* Determine the data pointer. */
++        * Data = (gctUINT8_PTR) (*CommandBuffer) + (* CommandBuffer)->bufferOffset;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++gceSTATUS
++gckVGCOMMAND_Free(
++    IN gckVGCOMMAND Command,
++    IN gcsCMDBUFFER_PTR CommandBuffer
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Command=0x%x CommandBuffer=0x%x",
++        Command, CommandBuffer);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++    gcmkVERIFY_ARGUMENT(CommandBuffer != gcvNULL);
++
++    /* Free command buffer. */
++    status = _FreeCommandBuffer(Command->kernel, CommandBuffer);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++gceSTATUS
++gckVGCOMMAND_Execute(
++    IN gckVGCOMMAND Command,
++    IN gcsCMDBUFFER_PTR CommandBuffer
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Command=0x%x CommandBuffer=0x%x",
++        Command, CommandBuffer);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++    gcmkVERIFY_ARGUMENT(CommandBuffer != gcvNULL);
++
++    do
++    {
++        gctUINT queueLength;
++        gcsKERNEL_CMDQUEUE_PTR kernelEntry;
++
++        /* Lock the current queue. */
++        gcmkERR_BREAK(_LockCurrentQueue(
++            Command, &kernelEntry, &queueLength
++            ));
++
++        /* Set the buffer. */
++        kernelEntry->commandBuffer = CommandBuffer;
++        kernelEntry->handler = _FreeKernelCommandBuffer;
++
++        /* Lock the current queue. */
++        gcmkERR_BREAK(_UnlockCurrentQueue(
++            Command, 1
++            ));
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++gceSTATUS
++gckVGCOMMAND_Commit(
++    IN gckVGCOMMAND Command,
++    IN gcsVGCONTEXT_PTR Context,
++    IN gcsVGCMDQUEUE_PTR Queue,
++    IN gctUINT EntryCount,
++    IN gcsTASK_MASTER_TABLE_PTR TaskTable
++    )
++{
++    /*
++        The first buffer is executed through a direct gckVGHARDWARE_Execute call,
++        therefore only an update is needed after the execution is over. All
++        consequent buffers need to be executed upon the first update call from
++        the FE interrupt handler.
++    */
++
++    static gcsQUEUE_UPDATE_CONTROL _dynamicBuffer[] =
++    {
++        {
++            _UpdateDynamicCommandBuffer,
++            _UpdateDynamicCommandBuffer,
++            _UpdateLastDynamicCommandBuffer,
++            _UpdateLastDynamicCommandBuffer
++        },
++        {
++            _ExecuteDynamicCommandBuffer,
++            _UpdateDynamicCommandBuffer,
++            _ExecuteLastDynamicCommandBuffer,
++            _UpdateLastDynamicCommandBuffer
++        }
++    };
++
++    static gcsQUEUE_UPDATE_CONTROL _staticBuffer[] =
++    {
++        {
++            _UpdateStaticCommandBuffer,
++            _UpdateStaticCommandBuffer,
++            _UpdateLastStaticCommandBuffer,
++            _UpdateLastStaticCommandBuffer
++        },
++        {
++            _ExecuteStaticCommandBuffer,
++            _UpdateStaticCommandBuffer,
++            _ExecuteLastStaticCommandBuffer,
++            _UpdateLastStaticCommandBuffer
++        }
++    };
++
++    gceSTATUS status, last;
++
++    gcmkHEADER_ARG("Command=0x%x Context=0x%x Queue=0x%x EntryCount=0x%x TaskTable=0x%x",
++        Command, Context, Queue, EntryCount, TaskTable);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Command, gcvOBJ_COMMAND);
++    gcmkVERIFY_ARGUMENT(Context != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Queue != gcvNULL);
++    gcmkVERIFY_ARGUMENT(EntryCount > 1);
++
++#ifdef __QNXNTO__
++    TaskTable->coid     = Context->coid;
++    TaskTable->rcvid    = Context->rcvid;
++#endif /* __QNXNTO__ */
++
++    do
++    {
++        gctBOOL haveFETasks;
++        gctUINT queueSize;
++        gcsVGCMDQUEUE_PTR mappedQueue;
++        gcsVGCMDQUEUE_PTR userEntry;
++        gcsKERNEL_CMDQUEUE_PTR kernelEntry;
++        gcsQUEUE_UPDATE_CONTROL_PTR queueControl;
++        gctUINT currentLength;
++        gctUINT queueLength;
++        gctUINT entriesQueued;
++        gctUINT8_PTR previousEnd;
++        gctBOOL previousDynamic;
++        gctBOOL previousExecuted;
++        gctUINT controlIndex;
++
++        gcmkERR_BREAK(gckVGHARDWARE_SetPowerManagementState(
++            Command->hardware, gcvPOWER_ON_AUTO
++            ));
++
++        /* Acquire the power semaphore. */
++        gcmkERR_BREAK(gckOS_AcquireSemaphore(
++            Command->os, Command->powerSemaphore
++            ));
++
++        /* Acquire the mutex. */
++        status = gckOS_AcquireMutex(
++            Command->os,
++            Command->commitMutex,
++            gcvINFINITE
++            );
++
++        if (gcmIS_ERROR(status))
++        {
++            gcmkVERIFY_OK(gckOS_ReleaseSemaphore(
++                Command->os, Command->powerSemaphore));
++            break;
++        }
++
++        do
++        {
++            gcmkERR_BREAK(_FlushMMU(Command));
++
++            /* Assign a context ID if not yet assigned. */
++            if (Context->id == 0)
++            {
++                /* Assign the next context number. */
++                Context->id = ++ Command->contextCounter;
++
++                /* See if we overflowed. */
++                if (Command->contextCounter == 0)
++                {
++                    /* We actually did overflow, wow... */
++                    status = gcvSTATUS_OUT_OF_RESOURCES;
++                    break;
++                }
++            }
++
++            /* The first entry in the queue is always the context buffer.
++               Verify whether the user context is the same as the current
++               context and if that's the case, skip the first entry. */
++            if (Context->id == Command->currentContext)
++            {
++                /* Same context as before, skip the first entry. */
++                EntryCount -= 1;
++                Queue      += 1;
++
++                /* Set the signal to avoid user waiting. */
++#ifdef __QNXNTO__
++                gcmkERR_BREAK(gckOS_UserSignal(
++                    Command->os, Context->signal, Context->rcvid, Context->coid
++                    ));
++#else
++                gcmkERR_BREAK(gckOS_UserSignal(
++                    Command->os, Context->signal, Context->process
++                    ));
++
++#endif /* __QNXNTO__ */
++
++            }
++            else
++            {
++                /* Different user context - keep the first entry.
++                   Set the user context as the current one. */
++                Command->currentContext = Context->id;
++            }
++
++            /* Reset pointers. */
++            queueControl = gcvNULL;
++            previousEnd  = gcvNULL;
++
++            /* Determine whether there are FE tasks to be performed. */
++            haveFETasks = (TaskTable->table[gcvBLOCK_COMMAND].head != gcvNULL);
++
++            /* Determine the size of the queue. */
++            queueSize = EntryCount * gcmSIZEOF(gcsVGCMDQUEUE);
++
++            /* Map the command queue into the kernel space. */
++            gcmkERR_BREAK(gckOS_MapUserPointer(
++                Command->os,
++                Queue,
++                queueSize,
++                (gctPOINTER *) &mappedQueue
++                ));
++
++            /* Set the first entry. */
++            userEntry = mappedQueue;
++
++            /* Process the command queue. */
++            while (EntryCount)
++            {
++                /* Lock the current queue. */
++                gcmkERR_BREAK(_LockCurrentQueue(
++                    Command, &kernelEntry, &queueLength
++                    ));
++
++                /* Determine the number of entries to process. */
++                currentLength = (queueLength < EntryCount)
++                    ? queueLength
++                    : EntryCount;
++
++                /* Update the number of the entries left to process. */
++                EntryCount -= currentLength;
++
++                /* Reset previous flags. */
++                previousDynamic  = gcvFALSE;
++                previousExecuted = gcvFALSE;
++
++                /* Set the initial control index. */
++                controlIndex = 0;
++
++                /* Process entries. */
++                for (entriesQueued = 0; entriesQueued < currentLength; entriesQueued += 1)
++                {
++                    /* Get the kernel pointer to the command buffer header. */
++                    gcsCMDBUFFER_PTR commandBuffer = gcvNULL;
++                    gcmkERR_BREAK(_ConvertUserCommandBufferPointer(
++                        Command,
++                        userEntry->commandBuffer,
++                        &commandBuffer
++                        ));
++
++                    /* Is it a dynamic command buffer? */
++                    if (userEntry->dynamic)
++                    {
++                        /* Select dynamic buffer control functions. */
++                        queueControl = &_dynamicBuffer[controlIndex];
++                    }
++
++                    /* No, a static command buffer. */
++                    else
++                    {
++                        /* Select static buffer control functions. */
++                        queueControl = &_staticBuffer[controlIndex];
++                    }
++
++                    /* Set the command buffer pointer to the entry. */
++                    kernelEntry->commandBuffer = commandBuffer;
++
++                    /* If the previous entry was a dynamic command buffer,
++                       link it to the current. */
++                    if (previousDynamic)
++                    {
++                        gcmkERR_BREAK(gckVGCOMMAND_FetchCommand(
++                            Command,
++                            previousEnd,
++                            commandBuffer->address,
++                            commandBuffer->dataCount,
++                            gcvNULL
++                            ));
++
++                        /* The buffer will be auto-executed, only need to
++                           update it after it has been executed. */
++                        kernelEntry->handler = queueControl->update;
++
++                        /* The buffer is only being updated. */
++                        previousExecuted = gcvFALSE;
++                    }
++                    else
++                    {
++                        /* Set the buffer up for execution. */
++                        kernelEntry->handler = queueControl->execute;
++
++                        /* The buffer is being updated. */
++                        previousExecuted = gcvTRUE;
++                    }
++
++                    /* The current buffer's END command becomes the last END. */
++                    previousEnd
++                        = ((gctUINT8_PTR) commandBuffer)
++                        + commandBuffer->bufferOffset
++                        + commandBuffer->dataCount * Command->info.commandAlignment
++                        - Command->info.staticTailSize;
++
++                    /* Update the last entry info. */
++                    previousDynamic = userEntry->dynamic;
++
++                    /* Advance entries. */
++                    userEntry   += 1;
++                    kernelEntry += 1;
++
++                    /* Update the control index. */
++                    controlIndex = 1;
++                }
++
++                /* If the previous entry was a dynamic command buffer,
++                   terminate it with an END. */
++                if (previousDynamic)
++                {
++                    gcmkERR_BREAK(gckVGCOMMAND_EndCommand(
++                        Command,
++                        previousEnd,
++                        Command->info.feBufferInt,
++                        gcvNULL
++                        ));
++                }
++
++                /* Last buffer? */
++                if (EntryCount == 0)
++                {
++                    /* Modify the last command buffer's routines to handle
++                       tasks if any.*/
++                    if (haveFETasks)
++                    {
++                        if (previousExecuted)
++                        {
++                            kernelEntry[-1].handler = queueControl->lastExecute;
++                        }
++                        else
++                        {
++                            kernelEntry[-1].handler = queueControl->lastUpdate;
++                        }
++                    }
++
++                    /* Release the mutex. */
++                    gcmkERR_BREAK(gckOS_ReleaseMutex(
++                        Command->os,
++                        Command->queueMutex
++                        ));
++                    /* Schedule tasks. */
++                    gcmkERR_BREAK(_ScheduleTasks(Command, TaskTable, previousEnd));
++
++                    /* Acquire the mutex. */
++                    gcmkERR_BREAK(gckOS_AcquireMutex(
++                        Command->os,
++                        Command->queueMutex,
++                        gcvINFINITE
++                        ));
++                }
++
++                /* Unkock and schedule the current queue for execution. */
++                gcmkERR_BREAK(_UnlockCurrentQueue(
++                    Command, currentLength
++                    ));
++            }
++
++
++            /* Unmap the user command buffer. */
++            gcmkERR_BREAK(gckOS_UnmapUserPointer(
++                Command->os,
++                Queue,
++                queueSize,
++                mappedQueue
++                ));
++        }
++        while (gcvFALSE);
++
++        /* Release the mutex. */
++        gcmkCHECK_STATUS(gckOS_ReleaseMutex(
++            Command->os,
++            Command->commitMutex
++            ));
++
++        gcmkVERIFY_OK(gckOS_ReleaseSemaphore(
++            Command->os, Command->powerSemaphore));
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++#endif /* gcdENABLE_VG */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_db.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,1618 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_DATABASE
++
++/*******************************************************************************
++***** Private fuctions ********************************************************/
++
++#define _GetSlot(database, x) \
++    (gctUINT32)(((gcmPTR_TO_UINT64(x) >> 7) % gcmCOUNTOF(database->list)))
++
++/*******************************************************************************
++**  gckKERNEL_NewDatabase
++**
++**  Create a new database structure and insert it to the head of the hash list.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          ProcessID that identifies the database.
++**
++**  OUTPUT:
++**
++**      gcsDATABASE_PTR * Database
++**          Pointer to a variable receiving the database structure pointer on
++**          success.
++*/
++static gceSTATUS
++gckKERNEL_NewDatabase(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    OUT gcsDATABASE_PTR * Database
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++    gctBOOL acquired = gcvFALSE;
++    gctSIZE_T slot;
++    gcsDATABASE_PTR existingDatabase;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
++
++    /* Acquire the database mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Compute the hash for the database. */
++    slot = ProcessID % gcmCOUNTOF(Kernel->db->db);
++
++    /* Walk the hash list. */
++    for (existingDatabase = Kernel->db->db[slot];
++         existingDatabase != gcvNULL;
++         existingDatabase = existingDatabase->next)
++    {
++        if (existingDatabase->processID == ProcessID)
++        {
++            /* One process can't be added twice. */
++            gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++        }
++    }
++
++    if (Kernel->db->freeDatabase != gcvNULL)
++    {
++        /* Allocate a database from the free list. */
++        database             = Kernel->db->freeDatabase;
++        Kernel->db->freeDatabase = database->next;
++    }
++    else
++    {
++        gctPOINTER pointer = gcvNULL;
++
++        /* Allocate a new database from the heap. */
++        gcmkONERROR(gckOS_Allocate(Kernel->os,
++                                   gcmSIZEOF(gcsDATABASE),
++                                   &pointer));
++
++        database = pointer;
++    }
++
++    /* Insert the database into the hash. */
++    database->next   = Kernel->db->db[slot];
++    Kernel->db->db[slot] = database;
++
++    /* Save the hash slot. */
++    database->slot = slot;
++
++    /* Release the database mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Return the database. */
++    *Database = database;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Database=0x%x", *Database);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the database mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_FindDatabase
++**
++**  Find a database identified by a process ID and move it to the head of the
++**  hash list.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          ProcessID that identifies the database.
++**
++**      gctBOOL LastProcessID
++**          gcvTRUE if searching for the last known process ID.  gcvFALSE if
++**          we need to search for the process ID specified by the ProcessID
++**          argument.
++**
++**  OUTPUT:
++**
++**      gcsDATABASE_PTR * Database
++**          Pointer to a variable receiving the database structure pointer on
++**          success.
++*/
++static gceSTATUS
++gckKERNEL_FindDatabase(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gctBOOL LastProcessID,
++    OUT gcsDATABASE_PTR * Database
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database, previous;
++    gctSIZE_T slot;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d LastProcessID=%d",
++                   Kernel, ProcessID, LastProcessID);
++
++    /* Compute the hash for the database. */
++    slot = ProcessID % gcmCOUNTOF(Kernel->db->db);
++
++    /* Check whether we are getting the last known database. */
++    if (LastProcessID)
++    {
++        /* Use last database. */
++        database = Kernel->db->lastDatabase;
++
++        if (database == gcvNULL)
++        {
++            /* Database not found. */
++            gcmkONERROR(gcvSTATUS_INVALID_DATA);
++        }
++    }
++    else
++    {
++        /* Walk the hash list. */
++        for (previous = gcvNULL, database = Kernel->db->db[slot];
++             database != gcvNULL;
++             database = database->next)
++        {
++            if (database->processID == ProcessID)
++            {
++                /* Found it! */
++                break;
++            }
++
++            previous = database;
++        }
++
++        if (database == gcvNULL)
++        {
++            /* Database not found. */
++            gcmkONERROR(gcvSTATUS_INVALID_DATA);
++        }
++
++        if (previous != gcvNULL)
++        {
++            /* Move database to the head of the hash list. */
++            previous->next   = database->next;
++            database->next   = Kernel->db->db[slot];
++            Kernel->db->db[slot] = database;
++        }
++    }
++
++    /* Return the database. */
++    *Database = database;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Database=0x%x", *Database);
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_DeleteDatabase
++**
++**  Remove a database from the hash list and delete its structure.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gcsDATABASE_PTR Database
++**          Pointer to the database structure to remove.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++static gceSTATUS
++gckKERNEL_DeleteDatabase(
++    IN gckKERNEL Kernel,
++    IN gcsDATABASE_PTR Database
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++
++    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x", Kernel, Database);
++
++    /* Check slot value. */
++    gcmkVERIFY_ARGUMENT(Database->slot < gcmCOUNTOF(Kernel->db->db));
++
++    if (Database->slot < gcmCOUNTOF(Kernel->db->db))
++    {
++        /* Check if database if the head of the hash list. */
++        if (Kernel->db->db[Database->slot] == Database)
++        {
++            /* Remove the database from the hash list. */
++            Kernel->db->db[Database->slot] = Database->next;
++        }
++        else
++        {
++            /* Walk the has list to find the database. */
++            for (database = Kernel->db->db[Database->slot];
++                 database != gcvNULL;
++                 database = database->next
++            )
++            {
++                /* Check if the next list entry is this database. */
++                if (database->next == Database)
++                {
++                    /* Remove the database from the hash list. */
++                    database->next = Database->next;
++                    break;
++                }
++            }
++
++            if (database == gcvNULL)
++            {
++                /* Ouch!  Something got corrupted. */
++                gcmkONERROR(gcvSTATUS_INVALID_DATA);
++            }
++        }
++    }
++
++    if (Kernel->db->lastDatabase != gcvNULL)
++    {
++        /* Insert database to the free list. */
++        Kernel->db->lastDatabase->next = Kernel->db->freeDatabase;
++        Kernel->db->freeDatabase       = Kernel->db->lastDatabase;
++    }
++
++    /* Keep database as the last database. */
++    Kernel->db->lastDatabase = Database;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_NewRecord
++**
++**  Create a new database record structure and insert it to the head of the
++**  database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gcsDATABASE_PTR Database
++**          Pointer to a database structure.
++**
++**  OUTPUT:
++**
++**      gcsDATABASE_RECORD_PTR * Record
++**          Pointer to a variable receiving the database record structure
++**          pointer on success.
++*/
++static gceSTATUS
++gckKERNEL_NewRecord(
++    IN gckKERNEL Kernel,
++    IN gcsDATABASE_PTR Database,
++    IN gctUINT32 Slot,
++    OUT gcsDATABASE_RECORD_PTR * Record
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_RECORD_PTR record = gcvNULL;
++
++    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x", Kernel, Database);
++
++    if (Kernel->db->freeRecord != gcvNULL)
++    {
++        /* Allocate the record from the free list. */
++        record             = Kernel->db->freeRecord;
++        Kernel->db->freeRecord = record->next;
++    }
++    else
++    {
++        gctPOINTER pointer = gcvNULL;
++
++        /* Allocate the record from the heap. */
++        gcmkONERROR(gckOS_Allocate(Kernel->os,
++                                   gcmSIZEOF(gcsDATABASE_RECORD),
++                                   &pointer));
++
++        record = pointer;
++    }
++
++    /* Insert the record in the database. */
++    record->next         = Database->list[Slot];
++    Database->list[Slot] = record;
++
++    /* Return the record. */
++    *Record = record;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Record=0x%x", *Record);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (record != gcvNULL)
++    {
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, record));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_DeleteRecord
++**
++**  Remove a database record from the database and delete its structure.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gcsDATABASE_PTR Database
++**          Pointer to a database structure.
++**
++**      gceDATABASE_TYPE Type
++**          Type of the record to remove.
++**
++**      gctPOINTER Data
++**          Data of the record to remove.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T_PTR Bytes
++**          Pointer to a variable that receives the size of the record deleted.
++**          Can be gcvNULL if the size is not required.
++*/
++static gceSTATUS
++gckKERNEL_DeleteRecord(
++    IN gckKERNEL Kernel,
++    IN gcsDATABASE_PTR Database,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Data,
++    OUT gctSIZE_T_PTR Bytes OPTIONAL
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_RECORD_PTR record, previous;
++    gctUINT32 slot = _GetSlot(Database, Data);
++
++    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x Type=%d Data=0x%x",
++                   Kernel, Database, Type, Data);
++
++    /* Scan the database for this record. */
++    for (record = Database->list[slot], previous = gcvNULL;
++         record != gcvNULL;
++         record = record->next
++    )
++    {
++        if ((record->type == Type)
++        &&  (record->data == Data)
++        )
++        {
++            /* Found it! */
++            break;
++        }
++
++        previous = record;
++    }
++
++    if (record == gcvNULL)
++    {
++        /* Ouch!  This record is not found? */
++        gcmkONERROR(gcvSTATUS_INVALID_DATA);
++    }
++
++    if (Bytes != gcvNULL)
++    {
++        /* Return size of record. */
++        *Bytes = record->bytes;
++    }
++
++    /* Remove record from database. */
++    if (previous == gcvNULL)
++    {
++        Database->list[slot] = record->next;
++    }
++    else
++    {
++        previous->next = record->next;
++    }
++
++    /* Insert record in free list. */
++    record->next       = Kernel->db->freeRecord;
++    Kernel->db->freeRecord = record;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu", gcmOPT_VALUE(Bytes));
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_FindRecord
++**
++**  Find a database record from the database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gcsDATABASE_PTR Database
++**          Pointer to a database structure.
++**
++**      gceDATABASE_TYPE Type
++**          Type of the record to remove.
++**
++**      gctPOINTER Data
++**          Data of the record to remove.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T_PTR Bytes
++**          Pointer to a variable that receives the size of the record deleted.
++**          Can be gcvNULL if the size is not required.
++*/
++static gceSTATUS
++gckKERNEL_FindRecord(
++    IN gckKERNEL Kernel,
++    IN gcsDATABASE_PTR Database,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Data,
++    OUT gcsDATABASE_RECORD_PTR Record
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_RECORD_PTR record;
++    gctUINT32 slot = _GetSlot(Database, Data);
++
++    gcmkHEADER_ARG("Kernel=0x%x Database=0x%x Type=%d Data=0x%x",
++                   Kernel, Database, Type, Data);
++
++    /* Scan the database for this record. */
++    for (record = Database->list[slot];
++         record != gcvNULL;
++         record = record->next
++    )
++    {
++        if ((record->type == Type)
++        &&  (record->data == Data)
++        )
++        {
++            /* Found it! */
++            break;
++        }
++    }
++
++    if (record == gcvNULL)
++    {
++        /* Ouch!  This record is not found? */
++        gcmkONERROR(gcvSTATUS_INVALID_DATA);
++    }
++
++    if (Record != gcvNULL)
++    {
++        /* Return information of record. */
++        gcmkONERROR(
++            gckOS_MemCopy(Record, record, sizeof(gcsDATABASE_RECORD)));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("Record=0x%x", Record);
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++
++/*******************************************************************************
++***** Public API **************************************************************/
++
++/*******************************************************************************
++**  gckKERNEL_CreateProcessDB
++**
++**  Create a new process database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_CreateProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database = gcvNULL;
++    gctUINT32 i;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Create a new database. */
++    gcmkONERROR(gckKERNEL_NewDatabase(Kernel, ProcessID, &database));
++
++    /* Initialize the database. */
++    database->processID             = ProcessID;
++    database->vidMem.bytes          = 0;
++    database->vidMem.maxBytes       = 0;
++    database->vidMem.totalBytes     = 0;
++    database->nonPaged.bytes        = 0;
++    database->nonPaged.maxBytes     = 0;
++    database->nonPaged.totalBytes   = 0;
++    database->contiguous.bytes      = 0;
++    database->contiguous.maxBytes   = 0;
++    database->contiguous.totalBytes = 0;
++    database->mapMemory.bytes          = 0;
++    database->mapMemory.maxBytes       = 0;
++    database->mapMemory.totalBytes     = 0;
++    database->mapUserMemory.bytes      = 0;
++    database->mapUserMemory.maxBytes   = 0;
++    database->mapUserMemory.totalBytes = 0;
++    database->vidMemResv.bytes         = 0;
++    database->vidMemResv.maxBytes      = 0;
++    database->vidMemResv.totalBytes    = 0;
++    database->vidMemCont.bytes         = 0;
++    database->vidMemCont.maxBytes      = 0;
++    database->vidMemCont.totalBytes    = 0;
++    database->vidMemVirt.bytes         = 0;
++    database->vidMemVirt.maxBytes      = 0;
++    database->vidMemVirt.totalBytes    = 0;
++
++    for (i = 0; i < gcmCOUNTOF(database->list); i++)
++    {
++        database->list[i]              = gcvNULL;
++    }
++
++#if gcdSECURE_USER
++    {
++        gctINT slot;
++        gcskSECURE_CACHE * cache = &database->cache;
++
++        /* Setup the linked list of cache nodes. */
++        for (slot = 1; slot <= gcdSECURE_CACHE_SLOTS; ++slot)
++        {
++            cache->cache[slot].logical = gcvNULL;
++
++#if gcdSECURE_CACHE_METHOD != gcdSECURE_CACHE_TABLE
++            cache->cache[slot].prev = &cache->cache[slot - 1];
++            cache->cache[slot].next = &cache->cache[slot + 1];
++#   endif
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++            cache->cache[slot].nextHash = gcvNULL;
++            cache->cache[slot].prevHash = gcvNULL;
++#   endif
++        }
++
++#if gcdSECURE_CACHE_METHOD != gcdSECURE_CACHE_TABLE
++        /* Setup the head and tail of the cache. */
++        cache->cache[0].next    = &cache->cache[1];
++        cache->cache[0].prev    = &cache->cache[gcdSECURE_CACHE_SLOTS];
++        cache->cache[0].logical = gcvNULL;
++
++        /* Fix up the head and tail pointers. */
++        cache->cache[0].next->prev = &cache->cache[0];
++        cache->cache[0].prev->next = &cache->cache[0];
++#   endif
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++        /* Zero out the hash table. */
++        for (slot = 0; slot < gcmCOUNTOF(cache->hash); ++slot)
++        {
++            cache->hash[slot].logical  = gcvNULL;
++            cache->hash[slot].nextHash = gcvNULL;
++        }
++#   endif
++
++        /* Initialize cache index. */
++        cache->cacheIndex = gcvNULL;
++        cache->cacheFree  = 1;
++        cache->cacheStamp = 0;
++    }
++#endif
++
++    /* Reset idle timer. */
++    Kernel->db->lastIdle = 0;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_AddProcessDB
++**
++**  Add a record to a process database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**      gceDATABASE_TYPE TYPE
++**          Type of the record to add.
++**
++**      gctPOINTER Pointer
++**          Data of the record to add.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the record to add.
++**
++**      gctSIZE_T Size
++**          Size of the record to add.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_AddProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Pointer,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Size
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++    gcsDATABASE_RECORD_PTR record = gcvNULL;
++    gcsDATABASE_COUNTERS * count;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Pointer=0x%x "
++                   "Physical=0x%x Size=%lu",
++                   Kernel, ProcessID, Type, Pointer, Physical, Size);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Acquire the database mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Special case the idle record. */
++    if (Type == gcvDB_IDLE)
++    {
++        gctUINT64 time;
++
++        /* Get the current profile time. */
++        gcmkONERROR(gckOS_GetProfileTick(&time));
++
++        if ((ProcessID == 0) && (Kernel->db->lastIdle != 0))
++        {
++            /* Out of idle, adjust time it was idle. */
++            Kernel->db->idleTime += time - Kernel->db->lastIdle;
++            Kernel->db->lastIdle  = 0;
++        }
++        else if (ProcessID == 1)
++        {
++            /* Save current idle time. */
++            Kernel->db->lastIdle = time;
++        }
++
++#if gcdDYNAMIC_SPEED
++        {
++            /* Test for first call. */
++            if (Kernel->db->lastSlowdown == 0)
++            {
++                /* Save milliseconds. */
++                Kernel->db->lastSlowdown     = time;
++                Kernel->db->lastSlowdownIdle = Kernel->db->idleTime;
++            }
++            else
++            {
++                /* Compute ellapsed time in milliseconds. */
++                gctUINT delta = gckOS_ProfileToMS(time - Kernel->db->lastSlowdown);
++
++                /* Test for end of period. */
++                if (delta >= gcdDYNAMIC_SPEED)
++                {
++                    /* Compute number of idle milliseconds. */
++                    gctUINT idle = gckOS_ProfileToMS(
++                        Kernel->db->idleTime  - Kernel->db->lastSlowdownIdle);
++
++                    /* Broadcast to slow down the GPU. */
++                    gcmkONERROR(gckOS_BroadcastCalibrateSpeed(Kernel->os,
++                                                              Kernel->hardware,
++                                                              idle,
++                                                              delta));
++
++                    /* Save current time. */
++                    Kernel->db->lastSlowdown     = time;
++                    Kernel->db->lastSlowdownIdle = Kernel->db->idleTime;
++                }
++            }
++        }
++#endif
++        /* Release the database mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++        /* Success. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++
++
++    /* Find the database. */
++    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
++
++    /* Create a new record in the database. */
++    gcmkONERROR(gckKERNEL_NewRecord(Kernel, database, _GetSlot(database, Pointer), &record));
++
++    /* Initialize the record. */
++    record->kernel   = Kernel;
++    record->type     = Type;
++    record->data     = Pointer;
++    record->physical = Physical;
++    record->bytes    = Size;
++
++    /* Get pointer to counters. */
++    switch (Type)
++    {
++    case gcvDB_VIDEO_MEMORY:
++        count = &database->vidMem;
++        break;
++
++    case gcvDB_NON_PAGED:
++        count = &database->nonPaged;
++        break;
++
++    case gcvDB_CONTIGUOUS:
++        count = &database->contiguous;
++        break;
++
++    case gcvDB_MAP_MEMORY:
++        count = &database->mapMemory;
++        break;
++
++    case gcvDB_MAP_USER_MEMORY:
++        count = &database->mapUserMemory;
++        break;
++
++    case gcvDB_VIDEO_MEMORY_RESERVED:
++        count = &database->vidMemResv;
++        break;
++
++    case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
++        count = &database->vidMemCont;
++        break;
++
++    case gcvDB_VIDEO_MEMORY_VIRTUAL:
++        count = &database->vidMemVirt;
++        break;
++
++    default:
++        count = gcvNULL;
++        break;
++    }
++
++    if (count != gcvNULL)
++    {
++        /* Adjust counters. */
++        count->totalBytes += Size;
++        count->bytes      += Size;
++
++        if (count->bytes > count->maxBytes)
++        {
++            count->maxBytes = count->bytes;
++        }
++    }
++
++    /* Release the database mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the database mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_RemoveProcessDB
++**
++**  Remove a record from a process database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**      gceDATABASE_TYPE TYPE
++**          Type of the record to remove.
++**
++**      gctPOINTER Pointer
++**          Data of the record to remove.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_RemoveProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Pointer
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++    gctSIZE_T bytes = 0;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Pointer=0x%x",
++                   Kernel, ProcessID, Type, Pointer);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++
++    /* Acquire the database mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Find the database. */
++    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
++
++    /* Delete the record. */
++    gcmkONERROR(
++        gckKERNEL_DeleteRecord(Kernel, database, Type, Pointer, &bytes));
++
++    /* Update counters. */
++    switch (Type)
++    {
++    case gcvDB_VIDEO_MEMORY:
++        database->vidMem.bytes -= bytes;
++        break;
++
++    case gcvDB_NON_PAGED:
++        database->nonPaged.bytes -= bytes;
++        break;
++
++    case gcvDB_CONTIGUOUS:
++        database->contiguous.bytes -= bytes;
++        break;
++
++    case gcvDB_MAP_MEMORY:
++        database->mapMemory.bytes -= bytes;
++        break;
++
++    case gcvDB_MAP_USER_MEMORY:
++        database->mapUserMemory.bytes -= bytes;
++        break;
++
++    case gcvDB_VIDEO_MEMORY_RESERVED:
++        database->vidMemResv.bytes -= bytes;
++        break;
++
++    case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
++        database->vidMemCont.bytes -= bytes;
++        break;
++
++    case gcvDB_VIDEO_MEMORY_VIRTUAL:
++        database->vidMemVirt.bytes -= bytes;
++        break;
++
++    default:
++        break;
++    }
++
++    /* Release the database mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the database mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_FindProcessDB
++**
++**  Find a record from a process database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**      gceDATABASE_TYPE TYPE
++**          Type of the record to remove.
++**
++**      gctPOINTER Pointer
++**          Data of the record to remove.
++**
++**  OUTPUT:
++**
++**      gcsDATABASE_RECORD_PTR Record
++**          Copy of record.
++*/
++gceSTATUS
++gckKERNEL_FindProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gctUINT32 ThreadID,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Pointer,
++    OUT gcsDATABASE_RECORD_PTR Record
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Pointer=0x%x",
++                   Kernel, ProcessID, ThreadID, Type, Pointer);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++
++    /* Acquire the database mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Find the database. */
++    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
++
++    /* Find the record. */
++    gcmkONERROR(
++        gckKERNEL_FindRecord(Kernel, database, Type, Pointer, Record));
++
++    /* Release the database mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the database mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_DestroyProcessDB
++**
++**  Destroy a process database.  If the database contains any records, the data
++**  inside those records will be deleted as well.  This aids in the cleanup if
++**  a process has died unexpectedly or has memory leaks.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_DestroyProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++    gcsDATABASE_RECORD_PTR record, next;
++    gctBOOL asynchronous;
++    gctPHYS_ADDR physical;
++    gcuVIDMEM_NODE_PTR node;
++    gckKERNEL kernel = Kernel;
++    gctUINT32 i;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Acquire the database mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Find the database. */
++    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
++                   "DB(%d): VidMem: total=%lu max=%lu",
++                   ProcessID, database->vidMem.totalBytes,
++                   database->vidMem.maxBytes);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
++                   "DB(%d): NonPaged: total=%lu max=%lu",
++                   ProcessID, database->nonPaged.totalBytes,
++                   database->nonPaged.maxBytes);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
++                   "DB(%d): Contiguous: total=%lu max=%lu",
++                   ProcessID, database->contiguous.totalBytes,
++                   database->contiguous.maxBytes);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
++                   "DB(%d): Idle time=%llu",
++                   ProcessID, Kernel->db->idleTime);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
++                   "DB(%d): Map: total=%lu max=%lu",
++                   ProcessID, database->mapMemory.totalBytes,
++                   database->mapMemory.maxBytes);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DATABASE,
++                   "DB(%d): Map: total=%lu max=%lu",
++                   ProcessID, database->mapUserMemory.totalBytes,
++                   database->mapUserMemory.maxBytes);
++
++    if (database->list != gcvNULL)
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                       "Process %d has entries in its database:",
++                       ProcessID);
++    }
++
++    for(i = 0; i < gcmCOUNTOF(database->list); i++)
++    {
++
++    /* Walk all records. */
++    for (record = database->list[i]; record != gcvNULL; record = next)
++    {
++        /* Next next record. */
++        next = record->next;
++
++        gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++        acquired = gcvFALSE;
++
++        /* Dispatch on record type. */
++        switch (record->type)
++        {
++        case gcvDB_VIDEO_MEMORY:
++            /* Free the video memory. */
++            status = gckVIDMEM_Free(Kernel, gcmUINT64_TO_PTR(record->data));
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: VIDEO_MEMORY 0x%x (status=%d)",
++                           record->data, status);
++            break;
++
++        case gcvDB_NON_PAGED:
++            physical = gcmNAME_TO_PTR(record->physical);
++            /* Unmap user logical memory first. */
++            status = gckOS_UnmapUserLogical(Kernel->os,
++                                            physical,
++                                            record->bytes,
++                                            record->data);
++
++            /* Free the non paged memory. */
++            status = gckOS_FreeNonPagedMemory(Kernel->os,
++                                              record->bytes,
++                                              physical,
++                                              record->data);
++            gcmRELEASE_NAME(record->physical);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: NON_PAGED 0x%x, bytes=%lu (status=%d)",
++                           record->data, record->bytes, status);
++            break;
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++        case gcvDB_COMMAND_BUFFER:
++            /* Free the command buffer. */
++            status = gckEVENT_DestroyVirtualCommandBuffer(record->kernel->eventObj,
++                                                          record->bytes,
++                                                          gcmNAME_TO_PTR(record->physical),
++                                                          record->data,
++                                                          gcvKERNEL_PIXEL);
++            gcmRELEASE_NAME(record->physical);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: COMMAND_BUFFER 0x%x, bytes=%lu (status=%d)",
++                           record->data, record->bytes, status);
++            break;
++#endif
++
++        case gcvDB_CONTIGUOUS:
++            physical = gcmNAME_TO_PTR(record->physical);
++            /* Unmap user logical memory first. */
++            status = gckOS_UnmapUserLogical(Kernel->os,
++                                            physical,
++                                            record->bytes,
++                                            record->data);
++
++            /* Free the contiguous memory. */
++            status = gckEVENT_FreeContiguousMemory(Kernel->eventObj,
++                                                   record->bytes,
++                                                   physical,
++                                                   record->data,
++                                                   gcvKERNEL_PIXEL);
++            gcmRELEASE_NAME(record->physical);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: CONTIGUOUS 0x%x bytes=%lu (status=%d)",
++                           record->data, record->bytes, status);
++            break;
++
++        case gcvDB_SIGNAL:
++#if USE_NEW_LINUX_SIGNAL
++            status = gcvSTATUS_NOT_SUPPORTED;
++#else
++            /* Free the user signal. */
++            status = gckOS_DestroyUserSignal(Kernel->os,
++                                             gcmPTR2INT(record->data));
++#endif /* USE_NEW_LINUX_SIGNAL */
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: SIGNAL %d (status=%d)",
++                           (gctINT)(gctUINTPTR_T)record->data, status);
++            break;
++
++        case gcvDB_VIDEO_MEMORY_LOCKED:
++            node = gcmUINT64_TO_PTR(record->data);
++            /* Unlock what we still locked */
++            status = gckVIDMEM_Unlock(record->kernel,
++                                      node,
++                                      gcvSURF_TYPE_UNKNOWN,
++                                      &asynchronous);
++
++            if (gcmIS_SUCCESS(status) && (gcvTRUE == asynchronous))
++            {
++                /* TODO: we maybe need to schedule a event here */
++                status = gckVIDMEM_Unlock(record->kernel,
++                                          node,
++                                          gcvSURF_TYPE_UNKNOWN,
++                                          gcvNULL);
++            }
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: VIDEO_MEMORY_LOCKED 0x%x (status=%d)",
++                           node, status);
++            break;
++
++        case gcvDB_CONTEXT:
++            /* TODO: Free the context */
++            status = gckCOMMAND_Detach(Kernel->command, gcmNAME_TO_PTR(record->data));
++            gcmRELEASE_NAME(record->data);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: CONTEXT 0x%x (status=%d)",
++                           record->data, status);
++            break;
++
++        case gcvDB_MAP_MEMORY:
++            /* Unmap memory. */
++            status = gckKERNEL_UnmapMemory(Kernel,
++                                           record->physical,
++                                           record->bytes,
++                                           record->data);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: MAP MEMORY %d (status=%d)",
++                           gcmPTR2INT(record->data), status);
++            break;
++
++        case gcvDB_MAP_USER_MEMORY:
++            /* TODO: Unmap user memory. */
++            status = gckOS_UnmapUserMemory(Kernel->os,
++                                           Kernel->core,
++                                           record->physical,
++                                           record->bytes,
++                                           gcmNAME_TO_PTR(record->data),
++                                           0);
++            gcmRELEASE_NAME(record->data);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: MAP USER MEMORY %d (status=%d)",
++                           gcmPTR2INT(record->data), status);
++            break;
++
++        case gcvDB_SHARED_INFO:
++            status = gckOS_FreeMemory(Kernel->os, record->physical);
++            break;
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++        case gcvDB_SYNC_POINT:
++            /* Free the user signal. */
++            status = gckOS_DestroySyncPoint(Kernel->os,
++                                            (gctSYNC_POINT) record->data);
++
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_DATABASE,
++                           "DB: SYNC POINT %d (status=%d)",
++                           (gctINT)(gctUINTPTR_T)record->data, status);
++            break;
++#endif
++
++        case gcvDB_VIDEO_MEMORY_RESERVED:
++        case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
++        case gcvDB_VIDEO_MEMORY_VIRTUAL:
++            break;//Nothing to do
++
++        default:
++            gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DATABASE,
++                           "DB: Correcupted record=0x%08x type=%d",
++                           record, record->type);
++            break;
++        }
++
++        gcmkONERROR(
++            gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++        acquired = gcvTRUE;
++
++        /* Delete the record. */
++        gcmkONERROR(gckKERNEL_DeleteRecord(Kernel,
++                                           database,
++                                           record->type,
++                                           record->data,
++                                           gcvNULL));
++    }
++
++    }
++
++    /* Delete the database. */
++    gcmkONERROR(gckKERNEL_DeleteDatabase(Kernel, database));
++
++    /* Release the database mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the database mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckKERNEL_QueryProcessDB
++**
++**  Query a process database for the current usage of a particular record type.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**      gctBOOL LastProcessID
++**          gcvTRUE if searching for the last known process ID.  gcvFALSE if
++**          we need to search for the process ID specified by the ProcessID
++**          argument.
++**
++**      gceDATABASE_TYPE Type
++**          Type of the record to query.
++**
++**  OUTPUT:
++**
++**      gcuDATABASE_INFO * Info
++**          Pointer to a variable that receives the requested information.
++*/
++gceSTATUS
++gckKERNEL_QueryProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gctBOOL LastProcessID,
++    IN gceDATABASE_TYPE Type,
++    OUT gcuDATABASE_INFO * Info
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d Type=%d Info=0x%x",
++                   Kernel, ProcessID, Type, Info);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
++
++    /* Acquire the database mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Find the database. */
++    gcmkONERROR(
++        gckKERNEL_FindDatabase(Kernel, ProcessID, LastProcessID, &database));
++
++    /* Get pointer to counters. */
++    switch (Type)
++    {
++    case gcvDB_VIDEO_MEMORY:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->vidMem,
++                                  gcmSIZEOF(database->vidMem));
++        break;
++
++    case gcvDB_NON_PAGED:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->nonPaged,
++                                  gcmSIZEOF(database->vidMem));
++        break;
++
++    case gcvDB_CONTIGUOUS:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->contiguous,
++                                  gcmSIZEOF(database->vidMem));
++        break;
++
++    case gcvDB_IDLE:
++        Info->time           = Kernel->db->idleTime;
++        Kernel->db->idleTime = 0;
++        break;
++
++    case gcvDB_MAP_MEMORY:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->mapMemory,
++                                  gcmSIZEOF(database->mapMemory));
++        break;
++
++    case gcvDB_MAP_USER_MEMORY:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->mapUserMemory,
++                                  gcmSIZEOF(database->mapUserMemory));
++        break;
++
++    case gcvDB_VIDEO_MEMORY_RESERVED:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->vidMemResv,
++                                  gcmSIZEOF(database->vidMemResv));
++        break;
++
++    case gcvDB_VIDEO_MEMORY_CONTIGUOUS:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->vidMemCont,
++                                  gcmSIZEOF(database->vidMemCont));
++        break;
++
++    case gcvDB_VIDEO_MEMORY_VIRTUAL:
++        gckOS_MemCopy(&Info->counters,
++                                  &database->vidMemVirt,
++                                  gcmSIZEOF(database->vidMemVirt));
++        break;
++
++    default:
++        break;
++    }
++
++    /* Release the database mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the database mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdSECURE_USER
++/*******************************************************************************
++**  gckKERNEL_GetProcessDBCache
++**
++**  Get teh secure cache from a process database.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to a gckKERNEL object.
++**
++**      gctUINT32 ProcessID
++**          Process ID used to identify the database.
++**
++**  OUTPUT:
++**
++**      gcskSECURE_CACHE_PTR * Cache
++**          Pointer to a variable that receives the secure cache pointer.
++*/
++gceSTATUS
++gckKERNEL_GetProcessDBCache(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    OUT gcskSECURE_CACHE_PTR * Cache
++    )
++{
++    gceSTATUS status;
++    gcsDATABASE_PTR database;
++
++    gcmkHEADER_ARG("Kernel=0x%x ProcessID=%d", Kernel, ProcessID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Cache != gcvNULL);
++
++    /* Find the database. */
++    gcmkONERROR(gckKERNEL_FindDatabase(Kernel, ProcessID, gcvFALSE, &database));
++
++    /* Return the pointer to the cache. */
++    *Cache = &database->cache;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Cache=0x%x", *Cache);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++gceSTATUS
++gckKERNEL_DumpProcessDB(
++    IN gckKERNEL Kernel
++    )
++{
++    gcsDATABASE_PTR database;
++    gctINT i, pid;
++    gctUINT8 name[24];
++
++    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
++
++    /* Acquire the database mutex. */
++    gcmkVERIFY_OK(
++        gckOS_AcquireMutex(Kernel->os, Kernel->db->dbMutex, gcvINFINITE));
++
++    gcmkPRINT("**************************\n");
++    gcmkPRINT("***  PROCESS DB DUMP   ***\n");
++    gcmkPRINT("**************************\n");
++
++    gcmkPRINT_N(8, "%-8s%s\n", "PID", "NAME");
++    /* Walk the databases. */
++    for (i = 0; i < gcmCOUNTOF(Kernel->db->db); ++i)
++    {
++        for (database = Kernel->db->db[i];
++             database != gcvNULL;
++             database = database->next)
++        {
++            pid = database->processID;
++
++            gcmkVERIFY_OK(gckOS_ZeroMemory(name, gcmSIZEOF(name)));
++
++            gcmkVERIFY_OK(gckOS_GetProcessNameByPid(pid, gcmSIZEOF(name), name));
++
++            gcmkPRINT_N(8, "%-8d%s\n", pid, name);
++        }
++    }
++
++    /* Release the database mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->db->dbMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_debug.c	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,2559 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++#include <gc_hal_kernel_debug.h>
++
++/******************************************************************************\
++******************************** Debug Variables *******************************
++\******************************************************************************/
++
++static gceSTATUS _lastError  = gcvSTATUS_OK;
++static gctUINT32 _debugLevel = gcvLEVEL_ERROR;
++/*
++_debugZones config value
++Please Reference define in gc_hal_base.h
++*/
++static gctUINT32 _debugZones = gcvZONE_NONE;
++
++/******************************************************************************\
++********************************* Debug Switches *******************************
++\******************************************************************************/
++
++/*
++    gcdBUFFERED_OUTPUT
++
++    When set to non-zero, all output is collected into a buffer with the
++    specified size.  Once the buffer gets full, the debug buffer will be
++    printed to the console. gcdBUFFERED_SIZE determines the size of the buffer.
++*/
++#define gcdBUFFERED_OUTPUT  0
++
++/*
++    gcdBUFFERED_SIZE
++
++    When set to non-zero, all output is collected into a buffer with the
++    specified size.  Once the buffer gets full, the debug buffer will be
++    printed to the console.
++*/
++#define gcdBUFFERED_SIZE    (1024 * 1024 * 2)
++
++/*
++    gcdDMA_BUFFER_COUNT
++
++    If greater then zero, the debugger will attempt to find the command buffer
++    where DMA is currently executing and then print this buffer and
++    (gcdDMA_BUFFER_COUNT - 1) buffers before the current one. If set to zero
++    or the current buffer is not found, all buffers are printed.
++*/
++#define gcdDMA_BUFFER_COUNT 0
++
++/*
++    gcdTHREAD_BUFFERS
++
++    When greater then one, will accumulate messages from the specified number
++    of threads in separate output buffers.
++*/
++#define gcdTHREAD_BUFFERS   1
++
++/*
++    gcdENABLE_OVERFLOW
++
++    When set to non-zero, and the output buffer gets full, instead of being
++    printed, it will be allowed to overflow removing the oldest messages.
++*/
++#define gcdENABLE_OVERFLOW  1
++
++/*
++    gcdSHOW_LINE_NUMBER
++
++    When enabledm each print statement will be preceeded with the current
++    line number.
++*/
++#define gcdSHOW_LINE_NUMBER 0
++
++/*
++    gcdSHOW_PROCESS_ID
++
++    When enabledm each print statement will be preceeded with the current
++    process ID.
++*/
++#define gcdSHOW_PROCESS_ID  0
++
++/*
++    gcdSHOW_THREAD_ID
++
++    When enabledm each print statement will be preceeded with the current
++    thread ID.
++*/
++#define gcdSHOW_THREAD_ID   0
++
++/*
++    gcdSHOW_TIME
++
++    When enabled each print statement will be preceeded with the current
++    high-resolution time.
++*/
++#define gcdSHOW_TIME        0
++
++
++/******************************************************************************\
++****************************** Miscellaneous Macros ****************************
++\******************************************************************************/
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++#   define gcmDBGASSERT(Expression, Format, Value) \
++        if (!(Expression)) \
++        { \
++            _DirectPrint( \
++                "*** gcmDBGASSERT ***************************\n" \
++                "    function     : %s\n" \
++                "    line         : %d\n" \
++                "    expression   : " #Expression "\n" \
++                "    actual value : " Format "\n", \
++                __FUNCTION__, __LINE__, Value \
++                ); \
++        }
++#else
++#   define gcmDBGASSERT(Expression, Format, Value)
++#endif
++
++#define gcmPTRALIGNMENT(Pointer, Alignemnt) \
++( \
++    gcmALIGN(gcmPTR2INT(Pointer), Alignemnt) - gcmPTR2INT(Pointer) \
++)
++
++#if gcdALIGNBYSIZE
++#   define gcmISALIGNED(Offset, Alignment) \
++        (((Offset) & ((Alignment) - 1)) == 0)
++
++#   define gcmkALIGNPTR(Type, Pointer, Alignment) \
++        Pointer = (Type) gcmINT2PTR(gcmALIGN(gcmPTR2INT(Pointer), Alignment))
++#else
++#   define gcmISALIGNED(Offset, Alignment) \
++        gcvTRUE
++
++#   define gcmkALIGNPTR(Type, Pointer, Alignment)
++#endif
++
++#define gcmALIGNSIZE(Offset, Size) \
++    ((Size - Offset) + Size)
++
++#define gcdHAVEPREFIX \
++( \
++       gcdSHOW_TIME \
++    || gcdSHOW_LINE_NUMBER \
++    || gcdSHOW_PROCESS_ID \
++    || gcdSHOW_THREAD_ID \
++)
++
++#if gcdHAVEPREFIX
++
++#   define gcdOFFSET                    0
++
++#if gcdSHOW_TIME
++#if gcmISALIGNED(gcdOFFSET, 8)
++#           define gcdTIMESIZE          gcmSIZEOF(gctUINT64)
++#       elif gcdOFFSET == 4
++#           define gcdTIMESIZE          gcmALIGNSIZE(4, gcmSIZEOF(gctUINT64))
++#       else
++#           error "Unexpected offset value."
++#       endif
++#       undef  gcdOFFSET
++#       define gcdOFFSET                8
++#if !defined(gcdPREFIX_LEADER)
++#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT64)
++#           define gcdTIMEFORMAT        "0x%016llX"
++#       else
++#           define gcdTIMEFORMAT        ", 0x%016llX"
++#       endif
++#   else
++#       define gcdTIMESIZE              0
++#       define gcdTIMEFORMAT
++#   endif
++
++#if gcdSHOW_LINE_NUMBER
++#if gcmISALIGNED(gcdOFFSET, 8)
++#           define gcdNUMSIZE           gcmSIZEOF(gctUINT64)
++#       elif gcdOFFSET == 4
++#           define gcdNUMSIZE           gcmALIGNSIZE(4, gcmSIZEOF(gctUINT64))
++#       else
++#           error "Unexpected offset value."
++#       endif
++#       undef  gcdOFFSET
++#       define gcdOFFSET                8
++#if !defined(gcdPREFIX_LEADER)
++#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT64)
++#           define gcdNUMFORMAT         "%8llu"
++#       else
++#           define gcdNUMFORMAT         ", %8llu"
++#       endif
++#   else
++#       define gcdNUMSIZE               0
++#       define gcdNUMFORMAT
++#   endif
++
++#if gcdSHOW_PROCESS_ID
++#if gcmISALIGNED(gcdOFFSET, 4)
++#           define gcdPIDSIZE           gcmSIZEOF(gctUINT32)
++#       else
++#           error "Unexpected offset value."
++#       endif
++#       undef  gcdOFFSET
++#       define gcdOFFSET                4
++#if !defined(gcdPREFIX_LEADER)
++#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT32)
++#           define gcdPIDFORMAT         "pid=%5d"
++#       else
++#           define gcdPIDFORMAT         ", pid=%5d"
++#       endif
++#   else
++#       define gcdPIDSIZE               0
++#       define gcdPIDFORMAT
++#   endif
++
++#if gcdSHOW_THREAD_ID
++#if gcmISALIGNED(gcdOFFSET, 4)
++#           define gcdTIDSIZE           gcmSIZEOF(gctUINT32)
++#       else
++#           error "Unexpected offset value."
++#       endif
++#       undef  gcdOFFSET
++#       define gcdOFFSET                4
++#if !defined(gcdPREFIX_LEADER)
++#           define gcdPREFIX_LEADER     gcmSIZEOF(gctUINT32)
++#           define gcdTIDFORMAT         "tid=%5d"
++#       else
++#           define gcdTIDFORMAT         ", tid=%5d"
++#       endif
++#   else
++#       define gcdTIDSIZE               0
++#       define gcdTIDFORMAT
++#   endif
++
++#   define gcdPREFIX_SIZE \
++    ( \
++          gcdTIMESIZE \
++        + gcdNUMSIZE  \
++        + gcdPIDSIZE  \
++        + gcdTIDSIZE  \
++    )
++
++    static const char * _prefixFormat =
++    "["
++        gcdTIMEFORMAT
++        gcdNUMFORMAT
++        gcdPIDFORMAT
++        gcdTIDFORMAT
++    "] ";
++
++#else
++
++#   define gcdPREFIX_LEADER             gcmSIZEOF(gctUINT32)
++#   define gcdPREFIX_SIZE               0
++
++#endif
++
++/* Assumed largest variable argument leader size. */
++#define gcdVARARG_LEADER                gcmSIZEOF(gctUINT64)
++
++/* Alignnments. */
++#if gcdALIGNBYSIZE
++#   define gcdPREFIX_ALIGNMENT gcdPREFIX_LEADER
++#   define gcdVARARG_ALIGNMENT gcdVARARG_LEADER
++#else
++#   define gcdPREFIX_ALIGNMENT 0
++#   define gcdVARARG_ALIGNMENT 0
++#endif
++
++#if gcdBUFFERED_OUTPUT
++#   define gcdOUTPUTPREFIX _AppendPrefix
++#   define gcdOUTPUTSTRING _AppendString
++#   define gcdOUTPUTCOPY   _AppendCopy
++#   define gcdOUTPUTBUFFER _AppendBuffer
++#else
++#   define gcdOUTPUTPREFIX _PrintPrefix
++#   define gcdOUTPUTSTRING _PrintString
++#   define gcdOUTPUTCOPY   _PrintString
++#   define gcdOUTPUTBUFFER _PrintBuffer
++#endif
++
++/******************************************************************************\
++****************************** Private Structures ******************************
++\******************************************************************************/
++
++typedef enum _gceBUFITEM
++{
++    gceBUFITEM_NONE,
++    gcvBUFITEM_PREFIX,
++    gcvBUFITEM_STRING,
++    gcvBUFITEM_COPY,
++    gcvBUFITEM_BUFFER
++}
++gceBUFITEM;
++
++/* Common item head/buffer terminator. */
++typedef struct _gcsBUFITEM_HEAD * gcsBUFITEM_HEAD_PTR;
++typedef struct _gcsBUFITEM_HEAD
++{
++    gceBUFITEM              type;
++}
++gcsBUFITEM_HEAD;
++
++/* String prefix (for ex. [     1,tid=0x019A]) */
++typedef struct _gcsBUFITEM_PREFIX * gcsBUFITEM_PREFIX_PTR;
++typedef struct _gcsBUFITEM_PREFIX
++{
++    gceBUFITEM              type;
++#if gcdHAVEPREFIX
++    gctPOINTER              prefixData;
++#endif
++}
++gcsBUFITEM_PREFIX;
++
++/* Buffered string. */
++typedef struct _gcsBUFITEM_STRING * gcsBUFITEM_STRING_PTR;
++typedef struct _gcsBUFITEM_STRING
++{
++    gceBUFITEM              type;
++    gctINT                  indent;
++    gctCONST_STRING         message;
++    gctPOINTER              messageData;
++    gctUINT                 messageDataSize;
++}
++gcsBUFITEM_STRING;
++
++/* Buffered string (copy of the string is included with the record). */
++typedef struct _gcsBUFITEM_COPY * gcsBUFITEM_COPY_PTR;
++typedef struct _gcsBUFITEM_COPY
++{
++    gceBUFITEM              type;
++    gctINT                  indent;
++    gctPOINTER              messageData;
++    gctUINT                 messageDataSize;
++}
++gcsBUFITEM_COPY;
++
++/* Memory buffer. */
++typedef struct _gcsBUFITEM_BUFFER * gcsBUFITEM_BUFFER_PTR;
++typedef struct _gcsBUFITEM_BUFFER
++{
++    gceBUFITEM              type;
++    gctINT                  indent;
++    gceDUMP_BUFFER          bufferType;
++
++#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
++    gctUINT32               dmaAddress;
++#endif
++
++    gctUINT                 dataSize;
++    gctUINT32               address;
++#if gcdHAVEPREFIX
++    gctPOINTER              prefixData;
++#endif
++}
++gcsBUFITEM_BUFFER;
++
++typedef struct _gcsBUFFERED_OUTPUT * gcsBUFFERED_OUTPUT_PTR;
++typedef struct _gcsBUFFERED_OUTPUT
++{
++#if gcdTHREAD_BUFFERS > 1
++    gctUINT32               threadID;
++#endif
++
++#if gcdSHOW_LINE_NUMBER
++    gctUINT64               lineNumber;
++#endif
++
++    gctINT                  indent;
++
++#if gcdBUFFERED_OUTPUT
++    gctINT                  start;
++    gctINT                  index;
++    gctINT                  count;
++    gctUINT8                buffer[gcdBUFFERED_SIZE];
++#endif
++
++    gcsBUFFERED_OUTPUT_PTR  prev;
++    gcsBUFFERED_OUTPUT_PTR  next;
++}
++gcsBUFFERED_OUTPUT;
++
++typedef gctUINT (* gcfPRINTSTRING) (
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gcsBUFITEM_HEAD_PTR Item
++    );
++
++typedef gctINT (* gcfGETITEMSIZE) (
++    IN gcsBUFITEM_HEAD_PTR Item
++    );
++
++/******************************************************************************\
++******************************* Private Variables ******************************
++\******************************************************************************/
++
++static gcsBUFFERED_OUTPUT     _outputBuffer[gcdTHREAD_BUFFERS];
++static gcsBUFFERED_OUTPUT_PTR _outputBufferHead = gcvNULL;
++static gcsBUFFERED_OUTPUT_PTR _outputBufferTail = gcvNULL;
++
++/******************************************************************************\
++****************************** Item Size Functions *****************************
++\******************************************************************************/
++
++#if gcdBUFFERED_OUTPUT
++static gctINT
++_GetTerminatorItemSize(
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++    return gcmSIZEOF(gcsBUFITEM_HEAD);
++}
++
++static gctINT
++_GetPrefixItemSize(
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++#if gcdHAVEPREFIX
++    gcsBUFITEM_PREFIX_PTR item = (gcsBUFITEM_PREFIX_PTR) Item;
++    gctUINT vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
++    return vlen + gcdPREFIX_SIZE;
++#else
++    return gcmSIZEOF(gcsBUFITEM_PREFIX);
++#endif
++}
++
++static gctINT
++_GetStringItemSize(
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++    gcsBUFITEM_STRING_PTR item = (gcsBUFITEM_STRING_PTR) Item;
++    gctUINT vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
++    return vlen + item->messageDataSize;
++}
++
++static gctINT
++_GetCopyItemSize(
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++    gcsBUFITEM_COPY_PTR item = (gcsBUFITEM_COPY_PTR) Item;
++    gctUINT vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
++    return vlen + item->messageDataSize;
++}
++
++static gctINT
++_GetBufferItemSize(
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++#if gcdHAVEPREFIX
++    gcsBUFITEM_BUFFER_PTR item = (gcsBUFITEM_BUFFER_PTR) Item;
++    gctUINT vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
++    return vlen + gcdPREFIX_SIZE + item->dataSize;
++#else
++    gcsBUFITEM_BUFFER_PTR item = (gcsBUFITEM_BUFFER_PTR) Item;
++    return gcmSIZEOF(gcsBUFITEM_BUFFER) + item->dataSize;
++#endif
++}
++
++static gcfGETITEMSIZE _itemSize[] =
++{
++    _GetTerminatorItemSize,
++    _GetPrefixItemSize,
++    _GetStringItemSize,
++    _GetCopyItemSize,
++    _GetBufferItemSize
++};
++#endif
++
++/******************************************************************************\
++******************************* Printing Functions *****************************
++\******************************************************************************/
++
++#if gcdDEBUG || gcdBUFFERED_OUTPUT
++static void
++_DirectPrint(
++    gctCONST_STRING Message,
++    ...
++    )
++{
++    gctINT len;
++    char buffer[768];
++    gctARGUMENTS arguments;
++
++    gcmkARGUMENTS_START(arguments, Message);
++    len = gcmkVSPRINTF(buffer, gcmSIZEOF(buffer), Message, arguments);
++    gcmkARGUMENTS_END(arguments);
++
++    buffer[len] = '\0';
++    gcmkOUTPUT_STRING(buffer);
++}
++#endif
++
++static int
++_AppendIndent(
++    IN gctINT Indent,
++    IN char * Buffer,
++    IN int BufferSize
++    )
++{
++    gctINT i;
++
++    gctINT len    = 0;
++    gctINT indent = Indent % 40;
++
++    for (i = 0; i < indent; i += 1)
++    {
++        Buffer[len++] = ' ';
++    }
++
++    if (indent != Indent)
++    {
++        len += gcmkSPRINTF(
++            Buffer + len, BufferSize - len, " <%d> ", Indent
++            );
++
++        Buffer[len] = '\0';
++    }
++
++    return len;
++}
++
++#if gcdHAVEPREFIX
++static void
++_PrintPrefix(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctPOINTER Data
++    )
++{
++    char buffer[768];
++    gctINT len;
++
++    /* Format the string. */
++    len = gcmkVSPRINTF(buffer, gcmSIZEOF(buffer), _prefixFormat, Data);
++    buffer[len] = '\0';
++
++    /* Print the string. */
++    gcmkOUTPUT_STRING(buffer);
++}
++#endif
++
++static void
++_PrintString(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctINT Indent,
++    IN gctCONST_STRING Message,
++    IN gctUINT ArgumentSize,
++    IN gctPOINTER Data
++    )
++{
++    char buffer[768];
++    gctINT len;
++
++    /* Append the indent string. */
++    len = _AppendIndent(Indent, buffer, gcmSIZEOF(buffer));
++
++    /* Format the string. */
++    len += gcmkVSPRINTF(buffer + len, gcmSIZEOF(buffer) - len, Message, Data);
++    buffer[len] = '\0';
++
++    /* Add end-of-line if missing. */
++    if (buffer[len - 1] != '\n')
++    {
++        buffer[len++] = '\n';
++        buffer[len] = '\0';
++    }
++
++    /* Print the string. */
++    gcmkOUTPUT_STRING(buffer);
++}
++
++static void
++_PrintBuffer(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctINT Indent,
++    IN gctPOINTER PrefixData,
++    IN gctPOINTER Data,
++    IN gctUINT Address,
++    IN gctUINT DataSize,
++    IN gceDUMP_BUFFER Type,
++    IN gctUINT32 DmaAddress
++    )
++{
++    static gctCONST_STRING _titleString[] =
++    {
++        "CONTEXT BUFFER",
++        "USER COMMAND BUFFER",
++        "KERNEL COMMAND BUFFER",
++        "LINK BUFFER",
++        "WAIT LINK BUFFER",
++        ""
++    };
++
++    static const gctINT COLUMN_COUNT = 8;
++
++    gctUINT i, count, column, address;
++    gctUINT32_PTR data;
++    gctCHAR buffer[768];
++    gctUINT indent, len;
++    gctBOOL command;
++
++    /* Append space for the prefix. */
++#if gcdHAVEPREFIX
++    indent = gcmkVSPRINTF(buffer, gcmSIZEOF(buffer), _prefixFormat, PrefixData);
++    buffer[indent] = '\0';
++#else
++    indent = 0;
++#endif
++
++    /* Append the indent string. */
++    indent += _AppendIndent(
++        Indent, buffer + indent, gcmSIZEOF(buffer) - indent
++        );
++
++    switch (Type)
++    {
++    case gceDUMP_BUFFER_CONTEXT:
++    case gceDUMP_BUFFER_USER:
++    case gceDUMP_BUFFER_KERNEL:
++    case gceDUMP_BUFFER_LINK:
++    case gceDUMP_BUFFER_WAITLINK:
++        /* Form and print the title string. */
++        gcmkSPRINTF2(
++            buffer + indent, gcmSIZEOF(buffer) - indent,
++            "%s%s\n", _titleString[Type],
++            ((DmaAddress >= Address) && (DmaAddress < Address + DataSize))
++                ? " (CURRENT)" : ""
++            );
++
++        gcmkOUTPUT_STRING(buffer);
++
++        /* Terminate the string. */
++        buffer[indent] = '\0';
++
++        /* This is a command buffer. */
++        command = gcvTRUE;
++        break;
++
++    case gceDUMP_BUFFER_FROM_USER:
++        /* This is not a command buffer. */
++        command = gcvFALSE;
++
++        /* No title. */
++        break;
++
++    default:
++        gcmDBGASSERT(gcvFALSE, "%s", "invalid buffer type");
++
++        /* This is not a command buffer. */
++        command = gcvFALSE;
++    }
++
++    /* Overwrite the prefix with spaces. */
++    for (i = 0; i < indent; i += 1)
++    {
++        buffer[i] = ' ';
++    }
++
++    /* Form and print the opening string. */
++    if (command)
++    {
++        gcmkSPRINTF2(
++            buffer + indent, gcmSIZEOF(buffer) - indent,
++            "@[kernel.command %08X %08X\n", Address, DataSize
++            );
++
++        gcmkOUTPUT_STRING(buffer);
++
++        /* Terminate the string. */
++        buffer[indent] = '\0';
++    }
++
++    /* Get initial address. */
++    address = Address;
++
++    /* Cast the data pointer. */
++    data = (gctUINT32_PTR) Data;
++
++    /* Compute the number of double words. */
++    count = DataSize / gcmSIZEOF(gctUINT32);
++
++    /* Print the buffer. */
++    for (i = 0, len = indent, column = 0; i < count; i += 1)
++    {
++        /* Append the address. */
++        if (column == 0)
++        {
++            len += gcmkSPRINTF(
++                buffer + len, gcmSIZEOF(buffer) - len, "0x%08X:", address
++                );
++        }
++
++        /* Append the data value. */
++        len += gcmkSPRINTF2(
++            buffer + len, gcmSIZEOF(buffer) - len, "%c%08X",
++            (address == DmaAddress)? '>' : ' ', data[i]
++            );
++
++        buffer[len] = '\0';
++
++        /* Update the address. */
++        address += gcmSIZEOF(gctUINT32);
++
++        /* Advance column count. */
++        column += 1;
++
++        /* End of line? */
++        if ((column % COLUMN_COUNT) == 0)
++        {
++            /* Append EOL. */
++            gcmkSTRCAT(buffer + len, gcmSIZEOF(buffer) - len, "\n");
++
++            /* Print the string. */
++            gcmkOUTPUT_STRING(buffer);
++
++            /* Reset. */
++            len    = indent;
++            column = 0;
++        }
++    }
++
++    /* Print the last partial string. */
++    if (column != 0)
++    {
++        /* Append EOL. */
++        gcmkSTRCAT(buffer + len, gcmSIZEOF(buffer) - len, "\n");
++
++        /* Print the string. */
++        gcmkOUTPUT_STRING(buffer);
++    }
++
++    /* Form and print the opening string. */
++    if (command)
++    {
++        buffer[indent] = '\0';
++        gcmkSTRCAT(buffer, gcmSIZEOF(buffer), "] -- command\n");
++        gcmkOUTPUT_STRING(buffer);
++    }
++}
++
++#if gcdBUFFERED_OUTPUT
++static gctUINT
++_PrintNone(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++    /* Return the size of the node. */
++    return gcmSIZEOF(gcsBUFITEM_HEAD);
++}
++
++static gctUINT
++_PrintPrefixWrapper(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++#if gcdHAVEPREFIX
++    gcsBUFITEM_PREFIX_PTR item;
++    gctUINT vlen;
++
++    /* Get access to the data. */
++    item = (gcsBUFITEM_PREFIX_PTR) Item;
++
++    /* Print the message. */
++    _PrintPrefix(OutputBuffer, item->prefixData);
++
++    /* Compute the size of the variable portion of the structure. */
++    vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
++
++    /* Return the size of the node. */
++    return vlen + gcdPREFIX_SIZE;
++#else
++    return gcmSIZEOF(gcsBUFITEM_PREFIX);
++#endif
++}
++
++static gctUINT
++_PrintStringWrapper(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++    gcsBUFITEM_STRING_PTR item;
++    gctUINT vlen;
++
++    /* Get access to the data. */
++    item = (gcsBUFITEM_STRING_PTR) Item;
++
++    /* Print the message. */
++    _PrintString(
++        OutputBuffer,
++        item->indent, item->message, item->messageDataSize, item->messageData
++        );
++
++    /* Compute the size of the variable portion of the structure. */
++    vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
++
++    /* Return the size of the node. */
++    return vlen + item->messageDataSize;
++}
++
++static gctUINT
++_PrintCopyWrapper(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++    gcsBUFITEM_COPY_PTR item;
++    gctCONST_STRING message;
++    gctUINT vlen;
++
++    /* Get access to the data. */
++    item = (gcsBUFITEM_COPY_PTR) Item;
++
++    /* Determine the string pointer. */
++    message = (gctCONST_STRING) (item + 1);
++
++    /* Print the message. */
++    _PrintString(
++        OutputBuffer,
++        item->indent, message, item->messageDataSize, item->messageData
++        );
++
++    /* Compute the size of the variable portion of the structure. */
++    vlen = ((gctUINT8_PTR) item->messageData) - ((gctUINT8_PTR) item);
++
++    /* Return the size of the node. */
++    return vlen + item->messageDataSize;
++}
++
++static gctUINT
++_PrintBufferWrapper(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gcsBUFITEM_HEAD_PTR Item
++    )
++{
++#if gcdHAVEPREFIX
++    gctUINT32 dmaAddress;
++    gcsBUFITEM_BUFFER_PTR item;
++    gctPOINTER data;
++    gctUINT vlen;
++
++    /* Get access to the data. */
++    item = (gcsBUFITEM_BUFFER_PTR) Item;
++
++#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
++    dmaAddress = item->dmaAddress;
++#else
++    dmaAddress = 0xFFFFFFFF;
++#endif
++
++    if (dmaAddress != 0)
++    {
++        /* Compute the data address. */
++        data = ((gctUINT8_PTR) item->prefixData) + gcdPREFIX_SIZE;
++
++        /* Print buffer. */
++        _PrintBuffer(
++            OutputBuffer,
++            item->indent, item->prefixData,
++            data, item->address, item->dataSize,
++            item->bufferType, dmaAddress
++            );
++    }
++
++    /* Compute the size of the variable portion of the structure. */
++    vlen = ((gctUINT8_PTR) item->prefixData) - ((gctUINT8_PTR) item);
++
++    /* Return the size of the node. */
++    return vlen + gcdPREFIX_SIZE + item->dataSize;
++#else
++    gctUINT32 dmaAddress;
++    gcsBUFITEM_BUFFER_PTR item;
++
++    /* Get access to the data. */
++    item = (gcsBUFITEM_BUFFER_PTR) Item;
++
++#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
++    dmaAddress = item->dmaAddress;
++#else
++    dmaAddress = 0xFFFFFFFF;
++#endif
++
++    if (dmaAddress != 0)
++    {
++        /* Print buffer. */
++        _PrintBuffer(
++            OutputBuffer,
++            item->indent, gcvNULL,
++            item + 1, item->address, item->dataSize,
++            item->bufferType, dmaAddress
++            );
++    }
++
++    /* Return the size of the node. */
++    return gcmSIZEOF(gcsBUFITEM_BUFFER) + item->dataSize;
++#endif
++}
++
++static gcfPRINTSTRING _printArray[] =
++{
++    _PrintNone,
++    _PrintPrefixWrapper,
++    _PrintStringWrapper,
++    _PrintCopyWrapper,
++    _PrintBufferWrapper
++};
++#endif
++
++/******************************************************************************\
++******************************* Private Functions ******************************
++\******************************************************************************/
++
++#if gcdBUFFERED_OUTPUT
++
++#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
++static gcsBUFITEM_BUFFER_PTR
++_FindCurrentDMABuffer(
++    gctUINT32 DmaAddress
++    )
++{
++    gctINT i, skip;
++    gcsBUFITEM_HEAD_PTR item;
++    gcsBUFITEM_BUFFER_PTR dmaCurrent;
++
++    /* Reset the current buffer. */
++    dmaCurrent = gcvNULL;
++
++    /* Get the first stored item. */
++    item = (gcsBUFITEM_HEAD_PTR) &_outputBufferHead->buffer[_outputBufferHead->start];
++
++    /* Run through all items. */
++    for (i = 0; i < _outputBufferHead->count; i += 1)
++    {
++        /* Buffer item? */
++        if (item->type == gcvBUFITEM_BUFFER)
++        {
++            gcsBUFITEM_BUFFER_PTR buffer = (gcsBUFITEM_BUFFER_PTR) item;
++
++            if ((DmaAddress >= buffer->address) &&
++                (DmaAddress <  buffer->address + buffer->dataSize))
++            {
++                dmaCurrent = buffer;
++            }
++        }
++
++        /* Get the item size and skip it. */
++        skip = (* _itemSize[item->type]) (item);
++        item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
++
++        /* End of the buffer? Wrap around. */
++        if (item->type == gceBUFITEM_NONE)
++        {
++            item = (gcsBUFITEM_HEAD_PTR) _outputBufferHead->buffer;
++        }
++    }
++
++    /* Return result. */
++    return dmaCurrent;
++}
++
++static void
++_EnableAllDMABuffers(
++    void
++    )
++{
++    gctINT i, skip;
++    gcsBUFITEM_HEAD_PTR item;
++
++    /* Get the first stored item. */
++    item = (gcsBUFITEM_HEAD_PTR) &_outputBufferHead->buffer[_outputBufferHead->start];
++
++    /* Run through all items. */
++    for (i = 0; i < _outputBufferHead->count; i += 1)
++    {
++        /* Buffer item? */
++        if (item->type == gcvBUFITEM_BUFFER)
++        {
++            gcsBUFITEM_BUFFER_PTR buffer = (gcsBUFITEM_BUFFER_PTR) item;
++
++            /* Enable the buffer. */
++            buffer->dmaAddress = ~0U;
++        }
++
++        /* Get the item size and skip it. */
++        skip = (* _itemSize[item->type]) (item);
++        item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
++
++        /* End of the buffer? Wrap around. */
++        if (item->type == gceBUFITEM_NONE)
++        {
++            item = (gcsBUFITEM_HEAD_PTR) _outputBufferHead->buffer;
++        }
++    }
++}
++
++static void
++_EnableDMABuffers(
++    gctUINT32 DmaAddress,
++    gcsBUFITEM_BUFFER_PTR CurrentDMABuffer
++    )
++{
++    gctINT i, skip, index;
++    gcsBUFITEM_HEAD_PTR item;
++    gcsBUFITEM_BUFFER_PTR buffers[gcdDMA_BUFFER_COUNT];
++
++    /* Reset buffer pointers. */
++    gckOS_ZeroMemory(buffers, gcmSIZEOF(buffers));
++
++    /* Set the current buffer index. */
++    index = -1;
++
++    /* Get the first stored item. */
++    item = (gcsBUFITEM_HEAD_PTR) &_outputBufferHead->buffer[_outputBufferHead->start];
++
++    /* Run through all items until the current DMA buffer is found. */
++    for (i = 0; i < _outputBufferHead->count; i += 1)
++    {
++        /* Buffer item? */
++        if (item->type == gcvBUFITEM_BUFFER)
++        {
++            /* Advance the index. */
++            index = (index + 1) % gcdDMA_BUFFER_COUNT;
++
++            /* Add to the buffer array. */
++            buffers[index] = (gcsBUFITEM_BUFFER_PTR) item;
++
++            /* Stop if this is the current DMA buffer. */
++            if ((gcsBUFITEM_BUFFER_PTR) item == CurrentDMABuffer)
++            {
++                break;
++            }
++        }
++
++        /* Get the item size and skip it. */
++        skip = (* _itemSize[item->type]) (item);
++        item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
++
++        /* End of the buffer? Wrap around. */
++        if (item->type == gceBUFITEM_NONE)
++        {
++            item = (gcsBUFITEM_HEAD_PTR) _outputBufferHead->buffer;
++        }
++    }
++
++    /* Enable the found buffers. */
++    gcmDBGASSERT(index != -1, "%d", index);
++
++    for (i = 0; i < gcdDMA_BUFFER_COUNT; i += 1)
++    {
++        if (buffers[index] == gcvNULL)
++        {
++            break;
++        }
++
++        buffers[index]->dmaAddress = DmaAddress;
++
++        index -= 1;
++
++        if (index == -1)
++        {
++            index = gcdDMA_BUFFER_COUNT - 1;
++        }
++    }
++}
++#endif
++
++static void
++_Flush(
++    gctUINT32 DmaAddress
++    )
++{
++    gctINT i, skip;
++    gcsBUFITEM_HEAD_PTR item;
++
++    gcsBUFFERED_OUTPUT_PTR outputBuffer = _outputBufferHead;
++
++#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
++    if ((outputBuffer != gcvNULL) && (outputBuffer->count != 0))
++    {
++        /* Find the current DMA buffer. */
++        gcsBUFITEM_BUFFER_PTR dmaCurrent = _FindCurrentDMABuffer(DmaAddress);
++
++        /* Was the current buffer found? */
++        if (dmaCurrent == gcvNULL)
++        {
++            /* No, print all buffers. */
++            _EnableAllDMABuffers();
++        }
++        else
++        {
++            /* Yes, enable only specified number of buffers. */
++            _EnableDMABuffers(DmaAddress, dmaCurrent);
++        }
++    }
++#endif
++
++    while (outputBuffer != gcvNULL)
++    {
++        if (outputBuffer->count != 0)
++        {
++            _DirectPrint("********************************************************************************\n");
++            _DirectPrint("FLUSHING DEBUG OUTPUT BUFFER (%d elements).\n", outputBuffer->count);
++            _DirectPrint("********************************************************************************\n");
++
++            item = (gcsBUFITEM_HEAD_PTR) &outputBuffer->buffer[outputBuffer->start];
++
++            for (i = 0; i < outputBuffer->count; i += 1)
++            {
++                skip = (* _printArray[item->type]) (outputBuffer, item);
++
++                item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
++
++                if (item->type == gceBUFITEM_NONE)
++                {
++                    item = (gcsBUFITEM_HEAD_PTR) outputBuffer->buffer;
++                }
++            }
++
++            outputBuffer->start = 0;
++            outputBuffer->index = 0;
++            outputBuffer->count = 0;
++        }
++
++        outputBuffer = outputBuffer->next;
++    }
++}
++
++static gcsBUFITEM_HEAD_PTR
++_AllocateItem(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctINT Size
++    )
++{
++    gctINT skip;
++    gcsBUFITEM_HEAD_PTR item, next;
++
++#if gcdENABLE_OVERFLOW
++    if (
++            (OutputBuffer->index + Size >= gcdBUFFERED_SIZE - gcmSIZEOF(gcsBUFITEM_HEAD))
++            ||
++            (
++                (OutputBuffer->index        <  OutputBuffer->start) &&
++                (OutputBuffer->index + Size >= OutputBuffer->start)
++            )
++    )
++    {
++        if (OutputBuffer->index + Size >= gcdBUFFERED_SIZE - gcmSIZEOF(gcsBUFITEM_HEAD))
++        {
++            if (OutputBuffer->index < OutputBuffer->start)
++            {
++                item = (gcsBUFITEM_HEAD_PTR) &OutputBuffer->buffer[OutputBuffer->start];
++
++                while (item->type != gceBUFITEM_NONE)
++                {
++                    skip = (* _itemSize[item->type]) (item);
++
++                    OutputBuffer->start += skip;
++                    OutputBuffer->count -= 1;
++
++                    item->type = gceBUFITEM_NONE;
++                    item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
++                }
++
++                OutputBuffer->start = 0;
++            }
++
++            OutputBuffer->index = 0;
++        }
++
++        item = (gcsBUFITEM_HEAD_PTR) &OutputBuffer->buffer[OutputBuffer->start];
++
++        while (OutputBuffer->start - OutputBuffer->index <= Size)
++        {
++            skip = (* _itemSize[item->type]) (item);
++
++            OutputBuffer->start += skip;
++            OutputBuffer->count -= 1;
++
++            item->type = gceBUFITEM_NONE;
++            item = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + skip);
++
++            if (item->type == gceBUFITEM_NONE)
++            {
++                OutputBuffer->start = 0;
++                break;
++            }
++        }
++    }
++#else
++    if (OutputBuffer->index + Size > gcdBUFFERED_SIZE - gcmSIZEOF(gcsBUFITEM_HEAD))
++    {
++        _DirectPrint("\nMessage buffer full; forcing message flush.\n\n");
++        _Flush(~0U);
++    }
++#endif
++
++    item = (gcsBUFITEM_HEAD_PTR) &OutputBuffer->buffer[OutputBuffer->index];
++
++    OutputBuffer->index += Size;
++    OutputBuffer->count += 1;
++
++    next = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) item + Size);
++    next->type = gceBUFITEM_NONE;
++
++    return item;
++}
++
++#if gcdALIGNBYSIZE
++static void
++_FreeExtraSpace(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctPOINTER Item,
++    IN gctINT ItemSize,
++    IN gctINT FreeSize
++    )
++{
++    gcsBUFITEM_HEAD_PTR next;
++
++    OutputBuffer->index -= FreeSize;
++
++    next = (gcsBUFITEM_HEAD_PTR) ((gctUINT8_PTR) Item + ItemSize);
++    next->type = gceBUFITEM_NONE;
++}
++#endif
++
++#if gcdHAVEPREFIX
++static void
++_AppendPrefix(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctPOINTER Data
++    )
++{
++    gctUINT8_PTR prefixData;
++    gcsBUFITEM_PREFIX_PTR item;
++    gctINT allocSize;
++
++#if gcdALIGNBYSIZE
++    gctUINT alignment;
++    gctINT size, freeSize;
++#endif
++
++    gcmDBGASSERT(Data != gcvNULL, "%p", Data);
++
++    /* Determine the maximum item size. */
++    allocSize
++        = gcmSIZEOF(gcsBUFITEM_PREFIX)
++        + gcdPREFIX_SIZE
++        + gcdPREFIX_ALIGNMENT;
++
++    /* Allocate prefix item. */
++    item = (gcsBUFITEM_PREFIX_PTR) _AllocateItem(OutputBuffer, allocSize);
++
++    /* Compute the initial prefix data pointer. */
++    prefixData = (gctUINT8_PTR) (item + 1);
++
++    /* Align the data pointer as necessary. */
++#if gcdALIGNBYSIZE
++    alignment = gcmPTRALIGNMENT(prefixData, gcdPREFIX_ALIGNMENT);
++    prefixData += alignment;
++#endif
++
++    /* Set item data. */
++    item->type       = gcvBUFITEM_PREFIX;
++    item->prefixData = prefixData;
++
++    /* Copy argument value. */
++    memcpy(prefixData, Data, gcdPREFIX_SIZE);
++
++#if gcdALIGNBYSIZE
++    /* Compute the actual node size. */
++    size = gcmSIZEOF(gcsBUFITEM_PREFIX) + gcdPREFIX_SIZE + alignment;
++
++    /* Free extra memory if any. */
++    freeSize = allocSize - size;
++    if (freeSize != 0)
++    {
++        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
++    }
++#endif
++}
++#endif
++
++static void
++_AppendString(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctINT Indent,
++    IN gctCONST_STRING Message,
++    IN gctUINT ArgumentSize,
++    IN gctPOINTER Data
++    )
++{
++    gctUINT8_PTR messageData;
++    gcsBUFITEM_STRING_PTR item;
++    gctINT allocSize;
++
++#if gcdALIGNBYSIZE
++    gctUINT alignment;
++    gctINT size, freeSize;
++#endif
++
++    /* Determine the maximum item size. */
++    allocSize
++        = gcmSIZEOF(gcsBUFITEM_STRING)
++        + ArgumentSize
++        + gcdVARARG_ALIGNMENT;
++
++    /* Allocate prefix item. */
++    item = (gcsBUFITEM_STRING_PTR) _AllocateItem(OutputBuffer, allocSize);
++
++    /* Compute the initial message data pointer. */
++    messageData = (gctUINT8_PTR) (item + 1);
++
++    /* Align the data pointer as necessary. */
++#if gcdALIGNBYSIZE
++    alignment = gcmPTRALIGNMENT(messageData, gcdVARARG_ALIGNMENT);
++    messageData += alignment;
++#endif
++
++    /* Set item data. */
++    item->type            = gcvBUFITEM_STRING;
++    item->indent          = Indent;
++    item->message         = Message;
++    item->messageData     = messageData;
++    item->messageDataSize = ArgumentSize;
++
++    /* Copy argument value. */
++    if (ArgumentSize != 0)
++    {
++        memcpy(messageData, Data, ArgumentSize);
++    }
++
++#if gcdALIGNBYSIZE
++    /* Compute the actual node size. */
++    size = gcmSIZEOF(gcsBUFITEM_STRING) + ArgumentSize + alignment;
++
++    /* Free extra memory if any. */
++    freeSize = allocSize - size;
++    if (freeSize != 0)
++    {
++        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
++    }
++#endif
++}
++
++static void
++_AppendCopy(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctINT Indent,
++    IN gctCONST_STRING Message,
++    IN gctUINT ArgumentSize,
++    IN gctPOINTER Data
++    )
++{
++    gctUINT8_PTR messageData;
++    gcsBUFITEM_COPY_PTR item;
++    gctINT allocSize;
++    gctINT messageLength;
++    gctCONST_STRING message;
++
++#if gcdALIGNBYSIZE
++    gctUINT alignment;
++    gctINT size, freeSize;
++#endif
++
++    /* Get the length of the string. */
++    messageLength = strlen(Message) + 1;
++
++    /* Determine the maximum item size. */
++    allocSize
++        = gcmSIZEOF(gcsBUFITEM_COPY)
++        + messageLength
++        + ArgumentSize
++        + gcdVARARG_ALIGNMENT;
++
++    /* Allocate prefix item. */
++    item = (gcsBUFITEM_COPY_PTR) _AllocateItem(OutputBuffer, allocSize);
++
++    /* Determine the message placement. */
++    message = (gctCONST_STRING) (item + 1);
++
++    /* Compute the initial message data pointer. */
++    messageData = (gctUINT8_PTR) message + messageLength;
++
++    /* Align the data pointer as necessary. */
++#if gcdALIGNBYSIZE
++    if (ArgumentSize == 0)
++    {
++        alignment = 0;
++    }
++    else
++    {
++        alignment = gcmPTRALIGNMENT(messageData, gcdVARARG_ALIGNMENT);
++        messageData += alignment;
++    }
++#endif
++
++    /* Set item data. */
++    item->type            = gcvBUFITEM_COPY;
++    item->indent          = Indent;
++    item->messageData     = messageData;
++    item->messageDataSize = ArgumentSize;
++
++    /* Copy the message. */
++    memcpy((gctPOINTER) message, Message, messageLength);
++
++    /* Copy argument value. */
++    if (ArgumentSize != 0)
++    {
++        memcpy(messageData, Data, ArgumentSize);
++    }
++
++#if gcdALIGNBYSIZE
++    /* Compute the actual node size. */
++    size
++        = gcmSIZEOF(gcsBUFITEM_COPY)
++        + messageLength
++        + ArgumentSize
++        + alignment;
++
++    /* Free extra memory if any. */
++    freeSize = allocSize - size;
++    if (freeSize != 0)
++    {
++        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
++    }
++#endif
++}
++
++static void
++_AppendBuffer(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctINT Indent,
++    IN gctPOINTER PrefixData,
++    IN gctPOINTER Data,
++    IN gctUINT Address,
++    IN gctUINT DataSize,
++    IN gceDUMP_BUFFER Type,
++    IN gctUINT32 DmaAddress
++    )
++{
++#if gcdHAVEPREFIX
++    gctUINT8_PTR prefixData;
++    gcsBUFITEM_BUFFER_PTR item;
++    gctINT allocSize;
++    gctPOINTER data;
++
++#if gcdALIGNBYSIZE
++    gctUINT alignment;
++    gctINT size, freeSize;
++#endif
++
++    gcmDBGASSERT(DataSize != 0, "%d", DataSize);
++    gcmDBGASSERT(Data != gcvNULL, "%p", Data);
++
++    /* Determine the maximum item size. */
++    allocSize
++        = gcmSIZEOF(gcsBUFITEM_BUFFER)
++        + gcdPREFIX_SIZE
++        + gcdPREFIX_ALIGNMENT
++        + DataSize;
++
++    /* Allocate prefix item. */
++    item = (gcsBUFITEM_BUFFER_PTR) _AllocateItem(OutputBuffer, allocSize);
++
++    /* Compute the initial prefix data pointer. */
++    prefixData = (gctUINT8_PTR) (item + 1);
++
++#if gcdALIGNBYSIZE
++    /* Align the data pointer as necessary. */
++    alignment = gcmPTRALIGNMENT(prefixData, gcdPREFIX_ALIGNMENT);
++    prefixData += alignment;
++#endif
++
++    /* Set item data. */
++    item->type       = gcvBUFITEM_BUFFER;
++    item->indent     = Indent;
++    item->bufferType = Type;
++    item->dataSize   = DataSize;
++    item->address    = Address;
++    item->prefixData = prefixData;
++
++#if gcdDMA_BUFFER_COUNT && (gcdTHREAD_BUFFERS == 1)
++    item->dmaAddress = DmaAddress;
++#endif
++
++    /* Copy prefix data. */
++    memcpy(prefixData, PrefixData, gcdPREFIX_SIZE);
++
++    /* Compute the data pointer. */
++    data = prefixData + gcdPREFIX_SIZE;
++
++    /* Copy argument value. */
++    memcpy(data, Data, DataSize);
++
++#if gcdALIGNBYSIZE
++    /* Compute the actual node size. */
++    size
++        = gcmSIZEOF(gcsBUFITEM_BUFFER)
++        + gcdPREFIX_SIZE
++        + alignment
++        + DataSize;
++
++    /* Free extra memory if any. */
++    freeSize = allocSize - size;
++    if (freeSize != 0)
++    {
++        _FreeExtraSpace(OutputBuffer, item, size, freeSize);
++    }
++#endif
++#else
++    gcsBUFITEM_BUFFER_PTR item;
++    gctINT size;
++
++    gcmDBGASSERT(DataSize != 0, "%d", DataSize);
++    gcmDBGASSERT(Data != gcvNULL, "%p", Data);
++
++    /* Determine the maximum item size. */
++    size = gcmSIZEOF(gcsBUFITEM_BUFFER) + DataSize;
++
++    /* Allocate prefix item. */
++    item = (gcsBUFITEM_BUFFER_PTR) _AllocateItem(OutputBuffer, size);
++
++    /* Set item data. */
++    item->type     = gcvBUFITEM_BUFFER;
++    item->indent   = Indent;
++    item->dataSize = DataSize;
++    item->address  = Address;
++
++    /* Copy argument value. */
++    memcpy(item + 1, Data, DataSize);
++#endif
++}
++#endif
++
++static gcmINLINE void
++_InitBuffers(
++    void
++    )
++{
++    int i;
++
++    if (_outputBufferHead == gcvNULL)
++    {
++        for (i = 0; i < gcdTHREAD_BUFFERS; i += 1)
++        {
++            if (_outputBufferTail == gcvNULL)
++            {
++                _outputBufferHead = &_outputBuffer[i];
++            }
++            else
++            {
++                _outputBufferTail->next = &_outputBuffer[i];
++            }
++
++#if gcdTHREAD_BUFFERS > 1
++            _outputBuffer[i].threadID = ~0U;
++#endif
++
++            _outputBuffer[i].prev = _outputBufferTail;
++            _outputBuffer[i].next =  gcvNULL;
++
++            _outputBufferTail = &_outputBuffer[i];
++        }
++    }
++}
++
++static gcmINLINE gcsBUFFERED_OUTPUT_PTR
++_GetOutputBuffer(
++    void
++    )
++{
++    gcsBUFFERED_OUTPUT_PTR outputBuffer;
++
++#if gcdTHREAD_BUFFERS > 1
++    /* Get the current thread ID. */
++    gctUINT32 ThreadID = gcmkGETTHREADID();
++
++    /* Locate the output buffer for the thread. */
++    outputBuffer = _outputBufferHead;
++
++    while (outputBuffer != gcvNULL)
++    {
++        if (outputBuffer->threadID == ThreadID)
++        {
++            break;
++        }
++
++        outputBuffer = outputBuffer->next;
++    }
++
++    /* No matching buffer found? */
++    if (outputBuffer == gcvNULL)
++    {
++        /* Get the tail for the buffer. */
++        outputBuffer = _outputBufferTail;
++
++        /* Move it to the head. */
++        _outputBufferTail       = _outputBufferTail->prev;
++        _outputBufferTail->next = gcvNULL;
++
++        outputBuffer->prev = gcvNULL;
++        outputBuffer->next = _outputBufferHead;
++
++        _outputBufferHead->prev = outputBuffer;
++        _outputBufferHead       = outputBuffer;
++
++        /* Reset the buffer. */
++        outputBuffer->threadID   = ThreadID;
++#if gcdBUFFERED_OUTPUT
++        outputBuffer->start      = 0;
++        outputBuffer->index      = 0;
++        outputBuffer->count      = 0;
++#endif
++#if gcdSHOW_LINE_NUMBER
++        outputBuffer->lineNumber = 0;
++#endif
++    }
++#else
++    outputBuffer = _outputBufferHead;
++#endif
++
++    return outputBuffer;
++}
++
++static gcmINLINE int _GetArgumentSize(
++    IN gctCONST_STRING Message
++    )
++{
++    int i, count;
++
++    gcmDBGASSERT(Message != gcvNULL, "%p", Message);
++
++    for (i = 0, count = 0; Message[i]; i += 1)
++    {
++        if (Message[i] == '%')
++        {
++            count += 1;
++        }
++    }
++
++    return count * gcmSIZEOF(gctUINT32);
++}
++
++#if gcdHAVEPREFIX
++static void
++_InitPrefixData(
++    IN gcsBUFFERED_OUTPUT_PTR OutputBuffer,
++    IN gctPOINTER Data
++    )
++{
++    gctUINT8_PTR data  = (gctUINT8_PTR) Data;
++
++#if gcdSHOW_TIME
++    {
++        gctUINT64 time;
++        gckOS_GetProfileTick(&time);
++        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT64));
++        * ((gctUINT64_PTR) data) = time;
++        data += gcmSIZEOF(gctUINT64);
++    }
++#endif
++
++#if gcdSHOW_LINE_NUMBER
++    {
++        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT64));
++        * ((gctUINT64_PTR) data) = OutputBuffer->lineNumber;
++        data += gcmSIZEOF(gctUINT64);
++    }
++#endif
++
++#if gcdSHOW_PROCESS_ID
++    {
++        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT32));
++        * ((gctUINT32_PTR) data) = gcmkGETPROCESSID();
++        data += gcmSIZEOF(gctUINT32);
++    }
++#endif
++
++#if gcdSHOW_THREAD_ID
++    {
++        gcmkALIGNPTR(gctUINT8_PTR, data, gcmSIZEOF(gctUINT32));
++        * ((gctUINT32_PTR) data) = gcmkGETTHREADID();
++    }
++#endif
++}
++#endif
++
++static void
++_Print(
++    IN gctUINT ArgumentSize,
++    IN gctBOOL CopyMessage,
++    IN gctCONST_STRING Message,
++    IN gctARGUMENTS Arguments
++    )
++{
++    gcsBUFFERED_OUTPUT_PTR outputBuffer;
++    gcmkDECLARE_LOCK(lockHandle);
++
++    gcmkLOCKSECTION(lockHandle);
++
++    /* Initialize output buffer list. */
++    _InitBuffers();
++
++    /* Locate the proper output buffer. */
++    outputBuffer = _GetOutputBuffer();
++
++    /* Update the line number. */
++#if gcdSHOW_LINE_NUMBER
++    outputBuffer->lineNumber += 1;
++#endif
++
++    /* Print prefix. */
++#if gcdHAVEPREFIX
++    {
++        gctUINT8_PTR alignedPrefixData;
++        gctUINT8 prefixData[gcdPREFIX_SIZE + gcdPREFIX_ALIGNMENT];
++
++        /* Compute aligned pointer. */
++        alignedPrefixData = prefixData;
++        gcmkALIGNPTR(gctUINT8_PTR, alignedPrefixData, gcdPREFIX_ALIGNMENT);
++
++        /* Initialize the prefix data. */
++        _InitPrefixData(outputBuffer, alignedPrefixData);
++
++        /* Print the prefix. */
++        gcdOUTPUTPREFIX(outputBuffer, alignedPrefixData);
++    }
++#endif
++
++    /* Form the indent string. */
++    if (strncmp(Message, "--", 2) == 0)
++    {
++        outputBuffer->indent -= 2;
++    }
++
++    /* Print the message. */
++    if (CopyMessage)
++    {
++        gcdOUTPUTCOPY(
++            outputBuffer, outputBuffer->indent,
++            Message, ArgumentSize, * (gctPOINTER *) &Arguments
++            );
++    }
++    else
++    {
++        gcdOUTPUTSTRING(
++            outputBuffer, outputBuffer->indent,
++            Message, ArgumentSize, * (gctPOINTER *) &Arguments
++            );
++    }
++
++    /* Check increasing indent. */
++    if (strncmp(Message, "++", 2) == 0)
++    {
++        outputBuffer->indent += 2;
++    }
++
++    gcmkUNLOCKSECTION(lockHandle);
++}
++
++
++/******************************************************************************\
++********************************* Debug Macros *********************************
++\******************************************************************************/
++
++#ifdef __QNXNTO__
++
++extern volatile unsigned g_nQnxInIsrs;
++
++#define gcmDEBUGPRINT(ArgumentSize, CopyMessage, Message) \
++{ \
++    if (atomic_add_value(&g_nQnxInIsrs, 1) == 0) \
++    { \
++        gctARGUMENTS __arguments__; \
++        gcmkARGUMENTS_START(__arguments__, Message); \
++        _Print(ArgumentSize, CopyMessage, Message, __arguments__); \
++        gcmkARGUMENTS_END(__arguments__); \
++    } \
++    atomic_sub(&g_nQnxInIsrs, 1); \
++}
++
++#else
++
++#define gcmDEBUGPRINT(ArgumentSize, CopyMessage, Message) \
++{ \
++    gctARGUMENTS __arguments__; \
++    gcmkARGUMENTS_START(__arguments__, Message); \
++    _Print(ArgumentSize, CopyMessage, Message, __arguments__); \
++    gcmkARGUMENTS_END(__arguments__); \
++}
++
++#endif
++
++/******************************************************************************\
++********************************** Debug Code **********************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckOS_Print
++**
++**  Send a message to the debugger.
++**
++**  INPUT:
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_Print(
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_PrintN
++**
++**  Send a message to the debugger.
++**
++**  INPUT:
++**
++**      gctUINT ArgumentSize
++**          The size of the optional arguments in bytes.
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_PrintN(
++    IN gctUINT ArgumentSize,
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    gcmDEBUGPRINT(ArgumentSize, gcvFALSE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_CopyPrint
++**
++**  Send a message to the debugger. If in buffered output mode, the entire
++**  message will be copied into the buffer instead of using the pointer to
++**  the string.
++**
++**  INPUT:
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_CopyPrint(
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvTRUE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_DumpBuffer
++**
++**  Print the contents of the specified buffer.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctPOINTER Buffer
++**          Pointer to the buffer to print.
++**
++**      gctUINT Size
++**          Size of the buffer.
++**
++**      gceDUMP_BUFFER Type
++**          Buffer type.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_DumpBuffer(
++    IN gckOS Os,
++    IN gctPOINTER Buffer,
++    IN gctUINT Size,
++    IN gceDUMP_BUFFER Type,
++    IN gctBOOL CopyMessage
++    )
++{
++    gctUINT32 address;
++    gcsBUFFERED_OUTPUT_PTR outputBuffer;
++    static gctBOOL userLocked;
++    gctCHAR *buffer = (gctCHAR*)Buffer;
++
++    gcmkDECLARE_LOCK(lockHandle);
++
++    /* Request lock when not coming from user,
++       or coming from user and not yet locked
++          and message is starting with @[. */
++    if (Type == gceDUMP_BUFFER_FROM_USER)
++    {
++        if ((Size > 2)
++        && (buffer[0] == '@')
++        && (buffer[1] == '['))
++        {
++            /* Beginning of a user dump. */
++            gcmkLOCKSECTION(lockHandle);
++            userLocked = gcvTRUE;
++        }
++        /* Else, let it pass through. */
++    }
++    else
++    {
++        gcmkLOCKSECTION(lockHandle);
++        userLocked = gcvFALSE;
++    }
++
++    if (Buffer != gcvNULL)
++    {
++        /* Initialize output buffer list. */
++        _InitBuffers();
++
++        /* Locate the proper output buffer. */
++        outputBuffer = _GetOutputBuffer();
++
++        /* Update the line number. */
++#if gcdSHOW_LINE_NUMBER
++        outputBuffer->lineNumber += 1;
++#endif
++
++        /* Get the physical address of the buffer. */
++        if (Type != gceDUMP_BUFFER_FROM_USER)
++        {
++            gcmkVERIFY_OK(gckOS_GetPhysicalAddress(Os, Buffer, &address));
++        }
++        else
++        {
++            address = 0;
++        }
++
++#if gcdHAVEPREFIX
++        {
++            gctUINT8_PTR alignedPrefixData;
++            gctUINT8 prefixData[gcdPREFIX_SIZE + gcdPREFIX_ALIGNMENT];
++
++            /* Compute aligned pointer. */
++            alignedPrefixData = prefixData;
++            gcmkALIGNPTR(gctUINT8_PTR, alignedPrefixData, gcdPREFIX_ALIGNMENT);
++
++            /* Initialize the prefix data. */
++            _InitPrefixData(outputBuffer, alignedPrefixData);
++
++            /* Print/schedule the buffer. */
++            gcdOUTPUTBUFFER(
++                outputBuffer, outputBuffer->indent,
++                alignedPrefixData, Buffer, address, Size, Type, 0
++                );
++        }
++#else
++        /* Print/schedule the buffer. */
++        if (Type == gceDUMP_BUFFER_FROM_USER)
++        {
++            gcdOUTPUTSTRING(
++                outputBuffer, outputBuffer->indent,
++                Buffer, 0, gcvNULL
++                );
++        }
++        else
++        {
++            gcdOUTPUTBUFFER(
++                outputBuffer, outputBuffer->indent,
++                gcvNULL, Buffer, address, Size, Type, 0
++                );
++        }
++#endif
++    }
++
++    /* Unlock when not coming from user,
++       or coming from user and not yet locked. */
++    if (userLocked)
++    {
++        if ((Size > 4)
++        && (buffer[0] == ']')
++        && (buffer[1] == ' ')
++        && (buffer[2] == '-')
++        && (buffer[3] == '-'))
++        {
++            /* End of a user dump. */
++            gcmkUNLOCKSECTION(lockHandle);
++            userLocked = gcvFALSE;
++        }
++        /* Else, let it pass through, don't unlock. */
++    }
++    else
++    {
++        gcmkUNLOCKSECTION(lockHandle);
++    }
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugTrace
++**
++**  Send a leveled message to the debugger.
++**
++**  INPUT:
++**
++**      gctUINT32 Level
++**          Debug level of message.
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_DebugTrace(
++    IN gctUINT32 Level,
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    if (Level > _debugLevel)
++    {
++        return;
++    }
++
++    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugTraceN
++**
++**  Send a leveled message to the debugger.
++**
++**  INPUT:
++**
++**      gctUINT32 Level
++**          Debug level of message.
++**
++**      gctUINT ArgumentSize
++**          The size of the optional arguments in bytes.
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_DebugTraceN(
++    IN gctUINT32 Level,
++    IN gctUINT ArgumentSize,
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    if (Level > _debugLevel)
++    {
++        return;
++    }
++
++    gcmDEBUGPRINT(ArgumentSize, gcvFALSE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugTraceZone
++**
++**  Send a leveled and zoned message to the debugger.
++**
++**  INPUT:
++**
++**      gctUINT32 Level
++**          Debug level for message.
++**
++**      gctUINT32 Zone
++**          Debug zone for message.
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_DebugTraceZone(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone,
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    if ((Level > _debugLevel) || !(Zone & _debugZones))
++    {
++        return;
++    }
++
++    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugTraceZoneN
++**
++**  Send a leveled and zoned message to the debugger.
++**
++**  INPUT:
++**
++**      gctUINT32 Level
++**          Debug level for message.
++**
++**      gctUINT32 Zone
++**          Debug zone for message.
++**
++**      gctUINT ArgumentSize
++**          The size of the optional arguments in bytes.
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_DebugTraceZoneN(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone,
++    IN gctUINT ArgumentSize,
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    if ((Level > _debugLevel) || !(Zone & _debugZones))
++    {
++        return;
++    }
++
++    gcmDEBUGPRINT(ArgumentSize, gcvFALSE, Message);
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugBreak
++**
++**  Break into the debugger.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++void
++gckOS_DebugBreak(
++    void
++    )
++{
++    gckOS_DebugTrace(gcvLEVEL_ERROR, "%s(%d)", __FUNCTION__, __LINE__);
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugFatal
++**
++**  Send a message to the debugger and break into the debugger.
++**
++**  INPUT:
++**
++**      gctCONST_STRING Message
++**          Pointer to message.
++**
++**      ...
++**          Optional arguments.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++void
++gckOS_DebugFatal(
++    IN gctCONST_STRING Message,
++    ...
++    )
++{
++    gcmkPRINT_VERSION();
++    gcmDEBUGPRINT(_GetArgumentSize(Message), gcvFALSE, Message);
++
++    /* Break into the debugger. */
++    gckOS_DebugBreak();
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetDebugLevel
++**
++**  Set the debug level.
++**
++**  INPUT:
++**
++**      gctUINT32 Level
++**          New debug level.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_SetDebugLevel(
++    IN gctUINT32 Level
++    )
++{
++    _debugLevel = Level;
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetDebugZone
++**
++**  Set the debug zone.
++**
++**  INPUT:
++**
++**      gctUINT32 Zone
++**          New debug zone.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++void
++gckOS_SetDebugZone(
++    IN gctUINT32 Zone
++    )
++{
++    _debugZones = Zone;
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetDebugLevelZone
++**
++**  Set the debug level and zone.
++**
++**  INPUT:
++**
++**      gctUINT32 Level
++**          New debug level.
++**
++**      gctUINT32 Zone
++**          New debug zone.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_SetDebugLevelZone(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone
++    )
++{
++    _debugLevel = Level;
++    _debugZones = Zone;
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetDebugZones
++**
++**  Enable or disable debug zones.
++**
++**  INPUT:
++**
++**      gctUINT32 Zones
++**          Debug zones to enable or disable.
++**
++**      gctBOOL Enable
++**          Set to gcvTRUE to enable the zones (or the Zones with the current
++**          zones) or gcvFALSE to disable the specified Zones.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_SetDebugZones(
++    IN gctUINT32 Zones,
++    IN gctBOOL Enable
++    )
++{
++    if (Enable)
++    {
++        /* Enable the zones. */
++        _debugZones |= Zones;
++    }
++    else
++    {
++        /* Disable the zones. */
++        _debugZones &= ~Zones;
++    }
++}
++
++/*******************************************************************************
++**
++**  gckOS_Verify
++**
++**  Called to verify the result of a function call.
++**
++**  INPUT:
++**
++**      gceSTATUS Status
++**          Function call result.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_Verify(
++    IN gceSTATUS status
++    )
++{
++    _lastError = status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_DebugFlush
++**
++**  Force messages to be flushed out.
++**
++**  INPUT:
++**
++**      gctCONST_STRING CallerName
++**          Name of the caller function.
++**
++**      gctUINT LineNumber
++**          Line number of the caller.
++**
++**      gctUINT32 DmaAddress
++**          The current DMA address or ~0U to ignore.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++void
++gckOS_DebugFlush(
++    gctCONST_STRING CallerName,
++    gctUINT LineNumber,
++    gctUINT32 DmaAddress
++    )
++{
++#if gcdBUFFERED_OUTPUT
++    _DirectPrint("\nFlush requested by %s(%d).\n\n", CallerName, LineNumber);
++    _Flush(DmaAddress);
++#endif
++}
++gctCONST_STRING
++gckOS_DebugStatus2Name(
++	gceSTATUS status
++	)
++{
++	switch (status)
++	{
++	case gcvSTATUS_OK:
++		return "gcvSTATUS_OK";
++	case gcvSTATUS_TRUE:
++		return "gcvSTATUS_TRUE";
++	case gcvSTATUS_NO_MORE_DATA:
++		return "gcvSTATUS_NO_MORE_DATA";
++	case gcvSTATUS_CACHED:
++		return "gcvSTATUS_CACHED";
++	case gcvSTATUS_MIPMAP_TOO_LARGE:
++		return "gcvSTATUS_MIPMAP_TOO_LARGE";
++	case gcvSTATUS_NAME_NOT_FOUND:
++		return "gcvSTATUS_NAME_NOT_FOUND";
++	case gcvSTATUS_NOT_OUR_INTERRUPT:
++		return "gcvSTATUS_NOT_OUR_INTERRUPT";
++	case gcvSTATUS_MISMATCH:
++		return "gcvSTATUS_MISMATCH";
++	case gcvSTATUS_MIPMAP_TOO_SMALL:
++		return "gcvSTATUS_MIPMAP_TOO_SMALL";
++	case gcvSTATUS_LARGER:
++		return "gcvSTATUS_LARGER";
++	case gcvSTATUS_SMALLER:
++		return "gcvSTATUS_SMALLER";
++	case gcvSTATUS_CHIP_NOT_READY:
++		return "gcvSTATUS_CHIP_NOT_READY";
++	case gcvSTATUS_NEED_CONVERSION:
++		return "gcvSTATUS_NEED_CONVERSION";
++	case gcvSTATUS_SKIP:
++		return "gcvSTATUS_SKIP";
++	case gcvSTATUS_DATA_TOO_LARGE:
++		return "gcvSTATUS_DATA_TOO_LARGE";
++	case gcvSTATUS_INVALID_CONFIG:
++		return "gcvSTATUS_INVALID_CONFIG";
++	case gcvSTATUS_CHANGED:
++		return "gcvSTATUS_CHANGED";
++	case gcvSTATUS_NOT_SUPPORT_DITHER:
++		return "gcvSTATUS_NOT_SUPPORT_DITHER";
++
++	case gcvSTATUS_INVALID_ARGUMENT:
++		return "gcvSTATUS_INVALID_ARGUMENT";
++	case gcvSTATUS_INVALID_OBJECT:
++		return "gcvSTATUS_INVALID_OBJECT";
++	case gcvSTATUS_OUT_OF_MEMORY:
++		return "gcvSTATUS_OUT_OF_MEMORY";
++	case gcvSTATUS_MEMORY_LOCKED:
++		return "gcvSTATUS_MEMORY_LOCKED";
++	case gcvSTATUS_MEMORY_UNLOCKED:
++		return "gcvSTATUS_MEMORY_UNLOCKED";
++	case gcvSTATUS_HEAP_CORRUPTED:
++		return "gcvSTATUS_HEAP_CORRUPTED";
++	case gcvSTATUS_GENERIC_IO:
++		return "gcvSTATUS_GENERIC_IO";
++	case gcvSTATUS_INVALID_ADDRESS:
++		return "gcvSTATUS_INVALID_ADDRESS";
++	case gcvSTATUS_CONTEXT_LOSSED:
++		return "gcvSTATUS_CONTEXT_LOSSED";
++	case gcvSTATUS_TOO_COMPLEX:
++		return "gcvSTATUS_TOO_COMPLEX";
++	case gcvSTATUS_BUFFER_TOO_SMALL:
++		return "gcvSTATUS_BUFFER_TOO_SMALL";
++	case gcvSTATUS_INTERFACE_ERROR:
++		return "gcvSTATUS_INTERFACE_ERROR";
++	case gcvSTATUS_NOT_SUPPORTED:
++		return "gcvSTATUS_NOT_SUPPORTED";
++	case gcvSTATUS_MORE_DATA:
++		return "gcvSTATUS_MORE_DATA";
++	case gcvSTATUS_TIMEOUT:
++		return "gcvSTATUS_TIMEOUT";
++	case gcvSTATUS_OUT_OF_RESOURCES:
++		return "gcvSTATUS_OUT_OF_RESOURCES";
++	case gcvSTATUS_INVALID_DATA:
++		return "gcvSTATUS_INVALID_DATA";
++	case gcvSTATUS_INVALID_MIPMAP:
++		return "gcvSTATUS_INVALID_MIPMAP";
++	case gcvSTATUS_NOT_FOUND:
++		return "gcvSTATUS_NOT_FOUND";
++	case gcvSTATUS_NOT_ALIGNED:
++		return "gcvSTATUS_NOT_ALIGNED";
++	case gcvSTATUS_INVALID_REQUEST:
++		return "gcvSTATUS_INVALID_REQUEST";
++	case gcvSTATUS_GPU_NOT_RESPONDING:
++		return "gcvSTATUS_GPU_NOT_RESPONDING";
++	case gcvSTATUS_TIMER_OVERFLOW:
++		return "gcvSTATUS_TIMER_OVERFLOW";
++	case gcvSTATUS_VERSION_MISMATCH:
++		return "gcvSTATUS_VERSION_MISMATCH";
++	case gcvSTATUS_LOCKED:
++		return "gcvSTATUS_LOCKED";
++
++    /* Linker errors. */
++	case gcvSTATUS_GLOBAL_TYPE_MISMATCH:
++		return "gcvSTATUS_GLOBAL_TYPE_MISMATCH";
++	case gcvSTATUS_TOO_MANY_ATTRIBUTES:
++		return "gcvSTATUS_TOO_MANY_ATTRIBUTES";
++	case gcvSTATUS_TOO_MANY_UNIFORMS:
++		return "gcvSTATUS_TOO_MANY_UNIFORMS";
++	case gcvSTATUS_TOO_MANY_VARYINGS:
++		return "gcvSTATUS_TOO_MANY_VARYINGS";
++	case gcvSTATUS_UNDECLARED_VARYING:
++		return "gcvSTATUS_UNDECLARED_VARYING";
++	case gcvSTATUS_VARYING_TYPE_MISMATCH:
++		return "gcvSTATUS_VARYING_TYPE_MISMATCH";
++	case gcvSTATUS_MISSING_MAIN:
++		return "gcvSTATUS_MISSING_MAIN";
++	case gcvSTATUS_NAME_MISMATCH:
++		return "gcvSTATUS_NAME_MISMATCH";
++	case gcvSTATUS_INVALID_INDEX:
++		return "gcvSTATUS_INVALID_INDEX";
++	default:
++		return "nil";
++	}
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_event.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,2898 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++#include "gc_hal_kernel_buffer.h"
++
++#ifdef __QNXNTO__
++#include <atomic.h>
++#include "gc_hal_kernel_qnx.h"
++#endif
++
++#define _GC_OBJ_ZONE                    gcvZONE_EVENT
++
++#define gcdEVENT_ALLOCATION_COUNT       (4096 / gcmSIZEOF(gcsHAL_INTERFACE))
++#define gcdEVENT_MIN_THRESHOLD          4
++
++/******************************************************************************\
++********************************* Support Code *********************************
++\******************************************************************************/
++
++static gceSTATUS
++gckEVENT_AllocateQueue(
++    IN gckEVENT Event,
++    OUT gcsEVENT_QUEUE_PTR * Queue
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Event=0x%x", Event);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Queue != gcvNULL);
++
++    /* Do we have free queues? */
++    if (Event->freeList == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++    /* Move one free queue from the free list. */
++    * Queue = Event->freeList;
++    Event->freeList = Event->freeList->next;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Queue=0x%x", gcmOPT_POINTER(Queue));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++gckEVENT_FreeQueue(
++    IN gckEVENT Event,
++    OUT gcsEVENT_QUEUE_PTR Queue
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++
++    gcmkHEADER_ARG("Event=0x%x", Event);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Queue != gcvNULL);
++
++    /* Move one free queue from the free list. */
++    Queue->next = Event->freeList;
++    Event->freeList = Queue;
++
++    /* Success. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++gckEVENT_FreeRecord(
++    IN gckEVENT Event,
++    IN gcsEVENT_PTR Record
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Event=0x%x Record=0x%x", Event, Record);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Record != gcvNULL);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Event->os,
++                                   Event->freeEventMutex,
++                                   gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Push the record on the free list. */
++    Record->next           = Event->freeEventList;
++    Event->freeEventList   = Record;
++    Event->freeEventCount += 1;
++
++    /* Release the mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++gckEVENT_IsEmpty(
++    IN gckEVENT Event,
++    OUT gctBOOL_PTR IsEmpty
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T i;
++
++    gcmkHEADER_ARG("Event=0x%x", Event);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(IsEmpty != gcvNULL);
++
++    /* Assume the event queue is empty. */
++    *IsEmpty = gcvTRUE;
++
++    /* Try acquiring the mutex. */
++    status = gckOS_AcquireMutex(Event->os, Event->eventQueueMutex, 0);
++    if (status == gcvSTATUS_TIMEOUT)
++    {
++        /* Timeout - queue is no longer empty. */
++        *IsEmpty = gcvFALSE;
++    }
++    else
++    {
++        /* Bail out on error. */
++        gcmkONERROR(status);
++
++        /* Walk the event queue. */
++        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++        {
++            /* Check whether this event is in use. */
++            if (Event->queues[i].head != gcvNULL)
++            {
++                /* The event is in use, hence the queue is not empty. */
++                *IsEmpty = gcvFALSE;
++                break;
++            }
++        }
++
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*IsEmpty=%d", gcmOPT_VALUE(IsEmpty));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++_TryToIdleGPU(
++    IN gckEVENT Event
++)
++{
++    gceSTATUS status;
++    gctBOOL empty = gcvFALSE, idle = gcvFALSE;
++    gctBOOL powerLocked = gcvFALSE;
++    gckHARDWARE hardware;
++
++    gcmkHEADER_ARG("Event=0x%x", Event);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    /* Grab gckHARDWARE object. */
++    hardware = Event->kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    /* Check whether the event queue is empty. */
++    gcmkONERROR(gckEVENT_IsEmpty(Event, &empty));
++
++    if (empty)
++    {
++        status = gckOS_AcquireMutex(hardware->os, hardware->powerMutex, 0);
++        if (status == gcvSTATUS_TIMEOUT)
++        {
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        powerLocked = gcvTRUE;
++
++        /* Query whether the hardware is idle. */
++        gcmkONERROR(gckHARDWARE_QueryIdle(Event->kernel->hardware, &idle));
++
++        gcmkONERROR(gckOS_ReleaseMutex(hardware->os, hardware->powerMutex));
++        powerLocked = gcvFALSE;
++
++        if (idle)
++        {
++            /* Inform the system of idle GPU. */
++            gcmkONERROR(gckOS_Broadcast(Event->os,
++                                        Event->kernel->hardware,
++                                        gcvBROADCAST_GPU_IDLE));
++        }
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (powerLocked)
++    {
++        gcmkONERROR(gckOS_ReleaseMutex(hardware->os, hardware->powerMutex));
++        powerLocked = gcvFALSE;
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++__RemoveRecordFromProcessDB(
++    IN gckEVENT Event,
++    IN gcsEVENT_PTR Record
++    )
++{
++    gcmkHEADER_ARG("Event=0x%x Record=0x%x", Event, Record);
++    gcmkVERIFY_ARGUMENT(Record != gcvNULL);
++
++    while (Record != gcvNULL)
++    {
++        if (Record->info.command == gcvHAL_SIGNAL)
++        {
++            /* TODO: Find a better place to bind signal to hardware.*/
++            gcmkVERIFY_OK(gckOS_SignalSetHardware(Event->os,
++                        gcmUINT64_TO_PTR(Record->info.u.Signal.signal),
++                        Event->kernel->hardware));
++        }
++
++        if (Record->fromKernel)
++        {
++            /* No need to check db if event is from kernel. */
++            Record = Record->next;
++            continue;
++        }
++
++        switch (Record->info.command)
++        {
++        case gcvHAL_FREE_NON_PAGED_MEMORY:
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Event->kernel,
++                Record->processID,
++                gcvDB_NON_PAGED,
++                gcmUINT64_TO_PTR(Record->info.u.FreeNonPagedMemory.logical)));
++            break;
++
++        case gcvHAL_FREE_CONTIGUOUS_MEMORY:
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Event->kernel,
++                Record->processID,
++                gcvDB_CONTIGUOUS,
++                gcmUINT64_TO_PTR(Record->info.u.FreeContiguousMemory.logical)));
++            break;
++
++        case gcvHAL_FREE_VIDEO_MEMORY:
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Event->kernel,
++                Record->processID,
++                gcvDB_VIDEO_MEMORY,
++                gcmUINT64_TO_PTR(Record->info.u.FreeVideoMemory.node)));
++
++            {
++                gcuVIDMEM_NODE_PTR node = (gcuVIDMEM_NODE_PTR)(gcmUINT64_TO_PTR(Record->info.u.FreeVideoMemory.node));
++
++                if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++                {
++                     gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(Event->kernel,
++                                      Record->processID,
++                                      gcvDB_VIDEO_MEMORY_RESERVED,
++                                      node));
++                }
++                else if(node->Virtual.contiguous)
++                {
++                    gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(Event->kernel,
++                                      Record->processID,
++                                      gcvDB_VIDEO_MEMORY_CONTIGUOUS,
++                                      node));
++                }
++                else
++                {
++                    gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(Event->kernel,
++                                      Record->processID,
++                                      gcvDB_VIDEO_MEMORY_VIRTUAL,
++                                      node));
++                }
++            }
++
++            break;
++
++        case gcvHAL_UNLOCK_VIDEO_MEMORY:
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Event->kernel,
++                Record->processID,
++                gcvDB_VIDEO_MEMORY_LOCKED,
++                gcmUINT64_TO_PTR(Record->info.u.UnlockVideoMemory.node)));
++            break;
++
++        case gcvHAL_UNMAP_USER_MEMORY:
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Event->kernel,
++                Record->processID,
++                gcvDB_MAP_USER_MEMORY,
++                gcmINT2PTR(Record->info.u.UnmapUserMemory.info)));
++            break;
++
++        case gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER:
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Event->kernel,
++                Record->processID,
++                gcvDB_COMMAND_BUFFER,
++                gcmUINT64_TO_PTR(Record->info.u.FreeVirtualCommandBuffer.logical)));
++            break;
++
++        default:
++            break;
++        }
++
++        Record = Record->next;
++    }
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++void
++_SubmitTimerFunction(
++    gctPOINTER Data
++    )
++{
++    gckEVENT event = (gckEVENT)Data;
++    gcmkVERIFY_OK(gckEVENT_Submit(event, gcvTRUE, gcvFALSE));
++}
++
++/******************************************************************************\
++******************************* gckEVENT API Code *******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckEVENT_Construct
++**
++**  Construct a new gckEVENT object.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**  OUTPUT:
++**
++**      gckEVENT * Event
++**          Pointer to a variable that receives the gckEVENT object pointer.
++*/
++gceSTATUS
++gckEVENT_Construct(
++    IN gckKERNEL Kernel,
++    OUT gckEVENT * Event
++    )
++{
++    gckOS os;
++    gceSTATUS status;
++    gckEVENT eventObj = gcvNULL;
++    int i;
++    gcsEVENT_PTR record;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Event != gcvNULL);
++
++    /* Extract the pointer to the gckOS object. */
++    os = Kernel->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Allocate the gckEVENT object. */
++    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(struct _gckEVENT), &pointer));
++
++    eventObj = pointer;
++
++    /* Reset the object. */
++    gcmkVERIFY_OK(gckOS_ZeroMemory(eventObj, gcmSIZEOF(struct _gckEVENT)));
++
++    /* Initialize the gckEVENT object. */
++    eventObj->object.type = gcvOBJ_EVENT;
++    eventObj->kernel      = Kernel;
++    eventObj->os          = os;
++
++    /* Create the mutexes. */
++    gcmkONERROR(gckOS_CreateMutex(os, &eventObj->eventQueueMutex));
++    gcmkONERROR(gckOS_CreateMutex(os, &eventObj->freeEventMutex));
++    gcmkONERROR(gckOS_CreateMutex(os, &eventObj->eventListMutex));
++
++    /* Create a bunch of event reccords. */
++    for (i = 0; i < gcdEVENT_ALLOCATION_COUNT; i += 1)
++    {
++        /* Allocate an event record. */
++        gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(gcsEVENT), &pointer));
++
++        record = pointer;
++
++        /* Push it on the free list. */
++        record->next              = eventObj->freeEventList;
++        eventObj->freeEventList   = record;
++        eventObj->freeEventCount += 1;
++    }
++
++    /* Initialize the free list of event queues. */
++    for (i = 0; i < gcdREPO_LIST_COUNT; i += 1)
++    {
++        eventObj->repoList[i].next = eventObj->freeList;
++        eventObj->freeList = &eventObj->repoList[i];
++    }
++
++    /* Construct the atom. */
++    gcmkONERROR(gckOS_AtomConstruct(os, &eventObj->freeAtom));
++    gcmkONERROR(gckOS_AtomSet(os,
++                              eventObj->freeAtom,
++                              gcmCOUNTOF(eventObj->queues)));
++
++#if gcdSMP
++    gcmkONERROR(gckOS_AtomConstruct(os, &eventObj->pending));
++#endif
++
++    gcmkVERIFY_OK(gckOS_CreateTimer(os,
++                                    _SubmitTimerFunction,
++                                    (gctPOINTER)eventObj,
++                                    &eventObj->submitTimer));
++
++    /* Return pointer to the gckEVENT object. */
++    *Event = eventObj;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Event=0x%x", *Event);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (eventObj != gcvNULL)
++    {
++        if (eventObj->eventQueueMutex != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(os, eventObj->eventQueueMutex));
++        }
++
++        if (eventObj->freeEventMutex != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(os, eventObj->freeEventMutex));
++        }
++
++        if (eventObj->eventListMutex != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(os, eventObj->eventListMutex));
++        }
++
++        while (eventObj->freeEventList != gcvNULL)
++        {
++            record = eventObj->freeEventList;
++            eventObj->freeEventList = record->next;
++
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, record));
++        }
++
++        if (eventObj->freeAtom != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(os, eventObj->freeAtom));
++        }
++
++#if gcdSMP
++        if (eventObj->pending != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_AtomDestroy(os, eventObj->pending));
++        }
++#endif
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, eventObj));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Destroy
++**
++**  Destroy an gckEVENT object.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Destroy(
++    IN gckEVENT Event
++    )
++{
++    gcsEVENT_PTR record;
++    gcsEVENT_QUEUE_PTR queue;
++
++    gcmkHEADER_ARG("Event=0x%x", Event);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    if (Event->submitTimer != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckOS_StopTimer(Event->os, Event->submitTimer));
++        gcmkVERIFY_OK(gckOS_DestroyTimer(Event->os, Event->submitTimer));
++    }
++
++    /* Delete the queue mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Event->os, Event->eventQueueMutex));
++
++    /* Free all free events. */
++    while (Event->freeEventList != gcvNULL)
++    {
++        record = Event->freeEventList;
++        Event->freeEventList = record->next;
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Event->os, record));
++    }
++
++    /* Delete the free mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Event->os, Event->freeEventMutex));
++
++    /* Free all pending queues. */
++    while (Event->queueHead != gcvNULL)
++    {
++        /* Get the current queue. */
++        queue = Event->queueHead;
++
++        /* Free all pending events. */
++        while (queue->head != gcvNULL)
++        {
++            record      = queue->head;
++            queue->head = record->next;
++
++            gcmkTRACE_ZONE_N(
++                gcvLEVEL_WARNING, gcvZONE_EVENT,
++                gcmSIZEOF(record) + gcmSIZEOF(queue->source),
++                "Event record 0x%x is still pending for %d.",
++                record, queue->source
++                );
++
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Event->os, record));
++        }
++
++        /* Remove the top queue from the list. */
++        if (Event->queueHead == Event->queueTail)
++        {
++            Event->queueHead =
++            Event->queueTail = gcvNULL;
++        }
++        else
++        {
++            Event->queueHead = Event->queueHead->next;
++        }
++
++        /* Free the queue. */
++        gcmkVERIFY_OK(gckEVENT_FreeQueue(Event, queue));
++    }
++
++    /* Delete the list mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Event->os, Event->eventListMutex));
++
++    /* Delete the atom. */
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Event->os, Event->freeAtom));
++
++#if gcdSMP
++    gcmkVERIFY_OK(gckOS_AtomDestroy(Event->os, Event->pending));
++#endif
++
++    /* Mark the gckEVENT object as unknown. */
++    Event->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckEVENT object. */
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Event->os, Event));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_GetEvent
++**
++**  Reserve the next available hardware event.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctBOOL Wait
++**          Set to gcvTRUE to force the function to wait if no events are
++**          immediately available.
++**
++**      gceKERNEL_WHERE Source
++**          Source of the event.
++**
++**  OUTPUT:
++**
++**      gctUINT8 * EventID
++**          Reserved event ID.
++*/
++static gceSTATUS
++gckEVENT_GetEvent(
++    IN gckEVENT Event,
++    IN gctBOOL Wait,
++    OUT gctUINT8 * EventID,
++    IN gcsEVENT_PTR Head,
++    IN gceKERNEL_WHERE Source
++    )
++{
++    gctINT i, id;
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++    gctINT32 free;
++
++#if gcdGPU_TIMEOUT
++    gctUINT32 timer = 0;
++#endif
++
++    gcmkHEADER_ARG("Event=0x%x Head=%p Source=%d", Event, Head, Source);
++
++    while (gcvTRUE)
++    {
++        /* Grab the queue mutex. */
++        gcmkONERROR(gckOS_AcquireMutex(Event->os,
++                                       Event->eventQueueMutex,
++                                       gcvINFINITE));
++        acquired = gcvTRUE;
++
++        /* Walk through all events. */
++        id = Event->lastID;
++        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++        {
++            gctINT nextID = gckMATH_ModuloInt((id + 1),
++                                              gcmCOUNTOF(Event->queues));
++
++            if (Event->queues[id].head == gcvNULL)
++            {
++                *EventID = (gctUINT8) id;
++
++                Event->lastID = (gctUINT8) nextID;
++
++                /* Save time stamp of event. */
++                Event->queues[id].stamp  = ++(Event->stamp);
++                Event->queues[id].head = Head;
++                Event->queues[id].source = Source;
++
++                gcmkONERROR(gckOS_AtomDecrement(Event->os,
++                                                Event->freeAtom,
++                                                &free));
++#if gcdDYNAMIC_SPEED
++                if (free <= gcdDYNAMIC_EVENT_THRESHOLD)
++                {
++                    gcmkONERROR(gckOS_BroadcastHurry(
++                        Event->os,
++                        Event->kernel->hardware,
++                        gcdDYNAMIC_EVENT_THRESHOLD - free));
++                }
++#endif
++
++                /* Release the queue mutex. */
++                gcmkONERROR(gckOS_ReleaseMutex(Event->os,
++                                               Event->eventQueueMutex));
++
++                /* Success. */
++                gcmkTRACE_ZONE_N(
++                    gcvLEVEL_INFO, gcvZONE_EVENT,
++                    gcmSIZEOF(id),
++                    "Using id=%d",
++                    id
++                    );
++
++                gcmkFOOTER_ARG("*EventID=%u", *EventID);
++                return gcvSTATUS_OK;
++            }
++
++            id = nextID;
++        }
++
++#if gcdDYNAMIC_SPEED
++        /* No free events, speed up the GPU right now! */
++        gcmkONERROR(gckOS_BroadcastHurry(Event->os,
++                                         Event->kernel->hardware,
++                                         gcdDYNAMIC_EVENT_THRESHOLD));
++#endif
++
++        /* Release the queue mutex. */
++        gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++        acquired = gcvFALSE;
++
++        /* Fail if wait is not requested. */
++        if (!Wait)
++        {
++            /* Out of resources. */
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++
++        /* Delay a while. */
++        gcmkONERROR(gckOS_Delay(Event->os, 1));
++
++#if gcdGPU_TIMEOUT
++        /* Increment the wait timer. */
++        timer += 1;
++
++        if (timer == Event->kernel->timeOut)
++        {
++            /* Try to call any outstanding events. */
++            gcmkONERROR(gckHARDWARE_Interrupt(Event->kernel->hardware,
++                                              gcvTRUE));
++        }
++        else if (timer > Event->kernel->timeOut)
++        {
++            gcmkTRACE_N(
++                gcvLEVEL_ERROR,
++                gcmSIZEOF(gctCONST_STRING) + gcmSIZEOF(gctINT),
++                "%s(%d): no available events\n",
++                __FUNCTION__, __LINE__
++                );
++
++            /* Bail out. */
++            gcmkONERROR(gcvSTATUS_GPU_NOT_RESPONDING);
++        }
++#endif
++    }
++
++OnError:
++    if (acquired)
++    {
++        /* Release the queue mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_AllocateRecord
++**
++**  Allocate a record for the new event.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctBOOL AllocateAllowed
++**          State for allocation if out of free events.
++**
++**  OUTPUT:
++**
++**      gcsEVENT_PTR * Record
++**          Allocated event record.
++*/
++gceSTATUS
++gckEVENT_AllocateRecord(
++    IN gckEVENT Event,
++    IN gctBOOL AllocateAllowed,
++    OUT gcsEVENT_PTR * Record
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++    gctINT i;
++    gcsEVENT_PTR record;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Event=0x%x AllocateAllowed=%d", Event, AllocateAllowed);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Record != gcvNULL);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Event->os, Event->freeEventMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Test if we are below the allocation threshold. */
++    if ( (AllocateAllowed && (Event->freeEventCount < gcdEVENT_MIN_THRESHOLD)) ||
++         (Event->freeEventCount == 0) )
++    {
++        /* Allocate a bunch of records. */
++        for (i = 0; i < gcdEVENT_ALLOCATION_COUNT; i += 1)
++        {
++            /* Allocate an event record. */
++            gcmkONERROR(gckOS_Allocate(Event->os,
++                                       gcmSIZEOF(gcsEVENT),
++                                       &pointer));
++
++            record = pointer;
++
++            /* Push it on the free list. */
++            record->next           = Event->freeEventList;
++            Event->freeEventList   = record;
++            Event->freeEventCount += 1;
++        }
++    }
++
++    *Record                = Event->freeEventList;
++    Event->freeEventList   = Event->freeEventList->next;
++    Event->freeEventCount -= 1;
++
++    /* Release the mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Record=0x%x", gcmOPT_POINTER(Record));
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->freeEventMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_AddList
++**
++**  Add a new event to the list of events.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gcsHAL_INTERFACE_PTR Interface
++**          Pointer to the interface for the event to be added.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++**
++**      gctBOOL AllocateAllowed
++**          State for allocation if out of free events.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_AddList(
++    IN gckEVENT Event,
++    IN gcsHAL_INTERFACE_PTR Interface,
++    IN gceKERNEL_WHERE FromWhere,
++    IN gctBOOL AllocateAllowed,
++    IN gctBOOL FromKernel
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++    gcsEVENT_PTR record = gcvNULL;
++    gcsEVENT_QUEUE_PTR queue;
++    gckKERNEL kernel = Event->kernel;
++
++    gcmkHEADER_ARG("Event=0x%x Interface=0x%x",
++                   Event, Interface);
++
++    gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, _GC_OBJ_ZONE,
++                    "FromWhere=%d AllocateAllowed=%d",
++                    FromWhere, AllocateAllowed);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
++
++    /* Verify the event command. */
++    gcmkASSERT
++        (  (Interface->command == gcvHAL_FREE_NON_PAGED_MEMORY)
++        || (Interface->command == gcvHAL_FREE_CONTIGUOUS_MEMORY)
++        || (Interface->command == gcvHAL_FREE_VIDEO_MEMORY)
++        || (Interface->command == gcvHAL_WRITE_DATA)
++        || (Interface->command == gcvHAL_UNLOCK_VIDEO_MEMORY)
++        || (Interface->command == gcvHAL_SIGNAL)
++        || (Interface->command == gcvHAL_UNMAP_USER_MEMORY)
++        || (Interface->command == gcvHAL_TIMESTAMP)
++        || (Interface->command == gcvHAL_COMMIT_DONE)
++        || (Interface->command == gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER)
++        || (Interface->command == gcvHAL_SYNC_POINT)
++        );
++
++    /* Validate the source. */
++    if ((FromWhere != gcvKERNEL_COMMAND) && (FromWhere != gcvKERNEL_PIXEL))
++    {
++        /* Invalid argument. */
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Allocate a free record. */
++    gcmkONERROR(gckEVENT_AllocateRecord(Event, AllocateAllowed, &record));
++
++    /* Termninate the record. */
++    record->next = gcvNULL;
++
++    /* Record the committer. */
++    record->fromKernel = FromKernel;
++
++    /* Copy the event interface into the record. */
++    gckOS_MemCopy(&record->info, Interface, gcmSIZEOF(record->info));
++
++    /* Get process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&record->processID));
++
++#ifdef __QNXNTO__
++    record->kernel = Event->kernel;
++#endif
++
++    gcmkONERROR(__RemoveRecordFromProcessDB(Event, record));
++
++    /* Acquire the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Event->os, Event->eventListMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Do we need to allocate a new queue? */
++    if ((Event->queueTail == gcvNULL) || (Event->queueTail->source < FromWhere))
++    {
++        /* Allocate a new queue. */
++        gcmkONERROR(gckEVENT_AllocateQueue(Event, &queue));
++
++        /* Initialize the queue. */
++        queue->source = FromWhere;
++        queue->head   = gcvNULL;
++        queue->next   = gcvNULL;
++
++        /* Attach it to the list of allocated queues. */
++        if (Event->queueTail == gcvNULL)
++        {
++            Event->queueHead =
++            Event->queueTail = queue;
++        }
++        else
++        {
++            Event->queueTail->next = queue;
++            Event->queueTail       = queue;
++        }
++    }
++    else
++    {
++        queue = Event->queueTail;
++    }
++
++    /* Attach the record to the queue. */
++    if (queue->head == gcvNULL)
++    {
++        queue->head = record;
++        queue->tail = record;
++    }
++    else
++    {
++        queue->tail->next = record;
++        queue->tail       = record;
++    }
++
++    /* Unmap user space logical address.
++     * Linux kernel does not support unmap the memory of other process any more since 3.5.
++     * Let's unmap memory of self process before submit the event to gpu.
++     * */
++    switch(Interface->command)
++    {
++    case gcvHAL_FREE_NON_PAGED_MEMORY:
++        gcmkONERROR(gckOS_UnmapUserLogical(
++                        Event->os,
++                        gcmNAME_TO_PTR(Interface->u.FreeNonPagedMemory.physical),
++                        (gctSIZE_T) Interface->u.FreeNonPagedMemory.bytes,
++                        gcmUINT64_TO_PTR(Interface->u.FreeNonPagedMemory.logical)));
++        break;
++    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
++        gcmkONERROR(gckOS_UnmapUserLogical(
++                        Event->os,
++                        gcmNAME_TO_PTR(Interface->u.FreeContiguousMemory.physical),
++                        (gctSIZE_T) Interface->u.FreeContiguousMemory.bytes,
++                        gcmUINT64_TO_PTR(Interface->u.FreeContiguousMemory.logical)));
++        break;
++    default:
++        break;
++    }
++
++
++    /* Release the mutex. */
++    gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
++    }
++
++    if (record != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckEVENT_FreeRecord(Event, record));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Unlock
++**
++**  Schedule an event to unlock virtual memory.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to a gcuVIDMEM_NODE union that specifies the virtual memory
++**          to unlock.
++**
++**      gceSURF_TYPE Type
++**          Type of surface to unlock.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Unlock(
++    IN gckEVENT Event,
++    IN gceKERNEL_WHERE FromWhere,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gceSURF_TYPE Type
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++
++    gcmkHEADER_ARG("Event=0x%x FromWhere=%d Node=0x%x Type=%d",
++                   Event, FromWhere, Node, Type);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
++
++    /* Mark the event as an unlock. */
++    iface.command                           = gcvHAL_UNLOCK_VIDEO_MEMORY;
++    iface.u.UnlockVideoMemory.node          = gcmPTR_TO_UINT64(Node);
++    iface.u.UnlockVideoMemory.type          = Type;
++    iface.u.UnlockVideoMemory.asynchroneous = 0;
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_FreeVideoMemory
++**
++**  Schedule an event to free video memory.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gcuVIDMEM_NODE_PTR VideoMemory
++**          Pointer to a gcuVIDMEM_NODE object to free.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_FreeVideoMemory(
++    IN gckEVENT Event,
++    IN gcuVIDMEM_NODE_PTR VideoMemory,
++    IN gceKERNEL_WHERE FromWhere
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++
++    gcmkHEADER_ARG("Event=0x%x VideoMemory=0x%x FromWhere=%d",
++                   Event, VideoMemory, FromWhere);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(VideoMemory != gcvNULL);
++
++    /* Create an event. */
++    iface.command = gcvHAL_FREE_VIDEO_MEMORY;
++    iface.u.FreeVideoMemory.node = gcmPTR_TO_UINT64(VideoMemory);
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_FreeNonPagedMemory
++**
++**  Schedule an event to free non-paged memory.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes of non-paged memory to free.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of non-paged memory to free.
++**
++**      gctPOINTER Logical
++**          Logical address of non-paged memory to free.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++*/
++gceSTATUS
++gckEVENT_FreeNonPagedMemory(
++    IN gckEVENT Event,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gceKERNEL_WHERE FromWhere
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++    gckKERNEL kernel = Event->kernel;
++
++    gcmkHEADER_ARG("Event=0x%x Bytes=%lu Physical=0x%x Logical=0x%x "
++                   "FromWhere=%d",
++                   Event, Bytes, Physical, Logical, FromWhere);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    /* Create an event. */
++    iface.command = gcvHAL_FREE_NON_PAGED_MEMORY;
++    iface.u.FreeNonPagedMemory.bytes    = Bytes;
++    iface.u.FreeNonPagedMemory.physical = gcmPTR_TO_NAME(Physical);
++    iface.u.FreeNonPagedMemory.logical  = gcmPTR_TO_UINT64(Logical);
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckEVENT_DestroyVirtualCommandBuffer(
++    IN gckEVENT Event,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gceKERNEL_WHERE FromWhere
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++    gckKERNEL kernel = Event->kernel;
++
++    gcmkHEADER_ARG("Event=0x%x Bytes=%lu Physical=0x%x Logical=0x%x "
++                   "FromWhere=%d",
++                   Event, Bytes, Physical, Logical, FromWhere);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    /* Create an event. */
++    iface.command = gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER;
++    iface.u.FreeVirtualCommandBuffer.bytes    = Bytes;
++    iface.u.FreeVirtualCommandBuffer.physical = gcmPTR_TO_NAME(Physical);
++    iface.u.FreeVirtualCommandBuffer.logical  = gcmPTR_TO_UINT64(Logical);
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_FreeContigiuousMemory
++**
++**  Schedule an event to free contiguous memory.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes of contiguous memory to free.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of contiguous memory to free.
++**
++**      gctPOINTER Logical
++**          Logical address of contiguous memory to free.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++*/
++gceSTATUS
++gckEVENT_FreeContiguousMemory(
++    IN gckEVENT Event,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gceKERNEL_WHERE FromWhere
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++    gckKERNEL kernel = Event->kernel;
++
++    gcmkHEADER_ARG("Event=0x%x Bytes=%lu Physical=0x%x Logical=0x%x "
++                   "FromWhere=%d",
++                   Event, Bytes, Physical, Logical, FromWhere);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    /* Create an event. */
++    iface.command = gcvHAL_FREE_CONTIGUOUS_MEMORY;
++    iface.u.FreeContiguousMemory.bytes    = Bytes;
++    iface.u.FreeContiguousMemory.physical = gcmPTR_TO_NAME(Physical);
++    iface.u.FreeContiguousMemory.logical  = gcmPTR_TO_UINT64(Logical);
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Signal
++**
++**  Schedule an event to trigger a signal.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctSIGNAL Signal
++**          Pointer to the signal to trigger.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Signal(
++    IN gckEVENT Event,
++    IN gctSIGNAL Signal,
++    IN gceKERNEL_WHERE FromWhere
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++
++    gcmkHEADER_ARG("Event=0x%x Signal=0x%x FromWhere=%d",
++                   Event, Signal, FromWhere);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++
++    /* Mark the event as a signal. */
++    iface.command            = gcvHAL_SIGNAL;
++    iface.u.Signal.signal    = gcmPTR_TO_UINT64(Signal);
++#ifdef __QNXNTO__
++    iface.u.Signal.coid      = 0;
++    iface.u.Signal.rcvid     = 0;
++#endif
++    iface.u.Signal.auxSignal = 0;
++    iface.u.Signal.process   = 0;
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_CommitDone
++**
++**  Schedule an event to wake up work thread when commit is done by GPU.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gceKERNEL_WHERE FromWhere
++**          Place in the pipe where the event needs to be generated.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_CommitDone(
++    IN gckEVENT Event,
++    IN gceKERNEL_WHERE FromWhere
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++
++    gcmkHEADER_ARG("Event=0x%x FromWhere=%d", Event, FromWhere);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    iface.command = gcvHAL_COMMIT_DONE;
++
++    /* Append it to the queue. */
++    gcmkONERROR(gckEVENT_AddList(Event, &iface, FromWhere, gcvFALSE, gcvTRUE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++/*******************************************************************************
++**
++**  gckEVENT_Submit
++**
++**  Submit the current event queue to the GPU.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctBOOL Wait
++**          Submit requires one vacant event; if Wait is set to not zero,
++**          and there are no vacant events at this time, the function will
++**          wait until an event becomes vacant so that submission of the
++**          queue is successful.
++**
++**      gctBOOL FromPower
++**          Determines whether the call originates from inside the power
++**          management or not.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Submit(
++    IN gckEVENT Event,
++    IN gctBOOL Wait,
++    IN gctBOOL FromPower
++    )
++{
++    gceSTATUS status;
++    gctUINT8 id = 0xFF;
++    gcsEVENT_QUEUE_PTR queue;
++    gctBOOL acquired = gcvFALSE;
++    gckCOMMAND command = gcvNULL;
++    gctBOOL commitEntered = gcvFALSE;
++#if !gcdNULL_DRIVER
++    gctSIZE_T bytes;
++    gctPOINTER buffer;
++#endif
++
++    gcmkHEADER_ARG("Event=0x%x Wait=%d", Event, Wait);
++
++    /* Get gckCOMMAND object. */
++    command = Event->kernel->command;
++
++    /* Are there event queues? */
++    if (Event->queueHead != gcvNULL)
++    {
++        /* Acquire the command queue. */
++        gcmkONERROR(gckCOMMAND_EnterCommit(command, FromPower));
++        commitEntered = gcvTRUE;
++
++        /* Process all queues. */
++        while (Event->queueHead != gcvNULL)
++        {
++            /* Acquire the list mutex. */
++            gcmkONERROR(gckOS_AcquireMutex(Event->os,
++                                           Event->eventListMutex,
++                                           gcvINFINITE));
++            acquired = gcvTRUE;
++
++            /* Get the current queue. */
++            queue = Event->queueHead;
++
++            /* Allocate an event ID. */
++            gcmkONERROR(gckEVENT_GetEvent(Event, Wait, &id, queue->head, queue->source));
++
++            /* Copy event list to event ID queue. */
++            Event->queues[id].head   = queue->head;
++
++            /* Remove the top queue from the list. */
++            if (Event->queueHead == Event->queueTail)
++            {
++                Event->queueHead = gcvNULL;
++                Event->queueTail = gcvNULL;
++            }
++            else
++            {
++                Event->queueHead = Event->queueHead->next;
++            }
++
++            /* Free the queue. */
++            gcmkONERROR(gckEVENT_FreeQueue(Event, queue));
++
++            /* Release the list mutex. */
++            gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
++            acquired = gcvFALSE;
++
++#if gcdNULL_DRIVER
++            /* Notify immediately on infinite hardware. */
++            gcmkONERROR(gckEVENT_Interrupt(Event, 1 << id));
++
++            gcmkONERROR(gckEVENT_Notify(Event, 0));
++#else
++            /* Get the size of the hardware event. */
++            gcmkONERROR(gckHARDWARE_Event(Event->kernel->hardware,
++                                          gcvNULL,
++                                          id,
++                                          Event->queues[id].source,
++                                          &bytes));
++
++            /* Reserve space in the command queue. */
++            gcmkONERROR(gckCOMMAND_Reserve(command,
++                                           bytes,
++                                           &buffer,
++                                           &bytes));
++
++            /* Set the hardware event in the command queue. */
++            gcmkONERROR(gckHARDWARE_Event(Event->kernel->hardware,
++                                          buffer,
++                                          id,
++                                          Event->queues[id].source,
++                                          &bytes));
++
++            /* Execute the hardware event. */
++            gcmkONERROR(gckCOMMAND_Execute(command, bytes));
++#endif
++        }
++
++        /* Release the command queue. */
++        gcmkONERROR(gckCOMMAND_ExitCommit(command, FromPower));
++        commitEntered = gcvFALSE;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, FromPower));
++    }
++
++    if (acquired)
++    {
++        /* Need to unroll the mutex acquire. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventListMutex));
++    }
++
++    if (id != 0xFF)
++    {
++        /* Need to unroll the event allocation. */
++        Event->queues[id].head = gcvNULL;
++    }
++
++    if (status == gcvSTATUS_GPU_NOT_RESPONDING)
++    {
++        /* Broadcast GPU stuck. */
++        status = gckOS_Broadcast(Event->os,
++                                 Event->kernel->hardware,
++                                 gcvBROADCAST_GPU_STUCK);
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Commit
++**
++**  Commit an event queue from the user.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gcsQUEUE_PTR Queue
++**          User event queue.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Commit(
++    IN gckEVENT Event,
++    IN gcsQUEUE_PTR Queue
++    )
++{
++    gceSTATUS status;
++    gcsQUEUE_PTR record = gcvNULL, next;
++    gctUINT32 processID;
++    gctBOOL needCopy = gcvFALSE;
++
++    gcmkHEADER_ARG("Event=0x%x Queue=0x%x", Event, Queue);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    /* Get the current process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&processID));
++
++    /* Query if we need to copy the client data. */
++    gcmkONERROR(gckOS_QueryNeedCopy(Event->os, processID, &needCopy));
++
++    /* Loop while there are records in the queue. */
++    while (Queue != gcvNULL)
++    {
++        gcsQUEUE queue;
++
++        if (needCopy)
++        {
++            /* Point to stack record. */
++            record = &queue;
++
++            /* Copy the data from the client. */
++            gcmkONERROR(gckOS_CopyFromUserData(Event->os,
++                                               record,
++                                               Queue,
++                                               gcmSIZEOF(gcsQUEUE)));
++        }
++        else
++        {
++            gctPOINTER pointer = gcvNULL;
++
++            /* Map record into kernel memory. */
++            gcmkONERROR(gckOS_MapUserPointer(Event->os,
++                                             Queue,
++                                             gcmSIZEOF(gcsQUEUE),
++                                             &pointer));
++
++            record = pointer;
++        }
++
++        /* Append event record to event queue. */
++        gcmkONERROR(
++            gckEVENT_AddList(Event, &record->iface, gcvKERNEL_PIXEL, gcvTRUE, gcvFALSE));
++
++        /* Next record in the queue. */
++        next = gcmUINT64_TO_PTR(record->next);
++
++        if (!needCopy)
++        {
++            /* Unmap record from kernel memory. */
++            gcmkONERROR(
++                gckOS_UnmapUserPointer(Event->os,
++                                       Queue,
++                                       gcmSIZEOF(gcsQUEUE),
++                                       (gctPOINTER *) record));
++            record = gcvNULL;
++        }
++
++        Queue = next;
++    }
++
++    /* Submit the event list. */
++    gcmkONERROR(gckEVENT_Submit(Event, gcvTRUE, gcvFALSE));
++
++    /* Success */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if ((record != gcvNULL) && !needCopy)
++    {
++        /* Roll back. */
++        gcmkVERIFY_OK(gckOS_UnmapUserPointer(Event->os,
++                                             Queue,
++                                             gcmSIZEOF(gcsQUEUE),
++                                             (gctPOINTER *) record));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Compose
++**
++**  Schedule a composition event and start a composition.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gcsHAL_COMPOSE_PTR Info
++**          Pointer to the composition structure.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Compose(
++    IN gckEVENT Event,
++    IN gcsHAL_COMPOSE_PTR Info
++    )
++{
++    gceSTATUS status;
++    gcsEVENT_PTR headRecord;
++    gcsEVENT_PTR tailRecord;
++    gcsEVENT_PTR tempRecord;
++    gctUINT8 id = 0xFF;
++    gctUINT32 processID;
++
++    gcmkHEADER_ARG("Event=0x%x Info=0x%x", Event, Info);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
++
++    /* Get process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&processID));
++
++    /* Allocate a record. */
++    gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &tempRecord));
++    headRecord = tailRecord = tempRecord;
++
++    /* Initialize the record. */
++    tempRecord->info.command            = gcvHAL_SIGNAL;
++    tempRecord->info.u.Signal.process   = Info->process;
++#ifdef __QNXNTO__
++    tempRecord->info.u.Signal.coid      = Info->coid;
++    tempRecord->info.u.Signal.rcvid     = Info->rcvid;
++#endif
++    tempRecord->info.u.Signal.signal    = Info->signal;
++    tempRecord->info.u.Signal.auxSignal = 0;
++    tempRecord->next = gcvNULL;
++    tempRecord->processID = processID;
++
++    /* Allocate another record for user signal #1. */
++    if (gcmUINT64_TO_PTR(Info->userSignal1) != gcvNULL)
++    {
++        /* Allocate a record. */
++        gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &tempRecord));
++        tailRecord->next = tempRecord;
++        tailRecord = tempRecord;
++
++        /* Initialize the record. */
++        tempRecord->info.command            = gcvHAL_SIGNAL;
++        tempRecord->info.u.Signal.process   = Info->userProcess;
++#ifdef __QNXNTO__
++        tempRecord->info.u.Signal.coid      = Info->coid;
++        tempRecord->info.u.Signal.rcvid     = Info->rcvid;
++#endif
++        tempRecord->info.u.Signal.signal    = Info->userSignal1;
++        tempRecord->info.u.Signal.auxSignal = 0;
++        tempRecord->next = gcvNULL;
++        tempRecord->processID = processID;
++    }
++
++    /* Allocate another record for user signal #2. */
++    if (gcmUINT64_TO_PTR(Info->userSignal2) != gcvNULL)
++    {
++        /* Allocate a record. */
++        gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &tempRecord));
++        tailRecord->next = tempRecord;
++        tailRecord = tempRecord;
++
++        /* Initialize the record. */
++        tempRecord->info.command            = gcvHAL_SIGNAL;
++        tempRecord->info.u.Signal.process   = Info->userProcess;
++#ifdef __QNXNTO__
++        tempRecord->info.u.Signal.coid      = Info->coid;
++        tempRecord->info.u.Signal.rcvid     = Info->rcvid;
++#endif
++        tempRecord->info.u.Signal.signal    = Info->userSignal2;
++        tempRecord->info.u.Signal.auxSignal = 0;
++        tempRecord->next = gcvNULL;
++        tempRecord->processID = processID;
++    }
++
++    /* Allocate an event ID. */
++    gcmkONERROR(gckEVENT_GetEvent(Event, gcvTRUE, &id, headRecord, gcvKERNEL_PIXEL));
++
++    /* Start composition. */
++    gcmkONERROR(gckHARDWARE_Compose(
++        Event->kernel->hardware, processID,
++        gcmUINT64_TO_PTR(Info->physical), gcmUINT64_TO_PTR(Info->logical), Info->offset, Info->size, id
++        ));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Interrupt
++**
++**  Called by the interrupt service routine to store the triggered interrupt
++**  mask to be later processed by gckEVENT_Notify.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctUINT32 Data
++**          Mask for the 32 interrupts.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Interrupt(
++    IN gckEVENT Event,
++    IN gctUINT32 Data
++    )
++{
++    unsigned long flags;
++    gcmkHEADER_ARG("Event=0x%x Data=0x%x", Event, Data);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    /* Combine current interrupt status with pending flags. */
++    spin_lock_irqsave(&Event->kernel->irq_lock, flags);
++#if gcdSMP
++    gckOS_AtomSetMask(Event->pending, Data);
++#elif defined(__QNXNTO__)
++    atomic_set(&Event->pending, Data);
++#else
++    Event->pending |= Data;
++#endif
++    spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckEVENT_Notify
++**
++**  Process all triggered interrupts.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Notify(
++    IN gckEVENT Event,
++    IN gctUINT32 IDs
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctINT i;
++    gcsEVENT_QUEUE * queue;
++    gctUINT mask = 0;
++    gctBOOL acquired = gcvFALSE;
++    gcuVIDMEM_NODE_PTR node;
++    gctPOINTER info;
++    gctSIGNAL signal;
++    gctUINT pending;
++    gckKERNEL kernel = Event->kernel;
++#if !gcdSMP
++    gctBOOL suspended = gcvFALSE;
++#endif
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gctINT eventNumber = 0;
++#endif
++    gctINT32 free;
++#if gcdSECURE_USER
++    gcskSECURE_CACHE_PTR cache;
++#endif
++    unsigned long flags;
++
++    gcmkHEADER_ARG("Event=0x%x IDs=0x%x", Event, IDs);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    gcmDEBUG_ONLY(
++        if (IDs != 0)
++        {
++            for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++            {
++                if (Event->queues[i].head != gcvNULL)
++                {
++                    gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                                   "Queue(%d): stamp=%llu source=%d",
++                                   i,
++                                   Event->queues[i].stamp,
++                                   Event->queues[i].source);
++                }
++            }
++        }
++    );
++
++    for (;;)
++    {
++        gcsEVENT_PTR record;
++
++        spin_lock_irqsave(&Event->kernel->irq_lock, flags);
++#if gcdSMP
++        /* Get current interrupts. */
++        gckOS_AtomGet(Event->os, Event->pending, (gctINT32_PTR)&pending);
++#else
++        /* Get current interrupts. */
++        pending = Event->pending;
++#endif
++        spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
++
++        if (pending & 0x80000000)
++        {
++            //gckOS_Print("!!!!!!!!!!!!! AXI BUS ERROR !!!!!!!!!!!!!\n");
++            gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_EVENT, "AXI BUS ERROR");
++            pending &= 0x7FFFFFFF;
++        }
++
++        if (pending & 0x40000000)
++        {
++            gckHARDWARE_DumpMMUException(Event->kernel->hardware);
++
++            pending &= 0x3FFFFFFF;
++        }
++
++        gcmkTRACE_ZONE_N(
++            gcvLEVEL_INFO, gcvZONE_EVENT,
++            gcmSIZEOF(pending),
++            "Pending interrupts 0x%x",
++            pending
++            );
++
++        if (pending == 0)
++        {
++            /* No more pending interrupts - done. */
++            break;
++        }
++
++        queue = gcvNULL;
++
++        /* Grab the mutex queue. */
++        gcmkONERROR(gckOS_AcquireMutex(Event->os,
++                                       Event->eventQueueMutex,
++                                       gcvINFINITE));
++        acquired = gcvTRUE;
++
++        gcmDEBUG_ONLY(
++            if (IDs == 0)
++            {
++                for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++                {
++                    if (Event->queues[i].head != gcvNULL)
++                    {
++                        gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                                       "Queue(%d): stamp=%llu source=%d",
++                                       i,
++                                       Event->queues[i].stamp,
++                                       Event->queues[i].source);
++                    }
++                }
++            }
++        );
++
++        /* Find the oldest pending interrupt. */
++        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++        {
++            if ((Event->queues[i].head != gcvNULL)
++            &&  (pending & (1 << i))
++            )
++            {
++                if ((queue == gcvNULL)
++                ||  (Event->queues[i].stamp < queue->stamp)
++                )
++                {
++                    queue = &Event->queues[i];
++                    mask  = 1 << i;
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++                    eventNumber = i;
++#endif
++                }
++            }
++        }
++
++        if (queue == gcvNULL)
++        {
++            gcmkTRACE_ZONE_N(
++                gcvLEVEL_ERROR, gcvZONE_EVENT,
++                gcmSIZEOF(pending),
++                "Interrupts 0x%x are not pending.",
++                pending
++                );
++
++            /* Release the mutex queue. */
++            gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++            acquired = gcvFALSE;
++
++            spin_lock_irqsave(&Event->kernel->irq_lock, flags);
++#if gcdSMP
++            /* Mark pending interrupts as handled. */
++            gckOS_AtomClearMask(Event->pending, pending);
++#elif defined(__QNXNTO__)
++            /* Mark pending interrupts as handled. */
++            atomic_clr((gctUINT32_PTR)&Event->pending, pending);
++#else
++            /* Mark pending interrupts as handled. */
++            Event->pending &= ~pending;
++#endif
++            spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
++            break;
++        }
++
++        /* Check whether there is a missed interrupt. */
++        for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++        {
++            if ((Event->queues[i].head != gcvNULL)
++            &&  (Event->queues[i].stamp < queue->stamp)
++            &&  (Event->queues[i].source <= queue->source)
++            )
++            {
++                gcmkTRACE_N(
++                    gcvLEVEL_ERROR,
++                    gcmSIZEOF(i) + gcmSIZEOF(Event->queues[i].stamp),
++                    "Event %d lost (stamp %llu)",
++                    i, Event->queues[i].stamp
++                    );
++
++                /* Use this event instead. */
++                queue = &Event->queues[i];
++                mask  = 0;
++            }
++        }
++
++        if (mask != 0)
++        {
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++            gcmkTRACE_ZONE_N(
++                gcvLEVEL_INFO, gcvZONE_EVENT,
++                gcmSIZEOF(eventNumber),
++                "Processing interrupt %d",
++                eventNumber
++                );
++#endif
++        }
++
++        spin_lock_irqsave(&Event->kernel->irq_lock, flags);
++#if gcdSMP
++        /* Mark pending interrupt as handled. */
++        gckOS_AtomClearMask(Event->pending, mask);
++#elif defined(__QNXNTO__)
++        /* Mark pending interrupt as handled. */
++        atomic_clr(&Event->pending, mask);
++#else
++        /* Mark pending interrupt as handled. */
++        Event->pending &= ~mask;
++#endif
++        spin_unlock_irqrestore(&Event->kernel->irq_lock, flags);
++
++        /* We are in the notify loop. */
++        Event->inNotify = gcvTRUE;
++
++        /* We are in the notify loop. */
++        Event->inNotify = gcvTRUE;
++
++        /* Grab the event head. */
++        record = queue->head;
++
++        /* Now quickly clear its event list. */
++        queue->head = gcvNULL;
++
++        /* Release the mutex queue. */
++        gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++        acquired = gcvFALSE;
++
++        /* Increase the number of free events. */
++        gcmkONERROR(gckOS_AtomIncrement(Event->os, Event->freeAtom, &free));
++
++        /* Walk all events for this interrupt. */
++        while (record != gcvNULL)
++        {
++            gcsEVENT_PTR recordNext;
++#ifndef __QNXNTO__
++            gctPOINTER logical;
++#endif
++#if gcdSECURE_USER
++            gctSIZE_T bytes;
++#endif
++
++            /* Grab next record. */
++            recordNext = record->next;
++
++#ifdef __QNXNTO__
++            /* Assign record->processID as the pid for this galcore thread.
++             * Used in OS calls like gckOS_UnlockMemory() which do not take a pid.
++             */
++            drv_thread_specific_key_assign(record->processID, 0, Event->kernel->core);
++#endif
++
++#if gcdSECURE_USER
++            /* Get the cache that belongs to this process. */
++            gcmkONERROR(gckKERNEL_GetProcessDBCache(Event->kernel,
++                        record->processID,
++                        &cache));
++#endif
++
++            gcmkTRACE_ZONE_N(
++                gcvLEVEL_INFO, gcvZONE_EVENT,
++                gcmSIZEOF(record->info.command),
++                "Processing event type: %d",
++                record->info.command
++                );
++
++            switch (record->info.command)
++            {
++            case gcvHAL_FREE_NON_PAGED_MEMORY:
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                               "gcvHAL_FREE_NON_PAGED_MEMORY: 0x%x",
++                               gcmNAME_TO_PTR(record->info.u.FreeNonPagedMemory.physical));
++
++                /* Free non-paged memory. */
++                status = gckOS_FreeNonPagedMemory(
++                            Event->os,
++                            (gctSIZE_T) record->info.u.FreeNonPagedMemory.bytes,
++                            gcmNAME_TO_PTR(record->info.u.FreeNonPagedMemory.physical),
++                            gcmUINT64_TO_PTR(record->info.u.FreeNonPagedMemory.logical));
++
++                if (gcmIS_SUCCESS(status))
++                {
++#if gcdSECURE_USER
++                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++                        Event->kernel,
++                        cache,
++                        gcmUINT64_TO_PTR(record->record.u.FreeNonPagedMemory.logical),
++                        (gctSIZE_T) record->record.u.FreeNonPagedMemory.bytes));
++#endif
++                }
++                gcmRELEASE_NAME(record->info.u.FreeNonPagedMemory.physical);
++                break;
++
++            case gcvHAL_FREE_CONTIGUOUS_MEMORY:
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                    "gcvHAL_FREE_CONTIGUOUS_MEMORY: 0x%x",
++                    gcmNAME_TO_PTR(record->info.u.FreeContiguousMemory.physical));
++
++                /* Unmap the user memory. */
++                status = gckOS_FreeContiguous(
++                            Event->os,
++                            gcmNAME_TO_PTR(record->info.u.FreeContiguousMemory.physical),
++                            gcmUINT64_TO_PTR(record->info.u.FreeContiguousMemory.logical),
++                            (gctSIZE_T) record->info.u.FreeContiguousMemory.bytes);
++
++                if (gcmIS_SUCCESS(status))
++                {
++#if gcdSECURE_USER
++                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++                        Event->kernel,
++                        cache,
++                        gcmUINT64_TO_PTR(record->record.u.FreeContiguousMemory.logical),
++                        (gctSIZE_T) record->record.u.FreeContiguousMemory.bytes));
++#endif
++                }
++                gcmRELEASE_NAME(record->info.u.FreeContiguousMemory.physical);
++                break;
++
++            case gcvHAL_FREE_VIDEO_MEMORY:
++                node = gcmUINT64_TO_PTR(record->info.u.FreeVideoMemory.node);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                               "gcvHAL_FREE_VIDEO_MEMORY: 0x%x",
++                               node);
++#ifdef __QNXNTO__
++#if gcdUSE_VIDMEM_PER_PID
++                /* Check if the VidMem object still exists. */
++                if (gckKERNEL_GetVideoMemoryPoolPid(record->kernel,
++                                                    gcvPOOL_SYSTEM,
++                                                    record->processID,
++                                                    gcvNULL) == gcvSTATUS_NOT_FOUND)
++                {
++                    /*printf("Vidmem not found for process:%d\n", queue->processID);*/
++                    status = gcvSTATUS_OK;
++                    break;
++                }
++#else
++                if ((node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++                &&  (node->VidMem.logical != gcvNULL)
++                )
++                {
++                    gcmkERR_BREAK(
++                        gckKERNEL_UnmapVideoMemory(record->kernel,
++                                                   node->VidMem.logical,
++                                                   record->processID,
++                                                   node->VidMem.bytes));
++                    node->VidMem.logical = gcvNULL;
++                }
++#endif
++#endif
++
++                /* Free video memory. */
++                status =
++                    gckVIDMEM_Free(Event->kernel, node);
++
++                break;
++
++            case gcvHAL_WRITE_DATA:
++#ifndef __QNXNTO__
++                /* Convert physical into logical address. */
++                gcmkERR_BREAK(
++                    gckOS_MapPhysical(Event->os,
++                                      record->info.u.WriteData.address,
++                                      gcmSIZEOF(gctUINT32),
++                                      &logical));
++
++                /* Write data. */
++                gcmkERR_BREAK(
++                    gckOS_WriteMemory(Event->os,
++                                      logical,
++                                      record->info.u.WriteData.data));
++
++                /* Unmap the physical memory. */
++                gcmkERR_BREAK(
++                    gckOS_UnmapPhysical(Event->os,
++                                        logical,
++                                        gcmSIZEOF(gctUINT32)));
++#else
++                /* Write data. */
++                gcmkERR_BREAK(
++                    gckOS_WriteMemory(Event->os,
++                                      (gctPOINTER)
++                                          record->info.u.WriteData.address,
++                                      record->info.u.WriteData.data));
++#endif
++                break;
++
++            case gcvHAL_UNLOCK_VIDEO_MEMORY:
++                node = gcmUINT64_TO_PTR(record->info.u.UnlockVideoMemory.node);
++
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                               "gcvHAL_UNLOCK_VIDEO_MEMORY: 0x%x",
++                               node);
++
++                /* Save node information before it disappears. */
++#if gcdSECURE_USER
++                if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++                {
++                    logical = gcvNULL;
++                    bytes   = 0;
++                }
++                else
++                {
++                    logical = node->Virtual.logical;
++                    bytes   = node->Virtual.bytes;
++                }
++#endif
++
++                /* Unlock. */
++                status = gckVIDMEM_Unlock(
++                    Event->kernel,
++                    node,
++                    record->info.u.UnlockVideoMemory.type,
++                    gcvNULL);
++
++#if gcdSECURE_USER
++                if (gcmIS_SUCCESS(status) && (logical != gcvNULL))
++                {
++                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++                        Event->kernel,
++                        cache,
++                        logical,
++                        bytes));
++                }
++#endif
++                break;
++
++            case gcvHAL_SIGNAL:
++                signal = gcmUINT64_TO_PTR(record->info.u.Signal.signal);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                               "gcvHAL_SIGNAL: 0x%x",
++                               signal);
++
++#ifdef __QNXNTO__
++                if ((record->info.u.Signal.coid == 0)
++                &&  (record->info.u.Signal.rcvid == 0)
++                )
++                {
++                    /* Kernel signal. */
++                    gcmkERR_BREAK(
++                        gckOS_Signal(Event->os,
++                                     signal,
++                                     gcvTRUE));
++                }
++                else
++                {
++                    /* User signal. */
++                    gcmkERR_BREAK(
++                        gckOS_UserSignal(Event->os,
++                                         signal,
++                                         record->info.u.Signal.rcvid,
++                                         record->info.u.Signal.coid));
++                }
++#else
++                /* Set signal. */
++                if (gcmUINT64_TO_PTR(record->info.u.Signal.process) == gcvNULL)
++                {
++                    /* Kernel signal. */
++                    gcmkERR_BREAK(
++                        gckOS_Signal(Event->os,
++                                     signal,
++                                     gcvTRUE));
++                }
++                else
++                {
++                    /* User signal. */
++                    gcmkERR_BREAK(
++                        gckOS_UserSignal(Event->os,
++                                         signal,
++                                         gcmUINT64_TO_PTR(record->info.u.Signal.process)));
++                }
++
++                gcmkASSERT(record->info.u.Signal.auxSignal == 0);
++#endif
++                break;
++
++            case gcvHAL_UNMAP_USER_MEMORY:
++                info = gcmNAME_TO_PTR(record->info.u.UnmapUserMemory.info);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                               "gcvHAL_UNMAP_USER_MEMORY: 0x%x",
++                               info);
++
++                /* Unmap the user memory. */
++                status = gckOS_UnmapUserMemory(
++                    Event->os,
++                    Event->kernel->core,
++                    gcmUINT64_TO_PTR(record->info.u.UnmapUserMemory.memory),
++                    (gctSIZE_T) record->info.u.UnmapUserMemory.size,
++                    info,
++                    record->info.u.UnmapUserMemory.address);
++
++#if gcdSECURE_USER
++                if (gcmIS_SUCCESS(status))
++                {
++                    gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(
++                        Event->kernel,
++                        cache,
++                        gcmUINT64_TO_PTR(record->info.u.UnmapUserMemory.memory),
++                        (gctSIZE_T) record->info.u.UnmapUserMemory.size));
++                }
++#endif
++                gcmRELEASE_NAME(record->info.u.UnmapUserMemory.info);
++                break;
++
++            case gcvHAL_TIMESTAMP:
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                               "gcvHAL_TIMESTAMP: %d %d",
++                               record->info.u.TimeStamp.timer,
++                               record->info.u.TimeStamp.request);
++
++                /* Process the timestamp. */
++                switch (record->info.u.TimeStamp.request)
++                {
++                case 0:
++                    status = gckOS_GetTime(&Event->kernel->timers[
++                                           record->info.u.TimeStamp.timer].
++                                           stopTime);
++                    break;
++
++                case 1:
++                    status = gckOS_GetTime(&Event->kernel->timers[
++                                           record->info.u.TimeStamp.timer].
++                                           startTime);
++                    break;
++
++                default:
++                    gcmkTRACE_ZONE_N(
++                        gcvLEVEL_ERROR, gcvZONE_EVENT,
++                        gcmSIZEOF(record->info.u.TimeStamp.request),
++                        "Invalid timestamp request: %d",
++                        record->info.u.TimeStamp.request
++                        );
++
++                    status = gcvSTATUS_INVALID_ARGUMENT;
++                    break;
++                }
++                break;
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++             case gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER:
++                 gcmkVERIFY_OK(
++                     gckKERNEL_DestroyVirtualCommandBuffer(Event->kernel,
++                         (gctSIZE_T) record->info.u.FreeVirtualCommandBuffer.bytes,
++                         gcmNAME_TO_PTR(record->info.u.FreeVirtualCommandBuffer.physical),
++                         gcmUINT64_TO_PTR(record->info.u.FreeVirtualCommandBuffer.logical)
++                         ));
++                 gcmRELEASE_NAME(record->info.u.FreeVirtualCommandBuffer.physical);
++                 break;
++#endif
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++            case gcvHAL_SYNC_POINT:
++                {
++                    gctSYNC_POINT syncPoint;
++
++                    syncPoint = gcmUINT64_TO_PTR(record->info.u.SyncPoint.syncPoint);
++                    status = gckOS_SignalSyncPoint(Event->os, syncPoint);
++                }
++                break;
++#endif
++
++            case gcvHAL_COMMIT_DONE:
++                break;
++
++            default:
++                /* Invalid argument. */
++                gcmkTRACE_ZONE_N(
++                    gcvLEVEL_ERROR, gcvZONE_EVENT,
++                    gcmSIZEOF(record->info.command),
++                    "Unknown event type: %d",
++                    record->info.command
++                    );
++
++                status = gcvSTATUS_INVALID_ARGUMENT;
++                break;
++            }
++
++            /* Make sure there are no errors generated. */
++            if (gcmIS_ERROR(status))
++            {
++                gcmkTRACE_ZONE_N(
++                    gcvLEVEL_WARNING, gcvZONE_EVENT,
++                    gcmSIZEOF(status),
++                    "Event produced status: %d(%s)",
++                    status, gckOS_DebugStatus2Name(status));
++            }
++
++            /* Free the event. */
++            gcmkVERIFY_OK(gckEVENT_FreeRecord(Event, record));
++
++            /* Advance to next record. */
++            record = recordNext;
++        }
++
++        gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_EVENT,
++                       "Handled interrupt 0x%x", mask);
++    }
++
++    if (IDs == 0)
++    {
++        gcmkONERROR(_TryToIdleGPU(Event));
++    }
++
++    /* We are out the notify loop. */
++    Event->inNotify = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++    }
++
++#if !gcdSMP
++    if (suspended)
++    {
++        /* Resume interrupts. */
++        gcmkVERIFY_OK(gckOS_ResumeInterruptEx(Event->os, Event->kernel->core));
++    }
++#endif
++
++    /* We are out the notify loop. */
++    Event->inNotify = gcvFALSE;
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckEVENT_FreeProcess
++**
++**  Free all events owned by a particular process ID.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctUINT32 ProcessID
++**          Process ID of the process to be freed up.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_FreeProcess(
++    IN gckEVENT Event,
++    IN gctUINT32 ProcessID
++    )
++{
++    gctSIZE_T i;
++    gctBOOL acquired = gcvFALSE;
++    gcsEVENT_PTR record, next;
++    gceSTATUS status;
++    gcsEVENT_PTR deleteHead, deleteTail;
++
++    gcmkHEADER_ARG("Event=0x%x ProcessID=%d", Event, ProcessID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    /* Walk through all queues. */
++    for (i = 0; i < gcmCOUNTOF(Event->queues); ++i)
++    {
++        if (Event->queues[i].head != gcvNULL)
++        {
++            /* Grab the event queue mutex. */
++            gcmkONERROR(gckOS_AcquireMutex(Event->os,
++                                           Event->eventQueueMutex,
++                                           gcvINFINITE));
++            acquired = gcvTRUE;
++
++            /* Grab the mutex head. */
++            record                = Event->queues[i].head;
++            Event->queues[i].head = gcvNULL;
++            Event->queues[i].tail = gcvNULL;
++            deleteHead            = gcvNULL;
++            deleteTail            = gcvNULL;
++
++            while (record != gcvNULL)
++            {
++                next = record->next;
++                if (record->processID == ProcessID)
++                {
++                    if (deleteHead == gcvNULL)
++                    {
++                        deleteHead = record;
++                    }
++                    else
++                    {
++                        deleteTail->next = record;
++                    }
++
++                    deleteTail = record;
++                }
++                else
++                {
++                    if (Event->queues[i].head == gcvNULL)
++                    {
++                        Event->queues[i].head = record;
++                    }
++                    else
++                    {
++                        Event->queues[i].tail->next = record;
++                    }
++
++                    Event->queues[i].tail = record;
++                }
++
++                record->next = gcvNULL;
++                record = next;
++            }
++
++            /* Release the mutex queue. */
++            gcmkONERROR(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++            acquired = gcvFALSE;
++
++            /* Loop through the entire list of events. */
++            for (record = deleteHead; record != gcvNULL; record = next)
++            {
++                /* Get the next event record. */
++                next = record->next;
++
++                /* Free the event record. */
++                gcmkONERROR(gckEVENT_FreeRecord(Event, record));
++            }
++        }
++    }
++
++    gcmkONERROR(_TryToIdleGPU(Event));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Release the event queue mutex. */
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Event->os, Event->eventQueueMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**  gckEVENT_Stop
++**
++**  Stop the hardware using the End event mechanism.
++**
++**  INPUT:
++**
++**      gckEVENT Event
++**          Pointer to an gckEVENT object.
++**
++**      gctUINT32 ProcessID
++**          Process ID Logical belongs.
++**
++**      gctPHYS_ADDR Handle
++**          Physical address handle.  If gcvNULL it is video memory.
++**
++**      gctPOINTER Logical
++**          Logical address to flush.
++**
++**      gctSIGNAL Signal
++**          Pointer to the signal to trigger.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckEVENT_Stop(
++    IN gckEVENT Event,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Handle,
++    IN gctPOINTER Logical,
++    IN gctSIGNAL Signal,
++	IN OUT gctSIZE_T * waitSize
++    )
++{
++    gceSTATUS status;
++   /* gctSIZE_T waitSize;*/
++    gcsEVENT_PTR record;
++    gctUINT8 id = 0xFF;
++
++    gcmkHEADER_ARG("Event=0x%x ProcessID=%u Handle=0x%x Logical=0x%x "
++                   "Signal=0x%x",
++                   Event, ProcessID, Handle, Logical, Signal);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Event, gcvOBJ_EVENT);
++
++    /* Submit the current event queue. */
++    gcmkONERROR(gckEVENT_Submit(Event, gcvTRUE, gcvFALSE));
++
++    /* Allocate a record. */
++    gcmkONERROR(gckEVENT_AllocateRecord(Event, gcvTRUE, &record));
++
++    /* Initialize the record. */
++    record->next = gcvNULL;
++    record->processID               = ProcessID;
++    record->info.command            = gcvHAL_SIGNAL;
++    record->info.u.Signal.signal    = gcmPTR_TO_UINT64(Signal);
++#ifdef __QNXNTO__
++    record->info.u.Signal.coid      = 0;
++    record->info.u.Signal.rcvid     = 0;
++#endif
++    record->info.u.Signal.auxSignal = 0;
++    record->info.u.Signal.process   = 0;
++
++
++    gcmkONERROR(gckEVENT_GetEvent(Event, gcvTRUE, &id, record, gcvKERNEL_PIXEL));
++
++    /* Replace last WAIT with END. */
++    gcmkONERROR(gckHARDWARE_End(
++        Event->kernel->hardware, Logical, waitSize
++        ));
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Flush the cache for the END. */
++    gcmkONERROR(gckOS_CacheClean(
++        Event->os,
++        ProcessID,
++        gcvNULL,
++        Handle,
++        Logical,
++        *waitSize
++        ));
++#endif
++
++    /* Wait for the signal. */
++    gcmkONERROR(gckOS_WaitSignal(Event->os, Signal, gcvINFINITE));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++static void
++_PrintRecord(
++    gcsEVENT_PTR record
++    )
++{
++    switch (record->info.command)
++    {
++    case gcvHAL_FREE_NON_PAGED_MEMORY:
++        gcmkPRINT("      gcvHAL_FREE_NON_PAGED_MEMORY");
++            break;
++
++    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
++        gcmkPRINT("      gcvHAL_FREE_CONTIGUOUS_MEMORY");
++            break;
++
++    case gcvHAL_FREE_VIDEO_MEMORY:
++        gcmkPRINT("      gcvHAL_FREE_VIDEO_MEMORY");
++            break;
++
++    case gcvHAL_WRITE_DATA:
++        gcmkPRINT("      gcvHAL_WRITE_DATA");
++       break;
++
++    case gcvHAL_UNLOCK_VIDEO_MEMORY:
++        gcmkPRINT("      gcvHAL_UNLOCK_VIDEO_MEMORY");
++        break;
++
++    case gcvHAL_SIGNAL:
++        gcmkPRINT("      gcvHAL_SIGNAL process=%d signal=0x%x",
++                  record->info.u.Signal.process,
++                  record->info.u.Signal.signal);
++        break;
++
++    case gcvHAL_UNMAP_USER_MEMORY:
++        gcmkPRINT("      gcvHAL_UNMAP_USER_MEMORY");
++       break;
++
++    case gcvHAL_TIMESTAMP:
++        gcmkPRINT("      gcvHAL_TIMESTAMP");
++        break;
++
++    case gcvHAL_COMMIT_DONE:
++        gcmkPRINT("      gcvHAL_COMMIT_DONE");
++        break;
++
++    case gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER:
++        gcmkPRINT("      gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER logical=0x%08x",
++                  record->info.u.FreeVirtualCommandBuffer.logical);
++        break;
++
++    default:
++        gcmkPRINT("      Illegal Event %d", record->info.command);
++        break;
++    }
++}
++
++/*******************************************************************************
++** gckEVENT_Dump
++**
++** Dump record in event queue when stuck happens.
++** No protection for the event queue.
++**/
++gceSTATUS
++gckEVENT_Dump(
++    IN gckEVENT Event
++    )
++{
++    gcsEVENT_QUEUE_PTR queueHead = Event->queueHead;
++    gcsEVENT_QUEUE_PTR queue;
++    gcsEVENT_PTR record = gcvNULL;
++    gctINT i;
++
++    gcmkHEADER_ARG("Event=0x%x", Event);
++
++    gcmkPRINT("**************************\n");
++    gcmkPRINT("***  EVENT STATE DUMP  ***\n");
++    gcmkPRINT("**************************\n");
++
++
++    gcmkPRINT("  Unsumbitted Event:");
++    while(queueHead)
++    {
++        queue = queueHead;
++        record = queueHead->head;
++
++        gcmkPRINT("    [%x]:", queue);
++        while(record)
++        {
++            _PrintRecord(record);
++            record = record->next;
++        }
++
++        if (queueHead == Event->queueTail)
++        {
++            queueHead = gcvNULL;
++        }
++        else
++        {
++            queueHead = queueHead->next;
++        }
++    }
++
++    gcmkPRINT("  Untriggered Event:");
++    for (i = 0; i < 30; i++)
++    {
++        queue = &Event->queues[i];
++        record = queue->head;
++
++        gcmkPRINT("    [%d]:", i);
++        while(record)
++        {
++            _PrintRecord(record);
++            record = record->next;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS gckEVENT_WaitEmpty(gckEVENT Event)
++{
++    gctBOOL isEmpty;
++
++    while (Event->inNotify || (gcmIS_SUCCESS(gckEVENT_IsEmpty(Event, &isEmpty)) && !isEmpty)) ;
++
++    return gcvSTATUS_OK;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel.h	2015-07-27 23:13:06.190893891 +0200
+@@ -0,0 +1,1007 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_h_
++#define __gc_hal_kernel_h_
++
++#include <linux/spinlock.h>
++
++#include "gc_hal.h"
++#include "gc_hal_kernel_hardware.h"
++#include "gc_hal_driver.h"
++
++#if gcdENABLE_VG
++#include "gc_hal_kernel_vg.h"
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++
++/*******************************************************************************
++***** New MMU Defination *******************************************************/
++#define gcdMMU_MTLB_SHIFT           22
++#define gcdMMU_STLB_4K_SHIFT        12
++#define gcdMMU_STLB_64K_SHIFT       16
++
++#define gcdMMU_MTLB_BITS            (32 - gcdMMU_MTLB_SHIFT)
++#define gcdMMU_PAGE_4K_BITS         gcdMMU_STLB_4K_SHIFT
++#define gcdMMU_STLB_4K_BITS         (32 - gcdMMU_MTLB_BITS - gcdMMU_PAGE_4K_BITS)
++#define gcdMMU_PAGE_64K_BITS        gcdMMU_STLB_64K_SHIFT
++#define gcdMMU_STLB_64K_BITS        (32 - gcdMMU_MTLB_BITS - gcdMMU_PAGE_64K_BITS)
++
++#define gcdMMU_MTLB_ENTRY_NUM       (1 << gcdMMU_MTLB_BITS)
++#define gcdMMU_MTLB_SIZE            (gcdMMU_MTLB_ENTRY_NUM << 2)
++#define gcdMMU_STLB_4K_ENTRY_NUM    (1 << gcdMMU_STLB_4K_BITS)
++#define gcdMMU_STLB_4K_SIZE         (gcdMMU_STLB_4K_ENTRY_NUM << 2)
++#define gcdMMU_PAGE_4K_SIZE         (1 << gcdMMU_STLB_4K_SHIFT)
++#define gcdMMU_STLB_64K_ENTRY_NUM   (1 << gcdMMU_STLB_64K_BITS)
++#define gcdMMU_STLB_64K_SIZE        (gcdMMU_STLB_64K_ENTRY_NUM << 2)
++#define gcdMMU_PAGE_64K_SIZE        (1 << gcdMMU_STLB_64K_SHIFT)
++
++#define gcdMMU_MTLB_MASK            (~((1U << gcdMMU_MTLB_SHIFT)-1))
++#define gcdMMU_STLB_4K_MASK         ((~0U << gcdMMU_STLB_4K_SHIFT) ^ gcdMMU_MTLB_MASK)
++#define gcdMMU_PAGE_4K_MASK         (gcdMMU_PAGE_4K_SIZE - 1)
++#define gcdMMU_STLB_64K_MASK        ((~((1U << gcdMMU_STLB_64K_SHIFT)-1)) ^ gcdMMU_MTLB_MASK)
++#define gcdMMU_PAGE_64K_MASK        (gcdMMU_PAGE_64K_SIZE - 1)
++
++/* Page offset definitions. */
++#define gcdMMU_OFFSET_4K_BITS       (32 - gcdMMU_MTLB_BITS - gcdMMU_STLB_4K_BITS)
++#define gcdMMU_OFFSET_4K_MASK       ((1U << gcdMMU_OFFSET_4K_BITS) - 1)
++#define gcdMMU_OFFSET_16K_BITS      (32 - gcdMMU_MTLB_BITS - gcdMMU_STLB_16K_BITS)
++#define gcdMMU_OFFSET_16K_MASK      ((1U << gcdMMU_OFFSET_16K_BITS) - 1)
++
++/*******************************************************************************
++***** Process Secure Cache ****************************************************/
++
++#define gcdSECURE_CACHE_LRU         1
++#define gcdSECURE_CACHE_LINEAR      2
++#define gcdSECURE_CACHE_HASH        3
++#define gcdSECURE_CACHE_TABLE       4
++
++typedef struct _gcskLOGICAL_CACHE * gcskLOGICAL_CACHE_PTR;
++typedef struct _gcskLOGICAL_CACHE   gcskLOGICAL_CACHE;
++struct _gcskLOGICAL_CACHE
++{
++    /* Logical address. */
++    gctPOINTER                      logical;
++
++    /* DMAable address. */
++    gctUINT32                       dma;
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++    /* Pointer to the previous and next hash tables. */
++    gcskLOGICAL_CACHE_PTR           nextHash;
++    gcskLOGICAL_CACHE_PTR           prevHash;
++#endif
++
++#if gcdSECURE_CACHE_METHOD != gcdSECURE_CACHE_TABLE
++    /* Pointer to the previous and next slot. */
++    gcskLOGICAL_CACHE_PTR           next;
++    gcskLOGICAL_CACHE_PTR           prev;
++#endif
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_LINEAR
++    /* Time stamp. */
++    gctUINT64                       stamp;
++#endif
++};
++
++typedef struct _gcskSECURE_CACHE * gcskSECURE_CACHE_PTR;
++typedef struct _gcskSECURE_CACHE
++{
++    /* Cache memory. */
++    gcskLOGICAL_CACHE               cache[1 + gcdSECURE_CACHE_SLOTS];
++
++    /* Last known index for LINEAR mode. */
++    gcskLOGICAL_CACHE_PTR           cacheIndex;
++
++    /* Current free slot for LINEAR mode. */
++    gctUINT32                       cacheFree;
++
++    /* Time stamp for LINEAR mode. */
++    gctUINT64                       cacheStamp;
++
++#if gcdSECURE_CACHE_METHOD == gcdSECURE_CACHE_HASH
++    /* Hash table for HASH mode. */
++    gcskLOGICAL_CACHE              hash[256];
++#endif
++}
++gcskSECURE_CACHE;
++
++/*******************************************************************************
++***** Process Database Management *********************************************/
++
++typedef enum _gceDATABASE_TYPE
++{
++    gcvDB_VIDEO_MEMORY = 1,             /* Video memory created. */
++    gcvDB_COMMAND_BUFFER,               /* Command Buffer. */
++    gcvDB_NON_PAGED,                    /* Non paged memory. */
++    gcvDB_CONTIGUOUS,                   /* Contiguous memory. */
++    gcvDB_SIGNAL,                       /* Signal. */
++    gcvDB_VIDEO_MEMORY_LOCKED,          /* Video memory locked. */
++    gcvDB_CONTEXT,                      /* Context */
++    gcvDB_IDLE,                         /* GPU idle. */
++    gcvDB_MAP_MEMORY,                   /* Map memory */
++    gcvDB_SHARED_INFO,                  /* Private data */
++    gcvDB_MAP_USER_MEMORY,              /* Map user memory */
++    gcvDB_SYNC_POINT,                   /* Sync point. */
++    gcvDB_VIDEO_MEMORY_RESERVED,        /* Reserved video memory */
++    gcvDB_VIDEO_MEMORY_CONTIGUOUS,      /* Contiguous video memory */
++    gcvDB_VIDEO_MEMORY_VIRTUAL,         /* Virtual video memory */
++}
++gceDATABASE_TYPE;
++
++typedef struct _gcsDATABASE_RECORD *    gcsDATABASE_RECORD_PTR;
++typedef struct _gcsDATABASE_RECORD
++{
++    /* Pointer to kernel. */
++    gckKERNEL                           kernel;
++
++    /* Pointer to next database record. */
++    gcsDATABASE_RECORD_PTR              next;
++
++    /* Type of record. */
++    gceDATABASE_TYPE                    type;
++
++    /* Data for record. */
++    gctPOINTER                          data;
++    gctPHYS_ADDR                        physical;
++    gctSIZE_T                           bytes;
++}
++gcsDATABASE_RECORD;
++
++typedef struct _gcsDATABASE *           gcsDATABASE_PTR;
++typedef struct _gcsDATABASE
++{
++    /* Pointer to next entry is hash list. */
++    gcsDATABASE_PTR                     next;
++    gctSIZE_T                           slot;
++
++    /* Process ID. */
++    gctUINT32                           processID;
++
++    /* Sizes to query. */
++    gcsDATABASE_COUNTERS                vidMem;
++    gcsDATABASE_COUNTERS                nonPaged;
++    gcsDATABASE_COUNTERS                contiguous;
++    gcsDATABASE_COUNTERS                mapUserMemory;
++    gcsDATABASE_COUNTERS                mapMemory;
++    gcsDATABASE_COUNTERS                vidMemResv;
++    gcsDATABASE_COUNTERS                vidMemCont;
++    gcsDATABASE_COUNTERS                vidMemVirt;
++
++    /* Idle time management. */
++    gctUINT64                           lastIdle;
++    gctUINT64                           idle;
++
++    /* Pointer to database. */
++    gcsDATABASE_RECORD_PTR              list[48];
++
++#if gcdSECURE_USER
++    /* Secure cache. */
++    gcskSECURE_CACHE                    cache;
++#endif
++
++    gctPOINTER                          handleDatabase;
++    gctPOINTER                          handleDatabaseMutex;
++}
++gcsDATABASE;
++
++/* Create a process database that will contain all its allocations. */
++gceSTATUS
++gckKERNEL_CreateProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID
++    );
++
++/* Add a record to the process database. */
++gceSTATUS
++gckKERNEL_AddProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Pointer,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Size
++    );
++
++/* Remove a record to the process database. */
++gceSTATUS
++gckKERNEL_RemoveProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Pointer
++    );
++
++/* Destroy the process database. */
++gceSTATUS
++gckKERNEL_DestroyProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID
++    );
++
++/* Find a record to the process database. */
++gceSTATUS
++gckKERNEL_FindProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gctUINT32 ThreadID,
++    IN gceDATABASE_TYPE Type,
++    IN gctPOINTER Pointer,
++    OUT gcsDATABASE_RECORD_PTR Record
++    );
++
++/* Query the process database. */
++gceSTATUS
++gckKERNEL_QueryProcessDB(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    IN gctBOOL LastProcessID,
++    IN gceDATABASE_TYPE Type,
++    OUT gcuDATABASE_INFO * Info
++    );
++
++/* Dump the process database. */
++gceSTATUS
++gckKERNEL_DumpProcessDB(
++    IN gckKERNEL Kernel
++    );
++
++/* ID database */
++gceSTATUS
++gckKERNEL_CreateIntegerDatabase(
++    IN gckKERNEL Kernel,
++    OUT gctPOINTER * Database
++    );
++
++gceSTATUS
++gckKERNEL_DestroyIntegerDatabase(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Database
++    );
++
++gceSTATUS
++gckKERNEL_AllocateIntegerId(
++    IN gctPOINTER Database,
++    IN gctPOINTER Pointer,
++    OUT gctUINT32 * Id
++    );
++
++gceSTATUS
++gckKERNEL_FreeIntegerId(
++    IN gctPOINTER Database,
++    IN gctUINT32 Id
++    );
++
++gceSTATUS
++gckKERNEL_QueryIntegerId(
++    IN gctPOINTER Database,
++    IN gctUINT32 Id,
++    OUT gctPOINTER * Pointer
++    );
++
++gctUINT32
++gckKERNEL_AllocateNameFromPointer(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Pointer
++    );
++
++gctPOINTER
++gckKERNEL_QueryPointerFromName(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 Name
++    );
++
++gceSTATUS
++gckKERNEL_DeleteName(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 Name
++    );
++
++#if gcdSECURE_USER
++/* Get secure cache from the process database. */
++gceSTATUS
++gckKERNEL_GetProcessDBCache(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 ProcessID,
++    OUT gcskSECURE_CACHE_PTR * Cache
++    );
++#endif
++
++/*******************************************************************************
++********* Timer Management ****************************************************/
++typedef struct _gcsTIMER *           gcsTIMER_PTR;
++typedef struct _gcsTIMER
++{
++    /* Start and Stop time holders. */
++    gctUINT64                           startTime;
++    gctUINT64                           stopTime;
++}
++gcsTIMER;
++
++/******************************************************************************\
++********************************** Structures **********************************
++\******************************************************************************/
++
++/* gckDB object. */
++struct _gckDB
++{
++    /* Database management. */
++    gcsDATABASE_PTR             db[16];
++    gctPOINTER                  dbMutex;
++    gcsDATABASE_PTR             freeDatabase;
++    gcsDATABASE_RECORD_PTR      freeRecord;
++    gcsDATABASE_PTR             lastDatabase;
++    gctUINT32                   lastProcessID;
++    gctUINT64                   lastIdle;
++    gctUINT64                   idleTime;
++    gctUINT64                   lastSlowdown;
++    gctUINT64                   lastSlowdownIdle;
++    /* ID - Pointer database*/
++    gctPOINTER                  pointerDatabase;
++    gctPOINTER                  pointerDatabaseMutex;
++};
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++typedef struct _gckVIRTUAL_COMMAND_BUFFER * gckVIRTUAL_COMMAND_BUFFER_PTR;
++typedef struct _gckVIRTUAL_COMMAND_BUFFER
++{
++    gctPHYS_ADDR                physical;
++    gctPOINTER                  userLogical;
++    gctPOINTER                  kernelLogical;
++    gctSIZE_T                   pageCount;
++    gctPOINTER                  pageTable;
++    gctUINT32                   gpuAddress;
++    gctUINT                     pid;
++    gckVIRTUAL_COMMAND_BUFFER_PTR   next;
++    gckVIRTUAL_COMMAND_BUFFER_PTR   prev;
++    gckKERNEL                   kernel;
++}
++gckVIRTUAL_COMMAND_BUFFER;
++#endif
++
++/* gckKERNEL object. */
++struct _gckKERNEL
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Core */
++    gceCORE                     core;
++
++    /* Pointer to gckHARDWARE object. */
++    gckHARDWARE                 hardware;
++
++    /* Pointer to gckCOMMAND object. */
++    gckCOMMAND                  command;
++
++    /* Pointer to gckEVENT object. */
++    gckEVENT                    eventObj;
++
++    /* Pointer to context. */
++    gctPOINTER                  context;
++
++    /* Pointer to gckMMU object. */
++    gckMMU                      mmu;
++
++    /* Arom holding number of clients. */
++    gctPOINTER                  atomClients;
++
++#if VIVANTE_PROFILER
++    /* Enable profiling */
++    gctBOOL                     profileEnable;
++
++    /* Clear profile register or not*/
++    gctBOOL                     profileCleanRegister;
++
++#endif
++
++#ifdef QNX_SINGLE_THREADED_DEBUGGING
++    gctPOINTER                  debugMutex;
++#endif
++
++    /* Database management. */
++    gckDB                       db;
++    gctBOOL                     dbCreated;
++
++#if gcdENABLE_RECOVERY
++    gctPOINTER                  resetFlagClearTimer;
++    gctPOINTER                  resetAtom;
++    gctUINT64                   resetTimeStamp;
++#endif
++
++    /* Pointer to gckEVENT object. */
++    gcsTIMER                    timers[8];
++    gctUINT32                   timeOut;
++
++#if gcdENABLE_VG
++    gckVGKERNEL                 vg;
++#endif
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++    gckVIRTUAL_COMMAND_BUFFER_PTR virtualBufferHead;
++    gckVIRTUAL_COMMAND_BUFFER_PTR virtualBufferTail;
++    gctPOINTER                    virtualBufferLock;
++#endif
++
++#if gcdDVFS
++    gckDVFS                     dvfs;
++#endif
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    gctHANDLE                   timeline;
++#endif
++
++    spinlock_t                 irq_lock;
++
++    gctPOINTER                  vidmemMutex;
++};
++
++struct _FrequencyHistory
++{
++    gctUINT32                   frequency;
++    gctUINT32                   count;
++};
++
++/* gckDVFS object. */
++struct _gckDVFS
++{
++    gckOS                       os;
++    gckHARDWARE                 hardware;
++    gctPOINTER                  timer;
++    gctUINT32                   pollingTime;
++    gctBOOL                     stop;
++    gctUINT32                   totalConfig;
++    gctUINT32                   loads[8];
++    gctUINT8                    currentScale;
++    struct _FrequencyHistory    frequencyHistory[16];
++};
++
++/* gckCOMMAND object. */
++struct _gckCOMMAND
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to required object. */
++    gckKERNEL                   kernel;
++    gckOS                       os;
++
++    /* Number of bytes per page. */
++    gctSIZE_T                   pageSize;
++
++    /* Current pipe select. */
++    gcePIPE_SELECT              pipeSelect;
++
++    /* Command queue running flag. */
++    gctBOOL                     running;
++
++    /* Idle flag and commit stamp. */
++    gctBOOL                     idle;
++    gctUINT64                   commitStamp;
++
++    /* Command queue mutex. */
++    gctPOINTER                  mutexQueue;
++
++    /* Context switching mutex. */
++    gctPOINTER                  mutexContext;
++
++#if VIVANTE_PROFILER_CONTEXT
++    /* Context sequence mutex. */
++    gctPOINTER                  mutexContextSeq;
++#endif
++
++    /* Command queue power semaphore. */
++    gctPOINTER                  powerSemaphore;
++
++    /* Current command queue. */
++    struct _gcskCOMMAND_QUEUE
++    {
++        gctSIGNAL               signal;
++        gctPHYS_ADDR            physical;
++        gctPOINTER              logical;
++    }
++    queues[gcdCOMMAND_QUEUES];
++
++    gctPHYS_ADDR                physical;
++    gctPOINTER                  logical;
++    gctUINT32                   offset;
++    gctINT                      index;
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++    gctUINT                     wrapCount;
++#endif
++
++    /* The command queue is new. */
++    gctBOOL                     newQueue;
++
++    /* Context management. */
++    gckCONTEXT                  currContext;
++
++    /* Pointer to last WAIT command. */
++    gctPHYS_ADDR                waitPhysical;
++    gctPOINTER                  waitLogical;
++    gctSIZE_T                   waitSize;
++
++    /* Command buffer alignment. */
++    gctSIZE_T                   alignment;
++    gctSIZE_T                   reservedHead;
++    gctSIZE_T                   reservedTail;
++
++    /* Commit counter. */
++    gctPOINTER                  atomCommit;
++
++    /* Kernel process ID. */
++    gctUINT32                   kernelProcessID;
++
++    /* End Event signal. */
++    gctSIGNAL                   endEventSignal;
++
++#if gcdSECURE_USER
++    /* Hint array copy buffer. */
++    gctBOOL                     hintArrayAllocated;
++    gctUINT                     hintArraySize;
++    gctUINT32_PTR               hintArray;
++#endif
++};
++
++typedef struct _gcsEVENT *      gcsEVENT_PTR;
++
++/* Structure holding one event to be processed. */
++typedef struct _gcsEVENT
++{
++    /* Pointer to next event in queue. */
++    gcsEVENT_PTR                next;
++
++    /* Event information. */
++    gcsHAL_INTERFACE            info;
++
++    /* Process ID owning the event. */
++    gctUINT32                   processID;
++
++#ifdef __QNXNTO__
++    /* Kernel. */
++    gckKERNEL                   kernel;
++#endif
++
++    gctBOOL                     fromKernel;
++}
++gcsEVENT;
++
++/* Structure holding a list of events to be processed by an interrupt. */
++typedef struct _gcsEVENT_QUEUE * gcsEVENT_QUEUE_PTR;
++typedef struct _gcsEVENT_QUEUE
++{
++    /* Time stamp. */
++    gctUINT64                   stamp;
++
++    /* Source of the event. */
++    gceKERNEL_WHERE             source;
++
++    /* Pointer to head of event queue. */
++    gcsEVENT_PTR                head;
++
++    /* Pointer to tail of event queue. */
++    gcsEVENT_PTR                tail;
++
++    /* Next list of events. */
++    gcsEVENT_QUEUE_PTR          next;
++}
++gcsEVENT_QUEUE;
++
++/*
++    gcdREPO_LIST_COUNT defines the maximum number of event queues with different
++    hardware module sources that may coexist at the same time. Only two sources
++    are supported - gcvKERNEL_COMMAND and gcvKERNEL_PIXEL. gcvKERNEL_COMMAND
++    source is used only for managing the kernel command queue and is only issued
++    when the current command queue gets full. Since we commit event queues every
++    time we commit command buffers, in the worst case we can have up to three
++    pending event queues:
++        - gcvKERNEL_PIXEL
++        - gcvKERNEL_COMMAND (queue overflow)
++        - gcvKERNEL_PIXEL
++*/
++#define gcdREPO_LIST_COUNT      3
++
++/* gckEVENT object. */
++struct _gckEVENT
++{
++    /* The object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to required objects. */
++    gckOS                       os;
++    gckKERNEL                   kernel;
++
++    /* Time stamp. */
++    gctUINT64                   stamp;
++    gctUINT64                   lastCommitStamp;
++
++    /* Queue mutex. */
++    gctPOINTER                  eventQueueMutex;
++
++    /* Array of event queues. */
++    gcsEVENT_QUEUE              queues[30];
++    gctUINT8                    lastID;
++    gctPOINTER                  freeAtom;
++
++    /* Pending events. */
++#if gcdSMP
++    gctPOINTER                  pending;
++#else
++    volatile gctUINT            pending;
++#endif
++
++    /* List of free event structures and its mutex. */
++    gcsEVENT_PTR                freeEventList;
++    gctSIZE_T                   freeEventCount;
++    gctPOINTER                  freeEventMutex;
++
++    /* Event queues. */
++    gcsEVENT_QUEUE_PTR          queueHead;
++    gcsEVENT_QUEUE_PTR          queueTail;
++    gcsEVENT_QUEUE_PTR          freeList;
++    gcsEVENT_QUEUE              repoList[gcdREPO_LIST_COUNT];
++    gctPOINTER                  eventListMutex;
++
++    gctPOINTER                  submitTimer;
++
++    volatile gctBOOL            inNotify;
++};
++
++/* Free all events belonging to a process. */
++gceSTATUS
++gckEVENT_FreeProcess(
++    IN gckEVENT Event,
++    IN gctUINT32 ProcessID
++    );
++
++gceSTATUS
++gckEVENT_Stop(
++    IN gckEVENT Event,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Handle,
++    IN gctPOINTER Logical,
++    IN gctSIGNAL Signal,
++	IN OUT gctSIZE_T * waitSize
++    );
++
++gceSTATUS
++gckEVENT_WaitEmpty(
++    IN gckEVENT Event
++    );
++
++/* gcuVIDMEM_NODE structure. */
++typedef union _gcuVIDMEM_NODE
++{
++    /* Allocated from gckVIDMEM. */
++    struct _gcsVIDMEM_NODE_VIDMEM
++    {
++        /* Owner of this node. */
++        gckVIDMEM               memory;
++
++        /* Dual-linked list of nodes. */
++        gcuVIDMEM_NODE_PTR      next;
++        gcuVIDMEM_NODE_PTR      prev;
++
++        /* Dual linked list of free nodes. */
++        gcuVIDMEM_NODE_PTR      nextFree;
++        gcuVIDMEM_NODE_PTR      prevFree;
++
++        /* Information for this node. */
++        gctUINT32               offset;
++        gctSIZE_T               bytes;
++        gctUINT32               alignment;
++
++#ifdef __QNXNTO__
++        /* Client/server vaddr (mapped using mmap_join). */
++        gctPOINTER              logical;
++#endif
++
++        /* Locked counter. */
++        gctINT32                locked;
++
++        /* Memory pool. */
++        gcePOOL                 pool;
++        gctUINT32               physical;
++
++        /* Process ID owning this memory. */
++        gctUINT32               processID;
++
++        /* Prevent compositor from freeing until client unlocks. */
++        gctBOOL                 freePending;
++
++        /* */
++        gcsVIDMEM_NODE_SHARED_INFO sharedInfo;
++
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
++        gctPOINTER              kernelVirtual;
++#endif
++
++        /* Surface type. */
++        gceSURF_TYPE            type;
++    }
++    VidMem;
++
++    /* Allocated from gckOS. */
++    struct _gcsVIDMEM_NODE_VIRTUAL
++    {
++        /* Pointer to gckKERNEL object. */
++        gckKERNEL               kernel;
++
++        /* Information for this node. */
++        /* Contiguously allocated? */
++        gctBOOL                 contiguous;
++        /* mdl record pointer... a kmalloc address. Process agnostic. */
++        gctPHYS_ADDR            physical;
++        gctSIZE_T               bytes;
++        /* do_mmap_pgoff address... mapped per-process. */
++        gctPOINTER              logical;
++
++        /* Page table information. */
++        /* Used only when node is not contiguous */
++        gctSIZE_T               pageCount;
++
++        /* Used only when node is not contiguous */
++        gctPOINTER              pageTables[gcdMAX_GPU_COUNT];
++        /* Pointer to gckKERNEL object who lock this. */
++        gckKERNEL               lockKernels[gcdMAX_GPU_COUNT];
++        /* Actual physical address */
++        gctUINT32               addresses[gcdMAX_GPU_COUNT];
++
++        /* Locked counter. */
++        gctINT32                lockeds[gcdMAX_GPU_COUNT];
++
++#ifdef __QNXNTO__
++        /* Single linked list of nodes. */
++        gcuVIDMEM_NODE_PTR      next;
++
++        /* Unlock pending flag. */
++        gctBOOL                 unlockPendings[gcdMAX_GPU_COUNT];
++
++        /* Free pending flag. */
++        gctBOOL                 freePending;
++#endif
++
++        /* Process ID owning this memory. */
++        gctUINT32               processID;
++
++        /* Owner process sets freed to true
++         * when it trys to free a locked
++         * node */
++        gctBOOL                 freed;
++
++        /* */
++        gcsVIDMEM_NODE_SHARED_INFO sharedInfo;
++
++        /* Surface type. */
++        gceSURF_TYPE            type;
++    }
++    Virtual;
++}
++gcuVIDMEM_NODE;
++
++/* gckVIDMEM object. */
++struct _gckVIDMEM
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Information for this video memory heap. */
++    gctUINT32                   baseAddress;
++    gctSIZE_T                   bytes;
++    gctSIZE_T                   freeBytes;
++
++    /* Mapping for each type of surface. */
++    gctINT                      mapping[gcvSURF_NUM_TYPES];
++
++    /* Sentinel nodes for up to 8 banks. */
++    gcuVIDMEM_NODE              sentinel[8];
++
++    /* Allocation threshold. */
++    gctSIZE_T                   threshold;
++
++#if gcdUSE_VIDMEM_PER_PID
++    /* The Pid this VidMem belongs to. */
++    gctUINT32                   pid;
++
++    struct _gckVIDMEM*          next;
++#endif
++};
++
++/* gckMMU object. */
++struct _gckMMU
++{
++    /* The object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Pointer to gckHARDWARE object. */
++    gckHARDWARE                 hardware;
++
++    /* The page table mutex. */
++    gctPOINTER                  pageTableMutex;
++
++    /* Page table information. */
++    gctSIZE_T                   pageTableSize;
++    gctPHYS_ADDR                pageTablePhysical;
++    gctUINT32_PTR               pageTableLogical;
++    gctUINT32                   pageTableEntries;
++
++    /* Master TLB information. */
++    gctSIZE_T                   mtlbSize;
++    gctPHYS_ADDR                mtlbPhysical;
++    gctUINT32_PTR               mtlbLogical;
++    gctUINT32                   mtlbEntries;
++
++    /* Free entries. */
++    gctUINT32                   heapList;
++    gctBOOL                     freeNodes;
++
++    gctPOINTER                  staticSTLB;
++    gctBOOL                     enabled;
++
++    gctUINT32                   dynamicMappingStart;
++
++#ifdef __QNXNTO__
++    /* Single linked list of all allocated nodes. */
++    gctPOINTER                  nodeMutex;
++    gcuVIDMEM_NODE_PTR          nodeList;
++#endif
++};
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++gceSTATUS
++gckOS_CreateKernelVirtualMapping(
++    IN gctPHYS_ADDR Physical,
++    OUT gctSIZE_T * PageCount,
++    OUT gctPOINTER * Logical
++    );
++
++gceSTATUS
++gckOS_DestroyKernelVirtualMapping(
++    IN gctPOINTER Logical
++    );
++
++gceSTATUS
++gckKERNEL_AllocateVirtualCommandBuffer(
++    IN gckKERNEL Kernel,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    );
++
++gceSTATUS
++gckKERNEL_DestroyVirtualCommandBuffer(
++    IN gckKERNEL Kernel,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical
++    );
++
++gceSTATUS
++gckKERNEL_GetGPUAddress(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    );
++
++gceSTATUS
++gckKERNEL_QueryGPUAddress(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 GpuAddress,
++    OUT gckVIRTUAL_COMMAND_BUFFER_PTR * Buffer
++    );
++#endif
++
++gceSTATUS
++gckKERNEL_AttachProcess(
++    IN gckKERNEL Kernel,
++    IN gctBOOL Attach
++    );
++
++gceSTATUS
++gckKERNEL_AttachProcessEx(
++    IN gckKERNEL Kernel,
++    IN gctBOOL Attach,
++    IN gctUINT32 PID
++    );
++
++#if gcdSECURE_USER
++gceSTATUS
++gckKERNEL_MapLogicalToPhysical(
++    IN gckKERNEL Kernel,
++    IN gcskSECURE_CACHE_PTR Cache,
++    IN OUT gctPOINTER * Data
++    );
++
++gceSTATUS
++gckKERNEL_FlushTranslationCache(
++    IN gckKERNEL Kernel,
++    IN gcskSECURE_CACHE_PTR Cache,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++#endif
++
++gceSTATUS
++gckHARDWARE_QueryIdle(
++    IN gckHARDWARE Hardware,
++    OUT gctBOOL_PTR IsIdle
++    );
++
++/******************************************************************************\
++******************************* gckCONTEXT Object *******************************
++\******************************************************************************/
++
++gceSTATUS
++gckCONTEXT_Construct(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 ProcessID,
++    OUT gckCONTEXT * Context
++    );
++
++gceSTATUS
++gckCONTEXT_Destroy(
++    IN gckCONTEXT Context
++    );
++
++gceSTATUS
++gckCONTEXT_Update(
++    IN gckCONTEXT Context,
++    IN gctUINT32 ProcessID,
++    IN gcsSTATE_DELTA_PTR StateDelta
++    );
++
++#if gcdLINK_QUEUE_SIZE
++void
++gckLINKQUEUE_Enqueue(
++    IN gckLINKQUEUE LinkQueue,
++    IN gctUINT32 start,
++    IN gctUINT32 end
++    );
++
++void
++gckLINKQUEUE_GetData(
++    IN gckLINKQUEUE LinkQueue,
++    IN gctUINT32 Index,
++    OUT gckLINKDATA * Data
++    );
++#endif
++
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_heap.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,859 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++/**
++**  @file
++**  gckHEAP object for kernel HAL layer.  The heap implemented here is an arena-
++**  based memory allocation.  An arena-based memory heap allocates data quickly
++**  from specified arenas and reduces memory fragmentation.
++**
++*/
++#include "gc_hal_kernel_precomp.h"
++
++#define _GC_OBJ_ZONE            gcvZONE_HEAP
++
++/*******************************************************************************
++***** Structures ***************************************************************
++*******************************************************************************/
++
++#define gcdIN_USE               ((gcskNODE_PTR) ~0)
++
++typedef struct _gcskNODE *      gcskNODE_PTR;
++typedef struct _gcskNODE
++{
++    /* Number of byets in node. */
++    gctSIZE_T                   bytes;
++
++    /* Pointer to next free node, or gcvNULL to mark the node as freed, or
++    ** gcdIN_USE to mark the node as used. */
++    gcskNODE_PTR                next;
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Time stamp of allocation. */
++    gctUINT64                   timeStamp;
++#endif
++}
++gcskNODE;
++
++typedef struct _gcskHEAP    *   gcskHEAP_PTR;
++typedef struct _gcskHEAP
++{
++    /* Linked list. */
++    gcskHEAP_PTR                next;
++    gcskHEAP_PTR                prev;
++
++    /* Heap size. */
++    gctSIZE_T                   size;
++
++    /* Free list. */
++    gcskNODE_PTR                freeList;
++}
++gcskHEAP;
++
++struct _gckHEAP
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to a gckOS object. */
++    gckOS                       os;
++
++    /* Locking mutex. */
++    gctPOINTER                  mutex;
++
++    /* Allocation parameters. */
++    gctSIZE_T                   allocationSize;
++
++    /* Heap list. */
++    gcskHEAP_PTR                heap;
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    gctUINT64                   timeStamp;
++#endif
++
++#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Profile information. */
++    gctUINT32                   allocCount;
++    gctUINT64                   allocBytes;
++    gctUINT64                   allocBytesMax;
++    gctUINT64                   allocBytesTotal;
++    gctUINT32                   heapCount;
++    gctUINT32                   heapCountMax;
++    gctUINT64                   heapMemory;
++    gctUINT64                   heapMemoryMax;
++#endif
++};
++
++/*******************************************************************************
++***** Static Support Functions *************************************************
++*******************************************************************************/
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++static gctSIZE_T
++_DumpHeap(
++    IN gcskHEAP_PTR Heap
++    )
++{
++    gctPOINTER p;
++    gctSIZE_T leaked = 0;
++
++    /* Start at first node. */
++    for (p = Heap + 1;;)
++    {
++        /* Convert the pointer. */
++        gcskNODE_PTR node = (gcskNODE_PTR) p;
++
++        /* Check if this is a used node. */
++        if (node->next == gcdIN_USE)
++        {
++            /* Print the leaking node. */
++            gcmkTRACE_ZONE(gcvLEVEL_WARNING, gcvZONE_HEAP,
++                           "Detected leaking: node=0x%x bytes=%lu timeStamp=%llu "
++                           "(%08X %c%c%c%c)",
++                           node, node->bytes, node->timeStamp,
++                           ((gctUINT32_PTR) (node + 1))[0],
++                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[0]),
++                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[1]),
++                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[2]),
++                           gcmPRINTABLE(((gctUINT8_PTR) (node + 1))[3]));
++
++            /* Add leaking byte count. */
++            leaked += node->bytes;
++        }
++
++        /* Test for end of heap. */
++        if (node->bytes == 0)
++        {
++            break;
++        }
++
++        else
++        {
++            /* Move to next node. */
++            p = (gctUINT8_PTR) node + node->bytes;
++        }
++    }
++
++    /* Return the number of leaked bytes. */
++    return leaked;
++}
++#endif
++
++static gceSTATUS
++_CompactKernelHeap(
++    IN gckHEAP Heap
++    )
++{
++    gcskHEAP_PTR heap, next;
++    gctPOINTER p;
++    gcskHEAP_PTR freeList = gcvNULL;
++
++    gcmkHEADER_ARG("Heap=0x%x", Heap);
++
++    /* Walk all the heaps. */
++    for (heap = Heap->heap; heap != gcvNULL; heap = next)
++    {
++        gcskNODE_PTR lastFree = gcvNULL;
++
++        /* Zero out the free list. */
++        heap->freeList = gcvNULL;
++
++        /* Start at the first node. */
++        for (p = (gctUINT8_PTR) (heap + 1);;)
++        {
++            /* Convert the pointer. */
++            gcskNODE_PTR node = (gcskNODE_PTR) p;
++
++            gcmkASSERT(p <= (gctPOINTER) ((gctUINT8_PTR) (heap + 1) + heap->size));
++
++            /* Test if this node not used. */
++            if (node->next != gcdIN_USE)
++            {
++                /* Test if this is the end of the heap. */
++                if (node->bytes == 0)
++                {
++                    break;
++                }
++
++                /* Test of this is the first free node. */
++                else if (lastFree == gcvNULL)
++                {
++                    /* Initialzie the free list. */
++                    heap->freeList = node;
++                    lastFree       = node;
++                }
++
++                else
++                {
++                    /* Test if this free node is contiguous with the previous
++                    ** free node. */
++                    if ((gctUINT8_PTR) lastFree + lastFree->bytes == p)
++                    {
++                        /* Just increase the size of the previous free node. */
++                        lastFree->bytes += node->bytes;
++                    }
++                    else
++                    {
++                        /* Add to linked list. */
++                        lastFree->next = node;
++                        lastFree       = node;
++                    }
++                }
++            }
++
++            /* Move to next node. */
++            p = (gctUINT8_PTR) node + node->bytes;
++        }
++
++        /* Mark the end of the chain. */
++        if (lastFree != gcvNULL)
++        {
++            lastFree->next = gcvNULL;
++        }
++
++        /* Get next heap. */
++        next = heap->next;
++
++        /* Check if the entire heap is free. */
++        if ((heap->freeList != gcvNULL)
++        &&  (heap->freeList->bytes == heap->size - gcmSIZEOF(gcskNODE))
++        )
++        {
++            /* Remove the heap from the linked list. */
++            if (heap->prev == gcvNULL)
++            {
++                Heap->heap = next;
++            }
++            else
++            {
++                heap->prev->next = next;
++            }
++
++            if (heap->next != gcvNULL)
++            {
++                heap->next->prev = heap->prev;
++            }
++
++#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
++            /* Update profiling. */
++            Heap->heapCount  -= 1;
++            Heap->heapMemory -= heap->size + gcmSIZEOF(gcskHEAP);
++#endif
++
++            /* Add this heap to the list of heaps that need to be freed. */
++            heap->next = freeList;
++            freeList   = heap;
++        }
++    }
++
++    if (freeList != gcvNULL)
++    {
++        /* Release the mutex, remove any chance for a dead lock. */
++        gcmkVERIFY_OK(
++            gckOS_ReleaseMutex(Heap->os, Heap->mutex));
++
++        /* Free all heaps in the free list. */
++        for (heap = freeList; heap != gcvNULL; heap = next)
++        {
++            /* Get pointer to the next heap. */
++            next = heap->next;
++
++            /* Free the heap. */
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HEAP,
++                           "Freeing heap 0x%x (%lu bytes)",
++                           heap, heap->size + gcmSIZEOF(gcskHEAP));
++            gcmkVERIFY_OK(gckOS_FreeMemory(Heap->os, heap));
++        }
++
++        /* Acquire the mutex again. */
++        gcmkVERIFY_OK(
++            gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++***** gckHEAP API Code *********************************************************
++*******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckHEAP_Construct
++**
++**  Construct a new gckHEAP object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctSIZE_T AllocationSize
++**          Minimum size per arena.
++**
++**  OUTPUT:
++**
++**      gckHEAP * Heap
++**          Pointer to a variable that will hold the pointer to the gckHEAP
++**          object.
++*/
++gceSTATUS
++gckHEAP_Construct(
++    IN gckOS Os,
++    IN gctSIZE_T AllocationSize,
++    OUT gckHEAP * Heap
++    )
++{
++    gceSTATUS status;
++    gckHEAP heap = gcvNULL;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%x AllocationSize=%lu", Os, AllocationSize);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Heap != gcvNULL);
++
++    /* Allocate the gckHEAP object. */
++    gcmkONERROR(gckOS_AllocateMemory(Os,
++                                     gcmSIZEOF(struct _gckHEAP),
++                                     &pointer));
++
++    heap = pointer;
++
++    /* Initialize the gckHEAP object. */
++    heap->object.type    = gcvOBJ_HEAP;
++    heap->os             = Os;
++    heap->allocationSize = AllocationSize;
++    heap->heap           = gcvNULL;
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    heap->timeStamp      = 0;
++#endif
++
++#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Zero the counters. */
++    heap->allocCount      = 0;
++    heap->allocBytes      = 0;
++    heap->allocBytesMax   = 0;
++    heap->allocBytesTotal = 0;
++    heap->heapCount       = 0;
++    heap->heapCountMax    = 0;
++    heap->heapMemory      = 0;
++    heap->heapMemoryMax   = 0;
++#endif
++
++    /* Create the mutex. */
++    gcmkONERROR(gckOS_CreateMutex(Os, &heap->mutex));
++
++    /* Return the pointer to the gckHEAP object. */
++    *Heap = heap;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Heap=0x%x", *Heap);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (heap != gcvNULL)
++    {
++        /* Free the heap structure. */
++        gcmkVERIFY_OK(gckOS_FreeMemory(Os, heap));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHEAP_Destroy
++**
++**  Destroy a gckHEAP object.
++**
++**  INPUT:
++**
++**      gckHEAP Heap
++**          Pointer to a gckHEAP object to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckHEAP_Destroy(
++    IN gckHEAP Heap
++    )
++{
++    gcskHEAP_PTR heap;
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    gctSIZE_T leaked = 0;
++#endif
++
++    gcmkHEADER_ARG("Heap=0x%x", Heap);
++
++    for (heap = Heap->heap; heap != gcvNULL; heap = Heap->heap)
++    {
++        /* Unlink heap from linked list. */
++        Heap->heap = heap->next;
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++        /* Check for leaked memory. */
++        leaked += _DumpHeap(heap);
++#endif
++
++        /* Free the heap. */
++        gcmkVERIFY_OK(gckOS_FreeMemory(Heap->os, heap));
++    }
++
++    /* Free the mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Heap->os, Heap->mutex));
++
++    /* Free the heap structure. */
++    gcmkVERIFY_OK(gckOS_FreeMemory(Heap->os, Heap));
++
++    /* Success. */
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    gcmkFOOTER_ARG("leaked=%lu", leaked);
++#else
++    gcmkFOOTER_NO();
++#endif
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckHEAP_Allocate
++**
++**  Allocate data from the heap.
++**
++**  INPUT:
++**
++**      gckHEAP Heap
++**          Pointer to a gckHEAP object.
++**
++**      IN gctSIZE_T Bytes
++**          Number of byte to allocate.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Memory
++**          Pointer to a variable that will hold the address of the allocated
++**          memory.
++*/
++gceSTATUS
++gckHEAP_Allocate(
++    IN gckHEAP Heap,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    )
++{
++    gctBOOL acquired = gcvFALSE;
++    gcskHEAP_PTR heap;
++    gceSTATUS status;
++    gctSIZE_T bytes;
++    gcskNODE_PTR node, used, prevFree = gcvNULL;
++    gctPOINTER memory = gcvNULL;
++
++    gcmkHEADER_ARG("Heap=0x%x Bytes=%lu", Heap, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    /* Determine number of bytes required for a node. */
++    bytes = gcmALIGN(Bytes + gcmSIZEOF(gcskNODE), 8);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
++
++    acquired = gcvTRUE;
++
++    /* Check if this allocation is bigger than the default allocation size. */
++    if (bytes > Heap->allocationSize - gcmSIZEOF(gcskHEAP) - gcmSIZEOF(gcskNODE))
++    {
++        /* Adjust allocation size. */
++        Heap->allocationSize = bytes * 2;
++    }
++
++    else if (Heap->heap != gcvNULL)
++    {
++        gctINT i;
++
++        /* 2 retries, since we might need to compact. */
++        for (i = 0; i < 2; ++i)
++        {
++            /* Walk all the heaps. */
++            for (heap = Heap->heap; heap != gcvNULL; heap = heap->next)
++            {
++                /* Check if this heap has enough bytes to hold the request. */
++                if (bytes <= heap->size - gcmSIZEOF(gcskNODE))
++                {
++                    prevFree = gcvNULL;
++
++                    /* Walk the chain of free nodes. */
++                    for (node = heap->freeList;
++                         node != gcvNULL;
++                         node = node->next
++                    )
++                    {
++                        gcmkASSERT(node->next != gcdIN_USE);
++
++                        /* Check if this free node has enough bytes. */
++                        if (node->bytes >= bytes)
++                        {
++                            /* Use the node. */
++                            goto UseNode;
++                        }
++
++                        /* Save current free node for linked list management. */
++                        prevFree = node;
++                    }
++                }
++            }
++
++            if (i == 0)
++            {
++                /* Compact the heap. */
++                gcmkVERIFY_OK(_CompactKernelHeap(Heap));
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "===== KERNEL HEAP =====");
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Number of allocations           : %12u",
++                               Heap->allocCount);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Number of bytes allocated       : %12llu",
++                               Heap->allocBytes);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Maximum allocation size         : %12llu",
++                               Heap->allocBytesMax);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Total number of bytes allocated : %12llu",
++                               Heap->allocBytesTotal);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Number of heaps                 : %12u",
++                               Heap->heapCount);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Heap memory in bytes            : %12llu",
++                               Heap->heapMemory);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Maximum number of heaps         : %12u",
++                               Heap->heapCountMax);
++                gcmkTRACE_ZONE(gcvLEVEL_VERBOSE, gcvZONE_HEAP,
++                               "Maximum heap memory in bytes    : %12llu",
++                               Heap->heapMemoryMax);
++#endif
++            }
++        }
++    }
++
++    /* Release the mutex. */
++    gcmkONERROR(
++        gckOS_ReleaseMutex(Heap->os, Heap->mutex));
++
++    acquired = gcvFALSE;
++
++    /* Allocate a new heap. */
++    gcmkONERROR(
++        gckOS_AllocateMemory(Heap->os,
++                             Heap->allocationSize,
++                             &memory));
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_HEAP,
++                   "Allocated heap 0x%x (%lu bytes)",
++                   memory, Heap->allocationSize);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
++
++    acquired = gcvTRUE;
++
++    /* Use the allocated memory as the heap. */
++    heap = (gcskHEAP_PTR) memory;
++
++    /* Insert this heap to the head of the chain. */
++    heap->next = Heap->heap;
++    heap->prev = gcvNULL;
++    heap->size = Heap->allocationSize - gcmSIZEOF(gcskHEAP);
++
++    if (heap->next != gcvNULL)
++    {
++        heap->next->prev = heap;
++    }
++    Heap->heap = heap;
++
++    /* Mark the end of the heap. */
++    node = (gcskNODE_PTR) ( (gctUINT8_PTR) heap
++                          + Heap->allocationSize
++                          - gcmSIZEOF(gcskNODE)
++                          );
++    node->bytes = 0;
++    node->next  = gcvNULL;
++
++    /* Create a free list. */
++    node           = (gcskNODE_PTR) (heap + 1);
++    heap->freeList = node;
++
++    /* Initialize the free list. */
++    node->bytes = heap->size - gcmSIZEOF(gcskNODE);
++    node->next  = gcvNULL;
++
++    /* No previous free. */
++    prevFree = gcvNULL;
++
++#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Update profiling. */
++    Heap->heapCount  += 1;
++    Heap->heapMemory += Heap->allocationSize;
++
++    if (Heap->heapCount > Heap->heapCountMax)
++    {
++        Heap->heapCountMax = Heap->heapCount;
++    }
++    if (Heap->heapMemory > Heap->heapMemoryMax)
++    {
++        Heap->heapMemoryMax = Heap->heapMemory;
++    }
++#endif
++
++UseNode:
++    /* Verify some stuff. */
++    gcmkASSERT(heap != gcvNULL);
++    gcmkASSERT(node != gcvNULL);
++    gcmkASSERT(node->bytes >= bytes);
++
++    if (heap->prev != gcvNULL)
++    {
++        /* Unlink the heap from the linked list. */
++        heap->prev->next = heap->next;
++        if (heap->next != gcvNULL)
++        {
++            heap->next->prev = heap->prev;
++        }
++
++        /* Move the heap to the front of the list. */
++        heap->next       = Heap->heap;
++        heap->prev       = gcvNULL;
++        Heap->heap       = heap;
++        heap->next->prev = heap;
++    }
++
++    /* Check if there is enough free space left after usage for another free
++    ** node. */
++    if (node->bytes - bytes >= gcmSIZEOF(gcskNODE))
++    {
++        /* Allocated used space from the back of the free list. */
++        used = (gcskNODE_PTR) ((gctUINT8_PTR) node + node->bytes - bytes);
++
++        /* Adjust the number of free bytes. */
++        node->bytes -= bytes;
++        gcmkASSERT(node->bytes >= gcmSIZEOF(gcskNODE));
++    }
++    else
++    {
++        /* Remove this free list from the chain. */
++        if (prevFree == gcvNULL)
++        {
++            heap->freeList = node->next;
++        }
++        else
++        {
++            prevFree->next = node->next;
++        }
++
++        /* Consume the entire free node. */
++        used  = (gcskNODE_PTR) node;
++        bytes = node->bytes;
++    }
++
++    /* Mark node as used. */
++    used->bytes     = bytes;
++    used->next      = gcdIN_USE;
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    used->timeStamp = ++Heap->timeStamp;
++#endif
++
++#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Update profile counters. */
++    Heap->allocCount      += 1;
++    Heap->allocBytes      += bytes;
++    Heap->allocBytesMax    = gcmMAX(Heap->allocBytes, Heap->allocBytesMax);
++    Heap->allocBytesTotal += bytes;
++#endif
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(
++        gckOS_ReleaseMutex(Heap->os, Heap->mutex));
++
++    /* Return pointer to memory. */
++    *Memory = used + 1;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Memory=0x%x", *Memory);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(
++            gckOS_ReleaseMutex(Heap->os, Heap->mutex));
++    }
++
++    if (memory != gcvNULL)
++    {
++        /* Free the heap memory. */
++        gckOS_FreeMemory(Heap->os, memory);
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckHEAP_Free
++**
++**  Free allocated memory from the heap.
++**
++**  INPUT:
++**
++**      gckHEAP Heap
++**          Pointer to a gckHEAP object.
++**
++**      IN gctPOINTER Memory
++**          Pointer to memory to free.
++**
++**  OUTPUT:
++**
++**      NOTHING.
++*/
++gceSTATUS
++gckHEAP_Free(
++    IN gckHEAP Heap,
++    IN gctPOINTER Memory
++    )
++{
++    gcskNODE_PTR node;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Heap=0x%x Memory=0x%x", Heap, Memory);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Heap->os, Heap->mutex, gcvINFINITE));
++
++    /* Pointer to structure. */
++    node = (gcskNODE_PTR) Memory - 1;
++
++    /* Mark the node as freed. */
++    node->next = gcvNULL;
++
++#if VIVANTE_PROFILER || gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Update profile counters. */
++    Heap->allocBytes -= node->bytes;
++#endif
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(
++        gckOS_ReleaseMutex(Heap->os, Heap->mutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if VIVANTE_PROFILER
++gceSTATUS
++gckHEAP_ProfileStart(
++    IN gckHEAP Heap
++    )
++{
++    gcmkHEADER_ARG("Heap=0x%x", Heap);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
++
++    /* Zero the counters. */
++    Heap->allocCount      = 0;
++    Heap->allocBytes      = 0;
++    Heap->allocBytesMax   = 0;
++    Heap->allocBytesTotal = 0;
++    Heap->heapCount       = 0;
++    Heap->heapCountMax    = 0;
++    Heap->heapMemory      = 0;
++    Heap->heapMemoryMax   = 0;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckHEAP_ProfileEnd(
++    IN gckHEAP Heap,
++    IN gctCONST_STRING Title
++    )
++{
++    gcmkHEADER_ARG("Heap=0x%x Title=0x%x", Heap, Title);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Heap, gcvOBJ_HEAP);
++    gcmkVERIFY_ARGUMENT(Title != gcvNULL);
++
++    gcmkPRINT("");
++    gcmkPRINT("=====[ HEAP - %s ]=====", Title);
++    gcmkPRINT("Number of allocations           : %12u",   Heap->allocCount);
++    gcmkPRINT("Number of bytes allocated       : %12llu", Heap->allocBytes);
++    gcmkPRINT("Maximum allocation size         : %12llu", Heap->allocBytesMax);
++    gcmkPRINT("Total number of bytes allocated : %12llu", Heap->allocBytesTotal);
++    gcmkPRINT("Number of heaps                 : %12u",   Heap->heapCount);
++    gcmkPRINT("Heap memory in bytes            : %12llu", Heap->heapMemory);
++    gcmkPRINT("Maximum number of heaps         : %12u",   Heap->heapCountMax);
++    gcmkPRINT("Maximum heap memory in bytes    : %12llu", Heap->heapMemoryMax);
++    gcmkPRINT("==============================================");
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++#endif /* VIVANTE_PROFILER */
++
++/*******************************************************************************
++***** Test Code ****************************************************************
++*******************************************************************************/
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_interrupt_vg.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,877 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#if gcdENABLE_VG
++
++/******************************************************************************\
++*********************** Support Functions and Definitions **********************
++\******************************************************************************/
++
++/* Interruot statistics will be accumulated if not zero. */
++#define gcmENABLE_INTERRUPT_STATISTICS 0
++
++#define _GC_OBJ_ZONE    gcvZONE_INTERRUPT
++
++/* Object structure. */
++struct _gckVGINTERRUPT
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* gckVGKERNEL pointer. */
++    gckVGKERNEL                 kernel;
++
++    /* gckOS pointer. */
++    gckOS                       os;
++
++    /* Interrupt handlers. */
++    gctINTERRUPT_HANDLER        handlers[32];
++
++    /* Main interrupt handler thread. */
++    gctTHREAD                   handler;
++    gctBOOL                     terminate;
++
++    /* Interrupt FIFO. */
++    gctSEMAPHORE                fifoValid;
++    gctUINT32                   fifo[256];
++    gctUINT                     fifoItems;
++    gctUINT8                    head;
++    gctUINT8                    tail;
++
++    /* Interrupt statistics. */
++#if gcmENABLE_INTERRUPT_STATISTICS
++    gctUINT                     maxFifoItems;
++    gctUINT                     fifoOverflow;
++    gctUINT                     maxSimultaneous;
++    gctUINT                     multipleCount;
++#endif
++};
++
++
++/*******************************************************************************
++**
++**  _ProcessInterrupt
++**
++**  The interrupt processor.
++**
++**  INPUT:
++**
++**      ThreadParameter
++**          Pointer to the gckVGINTERRUPT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++#if gcmENABLE_INTERRUPT_STATISTICS
++static void
++_ProcessInterrupt(
++    gckVGINTERRUPT Interrupt,
++    gctUINT_PTR TriggeredCount
++    )
++#else
++static void
++_ProcessInterrupt(
++    gckVGINTERRUPT Interrupt
++    )
++#endif
++{
++    gceSTATUS status;
++    gctUINT32 triggered;
++    gctUINT i;
++
++    /* Advance to the next entry. */
++    Interrupt->tail      += 1;
++    Interrupt->fifoItems -= 1;
++
++    /* Get the interrupt value. */
++    triggered = Interrupt->fifo[Interrupt->tail];
++    gcmkASSERT(triggered != 0);
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "%s: triggered=0x%08X\n",
++        __FUNCTION__,
++        triggered
++        );
++
++    /* Walk through all possible interrupts. */
++    for (i = 0; i < gcmSIZEOF(Interrupt->handlers); i += 1)
++    {
++        /* Test if interrupt happened. */
++        if ((triggered & 1) == 1)
++        {
++#if gcmENABLE_INTERRUPT_STATISTICS
++            if (TriggeredCount != gcvNULL)
++            {
++                (* TriggeredCount) += 1;
++            }
++#endif
++
++            /* Make sure we have valid handler. */
++            if (Interrupt->handlers[i] == gcvNULL)
++            {
++                gcmkTRACE(
++                    gcvLEVEL_ERROR,
++                    "%s: Interrupt %d isn't registered.\n",
++                    __FUNCTION__, i
++                    );
++            }
++            else
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                    "%s: interrupt=%d\n",
++                    __FUNCTION__,
++                    i
++                    );
++
++                /* Call the handler. */
++                status = Interrupt->handlers[i] (Interrupt->kernel);
++
++                if (gcmkIS_ERROR(status))
++                {
++                    /* Failed to signal the semaphore. */
++                    gcmkTRACE(
++                        gcvLEVEL_ERROR,
++                        "%s: Error %d incrementing the semaphore #%d.\n",
++                        __FUNCTION__, status, i
++                        );
++                }
++            }
++        }
++
++        /* Next interrupt. */
++        triggered >>= 1;
++
++        /* No more interrupts to handle? */
++        if (triggered == 0)
++        {
++            break;
++        }
++    }
++}
++
++
++/*******************************************************************************
++**
++**  _MainInterruptHandler
++**
++**  The main interrupt thread serves the interrupt FIFO and calls registered
++**  handlers for the interrupts that occured. The handlers are called in the
++**  sequence interrupts occured with the exception when multiple interrupts
++**  occured at the same time. In that case the handler calls are "sorted" by
++**  the interrupt number therefore giving the interrupts with lower numbers
++**  higher priority.
++**
++**  INPUT:
++**
++**      ThreadParameter
++**          Pointer to the gckVGINTERRUPT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++static gctTHREADFUNCRESULT gctTHREADFUNCTYPE
++_MainInterruptHandler(
++    gctTHREADFUNCPARAMETER ThreadParameter
++    )
++{
++    gceSTATUS status;
++    gckVGINTERRUPT interrupt;
++
++#if gcmENABLE_INTERRUPT_STATISTICS
++    gctUINT count;
++#endif
++
++    /* Cast the object. */
++    interrupt = (gckVGINTERRUPT) ThreadParameter;
++
++    /* Enter the loop. */
++    while (gcvTRUE)
++    {
++        /* Wait for an interrupt. */
++        status = gckOS_DecrementSemaphore(interrupt->os, interrupt->fifoValid);
++
++        /* Error? */
++        if (gcmkIS_ERROR(status))
++        {
++            break;
++        }
++
++        /* System termination request? */
++        if (status == gcvSTATUS_TERMINATE)
++        {
++            break;
++        }
++
++        /* Driver is shutting down? */
++        if (interrupt->terminate)
++        {
++            break;
++        }
++
++#if gcmENABLE_INTERRUPT_STATISTICS
++        /* Reset triggered count. */
++        count = 0;
++
++        /* Process the interrupt. */
++        _ProcessInterrupt(interrupt, &count);
++
++        /* Update conters. */
++        if (count > interrupt->maxSimultaneous)
++        {
++            interrupt->maxSimultaneous = count;
++        }
++
++        if (count > 1)
++        {
++            interrupt->multipleCount += 1;
++        }
++#else
++        /* Process the interrupt. */
++        _ProcessInterrupt(interrupt);
++#endif
++    }
++
++    return 0;
++}
++
++
++/*******************************************************************************
++**
++**  _StartInterruptHandler / _StopInterruptHandler
++**
++**  Main interrupt handler routine control.
++**
++**  INPUT:
++**
++**      ThreadParameter
++**          Pointer to the gckVGINTERRUPT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++static gceSTATUS
++_StartInterruptHandler(
++    gckVGINTERRUPT Interrupt
++    )
++{
++    gceSTATUS status, last;
++
++    do
++    {
++        /* Objects must not be already created. */
++        gcmkASSERT(Interrupt->fifoValid == gcvNULL);
++        gcmkASSERT(Interrupt->handler   == gcvNULL);
++
++        /* Reset the termination request. */
++        Interrupt->terminate = gcvFALSE;
++
++#if !gcdENABLE_INFINITE_SPEED_HW
++        /* Construct the fifo semaphore. */
++        gcmkERR_BREAK(gckOS_CreateSemaphoreVG(
++            Interrupt->os, &Interrupt->fifoValid
++            ));
++
++        /* Start the interrupt handler thread. */
++        gcmkERR_BREAK(gckOS_StartThread(
++            Interrupt->os,
++            _MainInterruptHandler,
++            Interrupt,
++            &Interrupt->handler
++            ));
++#endif
++
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Roll back. */
++    if (Interrupt->fifoValid != gcvNULL)
++    {
++        gcmkCHECK_STATUS(gckOS_DestroySemaphore(
++            Interrupt->os, Interrupt->fifoValid
++            ));
++
++        Interrupt->fifoValid = gcvNULL;
++    }
++
++    /* Return the status. */
++    return status;
++}
++
++static gceSTATUS
++_StopInterruptHandler(
++    gckVGINTERRUPT Interrupt
++    )
++{
++    gceSTATUS status;
++
++    do
++    {
++        /* Does the thread exist? */
++        if (Interrupt->handler == gcvNULL)
++        {
++            /* The semaphore must be NULL as well. */
++            gcmkASSERT(Interrupt->fifoValid == gcvNULL);
++
++            /* Success. */
++            status = gcvSTATUS_OK;
++            break;
++        }
++
++        /* The semaphore must exist as well. */
++        gcmkASSERT(Interrupt->fifoValid != gcvNULL);
++
++        /* Set the termination request. */
++        Interrupt->terminate = gcvTRUE;
++
++        /* Unlock the thread. */
++        gcmkERR_BREAK(gckOS_IncrementSemaphore(
++            Interrupt->os, Interrupt->fifoValid
++            ));
++
++        /* Wait until the thread quits. */
++        gcmkERR_BREAK(gckOS_StopThread(
++            Interrupt->os,
++            Interrupt->handler
++            ));
++
++        /* Destroy the semaphore. */
++        gcmkERR_BREAK(gckOS_DestroySemaphore(
++            Interrupt->os, Interrupt->fifoValid
++            ));
++
++        /* Reset handles. */
++        Interrupt->handler   = gcvNULL;
++        Interrupt->fifoValid = gcvNULL;
++    }
++    while (gcvFALSE);
++
++    /* Return the status. */
++    return status;
++}
++
++
++/******************************************************************************\
++***************************** Interrupt Object API *****************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckVGINTERRUPT_Construct
++**
++**  Construct an interrupt object.
++**
++**  INPUT:
++**
++**      Kernel
++**          Pointer to the gckVGKERNEL object.
++**
++**  OUTPUT:
++**
++**      Interrupt
++**          Pointer to the new gckVGINTERRUPT object.
++*/
++
++gceSTATUS
++gckVGINTERRUPT_Construct(
++    IN gckVGKERNEL Kernel,
++    OUT gckVGINTERRUPT * Interrupt
++    )
++{
++    gceSTATUS status;
++    gckVGINTERRUPT interrupt = gcvNULL;
++
++    gcmkHEADER_ARG("Kernel=0x%x Interrupt=0x%x", Kernel, Interrupt);
++
++    /* Verify argeuments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Interrupt != gcvNULL);
++
++    do
++    {
++        /* Allocate the gckVGINTERRUPT structure. */
++        gcmkERR_BREAK(gckOS_Allocate(
++            Kernel->os,
++            gcmSIZEOF(struct _gckVGINTERRUPT),
++            (gctPOINTER *) &interrupt
++            ));
++
++        /* Reset the object data. */
++        gcmkVERIFY_OK(gckOS_ZeroMemory(
++            interrupt, gcmSIZEOF(struct _gckVGINTERRUPT)
++            ));
++
++        /* Initialize the object. */
++        interrupt->object.type = gcvOBJ_INTERRUPT;
++
++        /* Initialize the object pointers. */
++        interrupt->kernel = Kernel;
++        interrupt->os     = Kernel->os;
++
++        /* Initialize the current FIFO position. */
++        interrupt->head = (gctUINT8)~0;
++        interrupt->tail = (gctUINT8)~0;
++
++        /* Start the thread. */
++        gcmkERR_BREAK(_StartInterruptHandler(interrupt));
++
++        /* Return interrupt object. */
++        *Interrupt = interrupt;
++
++        gcmkFOOTER_ARG("*Interrup=0x%x", *Interrupt);
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Roll back. */
++    if (interrupt != gcvNULL)
++    {
++        /* Free the gckVGINTERRUPT structure. */
++        gcmkVERIFY_OK(gckOS_Free(interrupt->os, interrupt));
++    }
++
++    gcmkFOOTER();
++
++    /* Return the status. */
++    return status;
++}
++
++
++/*******************************************************************************
++**
++**  gckVGINTERRUPT_Destroy
++**
++**  Destroy an interrupt object.
++**
++**  INPUT:
++**
++**      Interrupt
++**          Pointer to the gckVGINTERRUPT object to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++gceSTATUS
++gckVGINTERRUPT_Destroy(
++    IN gckVGINTERRUPT Interrupt
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Interrupt=0x%x", Interrupt);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
++
++    do
++    {
++        /* Stop the interrupt thread. */
++        gcmkERR_BREAK(_StopInterruptHandler(Interrupt));
++
++        /* Mark the object as unknown. */
++        Interrupt->object.type = gcvOBJ_UNKNOWN;
++
++        /* Free the gckVGINTERRUPT structure. */
++        gcmkERR_BREAK(gckOS_Free(Interrupt->os, Interrupt));
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++
++    /* Return the status. */
++    return status;
++}
++
++
++/*******************************************************************************
++**
++**  gckVGINTERRUPT_DumpState
++**
++**  Print the current state of the interrupt manager.
++**
++**  INPUT:
++**
++**      Interrupt
++**          Pointer to a gckVGINTERRUPT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++#if gcvDEBUG
++gceSTATUS
++gckVGINTERRUPT_DumpState(
++    IN gckVGINTERRUPT Interrupt
++    )
++{
++    gcmkHEADER_ARG("Interrupt=0x%x", Interrupt);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
++
++    /* Print the header. */
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "%s: INTERRUPT OBJECT STATUS\n",
++        __FUNCTION__
++        );
++
++    /* Print statistics. */
++#if gcmENABLE_INTERRUPT_STATISTICS
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "  Maximum number of FIFO items accumulated at a single time: %d\n",
++        Interrupt->maxFifoItems
++        );
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "  Interrupt FIFO overflow happened times: %d\n",
++        Interrupt->fifoOverflow
++        );
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "  Maximum number of interrupts simultaneously generated: %d\n",
++        Interrupt->maxSimultaneous
++        );
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "  Number of times when there were multiple interrupts generated: %d\n",
++        Interrupt->multipleCount
++        );
++#endif
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++        "  The current number of entries in the FIFO: %d\n",
++        Interrupt->fifoItems
++        );
++
++    /* Print the FIFO contents. */
++    if (Interrupt->fifoItems != 0)
++    {
++        gctUINT8 index;
++        gctUINT8 last;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++            "  FIFO current contents:\n"
++            );
++
++        /* Get the current pointers. */
++        index = Interrupt->tail;
++        last  = Interrupt->head;
++
++        while (index != last)
++        {
++            /* Advance to the next entry. */
++            index += 1;
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_VERBOSE, gcvZONE_COMMAND,
++                "    %d: 0x%08X\n",
++                index, Interrupt->fifo[index]
++                );
++        }
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++#endif
++
++
++/*******************************************************************************
++**
++**  gckVGINTERRUPT_Enable
++**
++**  Enable the specified interrupt.
++**
++**  INPUT:
++**
++**      Interrupt
++**          Pointer to a gckVGINTERRUPT object.
++**
++**      Id
++**          Pointer to the variable that holds the interrupt number to be
++**          registered in range 0..31.
++**          If the value is less then 0, gckVGINTERRUPT_Enable will attempt
++**          to find an unused interrupt. If such interrupt is found, the number
++**          will be assigned to the variable if the functuion call succeedes.
++**
++**      Handler
++**          Pointer to the handler to register for the interrupt.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++gceSTATUS
++gckVGINTERRUPT_Enable(
++    IN gckVGINTERRUPT Interrupt,
++    IN OUT gctINT32_PTR Id,
++    IN gctINTERRUPT_HANDLER Handler
++    )
++{
++    gceSTATUS status;
++    gctINT32 i;
++
++    gcmkHEADER_ARG("Interrupt=0x%x Id=0x%x Handler=0x%x", Interrupt, Id, Handler);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
++    gcmkVERIFY_ARGUMENT(Id != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Handler != gcvNULL);
++
++    do
++    {
++        /* See if we need to allocate an ID. */
++        if (*Id < 0)
++        {
++            /* Find the first unused interrupt handler. */
++            for (i = 0; i < gcmCOUNTOF(Interrupt->handlers); ++i)
++            {
++                if (Interrupt->handlers[i] == gcvNULL)
++                {
++                    break;
++                }
++            }
++
++            /* No unused innterrupts? */
++            if (i == gcmCOUNTOF(Interrupt->handlers))
++            {
++                status = gcvSTATUS_OUT_OF_RESOURCES;
++                break;
++            }
++
++            /* Update the interrupt ID. */
++            *Id = i;
++        }
++
++        /* Make sure the ID is in range. */
++        else if (*Id >= gcmCOUNTOF(Interrupt->handlers))
++        {
++            status = gcvSTATUS_INVALID_ARGUMENT;
++            break;
++        }
++
++        /* Set interrupt handler. */
++        Interrupt->handlers[*Id] = Handler;
++
++        /* Success. */
++        status = gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++
++/*******************************************************************************
++**
++**  gckVGINTERRUPT_Disable
++**
++**  Disable the specified interrupt.
++**
++**  INPUT:
++**
++**      Interrupt
++**          Pointer to a gckVGINTERRUPT object.
++**
++**      Id
++**          Interrupt number to be disabled in range 0..31.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++gceSTATUS
++gckVGINTERRUPT_Disable(
++    IN gckVGINTERRUPT Interrupt,
++    IN gctINT32 Id
++    )
++{
++    gcmkHEADER_ARG("Interrupt=0x%x Id=0x%x", Interrupt, Id);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
++    gcmkVERIFY_ARGUMENT((Id >= 0) && (Id < gcmCOUNTOF(Interrupt->handlers)));
++
++    /* Reset interrupt handler. */
++    Interrupt->handlers[Id] = gcvNULL;
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++
++/*******************************************************************************
++**
++**  gckVGINTERRUPT_Enque
++**
++**  Read the interrupt status register and put the value in the interrupt FIFO.
++**
++**  INPUT:
++**
++**      Interrupt
++**          Pointer to a gckVGINTERRUPT object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++
++#ifndef __QNXNTO__
++gceSTATUS
++gckVGINTERRUPT_Enque(
++    IN gckVGINTERRUPT Interrupt
++    )
++#else
++gceSTATUS
++gckVGINTERRUPT_Enque(
++    IN gckVGINTERRUPT Interrupt,
++    OUT gckOS *Os,
++    OUT gctSEMAPHORE *Semaphore
++    )
++#endif
++{
++    gceSTATUS status;
++    gctUINT32 triggered;
++
++    gcmkHEADER_ARG("Interrupt=0x%x", Interrupt);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Interrupt, gcvOBJ_INTERRUPT);
++
++#ifdef __QNXNTO__
++    *Os = gcvNULL;
++    *Semaphore = gcvNULL;
++#endif
++
++    do
++    {
++        /* Read interrupt status register. */
++        gcmkERR_BREAK(gckVGHARDWARE_ReadInterrupt(
++            Interrupt->kernel->hardware, &triggered
++            ));
++
++        /* Mask out TS overflow interrupt */
++        triggered &= 0xfffffffe;
++
++        /* No interrupts to process? */
++        if (triggered == 0)
++        {
++            status = gcvSTATUS_NOT_OUR_INTERRUPT;
++            break;
++        }
++
++        /* FIFO overflow? */
++        if (Interrupt->fifoItems == gcmCOUNTOF(Interrupt->fifo))
++        {
++#if gcmENABLE_INTERRUPT_STATISTICS
++            Interrupt->fifoOverflow += 1;
++#endif
++
++            /* OR the interrupt with the last value in the FIFO. */
++            Interrupt->fifo[Interrupt->head] |= triggered;
++
++            /* Success (kind of). */
++            status = gcvSTATUS_OK;
++        }
++        else
++        {
++            /* Advance to the next entry. */
++            Interrupt->head      += 1;
++            Interrupt->fifoItems += 1;
++
++#if gcmENABLE_INTERRUPT_STATISTICS
++            if (Interrupt->fifoItems > Interrupt->maxFifoItems)
++            {
++                Interrupt->maxFifoItems = Interrupt->fifoItems;
++            }
++#endif
++
++            /* Set the new value. */
++            Interrupt->fifo[Interrupt->head] = triggered;
++
++#ifndef __QNXNTO__
++            /* Increment the FIFO semaphore. */
++            gcmkERR_BREAK(gckOS_IncrementSemaphore(
++                Interrupt->os, Interrupt->fifoValid
++                ));
++#else
++            *Os = Interrupt->os;
++            *Semaphore = Interrupt->fifoValid;
++#endif
++
++            /* Windows kills our threads prematurely when the application
++               exists. Verify here that the thread is still alive. */
++            status = gckOS_VerifyThread(Interrupt->os, Interrupt->handler);
++
++            /* Has the thread been prematurely terminated? */
++            if (status != gcvSTATUS_OK)
++            {
++                /* Process all accumulated interrupts. */
++                while (Interrupt->head != Interrupt->tail)
++                {
++#if gcmENABLE_INTERRUPT_STATISTICS
++                    /* Process the interrupt. */
++                    _ProcessInterrupt(Interrupt, gcvNULL);
++#else
++                    /* Process the interrupt. */
++                    _ProcessInterrupt(Interrupt);
++#endif
++                }
++
++                /* Set success. */
++                status = gcvSTATUS_OK;
++            }
++        }
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++#endif /* gcdENABLE_VG */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,1982 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_MMU
++
++typedef enum _gceMMU_TYPE
++{
++    gcvMMU_USED     = (0 << 4),
++    gcvMMU_SINGLE   = (1 << 4),
++    gcvMMU_FREE     = (2 << 4),
++}
++gceMMU_TYPE;
++
++#define gcmENTRY_TYPE(x) (x & 0xF0)
++
++#define gcdMMU_TABLE_DUMP       0
++
++#define gcdUSE_MMU_EXCEPTION    0
++
++/*
++    gcdMMU_CLEAR_VALUE
++
++        The clear value for the entry of the old MMU.
++*/
++#ifndef gcdMMU_CLEAR_VALUE
++#   define gcdMMU_CLEAR_VALUE                   0x00000ABC
++#endif
++
++/* VIV: Start GPU address for gcvSURF_VERTEX.  */
++#define gcdVERTEX_START      (128 << 10)
++
++typedef struct _gcsMMU_STLB *gcsMMU_STLB_PTR;
++
++typedef struct _gcsMMU_STLB
++{
++    gctPHYS_ADDR    physical;
++    gctUINT32_PTR   logical;
++    gctSIZE_T       size;
++    gctUINT32       physBase;
++    gctSIZE_T       pageCount;
++    gctUINT32       mtlbIndex;
++    gctUINT32       mtlbEntryNum;
++    gcsMMU_STLB_PTR next;
++} gcsMMU_STLB;
++
++#if gcdSHARED_PAGETABLE
++typedef struct _gcsSharedPageTable * gcsSharedPageTable_PTR;
++typedef struct _gcsSharedPageTable
++{
++    /* Shared gckMMU object. */
++    gckMMU          mmu;
++
++    /* Hardwares which use this shared pagetable. */
++    gckHARDWARE     hardwares[gcdMAX_GPU_COUNT];
++
++    /* Number of cores use this shared pagetable. */
++    gctUINT32       reference;
++}
++gcsSharedPageTable;
++
++static gcsSharedPageTable_PTR sharedPageTable = gcvNULL;
++#endif
++
++#if gcdMIRROR_PAGETABLE
++typedef struct _gcsMirrorPageTable * gcsMirrorPageTable_PTR;
++typedef struct _gcsMirrorPageTable
++{
++    /* gckMMU objects. */
++    gckMMU          mmus[gcdMAX_GPU_COUNT];
++
++    /* Hardwares which use this shared pagetable. */
++    gckHARDWARE     hardwares[gcdMAX_GPU_COUNT];
++
++    /* Number of cores use this shared pagetable. */
++    gctUINT32       reference;
++}
++gcsMirrorPageTable;
++
++static gcsMirrorPageTable_PTR mirrorPageTable = gcvNULL;
++static gctPOINTER mirrorPageTableMutex = gcvNULL;
++#endif
++
++typedef struct _gcsDynamicSpaceNode * gcsDynamicSpaceNode_PTR;
++typedef struct _gcsDynamicSpaceNode
++{
++    gctUINT32       start;
++    gctINT32        entries;
++}
++gcsDynamicSpaceNode;
++
++static void
++_WritePageEntry(
++    IN gctUINT32_PTR PageEntry,
++    IN gctUINT32     EntryValue
++    )
++{
++    static gctUINT16 data = 0xff00;
++
++    if (*(gctUINT8 *)&data == 0xff)
++    {
++        *PageEntry = gcmSWAB32(EntryValue);
++    }
++    else
++    {
++        *PageEntry = EntryValue;
++    }
++}
++
++static gctUINT32
++_ReadPageEntry(
++    IN gctUINT32_PTR PageEntry
++    )
++{
++    static gctUINT16 data = 0xff00;
++    gctUINT32 entryValue;
++
++    if (*(gctUINT8 *)&data == 0xff)
++    {
++        entryValue = *PageEntry;
++        return gcmSWAB32(entryValue);
++    }
++    else
++    {
++        return *PageEntry;
++    }
++}
++
++static gceSTATUS
++_FillPageTable(
++    IN gctUINT32_PTR PageTable,
++    IN gctUINT32     PageCount,
++    IN gctUINT32     EntryValue
++)
++{
++    gctUINT i;
++
++    for (i = 0; i < PageCount; i++)
++    {
++        _WritePageEntry(PageTable + i, EntryValue);
++    }
++
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++_Link(
++    IN gckMMU Mmu,
++    IN gctUINT32 Index,
++    IN gctUINT32 Next
++    )
++{
++    if (Index >= Mmu->pageTableEntries)
++    {
++        /* Just move heap pointer. */
++        Mmu->heapList = Next;
++    }
++    else
++    {
++        /* Address page table. */
++        gctUINT32_PTR pageTable = Mmu->pageTableLogical;
++
++        /* Dispatch on node type. */
++        switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[Index])))
++        {
++        case gcvMMU_SINGLE:
++            /* Set single index. */
++            _WritePageEntry(&pageTable[Index], (Next << 8) | gcvMMU_SINGLE);
++            break;
++
++        case gcvMMU_FREE:
++            /* Set index. */
++            _WritePageEntry(&pageTable[Index + 1], Next);
++            break;
++
++        default:
++            gcmkFATAL("MMU table correcupted at index %u!", Index);
++            return gcvSTATUS_HEAP_CORRUPTED;
++        }
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++static gceSTATUS
++_AddFree(
++    IN gckMMU Mmu,
++    IN gctUINT32 Index,
++    IN gctUINT32 Node,
++    IN gctUINT32 Count
++    )
++{
++    gctUINT32_PTR pageTable = Mmu->pageTableLogical;
++
++    if (Count == 1)
++    {
++        /* Initialize a single page node. */
++        _WritePageEntry(pageTable + Node, (~((1U<<8)-1)) | gcvMMU_SINGLE);
++    }
++    else
++    {
++        /* Initialize the node. */
++        _WritePageEntry(pageTable + Node + 0, (Count << 8) | gcvMMU_FREE);
++        _WritePageEntry(pageTable + Node + 1, ~0U);
++    }
++
++    /* Append the node. */
++    return _Link(Mmu, Index, Node);
++}
++
++static gceSTATUS
++_Collect(
++    IN gckMMU Mmu
++    )
++{
++    gctUINT32_PTR pageTable = Mmu->pageTableLogical;
++    gceSTATUS status;
++    gctUINT32 i, previous, start = 0, count = 0;
++
++    previous = Mmu->heapList = ~0U;
++    Mmu->freeNodes = gcvFALSE;
++
++    /* Walk the entire page table. */
++    for (i = 0; i < Mmu->pageTableEntries; ++i)
++    {
++        /* Dispatch based on type of page. */
++        switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[i])))
++        {
++        case gcvMMU_USED:
++            /* Used page, so close any open node. */
++            if (count > 0)
++            {
++                /* Add the node. */
++                gcmkONERROR(_AddFree(Mmu, previous, start, count));
++
++                /* Reset the node. */
++                previous = start;
++                count    = 0;
++            }
++            break;
++
++        case gcvMMU_SINGLE:
++            /* Single free node. */
++            if (count++ == 0)
++            {
++                /* Start a new node. */
++                start = i;
++            }
++            break;
++
++        case gcvMMU_FREE:
++            /* A free node. */
++            if (count == 0)
++            {
++                /* Start a new node. */
++                start = i;
++            }
++
++            /* Advance the count. */
++            count += _ReadPageEntry(&pageTable[i]) >> 8;
++
++            /* Advance the index into the page table. */
++            i     += (_ReadPageEntry(&pageTable[i]) >> 8) - 1;
++            break;
++
++        default:
++            gcmkFATAL("MMU page table correcupted at index %u!", i);
++            return gcvSTATUS_HEAP_CORRUPTED;
++        }
++    }
++
++    /* See if we have an open node left. */
++    if (count > 0)
++    {
++        /* Add the node to the list. */
++        gcmkONERROR(_AddFree(Mmu, previous, start, count));
++    }
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_MMU,
++                   "Performed a garbage collection of the MMU heap.");
++
++    /* Success. */
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the staus. */
++    return status;
++}
++
++static gctUINT32
++_SetPage(gctUINT32 PageAddress)
++{
++    return PageAddress
++           /* writable */
++           | (1 << 2)
++           /* Ignore exception */
++           | (0 << 1)
++           /* Present */
++           | (1 << 0);
++}
++
++static gceSTATUS
++_FillFlatMapping(
++    IN gckMMU Mmu,
++    IN gctUINT32 PhysBase,
++    OUT gctSIZE_T Size
++    )
++{
++    gceSTATUS status;
++    gctBOOL mutex = gcvFALSE;
++    gcsMMU_STLB_PTR head = gcvNULL, pre = gcvNULL;
++    gctUINT32 start = PhysBase & (~gcdMMU_PAGE_64K_MASK);
++    gctUINT32 end = (PhysBase + Size - 1) & (~gcdMMU_PAGE_64K_MASK);
++    gctUINT32 mStart = start >> gcdMMU_MTLB_SHIFT;
++    gctUINT32 mEnd = end >> gcdMMU_MTLB_SHIFT;
++    gctUINT32 sStart = (start & gcdMMU_STLB_64K_MASK) >> gcdMMU_STLB_64K_SHIFT;
++    gctUINT32 sEnd = (end & gcdMMU_STLB_64K_MASK) >> gcdMMU_STLB_64K_SHIFT;
++
++    /* Grab the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
++    mutex = gcvTRUE;
++
++    while (mStart <= mEnd)
++    {
++        gcmkASSERT(mStart < gcdMMU_MTLB_ENTRY_NUM);
++        if (*(Mmu->mtlbLogical + mStart) == 0)
++        {
++            gcsMMU_STLB_PTR stlb;
++            gctPOINTER pointer = gcvNULL;
++            gctUINT32 last = (mStart == mEnd) ? sEnd : (gcdMMU_STLB_64K_ENTRY_NUM - 1);
++
++            gcmkONERROR(gckOS_Allocate(Mmu->os, sizeof(struct _gcsMMU_STLB), &pointer));
++            stlb = pointer;
++
++            stlb->mtlbEntryNum = 0;
++            stlb->next = gcvNULL;
++            stlb->physical = gcvNULL;
++            stlb->logical = gcvNULL;
++            stlb->size = gcdMMU_STLB_64K_SIZE;
++            stlb->pageCount = 0;
++
++            if (pre == gcvNULL)
++            {
++                pre = head = stlb;
++            }
++            else
++            {
++                gcmkASSERT(pre->next == gcvNULL);
++                pre->next = stlb;
++                pre = stlb;
++            }
++
++            gcmkONERROR(
++                    gckOS_AllocateContiguous(Mmu->os,
++                                             gcvFALSE,
++                                             &stlb->size,
++                                             &stlb->physical,
++                                             (gctPOINTER)&stlb->logical));
++
++            gcmkONERROR(gckOS_ZeroMemory(stlb->logical, stlb->size));
++
++            gcmkONERROR(gckOS_GetPhysicalAddress(
++                Mmu->os,
++                stlb->logical,
++                &stlb->physBase));
++
++            if (stlb->physBase & (gcdMMU_STLB_64K_SIZE - 1))
++            {
++                gcmkONERROR(gcvSTATUS_NOT_ALIGNED);
++            }
++
++            _WritePageEntry(Mmu->mtlbLogical + mStart,
++                            stlb->physBase
++                            /* 64KB page size */
++                            | (1 << 2)
++                            /* Ignore exception */
++                            | (0 << 1)
++                            /* Present */
++                            | (1 << 0)
++                            );
++#if gcdMMU_TABLE_DUMP
++            gckOS_Print("%s(%d): insert MTLB[%d]: %08x\n",
++                __FUNCTION__, __LINE__,
++                mStart,
++                _ReadPageEntry(Mmu->mtlbLogical + mStart));
++#endif
++
++            stlb->mtlbIndex = mStart;
++            stlb->mtlbEntryNum = 1;
++#if gcdMMU_TABLE_DUMP
++            gckOS_Print("%s(%d): STLB: logical:%08x -> physical:%08x\n",
++                    __FUNCTION__, __LINE__,
++                    stlb->logical,
++                    stlb->physBase);
++#endif
++
++            while (sStart <= last)
++            {
++                gcmkASSERT(!(start & gcdMMU_PAGE_64K_MASK));
++                _WritePageEntry(stlb->logical + sStart, _SetPage(start));
++#if gcdMMU_TABLE_DUMP
++                gckOS_Print("%s(%d): insert STLB[%d]: %08x\n",
++                    __FUNCTION__, __LINE__,
++                    sStart,
++                    _ReadPageEntry(stlb->logical + sStart));
++#endif
++                /* next page. */
++                start += gcdMMU_PAGE_64K_SIZE;
++                sStart++;
++                stlb->pageCount++;
++            }
++
++            sStart = 0;
++            ++mStart;
++        }
++        else
++        {
++            gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++        }
++    }
++
++    /* Insert the stlb into staticSTLB. */
++    if (Mmu->staticSTLB == gcvNULL)
++    {
++        Mmu->staticSTLB = head;
++    }
++    else
++    {
++        gcmkASSERT(pre == gcvNULL);
++        gcmkASSERT(pre->next == gcvNULL);
++        pre->next = Mmu->staticSTLB;
++        Mmu->staticSTLB = head;
++    }
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++
++    return gcvSTATUS_OK;
++
++OnError:
++
++    /* Roll back. */
++    while (head != gcvNULL)
++    {
++        pre = head;
++        head = head->next;
++
++        if (pre->physical != gcvNULL)
++        {
++            gcmkVERIFY_OK(
++                gckOS_FreeContiguous(Mmu->os,
++                    pre->physical,
++                    pre->logical,
++                    pre->size));
++        }
++
++        if (pre->mtlbEntryNum != 0)
++        {
++            gcmkASSERT(pre->mtlbEntryNum == 1);
++            _WritePageEntry(Mmu->mtlbLogical + pre->mtlbIndex, 0);
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, pre));
++    }
++
++    if (mutex)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++    }
++
++    return status;
++}
++
++static gceSTATUS
++_FindDynamicSpace(
++    IN gckMMU Mmu,
++    OUT gcsDynamicSpaceNode_PTR *Array,
++    OUT gctINT * Size
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gctPOINTER pointer = gcvNULL;
++    gcsDynamicSpaceNode_PTR array = gcvNULL;
++    gctINT size = 0;
++    gctINT i = 0, nodeStart = -1, nodeEntries = 0;
++
++    /* Allocate memory for the array. */
++    gcmkONERROR(gckOS_Allocate(Mmu->os,
++                               gcmSIZEOF(*array) * (gcdMMU_MTLB_ENTRY_NUM / 2),
++                               &pointer));
++
++    array = (gcsDynamicSpaceNode_PTR)pointer;
++
++    /* Loop all the entries. */
++    while (i < gcdMMU_MTLB_ENTRY_NUM)
++    {
++        if (!Mmu->mtlbLogical[i])
++        {
++            if (nodeStart < 0)
++            {
++                /* This is the first entry of the dynamic space. */
++                nodeStart   = i;
++                nodeEntries = 1;
++            }
++            else
++            {
++                /* Other entries of the dynamic space. */
++                nodeEntries++;
++            }
++        }
++        else if (nodeStart >= 0)
++        {
++            /* Save the previous node. */
++            array[size].start   = nodeStart;
++            array[size].entries = nodeEntries;
++            size++;
++
++            /* Reset the start. */
++            nodeStart   = -1;
++            nodeEntries = 0;
++        }
++
++        i++;
++    }
++
++    /* Save the previous node. */
++    if (nodeStart >= 0)
++    {
++        array[size].start   = nodeStart;
++        array[size].entries = nodeEntries;
++        size++;
++    }
++
++#if gcdMMU_TABLE_DUMP
++    for (i = 0; i < size; i++)
++    {
++        gckOS_Print("%s(%d): [%d]: start=%d, entries=%d.\n",
++                __FUNCTION__, __LINE__,
++                i,
++                array[i].start,
++                array[i].entries);
++    }
++#endif
++
++    *Array = array;
++    *Size  = size;
++
++    return gcvSTATUS_OK;
++
++OnError:
++    if (pointer != gcvNULL)
++    {
++        gckOS_Free(Mmu->os, pointer);
++    }
++
++    return status;
++}
++
++static gceSTATUS
++_SetupDynamicSpace(
++    IN gckMMU Mmu
++    )
++{
++    gceSTATUS status;
++    gcsDynamicSpaceNode_PTR nodeArray = gcvNULL;
++    gctINT i, nodeArraySize = 0;
++    gctUINT32 physical;
++    gctINT numEntries = 0;
++    gctUINT32_PTR pageTable;
++    gctBOOL acquired = gcvFALSE;
++
++    /* Find all the dynamic address space. */
++    gcmkONERROR(_FindDynamicSpace(Mmu, &nodeArray, &nodeArraySize));
++
++    /* TODO: We only use the largest one for now. */
++    for (i = 0; i < nodeArraySize; i++)
++    {
++        if (nodeArray[i].entries > numEntries)
++        {
++            Mmu->dynamicMappingStart = nodeArray[i].start;
++            numEntries               = nodeArray[i].entries;
++        }
++    }
++
++    gckOS_Free(Mmu->os, (gctPOINTER)nodeArray);
++
++    Mmu->pageTableSize = numEntries * 4096;
++
++    Mmu->pageTableEntries = Mmu->pageTableSize / gcmSIZEOF(gctUINT32);
++
++    /* Construct Slave TLB. */
++    gcmkONERROR(gckOS_AllocateContiguous(Mmu->os,
++                gcvFALSE,
++                &Mmu->pageTableSize,
++                &Mmu->pageTablePhysical,
++                (gctPOINTER)&Mmu->pageTableLogical));
++
++#if gcdUSE_MMU_EXCEPTION
++    gcmkONERROR(_FillPageTable(Mmu->pageTableLogical,
++                               Mmu->pageTableEntries,
++                               /* Enable exception */
++                               1 << 1));
++#else
++    /* Invalidate all entries. */
++    gcmkONERROR(gckOS_ZeroMemory(Mmu->pageTableLogical,
++                Mmu->pageTableSize));
++#endif
++
++    /* Initilization. */
++    pageTable      = Mmu->pageTableLogical;
++    _WritePageEntry(pageTable,     (Mmu->pageTableEntries << 8) | gcvMMU_FREE);
++    _WritePageEntry(pageTable + 1, ~0U);
++    Mmu->heapList  = 0;
++    Mmu->freeNodes = gcvFALSE;
++
++    gcmkONERROR(gckOS_GetPhysicalAddress(Mmu->os,
++                Mmu->pageTableLogical,
++                &physical));
++
++    /* Grab the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Map to Master TLB. */
++    for (i = (gctINT)Mmu->dynamicMappingStart;
++         i < (gctINT)Mmu->dynamicMappingStart + numEntries;
++         i++)
++    {
++        _WritePageEntry(Mmu->mtlbLogical + i,
++                        physical
++                        /* 4KB page size */
++                        | (0 << 2)
++                        /* Ignore exception */
++                        | (0 << 1)
++                        /* Present */
++                        | (1 << 0)
++                        );
++#if gcdMMU_TABLE_DUMP
++        gckOS_Print("%s(%d): insert MTLB[%d]: %08x\n",
++                __FUNCTION__, __LINE__,
++                i,
++                _ReadPageEntry(Mmu->mtlbLogical + i));
++#endif
++        physical += gcdMMU_STLB_4K_SIZE;
++    }
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++
++    return gcvSTATUS_OK;
++
++OnError:
++    if (Mmu->pageTableLogical)
++    {
++        /* Free the page table. */
++        gcmkVERIFY_OK(
++                gckOS_FreeContiguous(Mmu->os,
++                    Mmu->pageTablePhysical,
++                    (gctPOINTER) Mmu->pageTableLogical,
++                    Mmu->pageTableSize));
++    }
++
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++    }
++
++    return status;
++}
++
++/*******************************************************************************
++**
++**  _Construct
++**
++**  Construct a new gckMMU object.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctSIZE_T MmuSize
++**          Number of bytes for the page table.
++**
++**  OUTPUT:
++**
++**      gckMMU * Mmu
++**          Pointer to a variable that receives the gckMMU object pointer.
++*/
++gceSTATUS
++_Construct(
++    IN gckKERNEL Kernel,
++    IN gctSIZE_T MmuSize,
++    OUT gckMMU * Mmu
++    )
++{
++    gckOS os;
++    gckHARDWARE hardware;
++    gceSTATUS status;
++    gckMMU mmu = gcvNULL;
++    gctUINT32_PTR pageTable;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Kernel=0x%x MmuSize=%lu", Kernel, MmuSize);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(MmuSize > 0);
++    gcmkVERIFY_ARGUMENT(Mmu != gcvNULL);
++
++    /* Extract the gckOS object pointer. */
++    os = Kernel->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Extract the gckHARDWARE object pointer. */
++    hardware = Kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    /* Allocate memory for the gckMMU object. */
++    gcmkONERROR(gckOS_Allocate(os, sizeof(struct _gckMMU), &pointer));
++
++    mmu = pointer;
++
++    /* Initialize the gckMMU object. */
++    mmu->object.type      = gcvOBJ_MMU;
++    mmu->os               = os;
++    mmu->hardware         = hardware;
++    mmu->pageTableMutex   = gcvNULL;
++    mmu->pageTableLogical = gcvNULL;
++    mmu->mtlbLogical      = gcvNULL;
++    mmu->staticSTLB       = gcvNULL;
++    mmu->enabled          = gcvFALSE;
++#ifdef __QNXNTO__
++    mmu->nodeList         = gcvNULL;
++    mmu->nodeMutex        = gcvNULL;
++#endif
++
++    /* Create the page table mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &mmu->pageTableMutex));
++
++#ifdef __QNXNTO__
++    /* Create the node list mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &mmu->nodeMutex));
++#endif
++
++    if (hardware->mmuVersion == 0)
++    {
++        mmu->pageTableSize = MmuSize;
++
++        gcmkONERROR(
++            gckOS_AllocateContiguous(os,
++                                     gcvFALSE,
++                                     &mmu->pageTableSize,
++                                     &mmu->pageTablePhysical,
++                                     &pointer));
++
++        mmu->pageTableLogical = pointer;
++
++        /* Compute number of entries in page table. */
++        mmu->pageTableEntries = mmu->pageTableSize / sizeof(gctUINT32);
++
++        /* Mark all pages as free. */
++        pageTable      = mmu->pageTableLogical;
++
++#if gcdMMU_CLEAR_VALUE
++        _FillPageTable(pageTable, mmu->pageTableEntries, gcdMMU_CLEAR_VALUE);
++#endif
++
++        _WritePageEntry(pageTable,     (mmu->pageTableEntries << 8) | gcvMMU_FREE);
++        _WritePageEntry(pageTable + 1, ~0U);
++        mmu->heapList  = 0;
++        mmu->freeNodes = gcvFALSE;
++
++        /* Set page table address. */
++        gcmkONERROR(
++            gckHARDWARE_SetMMU(hardware, (gctPOINTER) mmu->pageTableLogical));
++    }
++    else
++    {
++        /* Allocate the 4K mode MTLB table. */
++        mmu->mtlbSize = gcdMMU_MTLB_SIZE + 64;
++
++        gcmkONERROR(
++            gckOS_AllocateContiguous(os,
++                                     gcvFALSE,
++                                     &mmu->mtlbSize,
++                                     &mmu->mtlbPhysical,
++                                     &pointer));
++
++        mmu->mtlbLogical = pointer;
++
++        /* Invalid all the entries. */
++        gcmkONERROR(
++            gckOS_ZeroMemory(pointer, mmu->mtlbSize));
++    }
++
++    /* Return the gckMMU object pointer. */
++    *Mmu = mmu;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Mmu=0x%x", *Mmu);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (mmu != gcvNULL)
++    {
++        if (mmu->pageTableLogical != gcvNULL)
++        {
++            /* Free the page table. */
++            gcmkVERIFY_OK(
++                gckOS_FreeContiguous(os,
++                                     mmu->pageTablePhysical,
++                                     (gctPOINTER) mmu->pageTableLogical,
++                                     mmu->pageTableSize));
++
++        }
++
++        if (mmu->mtlbLogical != gcvNULL)
++        {
++            gcmkVERIFY_OK(
++                gckOS_FreeContiguous(os,
++                                     mmu->mtlbPhysical,
++                                     (gctPOINTER) mmu->mtlbLogical,
++                                     mmu->mtlbSize));
++        }
++
++        if (mmu->pageTableMutex != gcvNULL)
++        {
++            /* Delete the mutex. */
++            gcmkVERIFY_OK(
++                gckOS_DeleteMutex(os, mmu->pageTableMutex));
++        }
++
++#ifdef __QNXNTO__
++        if (mmu->nodeMutex != gcvNULL)
++        {
++            /* Delete the mutex. */
++            gcmkVERIFY_OK(
++                gckOS_DeleteMutex(os, mmu->nodeMutex));
++        }
++#endif
++
++        /* Mark the gckMMU object as unknown. */
++        mmu->object.type = gcvOBJ_UNKNOWN;
++
++        /* Free the allocates memory. */
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, mmu));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  _Destroy
++**
++**  Destroy a gckMMU object.
++**
++**  INPUT:
++**
++**      gckMMU Mmu
++**          Pointer to an gckMMU object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++_Destroy(
++    IN gckMMU Mmu
++    )
++{
++#ifdef __QNXNTO__
++    gcuVIDMEM_NODE_PTR node, next;
++#endif
++
++    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++#ifdef __QNXNTO__
++    /* Free all associated virtual memory. */
++    for (node = Mmu->nodeList; node != gcvNULL; node = next)
++    {
++        next = node->Virtual.next;
++        gcmkVERIFY_OK(gckVIDMEM_Free(node));
++    }
++#endif
++
++    while (Mmu->staticSTLB != gcvNULL)
++    {
++        gcsMMU_STLB_PTR pre = Mmu->staticSTLB;
++        Mmu->staticSTLB = pre->next;
++
++        if (pre->physical != gcvNULL)
++        {
++            gcmkVERIFY_OK(
++                gckOS_FreeContiguous(Mmu->os,
++                    pre->physical,
++                    pre->logical,
++                    pre->size));
++        }
++
++        if (pre->mtlbEntryNum != 0)
++        {
++            gcmkASSERT(pre->mtlbEntryNum == 1);
++            _WritePageEntry(Mmu->mtlbLogical + pre->mtlbIndex, 0);
++#if gcdMMU_TABLE_DUMP
++            gckOS_Print("%s(%d): clean MTLB[%d]\n",
++                __FUNCTION__, __LINE__,
++                pre->mtlbIndex);
++#endif
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, pre));
++    }
++
++    if (Mmu->hardware->mmuVersion != 0)
++    {
++        gcmkVERIFY_OK(
++                gckOS_FreeContiguous(Mmu->os,
++                    Mmu->mtlbPhysical,
++                    (gctPOINTER) Mmu->mtlbLogical,
++                    Mmu->mtlbSize));
++    }
++
++    /* Free the page table. */
++    gcmkVERIFY_OK(
++            gckOS_FreeContiguous(Mmu->os,
++                Mmu->pageTablePhysical,
++                (gctPOINTER) Mmu->pageTableLogical,
++                Mmu->pageTableSize));
++
++#ifdef __QNXNTO__
++    /* Delete the node list mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Mmu->os, Mmu->nodeMutex));
++#endif
++
++    /* Delete the page table mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Mmu->os, Mmu->pageTableMutex));
++
++    /* Mark the gckMMU object as unknown. */
++    Mmu->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckMMU object. */
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, Mmu));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++** _AdjstIndex
++**
++**  Adjust the index from which we search for a usable node to make sure
++**  index allocated is greater than Start.
++*/
++gceSTATUS
++_AdjustIndex(
++    IN gckMMU Mmu,
++    IN gctUINT32 Index,
++    IN gctUINT32 PageCount,
++    IN gctUINT32 Start,
++    OUT gctUINT32 * IndexAdjusted
++    )
++{
++    gceSTATUS status;
++    gctUINT32 index = Index;
++    gctUINT32_PTR map = Mmu->pageTableLogical;
++
++    gcmkHEADER();
++
++    for (; index < Mmu->pageTableEntries;)
++    {
++        gctUINT32 result = 0;
++        gctUINT32 nodeSize = 0;
++
++        if (index >= Start)
++        {
++            break;
++        }
++
++        switch (gcmENTRY_TYPE(map[index]))
++        {
++        case gcvMMU_SINGLE:
++            nodeSize = 1;
++            break;
++
++        case gcvMMU_FREE:
++            nodeSize = map[index] >> 8;
++            break;
++
++        default:
++            gcmkFATAL("MMU table correcupted at index %u!", index);
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++
++        if (nodeSize > PageCount)
++        {
++            result = index + (nodeSize - PageCount);
++
++            if (result >= Start)
++            {
++                break;
++            }
++        }
++
++        switch (gcmENTRY_TYPE(map[index]))
++        {
++        case gcvMMU_SINGLE:
++            index = map[index] >> 8;
++            break;
++
++        case gcvMMU_FREE:
++            index = map[index + 1];
++            break;
++
++        default:
++            gcmkFATAL("MMU table correcupted at index %u!", index);
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++    }
++
++    *IndexAdjusted = index;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckMMU_Construct(
++    IN gckKERNEL Kernel,
++    IN gctSIZE_T MmuSize,
++    OUT gckMMU * Mmu
++    )
++{
++#if gcdSHARED_PAGETABLE
++    gceSTATUS status;
++    gctPOINTER pointer;
++
++    gcmkHEADER_ARG("Kernel=0x%08x", Kernel);
++
++    if (sharedPageTable == gcvNULL)
++    {
++        gcmkONERROR(
++                gckOS_Allocate(Kernel->os,
++                               sizeof(struct _gcsSharedPageTable),
++                               &pointer));
++        sharedPageTable = pointer;
++
++        gcmkONERROR(
++                gckOS_ZeroMemory(sharedPageTable,
++                    sizeof(struct _gcsSharedPageTable)));
++
++        gcmkONERROR(_Construct(Kernel, MmuSize, &sharedPageTable->mmu));
++    }
++    else if (Kernel->hardware->mmuVersion == 0)
++    {
++        /* Set page table address. */
++        gcmkONERROR(
++            gckHARDWARE_SetMMU(Kernel->hardware, (gctPOINTER) sharedPageTable->mmu->pageTableLogical));
++    }
++
++    *Mmu = sharedPageTable->mmu;
++
++    sharedPageTable->hardwares[sharedPageTable->reference] = Kernel->hardware;
++
++    sharedPageTable->reference++;
++
++    gcmkFOOTER_ARG("sharedPageTable->reference=%lu", sharedPageTable->reference);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (sharedPageTable)
++    {
++        if (sharedPageTable->mmu)
++        {
++            gcmkVERIFY_OK(gckMMU_Destroy(sharedPageTable->mmu));
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, sharedPageTable));
++    }
++
++    gcmkFOOTER();
++    return status;
++#elif gcdMIRROR_PAGETABLE
++    gceSTATUS status;
++    gctPOINTER pointer;
++
++    gcmkHEADER_ARG("Kernel=0x%08x", Kernel);
++
++    if (mirrorPageTable == gcvNULL)
++    {
++        gcmkONERROR(
++            gckOS_Allocate(Kernel->os,
++                           sizeof(struct _gcsMirrorPageTable),
++                           &pointer));
++        mirrorPageTable = pointer;
++
++        gcmkONERROR(
++            gckOS_ZeroMemory(mirrorPageTable,
++                    sizeof(struct _gcsMirrorPageTable)));
++
++        gcmkONERROR(
++            gckOS_CreateMutex(Kernel->os, &mirrorPageTableMutex));
++    }
++
++    gcmkONERROR(_Construct(Kernel, MmuSize, Mmu));
++
++    mirrorPageTable->mmus[mirrorPageTable->reference] = *Mmu;
++
++    mirrorPageTable->hardwares[mirrorPageTable->reference] = Kernel->hardware;
++
++    mirrorPageTable->reference++;
++
++    gcmkFOOTER_ARG("mirrorPageTable->reference=%lu", mirrorPageTable->reference);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (mirrorPageTable && mirrorPageTable->reference == 0)
++    {
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Kernel->os, mirrorPageTable));
++    }
++
++    gcmkFOOTER();
++    return status;
++#else
++    return _Construct(Kernel, MmuSize, Mmu);
++#endif
++}
++
++gceSTATUS
++gckMMU_Destroy(
++    IN gckMMU Mmu
++    )
++{
++#if gcdSHARED_PAGETABLE
++    sharedPageTable->reference--;
++
++    if (sharedPageTable->reference == 0)
++    {
++        if (sharedPageTable->mmu)
++        {
++            gcmkVERIFY_OK(_Destroy(Mmu));
++        }
++
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, sharedPageTable));
++    }
++
++    return gcvSTATUS_OK;
++#elif gcdMIRROR_PAGETABLE
++    mirrorPageTable->reference--;
++
++    if (mirrorPageTable->reference == 0)
++    {
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, mirrorPageTable));
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Mmu->os, mirrorPageTableMutex));
++    }
++
++    return _Destroy(Mmu);
++#else
++    return _Destroy(Mmu);
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckMMU_AllocatePages
++**
++**  Allocate pages inside the page table.
++**
++**  INPUT:
++**
++**      gckMMU Mmu
++**          Pointer to an gckMMU object.
++**
++**      gctSIZE_T PageCount
++**          Number of pages to allocate.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * PageTable
++**          Pointer to a variable that receives the base address of the page
++**          table.
++**
++**      gctUINT32 * Address
++**          Pointer to a variable that receives the hardware specific address.
++*/
++gceSTATUS
++_AllocatePages(
++    IN gckMMU Mmu,
++    IN gctSIZE_T PageCount,
++    IN gceSURF_TYPE Type,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    )
++{
++    gceSTATUS status;
++    gctBOOL mutex = gcvFALSE;
++    gctUINT32 index = 0, previous = ~0U, left;
++    gctUINT32_PTR pageTable;
++    gctBOOL gotIt;
++    gctUINT32 address;
++
++    gcmkHEADER_ARG("Mmu=0x%x PageCount=%lu", Mmu, PageCount);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++    gcmkVERIFY_ARGUMENT(PageCount > 0);
++    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
++
++    if (PageCount > Mmu->pageTableEntries)
++    {
++        gcmkPRINT("[galcore]: %s(%d): Run out of free page entry.",
++                  __FUNCTION__, __LINE__);
++
++        /* Not enough pages avaiable. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++    /* Grab the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
++    mutex = gcvTRUE;
++
++    /* Cast pointer to page table. */
++    for (pageTable = Mmu->pageTableLogical, gotIt = gcvFALSE; !gotIt;)
++    {
++        index = Mmu->heapList;
++
++        if ((Mmu->hardware->mmuVersion == 0) && (Type == gcvSURF_VERTEX))
++        {
++            gcmkONERROR(_AdjustIndex(
++                Mmu,
++                index,
++                PageCount,
++                gcdVERTEX_START / gcmSIZEOF(gctUINT32),
++                &index
++                ));
++        }
++
++        /* Walk the heap list. */
++        for (; !gotIt && (index < Mmu->pageTableEntries);)
++        {
++            /* Check the node type. */
++            switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[index])))
++            {
++            case gcvMMU_SINGLE:
++                /* Single odes are valid if we only need 1 page. */
++                if (PageCount == 1)
++                {
++                    gotIt = gcvTRUE;
++                }
++                else
++                {
++                    /* Move to next node. */
++                    previous = index;
++                    index    = _ReadPageEntry(&pageTable[index]) >> 8;
++                }
++                break;
++
++            case gcvMMU_FREE:
++                /* Test if the node has enough space. */
++                if (PageCount <= (_ReadPageEntry(&pageTable[index]) >> 8))
++                {
++                    gotIt = gcvTRUE;
++                }
++                else
++                {
++                    /* Move to next node. */
++                    previous = index;
++                    index    = _ReadPageEntry(&pageTable[index + 1]);
++                }
++                break;
++
++            default:
++                gcmkFATAL("MMU table correcupted at index %u!", index);
++                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++            }
++        }
++
++        /* Test if we are out of memory. */
++        if (index >= Mmu->pageTableEntries)
++        {
++            if (Mmu->freeNodes)
++            {
++                /* Time to move out the trash! */
++                gcmkONERROR(_Collect(Mmu));
++            }
++            else
++            {
++                gcmkPRINT("[galcore]: %s(%d): Run out of free page entry.",
++                          __FUNCTION__, __LINE__);
++
++                /* Out of resources. */
++                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++            }
++        }
++    }
++
++    switch (gcmENTRY_TYPE(_ReadPageEntry(&pageTable[index])))
++    {
++    case gcvMMU_SINGLE:
++        /* Unlink single node from free list. */
++        gcmkONERROR(
++            _Link(Mmu, previous, _ReadPageEntry(&pageTable[index]) >> 8));
++        break;
++
++    case gcvMMU_FREE:
++        /* Check how many pages will be left. */
++        left = (_ReadPageEntry(&pageTable[index]) >> 8) - PageCount;
++        switch (left)
++        {
++        case 0:
++            /* The entire node is consumed, just unlink it. */
++            gcmkONERROR(
++                _Link(Mmu, previous, _ReadPageEntry(&pageTable[index + 1])));
++            break;
++
++        case 1:
++            /* One page will remain.  Convert the node to a single node and
++            ** advance the index. */
++            _WritePageEntry(&pageTable[index], (_ReadPageEntry(&pageTable[index + 1]) << 8) | gcvMMU_SINGLE);
++            index ++;
++            break;
++
++        default:
++            /* Enough pages remain for a new node.  However, we will just adjust
++            ** the size of the current node and advance the index. */
++            _WritePageEntry(&pageTable[index], (left << 8) | gcvMMU_FREE);
++            index += left;
++            break;
++        }
++        break;
++    }
++
++    /* Mark node as used. */
++    gcmkONERROR(_FillPageTable(&pageTable[index], PageCount, gcvMMU_USED));
++
++    /* Return pointer to page table. */
++    *PageTable = &pageTable[index];
++
++    /* Build virtual address. */
++    if (Mmu->hardware->mmuVersion == 0)
++    {
++        gcmkONERROR(
++                gckHARDWARE_BuildVirtualAddress(Mmu->hardware, index, 0, &address));
++    }
++    else
++    {
++        gctUINT32 masterOffset = index / gcdMMU_STLB_4K_ENTRY_NUM
++                               + Mmu->dynamicMappingStart;
++        gctUINT32 slaveOffset = index % gcdMMU_STLB_4K_ENTRY_NUM;
++
++        address = (masterOffset << gcdMMU_MTLB_SHIFT)
++                | (slaveOffset << gcdMMU_STLB_4K_SHIFT);
++    }
++
++    if (Address != gcvNULL)
++    {
++        *Address = address;
++    }
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*PageTable=0x%x *Address=%08x",
++                   *PageTable, gcmOPT_VALUE(Address));
++    return gcvSTATUS_OK;
++
++OnError:
++
++    if (mutex)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckMMU_FreePages
++**
++**  Free pages inside the page table.
++**
++**  INPUT:
++**
++**      gckMMU Mmu
++**          Pointer to an gckMMU object.
++**
++**      gctPOINTER PageTable
++**          Base address of the page table to free.
++**
++**      gctSIZE_T PageCount
++**          Number of pages to free.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++_FreePages(
++    IN gckMMU Mmu,
++    IN gctPOINTER PageTable,
++    IN gctSIZE_T PageCount
++    )
++{
++    gctUINT32_PTR pageTable;
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Mmu=0x%x PageTable=0x%x PageCount=%lu",
++                   Mmu, PageTable, PageCount);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
++    gcmkVERIFY_ARGUMENT(PageCount > 0);
++
++    /* Convert the pointer. */
++    pageTable = (gctUINT32_PTR) PageTable;
++
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->pageTableMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++#if gcdMMU_CLEAR_VALUE
++    if (Mmu->hardware->mmuVersion == 0)
++    {
++        _FillPageTable(pageTable, PageCount, gcdMMU_CLEAR_VALUE);
++    }
++#endif
++
++    if (PageCount == 1)
++    {
++        /* Single page node. */
++        _WritePageEntry(pageTable,
++                        (~((1U<<8)-1)) | gcvMMU_SINGLE
++#if gcdUSE_MMU_EXCEPTION
++                        /* Enable exception */
++                        | 1 << 1
++#endif
++                        );
++    }
++    else
++    {
++        /* Mark the node as free. */
++        _WritePageEntry(pageTable,
++                        (PageCount << 8) | gcvMMU_FREE
++#if gcdUSE_MMU_EXCEPTION
++                        /* Enable exception */
++                        | 1 << 1
++#endif
++                       );
++        _WritePageEntry(pageTable + 1, ~0U);
++
++#if gcdUSE_MMU_EXCEPTION
++        /* Enable exception */
++        gcmkVERIFY_OK(_FillPageTable(pageTable + 2, PageCount - 2, 1 << 1));
++#endif
++    }
++
++    /* We have free nodes. */
++    Mmu->freeNodes = gcvTRUE;
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->pageTableMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckMMU_AllocatePages(
++    IN gckMMU Mmu,
++    IN gctSIZE_T PageCount,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    )
++{
++    return gckMMU_AllocatePagesEx(
++                Mmu, PageCount, gcvSURF_UNKNOWN, PageTable, Address);
++}
++
++gceSTATUS
++gckMMU_AllocatePagesEx(
++    IN gckMMU Mmu,
++    IN gctSIZE_T PageCount,
++    IN gceSURF_TYPE Type,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    )
++{
++#if gcdMIRROR_PAGETABLE
++    gceSTATUS status;
++    gctPOINTER pageTable;
++    gctUINT32 address;
++    gctINT i;
++    gckMMU mmu;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL allocated = gcvFALSE;
++
++    gckOS_AcquireMutex(Mmu->os, mirrorPageTableMutex, gcvINFINITE);
++    acquired = gcvTRUE;
++
++    /* Allocate page table for current MMU. */
++    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
++    {
++        if (Mmu == mirrorPageTable->mmus[i])
++        {
++            gcmkONERROR(_AllocatePages(Mmu, PageCount, Type, PageTable, Address));
++            allocated = gcvTRUE;
++        }
++    }
++
++    /* Allocate page table for other MMUs. */
++    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
++    {
++        mmu = mirrorPageTable->mmus[i];
++
++        if (Mmu != mmu)
++        {
++            gcmkONERROR(_AllocatePages(mmu, PageCount, Type, &pageTable, &address));
++            gcmkASSERT(address == *Address);
++        }
++    }
++
++    gckOS_ReleaseMutex(Mmu->os, mirrorPageTableMutex);
++    acquired = gcvFALSE;
++
++    return gcvSTATUS_OK;
++OnError:
++
++    if (allocated)
++    {
++        /* Page tables for multiple GPU always keep the same. So it is impossible
++         * the fist one allocates successfully but others fail.
++         */
++        gcmkASSERT(0);
++    }
++
++    if (acquired)
++    {
++        gckOS_ReleaseMutex(Mmu->os, mirrorPageTableMutex);
++    }
++
++    return status;
++#else
++    return _AllocatePages(Mmu, PageCount, Type, PageTable, Address);
++#endif
++}
++
++gceSTATUS
++gckMMU_FreePages(
++    IN gckMMU Mmu,
++    IN gctPOINTER PageTable,
++    IN gctSIZE_T PageCount
++    )
++{
++#if gcdMIRROR_PAGETABLE
++    gctINT i;
++    gctUINT32 offset;
++    gckMMU mmu;
++
++    gckOS_AcquireMutex(Mmu->os, mirrorPageTableMutex, gcvINFINITE);
++
++    gcmkVERIFY_OK(_FreePages(Mmu, PageTable, PageCount));
++
++    offset = (gctUINT32)PageTable - (gctUINT32)Mmu->pageTableLogical;
++
++    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
++    {
++        mmu = mirrorPageTable->mmus[i];
++
++        if (mmu != Mmu)
++        {
++            gcmkVERIFY_OK(_FreePages(mmu, mmu->pageTableLogical + offset/4, PageCount));
++        }
++    }
++
++    gckOS_ReleaseMutex(Mmu->os, mirrorPageTableMutex);
++
++    return gcvSTATUS_OK;
++#else
++    return _FreePages(Mmu, PageTable, PageCount);
++#endif
++}
++
++gceSTATUS
++gckMMU_Enable(
++    IN gckMMU Mmu,
++    IN gctUINT32 PhysBaseAddr,
++    IN gctUINT32 PhysSize
++    )
++{
++    gceSTATUS status;
++#if gcdSHARED_PAGETABLE
++    gckHARDWARE hardware;
++    gctINT i;
++#endif
++
++    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++#if gcdSHARED_PAGETABLE
++    if (Mmu->enabled)
++    {
++        gcmkFOOTER_ARG("Status=%d", gcvSTATUS_SKIP);
++        return gcvSTATUS_SKIP;
++    }
++#endif
++
++    if (Mmu->hardware->mmuVersion == 0)
++    {
++        /* Success. */
++        gcmkFOOTER_ARG("Status=%d", gcvSTATUS_SKIP);
++        return gcvSTATUS_SKIP;
++    }
++    else
++    {
++        if (PhysSize != 0)
++        {
++            gcmkONERROR(_FillFlatMapping(
++                Mmu,
++                PhysBaseAddr,
++                PhysSize
++                ));
++        }
++
++        gcmkONERROR(_SetupDynamicSpace(Mmu));
++
++#if gcdSHARED_PAGETABLE
++        for(i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            hardware = sharedPageTable->hardwares[i];
++            if (hardware != gcvNULL)
++            {
++                gcmkONERROR(
++                    gckHARDWARE_SetMMUv2(
++                        hardware,
++                        gcvTRUE,
++                        Mmu->mtlbLogical,
++                        gcvMMU_MODE_4K,
++                        (gctUINT8_PTR)Mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
++                        gcvFALSE
++                        ));
++            }
++        }
++#else
++        gcmkONERROR(
++            gckHARDWARE_SetMMUv2(
++                Mmu->hardware,
++                gcvTRUE,
++                Mmu->mtlbLogical,
++                gcvMMU_MODE_4K,
++                (gctUINT8_PTR)Mmu->mtlbLogical + gcdMMU_MTLB_SIZE,
++                gcvFALSE
++                ));
++#endif
++
++        Mmu->enabled = gcvTRUE;
++
++        /* Success. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckMMU_SetPage(
++    IN gckMMU Mmu,
++    IN gctUINT32 PageAddress,
++    IN gctUINT32 *PageEntry
++    )
++{
++#if gcdMIRROR_PAGETABLE
++    gctUINT32_PTR pageEntry;
++    gctINT i;
++    gckMMU mmu;
++    gctUINT32 offset = (gctUINT32)PageEntry - (gctUINT32)Mmu->pageTableLogical;
++#endif
++
++    gctUINT32 data;
++    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++    gcmkVERIFY_ARGUMENT(PageEntry != gcvNULL);
++    gcmkVERIFY_ARGUMENT(!(PageAddress & 0xFFF));
++
++    if (Mmu->hardware->mmuVersion == 0)
++    {
++        data = PageAddress;
++    }
++    else
++    {
++        data = _SetPage(PageAddress);
++    }
++
++    _WritePageEntry(PageEntry, data);
++
++#if gcdMIRROR_PAGETABLE
++    for (i = 0; i < (gctINT)mirrorPageTable->reference; i++)
++    {
++        mmu = mirrorPageTable->mmus[i];
++
++        if (mmu != Mmu)
++        {
++            pageEntry = mmu->pageTableLogical + offset / 4;
++
++            if (mmu->hardware->mmuVersion == 0)
++            {
++                _WritePageEntry(pageEntry, PageAddress);
++            }
++            else
++            {
++                _WritePageEntry(pageEntry, _SetPage(PageAddress));
++            }
++        }
++
++    }
++#endif
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#ifdef __QNXNTO__
++gceSTATUS
++gckMMU_InsertNode(
++    IN gckMMU Mmu,
++    IN gcuVIDMEM_NODE_PTR Node)
++{
++    gceSTATUS status;
++    gctBOOL mutex = gcvFALSE;
++
++    gcmkHEADER_ARG("Mmu=0x%x Node=0x%x", Mmu, Node);
++
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->nodeMutex, gcvINFINITE));
++    mutex = gcvTRUE;
++
++    Node->Virtual.next = Mmu->nodeList;
++    Mmu->nodeList = Node;
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
++
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (mutex)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckMMU_RemoveNode(
++    IN gckMMU Mmu,
++    IN gcuVIDMEM_NODE_PTR Node)
++{
++    gceSTATUS status;
++    gctBOOL mutex = gcvFALSE;
++    gcuVIDMEM_NODE_PTR *iter;
++
++    gcmkHEADER_ARG("Mmu=0x%x Node=0x%x", Mmu, Node);
++
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->nodeMutex, gcvINFINITE));
++    mutex = gcvTRUE;
++
++    for (iter = &Mmu->nodeList; *iter; iter = &(*iter)->Virtual.next)
++    {
++        if (*iter == Node)
++        {
++            *iter = Node->Virtual.next;
++            break;
++        }
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
++
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (mutex)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckMMU_FreeHandleMemory(
++    IN gckKERNEL Kernel,
++    IN gckMMU Mmu,
++    IN gctUINT32 Pid
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++    gcuVIDMEM_NODE_PTR curr, next;
++
++    gcmkHEADER_ARG("Kernel=0x%x, Mmu=0x%x Pid=%u", Kernel, Mmu, Pid);
++
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++    gcmkONERROR(gckOS_AcquireMutex(Mmu->os, Mmu->nodeMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    for (curr = Mmu->nodeList; curr != gcvNULL; curr = next)
++    {
++        next = curr->Virtual.next;
++
++        if (curr->Virtual.processID == Pid)
++        {
++            while (curr->Virtual.unlockPendings[Kernel->core] == 0 && curr->Virtual.lockeds[Kernel->core] > 0)
++            {
++                gcmkONERROR(gckVIDMEM_Unlock(Kernel, curr, gcvSURF_TYPE_UNKNOWN, gcvNULL));
++            }
++
++            gcmkVERIFY_OK(gckVIDMEM_Free(curr));
++        }
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
++
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->nodeMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++gceSTATUS
++gckMMU_Flush(
++    IN gckMMU Mmu
++    )
++{
++    gckHARDWARE hardware;
++#if gcdSHARED_PAGETABLE
++    gctINT i;
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++#if gcdENABLE_VG
++        if (i == gcvCORE_VG)
++        {
++            continue;
++        }
++#endif
++        hardware = sharedPageTable->hardwares[i];
++        if (hardware)
++        {
++            /* Notify cores who use this page table. */
++            gcmkVERIFY_OK(
++                gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
++        }
++    }
++#elif gcdMIRROR_PAGETABLE
++    gctINT i;
++    for (i = 0; i < mirrorPageTable->reference; i++)
++    {
++        hardware = mirrorPageTable->hardwares[i];
++
++        /* Notify cores who use this page table. */
++        gcmkVERIFY_OK(
++            gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
++    }
++#else
++    hardware = Mmu->hardware;
++    gcmkVERIFY_OK(
++        gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckMMU_DumpPageTableEntry(
++    IN gckMMU Mmu,
++    IN gctUINT32 Address
++    )
++{
++    gctUINT32_PTR pageTable;
++    gctUINT32 index;
++    gctUINT32 mtlb, stlb;
++
++    gcmkHEADER_ARG("Mmu=0x%08X Address=0x%08X", Mmu, Address);
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++    gcmkASSERT(Mmu->hardware->mmuVersion > 0);
++
++    mtlb   = (Address & gcdMMU_MTLB_MASK) >> gcdMMU_MTLB_SHIFT;
++    stlb   = (Address & gcdMMU_STLB_4K_MASK) >> gcdMMU_STLB_4K_SHIFT;
++
++    if (Address >= 0x80000000)
++    {
++        pageTable = Mmu->pageTableLogical;
++
++        index = (mtlb - Mmu->dynamicMappingStart)
++              * gcdMMU_STLB_4K_ENTRY_NUM
++              + stlb;
++
++        gcmkPRINT("    Page table entry = 0x%08X", _ReadPageEntry(pageTable + index));
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/******************************************************************************
++****************************** T E S T   C O D E ******************************
++******************************************************************************/
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_mmu_vg.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,522 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#if gcdENABLE_VG
++
++#define _GC_OBJ_ZONE    gcvZONE_MMU
++
++/*******************************************************************************
++**
++**  gckVGMMU_Construct
++**
++**  Construct a new gckVGMMU object.
++**
++**  INPUT:
++**
++**      gckVGKERNEL Kernel
++**          Pointer to an gckVGKERNEL object.
++**
++**      gctSIZE_T MmuSize
++**          Number of bytes for the page table.
++**
++**  OUTPUT:
++**
++**      gckVGMMU * Mmu
++**          Pointer to a variable that receives the gckVGMMU object pointer.
++*/
++gceSTATUS gckVGMMU_Construct(
++    IN gckVGKERNEL Kernel,
++    IN gctSIZE_T MmuSize,
++    OUT gckVGMMU * Mmu
++    )
++{
++    gckOS os;
++    gckVGHARDWARE hardware;
++    gceSTATUS status;
++    gckVGMMU mmu;
++    gctUINT32 * pageTable;
++    gctUINT32 i;
++
++    gcmkHEADER_ARG("Kernel=0x%x MmuSize=0x%x Mmu=0x%x", Kernel, MmuSize, Mmu);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(MmuSize > 0);
++    gcmkVERIFY_ARGUMENT(Mmu != gcvNULL);
++
++    /* Extract the gckOS object pointer. */
++    os = Kernel->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Extract the gckVGHARDWARE object pointer. */
++    hardware = Kernel->hardware;
++    gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++    /* Allocate memory for the gckVGMMU object. */
++    status = gckOS_Allocate(os, sizeof(struct _gckVGMMU), (gctPOINTER *) &mmu);
++
++    if (status < 0)
++    {
++        /* Error. */
++        gcmkFATAL(
++            "%s(%d): could not allocate gckVGMMU object.",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkFOOTER();
++        return status;
++    }
++
++    /* Initialize the gckVGMMU object. */
++    mmu->object.type = gcvOBJ_MMU;
++    mmu->os = os;
++    mmu->hardware = hardware;
++
++    /* Create the mutex. */
++    status = gckOS_CreateMutex(os, &mmu->mutex);
++
++    if (status < 0)
++    {
++        /* Roll back. */
++        mmu->object.type = gcvOBJ_UNKNOWN;
++        gcmkVERIFY_OK(gckOS_Free(os, mmu));
++
++        gcmkFOOTER();
++        /* Error. */
++        return status;
++    }
++
++    /* Allocate the page table. */
++    mmu->pageTableSize = MmuSize;
++    status = gckOS_AllocateContiguous(os,
++                                      gcvFALSE,
++                                      &mmu->pageTableSize,
++                                      &mmu->pageTablePhysical,
++                                      &mmu->pageTableLogical);
++
++    if (status < 0)
++    {
++        /* Roll back. */
++        gcmkVERIFY_OK(gckOS_DeleteMutex(os, mmu->mutex));
++
++        mmu->object.type = gcvOBJ_UNKNOWN;
++        gcmkVERIFY_OK(gckOS_Free(os, mmu));
++
++        /* Error. */
++        gcmkFATAL(
++            "%s(%d): could not allocate page table.",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkFOOTER();
++        return status;
++    }
++
++    /* Compute number of entries in page table. */
++    mmu->entryCount = mmu->pageTableSize / sizeof(gctUINT32);
++    mmu->entry = 0;
++
++    /* Mark the entire page table as available. */
++    pageTable = (gctUINT32 *) mmu->pageTableLogical;
++    for (i = 0; i < mmu->entryCount; i++)
++    {
++        pageTable[i] = (gctUINT32)~0;
++    }
++
++    /* Set page table address. */
++    status = gckVGHARDWARE_SetMMU(hardware, mmu->pageTableLogical);
++
++    if (status < 0)
++    {
++        /* Free the page table. */
++        gcmkVERIFY_OK(gckOS_FreeContiguous(mmu->os,
++                                      mmu->pageTablePhysical,
++                                      mmu->pageTableLogical,
++                                      mmu->pageTableSize));
++
++        /* Roll back. */
++        gcmkVERIFY_OK(gckOS_DeleteMutex(os, mmu->mutex));
++
++        mmu->object.type = gcvOBJ_UNKNOWN;
++        gcmkVERIFY_OK(gckOS_Free(os, mmu));
++
++        /* Error. */
++        gcmkFATAL(
++            "%s(%d): could not program page table.",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkFOOTER();
++        return status;
++    }
++
++    /* Return the gckVGMMU object pointer. */
++    *Mmu = mmu;
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_MMU,
++        "%s(%d): %u entries at %p.(0x%08X)\n",
++        __FUNCTION__, __LINE__,
++        mmu->entryCount,
++        mmu->pageTableLogical,
++        mmu->pageTablePhysical
++        );
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGMMU_Destroy
++**
++**  Destroy a nAQMMU object.
++**
++**  INPUT:
++**
++**      gckVGMMU Mmu
++**          Pointer to an gckVGMMU object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGMMU_Destroy(
++    IN gckVGMMU Mmu
++    )
++{
++    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++
++    /* Free the page table. */
++    gcmkVERIFY_OK(gckOS_FreeContiguous(Mmu->os,
++                                  Mmu->pageTablePhysical,
++                                  Mmu->pageTableLogical,
++                                  Mmu->pageTableSize));
++
++    /* Roll back. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Mmu->os, Mmu->mutex));
++
++    /* Mark the gckVGMMU object as unknown. */
++    Mmu->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckVGMMU object. */
++    gcmkVERIFY_OK(gckOS_Free(Mmu->os, Mmu));
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVGMMU_AllocatePages
++**
++**  Allocate pages inside the page table.
++**
++**  INPUT:
++**
++**      gckVGMMU Mmu
++**          Pointer to an gckVGMMU object.
++**
++**      gctSIZE_T PageCount
++**          Number of pages to allocate.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * PageTable
++**          Pointer to a variable that receives the base address of the page
++**          table.
++**
++**      gctUINT32 * Address
++**          Pointer to a variable that receives the hardware specific address.
++*/
++gceSTATUS gckVGMMU_AllocatePages(
++    IN gckVGMMU Mmu,
++    IN gctSIZE_T PageCount,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    )
++{
++    gceSTATUS status;
++    gctUINT32 tail, index, i;
++    gctUINT32 * table;
++    gctBOOL allocated = gcvFALSE;
++
++    gcmkHEADER_ARG("Mmu=0x%x PageCount=0x%x PageTable=0x%x Address=0x%x",
++        Mmu, PageCount, PageTable, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++    gcmkVERIFY_ARGUMENT(PageCount > 0);
++    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_MMU,
++        "%s(%d): %u pages.\n",
++        __FUNCTION__, __LINE__,
++        PageCount
++        );
++
++    if (PageCount > Mmu->entryCount)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_MMU,
++            "%s(%d): page table too small for %u pages.\n",
++            __FUNCTION__, __LINE__,
++            PageCount
++            );
++
++        gcmkFOOTER_NO();
++        /* Not enough pages avaiable. */
++        return gcvSTATUS_OUT_OF_RESOURCES;
++    }
++
++    /* Grab the mutex. */
++    status = gckOS_AcquireMutex(Mmu->os, Mmu->mutex, gcvINFINITE);
++
++    if (status < 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_MMU,
++            "%s(%d): could not acquire mutex.\n"
++            ,__FUNCTION__, __LINE__
++            );
++
++        gcmkFOOTER();
++        /* Error. */
++        return status;
++    }
++
++    /* Compute the tail for this allocation. */
++    tail = Mmu->entryCount - PageCount;
++
++    /* Walk all entries until we find enough slots. */
++    for (index = Mmu->entry; index <= tail;)
++    {
++        /* Access page table. */
++        table = (gctUINT32 *) Mmu->pageTableLogical + index;
++
++        /* See if all slots are available. */
++        for (i = 0; i < PageCount; i++, table++)
++        {
++            if (*table != ~0)
++            {
++                /* Start from next slot. */
++                index += i + 1;
++                break;
++            }
++        }
++
++        if (i == PageCount)
++        {
++            /* Bail out if we have enough page entries. */
++            allocated = gcvTRUE;
++            break;
++        }
++    }
++
++    if (!allocated)
++    {
++        if (status >= 0)
++        {
++            /* Walk all entries until we find enough slots. */
++            for (index = 0; index <= tail;)
++            {
++                /* Access page table. */
++                table = (gctUINT32 *) Mmu->pageTableLogical + index;
++
++                /* See if all slots are available. */
++                for (i = 0; i < PageCount; i++, table++)
++                {
++                    if (*table != ~0)
++                    {
++                        /* Start from next slot. */
++                        index += i + 1;
++                        break;
++                    }
++                }
++
++                if (i == PageCount)
++                {
++                    /* Bail out if we have enough page entries. */
++                    allocated = gcvTRUE;
++                    break;
++                }
++            }
++        }
++    }
++
++    if (!allocated && (status >= 0))
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_MMU,
++            "%s(%d): not enough free pages for %u pages.\n",
++            __FUNCTION__, __LINE__,
++            PageCount
++            );
++
++        /* Not enough empty slots available. */
++        status = gcvSTATUS_OUT_OF_RESOURCES;
++    }
++
++    if (status >= 0)
++    {
++        /* Build virtual address. */
++        status = gckVGHARDWARE_BuildVirtualAddress(Mmu->hardware,
++                                                 index,
++                                                 0,
++                                                 Address);
++
++        if (status >= 0)
++        {
++            /* Update current entry into page table. */
++            Mmu->entry = index + PageCount;
++
++            /* Return pointer to page table. */
++            *PageTable = (gctUINT32 *)  Mmu->pageTableLogical + index;
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_MMU,
++                "%s(%d): allocated %u pages at index %u (0x%08X) @ %p.\n",
++                __FUNCTION__, __LINE__,
++                PageCount,
++                index,
++                *Address,
++                *PageTable
++                );
++            }
++    }
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Mmu->os, Mmu->mutex));
++    gcmkFOOTER();
++
++    /* Return status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVGMMU_FreePages
++**
++**  Free pages inside the page table.
++**
++**  INPUT:
++**
++**      gckVGMMU Mmu
++**          Pointer to an gckVGMMU object.
++**
++**      gctPOINTER PageTable
++**          Base address of the page table to free.
++**
++**      gctSIZE_T PageCount
++**          Number of pages to free.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGMMU_FreePages(
++    IN gckVGMMU Mmu,
++    IN gctPOINTER PageTable,
++    IN gctSIZE_T PageCount
++    )
++{
++    gctUINT32 * table;
++
++    gcmkHEADER_ARG("Mmu=0x%x PageTable=0x%x PageCount=0x%x",
++        Mmu, PageTable, PageCount);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
++    gcmkVERIFY_ARGUMENT(PageCount > 0);
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_MMU,
++        "%s(%d): freeing %u pages at index %u @ %p.\n",
++        __FUNCTION__, __LINE__,
++        PageCount,
++        ((gctUINT32 *) PageTable - (gctUINT32 *) Mmu->pageTableLogical),
++        PageTable
++        );
++
++    /* Convert pointer. */
++    table = (gctUINT32 *) PageTable;
++
++    /* Mark the page table entries as available. */
++    while (PageCount-- > 0)
++    {
++        *table++ = (gctUINT32)~0;
++    }
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGMMU_SetPage(
++    IN gckVGMMU Mmu,
++    IN gctUINT32 PageAddress,
++    IN gctUINT32 *PageEntry
++    )
++{
++    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Mmu, gcvOBJ_MMU);
++    gcmkVERIFY_ARGUMENT(PageEntry != gcvNULL);
++    gcmkVERIFY_ARGUMENT(!(PageAddress & 0xFFF));
++
++    *PageEntry = PageAddress;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckVGMMU_Flush(
++   IN gckVGMMU Mmu
++   )
++{
++    gckVGHARDWARE hardware;
++
++    gcmkHEADER_ARG("Mmu=0x%x", Mmu);
++
++    hardware = Mmu->hardware;
++    gcmkVERIFY_OK(
++        gckOS_AtomSet(hardware->os, hardware->pageTableDirty, 1));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#endif /* gcdENABLE_VG */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_power.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,347 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_POWER
++
++/******************************************************************************\
++************************ Dynamic Voltage Frequency Setting *********************
++\******************************************************************************/
++#if gcdDVFS
++static gctUINT32
++_GetLoadHistory(
++    IN gckDVFS Dvfs,
++    IN gctUINT32 Select,
++    IN gctUINT32 Index
++)
++{
++    return Dvfs->loads[Index];
++}
++
++static void
++_IncreaseScale(
++    IN gckDVFS Dvfs,
++    IN gctUINT32 Load,
++    OUT gctUINT8 *Scale
++    )
++{
++    if (Dvfs->currentScale < 32)
++    {
++        *Scale = Dvfs->currentScale + 8;
++    }
++    else
++    {
++        *Scale = Dvfs->currentScale + 8;
++        *Scale = gcmMIN(64, *Scale);
++    }
++}
++
++static void
++_RecordFrequencyHistory(
++    gckDVFS Dvfs,
++    gctUINT32 Frequency
++    )
++{
++    gctUINT32 i = 0;
++
++    struct _FrequencyHistory *history = Dvfs->frequencyHistory;
++
++    for (i = 0; i < 16; i++)
++    {
++        if (history->frequency == Frequency)
++        {
++            break;
++        }
++
++        if (history->frequency == 0)
++        {
++            history->frequency = Frequency;
++            break;
++        }
++
++        history++;
++    }
++
++    if (i < 16)
++    {
++        history->count++;
++    }
++}
++
++static gctUINT32
++_GetFrequencyHistory(
++    gckDVFS Dvfs,
++    gctUINT32 Frequency
++    )
++{
++    gctUINT32 i = 0;
++
++    struct _FrequencyHistory * history = Dvfs->frequencyHistory;
++
++    for (i = 0; i < 16; i++)
++    {
++        if (history->frequency == Frequency)
++        {
++            break;
++        }
++
++        history++;
++    }
++
++    if (i < 16)
++    {
++        return history->count;
++    }
++
++    return 0;
++}
++
++static void
++_Policy(
++    IN gckDVFS Dvfs,
++    IN gctUINT32 Load,
++    OUT gctUINT8 *Scale
++    )
++{
++    gctUINT8 load[4], nextLoad;
++    gctUINT8 scale;
++
++    /* Last 4 history. */
++    load[0] = (Load & 0xFF);
++    load[1] = (Load & 0xFF00) >> 8;
++    load[2] = (Load & 0xFF0000) >> 16;
++    load[3] = (Load & 0xFF000000) >> 24;
++
++    /* Determine target scale. */
++    if (load[0] > 54)
++    {
++        _IncreaseScale(Dvfs, Load, &scale);
++    }
++    else
++    {
++        nextLoad = (load[0] + load[1] + load[2] + load[3])/4;
++
++        scale = Dvfs->currentScale * (nextLoad) / 54;
++
++        scale = gcmMAX(1, scale);
++        scale = gcmMIN(64, scale);
++    }
++
++    Dvfs->totalConfig++;
++
++    Dvfs->loads[(load[0]-1)/8]++;
++
++    *Scale = scale;
++
++
++    if (Dvfs->totalConfig % 100 == 0)
++    {
++        gcmkPRINT("=======================================================");
++        gcmkPRINT("GPU Load:       %-8d %-8d %-8d %-8d %-8d %-8d %-8d %-8d",
++                                   8, 16, 24, 32, 40, 48, 56, 64);
++        gcmkPRINT("                %-8d %-8d %-8d %-8d %-8d %-8d %-8d %-8d",
++                  _GetLoadHistory(Dvfs,2, 0),
++                  _GetLoadHistory(Dvfs,2, 1),
++                  _GetLoadHistory(Dvfs,2, 2),
++                  _GetLoadHistory(Dvfs,2, 3),
++                  _GetLoadHistory(Dvfs,2, 4),
++                  _GetLoadHistory(Dvfs,2, 5),
++                  _GetLoadHistory(Dvfs,2, 6),
++                  _GetLoadHistory(Dvfs,2, 7)
++                  );
++
++        gcmkPRINT("Frequency(MHz)  %-8d %-8d %-8d %-8d %-8d",
++                  58, 120, 240, 360, 480);
++        gcmkPRINT("                %-8d %-8d %-8d %-8d %-8d",
++                  _GetFrequencyHistory(Dvfs, 58),
++                  _GetFrequencyHistory(Dvfs,120),
++                  _GetFrequencyHistory(Dvfs,240),
++                  _GetFrequencyHistory(Dvfs,360),
++                  _GetFrequencyHistory(Dvfs,480)
++                  );
++    }
++}
++
++static void
++_TimerFunction(
++    gctPOINTER Data
++    )
++{
++    gceSTATUS status;
++    gckDVFS dvfs = (gckDVFS) Data;
++    gckHARDWARE hardware = dvfs->hardware;
++    gctUINT32 value;
++    gctUINT32 frequency;
++    gctUINT8 scale;
++    gctUINT32 t1, t2, consumed;
++
++    gckOS_GetTicks(&t1);
++
++    gcmkONERROR(gckHARDWARE_QueryLoad(hardware, &value));
++
++    /* determine target sacle. */
++    _Policy(dvfs, value, &scale);
++
++    /* Set frequency and voltage. */
++    gcmkONERROR(gckOS_SetGPUFrequency(hardware->os, hardware->core, scale));
++
++    /* Query real frequency. */
++    gcmkONERROR(
++        gckOS_QueryGPUFrequency(hardware->os,
++                                hardware->core,
++                                &frequency,
++                                &dvfs->currentScale));
++
++    _RecordFrequencyHistory(dvfs, frequency);
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_POWER,
++                   "Current frequency = %d",
++                   frequency);
++
++    /* Set period. */
++    gcmkONERROR(gckHARDWARE_SetDVFSPeroid(hardware, frequency));
++
++OnError:
++    /* Determine next querying time. */
++    gckOS_GetTicks(&t2);
++
++    consumed = gcmMIN(((long)t2 - (long)t1), 5);
++
++    if (dvfs->stop == gcvFALSE)
++    {
++        gcmkVERIFY_OK(gckOS_StartTimer(hardware->os,
++                                       dvfs->timer,
++                                       dvfs->pollingTime - consumed));
++    }
++
++    return;
++}
++
++gceSTATUS
++gckDVFS_Construct(
++    IN gckHARDWARE Hardware,
++    OUT gckDVFS * Dvfs
++    )
++{
++    gceSTATUS status;
++    gctPOINTER pointer;
++    gckDVFS dvfs = gcvNULL;
++    gckOS os = Hardware->os;
++
++    gcmkHEADER_ARG("Hardware=0x%X", Hardware);
++
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
++
++    /* Allocate a gckDVFS manager. */
++    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(struct _gckDVFS), &pointer));
++
++    gckOS_ZeroMemory(pointer, gcmSIZEOF(struct _gckDVFS));
++
++    dvfs = pointer;
++
++    /* Initialization. */
++    dvfs->hardware = Hardware;
++    dvfs->pollingTime = gcdDVFS_POLLING_TIME;
++    dvfs->os = Hardware->os;
++    dvfs->currentScale = 64;
++
++    /* Create a polling timer. */
++    gcmkONERROR(gckOS_CreateTimer(os, _TimerFunction, pointer, &dvfs->timer));
++
++    /* Initialize frequency and voltage adjustment helper. */
++    gcmkONERROR(gckOS_PrepareGPUFrequency(os, Hardware->core));
++
++    /* Return result. */
++    *Dvfs = dvfs;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (dvfs)
++    {
++        if (dvfs->timer)
++        {
++            gcmkVERIFY_OK(gckOS_DestroyTimer(os, dvfs->timer));
++        }
++
++        gcmkOS_SAFE_FREE(os, dvfs);
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckDVFS_Destroy(
++    IN gckDVFS Dvfs
++    )
++{
++    gcmkHEADER_ARG("Dvfs=0x%X", Dvfs);
++    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
++
++    /* Deinitialize helper fuunction. */
++    gcmkVERIFY_OK(gckOS_FinishGPUFrequency(Dvfs->os, Dvfs->hardware->core));
++
++    /* DestroyTimer. */
++    gcmkVERIFY_OK(gckOS_DestroyTimer(Dvfs->os, Dvfs->timer));
++
++    gcmkOS_SAFE_FREE(Dvfs->os, Dvfs);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckDVFS_Start(
++    IN gckDVFS Dvfs
++    )
++{
++    gcmkHEADER_ARG("Dvfs=0x%X", Dvfs);
++    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
++
++    gckHARDWARE_InitDVFS(Dvfs->hardware);
++
++    Dvfs->stop = gcvFALSE;
++
++    gckOS_StartTimer(Dvfs->os, Dvfs->timer, Dvfs->pollingTime);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckDVFS_Stop(
++    IN gckDVFS Dvfs
++    )
++{
++    gcmkHEADER_ARG("Dvfs=0x%X", Dvfs);
++    gcmkVERIFY_ARGUMENT(Dvfs != gcvNULL);
++
++    Dvfs->stop = gcvTRUE;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_precomp.h	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,29 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_precomp_h_
++#define __gc_hal_kernel_precomp_h_
++
++#include "gc_hal.h"
++#include "gc_hal_driver.h"
++#include "gc_hal_kernel.h"
++
++#endif /* __gc_hal_kernel_precomp_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_security.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,239 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++
++
++
++#define _GC_OBJ_ZONE    gcvZONE_KERNEL
++
++#if gcdSECURITY
++
++/*
++** Open a security service channel.
++*/
++gceSTATUS
++gckKERNEL_SecurityOpen(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 GPU,
++    OUT gctUINT32 *Channel
++    )
++{
++    gceSTATUS status;
++
++    gcmkONERROR(gckOS_OpenSecurityChannel(Kernel->os, Kernel->core, Channel));
++    gcmkONERROR(gckOS_InitSecurityChannel(*Channel));
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++/*
++** Close a security service channel
++*/
++gceSTATUS
++gckKERNEL_SecurityClose(
++    IN gctUINT32 Channel
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++/*
++** Security service interface.
++*/
++gceSTATUS
++gckKERNEL_SecurityCallService(
++    IN gctUINT32 Channel,
++    IN OUT gcsTA_INTERFACE * Interface
++)
++{
++    gceSTATUS status;
++    gcmkHEADER();
++
++    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
++
++    gckOS_CallSecurityService(Channel, Interface);
++
++    status = Interface->result;
++
++    gcmkONERROR(status);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_SecurityStartCommand(
++    IN gckKERNEL Kernel
++    )
++{
++    gceSTATUS status;
++    gcsTA_INTERFACE iface;
++
++    gcmkHEADER();
++
++    iface.command = KERNEL_START_COMMAND;
++    iface.u.StartCommand.gpu = Kernel->core;
++
++    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_SecurityAllocateSecurityMemory(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 Bytes,
++    OUT gctUINT32 * Handle
++    )
++{
++    gceSTATUS status;
++    gcsTA_INTERFACE iface;
++
++    gcmkHEADER();
++
++    iface.command = KERNEL_ALLOCATE_SECRUE_MEMORY;
++    iface.u.AllocateSecurityMemory.bytes = Bytes;
++
++    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
++
++    *Handle = iface.u.AllocateSecurityMemory.memory_handle;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_SecurityExecute(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Buffer,
++    IN gctUINT32 Bytes
++    )
++{
++    gceSTATUS status;
++    gcsTA_INTERFACE iface;
++
++    gcmkHEADER();
++
++    iface.command = KERNEL_EXECUTE;
++    iface.u.Execute.command_buffer = (gctUINT32 *)Buffer;
++    iface.u.Execute.gpu = Kernel->core;
++    iface.u.Execute.command_buffer_length = Bytes;
++
++#if defined(LINUX)
++    gcmkONERROR(gckOS_GetPhysicalAddress(Kernel->os, Buffer,
++            (gctUINT32 *)&iface.u.Execute.command_buffer));
++#endif
++
++    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
++
++    /* Update queue tail pointer. */
++    gcmkONERROR(gckHARDWARE_UpdateQueueTail(
++        Kernel->hardware, 0, 0
++        ));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_SecurityMapMemory(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 *PhysicalArray,
++    IN gctUINT32 PageCount,
++    OUT gctUINT32 * GPUAddress
++    )
++{
++    gceSTATUS status;
++    gcsTA_INTERFACE iface;
++
++    gcmkHEADER();
++
++    iface.command = KERNEL_MAP_MEMORY;
++
++#if defined(LINUX)
++    gcmkONERROR(gckOS_GetPhysicalAddress(Kernel->os, PhysicalArray,
++            (gctUINT32 *)&iface.u.MapMemory.physicals));
++#endif
++
++    iface.u.MapMemory.pageCount = PageCount;
++
++    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
++
++    *GPUAddress = iface.u.MapMemory.gpuAddress;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_SecurityUnmapMemory(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 GPUAddress,
++    IN gctUINT32 PageCount
++    )
++{
++    gceSTATUS status;
++    gcsTA_INTERFACE iface;
++
++    gcmkHEADER();
++
++    iface.command = KERNEL_UNMAP_MEMORY;
++
++    iface.u.UnmapMemory.gpuAddress = GPUAddress;
++    iface.u.UnmapMemory.pageCount  = PageCount;
++
++    gcmkONERROR(gckKERNEL_SecurityCallService(Kernel->securityChannel, &iface));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,896 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#if gcdENABLE_VG
++
++#define ENABLE_VG_TRY_VIRTUAL_MEMORY 0
++
++#define _GC_OBJ_ZONE            gcvZONE_VG
++
++/******************************************************************************\
++******************************* gckKERNEL API Code ******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckKERNEL_Construct
++**
++**  Construct a new gckKERNEL object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      IN gctPOINTER Context
++**          Pointer to a driver defined context.
++**
++**  OUTPUT:
++**
++**      gckKERNEL * Kernel
++**          Pointer to a variable that will hold the pointer to the gckKERNEL
++**          object.
++*/
++gceSTATUS gckVGKERNEL_Construct(
++    IN gckOS Os,
++    IN gctPOINTER Context,
++    IN gckKERNEL  inKernel,
++    OUT gckVGKERNEL * Kernel
++    )
++{
++    gceSTATUS status;
++    gckVGKERNEL kernel = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%x Context=0x%x", Os, Context);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Kernel != gcvNULL);
++
++    do
++    {
++        /* Allocate the gckKERNEL object. */
++        gcmkERR_BREAK(gckOS_Allocate(
++            Os,
++            sizeof(struct _gckVGKERNEL),
++            (gctPOINTER *) &kernel
++            ));
++
++        /* Initialize the gckKERNEL object. */
++        kernel->object.type = gcvOBJ_KERNEL;
++        kernel->os          = Os;
++        kernel->context     = Context;
++        kernel->hardware    = gcvNULL;
++        kernel->interrupt   = gcvNULL;
++        kernel->command     = gcvNULL;
++        kernel->mmu         = gcvNULL;
++        kernel->kernel      = inKernel;
++
++        /* Construct the gckVGHARDWARE object. */
++        gcmkERR_BREAK(gckVGHARDWARE_Construct(
++            Os, &kernel->hardware
++            ));
++
++        /* Set pointer to gckKERNEL object in gckVGHARDWARE object. */
++        kernel->hardware->kernel = kernel;
++
++        /* Construct the gckVGINTERRUPT object. */
++        gcmkERR_BREAK(gckVGINTERRUPT_Construct(
++            kernel, &kernel->interrupt
++            ));
++
++        /* Construct the gckVGCOMMAND object. */
++        gcmkERR_BREAK(gckVGCOMMAND_Construct(
++            kernel, gcmKB2BYTES(8), gcmKB2BYTES(2), &kernel->command
++            ));
++
++        /* Construct the gckVGMMU object. */
++        gcmkERR_BREAK(gckVGMMU_Construct(
++            kernel, gcmKB2BYTES(32), &kernel->mmu
++            ));
++
++        /* Return pointer to the gckKERNEL object. */
++        *Kernel = kernel;
++
++        gcmkFOOTER_ARG("*Kernel=0x%x", *Kernel);
++        /* Success. */
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Roll back. */
++    if (kernel != gcvNULL)
++    {
++        if (kernel->mmu != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckVGMMU_Destroy(kernel->mmu));
++        }
++
++        if (kernel->command != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckVGCOMMAND_Destroy(kernel->command));
++        }
++
++        if (kernel->interrupt != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckVGINTERRUPT_Destroy(kernel->interrupt));
++        }
++
++        if (kernel->hardware != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckVGHARDWARE_Destroy(kernel->hardware));
++        }
++
++        gcmkVERIFY_OK(gckOS_Free(Os, kernel));
++    }
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_Destroy
++**
++**  Destroy an gckKERNEL object.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckVGKERNEL_Destroy(
++    IN gckVGKERNEL Kernel
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Kernel=0x%x", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    do
++    {
++        /* Destroy the gckVGMMU object. */
++        if (Kernel->mmu != gcvNULL)
++        {
++            gcmkERR_BREAK(gckVGMMU_Destroy(Kernel->mmu));
++            Kernel->mmu = gcvNULL;
++        }
++
++        /* Destroy the gckVGCOMMAND object. */
++        if (Kernel->command != gcvNULL)
++        {
++            gcmkERR_BREAK(gckVGCOMMAND_Destroy(Kernel->command));
++            Kernel->command = gcvNULL;
++        }
++
++        /* Destroy the gckVGINTERRUPT object. */
++        if (Kernel->interrupt != gcvNULL)
++        {
++            gcmkERR_BREAK(gckVGINTERRUPT_Destroy(Kernel->interrupt));
++            Kernel->interrupt = gcvNULL;
++        }
++
++        /* Destroy the gckVGHARDWARE object. */
++        if (Kernel->hardware != gcvNULL)
++        {
++            gcmkERR_BREAK(gckVGHARDWARE_Destroy(Kernel->hardware));
++            Kernel->hardware = gcvNULL;
++        }
++
++        /* Mark the gckKERNEL object as unknown. */
++        Kernel->object.type = gcvOBJ_UNKNOWN;
++
++        /* Free the gckKERNEL object. */
++        gcmkERR_BREAK(gckOS_Free(Kernel->os, Kernel));
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++
++    /* Return status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_AllocateLinearMemory
++**
++**  Function walks all required memory pools and allocates the requested
++**  amount of video memory.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcePOOL * Pool
++**          Pointer the desired memory pool.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to allocate.
++**
++**      gctSIZE_T Alignment
++**          Required buffer alignment.
++**
++**      gceSURF_TYPE Type
++**          Surface type.
++**
++**  OUTPUT:
++**
++**      gcePOOL * Pool
++**          Pointer to the actual pool where the memory was allocated.
++**
++**      gcuVIDMEM_NODE_PTR * Node
++**          Allocated node.
++*/
++gceSTATUS
++gckKERNEL_AllocateLinearMemory(
++    IN gckKERNEL Kernel,
++    IN OUT gcePOOL * Pool,
++    IN gctSIZE_T Bytes,
++    IN gctSIZE_T Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    )
++{
++    gcePOOL pool;
++    gceSTATUS status;
++    gckVIDMEM videoMemory;
++
++    /* Get initial pool. */
++    switch (pool = *Pool)
++    {
++    case gcvPOOL_DEFAULT:
++    case gcvPOOL_LOCAL:
++        pool = gcvPOOL_LOCAL_INTERNAL;
++        break;
++
++    case gcvPOOL_UNIFIED:
++        pool = gcvPOOL_SYSTEM;
++        break;
++
++    default:
++        break;
++    }
++
++    do
++    {
++        /* Verify the number of bytes to allocate. */
++        if (Bytes == 0)
++        {
++            status = gcvSTATUS_INVALID_ARGUMENT;
++            break;
++        }
++
++        if (pool == gcvPOOL_VIRTUAL)
++        {
++            /* Create a gcuVIDMEM_NODE for virtual memory. */
++            gcmkERR_BREAK(gckVIDMEM_ConstructVirtual(Kernel, gcvFALSE, Bytes, Node));
++
++            /* Success. */
++            break;
++        }
++
++        else
++        {
++            /* Get pointer to gckVIDMEM object for pool. */
++            status = gckKERNEL_GetVideoMemoryPool(Kernel, pool, &videoMemory);
++
++            if (status == gcvSTATUS_OK)
++            {
++                if(*Pool == gcvPOOL_SYSTEM)
++                    Type |= gcvSURF_VG;
++                /* Allocate memory. */
++                status = gckVIDMEM_AllocateLinear(Kernel,
++                                                  videoMemory,
++                                                  Bytes,
++                                                  Alignment,
++                                                  Type,
++                                                  Node);
++
++                if (status == gcvSTATUS_OK)
++                {
++                    /* Memory allocated. */
++                    break;
++                }
++            }
++        }
++
++        if (pool == gcvPOOL_LOCAL_INTERNAL)
++        {
++            /* Advance to external memory. */
++            pool = gcvPOOL_LOCAL_EXTERNAL;
++        }
++        else if (pool == gcvPOOL_LOCAL_EXTERNAL)
++        {
++            /* Advance to contiguous system memory. */
++            pool = gcvPOOL_SYSTEM;
++        }
++        else if (pool == gcvPOOL_SYSTEM)
++        {
++            /* Advance to virtual memory. */
++#if ENABLE_VG_TRY_VIRTUAL_MEMORY
++            pool = gcvPOOL_VIRTUAL;
++#else
++            /*VG non-contiguous memory support is not ready yet, disable it temporary*/
++            status = gcvSTATUS_OUT_OF_MEMORY;
++            break;
++#endif
++        }
++        else
++        {
++            /* Out of pools. */
++            status = gcvSTATUS_OUT_OF_MEMORY;
++            break;
++        }
++    }
++    /* Loop only for multiple selection pools. */
++    while ((*Pool == gcvPOOL_DEFAULT)
++    ||     (*Pool == gcvPOOL_LOCAL)
++    ||     (*Pool == gcvPOOL_UNIFIED)
++    );
++
++    if (gcmIS_SUCCESS(status))
++    {
++        /* Return pool used for allocation. */
++        *Pool = pool;
++    }
++
++    /* Return status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_Dispatch
++**
++**  Dispatch a command received from the user HAL layer.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to a gcsHAL_INTERFACE structure that defines the command to
++**          be dispatched.
++**
++**  OUTPUT:
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to a gcsHAL_INTERFACE structure that receives any data to be
++**          returned.
++*/
++gceSTATUS gckVGKERNEL_Dispatch(
++    IN gckKERNEL Kernel,
++    IN gctBOOL FromUser,
++    IN OUT gcsHAL_INTERFACE * Interface
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE * kernelInterface = Interface;
++    gcuVIDMEM_NODE_PTR node;
++    gctUINT32 processID;
++    gckKERNEL kernel = Kernel;
++    gctPOINTER info = gcvNULL;
++    gctPHYS_ADDR physical = gcvNULL;
++    gctPOINTER logical = gcvNULL;
++    gctSIZE_T bytes = 0;
++
++    gcmkHEADER_ARG("Kernel=0x%x Interface=0x%x ", Kernel, Interface);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Interface != gcvNULL);
++
++    gcmkONERROR(gckOS_GetProcessID(&processID));
++
++    /* Dispatch on command. */
++    switch (Interface->command)
++    {
++    case gcvHAL_QUERY_VIDEO_MEMORY:
++        /* Query video memory size. */
++        gcmkERR_BREAK(gckKERNEL_QueryVideoMemory(
++            Kernel, kernelInterface
++            ));
++        break;
++
++    case gcvHAL_QUERY_CHIP_IDENTITY:
++        /* Query chip identity. */
++        gcmkERR_BREAK(gckVGHARDWARE_QueryChipIdentity(
++            Kernel->vg->hardware,
++            &kernelInterface->u.QueryChipIdentity.chipModel,
++            &kernelInterface->u.QueryChipIdentity.chipRevision,
++            &kernelInterface->u.QueryChipIdentity.chipFeatures,
++            &kernelInterface->u.QueryChipIdentity.chipMinorFeatures,
++            &kernelInterface->u.QueryChipIdentity.chipMinorFeatures2
++            ));
++        break;
++
++    case gcvHAL_QUERY_COMMAND_BUFFER:
++        /* Query command buffer information. */
++        gcmkERR_BREAK(gckKERNEL_QueryCommandBuffer(
++            Kernel,
++            &kernelInterface->u.QueryCommandBuffer.information
++            ));
++        break;
++    case gcvHAL_ALLOCATE_NON_PAGED_MEMORY:
++        bytes = (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes;
++        /* Allocate non-paged memory. */
++        gcmkERR_BREAK(gckOS_AllocateContiguous(
++            Kernel->os,
++            gcvTRUE,
++            &bytes,
++            &physical,
++            &logical
++            ));
++
++        kernelInterface->u.AllocateNonPagedMemory.bytes    = bytes;
++        kernelInterface->u.AllocateNonPagedMemory.logical  = gcmPTR_TO_UINT64(logical);
++        kernelInterface->u.AllocateNonPagedMemory.physical = gcmPTR_TO_NAME(physical);
++        break;
++
++    case gcvHAL_FREE_NON_PAGED_MEMORY:
++        physical = gcmNAME_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.physical);
++
++        /* Unmap user logical out of physical memory first. */
++        gcmkERR_BREAK(gckOS_UnmapUserLogical(
++            Kernel->os,
++            physical,
++            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes,
++            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical)
++            ));
++
++        /* Free non-paged memory. */
++        gcmkERR_BREAK(gckOS_FreeNonPagedMemory(
++            Kernel->os,
++            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes,
++            physical,
++            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical)
++            ));
++
++        gcmRELEASE_NAME(kernelInterface->u.AllocateNonPagedMemory.physical);
++        break;
++
++    case gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY:
++        bytes = (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes;
++        /* Allocate contiguous memory. */
++        gcmkERR_BREAK(gckOS_AllocateContiguous(
++            Kernel->os,
++            gcvTRUE,
++            &bytes,
++            &physical,
++            &logical
++            ));
++
++        kernelInterface->u.AllocateNonPagedMemory.bytes    = bytes;
++        kernelInterface->u.AllocateNonPagedMemory.logical  = gcmPTR_TO_UINT64(logical);
++        kernelInterface->u.AllocateNonPagedMemory.physical = gcmPTR_TO_NAME(physical);
++        break;
++
++    case gcvHAL_FREE_CONTIGUOUS_MEMORY:
++        physical = gcmNAME_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.physical);
++        /* Unmap user logical out of physical memory first. */
++        gcmkERR_BREAK(gckOS_UnmapUserLogical(
++            Kernel->os,
++            physical,
++            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes,
++            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical)
++            ));
++
++        /* Free contiguous memory. */
++        gcmkERR_BREAK(gckOS_FreeContiguous(
++            Kernel->os,
++            physical,
++            gcmUINT64_TO_PTR(kernelInterface->u.AllocateNonPagedMemory.logical),
++            (gctSIZE_T) kernelInterface->u.AllocateNonPagedMemory.bytes
++            ));
++
++        gcmRELEASE_NAME(kernelInterface->u.AllocateNonPagedMemory.physical);
++        break;
++
++    case gcvHAL_ALLOCATE_VIDEO_MEMORY:
++        {
++            gctSIZE_T bytes;
++            gctUINT32 bitsPerPixel;
++            gctUINT32 bits;
++
++            /* Align width and height to tiles. */
++            gcmkERR_BREAK(gckVGHARDWARE_AlignToTile(
++                Kernel->vg->hardware,
++                kernelInterface->u.AllocateVideoMemory.type,
++                &kernelInterface->u.AllocateVideoMemory.width,
++                &kernelInterface->u.AllocateVideoMemory.height
++                ));
++
++            /* Convert format into bytes per pixel and bytes per tile. */
++            gcmkERR_BREAK(gckVGHARDWARE_ConvertFormat(
++                Kernel->vg->hardware,
++                kernelInterface->u.AllocateVideoMemory.format,
++                &bitsPerPixel,
++                gcvNULL
++                ));
++
++            /* Compute number of bits for the allocation. */
++            bits
++                = kernelInterface->u.AllocateVideoMemory.width
++                * kernelInterface->u.AllocateVideoMemory.height
++                * kernelInterface->u.AllocateVideoMemory.depth
++                * bitsPerPixel;
++
++            /* Compute number of bytes for the allocation. */
++            bytes = gcmALIGN(bits, 8) / 8;
++
++            /* Allocate memory. */
++            gcmkERR_BREAK(gckKERNEL_AllocateLinearMemory(
++                Kernel,
++                &kernelInterface->u.AllocateVideoMemory.pool,
++                bytes,
++                64,
++                kernelInterface->u.AllocateVideoMemory.type,
++                &node
++                ));
++
++            kernelInterface->u.AllocateVideoMemory.node = gcmPTR_TO_UINT64(node);
++        }
++        break;
++
++    case gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY:
++        /* Allocate memory. */
++        gcmkERR_BREAK(gckKERNEL_AllocateLinearMemory(
++            Kernel,
++            &kernelInterface->u.AllocateLinearVideoMemory.pool,
++            kernelInterface->u.AllocateLinearVideoMemory.bytes,
++            kernelInterface->u.AllocateLinearVideoMemory.alignment,
++            kernelInterface->u.AllocateLinearVideoMemory.type,
++            &node
++            ));
++
++        gcmkERR_BREAK(gckKERNEL_AddProcessDB(Kernel,
++           processID, gcvDB_VIDEO_MEMORY,
++           node,
++           gcvNULL,
++           kernelInterface->u.AllocateLinearVideoMemory.bytes
++           ));
++
++        kernelInterface->u.AllocateLinearVideoMemory.node = gcmPTR_TO_UINT64(node);
++        break;
++
++    case gcvHAL_FREE_VIDEO_MEMORY:
++        node = gcmUINT64_TO_PTR(Interface->u.FreeVideoMemory.node);
++#ifdef __QNXNTO__
++        /* Unmap the video memory */
++
++        if ((node->VidMem.memory->object.type == gcvOBJ_VIDMEM) &&
++            (node->VidMem.logical != gcvNULL))
++        {
++            gckKERNEL_UnmapVideoMemory(Kernel,
++                                       node->VidMem.logical,
++                                       processID,
++                                       node->VidMem.bytes);
++            node->VidMem.logical = gcvNULL;
++        }
++#endif /* __QNXNTO__ */
++
++        /* Free video memory. */
++        gcmkERR_BREAK(gckVIDMEM_Free(Kernel,
++            node
++            ));
++
++        gcmkERR_BREAK(gckKERNEL_RemoveProcessDB(
++            Kernel,
++            processID, gcvDB_VIDEO_MEMORY,
++            node
++            ));
++
++        break;
++
++    case gcvHAL_MAP_MEMORY:
++        /* Map memory. */
++        gcmkERR_BREAK(gckKERNEL_MapMemory(
++            Kernel,
++            gcmINT2PTR(kernelInterface->u.MapMemory.physical),
++            (gctSIZE_T) kernelInterface->u.MapMemory.bytes,
++            &logical
++            ));
++        kernelInterface->u.MapMemory.logical = gcmPTR_TO_UINT64(logical);
++        break;
++
++    case gcvHAL_UNMAP_MEMORY:
++        /* Unmap memory. */
++        gcmkERR_BREAK(gckKERNEL_UnmapMemory(
++            Kernel,
++            gcmINT2PTR(kernelInterface->u.MapMemory.physical),
++            (gctSIZE_T) kernelInterface->u.MapMemory.bytes,
++            gcmUINT64_TO_PTR(kernelInterface->u.MapMemory.logical)
++            ));
++        break;
++
++    case gcvHAL_MAP_USER_MEMORY:
++        /* Map user memory to DMA. */
++        gcmkERR_BREAK(gckOS_MapUserMemory(
++            Kernel->os,
++            gcvCORE_VG,
++            gcmUINT64_TO_PTR(kernelInterface->u.MapUserMemory.memory),
++            kernelInterface->u.MapUserMemory.physical,
++            (gctSIZE_T) kernelInterface->u.MapUserMemory.size,
++            &info,
++            &kernelInterface->u.MapUserMemory.address
++            ));
++
++        kernelInterface->u.MapUserMemory.info = gcmPTR_TO_NAME(info);
++        break;
++
++    case gcvHAL_UNMAP_USER_MEMORY:
++        /* Unmap user memory. */
++        gcmkERR_BREAK(gckOS_UnmapUserMemory(
++            Kernel->os,
++            gcvCORE_VG,
++            gcmUINT64_TO_PTR(kernelInterface->u.UnmapUserMemory.memory),
++            (gctSIZE_T) kernelInterface->u.UnmapUserMemory.size,
++            gcmNAME_TO_PTR(kernelInterface->u.UnmapUserMemory.info),
++            kernelInterface->u.UnmapUserMemory.address
++            ));
++        gcmRELEASE_NAME(kernelInterface->u.UnmapUserMemory.info);
++        break;
++    case gcvHAL_LOCK_VIDEO_MEMORY:
++        node = gcmUINT64_TO_PTR(Interface->u.LockVideoMemory.node);
++
++        /* Lock video memory. */
++        gcmkERR_BREAK(
++            gckVIDMEM_Lock(Kernel,
++                           node,
++						   gcvFALSE,
++                           &Interface->u.LockVideoMemory.address));
++
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++            /* Map video memory address into user space. */
++#ifdef __QNXNTO__
++        if (node->VidMem.logical == gcvNULL)
++        {
++            gcmkONERROR(
++                gckKERNEL_MapVideoMemory(Kernel,
++                                         FromUser,
++                                         Interface->u.LockVideoMemory.address,
++                                         processID,
++                                         node->VidMem.bytes,
++                                         &node->VidMem.logical));
++        }
++
++        Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->VidMem.logical);
++#else
++            gcmkERR_BREAK(
++                gckKERNEL_MapVideoMemoryEx(Kernel,
++                                         gcvCORE_VG,
++                                         FromUser,
++                                         Interface->u.LockVideoMemory.address,
++                                         &logical));
++            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(logical);
++#endif
++        }
++        else
++        {
++            Interface->u.LockVideoMemory.memory = gcmPTR_TO_UINT64(node->Virtual.logical);
++
++            /* Success. */
++            status = gcvSTATUS_OK;
++        }
++
++#if gcdSECURE_USER
++        /* Return logical address as physical address. */
++        Interface->u.LockVideoMemory.address =
++            (gctUINT32)(Interface->u.LockVideoMemory.memory);
++#endif
++        gcmkERR_BREAK(
++            gckKERNEL_AddProcessDB(Kernel,
++                                   processID, gcvDB_VIDEO_MEMORY_LOCKED,
++                                   node,
++                                   gcvNULL,
++                                   0));
++        break;
++
++    case gcvHAL_UNLOCK_VIDEO_MEMORY:
++        /* Unlock video memory. */
++        node = gcmUINT64_TO_PTR(Interface->u.UnlockVideoMemory.node);
++
++#if gcdSECURE_USER
++        /* Save node information before it disappears. */
++        if (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        {
++            logical = gcvNULL;
++            bytes   = 0;
++        }
++        else
++        {
++            logical = node->Virtual.logical;
++            bytes   = node->Virtual.bytes;
++        }
++#endif
++
++        /* Unlock video memory. */
++        gcmkERR_BREAK(
++            gckVIDMEM_Unlock(Kernel,
++                             node,
++                             Interface->u.UnlockVideoMemory.type,
++                             &Interface->u.UnlockVideoMemory.asynchroneous));
++
++#if gcdSECURE_USER
++        /* Flush the translation cache for virtual surfaces. */
++        if (logical != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckKERNEL_FlushTranslationCache(Kernel,
++                                                          cache,
++                                                          logical,
++                                                          bytes));
++        }
++#endif
++
++        if (Interface->u.UnlockVideoMemory.asynchroneous == gcvFALSE)
++        {
++            /* There isn't a event to unlock this node, remove record now */
++            gcmkERR_BREAK(
++                    gckKERNEL_RemoveProcessDB(Kernel,
++                        processID, gcvDB_VIDEO_MEMORY_LOCKED,
++                        node));
++        }
++
++        break;
++    case gcvHAL_USER_SIGNAL:
++#if !USE_NEW_LINUX_SIGNAL
++        /* Dispatch depends on the user signal subcommands. */
++        switch(Interface->u.UserSignal.command)
++        {
++        case gcvUSER_SIGNAL_CREATE:
++            /* Create a signal used in the user space. */
++            gcmkERR_BREAK(
++                gckOS_CreateUserSignal(Kernel->os,
++                                       Interface->u.UserSignal.manualReset,
++                                       &Interface->u.UserSignal.id));
++
++            gcmkVERIFY_OK(
++                gckKERNEL_AddProcessDB(Kernel,
++                                       processID, gcvDB_SIGNAL,
++                                       gcmINT2PTR(Interface->u.UserSignal.id),
++                                       gcvNULL,
++                                       0));
++            break;
++
++        case gcvUSER_SIGNAL_DESTROY:
++            /* Destroy the signal. */
++            gcmkERR_BREAK(
++                gckOS_DestroyUserSignal(Kernel->os,
++                                        Interface->u.UserSignal.id));
++
++            gcmkVERIFY_OK(gckKERNEL_RemoveProcessDB(
++                Kernel,
++                processID, gcvDB_SIGNAL,
++                gcmINT2PTR(Interface->u.UserSignal.id)));
++            break;
++
++        case gcvUSER_SIGNAL_SIGNAL:
++            /* Signal the signal. */
++            gcmkERR_BREAK(
++                gckOS_SignalUserSignal(Kernel->os,
++                                       Interface->u.UserSignal.id,
++                                       Interface->u.UserSignal.state));
++            break;
++
++        case gcvUSER_SIGNAL_WAIT:
++            /* Wait on the signal. */
++            status = gckOS_WaitUserSignal(Kernel->os,
++                                          Interface->u.UserSignal.id,
++                                          Interface->u.UserSignal.wait);
++            break;
++
++        default:
++            /* Invalid user signal command. */
++            gcmkERR_BREAK(gcvSTATUS_INVALID_ARGUMENT);
++        }
++#endif
++        break;
++
++    case gcvHAL_COMMIT:
++        /* Commit a command and context buffer. */
++        gcmkERR_BREAK(gckVGCOMMAND_Commit(
++            Kernel->vg->command,
++            gcmUINT64_TO_PTR(kernelInterface->u.VGCommit.context),
++            gcmUINT64_TO_PTR(kernelInterface->u.VGCommit.queue),
++            kernelInterface->u.VGCommit.entryCount,
++            gcmUINT64_TO_PTR(kernelInterface->u.VGCommit.taskTable)
++            ));
++        break;
++    case gcvHAL_VERSION:
++        kernelInterface->u.Version.major = gcvVERSION_MAJOR;
++        kernelInterface->u.Version.minor = gcvVERSION_MINOR;
++        kernelInterface->u.Version.patch = gcvVERSION_PATCH;
++        kernelInterface->u.Version.build = gcvVERSION_BUILD;
++        status = gcvSTATUS_OK;
++        break;
++
++    case gcvHAL_GET_BASE_ADDRESS:
++        /* Get base address. */
++        gcmkERR_BREAK(
++            gckOS_GetBaseAddress(Kernel->os,
++                                 &kernelInterface->u.GetBaseAddress.baseAddress));
++        break;
++    default:
++        /* Invalid command. */
++        status = gcvSTATUS_INVALID_ARGUMENT;
++    }
++
++OnError:
++    /* Save status. */
++    kernelInterface->status = status;
++
++    gcmkFOOTER();
++
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_QueryCommandBuffer
++**
++**  Query command buffer attributes.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckVGHARDWARE object.
++**
++**  OUTPUT:
++**
++**      gcsCOMMAND_BUFFER_INFO_PTR Information
++**          Pointer to the information structure to receive buffer attributes.
++*/
++gceSTATUS
++gckKERNEL_QueryCommandBuffer(
++    IN gckKERNEL Kernel,
++    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Kernel=0x%x *Pool=0x%x",
++                   Kernel, Information);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Get the information. */
++    status = gckVGCOMMAND_QueryCommandBuffer(Kernel->vg->command, Information);
++
++    gcmkFOOTER();
++    /* Return status. */
++    return status;
++}
++
++#endif /* gcdENABLE_VG */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_vg.h	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,85 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_vg_h_
++#define __gc_hal_kernel_vg_h_
++
++#include "gc_hal.h"
++#include "gc_hal_driver.h"
++#include "gc_hal_kernel_hardware.h"
++
++/******************************************************************************\
++********************************** Structures **********************************
++\******************************************************************************/
++
++/* gckKERNEL object. */
++struct _gckVGKERNEL
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Pointer to gckHARDWARE object. */
++    gckVGHARDWARE                   hardware;
++
++    /* Pointer to gckINTERRUPT object. */
++    gckVGINTERRUPT              interrupt;
++
++    /* Pointer to gckCOMMAND object. */
++    gckVGCOMMAND                    command;
++
++    /* Pointer to context. */
++    gctPOINTER                  context;
++
++    /* Pointer to gckMMU object. */
++    gckVGMMU                        mmu;
++
++    gckKERNEL                   kernel;
++};
++
++/* gckMMU object. */
++struct _gckVGMMU
++{
++    /* The object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to gckOS object. */
++    gckOS                       os;
++
++    /* Pointer to gckHARDWARE object. */
++    gckVGHARDWARE                   hardware;
++
++    /* The page table mutex. */
++    gctPOINTER                  mutex;
++
++    /* Page table information. */
++    gctSIZE_T                   pageTableSize;
++    gctPHYS_ADDR                pageTablePhysical;
++    gctPOINTER                  pageTableLogical;
++
++    /* Allocation index. */
++    gctUINT32                   entryCount;
++    gctUINT32                   entry;
++};
++
++#endif /* __gc_hal_kernel_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/gc_hal_kernel_video_memory.c	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,2229 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_precomp.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_VIDMEM
++
++/******************************************************************************\
++******************************* Private Functions ******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  _Split
++**
++**  Split a node on the required byte boundary.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to the node to split.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to keep in the node.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      gctBOOL
++**          gcvTRUE if the node was split successfully, or gcvFALSE if there is an
++**          error.
++**
++*/
++static gctBOOL
++_Split(
++    IN gckOS Os,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gctSIZE_T Bytes
++    )
++{
++    gcuVIDMEM_NODE_PTR node;
++    gctPOINTER pointer = gcvNULL;
++
++    /* Make sure the byte boundary makes sense. */
++    if ((Bytes <= 0) || (Bytes > Node->VidMem.bytes))
++    {
++        return gcvFALSE;
++    }
++
++    /* Allocate a new gcuVIDMEM_NODE object. */
++    if (gcmIS_ERROR(gckOS_Allocate(Os,
++                                   gcmSIZEOF(gcuVIDMEM_NODE),
++                                   &pointer)))
++    {
++        /* Error. */
++        return gcvFALSE;
++    }
++
++    node = pointer;
++
++    /* Initialize gcuVIDMEM_NODE structure. */
++    node->VidMem.offset    = Node->VidMem.offset + Bytes;
++    node->VidMem.bytes     = Node->VidMem.bytes  - Bytes;
++    node->VidMem.alignment = 0;
++    node->VidMem.locked    = 0;
++    node->VidMem.memory    = Node->VidMem.memory;
++    node->VidMem.pool      = Node->VidMem.pool;
++    node->VidMem.physical  = Node->VidMem.physical;
++#ifdef __QNXNTO__
++#if gcdUSE_VIDMEM_PER_PID
++    gcmkASSERT(Node->VidMem.physical != 0);
++    gcmkASSERT(Node->VidMem.logical != gcvNULL);
++    node->VidMem.processID = Node->VidMem.processID;
++    node->VidMem.physical  = Node->VidMem.physical + Bytes;
++    node->VidMem.logical   = Node->VidMem.logical + Bytes;
++#else
++    node->VidMem.processID = 0;
++    node->VidMem.logical   = gcvNULL;
++#endif
++#endif
++
++    /* Insert node behind specified node. */
++    node->VidMem.next = Node->VidMem.next;
++    node->VidMem.prev = Node;
++    Node->VidMem.next = node->VidMem.next->VidMem.prev = node;
++
++    /* Insert free node behind specified node. */
++    node->VidMem.nextFree = Node->VidMem.nextFree;
++    node->VidMem.prevFree = Node;
++    Node->VidMem.nextFree = node->VidMem.nextFree->VidMem.prevFree = node;
++
++    /* Adjust size of specified node. */
++    Node->VidMem.bytes = Bytes;
++
++    /* Success. */
++    return gcvTRUE;
++}
++
++/*******************************************************************************
++**
++**  _Merge
++**
++**  Merge two adjacent nodes together.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to the first of the two nodes to merge.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++*/
++static gceSTATUS
++_Merge(
++    IN gckOS Os,
++    IN gcuVIDMEM_NODE_PTR Node
++    )
++{
++    gcuVIDMEM_NODE_PTR node;
++    gceSTATUS status;
++
++    /* Save pointer to next node. */
++    node = Node->VidMem.next;
++#if gcdUSE_VIDMEM_PER_PID
++    /* Check if the nodes are adjacent physically. */
++    if ( ((Node->VidMem.physical + Node->VidMem.bytes) != node->VidMem.physical) ||
++          ((Node->VidMem.logical + Node->VidMem.bytes) != node->VidMem.logical) )
++    {
++        /* Can't merge. */
++        return gcvSTATUS_OK;
++    }
++#else
++
++    /* This is a good time to make sure the heap is not corrupted. */
++    if (Node->VidMem.offset + Node->VidMem.bytes != node->VidMem.offset)
++    {
++        /* Corrupted heap. */
++        gcmkASSERT(
++            Node->VidMem.offset + Node->VidMem.bytes == node->VidMem.offset);
++        return gcvSTATUS_HEAP_CORRUPTED;
++    }
++#endif
++
++    /* Adjust byte count. */
++    Node->VidMem.bytes += node->VidMem.bytes;
++
++    /* Unlink next node from linked list. */
++    Node->VidMem.next     = node->VidMem.next;
++    Node->VidMem.nextFree = node->VidMem.nextFree;
++
++    Node->VidMem.next->VidMem.prev         =
++    Node->VidMem.nextFree->VidMem.prevFree = Node;
++
++    /* Free next node. */
++    status = gcmkOS_SAFE_FREE(Os, node);
++    return status;
++}
++
++/******************************************************************************\
++******************************* gckVIDMEM API Code ******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckVIDMEM_ConstructVirtual
++**
++**  Construct a new gcuVIDMEM_NODE union for virtual memory.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctSIZE_T Bytes
++**          Number of byte to allocate.
++**
++**  OUTPUT:
++**
++**      gcuVIDMEM_NODE_PTR * Node
++**          Pointer to a variable that receives the gcuVIDMEM_NODE union pointer.
++*/
++gceSTATUS
++gckVIDMEM_ConstructVirtual(
++    IN gckKERNEL Kernel,
++    IN gctBOOL Contiguous,
++    IN gctSIZE_T Bytes,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    )
++{
++    gckOS os;
++    gceSTATUS status;
++    gcuVIDMEM_NODE_PTR node = gcvNULL;
++    gctPOINTER pointer = gcvNULL;
++    gctINT i;
++
++    gcmkHEADER_ARG("Kernel=0x%x Contiguous=%d Bytes=%lu", Kernel, Contiguous, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
++
++    /* Extract the gckOS object pointer. */
++    os = Kernel->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    /* Allocate an gcuVIDMEM_NODE union. */
++    gcmkONERROR(gckOS_Allocate(os, gcmSIZEOF(gcuVIDMEM_NODE), &pointer));
++
++    node = pointer;
++
++    /* Initialize gcuVIDMEM_NODE union for virtual memory. */
++    node->Virtual.kernel        = Kernel;
++    node->Virtual.contiguous    = Contiguous;
++    node->Virtual.logical       = gcvNULL;
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        node->Virtual.lockeds[i]        = 0;
++        node->Virtual.pageTables[i]     = gcvNULL;
++        node->Virtual.lockKernels[i]    = gcvNULL;
++    }
++
++    gcmkONERROR(gckOS_GetProcessID(&node->Virtual.processID));
++
++#ifdef __QNXNTO__
++    node->Virtual.next          = gcvNULL;
++    node->Virtual.freePending   = gcvFALSE;
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        node->Virtual.unlockPendings[i] = gcvFALSE;
++    }
++#endif
++
++    node->Virtual.freed         = gcvFALSE;
++
++    gcmkONERROR(gckOS_ZeroMemory(&node->Virtual.sharedInfo, gcmSIZEOF(gcsVIDMEM_NODE_SHARED_INFO)));
++
++    /* Allocate the virtual memory. */
++    gcmkONERROR(
++        gckOS_AllocatePagedMemoryEx(os,
++                                    node->Virtual.contiguous,
++                                    node->Virtual.bytes = Bytes,
++                                    &node->Virtual.physical));
++
++#ifdef __QNXNTO__
++    /* Register. */
++#if gcdENABLE_VG
++    if (Kernel->core != gcvCORE_VG)
++#endif
++    {
++        gckMMU_InsertNode(Kernel->mmu, node);
++    }
++#endif
++
++    /* Return pointer to the gcuVIDMEM_NODE union. */
++    *Node = node;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                   "Created virtual node 0x%x for %u bytes @ 0x%x",
++                   node, Bytes, node->Virtual.physical);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Node=0x%x", *Node);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (node != gcvNULL)
++    {
++        /* Free the structure. */
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, node));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_DestroyVirtual
++**
++**  Destroy an gcuVIDMEM_NODE union for virtual memory.
++**
++**  INPUT:
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to a gcuVIDMEM_NODE union.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVIDMEM_DestroyVirtual(
++    IN gcuVIDMEM_NODE_PTR Node
++    )
++{
++    gckOS os;
++    gctINT i;
++
++    gcmkHEADER_ARG("Node=0x%x", Node);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Node->Virtual.kernel, gcvOBJ_KERNEL);
++
++    /* Extact the gckOS object pointer. */
++    os = Node->Virtual.kernel->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++#ifdef __QNXNTO__
++    /* Unregister. */
++#if gcdENABLE_VG
++    if (Node->Virtual.kernel->core != gcvCORE_VG)
++#endif
++    {
++        gcmkVERIFY_OK(
++                gckMMU_RemoveNode(Node->Virtual.kernel->mmu, Node));
++    }
++#endif
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (Node->Virtual.pageTables[i] != gcvNULL)
++        {
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                /* Free the pages. */
++                gcmkVERIFY_OK(gckVGMMU_FreePages(Node->Virtual.lockKernels[i]->vg->mmu,
++                                               Node->Virtual.pageTables[i],
++                                               Node->Virtual.pageCount));
++            }
++            else
++#endif
++            {
++                /* Free the pages. */
++                gcmkVERIFY_OK(gckMMU_FreePages(Node->Virtual.lockKernels[i]->mmu,
++                                               Node->Virtual.pageTables[i],
++                                               Node->Virtual.pageCount));
++            }
++        }
++    }
++
++    /* Delete the gcuVIDMEM_NODE union. */
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(os, Node));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_Construct
++**
++**  Construct a new gckVIDMEM object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 BaseAddress
++**          Base address for the video memory heap.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes in the video memory heap.
++**
++**      gctSIZE_T Threshold
++**          Minimum number of bytes beyond am allocation before the node is
++**          split.  Can be used as a minimum alignment requirement.
++**
++**      gctSIZE_T BankSize
++**          Number of bytes per physical memory bank.  Used by bank
++**          optimization.
++**
++**  OUTPUT:
++**
++**      gckVIDMEM * Memory
++**          Pointer to a variable that will hold the pointer to the gckVIDMEM
++**          object.
++*/
++gceSTATUS
++gckVIDMEM_Construct(
++    IN gckOS Os,
++    IN gctUINT32 BaseAddress,
++    IN gctSIZE_T Bytes,
++    IN gctSIZE_T Threshold,
++    IN gctSIZE_T BankSize,
++    OUT gckVIDMEM * Memory
++    )
++{
++    gckVIDMEM memory = gcvNULL;
++    gceSTATUS status;
++    gcuVIDMEM_NODE_PTR node;
++    gctINT i, banks = 0;
++    gctPOINTER pointer = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%x BaseAddress=%08x Bytes=%lu Threshold=%lu "
++                   "BankSize=%lu",
++                   Os, BaseAddress, Bytes, Threshold, BankSize);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    /* Allocate the gckVIDMEM object. */
++    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(struct _gckVIDMEM), &pointer));
++
++    memory = pointer;
++
++    /* Initialize the gckVIDMEM object. */
++    memory->object.type = gcvOBJ_VIDMEM;
++    memory->os          = Os;
++
++    /* Set video memory heap information. */
++    memory->baseAddress = BaseAddress;
++    memory->bytes       = Bytes;
++    memory->freeBytes   = Bytes;
++    memory->threshold   = Threshold;
++#if gcdUSE_VIDMEM_PER_PID
++    gcmkONERROR(gckOS_GetProcessID(&memory->pid));
++#endif
++
++    BaseAddress = 0;
++
++    /* Walk all possible banks. */
++    for (i = 0; i < gcmCOUNTOF(memory->sentinel); ++i)
++    {
++        gctSIZE_T bytes;
++
++        if (BankSize == 0)
++        {
++            /* Use all bytes for the first bank. */
++            bytes = Bytes;
++        }
++        else
++        {
++            /* Compute number of bytes for this bank. */
++            bytes = gcmALIGN(BaseAddress + 1, BankSize) - BaseAddress;
++
++            if (bytes > Bytes)
++            {
++                /* Make sure we don't exceed the total number of bytes. */
++                bytes = Bytes;
++            }
++        }
++
++        if (bytes == 0)
++        {
++            /* Mark heap is not used. */
++            memory->sentinel[i].VidMem.next     =
++            memory->sentinel[i].VidMem.prev     =
++            memory->sentinel[i].VidMem.nextFree =
++            memory->sentinel[i].VidMem.prevFree = gcvNULL;
++            continue;
++        }
++
++        /* Allocate one gcuVIDMEM_NODE union. */
++        gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcuVIDMEM_NODE), &pointer));
++
++        node = pointer;
++
++        /* Initialize gcuVIDMEM_NODE union. */
++        node->VidMem.memory    = memory;
++
++        node->VidMem.next      =
++        node->VidMem.prev      =
++        node->VidMem.nextFree  =
++        node->VidMem.prevFree  = &memory->sentinel[i];
++
++        node->VidMem.offset    = BaseAddress;
++        node->VidMem.bytes     = bytes;
++        node->VidMem.alignment = 0;
++        node->VidMem.physical  = 0;
++        node->VidMem.pool      = gcvPOOL_UNKNOWN;
++
++        node->VidMem.locked    = 0;
++
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
++        node->VidMem.kernelVirtual = gcvNULL;
++#endif
++
++        gcmkONERROR(gckOS_ZeroMemory(&node->VidMem.sharedInfo, gcmSIZEOF(gcsVIDMEM_NODE_SHARED_INFO)));
++
++#ifdef __QNXNTO__
++#if gcdUSE_VIDMEM_PER_PID
++        node->VidMem.processID = memory->pid;
++        node->VidMem.physical  = memory->baseAddress + BaseAddress;
++        gcmkONERROR(gckOS_GetLogicalAddressProcess(Os,
++                    node->VidMem.processID,
++                    node->VidMem.physical,
++                    &node->VidMem.logical));
++#else
++        node->VidMem.processID = 0;
++        node->VidMem.logical   = gcvNULL;
++#endif
++#endif
++
++        /* Initialize the linked list of nodes. */
++        memory->sentinel[i].VidMem.next     =
++        memory->sentinel[i].VidMem.prev     =
++        memory->sentinel[i].VidMem.nextFree =
++        memory->sentinel[i].VidMem.prevFree = node;
++
++        /* Mark sentinel. */
++        memory->sentinel[i].VidMem.bytes = 0;
++
++        /* Adjust address for next bank. */
++        BaseAddress += bytes;
++        Bytes       -= bytes;
++        banks       ++;
++    }
++
++    /* Assign all the bank mappings. */
++    memory->mapping[gcvSURF_RENDER_TARGET]      = banks - 1;
++    memory->mapping[gcvSURF_BITMAP]             = banks - 1;
++    if (banks > 1) --banks;
++    memory->mapping[gcvSURF_DEPTH]              = banks - 1;
++    memory->mapping[gcvSURF_HIERARCHICAL_DEPTH] = banks - 1;
++    if (banks > 1) --banks;
++    memory->mapping[gcvSURF_TEXTURE]            = banks - 1;
++    if (banks > 1) --banks;
++    memory->mapping[gcvSURF_VERTEX]             = banks - 1;
++    if (banks > 1) --banks;
++    memory->mapping[gcvSURF_INDEX]              = banks - 1;
++    if (banks > 1) --banks;
++    memory->mapping[gcvSURF_TILE_STATUS]        = banks - 1;
++    if (banks > 1) --banks;
++    memory->mapping[gcvSURF_TYPE_UNKNOWN]       = 0;
++
++#if gcdENABLE_VG
++    memory->mapping[gcvSURF_IMAGE]   = 0;
++    memory->mapping[gcvSURF_MASK]    = 0;
++    memory->mapping[gcvSURF_SCISSOR] = 0;
++#endif
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                  "[GALCORE] INDEX:         bank %d",
++                  memory->mapping[gcvSURF_INDEX]);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                  "[GALCORE] VERTEX:        bank %d",
++                  memory->mapping[gcvSURF_VERTEX]);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                  "[GALCORE] TEXTURE:       bank %d",
++                  memory->mapping[gcvSURF_TEXTURE]);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                  "[GALCORE] RENDER_TARGET: bank %d",
++                  memory->mapping[gcvSURF_RENDER_TARGET]);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                  "[GALCORE] DEPTH:         bank %d",
++                  memory->mapping[gcvSURF_DEPTH]);
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                  "[GALCORE] TILE_STATUS:   bank %d",
++                  memory->mapping[gcvSURF_TILE_STATUS]);
++
++    /* Return pointer to the gckVIDMEM object. */
++    *Memory = memory;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Memory=0x%x", *Memory);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    if (memory != gcvNULL)
++    {
++        for (i = 0; i < banks; ++i)
++        {
++            /* Free the heap. */
++            gcmkASSERT(memory->sentinel[i].VidMem.next != gcvNULL);
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, memory->sentinel[i].VidMem.next));
++        }
++
++        /* Free the object. */
++        gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, memory));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_Destroy
++**
++**  Destroy an gckVIDMEM object.
++**
++**  INPUT:
++**
++**      gckVIDMEM Memory
++**          Pointer to an gckVIDMEM object to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVIDMEM_Destroy(
++    IN gckVIDMEM Memory
++    )
++{
++    gcuVIDMEM_NODE_PTR node, next;
++    gctINT i;
++
++    gcmkHEADER_ARG("Memory=0x%x", Memory);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
++
++    /* Walk all sentinels. */
++    for (i = 0; i < gcmCOUNTOF(Memory->sentinel); ++i)
++    {
++        /* Bail out of the heap is not used. */
++        if (Memory->sentinel[i].VidMem.next == gcvNULL)
++        {
++            break;
++        }
++
++        /* Walk all the nodes until we reach the sentinel. */
++        for (node = Memory->sentinel[i].VidMem.next;
++             node->VidMem.bytes != 0;
++             node = next)
++        {
++            /* Save pointer to the next node. */
++            next = node->VidMem.next;
++
++            /* Free the node. */
++            gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Memory->os, node));
++        }
++    }
++
++    /* Mark the object as unknown. */
++    Memory->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckVIDMEM object. */
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Memory->os, Memory));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_Allocate
++**
++**  Allocate rectangular memory from the gckVIDMEM object.
++**
++**  INPUT:
++**
++**      gckVIDMEM Memory
++**          Pointer to an gckVIDMEM object.
++**
++**      gctUINT Width
++**          Width of rectangle to allocate.  Make sure the width is properly
++**          aligned.
++**
++**      gctUINT Height
++**          Height of rectangle to allocate.  Make sure the height is properly
++**          aligned.
++**
++**      gctUINT Depth
++**          Depth of rectangle to allocate.  This equals to the number of
++**          rectangles to allocate contiguously (i.e., for cubic maps and volume
++**          textures).
++**
++**      gctUINT BytesPerPixel
++**          Number of bytes per pixel.
++**
++**      gctUINT32 Alignment
++**          Byte alignment for allocation.
++**
++**      gceSURF_TYPE Type
++**          Type of surface to allocate (use by bank optimization).
++**
++**  OUTPUT:
++**
++**      gcuVIDMEM_NODE_PTR * Node
++**          Pointer to a variable that will hold the allocated memory node.
++*/
++gceSTATUS
++gckVIDMEM_Allocate(
++    IN gckKERNEL Kernel,
++    IN gckVIDMEM Memory,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Depth,
++    IN gctUINT BytesPerPixel,
++    IN gctUINT32 Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    )
++{
++    gctSIZE_T bytes;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Memory=0x%x Width=%u Height=%u Depth=%u BytesPerPixel=%u "
++                   "Alignment=%u Type=%d",
++                   Memory, Width, Height, Depth, BytesPerPixel, Alignment,
++                   Type);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
++    gcmkVERIFY_ARGUMENT(Width > 0);
++    gcmkVERIFY_ARGUMENT(Height > 0);
++    gcmkVERIFY_ARGUMENT(Depth > 0);
++    gcmkVERIFY_ARGUMENT(BytesPerPixel > 0);
++    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
++
++    /* Compute linear size. */
++    bytes = Width * Height * Depth * BytesPerPixel;
++
++    /* Allocate through linear function. */
++    gcmkONERROR(
++        gckVIDMEM_AllocateLinear(Kernel, Memory, bytes, Alignment, Type, Node));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Node=0x%x", *Node);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdENABLE_BANK_ALIGNMENT
++
++#if !gcdBANK_BIT_START
++#error gcdBANK_BIT_START not defined.
++#endif
++
++#if !gcdBANK_BIT_END
++#error gcdBANK_BIT_END not defined.
++#endif
++/*******************************************************************************
++**  _GetSurfaceBankAlignment
++**
++**  Return the required offset alignment required to the make BaseAddress
++**  aligned properly.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to gcoOS object.
++**
++**      gceSURF_TYPE Type
++**          Type of allocation.
++**
++**      gctUINT32 BaseAddress
++**          Base address of current video memory node.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR AlignmentOffset
++**          Pointer to a variable that will hold the number of bytes to skip in
++**          the current video memory node in order to make the alignment bank
++**          aligned.
++*/
++static gceSTATUS
++_GetSurfaceBankAlignment(
++    IN gceSURF_TYPE Type,
++    IN gctUINT32 BaseAddress,
++    OUT gctUINT32_PTR AlignmentOffset
++    )
++{
++    gctUINT32 bank;
++    /* To retrieve the bank. */
++    static const gctUINT32 bankMask = (0xFFFFFFFF << gcdBANK_BIT_START)
++                                    ^ (0xFFFFFFFF << (gcdBANK_BIT_END + 1));
++
++    /* To retrieve the bank and all the lower bytes. */
++    static const gctUINT32 byteMask = ~(0xFFFFFFFF << (gcdBANK_BIT_END + 1));
++
++    gcmkHEADER_ARG("Type=%d BaseAddress=0x%x ", Type, BaseAddress);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(AlignmentOffset != gcvNULL);
++
++    switch (Type)
++    {
++    case gcvSURF_RENDER_TARGET:
++        bank = (BaseAddress & bankMask) >> (gcdBANK_BIT_START);
++
++        /* Align to the first bank. */
++        *AlignmentOffset = (bank == 0) ?
++            0 :
++            ((1 << (gcdBANK_BIT_END + 1)) + 0) -  (BaseAddress & byteMask);
++        break;
++
++    case gcvSURF_DEPTH:
++        bank = (BaseAddress & bankMask) >> (gcdBANK_BIT_START);
++
++        /* Align to the third bank. */
++        *AlignmentOffset = (bank == 2) ?
++            0 :
++            ((1 << (gcdBANK_BIT_END + 1)) + (2 << gcdBANK_BIT_START)) -  (BaseAddress & byteMask);
++
++        /* Add a channel offset at the channel bit. */
++        *AlignmentOffset += (1 << gcdBANK_CHANNEL_BIT);
++        break;
++
++    default:
++        /* no alignment needed. */
++        *AlignmentOffset = 0;
++    }
++
++    /* Return the status. */
++    gcmkFOOTER_ARG("*AlignmentOffset=%u", *AlignmentOffset);
++    return gcvSTATUS_OK;
++}
++#endif
++
++static gcuVIDMEM_NODE_PTR
++_FindNode(
++    IN gckVIDMEM Memory,
++    IN gctINT Bank,
++    IN gctSIZE_T Bytes,
++    IN gceSURF_TYPE Type,
++    IN OUT gctUINT32_PTR Alignment
++    )
++{
++    gcuVIDMEM_NODE_PTR node;
++    gctUINT32 alignment;
++
++#if gcdENABLE_BANK_ALIGNMENT
++    gctUINT32 bankAlignment;
++    gceSTATUS status;
++#endif
++
++    if (Memory->sentinel[Bank].VidMem.nextFree == gcvNULL)
++    {
++        /* No free nodes left. */
++        return gcvNULL;
++    }
++
++#if gcdENABLE_BANK_ALIGNMENT
++    /* Walk all free nodes until we have one that is big enough or we have
++    ** reached the sentinel. */
++    for (node = Memory->sentinel[Bank].VidMem.nextFree;
++         node->VidMem.bytes != 0;
++         node = node->VidMem.nextFree)
++    {
++        gcmkONERROR(_GetSurfaceBankAlignment(
++            Type,
++            node->VidMem.memory->baseAddress + node->VidMem.offset,
++            &bankAlignment));
++
++        bankAlignment = gcmALIGN(bankAlignment, *Alignment);
++
++        /* Compute number of bytes to skip for alignment. */
++        alignment = (*Alignment == 0)
++                  ? 0
++                  : (*Alignment - (node->VidMem.offset % *Alignment));
++
++        if (alignment == *Alignment)
++        {
++            /* Node is already aligned. */
++            alignment = 0;
++        }
++
++        if (node->VidMem.bytes >= Bytes + alignment + bankAlignment)
++        {
++            /* This node is big enough. */
++            *Alignment = alignment + bankAlignment;
++            return node;
++        }
++    }
++#endif
++
++    /* Walk all free nodes until we have one that is big enough or we have
++       reached the sentinel. */
++    for (node = Memory->sentinel[Bank].VidMem.nextFree;
++         node->VidMem.bytes != 0;
++         node = node->VidMem.nextFree)
++    {
++
++        gctINT modulo = gckMATH_ModuloInt(node->VidMem.offset, *Alignment);
++
++        /* Compute number of bytes to skip for alignment. */
++        alignment = (*Alignment == 0) ? 0 : (*Alignment - modulo);
++
++        if (alignment == *Alignment)
++        {
++            /* Node is already aligned. */
++            alignment = 0;
++        }
++
++        if (node->VidMem.bytes >= Bytes + alignment)
++        {
++            /* This node is big enough. */
++            *Alignment = alignment;
++            return node;
++        }
++    }
++
++#if gcdENABLE_BANK_ALIGNMENT
++OnError:
++#endif
++    /* Not enough memory. */
++    return gcvNULL;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_AllocateLinear
++**
++**  Allocate linear memory from the gckVIDMEM object.
++**
++**  INPUT:
++**
++**      gckVIDMEM Memory
++**          Pointer to an gckVIDMEM object.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to allocate.
++**
++**      gctUINT32 Alignment
++**          Byte alignment for allocation.
++**
++**      gceSURF_TYPE Type
++**          Type of surface to allocate (use by bank optimization).
++**
++**  OUTPUT:
++**
++**      gcuVIDMEM_NODE_PTR * Node
++**          Pointer to a variable that will hold the allocated memory node.
++*/
++gceSTATUS
++gckVIDMEM_AllocateLinear(
++    IN gckKERNEL Kernel,
++    IN gckVIDMEM Memory,
++    IN gctSIZE_T Bytes,
++    IN gctUINT32 Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    )
++{
++    gceSTATUS status;
++    gcuVIDMEM_NODE_PTR node;
++    gctUINT32 alignment;
++    gctINT bank, i;
++    gctBOOL acquired = gcvFALSE;
++#if gcdSMALL_BLOCK_SIZE
++    gctBOOL force_allocate = (Type == gcvSURF_TILE_STATUS) || (Type & gcvSURF_VG);
++#endif
++
++    gcmkHEADER_ARG("Memory=0x%x Bytes=%lu Alignment=%u Type=%d",
++                   Memory, Bytes, Alignment, Type);
++
++    Type &= ~gcvSURF_VG;
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Type < gcvSURF_NUM_TYPES);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Memory->os, Kernel->vidmemMutex, gcvINFINITE));
++
++    acquired = gcvTRUE;
++#if !gcdUSE_VIDMEM_PER_PID
++
++    if (Bytes > Memory->freeBytes)
++    {
++        /* Not enough memory. */
++        status = gcvSTATUS_OUT_OF_MEMORY;
++        goto OnError;
++    }
++#endif
++
++#if gcdSMALL_BLOCK_SIZE
++    if ((!force_allocate) && (Memory->freeBytes < (Memory->bytes/gcdRATIO_FOR_SMALL_MEMORY))
++    &&  (Bytes >= gcdSMALL_BLOCK_SIZE)
++    )
++    {
++        /* The left memory is for small memory.*/
++        status = gcvSTATUS_OUT_OF_MEMORY;
++        goto OnError;
++    }
++#endif
++
++    /* Find the default bank for this surface type. */
++    gcmkASSERT((gctINT) Type < gcmCOUNTOF(Memory->mapping));
++    bank      = Memory->mapping[Type];
++    alignment = Alignment;
++
++#if gcdUSE_VIDMEM_PER_PID
++    if (Bytes <= Memory->freeBytes)
++    {
++#endif
++    /* Find a free node in the default bank. */
++    node = _FindNode(Memory, bank, Bytes, Type, &alignment);
++
++    /* Out of memory? */
++    if (node == gcvNULL)
++    {
++        /* Walk all lower banks. */
++        for (i = bank - 1; i >= 0; --i)
++        {
++            /* Find a free node inside the current bank. */
++            node = _FindNode(Memory, i, Bytes, Type, &alignment);
++            if (node != gcvNULL)
++            {
++                break;
++            }
++        }
++    }
++
++    if (node == gcvNULL)
++    {
++        /* Walk all upper banks. */
++        for (i = bank + 1; i < gcmCOUNTOF(Memory->sentinel); ++i)
++        {
++            if (Memory->sentinel[i].VidMem.nextFree == gcvNULL)
++            {
++                /* Abort when we reach unused banks. */
++                break;
++            }
++
++            /* Find a free node inside the current bank. */
++            node = _FindNode(Memory, i, Bytes, Type, &alignment);
++            if (node != gcvNULL)
++            {
++                break;
++            }
++        }
++    }
++#if gcdUSE_VIDMEM_PER_PID
++    }
++#endif
++
++    if (node == gcvNULL)
++    {
++        /* Out of memory. */
++#if gcdUSE_VIDMEM_PER_PID
++        /* Allocate more memory from shared pool. */
++        gctSIZE_T bytes;
++        gctPHYS_ADDR physical_temp;
++        gctUINT32 physical;
++        gctPOINTER logical;
++
++        bytes = gcmALIGN(Bytes, gcdUSE_VIDMEM_PER_PID_SIZE);
++
++        gcmkONERROR(gckOS_AllocateContiguous(Memory->os,
++                gcvTRUE,
++                &bytes,
++                &physical_temp,
++                &logical));
++
++        /* physical address is returned as 0 for user space. workaround. */
++        if (physical_temp == gcvNULL)
++        {
++        gcmkONERROR(gckOS_GetPhysicalAddress(Memory->os, logical, &physical));
++        }
++
++        /* Allocate one gcuVIDMEM_NODE union. */
++        gcmkONERROR(
++            gckOS_Allocate(Memory->os,
++                           gcmSIZEOF(gcuVIDMEM_NODE),
++                           (gctPOINTER *) &node));
++
++        /* Initialize gcuVIDMEM_NODE union. */
++        node->VidMem.memory    = Memory;
++
++        node->VidMem.offset    = 0;
++        node->VidMem.bytes     = bytes;
++        node->VidMem.alignment = 0;
++        node->VidMem.physical  = physical;
++        node->VidMem.pool      = gcvPOOL_UNKNOWN;
++
++        node->VidMem.locked    = 0;
++
++#ifdef __QNXNTO__
++        gcmkONERROR(gckOS_GetProcessID(&node->VidMem.processID));
++        node->VidMem.logical   = logical;
++        gcmkASSERT(logical != gcvNULL);
++#endif
++
++        /* Insert node behind sentinel node. */
++        node->VidMem.next = Memory->sentinel[bank].VidMem.next;
++        node->VidMem.prev = &Memory->sentinel[bank];
++        Memory->sentinel[bank].VidMem.next = node->VidMem.next->VidMem.prev = node;
++
++        /* Insert free node behind sentinel node. */
++        node->VidMem.nextFree = Memory->sentinel[bank].VidMem.nextFree;
++        node->VidMem.prevFree = &Memory->sentinel[bank];
++        Memory->sentinel[bank].VidMem.nextFree = node->VidMem.nextFree->VidMem.prevFree = node;
++
++        Memory->freeBytes += bytes;
++#else
++        status = gcvSTATUS_OUT_OF_MEMORY;
++        goto OnError;
++#endif
++    }
++
++    /* Do we have an alignment? */
++    if (alignment > 0)
++    {
++        /* Split the node so it is aligned. */
++        if (_Split(Memory->os, node, alignment))
++        {
++            /* Successful split, move to aligned node. */
++            node = node->VidMem.next;
++
++            /* Remove alignment. */
++            alignment = 0;
++        }
++    }
++
++    /* Do we have enough memory after the allocation to split it? */
++    if (node->VidMem.bytes - Bytes > Memory->threshold)
++    {
++        /* Adjust the node size. */
++        _Split(Memory->os, node, Bytes);
++    }
++
++    /* Remove the node from the free list. */
++    node->VidMem.prevFree->VidMem.nextFree = node->VidMem.nextFree;
++    node->VidMem.nextFree->VidMem.prevFree = node->VidMem.prevFree;
++    node->VidMem.nextFree                  =
++    node->VidMem.prevFree                  = gcvNULL;
++
++    /* Fill in the information. */
++    node->VidMem.alignment = alignment;
++    node->VidMem.memory    = Memory;
++#ifdef __QNXNTO__
++#if !gcdUSE_VIDMEM_PER_PID
++    node->VidMem.logical   = gcvNULL;
++    gcmkONERROR(gckOS_GetProcessID(&node->VidMem.processID));
++#else
++    gcmkASSERT(node->VidMem.logical != gcvNULL);
++#endif
++#endif
++
++    /* Adjust the number of free bytes. */
++    Memory->freeBytes -= node->VidMem.bytes;
++
++    node->VidMem.freePending = gcvFALSE;
++
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
++    node->VidMem.kernelVirtual = gcvNULL;
++#endif
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Kernel->vidmemMutex));
++
++    /* Return the pointer to the node. */
++    *Node = node;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                   "Allocated %u bytes @ 0x%x [0x%08X]",
++                   node->VidMem.bytes, node, node->VidMem.offset);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Node=0x%x", *Node);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++     /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Kernel->vidmemMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_Free
++**
++**  Free an allocated video memory node.
++**
++**  INPUT:
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to a gcuVIDMEM_NODE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVIDMEM_Free(
++    IN gckKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node
++    )
++{
++    gceSTATUS status;
++    gckKERNEL kernel = gcvNULL;
++    gckVIDMEM memory = gcvNULL;
++    gcuVIDMEM_NODE_PTR node;
++    gckOS os = gcvNULL;
++    gctBOOL acquired = gcvFALSE;
++    gctINT32 i, totalLocked;
++
++    gcmkHEADER_ARG("Node=0x%x", Node);
++
++    /* Acquire the mutex. */
++    gcmkONERROR(
++        gckOS_AcquireMutex(Kernel->os, Kernel->vidmemMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    /* Verify the arguments. */
++    if ((Node == gcvNULL)
++    ||  (Node->VidMem.memory == gcvNULL)
++    )
++    {
++        /* Invalid object. */
++        gcmkONERROR(gcvSTATUS_INVALID_OBJECT);
++    }
++
++    /**************************** Video Memory ********************************/
++
++    if (Node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++    {
++        if (Node->VidMem.locked > 0)
++        {
++            /* Client still has a lock, defer free op 'till when lock reaches 0. */
++            Node->VidMem.freePending = gcvTRUE;
++
++            gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++            acquired = gcvFALSE;
++
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                           "Node 0x%x is locked (%d)... deferring free.",
++                           Node, Node->VidMem.locked);
++
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        /* Extract pointer to gckVIDMEM object owning the node. */
++        memory = Node->VidMem.memory;
++
++#ifdef __QNXNTO__
++#if !gcdUSE_VIDMEM_PER_PID
++        /* Reset. */
++        Node->VidMem.processID = 0;
++        Node->VidMem.logical = gcvNULL;
++#endif
++
++        /* Don't try to re-free an already freed node. */
++        if ((Node->VidMem.nextFree == gcvNULL)
++        &&  (Node->VidMem.prevFree == gcvNULL)
++        )
++#endif
++        {
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
++            if (Node->VidMem.kernelVirtual)
++            {
++                gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                        "%s(%d) Unmap %x from kernel space.",
++                        __FUNCTION__, __LINE__,
++                        Node->VidMem.kernelVirtual);
++
++                gcmkVERIFY_OK(
++                    gckOS_UnmapPhysical(memory->os,
++                                        Node->VidMem.kernelVirtual,
++                                        Node->VidMem.bytes));
++
++                Node->VidMem.kernelVirtual = gcvNULL;
++            }
++#endif
++
++            /* Check if Node is already freed. */
++            if (Node->VidMem.nextFree)
++            {
++                /* Node is alread freed. */
++                gcmkONERROR(gcvSTATUS_INVALID_DATA);
++            }
++
++            /* Update the number of free bytes. */
++            memory->freeBytes += Node->VidMem.bytes;
++
++            /* Find the next free node. */
++            for (node = Node->VidMem.next;
++                 node != gcvNULL && node->VidMem.nextFree == gcvNULL;
++                 node = node->VidMem.next) ;
++
++            /* Insert this node in the free list. */
++            Node->VidMem.nextFree = node;
++            Node->VidMem.prevFree = node->VidMem.prevFree;
++
++            Node->VidMem.prevFree->VidMem.nextFree =
++            node->VidMem.prevFree                  = Node;
++
++            /* Is the next node a free node and not the sentinel? */
++            if ((Node->VidMem.next == Node->VidMem.nextFree)
++            &&  (Node->VidMem.next->VidMem.bytes != 0)
++            )
++            {
++                /* Merge this node with the next node. */
++                gcmkONERROR(_Merge(memory->os, node = Node));
++                gcmkASSERT(node->VidMem.nextFree != node);
++                gcmkASSERT(node->VidMem.prevFree != node);
++            }
++
++            /* Is the previous node a free node and not the sentinel? */
++            if ((Node->VidMem.prev == Node->VidMem.prevFree)
++            &&  (Node->VidMem.prev->VidMem.bytes != 0)
++            )
++            {
++                /* Merge this node with the previous node. */
++                gcmkONERROR(_Merge(memory->os, node = Node->VidMem.prev));
++                gcmkASSERT(node->VidMem.nextFree != node);
++                gcmkASSERT(node->VidMem.prevFree != node);
++            }
++        }
++
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                       "Node 0x%x is freed.",
++                       Node);
++
++        /* Success. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    /*************************** Virtual Memory *******************************/
++
++    /* Get gckKERNEL object. */
++    kernel = Node->Virtual.kernel;
++
++    /* Verify the gckKERNEL object pointer. */
++    gcmkVERIFY_OBJECT(kernel, gcvOBJ_KERNEL);
++
++    /* Get the gckOS object pointer. */
++    os = kernel->os;
++    gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++    for (i = 0, totalLocked = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        totalLocked += Node->Virtual.lockeds[i];
++    }
++
++    if (totalLocked > 0)
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_VIDMEM,
++                       "gckVIDMEM_Free: Virtual node 0x%x is locked (%d)",
++                       Node, totalLocked);
++
++        /* Set Flag */
++        Node->Virtual.freed = gcvTRUE;
++    }
++    else
++    {
++        /* Free the virtual memory. */
++        gcmkVERIFY_OK(gckOS_FreePagedMemory(kernel->os,
++                                            Node->Virtual.physical,
++                                            Node->Virtual.bytes));
++
++        /* Destroy the gcuVIDMEM_NODE union. */
++        gcmkVERIFY_OK(gckVIDMEM_DestroyVirtual(Node));
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++
++#ifdef __QNXNTO__
++/*******************************************************************************
++**
++**  gcoVIDMEM_FreeHandleMemory
++**
++**  Free all allocated video memory nodes for a handle.
++**
++**  INPUT:
++**
++**      gcoVIDMEM Memory
++**          Pointer to an gcoVIDMEM object..
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckVIDMEM_FreeHandleMemory(
++    IN gckKERNEL Kernel,
++    IN gckVIDMEM Memory,
++    IN gctUINT32 Pid
++    )
++{
++    gceSTATUS status;
++    gctBOOL mutex = gcvFALSE;
++    gcuVIDMEM_NODE_PTR node;
++    gctINT i;
++    gctUINT32 nodeCount = 0, byteCount = 0;
++    gctBOOL again;
++
++    gcmkHEADER_ARG("Kernel=0x%x, Memory=0x%x Pid=0x%u", Kernel, Memory, Pid);
++
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_OBJECT(Memory, gcvOBJ_VIDMEM);
++
++    gcmkONERROR(gckOS_AcquireMutex(Memory->os, Memory->mutex, gcvINFINITE));
++    mutex = gcvTRUE;
++
++    /* Walk all sentinels. */
++    for (i = 0; i < gcmCOUNTOF(Memory->sentinel); ++i)
++    {
++        /* Bail out of the heap if it is not used. */
++        if (Memory->sentinel[i].VidMem.next == gcvNULL)
++        {
++            break;
++        }
++
++        do
++        {
++            again = gcvFALSE;
++
++            /* Walk all the nodes until we reach the sentinel. */
++            for (node = Memory->sentinel[i].VidMem.next;
++                 node->VidMem.bytes != 0;
++                 node = node->VidMem.next)
++            {
++                /* Free the node if it was allocated by Handle. */
++                if (node->VidMem.processID == Pid)
++                {
++                    /* Unlock video memory. */
++                    while (node->VidMem.locked > 0)
++                    {
++                        gckVIDMEM_Unlock(Kernel, node, gcvSURF_TYPE_UNKNOWN, gcvNULL);
++                    }
++
++                    nodeCount++;
++                    byteCount += node->VidMem.bytes;
++
++                    /* Free video memory. */
++                    gcmkVERIFY_OK(gckVIDMEM_Free(node));
++
++                    /*
++                     * Freeing may cause a merge which will invalidate our iteration.
++                     * Don't be clever, just restart.
++                     */
++                    again = gcvTRUE;
++
++                    break;
++                }
++#if gcdUSE_VIDMEM_PER_PID
++                else
++                {
++                    gcmkASSERT(node->VidMem.processID == Pid);
++                }
++#endif
++            }
++        }
++        while (again);
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Memory->mutex));
++    gcmkFOOTER();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (mutex)
++    {
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Memory->os, Memory->mutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++/*******************************************************************************
++**
++** _NeedVirtualMapping
++**
++**  Whether setup GPU page table for video node.
++**
++**  INPUT:
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to a gcuVIDMEM_NODE union.
++**
++**      gceCORE  Core
++**          Id of current GPU.
++**
++**  OUTPUT:
++**      gctBOOL * NeedMapping
++**          A pointer hold the result whether Node should be mapping.
++*/
++static gceSTATUS
++_NeedVirtualMapping(
++    IN gckKERNEL Kernel,
++    IN gceCORE  Core,
++    IN gcuVIDMEM_NODE_PTR Node,
++    OUT gctBOOL * NeedMapping
++)
++{
++    gceSTATUS status;
++    gctUINT32 phys;
++    gctUINT32 end;
++    gcePOOL pool;
++    gctUINT32 offset;
++    gctUINT32 baseAddress;
++
++    gcmkHEADER_ARG("Node=0x%X", Node);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Kernel != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Node != gcvNULL);
++    gcmkVERIFY_ARGUMENT(NeedMapping != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Core < gcdMAX_GPU_COUNT);
++
++    if (Node->Virtual.contiguous)
++    {
++#if gcdENABLE_VG
++        if (Core == gcvCORE_VG)
++        {
++            *NeedMapping = gcvFALSE;
++        }
++        else
++#endif
++        {
++            /* Convert logical address into a physical address. */
++            gcmkONERROR(
++                gckOS_GetPhysicalAddress(Kernel->os, Node->Virtual.logical, &phys));
++
++            gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
++
++            gcmkASSERT(phys >= baseAddress);
++
++            /* Subtract baseAddress to get a GPU address used for programming. */
++            phys -= baseAddress;
++
++            /* If part of region is belong to gcvPOOL_VIRTUAL,
++            ** whole region has to be mapped. */
++            end = phys + Node->Virtual.bytes - 1;
++
++            gcmkONERROR(gckHARDWARE_SplitMemory(
++                        Kernel->hardware, end, &pool, &offset
++                        ));
++
++            *NeedMapping = (pool == gcvPOOL_VIRTUAL);
++        }
++    }
++    else
++    {
++        *NeedMapping = gcvTRUE;
++    }
++
++    gcmkFOOTER_ARG("*NeedMapping=%d", *NeedMapping);
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_Lock
++**
++**  Lock a video memory node and return its hardware specific address.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to a gcuVIDMEM_NODE union.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Pointer to a variable that will hold the hardware specific address.
++*/
++gceSTATUS
++gckVIDMEM_Lock(
++    IN gckKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gctBOOL Cacheable,
++    OUT gctUINT32 * Address
++    )
++{
++    gceSTATUS status;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL locked = gcvFALSE;
++    gckOS os = gcvNULL;
++    gctBOOL needMapping;
++    gctUINT32 baseAddress;
++
++    gcmkHEADER_ARG("Node=0x%x", Node);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Grab the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Kernel->os, Kernel->vidmemMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    if ((Node == gcvNULL)
++    ||  (Node->VidMem.memory == gcvNULL)
++    )
++    {
++        /* Invalid object. */
++        gcmkONERROR(gcvSTATUS_INVALID_OBJECT);
++    }
++
++    /**************************** Video Memory ********************************/
++
++    if (Node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++    {
++        if (Cacheable == gcvTRUE)
++        {
++            gcmkONERROR(gcvSTATUS_INVALID_REQUEST);
++        }
++
++        /* Increment the lock count. */
++        Node->VidMem.locked ++;
++
++        /* Return the physical address of the node. */
++#if !gcdUSE_VIDMEM_PER_PID
++        *Address = Node->VidMem.memory->baseAddress
++                 + Node->VidMem.offset
++                 + Node->VidMem.alignment;
++#else
++        *Address = Node->VidMem.physical;
++#endif
++
++        /* Get hardware specific address. */
++#if gcdENABLE_VG
++        if (Kernel->vg == gcvNULL)
++#endif
++        {
++            if (Kernel->hardware->mmuVersion == 0)
++            {
++                /* Convert physical to GPU address for old mmu. */
++                gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
++                gcmkASSERT(*Address > baseAddress);
++                *Address -= baseAddress;
++            }
++        }
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                      "Locked node 0x%x (%d) @ 0x%08X",
++                      Node,
++                      Node->VidMem.locked,
++                      *Address);
++    }
++
++    /*************************** Virtual Memory *******************************/
++
++    else
++    {
++        /* Verify the gckKERNEL object pointer. */
++        gcmkVERIFY_OBJECT(Node->Virtual.kernel, gcvOBJ_KERNEL);
++
++        /* Extract the gckOS object pointer. */
++        os = Node->Virtual.kernel->os;
++        gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++#if gcdPAGED_MEMORY_CACHEABLE
++        /* Force video memory cacheable. */
++        Cacheable = gcvTRUE;
++#endif
++
++        gcmkONERROR(
++            gckOS_LockPages(os,
++                            Node->Virtual.physical,
++                            Node->Virtual.bytes,
++                            Cacheable,
++                            &Node->Virtual.logical,
++                            &Node->Virtual.pageCount));
++
++        /* Increment the lock count. */
++        if (Node->Virtual.lockeds[Kernel->core] ++ == 0)
++        {
++            /* Is this node pending for a final unlock? */
++#ifdef __QNXNTO__
++            if (!Node->Virtual.contiguous && Node->Virtual.unlockPendings[Kernel->core])
++            {
++                /* Make sure we have a page table. */
++                gcmkASSERT(Node->Virtual.pageTables[Kernel->core] != gcvNULL);
++
++                /* Remove pending unlock. */
++                Node->Virtual.unlockPendings[Kernel->core] = gcvFALSE;
++            }
++
++            /* First lock - create a page table. */
++            gcmkASSERT(Node->Virtual.pageTables[Kernel->core] == gcvNULL);
++
++            /* Make sure we mark our node as not flushed. */
++            Node->Virtual.unlockPendings[Kernel->core] = gcvFALSE;
++#endif
++
++            locked = gcvTRUE;
++
++            gcmkONERROR(_NeedVirtualMapping(Kernel, Kernel->core, Node, &needMapping));
++
++            if (needMapping == gcvFALSE)
++            {
++                /* Get hardware specific address. */
++#if gcdENABLE_VG
++                if (Kernel->vg != gcvNULL)
++                {
++                    gcmkONERROR(gckVGHARDWARE_ConvertLogical(Kernel->vg->hardware,
++                                Node->Virtual.logical,
++                                &Node->Virtual.addresses[Kernel->core]));
++                }
++                else
++#endif
++                {
++                    gcmkONERROR(gckHARDWARE_ConvertLogical(Kernel->hardware,
++                                Node->Virtual.logical,
++                                &Node->Virtual.addresses[Kernel->core]));
++                }
++            }
++            else
++            {
++#if gcdENABLE_VG
++                if (Kernel->vg != gcvNULL)
++                {
++                    /* Allocate pages inside the MMU. */
++                    gcmkONERROR(
++                        gckVGMMU_AllocatePages(Kernel->vg->mmu,
++                                             Node->Virtual.pageCount,
++                                             &Node->Virtual.pageTables[Kernel->core],
++                                             &Node->Virtual.addresses[Kernel->core]));
++                }
++                else
++#endif
++                {
++                    /* Allocate pages inside the MMU. */
++                    gcmkONERROR(
++                        gckMMU_AllocatePagesEx(Kernel->mmu,
++                                             Node->Virtual.pageCount,
++                                             Node->Virtual.type,
++                                             &Node->Virtual.pageTables[Kernel->core],
++                                             &Node->Virtual.addresses[Kernel->core]));
++                }
++
++                Node->Virtual.lockKernels[Kernel->core] = Kernel;
++
++                /* Map the pages. */
++#ifdef __QNXNTO__
++                gcmkONERROR(
++                    gckOS_MapPagesEx(os,
++                                     Kernel->core,
++                                     Node->Virtual.physical,
++                                     Node->Virtual.logical,
++                                     Node->Virtual.pageCount,
++                                     Node->Virtual.pageTables[Kernel->core]));
++#else
++                gcmkONERROR(
++                    gckOS_MapPagesEx(os,
++                                     Kernel->core,
++                                     Node->Virtual.physical,
++                                     Node->Virtual.pageCount,
++                                     Node->Virtual.pageTables[Kernel->core]));
++#endif
++
++#if gcdENABLE_VG
++                if (Kernel->core == gcvCORE_VG)
++                {
++                    gcmkONERROR(gckVGMMU_Flush(Kernel->vg->mmu));
++                }
++                else
++#endif
++                {
++                    gcmkONERROR(gckMMU_Flush(Kernel->mmu));
++                }
++            }
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                           "Mapped virtual node 0x%x to 0x%08X",
++                           Node,
++                           Node->Virtual.addresses[Kernel->core]);
++        }
++
++        /* Return hardware address. */
++        *Address = Node->Virtual.addresses[Kernel->core];
++    }
++
++    /* Release the mutex. */
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=%08x", *Address);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (locked)
++    {
++        if (Node->Virtual.pageTables[Kernel->core] != gcvNULL)
++        {
++#if gcdENABLE_VG
++            if (Kernel->vg != gcvNULL)
++            {
++                /* Free the pages from the MMU. */
++                gcmkVERIFY_OK(
++                    gckVGMMU_FreePages(Kernel->vg->mmu,
++                                     Node->Virtual.pageTables[Kernel->core],
++                                     Node->Virtual.pageCount));
++            }
++            else
++#endif
++            {
++                /* Free the pages from the MMU. */
++                gcmkVERIFY_OK(
++                    gckMMU_FreePages(Kernel->mmu,
++                                     Node->Virtual.pageTables[Kernel->core],
++                                     Node->Virtual.pageCount));
++            }
++            Node->Virtual.pageTables[Kernel->core]  = gcvNULL;
++            Node->Virtual.lockKernels[Kernel->core] = gcvNULL;
++        }
++
++        /* Unlock the pages. */
++        gcmkVERIFY_OK(
++            gckOS_UnlockPages(os,
++                              Node->Virtual.physical,
++                              Node->Virtual.bytes,
++                              Node->Virtual.logical
++                              ));
++
++        Node->Virtual.lockeds[Kernel->core]--;
++    }
++
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckVIDMEM_Unlock
++**
++**  Unlock a video memory node.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcuVIDMEM_NODE_PTR Node
++**          Pointer to a locked gcuVIDMEM_NODE union.
++**
++**      gceSURF_TYPE Type
++**          Type of surface to unlock.
++**
++**      gctBOOL * Asynchroneous
++**          Pointer to a variable specifying whether the surface should be
++**          unlocked asynchroneously or not.
++**
++**  OUTPUT:
++**
++**      gctBOOL * Asynchroneous
++**          Pointer to a variable receiving the number of bytes used in the
++**          command buffer specified by 'Commands'.  If gcvNULL, there is no
++**          command buffer.
++*/
++gceSTATUS
++gckVIDMEM_Unlock(
++    IN gckKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gceSURF_TYPE Type,
++    IN OUT gctBOOL * Asynchroneous
++    )
++{
++    gceSTATUS status;
++    gckHARDWARE hardware;
++    gctPOINTER buffer;
++    gctSIZE_T requested, bufferSize;
++    gckCOMMAND command = gcvNULL;
++    gceKERNEL_FLUSH flush;
++    gckOS os = gcvNULL;
++    gctBOOL acquired = gcvFALSE;
++    gctBOOL commitEntered = gcvFALSE;
++    gctINT32 i, totalLocked;
++
++    gcmkHEADER_ARG("Node=0x%x Type=%d *Asynchroneous=%d",
++                   Node, Type, gcmOPT_VALUE(Asynchroneous));
++
++    /* Grab the mutex. */
++    gcmkONERROR(gckOS_AcquireMutex(Kernel->os, Kernel->vidmemMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++
++    /* Verify the arguments. */
++    if ((Node == gcvNULL)
++    ||  (Node->VidMem.memory == gcvNULL)
++    )
++    {
++        /* Invalid object. */
++        gcmkONERROR(gcvSTATUS_INVALID_OBJECT);
++    }
++
++    /**************************** Video Memory ********************************/
++
++    if (Node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++    {
++        if (Node->VidMem.locked <= 0)
++        {
++            /* The surface was not locked. */
++            status = gcvSTATUS_MEMORY_UNLOCKED;
++            goto OnError;
++        }
++
++        /* Decrement the lock count. */
++        Node->VidMem.locked --;
++
++        if (Asynchroneous != gcvNULL)
++        {
++            /* No need for any events. */
++            *Asynchroneous = gcvFALSE;
++        }
++
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                      "Unlocked node 0x%x (%d)",
++                      Node,
++                      Node->VidMem.locked);
++
++#ifdef __QNXNTO__
++        /* Unmap the video memory */
++        if ((Node->VidMem.locked == 0) && (Node->VidMem.logical != gcvNULL))
++        {
++            if (Kernel->core == gcvCORE_VG)
++            {
++                gckKERNEL_UnmapVideoMemory(Kernel,
++                                           Node->VidMem.logical,
++                                           Node->VidMem.processID,
++                                           Node->VidMem.bytes);
++                Node->VidMem.logical = gcvNULL;
++            }
++        }
++#endif /* __QNXNTO__ */
++
++        if (Node->VidMem.freePending && (Node->VidMem.locked == 0))
++        {
++            /* Client has unlocked node previously attempted to be freed by compositor. Free now. */
++            Node->VidMem.freePending = gcvFALSE;
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                           "Deferred-freeing Node 0x%x.",
++                           Node);
++
++            gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++            acquired = gcvFALSE;
++
++            gcmkONERROR(gckVIDMEM_Free(Kernel, Node));
++        }
++    }
++
++    /*************************** Virtual Memory *******************************/
++
++    else
++    {
++        /* Verify the gckHARDWARE object pointer. */
++        hardware = Kernel->hardware;
++        gcmkVERIFY_OBJECT(hardware, gcvOBJ_HARDWARE);
++
++        /* Verify the gckCOMMAND object pointer. */
++        command = Kernel->command;
++        gcmkVERIFY_OBJECT(command, gcvOBJ_COMMAND);
++
++        /* Get the gckOS object pointer. */
++        os = Kernel->os;
++        gcmkVERIFY_OBJECT(os, gcvOBJ_OS);
++
++        if (Asynchroneous == gcvNULL)
++        {
++            if (Node->Virtual.lockeds[Kernel->core] == 0)
++            {
++                status = gcvSTATUS_MEMORY_UNLOCKED;
++                goto OnError;
++            }
++
++            /* Decrement lock count. */
++            -- Node->Virtual.lockeds[Kernel->core];
++
++            /* See if we can unlock the resources. */
++            if (Node->Virtual.lockeds[Kernel->core] == 0)
++            {
++                /* Free the page table. */
++                if (Node->Virtual.pageTables[Kernel->core] != gcvNULL)
++                {
++#if gcdENABLE_VG
++                    if (Kernel->vg != gcvNULL)
++                    {
++                        gcmkONERROR(
++                            gckVGMMU_FreePages(Kernel->vg->mmu,
++                                             Node->Virtual.pageTables[Kernel->core],
++                                             Node->Virtual.pageCount));
++                    }
++                    else
++#endif
++                    {
++                        gcmkONERROR(
++                            gckMMU_FreePages(Kernel->mmu,
++                                             Node->Virtual.pageTables[Kernel->core],
++                                             Node->Virtual.pageCount));
++                    }
++                    /* Mark page table as freed. */
++                    Node->Virtual.pageTables[Kernel->core] = gcvNULL;
++                    Node->Virtual.lockKernels[Kernel->core] = gcvNULL;
++                }
++
++#ifdef __QNXNTO__
++                /* Mark node as unlocked. */
++                Node->Virtual.unlockPendings[Kernel->core] = gcvFALSE;
++#endif
++            }
++
++            for (i = 0, totalLocked = 0; i < gcdMAX_GPU_COUNT; i++)
++            {
++                totalLocked += Node->Virtual.lockeds[i];
++            }
++
++            if (totalLocked == 0)
++            {
++                /* Owner have already freed this node
++                ** and we are the last one to unlock, do
++                ** real free */
++                if (Node->Virtual.freed)
++                {
++                    /* Free the virtual memory. */
++                    gcmkVERIFY_OK(gckOS_FreePagedMemory(Kernel->os,
++                                                        Node->Virtual.physical,
++                                                        Node->Virtual.bytes));
++
++                    /* Destroy the gcuVIDMEM_NODE union. */
++                    gcmkVERIFY_OK(gckVIDMEM_DestroyVirtual(Node));
++
++                    /* Release mutex before node is destroyed */
++                    gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++
++                    acquired = gcvFALSE;
++
++                    /* Node has been destroyed, so we should not touch it any more */
++                    gcmkFOOTER();
++                    return gcvSTATUS_OK;
++                }
++            }
++
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                           "Unmapped virtual node 0x%x from 0x%08X",
++                           Node, Node->Virtual.addresses[Kernel->core]);
++
++        }
++
++        else
++        {
++            /* If we need to unlock a node from virtual memory we have to be
++            ** very carefull.  If the node is still inside the caches we
++            ** might get a bus error later if the cache line needs to be
++            ** replaced.  So - we have to flush the caches before we do
++            ** anything. */
++
++            /* gckCommand_EnterCommit() can't be called in interrupt handler because
++            ** of a dead lock situation:
++            ** process call Command_Commit(), and acquire Command->mutexQueue in
++            ** gckCOMMAND_EnterCommit(). Then it will wait for a signal which depends
++            ** on interrupt handler to generate, if interrupt handler enter
++            ** gckCommand_EnterCommit(), process will never get the signal. */
++
++            /* So, flush cache when we still in process context, and then ask caller to
++            ** schedule a event. */
++
++            gcmkONERROR(
++                gckOS_UnlockPages(os,
++                              Node->Virtual.physical,
++                              Node->Virtual.bytes,
++                              Node->Virtual.logical));
++
++            if (!Node->Virtual.contiguous
++            &&  (Node->Virtual.lockeds[Kernel->core] == 1)
++#if gcdENABLE_VG
++            && (Kernel->vg == gcvNULL)
++#endif
++            )
++            {
++                if (Type == gcvSURF_BITMAP)
++                {
++                    /* Flush 2D cache. */
++                    flush = gcvFLUSH_2D;
++                }
++                else if (Type == gcvSURF_RENDER_TARGET)
++                {
++                    /* Flush color cache. */
++                    flush = gcvFLUSH_COLOR;
++                }
++                else if (Type == gcvSURF_DEPTH)
++                {
++                    /* Flush depth cache. */
++                    flush = gcvFLUSH_DEPTH;
++                }
++                else
++                {
++                    /* No flush required. */
++                    flush = (gceKERNEL_FLUSH) 0;
++                }
++                if(hardware)
++                {
++                    gcmkONERROR(
++                        gckHARDWARE_Flush(hardware, flush, gcvNULL, &requested));
++
++                    if (requested != 0)
++                    {
++                        /* Acquire the command queue. */
++                        gcmkONERROR(gckCOMMAND_EnterCommit(command, gcvFALSE));
++                        commitEntered = gcvTRUE;
++
++                        gcmkONERROR(gckCOMMAND_Reserve(
++                            command, requested, &buffer, &bufferSize
++                            ));
++
++                        gcmkONERROR(gckHARDWARE_Flush(
++                            hardware, flush, buffer, &bufferSize
++                            ));
++
++                        /* Mark node as pending. */
++#ifdef __QNXNTO__
++                        Node->Virtual.unlockPendings[Kernel->core] = gcvTRUE;
++#endif
++
++                        gcmkONERROR(gckCOMMAND_Execute(command, requested));
++
++                        /* Release the command queue. */
++                        gcmkONERROR(gckCOMMAND_ExitCommit(command, gcvFALSE));
++                        commitEntered = gcvFALSE;
++                    }
++                }
++                else
++                {
++                    gckOS_Print("Hardware already is freed.\n");
++                }
++            }
++
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_VIDMEM,
++                           "Scheduled unlock for virtual node 0x%x",
++                           Node);
++
++            /* Schedule the surface to be unlocked. */
++            *Asynchroneous = gcvTRUE;
++        }
++    }
++
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++        acquired = gcvFALSE;
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Asynchroneous=%d", gcmOPT_VALUE(Asynchroneous));
++    return gcvSTATUS_OK;
++
++OnError:
++    if (commitEntered)
++    {
++        /* Release the command queue mutex. */
++        gcmkVERIFY_OK(gckCOMMAND_ExitCommit(command, gcvFALSE));
++    }
++
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Kernel->os, Kernel->vidmemMutex));
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_base.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,3896 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_base_h_
++#define __gc_hal_base_h_
++
++#include "gc_hal_enum.h"
++#include "gc_hal_types.h"
++
++#include "gc_hal_dump.h"
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++****************************** Object Declarations *****************************
++\******************************************************************************/
++
++typedef struct _gckOS *                 gckOS;
++typedef struct _gcoHAL *                gcoHAL;
++typedef struct _gcoOS *                 gcoOS;
++typedef struct _gco2D *                 gco2D;
++
++#ifndef VIVANTE_NO_3D
++typedef struct _gco3D *                 gco3D;
++#endif
++
++typedef struct _gcoSURF *               gcoSURF;
++typedef struct _gcsSURF_INFO *          gcsSURF_INFO_PTR;
++typedef struct _gcsSURF_NODE *          gcsSURF_NODE_PTR;
++typedef struct _gcsSURF_FORMAT_INFO *   gcsSURF_FORMAT_INFO_PTR;
++typedef struct _gcsPOINT *              gcsPOINT_PTR;
++typedef struct _gcsSIZE *               gcsSIZE_PTR;
++typedef struct _gcsRECT *               gcsRECT_PTR;
++typedef struct _gcsBOUNDARY *           gcsBOUNDARY_PTR;
++typedef struct _gcoDUMP *               gcoDUMP;
++typedef struct _gcoHARDWARE *           gcoHARDWARE;
++typedef union  _gcuVIDMEM_NODE *        gcuVIDMEM_NODE_PTR;
++
++typedef struct gcsATOM *                gcsATOM_PTR;
++
++#if gcdENABLE_VG
++typedef struct _gcoVG *                 gcoVG;
++typedef struct _gcsCOMPLETION_SIGNAL *	gcsCOMPLETION_SIGNAL_PTR;
++typedef struct _gcsCONTEXT_MAP *		gcsCONTEXT_MAP_PTR;
++#else
++typedef void *                          gcoVG;
++#endif
++
++#if gcdSYNC
++typedef struct _gcoFENCE *              gcoFENCE;
++typedef struct _gcsSYNC_CONTEXT  *      gcsSYNC_CONTEXT_PTR;
++#endif
++
++typedef struct _gcoOS_SymbolsList gcoOS_SymbolsList;
++
++/******************************************************************************\
++******************************* Process local storage *************************
++\******************************************************************************/
++typedef struct _gcsPLS * gcsPLS_PTR;
++
++typedef void (* gctPLS_DESTRUCTOR) (
++    gcsPLS_PTR
++    );
++
++typedef struct _gcsPLS
++{
++    /* Global objects. */
++    gcoOS                       os;
++    gcoHAL                      hal;
++
++    /* Internal memory pool. */
++    gctSIZE_T                   internalSize;
++    gctPHYS_ADDR                internalPhysical;
++    gctPOINTER                  internalLogical;
++
++    /* External memory pool. */
++    gctSIZE_T                   externalSize;
++    gctPHYS_ADDR                externalPhysical;
++    gctPOINTER                  externalLogical;
++
++    /* Contiguous memory pool. */
++    gctSIZE_T                   contiguousSize;
++    gctPHYS_ADDR                contiguousPhysical;
++    gctPOINTER                  contiguousLogical;
++
++    /* EGL-specific process-wide objects. */
++    gctPOINTER                  eglDisplayInfo;
++    gctPOINTER                  eglSurfaceInfo;
++    gceSURF_FORMAT              eglConfigFormat;
++
++    /* PorcessID of the constrcutor process */
++    gctUINT32                   processID;
++#if gcdFORCE_GAL_LOAD_TWICE
++    /* ThreadID of the constrcutor process. */
++    gctSIZE_T                   threadID;
++    /* Flag for calling module destructor. */
++    gctBOOL                     exiting;
++#endif
++
++    /* Reference count for destructor. */
++    gcsATOM_PTR                 reference;
++    gctBOOL                     bKFS;
++#if gcdUSE_NPOT_PATCH
++    gctBOOL                     bNeedSupportNP2Texture;
++#endif
++
++    /* Destructor for eglDisplayInfo. */
++    gctPLS_DESTRUCTOR           destructor;
++}
++gcsPLS;
++
++extern gcsPLS gcPLS;
++
++/******************************************************************************\
++******************************* Thread local storage *************************
++\******************************************************************************/
++
++typedef struct _gcsTLS * gcsTLS_PTR;
++
++typedef void (* gctTLS_DESTRUCTOR) (
++    gcsTLS_PTR
++    );
++
++typedef struct _gcsTLS
++{
++    gceHARDWARE_TYPE            currentType;
++    gcoHARDWARE                 hardware;
++    /* Only for separated 3D and 2D */
++    gcoHARDWARE                 hardware2D;
++#if gcdENABLE_VG
++    gcoVGHARDWARE               vg;
++    gcoVG                       engineVG;
++#endif /* gcdENABLE_VG */
++    gctPOINTER                  context;
++    gctTLS_DESTRUCTOR           destructor;
++    gctBOOL                     ProcessExiting;
++
++#ifndef VIVANTE_NO_3D
++	gco3D						engine3D;
++#endif
++#if gcdSYNC
++    gctBOOL                     fenceEnable;
++#endif
++	gco2D						engine2D;
++    gctBOOL                     copied;
++
++#if gcdFORCE_GAL_LOAD_TWICE
++    /* libGAL.so handle */
++    gctHANDLE                   handle;
++#endif
++}
++gcsTLS;
++
++/******************************************************************************\
++********************************* Enumerations *********************************
++\******************************************************************************/
++
++typedef enum _gcePLS_VALUE
++{
++  gcePLS_VALUE_EGL_DISPLAY_INFO,
++  gcePLS_VALUE_EGL_SURFACE_INFO,
++  gcePLS_VALUE_EGL_CONFIG_FORMAT_INFO,
++  gcePLS_VALUE_EGL_DESTRUCTOR_INFO,
++}
++gcePLS_VALUE;
++
++/* Video memory pool type. */
++typedef enum _gcePOOL
++{
++    gcvPOOL_UNKNOWN = 0,
++    gcvPOOL_DEFAULT,
++    gcvPOOL_LOCAL,
++    gcvPOOL_LOCAL_INTERNAL,
++    gcvPOOL_LOCAL_EXTERNAL,
++    gcvPOOL_UNIFIED,
++    gcvPOOL_SYSTEM,
++    gcvPOOL_VIRTUAL,
++    gcvPOOL_USER,
++    gcvPOOL_CONTIGUOUS,
++    gcvPOOL_DEFAULT_FORCE_CONTIGUOUS,
++    gcvPOOL_DEFAULT_FORCE_CONTIGUOUS_CACHEABLE,
++
++    gcvPOOL_NUMBER_OF_POOLS
++}
++gcePOOL;
++
++#ifndef VIVANTE_NO_3D
++/* Blending functions. */
++typedef enum _gceBLEND_FUNCTION
++{
++    gcvBLEND_ZERO,
++    gcvBLEND_ONE,
++    gcvBLEND_SOURCE_COLOR,
++    gcvBLEND_INV_SOURCE_COLOR,
++    gcvBLEND_SOURCE_ALPHA,
++    gcvBLEND_INV_SOURCE_ALPHA,
++    gcvBLEND_TARGET_COLOR,
++    gcvBLEND_INV_TARGET_COLOR,
++    gcvBLEND_TARGET_ALPHA,
++    gcvBLEND_INV_TARGET_ALPHA,
++    gcvBLEND_SOURCE_ALPHA_SATURATE,
++    gcvBLEND_CONST_COLOR,
++    gcvBLEND_INV_CONST_COLOR,
++    gcvBLEND_CONST_ALPHA,
++    gcvBLEND_INV_CONST_ALPHA,
++}
++gceBLEND_FUNCTION;
++
++/* Blending modes. */
++typedef enum _gceBLEND_MODE
++{
++    gcvBLEND_ADD,
++    gcvBLEND_SUBTRACT,
++    gcvBLEND_REVERSE_SUBTRACT,
++    gcvBLEND_MIN,
++    gcvBLEND_MAX,
++}
++gceBLEND_MODE;
++
++/* API flags. */
++typedef enum _gceAPI
++{
++    gcvAPI_D3D                  = 0x1,
++    gcvAPI_OPENGL               = 0x2,
++    gcvAPI_OPENVG               = 0x3,
++    gcvAPI_OPENCL               = 0x4,
++}
++gceAPI;
++
++/* Depth modes. */
++typedef enum _gceDEPTH_MODE
++{
++    gcvDEPTH_NONE,
++    gcvDEPTH_Z,
++    gcvDEPTH_W,
++}
++gceDEPTH_MODE;
++#endif /* VIVANTE_NO_3D */
++
++typedef enum _gceWHERE
++{
++    gcvWHERE_COMMAND,
++    gcvWHERE_RASTER,
++    gcvWHERE_PIXEL,
++}
++gceWHERE;
++
++typedef enum _gceHOW
++{
++    gcvHOW_SEMAPHORE            = 0x1,
++    gcvHOW_STALL                = 0x2,
++    gcvHOW_SEMAPHORE_STALL      = 0x3,
++}
++gceHOW;
++
++typedef enum _gceSignalHandlerType
++{
++    gcvHANDLE_SIGFPE_WHEN_SIGNAL_CODE_IS_0        = 0x1,
++}
++gceSignalHandlerType;
++
++
++#if gcdENABLE_VG
++/* gcsHAL_Limits*/
++typedef struct _gcsHAL_LIMITS
++{
++    /* chip info */
++    gceCHIPMODEL    chipModel;
++    gctUINT32       chipRevision;
++    gctUINT32       featureCount;
++    gctUINT32       *chipFeatures;
++
++    /* target caps */
++	gctUINT32         maxWidth;
++	gctUINT32         maxHeight;
++	gctUINT32         multiTargetCount;
++	gctUINT32         maxSamples;
++
++}gcsHAL_LIMITS;
++#endif
++
++/******************************************************************************\
++*********** Generic Memory Allocation Optimization Using Containers ************
++\******************************************************************************/
++
++/* Generic container definition. */
++typedef struct _gcsCONTAINER_LINK * gcsCONTAINER_LINK_PTR;
++typedef struct _gcsCONTAINER_LINK
++{
++    /* Points to the next container. */
++    gcsCONTAINER_LINK_PTR           next;
++}
++gcsCONTAINER_LINK;
++
++typedef struct _gcsCONTAINER_RECORD * gcsCONTAINER_RECORD_PTR;
++typedef struct _gcsCONTAINER_RECORD
++{
++    gcsCONTAINER_RECORD_PTR         prev;
++    gcsCONTAINER_RECORD_PTR         next;
++}
++gcsCONTAINER_RECORD;
++
++typedef struct _gcsCONTAINER * gcsCONTAINER_PTR;
++typedef struct _gcsCONTAINER
++{
++    gctUINT                         containerSize;
++    gctUINT                         recordSize;
++    gctUINT                         recordCount;
++    gcsCONTAINER_LINK_PTR           containers;
++    gcsCONTAINER_RECORD             freeList;
++    gcsCONTAINER_RECORD             allocList;
++}
++gcsCONTAINER;
++
++gceSTATUS
++gcsCONTAINER_Construct(
++    IN gcsCONTAINER_PTR Container,
++    gctUINT RecordsPerContainer,
++    gctUINT RecordSize
++    );
++
++gceSTATUS
++gcsCONTAINER_Destroy(
++    IN gcsCONTAINER_PTR Container
++    );
++
++gceSTATUS
++gcsCONTAINER_AllocateRecord(
++    IN gcsCONTAINER_PTR Container,
++    OUT gctPOINTER * Record
++    );
++
++gceSTATUS
++gcsCONTAINER_FreeRecord(
++    IN gcsCONTAINER_PTR Container,
++    IN gctPOINTER Record
++    );
++
++gceSTATUS
++gcsCONTAINER_FreeAll(
++    IN gcsCONTAINER_PTR Container
++    );
++
++/******************************************************************************\
++********************************* gcoHAL Object *********************************
++\******************************************************************************/
++
++/* Construct a new gcoHAL object. */
++gceSTATUS
++gcoHAL_Construct(
++    IN gctPOINTER Context,
++    IN gcoOS Os,
++    OUT gcoHAL * Hal
++    );
++
++/* Destroy an gcoHAL object. */
++gceSTATUS
++gcoHAL_Destroy(
++    IN gcoHAL Hal
++    );
++
++/* Get pointer to gco2D object. */
++gceSTATUS
++gcoHAL_Get2DEngine(
++    IN gcoHAL Hal,
++    OUT gco2D * Engine
++    );
++
++gceSTATUS
++gcoHAL_SetFscaleValue(
++    IN gctUINT FscaleValue
++    );
++
++gceSTATUS
++gcoHAL_GetFscaleValue(
++    OUT gctUINT * FscaleValue,
++    OUT gctUINT * MinFscaleValue,
++    OUT gctUINT * MaxFscaleValue
++    );
++
++gceSTATUS
++gcoHAL_SetBltNP2Texture(
++    gctBOOL enable
++    );
++
++#ifndef VIVANTE_NO_3D
++/* Get pointer to gco3D object. */
++gceSTATUS
++gcoHAL_Get3DEngine(
++    IN gcoHAL Hal,
++    OUT gco3D * Engine
++    );
++
++gceSTATUS
++gcoHAL_Query3DEngine(
++    IN gcoHAL Hal,
++    OUT gco3D * Engine
++    );
++
++gceSTATUS
++gcoHAL_Set3DEngine(
++    IN gcoHAL Hal,
++    IN gco3D Engine
++    );
++
++gceSTATUS
++gcoHAL_Get3DHardware(
++    IN gcoHAL Hal,
++    OUT gcoHARDWARE * Hardware
++    );
++
++gceSTATUS
++gcoHAL_Set3DHardware(
++    IN gcoHAL Hal,
++    IN gcoHARDWARE Hardware
++    );
++
++
++#endif /* VIVANTE_NO_3D */
++
++/* Verify whether the specified feature is available in hardware. */
++gceSTATUS
++gcoHAL_IsFeatureAvailable(
++    IN gcoHAL Hal,
++    IN gceFEATURE Feature
++    );
++
++/* Query the identity of the hardware. */
++gceSTATUS
++gcoHAL_QueryChipIdentity(
++    IN gcoHAL Hal,
++    OUT gceCHIPMODEL* ChipModel,
++    OUT gctUINT32* ChipRevision,
++    OUT gctUINT32* ChipFeatures,
++    OUT gctUINT32* ChipMinorFeatures
++    );
++
++/* Query the minor features of the hardware. */
++gceSTATUS gcoHAL_QueryChipMinorFeatures(
++    IN gcoHAL Hal,
++    OUT gctUINT32* NumFeatures,
++    OUT gctUINT32* ChipMinorFeatures
++    );
++
++/* Query the amount of video memory. */
++gceSTATUS
++gcoHAL_QueryVideoMemory(
++    IN gcoHAL Hal,
++    OUT gctPHYS_ADDR * InternalAddress,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctPHYS_ADDR * ExternalAddress,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctPHYS_ADDR * ContiguousAddress,
++    OUT gctSIZE_T * ContiguousSize
++    );
++
++/* Map video memory. */
++gceSTATUS
++gcoHAL_MapMemory(
++    IN gcoHAL Hal,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T NumberOfBytes,
++    OUT gctPOINTER * Logical
++    );
++
++/* Unmap video memory. */
++gceSTATUS
++gcoHAL_UnmapMemory(
++    IN gcoHAL Hal,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T NumberOfBytes,
++    IN gctPOINTER Logical
++    );
++
++/* Schedule an unmap of a buffer mapped through its physical address. */
++gceSTATUS
++gcoHAL_ScheduleUnmapMemory(
++    IN gcoHAL Hal,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T NumberOfBytes,
++    IN gctPOINTER Logical
++    );
++
++/* Map user memory. */
++gceSTATUS
++gcoHAL_MapUserMemory(
++    IN gctPOINTER Logical,
++    IN gctUINT32 Physical,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * Info,
++    OUT gctUINT32_PTR GPUAddress
++    );
++
++/* Unmap user memory. */
++gceSTATUS
++gcoHAL_UnmapUserMemory(
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Size,
++    IN gctPOINTER Info,
++    IN gctUINT32 GPUAddress
++    );
++
++/* Schedule an unmap of a user buffer using event mechanism. */
++gceSTATUS
++gcoHAL_ScheduleUnmapUserMemory(
++    IN gcoHAL Hal,
++    IN gctPOINTER Info,
++    IN gctSIZE_T Size,
++    IN gctUINT32 Address,
++    IN gctPOINTER Memory
++    );
++
++/* Commit the current command buffer. */
++gceSTATUS
++gcoHAL_Commit(
++    IN gcoHAL Hal,
++    IN gctBOOL Stall
++    );
++
++/* Query the tile capabilities. */
++gceSTATUS
++gcoHAL_QueryTiled(
++    IN gcoHAL Hal,
++    OUT gctINT32 * TileWidth2D,
++    OUT gctINT32 * TileHeight2D,
++    OUT gctINT32 * TileWidth3D,
++    OUT gctINT32 * TileHeight3D
++    );
++
++gceSTATUS
++gcoHAL_Compact(
++    IN gcoHAL Hal
++    );
++
++#if VIVANTE_PROFILER
++gceSTATUS
++gcoHAL_ProfileStart(
++    IN gcoHAL Hal
++    );
++
++gceSTATUS
++gcoHAL_ProfileEnd(
++    IN gcoHAL Hal,
++    IN gctCONST_STRING Title
++    );
++#endif
++
++/* Power Management */
++gceSTATUS
++gcoHAL_SetPowerManagementState(
++    IN gcoHAL Hal,
++    IN gceCHIPPOWERSTATE State
++    );
++
++gceSTATUS
++gcoHAL_QueryPowerManagementState(
++    IN gcoHAL Hal,
++    OUT gceCHIPPOWERSTATE *State
++    );
++
++/* Set the filter type for filter blit. */
++gceSTATUS
++gcoHAL_SetFilterType(
++    IN gcoHAL Hal,
++    IN gceFILTER_TYPE FilterType
++    );
++
++gceSTATUS
++gcoHAL_GetDump(
++    IN gcoHAL Hal,
++    OUT gcoDUMP * Dump
++    );
++
++/* Call the kernel HAL layer. */
++gceSTATUS
++gcoHAL_Call(
++    IN gcoHAL Hal,
++    IN OUT gcsHAL_INTERFACE_PTR Interface
++    );
++
++gceSTATUS
++gcoHAL_GetPatchID(
++    IN  gcoHAL Hal,
++    OUT gcePATCH_ID * PatchID
++    );
++
++/* Schedule an event. */
++gceSTATUS
++gcoHAL_ScheduleEvent(
++    IN gcoHAL Hal,
++    IN OUT gcsHAL_INTERFACE_PTR Interface
++    );
++
++/* Destroy a surface. */
++gceSTATUS
++gcoHAL_DestroySurface(
++    IN gcoHAL Hal,
++    IN gcoSURF Surface
++    );
++
++/* Request a start/stop timestamp. */
++gceSTATUS
++gcoHAL_SetTimer(
++    IN gcoHAL Hal,
++    IN gctUINT32 Index,
++    IN gctBOOL Start
++    );
++
++/* Get Time delta from a Timer in microseconds. */
++gceSTATUS
++gcoHAL_GetTimerTime(
++    IN gcoHAL Hal,
++    IN gctUINT32 Timer,
++    OUT gctINT32_PTR TimeDelta
++    );
++
++/* set timeout value. */
++gceSTATUS
++gcoHAL_SetTimeOut(
++    IN gcoHAL Hal,
++    IN gctUINT32 timeOut
++    );
++
++gceSTATUS
++gcoHAL_SetHardwareType(
++    IN gcoHAL Hal,
++    IN gceHARDWARE_TYPE HardwardType
++    );
++
++gceSTATUS
++gcoHAL_GetHardwareType(
++    IN gcoHAL Hal,
++    OUT gceHARDWARE_TYPE * HardwardType
++    );
++
++gceSTATUS
++gcoHAL_QueryChipCount(
++    IN gcoHAL Hal,
++    OUT gctINT32 * Count
++    );
++
++gceSTATUS
++gcoHAL_QuerySeparated3D2D(
++    IN gcoHAL Hal
++    );
++
++gceSTATUS
++gcoHAL_QuerySpecialHint(
++    IN gceSPECIAL_HINT Hint
++    );
++
++gceSTATUS
++gcoHAL_SetSpecialHintData(
++    IN gcoHARDWARE Hardware
++    );
++
++/* Get pointer to gcoVG object. */
++gceSTATUS
++gcoHAL_GetVGEngine(
++    IN gcoHAL Hal,
++    OUT gcoVG * Engine
++    );
++
++#if gcdENABLE_VG
++gceSTATUS
++gcoHAL_QueryChipLimits(
++    IN gcoHAL           Hal,
++    IN gctINT32         Chip,
++    OUT gcsHAL_LIMITS   *Limits);
++
++gceSTATUS
++gcoHAL_QueryChipFeature(
++    IN gcoHAL       Hal,
++    IN gctINT32     Chip,
++    IN gceFEATURE   Feature);
++
++#endif
++/******************************************************************************\
++********************************** gcoOS Object *********************************
++\******************************************************************************/
++
++/* Get PLS value for given key */
++gctPOINTER
++gcoOS_GetPLSValue(
++    IN gcePLS_VALUE key
++    );
++
++/* Set PLS value of a given key */
++void
++gcoOS_SetPLSValue(
++    IN gcePLS_VALUE key,
++    OUT gctPOINTER value
++    );
++
++/* Get access to the thread local storage. */
++gceSTATUS
++gcoOS_GetTLS(
++    OUT gcsTLS_PTR * TLS
++    );
++
++    /* Copy the TLS from a source thread. */
++    gceSTATUS gcoOS_CopyTLS(IN gcsTLS_PTR Source);
++
++/* Destroy the objects associated with the current thread. */
++void
++gcoOS_FreeThreadData(
++    IN gctBOOL ProcessExiting
++    );
++
++/* Construct a new gcoOS object. */
++gceSTATUS
++gcoOS_Construct(
++    IN gctPOINTER Context,
++    OUT gcoOS * Os
++    );
++
++/* Destroy an gcoOS object. */
++gceSTATUS
++gcoOS_Destroy(
++    IN gcoOS Os
++    );
++
++/* Get the base address for the physical memory. */
++gceSTATUS
++gcoOS_GetBaseAddress(
++    IN gcoOS Os,
++    OUT gctUINT32_PTR BaseAddress
++    );
++
++/* Allocate memory from the heap. */
++gceSTATUS
++gcoOS_Allocate(
++    IN gcoOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    );
++
++/* Get allocated memory size. */
++gceSTATUS
++gcoOS_GetMemorySize(
++    IN gcoOS Os,
++    IN gctPOINTER Memory,
++    OUT gctSIZE_T_PTR MemorySize
++    );
++
++/* Free allocated memory. */
++gceSTATUS
++gcoOS_Free(
++    IN gcoOS Os,
++    IN gctPOINTER Memory
++    );
++
++/* Allocate memory. */
++gceSTATUS
++gcoOS_AllocateMemory(
++    IN gcoOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    );
++
++/* Free memory. */
++gceSTATUS
++gcoOS_FreeMemory(
++    IN gcoOS Os,
++    IN gctPOINTER Memory
++    );
++
++/* Allocate contiguous memory. */
++gceSTATUS
++gcoOS_AllocateContiguous(
++    IN gcoOS Os,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    );
++
++/* Free contiguous memory. */
++gceSTATUS
++gcoOS_FreeContiguous(
++    IN gcoOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++
++/* Allocate video memory. */
++gceSTATUS
++gcoOS_AllocateVideoMemory(
++    IN gcoOS Os,
++    IN gctBOOL InUserSpace,
++    IN gctBOOL InCacheable,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctUINT32 * Physical,
++    OUT gctPOINTER * Logical,
++    OUT gctPOINTER * Handle
++    );
++
++/* Free video memory. */
++gceSTATUS
++gcoOS_FreeVideoMemory(
++    IN gcoOS Os,
++    IN gctPOINTER Handle
++    );
++
++gceSTATUS
++gcoSURF_GetBankOffsetBytes(
++    IN gcoSURF Surfce,
++    IN gceSURF_TYPE Type,
++    IN gctUINT32 Stride,
++    IN gctUINT32_PTR Bytes
++    );
++
++/* Map user memory. */
++gceSTATUS
++gcoOS_MapUserMemory(
++    IN gcoOS Os,
++    IN gctPOINTER Memory,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * Info,
++    OUT gctUINT32_PTR Address
++    );
++
++/* Map user memory. */
++gceSTATUS
++gcoOS_MapUserMemoryEx(
++    IN gcoOS Os,
++    IN gctPOINTER Memory,
++    IN gctUINT32 Physical,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * Info,
++    OUT gctUINT32_PTR Address
++    );
++
++/* Unmap user memory. */
++gceSTATUS
++gcoOS_UnmapUserMemory(
++    IN gcoOS Os,
++    IN gctPOINTER Memory,
++    IN gctSIZE_T Size,
++    IN gctPOINTER Info,
++    IN gctUINT32 Address
++    );
++
++/* Device I/O Control call to the kernel HAL layer. */
++gceSTATUS
++gcoOS_DeviceControl(
++    IN gcoOS Os,
++    IN gctUINT32 IoControlCode,
++    IN gctPOINTER InputBuffer,
++    IN gctSIZE_T InputBufferSize,
++    IN gctPOINTER OutputBuffer,
++    IN gctSIZE_T OutputBufferSize
++    );
++
++/* Allocate non paged memory. */
++gceSTATUS
++gcoOS_AllocateNonPagedMemory(
++    IN gcoOS Os,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    );
++
++/* Free non paged memory. */
++gceSTATUS
++gcoOS_FreeNonPagedMemory(
++    IN gcoOS Os,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical
++    );
++
++#define gcmOS_SAFE_FREE(os, mem) \
++	gcoOS_Free(os, mem); \
++	mem = gcvNULL
++
++#define gcmkOS_SAFE_FREE(os, mem) \
++    gckOS_Free(os, mem); \
++	mem = gcvNULL
++
++typedef enum _gceFILE_MODE
++{
++    gcvFILE_CREATE          = 0,
++    gcvFILE_APPEND,
++    gcvFILE_READ,
++    gcvFILE_CREATETEXT,
++    gcvFILE_APPENDTEXT,
++    gcvFILE_READTEXT,
++}
++gceFILE_MODE;
++
++/* Open a file. */
++gceSTATUS
++gcoOS_Open(
++    IN gcoOS Os,
++    IN gctCONST_STRING FileName,
++    IN gceFILE_MODE Mode,
++    OUT gctFILE * File
++    );
++
++/* Close a file. */
++gceSTATUS
++gcoOS_Close(
++    IN gcoOS Os,
++    IN gctFILE File
++    );
++
++/* Read data from a file. */
++gceSTATUS
++gcoOS_Read(
++    IN gcoOS Os,
++    IN gctFILE File,
++    IN gctSIZE_T ByteCount,
++    IN gctPOINTER Data,
++    OUT gctSIZE_T * ByteRead
++    );
++
++/* Write data to a file. */
++gceSTATUS
++gcoOS_Write(
++    IN gcoOS Os,
++    IN gctFILE File,
++    IN gctSIZE_T ByteCount,
++    IN gctCONST_POINTER Data
++    );
++
++/* Flush data to a file. */
++gceSTATUS
++gcoOS_Flush(
++    IN gcoOS Os,
++    IN gctFILE File
++    );
++
++/* Close a file descriptor. */
++gceSTATUS
++gcoOS_CloseFD(
++    IN gcoOS Os,
++    IN gctINT FD
++    );
++
++/* Dup file descriptor to another. */
++gceSTATUS
++gcoOS_DupFD(
++    IN gcoOS Os,
++    IN gctINT FD,
++    OUT gctINT * FD2
++    );
++
++/* Create an endpoint for communication. */
++gceSTATUS
++gcoOS_Socket(
++    IN gcoOS Os,
++    IN gctINT Domain,
++    IN gctINT Type,
++    IN gctINT Protocol,
++    OUT gctINT *SockFd
++    );
++
++/* Close a socket. */
++gceSTATUS
++gcoOS_CloseSocket(
++    IN gcoOS Os,
++    IN gctINT SockFd
++    );
++
++/* Initiate a connection on a socket. */
++gceSTATUS
++gcoOS_Connect(
++    IN gcoOS Os,
++    IN gctINT SockFd,
++    IN gctCONST_POINTER HostName,
++    IN gctUINT Port);
++
++/* Shut down part of connection on a socket. */
++gceSTATUS
++gcoOS_Shutdown(
++    IN gcoOS Os,
++    IN gctINT SockFd,
++    IN gctINT How
++    );
++
++/* Send a message on a socket. */
++gceSTATUS
++gcoOS_Send(
++    IN gcoOS Os,
++    IN gctINT SockFd,
++    IN gctSIZE_T ByteCount,
++    IN gctCONST_POINTER Data,
++    IN gctINT Flags
++    );
++
++/* Initiate a connection on a socket. */
++gceSTATUS
++gcoOS_WaitForSend(
++    IN gcoOS Os,
++    IN gctINT SockFd,
++    IN gctINT Seconds,
++    IN gctINT MicroSeconds);
++
++/* Get environment variable value. */
++gceSTATUS
++gcoOS_GetEnv(
++    IN gcoOS Os,
++    IN gctCONST_STRING VarName,
++    OUT gctSTRING * Value
++    );
++
++/* Set environment variable value. */
++gceSTATUS
++gcoOS_SetEnv(
++    IN gcoOS Os,
++    IN gctCONST_STRING VarName,
++    IN gctSTRING Value
++    );
++
++/* Get current working directory. */
++gceSTATUS
++gcoOS_GetCwd(
++    IN gcoOS Os,
++	IN gctINT SizeInBytes,
++    OUT gctSTRING Buffer
++    );
++
++/* Get file status info. */
++gceSTATUS
++gcoOS_Stat(
++    IN gcoOS Os,
++    IN gctCONST_STRING FileName,
++    OUT gctPOINTER Buffer
++    );
++
++typedef enum _gceFILE_WHENCE
++{
++    gcvFILE_SEEK_SET,
++    gcvFILE_SEEK_CUR,
++    gcvFILE_SEEK_END
++}
++gceFILE_WHENCE;
++
++/* Set the current position of a file. */
++gceSTATUS
++gcoOS_Seek(
++    IN gcoOS Os,
++    IN gctFILE File,
++    IN gctUINT32 Offset,
++    IN gceFILE_WHENCE Whence
++    );
++
++/* Set the current position of a file. */
++gceSTATUS
++gcoOS_SetPos(
++    IN gcoOS Os,
++    IN gctFILE File,
++    IN gctUINT32 Position
++    );
++
++/* Get the current position of a file. */
++gceSTATUS
++gcoOS_GetPos(
++    IN gcoOS Os,
++    IN gctFILE File,
++    OUT gctUINT32 * Position
++    );
++
++/* Same as strstr. */
++gceSTATUS
++gcoOS_StrStr(
++    IN gctCONST_STRING String,
++    IN gctCONST_STRING SubString,
++    OUT gctSTRING * Output
++    );
++
++/* Find the last occurance of a character inside a string. */
++gceSTATUS
++gcoOS_StrFindReverse(
++    IN gctCONST_STRING String,
++    IN gctINT8 Character,
++    OUT gctSTRING * Output
++    );
++
++gceSTATUS
++gcoOS_StrDup(
++    IN gcoOS Os,
++    IN gctCONST_STRING String,
++    OUT gctSTRING * Target
++    );
++
++/* Copy a string. */
++gceSTATUS
++gcoOS_StrCopySafe(
++    IN gctSTRING Destination,
++    IN gctSIZE_T DestinationSize,
++    IN gctCONST_STRING Source
++    );
++
++/* Append a string. */
++gceSTATUS
++gcoOS_StrCatSafe(
++    IN gctSTRING Destination,
++    IN gctSIZE_T DestinationSize,
++    IN gctCONST_STRING Source
++    );
++
++/* Compare two strings. */
++gceSTATUS
++gcoOS_StrCmp(
++    IN gctCONST_STRING String1,
++    IN gctCONST_STRING String2
++    );
++
++/* Compare characters of two strings. */
++gceSTATUS
++gcoOS_StrNCmp(
++    IN gctCONST_STRING String1,
++    IN gctCONST_STRING String2,
++    IN gctSIZE_T Count
++    );
++
++/* Convert string to float. */
++gceSTATUS
++gcoOS_StrToFloat(
++    IN gctCONST_STRING String,
++    OUT gctFLOAT * Float
++    );
++
++/* Convert hex string to integer. */
++gceSTATUS
++gcoOS_HexStrToInt(
++	IN gctCONST_STRING String,
++	OUT gctINT * Int
++	);
++
++/* Convert hex string to float. */
++gceSTATUS
++gcoOS_HexStrToFloat(
++	IN gctCONST_STRING String,
++	OUT gctFLOAT * Float
++	);
++
++/* Convert string to integer. */
++gceSTATUS
++gcoOS_StrToInt(
++    IN gctCONST_STRING String,
++    OUT gctINT * Int
++    );
++
++gceSTATUS
++gcoOS_MemCmp(
++    IN gctCONST_POINTER Memory1,
++    IN gctCONST_POINTER Memory2,
++    IN gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gcoOS_PrintStrSafe(
++    OUT gctSTRING String,
++    IN gctSIZE_T StringSize,
++    IN OUT gctUINT * Offset,
++    IN gctCONST_STRING Format,
++    ...
++    );
++
++gceSTATUS
++gcoOS_LoadLibrary(
++    IN gcoOS Os,
++    IN gctCONST_STRING Library,
++    OUT gctHANDLE * Handle
++    );
++
++gceSTATUS
++gcoOS_FreeLibrary(
++    IN gcoOS Os,
++    IN gctHANDLE Handle
++    );
++
++gceSTATUS
++gcoOS_GetProcAddress(
++    IN gcoOS Os,
++    IN gctHANDLE Handle,
++    IN gctCONST_STRING Name,
++    OUT gctPOINTER * Function
++    );
++
++gceSTATUS
++gcoOS_Compact(
++    IN gcoOS Os
++    );
++
++gceSTATUS
++gcoOS_AddSignalHandler (
++    IN gceSignalHandlerType SignalHandlerType
++    );
++
++#if VIVANTE_PROFILER
++gceSTATUS
++gcoOS_ProfileStart(
++    IN gcoOS Os
++    );
++
++gceSTATUS
++gcoOS_ProfileEnd(
++    IN gcoOS Os,
++    IN gctCONST_STRING Title
++    );
++
++gceSTATUS
++gcoOS_SetProfileSetting(
++        IN gcoOS Os,
++        IN gctBOOL Enable,
++        IN gctCONST_STRING FileName
++        );
++#endif
++
++gctBOOL
++gcoOS_IsNeededSupportNP2Texture(
++    IN gctCHAR* ProcName
++    );
++
++/* Query the video memory. */
++gceSTATUS
++gcoOS_QueryVideoMemory(
++    IN gcoOS Os,
++    OUT gctPHYS_ADDR * InternalAddress,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctPHYS_ADDR * ExternalAddress,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctPHYS_ADDR * ContiguousAddress,
++    OUT gctSIZE_T * ContiguousSize
++    );
++
++/* Detect if the process is the executable specified. */
++gceSTATUS
++gcoOS_DetectProcessByNamePid(
++    IN gctCONST_STRING Name,
++    IN gctHANDLE Pid
++    );
++
++/* Detect if the current process is the executable specified. */
++gceSTATUS
++gcoOS_DetectProcessByName(
++    IN gctCONST_STRING Name
++    );
++
++gceSTATUS
++gcoOS_DetectProcessByEncryptedName(
++    IN gctCONST_STRING Name
++    );
++
++#if defined(ANDROID)
++gceSTATUS
++gcoOS_DetectProgrameByEncryptedSymbols(
++    IN gcoOS_SymbolsList Symbols
++    );
++#endif
++
++/*----------------------------------------------------------------------------*/
++/*----- Atoms ----------------------------------------------------------------*/
++
++/* Construct an atom. */
++gceSTATUS
++gcoOS_AtomConstruct(
++    IN gcoOS Os,
++    OUT gcsATOM_PTR * Atom
++    );
++
++/* Destroy an atom. */
++gceSTATUS
++gcoOS_AtomDestroy(
++    IN gcoOS Os,
++    IN gcsATOM_PTR Atom
++    );
++
++/* Increment an atom. */
++gceSTATUS
++gcoOS_AtomIncrement(
++    IN gcoOS Os,
++    IN gcsATOM_PTR Atom,
++    OUT gctINT32_PTR OldValue
++    );
++
++/* Decrement an atom. */
++gceSTATUS
++gcoOS_AtomDecrement(
++    IN gcoOS Os,
++    IN gcsATOM_PTR Atom,
++    OUT gctINT32_PTR OldValue
++    );
++
++gctHANDLE
++gcoOS_GetCurrentProcessID(
++    void
++    );
++
++gctHANDLE
++gcoOS_GetCurrentThreadID(
++    void
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----- Time -----------------------------------------------------------------*/
++
++/* Get the number of milliseconds since the system started. */
++gctUINT32
++gcoOS_GetTicks(
++    void
++    );
++
++/* Get time in microseconds. */
++gceSTATUS
++gcoOS_GetTime(
++    gctUINT64_PTR Time
++    );
++
++/* Get CPU usage in microseconds. */
++gceSTATUS
++gcoOS_GetCPUTime(
++    gctUINT64_PTR CPUTime
++    );
++
++/* Get memory usage. */
++gceSTATUS
++gcoOS_GetMemoryUsage(
++    gctUINT32_PTR MaxRSS,
++    gctUINT32_PTR IxRSS,
++    gctUINT32_PTR IdRSS,
++    gctUINT32_PTR IsRSS
++    );
++
++/* Delay a number of microseconds. */
++gceSTATUS
++gcoOS_Delay(
++    IN gcoOS Os,
++    IN gctUINT32 Delay
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----- Threads --------------------------------------------------------------*/
++
++#ifdef _WIN32
++/* Cannot include windows.h here becuase "near" and "far"
++ * which are used in gcsDEPTH_INFO, are defined to nothing in WinDef.h.
++ * So, use the real value of DWORD and WINAPI, instead.
++ * DWORD is unsigned long, and WINAPI is __stdcall.
++ * If these two are change in WinDef.h, the following two typdefs
++ * need to be changed, too.
++ */
++typedef unsigned long gctTHREAD_RETURN;
++typedef unsigned long (__stdcall * gcTHREAD_ROUTINE)(void * Argument);
++#else
++typedef void * gctTHREAD_RETURN;
++typedef void * (* gcTHREAD_ROUTINE)(void *);
++#endif
++
++/* Create a new thread. */
++gceSTATUS
++gcoOS_CreateThread(
++    IN gcoOS Os,
++    IN gcTHREAD_ROUTINE Worker,
++    IN gctPOINTER Argument,
++    OUT gctPOINTER * Thread
++    );
++
++/* Close a thread. */
++gceSTATUS
++gcoOS_CloseThread(
++    IN gcoOS Os,
++    IN gctPOINTER Thread
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----- Mutexes --------------------------------------------------------------*/
++
++/* Create a new mutex. */
++gceSTATUS
++gcoOS_CreateMutex(
++    IN gcoOS Os,
++    OUT gctPOINTER * Mutex
++    );
++
++/* Delete a mutex. */
++gceSTATUS
++gcoOS_DeleteMutex(
++    IN gcoOS Os,
++    IN gctPOINTER Mutex
++    );
++
++/* Acquire a mutex. */
++gceSTATUS
++gcoOS_AcquireMutex(
++    IN gcoOS Os,
++    IN gctPOINTER Mutex,
++    IN gctUINT32 Timeout
++    );
++
++/* Release a mutex. */
++gceSTATUS
++gcoOS_ReleaseMutex(
++    IN gcoOS Os,
++    IN gctPOINTER Mutex
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----- Signals --------------------------------------------------------------*/
++
++/* Create a signal. */
++gceSTATUS
++gcoOS_CreateSignal(
++    IN gcoOS Os,
++    IN gctBOOL ManualReset,
++    OUT gctSIGNAL * Signal
++    );
++
++/* Destroy a signal. */
++gceSTATUS
++gcoOS_DestroySignal(
++    IN gcoOS Os,
++    IN gctSIGNAL Signal
++    );
++
++/* Signal a signal. */
++gceSTATUS
++gcoOS_Signal(
++    IN gcoOS Os,
++    IN gctSIGNAL Signal,
++    IN gctBOOL State
++    );
++
++/* Wait for a signal. */
++gceSTATUS
++gcoOS_WaitSignal(
++    IN gcoOS Os,
++    IN gctSIGNAL Signal,
++    IN gctUINT32 Wait
++    );
++
++/* Map a signal from another process */
++gceSTATUS
++gcoOS_MapSignal(
++    IN gctSIGNAL  RemoteSignal,
++    OUT gctSIGNAL * LocalSignal
++    );
++
++/* Unmap a signal mapped from another process */
++gceSTATUS
++gcoOS_UnmapSignal(
++    IN gctSIGNAL Signal
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----- Android Native Fence -------------------------------------------------*/
++
++/* Create sync point. */
++gceSTATUS
++gcoOS_CreateSyncPoint(
++    IN gcoOS Os,
++    OUT gctSYNC_POINT * SyncPoint
++    );
++
++/* Destroy sync point. */
++gceSTATUS
++gcoOS_DestroySyncPoint(
++    IN gcoOS Os,
++    IN gctSYNC_POINT SyncPoint
++    );
++
++/* Create native fence. */
++gceSTATUS
++gcoOS_CreateNativeFence(
++    IN gcoOS Os,
++    IN gctSYNC_POINT SyncPoint,
++    OUT gctINT * FenceFD
++    );
++
++/* Wait on native fence. */
++gceSTATUS
++gcoOS_WaitNativeFence(
++    IN gcoOS Os,
++    IN gctINT FenceFD,
++    IN gctUINT32 Timeout
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----- Memory Access and Cache ----------------------------------------------*/
++
++/* Write a register. */
++gceSTATUS
++gcoOS_WriteRegister(
++    IN gcoOS Os,
++    IN gctUINT32 Address,
++    IN gctUINT32 Data
++    );
++
++/* Read a register. */
++gceSTATUS
++gcoOS_ReadRegister(
++    IN gcoOS Os,
++    IN gctUINT32 Address,
++    OUT gctUINT32 * Data
++    );
++
++gceSTATUS
++gcoOS_CacheClean(
++    IN gcoOS Os,
++    IN gctUINT64 Node,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gcoOS_CacheFlush(
++    IN gcoOS Os,
++    IN gctUINT64 Node,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gcoOS_CacheInvalidate(
++    IN gcoOS Os,
++    IN gctUINT64 Node,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gcoOS_MemoryBarrier(
++    IN gcoOS Os,
++    IN gctPOINTER Logical
++    );
++
++
++/*----------------------------------------------------------------------------*/
++/*----- Profile --------------------------------------------------------------*/
++
++gceSTATUS
++gckOS_GetProfileTick(
++    OUT gctUINT64_PTR Tick
++    );
++
++gceSTATUS
++gckOS_QueryProfileTickRate(
++    OUT gctUINT64_PTR TickRate
++    );
++
++gctUINT32
++gckOS_ProfileToMS(
++    IN gctUINT64 Ticks
++    );
++
++gceSTATUS
++gcoOS_GetProfileTick(
++    OUT gctUINT64_PTR Tick
++    );
++
++gceSTATUS
++gcoOS_QueryProfileTickRate(
++    OUT gctUINT64_PTR TickRate
++    );
++
++#define _gcmPROFILE_INIT(prefix, freq, start) \
++    do { \
++        prefix ## OS_QueryProfileTickRate(&(freq)); \
++        prefix ## OS_GetProfileTick(&(start)); \
++    } while (gcvFALSE)
++
++#define _gcmPROFILE_QUERY(prefix, start, ticks) \
++    do { \
++        prefix ## OS_GetProfileTick(&(ticks)); \
++        (ticks) = ((ticks) > (start)) ? ((ticks) - (start)) \
++                                      : (~0ull - (start) + (ticks) + 1); \
++    } while (gcvFALSE)
++
++#if gcdENABLE_PROFILING
++#   define gcmkPROFILE_INIT(freq, start)    _gcmPROFILE_INIT(gck, freq, start)
++#   define gcmkPROFILE_QUERY(start, ticks)  _gcmPROFILE_QUERY(gck, start, ticks)
++#   define gcmPROFILE_INIT(freq, start)     _gcmPROFILE_INIT(gco, freq, start)
++#   define gcmPROFILE_QUERY(start, ticks)   _gcmPROFILE_QUERY(gco, start, ticks)
++#   define gcmPROFILE_ONLY(x)               x
++#   define gcmPROFILE_ELSE(x)               do { } while (gcvFALSE)
++#   define gcmPROFILE_DECLARE_ONLY(x)       x
++#   define gcmPROFILE_DECLARE_ELSE(x)       typedef x
++#else
++#   define gcmkPROFILE_INIT(start, freq)    do { } while (gcvFALSE)
++#   define gcmkPROFILE_QUERY(start, ticks)  do { } while (gcvFALSE)
++#   define gcmPROFILE_INIT(start, freq)     do { } while (gcvFALSE)
++#   define gcmPROFILE_QUERY(start, ticks)   do { } while (gcvFALSE)
++#   define gcmPROFILE_ONLY(x)               do { } while (gcvFALSE)
++#   define gcmPROFILE_ELSE(x)               x
++#   define gcmPROFILE_DECLARE_ONLY(x)       do { } while (gcvFALSE) 
++#   define gcmPROFILE_DECLARE_ELSE(x)       x
++#endif
++
++/*******************************************************************************
++**  gcoMATH object
++*/
++
++#define gcdPI                   3.14159265358979323846f
++
++/* Kernel. */
++gctINT
++gckMATH_ModuloInt(
++    IN gctINT X,
++    IN gctINT Y
++    );
++
++/* User. */
++gctUINT32
++gcoMATH_Log2in5dot5(
++    IN gctINT X
++    );
++
++
++gctFLOAT
++gcoMATH_UIntAsFloat(
++    IN gctUINT32 X
++    );
++
++gctUINT32
++gcoMATH_FloatAsUInt(
++    IN gctFLOAT X
++    );
++
++gctBOOL
++gcoMATH_CompareEqualF(
++    IN gctFLOAT X,
++    IN gctFLOAT Y
++    );
++
++gctUINT16
++gcoMATH_UInt8AsFloat16(
++    IN gctUINT8 X
++    );
++
++/******************************************************************************\
++**************************** Coordinate Structures *****************************
++\******************************************************************************/
++
++typedef struct _gcsPOINT
++{
++    gctINT32                    x;
++    gctINT32                    y;
++}
++gcsPOINT;
++
++typedef struct _gcsSIZE
++{
++    gctINT32                    width;
++    gctINT32                    height;
++}
++gcsSIZE;
++
++typedef struct _gcsRECT
++{
++    gctINT32                    left;
++    gctINT32                    top;
++    gctINT32                    right;
++    gctINT32                    bottom;
++}
++gcsRECT;
++
++typedef union _gcsPIXEL
++{
++    struct
++    {
++        gctFLOAT r, g, b, a;
++        gctFLOAT d, s;
++    } pf;
++
++    struct
++    {
++        gctINT32 r, g, b, a;
++        gctINT32 d, s;
++    } pi;
++
++    struct
++    {
++        gctUINT32 r, g, b, a;
++        gctUINT32 d, s;
++    } pui;
++
++} gcsPIXEL;
++
++
++/******************************************************************************\
++********************************* gcoSURF Object ********************************
++\******************************************************************************/
++
++/*----------------------------------------------------------------------------*/
++/*------------------------------- gcoSURF Common ------------------------------*/
++
++/* Color format classes. */
++typedef enum _gceFORMAT_CLASS
++{
++    gcvFORMAT_CLASS_RGBA        = 4500,
++    gcvFORMAT_CLASS_YUV,
++    gcvFORMAT_CLASS_INDEX,
++    gcvFORMAT_CLASS_LUMINANCE,
++    gcvFORMAT_CLASS_BUMP,
++    gcvFORMAT_CLASS_DEPTH,
++}
++gceFORMAT_CLASS;
++
++/* Special enums for width field in gcsFORMAT_COMPONENT. */
++typedef enum _gceCOMPONENT_CONTROL
++{
++    gcvCOMPONENT_NOTPRESENT     = 0x00,
++    gcvCOMPONENT_DONTCARE       = 0x80,
++    gcvCOMPONENT_WIDTHMASK      = 0x7F,
++    gcvCOMPONENT_ODD            = 0x80
++}
++gceCOMPONENT_CONTROL;
++
++/* Color format component parameters. */
++typedef struct _gcsFORMAT_COMPONENT
++{
++    gctUINT8                    start;
++    gctUINT8                    width;
++}
++gcsFORMAT_COMPONENT;
++
++/* RGBA color format class. */
++typedef struct _gcsFORMAT_CLASS_TYPE_RGBA
++{
++    gcsFORMAT_COMPONENT         alpha;
++    gcsFORMAT_COMPONENT         red;
++    gcsFORMAT_COMPONENT         green;
++    gcsFORMAT_COMPONENT         blue;
++}
++gcsFORMAT_CLASS_TYPE_RGBA;
++
++/* YUV color format class. */
++typedef struct _gcsFORMAT_CLASS_TYPE_YUV
++{
++    gcsFORMAT_COMPONENT         y;
++    gcsFORMAT_COMPONENT         u;
++    gcsFORMAT_COMPONENT         v;
++}
++gcsFORMAT_CLASS_TYPE_YUV;
++
++/* Index color format class. */
++typedef struct _gcsFORMAT_CLASS_TYPE_INDEX
++{
++    gcsFORMAT_COMPONENT         value;
++}
++gcsFORMAT_CLASS_TYPE_INDEX;
++
++/* Luminance color format class. */
++typedef struct _gcsFORMAT_CLASS_TYPE_LUMINANCE
++{
++    gcsFORMAT_COMPONENT         alpha;
++    gcsFORMAT_COMPONENT         value;
++}
++gcsFORMAT_CLASS_TYPE_LUMINANCE;
++
++/* Bump map color format class. */
++typedef struct _gcsFORMAT_CLASS_TYPE_BUMP
++{
++    gcsFORMAT_COMPONENT         alpha;
++    gcsFORMAT_COMPONENT         l;
++    gcsFORMAT_COMPONENT         v;
++    gcsFORMAT_COMPONENT         u;
++    gcsFORMAT_COMPONENT         q;
++    gcsFORMAT_COMPONENT         w;
++}
++gcsFORMAT_CLASS_TYPE_BUMP;
++
++/* Depth and stencil format class. */
++typedef struct _gcsFORMAT_CLASS_TYPE_DEPTH
++{
++    gcsFORMAT_COMPONENT         depth;
++    gcsFORMAT_COMPONENT         stencil;
++}
++gcsFORMAT_CLASS_TYPE_DEPTH;
++
++/* Format parameters. */
++typedef struct _gcsSURF_FORMAT_INFO
++{
++    /* Format code and class. */
++    gceSURF_FORMAT              format;
++    gceFORMAT_CLASS             fmtClass;
++
++    /* The size of one pixel in bits. */
++    gctUINT8                    bitsPerPixel;
++
++    /* Component swizzle. */
++    gceSURF_SWIZZLE             swizzle;
++
++    /* Some formats have two neighbour pixels interleaved together. */
++    /* To describe such format, set the flag to 1 and add another   */
++    /* like this one describing the odd pixel format.               */
++    gctUINT8                    interleaved;
++
++    /* Format components. */
++    union
++    {
++        gcsFORMAT_CLASS_TYPE_BUMP       bump;
++        gcsFORMAT_CLASS_TYPE_RGBA       rgba;
++        gcsFORMAT_CLASS_TYPE_YUV        yuv;
++        gcsFORMAT_CLASS_TYPE_LUMINANCE  lum;
++        gcsFORMAT_CLASS_TYPE_INDEX      index;
++        gcsFORMAT_CLASS_TYPE_DEPTH      depth;
++    } u;
++}
++gcsSURF_FORMAT_INFO;
++
++/* Frame buffer information. */
++typedef struct _gcsSURF_FRAMEBUFFER
++{
++    gctPOINTER                  logical;
++    gctUINT                     width, height;
++    gctINT                      stride;
++    gceSURF_FORMAT              format;
++}
++gcsSURF_FRAMEBUFFER;
++
++typedef struct _gcsVIDMEM_NODE_SHARED_INFO
++{
++    gctBOOL                     tileStatusDisabled;
++    gcsPOINT                    SrcOrigin;
++    gcsPOINT                    DestOrigin;
++    gcsSIZE                     RectSize;
++    gctUINT32                   clearValue;
++}
++gcsVIDMEM_NODE_SHARED_INFO;
++
++/* Generic pixel component descriptors. */
++extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_XXX8;
++extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_XX8X;
++extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_X8XX;
++extern gcsFORMAT_COMPONENT gcvPIXEL_COMP_8XXX;
++
++typedef enum _gceORIENTATION
++{
++    gcvORIENTATION_TOP_BOTTOM,
++    gcvORIENTATION_BOTTOM_TOP,
++}
++gceORIENTATION;
++
++
++/* Construct a new gcoSURF object. */
++gceSTATUS
++gcoSURF_Construct(
++    IN gcoHAL Hal,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Depth,
++    IN gceSURF_TYPE Type,
++    IN gceSURF_FORMAT Format,
++    IN gcePOOL Pool,
++    OUT gcoSURF * Surface
++    );
++
++/* Destroy an gcoSURF object. */
++gceSTATUS
++gcoSURF_Destroy(
++    IN gcoSURF Surface
++    );
++
++/* Map user-allocated surface. */
++gceSTATUS
++gcoSURF_MapUserSurface(
++    IN gcoSURF Surface,
++    IN gctUINT Alignment,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Physical
++    );
++
++/* Query vid mem node info. */
++gceSTATUS
++gcoSURF_QueryVidMemNode(
++    IN gcoSURF Surface,
++    OUT gctUINT64 * Node,
++    OUT gcePOOL * Pool,
++    OUT gctUINT_PTR Bytes
++    );
++
++/* Set the color type of the surface. */
++gceSTATUS
++gcoSURF_SetColorType(
++    IN gcoSURF Surface,
++    IN gceSURF_COLOR_TYPE ColorType
++    );
++
++/* Get the color type of the surface. */
++gceSTATUS
++gcoSURF_GetColorType(
++    IN gcoSURF Surface,
++    OUT gceSURF_COLOR_TYPE *ColorType
++    );
++
++/* Set the surface ration angle. */
++gceSTATUS
++gcoSURF_SetRotation(
++    IN gcoSURF Surface,
++    IN gceSURF_ROTATION Rotation
++    );
++
++gceSTATUS
++gcoSURF_SetPreRotation(
++    IN gcoSURF Surface,
++    IN gceSURF_ROTATION Rotation
++    );
++
++gceSTATUS
++gcoSURF_GetPreRotation(
++    IN gcoSURF Surface,
++    IN gceSURF_ROTATION *Rotation
++    );
++
++gceSTATUS
++gcoSURF_IsValid(
++    IN gcoSURF Surface
++    );
++
++#ifndef VIVANTE_NO_3D
++/* Verify and return the state of the tile status mechanism. */
++gceSTATUS
++gcoSURF_IsTileStatusSupported(
++    IN gcoSURF Surface
++    );
++
++/* Process tile status for the specified surface. */
++gceSTATUS
++gcoSURF_SetTileStatus(
++    IN gcoSURF Surface
++    );
++
++/* Enable tile status for the specified surface. */
++gceSTATUS
++gcoSURF_EnableTileStatus(
++    IN gcoSURF Surface
++    );
++
++/* Disable tile status for the specified surface. */
++gceSTATUS
++gcoSURF_DisableTileStatus(
++    IN gcoSURF Surface,
++    IN gctBOOL Decompress
++    );
++
++gceSTATUS
++gcoSURF_AlignResolveRect(
++    IN gcoSURF Surf,
++    IN gcsPOINT_PTR RectOrigin,
++    IN gcsPOINT_PTR RectSize,
++    OUT gcsPOINT_PTR AlignedOrigin,
++    OUT gcsPOINT_PTR AlignedSize
++    );
++#endif /* VIVANTE_NO_3D */
++
++/* Get surface size. */
++gceSTATUS
++gcoSURF_GetSize(
++    IN gcoSURF Surface,
++    OUT gctUINT * Width,
++    OUT gctUINT * Height,
++    OUT gctUINT * Depth
++    );
++
++/* Get surface aligned sizes. */
++gceSTATUS
++gcoSURF_GetAlignedSize(
++    IN gcoSURF Surface,
++    OUT gctUINT * Width,
++    OUT gctUINT * Height,
++    OUT gctINT * Stride
++    );
++
++/* Get alignments. */
++gceSTATUS
++gcoSURF_GetAlignment(
++    IN gceSURF_TYPE Type,
++    IN gceSURF_FORMAT Format,
++    OUT gctUINT * AddressAlignment,
++    OUT gctUINT * XAlignment,
++    OUT gctUINT * YAlignment
++    );
++
++/* Get surface type and format. */
++gceSTATUS
++gcoSURF_GetFormat(
++    IN gcoSURF Surface,
++    OUT gceSURF_TYPE * Type,
++    OUT gceSURF_FORMAT * Format
++    );
++
++/* Get surface tiling. */
++gceSTATUS
++gcoSURF_GetTiling(
++    IN gcoSURF Surface,
++    OUT gceTILING * Tiling
++    );
++
++/* Lock the surface. */
++gceSTATUS
++gcoSURF_Lock(
++    IN gcoSURF Surface,
++    IN OUT gctUINT32 * Address,
++    IN OUT gctPOINTER * Memory
++    );
++
++/* Unlock the surface. */
++gceSTATUS
++gcoSURF_Unlock(
++    IN gcoSURF Surface,
++    IN gctPOINTER Memory
++    );
++
++/* Return pixel format parameters. */
++gceSTATUS
++gcoSURF_QueryFormat(
++    IN gceSURF_FORMAT Format,
++    OUT gcsSURF_FORMAT_INFO_PTR * Info
++    );
++
++/* Compute the color pixel mask. */
++gceSTATUS
++gcoSURF_ComputeColorMask(
++    IN gcsSURF_FORMAT_INFO_PTR Format,
++    OUT gctUINT32_PTR ColorMask
++    );
++
++/* Flush the surface. */
++gceSTATUS
++gcoSURF_Flush(
++    IN gcoSURF Surface
++    );
++
++/* Fill surface from it's tile status buffer. */
++gceSTATUS
++gcoSURF_FillFromTile(
++    IN gcoSURF Surface
++    );
++
++/* Check if surface needs a filler. */
++gceSTATUS gcoSURF_NeedFiller(IN gcoSURF Surface);
++
++/* Fill surface with a value. */
++gceSTATUS
++gcoSURF_Fill(
++    IN gcoSURF Surface,
++    IN gcsPOINT_PTR Origin,
++    IN gcsSIZE_PTR Size,
++    IN gctUINT32 Value,
++    IN gctUINT32 Mask
++    );
++
++/* Alpha blend two surfaces together. */
++gceSTATUS
++gcoSURF_Blend(
++    IN gcoSURF SrcSurface,
++    IN gcoSURF DestSurface,
++    IN gcsPOINT_PTR SrcOrig,
++    IN gcsPOINT_PTR DestOrigin,
++    IN gcsSIZE_PTR Size,
++    IN gceSURF_BLEND_MODE Mode
++    );
++
++/* Create a new gcoSURF wrapper object. */
++gceSTATUS
++gcoSURF_ConstructWrapper(
++    IN gcoHAL Hal,
++    OUT gcoSURF * Surface
++    );
++
++/* Set the underlying buffer for the surface wrapper. */
++gceSTATUS
++gcoSURF_SetBuffer(
++    IN gcoSURF Surface,
++    IN gceSURF_TYPE Type,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT Stride,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Physical
++    );
++
++/* Set the underlying video buffer for the surface wrapper. */
++gceSTATUS
++gcoSURF_SetVideoBuffer(
++    IN gcoSURF Surface,
++    IN gceSURF_TYPE Type,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Stride,
++    IN gctPOINTER *LogicalPlane1,
++    IN gctUINT32 *PhysicalPlane1
++    );
++
++/* Set the size of the surface in pixels and map the underlying buffer. */
++gceSTATUS
++gcoSURF_SetWindow(
++    IN gcoSURF Surface,
++    IN gctUINT X,
++    IN gctUINT Y,
++    IN gctUINT Width,
++    IN gctUINT Height
++    );
++
++/* Set width/height alignment of the surface directly and calculate stride/size. This is only for dri backend now. Please be careful before use. */
++gceSTATUS
++gcoSURF_SetAlignment(
++    IN gcoSURF Surface,
++    IN gctUINT Width,
++    IN gctUINT Height
++    );
++
++/* Increase reference count of the surface. */
++gceSTATUS
++gcoSURF_ReferenceSurface(
++    IN gcoSURF Surface
++    );
++
++/* Get surface reference count. */
++gceSTATUS
++gcoSURF_QueryReferenceCount(
++    IN gcoSURF Surface,
++    OUT gctINT32 * ReferenceCount
++    );
++
++/* Set surface orientation. */
++gceSTATUS
++gcoSURF_SetOrientation(
++    IN gcoSURF Surface,
++    IN gceORIENTATION Orientation
++    );
++
++/* Query surface orientation. */
++gceSTATUS
++gcoSURF_QueryOrientation(
++    IN gcoSURF Surface,
++    OUT gceORIENTATION * Orientation
++    );
++
++gceSTATUS
++gcoSURF_SetOffset(
++    IN gcoSURF Surface,
++    IN gctUINT Offset
++    );
++
++gceSTATUS
++gcoSURF_GetOffset(
++    IN gcoSURF Surface,
++    OUT gctUINT *Offset
++    );
++
++gceSTATUS
++gcoSURF_NODE_Cache(
++    IN gcsSURF_NODE_PTR Node,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes,
++    IN gceCACHEOPERATION Operation
++    );
++
++/* Perform CPU cache operation on surface */
++gceSTATUS
++gcoSURF_CPUCacheOperation(
++    IN gcoSURF Surface,
++    IN gceCACHEOPERATION Operation
++    );
++
++
++gceSTATUS
++gcoSURF_SetLinearResolveAddress(
++    IN gcoSURF Surface,
++    IN gctUINT32 Address,
++    IN gctPOINTER Memory
++    );
++
++    gceSTATUS
++    gcoSURF_Swap(IN gcoSURF Surface1, IN gcoSURF Surface2);
++
++/******************************************************************************\
++********************************* gcoDUMP Object ********************************
++\******************************************************************************/
++
++/* Construct a new gcoDUMP object. */
++gceSTATUS
++gcoDUMP_Construct(
++    IN gcoOS Os,
++    IN gcoHAL Hal,
++    OUT gcoDUMP * Dump
++    );
++
++/* Destroy a gcoDUMP object. */
++gceSTATUS
++gcoDUMP_Destroy(
++    IN gcoDUMP Dump
++    );
++
++/* Enable/disable dumping. */
++gceSTATUS
++gcoDUMP_Control(
++    IN gcoDUMP Dump,
++    IN gctSTRING FileName
++    );
++
++gceSTATUS
++gcoDUMP_IsEnabled(
++    IN gcoDUMP Dump,
++    OUT gctBOOL * Enabled
++    );
++
++/* Add surface. */
++gceSTATUS
++gcoDUMP_AddSurface(
++    IN gcoDUMP Dump,
++    IN gctINT32 Width,
++    IN gctINT32 Height,
++    IN gceSURF_FORMAT PixelFormat,
++    IN gctUINT32 Address,
++    IN gctSIZE_T ByteCount
++    );
++
++/* Mark the beginning of a frame. */
++gceSTATUS
++gcoDUMP_FrameBegin(
++    IN gcoDUMP Dump
++    );
++
++/* Mark the end of a frame. */
++gceSTATUS
++gcoDUMP_FrameEnd(
++    IN gcoDUMP Dump
++    );
++
++/* Dump data. */
++gceSTATUS
++gcoDUMP_DumpData(
++    IN gcoDUMP Dump,
++    IN gceDUMP_TAG Type,
++    IN gctUINT32 Address,
++    IN gctSIZE_T ByteCount,
++    IN gctCONST_POINTER Data
++    );
++
++/* Delete an address. */
++gceSTATUS
++gcoDUMP_Delete(
++    IN gcoDUMP Dump,
++    IN gctUINT32 Address
++    );
++
++/* Enable dump or not. */
++gceSTATUS
++gcoDUMP_SetDumpFlag(
++    IN gctBOOL DumpState
++    );
++
++/******************************************************************************\
++******************************* gcsRECT Structure ******************************
++\******************************************************************************/
++
++/* Initialize rectangle structure. */
++gceSTATUS
++gcsRECT_Set(
++    OUT gcsRECT_PTR Rect,
++    IN gctINT32 Left,
++    IN gctINT32 Top,
++    IN gctINT32 Right,
++    IN gctINT32 Bottom
++    );
++
++/* Return the width of the rectangle. */
++gceSTATUS
++gcsRECT_Width(
++    IN gcsRECT_PTR Rect,
++    OUT gctINT32 * Width
++    );
++
++/* Return the height of the rectangle. */
++gceSTATUS
++gcsRECT_Height(
++    IN gcsRECT_PTR Rect,
++    OUT gctINT32 * Height
++    );
++
++/* Ensure that top left corner is to the left and above the right bottom. */
++gceSTATUS
++gcsRECT_Normalize(
++    IN OUT gcsRECT_PTR Rect
++    );
++
++/* Compare two rectangles. */
++gceSTATUS
++gcsRECT_IsEqual(
++    IN gcsRECT_PTR Rect1,
++    IN gcsRECT_PTR Rect2,
++    OUT gctBOOL * Equal
++    );
++
++/* Compare the sizes of two rectangles. */
++gceSTATUS
++gcsRECT_IsOfEqualSize(
++    IN gcsRECT_PTR Rect1,
++    IN gcsRECT_PTR Rect2,
++    OUT gctBOOL * EqualSize
++    );
++
++gceSTATUS
++gcsRECT_RelativeRotation(
++    IN gceSURF_ROTATION Orientation,
++    IN OUT gceSURF_ROTATION *Relation);
++
++gceSTATUS
++
++gcsRECT_Rotate(
++
++    IN OUT gcsRECT_PTR Rect,
++
++    IN gceSURF_ROTATION Rotation,
++
++    IN gceSURF_ROTATION toRotation,
++
++    IN gctINT32 SurfaceWidth,
++
++    IN gctINT32 SurfaceHeight
++
++    );
++
++/******************************************************************************\
++**************************** gcsBOUNDARY Structure *****************************
++\******************************************************************************/
++
++typedef struct _gcsBOUNDARY
++{
++    gctINT                      x;
++    gctINT                      y;
++    gctINT                      width;
++    gctINT                      height;
++}
++gcsBOUNDARY;
++
++/******************************************************************************\
++********************************* gcoHEAP Object ********************************
++\******************************************************************************/
++
++typedef struct _gcoHEAP *       gcoHEAP;
++
++/* Construct a new gcoHEAP object. */
++gceSTATUS
++gcoHEAP_Construct(
++    IN gcoOS Os,
++    IN gctSIZE_T AllocationSize,
++    OUT gcoHEAP * Heap
++    );
++
++/* Destroy an gcoHEAP object. */
++gceSTATUS
++gcoHEAP_Destroy(
++    IN gcoHEAP Heap
++    );
++
++/* Allocate memory. */
++gceSTATUS
++gcoHEAP_Allocate(
++    IN gcoHEAP Heap,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Node
++    );
++
++gceSTATUS
++gcoHEAP_GetMemorySize(
++    IN gcoHEAP Heap,
++    IN gctPOINTER Memory,
++    OUT gctSIZE_T_PTR MemorySize
++    );
++
++/* Free memory. */
++gceSTATUS
++gcoHEAP_Free(
++    IN gcoHEAP Heap,
++    IN gctPOINTER Node
++    );
++
++#if (VIVANTE_PROFILER  || gcdDEBUG)
++/* Profile the heap. */
++gceSTATUS
++gcoHEAP_ProfileStart(
++    IN gcoHEAP Heap
++    );
++
++gceSTATUS
++gcoHEAP_ProfileEnd(
++    IN gcoHEAP Heap,
++    IN gctCONST_STRING Title
++    );
++#endif
++
++
++/******************************************************************************\
++******************************* Debugging Macros *******************************
++\******************************************************************************/
++
++void
++gcoOS_SetDebugLevel(
++    IN gctUINT32 Level
++    );
++
++void
++gcoOS_GetDebugLevel(
++    OUT gctUINT32_PTR DebugLevel
++    );
++
++void
++gcoOS_SetDebugZone(
++    IN gctUINT32 Zone
++    );
++
++void
++gcoOS_GetDebugZone(
++    IN gctUINT32 Zone,
++    OUT gctUINT32_PTR DebugZone
++    );
++
++void
++gcoOS_SetDebugLevelZone(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone
++    );
++
++void
++gcoOS_SetDebugZones(
++    IN gctUINT32 Zones,
++    IN gctBOOL Enable
++    );
++
++void
++gcoOS_SetDebugFile(
++    IN gctCONST_STRING FileName
++    );
++
++gctFILE
++gcoOS_ReplaceDebugFile(
++    IN gctFILE fp
++	);
++
++/*******************************************************************************
++**
++**  gcmFATAL
++**
++**      Print a message to the debugger and execute a break point.
++**
++**  ARGUMENTS:
++**
++**      message Message.
++**      ...     Optional arguments.
++*/
++
++void
++gckOS_DebugFatal(
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gcoOS_DebugFatal(
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++#if gcmIS_DEBUG(gcdDEBUG_FATAL)
++#   define gcmFATAL             gcoOS_DebugFatal
++#   define gcmkFATAL            gckOS_DebugFatal
++#elif gcdHAS_ELLIPSES
++#   define gcmFATAL(...)
++#   define gcmkFATAL(...)
++#else
++    gcmINLINE static void
++    __dummy_fatal(
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++#   define gcmFATAL             __dummy_fatal
++#   define gcmkFATAL            __dummy_fatal
++#endif
++
++#define gcmENUM2TEXT(e)         case e: return #e
++
++/*******************************************************************************
++**
++**  gcmTRACE
++**
++**      Print a message to the debugfer if the correct level has been set.  In
++**      retail mode this macro does nothing.
++**
++**  ARGUMENTS:
++**
++**      level   Level of message.
++**      message Message.
++**      ...     Optional arguments.
++*/
++#define gcvLEVEL_NONE           -1
++#define gcvLEVEL_ERROR          0
++#define gcvLEVEL_WARNING        1
++#define gcvLEVEL_INFO           2
++#define gcvLEVEL_VERBOSE        3
++
++void
++gckOS_DebugTrace(
++    IN gctUINT32 Level,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gckOS_DebugTraceN(
++    IN gctUINT32 Level,
++    IN gctUINT ArgumentSize,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gcoOS_DebugTrace(
++    IN gctUINT32 Level,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++#   define gcmTRACE             gcoOS_DebugTrace
++#   define gcmkTRACE            gckOS_DebugTrace
++#   define gcmkTRACE_N          gckOS_DebugTraceN
++#elif gcdHAS_ELLIPSES
++#   define gcmTRACE(...)
++#   define gcmkTRACE(...)
++#   define gcmkTRACE_N(...)
++#else
++    gcmINLINE static void
++    __dummy_trace(
++        IN gctUINT32 Level,
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++
++    gcmINLINE static void
++    __dummy_trace_n(
++        IN gctUINT32 Level,
++        IN gctUINT ArgumentSize,
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++
++#   define gcmTRACE             __dummy_trace
++#   define gcmkTRACE            __dummy_trace
++#   define gcmkTRACE_N          __dummy_trace_n
++#endif
++
++/* Zones common for kernel and user. */
++#define gcvZONE_OS              (1 << 0)
++#define gcvZONE_HARDWARE        (1 << 1)
++#define gcvZONE_HEAP            (1 << 2)
++#define gcvZONE_SIGNAL          (1 << 27)
++
++/* Kernel zones. */
++#define gcvZONE_KERNEL          (1 << 3)
++#define gcvZONE_VIDMEM          (1 << 4)
++#define gcvZONE_COMMAND         (1 << 5)
++#define gcvZONE_DRIVER          (1 << 6)
++#define gcvZONE_CMODEL          (1 << 7)
++#define gcvZONE_MMU             (1 << 8)
++#define gcvZONE_EVENT           (1 << 9)
++#define gcvZONE_DEVICE          (1 << 10)
++#define gcvZONE_DATABASE        (1 << 11)
++#define gcvZONE_INTERRUPT       (1 << 12)
++#define gcvZONE_POWER           (1 << 13)
++
++/* User zones. */
++#define gcvZONE_HAL             (1 << 3)
++#define gcvZONE_BUFFER          (1 << 4)
++#define gcvZONE_CONTEXT         (1 << 5)
++#define gcvZONE_SURFACE         (1 << 6)
++#define gcvZONE_INDEX           (1 << 7)
++#define gcvZONE_STREAM          (1 << 8)
++#define gcvZONE_TEXTURE         (1 << 9)
++#define gcvZONE_2D              (1 << 10)
++#define gcvZONE_3D              (1 << 11)
++#define gcvZONE_COMPILER        (1 << 12)
++#define gcvZONE_MEMORY          (1 << 13)
++#define gcvZONE_STATE           (1 << 14)
++#define gcvZONE_AUX             (1 << 15)
++#define gcvZONE_VERTEX          (1 << 16)
++#define gcvZONE_CL              (1 << 17)
++#define gcvZONE_COMPOSITION     (1 << 17)
++#define gcvZONE_VG              (1 << 18)
++#define gcvZONE_IMAGE           (1 << 19)
++#define gcvZONE_UTILITY         (1 << 20)
++#define gcvZONE_PARAMETERS      (1 << 21)
++
++/* API definitions. */
++#define gcvZONE_API_HAL         (1 << 28)
++#define gcvZONE_API_EGL         (2 << 28)
++#define gcvZONE_API_ES11        (3 << 28)
++#define gcvZONE_API_ES20        (4 << 28)
++#define gcvZONE_API_VG11        (5 << 28)
++#define gcvZONE_API_GL          (6 << 28)
++#define gcvZONE_API_DFB         (7 << 28)
++#define gcvZONE_API_GDI         (8 << 28)
++#define gcvZONE_API_D3D         (9 << 28)
++#define gcvZONE_API_ES30        (10 << 28)
++
++
++#define gcmZONE_GET_API(zone)   ((zone) >> 28)
++/*Set gcdZONE_MASE like 0x0 | gcvZONE_API_EGL
++will enable print EGL module debug info*/
++#define gcdZONE_MASK            0x0FFFFFFF
++
++/* Handy zones. */
++#define gcvZONE_NONE            0
++#define gcvZONE_ALL             0x0FFFFFFF
++
++/*Dump API depth set 1 for API, 2 for API and API behavior*/
++#define gcvDUMP_API_DEPTH       1
++
++/*******************************************************************************
++**
++**  gcmTRACE_ZONE
++**
++**      Print a message to the debugger if the correct level and zone has been
++**      set.  In retail mode this macro does nothing.
++**
++**  ARGUMENTS:
++**
++**      Level   Level of message.
++**      Zone    Zone of message.
++**      Message Message.
++**      ...     Optional arguments.
++*/
++
++void
++gckOS_DebugTraceZone(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gckOS_DebugTraceZoneN(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone,
++    IN gctUINT ArgumentSize,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gcoOS_DebugTraceZone(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++#   define gcmTRACE_ZONE            gcoOS_DebugTraceZone
++#   define gcmkTRACE_ZONE           gckOS_DebugTraceZone
++#   define gcmkTRACE_ZONE_N         gckOS_DebugTraceZoneN
++#elif gcdHAS_ELLIPSES
++#   define gcmTRACE_ZONE(...)
++#   define gcmkTRACE_ZONE(...)
++#   define gcmkTRACE_ZONE_N(...)
++#else
++    gcmINLINE static void
++    __dummy_trace_zone(
++        IN gctUINT32 Level,
++        IN gctUINT32 Zone,
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++
++    gcmINLINE static void
++    __dummy_trace_zone_n(
++        IN gctUINT32 Level,
++        IN gctUINT32 Zone,
++        IN gctUINT ArgumentSize,
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++
++#   define gcmTRACE_ZONE            __dummy_trace_zone
++#   define gcmkTRACE_ZONE           __dummy_trace_zone
++#   define gcmkTRACE_ZONE_N         __dummy_trace_zone_n
++#endif
++
++/*******************************************************************************
++**
++**  gcmDEBUG_ONLY
++**
++**      Execute a statement or function only in DEBUG mode.
++**
++**  ARGUMENTS:
++**
++**      f       Statement or function to execute.
++*/
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++#   define gcmDEBUG_ONLY(f)         f
++#else
++#   define gcmDEBUG_ONLY(f)
++#endif
++
++/*******************************************************************************
++**
++**  gcmSTACK_PUSH
++**  gcmSTACK_POP
++**  gcmSTACK_DUMP
++**
++**      Push or pop a function with entry arguments on the trace stack.
++**
++**  ARGUMENTS:
++**
++**      Function    Name of function.
++**      Line        Line number.
++**      Text        Optional text.
++**      ...         Optional arguments for text.
++*/
++#if gcmIS_DEBUG(gcdDEBUG_STACK)
++    void
++    gcoOS_StackPush(
++        IN gctCONST_STRING Function,
++        IN gctINT Line,
++        IN gctCONST_STRING Text,
++        ...
++        );
++    void
++    gcoOS_StackPop(
++        IN gctCONST_STRING Function
++        );
++    void
++    gcoOS_StackDump(
++        void
++        );
++#   define gcmSTACK_PUSH            gcoOS_StackPush
++#   define gcmSTACK_POP             gcoOS_StackPop
++#   define gcmSTACK_DUMP            gcoOS_StackDump
++#elif gcdHAS_ELLIPSES
++#   define gcmSTACK_PUSH(...)       do { } while (0)
++#   define gcmSTACK_POP(Function)   do { } while (0)
++#   define gcmSTACK_DUMP()          do { } while (0)
++#else
++    gcmINLINE static void
++    __dummy_stack_push(
++        IN gctCONST_STRING Function,
++        IN gctINT Line,
++        IN gctCONST_STRING Text, ...
++        )
++    {
++    }
++#   define gcmSTACK_PUSH            __dummy_stack_push
++#   define gcmSTACK_POP(Function)   do { } while (0)
++#   define gcmSTACK_DUMP()          do { } while (0)
++#endif
++
++/******************************************************************************\
++******************************** Logging Macros ********************************
++\******************************************************************************/
++
++#define gcdHEADER_LEVEL             gcvLEVEL_VERBOSE
++
++
++#if gcdENABLE_PROFILING
++void
++gcoOS_ProfileDB(
++    IN gctCONST_STRING Function,
++    IN OUT gctBOOL_PTR Initialized
++    );
++
++#define gcmHEADER() \
++    static gctBOOL __profile__initialized__ = gcvFALSE; \
++    gcmSTACK_PUSH(__FUNCTION__, __LINE__, gcvNULL, gcvNULL); \
++    gcoOS_ProfileDB(__FUNCTION__, &__profile__initialized__)
++#define gcmHEADER_ARG(...) \
++    static gctBOOL __profile__initialized__ = gcvFALSE; \
++    gcmSTACK_PUSH(__FUNCTION__, __LINE__, Text, __VA_ARGS__); \
++    gcoOS_ProfileDB(__FUNCTION__, &__profile__initialized__)
++#define gcmFOOTER() \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcoOS_ProfileDB(__FUNCTION__, gcvNULL)
++#define gcmFOOTER_NO() \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcoOS_ProfileDB(__FUNCTION__, gcvNULL)
++#define gcmFOOTER_ARG(...) \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcoOS_ProfileDB(__FUNCTION__, gcvNULL)
++#define gcmFOOTER_KILL() \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcoOS_ProfileDB(gcvNULL, gcvNULL)
++
++#else /* gcdENABLE_PROFILING */
++
++#if gcdHAS_ELLIPSES
++#define gcmHEADER() \
++    gctINT8 __user__ = 1; \
++    gctINT8_PTR __user_ptr__ = &__user__; \
++    gcmSTACK_PUSH(__FUNCTION__, __LINE__, gcvNULL, gcvNULL); \
++    gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                  "++%s(%d)", __FUNCTION__, __LINE__)
++#else
++    gcmINLINE static void
++    __dummy_header(void)
++    {
++    }
++#   define gcmHEADER                   __dummy_header
++#endif
++
++#if gcdHAS_ELLIPSES
++#   define gcmHEADER_ARG(Text, ...) \
++        gctINT8 __user__ = 1; \
++        gctINT8_PTR __user_ptr__ = &__user__; \
++        gcmSTACK_PUSH(__FUNCTION__, __LINE__, Text, __VA_ARGS__); \
++        gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                      "++%s(%d): " Text, __FUNCTION__, __LINE__, __VA_ARGS__)
++#else
++    gcmINLINE static void
++    __dummy_header_arg(
++        IN gctCONST_STRING Text,
++        ...
++        )
++    {
++    }
++#   define gcmHEADER_ARG                __dummy_header_arg
++#endif
++
++#if gcdHAS_ELLIPSES
++#   define gcmFOOTER() \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcmPROFILE_ONLY(gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                                  "--%s(%d) [%llu,%llu]: status=%d(%s)", \
++                                  __FUNCTION__, __LINE__, \
++                                  __ticks__, __total__, \
++                                  status, gcoOS_DebugStatus2Name(status))); \
++    gcmPROFILE_ELSE(gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                                  "--%s(%d): status=%d(%s)", \
++                                  __FUNCTION__, __LINE__, \
++                                  status, gcoOS_DebugStatus2Name(status))); \
++    *__user_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_footer(void)
++    {
++    }
++#   define gcmFOOTER                    __dummy_footer
++#endif
++
++#if gcdHAS_ELLIPSES
++#define gcmFOOTER_NO() \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                  "--%s(%d)", __FUNCTION__, __LINE__); \
++    *__user_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_footer_no(void)
++    {
++    }
++#   define gcmFOOTER_NO                 __dummy_footer_no
++#endif
++
++#if gcdHAS_ELLIPSES
++#define gcmFOOTER_KILL() \
++    gcmSTACK_POP(__FUNCTION__); \
++    gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                  "--%s(%d)", __FUNCTION__, __LINE__); \
++    *__user_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_footer_kill(void)
++    {
++    }
++#   define gcmFOOTER_KILL               __dummy_footer_kill
++#endif
++
++#if gcdHAS_ELLIPSES
++#   define gcmFOOTER_ARG(Text, ...) \
++        gcmSTACK_POP(__FUNCTION__); \
++        gcmTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                      "--%s(%d): " Text, __FUNCTION__, __LINE__, __VA_ARGS__); \
++        *__user_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_footer_arg(
++        IN gctCONST_STRING Text,
++        ...
++        )
++    {
++    }
++#   define gcmFOOTER_ARG                __dummy_footer_arg
++#endif
++
++#endif /* gcdENABLE_PROFILING */
++
++#if gcdHAS_ELLIPSES
++#define gcmkHEADER() \
++    gctINT8 __kernel__ = 1; \
++    gctINT8_PTR __kernel_ptr__ = &__kernel__; \
++    gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                   "++%s(%d)", __FUNCTION__, __LINE__)
++#else
++    gcmINLINE static void
++    __dummy_kheader(void)
++    {
++    }
++#   define gcmkHEADER                  __dummy_kheader
++#endif
++
++#if gcdHAS_ELLIPSES
++#   define gcmkHEADER_ARG(Text, ...) \
++        gctINT8 __kernel__ = 1; \
++        gctINT8_PTR __kernel_ptr__ = &__kernel__; \
++        gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                       "++%s(%d): " Text, __FUNCTION__, __LINE__, __VA_ARGS__)
++#else
++    gcmINLINE static void
++    __dummy_kheader_arg(
++        IN gctCONST_STRING Text,
++        ...
++        )
++    {
++    }
++#   define gcmkHEADER_ARG               __dummy_kheader_arg
++#endif
++
++#if gcdHAS_ELLIPSES
++#define gcmkFOOTER() \
++    gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                   "--%s(%d): status=%d(%s)", \
++                   __FUNCTION__, __LINE__, status, gckOS_DebugStatus2Name(status)); \
++    *__kernel_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_kfooter(void)
++    {
++    }
++#   define gcmkFOOTER                   __dummy_kfooter
++#endif
++
++#if gcdHAS_ELLIPSES
++#define gcmkFOOTER_NO() \
++    gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                   "--%s(%d)", __FUNCTION__, __LINE__); \
++    *__kernel_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_kfooter_no(void)
++    {
++    }
++#   define gcmkFOOTER_NO                __dummy_kfooter_no
++#endif
++
++#if gcdHAS_ELLIPSES
++#   define gcmkFOOTER_ARG(Text, ...) \
++        gcmkTRACE_ZONE(gcdHEADER_LEVEL, _GC_OBJ_ZONE, \
++                       "--%s(%d): " Text, \
++                       __FUNCTION__, __LINE__, __VA_ARGS__); \
++        *__kernel_ptr__ -= 1
++#else
++    gcmINLINE static void
++    __dummy_kfooter_arg(
++        IN gctCONST_STRING Text,
++        ...
++        )
++    {
++    }
++#   define gcmkFOOTER_ARG               __dummy_kfooter_arg
++#endif
++
++#define gcmOPT_VALUE(ptr)               (((ptr) == gcvNULL) ? 0 : *(ptr))
++#define gcmOPT_VALUE_INDEX(ptr, index)  (((ptr) == gcvNULL) ? 0 : ptr[index])
++#define gcmOPT_POINTER(ptr)             (((ptr) == gcvNULL) ? gcvNULL : *(ptr))
++#define gcmOPT_STRING(ptr)              (((ptr) == gcvNULL) ? "(nil)" : (ptr))
++
++void
++gckOS_Print(
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gckOS_PrintN(
++    IN gctUINT ArgumentSize,
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gckOS_CopyPrint(
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gcoOS_Print(
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++#define gcmPRINT                gcoOS_Print
++#define gcmkPRINT               gckOS_Print
++#define gcmkPRINT_N             gckOS_PrintN
++
++#if gcdPRINT_VERSION
++#   define gcmPRINT_VERSION()       do { \
++                                        _gcmPRINT_VERSION(gcm); \
++                                        gcmSTACK_DUMP(); \
++                                    } while (0)
++#   define gcmkPRINT_VERSION()      _gcmPRINT_VERSION(gcmk)
++#   define _gcmPRINT_VERSION(prefix) \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++                      "Vivante HAL version %d.%d.%d build %d  %s  %s", \
++                      gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH, \
++                      gcvVERSION_BUILD, gcvVERSION_DATE, gcvVERSION_TIME )
++#else
++#   define gcmPRINT_VERSION()       do { gcmSTACK_DUMP(); } while (gcvFALSE)
++#   define gcmkPRINT_VERSION()      do { } while (gcvFALSE)
++#endif
++
++typedef enum _gceDUMP_BUFFER
++{
++    gceDUMP_BUFFER_CONTEXT,
++    gceDUMP_BUFFER_USER,
++    gceDUMP_BUFFER_KERNEL,
++    gceDUMP_BUFFER_LINK,
++    gceDUMP_BUFFER_WAITLINK,
++    gceDUMP_BUFFER_FROM_USER,
++}
++gceDUMP_BUFFER;
++
++void
++gckOS_DumpBuffer(
++    IN gckOS Os,
++    IN gctPOINTER Buffer,
++    IN gctUINT Size,
++    IN gceDUMP_BUFFER Type,
++    IN gctBOOL CopyMessage
++    );
++
++#define gcmkDUMPBUFFER          gckOS_DumpBuffer
++
++#if gcdDUMP_COMMAND
++#   define gcmkDUMPCOMMAND(Os, Buffer, Size, Type, CopyMessage) \
++        gcmkDUMPBUFFER(Os, Buffer, Size, Type, CopyMessage)
++#else
++#   define gcmkDUMPCOMMAND(Os, Buffer, Size, Type, CopyMessage)
++#endif
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++
++void
++gckOS_DebugFlush(
++    gctCONST_STRING CallerName,
++    gctUINT LineNumber,
++    gctUINT32 DmaAddress
++    );
++
++#   define gcmkDEBUGFLUSH(DmaAddress) \
++        gckOS_DebugFlush(__FUNCTION__, __LINE__, DmaAddress)
++#else
++#   define gcmkDEBUGFLUSH(DmaAddress)
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_FRAMERATE
++**
++**      Print average frame rate
++**
++*/
++#if gcdDUMP_FRAMERATE
++    gceSTATUS
++    gcfDumpFrameRate(
++        void
++    );
++#   define gcmDUMP_FRAMERATE        gcfDumpFrameRate
++#elif gcdHAS_ELLIPSES
++#   define gcmDUMP_FRAMERATE(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_frame_rate(
++        void
++        )
++    {
++    }
++#   define gcmDUMP_FRAMERATE        __dummy_dump_frame_rate
++#endif
++
++
++/*******************************************************************************
++**
++**  gcmDUMP
++**
++**      Print a dump message.
++**
++**  ARGUMENTS:
++**
++**      gctSTRING   Message.
++**
++**      ...         Optional arguments.
++*/
++#if gcdDUMP
++    gceSTATUS
++    gcfDump(
++        IN gcoOS Os,
++        IN gctCONST_STRING String,
++        ...
++        );
++#  define gcmDUMP               gcfDump
++#elif gcdHAS_ELLIPSES
++#  define gcmDUMP(...)
++#else
++    gcmINLINE static void
++    __dummy_dump(
++        IN gcoOS Os,
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++#  define gcmDUMP               __dummy_dump
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_DATA
++**
++**      Add data to the dump.
++**
++**  ARGUMENTS:
++**
++**      gctSTRING Tag
++**          Tag for dump.
++**
++**      gctPOINTER Logical
++**          Logical address of buffer.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes.
++*/
++
++#if gcdDUMP || gcdDUMP_COMMAND
++    gceSTATUS
++    gcfDumpData(
++        IN gcoOS Os,
++        IN gctSTRING Tag,
++        IN gctPOINTER Logical,
++        IN gctSIZE_T Bytes
++        );
++#  define gcmDUMP_DATA          gcfDumpData
++#elif gcdHAS_ELLIPSES
++#  define gcmDUMP_DATA(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_data(
++        IN gcoOS Os,
++        IN gctSTRING Tag,
++        IN gctPOINTER Logical,
++        IN gctSIZE_T Bytes
++        )
++    {
++    }
++#  define gcmDUMP_DATA          __dummy_dump_data
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_BUFFER
++**
++**      Print a buffer to the dump.
++**
++**  ARGUMENTS:
++**
++**      gctSTRING Tag
++**          Tag for dump.
++**
++**      gctUINT32 Physical
++**          Physical address of buffer.
++**
++**      gctPOINTER Logical
++**          Logical address of buffer.
++**
++**      gctUINT32 Offset
++**          Offset into buffer.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes.
++*/
++
++#if gcdDUMP || gcdDUMP_COMMAND
++gceSTATUS
++gcfDumpBuffer(
++    IN gcoOS Os,
++    IN gctSTRING Tag,
++    IN gctUINT32 Physical,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset,
++    IN gctSIZE_T Bytes
++    );
++#   define gcmDUMP_BUFFER       gcfDumpBuffer
++#elif gcdHAS_ELLIPSES
++#   define gcmDUMP_BUFFER(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_buffer(
++        IN gcoOS Os,
++        IN gctSTRING Tag,
++        IN gctUINT32 Physical,
++        IN gctPOINTER Logical,
++        IN gctUINT32 Offset,
++        IN gctSIZE_T Bytes
++        )
++    {
++    }
++#   define gcmDUMP_BUFFER       __dummy_dump_buffer
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_API
++**
++**      Print a dump message for a high level API prefixed by the function name.
++**
++**  ARGUMENTS:
++**
++**      gctSTRING   Message.
++**
++**      ...         Optional arguments.
++*/
++gceSTATUS gcfDumpApi(IN gctCONST_STRING String, ...);
++#if gcdDUMP_API
++#   define gcmDUMP_API           gcfDumpApi
++#elif gcdHAS_ELLIPSES
++#   define gcmDUMP_API(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_api(
++        IN gctCONST_STRING Message,
++        ...
++        )
++    {
++    }
++#  define gcmDUMP_API           __dummy_dump_api
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_API_ARRAY
++**
++**      Print an array of data.
++**
++**  ARGUMENTS:
++**
++**      gctUINT32_PTR   Pointer to array.
++**      gctUINT32       Size.
++*/
++gceSTATUS gcfDumpArray(IN gctCONST_POINTER Data, IN gctUINT32 Size);
++#if gcdDUMP_API
++#   define gcmDUMP_API_ARRAY        gcfDumpArray
++#elif gcdHAS_ELLIPSES
++#   define gcmDUMP_API_ARRAY(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_api_array(
++        IN gctCONST_POINTER Data,
++        IN gctUINT32 Size
++        )
++    {
++    }
++#   define gcmDUMP_API_ARRAY        __dummy_dump_api_array
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_API_ARRAY_TOKEN
++**
++**      Print an array of data terminated by a token.
++**
++**  ARGUMENTS:
++**
++**      gctUINT32_PTR   Pointer to array.
++**      gctUINT32       Termination.
++*/
++gceSTATUS gcfDumpArrayToken(IN gctCONST_POINTER Data, IN gctUINT32 Termination);
++#if gcdDUMP_API
++#   define gcmDUMP_API_ARRAY_TOKEN  gcfDumpArrayToken
++#elif gcdHAS_ELLIPSES
++#   define gcmDUMP_API_ARRAY_TOKEN(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_api_array_token(
++        IN gctCONST_POINTER Data,
++        IN gctUINT32 Termination
++        )
++    {
++    }
++#   define gcmDUMP_API_ARRAY_TOKEN  __dummy_dump_api_array_token
++#endif
++
++/*******************************************************************************
++**
++**  gcmDUMP_API_DATA
++**
++**      Print an array of bytes.
++**
++**  ARGUMENTS:
++**
++**      gctCONST_POINTER    Pointer to array.
++**      gctSIZE_T           Size.
++*/
++gceSTATUS gcfDumpApiData(IN gctCONST_POINTER Data, IN gctSIZE_T Size);
++#if gcdDUMP_API
++#   define gcmDUMP_API_DATA         gcfDumpApiData
++#elif gcdHAS_ELLIPSES
++#   define gcmDUMP_API_DATA(...)
++#else
++    gcmINLINE static void
++    __dummy_dump_api_data(
++        IN gctCONST_POINTER Data,
++        IN gctSIZE_T Size
++        )
++    {
++    }
++#   define gcmDUMP_API_DATA         __dummy_dump_api_data
++#endif
++
++/*******************************************************************************
++**
++**  gcmTRACE_RELEASE
++**
++**      Print a message to the shader debugger.
++**
++**  ARGUMENTS:
++**
++**      message Message.
++**      ...     Optional arguments.
++*/
++
++#define gcmTRACE_RELEASE                gcoOS_DebugShaderTrace
++
++void
++gcoOS_DebugShaderTrace(
++    IN gctCONST_STRING Message,
++    ...
++    );
++
++void
++gcoOS_SetDebugShaderFiles(
++    IN gctCONST_STRING VSFileName,
++    IN gctCONST_STRING FSFileName
++    );
++
++void
++gcoOS_SetDebugShaderFileType(
++    IN gctUINT32 ShaderType
++    );
++
++void
++gcoOS_EnableDebugBuffer(
++    IN gctBOOL Enable
++    );
++
++/*******************************************************************************
++**
++**  gcmBREAK
++**
++**      Break into the debugger.  In retail mode this macro does nothing.
++**
++**  ARGUMENTS:
++**
++**      None.
++*/
++
++void
++gcoOS_DebugBreak(
++    void
++    );
++
++void
++gckOS_DebugBreak(
++    void
++    );
++
++#if gcmIS_DEBUG(gcdDEBUG_BREAK)
++#   define gcmBREAK             gcoOS_DebugBreak
++#   define gcmkBREAK            gckOS_DebugBreak
++#else
++#   define gcmBREAK()
++#   define gcmkBREAK()
++#endif
++
++/*******************************************************************************
++**
++**  gcmASSERT
++**
++**      Evaluate an expression and break into the debugger if the expression
++**      evaluates to false.  In retail mode this macro does nothing.
++**
++**  ARGUMENTS:
++**
++**      exp     Expression to evaluate.
++*/
++#if gcmIS_DEBUG(gcdDEBUG_ASSERT)
++#   define _gcmASSERT(prefix, exp) \
++        do \
++        { \
++            if (!(exp)) \
++            { \
++                prefix##TRACE(gcvLEVEL_ERROR, \
++                              #prefix "ASSERT at %s(%d)", \
++                              __FUNCTION__, __LINE__); \
++                prefix##TRACE(gcvLEVEL_ERROR, \
++                              "(%s)", #exp); \
++                prefix##BREAK(); \
++            } \
++        } \
++        while (gcvFALSE)
++#   define gcmASSERT(exp)           _gcmASSERT(gcm, exp)
++#   define gcmkASSERT(exp)          _gcmASSERT(gcmk, exp)
++#else
++#   define gcmASSERT(exp)
++#   define gcmkASSERT(exp)
++#endif
++
++/*******************************************************************************
++**
++**  gcmVERIFY
++**
++**      Verify if an expression returns true.  If the expression does not
++**      evaluates to true, an assertion will happen in debug mode.
++**
++**  ARGUMENTS:
++**
++**      exp     Expression to evaluate.
++*/
++#if gcmIS_DEBUG(gcdDEBUG_ASSERT)
++#   define gcmVERIFY(exp)           gcmASSERT(exp)
++#   define gcmkVERIFY(exp)          gcmkASSERT(exp)
++#else
++#   define gcmVERIFY(exp)           exp
++#   define gcmkVERIFY(exp)          exp
++#endif
++
++/*******************************************************************************
++**
++**  gcmVERIFY_OK
++**
++**      Verify a fucntion returns gcvSTATUS_OK.  If the function does not return
++**      gcvSTATUS_OK, an assertion will happen in debug mode.
++**
++**  ARGUMENTS:
++**
++**      func    Function to evaluate.
++*/
++
++void
++gcoOS_Verify(
++    IN gceSTATUS status
++    );
++
++void
++gckOS_Verify(
++    IN gceSTATUS status
++    );
++
++#if gcmIS_DEBUG(gcdDEBUG_ASSERT)
++#   define gcmVERIFY_OK(func) \
++        do \
++        { \
++            gceSTATUS verifyStatus = func; \
++            gcoOS_Verify(verifyStatus); \
++            if (verifyStatus != gcvSTATUS_OK) \
++            { \
++                gcmTRACE( \
++                    gcvLEVEL_ERROR, \
++                    "gcmVERIFY_OK(%d): function returned %d", \
++                    __LINE__, verifyStatus \
++                    ); \
++            } \
++            gcmASSERT(verifyStatus == gcvSTATUS_OK); \
++        } \
++        while (gcvFALSE)
++#   define gcmkVERIFY_OK(func) \
++        do \
++        { \
++            gceSTATUS verifyStatus = func; \
++            if (verifyStatus != gcvSTATUS_OK) \
++            { \
++                gcmkTRACE( \
++                    gcvLEVEL_ERROR, \
++                    "gcmkVERIFY_OK(%d): function returned %d", \
++                    __LINE__, verifyStatus \
++                    ); \
++            } \
++            gckOS_Verify(verifyStatus); \
++            gcmkASSERT(verifyStatus == gcvSTATUS_OK); \
++        } \
++        while (gcvFALSE)
++#else
++#   define gcmVERIFY_OK(func)       func
++#   define gcmkVERIFY_OK(func)      func
++#endif
++
++gctCONST_STRING
++gcoOS_DebugStatus2Name(
++    gceSTATUS status
++    );
++
++gctCONST_STRING
++gckOS_DebugStatus2Name(
++    gceSTATUS status
++    );
++
++/*******************************************************************************
++**
++**  gcmERR_BREAK
++**
++**      Executes a break statement on error.
++**
++**  ASSUMPTIONS:
++**
++**      'status' variable of gceSTATUS type must be defined.
++**
++**  ARGUMENTS:
++**
++**      func    Function to evaluate.
++*/
++#define _gcmERR_BREAK(prefix, func) \
++    status = func; \
++    if (gcmIS_ERROR(status)) \
++    { \
++        prefix##PRINT_VERSION(); \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++            #prefix "ERR_BREAK: status=%d(%s) @ %s(%d)", \
++            status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++        break; \
++    } \
++    do { } while (gcvFALSE)
++#define _gcmkERR_BREAK(prefix, func) \
++    status = func; \
++    if (gcmIS_ERROR(status)) \
++    { \
++        prefix##PRINT_VERSION(); \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++            #prefix "ERR_BREAK: status=%d(%s) @ %s(%d)", \
++            status, gckOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++        break; \
++    } \
++    do { } while (gcvFALSE)
++#define gcmERR_BREAK(func)          _gcmERR_BREAK(gcm, func)
++#define gcmkERR_BREAK(func)         _gcmkERR_BREAK(gcmk, func)
++
++/*******************************************************************************
++**
++**  gcmERR_RETURN
++**
++**      Executes a return on error.
++**
++**  ASSUMPTIONS:
++**
++**      'status' variable of gceSTATUS type must be defined.
++**
++**  ARGUMENTS:
++**
++**      func    Function to evaluate.
++*/
++#define _gcmERR_RETURN(prefix, func) \
++    status = func; \
++    if (gcmIS_ERROR(status)) \
++    { \
++        prefix##PRINT_VERSION(); \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++            #prefix "ERR_RETURN: status=%d(%s) @ %s(%d)", \
++            status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++        prefix##FOOTER(); \
++        return status; \
++    } \
++    do { } while (gcvFALSE)
++#define _gcmkERR_RETURN(prefix, func) \
++    status = func; \
++    if (gcmIS_ERROR(status)) \
++    { \
++        prefix##PRINT_VERSION(); \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++            #prefix "ERR_RETURN: status=%d(%s) @ %s(%d)", \
++            status, gckOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++        prefix##FOOTER(); \
++        return status; \
++    } \
++    do { } while (gcvFALSE)
++#define gcmERR_RETURN(func)         _gcmERR_RETURN(gcm, func)
++#define gcmkERR_RETURN(func)        _gcmkERR_RETURN(gcmk, func)
++
++
++/*******************************************************************************
++**
++**  gcmONERROR
++**
++**      Jump to the error handler in case there is an error.
++**
++**  ASSUMPTIONS:
++**
++**      'status' variable of gceSTATUS type must be defined.
++**
++**  ARGUMENTS:
++**
++**      func    Function to evaluate.
++*/
++#define _gcmONERROR(prefix, func) \
++    do \
++    { \
++        status = func; \
++        if (gcmIS_ERROR(status)) \
++        { \
++            prefix##PRINT_VERSION(); \
++            prefix##TRACE(gcvLEVEL_ERROR, \
++                #prefix "ONERROR: status=%d(%s) @ %s(%d)", \
++                status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++            goto OnError; \
++        } \
++    } \
++    while (gcvFALSE)
++#define _gcmkONERROR(prefix, func) \
++    do \
++    { \
++        status = func; \
++        if (gcmIS_ERROR(status)) \
++        { \
++            prefix##PRINT_VERSION(); \
++            prefix##TRACE(gcvLEVEL_ERROR, \
++                #prefix "ONERROR: status=%d(%s) @ %s(%d)", \
++                status, gckOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++            goto OnError; \
++        } \
++    } \
++    while (gcvFALSE)
++#define gcmONERROR(func)            _gcmONERROR(gcm, func)
++#define gcmkONERROR(func)           _gcmkONERROR(gcmk, func)
++
++/*******************************************************************************
++**
++**  gcmVERIFY_LOCK
++**
++**      Verifies whether the surface is locked.
++**
++**  ARGUMENTS:
++**
++**      surfaceInfo Pointer to the surface iniformational structure.
++*/
++#define gcmVERIFY_LOCK(surfaceInfo) \
++    if (!surfaceInfo->node.valid) \
++    { \
++        gcmONERROR(gcvSTATUS_MEMORY_UNLOCKED); \
++    } \
++
++/*******************************************************************************
++**
++**  gcmVERIFY_NODE_LOCK
++**
++**      Verifies whether the surface node is locked.
++**
++**  ARGUMENTS:
++**
++**      surfaceInfo Pointer to the surface iniformational structure.
++*/
++#define gcmVERIFY_NODE_LOCK(surfaceNode) \
++    if (!(surfaceNode)->valid) \
++    { \
++        status = gcvSTATUS_MEMORY_UNLOCKED; \
++        break; \
++    } \
++    do { } while (gcvFALSE)
++
++/*******************************************************************************
++**
++**  gcmBADOBJECT_BREAK
++**
++**      Executes a break statement on bad object.
++**
++**  ARGUMENTS:
++**
++**      obj     Object to test.
++**      t       Expected type of the object.
++*/
++#define gcmBADOBJECT_BREAK(obj, t) \
++    if ((obj == gcvNULL) \
++    ||  (((gcsOBJECT *)(obj))->type != t) \
++    ) \
++    { \
++        status = gcvSTATUS_INVALID_OBJECT; \
++        break; \
++    } \
++    do { } while (gcvFALSE)
++
++/*******************************************************************************
++**
++**  gcmCHECK_STATUS
++**
++**      Executes a break statement on error.
++**
++**  ASSUMPTIONS:
++**
++**      'status' variable of gceSTATUS type must be defined.
++**
++**  ARGUMENTS:
++**
++**      func    Function to evaluate.
++*/
++#define _gcmCHECK_STATUS(prefix, func) \
++    do \
++    { \
++        last = func; \
++        if (gcmIS_ERROR(last)) \
++        { \
++            prefix##TRACE(gcvLEVEL_ERROR, \
++                #prefix "CHECK_STATUS: status=%d(%s) @ %s(%d)", \
++                last, gcoOS_DebugStatus2Name(last), __FUNCTION__, __LINE__); \
++            status = last; \
++        } \
++    } \
++    while (gcvFALSE)
++#define _gcmkCHECK_STATUS(prefix, func) \
++    do \
++    { \
++        last = func; \
++        if (gcmIS_ERROR(last)) \
++        { \
++            prefix##TRACE(gcvLEVEL_ERROR, \
++                #prefix "CHECK_STATUS: status=%d(%s) @ %s(%d)", \
++                last, gckOS_DebugStatus2Name(last), __FUNCTION__, __LINE__); \
++            status = last; \
++        } \
++    } \
++    while (gcvFALSE)
++#define gcmCHECK_STATUS(func)       _gcmCHECK_STATUS(gcm, func)
++#define gcmkCHECK_STATUS(func)      _gcmkCHECK_STATUS(gcmk, func)
++
++/*******************************************************************************
++**
++**  gcmVERIFY_ARGUMENT
++**
++**      Assert if an argument does not apply to the specified expression.  If
++**      the argument evaluates to false, gcvSTATUS_INVALID_ARGUMENT will be
++**      returned from the current function.  In retail mode this macro does
++**      nothing.
++**
++**  ARGUMENTS:
++**
++**      arg     Argument to evaluate.
++*/
++#   define _gcmVERIFY_ARGUMENT(prefix, arg) \
++       do \
++       { \
++           if (!(arg)) \
++           { \
++               prefix##TRACE(gcvLEVEL_ERROR, #prefix "VERIFY_ARGUMENT failed:"); \
++               prefix##ASSERT(arg); \
++               prefix##FOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT); \
++               return gcvSTATUS_INVALID_ARGUMENT; \
++           } \
++       } \
++       while (gcvFALSE)
++#   define gcmVERIFY_ARGUMENT(arg)     _gcmVERIFY_ARGUMENT(gcm, arg)
++#   define gcmkVERIFY_ARGUMENT(arg)    _gcmVERIFY_ARGUMENT(gcmk, arg)
++
++/*******************************************************************************
++**
++**  gcmDEBUG_VERIFY_ARGUMENT
++**
++**      Works just like gcmVERIFY_ARGUMENT, but is only valid in debug mode.
++**      Use this to verify arguments inside non-public API functions.
++*/
++#if gcdDEBUG
++#   define gcmDEBUG_VERIFY_ARGUMENT(arg)    _gcmVERIFY_ARGUMENT(gcm, arg)
++#   define gcmkDEBUG_VERIFY_ARGUMENT(arg)   _gcmkVERIFY_ARGUMENT(gcm, arg)
++#else
++#   define gcmDEBUG_VERIFY_ARGUMENT(arg)
++#   define gcmkDEBUG_VERIFY_ARGUMENT(arg)
++#endif
++
++/*******************************************************************************
++**
++**  gcmVERIFY_ARGUMENT_RETURN
++**
++**      Assert if an argument does not apply to the specified expression.  If
++**      the argument evaluates to false, gcvSTATUS_INVALID_ARGUMENT will be
++**      returned from the current function.  In retail mode this macro does
++**      nothing.
++**
++**  ARGUMENTS:
++**
++**      arg     Argument to evaluate.
++*/
++#   define _gcmVERIFY_ARGUMENT_RETURN(prefix, arg, value) \
++       do \
++       { \
++           if (!(arg)) \
++           { \
++               prefix##TRACE(gcvLEVEL_ERROR, \
++                             #prefix "gcmVERIFY_ARGUMENT_RETURN failed:"); \
++               prefix##ASSERT(arg); \
++               prefix##FOOTER_ARG("value=%d", value); \
++               return value; \
++           } \
++       } \
++       while (gcvFALSE)
++#   define gcmVERIFY_ARGUMENT_RETURN(arg, value) \
++                _gcmVERIFY_ARGUMENT_RETURN(gcm, arg, value)
++#   define gcmkVERIFY_ARGUMENT_RETURN(arg, value) \
++                _gcmVERIFY_ARGUMENT_RETURN(gcmk, arg, value)
++
++#define MAX_LOOP_COUNT 0x7FFFFFFF
++
++/******************************************************************************\
++****************************** User Debug Option ******************************
++\******************************************************************************/
++
++/* User option. */
++typedef enum _gceDEBUG_MSG
++{
++    gcvDEBUG_MSG_NONE,
++    gcvDEBUG_MSG_ERROR,
++    gcvDEBUG_MSG_WARNING
++}
++gceDEBUG_MSG;
++
++typedef struct _gcsUSER_DEBUG_OPTION
++{
++    gceDEBUG_MSG        debugMsg;
++}
++gcsUSER_DEBUG_OPTION;
++
++gcsUSER_DEBUG_OPTION *
++gcGetUserDebugOption(
++    void
++    );
++
++struct _gcoOS_SymbolsList
++{
++    gcePATCH_ID patchId;
++    const char * symList[10];
++};
++
++#if gcdHAS_ELLIPSES
++#define gcmUSER_DEBUG_MSG(level, ...) \
++    do \
++    { \
++        if (level <= gcGetUserDebugOption()->debugMsg) \
++        { \
++            gcoOS_Print(__VA_ARGS__); \
++        } \
++    } while (gcvFALSE)
++
++#define gcmUSER_DEBUG_ERROR_MSG(...)   gcmUSER_DEBUG_MSG(gcvDEBUG_MSG_ERROR, "Error: " __VA_ARGS__)
++#define gcmUSER_DEBUG_WARNING_MSG(...) gcmUSER_DEBUG_MSG(gcvDEBUG_MSG_WARNING, "Warring: " __VA_ARGS__)
++#else
++#define gcmUSER_DEBUG_MSG
++#define gcmUSER_DEBUG_ERROR_MSG
++#define gcmUSER_DEBUG_WARNING_MSG
++#endif
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_base_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_compiler.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,4356 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++/*
++**	Include file the defines the front- and back-end compilers, as well as the
++**	objects they use.
++*/
++
++#ifndef __gc_hal_compiler_h_
++#define __gc_hal_compiler_h_
++
++#ifndef VIVANTE_NO_3D
++#include "gc_hal_types.h"
++#include "gc_hal_engine.h"
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++#ifndef GC_ENABLE_LOADTIME_OPT
++#define GC_ENABLE_LOADTIME_OPT           1
++#endif
++
++#define TEMP_OPT_CONSTANT_TEXLD_COORD    0
++
++#define TEMP_SHADER_PATCH                1
++
++#define TEMP_INLINE_ALL_EXPANSION            1
++/******************************* IR VERSION ******************/
++#define gcdSL_IR_VERSION gcmCC('\0','\0','\0','\1')
++
++/******************************************************************************\
++|******************************* SHADER LANGUAGE ******************************|
++\******************************************************************************/
++
++    /* allocator/deallocator function pointer */
++typedef gceSTATUS (*gctAllocatorFunc)(
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    );
++
++typedef gceSTATUS (*gctDeallocatorFunc)(
++    IN gctPOINTER Memory
++    );
++
++typedef gctBOOL (*compareFunc) (
++     IN void *    data,
++     IN void *    key
++     );
++
++typedef struct _gcsListNode gcsListNode;
++struct _gcsListNode
++{
++    gcsListNode *       next;
++    void *              data;
++};
++
++typedef struct _gcsAllocator
++{
++    gctAllocatorFunc    allocate;
++    gctDeallocatorFunc  deallocate;
++} gcsAllocator;
++
++/* simple map structure */
++typedef struct _SimpleMap SimpleMap;
++struct _SimpleMap
++{
++    gctUINT32     key;
++    gctUINT32     val;
++    SimpleMap    *next;
++    gcsAllocator *allocator;
++
++};
++
++/* SimpleMap Operations */
++/* return -1 if not found, otherwise return the mapped value */
++gctUINT32
++gcSimpleMap_Find(
++     IN SimpleMap *Map,
++     IN gctUINT32    Key
++     );
++
++gceSTATUS
++gcSimpleMap_Destory(
++     IN SimpleMap *    Map,
++     IN gcsAllocator * Allocator
++     );
++
++/* Add a pair <Key, Val> to the Map head, the user should be aware that the
++ * map pointer is always changed when adding a new node :
++ *
++ *   gcSimpleMap_AddNode(&theMap, key, val, allocator);
++ *
++ */
++gceSTATUS
++gcSimpleMap_AddNode(
++     IN SimpleMap **   Map,
++     IN gctUINT32      Key,
++     IN gctUINT32      Val,
++     IN gcsAllocator * Allocator
++     );
++
++/* gcsList data structure and related operations */
++typedef struct _gcsList
++{
++    gcsListNode  *head;
++    gcsListNode  *tail;
++    gctINT        count;
++    gcsAllocator *allocator;
++} gcsList;
++
++/* List operations */
++void
++gcList_Init(
++    IN gcsList *list,
++    IN gcsAllocator *allocator
++    );
++
++gceSTATUS
++gcList_CreateNode(
++    IN void *             Data,
++    IN gctAllocatorFunc   Allocator,
++    OUT gcsListNode **    ListNode
++    );
++
++gceSTATUS
++gcList_Clean(
++    IN gcsList *          List,
++    IN gctBOOL            FreeData
++    );
++
++gcsListNode *
++gcList_FindNode(
++    IN gcsList *      List,
++    IN void *         Key,
++    IN compareFunc    compare
++    );
++
++gceSTATUS
++gcList_AddNode(
++    IN gcsList *          List,
++    IN void *             Data
++    );
++
++gceSTATUS
++gcList_RemoveNode(
++    IN gcsList *          List,
++    IN gcsListNode *      Node
++    );
++
++/*  link list structure for code list */
++typedef gcsList gcsCodeList;
++typedef gcsCodeList * gctCodeList;
++typedef gcsListNode gcsCodeListNode;
++
++/* Possible shader language opcodes. */
++typedef enum _gcSL_OPCODE
++{
++	gcSL_NOP,							/* 0x00 */
++	gcSL_MOV,							/* 0x01 */
++	gcSL_SAT,							/* 0x02 */
++	gcSL_DP3,							/* 0x03 */
++	gcSL_DP4,							/* 0x04 */
++	gcSL_ABS,							/* 0x05 */
++	gcSL_JMP,							/* 0x06 */
++	gcSL_ADD,							/* 0x07 */
++	gcSL_MUL,							/* 0x08 */
++	gcSL_RCP,							/* 0x09 */
++	gcSL_SUB,							/* 0x0A */
++	gcSL_KILL,							/* 0x0B */
++	gcSL_TEXLD,							/* 0x0C */
++	gcSL_CALL,							/* 0x0D */
++	gcSL_RET,							/* 0x0E */
++	gcSL_NORM,							/* 0x0F */
++	gcSL_MAX,							/* 0x10 */
++	gcSL_MIN,							/* 0x11 */
++	gcSL_POW,							/* 0x12 */
++	gcSL_RSQ,							/* 0x13 */
++	gcSL_LOG,							/* 0x14 */
++	gcSL_FRAC,							/* 0x15 */
++	gcSL_FLOOR,							/* 0x16 */
++	gcSL_CEIL,							/* 0x17 */
++	gcSL_CROSS,							/* 0x18 */
++	gcSL_TEXLDP,						/* 0x19 */
++	gcSL_TEXBIAS,						/* 0x1A */
++	gcSL_TEXGRAD,						/* 0x1B */
++	gcSL_TEXLOD,						/* 0x1C */
++	gcSL_SIN,							/* 0x1D */
++	gcSL_COS,							/* 0x1E */
++	gcSL_TAN,							/* 0x1F */
++	gcSL_EXP,							/* 0x20 */
++	gcSL_SIGN,							/* 0x21 */
++	gcSL_STEP,							/* 0x22 */
++	gcSL_SQRT,							/* 0x23 */
++	gcSL_ACOS,							/* 0x24 */
++	gcSL_ASIN,							/* 0x25 */
++	gcSL_ATAN,							/* 0x26 */
++	gcSL_SET,							/* 0x27 */
++	gcSL_DSX,							/* 0x28 */
++	gcSL_DSY,							/* 0x29 */
++	gcSL_FWIDTH,						/* 0x2A */
++	gcSL_DIV,   						/* 0x2B */
++	gcSL_MOD,   						/* 0x2C */
++	gcSL_AND_BITWISE,					/* 0x2D */
++	gcSL_OR_BITWISE,					/* 0x2E */
++	gcSL_XOR_BITWISE,					/* 0x2F */
++	gcSL_NOT_BITWISE,					/* 0x30 */
++	gcSL_LSHIFT,						/* 0x31 */
++	gcSL_RSHIFT,						/* 0x32 */
++	gcSL_ROTATE,						/* 0x33 */
++	gcSL_BITSEL,						/* 0x34 */
++	gcSL_LEADZERO,						/* 0x35 */
++	gcSL_LOAD,							/* 0x36 */
++	gcSL_STORE,							/* 0x37 */
++	gcSL_BARRIER,						/* 0x38 */
++	gcSL_STORE1,						/* 0x39 */
++	gcSL_ATOMADD,						/* 0x3A */
++	gcSL_ATOMSUB,						/* 0x3B */
++	gcSL_ATOMXCHG,						/* 0x3C */
++	gcSL_ATOMCMPXCHG,					/* 0x3D */
++	gcSL_ATOMMIN,						/* 0x3E */
++	gcSL_ATOMMAX,						/* 0x3F */
++	gcSL_ATOMOR,						/* 0x40 */
++	gcSL_ATOMAND,						/* 0x41 */
++	gcSL_ATOMXOR,						/* 0x42 */
++	/*gcSL_UNUSED,						 0x43 */
++	/*gcSL_UNUSED,						 0x44 */
++	/*gcSL_UNUSED,						 0x45 */
++	/*gcSL_UNUSED,						 0x46 */
++	/*gcSL_UNUSED,						 0x47 */
++	/*gcSL_UNUSED,						 0x48 */
++	/*gcSL_UNUSED,						 0x49 */
++	/*gcSL_UNUSED,						 0x4A */
++	/*gcSL_UNUSED,						 0x4B */
++	/*gcSL_UNUSED,					 	 0x4C */
++	/*gcSL_UNUSED,						 0x4D */
++	/*gcSL_UNUSED,						 0x4E */
++	/*gcSL_UNUSED,						 0x4F */
++	/*gcSL_UNUSED,						 0x50 */
++	/*gcSL_UNUSED,						 0x51 */
++	/*gcSL_UNUSED,						 0x52 */
++	gcSL_ADDLO = 0x53,					/* 0x53 */  /* Float only. */
++	gcSL_MULLO,							/* 0x54 */  /* Float only. */
++	gcSL_CONV,							/* 0x55 */
++	gcSL_GETEXP,						/* 0x56 */
++	gcSL_GETMANT,						/* 0x57 */
++	gcSL_MULHI,							/* 0x58 */  /* Integer only. */
++	gcSL_CMP,							/* 0x59 */
++	gcSL_I2F,							/* 0x5A */
++	gcSL_F2I,							/* 0x5B */
++	gcSL_ADDSAT,						/* 0x5C */  /* Integer only. */
++	gcSL_SUBSAT,						/* 0x5D */  /* Integer only. */
++	gcSL_MULSAT,						/* 0x5E */  /* Integer only. */
++	gcSL_DP2,							/* 0x5F */
++	gcSL_MAXOPCODE
++}
++gcSL_OPCODE;
++
++typedef enum _gcSL_FORMAT
++{
++	gcSL_FLOAT = 0,						/* 0 */
++	gcSL_INTEGER = 1,				    /* 1 */
++	gcSL_INT32 = 1,					    /* 1 */
++	gcSL_BOOLEAN = 2,					/* 2 */
++	gcSL_UINT32 = 3,					/* 3 */
++	gcSL_INT8,						    /* 4 */
++	gcSL_UINT8,						    /* 5 */
++	gcSL_INT16,						    /* 6 */
++	gcSL_UINT16,						/* 7 */
++	gcSL_INT64,						    /* 8 */     /* Reserved for future enhancement. */
++	gcSL_UINT64,						/* 9 */     /* Reserved for future enhancement. */
++	gcSL_INT128,					    /* 10 */    /* Reserved for future enhancement. */
++	gcSL_UINT128,						/* 11 */    /* Reserved for future enhancement. */
++	gcSL_FLOAT16,					    /* 12 */
++	gcSL_FLOAT64,						/* 13 */    /* Reserved for future enhancement. */
++	gcSL_FLOAT128,						/* 14 */    /* Reserved for future enhancement. */
++}
++gcSL_FORMAT;
++
++/* Destination write enable bits. */
++typedef enum _gcSL_ENABLE
++{
++    gcSL_ENABLE_NONE                    = 0x0,     /* none is enabled, error/uninitialized state */
++	gcSL_ENABLE_X						= 0x1,
++	gcSL_ENABLE_Y						= 0x2,
++	gcSL_ENABLE_Z						= 0x4,
++	gcSL_ENABLE_W						= 0x8,
++	/* Combinations. */
++	gcSL_ENABLE_XY						= gcSL_ENABLE_X | gcSL_ENABLE_Y,
++	gcSL_ENABLE_XYZ						= gcSL_ENABLE_X | gcSL_ENABLE_Y | gcSL_ENABLE_Z,
++	gcSL_ENABLE_XYZW					= gcSL_ENABLE_X | gcSL_ENABLE_Y | gcSL_ENABLE_Z | gcSL_ENABLE_W,
++	gcSL_ENABLE_XYW						= gcSL_ENABLE_X | gcSL_ENABLE_Y | gcSL_ENABLE_W,
++	gcSL_ENABLE_XZ						= gcSL_ENABLE_X | gcSL_ENABLE_Z,
++	gcSL_ENABLE_XZW						= gcSL_ENABLE_X | gcSL_ENABLE_Z | gcSL_ENABLE_W,
++	gcSL_ENABLE_XW						= gcSL_ENABLE_X | gcSL_ENABLE_W,
++	gcSL_ENABLE_YZ						= gcSL_ENABLE_Y | gcSL_ENABLE_Z,
++	gcSL_ENABLE_YZW						= gcSL_ENABLE_Y | gcSL_ENABLE_Z | gcSL_ENABLE_W,
++	gcSL_ENABLE_YW						= gcSL_ENABLE_Y | gcSL_ENABLE_W,
++	gcSL_ENABLE_ZW						= gcSL_ENABLE_Z | gcSL_ENABLE_W,
++}
++gcSL_ENABLE;
++
++/* Possible indices. */
++typedef enum _gcSL_INDEXED
++{
++	gcSL_NOT_INDEXED,					/* 0 */
++	gcSL_INDEXED_X,						/* 1 */
++	gcSL_INDEXED_Y,						/* 2 */
++	gcSL_INDEXED_Z,						/* 3 */
++	gcSL_INDEXED_W,						/* 4 */
++}
++gcSL_INDEXED;
++
++/* Opcode conditions. */
++typedef enum _gcSL_CONDITION
++{
++	gcSL_ALWAYS,						/* 0x0 */
++	gcSL_NOT_EQUAL,						/* 0x1 */
++	gcSL_LESS_OR_EQUAL,					/* 0x2 */
++	gcSL_LESS,							/* 0x3 */
++	gcSL_EQUAL,							/* 0x4 */
++	gcSL_GREATER,						/* 0x5 */
++	gcSL_GREATER_OR_EQUAL,				/* 0x6 */
++	gcSL_AND,							/* 0x7 */
++	gcSL_OR,							/* 0x8 */
++	gcSL_XOR,							/* 0x9 */
++    gcSL_NOT_ZERO,                      /* 0xA */
++}
++gcSL_CONDITION;
++
++/* Possible source operand types. */
++typedef enum _gcSL_TYPE
++{
++	gcSL_NONE,							/* 0x0 */
++	gcSL_TEMP,							/* 0x1 */
++	gcSL_ATTRIBUTE,						/* 0x2 */
++	gcSL_UNIFORM,						/* 0x3 */
++	gcSL_SAMPLER,						/* 0x4 */
++	gcSL_CONSTANT,						/* 0x5 */
++	gcSL_OUTPUT,						/* 0x6 */
++	gcSL_PHYSICAL,						/* 0x7 */
++}
++gcSL_TYPE;
++
++/* Swizzle generator macro. */
++#define gcmSWIZZLE(Component1, Component2, Component3, Component4) \
++( \
++	(gcSL_SWIZZLE_ ## Component1 << 0) | \
++	(gcSL_SWIZZLE_ ## Component2 << 2) | \
++	(gcSL_SWIZZLE_ ## Component3 << 4) | \
++	(gcSL_SWIZZLE_ ## Component4 << 6)   \
++)
++
++#define gcmExtractSwizzle(Swizzle, Index) \
++    ((gcSL_SWIZZLE) ((((Swizzle) >> (Index * 2)) & 0x3)))
++
++#define gcmComposeSwizzle(SwizzleX, SwizzleY, SwizzleZ, SwizzleW) \
++( \
++	((SwizzleX) << 0) | \
++	((SwizzleY) << 2) | \
++	((SwizzleZ) << 4) | \
++	((SwizzleW) << 6)   \
++)
++
++/* Possible swizzle values. */
++typedef enum _gcSL_SWIZZLE
++{
++	gcSL_SWIZZLE_X,						/* 0x0 */
++	gcSL_SWIZZLE_Y,						/* 0x1 */
++	gcSL_SWIZZLE_Z,						/* 0x2 */
++	gcSL_SWIZZLE_W,						/* 0x3 */
++	/* Combinations. */
++	gcSL_SWIZZLE_XXXX = gcmSWIZZLE(X, X, X, X),
++	gcSL_SWIZZLE_YYYY = gcmSWIZZLE(Y, Y, Y, Y),
++	gcSL_SWIZZLE_ZZZZ = gcmSWIZZLE(Z, Z, Z, Z),
++	gcSL_SWIZZLE_WWWW = gcmSWIZZLE(W, W, W, W),
++	gcSL_SWIZZLE_XYYY = gcmSWIZZLE(X, Y, Y, Y),
++	gcSL_SWIZZLE_XZZZ = gcmSWIZZLE(X, Z, Z, Z),
++	gcSL_SWIZZLE_XWWW = gcmSWIZZLE(X, W, W, W),
++	gcSL_SWIZZLE_YZZZ = gcmSWIZZLE(Y, Z, Z, Z),
++	gcSL_SWIZZLE_YWWW = gcmSWIZZLE(Y, W, W, W),
++	gcSL_SWIZZLE_ZWWW = gcmSWIZZLE(Z, W, W, W),
++	gcSL_SWIZZLE_XYZZ = gcmSWIZZLE(X, Y, Z, Z),
++	gcSL_SWIZZLE_XYWW = gcmSWIZZLE(X, Y, W, W),
++	gcSL_SWIZZLE_XZWW = gcmSWIZZLE(X, Z, W, W),
++	gcSL_SWIZZLE_YZWW = gcmSWIZZLE(Y, Z, W, W),
++	gcSL_SWIZZLE_XXYZ = gcmSWIZZLE(X, X, Y, Z),
++	gcSL_SWIZZLE_XYZW = gcmSWIZZLE(X, Y, Z, W),
++	gcSL_SWIZZLE_XYXY = gcmSWIZZLE(X, Y, X, Y),
++	gcSL_SWIZZLE_YYZZ = gcmSWIZZLE(Y, Y, Z, Z),
++	gcSL_SWIZZLE_YYWW = gcmSWIZZLE(Y, Y, W, W),
++	gcSL_SWIZZLE_ZZZW = gcmSWIZZLE(Z, Z, Z, W),
++	gcSL_SWIZZLE_XZZW = gcmSWIZZLE(X, Z, Z, W),
++	gcSL_SWIZZLE_YYZW = gcmSWIZZLE(Y, Y, Z, W),
++
++    gcSL_SWIZZLE_INVALID = 0x7FFFFFFF
++}
++gcSL_SWIZZLE;
++
++typedef enum _gcSL_COMPONENT
++{
++	gcSL_COMPONENT_X,               /* 0x0 */
++	gcSL_COMPONENT_Y,               /* 0x1 */
++	gcSL_COMPONENT_Z,               /* 0x2 */
++	gcSL_COMPONENT_W,               /* 0x3 */
++    gcSL_COMPONENT_COUNT            /* 0x4 */
++} gcSL_COMPONENT;
++
++#define gcmIsComponentEnabled(Enable, Component) (((Enable) & (1 << (Component))) != 0)
++
++/******************************************************************************\
++|*********************************** SHADERS **********************************|
++\******************************************************************************/
++
++/* Shader types. */
++typedef enum _gcSHADER_KIND {
++    gcSHADER_TYPE_UNKNOWN = 0,
++    gcSHADER_TYPE_VERTEX,
++    gcSHADER_TYPE_FRAGMENT,
++    gcSHADER_TYPE_CL,
++    gcSHADER_TYPE_PRECOMPILED,
++    gcSHADER_KIND_COUNT
++} gcSHADER_KIND;
++
++typedef enum _gcGL_DRIVER_VERSION {
++    gcGL_DRIVER_ES11,    /* OpenGL ES 1.1 */
++    gcGL_DRIVER_ES20,    /* OpenGL ES 2.0 */
++    gcGL_DRIVER_ES30     /* OpenGL ES 3.0 */
++} gcGL_DRIVER_VERSION;
++
++/* gcSHADER objects. */
++typedef struct _gcSHADER *              gcSHADER;
++typedef struct _gcATTRIBUTE *			gcATTRIBUTE;
++typedef struct _gcUNIFORM *             gcUNIFORM;
++typedef struct _gcOUTPUT *              gcOUTPUT;
++typedef struct _gcsFUNCTION *			gcFUNCTION;
++typedef struct _gcsKERNEL_FUNCTION *	gcKERNEL_FUNCTION;
++typedef struct _gcsHINT *               gcsHINT_PTR;
++typedef struct _gcSHADER_PROFILER *     gcSHADER_PROFILER;
++typedef struct _gcVARIABLE *			gcVARIABLE;
++typedef struct _gcSHADER_LIST *         gcSHADER_LIST;
++
++struct _gcsHINT
++{
++    /* Numbr of data transfers for Vertex Shader output. */
++    gctUINT32   vsOutputCount;
++
++    /* Flag whether the VS has point size or not. */
++    gctBOOL     vsHasPointSize;
++
++#if gcdUSE_WCLIP_PATCH
++    /* Flag whether the VS gl_position.z depends on gl_position.w
++       it's a hint for wclipping */
++    gctBOOL     vsPositionZDependsOnW;
++#endif
++
++    gctBOOL     clipW;
++
++    /* Flag whether or not the shader has a KILL instruction. */
++    gctBOOL     hasKill;
++
++    /* Element count. */
++    gctUINT32   elementCount;
++
++    /* Component count. */
++    gctUINT32   componentCount;
++
++    /* Number of data transfers for Fragment Shader input. */
++    gctUINT32   fsInputCount;
++
++    /* Maximum number of temporary registers used in FS. */
++    gctUINT32   fsMaxTemp;
++
++	/* Maximum number of temporary registers used in VS. */
++	gctUINT32   vsMaxTemp;
++
++    /* Balance minimum. */
++    gctUINT32   balanceMin;
++
++    /* Balance maximum. */
++    gctUINT32   balanceMax;
++
++    /* Auto-shift balancing. */
++    gctBOOL     autoShift;
++
++    /* Flag whether the PS outputs the depth value or not. */
++    gctBOOL     psHasFragDepthOut;
++
++	/* Flag whether the ThreadWalker is in PS. */
++	gctBOOL		threadWalkerInPS;
++
++    /* HW reg number for position of VS */
++    gctUINT32   hwRegNoOfSIVPos;
++
++#if gcdALPHA_KILL_IN_SHADER
++    /* States to set when alpha kill is enabled. */
++    gctUINT32   killStateAddress;
++    gctUINT32   alphaKillStateValue;
++    gctUINT32   colorKillStateValue;
++
++    /* Shader instructiuon. */
++    gctUINT32   killInstructionAddress;
++    gctUINT32   alphaKillInstruction[3];
++    gctUINT32   colorKillInstruction[3];
++#endif
++
++#if TEMP_SHADER_PATCH
++	gctUINT32	pachedShaderIdentifier;
++#endif
++
++#if gcdUSE_WCLIP_PATCH
++    /* Strict WClip match. */
++    gctBOOL     strictWClipMatch;
++#endif
++};
++
++#if TEMP_SHADER_PATCH
++#define INVALID_SHADER_IDENTIFIER 0xFFFFFFFF
++#endif
++
++/* gcSHADER_TYPE enumeration. */
++typedef enum _gcSHADER_TYPE
++{
++    gcSHADER_FLOAT_X1   = 0,        /* 0x00 */
++    gcSHADER_FLOAT_X2,				/* 0x01 */
++	gcSHADER_FLOAT_X3,				/* 0x02 */
++	gcSHADER_FLOAT_X4,				/* 0x03 */
++	gcSHADER_FLOAT_2X2,				/* 0x04 */
++	gcSHADER_FLOAT_3X3,				/* 0x05 */
++	gcSHADER_FLOAT_4X4,				/* 0x06 */
++	gcSHADER_BOOLEAN_X1,			/* 0x07 */
++	gcSHADER_BOOLEAN_X2,			/* 0x08 */
++	gcSHADER_BOOLEAN_X3,			/* 0x09 */
++	gcSHADER_BOOLEAN_X4,			/* 0x0A */
++	gcSHADER_INTEGER_X1,			/* 0x0B */
++	gcSHADER_INTEGER_X2,			/* 0x0C */
++	gcSHADER_INTEGER_X3,			/* 0x0D */
++	gcSHADER_INTEGER_X4,			/* 0x0E */
++	gcSHADER_SAMPLER_1D,			/* 0x0F */
++	gcSHADER_SAMPLER_2D,			/* 0x10 */
++	gcSHADER_SAMPLER_3D,			/* 0x11 */
++	gcSHADER_SAMPLER_CUBIC,			/* 0x12 */
++	gcSHADER_FIXED_X1,				/* 0x13 */
++	gcSHADER_FIXED_X2,				/* 0x14 */
++	gcSHADER_FIXED_X3,				/* 0x15 */
++	gcSHADER_FIXED_X4,				/* 0x16 */
++	gcSHADER_IMAGE_2D,				/* 0x17 */  /* For OCL. */
++	gcSHADER_IMAGE_3D,				/* 0x18 */  /* For OCL. */
++	gcSHADER_SAMPLER,				/* 0x19 */  /* For OCL. */
++	gcSHADER_FLOAT_2X3,				/* 0x1A */
++	gcSHADER_FLOAT_2X4,				/* 0x1B */
++	gcSHADER_FLOAT_3X2,				/* 0x1C */
++	gcSHADER_FLOAT_3X4,				/* 0x1D */
++	gcSHADER_FLOAT_4X2,				/* 0x1E */
++	gcSHADER_FLOAT_4X3,				/* 0x1F */
++	gcSHADER_ISAMPLER_2D,			/* 0x20 */
++	gcSHADER_ISAMPLER_3D,			/* 0x21 */
++	gcSHADER_ISAMPLER_CUBIC,		/* 0x22 */
++	gcSHADER_USAMPLER_2D,			/* 0x23 */
++	gcSHADER_USAMPLER_3D,			/* 0x24 */
++	gcSHADER_USAMPLER_CUBIC,		/* 0x25 */
++	gcSHADER_SAMPLER_EXTERNAL_OES,		/* 0x26 */
++
++	gcSHADER_UINT_X1,			/* 0x27 */
++	gcSHADER_UINT_X2,			/* 0x28 */
++	gcSHADER_UINT_X3,			/* 0x29 */
++	gcSHADER_UINT_X4,			/* 0x2A */
++
++    gcSHADER_UNKONWN_TYPE,      /* do not add type after this */
++    gcSHADER_TYPE_COUNT         /* must to change gcvShaderTypeInfo at the
++                                 * same time if you add any new type! */}
++gcSHADER_TYPE;
++
++typedef enum _gcSHADER_TYPE_KIND
++{
++    gceTK_UNKOWN,
++    gceTK_FLOAT,
++    gceTK_INT,
++    gceTK_UINT,
++    gceTK_BOOL,
++    gceTK_FIXED,
++    gceTK_SAMPLER,
++    gceTK_IMAGE,
++    gceTK_OTHER
++} gcSHADER_TYPE_KIND;
++
++typedef struct _gcSHADER_TYPEINFO
++{
++    gcSHADER_TYPE      type;              /* e.g. gcSHADER_FLOAT_2X4 */
++    gctINT             components;        /* e.g. 4 components       */
++    gctINT             rows;              /* e.g. 2 rows             */
++    gcSHADER_TYPE      componentType;     /* e.g. gcSHADER_FLOAT_X4  */
++    gcSHADER_TYPE_KIND kind;              /* e.g. gceTK_FLOAT */
++    gctCONST_STRING    name;              /* e.g. "FLOAT_2X4" */
++} gcSHADER_TYPEINFO;
++
++extern gcSHADER_TYPEINFO gcvShaderTypeInfo[];
++
++#define gcmType_Comonents(Type)    (gcvShaderTypeInfo[Type].components)
++#define gcmType_Rows(Type)         (gcvShaderTypeInfo[Type].rows)
++#define gcmType_ComonentType(Type) (gcvShaderTypeInfo[Type].componentType)
++#define gcmType_Kind(Type)         (gcvShaderTypeInfo[Type].kind)
++#define gcmType_Name(Type)         (gcvShaderTypeInfo[Type].name)
++
++#define gcmType_isMatrix(type) (gcmType_Rows(type) > 1)
++
++typedef enum _gcSHADER_VAR_CATEGORY
++{
++    gcSHADER_VAR_CATEGORY_NORMAL  =  0, /* primitive type and its array */
++    gcSHADER_VAR_CATEGORY_STRUCT  =  1  /* structure */
++}
++gcSHADER_VAR_CATEGORY;
++
++typedef enum _gceTYPE_QUALIFIER
++{
++    gcvTYPE_QUALIFIER_NONE         = 0x0, /* unqualified */
++    gcvTYPE_QUALIFIER_VOLATILE     = 0x1, /* volatile */
++}gceTYPE_QUALIFIER;
++
++typedef gctUINT16  gctTYPE_QUALIFIER;
++
++#if GC_ENABLE_LOADTIME_OPT
++typedef struct _gcSHADER_TYPE_INFO
++{
++    gcSHADER_TYPE    type;        /* eg. gcSHADER_FLOAT_2X3 is the type */
++    gctCONST_STRING  name;        /* the name of the type: "gcSHADER_FLOAT_2X3" */
++    gcSHADER_TYPE    baseType;    /* its base type is gcSHADER_FLOAT_2 */
++    gctINT           components;  /* it has 2 components */
++    gctINT           rows;        /* and 3 rows */
++    gctINT           size;        /* the size in byte */
++} gcSHADER_TYPE_INFO;
++
++extern gcSHADER_TYPE_INFO shader_type_info[];
++
++enum gceLTCDumpOption {
++    gceLTC_DUMP_UNIFORM      = 0x0001,
++    gceLTC_DUMP_EVALUATION   = 0x0002,
++    gceLTC_DUMP_EXPESSION    = 0x0004,
++    gceLTC_DUMP_COLLECTING   = 0x0008,
++};
++
++gctBOOL gcDumpOption(gctINT Opt);
++
++#endif /* GC_ENABLE_LOADTIME_OPT */
++
++#define IS_MATRIX_TYPE(type) \
++    (((type >= gcSHADER_FLOAT_2X2) && (type <= gcSHADER_FLOAT_4X4)) || \
++     ((type >= gcSHADER_FLOAT_2X3) && (type <= gcSHADER_FLOAT_4X3)))
++
++/* gcSHADER_PRECISION enumeration. */
++typedef enum _gcSHADER_PRECISION
++{
++	gcSHADER_PRECISION_DEFAULT,				/* 0x00 */
++	gcSHADER_PRECISION_HIGH,				/* 0x01 */
++	gcSHADER_PRECISION_MEDIUM,				/* 0x02 */
++	gcSHADER_PRECISION_LOW,				    /* 0x03 */
++}
++gcSHADER_PRECISION;
++
++/* Shader flags. */
++typedef enum _gceSHADER_FLAGS
++{
++    gcvSHADER_NO_OPTIMIZATION           = 0x00,
++	gcvSHADER_DEAD_CODE					= 0x01,
++	gcvSHADER_RESOURCE_USAGE			= 0x02,
++	gcvSHADER_OPTIMIZER					= 0x04,
++	gcvSHADER_USE_GL_Z					= 0x08,
++    /*
++        The GC family of GPU cores model GC860 and under require the Z
++        to be from 0 <= z <= w.
++        However, OpenGL specifies the Z to be from -w <= z <= w.  So we
++        have to a conversion here:
++
++            z = (z + w) / 2.
++
++        So here we append two instructions to the vertex shader.
++    */
++	gcvSHADER_USE_GL_POSITION			= 0x10,
++	gcvSHADER_USE_GL_FACE				= 0x20,
++	gcvSHADER_USE_GL_POINT_COORD		= 0x40,
++	gcvSHADER_LOADTIME_OPTIMIZER		= 0x80,
++#if gcdALPHA_KILL_IN_SHADER
++    gcvSHADER_USE_ALPHA_KILL            = 0x100,
++#endif
++
++#if gcdPRE_ROTATION && (ANDROID_SDK_VERSION >= 14)
++    gcvSHADER_VS_PRE_ROTATION           = 0x200,
++#endif
++
++#if TEMP_INLINE_ALL_EXPANSION
++    gcvSHADER_INLINE_ALL_EXPANSION      = 0x400,
++#endif
++}
++gceSHADER_FLAGS;
++
++gceSTATUS
++gcSHADER_CheckClipW(
++    IN gctCONST_STRING VertexSource,
++    IN gctCONST_STRING FragmentSource,
++    OUT gctBOOL * clipW);
++
++/*******************************************************************************
++**  gcSHADER_GetUniformVectorCount
++**
++**  Get the number of vectors used by uniforms for this shader.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Count
++**          Pointer to a variable receiving the number of vectors.
++*/
++gceSTATUS
++gcSHADER_GetUniformVectorCount(
++    IN gcSHADER Shader,
++    OUT gctSIZE_T * Count
++    );
++
++/*******************************************************************************
++**							gcOptimizer Data Structures
++*******************************************************************************/
++typedef enum _gceSHADER_OPTIMIZATION
++{
++    /*  No optimization. */
++	gcvOPTIMIZATION_NONE,
++
++    /*  Flow graph construction. */
++	gcvOPTIMIZATION_CONSTRUCTION                = 1 << 0,
++
++    /*  Dead code elimination. */
++	gcvOPTIMIZATION_DEAD_CODE                   = 1 << 1,
++
++    /*  Redundant move instruction elimination. */
++	gcvOPTIMIZATION_REDUNDANT_MOVE              = 1 << 2,
++
++    /*  Inline expansion. */
++	gcvOPTIMIZATION_INLINE_EXPANSION            = 1 << 3,
++
++    /*  Constant propagation. */
++	gcvOPTIMIZATION_CONSTANT_PROPAGATION        = 1 << 4,
++
++    /*  Redundant bounds/checking elimination. */
++	gcvOPTIMIZATION_REDUNDANT_CHECKING          = 1 << 5,
++
++    /*  Loop invariant movement. */
++	gcvOPTIMIZATION_LOOP_INVARIANT              = 1 << 6,
++
++    /*  Induction variable removal. */
++	gcvOPTIMIZATION_INDUCTION_VARIABLE          = 1 << 7,
++
++    /*  Common subexpression elimination. */
++	gcvOPTIMIZATION_COMMON_SUBEXPRESSION        = 1 << 8,
++
++    /*  Control flow/banch optimization. */
++	gcvOPTIMIZATION_CONTROL_FLOW                = 1 << 9,
++
++    /*  Vector component operation merge. */
++	gcvOPTIMIZATION_VECTOR_INSTRUCTION_MERGE    = 1 << 10,
++
++    /*  Algebra simplificaton. */
++	gcvOPTIMIZATION_ALGEBRAIC_SIMPLIFICATION    = 1 << 11,
++
++    /*  Pattern matching and replacing. */
++	gcvOPTIMIZATION_PATTERN_MATCHING            = 1 << 12,
++
++    /*  Interprocedural constant propagation. */
++	gcvOPTIMIZATION_IP_CONSTANT_PROPAGATION     = 1 << 13,
++
++    /*  Interprecedural register optimization. */
++	gcvOPTIMIZATION_IP_REGISTRATION             = 1 << 14,
++
++    /*  Optimization option number. */
++	gcvOPTIMIZATION_OPTION_NUMBER               = 1 << 15,
++
++	/*  Loadtime constant. */
++    gcvOPTIMIZATION_LOADTIME_CONSTANT           = 1 << 16,
++
++    /*  MAD instruction optimization. */
++	gcvOPTIMIZATION_MAD_INSTRUCTION             = 1 << 17,
++
++    /*  Special optimization for LOAD SW workaround. */
++	gcvOPTIMIZATION_LOAD_SW_WORKAROUND          = 1 << 18,
++
++    /* move code into conditional block if possile */
++	gcvOPTIMIZATION_CONDITIONALIZE              = 1 << 19,
++
++    /* expriemental: power optimization mode
++        1. add extra dummy texld to tune performance
++        2. insert NOP after high power instrucitons
++        3. split high power vec3/vec4 instruciton to vec2/vec1 operation
++        4. ...
++     */
++	gcvOPTIMIZATION_POWER_OPTIMIZATION           = 1 << 20,
++
++    /* optimize varying packing */
++    gcvOPTIMIZATION_VARYINGPACKING              = 1 << 22,
++
++#if TEMP_INLINE_ALL_EXPANSION
++	gcvOPTIMIZATION_INLINE_ALL_EXPANSION        = 1 << 23,
++#endif
++
++    /*  Full optimization. */
++    /*  Note that gcvOPTIMIZATION_LOAD_SW_WORKAROUND is off. */
++	gcvOPTIMIZATION_FULL                        = 0x7FFFFFFF &
++                                                  ~gcvOPTIMIZATION_LOAD_SW_WORKAROUND &
++                                                  ~gcvOPTIMIZATION_INLINE_ALL_EXPANSION &
++                                                  ~gcvOPTIMIZATION_POWER_OPTIMIZATION,
++
++	/* Optimization Unit Test flag. */
++    gcvOPTIMIZATION_UNIT_TEST                   = 1 << 31
++}
++gceSHADER_OPTIMIZATION;
++
++typedef enum _gceOPTIMIZATION_VaryingPaking
++{
++    gcvOPTIMIZATION_VARYINGPACKING_NONE = 0,
++    gcvOPTIMIZATION_VARYINGPACKING_NOSPLIT,
++    gcvOPTIMIZATION_VARYINGPACKING_SPLIT
++} gceOPTIMIZATION_VaryingPaking;
++
++typedef struct _gcOPTIMIZER_OPTION
++{
++    gceSHADER_OPTIMIZATION     optFlags;
++
++    /* debug & dump options:
++
++         VC_OPTION=-DUMP:SRC:OPT|:OPTV|:CG|:CGV:|ALL|ALLV
++
++         SRC:  dump shader source code
++         OPT:  dump incoming and final IR
++         OPTV: dump result IR in each optimization phase
++         CG:   dump generated machine code
++         CGV:  dump BE tree and optimization detail
++
++         ALL = SRC|OPT|CG
++         ALLV = SRC|OPT|OPTV|CG|CGV
++     */
++    gctBOOL     dumpShaderSource;      /* dump shader source code */
++    gctBOOL     dumpOptimizer;         /* dump incoming and final IR */
++    gctBOOL     dumpOptimizerVerbose;  /* dump result IR in each optimization phase */
++    gctBOOL     dumpBEGenertedCode;    /* dump generated machine code */
++    gctBOOL     dumpBEVerbose;         /* dump BE tree and optimization detail */
++    gctBOOL     dumpBEFinalIR;         /* dump BE final IR */
++
++    /* Code generation */
++
++    /* Varying Packing:
++
++          VC_OPTION=-PACKVARYING:[0-2]|:T[-]m[,n]|:LshaderIdx,min,max
++
++          0: turn off varying packing
++          1: pack varyings, donot split any varying
++          2: pack varyings, may split to make fully packed output
++
++          Tm:    only packing shader pair which vertex shader id is m
++          Tm,n:  only packing shader pair which vertex shader id
++                   is in range of [m, n]
++          T-m:   do not packing shader pair which vertex shader id is m
++          T-m,n: do not packing shader pair which vertex shader id
++                   is in range of [m, n]
++
++          LshaderIdx,min,max : set  load balance (min, max) for shaderIdx
++                               if shaderIdx is -1, all shaders are impacted
++                               newMin = origMin * (min/100.);
++                               newMax = origMax * (max/100.);
++     */
++    gceOPTIMIZATION_VaryingPaking    packVarying;
++    gctINT                           _triageStart;
++    gctINT                           _triageEnd;
++    gctINT                           _loadBalanceShaderIdx;
++    gctINT                           _loadBalanceMin;
++    gctINT                           _loadBalanceMax;
++
++    /* Do not generate immdeiate
++
++          VC_OPTION=-NOIMM
++
++       Force generate immediate even the machine model don't support it,
++       for testing purpose only
++
++          VC_OPTION=-FORCEIMM
++     */
++    gctBOOL     noImmediate;
++    gctBOOL     forceImmediate;
++
++    /* Power reduction mode options */
++    gctBOOL   needPowerOptimization;
++
++    /* Patch TEXLD instruction by adding dummy texld
++       (can be used to tune GPU power usage):
++         for every TEXLD we seen, add n dummy TEXLD
++
++        it can be enabled by environment variable:
++
++          VC_OPTION=-PATCH_TEXLD:M:N
++
++        (for each M texld, add N dummy texld)
++     */
++    gctINT      patchEveryTEXLDs;
++    gctINT      patchDummyTEXLDs;
++
++    /* Insert NOP after high power consumption instructions
++
++         VC_OPTION="-INSERTNOP:MUL:MULLO:DP3:DP4:SEENTEXLD"
++     */
++    gctBOOL     insertNOP;
++    gctBOOL     insertNOPAfterMUL;
++    gctBOOL     insertNOPAfterMULLO;
++    gctBOOL     insertNOPAfterDP3;
++    gctBOOL     insertNOPAfterDP4;
++    gctBOOL     insertNOPOnlyWhenTexldSeen;
++
++    /* split MAD to MUL and ADD:
++
++         VC_OPTION=-SPLITMAD
++     */
++    gctBOOL     splitMAD;
++
++    /* Convert vect3/vec4 operations to multiple vec2/vec1 operations
++
++         VC_OPTION=-SPLITVEC:MUL:MULLO:DP3:DP4
++     */
++    gctBOOL     splitVec;
++    gctBOOL     splitVec4MUL;
++    gctBOOL     splitVec4MULLO;
++    gctBOOL     splitVec4DP3;
++    gctBOOL     splitVec4DP4;
++
++    /* turn/off features:
++
++          VC_OPTION=-F:n,[0|1]
++          Note: n must be decimal number
++     */
++    gctUINT     featureBits;
++
++    /* inline level (default 2 at O1):
++
++          VC_OPTION=-INLINELEVEL:[0-3]
++             0:  no inline
++             1:  only inline the function only called once or small function
++             2:  inline functions be called less than 5 times or medium size function
++             3:  inline everything possible
++     */
++    gctUINT     inlineLevel;
++} gcOPTIMIZER_OPTION;
++
++extern gcOPTIMIZER_OPTION theOptimizerOption;
++#define gcmGetOptimizerOption() gcGetOptimizerOption()
++
++#define gcmOPT_DUMP_SHADER_SRC()         \
++             (gcmGetOptimizerOption()->dumpShaderSource != 0)
++#define gcmOPT_DUMP_OPTIMIZER()          \
++             (gcmGetOptimizerOption()->dumpOptimizer != 0 || \
++              gcmOPT_DUMP_OPTIMIZER_VERBOSE() )
++#define gcmOPT_DUMP_OPTIMIZER_VERBOSE()  \
++             (gcmGetOptimizerOption()->dumpOptimizerVerbose != 0)
++#define gcmOPT_DUMP_CODEGEN()            \
++             (gcmGetOptimizerOption()->dumpBEGenertedCode != 0 || \
++              gcmOPT_DUMP_CODEGEN_VERBOSE() )
++#define gcmOPT_DUMP_CODEGEN_VERBOSE()    \
++             (gcmGetOptimizerOption()->dumpBEVerbose != 0)
++#define gcmOPT_DUMP_FINAL_IR()    \
++             (gcmGetOptimizerOption()->dumpBEFinalIR != 0)
++
++#define gcmOPT_SET_DUMP_SHADER_SRC(v)   \
++             gcmGetOptimizerOption()->dumpShaderSource = (v)
++
++#define gcmOPT_PATCH_TEXLD()  (gcmGetOptimizerOption()->patchDummyTEXLDs != 0)
++#define gcmOPT_INSERT_NOP()   (gcmGetOptimizerOption()->insertNOP == gcvTRUE)
++#define gcmOPT_SPLITMAD()     (gcmGetOptimizerOption()->splitMAD == gcvTRUE)
++#define gcmOPT_SPLITVEC()     (gcmGetOptimizerOption()->splitVec == gcvTRUE)
++
++#define gcmOPT_NOIMMEDIATE()  (gcmGetOptimizerOption()->noImmediate == gcvTRUE)
++#define gcmOPT_FORCEIMMEDIATE()  (gcmGetOptimizerOption()->forceImmediate == gcvTRUE)
++
++#define gcmOPT_PACKVARYING()     (gcmGetOptimizerOption()->packVarying)
++#define gcmOPT_PACKVARYING_triageStart()   (gcmGetOptimizerOption()->_triageStart)
++#define gcmOPT_PACKVARYING_triageEnd()     (gcmGetOptimizerOption()->_triageEnd)
++
++#define gcmOPT_INLINELEVEL()     (gcmGetOptimizerOption()->inlineLevel)
++
++/* Setters */
++#define gcmOPT_SetPatchTexld(m,n) (gcmGetOptimizerOption()->patchEveryTEXLDs = (m),\
++                                   gcmGetOptimizerOption()->patchDummyTEXLDs = (n))
++#define gcmOPT_SetSplitVecMUL() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
++                                 gcmGetOptimizerOption()->splitVec4MUL = gcvTRUE)
++#define gcmOPT_SetSplitVecMULLO() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
++                                  gcmGetOptimizerOption()->splitVec4MULLO = gcvTRUE)
++#define gcmOPT_SetSplitVecDP3() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
++                                 gcmGetOptimizerOption()->splitVec4DP3 = gcvTRUE)
++#define gcmOPT_SetSplitVecDP4() (gcmGetOptimizerOption()->splitVec = gcvTRUE, \
++                                 gcmGetOptimizerOption()->splitVec4DP4 = gcvTRUE)
++
++#define gcmOPT_SetPackVarying(v)     (gcmGetOptimizerOption()->packVarying = v)
++
++#define FB_LIVERANGE_FIX1     0x0001
++
++
++#define PredefinedDummySamplerId       8
++
++/* Function argument qualifier */
++typedef enum _gceINPUT_OUTPUT
++{
++	gcvFUNCTION_INPUT,
++	gcvFUNCTION_OUTPUT,
++	gcvFUNCTION_INOUT
++}
++gceINPUT_OUTPUT;
++
++/* Kernel function property flags. */
++typedef enum _gcePROPERTY_FLAGS
++{
++	gcvPROPERTY_REQD_WORK_GRP_SIZE	= 0x01
++}
++gceKERNEL_FUNCTION_PROPERTY_FLAGS;
++
++/* Uniform flags. */
++typedef enum _gceUNIFORM_FLAGS
++{
++	gcvUNIFORM_KERNEL_ARG			= 0x01,
++	gcvUNIFORM_KERNEL_ARG_LOCAL		= 0x02,
++	gcvUNIFORM_KERNEL_ARG_SAMPLER		= 0x04,
++	gcvUNIFORM_LOCAL_ADDRESS_SPACE		= 0x08,
++	gcvUNIFORM_PRIVATE_ADDRESS_SPACE	= 0x10,
++	gcvUNIFORM_CONSTANT_ADDRESS_SPACE	= 0x20,
++	gcvUNIFORM_GLOBAL_SIZE			= 0x40,
++	gcvUNIFORM_LOCAL_SIZE			= 0x80,
++	gcvUNIFORM_NUM_GROUPS			= 0x100,
++	gcvUNIFORM_GLOBAL_OFFSET		= 0x200,
++	gcvUNIFORM_WORK_DIM			= 0x400,
++	gcvUNIFORM_KERNEL_ARG_CONSTANT		= 0x800,
++	gcvUNIFORM_KERNEL_ARG_LOCAL_MEM_SIZE	= 0x1000,
++	gcvUNIFORM_KERNEL_ARG_PRIVATE		= 0x2000,
++	gcvUNIFORM_LOADTIME_CONSTANT		= 0x4000,
++    gcvUNIFORM_IS_ARRAY                 = 0x8000,
++}
++gceUNIFORM_FLAGS;
++
++#define gcdUNIFORM_KERNEL_ARG_MASK  (gcvUNIFORM_KERNEL_ARG         | \
++                                     gcvUNIFORM_KERNEL_ARG_LOCAL   | \
++									 gcvUNIFORM_KERNEL_ARG_SAMPLER | \
++									 gcvUNIFORM_KERNEL_ARG_PRIVATE | \
++									 gcvUNIFORM_KERNEL_ARG_CONSTANT)
++
++typedef enum _gceVARIABLE_UPDATE_FLAGS
++{
++    gcvVARIABLE_UPDATE_NOUPDATE = 0,
++    gcvVARIABLE_UPDATE_TEMPREG,
++    gcvVARIABLE_UPDATE_TYPE_QUALIFIER,
++}gceVARIABLE_UPDATE_FLAGS;
++
++typedef struct _gcMACHINE_INST
++{
++    gctUINT        state0;
++    gctUINT        state1;
++    gctUINT        state2;
++    gctUINT        state3;
++}gcMACHINE_INST, *gcMACHINE_INST_PTR;
++
++typedef struct _gcMACHINECODE
++{
++    gcMACHINE_INST_PTR   pCode;          /* machine code  */
++    gctUINT              instCount;      /* 128-bit count */
++    gctUINT              maxConstRegNo;
++    gctUINT              maxTempRegNo;
++    gctUINT              endPCOfMainRoutine;
++}gcMACHINECODE, *gcMACHINECODE_PTR;
++
++typedef enum NP2_ADDRESS_MODE
++{
++    NP2_ADDRESS_MODE_CLAMP  = 0,
++    NP2_ADDRESS_MODE_REPEAT = 1,
++    NP2_ADDRESS_MODE_MIRROR = 2
++}NP2_ADDRESS_MODE;
++
++typedef struct _gcNPOT_PATCH_PARAM
++{
++    gctINT               samplerSlot;
++    NP2_ADDRESS_MODE     addressMode[3];
++    gctINT               texDimension;    /* 2 or 3 */
++}gcNPOT_PATCH_PARAM, *gcNPOT_PATCH_PARAM_PTR;
++
++typedef struct _gcZBIAS_PATCH_PARAM
++{
++    /* Driver uses this to program uniform that designating zbias */
++    gctINT               uniformAddr;
++    gctINT               channel;
++}gcZBIAS_PATCH_PARAM, *gcZBIAS_PATCH_PARAM_PTR;
++
++void
++gcGetOptionFromEnv(
++    IN OUT gcOPTIMIZER_OPTION * Option
++    );
++
++void
++gcSetOptimizerOption(
++    IN gceSHADER_FLAGS Flags
++    );
++
++gcOPTIMIZER_OPTION *
++gcGetOptimizerOption();
++
++/*******************************************************************************
++**  gcSHADER_SetCompilerVersion
++**
++**  Set the compiler version of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to gcSHADER object
++**
++**      gctINT *Version
++**          Pointer to a two word version
++*/
++gceSTATUS
++gcSHADER_SetCompilerVersion(
++    IN gcSHADER Shader,
++    IN gctUINT32 *Version
++    );
++
++/*******************************************************************************
++**  gcSHADER_GetCompilerVersion
++**
++**  Get the compiler version of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR *CompilerVersion.
++**          Pointer to holder of returned compilerVersion pointer
++*/
++gceSTATUS
++gcSHADER_GetCompilerVersion(
++    IN gcSHADER Shader,
++    OUT gctUINT32_PTR *CompilerVersion
++    );
++
++/*******************************************************************************
++**  gcSHADER_GetType
++**
++**  Get the gcSHADER object's type.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctINT *Type.
++**          Pointer to return shader type.
++*/
++gceSTATUS
++gcSHADER_GetType(
++    IN gcSHADER Shader,
++    OUT gctINT *Type
++    );
++
++gctUINT
++gcSHADER_NextId();
++/*******************************************************************************
++**                             gcSHADER_Construct
++********************************************************************************
++**
++**	Construct a new gcSHADER object.
++**
++**	INPUT:
++**
++**		gcoOS Hal
++**			Pointer to an gcoHAL object.
++**
++**		gctINT ShaderType
++**			Type of gcSHADER object to cerate.  'ShaderType' can be one of the
++**			following:
++**
++**				gcSHADER_TYPE_VERTEX	Vertex shader.
++**				gcSHADER_TYPE_FRAGMENT	Fragment shader.
++**
++**	OUTPUT:
++**
++**		gcSHADER * Shader
++**			Pointer to a variable receiving the gcSHADER object pointer.
++*/
++gceSTATUS
++gcSHADER_Construct(
++	IN gcoHAL Hal,
++	IN gctINT ShaderType,
++	OUT gcSHADER * Shader
++	);
++
++/*******************************************************************************
++**                              gcSHADER_Destroy
++********************************************************************************
++**
++**	Destroy a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_Destroy(
++	IN gcSHADER Shader
++	);
++
++/*******************************************************************************
++**                              gcSHADER_Copy
++********************************************************************************
++**
++**	Copy a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**      gcSHADER Source
++**          Pointer to a gcSHADER object that will be copied.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_Copy(
++	IN gcSHADER Shader,
++	IN gcSHADER Source
++	);
++
++/*******************************************************************************
++**  gcSHADER_LoadHeader
++**
++**  Load a gcSHADER object from a binary buffer.  The binary buffer is layed out
++**  as follows:
++**      // Six word header
++**      // Signature, must be 'S','H','D','R'.
++**      gctINT8             signature[4];
++**      gctUINT32           binFileVersion;
++**      gctUINT32           compilerVersion[2];
++**      gctUINT32           gcSLVersion;
++**      gctUINT32           binarySize;
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**          Shader type will be returned if type in shader object is not gcSHADER_TYPE_PRECOMPILED
++**
++**      gctPOINTER Buffer
++**          Pointer to a binary buffer containing the shader data to load.
++**
++**      gctSIZE_T BufferSize
++**          Number of bytes inside the binary buffer pointed to by 'Buffer'.
++**
++**  OUTPUT:
++**      nothing
++**
++*/
++gceSTATUS
++gcSHADER_LoadHeader(
++    IN gcSHADER Shader,
++    IN gctPOINTER Buffer,
++    IN gctSIZE_T BufferSize,
++    OUT gctUINT32 * ShaderVersion
++    );
++
++/*******************************************************************************
++**  gcSHADER_LoadKernel
++**
++**  Load a kernel function given by name into gcSHADER object
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSTRING KernelName
++**          Pointer to a kernel function name
++**
++**  OUTPUT:
++**      nothing
++**
++*/
++gceSTATUS
++gcSHADER_LoadKernel(
++    IN gcSHADER Shader,
++    IN gctSTRING KernelName
++    );
++
++/*******************************************************************************
++**                                gcSHADER_Load
++********************************************************************************
++**
++**	Load a gcSHADER object from a binary buffer.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctPOINTER Buffer
++**			Pointer to a binary buffer containg the shader data to load.
++**
++**		gctSIZE_T BufferSize
++**			Number of bytes inside the binary buffer pointed to by 'Buffer'.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_Load(
++	IN gcSHADER Shader,
++	IN gctPOINTER Buffer,
++	IN gctSIZE_T BufferSize
++	);
++
++/*******************************************************************************
++**                                gcSHADER_Save
++********************************************************************************
++**
++**	Save a gcSHADER object to a binary buffer.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctPOINTER Buffer
++**			Pointer to a binary buffer to be used as storage for the gcSHADER
++**			object.  If 'Buffer' is gcvNULL, the gcSHADER object will not be saved,
++**			but the number of bytes required to hold the binary output for the
++**			gcSHADER object will be returned.
++**
++**		gctSIZE_T * BufferSize
++**			Pointer to a variable holding the number of bytes allocated in
++**			'Buffer'.  Only valid if 'Buffer' is not gcvNULL.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * BufferSize
++**			Pointer to a variable receiving the number of bytes required to hold
++**			the binary form of the gcSHADER object.
++*/
++gceSTATUS
++gcSHADER_Save(
++	IN gcSHADER Shader,
++	IN gctPOINTER Buffer,
++	IN OUT gctSIZE_T * BufferSize
++	);
++
++/*******************************************************************************
++**                                gcSHADER_LoadEx
++********************************************************************************
++**
++**	Load a gcSHADER object from a binary buffer.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctPOINTER Buffer
++**			Pointer to a binary buffer containg the shader data to load.
++**
++**		gctSIZE_T BufferSize
++**			Number of bytes inside the binary buffer pointed to by 'Buffer'.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_LoadEx(
++	IN gcSHADER Shader,
++	IN gctPOINTER Buffer,
++	IN gctSIZE_T BufferSize
++	);
++
++/*******************************************************************************
++**                                gcSHADER_SaveEx
++********************************************************************************
++**
++**	Save a gcSHADER object to a binary buffer.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctPOINTER Buffer
++**			Pointer to a binary buffer to be used as storage for the gcSHADER
++**			object.  If 'Buffer' is gcvNULL, the gcSHADER object will not be saved,
++**			but the number of bytes required to hold the binary output for the
++**			gcSHADER object will be returned.
++**
++**		gctSIZE_T * BufferSize
++**			Pointer to a variable holding the number of bytes allocated in
++**			'Buffer'.  Only valid if 'Buffer' is not gcvNULL.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * BufferSize
++**			Pointer to a variable receiving the number of bytes required to hold
++**			the binary form of the gcSHADER object.
++*/
++gceSTATUS
++gcSHADER_SaveEx(
++	IN gcSHADER Shader,
++	IN gctPOINTER Buffer,
++	IN OUT gctSIZE_T * BufferSize
++	);
++
++/*******************************************************************************
++**  gcSHADER_ReallocateAttributes
++**
++**  Reallocate an array of pointers to gcATTRIBUTE objects.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcSHADER_ReallocateAttributes(
++    IN gcSHADER Shader,
++    IN gctSIZE_T Count
++    );
++
++/*******************************************************************************
++**							  gcSHADER_AddAttribute
++********************************************************************************
++**
++**	Add an attribute to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the attribute to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the attribute to add.
++**
++**		gctSIZE_T Length
++**			Array length of the attribute to add.  'Length' must be at least 1.
++**
++**		gctBOOL IsTexture
++**			gcvTRUE if the attribute is used as a texture coordinate, gcvFALSE if not.
++**
++**	OUTPUT:
++**
++**		gcATTRIBUTE * Attribute
++**			Pointer to a variable receiving the gcATTRIBUTE object pointer.
++*/
++gceSTATUS
++gcSHADER_AddAttribute(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++	IN gctSIZE_T Length,
++	IN gctBOOL IsTexture,
++	OUT gcATTRIBUTE * Attribute
++	);
++
++/*******************************************************************************
++**                         gcSHADER_GetAttributeCount
++********************************************************************************
++**
++**	Get the number of attributes for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Count
++**			Pointer to a variable receiving the number of attributes.
++*/
++gceSTATUS
++gcSHADER_GetAttributeCount(
++	IN gcSHADER Shader,
++	OUT gctSIZE_T * Count
++	);
++
++/*******************************************************************************
++**                            gcSHADER_GetAttribute
++********************************************************************************
++**
++**	Get the gcATTRIBUTE object poniter for an indexed attribute for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT Index
++**			Index of the attribute to retrieve.
++**
++**	OUTPUT:
++**
++**		gcATTRIBUTE * Attribute
++**			Pointer to a variable receiving the gcATTRIBUTE object pointer.
++*/
++gceSTATUS
++gcSHADER_GetAttribute(
++	IN gcSHADER Shader,
++	IN gctUINT Index,
++	OUT gcATTRIBUTE * Attribute
++	);
++
++/*******************************************************************************
++**  gcSHADER_ReallocateUniforms
++**
++**  Reallocate an array of pointers to gcUNIFORM objects.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcSHADER_ReallocateUniforms(
++    IN gcSHADER Shader,
++    IN gctSIZE_T Count
++    );
++
++/*******************************************************************************
++**							   gcSHADER_AddUniform
++********************************************************************************
++**
++**	Add an uniform to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the uniform to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the uniform to add.
++**
++**		gctSIZE_T Length
++**			Array length of the uniform to add.  'Length' must be at least 1.
++**
++**	OUTPUT:
++**
++**		gcUNIFORM * Uniform
++**			Pointer to a variable receiving the gcUNIFORM object pointer.
++*/
++gceSTATUS
++gcSHADER_AddUniform(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++	IN gctSIZE_T Length,
++	OUT gcUNIFORM * Uniform
++	);
++
++/*******************************************************************************
++**							   gcSHADER_AddPreRotationUniform
++********************************************************************************
++**
++**	Add an uniform to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the uniform to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the uniform to add.
++**
++**		gctSIZE_T Length
++**			Array length of the uniform to add.  'Length' must be at least 1.
++**
++**		gctINT col
++**			Which uniform.
++**
++**	OUTPUT:
++**
++**		gcUNIFORM * Uniform
++**			Pointer to a variable receiving the gcUNIFORM object pointer.
++*/
++gceSTATUS
++gcSHADER_AddPreRotationUniform(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++	IN gctSIZE_T Length,
++    IN gctINT col,
++	OUT gcUNIFORM * Uniform
++	);
++
++/*******************************************************************************
++**							   gcSHADER_AddUniformEx
++********************************************************************************
++**
++**	Add an uniform to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the uniform to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the uniform to add.
++**
++**      gcSHADER_PRECISION precision
++**          Precision of the uniform to add.
++**
++**		gctSIZE_T Length
++**			Array length of the uniform to add.  'Length' must be at least 1.
++**
++**	OUTPUT:
++**
++**		gcUNIFORM * Uniform
++**			Pointer to a variable receiving the gcUNIFORM object pointer.
++*/
++gceSTATUS
++gcSHADER_AddUniformEx(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++    IN gcSHADER_PRECISION precision,
++	IN gctSIZE_T Length,
++	OUT gcUNIFORM * Uniform
++	);
++
++/*******************************************************************************
++**							   gcSHADER_AddUniformEx1
++********************************************************************************
++**
++**	Add an uniform to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the uniform to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the uniform to add.
++**
++**      gcSHADER_PRECISION precision
++**          Precision of the uniform to add.
++**
++**		gctSIZE_T Length
++**			Array length of the uniform to add.  'Length' must be at least 1.
++**
++**      gcSHADER_VAR_CATEGORY varCategory
++**          Variable category, normal or struct.
++**
++**      gctUINT16 numStructureElement
++**          If struct, its element number.
++**
++**      gctINT16 parent
++**          If struct, parent index in gcSHADER.variables.
++**
++**      gctINT16 prevSibling
++**          If struct, previous sibling index in gcSHADER.variables.
++**
++**	OUTPUT:
++**
++**		gcUNIFORM * Uniform
++**			Pointer to a variable receiving the gcUNIFORM object pointer.
++**
++**      gctINT16* ThisUniformIndex
++**          Returned value about uniform index in gcSHADER.
++*/
++gceSTATUS
++gcSHADER_AddUniformEx1(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++    IN gcSHADER_PRECISION precision,
++	IN gctSIZE_T Length,
++    IN gctINT    IsArray,
++    IN gcSHADER_VAR_CATEGORY varCategory,
++    IN gctUINT16 numStructureElement,
++    IN gctINT16 parent,
++    IN gctINT16 prevSibling,
++    OUT gctINT16* ThisUniformIndex,
++	OUT gcUNIFORM * Uniform
++	);
++
++/*******************************************************************************
++**                          gcSHADER_GetUniformCount
++********************************************************************************
++**
++**	Get the number of uniforms for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Count
++**			Pointer to a variable receiving the number of uniforms.
++*/
++gceSTATUS
++gcSHADER_GetUniformCount(
++	IN gcSHADER Shader,
++	OUT gctSIZE_T * Count
++	);
++
++/*******************************************************************************
++**                         gcSHADER_GetPreRotationUniform
++********************************************************************************
++**
++**	Get the preRotate Uniform.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		gcUNIFORM ** pUniform
++**			Pointer to a preRotation uniforms array.
++*/
++gceSTATUS
++gcSHADER_GetPreRotationUniform(
++	IN gcSHADER Shader,
++	OUT gcUNIFORM ** pUniform
++	);
++
++/*******************************************************************************
++**                             gcSHADER_GetUniform
++********************************************************************************
++**
++**	Get the gcUNIFORM object pointer for an indexed uniform for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT Index
++**			Index of the uniform to retrieve.
++**
++**	OUTPUT:
++**
++**		gcUNIFORM * Uniform
++**			Pointer to a variable receiving the gcUNIFORM object pointer.
++*/
++gceSTATUS
++gcSHADER_GetUniform(
++	IN gcSHADER Shader,
++	IN gctUINT Index,
++	OUT gcUNIFORM * Uniform
++	);
++
++
++/*******************************************************************************
++**                             gcSHADER_GetUniformIndexingRange
++********************************************************************************
++**
++**	Get the gcUNIFORM object pointer for an indexed uniform for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctINT uniformIndex
++**			Index of the start uniform.
++**
++**		gctINT offset
++**			Offset to indexing.
++**
++**	OUTPUT:
++**
++**		gctINT * LastUniformIndex
++**			Pointer to index of last uniform in indexing range.
++**
++**		gctINT * OffsetUniformIndex
++**			Pointer to index of uniform that indexing at offset.
++**
++**		gctINT * DeviationInOffsetUniform
++**			Pointer to offset in uniform picked up.
++*/
++gceSTATUS
++gcSHADER_GetUniformIndexingRange(
++	IN gcSHADER Shader,
++	IN gctINT uniformIndex,
++    IN gctINT offset,
++	OUT gctINT * LastUniformIndex,
++    OUT gctINT * OffsetUniformIndex,
++    OUT gctINT * DeviationInOffsetUniform
++	);
++
++/*******************************************************************************
++**  gcSHADER_GetKernelFucntion
++**
++**  Get the gcKERNEL_FUNCTION object pointer for an indexed kernel function for this shader.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctUINT Index
++**          Index of kernel function to retreive the name for.
++**
++**  OUTPUT:
++**
++**      gcKERNEL_FUNCTION * KernelFunction
++**          Pointer to a variable receiving the gcKERNEL_FUNCTION object pointer.
++*/
++gceSTATUS
++gcSHADER_GetKernelFunction(
++    IN gcSHADER Shader,
++    IN gctUINT Index,
++    OUT gcKERNEL_FUNCTION * KernelFunction
++    );
++
++gceSTATUS
++gcSHADER_GetKernelFunctionByName(
++	IN gcSHADER Shader,
++    IN gctSTRING KernelName,
++    OUT gcKERNEL_FUNCTION * KernelFunction
++    );
++/*******************************************************************************
++**  gcSHADER_GetKernelFunctionCount
++**
++**  Get the number of kernel functions for this shader.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Count
++**          Pointer to a variable receiving the number of kernel functions.
++*/
++gceSTATUS
++gcSHADER_GetKernelFunctionCount(
++    IN gcSHADER Shader,
++    OUT gctSIZE_T * Count
++    );
++
++/*******************************************************************************
++**  gcSHADER_ReallocateOutputs
++**
++**  Reallocate an array of pointers to gcOUTPUT objects.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcSHADER_ReallocateOutputs(
++    IN gcSHADER Shader,
++    IN gctSIZE_T Count
++    );
++
++/*******************************************************************************
++**							   gcSHADER_AddOutput
++********************************************************************************
++**
++**	Add an output to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the output to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the output to add.
++**
++**		gctSIZE_T Length
++**			Array length of the output to add.  'Length' must be at least 1.
++**
++**		gctUINT16 TempRegister
++**			Temporary register index that holds the output value.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOutput(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++	IN gctSIZE_T Length,
++	IN gctUINT16 TempRegister
++	);
++
++gceSTATUS
++gcSHADER_AddOutputIndexed(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gctSIZE_T Index,
++	IN gctUINT16 TempIndex
++	);
++
++/*******************************************************************************
++**							 gcSHADER_GetOutputCount
++********************************************************************************
++**
++**	Get the number of outputs for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Count
++**			Pointer to a variable receiving the number of outputs.
++*/
++gceSTATUS
++gcSHADER_GetOutputCount(
++	IN gcSHADER Shader,
++	OUT gctSIZE_T * Count
++	);
++
++/*******************************************************************************
++**							   gcSHADER_GetOutput
++********************************************************************************
++**
++**	Get the gcOUTPUT object pointer for an indexed output for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT Index
++**			Index of output to retrieve.
++**
++**	OUTPUT:
++**
++**		gcOUTPUT * Output
++**			Pointer to a variable receiving the gcOUTPUT object pointer.
++*/
++gceSTATUS
++gcSHADER_GetOutput(
++	IN gcSHADER Shader,
++	IN gctUINT Index,
++	OUT gcOUTPUT * Output
++	);
++
++
++/*******************************************************************************
++**							   gcSHADER_GetOutputByName
++********************************************************************************
++**
++**	Get the gcOUTPUT object pointer for this shader by output name.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctSTRING name
++**			Name of output to retrieve.
++**
++**      gctSIZE_T nameLength
++**          Length of name to retrieve
++**
++**	OUTPUT:
++**
++**		gcOUTPUT * Output
++**			Pointer to a variable receiving the gcOUTPUT object pointer.
++*/
++gceSTATUS
++gcSHADER_GetOutputByName(
++	IN gcSHADER Shader,
++	IN gctSTRING name,
++    IN gctSIZE_T nameLength,
++	OUT gcOUTPUT * Output
++	);
++
++/*******************************************************************************
++**  gcSHADER_ReallocateVariables
++**
++**  Reallocate an array of pointers to gcVARIABLE objects.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcSHADER_ReallocateVariables(
++    IN gcSHADER Shader,
++    IN gctSIZE_T Count
++    );
++
++/*******************************************************************************
++**							   gcSHADER_AddVariable
++********************************************************************************
++**
++**	Add a variable to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctCONST_STRING Name
++**			Name of the variable to add.
++**
++**		gcSHADER_TYPE Type
++**			Type of the variable to add.
++**
++**		gctSIZE_T Length
++**			Array length of the variable to add.  'Length' must be at least 1.
++**
++**		gctUINT16 TempRegister
++**			Temporary register index that holds the variable value.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddVariable(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	IN gcSHADER_TYPE Type,
++	IN gctSIZE_T Length,
++	IN gctUINT16 TempRegister
++	);
++
++
++/*******************************************************************************
++**  gcSHADER_AddVariableEx
++********************************************************************************
++**
++**  Add a variable to a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctCONST_STRING Name
++**          Name of the variable to add.
++**
++**      gcSHADER_TYPE Type
++**          Type of the variable to add.
++**
++**      gctSIZE_T Length
++**          Array length of the variable to add.  'Length' must be at least 1.
++**
++**      gctUINT16 TempRegister
++**          Temporary register index that holds the variable value.
++**
++**      gcSHADER_VAR_CATEGORY varCategory
++**          Variable category, normal or struct.
++**
++**      gctUINT16 numStructureElement
++**          If struct, its element number.
++**
++**      gctINT16 parent
++**          If struct, parent index in gcSHADER.variables.
++**
++**      gctINT16 prevSibling
++**          If struct, previous sibling index in gcSHADER.variables.
++**
++**  OUTPUT:
++**
++**      gctINT16* ThisVarIndex
++**          Returned value about variable index in gcSHADER.
++*/
++gceSTATUS
++gcSHADER_AddVariableEx(
++    IN gcSHADER Shader,
++    IN gctCONST_STRING Name,
++    IN gcSHADER_TYPE Type,
++    IN gctSIZE_T Length,
++    IN gctUINT16 TempRegister,
++    IN gcSHADER_VAR_CATEGORY varCategory,
++    IN gctUINT16 numStructureElement,
++    IN gctINT16 parent,
++    IN gctINT16 prevSibling,
++    OUT gctINT16* ThisVarIndex
++    );
++
++/*******************************************************************************
++**  gcSHADER_UpdateVariable
++********************************************************************************
++**
++**  Update a variable to a gcSHADER object.
++**
++**  INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT Index
++**			Index of variable to retrieve.
++**
++**		gceVARIABLE_UPDATE_FLAGS flag
++**			Flag which property of variable will be updated.
++**
++**      gctUINT newValue
++**          New value to update.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gcSHADER_UpdateVariable(
++    IN gcSHADER Shader,
++    IN gctUINT Index,
++    IN gceVARIABLE_UPDATE_FLAGS flag,
++    IN gctUINT newValue
++    );
++
++/*******************************************************************************
++**							 gcSHADER_GetVariableCount
++********************************************************************************
++**
++**	Get the number of variables for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Count
++**			Pointer to a variable receiving the number of variables.
++*/
++gceSTATUS
++gcSHADER_GetVariableCount(
++	IN gcSHADER Shader,
++	OUT gctSIZE_T * Count
++	);
++
++/*******************************************************************************
++**							   gcSHADER_GetVariable
++********************************************************************************
++**
++**	Get the gcVARIABLE object pointer for an indexed variable for this shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT Index
++**			Index of variable to retrieve.
++**
++**	OUTPUT:
++**
++**		gcVARIABLE * Variable
++**			Pointer to a variable receiving the gcVARIABLE object pointer.
++*/
++gceSTATUS
++gcSHADER_GetVariable(
++	IN gcSHADER Shader,
++	IN gctUINT Index,
++	OUT gcVARIABLE * Variable
++	);
++
++/*******************************************************************************
++**							   gcSHADER_GetVariableIndexingRange
++********************************************************************************
++**
++**	Get the gcVARIABLE indexing range.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcVARIABLE variable
++**			Start variable.
++**
++**		gctBOOL whole
++**			Indicate whether maximum indexing range is queried
++**
++**	OUTPUT:
++**
++**		gctUINT *Start
++**			Pointer to range start (temp register index).
++**
++**		gctUINT *End
++**			Pointer to range end (temp register index).
++*/
++gceSTATUS
++gcSHADER_GetVariableIndexingRange(
++	IN gcSHADER Shader,
++    IN gcVARIABLE variable,
++    IN gctBOOL whole,
++    OUT gctUINT *Start,
++    OUT gctUINT *End
++	);
++
++/*******************************************************************************
++**							   gcSHADER_AddOpcode
++********************************************************************************
++**
++**	Add an opcode to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcSL_OPCODE Opcode
++**			Opcode to add.
++**
++**		gctUINT16 TempRegister
++**			Temporary register index that acts as the target of the opcode.
++**
++**		gctUINT8 Enable
++**			Write enable bits for the temporary register that acts as the target
++**			of the opcode.
++**
++**		gcSL_FORMAT Format
++**			Format of the temporary register.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOpcode(
++	IN gcSHADER Shader,
++	IN gcSL_OPCODE Opcode,
++	IN gctUINT16 TempRegister,
++	IN gctUINT8 Enable,
++	IN gcSL_FORMAT Format
++	);
++
++gceSTATUS
++gcSHADER_AddOpcode2(
++	IN gcSHADER Shader,
++	IN gcSL_OPCODE Opcode,
++	IN gcSL_CONDITION Condition,
++	IN gctUINT16 TempRegister,
++	IN gctUINT8 Enable,
++	IN gcSL_FORMAT Format
++	);
++
++/*******************************************************************************
++**							gcSHADER_AddOpcodeIndexed
++********************************************************************************
++**
++**	Add an opcode to a gcSHADER object that writes to an dynamically indexed
++**	target.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcSL_OPCODE Opcode
++**			Opcode to add.
++**
++**		gctUINT16 TempRegister
++**			Temporary register index that acts as the target of the opcode.
++**
++**		gctUINT8 Enable
++**			Write enable bits  for the temporary register that acts as the
++**			target of the opcode.
++**
++**		gcSL_INDEXED Mode
++**			Location of the dynamic index inside the temporary register.  Valid
++**			values can be:
++**
++**				gcSL_INDEXED_X - Use x component of the temporary register.
++**				gcSL_INDEXED_Y - Use y component of the temporary register.
++**				gcSL_INDEXED_Z - Use z component of the temporary register.
++**				gcSL_INDEXED_W - Use w component of the temporary register.
++**
++**		gctUINT16 IndexRegister
++**			Temporary register index that holds the dynamic index.
++**
++**		gcSL_FORMAT Format
++**			Format of the temporary register.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOpcodeIndexed(
++	IN gcSHADER Shader,
++	IN gcSL_OPCODE Opcode,
++	IN gctUINT16 TempRegister,
++	IN gctUINT8 Enable,
++	IN gcSL_INDEXED Mode,
++	IN gctUINT16 IndexRegister,
++	IN gcSL_FORMAT Format
++	);
++
++/*******************************************************************************
++**  gcSHADER_AddOpcodeConditionIndexed
++**
++**  Add an opcode to a gcSHADER object that writes to an dynamically indexed
++**  target.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gcSL_OPCODE Opcode
++**          Opcode to add.
++**
++**      gcSL_CONDITION Condition
++**          Condition to check.
++**
++**      gctUINT16 TempRegister
++**          Temporary register index that acts as the target of the opcode.
++**
++**      gctUINT8 Enable
++**          Write enable bits  for the temporary register that acts as the
++**          target of the opcode.
++**
++**      gcSL_INDEXED Indexed
++**          Location of the dynamic index inside the temporary register.  Valid
++**          values can be:
++**
++**              gcSL_INDEXED_X - Use x component of the temporary register.
++**              gcSL_INDEXED_Y - Use y component of the temporary register.
++**              gcSL_INDEXED_Z - Use z component of the temporary register.
++**              gcSL_INDEXED_W - Use w component of the temporary register.
++**
++**      gctUINT16 IndexRegister
++**          Temporary register index that holds the dynamic index.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOpcodeConditionIndexed(
++    IN gcSHADER Shader,
++    IN gcSL_OPCODE Opcode,
++    IN gcSL_CONDITION Condition,
++    IN gctUINT16 TempRegister,
++    IN gctUINT8 Enable,
++    IN gcSL_INDEXED Indexed,
++    IN gctUINT16 IndexRegister,
++    IN gcSL_FORMAT Format
++    );
++
++/*******************************************************************************
++**						  gcSHADER_AddOpcodeConditional
++********************************************************************************
++**
++**	Add an conditional opcode to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcSL_OPCODE Opcode
++**			Opcode to add.
++**
++**		gcSL_CONDITION Condition
++**			Condition that needs to evaluate to gcvTRUE in order for the opcode to
++**			execute.
++**
++**		gctUINT Label
++**			Target label if 'Condition' evaluates to gcvTRUE.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOpcodeConditional(
++	IN gcSHADER Shader,
++	IN gcSL_OPCODE Opcode,
++	IN gcSL_CONDITION Condition,
++	IN gctUINT Label
++	);
++
++/*******************************************************************************
++**  gcSHADER_AddOpcodeConditionalFormatted
++**
++**  Add an conditional jump or call opcode to a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gcSL_OPCODE Opcode
++**          Opcode to add.
++**
++**      gcSL_CONDITION Condition
++**          Condition that needs to evaluate to gcvTRUE in order for the opcode to
++**          execute.
++**
++**      gcSL_FORMAT Format
++**          Format of conditional operands
++**
++**      gctUINT Label
++**          Target label if 'Condition' evaluates to gcvTRUE.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOpcodeConditionalFormatted(
++    IN gcSHADER Shader,
++    IN gcSL_OPCODE Opcode,
++    IN gcSL_CONDITION Condition,
++    IN gcSL_FORMAT Format,
++    IN gctUINT Label
++    );
++
++/*******************************************************************************
++**  gcSHADER_AddOpcodeConditionalFormattedEnable
++**
++**  Add an conditional jump or call opcode to a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gcSL_OPCODE Opcode
++**          Opcode to add.
++**
++**      gcSL_CONDITION Condition
++**          Condition that needs to evaluate to gcvTRUE in order for the opcode to
++**          execute.
++**
++**      gcSL_FORMAT Format
++**          Format of conditional operands
++**
++**      gctUINT8 Enable
++**          Write enable value for the target of the opcode.
++**
++**      gctUINT Label
++**          Target label if 'Condition' evaluates to gcvTRUE.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gcSHADER_AddOpcodeConditionalFormattedEnable(
++    IN gcSHADER Shader,
++    IN gcSL_OPCODE Opcode,
++    IN gcSL_CONDITION Condition,
++    IN gcSL_FORMAT Format,
++    IN gctUINT8 Enable,
++    IN gctUINT Label
++    );
++
++/*******************************************************************************
++**								gcSHADER_AddLabel
++********************************************************************************
++**
++**	Define a label at the current instruction of a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT Label
++**			Label to define.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddLabel(
++	IN gcSHADER Shader,
++	IN gctUINT Label
++	);
++
++/*******************************************************************************
++**							   gcSHADER_AddSource
++********************************************************************************
++**
++**	Add a source operand to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcSL_TYPE Type
++**			Type of the source operand.
++**
++**		gctUINT16 SourceIndex
++**			Index of the source operand.
++**
++**		gctUINT8 Swizzle
++**			x, y, z, and w swizzle values packed into one 8-bit value.
++**
++**		gcSL_FORMAT Format
++**			Format of the source operand.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSource(
++	IN gcSHADER Shader,
++	IN gcSL_TYPE Type,
++	IN gctUINT16 SourceIndex,
++	IN gctUINT8 Swizzle,
++	IN gcSL_FORMAT Format
++	);
++
++/*******************************************************************************
++**							gcSHADER_AddSourceIndexed
++********************************************************************************
++**
++**	Add a dynamically indexed source operand to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcSL_TYPE Type
++**			Type of the source operand.
++**
++**		gctUINT16 SourceIndex
++**			Index of the source operand.
++**
++**		gctUINT8 Swizzle
++**			x, y, z, and w swizzle values packed into one 8-bit value.
++**
++**		gcSL_INDEXED Mode
++**			Addressing mode for the index.
++**
++**		gctUINT16 IndexRegister
++**			Temporary register index that holds the dynamic index.
++**
++**		gcSL_FORMAT Format
++**			Format of the source operand.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceIndexed(
++	IN gcSHADER Shader,
++	IN gcSL_TYPE Type,
++	IN gctUINT16 SourceIndex,
++	IN gctUINT8 Swizzle,
++	IN gcSL_INDEXED Mode,
++	IN gctUINT16 IndexRegister,
++	IN gcSL_FORMAT Format
++	);
++
++/*******************************************************************************
++**						   gcSHADER_AddSourceAttribute
++********************************************************************************
++**
++**	Add an attribute as a source operand to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcATTRIBUTE Attribute
++**			Pointer to a gcATTRIBUTE object.
++**
++**		gctUINT8 Swizzle
++**			x, y, z, and w swizzle values packed into one 8-bit value.
++**
++**		gctINT Index
++**			Static index into the attribute in case the attribute is a matrix
++**			or array.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceAttribute(
++	IN gcSHADER Shader,
++	IN gcATTRIBUTE Attribute,
++	IN gctUINT8 Swizzle,
++	IN gctINT Index
++	);
++
++/*******************************************************************************
++**						   gcSHADER_AddSourceAttributeIndexed
++********************************************************************************
++**
++**	Add an indexed attribute as a source operand to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcATTRIBUTE Attribute
++**			Pointer to a gcATTRIBUTE object.
++**
++**		gctUINT8 Swizzle
++**			x, y, z, and w swizzle values packed into one 8-bit value.
++**
++**		gctINT Index
++**			Static index into the attribute in case the attribute is a matrix
++**			or array.
++**
++**		gcSL_INDEXED Mode
++**			Addressing mode of the dynamic index.
++**
++**		gctUINT16 IndexRegister
++**			Temporary register index that holds the dynamic index.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceAttributeIndexed(
++	IN gcSHADER Shader,
++	IN gcATTRIBUTE Attribute,
++	IN gctUINT8 Swizzle,
++	IN gctINT Index,
++	IN gcSL_INDEXED Mode,
++	IN gctUINT16 IndexRegister
++	);
++
++/*******************************************************************************
++**							gcSHADER_AddSourceUniform
++********************************************************************************
++**
++**	Add a uniform as a source operand to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**		gctUINT8 Swizzle
++**			x, y, z, and w swizzle values packed into one 8-bit value.
++**
++**		gctINT Index
++**			Static index into the uniform in case the uniform is a matrix or
++**			array.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceUniform(
++	IN gcSHADER Shader,
++	IN gcUNIFORM Uniform,
++	IN gctUINT8 Swizzle,
++	IN gctINT Index
++	);
++
++/*******************************************************************************
++**						gcSHADER_AddSourceUniformIndexed
++********************************************************************************
++**
++**	Add an indexed uniform as a source operand to a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**		gctUINT8 Swizzle
++**			x, y, z, and w swizzle values packed into one 8-bit value.
++**
++**		gctINT Index
++**			Static index into the uniform in case the uniform is a matrix or
++**			array.
++**
++**		gcSL_INDEXED Mode
++**			Addressing mode of the dynamic index.
++**
++**		gctUINT16 IndexRegister
++**			Temporary register index that holds the dynamic index.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceUniformIndexed(
++	IN gcSHADER Shader,
++	IN gcUNIFORM Uniform,
++	IN gctUINT8 Swizzle,
++	IN gctINT Index,
++	IN gcSL_INDEXED Mode,
++	IN gctUINT16 IndexRegister
++	);
++
++gceSTATUS
++gcSHADER_AddSourceSamplerIndexed(
++	IN gcSHADER Shader,
++	IN gctUINT8 Swizzle,
++	IN gcSL_INDEXED Mode,
++	IN gctUINT16 IndexRegister
++	);
++
++gceSTATUS
++gcSHADER_AddSourceAttributeFormatted(
++    IN gcSHADER Shader,
++    IN gcATTRIBUTE Attribute,
++    IN gctUINT8 Swizzle,
++    IN gctINT Index,
++    IN gcSL_FORMAT Format
++    );
++
++gceSTATUS
++gcSHADER_AddSourceAttributeIndexedFormatted(
++    IN gcSHADER Shader,
++    IN gcATTRIBUTE Attribute,
++    IN gctUINT8 Swizzle,
++    IN gctINT Index,
++    IN gcSL_INDEXED Mode,
++    IN gctUINT16 IndexRegister,
++    IN gcSL_FORMAT Format
++    );
++
++gceSTATUS
++gcSHADER_AddSourceUniformFormatted(
++    IN gcSHADER Shader,
++    IN gcUNIFORM Uniform,
++    IN gctUINT8 Swizzle,
++    IN gctINT Index,
++    IN gcSL_FORMAT Format
++    );
++
++gceSTATUS
++gcSHADER_AddSourceUniformIndexedFormatted(
++    IN gcSHADER Shader,
++    IN gcUNIFORM Uniform,
++    IN gctUINT8 Swizzle,
++    IN gctINT Index,
++    IN gcSL_INDEXED Mode,
++    IN gctUINT16 IndexRegister,
++    IN gcSL_FORMAT Format
++    );
++
++gceSTATUS
++gcSHADER_AddSourceSamplerIndexedFormatted(
++    IN gcSHADER Shader,
++    IN gctUINT8 Swizzle,
++    IN gcSL_INDEXED Mode,
++    IN gctUINT16 IndexRegister,
++    IN gcSL_FORMAT Format
++    );
++
++/*******************************************************************************
++**						   gcSHADER_AddSourceConstant
++********************************************************************************
++**
++**	Add a constant floating point value as a source operand to a gcSHADER
++**	object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctFLOAT Constant
++**			Floating point constant.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceConstant(
++	IN gcSHADER Shader,
++	IN gctFLOAT Constant
++	);
++
++/*******************************************************************************
++**			                   gcSHADER_AddSourceConstantFormatted
++********************************************************************************
++**
++**	Add a constant value as a source operand to a gcSHADER
++**	object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		void * Constant
++**			Pointer to constant.
++**
++**		gcSL_FORMAT Format
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_AddSourceConstantFormatted(
++	IN gcSHADER Shader,
++	IN void *Constant,
++	IN gcSL_FORMAT Format
++	);
++
++/*******************************************************************************
++**								  gcSHADER_Pack
++********************************************************************************
++**
++**	Pack a dynamically created gcSHADER object by trimming the allocated arrays
++**	and resolving all the labeling.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_Pack(
++	IN gcSHADER Shader
++	);
++
++/*******************************************************************************
++**								gcSHADER_SetOptimizationOption
++********************************************************************************
++**
++**	Set optimization option of a gcSHADER object.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object.
++**
++**		gctUINT OptimizationOption
++**			Optimization option.  Can be one of the following:
++**
++**				0						- No optimization.
++**				1						- Full optimization.
++**				Other value				- For optimizer testing.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcSHADER_SetOptimizationOption(
++	IN gcSHADER Shader,
++	IN gctUINT OptimizationOption
++	);
++
++/*******************************************************************************
++**  gcSHADER_ReallocateFunctions
++**
++**  Reallocate an array of pointers to gcFUNCTION objects.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcSHADER_ReallocateFunctions(
++    IN gcSHADER Shader,
++    IN gctSIZE_T Count
++    );
++
++gceSTATUS
++gcSHADER_AddFunction(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	OUT gcFUNCTION * Function
++	);
++
++gceSTATUS
++gcSHADER_ReallocateKernelFunctions(
++    IN gcSHADER Shader,
++    IN gctSIZE_T Count
++    );
++
++gceSTATUS
++gcSHADER_AddKernelFunction(
++	IN gcSHADER Shader,
++	IN gctCONST_STRING Name,
++	OUT gcKERNEL_FUNCTION * KernelFunction
++	);
++
++gceSTATUS
++gcSHADER_BeginFunction(
++	IN gcSHADER Shader,
++	IN gcFUNCTION Function
++	);
++
++gceSTATUS
++gcSHADER_EndFunction(
++	IN gcSHADER Shader,
++	IN gcFUNCTION Function
++	);
++
++gceSTATUS
++gcSHADER_BeginKernelFunction(
++	IN gcSHADER Shader,
++	IN gcKERNEL_FUNCTION KernelFunction
++	);
++
++gceSTATUS
++gcSHADER_EndKernelFunction(
++	IN gcSHADER Shader,
++	IN gcKERNEL_FUNCTION KernelFunction,
++	IN gctSIZE_T LocalMemorySize
++	);
++
++gceSTATUS
++gcSHADER_SetMaxKernelFunctionArgs(
++    IN gcSHADER Shader,
++    IN gctUINT32 MaxKernelFunctionArgs
++    );
++
++/*******************************************************************************
++**  gcSHADER_SetConstantMemorySize
++**
++**  Set the constant memory address space size of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T ConstantMemorySize
++**          Constant memory size in bytes
++**
++**      gctCHAR *ConstantMemoryBuffer
++**          Constant memory buffer
++*/
++gceSTATUS
++gcSHADER_SetConstantMemorySize(
++    IN gcSHADER Shader,
++    IN gctSIZE_T ConstantMemorySize,
++    IN gctCHAR * ConstantMemoryBuffer
++    );
++
++/*******************************************************************************
++**  gcSHADER_GetConstantMemorySize
++**
++**  Set the constant memory address space size of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * ConstantMemorySize
++**          Pointer to a variable receiving constant memory size in bytes
++**
++**      gctCHAR **ConstantMemoryBuffer.
++**          Pointer to a variable for returned shader constant memory buffer.
++*/
++gceSTATUS
++gcSHADER_GetConstantMemorySize(
++    IN gcSHADER Shader,
++    OUT gctSIZE_T * ConstantMemorySize,
++    OUT gctCHAR ** ConstantMemoryBuffer
++    );
++
++/*******************************************************************************
++**  gcSHADER_SetPrivateMemorySize
++**
++**  Set the private memory address space size of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T PrivateMemorySize
++**          Private memory size in bytes
++*/
++gceSTATUS
++gcSHADER_SetPrivateMemorySize(
++    IN gcSHADER Shader,
++    IN gctSIZE_T PrivateMemorySize
++    );
++
++/*******************************************************************************
++**  gcSHADER_GetPrivateMemorySize
++**
++**  Set the private memory address space size of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * PrivateMemorySize
++**          Pointer to a variable receiving private memory size in bytes
++*/
++gceSTATUS
++gcSHADER_GetPrivateMemorySize(
++    IN gcSHADER Shader,
++    OUT gctSIZE_T * PrivateMemorySize
++    );
++
++/*******************************************************************************
++**  gcSHADER_SetLocalMemorySize
++**
++**  Set the local memory address space size of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**      gctSIZE_T LocalMemorySize
++**          Local memory size in bytes
++*/
++gceSTATUS
++gcSHADER_SetLocalMemorySize(
++    IN gcSHADER Shader,
++    IN gctSIZE_T LocalMemorySize
++    );
++
++/*******************************************************************************
++**  gcSHADER_GetLocalMemorySize
++**
++**  Set the local memory address space size of a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * LocalMemorySize
++**          Pointer to a variable receiving lcoal memory size in bytes
++*/
++gceSTATUS
++gcSHADER_GetLocalMemorySize(
++    IN gcSHADER Shader,
++    OUT gctSIZE_T * LocalMemorySize
++    );
++
++
++/*******************************************************************************
++**  gcSHADER_CheckValidity
++**
++**  Check validity for a gcSHADER object.
++**
++**  INPUT:
++**
++**      gcSHADER Shader
++**          Pointer to a gcSHADER object.
++**
++*/
++gceSTATUS
++gcSHADER_CheckValidity(
++    IN gcSHADER Shader
++    );
++
++#if gcdUSE_WCLIP_PATCH
++gceSTATUS
++gcATTRIBUTE_IsPosition(
++        IN gcATTRIBUTE Attribute,
++        OUT gctBOOL * IsPosition
++        );
++#endif
++
++/*******************************************************************************
++**                             gcATTRIBUTE_GetType
++********************************************************************************
++**
++**	Get the type and array length of a gcATTRIBUTE object.
++**
++**	INPUT:
++**
++**		gcATTRIBUTE Attribute
++**			Pointer to a gcATTRIBUTE object.
++**
++**	OUTPUT:
++**
++**		gcSHADER_TYPE * Type
++**			Pointer to a variable receiving the type of the attribute.  'Type'
++**			can be gcvNULL, in which case no type will be returned.
++**
++**		gctSIZE_T * ArrayLength
++**			Pointer to a variable receiving the length of the array if the
++**			attribute was declared as an array.  If the attribute was not
++**			declared as an array, the array length will be 1.  'ArrayLength' can
++**			be gcvNULL, in which case no array length will be returned.
++*/
++gceSTATUS
++gcATTRIBUTE_GetType(
++	IN gcATTRIBUTE Attribute,
++	OUT gcSHADER_TYPE * Type,
++	OUT gctSIZE_T * ArrayLength
++	);
++
++/*******************************************************************************
++**                            gcATTRIBUTE_GetName
++********************************************************************************
++**
++**	Get the name of a gcATTRIBUTE object.
++**
++**	INPUT:
++**
++**		gcATTRIBUTE Attribute
++**			Pointer to a gcATTRIBUTE object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Length
++**			Pointer to a variable receiving the length of the attribute name.
++**			'Length' can be gcvNULL, in which case no length will be returned.
++**
++**		gctCONST_STRING * Name
++**			Pointer to a variable receiving the pointer to the attribute name.
++**			'Name' can be gcvNULL, in which case no name will be returned.
++*/
++gceSTATUS
++gcATTRIBUTE_GetName(
++	IN gcATTRIBUTE Attribute,
++	OUT gctSIZE_T * Length,
++	OUT gctCONST_STRING * Name
++	);
++
++/*******************************************************************************
++**                            gcATTRIBUTE_IsEnabled
++********************************************************************************
++**
++**	Query the enabled state of a gcATTRIBUTE object.
++**
++**	INPUT:
++**
++**		gcATTRIBUTE Attribute
++**			Pointer to a gcATTRIBUTE object.
++**
++**	OUTPUT:
++**
++**		gctBOOL * Enabled
++**			Pointer to a variable receiving the enabled state of the attribute.
++*/
++gceSTATUS
++gcATTRIBUTE_IsEnabled(
++	IN gcATTRIBUTE Attribute,
++	OUT gctBOOL * Enabled
++	);
++
++gceSTATUS
++gcATTRIBUTE_GetIndex(
++    IN gcATTRIBUTE Attribute,
++    OUT gctUINT16 * Index
++    );
++
++/*******************************************************************************
++**                              gcUNIFORM_GetType
++********************************************************************************
++**
++**	Get the type and array length of a gcUNIFORM object.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**	OUTPUT:
++**
++**		gcSHADER_TYPE * Type
++**			Pointer to a variable receiving the type of the uniform.  'Type' can
++**			be gcvNULL, in which case no type will be returned.
++**
++**		gctSIZE_T * ArrayLength
++**			Pointer to a variable receiving the length of the array if the
++**			uniform was declared as an array.  If the uniform was not declared
++**			as an array, the array length will be 1.  'ArrayLength' can be gcvNULL,
++**			in which case no array length will be returned.
++*/
++gceSTATUS
++gcUNIFORM_GetType(
++	IN gcUNIFORM Uniform,
++	OUT gcSHADER_TYPE * Type,
++	OUT gctSIZE_T * ArrayLength
++	);
++
++/*******************************************************************************
++**                              gcUNIFORM_GetTypeEx
++********************************************************************************
++**
++**	Get the type and array length of a gcUNIFORM object.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**	OUTPUT:
++**
++**		gcSHADER_TYPE * Type
++**			Pointer to a variable receiving the type of the uniform.  'Type' can
++**			be gcvNULL, in which case no type will be returned.
++**
++**		gcSHADER_PRECISION * Precision
++**			Pointer to a variable receiving the precision of the uniform.  'Precision' can
++**			be gcvNULL, in which case no type will be returned.
++**
++**		gctSIZE_T * ArrayLength
++**			Pointer to a variable receiving the length of the array if the
++**			uniform was declared as an array.  If the uniform was not declared
++**			as an array, the array length will be 1.  'ArrayLength' can be gcvNULL,
++**			in which case no array length will be returned.
++*/
++gceSTATUS
++gcUNIFORM_GetTypeEx(
++	IN gcUNIFORM Uniform,
++	OUT gcSHADER_TYPE * Type,
++    OUT gcSHADER_PRECISION * Precision,
++	OUT gctSIZE_T * ArrayLength
++	);
++
++/*******************************************************************************
++**                              gcUNIFORM_GetFlags
++********************************************************************************
++**
++**	Get the flags of a gcUNIFORM object.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**	OUTPUT:
++**
++**		gceUNIFORM_FLAGS * Flags
++**			Pointer to a variable receiving the flags of the uniform.
++**
++*/
++gceSTATUS
++gcUNIFORM_GetFlags(
++	IN gcUNIFORM Uniform,
++	OUT gceUNIFORM_FLAGS * Flags
++	);
++
++/*******************************************************************************
++**                              gcUNIFORM_SetFlags
++********************************************************************************
++**
++**	Set the flags of a gcUNIFORM object.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**		gceUNIFORM_FLAGS Flags
++**			Flags of the uniform to be set.
++**
++**	OUTPUT:
++**			Nothing.
++**
++*/
++gceSTATUS
++gcUNIFORM_SetFlags(
++	IN gcUNIFORM Uniform,
++	IN gceUNIFORM_FLAGS Flags
++	);
++
++/*******************************************************************************
++**                              gcUNIFORM_GetName
++********************************************************************************
++**
++**	Get the name of a gcUNIFORM object.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Length
++**			Pointer to a variable receiving the length of the uniform name.
++**			'Length' can be gcvNULL, in which case no length will be returned.
++**
++**		gctCONST_STRING * Name
++**			Pointer to a variable receiving the pointer to the uniform name.
++**			'Name' can be gcvNULL, in which case no name will be returned.
++*/
++gceSTATUS
++gcUNIFORM_GetName(
++	IN gcUNIFORM Uniform,
++	OUT gctSIZE_T * Length,
++	OUT gctCONST_STRING * Name
++	);
++
++/*******************************************************************************
++**                              gcUNIFORM_GetSampler
++********************************************************************************
++**
++**	Get the physical sampler number for a sampler gcUNIFORM object.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**	OUTPUT:
++**
++**		gctUINT32 * Sampler
++**			Pointer to a variable receiving the physical sampler.
++*/
++gceSTATUS
++gcUNIFORM_GetSampler(
++	IN gcUNIFORM Uniform,
++	OUT gctUINT32 * Sampler
++	);
++
++gceSTATUS
++gcUNIFORM_GetIndex(
++    IN gcUNIFORM Uniform,
++    OUT gctUINT16 * Index
++    );
++
++/*******************************************************************************
++**  gcUNIFORM_GetFormat
++**
++**  Get the type and array length of a gcUNIFORM object.
++**
++**  INPUT:
++**
++**      gcUNIFORM Uniform
++**          Pointer to a gcUNIFORM object.
++**
++**  OUTPUT:
++**
++**      gcSL_FORMAT * Format
++**          Pointer to a variable receiving the format of element of the uniform.
++**          'Type' can be gcvNULL, in which case no type will be returned.
++**
++**      gctBOOL * IsPointer
++**          Pointer to a variable receiving the state wheter the uniform is a pointer.
++**          'IsPointer' can be gcvNULL, in which case no array length will be returned.
++*/
++gceSTATUS
++gcUNIFORM_GetFormat(
++    IN gcUNIFORM Uniform,
++    OUT gcSL_FORMAT * Format,
++    OUT gctBOOL * IsPointer
++    );
++
++/*******************************************************************************
++**  gcUNIFORM_SetFormat
++**
++**  Set the format and isPointer of a uniform.
++**
++**  INPUT:
++**
++**      gcUNIFORM Uniform
++**          Pointer to a gcUNIFORM object.
++**
++**      gcSL_FORMAT Format
++**          Format of element of the uniform shaderType.
++**
++**      gctBOOL IsPointer
++**          Wheter the uniform is a pointer.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gcUNIFORM_SetFormat(
++    IN gcUNIFORM Uniform,
++    IN gcSL_FORMAT Format,
++    IN gctBOOL IsPointer
++    );
++
++/*******************************************************************************
++**							   gcUNIFORM_SetValue
++********************************************************************************
++**
++**	Set the value of a uniform in integer.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**		gctSIZE_T Count
++**			Number of entries to program if the uniform has been declared as an
++**			array.
++**
++**		const gctINT * Value
++**			Pointer to a buffer holding the integer values for the uniform.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcUNIFORM_SetValue(
++	IN gcUNIFORM Uniform,
++	IN gctSIZE_T Count,
++	IN const gctINT * Value
++	);
++
++/*******************************************************************************
++**							   gcUNIFORM_SetValueX
++********************************************************************************
++**
++**	Set the value of a uniform in fixed point.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**		gctSIZE_T Count
++**			Number of entries to program if the uniform has been declared as an
++**			array.
++**
++**		const gctFIXED_POINT * Value
++**			Pointer to a buffer holding the fixed point values for the uniform.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcUNIFORM_SetValueX(
++	IN gcUNIFORM Uniform,
++	IN gctSIZE_T Count,
++	IN gctFIXED_POINT * Value
++	);
++
++/*******************************************************************************
++**							   gcUNIFORM_SetValueF
++********************************************************************************
++**
++**	Set the value of a uniform in floating point.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**		gctSIZE_T Count
++**			Number of entries to program if the uniform has been declared as an
++**			array.
++**
++**		const gctFLOAT * Value
++**			Pointer to a buffer holding the floating point values for the
++**			uniform.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gceSTATUS
++gcUNIFORM_SetValueF(
++	IN gcUNIFORM Uniform,
++	IN gctSIZE_T Count,
++	IN const gctFLOAT * Value
++	);
++
++/*******************************************************************************
++**  gcUNIFORM_ProgramF
++**
++**  Set the value of a uniform in floating point.
++**
++**  INPUT:
++**
++**      gctUINT32 Address
++**          Address of Uniform.
++**
++**      gctSIZE_T Row/Col
++**
++**      const gctFLOAT * Value
++**          Pointer to a buffer holding the floating point values for the
++**          uniform.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gcUNIFORM_ProgramF(
++    IN gctUINT32 Address,
++    IN gctSIZE_T Row,
++    IN gctSIZE_T Col,
++    IN const gctFLOAT * Value
++    );
++
++/*******************************************************************************
++**						 gcUNIFORM_GetModelViewProjMatrix
++********************************************************************************
++**
++**	Get the value of uniform modelViewProjMatrix ID if present.
++**
++**	INPUT:
++**
++**		gcUNIFORM Uniform
++**			Pointer to a gcUNIFORM object.
++**
++**	OUTPUT:
++**
++**		Nothing.
++*/
++gctUINT
++gcUNIFORM_GetModelViewProjMatrix(
++    IN gcUNIFORM Uniform
++    );
++
++/*******************************************************************************
++**								gcOUTPUT_GetType
++********************************************************************************
++**
++**	Get the type and array length of a gcOUTPUT object.
++**
++**	INPUT:
++**
++**		gcOUTPUT Output
++**			Pointer to a gcOUTPUT object.
++**
++**	OUTPUT:
++**
++**		gcSHADER_TYPE * Type
++**			Pointer to a variable receiving the type of the output.  'Type' can
++**			be gcvNULL, in which case no type will be returned.
++**
++**		gctSIZE_T * ArrayLength
++**			Pointer to a variable receiving the length of the array if the
++**			output was declared as an array.  If the output was not declared
++**			as an array, the array length will be 1.  'ArrayLength' can be gcvNULL,
++**			in which case no array length will be returned.
++*/
++gceSTATUS
++gcOUTPUT_GetType(
++	IN gcOUTPUT Output,
++	OUT gcSHADER_TYPE * Type,
++	OUT gctSIZE_T * ArrayLength
++	);
++
++/*******************************************************************************
++**							   gcOUTPUT_GetIndex
++********************************************************************************
++**
++**	Get the index of a gcOUTPUT object.
++**
++**	INPUT:
++**
++**		gcOUTPUT Output
++**			Pointer to a gcOUTPUT object.
++**
++**	OUTPUT:
++**
++**		gctUINT * Index
++**			Pointer to a variable receiving the temporary register index of the
++**			output.  'Index' can be gcvNULL,. in which case no index will be
++**			returned.
++*/
++gceSTATUS
++gcOUTPUT_GetIndex(
++	IN gcOUTPUT Output,
++	OUT gctUINT * Index
++	);
++
++/*******************************************************************************
++**								gcOUTPUT_GetName
++********************************************************************************
++**
++**	Get the name of a gcOUTPUT object.
++**
++**	INPUT:
++**
++**		gcOUTPUT Output
++**			Pointer to a gcOUTPUT object.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * Length
++**			Pointer to a variable receiving the length of the output name.
++**			'Length' can be gcvNULL, in which case no length will be returned.
++**
++**		gctCONST_STRING * Name
++**			Pointer to a variable receiving the pointer to the output name.
++**			'Name' can be gcvNULL, in which case no name will be returned.
++*/
++gceSTATUS
++gcOUTPUT_GetName(
++	IN gcOUTPUT Output,
++	OUT gctSIZE_T * Length,
++	OUT gctCONST_STRING * Name
++	);
++
++/*******************************************************************************
++*********************************************************** F U N C T I O N S **
++*******************************************************************************/
++
++/*******************************************************************************
++**  gcFUNCTION_ReallocateArguments
++**
++**  Reallocate an array of gcsFUNCTION_ARGUMENT objects.
++**
++**  INPUT:
++**
++**      gcFUNCTION Function
++**          Pointer to a gcFUNCTION object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcFUNCTION_ReallocateArguments(
++    IN gcFUNCTION Function,
++    IN gctSIZE_T Count
++    );
++
++gceSTATUS
++gcFUNCTION_AddArgument(
++	IN gcFUNCTION Function,
++	IN gctUINT16 TempIndex,
++	IN gctUINT8 Enable,
++	IN gctUINT8 Qualifier
++	);
++
++gceSTATUS
++gcFUNCTION_GetArgument(
++	IN gcFUNCTION Function,
++	IN gctUINT16 Index,
++	OUT gctUINT16_PTR Temp,
++	OUT gctUINT8_PTR Enable,
++	OUT gctUINT8_PTR Swizzle
++	);
++
++gceSTATUS
++gcFUNCTION_GetLabel(
++	IN gcFUNCTION Function,
++	OUT gctUINT_PTR Label
++	);
++
++/*******************************************************************************
++************************* K E R N E L    P R O P E R T Y    F U N C T I O N S **
++*******************************************************************************/
++/*******************************************************************************/
++gceSTATUS
++gcKERNEL_FUNCTION_AddKernelFunctionProperties(
++	    IN gcKERNEL_FUNCTION KernelFunction,
++		IN gctINT propertyType,
++		IN gctSIZE_T propertySize,
++		IN gctINT * values
++		);
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetPropertyCount(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    OUT gctSIZE_T * Count
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetProperty(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctUINT Index,
++	OUT gctSIZE_T * propertySize,
++	OUT gctINT * propertyType,
++	OUT gctINT * propertyValues
++    );
++
++
++/*******************************************************************************
++*******************************I M A G E   S A M P L E R    F U N C T I O N S **
++*******************************************************************************/
++/*******************************************************************************
++**  gcKERNEL_FUNCTION_ReallocateImageSamplers
++**
++**  Reallocate an array of pointers to image sampler pair.
++**
++**  INPUT:
++**
++**      gcKERNEL_FUNCTION KernelFunction
++**          Pointer to a gcKERNEL_FUNCTION object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcKERNEL_FUNCTION_ReallocateImageSamplers(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctSIZE_T Count
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_AddImageSampler(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctUINT8 ImageNum,
++    IN gctBOOL IsConstantSamplerType,
++    IN gctUINT32 SamplerType
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetImageSamplerCount(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    OUT gctSIZE_T * Count
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetImageSampler(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctUINT Index,
++    OUT gctUINT8 *ImageNum,
++    OUT gctBOOL *IsConstantSamplerType,
++    OUT gctUINT32 *SamplerType
++    );
++
++/*******************************************************************************
++*********************************************K E R N E L    F U N C T I O N S **
++*******************************************************************************/
++
++/*******************************************************************************
++**  gcKERNEL_FUNCTION_ReallocateArguments
++**
++**  Reallocate an array of gcsFUNCTION_ARGUMENT objects.
++**
++**  INPUT:
++**
++**      gcKERNEL_FUNCTION Function
++**          Pointer to a gcKERNEL_FUNCTION object.
++**
++**      gctSIZE_T Count
++**          Array count to reallocate.  'Count' must be at least 1.
++*/
++gceSTATUS
++gcKERNEL_FUNCTION_ReallocateArguments(
++    IN gcKERNEL_FUNCTION Function,
++    IN gctSIZE_T Count
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_AddArgument(
++	IN gcKERNEL_FUNCTION Function,
++	IN gctUINT16 TempIndex,
++	IN gctUINT8 Enable,
++	IN gctUINT8 Qualifier
++	);
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetArgument(
++	IN gcKERNEL_FUNCTION Function,
++	IN gctUINT16 Index,
++	OUT gctUINT16_PTR Temp,
++	OUT gctUINT8_PTR Enable,
++	OUT gctUINT8_PTR Swizzle
++	);
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetLabel(
++	IN gcKERNEL_FUNCTION Function,
++	OUT gctUINT_PTR Label
++	);
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetName(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    OUT gctSIZE_T * Length,
++    OUT gctCONST_STRING * Name
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_ReallocateUniformArguments(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctSIZE_T Count
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_AddUniformArgument(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctCONST_STRING Name,
++    IN gcSHADER_TYPE Type,
++    IN gctSIZE_T Length,
++    OUT gcUNIFORM * UniformArgument
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetUniformArgumentCount(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    OUT gctSIZE_T * Count
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_GetUniformArgument(
++    IN gcKERNEL_FUNCTION KernelFunction,
++    IN gctUINT Index,
++    OUT gcUNIFORM * UniformArgument
++    );
++
++gceSTATUS
++gcKERNEL_FUNCTION_SetCodeEnd(
++    IN gcKERNEL_FUNCTION KernelFunction
++    );
++
++/*******************************************************************************
++**                              gcCompileShader
++********************************************************************************
++**
++**	Compile a shader.
++**
++**	INPUT:
++**
++**		gcoOS Hal
++**			Pointer to an gcoHAL object.
++**
++**		gctINT ShaderType
++**			Shader type to compile.  Can be one of the following values:
++**
++**				gcSHADER_TYPE_VERTEX
++**					Compile a vertex shader.
++**
++**				gcSHADER_TYPE_FRAGMENT
++**					Compile a fragment shader.
++**
++**		gctSIZE_T SourceSize
++**			Size of the source buffer in bytes.
++**
++**		gctCONST_STRING Source
++**			Pointer to the buffer containing the shader source code.
++**
++**	OUTPUT:
++**
++**		gcSHADER * Binary
++**			Pointer to a variable receiving the pointer to a gcSHADER object
++**			containg the compiled shader code.
++**
++**		gctSTRING * Log
++**			Pointer to a variable receiving a string pointer containging the
++**			compile log.
++*/
++gceSTATUS
++gcCompileShader(
++	IN gcoHAL Hal,
++	IN gctINT ShaderType,
++	IN gctSIZE_T SourceSize,
++	IN gctCONST_STRING Source,
++	OUT gcSHADER * Binary,
++	OUT gctSTRING * Log
++	);
++
++/*******************************************************************************
++**                              gcOptimizeShader
++********************************************************************************
++**
++**	Optimize a shader.
++**
++**	INPUT:
++**
++**		gcSHADER Shader
++**			Pointer to a gcSHADER object holding information about the compiled
++**			shader.
++**
++**		gctFILE LogFile
++**			Pointer to an open FILE object.
++*/
++gceSTATUS
++gcOptimizeShader(
++	IN gcSHADER Shader,
++	IN gctFILE LogFile
++	);
++
++/*******************************************************************************
++**                                gcLinkShaders
++********************************************************************************
++**
++**	Link two shaders and generate a harwdare specific state buffer by compiling
++**	the compiler generated code through the resource allocator and code
++**	generator.
++**
++**	INPUT:
++**
++**		gcSHADER VertexShader
++**			Pointer to a gcSHADER object holding information about the compiled
++**			vertex shader.
++**
++**		gcSHADER FragmentShader
++**			Pointer to a gcSHADER object holding information about the compiled
++**			fragment shader.
++**
++**		gceSHADER_FLAGS Flags
++**			Compiler flags.  Can be any of the following:
++**
++**				gcvSHADER_DEAD_CODE       - Dead code elimination.
++**				gcvSHADER_RESOURCE_USAGE  - Resource usage optimizaion.
++**				gcvSHADER_OPTIMIZER       - Full optimization.
++**				gcvSHADER_USE_GL_Z        - Use OpenGL ES Z coordinate.
++**				gcvSHADER_USE_GL_POSITION - Use OpenGL ES gl_Position.
++**				gcvSHADER_USE_GL_FACE     - Use OpenGL ES gl_FaceForward.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * StateBufferSize
++**			Pointer to a variable receicing the number of bytes in the buffer
++**			returned in 'StateBuffer'.
++**
++**		gctPOINTER * StateBuffer
++**			Pointer to a variable receiving a buffer pointer that contains the
++**			states required to download the shaders into the hardware.
++**
++**		gcsHINT_PTR * Hints
++**			Pointer to a variable receiving a gcsHINT structure pointer that
++**			contains information required when loading the shader states.
++*/
++gceSTATUS
++gcLinkShaders(
++	IN gcSHADER VertexShader,
++	IN gcSHADER FragmentShader,
++	IN gceSHADER_FLAGS Flags,
++	OUT gctSIZE_T * StateBufferSize,
++	OUT gctPOINTER * StateBuffer,
++	OUT gcsHINT_PTR * Hints,
++    OUT gcMACHINECODE_PTR *ppVsMachineCode,
++    OUT gcMACHINECODE_PTR *ppFsMachineCode
++	);
++
++/*******************************************************************************
++**                                gcLoadShaders
++********************************************************************************
++**
++**	Load a pre-compiled and pre-linked shader program into the hardware.
++**
++**	INPUT:
++**
++**		gcoHAL Hal
++**			Pointer to a gcoHAL object.
++**
++**		gctSIZE_T StateBufferSize
++**			The number of bytes in the 'StateBuffer'.
++**
++**		gctPOINTER StateBuffer
++**			Pointer to the states that make up the shader program.
++**
++**		gcsHINT_PTR Hints
++**			Pointer to a gcsHINT structure that contains information required
++**			when loading the shader states.
++*/
++gceSTATUS
++gcLoadShaders(
++	IN gcoHAL Hal,
++	IN gctSIZE_T StateBufferSize,
++	IN gctPOINTER StateBuffer,
++	IN gcsHINT_PTR Hints
++	);
++
++gceSTATUS
++gcRecompileShaders(
++    IN gcoHAL Hal,
++    IN gcMACHINECODE_PTR pVsMachineCode,
++    IN gcMACHINECODE_PTR pPsMachineCode,
++    /*Recompile variables*/
++    IN OUT gctPOINTER *ppRecompileStateBuffer,
++    IN OUT gctSIZE_T *pRecompileStateBufferSize,
++    IN OUT gcsHINT_PTR *ppRecompileHints,
++    /* natvie state*/
++    IN gctPOINTER pNativeStateBuffer,
++    IN gctSIZE_T nativeStateBufferSize,
++    IN gcsHINT_PTR pNativeHints,
++    /* npt info */
++    IN gctUINT32 Samplers,
++    IN gctUINT32 *SamplerWrapS,
++    IN gctUINT32 *SamplerWrapT
++    );
++
++gceSTATUS
++gcRecompileDepthBias(
++    IN gcoHAL Hal,
++    IN gcMACHINECODE_PTR pVsMachineCode,
++    /*Recompile variables*/
++    IN OUT gctPOINTER *ppRecompileStateBuffer,
++    IN OUT gctSIZE_T *pRecompileStateBufferSize,
++    IN OUT gcsHINT_PTR *ppRecompileHints,
++    /* natvie state*/
++    IN gctPOINTER pNativeStateBuffer,
++    IN gctSIZE_T nativeStateBufferSize,
++    IN gcsHINT_PTR pNativeHints,
++	OUT gctINT * uniformAddr,
++	OUT gctINT * uniformChannel
++    );
++
++/*******************************************************************************
++**                                gcSaveProgram
++********************************************************************************
++**
++**	Save pre-compiled shaders and pre-linked programs to a binary file.
++**
++**	INPUT:
++**
++**		gcSHADER VertexShader
++**			Pointer to vertex shader object.
++**
++**		gcSHADER FragmentShader
++**			Pointer to fragment shader object.
++**
++**		gctSIZE_T ProgramBufferSize
++**			Number of bytes in 'ProgramBuffer'.
++**
++**		gctPOINTER ProgramBuffer
++**			Pointer to buffer containing the program states.
++**
++**		gcsHINT_PTR Hints
++**			Pointer to HINTS structure for program states.
++**
++**	OUTPUT:
++**
++**		gctPOINTER * Binary
++**			Pointer to a variable receiving the binary data to be saved.
++**
++**		gctSIZE_T * BinarySize
++**			Pointer to a variable receiving the number of bytes inside 'Binary'.
++*/
++gceSTATUS
++gcSaveProgram(
++	IN gcSHADER VertexShader,
++	IN gcSHADER FragmentShader,
++	IN gctSIZE_T ProgramBufferSize,
++	IN gctPOINTER ProgramBuffer,
++	IN gcsHINT_PTR Hints,
++	OUT gctPOINTER * Binary,
++	OUT gctSIZE_T * BinarySize
++	);
++
++/*******************************************************************************
++**                                gcLoadProgram
++********************************************************************************
++**
++**	Load pre-compiled shaders and pre-linked programs from a binary file.
++**
++**	INPUT:
++**
++**		gctPOINTER Binary
++**			Pointer to the binary data loaded.
++**
++**		gctSIZE_T BinarySize
++**			Number of bytes in 'Binary'.
++**
++**	OUTPUT:
++**
++**		gcSHADER VertexShader
++**			Pointer to a vertex shader object.
++**
++**		gcSHADER FragmentShader
++**			Pointer to a fragment shader object.
++**
++**		gctSIZE_T * ProgramBufferSize
++**			Pointer to a variable receicing the number of bytes in the buffer
++**			returned in 'ProgramBuffer'.
++**
++**		gctPOINTER * ProgramBuffer
++**			Pointer to a variable receiving a buffer pointer that contains the
++**			states required to download the shaders into the hardware.
++**
++**		gcsHINT_PTR * Hints
++**			Pointer to a variable receiving a gcsHINT structure pointer that
++**			contains information required when loading the shader states.
++*/
++gceSTATUS
++gcLoadProgram(
++	IN gctPOINTER Binary,
++	IN gctSIZE_T BinarySize,
++	OUT gcSHADER VertexShader,
++	OUT gcSHADER FragmentShader,
++	OUT gctSIZE_T * ProgramBufferSize,
++	OUT gctPOINTER * ProgramBuffer,
++	OUT gcsHINT_PTR * Hints
++	);
++
++/*******************************************************************************
++**                              gcCompileKernel
++********************************************************************************
++**
++**	Compile a OpenCL kernel shader.
++**
++**	INPUT:
++**
++**		gcoOS Hal
++**			Pointer to an gcoHAL object.
++**
++**		gctSIZE_T SourceSize
++**			Size of the source buffer in bytes.
++**
++**		gctCONST_STRING Source
++**			Pointer to the buffer containing the shader source code.
++**
++**	OUTPUT:
++**
++**		gcSHADER * Binary
++**			Pointer to a variable receiving the pointer to a gcSHADER object
++**			containg the compiled shader code.
++**
++**		gctSTRING * Log
++**			Pointer to a variable receiving a string pointer containging the
++**			compile log.
++*/
++gceSTATUS
++gcCompileKernel(
++	IN gcoHAL Hal,
++	IN gctSIZE_T SourceSize,
++	IN gctCONST_STRING Source,
++	IN gctCONST_STRING Options,
++	OUT gcSHADER * Binary,
++	OUT gctSTRING * Log
++	);
++
++/*******************************************************************************
++**                                gcLinkKernel
++********************************************************************************
++**
++**	Link OpenCL kernel and generate a harwdare specific state buffer by compiling
++**	the compiler generated code through the resource allocator and code
++**	generator.
++**
++**	INPUT:
++**
++**		gcSHADER Kernel
++**			Pointer to a gcSHADER object holding information about the compiled
++**			OpenCL kernel.
++**
++**		gceSHADER_FLAGS Flags
++**			Compiler flags.  Can be any of the following:
++**
++**				gcvSHADER_DEAD_CODE       - Dead code elimination.
++**				gcvSHADER_RESOURCE_USAGE  - Resource usage optimizaion.
++**				gcvSHADER_OPTIMIZER       - Full optimization.
++**				gcvSHADER_USE_GL_Z        - Use OpenGL ES Z coordinate.
++**				gcvSHADER_USE_GL_POSITION - Use OpenGL ES gl_Position.
++**				gcvSHADER_USE_GL_FACE     - Use OpenGL ES gl_FaceForward.
++**
++**	OUTPUT:
++**
++**		gctSIZE_T * StateBufferSize
++**			Pointer to a variable receiving the number of bytes in the buffer
++**			returned in 'StateBuffer'.
++**
++**		gctPOINTER * StateBuffer
++**			Pointer to a variable receiving a buffer pointer that contains the
++**			states required to download the shaders into the hardware.
++**
++**		gcsHINT_PTR * Hints
++**			Pointer to a variable receiving a gcsHINT structure pointer that
++**			contains information required when loading the shader states.
++*/
++gceSTATUS
++gcLinkKernel(
++	IN gcSHADER Kernel,
++	IN gceSHADER_FLAGS Flags,
++	OUT gctSIZE_T * StateBufferSize,
++	OUT gctPOINTER * StateBuffer,
++	OUT gcsHINT_PTR * Hints
++	);
++
++/*******************************************************************************
++**                                gcLoadKernel
++********************************************************************************
++**
++**  Load a pre-compiled and pre-linked kernel program into the hardware.
++**
++**  INPUT:
++**
++**      gctSIZE_T StateBufferSize
++**          The number of bytes in the 'StateBuffer'.
++**
++**      gctPOINTER StateBuffer
++**          Pointer to the states that make up the shader program.
++**
++**      gcsHINT_PTR Hints
++**          Pointer to a gcsHINT structure that contains information required
++**          when loading the shader states.
++*/
++gceSTATUS
++gcLoadKernel(
++    IN gctSIZE_T StateBufferSize,
++    IN gctPOINTER StateBuffer,
++    IN gcsHINT_PTR Hints
++    );
++
++gceSTATUS
++gcInvokeThreadWalker(
++    IN gcsTHREAD_WALKER_INFO_PTR Info
++    );
++
++void
++gcTYPE_GetTypeInfo(
++    IN gcSHADER_TYPE      Type,
++    OUT gctINT *          Components,
++    OUT gctINT *          Rows,
++    OUT gctCONST_STRING * Name
++    );
++
++gctBOOL
++gcOPT_doVaryingPackingForShader(
++	IN gcSHADER Shader
++    );
++
++gceSTATUS
++gcSHADER_PatchNPOTForMachineCode(
++    IN     gcSHADER_KIND          shaderType,
++    IN     gcMACHINECODE_PTR      pMachineCode,
++    IN     gcNPOT_PATCH_PARAM_PTR pPatchParam,
++    IN     gctUINT                countOfPatchParam,
++    IN     gctUINT                hwSupportedInstCount,
++    OUT    gctPOINTER*            ppCmdBuffer,
++    OUT    gctUINT32*             pByteSizeOfCmdBuffer,
++    IN OUT gcsHINT_PTR            pHints /* User needs copy original hints to this one, then passed this one in */
++    );
++
++gceSTATUS
++gcSHADER_PatchZBiasForMachineCodeVS(
++    IN     gcMACHINECODE_PTR       pMachineCode,
++    IN OUT gcZBIAS_PATCH_PARAM_PTR pPatchParam,
++    IN     gctUINT                 hwSupportedInstCount,
++    OUT    gctPOINTER*             ppCmdBuffer,
++    OUT    gctUINT32*              pByteSizeOfCmdBuffer,
++    IN OUT gcsHINT_PTR             pHints /* User needs copy original hints to this one, then passed this one in */
++    );
++
++gceSTATUS
++gcSHADER_InsertList(
++    IN gcSHADER                    Shader,
++    IN gcSHADER_LIST *             Root,
++    IN gctINT                      Index,
++    IN gctINT                      Data0,
++    IN gctINT                      Data1
++    );
++
++gceSTATUS
++gcSHADER_UpdateList(
++    IN gcSHADER                    Shader,
++    IN gcSHADER_LIST               Root,
++    IN gctINT                      Index,
++    IN gctINT                      NewIndex
++    );
++
++gceSTATUS
++gcSHADER_DeleteList(
++    IN gcSHADER                    Shader,
++    IN gcSHADER_LIST *             Root,
++    IN gctINT                      Index
++    );
++
++gceSTATUS
++gcSHADER_FindList(
++    IN gcSHADER                    Shader,
++    IN gcSHADER_LIST               Root,
++    IN gctINT                      Index,
++    IN gcSHADER_LIST *             List
++    );
++
++gceSTATUS
++gcSHADER_InsertWClipList(
++    IN gcSHADER                    Shader,
++    IN gctINT                      Index,
++    IN gctINT                      Data0,
++    IN gctINT                      Data1
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* VIVANTE_NO_3D */
++#endif /* __gc_hal_compiler_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,1051 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_driver_h_
++#define __gc_hal_driver_h_
++
++#include "gc_hal_enum.h"
++#include "gc_hal_types.h"
++
++#if gcdENABLE_VG
++#include "gc_hal_driver_vg.h"
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++******************************* I/O Control Codes ******************************
++\******************************************************************************/
++
++#define gcvHAL_CLASS                    "galcore"
++#define IOCTL_GCHAL_INTERFACE           30000
++#define IOCTL_GCHAL_KERNEL_INTERFACE    30001
++#define IOCTL_GCHAL_TERMINATE           30002
++
++/******************************************************************************\
++********************************* Command Codes ********************************
++\******************************************************************************/
++
++typedef enum _gceHAL_COMMAND_CODES
++{
++    /* Generic query. */
++    gcvHAL_QUERY_VIDEO_MEMORY,
++    gcvHAL_QUERY_CHIP_IDENTITY,
++
++    /* Contiguous memory. */
++    gcvHAL_ALLOCATE_NON_PAGED_MEMORY,
++    gcvHAL_FREE_NON_PAGED_MEMORY,
++    gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY,
++    gcvHAL_FREE_CONTIGUOUS_MEMORY,
++
++    /* Video memory allocation. */
++    gcvHAL_ALLOCATE_VIDEO_MEMORY,           /* Enforced alignment. */
++    gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY,    /* No alignment. */
++    gcvHAL_FREE_VIDEO_MEMORY,
++
++    /* Physical-to-logical mapping. */
++    gcvHAL_MAP_MEMORY,
++    gcvHAL_UNMAP_MEMORY,
++
++    /* Logical-to-physical mapping. */
++    gcvHAL_MAP_USER_MEMORY,
++    gcvHAL_UNMAP_USER_MEMORY,
++
++    /* Surface lock/unlock. */
++    gcvHAL_LOCK_VIDEO_MEMORY,
++    gcvHAL_UNLOCK_VIDEO_MEMORY,
++
++    /* Event queue. */
++    gcvHAL_EVENT_COMMIT,
++
++    gcvHAL_USER_SIGNAL,
++    gcvHAL_SIGNAL,
++    gcvHAL_WRITE_DATA,
++
++    gcvHAL_COMMIT,
++    gcvHAL_STALL,
++
++    gcvHAL_READ_REGISTER,
++    gcvHAL_WRITE_REGISTER,
++
++    gcvHAL_GET_PROFILE_SETTING,
++    gcvHAL_SET_PROFILE_SETTING,
++
++    gcvHAL_READ_ALL_PROFILE_REGISTERS,
++    gcvHAL_PROFILE_REGISTERS_2D,
++#if VIVANTE_PROFILER_PERDRAW
++    gcvHAL_READ_PROFILER_REGISTER_SETTING,
++#endif
++
++    /* Power management. */
++    gcvHAL_SET_POWER_MANAGEMENT_STATE,
++    gcvHAL_QUERY_POWER_MANAGEMENT_STATE,
++
++    gcvHAL_GET_BASE_ADDRESS,
++
++    gcvHAL_SET_IDLE, /* reserved */
++
++    /* Queries. */
++    gcvHAL_QUERY_KERNEL_SETTINGS,
++
++    /* Reset. */
++    gcvHAL_RESET,
++
++    /* Map physical address into handle. */
++    gcvHAL_MAP_PHYSICAL,
++
++    /* Debugger stuff. */
++    gcvHAL_DEBUG,
++
++    /* Cache stuff. */
++    gcvHAL_CACHE,
++
++    /* TimeStamp */
++    gcvHAL_TIMESTAMP,
++
++    /* Database. */
++    gcvHAL_DATABASE,
++
++    /* Version. */
++    gcvHAL_VERSION,
++
++    /* Chip info */
++    gcvHAL_CHIP_INFO,
++
++    /* Process attaching/detaching. */
++    gcvHAL_ATTACH,
++    gcvHAL_DETACH,
++
++    /* Composition. */
++    gcvHAL_COMPOSE,
++
++    /* Set timeOut value */
++    gcvHAL_SET_TIMEOUT,
++
++    /* Frame database. */
++    gcvHAL_GET_FRAME_INFO,
++
++    /* Shared info for each process */
++    gcvHAL_GET_SHARED_INFO,
++    gcvHAL_SET_SHARED_INFO,
++    gcvHAL_QUERY_COMMAND_BUFFER,
++
++    gcvHAL_COMMIT_DONE,
++
++    /* GPU and event dump */
++    gcvHAL_DUMP_GPU_STATE,
++    gcvHAL_DUMP_EVENT,
++
++    /* Virtual command buffer. */
++    gcvHAL_ALLOCATE_VIRTUAL_COMMAND_BUFFER,
++    gcvHAL_FREE_VIRTUAL_COMMAND_BUFFER,
++
++    /* FSCALE_VAL. */
++    gcvHAL_SET_FSCALE_VALUE,
++    gcvHAL_GET_FSCALE_VALUE,
++
++    /* Reset time stamp. */
++    gcvHAL_QUERY_RESET_TIME_STAMP,
++
++    /* Sync point operations. */
++    gcvHAL_SYNC_POINT,
++
++    /* Create native fence and return its fd. */
++    gcvHAL_CREATE_NATIVE_FENCE,
++
++    /* Video memory database */
++    gcvHAL_VIDMEM_DATABASE,
++}
++gceHAL_COMMAND_CODES;
++
++/******************************************************************************\
++****************************** Interface Structure *****************************
++\******************************************************************************/
++
++#define gcdMAX_PROFILE_FILE_NAME    128
++
++/* Kernel settings. */
++typedef struct _gcsKERNEL_SETTINGS
++{
++    /* Used RealTime signal between kernel and user. */
++    gctINT signal;
++}
++gcsKERNEL_SETTINGS;
++
++
++/* gcvHAL_QUERY_CHIP_IDENTITY */
++typedef struct _gcsHAL_QUERY_CHIP_IDENTITY * gcsHAL_QUERY_CHIP_IDENTITY_PTR;
++typedef struct _gcsHAL_QUERY_CHIP_IDENTITY
++{
++
++    /* Chip model. */
++    gceCHIPMODEL                chipModel;
++
++    /* Revision value.*/
++    gctUINT32                   chipRevision;
++
++    /* Supported feature fields. */
++    gctUINT32                   chipFeatures;
++
++    /* Supported minor feature fields. */
++    gctUINT32                   chipMinorFeatures;
++
++    /* Supported minor feature 1 fields. */
++    gctUINT32                   chipMinorFeatures1;
++
++    /* Supported minor feature 2 fields. */
++    gctUINT32                   chipMinorFeatures2;
++
++    /* Supported minor feature 3 fields. */
++    gctUINT32                   chipMinorFeatures3;
++
++    /* Supported minor feature 4 fields. */
++    gctUINT32                   chipMinorFeatures4;
++
++    /* Number of streams supported. */
++    gctUINT32                   streamCount;
++
++    /* Total number of temporary registers per thread. */
++    gctUINT32                   registerMax;
++
++    /* Maximum number of threads. */
++    gctUINT32                   threadCount;
++
++    /* Number of shader cores. */
++    gctUINT32                   shaderCoreCount;
++
++    /* Size of the vertex cache. */
++    gctUINT32                   vertexCacheSize;
++
++    /* Number of entries in the vertex output buffer. */
++    gctUINT32                   vertexOutputBufferSize;
++
++    /* Number of pixel pipes. */
++    gctUINT32                   pixelPipes;
++
++    /* Number of instructions. */
++    gctUINT32                   instructionCount;
++
++    /* Number of constants. */
++    gctUINT32                   numConstants;
++
++    /* Buffer size */
++    gctUINT32                   bufferSize;
++
++    /* Number of varyings */
++    gctUINT32                   varyingsCount;
++
++    /* Supertile layout style in hardware */
++    gctUINT32                   superTileMode;
++
++    /* Special control bits for 2D chip. */
++    gctUINT32                   chip2DControl;
++}
++gcsHAL_QUERY_CHIP_IDENTITY;
++
++/* gcvHAL_COMPOSE. */
++typedef struct _gcsHAL_COMPOSE * gcsHAL_COMPOSE_PTR;
++typedef struct _gcsHAL_COMPOSE
++{
++    /* Composition state buffer. */
++    gctUINT64                   physical;
++    gctUINT64                   logical;
++    gctUINT                     offset;
++    gctUINT                     size;
++
++    /* Composition end signal. */
++    gctUINT64                   process;
++    gctUINT64                   signal;
++
++    /* User signals. */
++    gctUINT64                   userProcess;
++    gctUINT64                   userSignal1;
++    gctUINT64                   userSignal2;
++
++#if defined(__QNXNTO__)
++    /* Client pulse side-channel connection ID. */
++    gctINT32                    coid;
++
++    /* Set by server. */
++    gctINT32                    rcvid;
++#endif
++}
++gcsHAL_COMPOSE;
++
++
++typedef struct _gcsHAL_INTERFACE
++{
++    /* Command code. */
++    gceHAL_COMMAND_CODES        command;
++
++    /* Hardware type. */
++    gceHARDWARE_TYPE            hardwareType;
++
++    /* Status value. */
++    gceSTATUS                   status;
++
++    /* Handle to this interface channel. */
++    gctUINT64                   handle;
++
++    /* Pid of the client. */
++    gctUINT32                   pid;
++
++    /* Union of command structures. */
++    union _u
++    {
++        /* gcvHAL_GET_BASE_ADDRESS */
++        struct _gcsHAL_GET_BASE_ADDRESS
++        {
++            /* Physical memory address of internal memory. */
++            OUT gctUINT32               baseAddress;
++        }
++        GetBaseAddress;
++
++        /* gcvHAL_QUERY_VIDEO_MEMORY */
++        struct _gcsHAL_QUERY_VIDEO_MEMORY
++        {
++            /* Physical memory address of internal memory. Just a name. */
++            OUT gctUINT32               internalPhysical;
++
++            /* Size in bytes of internal memory. */
++            OUT gctUINT64               internalSize;
++
++            /* Physical memory address of external memory. Just a name. */
++            OUT gctUINT32               externalPhysical;
++
++            /* Size in bytes of external memory.*/
++            OUT gctUINT64               externalSize;
++
++            /* Physical memory address of contiguous memory. Just a name. */
++            OUT gctUINT32               contiguousPhysical;
++
++            /* Size in bytes of contiguous memory.*/
++            OUT gctUINT64               contiguousSize;
++        }
++        QueryVideoMemory;
++
++        /* gcvHAL_QUERY_CHIP_IDENTITY */
++        gcsHAL_QUERY_CHIP_IDENTITY      QueryChipIdentity;
++
++        /* gcvHAL_MAP_MEMORY */
++        struct _gcsHAL_MAP_MEMORY
++        {
++            /* Physical memory address to map. Just a name on Linux/Qnx. */
++            IN gctUINT32                physical;
++
++            /* Number of bytes in physical memory to map. */
++            IN gctUINT64                bytes;
++
++            /* Address of mapped memory. */
++            OUT gctUINT64               logical;
++        }
++        MapMemory;
++
++        /* gcvHAL_UNMAP_MEMORY */
++        struct _gcsHAL_UNMAP_MEMORY
++        {
++            /* Physical memory address to unmap. Just a name on Linux/Qnx. */
++            IN gctUINT32                physical;
++
++            /* Number of bytes in physical memory to unmap. */
++            IN gctUINT64                bytes;
++
++            /* Address of mapped memory to unmap. */
++            IN gctUINT64                logical;
++        }
++        UnmapMemory;
++
++        /* gcvHAL_ALLOCATE_LINEAR_VIDEO_MEMORY */
++        struct _gcsHAL_ALLOCATE_LINEAR_VIDEO_MEMORY
++        {
++            /* Number of bytes to allocate. */
++            IN OUT gctUINT              bytes;
++
++            /* Buffer alignment. */
++            IN gctUINT                  alignment;
++
++            /* Type of allocation. */
++            IN gceSURF_TYPE             type;
++
++            /* Memory pool to allocate from. */
++            IN OUT gcePOOL              pool;
++
++            /* Allocated video memory in gcuVIDMEM_NODE. */
++            OUT gctUINT64               node;
++        }
++        AllocateLinearVideoMemory;
++
++        /* gcvHAL_ALLOCATE_VIDEO_MEMORY */
++        struct _gcsHAL_ALLOCATE_VIDEO_MEMORY
++        {
++            /* Width of rectangle to allocate. */
++            IN OUT gctUINT              width;
++
++            /* Height of rectangle to allocate. */
++            IN OUT gctUINT              height;
++
++            /* Depth of rectangle to allocate. */
++            IN gctUINT                  depth;
++
++            /* Format rectangle to allocate in gceSURF_FORMAT. */
++            IN gceSURF_FORMAT           format;
++
++            /* Type of allocation. */
++            IN gceSURF_TYPE             type;
++
++            /* Memory pool to allocate from. */
++            IN OUT gcePOOL              pool;
++
++            /* Allocated video memory in gcuVIDMEM_NODE. */
++            OUT gctUINT64               node;
++        }
++        AllocateVideoMemory;
++
++        /* gcvHAL_FREE_VIDEO_MEMORY */
++        struct _gcsHAL_FREE_VIDEO_MEMORY
++        {
++            /* Allocated video memory in gcuVIDMEM_NODE. */
++            IN gctUINT64        node;
++
++#ifdef __QNXNTO__
++/* TODO: This is part of the unlock - why is it here? */
++            /* Mapped logical address to unmap in user space. */
++            OUT gctUINT64       memory;
++
++            /* Number of bytes to allocated. */
++            OUT gctUINT64       bytes;
++#endif
++        }
++        FreeVideoMemory;
++
++        /* gcvHAL_LOCK_VIDEO_MEMORY */
++        struct _gcsHAL_LOCK_VIDEO_MEMORY
++        {
++            /* Allocated video memory gcuVIDMEM_NODE gcuVIDMEM_NODE. */
++            IN gctUINT64            node;
++
++            /* Cache configuration. */
++            /* Only gcvPOOL_CONTIGUOUS and gcvPOOL_VIRUTAL
++            ** can be configured */
++            IN gctBOOL              cacheable;
++
++            /* Hardware specific address. */
++            OUT gctUINT32           address;
++
++            /* Mapped logical address. */
++            OUT gctUINT64           memory;
++        }
++        LockVideoMemory;
++
++        /* gcvHAL_UNLOCK_VIDEO_MEMORY */
++        struct _gcsHAL_UNLOCK_VIDEO_MEMORY
++        {
++            /* Allocated video memory in gcuVIDMEM_NODE. */
++            IN gctUINT64            node;
++
++            /* Type of surface. */
++            IN gceSURF_TYPE         type;
++
++            /* Flag to unlock surface asynchroneously. */
++            IN OUT gctBOOL          asynchroneous;
++        }
++        UnlockVideoMemory;
++
++        /* gcvHAL_ALLOCATE_NON_PAGED_MEMORY */
++        struct _gcsHAL_ALLOCATE_NON_PAGED_MEMORY
++        {
++            /* Number of bytes to allocate. */
++            IN OUT gctUINT64        bytes;
++
++            /* Physical address of allocation. Just a name. */
++            OUT gctUINT32           physical;
++
++            /* Logical address of allocation. */
++            OUT gctUINT64           logical;
++        }
++        AllocateNonPagedMemory;
++
++        /* gcvHAL_FREE_NON_PAGED_MEMORY */
++        struct _gcsHAL_FREE_NON_PAGED_MEMORY
++        {
++            /* Number of bytes allocated. */
++            IN gctUINT64            bytes;
++
++            /* Physical address of allocation. Just a name. */
++            IN gctUINT32            physical;
++
++            /* Logical address of allocation. */
++            IN gctUINT64            logical;
++        }
++        FreeNonPagedMemory;
++
++        /* gcvHAL_ALLOCATE_NON_PAGED_MEMORY */
++        struct _gcsHAL_ALLOCATE_VIRTUAL_COMMAND_BUFFER
++        {
++            /* Number of bytes to allocate. */
++            IN OUT gctUINT64        bytes;
++
++            /* Physical address of allocation. Just a name. */
++            OUT gctUINT32           physical;
++
++            /* Logical address of allocation. */
++            OUT gctUINT64           logical;
++        }
++        AllocateVirtualCommandBuffer;
++
++        /* gcvHAL_FREE_NON_PAGED_MEMORY */
++        struct _gcsHAL_FREE_VIRTUAL_COMMAND_BUFFER
++        {
++            /* Number of bytes allocated. */
++            IN gctUINT64            bytes;
++
++            /* Physical address of allocation. Just a name. */
++            IN gctUINT32            physical;
++
++            /* Logical address of allocation. */
++            IN gctUINT64            logical;
++        }
++        FreeVirtualCommandBuffer;
++
++        /* gcvHAL_EVENT_COMMIT. */
++        struct _gcsHAL_EVENT_COMMIT
++        {
++            /* Event queue in gcsQUEUE. */
++            IN gctUINT64             queue;
++        }
++        Event;
++
++        /* gcvHAL_COMMIT */
++        struct _gcsHAL_COMMIT
++        {
++            /* Context buffer object gckCONTEXT. */
++            IN gctUINT64            context;
++
++            /* Command buffer gcoCMDBUF. */
++            IN gctUINT64            commandBuffer;
++
++            /* State delta buffer in gcsSTATE_DELTA. */
++            gctUINT64               delta;
++
++            /* Event queue in gcsQUEUE. */
++            IN gctUINT64            queue;
++        }
++        Commit;
++
++        /* gcvHAL_MAP_USER_MEMORY */
++        struct _gcsHAL_MAP_USER_MEMORY
++        {
++            /* Base address of user memory to map. */
++            IN gctUINT64                memory;
++
++            /* Physical address of user memory to map. */
++            IN gctUINT32                physical;
++
++            /* Size of user memory in bytes to map. */
++            IN gctUINT64                size;
++
++            /* Info record required by gcvHAL_UNMAP_USER_MEMORY. Just a name. */
++            OUT gctUINT32               info;
++
++            /* Physical address of mapped memory. */
++            OUT gctUINT32               address;
++        }
++        MapUserMemory;
++
++        /* gcvHAL_UNMAP_USER_MEMORY */
++        struct _gcsHAL_UNMAP_USER_MEMORY
++        {
++            /* Base address of user memory to unmap. */
++            IN gctUINT64                memory;
++
++            /* Size of user memory in bytes to unmap. */
++            IN gctUINT64                size;
++
++            /* Info record returned by gcvHAL_MAP_USER_MEMORY. Just a name. */
++            IN gctUINT32                info;
++
++            /* Physical address of mapped memory as returned by
++               gcvHAL_MAP_USER_MEMORY. */
++            IN gctUINT32                address;
++        }
++        UnmapUserMemory;
++#if !USE_NEW_LINUX_SIGNAL
++        /* gcsHAL_USER_SIGNAL  */
++        struct _gcsHAL_USER_SIGNAL
++        {
++            /* Command. */
++            gceUSER_SIGNAL_COMMAND_CODES command;
++
++            /* Signal ID. */
++            IN OUT gctINT               id;
++
++            /* Reset mode. */
++            IN gctBOOL                  manualReset;
++
++            /* Wait timedout. */
++            IN gctUINT32                wait;
++
++            /* State. */
++            IN gctBOOL                  state;
++        }
++        UserSignal;
++#endif
++
++        /* gcvHAL_SIGNAL. */
++        struct _gcsHAL_SIGNAL
++        {
++            /* Signal handle to signal gctSIGNAL. */
++            IN gctUINT64                signal;
++
++            /* Reserved gctSIGNAL. */
++            IN gctUINT64                auxSignal;
++
++            /* Process owning the signal gctHANDLE. */
++            IN gctUINT64                process;
++
++#if defined(__QNXNTO__)
++            /* Client pulse side-channel connection ID. Set by client in gcoOS_CreateSignal. */
++            IN gctINT32                 coid;
++
++            /* Set by server. */
++            IN gctINT32                 rcvid;
++#endif
++            /* Event generated from where of pipeline */
++            IN gceKERNEL_WHERE          fromWhere;
++        }
++        Signal;
++
++        /* gcvHAL_WRITE_DATA. */
++        struct _gcsHAL_WRITE_DATA
++        {
++            /* Address to write data to. */
++            IN gctUINT32                address;
++
++            /* Data to write. */
++            IN gctUINT32                data;
++        }
++        WriteData;
++
++        /* gcvHAL_ALLOCATE_CONTIGUOUS_MEMORY */
++        struct _gcsHAL_ALLOCATE_CONTIGUOUS_MEMORY
++        {
++            /* Number of bytes to allocate. */
++            IN OUT gctUINT64            bytes;
++
++            /* Hardware address of allocation. */
++            OUT gctUINT32               address;
++
++            /* Physical address of allocation. Just a name. */
++            OUT gctUINT32               physical;
++
++            /* Logical address of allocation. */
++            OUT gctUINT64               logical;
++        }
++        AllocateContiguousMemory;
++
++        /* gcvHAL_FREE_CONTIGUOUS_MEMORY */
++        struct _gcsHAL_FREE_CONTIGUOUS_MEMORY
++        {
++            /* Number of bytes allocated. */
++            IN gctUINT64                bytes;
++
++            /* Physical address of allocation. Just a name. */
++            IN gctUINT32                physical;
++
++            /* Logical address of allocation. */
++            IN gctUINT64                logical;
++        }
++        FreeContiguousMemory;
++
++        /* gcvHAL_READ_REGISTER */
++        struct _gcsHAL_READ_REGISTER
++        {
++            /* Logical address of memory to write data to. */
++            IN gctUINT32            address;
++
++            /* Data read. */
++            OUT gctUINT32           data;
++        }
++        ReadRegisterData;
++
++        /* gcvHAL_WRITE_REGISTER */
++        struct _gcsHAL_WRITE_REGISTER
++        {
++            /* Logical address of memory to write data to. */
++            IN gctUINT32            address;
++
++            /* Data read. */
++            IN gctUINT32            data;
++        }
++        WriteRegisterData;
++
++#if VIVANTE_PROFILER
++        /* gcvHAL_GET_PROFILE_SETTING */
++        struct _gcsHAL_GET_PROFILE_SETTING
++        {
++            /* Enable profiling */
++            OUT gctBOOL             enable;
++
++            /* The profile file name */
++            OUT gctCHAR             fileName[gcdMAX_PROFILE_FILE_NAME];
++        }
++        GetProfileSetting;
++
++        /* gcvHAL_SET_PROFILE_SETTING */
++        struct _gcsHAL_SET_PROFILE_SETTING
++        {
++            /* Enable profiling */
++            IN gctBOOL              enable;
++
++            /* The profile file name */
++            IN gctCHAR              fileName[gcdMAX_PROFILE_FILE_NAME];
++        }
++        SetProfileSetting;
++
++#if VIVANTE_PROFILER_PERDRAW
++        /* gcvHAL_READ_PROFILER_REGISTER_SETTING */
++        struct _gcsHAL_READ_PROFILER_REGISTER_SETTING
++         {
++            /*Should Clear Register*/
++            IN gctBOOL               bclear;
++         }
++        SetProfilerRegisterClear;
++#endif
++
++        /* gcvHAL_READ_ALL_PROFILE_REGISTERS */
++        struct _gcsHAL_READ_ALL_PROFILE_REGISTERS
++        {
++#if VIVANTE_PROFILER_CONTEXT
++            /* Context buffer object gckCONTEXT. Just a name. */
++            IN gctUINT32                context;
++#endif
++            /* Data read. */
++            OUT gcsPROFILER_COUNTERS    counters;
++        }
++        RegisterProfileData;
++
++        /* gcvHAL_PROFILE_REGISTERS_2D */
++        struct _gcsHAL_PROFILE_REGISTERS_2D
++        {
++            /* Data read in gcs2D_PROFILE. */
++            OUT gctUINT64       hwProfile2D;
++        }
++        RegisterProfileData2D;
++#endif
++        /* Power management. */
++        /* gcvHAL_SET_POWER_MANAGEMENT_STATE */
++        struct _gcsHAL_SET_POWER_MANAGEMENT
++        {
++            /* Data read. */
++            IN gceCHIPPOWERSTATE        state;
++        }
++        SetPowerManagement;
++
++        /* gcvHAL_QUERY_POWER_MANAGEMENT_STATE */
++        struct _gcsHAL_QUERY_POWER_MANAGEMENT
++        {
++            /* Data read. */
++            OUT gceCHIPPOWERSTATE       state;
++
++            /* Idle query. */
++            OUT gctBOOL                 isIdle;
++        }
++        QueryPowerManagement;
++
++        /* gcvHAL_QUERY_KERNEL_SETTINGS */
++        struct _gcsHAL_QUERY_KERNEL_SETTINGS
++        {
++            /* Settings.*/
++            OUT gcsKERNEL_SETTINGS      settings;
++        }
++        QueryKernelSettings;
++
++        /* gcvHAL_MAP_PHYSICAL */
++        struct _gcsHAL_MAP_PHYSICAL
++        {
++            /* gcvTRUE to map, gcvFALSE to unmap. */
++            IN gctBOOL                  map;
++
++            /* Physical address. */
++            IN OUT gctUINT64            physical;
++        }
++        MapPhysical;
++
++        /* gcvHAL_DEBUG */
++        struct _gcsHAL_DEBUG
++        {
++            /* If gcvTRUE, set the debug information. */
++            IN gctBOOL                  set;
++            IN gctUINT32                level;
++            IN gctUINT32                zones;
++            IN gctBOOL                  enable;
++
++            IN gceDEBUG_MESSAGE_TYPE    type;
++            IN gctUINT32                messageSize;
++
++            /* Message to print if not empty. */
++            IN gctCHAR                  message[80];
++        }
++        Debug;
++
++        /* gcvHAL_CACHE */
++        struct _gcsHAL_CACHE
++        {
++            IN gceCACHEOPERATION        operation;
++            /* gctHANDLE */
++            IN gctUINT64                process;
++            IN gctUINT64                logical;
++            IN gctUINT64                bytes;
++            /* gcuVIDMEM_NODE_PTR */
++            IN gctUINT64                node;
++        }
++        Cache;
++
++        /* gcvHAL_TIMESTAMP */
++        struct _gcsHAL_TIMESTAMP
++        {
++            /* Timer select. */
++            IN gctUINT32                timer;
++
++            /* Timer request type (0-stop, 1-start, 2-send delta). */
++            IN gctUINT32                request;
++
++            /* Result of delta time in microseconds. */
++            OUT gctINT32                timeDelta;
++        }
++        TimeStamp;
++
++        /* gcvHAL_DATABASE */
++        struct _gcsHAL_DATABASE
++        {
++            /* Set to gcvTRUE if you want to query a particular process ID.
++            ** Set to gcvFALSE to query the last detached process. */
++            IN gctBOOL                  validProcessID;
++
++            /* Process ID to query. */
++            IN gctUINT32                processID;
++
++            /* Information. */
++            OUT gcuDATABASE_INFO        vidMem;
++            OUT gcuDATABASE_INFO        nonPaged;
++            OUT gcuDATABASE_INFO        contiguous;
++            OUT gcuDATABASE_INFO        gpuIdle;
++        }
++        Database;
++
++        /* gcvHAL_VIDMEM_DATABASE */
++        struct _gcsHAL_VIDMEM_DATABASE
++        {
++            /* Set to gcvTRUE if you want to query a particular process ID.
++            ** Set to gcvFALSE to query the last detached process. */
++            IN gctBOOL                  validProcessID;
++
++            /* Process ID to query. */
++            IN gctUINT32                processID;
++
++            /* Information. */
++            OUT gcuDATABASE_INFO        vidMemResv;
++            OUT gcuDATABASE_INFO        vidMemCont;
++            OUT gcuDATABASE_INFO        vidMemVirt;
++        }
++        VidMemDatabase;
++
++        /* gcvHAL_VERSION */
++        struct _gcsHAL_VERSION
++        {
++            /* Major version: N.n.n. */
++            OUT gctINT32                major;
++
++            /* Minor version: n.N.n. */
++            OUT gctINT32                minor;
++
++            /* Patch version: n.n.N. */
++            OUT gctINT32                patch;
++
++            /* Build version. */
++            OUT gctUINT32               build;
++        }
++        Version;
++
++        /* gcvHAL_CHIP_INFO */
++        struct _gcsHAL_CHIP_INFO
++        {
++            /* Chip count. */
++            OUT gctINT32                count;
++
++            /* Chip types. */
++            OUT gceHARDWARE_TYPE        types[gcdCHIP_COUNT];
++        }
++        ChipInfo;
++
++        /* gcvHAL_ATTACH */
++        struct _gcsHAL_ATTACH
++        {
++            /* Context buffer object gckCONTEXT. Just a name. */
++            OUT gctUINT32               context;
++
++            /* Number of states in the buffer. */
++            OUT gctUINT64               stateCount;
++        }
++        Attach;
++
++        /* gcvHAL_DETACH */
++        struct _gcsHAL_DETACH
++        {
++            /* Context buffer object gckCONTEXT. Just a name. */
++            IN gctUINT32                context;
++        }
++        Detach;
++
++        /* gcvHAL_COMPOSE. */
++        gcsHAL_COMPOSE            Compose;
++
++        /* gcvHAL_GET_FRAME_INFO. */
++        struct _gcsHAL_GET_FRAME_INFO
++        {
++            /* gcsHAL_FRAME_INFO* */
++            OUT gctUINT64     frameInfo;
++        }
++        GetFrameInfo;
++
++        /* gcvHAL_SET_TIME_OUT. */
++        struct _gcsHAL_SET_TIMEOUT
++        {
++            gctUINT32                   timeOut;
++        }
++        SetTimeOut;
++
++#if gcdENABLE_VG
++		/* gcvHAL_COMMIT */
++		struct _gcsHAL_VGCOMMIT
++		{
++			/* Context buffer in gcsVGCONTEXT. */
++			IN gctUINT64			context;
++
++			/* Command queue in gcsVGCMDQUEUE. */
++			IN gctUINT64			queue;
++
++			/* Number of entries in the queue. */
++			IN gctUINT			entryCount;
++
++			/* Task table in gcsTASK_MASTER_TABLE. */
++			IN gctUINT64	                taskTable;
++		}
++		VGCommit;
++
++		/* gcvHAL_QUERY_COMMAND_BUFFER */
++		struct _gcsHAL_QUERY_COMMAND_BUFFER
++		{
++			/* Command buffer attributes. */
++			OUT gcsCOMMAND_BUFFER_INFO	information;
++		}
++		QueryCommandBuffer;
++
++#endif
++
++        struct _gcsHAL_GET_SHARED_INFO
++        {
++            /* Process id. */
++            IN gctUINT32            pid;
++
++            /* Data id. */
++            IN gctUINT32            dataId;
++
++            /* Data size. */
++            IN gctSIZE_T            bytes;
++
++            /* Pointer to save the shared data. */
++            OUT gctPOINTER          data;
++        }
++        GetSharedInfo;
++
++        struct _gcsHAL_SET_SHARED_INFO
++        {
++            /* Data id. */
++            IN gctUINT32            dataId;
++
++            /* Data to be shared. */
++            IN gctPOINTER           data;
++
++            /* Data size. */
++            IN gctSIZE_T            bytes;
++        }
++        SetSharedInfo;
++
++        struct _gcsHAL_SET_FSCALE_VALUE
++        {
++            IN gctUINT              value;
++        }
++        SetFscaleValue;
++
++        struct _gcsHAL_GET_FSCALE_VALUE
++        {
++            OUT gctUINT             value;
++            OUT gctUINT             minValue;
++            OUT gctUINT             maxValue;
++        }
++        GetFscaleValue;
++
++        struct _gcsHAL_QUERY_RESET_TIME_STAMP
++        {
++            OUT gctUINT64           timeStamp;
++        }
++        QueryResetTimeStamp;
++
++        struct _gcsHAL_SYNC_POINT
++        {
++            /* Command. */
++            gceSYNC_POINT_COMMAND_CODES command;
++
++            /* Sync point. */
++            IN OUT gctUINT64            syncPoint;
++
++            /* From where. */
++            IN gceKERNEL_WHERE          fromWhere;
++
++            /* Signaled state. */
++            OUT gctBOOL                 state;
++        }
++        SyncPoint;
++
++        struct _gcsHAL_CREATE_NATIVE_FENCE
++        {
++            /* Signal id to dup. */
++            IN gctUINT64                syncPoint;
++
++            /* Native fence file descriptor. */
++            OUT gctINT                  fenceFD;
++
++        }
++        CreateNativeFence;
++    }
++    u;
++}
++gcsHAL_INTERFACE;
++
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_driver_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_driver_vg.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,270 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_driver_vg_h_
++#define __gc_hal_driver_vg_h_
++
++
++
++#include "gc_hal_types.h"
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++******************************* I/O Control Codes ******************************
++\******************************************************************************/
++
++#define gcvHAL_CLASS            "galcore"
++#define IOCTL_GCHAL_INTERFACE   30000
++
++/******************************************************************************\
++********************************* Command Codes ********************************
++\******************************************************************************/
++
++/******************************************************************************\
++********************* Command buffer information structure. ********************
++\******************************************************************************/
++
++typedef struct _gcsCOMMAND_BUFFER_INFO * gcsCOMMAND_BUFFER_INFO_PTR;
++typedef struct _gcsCOMMAND_BUFFER_INFO
++{
++    /* FE command buffer interrupt ID. */
++    gctINT32                    feBufferInt;
++
++    /* TS overflow interrupt ID. */
++    gctINT32                    tsOverflowInt;
++
++    /* Alignment and mask for the buffer address. */
++    gctUINT                     addressMask;
++    gctSIZE_T                   addressAlignment;
++
++    /* Alignment for each command. */
++    gctSIZE_T                   commandAlignment;
++
++    /* Number of bytes required by the STATE command. */
++    gctSIZE_T                   stateCommandSize;
++
++    /* Number of bytes required by the RESTART command. */
++    gctSIZE_T                   restartCommandSize;
++
++    /* Number of bytes required by the FETCH command. */
++    gctSIZE_T                   fetchCommandSize;
++
++    /* Number of bytes required by the CALL command. */
++    gctSIZE_T                   callCommandSize;
++
++    /* Number of bytes required by the RETURN command. */
++    gctSIZE_T                   returnCommandSize;
++
++    /* Number of bytes required by the EVENT command. */
++    gctSIZE_T                   eventCommandSize;
++
++    /* Number of bytes required by the END command. */
++    gctSIZE_T                   endCommandSize;
++
++    /* Number of bytes reserved at the tail of a static command buffer. */
++    gctSIZE_T                   staticTailSize;
++
++    /* Number of bytes reserved at the tail of a dynamic command buffer. */
++    gctSIZE_T                   dynamicTailSize;
++}
++gcsCOMMAND_BUFFER_INFO;
++
++/******************************************************************************\
++******************************** Task Structures *******************************
++\******************************************************************************/
++
++typedef enum _gceTASK
++{
++    gcvTASK_LINK,
++    gcvTASK_CLUSTER,
++    gcvTASK_INCREMENT,
++    gcvTASK_DECREMENT,
++    gcvTASK_SIGNAL,
++    gcvTASK_LOCKDOWN,
++    gcvTASK_UNLOCK_VIDEO_MEMORY,
++    gcvTASK_FREE_VIDEO_MEMORY,
++    gcvTASK_FREE_CONTIGUOUS_MEMORY,
++    gcvTASK_UNMAP_USER_MEMORY
++}
++gceTASK;
++
++typedef struct _gcsTASK_HEADER * gcsTASK_HEADER_PTR;
++typedef struct _gcsTASK_HEADER
++{
++    /* Task ID. */
++    IN gceTASK                  id;
++}
++gcsTASK_HEADER;
++
++typedef struct _gcsTASK_LINK * gcsTASK_LINK_PTR;
++typedef struct _gcsTASK_LINK
++{
++    /* Task ID (gcvTASK_LINK). */
++    IN gceTASK                  id;
++
++    /* Pointer to the next task container. */
++    IN gctPOINTER               cotainer;
++
++    /* Pointer to the next task from the next task container. */
++    IN gcsTASK_HEADER_PTR       task;
++}
++gcsTASK_LINK;
++
++typedef struct _gcsTASK_CLUSTER * gcsTASK_CLUSTER_PTR;
++typedef struct _gcsTASK_CLUSTER
++{
++    /* Task ID (gcvTASK_CLUSTER). */
++    IN gceTASK                  id;
++
++    /* Number of tasks in the cluster. */
++    IN gctUINT                  taskCount;
++}
++gcsTASK_CLUSTER;
++
++typedef struct _gcsTASK_INCREMENT * gcsTASK_INCREMENT_PTR;
++typedef struct _gcsTASK_INCREMENT
++{
++    /* Task ID (gcvTASK_INCREMENT). */
++    IN gceTASK                  id;
++
++    /* Address of the variable to increment. */
++    IN gctUINT32                address;
++}
++gcsTASK_INCREMENT;
++
++typedef struct _gcsTASK_DECREMENT * gcsTASK_DECREMENT_PTR;
++typedef struct _gcsTASK_DECREMENT
++{
++    /* Task ID (gcvTASK_DECREMENT). */
++    IN gceTASK                  id;
++
++    /* Address of the variable to decrement. */
++    IN gctUINT32                address;
++}
++gcsTASK_DECREMENT;
++
++typedef struct _gcsTASK_SIGNAL * gcsTASK_SIGNAL_PTR;
++typedef struct _gcsTASK_SIGNAL
++{
++    /* Task ID (gcvTASK_SIGNAL). */
++    IN gceTASK                  id;
++
++    /* Process owning the signal. */
++    IN gctHANDLE                process;
++
++    /* Signal handle to signal. */
++    IN gctSIGNAL                signal;
++
++#if defined(__QNXNTO__)
++    IN gctINT32                 coid;
++    IN gctINT32                 rcvid;
++#endif
++}
++gcsTASK_SIGNAL;
++
++typedef struct _gcsTASK_LOCKDOWN * gcsTASK_LOCKDOWN_PTR;
++typedef struct _gcsTASK_LOCKDOWN
++{
++    /* Task ID (gcvTASK_LOCKDOWN). */
++    IN gceTASK                  id;
++
++    /* Address of the user space counter. */
++    IN gctUINT32                userCounter;
++
++    /* Address of the kernel space counter. */
++    IN gctUINT32                kernelCounter;
++
++    /* Process owning the signal. */
++    IN gctHANDLE                process;
++
++    /* Signal handle to signal. */
++    IN gctSIGNAL                signal;
++}
++gcsTASK_LOCKDOWN;
++
++typedef struct _gcsTASK_UNLOCK_VIDEO_MEMORY * gcsTASK_UNLOCK_VIDEO_MEMORY_PTR;
++typedef struct _gcsTASK_UNLOCK_VIDEO_MEMORY
++{
++    /* Task ID (gcvTASK_UNLOCK_VIDEO_MEMORY). */
++    IN gceTASK                  id;
++
++    /* Allocated video memory. */
++    IN gctUINT64                node;
++}
++gcsTASK_UNLOCK_VIDEO_MEMORY;
++
++typedef struct _gcsTASK_FREE_VIDEO_MEMORY * gcsTASK_FREE_VIDEO_MEMORY_PTR;
++typedef struct _gcsTASK_FREE_VIDEO_MEMORY
++{
++    /* Task ID (gcvTASK_FREE_VIDEO_MEMORY). */
++    IN gceTASK                  id;
++
++    /* Allocated video memory. */
++    IN gctUINT64                node;
++}
++gcsTASK_FREE_VIDEO_MEMORY;
++
++typedef struct _gcsTASK_FREE_CONTIGUOUS_MEMORY * gcsTASK_FREE_CONTIGUOUS_MEMORY_PTR;
++typedef struct _gcsTASK_FREE_CONTIGUOUS_MEMORY
++{
++    /* Task ID (gcvTASK_FREE_CONTIGUOUS_MEMORY). */
++    IN gceTASK                  id;
++
++    /* Number of bytes allocated. */
++    IN gctSIZE_T                bytes;
++
++    /* Physical address of allocation. */
++    IN gctPHYS_ADDR             physical;
++
++    /* Logical address of allocation. */
++    IN gctPOINTER               logical;
++}
++gcsTASK_FREE_CONTIGUOUS_MEMORY;
++
++typedef struct _gcsTASK_UNMAP_USER_MEMORY * gcsTASK_UNMAP_USER_MEMORY_PTR;
++typedef struct _gcsTASK_UNMAP_USER_MEMORY
++{
++    /* Task ID (gcvTASK_UNMAP_USER_MEMORY). */
++    IN gceTASK                  id;
++
++    /* Base address of user memory to unmap. */
++    IN gctPOINTER               memory;
++
++    /* Size of user memory in bytes to unmap. */
++    IN gctSIZE_T                size;
++
++    /* Info record returned by gcvHAL_MAP_USER_MEMORY. */
++    IN gctPOINTER               info;
++
++    /* Physical address of mapped memory as returned by
++       gcvHAL_MAP_USER_MEMORY. */
++    IN gctUINT32                address;
++}
++gcsTASK_UNMAP_USER_MEMORY;
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_driver_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_dump.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,88 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_dump_h_
++#define __gc_hal_dump_h_
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/*
++**	FILE LAYOUT:
++**
++**		gcsDUMP_FILE structure
++**
++**		gcsDUMP_DATA frame
++**			gcsDUMP_DATA or gcDUMP_DATA_SIZE records rendingring the frame
++**			gctUINT8 data[length]
++*/
++
++#define gcvDUMP_FILE_SIGNATURE		gcmCC('g','c','D','B')
++
++typedef struct _gcsDUMP_FILE
++{
++	gctUINT32   		signature;	/* File signature */
++	gctSIZE_T 			length;		/* Length of file */
++	gctUINT32 			frames;		/* Number of frames in file */
++}
++gcsDUMP_FILE;
++
++typedef enum _gceDUMP_TAG
++{
++	gcvTAG_SURFACE					= gcmCC('s','u','r','f'),
++	gcvTAG_FRAME					= gcmCC('f','r','m',' '),
++	gcvTAG_COMMAND					= gcmCC('c','m','d',' '),
++	gcvTAG_INDEX					= gcmCC('i','n','d','x'),
++	gcvTAG_STREAM					= gcmCC('s','t','r','m'),
++	gcvTAG_TEXTURE					= gcmCC('t','e','x','t'),
++	gcvTAG_RENDER_TARGET			= gcmCC('r','n','d','r'),
++	gcvTAG_DEPTH					= gcmCC('z','b','u','f'),
++	gcvTAG_RESOLVE					= gcmCC('r','s','l','v'),
++	gcvTAG_DELETE					= gcmCC('d','e','l',' '),
++}
++gceDUMP_TAG;
++
++typedef struct _gcsDUMP_SURFACE
++{
++	gceDUMP_TAG			type;		/* Type of record. */
++	gctUINT32     		address;	/* Address of the surface. */
++	gctINT16      		width;		/* Width of surface. */
++	gctINT16	   		height;		/* Height of surface. */
++	gceSURF_FORMAT		format;		/* Surface pixel format. */
++	gctSIZE_T			length;		/* Number of bytes inside the surface. */
++}
++gcsDUMP_SURFACE;
++
++typedef struct _gcsDUMP_DATA
++{
++	gceDUMP_TAG		 	type;		/* Type of record. */
++	gctSIZE_T     		length;		/* Number of bytes of data. */
++	gctUINT32     		address;	/* Address for the data. */
++}
++gcsDUMP_DATA;
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_dump_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,627 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++#ifndef __gc_hal_eglplatform_h_
++#define __gc_hal_eglplatform_h_
++
++/* Include VDK types. */
++#include "gc_hal_types.h"
++#include "gc_hal_base.h"
++#include "gc_hal_eglplatform_type.h"
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++
++#if defined(_WIN32) || defined(__VC32__) && !defined(__CYGWIN__) && !defined(__SCITECH_SNAP__)
++/* Win32 and Windows CE platforms. */
++#include <windows.h>
++typedef HDC             HALNativeDisplayType;
++typedef HWND            HALNativeWindowType;
++typedef HBITMAP         HALNativePixmapType;
++
++typedef struct __BITFIELDINFO{
++    BITMAPINFO    bmi;
++    RGBQUAD       bmiColors[2];
++} BITFIELDINFO;
++
++#elif defined(LINUX) && defined(EGL_API_DFB) && !defined(__APPLE__)
++#include <directfb.h>
++typedef struct _DFBDisplay * HALNativeDisplayType;
++typedef struct _DFBWindow *  HALNativeWindowType;
++typedef struct _DFBPixmap *  HALNativePixmapType;
++
++#elif defined(LINUX) && defined(EGL_API_FB) && !defined(__APPLE__)
++
++#if defined(EGL_API_WL)
++/* Wayland platform. */
++#include "wayland-server.h"
++#include <wayland-egl.h>
++
++#define WL_EGL_NUM_BACKBUFFERS 3
++
++typedef struct _gcsWL_VIV_BUFFER
++{
++   struct wl_resource *wl_buffer;
++   gcoSURF surface;
++   gctINT32 width, height;
++} gcsWL_VIV_BUFFER;
++
++typedef struct _gcsWL_EGL_DISPLAY
++{
++   struct wl_display* wl_display;
++   struct wl_viv* wl_viv;
++   struct wl_registry *registry;
++   struct wl_event_queue    *wl_queue;
++} gcsWL_EGL_DISPLAY;
++
++typedef struct _gcsWL_EGL_BUFFER_INFO
++{
++   gctINT32 width;
++   gctINT32 height;
++   gctINT32 stride;
++   gceSURF_FORMAT format;
++   gcuVIDMEM_NODE_PTR node;
++   gcePOOL pool;
++   gctUINT bytes;
++   gcoSURF surface;
++   gcoSURF attached_surface;
++   gctINT32 invalidate;
++   gctBOOL locked;
++} gcsWL_EGL_BUFFER_INFO;
++
++typedef struct _gcsWL_EGL_BUFFER
++{
++   struct wl_buffer* wl_buffer;
++   gcsWL_EGL_BUFFER_INFO info;
++} gcsWL_EGL_BUFFER;
++
++typedef struct _gcsWL_EGL_WINDOW_INFO
++{
++   gctINT32 dx;
++   gctINT32 dy;
++   gctUINT width;
++   gctUINT height;
++   gctINT32 attached_width;
++   gctINT32 attached_height;
++   gceSURF_FORMAT format;
++   gctUINT bpp;
++} gcsWL_EGL_WINDOW_INFO;
++
++struct wl_egl_window
++{
++   gcsWL_EGL_DISPLAY* display;
++   gcsWL_EGL_BUFFER backbuffers[WL_EGL_NUM_BACKBUFFERS];
++   gcsWL_EGL_WINDOW_INFO info;
++   gctUINT current;
++   struct wl_surface* surface;
++   struct wl_callback* frame_callback;
++};
++
++typedef void*   HALNativeDisplayType;
++typedef void*   HALNativeWindowType;
++typedef void*   HALNativePixmapType;
++#else
++/* Linux platform for FBDEV. */
++typedef struct _FBDisplay * HALNativeDisplayType;
++typedef struct _FBWindow *  HALNativeWindowType;
++typedef struct _FBPixmap *  HALNativePixmapType;
++#endif
++#elif defined(__ANDROID__) || defined(ANDROID)
++
++struct egl_native_pixmap_t;
++
++#if ANDROID_SDK_VERSION >= 9
++    #include <android/native_window.h>
++
++    typedef struct ANativeWindow*           HALNativeWindowType;
++    typedef struct egl_native_pixmap_t*     HALNativePixmapType;
++    typedef void*                           HALNativeDisplayType;
++#else
++    struct android_native_window_t;
++    typedef struct android_native_window_t*    HALNativeWindowType;
++    typedef struct egl_native_pixmap_t *        HALNativePixmapType;
++    typedef void*                               HALNativeDisplayType;
++#endif
++
++#elif defined(LINUX) || defined(__APPLE__)
++/* X11 platform. */
++#include <X11/Xlib.h>
++#include <X11/Xutil.h>
++
++typedef Display *   HALNativeDisplayType;
++typedef Window      HALNativeWindowType;
++
++#ifdef CUSTOM_PIXMAP
++typedef void *      HALNativePixmapType;
++#else
++typedef Pixmap      HALNativePixmapType;
++#endif /* CUSTOM_PIXMAP */
++
++/* Rename some badly named X defines. */
++#ifdef Status
++#   define XStatus      int
++#   undef Status
++#endif
++#ifdef Always
++#   define XAlways      2
++#   undef Always
++#endif
++#ifdef CurrentTime
++#   undef CurrentTime
++#   define XCurrentTime 0
++#endif
++
++#elif defined(__QNXNTO__)
++#include <screen/screen.h>
++
++/* VOID */
++typedef int              HALNativeDisplayType;
++typedef screen_window_t  HALNativeWindowType;
++typedef screen_pixmap_t  HALNativePixmapType;
++
++#else
++
++#error "Platform not recognized"
++
++/* VOID */
++typedef void *  HALNativeDisplayType;
++typedef void *  HALNativeWindowType;
++typedef void *  HALNativePixmapType;
++
++#endif
++
++/* define DUMMY according to the system */
++#if defined(EGL_API_WL)
++#   define WL_DUMMY (31415926)
++#   define EGL_DUMMY WL_DUMMY
++#elif defined(__ANDROID__) || defined(ANDROID)
++#   define ANDROID_DUMMY (31415926)
++#   define EGL_DUMMY ANDROID_DUMMY
++#else
++#   define EGL_DUMMY (31415926)
++#endif
++
++/*******************************************************************************
++** Display. ********************************************************************
++*/
++
++gceSTATUS
++gcoOS_GetDisplay(
++    OUT HALNativeDisplayType * Display,
++    IN gctPOINTER Context
++    );
++
++gceSTATUS
++gcoOS_GetDisplayByIndex(
++    IN gctINT DisplayIndex,
++    OUT HALNativeDisplayType * Display,
++    IN gctPOINTER Context
++    );
++
++gceSTATUS
++gcoOS_GetDisplayInfo(
++    IN HALNativeDisplayType Display,
++    OUT gctINT * Width,
++    OUT gctINT * Height,
++    OUT gctSIZE_T * Physical,
++    OUT gctINT * Stride,
++    OUT gctINT * BitsPerPixel
++    );
++
++
++
++gceSTATUS
++gcoOS_GetDisplayInfoEx(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctUINT DisplayInfoSize,
++    OUT halDISPLAY_INFO * DisplayInfo
++    );
++
++gceSTATUS
++gcoOS_GetNextDisplayInfoExByIndex(
++    IN gctINT Index,
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctUINT DisplayInfoSize,
++    OUT halDISPLAY_INFO * DisplayInfo
++    );
++
++gceSTATUS
++gcoOS_GetDisplayVirtual(
++    IN HALNativeDisplayType Display,
++    OUT gctINT * Width,
++    OUT gctINT * Height
++    );
++
++gceSTATUS
++gcoOS_GetDisplayBackbuffer(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    OUT gctPOINTER  *  context,
++    OUT gcoSURF     *  surface,
++    OUT gctUINT * Offset,
++    OUT gctINT * X,
++    OUT gctINT * Y
++    );
++
++gceSTATUS
++gcoOS_SetDisplayVirtual(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctUINT Offset,
++    IN gctINT X,
++    IN gctINT Y
++    );
++
++gceSTATUS
++gcoOS_SetDisplayVirtualEx(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctPOINTER Context,
++    IN gcoSURF Surface,
++    IN gctUINT Offset,
++    IN gctINT X,
++    IN gctINT Y
++    );
++
++gceSTATUS
++gcoOS_SetSwapInterval(
++    IN HALNativeDisplayType Display,
++    IN gctINT Interval
++);
++
++gceSTATUS
++gcoOS_GetSwapInterval(
++    IN HALNativeDisplayType Display,
++    IN gctINT_PTR Min,
++    IN gctINT_PTR Max
++);
++
++gceSTATUS
++gcoOS_DisplayBufferRegions(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctINT NumRects,
++    IN gctINT_PTR Rects
++    );
++
++gceSTATUS
++gcoOS_DestroyDisplay(
++    IN HALNativeDisplayType Display
++    );
++
++gceSTATUS
++gcoOS_InitLocalDisplayInfo(
++    IN HALNativeDisplayType Display,
++    IN OUT gctPOINTER * localDisplay
++    );
++
++gceSTATUS
++gcoOS_DeinitLocalDisplayInfo(
++    IN HALNativeDisplayType Display,
++    IN OUT gctPOINTER * localDisplay
++    );
++
++gceSTATUS
++gcoOS_GetDisplayInfoEx2(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctPOINTER  localDisplay,
++    IN gctUINT DisplayInfoSize,
++    OUT halDISPLAY_INFO * DisplayInfo
++    );
++
++gceSTATUS
++gcoOS_GetDisplayBackbufferEx(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctPOINTER  localDisplay,
++    OUT gctPOINTER  *  context,
++    OUT gcoSURF     *  surface,
++    OUT gctUINT * Offset,
++    OUT gctINT * X,
++    OUT gctINT * Y
++    );
++
++gceSTATUS
++gcoOS_IsValidDisplay(
++    IN HALNativeDisplayType Display
++    );
++
++gceSTATUS
++gcoOS_GetNativeVisualId(
++    IN HALNativeDisplayType Display,
++    OUT gctINT* nativeVisualId
++    );
++
++gctBOOL
++gcoOS_SynchronousFlip(
++    IN HALNativeDisplayType Display
++    );
++
++/*******************************************************************************
++** Windows. ********************************************************************
++*/
++
++gceSTATUS
++gcoOS_CreateWindow(
++    IN HALNativeDisplayType Display,
++    IN gctINT X,
++    IN gctINT Y,
++    IN gctINT Width,
++    IN gctINT Height,
++    OUT HALNativeWindowType * Window
++    );
++
++gceSTATUS
++gcoOS_GetWindowInfo(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    OUT gctINT * X,
++    OUT gctINT * Y,
++    OUT gctINT * Width,
++    OUT gctINT * Height,
++    OUT gctINT * BitsPerPixel,
++    OUT gctUINT * Offset
++    );
++
++gceSTATUS
++gcoOS_DestroyWindow(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window
++    );
++
++gceSTATUS
++gcoOS_DrawImage(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctINT Left,
++    IN gctINT Top,
++    IN gctINT Right,
++    IN gctINT Bottom,
++    IN gctINT Width,
++    IN gctINT Height,
++    IN gctINT BitsPerPixel,
++    IN gctPOINTER Bits
++    );
++
++gceSTATUS
++gcoOS_GetImage(
++    IN HALNativeWindowType Window,
++    IN gctINT Left,
++    IN gctINT Top,
++    IN gctINT Right,
++    IN gctINT Bottom,
++    OUT gctINT * BitsPerPixel,
++    OUT gctPOINTER * Bits
++    );
++
++gceSTATUS
++gcoOS_GetWindowInfoEx(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    OUT gctINT * X,
++    OUT gctINT * Y,
++    OUT gctINT * Width,
++    OUT gctINT * Height,
++    OUT gctINT * BitsPerPixel,
++    OUT gctUINT * Offset,
++    OUT gceSURF_FORMAT * Format
++    );
++
++gceSTATUS
++gcoOS_DrawImageEx(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctINT Left,
++    IN gctINT Top,
++    IN gctINT Right,
++    IN gctINT Bottom,
++    IN gctINT Width,
++    IN gctINT Height,
++    IN gctINT BitsPerPixel,
++    IN gctPOINTER Bits,
++    IN gceSURF_FORMAT  Format
++    );
++
++/*******************************************************************************
++** Pixmaps. ********************************************************************
++*/
++
++gceSTATUS
++gcoOS_CreatePixmap(
++    IN HALNativeDisplayType Display,
++    IN gctINT Width,
++    IN gctINT Height,
++    IN gctINT BitsPerPixel,
++    OUT HALNativePixmapType * Pixmap
++    );
++
++gceSTATUS
++gcoOS_GetPixmapInfo(
++    IN HALNativeDisplayType Display,
++    IN HALNativePixmapType Pixmap,
++    OUT gctINT * Width,
++    OUT gctINT * Height,
++    OUT gctINT * BitsPerPixel,
++    OUT gctINT * Stride,
++    OUT gctPOINTER * Bits
++    );
++
++gceSTATUS
++gcoOS_DrawPixmap(
++    IN HALNativeDisplayType Display,
++    IN HALNativePixmapType Pixmap,
++    IN gctINT Left,
++    IN gctINT Top,
++    IN gctINT Right,
++    IN gctINT Bottom,
++    IN gctINT Width,
++    IN gctINT Height,
++    IN gctINT BitsPerPixel,
++    IN gctPOINTER Bits
++    );
++
++gceSTATUS
++gcoOS_DestroyPixmap(
++    IN HALNativeDisplayType Display,
++    IN HALNativePixmapType Pixmap
++    );
++
++gceSTATUS
++gcoOS_GetPixmapInfoEx(
++    IN HALNativeDisplayType Display,
++    IN HALNativePixmapType Pixmap,
++    OUT gctINT * Width,
++    OUT gctINT * Height,
++    OUT gctINT * BitsPerPixel,
++    OUT gctINT * Stride,
++    OUT gctPOINTER * Bits,
++    OUT gceSURF_FORMAT * Format
++    );
++
++gceSTATUS
++gcoOS_CopyPixmapBits(
++    IN HALNativeDisplayType Display,
++    IN HALNativePixmapType Pixmap,
++    IN gctUINT DstWidth,
++    IN gctUINT DstHeight,
++    IN gctINT DstStride,
++    IN gceSURF_FORMAT DstFormat,
++    OUT gctPOINTER DstBits
++    );
++
++/*******************************************************************************
++** OS relative. ****************************************************************
++*/
++gceSTATUS
++gcoOS_LoadEGLLibrary(
++    OUT gctHANDLE * Handle
++    );
++
++gceSTATUS
++gcoOS_FreeEGLLibrary(
++    IN gctHANDLE Handle
++    );
++
++gceSTATUS
++gcoOS_ShowWindow(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window
++    );
++
++gceSTATUS
++gcoOS_HideWindow(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window
++    );
++
++gceSTATUS
++gcoOS_SetWindowTitle(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    IN gctCONST_STRING Title
++    );
++
++gceSTATUS
++gcoOS_CapturePointer(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window
++    );
++
++gceSTATUS
++gcoOS_GetEvent(
++    IN HALNativeDisplayType Display,
++    IN HALNativeWindowType Window,
++    OUT halEvent * Event
++    );
++
++gceSTATUS
++gcoOS_CreateClientBuffer(
++    IN gctINT Width,
++    IN gctINT Height,
++    IN gctINT Format,
++    IN gctINT Type,
++    OUT gctPOINTER * ClientBuffer
++    );
++
++gceSTATUS
++gcoOS_GetClientBufferInfo(
++    IN gctPOINTER ClientBuffer,
++    OUT gctINT * Width,
++    OUT gctINT * Height,
++    OUT gctINT * Stride,
++    OUT gctPOINTER * Bits
++    );
++
++gceSTATUS
++gcoOS_DestroyClientBuffer(
++    IN gctPOINTER ClientBuffer
++    );
++
++gceSTATUS
++gcoOS_DestroyContext(
++    IN gctPOINTER Display,
++    IN gctPOINTER Context
++    );
++
++gceSTATUS
++gcoOS_CreateContext(
++    IN gctPOINTER LocalDisplay,
++    IN gctPOINTER Context
++    );
++
++gceSTATUS
++gcoOS_MakeCurrent(
++    IN gctPOINTER LocalDisplay,
++    IN HALNativeWindowType DrawDrawable,
++    IN HALNativeWindowType ReadDrawable,
++    IN gctPOINTER Context,
++    IN gcoSURF ResolveTarget
++    );
++
++gceSTATUS
++gcoOS_CreateDrawable(
++    IN gctPOINTER LocalDisplay,
++    IN HALNativeWindowType Drawable
++    );
++
++gceSTATUS
++gcoOS_DestroyDrawable(
++    IN gctPOINTER LocalDisplay,
++    IN HALNativeWindowType Drawable
++    );
++gceSTATUS
++gcoOS_SwapBuffers(
++    IN gctPOINTER LocalDisplay,
++    IN HALNativeWindowType Drawable,
++    IN gcoSURF RenderTarget,
++    IN gcoSURF ResolveTarget,
++    IN gctPOINTER ResolveBits,
++    OUT gctUINT *Width,
++    OUT gctUINT *Height
++    );
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_eglplatform_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_eglplatform_type.h	2015-07-27 23:13:06.210822785 +0200
+@@ -0,0 +1,286 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_eglplatform_type_h_
++#define __gc_hal_eglplatform_type_h_
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/*******************************************************************************
++** Events. *********************************************************************
++*/
++
++typedef enum _halEventType
++{
++	/* Keyboard event. */
++    HAL_KEYBOARD,
++
++	/* Mouse move event. */
++    HAL_POINTER,
++
++	/* Mouse button event. */
++    HAL_BUTTON,
++
++	/* Application close event. */
++	HAL_CLOSE,
++
++	/* Application window has been updated. */
++	HAL_WINDOW_UPDATE
++}
++halEventType;
++
++/* Scancodes for keyboard. */
++typedef enum _halKeys
++{
++    HAL_UNKNOWN = -1,
++
++    HAL_BACKSPACE = 0x08,
++    HAL_TAB,
++    HAL_ENTER = 0x0D,
++    HAL_ESCAPE = 0x1B,
++
++    HAL_SPACE = 0x20,
++    HAL_SINGLEQUOTE = 0x27,
++    HAL_PAD_ASTERISK = 0x2A,
++    HAL_COMMA = 0x2C,
++    HAL_HYPHEN,
++    HAL_PERIOD,
++    HAL_SLASH,
++    HAL_0,
++    HAL_1,
++    HAL_2,
++    HAL_3,
++    HAL_4,
++    HAL_5,
++    HAL_6,
++    HAL_7,
++    HAL_8,
++    HAL_9,
++    HAL_SEMICOLON = 0x3B,
++    HAL_EQUAL = 0x3D,
++    HAL_A = 0x41,
++    HAL_B,
++    HAL_C,
++    HAL_D,
++    HAL_E,
++    HAL_F,
++    HAL_G,
++    HAL_H,
++    HAL_I,
++    HAL_J,
++    HAL_K,
++    HAL_L,
++    HAL_M,
++    HAL_N,
++    HAL_O,
++    HAL_P,
++    HAL_Q,
++    HAL_R,
++    HAL_S,
++    HAL_T,
++    HAL_U,
++    HAL_V,
++    HAL_W,
++    HAL_X,
++    HAL_Y,
++    HAL_Z,
++    HAL_LBRACKET,
++    HAL_BACKSLASH,
++    HAL_RBRACKET,
++    HAL_BACKQUOTE = 0x60,
++
++    HAL_F1 = 0x80,
++    HAL_F2,
++    HAL_F3,
++    HAL_F4,
++    HAL_F5,
++    HAL_F6,
++    HAL_F7,
++    HAL_F8,
++    HAL_F9,
++    HAL_F10,
++    HAL_F11,
++    HAL_F12,
++
++    HAL_LCTRL,
++    HAL_RCTRL,
++    HAL_LSHIFT,
++    HAL_RSHIFT,
++    HAL_LALT,
++    HAL_RALT,
++    HAL_CAPSLOCK,
++    HAL_NUMLOCK,
++    HAL_SCROLLLOCK,
++    HAL_PAD_0,
++    HAL_PAD_1,
++    HAL_PAD_2,
++    HAL_PAD_3,
++    HAL_PAD_4,
++    HAL_PAD_5,
++    HAL_PAD_6,
++    HAL_PAD_7,
++    HAL_PAD_8,
++    HAL_PAD_9,
++    HAL_PAD_HYPHEN,
++    HAL_PAD_PLUS,
++    HAL_PAD_SLASH,
++    HAL_PAD_PERIOD,
++    HAL_PAD_ENTER,
++    HAL_SYSRQ,
++    HAL_PRNTSCRN,
++    HAL_BREAK,
++    HAL_UP,
++    HAL_LEFT,
++    HAL_RIGHT,
++    HAL_DOWN,
++    HAL_HOME,
++    HAL_END,
++    HAL_PGUP,
++    HAL_PGDN,
++    HAL_INSERT,
++    HAL_DELETE,
++    HAL_LWINDOW,
++    HAL_RWINDOW,
++    HAL_MENU,
++    HAL_POWER,
++    HAL_SLEEP,
++    HAL_WAKE
++}
++halKeys;
++
++/* Structure that defined keyboard mapping. */
++typedef struct _halKeyMap
++{
++	/* Normal key. */
++    halKeys normal;
++
++	/* Extended key. */
++    halKeys extended;
++}
++halKeyMap;
++
++/* Event structure. */
++typedef struct _halEvent
++{
++	/* Event type. */
++    halEventType type;
++
++	/* Event data union. */
++    union _halEventData
++    {
++		/* Event data for keyboard. */
++        struct _halKeyboard
++        {
++			/* Scancode. */
++            halKeys	scancode;
++
++			/* ASCII characte of the key pressed. */
++            char	key;
++
++			/* Flag whether the key was pressed (1) or released (0). */
++            char	pressed;
++        }
++        keyboard;
++
++		/* Event data for pointer. */
++        struct _halPointer
++        {
++			/* Current pointer coordinate. */
++            int		x;
++            int		y;
++        }
++        pointer;
++
++		/* Event data for mouse buttons. */
++        struct _halButton
++        {
++			/* Left button state. */
++            int		left;
++
++			/* Middle button state. */
++            int		middle;
++
++			/* Right button state. */
++            int		right;
++
++			/* Current pointer coordinate. */
++			int		x;
++			int		y;
++        }
++        button;
++    }
++    data;
++}
++halEvent;
++
++/* VFK_DISPLAY_INFO structure defining information returned by
++   vdkGetDisplayInfoEx. */
++typedef struct _halDISPLAY_INFO
++{
++    /* The size of the display in pixels. */
++    int                         width;
++    int                         height;
++
++    /* The stride of the dispay. -1 is returned if the stride is not known
++    ** for the specified display.*/
++    int                         stride;
++
++    /* The color depth of the display in bits per pixel. */
++    int                         bitsPerPixel;
++
++    /* The logical pointer to the display memory buffer. NULL is returned
++    ** if the pointer is not known for the specified display. */
++    void *                      logical;
++
++    /* The physical address of the display memory buffer. ~0 is returned
++    ** if the address is not known for the specified display. */
++    unsigned long               physical;
++
++    int                wrapFB;   /* true if compositor, false otherwise. */
++
++#ifndef __QNXNTO__
++    /* 355_FB_MULTI_BUFFER */
++    int                      multiBuffer;
++    int                      backBufferY;
++#endif
++
++    /* The color info of the display. */
++    unsigned int                alphaLength;
++    unsigned int                alphaOffset;
++    unsigned int                redLength;
++    unsigned int                redOffset;
++    unsigned int                greenLength;
++    unsigned int                greenOffset;
++    unsigned int                blueLength;
++    unsigned int                blueOffset;
++
++    /* Display flip support. */
++    int                         flip;
++}
++halDISPLAY_INFO;
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_eglplatform_type_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,2053 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_engine_h_
++#define __gc_hal_engine_h_
++
++#ifndef VIVANTE_NO_3D
++#include "gc_hal_types.h"
++#include "gc_hal_enum.h"
++
++#if gcdENABLE_VG
++#include "gc_hal_engine_vg.h"
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++****************************** Object Declarations *****************************
++\******************************************************************************/
++
++typedef struct _gcoSTREAM *             gcoSTREAM;
++typedef struct _gcoVERTEX *             gcoVERTEX;
++typedef struct _gcoTEXTURE *            gcoTEXTURE;
++typedef struct _gcoINDEX *              gcoINDEX;
++typedef struct _gcsVERTEX_ATTRIBUTES *  gcsVERTEX_ATTRIBUTES_PTR;
++typedef struct _gcoVERTEXARRAY *        gcoVERTEXARRAY;
++
++#define gcdATTRIBUTE_COUNT              16
++
++/******************************************************************************\
++********************************* Enumerations *********************************
++\******************************************************************************/
++
++/* Shading format. */
++typedef enum _gceSHADING
++{
++    gcvSHADING_SMOOTH,
++    gcvSHADING_FLAT_D3D,
++    gcvSHADING_FLAT_OPENGL,
++}
++gceSHADING;
++
++/* Culling modes. */
++typedef enum _gceCULL
++{
++    gcvCULL_NONE,
++    gcvCULL_CCW,
++    gcvCULL_CW,
++}
++gceCULL;
++
++/* Fill modes. */
++typedef enum _gceFILL
++{
++    gcvFILL_POINT,
++    gcvFILL_WIRE_FRAME,
++    gcvFILL_SOLID,
++}
++gceFILL;
++
++/* Compare modes. */
++typedef enum _gceCOMPARE
++{
++    gcvCOMPARE_NEVER,
++    gcvCOMPARE_NOT_EQUAL,
++    gcvCOMPARE_LESS,
++    gcvCOMPARE_LESS_OR_EQUAL,
++    gcvCOMPARE_EQUAL,
++    gcvCOMPARE_GREATER,
++    gcvCOMPARE_GREATER_OR_EQUAL,
++    gcvCOMPARE_ALWAYS,
++    gcvCOMPARE_INVALID = -1
++}
++gceCOMPARE;
++
++/* Stencil modes. */
++typedef enum _gceSTENCIL_MODE
++{
++    gcvSTENCIL_NONE,
++    gcvSTENCIL_SINGLE_SIDED,
++    gcvSTENCIL_DOUBLE_SIDED,
++}
++gceSTENCIL_MODE;
++
++/* Stencil operations. */
++typedef enum _gceSTENCIL_OPERATION
++{
++    gcvSTENCIL_KEEP,
++    gcvSTENCIL_REPLACE,
++    gcvSTENCIL_ZERO,
++    gcvSTENCIL_INVERT,
++    gcvSTENCIL_INCREMENT,
++    gcvSTENCIL_DECREMENT,
++    gcvSTENCIL_INCREMENT_SATURATE,
++    gcvSTENCIL_DECREMENT_SATURATE,
++    gcvSTENCIL_OPERATION_INVALID = -1
++}
++gceSTENCIL_OPERATION;
++
++/* Stencil selection. */
++typedef enum _gceSTENCIL_WHERE
++{
++    gcvSTENCIL_FRONT,
++    gcvSTENCIL_BACK,
++}
++gceSTENCIL_WHERE;
++
++/* Texture addressing selection. */
++typedef enum _gceTEXTURE_WHICH
++{
++    gcvTEXTURE_S,
++    gcvTEXTURE_T,
++    gcvTEXTURE_R,
++}
++gceTEXTURE_WHICH;
++
++/* Texture addressing modes. */
++typedef enum _gceTEXTURE_ADDRESSING
++{
++    gcvTEXTURE_WRAP,
++    gcvTEXTURE_CLAMP,
++    gcvTEXTURE_BORDER,
++    gcvTEXTURE_MIRROR,
++    gcvTEXTURE_MIRROR_ONCE,
++}
++gceTEXTURE_ADDRESSING;
++
++/* Texture filters. */
++typedef enum _gceTEXTURE_FILTER
++{
++    gcvTEXTURE_NONE,
++    gcvTEXTURE_POINT,
++    gcvTEXTURE_LINEAR,
++    gcvTEXTURE_ANISOTROPIC,
++}
++gceTEXTURE_FILTER;
++
++/* Primitive types. */
++typedef enum _gcePRIMITIVE
++{
++    gcvPRIMITIVE_POINT_LIST,
++    gcvPRIMITIVE_LINE_LIST,
++    gcvPRIMITIVE_LINE_STRIP,
++    gcvPRIMITIVE_LINE_LOOP,
++    gcvPRIMITIVE_TRIANGLE_LIST,
++    gcvPRIMITIVE_TRIANGLE_STRIP,
++    gcvPRIMITIVE_TRIANGLE_FAN,
++    gcvPRIMITIVE_RECTANGLE,
++}
++gcePRIMITIVE;
++
++/* Index types. */
++typedef enum _gceINDEX_TYPE
++{
++    gcvINDEX_8,
++    gcvINDEX_16,
++    gcvINDEX_32,
++}
++gceINDEX_TYPE;
++
++/******************************************************************************\
++********************************* gcoHAL Object *********************************
++\******************************************************************************/
++
++/* Query the target capabilities. */
++gceSTATUS
++gcoHAL_QueryTargetCaps(
++    IN gcoHAL Hal,
++    OUT gctUINT * MaxWidth,
++    OUT gctUINT * MaxHeight,
++    OUT gctUINT * MultiTargetCount,
++    OUT gctUINT * MaxSamples
++    );
++
++gceSTATUS
++gcoHAL_SetDepthOnly(
++    IN gcoHAL Hal,
++    IN gctBOOL Enable
++    );
++
++gceSTATUS
++gcoHAL_QueryShaderCaps(
++    IN gcoHAL Hal,
++    OUT gctUINT * VertexUniforms,
++    OUT gctUINT * FragmentUniforms,
++    OUT gctUINT * Varyings
++    );
++
++gceSTATUS
++gcoHAL_QueryTextureCaps(
++    IN gcoHAL Hal,
++    OUT gctUINT * MaxWidth,
++    OUT gctUINT * MaxHeight,
++    OUT gctUINT * MaxDepth,
++    OUT gctBOOL * Cubic,
++    OUT gctBOOL * NonPowerOfTwo,
++    OUT gctUINT * VertexSamplers,
++    OUT gctUINT * PixelSamplers
++    );
++
++gceSTATUS
++gcoHAL_QueryTextureMaxAniso(
++    IN gcoHAL Hal,
++    OUT gctUINT * MaxAnisoValue
++    );
++
++gceSTATUS
++gcoHAL_QueryStreamCaps(
++    IN gcoHAL Hal,
++    OUT gctUINT32 * MaxAttributes,
++    OUT gctUINT32 * MaxStreamSize,
++    OUT gctUINT32 * NumberOfStreams,
++    OUT gctUINT32 * Alignment
++    );
++
++/******************************************************************************\
++********************************* gcoSURF Object ********************************
++\******************************************************************************/
++
++/*----------------------------------------------------------------------------*/
++/*--------------------------------- gcoSURF 3D --------------------------------*/
++
++/* Copy surface. */
++gceSTATUS
++gcoSURF_Copy(
++    IN gcoSURF Surface,
++    IN gcoSURF Source
++    );
++
++/* Clear surface. */
++gceSTATUS
++gcoSURF_Clear(
++    IN gcoSURF Surface,
++    IN gctUINT Flags
++    );
++
++/* Set number of samples for a gcoSURF object. */
++gceSTATUS
++gcoSURF_SetSamples(
++    IN gcoSURF Surface,
++    IN gctUINT Samples
++    );
++
++/* Get the number of samples per pixel. */
++gceSTATUS
++gcoSURF_GetSamples(
++    IN gcoSURF Surface,
++    OUT gctUINT_PTR Samples
++    );
++
++/* Clear rectangular surface. */
++gceSTATUS
++gcoSURF_ClearRect(
++    IN gcoSURF Surface,
++    IN gctINT Left,
++    IN gctINT Top,
++    IN gctINT Right,
++    IN gctINT Bottom,
++    IN gctUINT Flags
++    );
++
++/* TO BE REMOVED */
++    gceSTATUS
++    depr_gcoSURF_Resolve(
++        IN gcoSURF SrcSurface,
++        IN gcoSURF DestSurface,
++        IN gctUINT32 DestAddress,
++        IN gctPOINTER DestBits,
++        IN gctINT DestStride,
++        IN gceSURF_TYPE DestType,
++        IN gceSURF_FORMAT DestFormat,
++        IN gctUINT DestWidth,
++        IN gctUINT DestHeight
++        );
++
++    gceSTATUS
++    depr_gcoSURF_ResolveRect(
++        IN gcoSURF SrcSurface,
++        IN gcoSURF DestSurface,
++        IN gctUINT32 DestAddress,
++        IN gctPOINTER DestBits,
++        IN gctINT DestStride,
++        IN gceSURF_TYPE DestType,
++        IN gceSURF_FORMAT DestFormat,
++        IN gctUINT DestWidth,
++        IN gctUINT DestHeight,
++        IN gcsPOINT_PTR SrcOrigin,
++        IN gcsPOINT_PTR DestOrigin,
++        IN gcsPOINT_PTR RectSize
++        );
++
++/* Resample surface. */
++gceSTATUS
++gcoSURF_Resample(
++    IN gcoSURF SrcSurface,
++    IN gcoSURF DestSurface
++    );
++
++/* Resolve surface. */
++gceSTATUS
++gcoSURF_Resolve(
++    IN gcoSURF SrcSurface,
++    IN gcoSURF DestSurface
++    );
++
++gceSTATUS
++gcoSURF_IsHWResolveable(
++    IN gcoSURF SrcSurface,
++    IN gcoSURF DestSurface,
++    IN gcsPOINT_PTR SrcOrigin,
++    IN gcsPOINT_PTR DestOrigin,
++    IN gcsPOINT_PTR RectSize
++    );
++
++/* Resolve rectangular area of a surface. */
++gceSTATUS
++gcoSURF_ResolveRect(
++    IN gcoSURF SrcSurface,
++    IN gcoSURF DestSurface,
++    IN gcsPOINT_PTR SrcOrigin,
++    IN gcsPOINT_PTR DestOrigin,
++    IN gcsPOINT_PTR RectSize
++    );
++
++/* Set surface resolvability. */
++gceSTATUS
++gcoSURF_SetResolvability(
++    IN gcoSURF Surface,
++    IN gctBOOL Resolvable
++    );
++
++gceSTATUS
++gcoSURF_IsRenderable(
++    IN gcoSURF Surface
++    );
++
++gceSTATUS
++gcoSURF_IsFormatRenderableAsRT(
++    IN gcoSURF Surface
++    );
++
++#if gcdSYNC
++gceSTATUS
++gcoSURF_GetFence(
++    IN gcoSURF Surface
++    );
++gceSTATUS
++gcoSURF_WaitFence(
++    IN gcoSURF Surface
++    );
++
++gceSTATUS
++gcoSTREAM_GetFence(
++    IN gcoSTREAM stream
++    );
++
++gceSTATUS
++gcoSTREAM_WaitFence(
++    IN gcoSTREAM stream
++    );
++
++gceSTATUS
++gcoINDEX_GetFence(
++    IN gcoINDEX index
++    );
++
++gceSTATUS
++gcoINDEX_WaitFence(
++    IN gcoINDEX index
++    );
++#endif
++
++/******************************************************************************\
++******************************** gcoINDEX Object *******************************
++\******************************************************************************/
++
++/* Construct a new gcoINDEX object. */
++gceSTATUS
++gcoINDEX_Construct(
++    IN gcoHAL Hal,
++    OUT gcoINDEX * Index
++    );
++
++/* Destroy a gcoINDEX object. */
++gceSTATUS
++gcoINDEX_Destroy(
++    IN gcoINDEX Index
++    );
++
++/* Lock index in memory. */
++gceSTATUS
++gcoINDEX_Lock(
++    IN gcoINDEX Index,
++    OUT gctUINT32 * Address,
++    OUT gctPOINTER * Memory
++    );
++
++/* Unlock index that was previously locked with gcoINDEX_Lock. */
++gceSTATUS
++gcoINDEX_Unlock(
++    IN gcoINDEX Index
++    );
++
++/* Upload index data into the memory. */
++gceSTATUS
++gcoINDEX_Load(
++    IN gcoINDEX Index,
++    IN gceINDEX_TYPE IndexType,
++    IN gctUINT32 IndexCount,
++    IN gctPOINTER IndexBuffer
++    );
++
++/* Bind an index object to the hardware. */
++gceSTATUS
++gcoINDEX_Bind(
++    IN gcoINDEX Index,
++    IN gceINDEX_TYPE Type
++    );
++
++/* Bind an index object to the hardware. */
++gceSTATUS
++gcoINDEX_BindOffset(
++    IN gcoINDEX Index,
++    IN gceINDEX_TYPE Type,
++    IN gctUINT32 Offset
++    );
++
++/* Free existing index buffer. */
++gceSTATUS
++gcoINDEX_Free(
++    IN gcoINDEX Index
++    );
++
++/* Upload data into an index buffer. */
++gceSTATUS
++gcoINDEX_Upload(
++    IN gcoINDEX Index,
++    IN gctCONST_POINTER Buffer,
++    IN gctSIZE_T Bytes
++    );
++
++/* Upload data into an index buffer starting at an offset. */
++gceSTATUS
++gcoINDEX_UploadOffset(
++    IN gcoINDEX Index,
++    IN gctUINT32 Offset,
++    IN gctCONST_POINTER Buffer,
++    IN gctSIZE_T Bytes
++    );
++
++/*Merge index2 to index1 from 0, index2 must subset of inex1*/
++gceSTATUS
++gcoINDEX_Merge(
++    IN gcoINDEX Index1,
++    IN gcoINDEX Index2
++    );
++
++/*check if index buffer is enough for this draw*/
++gctBOOL
++gcoINDEX_CheckRange(
++    IN gcoINDEX Index,
++    IN gceINDEX_TYPE Type,
++    IN gctINT Count,
++    IN gctUINT32  Indices
++    );
++
++/* Query the index capabilities. */
++gceSTATUS
++gcoINDEX_QueryCaps(
++    OUT gctBOOL * Index8,
++    OUT gctBOOL * Index16,
++    OUT gctBOOL * Index32,
++    OUT gctUINT * MaxIndex
++    );
++
++/* Determine the index range in the current index buffer. */
++gceSTATUS
++gcoINDEX_GetIndexRange(
++    IN gcoINDEX Index,
++    IN gceINDEX_TYPE Type,
++    IN gctUINT32 Offset,
++    IN gctUINT32 Count,
++    OUT gctUINT32 * MinimumIndex,
++    OUT gctUINT32 * MaximumIndex
++    );
++
++/* Dynamic buffer management. */
++gceSTATUS
++gcoINDEX_SetDynamic(
++    IN gcoINDEX Index,
++    IN gctSIZE_T Bytes,
++    IN gctUINT Buffers
++    );
++
++gceSTATUS
++gcoINDEX_UploadDynamic(
++    IN gcoINDEX Index,
++    IN gctCONST_POINTER Data,
++    IN gctSIZE_T Bytes
++    );
++
++/******************************************************************************\
++********************************** gco3D Object *********************************
++\******************************************************************************/
++
++/* Clear flags. */
++typedef enum _gceCLEAR
++{
++    gcvCLEAR_COLOR              = 0x1,
++    gcvCLEAR_DEPTH              = 0x2,
++    gcvCLEAR_STENCIL            = 0x4,
++    gcvCLEAR_HZ                 = 0x8,
++    gcvCLEAR_HAS_VAA            = 0x10,
++}
++gceCLEAR;
++
++/* Blending targets. */
++typedef enum _gceBLEND_UNIT
++{
++    gcvBLEND_SOURCE,
++    gcvBLEND_TARGET,
++}
++gceBLEND_UNIT;
++
++/* Construct a new gco3D object. */
++gceSTATUS
++gco3D_Construct(
++    IN gcoHAL Hal,
++    OUT gco3D * Engine
++    );
++
++/* Destroy an gco3D object. */
++gceSTATUS
++gco3D_Destroy(
++    IN gco3D Engine
++    );
++
++/* Set 3D API type. */
++gceSTATUS
++gco3D_SetAPI(
++    IN gco3D Engine,
++    IN gceAPI ApiType
++    );
++
++/* Set render target. */
++gceSTATUS
++gco3D_SetTarget(
++    IN gco3D Engine,
++    IN gcoSURF Surface
++    );
++
++/* Unset render target. */
++gceSTATUS
++gco3D_UnsetTarget(
++    IN gco3D Engine,
++    IN gcoSURF Surface
++    );
++
++/* Set depth buffer. */
++gceSTATUS
++gco3D_SetDepth(
++    IN gco3D Engine,
++    IN gcoSURF Surface
++    );
++
++/* Unset depth buffer. */
++gceSTATUS
++gco3D_UnsetDepth(
++    IN gco3D Engine,
++    IN gcoSURF Surface
++    );
++
++/* Set viewport. */
++gceSTATUS
++gco3D_SetViewport(
++    IN gco3D Engine,
++    IN gctINT32 Left,
++    IN gctINT32 Top,
++    IN gctINT32 Right,
++    IN gctINT32 Bottom
++    );
++
++/* Set scissors. */
++gceSTATUS
++gco3D_SetScissors(
++    IN gco3D Engine,
++    IN gctINT32 Left,
++    IN gctINT32 Top,
++    IN gctINT32 Right,
++    IN gctINT32 Bottom
++    );
++
++/* Set clear color. */
++gceSTATUS
++gco3D_SetClearColor(
++    IN gco3D Engine,
++    IN gctUINT8 Red,
++    IN gctUINT8 Green,
++    IN gctUINT8 Blue,
++    IN gctUINT8 Alpha
++    );
++
++/* Set fixed point clear color. */
++gceSTATUS
++gco3D_SetClearColorX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT Red,
++    IN gctFIXED_POINT Green,
++    IN gctFIXED_POINT Blue,
++    IN gctFIXED_POINT Alpha
++    );
++
++/* Set floating point clear color. */
++gceSTATUS
++gco3D_SetClearColorF(
++    IN gco3D Engine,
++    IN gctFLOAT Red,
++    IN gctFLOAT Green,
++    IN gctFLOAT Blue,
++    IN gctFLOAT Alpha
++    );
++
++/* Set fixed point clear depth. */
++gceSTATUS
++gco3D_SetClearDepthX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT Depth
++    );
++
++/* Set floating point clear depth. */
++gceSTATUS
++gco3D_SetClearDepthF(
++    IN gco3D Engine,
++    IN gctFLOAT Depth
++    );
++
++/* Set clear stencil. */
++gceSTATUS
++gco3D_SetClearStencil(
++    IN gco3D Engine,
++    IN gctUINT32 Stencil
++    );
++
++/* Clear a Rect sub-surface. */
++gceSTATUS
++gco3D_ClearRect(
++    IN gco3D Engine,
++    IN gctUINT32 Address,
++    IN gctPOINTER Memory,
++    IN gctUINT32 Stride,
++    IN gceSURF_FORMAT Format,
++    IN gctINT32 Left,
++    IN gctINT32 Top,
++    IN gctINT32 Right,
++    IN gctINT32 Bottom,
++    IN gctUINT32 Width,
++    IN gctUINT32 Height,
++    IN gctUINT32 Flags
++    );
++
++/* Clear surface. */
++gceSTATUS
++gco3D_Clear(
++    IN gco3D Engine,
++    IN gctUINT32 Address,
++    IN gctUINT32 Stride,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT32 Width,
++    IN gctUINT32 Height,
++    IN gctUINT32 Flags
++    );
++
++
++/* Clear tile status. */
++gceSTATUS
++gco3D_ClearTileStatus(
++    IN gco3D Engine,
++    IN gcsSURF_INFO_PTR Surface,
++    IN gctUINT32 TileStatusAddress,
++    IN gctUINT32 Flags
++    );
++
++/* Set shading mode. */
++gceSTATUS
++gco3D_SetShading(
++    IN gco3D Engine,
++    IN gceSHADING Shading
++    );
++
++/* Set blending mode. */
++gceSTATUS
++gco3D_EnableBlending(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set blending function. */
++gceSTATUS
++gco3D_SetBlendFunction(
++    IN gco3D Engine,
++    IN gceBLEND_UNIT Unit,
++    IN gceBLEND_FUNCTION FunctionRGB,
++    IN gceBLEND_FUNCTION FunctionAlpha
++    );
++
++/* Set blending mode. */
++gceSTATUS
++gco3D_SetBlendMode(
++    IN gco3D Engine,
++    IN gceBLEND_MODE ModeRGB,
++    IN gceBLEND_MODE ModeAlpha
++    );
++
++/* Set blending color. */
++gceSTATUS
++gco3D_SetBlendColor(
++    IN gco3D Engine,
++    IN gctUINT Red,
++    IN gctUINT Green,
++    IN gctUINT Blue,
++    IN gctUINT Alpha
++    );
++
++/* Set fixed point blending color. */
++gceSTATUS
++gco3D_SetBlendColorX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT Red,
++    IN gctFIXED_POINT Green,
++    IN gctFIXED_POINT Blue,
++    IN gctFIXED_POINT Alpha
++    );
++
++/* Set floating point blending color. */
++gceSTATUS
++gco3D_SetBlendColorF(
++    IN gco3D Engine,
++    IN gctFLOAT Red,
++    IN gctFLOAT Green,
++    IN gctFLOAT Blue,
++    IN gctFLOAT Alpha
++    );
++
++/* Set culling mode. */
++gceSTATUS
++gco3D_SetCulling(
++    IN gco3D Engine,
++    IN gceCULL Mode
++    );
++
++/* Enable point size */
++gceSTATUS
++gco3D_SetPointSizeEnable(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set point sprite */
++gceSTATUS
++gco3D_SetPointSprite(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set fill mode. */
++gceSTATUS
++gco3D_SetFill(
++    IN gco3D Engine,
++    IN gceFILL Mode
++    );
++
++/* Set depth compare mode. */
++gceSTATUS
++gco3D_SetDepthCompare(
++    IN gco3D Engine,
++    IN gceCOMPARE Compare
++    );
++
++/* Enable depth writing. */
++gceSTATUS
++gco3D_EnableDepthWrite(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set depth mode. */
++gceSTATUS
++gco3D_SetDepthMode(
++    IN gco3D Engine,
++    IN gceDEPTH_MODE Mode
++    );
++
++/* Set depth range. */
++gceSTATUS
++gco3D_SetDepthRangeX(
++    IN gco3D Engine,
++    IN gceDEPTH_MODE Mode,
++    IN gctFIXED_POINT Near,
++    IN gctFIXED_POINT Far
++    );
++
++/* Set depth range. */
++gceSTATUS
++gco3D_SetDepthRangeF(
++    IN gco3D Engine,
++    IN gceDEPTH_MODE Mode,
++    IN gctFLOAT Near,
++    IN gctFLOAT Far
++    );
++
++/* Set last pixel enable */
++gceSTATUS
++gco3D_SetLastPixelEnable(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set depth Bias and Scale */
++gceSTATUS
++gco3D_SetDepthScaleBiasX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT DepthScale,
++    IN gctFIXED_POINT DepthBias
++    );
++
++gceSTATUS
++gco3D_SetDepthScaleBiasF(
++    IN gco3D Engine,
++    IN gctFLOAT DepthScale,
++    IN gctFLOAT DepthBias
++    );
++
++/* Set depth near and far clipping plane. */
++gceSTATUS
++gco3D_SetDepthPlaneF(
++    IN gco3D Engine,
++    IN gctFLOAT Near,
++    IN gctFLOAT Far
++    );
++
++/* Enable or disable dithering. */
++gceSTATUS
++gco3D_EnableDither(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set color write enable bits. */
++gceSTATUS
++gco3D_SetColorWrite(
++    IN gco3D Engine,
++    IN gctUINT8 Enable
++    );
++
++/* Enable or disable early depth. */
++gceSTATUS
++gco3D_SetEarlyDepth(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Enable or disable all early depth operations. */
++gceSTATUS
++gco3D_SetAllEarlyDepthModes(
++    IN gco3D Engine,
++    IN gctBOOL Disable
++    );
++
++/* Switch dynamic early mode */
++gceSTATUS
++gco3D_SwitchDynamicEarlyDepthMode(
++    IN gco3D Engine
++    );
++
++/* Set dynamic early mode */
++gceSTATUS
++gco3D_DisableDynamicEarlyDepthMode(
++    IN gco3D Engine,
++    IN gctBOOL Disable
++    );
++
++/* Enable or disable depth-only mode. */
++gceSTATUS
++gco3D_SetDepthOnly(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++typedef struct _gcsSTENCIL_INFO * gcsSTENCIL_INFO_PTR;
++typedef struct _gcsSTENCIL_INFO
++{
++    gceSTENCIL_MODE         mode;
++
++    gctUINT8                maskFront;
++	gctUINT8                maskBack;
++    gctUINT8                writeMaskFront;
++    gctUINT8                writeMaskBack;
++
++    gctUINT8                referenceFront;
++
++    gceCOMPARE              compareFront;
++    gceSTENCIL_OPERATION    passFront;
++    gceSTENCIL_OPERATION    failFront;
++    gceSTENCIL_OPERATION    depthFailFront;
++
++    gctUINT8                referenceBack;
++    gceCOMPARE              compareBack;
++    gceSTENCIL_OPERATION    passBack;
++    gceSTENCIL_OPERATION    failBack;
++    gceSTENCIL_OPERATION    depthFailBack;
++}
++gcsSTENCIL_INFO;
++
++/* Set stencil mode. */
++gceSTATUS
++gco3D_SetStencilMode(
++    IN gco3D Engine,
++    IN gceSTENCIL_MODE Mode
++    );
++
++/* Set stencil mask. */
++gceSTATUS
++gco3D_SetStencilMask(
++    IN gco3D Engine,
++    IN gctUINT8 Mask
++    );
++
++/* Set stencil back mask. */
++gceSTATUS
++gco3D_SetStencilMaskBack(
++    IN gco3D Engine,
++    IN gctUINT8 Mask
++    );
++
++/* Set stencil write mask. */
++gceSTATUS
++gco3D_SetStencilWriteMask(
++    IN gco3D Engine,
++    IN gctUINT8 Mask
++    );
++
++/* Set stencil back write mask. */
++gceSTATUS
++gco3D_SetStencilWriteMaskBack(
++    IN gco3D Engine,
++    IN gctUINT8 Mask
++    );
++
++/* Set stencil reference. */
++gceSTATUS
++gco3D_SetStencilReference(
++    IN gco3D Engine,
++    IN gctUINT8 Reference,
++    IN gctBOOL Front
++    );
++
++/* Set stencil compare. */
++gceSTATUS
++gco3D_SetStencilCompare(
++    IN gco3D Engine,
++    IN gceSTENCIL_WHERE Where,
++    IN gceCOMPARE Compare
++    );
++
++/* Set stencil operation on pass. */
++gceSTATUS
++gco3D_SetStencilPass(
++    IN gco3D Engine,
++    IN gceSTENCIL_WHERE Where,
++    IN gceSTENCIL_OPERATION Operation
++    );
++
++/* Set stencil operation on fail. */
++gceSTATUS
++gco3D_SetStencilFail(
++    IN gco3D Engine,
++    IN gceSTENCIL_WHERE Where,
++    IN gceSTENCIL_OPERATION Operation
++    );
++
++/* Set stencil operation on depth fail. */
++gceSTATUS
++gco3D_SetStencilDepthFail(
++    IN gco3D Engine,
++    IN gceSTENCIL_WHERE Where,
++    IN gceSTENCIL_OPERATION Operation
++    );
++
++/* Set all stencil states in one blow. */
++gceSTATUS
++gco3D_SetStencilAll(
++    IN gco3D Engine,
++    IN gcsSTENCIL_INFO_PTR Info
++    );
++
++typedef struct _gcsALPHA_INFO * gcsALPHA_INFO_PTR;
++typedef struct _gcsALPHA_INFO
++{
++    /* Alpha test states. */
++    gctBOOL                 test;
++    gceCOMPARE              compare;
++    gctUINT8                reference;
++    gctFLOAT                floatReference;
++
++    /* Alpha blending states. */
++    gctBOOL                 blend;
++
++    gceBLEND_FUNCTION       srcFuncColor;
++    gceBLEND_FUNCTION       srcFuncAlpha;
++    gceBLEND_FUNCTION       trgFuncColor;
++    gceBLEND_FUNCTION       trgFuncAlpha;
++
++    gceBLEND_MODE           modeColor;
++    gceBLEND_MODE           modeAlpha;
++
++    gctUINT32               color;
++}
++gcsALPHA_INFO;
++
++/* Enable or disable alpha test. */
++gceSTATUS
++gco3D_SetAlphaTest(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set alpha test compare. */
++gceSTATUS
++gco3D_SetAlphaCompare(
++    IN gco3D Engine,
++    IN gceCOMPARE Compare
++    );
++
++/* Set alpha test reference in unsigned integer. */
++gceSTATUS
++gco3D_SetAlphaReference(
++    IN gco3D Engine,
++    IN gctUINT8 Reference,
++    IN gctFLOAT FloatReference
++    );
++
++/* Set alpha test reference in fixed point. */
++gceSTATUS
++gco3D_SetAlphaReferenceX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT Reference
++    );
++
++/* Set alpha test reference in floating point. */
++gceSTATUS
++gco3D_SetAlphaReferenceF(
++    IN gco3D Engine,
++    IN gctFLOAT Reference
++    );
++
++/* Enable/Disable anti-alias line. */
++gceSTATUS
++gco3D_SetAntiAliasLine(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Set texture slot for anti-alias line. */
++gceSTATUS
++gco3D_SetAALineTexSlot(
++    IN gco3D Engine,
++    IN gctUINT TexSlot
++    );
++
++/* Set anti-alias line width scale. */
++gceSTATUS
++gco3D_SetAALineWidth(
++    IN gco3D Engine,
++    IN gctFLOAT Width
++    );
++
++/* Draw a number of primitives. */
++gceSTATUS
++gco3D_DrawPrimitives(
++    IN gco3D Engine,
++    IN gcePRIMITIVE Type,
++    IN gctINT StartVertex,
++    IN gctSIZE_T PrimitiveCount
++    );
++
++gceSTATUS
++gco3D_DrawPrimitivesCount(
++    IN gco3D Engine,
++    IN gcePRIMITIVE Type,
++    IN gctINT* StartVertex,
++    IN gctSIZE_T* VertexCount,
++    IN gctSIZE_T PrimitiveCount
++    );
++
++
++/* Draw a number of primitives using offsets. */
++gceSTATUS
++gco3D_DrawPrimitivesOffset(
++    IN gco3D Engine,
++    IN gcePRIMITIVE Type,
++    IN gctINT32 StartOffset,
++    IN gctSIZE_T PrimitiveCount
++    );
++
++/* Draw a number of indexed primitives. */
++gceSTATUS
++gco3D_DrawIndexedPrimitives(
++    IN gco3D Engine,
++    IN gcePRIMITIVE Type,
++    IN gctINT BaseVertex,
++    IN gctINT StartIndex,
++    IN gctSIZE_T PrimitiveCount
++    );
++
++/* Draw a number of indexed primitives using offsets. */
++gceSTATUS
++gco3D_DrawIndexedPrimitivesOffset(
++    IN gco3D Engine,
++    IN gcePRIMITIVE Type,
++    IN gctINT32 BaseOffset,
++    IN gctINT32 StartOffset,
++    IN gctSIZE_T PrimitiveCount
++    );
++
++/* Enable or disable anti-aliasing. */
++gceSTATUS
++gco3D_SetAntiAlias(
++    IN gco3D Engine,
++    IN gctBOOL Enable
++    );
++
++/* Write data into the command buffer. */
++gceSTATUS
++gco3D_WriteBuffer(
++    IN gco3D Engine,
++    IN gctCONST_POINTER Data,
++    IN gctSIZE_T Bytes,
++    IN gctBOOL Aligned
++    );
++
++/* Send sempahore and stall until sempahore is signalled. */
++gceSTATUS
++gco3D_Semaphore(
++    IN gco3D Engine,
++    IN gceWHERE From,
++    IN gceWHERE To,
++    IN gceHOW How);
++
++/* Set the subpixels center. */
++gceSTATUS
++gco3D_SetCentroids(
++    IN gco3D Engine,
++    IN gctUINT32 Index,
++    IN gctPOINTER Centroids
++    );
++
++gceSTATUS
++gco3D_SetLogicOp(
++    IN gco3D Engine,
++    IN gctUINT8 Rop
++    );
++
++/* OCL thread walker information. */
++typedef struct _gcsTHREAD_WALKER_INFO * gcsTHREAD_WALKER_INFO_PTR;
++typedef struct _gcsTHREAD_WALKER_INFO
++{
++    gctUINT32   dimensions;
++    gctUINT32   traverseOrder;
++    gctUINT32   enableSwathX;
++    gctUINT32   enableSwathY;
++    gctUINT32   enableSwathZ;
++    gctUINT32   swathSizeX;
++    gctUINT32   swathSizeY;
++    gctUINT32   swathSizeZ;
++    gctUINT32   valueOrder;
++
++    gctUINT32   globalSizeX;
++    gctUINT32   globalOffsetX;
++    gctUINT32   globalSizeY;
++    gctUINT32   globalOffsetY;
++    gctUINT32   globalSizeZ;
++    gctUINT32   globalOffsetZ;
++
++    gctUINT32   workGroupSizeX;
++    gctUINT32   workGroupCountX;
++    gctUINT32   workGroupSizeY;
++    gctUINT32   workGroupCountY;
++    gctUINT32   workGroupSizeZ;
++    gctUINT32   workGroupCountZ;
++
++    gctUINT32   threadAllocation;
++}
++gcsTHREAD_WALKER_INFO;
++
++/* Start OCL thread walker. */
++gceSTATUS
++gco3D_InvokeThreadWalker(
++    IN gco3D Engine,
++    IN gcsTHREAD_WALKER_INFO_PTR Info
++    );
++
++/* Set w clip and w plane limit value. */
++gceSTATUS
++gco3D_SetWClipEnable(
++	IN gco3D Engine,
++	IN gctBOOL Enable
++    );
++
++gceSTATUS
++gco3D_GetWClipEnable(
++    IN gco3D Engine,
++    OUT gctBOOL * Enable
++    );
++
++gceSTATUS
++gco3D_SetWPlaneLimitF(
++	IN gco3D Engine,
++	IN gctFLOAT Value
++    );
++
++gceSTATUS
++gco3D_SetWPlaneLimitX(
++	IN gco3D Engine,
++	IN gctFIXED_POINT Value
++    );
++
++
++gceSTATUS
++gco3D_SetWPlaneLimit(
++        IN gco3D Engine,
++        IN gctFLOAT Value
++        );
++
++/*----------------------------------------------------------------------------*/
++/*-------------------------- gco3D Fragment Processor ------------------------*/
++
++/* Set the fragment processor configuration. */
++gceSTATUS
++gco3D_SetFragmentConfiguration(
++    IN gco3D Engine,
++    IN gctBOOL ColorFromStream,
++    IN gctBOOL EnableFog,
++    IN gctBOOL EnableSmoothPoint,
++    IN gctUINT32 ClipPlanes
++    );
++
++/* Enable/disable texture stage operation. */
++gceSTATUS
++gco3D_EnableTextureStage(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gctBOOL Enable
++    );
++
++/* Program the channel enable masks for the color texture function. */
++gceSTATUS
++gco3D_SetTextureColorMask(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gctBOOL ColorEnabled,
++    IN gctBOOL AlphaEnabled
++    );
++
++/* Program the channel enable masks for the alpha texture function. */
++gceSTATUS
++gco3D_SetTextureAlphaMask(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gctBOOL ColorEnabled,
++    IN gctBOOL AlphaEnabled
++    );
++
++/* Program the constant fragment color. */
++gceSTATUS
++gco3D_SetFragmentColorX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT Red,
++    IN gctFIXED_POINT Green,
++    IN gctFIXED_POINT Blue,
++    IN gctFIXED_POINT Alpha
++    );
++
++gceSTATUS
++gco3D_SetFragmentColorF(
++    IN gco3D Engine,
++    IN gctFLOAT Red,
++    IN gctFLOAT Green,
++    IN gctFLOAT Blue,
++    IN gctFLOAT Alpha
++    );
++
++/* Program the constant fog color. */
++gceSTATUS
++gco3D_SetFogColorX(
++    IN gco3D Engine,
++    IN gctFIXED_POINT Red,
++    IN gctFIXED_POINT Green,
++    IN gctFIXED_POINT Blue,
++    IN gctFIXED_POINT Alpha
++    );
++
++gceSTATUS
++gco3D_SetFogColorF(
++    IN gco3D Engine,
++    IN gctFLOAT Red,
++    IN gctFLOAT Green,
++    IN gctFLOAT Blue,
++    IN gctFLOAT Alpha
++    );
++
++/* Program the constant texture color. */
++gceSTATUS
++gco3D_SetTetxureColorX(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gctFIXED_POINT Red,
++    IN gctFIXED_POINT Green,
++    IN gctFIXED_POINT Blue,
++    IN gctFIXED_POINT Alpha
++    );
++
++gceSTATUS
++gco3D_SetTetxureColorF(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gctFLOAT Red,
++    IN gctFLOAT Green,
++    IN gctFLOAT Blue,
++    IN gctFLOAT Alpha
++    );
++
++/* Configure color texture function. */
++gceSTATUS
++gco3D_SetColorTextureFunction(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gceTEXTURE_FUNCTION Function,
++    IN gceTEXTURE_SOURCE Source0,
++    IN gceTEXTURE_CHANNEL Channel0,
++    IN gceTEXTURE_SOURCE Source1,
++    IN gceTEXTURE_CHANNEL Channel1,
++    IN gceTEXTURE_SOURCE Source2,
++    IN gceTEXTURE_CHANNEL Channel2,
++    IN gctINT Scale
++    );
++
++/* Configure alpha texture function. */
++gceSTATUS
++gco3D_SetAlphaTextureFunction(
++    IN gco3D Engine,
++    IN gctINT Stage,
++    IN gceTEXTURE_FUNCTION Function,
++    IN gceTEXTURE_SOURCE Source0,
++    IN gceTEXTURE_CHANNEL Channel0,
++    IN gceTEXTURE_SOURCE Source1,
++    IN gceTEXTURE_CHANNEL Channel1,
++    IN gceTEXTURE_SOURCE Source2,
++    IN gceTEXTURE_CHANNEL Channel2,
++    IN gctINT Scale
++    );
++
++/* Invoke OCL thread walker. */
++gceSTATUS
++gcoHARDWARE_InvokeThreadWalker(
++    IN gcsTHREAD_WALKER_INFO_PTR Info
++    );
++
++/******************************************************************************\
++******************************* gcoTEXTURE Object *******************************
++\******************************************************************************/
++
++/* Cube faces. */
++typedef enum _gceTEXTURE_FACE
++{
++    gcvFACE_NONE,
++    gcvFACE_POSITIVE_X,
++    gcvFACE_NEGATIVE_X,
++    gcvFACE_POSITIVE_Y,
++    gcvFACE_NEGATIVE_Y,
++    gcvFACE_POSITIVE_Z,
++    gcvFACE_NEGATIVE_Z,
++}
++gceTEXTURE_FACE;
++
++#if gcdFORCE_MIPMAP
++typedef enum
++{
++    gcvForceMipDisabled  = 0,
++    gcvForceMipEnable    = 1,
++    gcvForceMipGenerated = 2,
++    gcvForceMipNever     = 3,
++}gceFORCE_MIPMAP;
++#endif
++
++typedef struct _gcsTEXTURE
++{
++    /* Addressing modes. */
++    gceTEXTURE_ADDRESSING       s;
++    gceTEXTURE_ADDRESSING       t;
++    gceTEXTURE_ADDRESSING       r;
++
++    /* Border color. */
++    gctUINT8                    border[4];
++
++    /* Filters. */
++    gceTEXTURE_FILTER           minFilter;
++    gceTEXTURE_FILTER           magFilter;
++    gceTEXTURE_FILTER           mipFilter;
++    gctUINT                     anisoFilter;
++    gctBOOL                     forceTopLevel;
++    gctBOOL                     autoMipmap;
++#if gcdFORCE_MIPMAP
++    gceFORCE_MIPMAP             forceMipmap;
++#endif
++    /* Level of detail. */
++    gctFIXED_POINT              lodBias;
++    gctFIXED_POINT              lodMin;
++    gctFIXED_POINT              lodMax;
++}
++gcsTEXTURE, * gcsTEXTURE_PTR;
++
++/* Construct a new gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_Construct(
++    IN gcoHAL Hal,
++    OUT gcoTEXTURE * Texture
++    );
++
++/* Construct a new sized gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_ConstructSized(
++    IN gcoHAL Hal,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Depth,
++    IN gctUINT Faces,
++    IN gctUINT MipMapCount,
++    IN gcePOOL Pool,
++    OUT gcoTEXTURE * Texture
++    );
++
++/* Destroy an gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_Destroy(
++    IN gcoTEXTURE Texture
++    );
++#if gcdFORCE_MIPMAP
++gceSTATUS
++gcoTEXTURE_DestroyForceMipmap(
++    IN gcoTEXTURE Texture
++    );
++
++gceSTATUS
++gcoTEXTURE_GetMipLevels(
++    IN gcoTEXTURE Texture,
++    OUT gctINT * levels
++    );
++#endif
++/* Replace a mipmap in gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_ReplaceMipMap(
++    IN gcoTEXTURE Texture,
++    IN gctUINT Level,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctINT imageFormat,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT Depth,
++    IN gctUINT Faces,
++    IN gcePOOL Pool
++    );
++
++/* Upload data to an gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_Upload(
++    IN gcoTEXTURE Texture,
++    IN gceTEXTURE_FACE Face,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Slice,
++    IN gctCONST_POINTER Memory,
++    IN gctINT Stride,
++    IN gceSURF_FORMAT Format
++    );
++
++/* Upload data to an gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_UploadSub(
++    IN gcoTEXTURE Texture,
++    IN gctUINT MipMap,
++    IN gceTEXTURE_FACE Face,
++    IN gctUINT X,
++    IN gctUINT Y,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Slice,
++    IN gctCONST_POINTER Memory,
++    IN gctINT Stride,
++    IN gceSURF_FORMAT Format
++    );
++
++/* Upload YUV data to an gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_UploadYUV(
++    IN gcoTEXTURE Texture,
++    IN gceTEXTURE_FACE Face,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Slice,
++    IN gctPOINTER Memory[3],
++    IN gctINT Stride[3],
++    IN gceSURF_FORMAT Format
++    );
++
++/* Upload compressed data to an gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_UploadCompressed(
++    IN gcoTEXTURE Texture,
++    IN gceTEXTURE_FACE Face,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Slice,
++    IN gctCONST_POINTER Memory,
++    IN gctSIZE_T Bytes
++    );
++
++/* Upload compressed sub data to an gcoTEXTURE object. */
++gceSTATUS
++gcoTEXTURE_UploadCompressedSub(
++    IN gcoTEXTURE Texture,
++    IN gctUINT MipMap,
++    IN gceTEXTURE_FACE Face,
++    IN gctUINT XOffset,
++    IN gctUINT YOffset,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Slice,
++    IN gctCONST_POINTER Memory,
++    IN gctSIZE_T Size
++    );
++
++/* GetImageFormat of texture. */
++gceSTATUS
++gcoTEXTURE_GetImageFormat(
++    IN gcoTEXTURE Texture,
++    IN gctUINT MipMap,
++    OUT gctINT *  ImageFormat
++    );
++
++/* Get gcoSURF object for a mipmap level. */
++gceSTATUS
++gcoTEXTURE_GetMipMap(
++    IN gcoTEXTURE Texture,
++    IN gctUINT MipMap,
++    OUT gcoSURF * Surface
++    );
++
++/* Get gcoSURF object for a mipmap level and face offset. */
++gceSTATUS
++gcoTEXTURE_GetMipMapFace(
++    IN gcoTEXTURE Texture,
++    IN gctUINT MipMap,
++    IN gceTEXTURE_FACE Face,
++    OUT gcoSURF * Surface,
++    OUT gctUINT32_PTR Offset
++    );
++
++gceSTATUS
++gcoTEXTURE_AddMipMap(
++    IN gcoTEXTURE Texture,
++    IN gctINT Level,
++    IN gctINT imageFormat,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Depth,
++    IN gctUINT Faces,
++    IN gcePOOL Pool,
++    OUT gcoSURF * Surface
++    );
++
++gceSTATUS
++gcoTEXTURE_AddMipMapFromClient(
++    IN gcoTEXTURE Texture,
++    IN gctINT     Level,
++    IN gcoSURF    Surface
++    );
++
++gceSTATUS
++gcoTEXTURE_AddMipMapFromSurface(
++    IN gcoTEXTURE Texture,
++    IN gctINT     Level,
++    IN gcoSURF    Surface
++    );
++
++gceSTATUS
++gcoTEXTURE_SetMaxLevel(
++    IN gcoTEXTURE Texture,
++    IN gctUINT Levels
++    );
++
++gceSTATUS
++gcoTEXTURE_SetEndianHint(
++    IN gcoTEXTURE Texture,
++    IN gceENDIAN_HINT EndianHint
++    );
++
++gceSTATUS
++gcoTEXTURE_Disable(
++    IN gcoHAL Hal,
++    IN gctINT Sampler
++    );
++
++gceSTATUS
++gcoTEXTURE_Flush(
++    IN gcoTEXTURE Texture
++    );
++
++gceSTATUS
++gcoTEXTURE_QueryCaps(
++    IN  gcoHAL    Hal,
++    OUT gctUINT * MaxWidth,
++    OUT gctUINT * MaxHeight,
++    OUT gctUINT * MaxDepth,
++    OUT gctBOOL * Cubic,
++    OUT gctBOOL * NonPowerOfTwo,
++    OUT gctUINT * VertexSamplers,
++    OUT gctUINT * PixelSamplers
++    );
++
++gceSTATUS
++gcoTEXTURE_GetTiling(
++    IN gcoTEXTURE Texture,
++    IN gctINT preferLevel,
++	OUT gceTILING * Tiling
++    );
++
++gceSTATUS
++gcoTEXTURE_GetClosestFormat(
++    IN gcoHAL Hal,
++    IN gceSURF_FORMAT InFormat,
++    OUT gceSURF_FORMAT* OutFormat
++    );
++
++gceSTATUS
++gcoTEXTURE_RenderIntoMipMap(
++    IN gcoTEXTURE Texture,
++    IN gctINT Level
++    );
++
++gceSTATUS
++gcoTEXTURE_IsRenderable(
++    IN gcoTEXTURE Texture,
++    IN gctUINT Level
++    );
++
++gceSTATUS
++gcoTEXTURE_IsRenderableEx(
++    IN gcoTEXTURE Texture,
++    IN gctUINT Level
++    );
++
++gceSTATUS
++gcoTEXTURE_IsComplete(
++    IN gcoTEXTURE Texture,
++    IN gctINT MaxLevel
++    );
++
++gceSTATUS
++gcoTEXTURE_BindTexture(
++    IN gcoTEXTURE Texture,
++    IN gctINT Target,
++    IN gctINT Sampler,
++    IN gcsTEXTURE_PTR Info
++    );
++
++/******************************************************************************\
++******************************* gcoSTREAM Object ******************************
++\******************************************************************************/
++
++typedef enum _gceVERTEX_FORMAT
++{
++    gcvVERTEX_BYTE,
++    gcvVERTEX_UNSIGNED_BYTE,
++    gcvVERTEX_SHORT,
++    gcvVERTEX_UNSIGNED_SHORT,
++    gcvVERTEX_INT,
++    gcvVERTEX_UNSIGNED_INT,
++    gcvVERTEX_FIXED,
++    gcvVERTEX_HALF,
++    gcvVERTEX_FLOAT,
++    gcvVERTEX_UNSIGNED_INT_10_10_10_2,
++    gcvVERTEX_INT_10_10_10_2,
++}
++gceVERTEX_FORMAT;
++
++gceSTATUS
++gcoSTREAM_Construct(
++    IN gcoHAL Hal,
++    OUT gcoSTREAM * Stream
++    );
++
++gceSTATUS
++gcoSTREAM_Destroy(
++    IN gcoSTREAM Stream
++    );
++
++gceSTATUS
++gcoSTREAM_Upload(
++    IN gcoSTREAM Stream,
++    IN gctCONST_POINTER Buffer,
++    IN gctUINT32 Offset,
++    IN gctSIZE_T Bytes,
++    IN gctBOOL Dynamic
++    );
++
++gceSTATUS
++gcoSTREAM_SetStride(
++    IN gcoSTREAM Stream,
++    IN gctUINT32 Stride
++    );
++
++gceSTATUS
++gcoSTREAM_Lock(
++    IN gcoSTREAM Stream,
++    OUT gctPOINTER * Logical,
++    OUT gctUINT32 * Physical
++    );
++
++gceSTATUS
++gcoSTREAM_Unlock(
++    IN gcoSTREAM Stream
++    );
++
++gceSTATUS
++gcoSTREAM_Reserve(
++    IN gcoSTREAM Stream,
++    IN gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gcoSTREAM_Flush(
++    IN gcoSTREAM Stream
++    );
++
++/* Dynamic buffer API. */
++gceSTATUS
++gcoSTREAM_SetDynamic(
++    IN gcoSTREAM Stream,
++    IN gctSIZE_T Bytes,
++    IN gctUINT Buffers
++    );
++
++typedef struct _gcsSTREAM_INFO
++{
++    gctUINT             index;
++    gceVERTEX_FORMAT    format;
++    gctBOOL             normalized;
++    gctUINT             components;
++    gctSIZE_T           size;
++    gctCONST_POINTER    data;
++    gctUINT             stride;
++}
++gcsSTREAM_INFO, * gcsSTREAM_INFO_PTR;
++
++gceSTATUS
++gcoSTREAM_UploadDynamic(
++    IN gcoSTREAM Stream,
++    IN gctUINT VertexCount,
++    IN gctUINT InfoCount,
++    IN gcsSTREAM_INFO_PTR Info,
++    IN gcoVERTEX Vertex
++    );
++
++gceSTATUS
++gcoSTREAM_CPUCacheOperation(
++    IN gcoSTREAM Stream,
++    IN gceCACHEOPERATION Operation
++    );
++
++/******************************************************************************\
++******************************** gcoVERTEX Object ******************************
++\******************************************************************************/
++
++typedef struct _gcsVERTEX_ATTRIBUTES
++{
++    gceVERTEX_FORMAT            format;
++    gctBOOL                     normalized;
++    gctUINT32                   components;
++    gctSIZE_T                   size;
++    gctUINT32                   stream;
++    gctUINT32                   offset;
++    gctUINT32                   stride;
++}
++gcsVERTEX_ATTRIBUTES;
++
++gceSTATUS
++gcoVERTEX_Construct(
++    IN gcoHAL Hal,
++    OUT gcoVERTEX * Vertex
++    );
++
++gceSTATUS
++gcoVERTEX_Destroy(
++    IN gcoVERTEX Vertex
++    );
++
++gceSTATUS
++gcoVERTEX_Reset(
++    IN gcoVERTEX Vertex
++    );
++
++gceSTATUS
++gcoVERTEX_EnableAttribute(
++    IN gcoVERTEX Vertex,
++    IN gctUINT32 Index,
++    IN gceVERTEX_FORMAT Format,
++    IN gctBOOL Normalized,
++    IN gctUINT32 Components,
++    IN gcoSTREAM Stream,
++    IN gctUINT32 Offset,
++    IN gctUINT32 Stride
++    );
++
++gceSTATUS
++gcoVERTEX_DisableAttribute(
++    IN gcoVERTEX Vertex,
++    IN gctUINT32 Index
++    );
++
++gceSTATUS
++gcoVERTEX_Bind(
++    IN gcoVERTEX Vertex
++    );
++
++/*******************************************************************************
++***** gcoVERTEXARRAY Object ***************************************************/
++
++typedef struct _gcsVERTEXARRAY
++{
++    /* Enabled. */
++    gctBOOL             enable;
++
++    /* Number of components. */
++    gctINT              size;
++
++    /* Attribute format. */
++    gceVERTEX_FORMAT    format;
++
++    /* Flag whether the attribute is normalized or not. */
++    gctBOOL             normalized;
++
++    /* Stride of the component. */
++    gctUINT             stride;
++
++    /* Pointer to the attribute data. */
++    gctCONST_POINTER    pointer;
++
++    /* Stream object owning the attribute data. */
++    gcoSTREAM           stream;
++
++    /* Generic values for attribute. */
++    gctFLOAT            genericValue[4];
++
++    /* Generic size for attribute. */
++    gctINT              genericSize;
++
++    /* Vertex shader linkage. */
++    gctUINT             linkage;
++
++#if gcdUSE_WCLIP_PATCH
++    gctBOOL             isPosition;
++#endif
++}
++gcsVERTEXARRAY,
++* gcsVERTEXARRAY_PTR;
++
++gceSTATUS
++gcoVERTEXARRAY_Construct(
++    IN gcoHAL Hal,
++    OUT gcoVERTEXARRAY * Vertex
++    );
++
++gceSTATUS
++gcoVERTEXARRAY_Destroy(
++    IN gcoVERTEXARRAY Vertex
++    );
++
++gceSTATUS
++gcoVERTEXARRAY_Bind(
++    IN gcoVERTEXARRAY Vertex,
++    IN gctUINT32 EnableBits,
++    IN gcsVERTEXARRAY_PTR VertexArray,
++    IN gctUINT First,
++    IN gctSIZE_T Count,
++    IN gceINDEX_TYPE IndexType,
++    IN gcoINDEX IndexObject,
++    IN gctPOINTER IndexMemory,
++    IN OUT gcePRIMITIVE * PrimitiveType,
++#if gcdUSE_WCLIP_PATCH
++    IN OUT gctUINT * PrimitiveCount,
++    IN OUT gctFLOAT * wLimitRms,
++    IN OUT gctBOOL * wLimitDirty
++#else
++    IN OUT gctUINT * PrimitiveCount
++#endif
++    );
++
++gctUINT
++gcoVERTEXARRAY_GetMaxStream(
++    IN gcoVERTEXARRAY Vertex
++);
++
++gceSTATUS
++gcoVERTEXARRAY_SetMaxStream(
++    IN gcoVERTEXARRAY Vertex,
++    gctUINT maxStreams
++);
++/*******************************************************************************
++***** Composition *************************************************************/
++
++typedef enum _gceCOMPOSITION
++{
++    gcvCOMPOSE_CLEAR = 1,
++    gcvCOMPOSE_BLUR,
++    gcvCOMPOSE_DIM,
++    gcvCOMPOSE_LAYER
++}
++gceCOMPOSITION;
++
++typedef struct _gcsCOMPOSITION * gcsCOMPOSITION_PTR;
++typedef struct _gcsCOMPOSITION
++{
++    /* Structure size. */
++    gctUINT                         structSize;
++
++    /* Composition operation. */
++    gceCOMPOSITION                  operation;
++
++    /* Layer to be composed. */
++    gcoSURF                         layer;
++
++    /* Source and target coordinates. */
++    gcsRECT                         srcRect;
++    gcsRECT                         trgRect;
++
++    /* Target rectangle */
++    gcsPOINT                        v0;
++    gcsPOINT                        v1;
++    gcsPOINT                        v2;
++
++    /* Blending parameters. */
++    gctBOOL                         enableBlending;
++    gctBOOL                         premultiplied;
++    gctUINT8                        alphaValue;
++
++    /* Clear color. */
++    gctFLOAT                        r;
++    gctFLOAT                        g;
++    gctFLOAT                        b;
++    gctFLOAT                        a;
++}
++gcsCOMPOSITION;
++
++gceSTATUS
++gco3D_ProbeComposition(
++    gctBOOL ResetIfEmpty
++    );
++
++gceSTATUS
++gco3D_CompositionBegin(
++    void
++    );
++
++gceSTATUS
++gco3D_ComposeLayer(
++    IN gcsCOMPOSITION_PTR Layer
++    );
++
++gceSTATUS
++gco3D_CompositionSignals(
++    IN gctHANDLE Process,
++    IN gctSIGNAL Signal1,
++    IN gctSIGNAL Signal2
++    );
++
++gceSTATUS
++gco3D_CompositionEnd(
++    IN gcoSURF Target,
++    IN gctBOOL Synchronous
++    );
++
++/* Frame Database */
++gceSTATUS
++gcoHAL_AddFrameDB(
++    void
++    );
++
++gceSTATUS
++gcoHAL_DumpFrameDB(
++    gctCONST_STRING Filename OPTIONAL
++    );
++
++gceSTATUS
++gcoHAL_GetSharedInfo(
++    IN gctUINT32 Pid,
++    IN gctUINT32 DataId,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER Data
++    );
++
++gceSTATUS
++gcoHAL_SetSharedInfo(
++    IN gctUINT32 DataId,
++    IN gctPOINTER Data,
++    IN gctSIZE_T Bytes
++    );
++
++#if VIVANTE_PROFILER_CONTEXT
++gceSTATUS
++gcoHARDWARE_GetContext(
++    IN gcoHARDWARE Hardware,
++    OUT gctUINT32 * Context
++    );
++#endif
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* VIVANTE_NO_3D */
++#endif /* __gc_hal_engine_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_engine_vg.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,904 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_engine_vg_h_
++#define __gc_hal_engine_vg_h_
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++#include "gc_hal_types.h"
++
++/******************************************************************************\
++******************************** VG Enumerations *******************************
++\******************************************************************************/
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Tiling mode for painting and imagig.
++**
++**  This enumeration defines the tiling modes supported by the HAL.  This is
++**  in fact a one-to-one mapping of the OpenVG 1.1 tile modes.
++*/
++typedef enum _gceTILE_MODE
++{
++    gcvTILE_FILL,
++    gcvTILE_PAD,
++    gcvTILE_REPEAT,
++    gcvTILE_REFLECT
++}
++gceTILE_MODE;
++
++/******************************************************************************/
++/** @ingroup gcoVG
++**
++**  @brief  The different paint modes.
++**
++**  This enumeration lists the available paint modes.
++*/
++typedef enum _gcePAINT_TYPE
++{
++    /** Solid color. */
++    gcvPAINT_MODE_SOLID,
++
++    /** Linear gradient. */
++    gcvPAINT_MODE_LINEAR,
++
++    /** Radial gradient. */
++    gcvPAINT_MODE_RADIAL,
++
++    /** Pattern. */
++    gcvPAINT_MODE_PATTERN,
++
++    /** Mode count. */
++    gcvPAINT_MODE_COUNT
++}
++gcePAINT_TYPE;
++
++/**
++** @ingroup gcoVG
++**
++**  @brief Types of path data supported by HAL.
++**
++**  This enumeration defines the types of path data supported by the HAL.
++**  This is in fact a one-to-one mapping of the OpenVG 1.1 path types.
++*/
++typedef enum _gcePATHTYPE
++{
++    gcePATHTYPE_UNKNOWN = -1,
++    gcePATHTYPE_INT8,
++    gcePATHTYPE_INT16,
++    gcePATHTYPE_INT32,
++    gcePATHTYPE_FLOAT
++}
++gcePATHTYPE;
++
++/**
++** @ingroup gcoVG
++**
++**  @brief Supported path segment commands.
++**
++**  This enumeration defines the path segment commands supported by the HAL.
++*/
++typedef enum _gceVGCMD
++{
++    gcvVGCMD_END,                        /*  0: GCCMD_TS_OPCODE_END           */
++    gcvVGCMD_CLOSE,                      /*  1: GCCMD_TS_OPCODE_CLOSE         */
++    gcvVGCMD_MOVE,                       /*  2: GCCMD_TS_OPCODE_MOVE          */
++    gcvVGCMD_MOVE_REL,                   /*  3: GCCMD_TS_OPCODE_MOVE_REL      */
++    gcvVGCMD_LINE,                       /*  4: GCCMD_TS_OPCODE_LINE          */
++    gcvVGCMD_LINE_REL,                   /*  5: GCCMD_TS_OPCODE_LINE_REL      */
++    gcvVGCMD_QUAD,                       /*  6: GCCMD_TS_OPCODE_QUADRATIC     */
++    gcvVGCMD_QUAD_REL,                   /*  7: GCCMD_TS_OPCODE_QUADRATIC_REL */
++    gcvVGCMD_CUBIC,                      /*  8: GCCMD_TS_OPCODE_CUBIC         */
++    gcvVGCMD_CUBIC_REL,                  /*  9: GCCMD_TS_OPCODE_CUBIC_REL     */
++    gcvVGCMD_BREAK,                      /* 10: GCCMD_TS_OPCODE_BREAK         */
++    gcvVGCMD_HLINE,                      /* 11: ******* R E S E R V E D *******/
++    gcvVGCMD_HLINE_REL,                  /* 12: ******* R E S E R V E D *******/
++    gcvVGCMD_VLINE,                      /* 13: ******* R E S E R V E D *******/
++    gcvVGCMD_VLINE_REL,                  /* 14: ******* R E S E R V E D *******/
++    gcvVGCMD_SQUAD,                      /* 15: ******* R E S E R V E D *******/
++    gcvVGCMD_SQUAD_REL,                  /* 16: ******* R E S E R V E D *******/
++    gcvVGCMD_SCUBIC,                     /* 17: ******* R E S E R V E D *******/
++    gcvVGCMD_SCUBIC_REL,                 /* 18: ******* R E S E R V E D *******/
++    gcvVGCMD_SCCWARC,                    /* 19: ******* R E S E R V E D *******/
++    gcvVGCMD_SCCWARC_REL,                /* 20: ******* R E S E R V E D *******/
++    gcvVGCMD_SCWARC,                     /* 21: ******* R E S E R V E D *******/
++    gcvVGCMD_SCWARC_REL,                 /* 22: ******* R E S E R V E D *******/
++    gcvVGCMD_LCCWARC,                    /* 23: ******* R E S E R V E D *******/
++    gcvVGCMD_LCCWARC_REL,                /* 24: ******* R E S E R V E D *******/
++    gcvVGCMD_LCWARC,                     /* 25: ******* R E S E R V E D *******/
++    gcvVGCMD_LCWARC_REL,                 /* 26: ******* R E S E R V E D *******/
++
++    /* The width of the command recognized by the hardware on bits. */
++    gcvVGCMD_WIDTH = 5,
++
++    /* Hardware command mask. */
++    gcvVGCMD_MASK = (1 << gcvVGCMD_WIDTH) - 1,
++
++    /* Command modifiers. */
++    gcvVGCMD_H_MOD   = 1 << gcvVGCMD_WIDTH,  /* =  32 */
++    gcvVGCMD_V_MOD   = 2 << gcvVGCMD_WIDTH,  /* =  64 */
++    gcvVGCMD_S_MOD   = 3 << gcvVGCMD_WIDTH,  /* =  96 */
++    gcvVGCMD_ARC_MOD = 4 << gcvVGCMD_WIDTH,  /* = 128 */
++
++    /* Emulated LINE commands. */
++    gcvVGCMD_HLINE_EMUL     = gcvVGCMD_H_MOD | gcvVGCMD_LINE,        /* =  36 */
++    gcvVGCMD_HLINE_EMUL_REL = gcvVGCMD_H_MOD | gcvVGCMD_LINE_REL,    /* =  37 */
++    gcvVGCMD_VLINE_EMUL     = gcvVGCMD_V_MOD | gcvVGCMD_LINE,        /* =  68 */
++    gcvVGCMD_VLINE_EMUL_REL = gcvVGCMD_V_MOD | gcvVGCMD_LINE_REL,    /* =  69 */
++
++    /* Emulated SMOOTH commands. */
++    gcvVGCMD_SQUAD_EMUL      = gcvVGCMD_S_MOD | gcvVGCMD_QUAD,       /* = 102 */
++    gcvVGCMD_SQUAD_EMUL_REL  = gcvVGCMD_S_MOD | gcvVGCMD_QUAD_REL,   /* = 103 */
++    gcvVGCMD_SCUBIC_EMUL     = gcvVGCMD_S_MOD | gcvVGCMD_CUBIC,      /* = 104 */
++    gcvVGCMD_SCUBIC_EMUL_REL = gcvVGCMD_S_MOD | gcvVGCMD_CUBIC_REL,  /* = 105 */
++
++    /* Emulation ARC commands. */
++    gcvVGCMD_ARC_LINE     = gcvVGCMD_ARC_MOD | gcvVGCMD_LINE,        /* = 132 */
++    gcvVGCMD_ARC_LINE_REL = gcvVGCMD_ARC_MOD | gcvVGCMD_LINE_REL,    /* = 133 */
++    gcvVGCMD_ARC_QUAD     = gcvVGCMD_ARC_MOD | gcvVGCMD_QUAD,        /* = 134 */
++    gcvVGCMD_ARC_QUAD_REL = gcvVGCMD_ARC_MOD | gcvVGCMD_QUAD_REL     /* = 135 */
++}
++gceVGCMD;
++typedef enum _gceVGCMD * gceVGCMD_PTR;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Blending modes supported by the HAL.
++**
++**  This enumeration defines the blending modes supported by the HAL.  This is
++**  in fact a one-to-one mapping of the OpenVG 1.1 blending modes.
++*/
++typedef enum _gceVG_BLEND
++{
++    gcvVG_BLEND_SRC,
++    gcvVG_BLEND_SRC_OVER,
++    gcvVG_BLEND_DST_OVER,
++    gcvVG_BLEND_SRC_IN,
++    gcvVG_BLEND_DST_IN,
++    gcvVG_BLEND_MULTIPLY,
++    gcvVG_BLEND_SCREEN,
++    gcvVG_BLEND_DARKEN,
++    gcvVG_BLEND_LIGHTEN,
++    gcvVG_BLEND_ADDITIVE,
++    gcvVG_BLEND_SUBTRACT,
++    gcvVG_BLEND_FILTER
++}
++gceVG_BLEND;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Image modes supported by the HAL.
++**
++**  This enumeration defines the image modes supported by the HAL.  This is
++**  in fact a one-to-one mapping of the OpenVG 1.1 image modes with the addition
++**  of NO IMAGE.
++*/
++typedef enum _gceVG_IMAGE
++{
++    gcvVG_IMAGE_NONE,
++    gcvVG_IMAGE_NORMAL,
++    gcvVG_IMAGE_MULTIPLY,
++    gcvVG_IMAGE_STENCIL,
++    gcvVG_IMAGE_FILTER
++}
++gceVG_IMAGE;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Filter mode patterns and imaging.
++**
++**  This enumeration defines the filter modes supported by the HAL.
++*/
++typedef enum _gceIMAGE_FILTER
++{
++    gcvFILTER_POINT,
++    gcvFILTER_LINEAR,
++    gcvFILTER_BI_LINEAR
++}
++gceIMAGE_FILTER;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Primitive modes supported by the HAL.
++**
++**  This enumeration defines the primitive modes supported by the HAL.
++*/
++typedef enum _gceVG_PRIMITIVE
++{
++    gcvVG_SCANLINE,
++    gcvVG_RECTANGLE,
++    gcvVG_TESSELLATED,
++    gcvVG_TESSELLATED_TILED
++}
++gceVG_PRIMITIVE;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Rendering quality modes supported by the HAL.
++**
++**  This enumeration defines the rendering quality modes supported by the HAL.
++*/
++typedef enum _gceRENDER_QUALITY
++{
++    gcvVG_NONANTIALIASED,
++    gcvVG_2X2_MSAA,
++    gcvVG_2X4_MSAA,
++    gcvVG_4X4_MSAA
++}
++gceRENDER_QUALITY;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Fill rules supported by the HAL.
++**
++**  This enumeration defines the fill rules supported by the HAL.
++*/
++typedef enum _gceFILL_RULE
++{
++    gcvVG_EVEN_ODD,
++    gcvVG_NON_ZERO
++}
++gceFILL_RULE;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Cap styles supported by the HAL.
++**
++**  This enumeration defines the cap styles supported by the HAL.
++*/
++typedef enum _gceCAP_STYLE
++{
++    gcvCAP_BUTT,
++    gcvCAP_ROUND,
++    gcvCAP_SQUARE
++}
++gceCAP_STYLE;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Join styles supported by the HAL.
++**
++**  This enumeration defines the join styles supported by the HAL.
++*/
++typedef enum _gceJOIN_STYLE
++{
++    gcvJOIN_MITER,
++    gcvJOIN_ROUND,
++    gcvJOIN_BEVEL
++}
++gceJOIN_STYLE;
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Channel mask values.
++**
++**  This enumeration defines the values for channel mask used in image
++**  filtering.
++*/
++
++/* Base values for channel mask definitions. */
++#define gcvCHANNEL_X    (0)
++#define gcvCHANNEL_R    (1 << 0)
++#define gcvCHANNEL_G    (1 << 1)
++#define gcvCHANNEL_B    (1 << 2)
++#define gcvCHANNEL_A    (1 << 3)
++
++typedef enum _gceCHANNEL
++{
++    gcvCHANNEL_XXXX = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X),
++    gcvCHANNEL_XXXA = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_A),
++    gcvCHANNEL_XXBX = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_X),
++    gcvCHANNEL_XXBA = (gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_A),
++
++    gcvCHANNEL_XGXX = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_X),
++    gcvCHANNEL_XGXA = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_A),
++    gcvCHANNEL_XGBX = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_X),
++    gcvCHANNEL_XGBA = (gcvCHANNEL_X | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_A),
++
++    gcvCHANNEL_RXXX = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_X),
++    gcvCHANNEL_RXXA = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_X | gcvCHANNEL_A),
++    gcvCHANNEL_RXBX = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_X),
++    gcvCHANNEL_RXBA = (gcvCHANNEL_R | gcvCHANNEL_X | gcvCHANNEL_B | gcvCHANNEL_A),
++
++    gcvCHANNEL_RGXX = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_X),
++    gcvCHANNEL_RGXA = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_X | gcvCHANNEL_A),
++    gcvCHANNEL_RGBX = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_X),
++    gcvCHANNEL_RGBA = (gcvCHANNEL_R | gcvCHANNEL_G | gcvCHANNEL_B | gcvCHANNEL_A),
++}
++gceCHANNEL;
++
++/******************************************************************************\
++******************************** VG Structures *******************************
++\******************************************************************************/
++
++/**
++**  @ingroup    gcoVG
++**
++**  @brief      Definition of the color ramp used by the gradient paints.
++**
++**  The gcsCOLOR_RAMP structure defines the layout of one single color inside
++**  a color ramp which is used by gradient paints.
++*/
++typedef struct _gcsCOLOR_RAMP
++{
++    /** Value for the color stop. */
++    gctFLOAT        stop;
++
++    /** Red color channel value for the color stop. */
++    gctFLOAT        red;
++
++    /** Green color channel value for the color stop. */
++    gctFLOAT        green;
++
++    /** Blue color channel value for the color stop. */
++    gctFLOAT        blue;
++
++    /** Alpha color channel value for the color stop. */
++    gctFLOAT        alpha;
++}
++gcsCOLOR_RAMP, * gcsCOLOR_RAMP_PTR;
++
++/**
++**  @ingroup    gcoVG
++**
++**  @brief      Definition of the color ramp used by the gradient paints in fixed form.
++**
++**  The gcsCOLOR_RAMP structure defines the layout of one single color inside
++**  a color ramp which is used by gradient paints.
++*/
++typedef struct _gcsFIXED_COLOR_RAMP
++{
++    /** Value for the color stop. */
++    gctFIXED_POINT      stop;
++
++    /** Red color channel value for the color stop. */
++    gctFIXED_POINT      red;
++
++    /** Green color channel value for the color stop. */
++    gctFIXED_POINT      green;
++
++    /** Blue color channel value for the color stop. */
++    gctFIXED_POINT      blue;
++
++    /** Alpha color channel value for the color stop. */
++    gctFIXED_POINT      alpha;
++}
++gcsFIXED_COLOR_RAMP, * gcsFIXED_COLOR_RAMP_PTR;
++
++
++/**
++**  @ingroup gcoVG
++**
++**  @brief  Rectangle structure used by the gcoVG object.
++**
++**  This structure defines the layout of a rectangle.  Make sure width and
++**  height are larger than 0.
++*/
++typedef struct _gcsVG_RECT * gcsVG_RECT_PTR;
++typedef struct _gcsVG_RECT
++{
++    /** Left location of the rectangle. */
++    gctINT      x;
++
++    /** Top location of the rectangle. */
++    gctINT      y;
++
++    /** Width of the rectangle. */
++    gctINT      width;
++
++    /** Height of the rectangle. */
++    gctINT      height;
++}
++gcsVG_RECT;
++
++/**
++**  @ingroup    gcoVG
++**
++**  @brief      Path command buffer attribute structure.
++**
++**  The gcsPATH_BUFFER_INFO structure contains the specifics about
++**  the layout of the path data command buffer.
++*/
++typedef struct _gcsPATH_BUFFER_INFO * gcsPATH_BUFFER_INFO_PTR;
++typedef struct _gcsPATH_BUFFER_INFO
++{
++    gctUINT     reservedForHead;
++    gctUINT     reservedForTail;
++}
++gcsPATH_BUFFER_INFO;
++
++/**
++**  @ingroup    gcoVG
++**
++**  @brief      Definition of the path data container structure.
++**
++**  The gcsPATH structure defines the layout of the path data container.
++*/
++typedef struct _gcsPATH_DATA * gcsPATH_DATA_PTR;
++typedef struct _gcsPATH_DATA
++{
++    /* Data container in command buffer format. */
++    gcsCMDBUFFER    data;
++
++    /* Path data type. */
++    gcePATHTYPE     dataType;
++}
++gcsPATH_DATA;
++
++
++/******************************************************************************\
++********************************* gcoHAL Object ********************************
++\******************************************************************************/
++
++/* Query path data storage attributes. */
++gceSTATUS
++gcoHAL_QueryPathStorage(
++    IN gcoHAL Hal,
++    OUT gcsPATH_BUFFER_INFO_PTR Information
++    );
++
++/* Associate a completion signal with the command buffer. */
++gceSTATUS
++gcoHAL_AssociateCompletion(
++    IN gcoHAL Hal,
++    IN gcsPATH_DATA_PTR PathData
++    );
++
++/* Release the current command buffer completion signal. */
++gceSTATUS
++gcoHAL_DeassociateCompletion(
++    IN gcoHAL Hal,
++    IN gcsPATH_DATA_PTR PathData
++    );
++
++/* Verify whether the command buffer is still in use. */
++gceSTATUS
++gcoHAL_CheckCompletion(
++    IN gcoHAL Hal,
++    IN gcsPATH_DATA_PTR PathData
++    );
++
++/* Wait until the command buffer is no longer in use. */
++gceSTATUS
++gcoHAL_WaitCompletion(
++    IN gcoHAL Hal,
++    IN gcsPATH_DATA_PTR PathData
++    );
++
++/* Flush the pixel cache. */
++gceSTATUS
++gcoHAL_Flush(
++    IN gcoHAL Hal
++    );
++
++/* Split a harwdare address into pool and offset. */
++gceSTATUS
++gcoHAL_SplitAddress(
++    IN gcoHAL Hal,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    );
++
++/* Combine pool and offset into a harwdare address. */
++gceSTATUS
++gcoHAL_CombineAddress(
++    IN gcoHAL Hal,
++    IN gcePOOL Pool,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    );
++
++/* Schedule to free linear video memory allocated. */
++gceSTATUS
++gcoHAL_ScheduleVideoMemory(
++    IN gcoHAL Hal,
++    IN gctUINT64 Node
++    );
++
++/* Free linear video memory allocated with gcoHAL_AllocateLinearVideoMemory. */
++gceSTATUS
++gcoHAL_FreeVideoMemory(
++    IN gcoHAL Hal,
++    IN gctUINT64 Node
++    );
++
++/* Query command buffer attributes. */
++gceSTATUS
++gcoHAL_QueryCommandBuffer(
++    IN gcoHAL Hal,
++    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
++    );
++/* Allocate and lock linear video memory. */
++gceSTATUS
++gcoHAL_AllocateLinearVideoMemory(
++    IN gcoHAL Hal,
++    IN gctUINT Size,
++    IN gctUINT Alignment,
++    IN gcePOOL Pool,
++    OUT gctUINT64 * Node,
++    OUT gctUINT32 * Address,
++    OUT gctPOINTER * Memory
++    );
++
++/* Align the specified size accordingly to the hardware requirements. */
++gceSTATUS
++gcoHAL_GetAlignedSurfaceSize(
++    IN gcoHAL Hal,
++    IN gceSURF_TYPE Type,
++    IN OUT gctUINT32_PTR Width,
++    IN OUT gctUINT32_PTR Height
++    );
++
++gceSTATUS
++gcoHAL_ReserveTask(
++    IN gcoHAL Hal,
++    IN gceBLOCK Block,
++    IN gctUINT TaskCount,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    );
++/******************************************************************************\
++********************************** gcoVG Object ********************************
++\******************************************************************************/
++
++/** @defgroup gcoVG gcoVG
++**
++**  The gcoVG object abstracts the VG hardware pipe.
++*/
++
++gctBOOL
++gcoVG_IsMaskSupported(
++    IN gceSURF_FORMAT Format
++    );
++
++gctBOOL
++gcoVG_IsTargetSupported(
++    IN gceSURF_FORMAT Format
++    );
++
++gctBOOL
++gcoVG_IsImageSupported(
++    IN gceSURF_FORMAT Format
++    );
++
++gctUINT8 gcoVG_PackColorComponent(
++    gctFLOAT Value
++    );
++
++gceSTATUS
++gcoVG_Construct(
++    IN gcoHAL Hal,
++    OUT gcoVG * Vg
++    );
++
++gceSTATUS
++gcoVG_Destroy(
++    IN gcoVG Vg
++    );
++
++gceSTATUS
++gcoVG_SetTarget(
++    IN gcoVG Vg,
++    IN gcoSURF Target
++    );
++
++gceSTATUS
++gcoVG_UnsetTarget(
++    IN gcoVG Vg,
++    IN gcoSURF Surface
++    );
++
++gceSTATUS
++gcoVG_SetUserToSurface(
++    IN gcoVG Vg,
++    IN gctFLOAT UserToSurface[9]
++    );
++
++gceSTATUS
++gcoVG_SetSurfaceToImage(
++    IN gcoVG Vg,
++    IN gctFLOAT SurfaceToImage[9]
++    );
++
++gceSTATUS
++gcoVG_EnableMask(
++    IN gcoVG Vg,
++    IN gctBOOL Enable
++    );
++
++gceSTATUS
++gcoVG_SetMask(
++    IN gcoVG Vg,
++    IN gcoSURF Mask
++    );
++
++gceSTATUS
++gcoVG_UnsetMask(
++    IN gcoVG Vg,
++    IN gcoSURF Surface
++    );
++
++gceSTATUS
++gcoVG_FlushMask(
++    IN gcoVG Vg
++    );
++
++gceSTATUS
++gcoVG_EnableScissor(
++    IN gcoVG Vg,
++    IN gctBOOL Enable
++    );
++
++gceSTATUS
++gcoVG_SetScissor(
++    IN gcoVG Vg,
++    IN gctSIZE_T RectangleCount,
++    IN gcsVG_RECT_PTR Rectangles
++    );
++
++gceSTATUS
++gcoVG_EnableColorTransform(
++    IN gcoVG Vg,
++    IN gctBOOL Enable
++    );
++
++gceSTATUS
++gcoVG_SetColorTransform(
++    IN gcoVG Vg,
++    IN gctFLOAT ColorTransform[8]
++    );
++
++gceSTATUS
++gcoVG_SetTileFillColor(
++    IN gcoVG Vg,
++    IN gctFLOAT Red,
++    IN gctFLOAT Green,
++    IN gctFLOAT Blue,
++    IN gctFLOAT Alpha
++    );
++
++gceSTATUS
++gcoVG_SetSolidPaint(
++    IN gcoVG Vg,
++    IN gctUINT8 Red,
++    IN gctUINT8 Green,
++    IN gctUINT8 Blue,
++    IN gctUINT8 Alpha
++    );
++
++gceSTATUS
++gcoVG_SetLinearPaint(
++    IN gcoVG Vg,
++    IN gctFLOAT Constant,
++    IN gctFLOAT StepX,
++    IN gctFLOAT StepY
++    );
++
++gceSTATUS
++gcoVG_SetRadialPaint(
++    IN gcoVG Vg,
++    IN gctFLOAT LinConstant,
++    IN gctFLOAT LinStepX,
++    IN gctFLOAT LinStepY,
++    IN gctFLOAT RadConstant,
++    IN gctFLOAT RadStepX,
++    IN gctFLOAT RadStepY,
++    IN gctFLOAT RadStepXX,
++    IN gctFLOAT RadStepYY,
++    IN gctFLOAT RadStepXY
++    );
++
++gceSTATUS
++gcoVG_SetPatternPaint(
++    IN gcoVG Vg,
++    IN gctFLOAT UConstant,
++    IN gctFLOAT UStepX,
++    IN gctFLOAT UStepY,
++    IN gctFLOAT VConstant,
++    IN gctFLOAT VStepX,
++    IN gctFLOAT VStepY,
++    IN gctBOOL Linear
++    );
++
++gceSTATUS
++gcoVG_SetColorRamp(
++    IN gcoVG Vg,
++    IN gcoSURF ColorRamp,
++    IN gceTILE_MODE ColorRampSpreadMode
++    );
++
++gceSTATUS
++gcoVG_SetPattern(
++    IN gcoVG Vg,
++    IN gcoSURF Pattern,
++    IN gceTILE_MODE TileMode,
++    IN gceIMAGE_FILTER Filter
++    );
++
++gceSTATUS
++gcoVG_SetImageMode(
++    IN gcoVG Vg,
++    IN gceVG_IMAGE Mode
++    );
++
++gceSTATUS
++gcoVG_SetBlendMode(
++    IN gcoVG Vg,
++    IN gceVG_BLEND Mode
++    );
++
++gceSTATUS
++gcoVG_SetRenderingQuality(
++    IN gcoVG Vg,
++    IN gceRENDER_QUALITY Quality
++    );
++
++gceSTATUS
++gcoVG_SetFillRule(
++    IN gcoVG Vg,
++    IN gceFILL_RULE FillRule
++    );
++
++gceSTATUS
++gcoVG_FinalizePath(
++    IN gcoVG Vg,
++    IN gcsPATH_DATA_PTR PathData
++    );
++
++gceSTATUS
++gcoVG_Clear(
++    IN gcoVG Vg,
++    IN gctINT X,
++    IN gctINT Y,
++    IN gctINT Width,
++    IN gctINT Height
++    );
++
++gceSTATUS
++gcoVG_DrawPath(
++    IN gcoVG Vg,
++    IN gcsPATH_DATA_PTR PathData,
++    IN gctFLOAT Scale,
++    IN gctFLOAT Bias,
++    IN gctBOOL SoftwareTesselation
++    );
++
++gceSTATUS
++gcoVG_DrawImage(
++    IN gcoVG Vg,
++    IN gcoSURF Source,
++    IN gcsPOINT_PTR SourceOrigin,
++    IN gcsPOINT_PTR TargetOrigin,
++    IN gcsSIZE_PTR SourceSize,
++    IN gctINT SourceX,
++    IN gctINT SourceY,
++    IN gctINT TargetX,
++    IN gctINT TargetY,
++    IN gctINT Width,
++    IN gctINT Height,
++    IN gctBOOL Mask
++    );
++
++gceSTATUS
++gcoVG_TesselateImage(
++    IN gcoVG Vg,
++    IN gcoSURF Image,
++    IN gcsVG_RECT_PTR Rectangle,
++    IN gceIMAGE_FILTER Filter,
++    IN gctBOOL Mask,
++    IN gctBOOL SoftwareTesselation
++    );
++
++gceSTATUS
++gcoVG_Blit(
++    IN gcoVG Vg,
++    IN gcoSURF Source,
++    IN gcoSURF Target,
++    IN gcsVG_RECT_PTR SrcRect,
++    IN gcsVG_RECT_PTR TrgRect,
++    IN gceIMAGE_FILTER Filter,
++    IN gceVG_BLEND Mode
++    );
++
++gceSTATUS
++gcoVG_ColorMatrix(
++    IN gcoVG Vg,
++    IN gcoSURF Source,
++    IN gcoSURF Target,
++    IN const gctFLOAT * Matrix,
++    IN gceCHANNEL ColorChannels,
++    IN gctBOOL FilterLinear,
++    IN gctBOOL FilterPremultiplied,
++    IN gcsPOINT_PTR SourceOrigin,
++    IN gcsPOINT_PTR TargetOrigin,
++    IN gctINT Width,
++    IN gctINT Height
++    );
++
++gceSTATUS
++gcoVG_SeparableConvolve(
++    IN gcoVG Vg,
++    IN gcoSURF Source,
++    IN gcoSURF Target,
++    IN gctINT KernelWidth,
++    IN gctINT KernelHeight,
++    IN gctINT ShiftX,
++    IN gctINT ShiftY,
++    IN const gctINT16 * KernelX,
++    IN const gctINT16 * KernelY,
++    IN gctFLOAT Scale,
++    IN gctFLOAT Bias,
++    IN gceTILE_MODE TilingMode,
++    IN gctFLOAT_PTR FillColor,
++    IN gceCHANNEL ColorChannels,
++    IN gctBOOL FilterLinear,
++    IN gctBOOL FilterPremultiplied,
++    IN gcsPOINT_PTR SourceOrigin,
++    IN gcsPOINT_PTR TargetOrigin,
++    IN gcsSIZE_PTR SourceSize,
++    IN gctINT Width,
++    IN gctINT Height
++    );
++
++gceSTATUS
++gcoVG_GaussianBlur(
++    IN gcoVG Vg,
++    IN gcoSURF Source,
++    IN gcoSURF Target,
++    IN gctFLOAT StdDeviationX,
++    IN gctFLOAT StdDeviationY,
++    IN gceTILE_MODE TilingMode,
++    IN gctFLOAT_PTR FillColor,
++    IN gceCHANNEL ColorChannels,
++    IN gctBOOL FilterLinear,
++    IN gctBOOL FilterPremultiplied,
++    IN gcsPOINT_PTR SourceOrigin,
++    IN gcsPOINT_PTR TargetOrigin,
++    IN gcsSIZE_PTR SourceSize,
++    IN gctINT Width,
++    IN gctINT Height
++    );
++
++gceSTATUS
++gcoVG_EnableDither(
++    IN gcoVG Vg,
++    IN gctBOOL Enable
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif  /* __gc_hal_vg_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_enum.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,965 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_enum_h_
++#define __gc_hal_enum_h_
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/* Chip models. */
++typedef enum _gceCHIPMODEL
++{
++    gcv300  = 0x0300,
++    gcv320  = 0x0320,
++    gcv350  = 0x0350,
++    gcv355  = 0x0355,
++    gcv400  = 0x0400,
++    gcv410  = 0x0410,
++    gcv420  = 0x0420,
++    gcv450  = 0x0450,
++    gcv500  = 0x0500,
++    gcv530  = 0x0530,
++    gcv600  = 0x0600,
++    gcv700  = 0x0700,
++    gcv800  = 0x0800,
++    gcv860  = 0x0860,
++    gcv880  = 0x0880,
++    gcv1000 = 0x1000,
++    gcv2000 = 0x2000,
++    gcv2100 = 0x2100,
++    gcv4000 = 0x4000,
++}
++gceCHIPMODEL;
++
++/* Chip features. */
++typedef enum _gceFEATURE
++{
++    gcvFEATURE_PIPE_2D = 0,
++    gcvFEATURE_PIPE_3D,
++    gcvFEATURE_PIPE_VG,
++    gcvFEATURE_DC,
++    gcvFEATURE_HIGH_DYNAMIC_RANGE,
++    gcvFEATURE_MODULE_CG,
++    gcvFEATURE_MIN_AREA,
++    gcvFEATURE_BUFFER_INTERLEAVING,
++    gcvFEATURE_BYTE_WRITE_2D,
++    gcvFEATURE_ENDIANNESS_CONFIG,
++    gcvFEATURE_DUAL_RETURN_BUS,
++    gcvFEATURE_DEBUG_MODE,
++    gcvFEATURE_YUY2_RENDER_TARGET,
++    gcvFEATURE_FRAGMENT_PROCESSOR,
++    gcvFEATURE_2DPE20,
++    gcvFEATURE_FAST_CLEAR,
++    gcvFEATURE_YUV420_TILER,
++    gcvFEATURE_YUY2_AVERAGING,
++    gcvFEATURE_FLIP_Y,
++    gcvFEATURE_EARLY_Z,
++    gcvFEATURE_Z_COMPRESSION,
++    gcvFEATURE_MSAA,
++    gcvFEATURE_SPECIAL_ANTI_ALIASING,
++    gcvFEATURE_SPECIAL_MSAA_LOD,
++    gcvFEATURE_422_TEXTURE_COMPRESSION,
++    gcvFEATURE_DXT_TEXTURE_COMPRESSION,
++    gcvFEATURE_ETC1_TEXTURE_COMPRESSION,
++    gcvFEATURE_CORRECT_TEXTURE_CONVERTER,
++    gcvFEATURE_TEXTURE_8K,
++    gcvFEATURE_SCALER,
++    gcvFEATURE_YUV420_SCALER,
++    gcvFEATURE_SHADER_HAS_W,
++    gcvFEATURE_SHADER_HAS_SIGN,
++    gcvFEATURE_SHADER_HAS_FLOOR,
++    gcvFEATURE_SHADER_HAS_CEIL,
++    gcvFEATURE_SHADER_HAS_SQRT,
++    gcvFEATURE_SHADER_HAS_TRIG,
++    gcvFEATURE_VAA,
++    gcvFEATURE_HZ,
++    gcvFEATURE_CORRECT_STENCIL,
++    gcvFEATURE_VG20,
++    gcvFEATURE_VG_FILTER,
++    gcvFEATURE_VG21,
++    gcvFEATURE_VG_DOUBLE_BUFFER,
++    gcvFEATURE_MC20,
++    gcvFEATURE_SUPER_TILED,
++    gcvFEATURE_2D_FILTERBLIT_PLUS_ALPHABLEND,
++    gcvFEATURE_2D_DITHER,
++    gcvFEATURE_2D_A8_TARGET,
++    gcvFEATURE_2D_FILTERBLIT_FULLROTATION,
++    gcvFEATURE_2D_BITBLIT_FULLROTATION,
++    gcvFEATURE_WIDE_LINE,
++    gcvFEATURE_FC_FLUSH_STALL,
++    gcvFEATURE_FULL_DIRECTFB,
++    gcvFEATURE_HALF_FLOAT_PIPE,
++    gcvFEATURE_LINE_LOOP,
++    gcvFEATURE_2D_YUV_BLIT,
++    gcvFEATURE_2D_TILING,
++    gcvFEATURE_NON_POWER_OF_TWO,
++    gcvFEATURE_3D_TEXTURE,
++    gcvFEATURE_TEXTURE_ARRAY,
++    gcvFEATURE_TILE_FILLER,
++    gcvFEATURE_LOGIC_OP,
++    gcvFEATURE_COMPOSITION,
++    gcvFEATURE_MIXED_STREAMS,
++    gcvFEATURE_2D_MULTI_SOURCE_BLT,
++    gcvFEATURE_END_EVENT,
++    gcvFEATURE_VERTEX_10_10_10_2,
++    gcvFEATURE_TEXTURE_10_10_10_2,
++    gcvFEATURE_TEXTURE_ANISOTROPIC_FILTERING,
++    gcvFEATURE_TEXTURE_FLOAT_HALF_FLOAT,
++	gcvFEATURE_2D_ROTATION_STALL_FIX,
++    gcvFEATURE_2D_MULTI_SOURCE_BLT_EX,
++	gcvFEATURE_BUG_FIXES10,
++    gcvFEATURE_2D_MINOR_TILING,
++    /* Supertiled compressed textures are supported. */
++    gcvFEATURE_TEX_COMPRRESSION_SUPERTILED,
++    gcvFEATURE_FAST_MSAA,
++    gcvFEATURE_BUG_FIXED_INDEXED_TRIANGLE_STRIP,
++    gcvFEATURE_TEXTURE_TILED_READ,
++    gcvFEATURE_DEPTH_BIAS_FIX,
++    gcvFEATURE_RECT_PRIMITIVE,
++	gcvFEATURE_BUG_FIXES11,
++	gcvFEATURE_SUPERTILED_TEXTURE,
++    gcvFEATURE_2D_NO_COLORBRUSH_INDEX8,
++    gcvFEATURE_RS_YUV_TARGET,
++    gcvFEATURE_2D_FC_SOURCE,
++	gcvFEATURE_PE_DITHER_FIX,
++    gcvFEATURE_2D_YUV_SEPARATE_STRIDE,
++    gcvFEATURE_FRUSTUM_CLIP_FIX,
++    gcvFEATURE_TEXTURE_LINEAR,
++    gcvFEATURE_TEXTURE_YUV_ASSEMBLER,
++    gcvFEATURE_SHADER_HAS_INSTRUCTION_CACHE,
++    gcvFEATURE_DYNAMIC_FREQUENCY_SCALING,
++    gcvFEATURE_BUGFIX15,
++    gcvFEATURE_2D_GAMMA,
++    gcvFEATURE_2D_COLOR_SPACE_CONVERSION,
++    gcvFEATURE_2D_SUPER_TILE_VERSION,
++    gcvFEATURE_2D_MIRROR_EXTENSION,
++    gcvFEATURE_2D_SUPER_TILE_V1,
++    gcvFEATURE_2D_SUPER_TILE_V2,
++    gcvFEATURE_2D_SUPER_TILE_V3,
++    gcvFEATURE_2D_MULTI_SOURCE_BLT_EX2,
++    gcvFEATURE_ELEMENT_INDEX_UINT,
++    gcvFEATURE_2D_COMPRESSION,
++    gcvFEATURE_2D_OPF_YUV_OUTPUT,
++    gcvFEATURE_2D_MULTI_SRC_BLT_TO_UNIFIED_DST_RECT,
++    gcvFEATURE_2D_YUV_MODE,
++    gcvFEATURE_DECOMPRESS_Z16,
++	gcvFEATURE_LINEAR_RENDER_TARGET,
++    gcvFEATURE_BUG_FIXES8,
++    gcvFEATURE_HALTI2,
++    gcvFEATURE_MMU,
++}
++gceFEATURE;
++
++/* Chip Power Status. */
++typedef enum _gceCHIPPOWERSTATE
++{
++    gcvPOWER_ON = 0,
++    gcvPOWER_OFF,
++    gcvPOWER_IDLE,
++    gcvPOWER_SUSPEND,
++    gcvPOWER_SUSPEND_ATPOWERON,
++    gcvPOWER_OFF_ATPOWERON,
++    gcvPOWER_IDLE_BROADCAST,
++    gcvPOWER_SUSPEND_BROADCAST,
++    gcvPOWER_OFF_BROADCAST,
++    gcvPOWER_OFF_RECOVERY,
++    gcvPOWER_OFF_TIMEOUT,
++    gcvPOWER_ON_AUTO
++}
++gceCHIPPOWERSTATE;
++
++/* CPU cache operations */
++typedef enum _gceCACHEOPERATION
++{
++    gcvCACHE_CLEAN      = 0x01,
++    gcvCACHE_INVALIDATE = 0x02,
++    gcvCACHE_FLUSH      = gcvCACHE_CLEAN  | gcvCACHE_INVALIDATE,
++    gcvCACHE_MEMORY_BARRIER = 0x04
++}
++gceCACHEOPERATION;
++
++/* Surface types. */
++typedef enum _gceSURF_TYPE
++{
++    gcvSURF_TYPE_UNKNOWN = 0,
++    gcvSURF_INDEX,
++    gcvSURF_VERTEX,
++    gcvSURF_TEXTURE,
++    gcvSURF_RENDER_TARGET,
++    gcvSURF_DEPTH,
++    gcvSURF_BITMAP,
++    gcvSURF_TILE_STATUS,
++	gcvSURF_IMAGE,
++    gcvSURF_MASK,
++    gcvSURF_SCISSOR,
++    gcvSURF_HIERARCHICAL_DEPTH,
++    gcvSURF_NUM_TYPES, /* Make sure this is the last one! */
++
++    /* Combinations. */
++    gcvSURF_NO_TILE_STATUS = 0x100,
++    gcvSURF_NO_VIDMEM      = 0x200, /* Used to allocate surfaces with no underlying vidmem node.
++                                       In Android, vidmem node is allocated by another process. */
++    gcvSURF_CACHEABLE      = 0x400, /* Used to allocate a cacheable surface */
++    gcvSURF_FLIP           = 0x800, /* The Resolve Target the will been flip resolve from RT */
++    gcvSURF_TILE_STATUS_DIRTY  = 0x1000, /* Init tile status to all dirty */
++
++    gcvSURF_LINEAR             = 0x2000,
++    gcvSURF_VG                     = 0x4000,
++
++    gcvSURF_TEXTURE_LINEAR               = gcvSURF_TEXTURE
++                                         | gcvSURF_LINEAR,
++
++    gcvSURF_RENDER_TARGET_NO_TILE_STATUS = gcvSURF_RENDER_TARGET
++                                         | gcvSURF_NO_TILE_STATUS,
++
++    gcvSURF_RENDER_TARGET_TS_DIRTY = gcvSURF_RENDER_TARGET
++                                         | gcvSURF_TILE_STATUS_DIRTY,
++
++    gcvSURF_DEPTH_NO_TILE_STATUS         = gcvSURF_DEPTH
++                                         | gcvSURF_NO_TILE_STATUS,
++
++    gcvSURF_DEPTH_TS_DIRTY               = gcvSURF_DEPTH
++                                         | gcvSURF_TILE_STATUS_DIRTY,
++
++    /* Supported surface types with no vidmem node. */
++    gcvSURF_BITMAP_NO_VIDMEM             = gcvSURF_BITMAP
++                                         | gcvSURF_NO_VIDMEM,
++
++    gcvSURF_TEXTURE_NO_VIDMEM            = gcvSURF_TEXTURE
++                                         | gcvSURF_NO_VIDMEM,
++
++    /* Cacheable surface types with no vidmem node. */
++    gcvSURF_CACHEABLE_BITMAP_NO_VIDMEM   = gcvSURF_BITMAP_NO_VIDMEM
++                                         | gcvSURF_CACHEABLE,
++
++    gcvSURF_CACHEABLE_BITMAP             = gcvSURF_BITMAP
++                                         | gcvSURF_CACHEABLE,
++
++    gcvSURF_FLIP_BITMAP                  = gcvSURF_BITMAP
++                                         | gcvSURF_FLIP,
++}
++gceSURF_TYPE;
++
++typedef enum _gceSURF_USAGE
++{
++    gcvSURF_USAGE_UNKNOWN,
++    gcvSURF_USAGE_RESOLVE_AFTER_CPU,
++    gcvSURF_USAGE_RESOLVE_AFTER_3D
++}
++gceSURF_USAGE;
++
++typedef enum _gceSURF_COLOR_TYPE
++{
++    gcvSURF_COLOR_UNKNOWN = 0,
++    gcvSURF_COLOR_LINEAR        = 0x01,
++    gcvSURF_COLOR_ALPHA_PRE     = 0x02,
++}
++gceSURF_COLOR_TYPE;
++
++/* Rotation. */
++typedef enum _gceSURF_ROTATION
++{
++    gcvSURF_0_DEGREE = 0,
++    gcvSURF_90_DEGREE,
++    gcvSURF_180_DEGREE,
++    gcvSURF_270_DEGREE,
++    gcvSURF_FLIP_X,
++    gcvSURF_FLIP_Y,
++
++	gcvSURF_POST_FLIP_X = 0x40000000,
++    gcvSURF_POST_FLIP_Y = 0x80000000,
++}
++gceSURF_ROTATION;
++
++typedef enum _gceMIPMAP_IMAGE_FORMAT
++{
++    gcvUNKNOWN_MIPMAP_IMAGE_FORMAT  = -2
++}
++gceMIPMAP_IMAGE_FORMAT;
++
++
++/* Surface formats. */
++typedef enum _gceSURF_FORMAT
++{
++    /* Unknown format. */
++    gcvSURF_UNKNOWN             = 0,
++
++    /* Palettized formats. */
++    gcvSURF_INDEX1              = 100,
++    gcvSURF_INDEX4,
++    gcvSURF_INDEX8,
++
++    /* RGB formats. */
++    gcvSURF_A2R2G2B2            = 200,
++    gcvSURF_R3G3B2,
++    gcvSURF_A8R3G3B2,
++    gcvSURF_X4R4G4B4,
++    gcvSURF_A4R4G4B4,
++    gcvSURF_R4G4B4A4,
++    gcvSURF_X1R5G5B5,
++    gcvSURF_A1R5G5B5,
++    gcvSURF_R5G5B5A1,
++    gcvSURF_R5G6B5,
++    gcvSURF_R8G8B8,
++    gcvSURF_X8R8G8B8,
++    gcvSURF_A8R8G8B8,
++    gcvSURF_R8G8B8A8,
++    gcvSURF_G8R8G8B8,
++    gcvSURF_R8G8B8G8,
++    gcvSURF_X2R10G10B10,
++    gcvSURF_A2R10G10B10,
++    gcvSURF_X12R12G12B12,
++    gcvSURF_A12R12G12B12,
++    gcvSURF_X16R16G16B16,
++    gcvSURF_A16R16G16B16,
++    gcvSURF_A32R32G32B32,
++    gcvSURF_R8G8B8X8,
++    gcvSURF_R5G5B5X1,
++    gcvSURF_R4G4B4X4,
++
++    /* BGR formats. */
++    gcvSURF_A4B4G4R4            = 300,
++    gcvSURF_A1B5G5R5,
++    gcvSURF_B5G6R5,
++    gcvSURF_B8G8R8,
++    gcvSURF_B16G16R16,
++    gcvSURF_X8B8G8R8,
++    gcvSURF_A8B8G8R8,
++    gcvSURF_A2B10G10R10,
++    gcvSURF_X16B16G16R16,
++    gcvSURF_A16B16G16R16,
++    gcvSURF_B32G32R32,
++    gcvSURF_X32B32G32R32,
++    gcvSURF_A32B32G32R32,
++    gcvSURF_B4G4R4A4,
++    gcvSURF_B5G5R5A1,
++    gcvSURF_B8G8R8X8,
++    gcvSURF_B8G8R8A8,
++    gcvSURF_X4B4G4R4,
++    gcvSURF_X1B5G5R5,
++    gcvSURF_B4G4R4X4,
++    gcvSURF_B5G5R5X1,
++    gcvSURF_X2B10G10R10,
++
++    /* Compressed formats. */
++    gcvSURF_DXT1                = 400,
++    gcvSURF_DXT2,
++    gcvSURF_DXT3,
++    gcvSURF_DXT4,
++    gcvSURF_DXT5,
++    gcvSURF_CXV8U8,
++    gcvSURF_ETC1,
++    gcvSURF_R11_EAC,
++    gcvSURF_SIGNED_R11_EAC,
++    gcvSURF_RG11_EAC,
++    gcvSURF_SIGNED_RG11_EAC,
++    gcvSURF_RGB8_ETC2,
++    gcvSURF_SRGB8_ETC2,
++    gcvSURF_RGB8_PUNCHTHROUGH_ALPHA1_ETC2,
++    gcvSURF_SRGB8_PUNCHTHROUGH_ALPHA1_ETC2,
++    gcvSURF_RGBA8_ETC2_EAC,
++    gcvSURF_SRGB8_ALPHA8_ETC2_EAC,
++
++    /* YUV formats. */
++    gcvSURF_YUY2                = 500,
++    gcvSURF_UYVY,
++    gcvSURF_YV12,
++    gcvSURF_I420,
++    gcvSURF_NV12,
++    gcvSURF_NV21,
++    gcvSURF_NV16,
++    gcvSURF_NV61,
++    gcvSURF_YVYU,
++    gcvSURF_VYUY,
++
++    /* Depth formats. */
++    gcvSURF_D16                 = 600,
++    gcvSURF_D24S8,
++    gcvSURF_D32,
++    gcvSURF_D24X8,
++
++    /* Alpha formats. */
++    gcvSURF_A4                  = 700,
++    gcvSURF_A8,
++    gcvSURF_A12,
++    gcvSURF_A16,
++    gcvSURF_A32,
++    gcvSURF_A1,
++
++    /* Luminance formats. */
++    gcvSURF_L4                  = 800,
++    gcvSURF_L8,
++    gcvSURF_L12,
++    gcvSURF_L16,
++    gcvSURF_L32,
++    gcvSURF_L1,
++
++    /* Alpha/Luminance formats. */
++    gcvSURF_A4L4                = 900,
++    gcvSURF_A2L6,
++    gcvSURF_A8L8,
++    gcvSURF_A4L12,
++    gcvSURF_A12L12,
++    gcvSURF_A16L16,
++
++    /* Bump formats. */
++    gcvSURF_L6V5U5              = 1000,
++    gcvSURF_V8U8,
++    gcvSURF_X8L8V8U8,
++    gcvSURF_Q8W8V8U8,
++    gcvSURF_A2W10V10U10,
++    gcvSURF_V16U16,
++    gcvSURF_Q16W16V16U16,
++
++    /* R/RG/RA formats. */
++    gcvSURF_R8                  = 1100,
++    gcvSURF_X8R8,
++    gcvSURF_G8R8,
++    gcvSURF_X8G8R8,
++    gcvSURF_A8R8,
++    gcvSURF_R16,
++    gcvSURF_X16R16,
++    gcvSURF_G16R16,
++    gcvSURF_X16G16R16,
++    gcvSURF_A16R16,
++    gcvSURF_R32,
++    gcvSURF_X32R32,
++    gcvSURF_G32R32,
++    gcvSURF_X32G32R32,
++    gcvSURF_A32R32,
++    gcvSURF_RG16,
++
++    /* Floating point formats. */
++    gcvSURF_R16F                = 1200,
++    gcvSURF_X16R16F,
++    gcvSURF_G16R16F,
++    gcvSURF_X16G16R16F,
++    gcvSURF_B16G16R16F,
++    gcvSURF_X16B16G16R16F,
++    gcvSURF_A16B16G16R16F,
++    gcvSURF_R32F,
++    gcvSURF_X32R32F,
++    gcvSURF_G32R32F,
++    gcvSURF_X32G32R32F,
++    gcvSURF_B32G32R32F,
++    gcvSURF_X32B32G32R32F,
++    gcvSURF_A32B32G32R32F,
++    gcvSURF_A16F,
++    gcvSURF_L16F,
++    gcvSURF_A16L16F,
++    gcvSURF_A16R16F,
++    gcvSURF_A32F,
++    gcvSURF_L32F,
++    gcvSURF_A32L32F,
++    gcvSURF_A32R32F,
++
++}
++gceSURF_FORMAT;
++
++/* Pixel swizzle modes. */
++typedef enum _gceSURF_SWIZZLE
++{
++    gcvSURF_NOSWIZZLE = 0,
++    gcvSURF_ARGB,
++    gcvSURF_ABGR,
++    gcvSURF_RGBA,
++    gcvSURF_BGRA
++}
++gceSURF_SWIZZLE;
++
++/* Transparency modes. */
++typedef enum _gceSURF_TRANSPARENCY
++{
++    /* Valid only for PE 1.0 */
++    gcvSURF_OPAQUE = 0,
++    gcvSURF_SOURCE_MATCH,
++    gcvSURF_SOURCE_MASK,
++    gcvSURF_PATTERN_MASK,
++}
++gceSURF_TRANSPARENCY;
++
++/* Surface Alignment. */
++typedef enum _gceSURF_ALIGNMENT
++{
++    gcvSURF_FOUR = 0,
++    gcvSURF_SIXTEEN,
++    gcvSURF_SUPER_TILED,
++    gcvSURF_SPLIT_TILED,
++    gcvSURF_SPLIT_SUPER_TILED,
++}
++gceSURF_ALIGNMENT;
++
++
++/* Surface Addressing. */
++typedef enum _gceSURF_ADDRESSING
++{
++    gcvSURF_NO_STRIDE_TILED = 0,
++    gcvSURF_NO_STRIDE_LINEAR,
++    gcvSURF_STRIDE_TILED,
++    gcvSURF_STRIDE_LINEAR
++}
++gceSURF_ADDRESSING;
++
++/* Transparency modes. */
++typedef enum _gce2D_TRANSPARENCY
++{
++    /* Valid only for PE 2.0 */
++    gcv2D_OPAQUE = 0,
++    gcv2D_KEYED,
++    gcv2D_MASKED
++}
++gce2D_TRANSPARENCY;
++
++/* Mono packing modes. */
++typedef enum _gceSURF_MONOPACK
++{
++    gcvSURF_PACKED8 = 0,
++    gcvSURF_PACKED16,
++    gcvSURF_PACKED32,
++    gcvSURF_UNPACKED,
++}
++gceSURF_MONOPACK;
++
++/* Blending modes. */
++typedef enum _gceSURF_BLEND_MODE
++{
++    /* Porter-Duff blending modes.                   */
++    /*                         Fsrc      Fdst        */
++    gcvBLEND_CLEAR = 0,     /* 0         0           */
++    gcvBLEND_SRC,           /* 1         0           */
++    gcvBLEND_DST,           /* 0         1           */
++    gcvBLEND_SRC_OVER_DST,  /* 1         1 - Asrc    */
++    gcvBLEND_DST_OVER_SRC,  /* 1 - Adst  1           */
++    gcvBLEND_SRC_IN_DST,    /* Adst      0           */
++    gcvBLEND_DST_IN_SRC,    /* 0         Asrc        */
++    gcvBLEND_SRC_OUT_DST,   /* 1 - Adst  0           */
++    gcvBLEND_DST_OUT_SRC,   /* 0         1 - Asrc    */
++    gcvBLEND_SRC_ATOP_DST,  /* Adst      1 - Asrc    */
++    gcvBLEND_DST_ATOP_SRC,  /* 1 - Adst  Asrc        */
++    gcvBLEND_SRC_XOR_DST,   /* 1 - Adst  1 - Asrc    */
++
++    /* Special blending modes.                       */
++    gcvBLEND_SET,           /* DST = 1               */
++    gcvBLEND_SUB            /* DST = DST * (1 - SRC) */
++}
++gceSURF_BLEND_MODE;
++
++/* Per-pixel alpha modes. */
++typedef enum _gceSURF_PIXEL_ALPHA_MODE
++{
++    gcvSURF_PIXEL_ALPHA_STRAIGHT = 0,
++    gcvSURF_PIXEL_ALPHA_INVERSED
++}
++gceSURF_PIXEL_ALPHA_MODE;
++
++/* Global alpha modes. */
++typedef enum _gceSURF_GLOBAL_ALPHA_MODE
++{
++    gcvSURF_GLOBAL_ALPHA_OFF = 0,
++    gcvSURF_GLOBAL_ALPHA_ON,
++    gcvSURF_GLOBAL_ALPHA_SCALE
++}
++gceSURF_GLOBAL_ALPHA_MODE;
++
++/* Color component modes for alpha blending. */
++typedef enum _gceSURF_PIXEL_COLOR_MODE
++{
++    gcvSURF_COLOR_STRAIGHT = 0,
++    gcvSURF_COLOR_MULTIPLY
++}
++gceSURF_PIXEL_COLOR_MODE;
++
++/* Color component modes for alpha blending. */
++typedef enum _gce2D_PIXEL_COLOR_MULTIPLY_MODE
++{
++    gcv2D_COLOR_MULTIPLY_DISABLE = 0,
++    gcv2D_COLOR_MULTIPLY_ENABLE
++}
++gce2D_PIXEL_COLOR_MULTIPLY_MODE;
++
++/* Color component modes for alpha blending. */
++typedef enum _gce2D_GLOBAL_COLOR_MULTIPLY_MODE
++{
++    gcv2D_GLOBAL_COLOR_MULTIPLY_DISABLE = 0,
++    gcv2D_GLOBAL_COLOR_MULTIPLY_ALPHA,
++    gcv2D_GLOBAL_COLOR_MULTIPLY_COLOR
++}
++gce2D_GLOBAL_COLOR_MULTIPLY_MODE;
++
++/* Alpha blending factor modes. */
++typedef enum _gceSURF_BLEND_FACTOR_MODE
++{
++    gcvSURF_BLEND_ZERO = 0,
++    gcvSURF_BLEND_ONE,
++    gcvSURF_BLEND_STRAIGHT,
++    gcvSURF_BLEND_INVERSED,
++    gcvSURF_BLEND_COLOR,
++    gcvSURF_BLEND_COLOR_INVERSED,
++    gcvSURF_BLEND_SRC_ALPHA_SATURATED,
++    gcvSURF_BLEND_STRAIGHT_NO_CROSS,
++    gcvSURF_BLEND_INVERSED_NO_CROSS,
++    gcvSURF_BLEND_COLOR_NO_CROSS,
++    gcvSURF_BLEND_COLOR_INVERSED_NO_CROSS,
++    gcvSURF_BLEND_SRC_ALPHA_SATURATED_CROSS
++}
++gceSURF_BLEND_FACTOR_MODE;
++
++/* Alpha blending porter duff rules. */
++typedef enum _gce2D_PORTER_DUFF_RULE
++{
++    gcvPD_CLEAR = 0,
++    gcvPD_SRC,
++    gcvPD_SRC_OVER,
++    gcvPD_DST_OVER,
++    gcvPD_SRC_IN,
++    gcvPD_DST_IN,
++    gcvPD_SRC_OUT,
++    gcvPD_DST_OUT,
++    gcvPD_SRC_ATOP,
++    gcvPD_DST_ATOP,
++    gcvPD_ADD,
++    gcvPD_XOR,
++    gcvPD_DST
++}
++gce2D_PORTER_DUFF_RULE;
++
++/* Alpha blending factor modes. */
++typedef enum _gce2D_YUV_COLOR_MODE
++{
++    gcv2D_YUV_601= 0,
++    gcv2D_YUV_709,
++    gcv2D_YUV_USER_DEFINED,
++    gcv2D_YUV_USER_DEFINED_CLAMP,
++
++    /* Default setting is for src. gcv2D_YUV_DST
++        can be ORed to set dst.
++    */
++    gcv2D_YUV_DST = 0x80000000,
++}
++gce2D_YUV_COLOR_MODE;
++
++typedef enum _gce2D_COMMAND
++{
++    gcv2D_CLEAR = 0,
++    gcv2D_LINE,
++    gcv2D_BLT,
++    gcv2D_STRETCH,
++    gcv2D_HOR_FILTER,
++    gcv2D_VER_FILTER,
++    gcv2D_MULTI_SOURCE_BLT,
++}
++gce2D_COMMAND;
++
++typedef enum _gce2D_TILE_STATUS_CONFIG
++{
++    gcv2D_TSC_DISABLE       = 0,
++    gcv2D_TSC_ENABLE        = 0x00000001,
++    gcv2D_TSC_COMPRESSED    = 0x00000002,
++    gcv2D_TSC_DOWN_SAMPLER  = 0x00000004,
++    gcv2D_TSC_2D_COMPRESSED = 0x00000008,
++}
++gce2D_TILE_STATUS_CONFIG;
++
++typedef enum _gce2D_QUERY
++{
++    gcv2D_QUERY_RGB_ADDRESS_MIN_ALIGN       = 0,
++    gcv2D_QUERY_RGB_STRIDE_MIN_ALIGN,
++    gcv2D_QUERY_YUV_ADDRESS_MIN_ALIGN,
++    gcv2D_QUERY_YUV_STRIDE_MIN_ALIGN,
++}
++gce2D_QUERY;
++
++typedef enum _gce2D_SUPER_TILE_VERSION
++{
++    gcv2D_SUPER_TILE_VERSION_V1       = 1,
++    gcv2D_SUPER_TILE_VERSION_V2       = 2,
++    gcv2D_SUPER_TILE_VERSION_V3       = 3,
++}
++gce2D_SUPER_TILE_VERSION;
++
++typedef enum _gce2D_STATE
++{
++    gcv2D_STATE_SPECIAL_FILTER_MIRROR_MODE       = 1,
++    gcv2D_STATE_SUPER_TILE_VERSION,
++    gcv2D_STATE_EN_GAMMA,
++    gcv2D_STATE_DE_GAMMA,
++    gcv2D_STATE_MULTI_SRC_BLIT_UNIFIED_DST_RECT,
++    gcv2D_STATE_XRGB_ENABLE,
++
++    gcv2D_STATE_ARRAY_EN_GAMMA                   = 0x10001,
++    gcv2D_STATE_ARRAY_DE_GAMMA,
++    gcv2D_STATE_ARRAY_CSC_YUV_TO_RGB,
++    gcv2D_STATE_ARRAY_CSC_RGB_TO_YUV,
++}
++gce2D_STATE;
++
++#ifndef VIVANTE_NO_3D
++/* Texture functions. */
++typedef enum _gceTEXTURE_FUNCTION
++{
++    gcvTEXTURE_DUMMY = 0,
++    gcvTEXTURE_REPLACE = 0,
++    gcvTEXTURE_MODULATE,
++    gcvTEXTURE_ADD,
++    gcvTEXTURE_ADD_SIGNED,
++    gcvTEXTURE_INTERPOLATE,
++    gcvTEXTURE_SUBTRACT,
++    gcvTEXTURE_DOT3
++}
++gceTEXTURE_FUNCTION;
++
++/* Texture sources. */
++typedef enum _gceTEXTURE_SOURCE
++{
++    gcvCOLOR_FROM_TEXTURE = 0,
++    gcvCOLOR_FROM_CONSTANT_COLOR,
++    gcvCOLOR_FROM_PRIMARY_COLOR,
++    gcvCOLOR_FROM_PREVIOUS_COLOR
++}
++gceTEXTURE_SOURCE;
++
++/* Texture source channels. */
++typedef enum _gceTEXTURE_CHANNEL
++{
++    gcvFROM_COLOR = 0,
++    gcvFROM_ONE_MINUS_COLOR,
++    gcvFROM_ALPHA,
++    gcvFROM_ONE_MINUS_ALPHA
++}
++gceTEXTURE_CHANNEL;
++#endif /* VIVANTE_NO_3D */
++
++/* Filter types. */
++typedef enum _gceFILTER_TYPE
++{
++    gcvFILTER_SYNC = 0,
++    gcvFILTER_BLUR,
++    gcvFILTER_USER
++}
++gceFILTER_TYPE;
++
++/* Filter pass types. */
++typedef enum _gceFILTER_PASS_TYPE
++{
++    gcvFILTER_HOR_PASS = 0,
++    gcvFILTER_VER_PASS
++}
++gceFILTER_PASS_TYPE;
++
++/* Endian hints. */
++typedef enum _gceENDIAN_HINT
++{
++    gcvENDIAN_NO_SWAP = 0,
++    gcvENDIAN_SWAP_WORD,
++    gcvENDIAN_SWAP_DWORD
++}
++gceENDIAN_HINT;
++
++/* Tiling modes. */
++typedef enum _gceTILING
++{
++    gcvLINEAR = 0,
++    gcvTILED,
++    gcvSUPERTILED,
++    gcvMULTI_TILED,
++    gcvMULTI_SUPERTILED,
++    gcvMINORTILED,
++}
++gceTILING;
++
++/* 2D pattern type. */
++typedef enum _gce2D_PATTERN
++{
++    gcv2D_PATTERN_SOLID = 0,
++    gcv2D_PATTERN_MONO,
++    gcv2D_PATTERN_COLOR,
++    gcv2D_PATTERN_INVALID
++}
++gce2D_PATTERN;
++
++/* 2D source type. */
++typedef enum _gce2D_SOURCE
++{
++    gcv2D_SOURCE_MASKED = 0,
++    gcv2D_SOURCE_MONO,
++    gcv2D_SOURCE_COLOR,
++    gcv2D_SOURCE_INVALID
++}
++gce2D_SOURCE;
++
++/* Pipes. */
++typedef enum _gcePIPE_SELECT
++{
++    gcvPIPE_INVALID = ~0,
++    gcvPIPE_3D      =  0,
++    gcvPIPE_2D
++}
++gcePIPE_SELECT;
++
++/* Hardware type. */
++typedef enum _gceHARDWARE_TYPE
++{
++    gcvHARDWARE_INVALID = 0x00,
++    gcvHARDWARE_3D      = 0x01,
++    gcvHARDWARE_2D      = 0x02,
++    gcvHARDWARE_VG      = 0x04,
++
++    gcvHARDWARE_3D2D    = gcvHARDWARE_3D | gcvHARDWARE_2D
++}
++gceHARDWARE_TYPE;
++
++#define gcdCHIP_COUNT               3
++
++typedef enum _gceMMU_MODE
++{
++    gcvMMU_MODE_1K,
++    gcvMMU_MODE_4K,
++} gceMMU_MODE;
++
++/* User signal command codes. */
++typedef enum _gceUSER_SIGNAL_COMMAND_CODES
++{
++    gcvUSER_SIGNAL_CREATE,
++    gcvUSER_SIGNAL_DESTROY,
++    gcvUSER_SIGNAL_SIGNAL,
++    gcvUSER_SIGNAL_WAIT,
++    gcvUSER_SIGNAL_MAP,
++    gcvUSER_SIGNAL_UNMAP,
++}
++gceUSER_SIGNAL_COMMAND_CODES;
++
++/* Sync point command codes. */
++typedef enum _gceSYNC_POINT_COMMAND_CODES
++{
++    gcvSYNC_POINT_CREATE,
++    gcvSYNC_POINT_DESTROY,
++    gcvSYNC_POINT_SIGNAL,
++}
++gceSYNC_POINT_COMMAND_CODES;
++
++/* Event locations. */
++typedef enum _gceKERNEL_WHERE
++{
++    gcvKERNEL_COMMAND,
++    gcvKERNEL_VERTEX,
++    gcvKERNEL_TRIANGLE,
++    gcvKERNEL_TEXTURE,
++    gcvKERNEL_PIXEL,
++}
++gceKERNEL_WHERE;
++
++#if gcdENABLE_VG
++/* Hardware blocks. */
++typedef enum _gceBLOCK
++{
++	gcvBLOCK_COMMAND,
++	gcvBLOCK_TESSELLATOR,
++	gcvBLOCK_TESSELLATOR2,
++	gcvBLOCK_TESSELLATOR3,
++	gcvBLOCK_RASTER,
++	gcvBLOCK_VG,
++	gcvBLOCK_VG2,
++	gcvBLOCK_VG3,
++	gcvBLOCK_PIXEL,
++
++	/* Number of defined blocks. */
++	gcvBLOCK_COUNT
++}
++gceBLOCK;
++#endif
++
++/* gcdDUMP message type. */
++typedef enum _gceDEBUG_MESSAGE_TYPE
++{
++    gcvMESSAGE_TEXT,
++    gcvMESSAGE_DUMP
++}
++gceDEBUG_MESSAGE_TYPE;
++
++typedef enum _gceSPECIAL_HINT
++{
++    gceSPECIAL_HINT0,
++    gceSPECIAL_HINT1,
++    gceSPECIAL_HINT2,
++    gceSPECIAL_HINT3,
++    /* For disable dynamic stream/index */
++    gceSPECIAL_HINT4
++}
++gceSPECIAL_HINT;
++
++typedef enum _gceMACHINECODE
++{
++    gcvMACHINECODE_HOVERJET0       = 0x0,
++    gcvMACHINECODE_HOVERJET1      ,
++
++    gcvMACHINECODE_TAIJI0         ,
++    gcvMACHINECODE_TAIJI1         ,
++    gcvMACHINECODE_TAIJI2         ,
++
++    gcvMACHINECODE_ANTUTU0        ,
++
++    gcvMACHINECODE_GLB27_RELEASE_0,
++    gcvMACHINECODE_GLB27_RELEASE_1,
++
++    gcvMACHINECODE_WAVESCAPE0     ,
++    gcvMACHINECODE_WAVESCAPE1     ,
++
++    gcvMACHINECODE_NENAMARKV2_4_0 ,
++    gcvMACHINECODE_NENAMARKV2_4_1 ,
++
++    gcvMACHINECODE_GLB25_RELEASE_0,
++    gcvMACHINECODE_GLB25_RELEASE_1,
++    gcvMACHINECODE_GLB25_RELEASE_2,
++}
++gceMACHINECODE;
++
++
++/******************************************************************************\
++****************************** Object Declarations *****************************
++\******************************************************************************/
++
++typedef struct _gckCONTEXT          * gckCONTEXT;
++typedef struct _gcoCMDBUF           * gcoCMDBUF;
++typedef struct _gcsSTATE_DELTA      * gcsSTATE_DELTA_PTR;
++typedef struct _gcsQUEUE            * gcsQUEUE_PTR;
++typedef struct _gcoQUEUE            * gcoQUEUE;
++typedef struct _gcsHAL_INTERFACE    * gcsHAL_INTERFACE_PTR;
++typedef struct _gcs2D_PROFILE       * gcs2D_PROFILE_PTR;
++
++#if gcdENABLE_VG
++typedef struct _gcoVGHARDWARE *			gcoVGHARDWARE;
++typedef struct _gcoVGBUFFER *           gcoVGBUFFER;
++typedef struct _gckVGHARDWARE *         gckVGHARDWARE;
++typedef struct _gcsVGCONTEXT *			gcsVGCONTEXT_PTR;
++typedef struct _gcsVGCONTEXT_MAP *		gcsVGCONTEXT_MAP_PTR;
++typedef struct _gcsVGCMDQUEUE *			gcsVGCMDQUEUE_PTR;
++typedef struct _gcsTASK_MASTER_TABLE *	gcsTASK_MASTER_TABLE_PTR;
++typedef struct _gckVGKERNEL *			gckVGKERNEL;
++typedef void *					        gctTHREAD;
++#endif
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_enum_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal.h	2015-07-27 23:13:06.194879670 +0200
+@@ -0,0 +1,2671 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_h_
++#define __gc_hal_h_
++
++#include "gc_hal_rename.h"
++#include "gc_hal_types.h"
++#include "gc_hal_enum.h"
++#include "gc_hal_base.h"
++#include "gc_hal_profiler.h"
++#include "gc_hal_driver.h"
++#ifndef VIVANTE_NO_3D
++#include "gc_hal_statistics.h"
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++******************************* Alignment Macros *******************************
++\******************************************************************************/
++
++#define gcmALIGN(n, align) \
++( \
++    ((n) + ((align) - 1)) & ~((align) - 1) \
++)
++
++#define gcmALIGN_BASE(n, align) \
++( \
++    ((n) & ~((align) - 1)) \
++)
++
++/******************************************************************************\
++***************************** Element Count Macro *****************************
++\******************************************************************************/
++
++#define gcmSIZEOF(a) \
++( \
++    (gctSIZE_T) (sizeof(a)) \
++)
++
++#define gcmCOUNTOF(a) \
++( \
++    sizeof(a) / sizeof(a[0]) \
++)
++
++/******************************************************************************\
++********************************* Cast Macro **********************************
++\******************************************************************************/
++#define gcmNAME_TO_PTR(na) \
++        gckKERNEL_QueryPointerFromName(kernel, gcmALL_TO_UINT32(na))
++
++#define gcmPTR_TO_NAME(ptr) \
++        gckKERNEL_AllocateNameFromPointer(kernel, ptr)
++
++#define gcmRELEASE_NAME(na) \
++        gckKERNEL_DeleteName(kernel, gcmALL_TO_UINT32(na))
++
++#ifdef __LP64__
++
++#define gcmALL_TO_UINT32(t) \
++( \
++    (gctUINT32) (gctUINTPTR_T) (t)\
++)
++
++#define gcmPTR_TO_UINT64(p) \
++( \
++    (gctUINT64) (p)\
++)
++
++#define gcmUINT64_TO_PTR(u) \
++( \
++    (gctPOINTER) (u)\
++)
++
++#else /* 32 bit */
++
++#define gcmALL_TO_UINT32(t) \
++( \
++    (gctUINT32) (t)\
++)
++
++#define gcmPTR_TO_UINT64(p) \
++( \
++    (gctUINT64) (gctUINTPTR_T) (p)\
++)
++
++#define gcmUINT64_TO_PTR(u) \
++( \
++    (gctPOINTER) (gctUINTPTR_T) (u)\
++)
++
++#endif
++
++#define gcmUINT64_TO_TYPE(u, t) \
++( \
++    (t) (gctUINTPTR_T) (u)\
++)
++
++/******************************************************************************\
++******************************** Useful Macro *********************************
++\******************************************************************************/
++
++#define gcvINVALID_ADDRESS          ~0U
++
++#define gcmGET_PRE_ROTATION(rotate) \
++    ((rotate) & (~(gcvSURF_POST_FLIP_X | gcvSURF_POST_FLIP_Y)))
++
++#define gcmGET_POST_ROTATION(rotate) \
++    ((rotate) & (gcvSURF_POST_FLIP_X | gcvSURF_POST_FLIP_Y))
++
++/******************************************************************************\
++******************************** gcsOBJECT Object *******************************
++\******************************************************************************/
++
++/* Type of objects. */
++typedef enum _gceOBJECT_TYPE
++{
++    gcvOBJ_UNKNOWN              = 0,
++    gcvOBJ_2D                   = gcmCC('2','D',' ',' '),
++    gcvOBJ_3D                   = gcmCC('3','D',' ',' '),
++    gcvOBJ_ATTRIBUTE            = gcmCC('A','T','T','R'),
++    gcvOBJ_BRUSHCACHE           = gcmCC('B','R','U','$'),
++    gcvOBJ_BRUSHNODE            = gcmCC('B','R','U','n'),
++    gcvOBJ_BRUSH                = gcmCC('B','R','U','o'),
++    gcvOBJ_BUFFER               = gcmCC('B','U','F','R'),
++    gcvOBJ_COMMAND              = gcmCC('C','M','D',' '),
++    gcvOBJ_COMMANDBUFFER        = gcmCC('C','M','D','B'),
++    gcvOBJ_CONTEXT              = gcmCC('C','T','X','T'),
++    gcvOBJ_DEVICE               = gcmCC('D','E','V',' '),
++    gcvOBJ_DUMP                 = gcmCC('D','U','M','P'),
++    gcvOBJ_EVENT                = gcmCC('E','V','N','T'),
++    gcvOBJ_FUNCTION             = gcmCC('F','U','N','C'),
++    gcvOBJ_HAL                  = gcmCC('H','A','L',' '),
++    gcvOBJ_HARDWARE             = gcmCC('H','A','R','D'),
++    gcvOBJ_HEAP                 = gcmCC('H','E','A','P'),
++    gcvOBJ_INDEX                = gcmCC('I','N','D','X'),
++    gcvOBJ_INTERRUPT            = gcmCC('I','N','T','R'),
++    gcvOBJ_KERNEL               = gcmCC('K','E','R','N'),
++    gcvOBJ_KERNEL_FUNCTION      = gcmCC('K','F','C','N'),
++    gcvOBJ_MEMORYBUFFER         = gcmCC('M','E','M','B'),
++    gcvOBJ_MMU                  = gcmCC('M','M','U',' '),
++    gcvOBJ_OS                   = gcmCC('O','S',' ',' '),
++    gcvOBJ_OUTPUT               = gcmCC('O','U','T','P'),
++    gcvOBJ_PAINT                = gcmCC('P','N','T',' '),
++    gcvOBJ_PATH                 = gcmCC('P','A','T','H'),
++    gcvOBJ_QUEUE                = gcmCC('Q','U','E',' '),
++    gcvOBJ_SAMPLER              = gcmCC('S','A','M','P'),
++    gcvOBJ_SHADER               = gcmCC('S','H','D','R'),
++    gcvOBJ_STREAM               = gcmCC('S','T','R','M'),
++    gcvOBJ_SURF                 = gcmCC('S','U','R','F'),
++    gcvOBJ_TEXTURE              = gcmCC('T','X','T','R'),
++    gcvOBJ_UNIFORM              = gcmCC('U','N','I','F'),
++    gcvOBJ_VARIABLE             = gcmCC('V','A','R','I'),
++    gcvOBJ_VERTEX               = gcmCC('V','R','T','X'),
++    gcvOBJ_VIDMEM               = gcmCC('V','M','E','M'),
++    gcvOBJ_VG                   = gcmCC('V','G',' ',' '),
++}
++gceOBJECT_TYPE;
++
++/* gcsOBJECT object defintinon. */
++typedef struct _gcsOBJECT
++{
++    /* Type of an object. */
++    gceOBJECT_TYPE              type;
++}
++gcsOBJECT;
++
++typedef struct _gckHARDWARE *       gckHARDWARE;
++
++/* CORE flags. */
++typedef enum _gceCORE
++{
++    gcvCORE_MAJOR       = 0x0,
++    gcvCORE_2D          = 0x1,
++    gcvCORE_VG          = 0x2
++}
++gceCORE;
++
++#define gcdMAX_GPU_COUNT               3
++
++/*******************************************************************************
++**
++**  gcmVERIFY_OBJECT
++**
++**      Assert if an object is invalid or is not of the specified type.  If the
++**      object is invalid or not of the specified type, gcvSTATUS_INVALID_OBJECT
++**      will be returned from the current function.  In retail mode this macro
++**      does nothing.
++**
++**  ARGUMENTS:
++**
++**      obj     Object to test.
++**      t       Expected type of the object.
++*/
++#if gcmIS_DEBUG(gcdDEBUG_TRACE)
++#define _gcmVERIFY_OBJECT(prefix, obj, t) \
++    if ((obj) == gcvNULL) \
++    { \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++                      #prefix "VERIFY_OBJECT failed: NULL"); \
++        prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
++                      gcmCC_PRINT(t)); \
++        prefix##ASSERT((obj) != gcvNULL); \
++        prefix##FOOTER_ARG("status=%d", gcvSTATUS_INVALID_OBJECT); \
++        return gcvSTATUS_INVALID_OBJECT; \
++    } \
++    else if (((gcsOBJECT*) (obj))->type != t) \
++    { \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++                      #prefix "VERIFY_OBJECT failed: %c%c%c%c", \
++                      gcmCC_PRINT(((gcsOBJECT*) (obj))->type)); \
++        prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
++                      gcmCC_PRINT(t)); \
++        prefix##ASSERT(((gcsOBJECT*)(obj))->type == t); \
++        prefix##FOOTER_ARG("status=%d", gcvSTATUS_INVALID_OBJECT); \
++        return gcvSTATUS_INVALID_OBJECT; \
++    }
++
++#   define gcmVERIFY_OBJECT(obj, t)     _gcmVERIFY_OBJECT(gcm, obj, t)
++#   define gcmkVERIFY_OBJECT(obj, t)    _gcmVERIFY_OBJECT(gcmk, obj, t)
++#else
++#   define gcmVERIFY_OBJECT(obj, t)     do {} while (gcvFALSE)
++#   define gcmkVERIFY_OBJECT(obj, t)    do {} while (gcvFALSE)
++#endif
++
++/******************************************************************************/
++/*VERIFY_OBJECT if special return expected*/
++/******************************************************************************/
++#ifndef EGL_API_ANDROID
++#   define _gcmVERIFY_OBJECT_RETURN(prefix, obj, t, retVal) \
++        do \
++        { \
++            if ((obj) == gcvNULL) \
++            { \
++                prefix##PRINT_VERSION(); \
++                prefix##TRACE(gcvLEVEL_ERROR, \
++                              #prefix "VERIFY_OBJECT_RETURN failed: NULL"); \
++                prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
++                              gcmCC_PRINT(t)); \
++                prefix##ASSERT((obj) != gcvNULL); \
++                prefix##FOOTER_ARG("retVal=%d", retVal); \
++                return retVal; \
++            } \
++            else if (((gcsOBJECT*) (obj))->type != t) \
++            { \
++                prefix##PRINT_VERSION(); \
++                prefix##TRACE(gcvLEVEL_ERROR, \
++                              #prefix "VERIFY_OBJECT_RETURN failed: %c%c%c%c", \
++                              gcmCC_PRINT(((gcsOBJECT*) (obj))->type)); \
++                prefix##TRACE(gcvLEVEL_ERROR, "  expected: %c%c%c%c", \
++                              gcmCC_PRINT(t)); \
++                prefix##ASSERT(((gcsOBJECT*)(obj))->type == t); \
++                prefix##FOOTER_ARG("retVal=%d", retVal); \
++                return retVal; \
++            } \
++        } \
++        while (gcvFALSE)
++#   define gcmVERIFY_OBJECT_RETURN(obj, t, retVal) \
++                            _gcmVERIFY_OBJECT_RETURN(gcm, obj, t, retVal)
++#   define gcmkVERIFY_OBJECT_RETURN(obj, t, retVal) \
++                            _gcmVERIFY_OBJECT_RETURN(gcmk, obj, t, retVal)
++#else
++#   define gcmVERIFY_OBJECT_RETURN(obj, t)     do {} while (gcvFALSE)
++#   define gcmVERIFY_OBJECT_RETURN(obj, t)    do {} while (gcvFALSE)
++#endif
++
++/******************************************************************************\
++********************************** gckOS Object *********************************
++\******************************************************************************/
++
++/* Construct a new gckOS object. */
++gceSTATUS
++gckOS_Construct(
++    IN gctPOINTER Context,
++    OUT gckOS * Os
++    );
++
++/* Destroy an gckOS object. */
++gceSTATUS
++gckOS_Destroy(
++    IN gckOS Os
++    );
++
++/* Query the video memory. */
++gceSTATUS
++gckOS_QueryVideoMemory(
++    IN gckOS Os,
++    OUT gctPHYS_ADDR * InternalAddress,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctPHYS_ADDR * ExternalAddress,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctPHYS_ADDR * ContiguousAddress,
++    OUT gctSIZE_T * ContiguousSize
++    );
++
++/* Allocate memory from the heap. */
++gceSTATUS
++gckOS_Allocate(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    );
++
++/* Free allocated memory. */
++gceSTATUS
++gckOS_Free(
++    IN gckOS Os,
++    IN gctPOINTER Memory
++    );
++
++/* Wrapper for allocation memory.. */
++gceSTATUS
++gckOS_AllocateMemory(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    );
++
++/* Wrapper for freeing memory. */
++gceSTATUS
++gckOS_FreeMemory(
++    IN gckOS Os,
++    IN gctPOINTER Memory
++    );
++
++/* Allocate paged memory. */
++gceSTATUS
++gckOS_AllocatePagedMemory(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPHYS_ADDR * Physical
++    );
++
++/* Allocate paged memory. */
++gceSTATUS
++gckOS_AllocatePagedMemoryEx(
++    IN gckOS Os,
++    IN gctBOOL Contiguous,
++    IN gctSIZE_T Bytes,
++    OUT gctPHYS_ADDR * Physical
++    );
++
++/* Lock pages. */
++gceSTATUS
++gckOS_LockPages(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctBOOL Cacheable,
++    OUT gctPOINTER * Logical,
++    OUT gctSIZE_T * PageCount
++    );
++
++/* Map pages. */
++gceSTATUS
++gckOS_MapPages(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++#ifdef __QNXNTO__
++    IN gctPOINTER Logical,
++#endif
++    IN gctSIZE_T PageCount,
++    IN gctPOINTER PageTable
++    );
++
++/* Map pages. */
++gceSTATUS
++gckOS_MapPagesEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPHYS_ADDR Physical,
++#ifdef __QNXNTO__
++    IN gctPOINTER Logical,
++#endif
++    IN gctSIZE_T PageCount,
++    IN gctPOINTER PageTable
++    );
++
++/* Unlock pages. */
++gceSTATUS
++gckOS_UnlockPages(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    );
++
++/* Free paged memory. */
++gceSTATUS
++gckOS_FreePagedMemory(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes
++    );
++
++/* Allocate non-paged memory. */
++gceSTATUS
++gckOS_AllocateNonPagedMemory(
++    IN gckOS Os,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    );
++
++/* Free non-paged memory. */
++gceSTATUS
++gckOS_FreeNonPagedMemory(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical
++    );
++
++/* Allocate contiguous memory. */
++gceSTATUS
++gckOS_AllocateContiguous(
++    IN gckOS Os,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    );
++
++/* Free contiguous memory. */
++gceSTATUS
++gckOS_FreeContiguous(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++
++/* Get the number fo bytes per page. */
++gceSTATUS
++gckOS_GetPageSize(
++    IN gckOS Os,
++    OUT gctSIZE_T * PageSize
++    );
++
++/* Get the physical address of a corresponding logical address. */
++gceSTATUS
++gckOS_GetPhysicalAddress(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    );
++
++/* Get the physical address of a corresponding logical address. */
++gceSTATUS
++gckOS_GetPhysicalAddressProcess(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    IN gctUINT32 ProcessID,
++    OUT gctUINT32 * Address
++    );
++
++/* Map physical memory. */
++gceSTATUS
++gckOS_MapPhysical(
++    IN gckOS Os,
++    IN gctUINT32 Physical,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Logical
++    );
++
++/* Unmap previously mapped physical memory. */
++gceSTATUS
++gckOS_UnmapPhysical(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    );
++
++/* Read data from a hardware register. */
++gceSTATUS
++gckOS_ReadRegister(
++    IN gckOS Os,
++    IN gctUINT32 Address,
++    OUT gctUINT32 * Data
++    );
++
++/* Read data from a hardware register. */
++gceSTATUS
++gckOS_ReadRegisterEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT32 Address,
++    OUT gctUINT32 * Data
++    );
++
++/* Write data to a hardware register. */
++gceSTATUS
++gckOS_WriteRegister(
++    IN gckOS Os,
++    IN gctUINT32 Address,
++    IN gctUINT32 Data
++    );
++
++/* Write data to a hardware register. */
++gceSTATUS
++gckOS_WriteRegisterEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT32 Address,
++    IN gctUINT32 Data
++    );
++
++/* Write data to a 32-bit memory location. */
++gceSTATUS
++gckOS_WriteMemory(
++    IN gckOS Os,
++    IN gctPOINTER Address,
++    IN gctUINT32 Data
++    );
++
++/* Map physical memory into the process space. */
++gceSTATUS
++gckOS_MapMemory(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Logical
++    );
++
++/* Unmap physical memory from the specified process space. */
++gceSTATUS
++gckOS_UnmapMemoryEx(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical,
++    IN gctUINT32 PID
++    );
++
++/* Unmap physical memory from the process space. */
++gceSTATUS
++gckOS_UnmapMemory(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    );
++
++/* Unmap user logical memory out of physical memory.
++ * This function is only supported in Linux currently.
++ */
++gceSTATUS
++gckOS_UnmapUserLogical(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    );
++
++/* Create a new mutex. */
++gceSTATUS
++gckOS_CreateMutex(
++    IN gckOS Os,
++    OUT gctPOINTER * Mutex
++    );
++
++/* Delete a mutex. */
++gceSTATUS
++gckOS_DeleteMutex(
++    IN gckOS Os,
++    IN gctPOINTER Mutex
++    );
++
++/* Acquire a mutex. */
++gceSTATUS
++gckOS_AcquireMutex(
++    IN gckOS Os,
++    IN gctPOINTER Mutex,
++    IN gctUINT32 Timeout
++    );
++
++/* Release a mutex. */
++gceSTATUS
++gckOS_ReleaseMutex(
++    IN gckOS Os,
++    IN gctPOINTER Mutex
++    );
++
++/* Atomically exchange a pair of 32-bit values. */
++gceSTATUS
++gckOS_AtomicExchange(
++    IN gckOS Os,
++    IN OUT gctUINT32_PTR Target,
++    IN gctUINT32 NewValue,
++    OUT gctUINT32_PTR OldValue
++    );
++
++/* Atomically exchange a pair of pointers. */
++gceSTATUS
++gckOS_AtomicExchangePtr(
++    IN gckOS Os,
++    IN OUT gctPOINTER * Target,
++    IN gctPOINTER NewValue,
++    OUT gctPOINTER * OldValue
++    );
++
++#if gcdSMP
++gceSTATUS
++gckOS_AtomSetMask(
++    IN gctPOINTER Atom,
++    IN gctUINT32 Mask
++    );
++
++gceSTATUS
++gckOS_AtomClearMask(
++    IN gctPOINTER Atom,
++    IN gctUINT32 Mask
++    );
++#endif
++
++gceSTATUS
++gckOS_DumpCallStack(
++    IN gckOS Os
++    );
++
++gceSTATUS
++gckOS_GetProcessNameByPid(
++    IN gctINT Pid,
++    IN gctSIZE_T Length,
++    OUT gctUINT8_PTR String
++    );
++
++
++
++/*******************************************************************************
++**
++**  gckOS_AtomConstruct
++**
++**  Create an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Atom
++**          Pointer to a variable receiving the constructed atom.
++*/
++gceSTATUS
++gckOS_AtomConstruct(
++    IN gckOS Os,
++    OUT gctPOINTER * Atom
++    );
++
++/*******************************************************************************
++**
++**  gckOS_AtomDestroy
++**
++**  Destroy an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomDestroy(
++    IN gckOS Os,
++    OUT gctPOINTER Atom
++    );
++
++/*******************************************************************************
++**
++**  gckOS_AtomGet
++**
++**  Get the 32-bit value protected by an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**  OUTPUT:
++**
++**      gctINT32_PTR Value
++**          Pointer to a variable the receives the value of the atom.
++*/
++gceSTATUS
++gckOS_AtomGet(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    OUT gctINT32_PTR Value
++    );
++
++/*******************************************************************************
++**
++**  gckOS_AtomSet
++**
++**  Set the 32-bit value protected by an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**      gctINT32 Value
++**          The value of the atom.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomSet(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    IN gctINT32 Value
++    );
++
++/*******************************************************************************
++**
++**  gckOS_AtomIncrement
++**
++**  Atomically increment the 32-bit integer value inside an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**  OUTPUT:
++**
++**      gctINT32_PTR Value
++**          Pointer to a variable the receives the original value of the atom.
++*/
++gceSTATUS
++gckOS_AtomIncrement(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    OUT gctINT32_PTR Value
++    );
++
++/*******************************************************************************
++**
++**  gckOS_AtomDecrement
++**
++**  Atomically decrement the 32-bit integer value inside an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**  OUTPUT:
++**
++**      gctINT32_PTR Value
++**          Pointer to a variable the receives the original value of the atom.
++*/
++gceSTATUS
++gckOS_AtomDecrement(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    OUT gctINT32_PTR Value
++    );
++
++/* Delay a number of microseconds. */
++gceSTATUS
++gckOS_Delay(
++    IN gckOS Os,
++    IN gctUINT32 Delay
++    );
++
++/* Get time in milliseconds. */
++gceSTATUS
++gckOS_GetTicks(
++    OUT gctUINT32_PTR Time
++    );
++
++/* Compare time value. */
++gceSTATUS
++gckOS_TicksAfter(
++    IN gctUINT32 Time1,
++    IN gctUINT32 Time2,
++    OUT gctBOOL_PTR IsAfter
++    );
++
++/* Get time in microseconds. */
++gceSTATUS
++gckOS_GetTime(
++    OUT gctUINT64_PTR Time
++    );
++
++/* Memory barrier. */
++gceSTATUS
++gckOS_MemoryBarrier(
++    IN gckOS Os,
++    IN gctPOINTER Address
++    );
++
++/* Map user pointer. */
++gceSTATUS
++gckOS_MapUserPointer(
++    IN gckOS Os,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * KernelPointer
++    );
++
++/* Unmap user pointer. */
++gceSTATUS
++gckOS_UnmapUserPointer(
++    IN gckOS Os,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size,
++    IN gctPOINTER KernelPointer
++    );
++
++/*******************************************************************************
++**
++**  gckOS_QueryNeedCopy
++**
++**  Query whether the memory can be accessed or mapped directly or it has to be
++**  copied.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Process ID of the current process.
++**
++**  OUTPUT:
++**
++**      gctBOOL_PTR NeedCopy
++**          Pointer to a boolean receiving gcvTRUE if the memory needs a copy or
++**          gcvFALSE if the memory can be accessed or mapped dircetly.
++*/
++gceSTATUS
++gckOS_QueryNeedCopy(
++    IN gckOS Os,
++    IN gctUINT32 ProcessID,
++    OUT gctBOOL_PTR NeedCopy
++    );
++
++/*******************************************************************************
++**
++**  gckOS_CopyFromUserData
++**
++**  Copy data from user to kernel memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER KernelPointer
++**          Pointer to kernel memory.
++**
++**      gctPOINTER Pointer
++**          Pointer to user memory.
++**
++**      gctSIZE_T Size
++**          Number of bytes to copy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_CopyFromUserData(
++    IN gckOS Os,
++    IN gctPOINTER KernelPointer,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size
++    );
++
++/*******************************************************************************
++**
++**  gckOS_CopyToUserData
++**
++**  Copy data from kernel to user memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER KernelPointer
++**          Pointer to kernel memory.
++**
++**      gctPOINTER Pointer
++**          Pointer to user memory.
++**
++**      gctSIZE_T Size
++**          Number of bytes to copy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_CopyToUserData(
++    IN gckOS Os,
++    IN gctPOINTER KernelPointer,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size
++    );
++
++#ifdef __QNXNTO__
++/* Map user physical address. */
++gceSTATUS
++gckOS_MapUserPhysical(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Phys,
++    OUT gctPOINTER * KernelPointer
++    );
++#endif
++
++gceSTATUS
++gckOS_SuspendInterrupt(
++    IN gckOS Os
++    );
++
++gceSTATUS
++gckOS_SuspendInterruptEx(
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++gceSTATUS
++gckOS_ResumeInterrupt(
++    IN gckOS Os
++    );
++
++gceSTATUS
++gckOS_ResumeInterruptEx(
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++/* Get the base address for the physical memory. */
++gceSTATUS
++gckOS_GetBaseAddress(
++    IN gckOS Os,
++    OUT gctUINT32_PTR BaseAddress
++    );
++
++/* Perform a memory copy. */
++gceSTATUS
++gckOS_MemCopy(
++    IN gctPOINTER Destination,
++    IN gctCONST_POINTER Source,
++    IN gctSIZE_T Bytes
++    );
++
++/* Zero memory. */
++gceSTATUS
++gckOS_ZeroMemory(
++    IN gctPOINTER Memory,
++    IN gctSIZE_T Bytes
++    );
++
++/* Device I/O control to the kernel HAL layer. */
++gceSTATUS
++gckOS_DeviceControl(
++    IN gckOS Os,
++    IN gctBOOL FromUser,
++    IN gctUINT32 IoControlCode,
++    IN gctPOINTER InputBuffer,
++    IN gctSIZE_T InputBufferSize,
++    OUT gctPOINTER OutputBuffer,
++    IN gctSIZE_T OutputBufferSize
++    );
++
++/*******************************************************************************
++**
++**  gckOS_GetProcessID
++**
++**  Get current process ID.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR ProcessID
++**          Pointer to the variable that receives the process ID.
++*/
++gceSTATUS
++gckOS_GetProcessID(
++    OUT gctUINT32_PTR ProcessID
++    );
++
++gceSTATUS
++gckOS_GetCurrentProcessID(
++    OUT gctUINT32_PTR ProcessID
++    );
++
++/*******************************************************************************
++**
++**  gckOS_GetThreadID
++**
++**  Get current thread ID.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR ThreadID
++**          Pointer to the variable that receives the thread ID.
++*/
++gceSTATUS
++gckOS_GetThreadID(
++    OUT gctUINT32_PTR ThreadID
++    );
++
++/******************************************************************************\
++********************************** Signal Object *********************************
++\******************************************************************************/
++
++/* Create a signal. */
++gceSTATUS
++gckOS_CreateSignal(
++    IN gckOS Os,
++    IN gctBOOL ManualReset,
++    OUT gctSIGNAL * Signal
++    );
++
++/* Destroy a signal. */
++gceSTATUS
++gckOS_DestroySignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal
++    );
++
++/* Signal a signal. */
++gceSTATUS
++gckOS_Signal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctBOOL State
++    );
++
++/* Wait for a signal. */
++gceSTATUS
++gckOS_WaitSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctUINT32 Wait
++    );
++
++/* Map a user signal to the kernel space. */
++gceSTATUS
++gckOS_MapSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctHANDLE Process,
++    OUT gctSIGNAL * MappedSignal
++    );
++
++/* Unmap a user signal */
++gceSTATUS
++gckOS_UnmapSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal
++    );
++
++/* Map user memory. */
++gceSTATUS
++gckOS_MapUserMemory(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPOINTER Memory,
++    IN gctUINT32 Physical,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * Info,
++    OUT gctUINT32_PTR Address
++    );
++
++/* Unmap user memory. */
++gceSTATUS
++gckOS_UnmapUserMemory(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPOINTER Memory,
++    IN gctSIZE_T Size,
++    IN gctPOINTER Info,
++    IN gctUINT32 Address
++    );
++
++/******************************************************************************\
++************************** Android Native Fence Sync ***************************
++\******************************************************************************/
++gceSTATUS
++gckOS_CreateSyncTimeline(
++    IN gckOS Os,
++    OUT gctHANDLE * Timeline
++    );
++
++gceSTATUS
++gckOS_DestroySyncTimeline(
++    IN gckOS Os,
++    IN gctHANDLE Timeline
++    );
++
++gceSTATUS
++gckOS_CreateSyncPoint(
++    IN gckOS Os,
++    OUT gctSYNC_POINT * SyncPoint
++    );
++
++gceSTATUS
++gckOS_ReferenceSyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint
++    );
++
++gceSTATUS
++gckOS_DestroySyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint
++    );
++
++gceSTATUS
++gckOS_SignalSyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint
++    );
++
++gceSTATUS
++gckOS_QuerySyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint,
++    OUT gctBOOL_PTR State
++    );
++
++gceSTATUS
++gckOS_CreateNativeFence(
++    IN gckOS Os,
++    IN gctHANDLE Timeline,
++    IN gctSYNC_POINT SyncPoint,
++    OUT gctINT * FenceFD
++    );
++
++#if !USE_NEW_LINUX_SIGNAL
++/* Create signal to be used in the user space. */
++gceSTATUS
++gckOS_CreateUserSignal(
++    IN gckOS Os,
++    IN gctBOOL ManualReset,
++    OUT gctINT * SignalID
++    );
++
++/* Destroy signal used in the user space. */
++gceSTATUS
++gckOS_DestroyUserSignal(
++    IN gckOS Os,
++    IN gctINT SignalID
++    );
++
++/* Wait for signal used in the user space. */
++gceSTATUS
++gckOS_WaitUserSignal(
++    IN gckOS Os,
++    IN gctINT SignalID,
++    IN gctUINT32 Wait
++    );
++
++/* Signal a signal used in the user space. */
++gceSTATUS
++gckOS_SignalUserSignal(
++    IN gckOS Os,
++    IN gctINT SignalID,
++    IN gctBOOL State
++    );
++#endif /* USE_NEW_LINUX_SIGNAL */
++
++/* Set a signal owned by a process. */
++#if defined(__QNXNTO__)
++gceSTATUS
++gckOS_UserSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctINT Recvid,
++    IN gctINT Coid
++    );
++#else
++gceSTATUS
++gckOS_UserSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctHANDLE Process
++    );
++#endif
++
++/******************************************************************************\
++** Cache Support
++*/
++
++gceSTATUS
++gckOS_CacheClean(
++    gckOS Os,
++    gctUINT32 ProcessID,
++    gctPHYS_ADDR Handle,
++    gctPOINTER Physical,
++    gctPOINTER Logical,
++    gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gckOS_CacheFlush(
++    gckOS Os,
++    gctUINT32 ProcessID,
++    gctPHYS_ADDR Handle,
++    gctPOINTER Physical,
++    gctPOINTER Logical,
++    gctSIZE_T Bytes
++    );
++
++gceSTATUS
++gckOS_CacheInvalidate(
++    gckOS Os,
++    gctUINT32 ProcessID,
++    gctPHYS_ADDR Handle,
++    gctPOINTER Physical,
++    gctPOINTER Logical,
++    gctSIZE_T Bytes
++    );
++
++/******************************************************************************\
++** Debug Support
++*/
++
++void
++gckOS_SetDebugLevel(
++    IN gctUINT32 Level
++    );
++
++void
++gckOS_SetDebugZone(
++    IN gctUINT32 Zone
++    );
++
++void
++gckOS_SetDebugLevelZone(
++    IN gctUINT32 Level,
++    IN gctUINT32 Zone
++    );
++
++void
++gckOS_SetDebugZones(
++    IN gctUINT32 Zones,
++    IN gctBOOL Enable
++    );
++
++void
++gckOS_SetDebugFile(
++    IN gctCONST_STRING FileName
++    );
++
++/*******************************************************************************
++** Broadcast interface.
++*/
++
++typedef enum _gceBROADCAST
++{
++    /* GPU might be idle. */
++    gcvBROADCAST_GPU_IDLE,
++
++    /* A commit is going to happen. */
++    gcvBROADCAST_GPU_COMMIT,
++
++    /* GPU seems to be stuck. */
++    gcvBROADCAST_GPU_STUCK,
++
++    /* First process gets attached. */
++    gcvBROADCAST_FIRST_PROCESS,
++
++    /* Last process gets detached. */
++    gcvBROADCAST_LAST_PROCESS,
++
++    /* AXI bus error. */
++    gcvBROADCAST_AXI_BUS_ERROR,
++}
++gceBROADCAST;
++
++gceSTATUS
++gckOS_Broadcast(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gceBROADCAST Reason
++    );
++
++gceSTATUS
++gckOS_BroadcastHurry(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT Urgency
++    );
++
++gceSTATUS
++gckOS_BroadcastCalibrateSpeed(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT Idle,
++    IN gctUINT Time
++    );
++
++/*******************************************************************************
++**
++**  gckOS_SetGPUPower
++**
++**  Set the power of the GPU on or off.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.ß
++**
++**      gckCORE Core
++**          GPU whose power is set.
++**
++**      gctBOOL Clock
++**          gcvTRUE to turn on the clock, or gcvFALSE to turn off the clock.
++**
++**      gctBOOL Power
++**          gcvTRUE to turn on the power, or gcvFALSE to turn off the power.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_SetGPUPower(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctBOOL Clock,
++    IN gctBOOL Power
++    );
++
++gceSTATUS
++gckOS_ResetGPU(
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++gceSTATUS
++gckOS_PrepareGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++gceSTATUS
++gckOS_FinishGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core
++    );
++
++gceSTATUS
++gckOS_QueryGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gctUINT32 * Frequency,
++    OUT gctUINT8 * Scale
++    );
++
++gceSTATUS
++gckOS_SetGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT8 Scale
++    );
++
++/*******************************************************************************
++** Semaphores.
++*/
++
++/* Create a new semaphore. */
++gceSTATUS
++gckOS_CreateSemaphore(
++    IN gckOS Os,
++    OUT gctPOINTER * Semaphore
++    );
++
++#if gcdENABLE_VG
++gceSTATUS
++gckOS_CreateSemaphoreVG(
++    IN gckOS Os,
++    OUT gctPOINTER * Semaphore
++    );
++#endif
++
++/* Delete a semahore. */
++gceSTATUS
++gckOS_DestroySemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    );
++
++/* Acquire a semahore. */
++gceSTATUS
++gckOS_AcquireSemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    );
++
++/* Try to acquire a semahore. */
++gceSTATUS
++gckOS_TryAcquireSemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    );
++
++/* Release a semahore. */
++gceSTATUS
++gckOS_ReleaseSemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    );
++
++/*******************************************************************************
++** Timer API.
++*/
++
++typedef void (*gctTIMERFUNCTION)(gctPOINTER);
++
++/* Create a timer. */
++gceSTATUS
++gckOS_CreateTimer(
++    IN gckOS Os,
++    IN gctTIMERFUNCTION Function,
++    IN gctPOINTER Data,
++    OUT gctPOINTER * Timer
++    );
++
++/* Destory a timer. */
++gceSTATUS
++gckOS_DestroyTimer(
++    IN gckOS Os,
++    IN gctPOINTER Timer
++    );
++
++/* Start a timer. */
++gceSTATUS
++gckOS_StartTimer(
++    IN gckOS Os,
++    IN gctPOINTER Timer,
++    IN gctUINT32 Delay
++    );
++
++/* Stop a timer. */
++gceSTATUS
++gckOS_StopTimer(
++    IN gckOS Os,
++    IN gctPOINTER Timer
++    );
++
++/* Get the global video memory mutex. */
++gceSTATUS
++gckOS_GetVideoMemoryMutex(
++    IN gckOS Os,
++    OUT gctPOINTER *Mutex
++    );
++
++/******************************************************************************\
++********************************* gckHEAP Object ********************************
++\******************************************************************************/
++
++typedef struct _gckHEAP *       gckHEAP;
++
++/* Construct a new gckHEAP object. */
++gceSTATUS
++gckHEAP_Construct(
++    IN gckOS Os,
++    IN gctSIZE_T AllocationSize,
++    OUT gckHEAP * Heap
++    );
++
++/* Destroy an gckHEAP object. */
++gceSTATUS
++gckHEAP_Destroy(
++    IN gckHEAP Heap
++    );
++
++/* Allocate memory. */
++gceSTATUS
++gckHEAP_Allocate(
++    IN gckHEAP Heap,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Node
++    );
++
++/* Free memory. */
++gceSTATUS
++gckHEAP_Free(
++    IN gckHEAP Heap,
++    IN gctPOINTER Node
++    );
++
++/* Profile the heap. */
++gceSTATUS
++gckHEAP_ProfileStart(
++    IN gckHEAP Heap
++    );
++
++gceSTATUS
++gckHEAP_ProfileEnd(
++    IN gckHEAP Heap,
++    IN gctCONST_STRING Title
++    );
++
++
++/******************************************************************************\
++******************************** gckVIDMEM Object ******************************
++\******************************************************************************/
++
++typedef struct _gckVIDMEM *         gckVIDMEM;
++typedef struct _gckKERNEL *         gckKERNEL;
++typedef struct _gckDB *             gckDB;
++typedef struct _gckDVFS *           gckDVFS;
++
++/* Construct a new gckVIDMEM object. */
++gceSTATUS
++gckVIDMEM_Construct(
++    IN gckOS Os,
++    IN gctUINT32 BaseAddress,
++    IN gctSIZE_T Bytes,
++    IN gctSIZE_T Threshold,
++    IN gctSIZE_T Banking,
++    OUT gckVIDMEM * Memory
++    );
++
++/* Destroy an gckVDIMEM object. */
++gceSTATUS
++gckVIDMEM_Destroy(
++    IN gckVIDMEM Memory
++    );
++
++/* Allocate rectangular memory. */
++gceSTATUS
++gckVIDMEM_Allocate(
++    IN gckKERNEL Kernel,
++    IN gckVIDMEM Memory,
++    IN gctUINT Width,
++    IN gctUINT Height,
++    IN gctUINT Depth,
++    IN gctUINT BytesPerPixel,
++    IN gctUINT32 Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    );
++
++/* Allocate linear memory. */
++gceSTATUS
++gckVIDMEM_AllocateLinear(
++    IN gckKERNEL Kernel,
++    IN gckVIDMEM Memory,
++    IN gctSIZE_T Bytes,
++    IN gctUINT32 Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    );
++
++/* Free memory. */
++gceSTATUS
++gckVIDMEM_Free(
++    IN gckKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node
++    );
++
++/* Lock memory. */
++gceSTATUS
++gckVIDMEM_Lock(
++    IN gckKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gctBOOL Cacheable,
++    OUT gctUINT32 * Address
++    );
++
++/* Unlock memory. */
++gceSTATUS
++gckVIDMEM_Unlock(
++    IN gckKERNEL Kernel,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gceSURF_TYPE Type,
++    IN OUT gctBOOL * Asynchroneous
++    );
++
++/* Construct a gcuVIDMEM_NODE union for virtual memory. */
++gceSTATUS
++gckVIDMEM_ConstructVirtual(
++    IN gckKERNEL Kernel,
++    IN gctBOOL Contiguous,
++    IN gctSIZE_T Bytes,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    );
++
++/* Destroy a gcuVIDMEM_NODE union for virtual memory. */
++gceSTATUS
++gckVIDMEM_DestroyVirtual(
++    IN gcuVIDMEM_NODE_PTR Node
++    );
++
++/******************************************************************************\
++******************************** gckKERNEL Object ******************************
++\******************************************************************************/
++
++struct _gcsHAL_INTERFACE;
++
++/* Notifications. */
++typedef enum _gceNOTIFY
++{
++    gcvNOTIFY_INTERRUPT,
++    gcvNOTIFY_COMMAND_QUEUE,
++}
++gceNOTIFY;
++
++/* Flush flags. */
++typedef enum _gceKERNEL_FLUSH
++{
++    gcvFLUSH_COLOR              = 0x01,
++    gcvFLUSH_DEPTH              = 0x02,
++    gcvFLUSH_TEXTURE            = 0x04,
++    gcvFLUSH_2D                 = 0x08,
++    gcvFLUSH_ALL                = gcvFLUSH_COLOR
++                                | gcvFLUSH_DEPTH
++                                | gcvFLUSH_TEXTURE
++                                | gcvFLUSH_2D,
++}
++gceKERNEL_FLUSH;
++
++/* Construct a new gckKERNEL object. */
++gceSTATUS
++gckKERNEL_Construct(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPOINTER Context,
++    IN gckDB SharedDB,
++    OUT gckKERNEL * Kernel
++    );
++
++/* Destroy an gckKERNEL object. */
++gceSTATUS
++gckKERNEL_Destroy(
++    IN gckKERNEL Kernel
++    );
++
++/* Dispatch a user-level command. */
++gceSTATUS
++gckKERNEL_Dispatch(
++    IN gckKERNEL Kernel,
++    IN gctBOOL FromUser,
++    IN OUT struct _gcsHAL_INTERFACE * Interface
++    );
++
++/* Query the video memory. */
++gceSTATUS
++gckKERNEL_QueryVideoMemory(
++    IN gckKERNEL Kernel,
++    OUT struct _gcsHAL_INTERFACE * Interface
++    );
++
++/* Lookup the gckVIDMEM object for a pool. */
++gceSTATUS
++gckKERNEL_GetVideoMemoryPool(
++    IN gckKERNEL Kernel,
++    IN gcePOOL Pool,
++    OUT gckVIDMEM * VideoMemory
++    );
++
++#if gcdUSE_VIDMEM_PER_PID
++gceSTATUS
++gckKERNEL_GetVideoMemoryPoolPid(
++    IN gckKERNEL Kernel,
++    IN gcePOOL Pool,
++    IN gctUINT32 Pid,
++    OUT gckVIDMEM * VideoMemory
++    );
++
++gceSTATUS
++gckKERNEL_CreateVideoMemoryPoolPid(
++    IN gckKERNEL Kernel,
++    IN gcePOOL Pool,
++    IN gctUINT32 Pid,
++    OUT gckVIDMEM * VideoMemory
++    );
++
++gceSTATUS
++gckKERNEL_RemoveVideoMemoryPoolPid(
++    IN gckKERNEL Kernel,
++    IN gckVIDMEM VideoMemory
++    );
++#endif
++
++/* Map video memory. */
++gceSTATUS
++gckKERNEL_MapVideoMemory(
++    IN gckKERNEL Kernel,
++    IN gctBOOL InUserSpace,
++    IN gctUINT32 Address,
++#ifdef __QNXNTO__
++    IN gctUINT32 Pid,
++    IN gctUINT32 Bytes,
++#endif
++    OUT gctPOINTER * Logical
++    );
++
++/* Map video memory. */
++gceSTATUS
++gckKERNEL_MapVideoMemoryEx(
++    IN gckKERNEL Kernel,
++    IN gceCORE Core,
++    IN gctBOOL InUserSpace,
++    IN gctUINT32 Address,
++#ifdef __QNXNTO__
++    IN gctUINT32 Pid,
++    IN gctUINT32 Bytes,
++#endif
++    OUT gctPOINTER * Logical
++    );
++
++#ifdef __QNXNTO__
++/* Unmap video memory. */
++gceSTATUS
++gckKERNEL_UnmapVideoMemory(
++    IN gckKERNEL Kernel,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Pid,
++    IN gctUINT32 Bytes
++    );
++#endif
++
++/* Map memory. */
++gceSTATUS
++gckKERNEL_MapMemory(
++    IN gckKERNEL Kernel,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Logical
++    );
++
++/* Unmap memory. */
++gceSTATUS
++gckKERNEL_UnmapMemory(
++    IN gckKERNEL Kernel,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    );
++
++/* Notification of events. */
++gceSTATUS
++gckKERNEL_Notify(
++    IN gckKERNEL Kernel,
++    IN gceNOTIFY Notifcation,
++    IN gctBOOL Data
++    );
++
++gceSTATUS
++gckKERNEL_QuerySettings(
++    IN gckKERNEL Kernel,
++    OUT gcsKERNEL_SETTINGS * Settings
++    );
++
++/*******************************************************************************
++**
++**  gckKERNEL_Recovery
++**
++**  Try to recover the GPU from a fatal error.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_Recovery(
++    IN gckKERNEL Kernel
++    );
++
++/* Set the value of timeout on HW operation. */
++void
++gckKERNEL_SetTimeOut(
++    IN gckKERNEL Kernel,
++    IN gctUINT32 timeOut
++    );
++
++/* Get access to the user data. */
++gceSTATUS
++gckKERNEL_OpenUserData(
++    IN gckKERNEL Kernel,
++    IN gctBOOL NeedCopy,
++    IN gctPOINTER StaticStorage,
++    IN gctPOINTER UserPointer,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * KernelPointer
++    );
++
++/* Release resources associated with the user data connection. */
++gceSTATUS
++gckKERNEL_CloseUserData(
++    IN gckKERNEL Kernel,
++    IN gctBOOL NeedCopy,
++    IN gctBOOL FlushData,
++    IN gctPOINTER UserPointer,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * KernelPointer
++    );
++
++gceSTATUS
++gckDVFS_Construct(
++    IN gckHARDWARE Hardware,
++    OUT gckDVFS * Frequency
++    );
++
++gceSTATUS
++gckDVFS_Destroy(
++    IN gckDVFS Dvfs
++    );
++
++gceSTATUS
++gckDVFS_Start(
++    IN gckDVFS Dvfs
++    );
++
++gceSTATUS
++gckDVFS_Stop(
++    IN gckDVFS Dvfs
++    );
++
++/******************************************************************************\
++******************************* gckHARDWARE Object *****************************
++\******************************************************************************/
++
++/* Construct a new gckHARDWARE object. */
++gceSTATUS
++gckHARDWARE_Construct(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gckHARDWARE * Hardware
++    );
++
++/* Destroy an gckHARDWARE object. */
++gceSTATUS
++gckHARDWARE_Destroy(
++    IN gckHARDWARE Hardware
++    );
++
++/* Get hardware type. */
++gceSTATUS
++gckHARDWARE_GetType(
++    IN gckHARDWARE Hardware,
++    OUT gceHARDWARE_TYPE * Type
++    );
++
++/* Query system memory requirements. */
++gceSTATUS
++gckHARDWARE_QuerySystemMemory(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * SystemSize,
++    OUT gctUINT32 * SystemBaseAddress
++    );
++
++/* Build virtual address. */
++gceSTATUS
++gckHARDWARE_BuildVirtualAddress(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Index,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    );
++
++/* Query command buffer requirements. */
++gceSTATUS
++gckHARDWARE_QueryCommandBuffer(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * Alignment,
++    OUT gctSIZE_T * ReservedHead,
++    OUT gctSIZE_T * ReservedTail
++    );
++
++/* Add a WAIT/LINK pair in the command queue. */
++gceSTATUS
++gckHARDWARE_WaitLink(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctUINT32 * WaitOffset,
++    OUT gctSIZE_T * WaitBytes
++    );
++
++/* Kickstart the command processor. */
++gceSTATUS
++gckHARDWARE_Execute(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++#ifdef __QNXNTO__
++    IN gctPOINTER Physical,
++    IN gctBOOL PhysicalAddresses,
++#endif
++    IN gctSIZE_T Bytes
++    );
++
++/* Add an END command in the command queue. */
++gceSTATUS
++gckHARDWARE_End(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Add a NOP command in the command queue. */
++gceSTATUS
++gckHARDWARE_Nop(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Add a WAIT command in the command queue. */
++gceSTATUS
++gckHARDWARE_Wait(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Count,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Add a PIPESELECT command in the command queue. */
++gceSTATUS
++gckHARDWARE_PipeSelect(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gcePIPE_SELECT Pipe,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Add a LINK command in the command queue. */
++gceSTATUS
++gckHARDWARE_Link(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctPOINTER FetchAddress,
++    IN gctSIZE_T FetchSize,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Add an EVENT command in the command queue. */
++gceSTATUS
++gckHARDWARE_Event(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT8 Event,
++    IN gceKERNEL_WHERE FromWhere,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Query the available memory. */
++gceSTATUS
++gckHARDWARE_QueryMemory(
++    IN gckHARDWARE Hardware,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctUINT32 * InternalBaseAddress,
++    OUT gctUINT32 * InternalAlignment,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctUINT32 * ExternalBaseAddress,
++    OUT gctUINT32 * ExternalAlignment,
++    OUT gctUINT32 * HorizontalTileSize,
++    OUT gctUINT32 * VerticalTileSize
++    );
++
++/* Query the identity of the hardware. */
++gceSTATUS
++gckHARDWARE_QueryChipIdentity(
++    IN gckHARDWARE Hardware,
++    OUT gcsHAL_QUERY_CHIP_IDENTITY_PTR Identity
++    );
++
++/* Query the shader support. */
++gceSTATUS
++gckHARDWARE_QueryShaderCaps(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT * VertexUniforms,
++    OUT gctUINT * FragmentUniforms,
++    OUT gctUINT * Varyings
++    );
++
++/* Split a harwdare specific address into API stuff. */
++gceSTATUS
++gckHARDWARE_SplitMemory(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    );
++
++/* Update command queue tail pointer. */
++gceSTATUS
++gckHARDWARE_UpdateQueueTail(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Offset
++    );
++
++/* Convert logical address to hardware specific address. */
++gceSTATUS
++gckHARDWARE_ConvertLogical(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    );
++
++#ifdef __QNXNTO__
++/* Convert physical address to hardware specific address. */
++gceSTATUS
++gckHARDWARE_ConvertPhysical(
++    IN gckHARDWARE Hardware,
++    IN gctPHYS_ADDR Physical,
++    OUT gctUINT32 * Address
++    );
++#endif
++
++/* Interrupt manager. */
++gceSTATUS
++gckHARDWARE_Interrupt(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL InterruptValid
++    );
++
++/* Program MMU. */
++gceSTATUS
++gckHARDWARE_SetMMU(
++    IN gckHARDWARE Hardware,
++    IN gctPOINTER Logical
++    );
++
++/* Flush the MMU. */
++gceSTATUS
++gckHARDWARE_FlushMMU(
++    IN gckHARDWARE Hardware
++    );
++
++/* Set the page table base address. */
++gceSTATUS
++gckHARDWARE_SetMMUv2(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Enable,
++    IN gctPOINTER MtlbAddress,
++    IN gceMMU_MODE Mode,
++    IN gctPOINTER SafeAddress,
++    IN gctBOOL FromPower
++    );
++
++/* Get idle register. */
++gceSTATUS
++gckHARDWARE_GetIdle(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL Wait,
++    OUT gctUINT32 * Data
++    );
++
++/* Flush the caches. */
++gceSTATUS
++gckHARDWARE_Flush(
++    IN gckHARDWARE Hardware,
++    IN gceKERNEL_FLUSH Flush,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Enable/disable fast clear. */
++gceSTATUS
++gckHARDWARE_SetFastClear(
++    IN gckHARDWARE Hardware,
++    IN gctINT Enable,
++    IN gctINT Compression
++    );
++
++gceSTATUS
++gckHARDWARE_ReadInterrupt(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32_PTR IDs
++    );
++
++/* Power management. */
++gceSTATUS
++gckHARDWARE_SetPowerManagementState(
++    IN gckHARDWARE Hardware,
++    IN gceCHIPPOWERSTATE State
++    );
++
++gceSTATUS
++gckHARDWARE_QueryPowerManagementState(
++    IN gckHARDWARE Hardware,
++    OUT gceCHIPPOWERSTATE* State
++    );
++
++gceSTATUS
++gckHARDWARE_SetPowerManagement(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL PowerManagement
++    );
++
++gceSTATUS
++gckHARDWARE_SetGpuProfiler(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL GpuProfiler
++    );
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++gceSTATUS
++gckHARDWARE_SetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32   FscaleValue
++    );
++
++gceSTATUS
++gckHARDWARE_GetFscaleValue(
++    IN gckHARDWARE Hardware,
++    IN gctUINT * FscaleValue,
++    IN gctUINT * MinFscaleValue,
++    IN gctUINT * MaxFscaleValue
++    );
++#endif
++
++#if gcdPOWEROFF_TIMEOUT
++gceSTATUS
++gckHARDWARE_SetPowerOffTimeout(
++    IN gckHARDWARE  Hardware,
++    IN gctUINT32    Timeout
++);
++
++gceSTATUS
++gckHARDWARE_QueryPowerOffTimeout(
++    IN gckHARDWARE  Hardware,
++    OUT gctUINT32*  Timeout
++);
++#endif
++
++/* Profile 2D Engine. */
++gceSTATUS
++gckHARDWARE_ProfileEngine2D(
++    IN gckHARDWARE Hardware,
++    OUT gcs2D_PROFILE_PTR Profile
++    );
++
++gceSTATUS
++gckHARDWARE_InitializeHardware(
++    IN gckHARDWARE Hardware
++    );
++
++gceSTATUS
++gckHARDWARE_Reset(
++    IN gckHARDWARE Hardware
++    );
++
++typedef gceSTATUS (*gctISRMANAGERFUNC)(gctPOINTER Context, gceCORE Core);
++
++gceSTATUS
++gckHARDWARE_SetIsrManager(
++    IN gckHARDWARE Hardware,
++    IN gctISRMANAGERFUNC StartIsr,
++    IN gctISRMANAGERFUNC StopIsr,
++    IN gctPOINTER Context
++    );
++
++/* Start a composition. */
++gceSTATUS
++gckHARDWARE_Compose(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Offset,
++    IN gctSIZE_T Size,
++    IN gctUINT8 EventID
++    );
++
++/* Check for Hardware features. */
++gceSTATUS
++gckHARDWARE_IsFeatureAvailable(
++    IN gckHARDWARE Hardware,
++    IN gceFEATURE Feature
++    );
++
++gceSTATUS
++gckHARDWARE_DumpMMUException(
++    IN gckHARDWARE Hardware
++    );
++
++gceSTATUS
++gckHARDWARE_DumpGPUState(
++    IN gckHARDWARE Hardware
++    );
++
++gceSTATUS
++gckHARDWARE_InitDVFS(
++    IN gckHARDWARE Hardware
++    );
++
++gceSTATUS
++gckHARDWARE_QueryLoad(
++    IN gckHARDWARE Hardware,
++    OUT gctUINT32 * Load
++    );
++
++gceSTATUS
++gckHARDWARE_SetDVFSPeroid(
++    IN gckHARDWARE Hardware,
++    IN gctUINT32 Frequency
++    );
++
++#if !gcdENABLE_VG
++/******************************************************************************\
++***************************** gckINTERRUPT Object ******************************
++\******************************************************************************/
++
++typedef struct _gckINTERRUPT *  gckINTERRUPT;
++
++typedef gceSTATUS (* gctINTERRUPT_HANDLER)(
++    IN gckKERNEL Kernel
++    );
++
++gceSTATUS
++gckINTERRUPT_Construct(
++    IN gckKERNEL Kernel,
++    OUT gckINTERRUPT * Interrupt
++    );
++
++gceSTATUS
++gckINTERRUPT_Destroy(
++    IN gckINTERRUPT Interrupt
++    );
++
++gceSTATUS
++gckINTERRUPT_SetHandler(
++    IN gckINTERRUPT Interrupt,
++    IN OUT gctINT32_PTR Id,
++    IN gctINTERRUPT_HANDLER Handler
++    );
++
++gceSTATUS
++gckINTERRUPT_Notify(
++    IN gckINTERRUPT Interrupt,
++    IN gctBOOL Valid
++    );
++#endif
++/******************************************************************************\
++******************************** gckEVENT Object *******************************
++\******************************************************************************/
++
++typedef struct _gckEVENT *      gckEVENT;
++
++/* Construct a new gckEVENT object. */
++gceSTATUS
++gckEVENT_Construct(
++    IN gckKERNEL Kernel,
++    OUT gckEVENT * Event
++    );
++
++/* Destroy an gckEVENT object. */
++gceSTATUS
++gckEVENT_Destroy(
++    IN gckEVENT Event
++    );
++
++/* Add a new event to the list of events. */
++gceSTATUS
++gckEVENT_AddList(
++    IN gckEVENT Event,
++    IN gcsHAL_INTERFACE_PTR Interface,
++    IN gceKERNEL_WHERE FromWhere,
++    IN gctBOOL AllocateAllowed,
++    IN gctBOOL FromKernel
++    );
++
++/* Schedule a FreeNonPagedMemory event. */
++gceSTATUS
++gckEVENT_FreeNonPagedMemory(
++    IN gckEVENT Event,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gceKERNEL_WHERE FromWhere
++    );
++
++/* Schedule a FreeContiguousMemory event. */
++gceSTATUS
++gckEVENT_FreeContiguousMemory(
++    IN gckEVENT Event,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gceKERNEL_WHERE FromWhere
++    );
++
++/* Schedule a FreeVideoMemory event. */
++gceSTATUS
++gckEVENT_FreeVideoMemory(
++    IN gckEVENT Event,
++    IN gcuVIDMEM_NODE_PTR VideoMemory,
++    IN gceKERNEL_WHERE FromWhere
++    );
++
++/* Schedule a signal event. */
++gceSTATUS
++gckEVENT_Signal(
++    IN gckEVENT Event,
++    IN gctSIGNAL Signal,
++    IN gceKERNEL_WHERE FromWhere
++    );
++
++/* Schedule an Unlock event. */
++gceSTATUS
++gckEVENT_Unlock(
++    IN gckEVENT Event,
++    IN gceKERNEL_WHERE FromWhere,
++    IN gcuVIDMEM_NODE_PTR Node,
++    IN gceSURF_TYPE Type
++    );
++
++gceSTATUS
++gckEVENT_CommitDone(
++    IN gckEVENT Event,
++    IN gceKERNEL_WHERE FromWhere
++    );
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++/* Schedule a FreeVirtualCommandBuffer event. */
++gceSTATUS
++gckEVENT_DestroyVirtualCommandBuffer(
++    IN gckEVENT Event,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gceKERNEL_WHERE FromWhere
++    );
++#endif
++
++gceSTATUS
++gckEVENT_Submit(
++    IN gckEVENT Event,
++    IN gctBOOL Wait,
++    IN gctBOOL FromPower
++    );
++
++/* Commit an event queue. */
++gceSTATUS
++gckEVENT_Commit(
++    IN gckEVENT Event,
++    IN gcsQUEUE_PTR Queue
++    );
++
++/* Schedule a composition event. */
++gceSTATUS
++gckEVENT_Compose(
++    IN gckEVENT Event,
++    IN gcsHAL_COMPOSE_PTR Info
++    );
++
++/* Event callback routine. */
++gceSTATUS
++gckEVENT_Notify(
++    IN gckEVENT Event,
++    IN gctUINT32 IDs
++    );
++
++/* Event callback routine. */
++gceSTATUS
++gckEVENT_Interrupt(
++    IN gckEVENT Event,
++    IN gctUINT32 IDs
++    );
++
++gceSTATUS
++gckEVENT_Dump(
++    IN gckEVENT Event
++    );
++/******************************************************************************\
++******************************* gckCOMMAND Object ******************************
++\******************************************************************************/
++
++typedef struct _gckCOMMAND *        gckCOMMAND;
++
++/* Construct a new gckCOMMAND object. */
++gceSTATUS
++gckCOMMAND_Construct(
++    IN gckKERNEL Kernel,
++    OUT gckCOMMAND * Command
++    );
++
++/* Destroy an gckCOMMAND object. */
++gceSTATUS
++gckCOMMAND_Destroy(
++    IN gckCOMMAND Command
++    );
++
++/* Acquire command queue synchronization objects. */
++gceSTATUS
++gckCOMMAND_EnterCommit(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromPower
++    );
++
++/* Release command queue synchronization objects. */
++gceSTATUS
++gckCOMMAND_ExitCommit(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromPower
++    );
++
++/* Start the command queue. */
++gceSTATUS
++gckCOMMAND_Start(
++    IN gckCOMMAND Command
++    );
++
++/* Stop the command queue. */
++gceSTATUS
++gckCOMMAND_Stop(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromRecovery
++    );
++
++/* Commit a buffer to the command queue. */
++gceSTATUS
++gckCOMMAND_Commit(
++    IN gckCOMMAND Command,
++    IN gckCONTEXT Context,
++    IN gcoCMDBUF CommandBuffer,
++    IN gcsSTATE_DELTA_PTR StateDelta,
++    IN gcsQUEUE_PTR EventQueue,
++    IN gctUINT32 ProcessID
++    );
++
++/* Reserve space in the command buffer. */
++gceSTATUS
++gckCOMMAND_Reserve(
++    IN gckCOMMAND Command,
++    IN gctSIZE_T RequestedBytes,
++    OUT gctPOINTER * Buffer,
++    OUT gctSIZE_T * BufferSize
++    );
++
++/* Execute reserved space in the command buffer. */
++gceSTATUS
++gckCOMMAND_Execute(
++    IN gckCOMMAND Command,
++    IN gctSIZE_T RequstedBytes
++    );
++
++/* Stall the command queue. */
++gceSTATUS
++gckCOMMAND_Stall(
++    IN gckCOMMAND Command,
++    IN gctBOOL FromPower
++    );
++
++/* Attach user process. */
++gceSTATUS
++gckCOMMAND_Attach(
++    IN gckCOMMAND Command,
++    OUT gckCONTEXT * Context,
++    OUT gctSIZE_T * StateCount,
++    IN gctUINT32 ProcessID
++    );
++
++/* Detach user process. */
++gceSTATUS
++gckCOMMAND_Detach(
++    IN gckCOMMAND Command,
++    IN gckCONTEXT Context
++    );
++
++#if gcdVIRTUAL_COMMAND_BUFFER
++gceSTATUS
++gckCOMMAND_DumpExecutingBuffer(
++    IN gckCOMMAND Command
++    );
++#endif
++
++/******************************************************************************\
++********************************* gckMMU Object ********************************
++\******************************************************************************/
++
++typedef struct _gckMMU *            gckMMU;
++
++/* Construct a new gckMMU object. */
++gceSTATUS
++gckMMU_Construct(
++    IN gckKERNEL Kernel,
++    IN gctSIZE_T MmuSize,
++    OUT gckMMU * Mmu
++    );
++
++/* Destroy an gckMMU object. */
++gceSTATUS
++gckMMU_Destroy(
++    IN gckMMU Mmu
++    );
++
++/* Enable the MMU. */
++gceSTATUS
++gckMMU_Enable(
++    IN gckMMU Mmu,
++    IN gctUINT32 PhysBaseAddr,
++    IN gctUINT32 PhysSize
++    );
++
++/* Allocate pages inside the MMU. */
++gceSTATUS
++gckMMU_AllocatePages(
++    IN gckMMU Mmu,
++    IN gctSIZE_T PageCount,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    );
++
++gceSTATUS
++gckMMU_AllocatePagesEx(
++    IN gckMMU Mmu,
++    IN gctSIZE_T PageCount,
++    IN gceSURF_TYPE Type,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    );
++
++/* Remove a page table from the MMU. */
++gceSTATUS
++gckMMU_FreePages(
++    IN gckMMU Mmu,
++    IN gctPOINTER PageTable,
++    IN gctSIZE_T PageCount
++    );
++
++/* Set the MMU page with info. */
++gceSTATUS
++gckMMU_SetPage(
++   IN gckMMU Mmu,
++   IN gctUINT32 PageAddress,
++   IN gctUINT32 *PageEntry
++   );
++
++#ifdef __QNXNTO__
++gceSTATUS
++gckMMU_InsertNode(
++    IN gckMMU Mmu,
++    IN gcuVIDMEM_NODE_PTR Node);
++
++gceSTATUS
++gckMMU_RemoveNode(
++    IN gckMMU Mmu,
++    IN gcuVIDMEM_NODE_PTR Node);
++#endif
++
++#ifdef __QNXNTO__
++gceSTATUS
++gckMMU_FreeHandleMemory(
++    IN gckKERNEL Kernel,
++    IN gckMMU Mmu,
++    IN gctUINT32 Pid
++    );
++#endif
++
++gceSTATUS
++gckMMU_Flush(
++    IN gckMMU Mmu
++    );
++
++gceSTATUS
++gckMMU_DumpPageTableEntry(
++    IN gckMMU Mmu,
++    IN gctUINT32 Address
++    );
++
++
++#if VIVANTE_PROFILER
++gceSTATUS
++gckHARDWARE_QueryProfileRegisters(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL   Clear,
++    OUT gcsPROFILER_COUNTERS * Counters
++    );
++#endif
++
++#if VIVANTE_PROFILER_CONTEXT
++gceSTATUS
++gckHARDWARE_QueryContextProfile(
++    IN gckHARDWARE Hardware,
++    IN gctBOOL   Clear,
++    IN gckCONTEXT Context,
++    OUT gcsPROFILER_COUNTERS * Counters
++    );
++
++gceSTATUS
++gckHARDWARE_UpdateContextProfile(
++    IN gckHARDWARE Hardware,
++    IN gckCONTEXT Context
++    );
++#endif
++
++gceSTATUS
++gckOS_SignalQueryHardware(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    OUT gckHARDWARE * Hardware
++    );
++
++gceSTATUS
++gckOS_SignalSetHardware(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    gckHARDWARE Hardware
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#if gcdENABLE_VG
++#include "gc_hal_vg.h"
++#endif
++
++#endif /* __gc_hal_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_kernel_buffer.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,185 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_buffer_h_
++#define __gc_hal_kernel_buffer_h_
++
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++************************ Command Buffer and Event Objects **********************
++\******************************************************************************/
++
++/* The number of context buffers per user. */
++#define gcdCONTEXT_BUFFER_COUNT 2
++
++/* State delta record. */
++typedef struct _gcsSTATE_DELTA_RECORD * gcsSTATE_DELTA_RECORD_PTR;
++typedef struct _gcsSTATE_DELTA_RECORD
++{
++    /* State address. */
++    gctUINT                     address;
++
++    /* State mask. */
++    gctUINT32                   mask;
++
++    /* State data. */
++    gctUINT32                   data;
++}
++gcsSTATE_DELTA_RECORD;
++
++/* State delta. */
++typedef struct _gcsSTATE_DELTA
++{
++    /* For debugging: the number of delta in the order of creation. */
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    gctUINT                     num;
++#endif
++
++    /* Main state delta ID. Every time state delta structure gets reinitialized,
++       main ID is incremented. If main state ID overflows, all map entry IDs get
++       reinitialized to make sure there is no potential erroneous match after
++       the overflow.*/
++    gctUINT                     id;
++
++    /* The number of contexts pending modification by the delta. */
++    gctINT                      refCount;
++
++    /* Vertex element count for the delta buffer. */
++    gctUINT                     elementCount;
++
++    /* Number of states currently stored in the record array. */
++    gctUINT                     recordCount;
++
++    /* Record array; holds all modified states in gcsSTATE_DELTA_RECORD. */
++    gctUINT64                   recordArray;
++
++    /* Map entry ID is used for map entry validation. If map entry ID does not
++       match the main state delta ID, the entry and the corresponding state are
++       considered not in use. */
++    gctUINT64                   mapEntryID;
++    gctUINT                     mapEntryIDSize;
++
++    /* If the map entry ID matches the main state delta ID, index points to
++       the state record in the record array. */
++    gctUINT64                   mapEntryIndex;
++
++    /* Previous and next state deltas in gcsSTATE_DELTA. */
++    gctUINT64                   prev;
++    gctUINT64                   next;
++}
++gcsSTATE_DELTA;
++
++/* Command buffer object. */
++struct _gcoCMDBUF
++{
++    /* The object. */
++    gcsOBJECT                   object;
++
++    /* Command buffer entry and exit pipes. */
++    gcePIPE_SELECT              entryPipe;
++    gcePIPE_SELECT              exitPipe;
++
++    /* Feature usage flags. */
++    gctBOOL                     using2D;
++    gctBOOL                     using3D;
++    gctBOOL                     usingFilterBlit;
++    gctBOOL                     usingPalette;
++
++    /* Physical address of command buffer. Just a name. */
++    gctUINT32                   physical;
++
++    /* Logical address of command buffer. */
++    gctUINT64                   logical;
++
++    /* Number of bytes in command buffer. */
++    gctUINT                     bytes;
++
++    /* Start offset into the command buffer. */
++    gctUINT                     startOffset;
++
++    /* Current offset into the command buffer. */
++    gctUINT                     offset;
++
++    /* Number of free bytes in command buffer. */
++    gctUINT                     free;
++
++    /* Location of the last reserved area. */
++    gctUINT64                   lastReserve;
++    gctUINT                     lastOffset;
++
++#if gcdSECURE_USER
++    /* Hint array for the current command buffer. */
++    gctUINT                     hintArraySize;
++    gctUINT64                   hintArray;
++    gctUINT64                   hintArrayTail;
++#endif
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++    /* Last load state command location and hardware address. */
++    gctUINT64                   lastLoadStatePtr;
++    gctUINT32                   lastLoadStateAddress;
++    gctUINT32                   lastLoadStateCount;
++#endif
++};
++
++typedef struct _gcsQUEUE
++{
++    /* Pointer to next gcsQUEUE structure in gcsQUEUE. */
++    gctUINT64                   next;
++
++    /* Event information. */
++    gcsHAL_INTERFACE            iface;
++}
++gcsQUEUE;
++
++/* Event queue. */
++struct _gcoQUEUE
++{
++    /* The object. */
++    gcsOBJECT                   object;
++
++    /* Pointer to current event queue. */
++    gcsQUEUE_PTR                head;
++    gcsQUEUE_PTR                tail;
++
++#ifdef __QNXNTO__
++    /* Buffer for records. */
++    gcsQUEUE_PTR                records;
++    gctUINT32                   freeBytes;
++    gctUINT32                   offset;
++#else
++    /* List of free records. */
++    gcsQUEUE_PTR                freeList;
++#endif
++    #define gcdIN_QUEUE_RECORD_LIMIT 16
++    /* Number of records currently in queue */
++    gctUINT32                   recordCount;
++};
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_buffer_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_mem.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,530 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++/*
++**	Include file for the local memory management.
++*/
++
++#ifndef __gc_hal_mem_h_
++#define __gc_hal_mem_h_
++#ifndef VIVANTE_NO_3D
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/*******************************************************************************
++**  Usage:
++
++	The macros to declare MemPool type and functions are
++	gcmMEM_DeclareFSMemPool (Type, TypeName, Prefix)
++	gcmMEM_DeclareVSMemPool (Type, TypeName, Prefix)
++	gcmMEM_DeclareAFSMemPool(Type, TypeName, Prefix)
++
++	The data structures for MemPool are
++	typedef struct _gcsMEM_FS_MEM_POOL *	gcsMEM_FS_MEM_POOL;
++	typedef struct _gcsMEM_VS_MEM_POOL *	gcsMEM_VS_MEM_POOL;
++	typedef struct _gcsMEM_AFS_MEM_POOL *	gcsMEM_AFS_MEM_POOL;
++
++	The MemPool constructor and destructor functions are
++	gcfMEM_InitFSMemPool(gcsMEM_FS_MEM_POOL *, gcoOS, gctUINT, gctUINT);
++	gcfMEM_FreeFSMemPool(gcsMEM_FS_MEM_POOL *);
++	gcfMEM_InitVSMemPool(gcsMEM_VS_MEM_POOL *, gcoOS, gctUINT, gctBOOL);
++	gcfMEM_FreeVSMemPool(gcsMEM_VS_MEM_POOL *);
++	gcfMEM_InitAFSMemPool(gcsMEM_AFS_MEM_POOL *, gcoOS, gctUINT);
++	gcfMEM_FreeAFSMemPool(gcsMEM_AFS_MEM_POOL *);
++
++	FS:  for Fixed-Size data structures
++	VS:  for Variable-size data structures
++	AFS: for Array of Fixed-Size data structures
++
++
++	// Example 1: For a fixed-size data structure, struct gcsNode.
++	// It is used locally in a file, so the functions are static without prefix.
++	// At top level, declear allocate and free functions.
++	// The first argument is the data type.
++	// The second armument is the short name used in the fuctions.
++	gcmMEM_DeclareFSMemPool(struct gcsNode, Node, );
++
++	// The previous macro creates two inline functions,
++	// _AllocateNode and _FreeNode.
++
++	// In function or struct
++	gcsMEM_FS_MEM_POOL nodeMemPool;
++
++	// In function,
++	struct gcsNode * node;
++	gceSTATUS status;
++
++	// Before using the memory pool, initialize it.
++	// The second argument is the gcoOS object.
++	// The third argument is the number of data structures to allocate for each chunk.
++	status = gcfMEM_InitFSMemPool(&nodeMemPool, os, 100, sizeof(struct gcsNode));
++	...
++
++	// Allocate a node.
++	status = _AllocateNode(nodeMemPool, &node);
++	...
++	// Free a node.
++	_FreeNode(nodeMemPool, node);
++
++	// After using the memory pool, free it.
++	gcfMEM_FreeFSMemPool(&nodeMemPool);
++
++
++	// Example 2: For array of fixed-size data structures, struct gcsNode.
++	// It is used in several files, so the functions are extern with prefix.
++	// At top level, declear allocate and free functions.
++	// The first argument is the data type, and the second one is the short name
++	// used in the fuctions.
++	gcmMEM_DeclareAFSMemPool(struct gcsNode, NodeArray, gcfOpt);
++
++	// The previous macro creates two inline functions,
++	// gcfOpt_AllocateNodeArray and gcfOpt_FreeNodeArray.
++
++	// In function or struct
++	gcsMEM_AFS_MEM_POOL nodeArrayMemPool;
++
++	// In function,
++	struct gcsNode * nodeArray;
++	gceSTATUS status;
++
++	// Before using the array memory pool, initialize it.
++	// The second argument is the gcoOS object, the third is the number of data
++	// structures to allocate for each chunk.
++	status = gcfMEM_InitAFSMemPool(&nodeArrayMemPool, os, sizeof(struct gcsNode));
++	...
++
++	// Allocate a node array of size 100.
++	status = gcfOpt_AllocateNodeArray(nodeArrayMemPool, &nodeArray, 100);
++	...
++	// Free a node array.
++	gcfOpt_FreeNodeArray(&nodeArrayMemPool, nodeArray);
++
++	// After using the array memory pool, free it.
++	gcfMEM_FreeAFSMemPool(&nodeArrayMemPool);
++
++*******************************************************************************/
++
++/*******************************************************************************
++**	To switch back to use gcoOS_Allocate and gcoOS_Free, add
++**	#define USE_LOCAL_MEMORY_POOL 0
++**	before including this file.
++*******************************************************************************/
++#ifndef USE_LOCAL_MEMORY_POOL
++/*
++    USE_LOCAL_MEMORY_POOL
++
++    This define enables the local memory management to improve performance.
++*/
++#define USE_LOCAL_MEMORY_POOL		1
++#endif
++
++/*******************************************************************************
++**							Memory Pool Data Structures
++*******************************************************************************/
++#if USE_LOCAL_MEMORY_POOL
++	typedef struct _gcsMEM_FS_MEM_POOL *	gcsMEM_FS_MEM_POOL;
++	typedef struct _gcsMEM_VS_MEM_POOL *	gcsMEM_VS_MEM_POOL;
++	typedef struct _gcsMEM_AFS_MEM_POOL *	gcsMEM_AFS_MEM_POOL;
++#else
++	typedef gcoOS	gcsMEM_FS_MEM_POOL;
++	typedef gcoOS	gcsMEM_VS_MEM_POOL;
++	typedef gcoOS	gcsMEM_AFS_MEM_POOL;
++#endif
++
++/*******************************************************************************
++**							Memory Pool Macros
++*******************************************************************************/
++#if USE_LOCAL_MEMORY_POOL
++#define gcmMEM_DeclareFSMemPool(Type, TypeName, Prefix) \
++gceSTATUS \
++Prefix##_Allocate##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type **					Pointer \
++	) \
++{ \
++	return(gcfMEM_FSMemPoolGetANode(MemPool, (gctPOINTER *) Pointer)); \
++} \
++ \
++gceSTATUS \
++Prefix##_CAllocate##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type **					Pointer \
++	) \
++{ \
++	gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++	gcmERR_RETURN(gcfMEM_FSMemPoolGetANode(MemPool, (gctPOINTER *) Pointer)); \
++	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, gcmSIZEOF(Type)); \
++    gcmFOOTER(); \
++	return gcvSTATUS_OK; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type *					Pointer \
++	) \
++{ \
++    gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++    status = gcfMEM_FSMemPoolFreeANode(MemPool, (gctPOINTER) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName##List( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type *					FirstPointer, \
++	Type *					LastPointer \
++	) \
++{ \
++    gceSTATUS               status; \
++    gcmHEADER_ARG("MemPool=0x%x FirstPointer=0x%x LastPointer=0x%x", MemPool, FirstPointer, LastPointer); \
++    status = gcfMEM_FSMemPoolFreeAList(MemPool, (gctPOINTER) FirstPointer, (gctPOINTER) LastPointer); \
++    gcmFOOTER(); \
++	return status; \
++}
++
++#define gcmMEM_DeclareVSMemPool(Type, TypeName, Prefix) \
++gceSTATUS \
++Prefix##_Allocate##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Size \
++	) \
++{ \
++    gceSTATUS               status;\
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
++    status = gcfMEM_VSMemPoolGetANode(MemPool, Size, (gctPOINTER *) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++} \
++ \
++gceSTATUS \
++ Prefix##_CAllocate##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Size \
++	) \
++{ \
++	gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
++	gcmERR_RETURN(gcfMEM_VSMemPoolGetANode(MemPool, Size, (gctPOINTER *) Pointer)); \
++	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, size); \
++    gcmFOOTER(); \
++	return gcvSTATUS_OK; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type *					Pointer \
++	) \
++{ \
++    gceSTATUS               status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pinter); \
++    status = gcfMEM_VSMemPoolFreeANode(MemPool, (gctPOINTER) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++}
++
++#define gcmMEM_DeclareAFSMemPool(Type, TypeName, Prefix) \
++gceSTATUS \
++Prefix##_Allocate##TypeName( \
++	gcsMEM_AFS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Count \
++	) \
++{ \
++    gceSTATUS               status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
++    status = gcfMEM_AFSMemPoolGetANode(MemPool, Count, (gctPOINTER *) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++} \
++ \
++gceSTATUS \
++Prefix##_CAllocate##TypeName( \
++	gcsMEM_AFS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Count \
++	) \
++{ \
++	gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
++	gcmERR_RETURN(gcfMEM_AFSMemPoolGetANode(MemPool, Count, (gctPOINTER *) Pointer)); \
++	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, Count * gcmSIZEOF(Type)); \
++    gcmFOOTER(); \
++	return gcvSTATUS_OK; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName( \
++	gcsMEM_AFS_MEM_POOL		MemPool, \
++	Type *					Pointer \
++	) \
++{ \
++    gceSTATUS               status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++    status = gcfMEM_AFSMemPoolFreeANode(MemPool, (gctPOINTER) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++}
++
++#else
++
++#define gcmMEM_DeclareFSMemPool(Type, TypeName, Prefix) \
++gceSTATUS \
++Prefix##_Allocate##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type **					Pointer \
++	) \
++{ \
++    gceSTATUS               status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++    status = gcoOS_Allocate(MemPool, \
++							gcmSIZEOF(Type), \
++							(gctPOINTER *) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++} \
++ \
++gceSTATUS \
++Prefix##_CAllocate##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type **					Pointer \
++	) \
++{ \
++	gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++	gcmERR_RETURN(gcoOS_Allocate(MemPool, \
++							gcmSIZEOF(Type), \
++							(gctPOINTER *) Pointer)); \
++	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, gcmSIZEOF(Type)); \
++    gcmFOOTER(); \
++	return gcvSTATUS_OK; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName( \
++	gcsMEM_FS_MEM_POOL		MemPool, \
++	Type *					Pointer \
++	) \
++{ \
++    gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++    status = gcmOS_SAFE_FREE(MemPool, Pointer); \
++    gcmFOOTER(); \
++	return status; \
++}
++
++#define gcmMEM_DeclareVSMemPool(Type, TypeName, Prefix) \
++gceSTATUS \
++Prefix##_Allocate##TypeName( \
++	gcsMEM_VS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Size \
++	) \
++{ \
++    gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
++    status = gcoOS_Allocate(MemPool, \
++							Size, \
++							(gctPOINTER *) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++} \
++ \
++gceSTATUS \
++Prefix##_CAllocate##TypeName( \
++	gcsMEM_VS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Size \
++	) \
++{ \
++	gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Size=%u", MemPool, Pointer, Size); \
++	gcmERR_RETURN(gcoOS_Allocate(MemPool, \
++							Size, \
++							(gctPOINTER *) Pointer)); \
++	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, Size); \
++    gcmFOOTER(); \
++	return gcvSTATUS_OK; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName( \
++	gcsMEM_VS_MEM_POOL		MemPool, \
++	Type *					Pointer \
++	) \
++{ \
++    gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++    status = gcmOS_SAFE_FREE(MemPool, Pointer); \
++    gcmFOOTER(); \
++	return status; \
++}
++
++#define gcmMEM_DeclareAFSMemPool(Type, TypeName, Prefix) \
++gceSTATUS \
++Prefix##_Allocate##TypeName( \
++	gcsMEM_AFS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Count \
++	) \
++{ \
++    gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
++    status = gcoOS_Allocate(MemPool, \
++							Count * gcmSIZEOF(Type), \
++							(gctPOINTER *) Pointer); \
++    gcmFOOTER(); \
++	return status; \
++} \
++ \
++gceSTATUS \
++Prefix##_CAllocate##TypeName( \
++	gcsMEM_AFS_MEM_POOL		MemPool, \
++	Type **					Pointer, \
++	gctUINT					Count \
++	) \
++{ \
++	gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x Count=%u", MemPool, Pointer, Count); \
++	gcmERR_RETURN(gcoOS_Allocate(MemPool, \
++							Count * gcmSIZEOF(Type), \
++							(gctPOINTER *) Pointer)); \
++	gcoOS_ZeroMemory(*(gctPOINTER *) Pointer, Count * gcmSIZEOF(Type)); \
++    gcmFOOTER(); \
++	return gcvSTATUS_OK; \
++} \
++ \
++gceSTATUS \
++Prefix##_Free##TypeName( \
++	gcsMEM_AFS_MEM_POOL		MemPool, \
++	Type *					Pointer \
++	) \
++{ \
++    gceSTATUS				status; \
++    gcmHEADER_ARG("MemPool=0x%x Pointer=0x%x", MemPool, Pointer); \
++    status = gcmOS_SAFE_FREE(MemPool, Pointer); \
++    gcmFOOTER(); \
++	return status; \
++}
++#endif
++
++/*******************************************************************************
++**							Memory Pool Data Functions
++*******************************************************************************/
++gceSTATUS
++gcfMEM_InitFSMemPool(
++	IN gcsMEM_FS_MEM_POOL * MemPool,
++	IN gcoOS				OS,
++	IN gctUINT				NodeCount,
++	IN gctUINT				NodeSize
++	);
++
++gceSTATUS
++gcfMEM_FreeFSMemPool(
++	IN gcsMEM_FS_MEM_POOL * MemPool
++	);
++
++gceSTATUS
++gcfMEM_FSMemPoolGetANode(
++	IN gcsMEM_FS_MEM_POOL	MemPool,
++	OUT gctPOINTER *		Node
++	);
++
++gceSTATUS
++gcfMEM_FSMemPoolFreeANode(
++	IN gcsMEM_FS_MEM_POOL	MemPool,
++	IN gctPOINTER			Node
++	);
++
++gceSTATUS
++gcfMEM_FSMemPoolFreeAList(
++	IN gcsMEM_FS_MEM_POOL	MemPool,
++	IN gctPOINTER			FirstNode,
++	IN gctPOINTER			LastNode
++	);
++
++gceSTATUS
++gcfMEM_InitVSMemPool(
++	IN gcsMEM_VS_MEM_POOL * MemPool,
++	IN gcoOS				OS,
++	IN gctUINT				BlockSize,
++	IN gctBOOL				RecycleFreeNode
++	);
++
++gceSTATUS
++gcfMEM_FreeVSMemPool(
++	IN gcsMEM_VS_MEM_POOL * MemPool
++	);
++
++gceSTATUS
++gcfMEM_VSMemPoolGetANode(
++	IN gcsMEM_VS_MEM_POOL	MemPool,
++	IN gctUINT				Size,
++	IN gctUINT				Alignment,
++	OUT gctPOINTER *		Node
++	);
++
++gceSTATUS
++gcfMEM_VSMemPoolFreeANode(
++	IN gcsMEM_VS_MEM_POOL	MemPool,
++	IN gctPOINTER			Node
++	);
++
++gceSTATUS
++gcfMEM_InitAFSMemPool(
++	IN gcsMEM_AFS_MEM_POOL *MemPool,
++	IN gcoOS				OS,
++	IN gctUINT				NodeCount,
++	IN gctUINT				NodeSize
++	);
++
++gceSTATUS
++gcfMEM_FreeAFSMemPool(
++	IN gcsMEM_AFS_MEM_POOL *MemPool
++	);
++
++gceSTATUS
++gcfMEM_AFSMemPoolGetANode(
++	IN gcsMEM_AFS_MEM_POOL	MemPool,
++	IN gctUINT				Count,
++	OUT gctPOINTER *		Node
++	);
++
++gceSTATUS
++gcfMEM_AFSMemPoolFreeANode(
++	IN gcsMEM_AFS_MEM_POOL	MemPool,
++	IN gctPOINTER			Node
++	);
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* VIVANTE_NO_3D */
++#endif /* __gc_hal_mem_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_options.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,947 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_options_h_
++#define __gc_hal_options_h_
++
++/*
++    gcdPRINT_VERSION
++
++        Print HAL version.
++*/
++#ifndef gcdPRINT_VERSION
++#   define gcdPRINT_VERSION                     0
++#endif
++
++/*
++    USE_NEW_LINUX_SIGNAL
++
++        This define enables the Linux kernel signaling between kernel and user.
++*/
++#ifndef USE_NEW_LINUX_SIGNAL
++#   define USE_NEW_LINUX_SIGNAL                 0
++#endif
++
++/*
++    VIVANTE_PROFILER
++
++        This define enables the profiler.
++*/
++#ifndef VIVANTE_PROFILER
++#   define VIVANTE_PROFILER                     1
++#endif
++
++#ifndef VIVANTE_PROFILER_PERDRAW
++#   define  VIVANTE_PROFILER_PERDRAW    0
++#endif
++
++/*
++    VIVANTE_PROFILER_CONTEXT
++
++        This define enables the profiler according to each hw context.
++*/
++#ifndef VIVANTE_PROFILER_CONTEXT
++#   define VIVANTE_PROFILER_CONTEXT             1
++#endif
++
++/*
++    gcdUSE_VG
++
++        Enable VG HAL layer (only for GC350).
++*/
++#ifndef gcdUSE_VG
++#   define gcdUSE_VG                            0
++#endif
++
++/*
++    USE_SW_FB
++
++        Set to 1 if the frame buffer memory cannot be accessed by the GPU.
++*/
++#ifndef USE_SW_FB
++#   define USE_SW_FB                            0
++#endif
++
++/*
++    USE_SUPER_SAMPLING
++
++        This define enables super-sampling support.
++*/
++#define USE_SUPER_SAMPLING                      0
++
++/*
++    PROFILE_HAL_COUNTERS
++
++        This define enables HAL counter profiling support.  HW and SHADER
++        counter profiling depends on this.
++*/
++#ifndef PROFILE_HAL_COUNTERS
++#   define PROFILE_HAL_COUNTERS                 1
++#endif
++
++/*
++    PROFILE_HW_COUNTERS
++
++        This define enables HW counter profiling support.
++*/
++#ifndef PROFILE_HW_COUNTERS
++#   define PROFILE_HW_COUNTERS                  1
++#endif
++
++/*
++    PROFILE_SHADER_COUNTERS
++
++        This define enables SHADER counter profiling support.
++*/
++#ifndef PROFILE_SHADER_COUNTERS
++#   define PROFILE_SHADER_COUNTERS              1
++#endif
++
++/*
++    COMMAND_PROCESSOR_VERSION
++
++        The version of the command buffer and task manager.
++*/
++#define COMMAND_PROCESSOR_VERSION               1
++
++/*
++    gcdDUMP_KEY
++
++        Set this to a string that appears in 'cat /proc/<pid>/cmdline'. E.g. 'camera'.
++        HAL will create dumps for the processes matching this key.
++*/
++#ifndef gcdDUMP_KEY
++#   define gcdDUMP_KEY                          "process"
++#endif
++
++/*
++    gcdDUMP_PATH
++
++        The dump file location. Some processes cannot write to the sdcard.
++        Try apps' data dir, e.g. /data/data/com.android.launcher
++*/
++#ifndef gcdDUMP_PATH
++#if defined(ANDROID)
++#   define gcdDUMP_PATH                         "/mnt/sdcard/"
++#else
++#   define gcdDUMP_PATH                         "./"
++#endif
++#endif
++
++/*
++    gcdDUMP
++
++        When set to 1, a dump of all states and memory uploads, as well as other
++        hardware related execution will be printed to the debug console.  This
++        data can be used for playing back applications.
++*/
++#ifndef gcdDUMP
++#   define gcdDUMP                              0
++#endif
++
++/*
++    gcdDUMP_API
++
++        When set to 1, a high level dump of the EGL and GL/VG APs's are
++        captured.
++*/
++#ifndef gcdDUMP_API
++#   define gcdDUMP_API                          0
++#endif
++
++/*
++    gcdDUMP_FRAMERATE
++        When set to a value other than zero, averaqe frame rate will be dumped.
++        The value set is the starting frame that the average will be calculated.
++        This is needed because sometimes first few frames are too slow to be included
++        in the average. Frame count starts from 1.
++*/
++#ifndef gcdDUMP_FRAMERATE
++#   define gcdDUMP_FRAMERATE					0
++#endif
++
++/*
++    gcdVIRTUAL_COMMAND_BUFFER
++        When set to 1, user command buffer and context buffer will be allocated
++        from gcvPOOL_VIRTUAL.
++*/
++#ifndef gcdVIRTUAL_COMMAND_BUFFER
++#   define gcdVIRTUAL_COMMAND_BUFFER            0
++#endif
++
++/*
++    gcdENABLE_FSCALE_VAL_ADJUST
++        When non-zero, FSCALE_VAL when gcvPOWER_ON can be adjusted externally.
++ */
++#ifndef gcdENABLE_FSCALE_VAL_ADJUST
++#   define gcdENABLE_FSCALE_VAL_ADJUST          1
++#endif
++
++/*
++    gcdDUMP_IN_KERNEL
++
++        When set to 1, all dumps will happen in the kernel.  This is handy if
++        you want the kernel to dump its command buffers as well and the data
++        needs to be in sync.
++*/
++#ifndef gcdDUMP_IN_KERNEL
++#   define gcdDUMP_IN_KERNEL                    0
++#endif
++
++/*
++    gcdDUMP_COMMAND
++
++        When set to non-zero, the command queue will dump all incoming command
++        and context buffers as well as all other modifications to the command
++        queue.
++*/
++#ifndef gcdDUMP_COMMAND
++#   define gcdDUMP_COMMAND                      0
++#endif
++
++/*
++    gcdDUMP_FRAME_TGA
++
++    When set to a value other than 0, a dump of the frame specified by the value,
++    will be done into frame.tga. Frame count starts from 1.
++ */
++#ifndef gcdDUMP_FRAME_TGA
++#define gcdDUMP_FRAME_TGA                       0
++#endif
++/*
++    gcdNULL_DRIVER
++
++    Set to 1 for infinite speed hardware.
++    Set to 2 for bypassing the HAL.
++    Set to 3 for bypassing the drivers.
++*/
++#ifndef gcdNULL_DRIVER
++#   define gcdNULL_DRIVER                       0
++#endif
++
++/*
++    gcdENABLE_TIMEOUT_DETECTION
++
++        Enable timeout detection.
++*/
++#ifndef gcdENABLE_TIMEOUT_DETECTION
++#   define gcdENABLE_TIMEOUT_DETECTION          0
++#endif
++
++/*
++    gcdCMD_BUFFER_SIZE
++
++        Number of bytes in a command buffer.
++*/
++#ifndef gcdCMD_BUFFER_SIZE
++#   define gcdCMD_BUFFER_SIZE                   (128 << 10)
++#endif
++
++/*
++    gcdCMD_BUFFERS
++
++        Number of command buffers to use per client.
++*/
++#ifndef gcdCMD_BUFFERS
++#   define gcdCMD_BUFFERS                       2
++#endif
++
++/*
++    gcdMAX_CMD_BUFFERS
++
++        Maximum number of command buffers to use per client.
++*/
++#ifndef gcdMAX_CMD_BUFFERS
++#   define gcdMAX_CMD_BUFFERS                   8
++#endif
++
++/*
++    gcdCOMMAND_QUEUES
++
++        Number of command queues in the kernel.
++*/
++#ifndef gcdCOMMAND_QUEUES
++#   define gcdCOMMAND_QUEUES                    2
++#endif
++
++/*
++    gcdPOWER_CONTROL_DELAY
++
++        The delay in milliseconds required to wait until the GPU has woke up
++        from a suspend or power-down state.  This is system dependent because
++        the bus clock also needs to stabalize.
++*/
++#ifndef gcdPOWER_CONTROL_DELAY
++#   define gcdPOWER_CONTROL_DELAY               0
++#endif
++
++/*
++    gcdMIRROR_PAGETABLE
++
++        Enable it when GPUs with old MMU and new MMU exist at same SoC. It makes
++        each GPU use same virtual address to access same physical memory.
++*/
++#ifndef gcdMIRROR_PAGETABLE
++#   define gcdMIRROR_PAGETABLE                  0
++#endif
++
++/*
++    gcdMMU_SIZE
++
++        Size of the MMU page table in bytes.  Each 4 bytes can hold 4kB worth of
++        virtual data.
++*/
++#ifndef gcdMMU_SIZE
++#if gcdMIRROR_PAGETABLE
++#   define gcdMMU_SIZE                          0x200000
++#else
++#   define gcdMMU_SIZE                          (2048 << 10)
++#endif
++#endif
++
++/*
++    gcdSECURE_USER
++
++        Use logical addresses instead of physical addresses in user land.  In
++        this case a hint table is created for both command buffers and context
++        buffers, and that hint table will be used to patch up those buffers in
++        the kernel when they are ready to submit.
++*/
++#ifndef gcdSECURE_USER
++#   define gcdSECURE_USER                       0
++#endif
++
++/*
++    gcdSECURE_CACHE_SLOTS
++
++        Number of slots in the logical to DMA address cache table.  Each time a
++        logical address needs to be translated into a DMA address for the GPU,
++        this cache will be walked.  The replacement scheme is LRU.
++*/
++#ifndef gcdSECURE_CACHE_SLOTS
++#   define gcdSECURE_CACHE_SLOTS                1024
++#endif
++
++/*
++    gcdSECURE_CACHE_METHOD
++
++        Replacement scheme used for Secure Cache.  The following options are
++        available:
++
++            gcdSECURE_CACHE_LRU
++                A standard LRU cache.
++
++            gcdSECURE_CACHE_LINEAR
++                A linear walker with the idea that an application will always
++                render the scene in a similar way, so the next entry in the
++                cache should be a hit most of the time.
++
++            gcdSECURE_CACHE_HASH
++                A 256-entry hash table.
++
++            gcdSECURE_CACHE_TABLE
++                A simple cache but with potential of a lot of cache replacement.
++*/
++#ifndef gcdSECURE_CACHE_METHOD
++#   define gcdSECURE_CACHE_METHOD               gcdSECURE_CACHE_HASH
++#endif
++
++/*
++    gcdREGISTER_ACCESS_FROM_USER
++
++        Set to 1 to allow IOCTL calls to get through from user land.  This
++        should only be in debug or development drops.
++*/
++#ifndef gcdREGISTER_ACCESS_FROM_USER
++#   define gcdREGISTER_ACCESS_FROM_USER         1
++#endif
++
++/*
++    gcdUSER_HEAP_ALLOCATOR
++
++        Set to 1 to enable user mode heap allocator for fast memory allocation
++        and destroying. Otherwise, memory allocation/destroying in user mode
++        will be directly managed by system. Only for linux for now.
++*/
++#ifndef gcdUSER_HEAP_ALLOCATOR
++#   define gcdUSER_HEAP_ALLOCATOR               1
++#endif
++
++/*
++    gcdHEAP_SIZE
++
++        Set the allocation size for the internal heaps.  Each time a heap is
++        full, a new heap will be allocated with this minmimum amount of bytes.
++        The bigger this size, the fewer heaps there are to allocate, the better
++        the performance.  However, heaps won't be freed until they are
++        completely free, so there might be some more memory waste if the size is
++        too big.
++*/
++#ifndef gcdHEAP_SIZE
++#   define gcdHEAP_SIZE                         (64 << 10)
++#endif
++
++/*
++    gcdPOWER_SUSNPEND_WHEN_IDLE
++
++        Set to 1 to make GPU enter gcvPOWER_SUSPEND when idle detected,
++        otherwise GPU will enter gcvPOWER_IDLE.
++*/
++#ifndef gcdPOWER_SUSNPEND_WHEN_IDLE
++#   define gcdPOWER_SUSNPEND_WHEN_IDLE          1
++#endif
++
++/*
++    gcdFPGA_BUILD
++
++        This define enables work arounds for FPGA images.
++*/
++#ifndef gcdFPGA_BUILD
++#   define gcdFPGA_BUILD                        0
++#endif
++
++/*
++    gcdGPU_TIMEOUT
++
++        This define specified the number of milliseconds the system will wait
++        before it broadcasts the GPU is stuck.  In other words, it will define
++        the timeout of any operation that needs to wait for the GPU.
++
++        If the value is 0, no timeout will be checked for.
++*/
++#ifndef gcdGPU_TIMEOUT
++#if gcdFPGA_BUILD
++#       define gcdGPU_TIMEOUT                   0
++#   else
++#       define gcdGPU_TIMEOUT                   20000
++#   endif
++#endif
++
++/*
++    gcdGPU_ADVANCETIMER
++
++        it is advance timer.
++*/
++#ifndef gcdGPU_ADVANCETIMER
++#   define gcdGPU_ADVANCETIMER                  250
++#endif
++
++/*
++    gcdSTATIC_LINK
++
++        This define disalbes static linking;
++*/
++#ifndef gcdSTATIC_LINK
++#   define gcdSTATIC_LINK                       0
++#endif
++
++/*
++    gcdUSE_NEW_HEAP
++
++        Setting this define to 1 enables new heap.
++*/
++#ifndef gcdUSE_NEW_HEAP
++#   define gcdUSE_NEW_HEAP                      0
++#endif
++
++/*
++    gcdCMD_NO_2D_CONTEXT
++
++        This define enables no-context 2D command buffer.
++*/
++#ifndef gcdCMD_NO_2D_CONTEXT
++#   define gcdCMD_NO_2D_CONTEXT                 1
++#endif
++
++/*
++    gcdENABLE_BANK_ALIGNMENT
++
++    When enabled, video memory is allocated bank aligned. The vendor can modify
++    _GetSurfaceBankAlignment() and gcoSURF_GetBankOffsetBytes() to define how
++    different types of allocations are bank and channel aligned.
++    When disabled (default), no bank alignment is done.
++*/
++#ifndef gcdENABLE_BANK_ALIGNMENT
++#   define gcdENABLE_BANK_ALIGNMENT             0
++#endif
++
++/*
++    gcdBANK_BIT_START
++
++    Specifies the start bit of the bank (inclusive).
++*/
++#ifndef gcdBANK_BIT_START
++#   define gcdBANK_BIT_START                    12
++#endif
++
++/*
++    gcdBANK_BIT_END
++
++    Specifies the end bit of the bank (inclusive).
++*/
++#ifndef gcdBANK_BIT_END
++#   define gcdBANK_BIT_END                      14
++#endif
++
++/*
++    gcdBANK_CHANNEL_BIT
++
++    When set, video memory when allocated bank aligned is allocated such that
++    render and depth buffer addresses alternate on the channel bit specified.
++    This option has an effect only when gcdENABLE_BANK_ALIGNMENT is enabled.
++    When disabled (default), no alteration is done.
++*/
++#ifndef gcdBANK_CHANNEL_BIT
++#   define gcdBANK_CHANNEL_BIT                  7
++#endif
++
++/*
++    gcdDYNAMIC_SPEED
++
++        When non-zero, it informs the kernel driver to use the speed throttling
++        broadcasting functions to inform the system the GPU should be spet up or
++        slowed down. It will send a broadcast for slowdown each "interval"
++        specified by this define in milliseconds
++        (gckOS_BroadcastCalibrateSpeed).
++*/
++#ifndef gcdDYNAMIC_SPEED
++#    define gcdDYNAMIC_SPEED                    2000
++#endif
++
++/*
++    gcdDYNAMIC_EVENT_THRESHOLD
++
++        When non-zero, it specifies the maximum number of available events at
++        which the kernel driver will issue a broadcast to speed up the GPU
++        (gckOS_BroadcastHurry).
++*/
++#ifndef gcdDYNAMIC_EVENT_THRESHOLD
++#    define gcdDYNAMIC_EVENT_THRESHOLD          5
++#endif
++
++/*
++    gcdENABLE_PROFILING
++
++        Enable profiling macros.
++*/
++#ifndef gcdENABLE_PROFILING
++#   define gcdENABLE_PROFILING                  0
++#endif
++
++/*
++    gcdENABLE_128B_MERGE
++
++        Enable 128B merge for the BUS control.
++*/
++#ifndef gcdENABLE_128B_MERGE
++#   define gcdENABLE_128B_MERGE                 0
++#endif
++
++/*
++    gcdFRAME_DB
++
++        When non-zero, it specified the number of frames inside the frame
++        database. The frame DB will collect per-frame timestamps and hardware
++        counters.
++*/
++#ifndef gcdFRAME_DB
++#   define gcdFRAME_DB                          0
++#   define gcdFRAME_DB_RESET                    0
++#   define gcdFRAME_DB_NAME                     "/var/log/frameDB.log"
++#endif
++
++/*
++    gcdENABLE_VG
++            enable the 2D openVG
++*/
++
++#ifndef gcdENABLE_VG
++#   define gcdENABLE_VG                         0
++#endif
++
++/*
++    gcdDYNAMIC_MAP_RESERVED_MEMORY
++
++        When gcvPOOL_SYSTEM is constructed from RESERVED memory,
++        driver can map the whole reserved memory to kernel space
++        at the beginning, or just map a piece of memory when need
++        to access.
++
++        Notice:
++        -  It's only for the 2D openVG. For other cores, there is
++           _NO_ need to map reserved memory to kernel.
++        -  It's meaningless when memory is allocated by
++           gckOS_AllocateContiguous, in that case, memory is always
++           mapped by system when allocated.
++*/
++#ifndef gcdDYNAMIC_MAP_RESERVED_MEMORY
++#   define gcdDYNAMIC_MAP_RESERVED_MEMORY      1
++#endif
++
++/*
++   gcdPAGED_MEMORY_CACHEABLE
++
++        When non-zero, paged memory will be cacheable.
++
++        Normally, driver will detemines whether a video memory
++        is cacheable or not. When cacheable is not neccessary,
++        it will be writecombine.
++
++        This option is only for those SOC which can't enable
++        writecombine without enabling cacheable.
++*/
++
++#ifndef gcdPAGED_MEMORY_CACHEABLE
++#   define gcdPAGED_MEMORY_CACHEABLE            0
++#endif
++
++/*
++   gcdNONPAGED_MEMORY_CACHEABLE
++
++        When non-zero, non paged memory will be cacheable.
++*/
++
++#ifndef gcdNONPAGED_MEMORY_CACHEABLE
++#   define gcdNONPAGED_MEMORY_CACHEABLE         0
++#endif
++
++/*
++   gcdNONPAGED_MEMORY_BUFFERABLE
++
++        When non-zero, non paged memory will be bufferable.
++        gcdNONPAGED_MEMORY_BUFFERABLE and gcdNONPAGED_MEMORY_CACHEABLE
++        can't be set 1 at same time
++*/
++
++#ifndef gcdNONPAGED_MEMORY_BUFFERABLE
++#   define gcdNONPAGED_MEMORY_BUFFERABLE        1
++#endif
++
++/*
++    gcdENABLE_INFINITE_SPEED_HW
++            enable the Infinte HW , this is for 2D openVG
++*/
++
++#ifndef gcdENABLE_INFINITE_SPEED_HW
++#   define gcdENABLE_INFINITE_SPEED_HW          0
++#endif
++
++/*
++    gcdENABLE_TS_DOUBLE_BUFFER
++            enable the TS double buffer, this is for 2D openVG
++*/
++
++#ifndef gcdENABLE_TS_DOUBLE_BUFFER
++#   define gcdENABLE_TS_DOUBLE_BUFFER           1
++#endif
++
++/*
++    gcd6000_SUPPORT
++
++    Temporary define to enable/disable 6000 support.
++ */
++#ifndef gcd6000_SUPPORT
++#   define gcd6000_SUPPORT                      0
++#endif
++
++/*
++    gcdPOWEROFF_TIMEOUT
++
++        When non-zero, GPU will power off automatically from
++        idle state, and gcdPOWEROFF_TIMEOUT is also the default
++        timeout in milliseconds.
++ */
++
++#ifndef gcdPOWEROFF_TIMEOUT
++#   define gcdPOWEROFF_TIMEOUT                  300
++#endif
++
++/*
++    gcdUSE_VIDMEM_PER_PID
++*/
++#ifndef gcdUSE_VIDMEM_PER_PID
++#   define gcdUSE_VIDMEM_PER_PID                0
++#endif
++
++/*
++    QNX_SINGLE_THREADED_DEBUGGING
++*/
++#ifndef QNX_SINGLE_THREADED_DEBUGGING
++#   define QNX_SINGLE_THREADED_DEBUGGING        0
++#endif
++
++/*
++    gcdENABLE_RECOVERY
++
++        This define enables the recovery code.
++*/
++#ifndef gcdENABLE_RECOVERY
++#   define gcdENABLE_RECOVERY                   0
++#endif
++
++/*
++    gcdRENDER_THREADS
++
++        Number of render threads. Make it zero, and there will be no render
++        threads.
++*/
++#ifndef gcdRENDER_THREADS
++#   define gcdRENDER_THREADS                    0
++#endif
++
++/*
++    gcdSMP
++
++        This define enables SMP support.
++
++        Currently, it only works on Linux/Android,
++        Kbuild will config it according to whether
++        CONFIG_SMP is set.
++
++*/
++#ifndef gcdSMP
++#   define gcdSMP                               0
++#endif
++
++/*
++    gcdSUPPORT_SWAP_RECTANGLE
++
++        Support swap with a specific rectangle.
++
++        Set the rectangle with eglSetSwapRectangleANDROID api.
++*/
++#ifndef gcdSUPPORT_SWAP_RECTANGLE
++#   define gcdSUPPORT_SWAP_RECTANGLE            0
++#endif
++
++/*
++    gcdGPU_LINEAR_BUFFER_ENABLED
++
++        Use linear buffer for GPU apps so HWC can do 2D composition.
++*/
++#ifndef gcdGPU_LINEAR_BUFFER_ENABLED
++#   define gcdGPU_LINEAR_BUFFER_ENABLED         1
++#endif
++
++/*
++    gcdENABLE_RENDER_INTO_WINDOW
++
++        Enable Render-Into-Window (ie, No-Resolve) feature on android.
++        NOTE that even if enabled, it still depends on hardware feature and
++        android application behavior. When hardware feature or application
++        behavior can not support render into window mode, it will fail back
++        to normal mode.
++        When Render-Into-Window is finally used, window back buffer of android
++        applications will be allocated matching render target tiling format.
++        Otherwise buffer tiling is decided by the above option
++        'gcdGPU_LINEAR_BUFFER_ENABLED'.
++*/
++#ifndef gcdENABLE_RENDER_INTO_WINDOW
++#   define gcdENABLE_RENDER_INTO_WINDOW         1
++#endif
++
++/*
++    gcdSHARED_RESOLVE_BUFFER_ENABLED
++
++        Use shared resolve buffer for all app buffers.
++*/
++#ifndef gcdSHARED_RESOLVE_BUFFER_ENABLED
++#   define gcdSHARED_RESOLVE_BUFFER_ENABLED         0
++#endif
++
++/*
++     gcdUSE_TRIANGLE_STRIP_PATCH
++ */
++#ifndef gcdUSE_TRIANGLE_STRIP_PATCH
++#   define gcdUSE_TRIANGLE_STRIP_PATCH            1
++#endif
++
++/*
++    gcdENABLE_OUTER_CACHE_PATCH
++
++        Enable the outer cache patch.
++*/
++#ifndef gcdENABLE_OUTER_CACHE_PATCH
++#   define gcdENABLE_OUTER_CACHE_PATCH          0
++#endif
++
++#ifndef gcdANDROID_UNALIGNED_LINEAR_COMPOSITION_ADJUST
++#   ifdef ANDROID
++#      define  gcdANDROID_UNALIGNED_LINEAR_COMPOSITION_ADJUST    1
++#   else
++#      define  gcdANDROID_UNALIGNED_LINEAR_COMPOSITION_ADJUST    0
++#   endif
++#endif
++
++#ifndef gcdENABLE_PE_DITHER_FIX
++#   define gcdENABLE_PE_DITHER_FIX              1
++#endif
++
++#ifndef gcdSHARED_PAGETABLE
++#   define gcdSHARED_PAGETABLE                  1
++#endif
++#ifndef gcdUSE_PVR
++#   define gcdUSE_PVR			                1
++#endif
++
++/*
++    gcdSMALL_BLOCK_SIZE
++
++        When non-zero, a part of VIDMEM will be reserved for requests
++        whose requesting size is less than gcdSMALL_BLOCK_SIZE.
++
++        For Linux, it's the size of a page. If this requeset fallbacks
++        to gcvPOOL_CONTIGUOUS or gcvPOOL_VIRTUAL, memory will be wasted
++        because they allocate a page at least.
++ */
++#ifndef gcdSMALL_BLOCK_SIZE
++#   define gcdSMALL_BLOCK_SIZE                  4096
++#   define gcdRATIO_FOR_SMALL_MEMORY            32
++#endif
++
++/*
++    gcdCONTIGUOUS_SIZE_LIMIT
++        When non-zero, size of video node from gcvPOOL_CONTIGUOUS is
++        limited by gcdCONTIGUOUS_SIZE_LIMIT.
++ */
++#ifndef gcdCONTIGUOUS_SIZE_LIMIT
++#   define gcdCONTIGUOUS_SIZE_LIMIT             0
++#endif
++
++#ifndef gcdDISALBE_EARLY_EARLY_Z
++#   define gcdDISALBE_EARLY_EARLY_Z             1
++#endif
++
++#ifndef gcdSHADER_SRC_BY_MACHINECODE
++#   define gcdSHADER_SRC_BY_MACHINECODE         1
++#endif
++
++/*
++    gcdLINK_QUEUE_SIZE
++
++        When non-zero, driver maintains a queue to record information of
++        latest lined context buffer and command buffer. Data in this queue
++        is be used to debug.
++*/
++#ifndef gcdLINK_QUEUE_SIZE
++#   define gcdLINK_QUEUE_SIZE                  0
++#endif
++
++/*  gcdALPHA_KILL_IN_SHADER
++ *
++ *  Enable alpha kill inside the shader. This will be set automatically by the
++ *  HAL if certain states match a criteria.
++ */
++#ifndef gcdALPHA_KILL_IN_SHADER
++#   define gcdALPHA_KILL_IN_SHADER              1
++#endif
++
++/*  gcdHIGH_PRECISION_DELAY_ENABLE
++ *
++ *  Enable high precision schedule delay with 1ms unit. otherwise schedule delay up to 10ms.
++ *  Browser app performance will have obvious drop without this enablement
++ */
++#ifndef gcdHIGH_PRECISION_DELAY_ENABLE
++#   define gcdHIGH_PRECISION_DELAY_ENABLE        1
++#endif
++
++#ifndef gcdUSE_WCLIP_PATCH
++#   define gcdUSE_WCLIP_PATCH                   1
++#endif
++
++#ifndef gcdHZ_L2_DISALBE
++#   define gcdHZ_L2_DISALBE                     1
++#endif
++
++#ifndef gcdBUGFIX15_DISABLE
++#   define gcdBUGFIX15_DISABLE                  1
++#endif
++
++#ifndef gcdDISABLE_HZ_FAST_CLEAR
++#   define gcdDISABLE_HZ_FAST_CLEAR             1
++#endif
++
++#ifndef gcdUSE_NPOT_PATCH
++#define gcdUSE_NPOT_PATCH                       1
++#endif
++
++#ifndef gcdSYNC
++#   define gcdSYNC                              1
++#endif
++
++#ifndef gcdENABLE_SPECIAL_HINT3
++#   define gcdENABLE_SPECIAL_HINT3               1
++#endif
++
++#if defined(ANDROID)
++#ifndef gcdPRE_ROTATION
++#   define gcdPRE_ROTATION                      1
++#endif
++#endif
++
++/*
++    gcdDVFS
++
++        When non-zero, software will make use of dynamic voltage and
++        frequency feature.
++ */
++#ifndef gcdDVFS
++#   define gcdDVFS                               1
++#   define gcdDVFS_ANAYLSE_WINDOW                4
++#   define gcdDVFS_POLLING_TIME                  (gcdDVFS_ANAYLSE_WINDOW * 4)
++#endif
++
++/*
++    gcdANDROID_NATIVE_FENCE_SYNC
++
++        Enable android native fence sync. It is introduced since jellybean-4.2.
++        Depends on linux kernel option: CONFIG_SYNC.
++
++        0: Disabled
++        1: Build framework for native fence sync feature, and EGL extension
++        2: Enable async swap buffers for client
++           * Native fence sync for client 'queueBuffer' in EGL, which is
++             'acquireFenceFd' for layer in compositor side.
++        3. Enable async hwcomposer composition.
++           * 'releaseFenceFd' for layer in compositor side, which is native
++             fence sync when client 'dequeueBuffer'
++           * Native fence sync for compositor 'queueBuffer' in EGL, which is
++             'acquireFenceFd' for framebuffer target for DC
++ */
++#ifndef gcdANDROID_NATIVE_FENCE_SYNC
++#   define gcdANDROID_NATIVE_FENCE_SYNC        0
++#endif
++
++#ifndef gcdFORCE_MIPMAP
++#   define gcdFORCE_MIPMAP                     1
++#endif
++
++/*
++    gcdFORCE_GAL_LOAD_TWICE
++
++        When non-zero, each thread except the main one will load libGAL.so twice to avoid potential segmetantion fault when app using dlopen/dlclose.
++        If threads exit arbitrarily, libGAL.so may not unload until the process quit.
++ */
++#ifndef gcdFORCE_GAL_LOAD_TWICE
++#   define gcdFORCE_GAL_LOAD_TWICE             0
++#endif
++
++#endif /* __gc_hal_options_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_profiler.h	2015-07-27 23:13:06.214808565 +0200
+@@ -0,0 +1,584 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_profiler_h_
++#define __gc_hal_profiler_h_
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++#define GLVERTEX_OBJECT 10
++#define GLVERTEX_OBJECT_BYTES 11
++
++#define GLINDEX_OBJECT 20
++#define GLINDEX_OBJECT_BYTES 21
++
++#define GLTEXTURE_OBJECT 30
++#define GLTEXTURE_OBJECT_BYTES 31
++
++#if VIVANTE_PROFILER
++#define gcmPROFILE_GC(Enum, Value)  gcoPROFILER_Count(gcvNULL, Enum, Value)
++#else
++#define gcmPROFILE_GC(Enum, Value)  do { } while (gcvFALSE)
++#endif
++
++#ifndef gcdNEW_PROFILER_FILE
++#define gcdNEW_PROFILER_FILE    1
++#endif
++
++#define    ES11_CALLS              151
++#define    ES11_DRAWCALLS          (ES11_CALLS             + 1)
++#define    ES11_STATECHANGECALLS   (ES11_DRAWCALLS         + 1)
++#define    ES11_POINTCOUNT         (ES11_STATECHANGECALLS  + 1)
++#define    ES11_LINECOUNT          (ES11_POINTCOUNT        + 1)
++#define    ES11_TRIANGLECOUNT      (ES11_LINECOUNT         + 1)
++
++#define    ES20_CALLS              159
++#define    ES20_DRAWCALLS          (ES20_CALLS             + 1)
++#define    ES20_STATECHANGECALLS   (ES20_DRAWCALLS         + 1)
++#define    ES20_POINTCOUNT         (ES20_STATECHANGECALLS  + 1)
++#define    ES20_LINECOUNT          (ES20_POINTCOUNT        + 1)
++#define    ES20_TRIANGLECOUNT      (ES20_LINECOUNT         + 1)
++
++#define    VG11_CALLS              88
++#define    VG11_DRAWCALLS          (VG11_CALLS              + 1)
++#define    VG11_STATECHANGECALLS   (VG11_DRAWCALLS          + 1)
++#define    VG11_FILLCOUNT          (VG11_STATECHANGECALLS   + 1)
++#define    VG11_STROKECOUNT        (VG11_FILLCOUNT          + 1)
++/* End of Driver API ID Definitions. */
++
++/* HAL & MISC IDs. */
++#define HAL_VERTBUFNEWBYTEALLOC    1
++#define HAL_VERTBUFTOTALBYTEALLOC  (HAL_VERTBUFNEWBYTEALLOC     + 1)
++#define HAL_VERTBUFNEWOBJALLOC     (HAL_VERTBUFTOTALBYTEALLOC   + 1)
++#define HAL_VERTBUFTOTALOBJALLOC   (HAL_VERTBUFNEWOBJALLOC      + 1)
++#define HAL_INDBUFNEWBYTEALLOC     (HAL_VERTBUFTOTALOBJALLOC    + 1)
++#define HAL_INDBUFTOTALBYTEALLOC   (HAL_INDBUFNEWBYTEALLOC      + 1)
++#define HAL_INDBUFNEWOBJALLOC      (HAL_INDBUFTOTALBYTEALLOC    + 1)
++#define HAL_INDBUFTOTALOBJALLOC    (HAL_INDBUFNEWOBJALLOC       + 1)
++#define HAL_TEXBUFNEWBYTEALLOC     (HAL_INDBUFTOTALOBJALLOC     + 1)
++#define HAL_TEXBUFTOTALBYTEALLOC   (HAL_TEXBUFNEWBYTEALLOC      + 1)
++#define HAL_TEXBUFNEWOBJALLOC      (HAL_TEXBUFTOTALBYTEALLOC    + 1)
++#define HAL_TEXBUFTOTALOBJALLOC    (HAL_TEXBUFNEWOBJALLOC       + 1)
++
++#define GPU_CYCLES           1
++#define GPU_READ64BYTE       (GPU_CYCLES         + 1)
++#define GPU_WRITE64BYTE      (GPU_READ64BYTE     + 1)
++#define GPU_TOTALCYCLES      (GPU_WRITE64BYTE    + 1)
++#define GPU_IDLECYCLES       (GPU_TOTALCYCLES    + 1)
++
++#define VS_INSTCOUNT          1
++#define VS_BRANCHINSTCOUNT    (VS_INSTCOUNT          + 1)
++#define VS_TEXLDINSTCOUNT     (VS_BRANCHINSTCOUNT    + 1)
++#define VS_RENDEREDVERTCOUNT  (VS_TEXLDINSTCOUNT     + 1)
++#define VS_SOURCE             (VS_RENDEREDVERTCOUNT  + 1)
++
++#define PS_INSTCOUNT          1
++#define PS_BRANCHINSTCOUNT    (PS_INSTCOUNT          + 1)
++#define PS_TEXLDINSTCOUNT     (PS_BRANCHINSTCOUNT    + 1)
++#define PS_RENDEREDPIXCOUNT   (PS_TEXLDINSTCOUNT     + 1)
++#define PS_SOURCE             (PS_RENDEREDPIXCOUNT   + 1)
++
++#define PA_INVERTCOUNT        1
++#define PA_INPRIMCOUNT        (PA_INVERTCOUNT      + 1)
++#define PA_OUTPRIMCOUNT       (PA_INPRIMCOUNT      + 1)
++#define PA_DEPTHCLIPCOUNT     (PA_OUTPRIMCOUNT     + 1)
++#define PA_TRIVIALREJCOUNT    (PA_DEPTHCLIPCOUNT   + 1)
++#define PA_CULLCOUNT          (PA_TRIVIALREJCOUNT  + 1)
++
++#define SE_TRIANGLECOUNT      1
++#define SE_LINECOUNT          (SE_TRIANGLECOUNT    + 1)
++
++#define RA_VALIDPIXCOUNT      1
++#define RA_TOTALQUADCOUNT     (RA_VALIDPIXCOUNT      + 1)
++#define RA_VALIDQUADCOUNTEZ   (RA_TOTALQUADCOUNT     + 1)
++#define RA_TOTALPRIMCOUNT     (RA_VALIDQUADCOUNTEZ   + 1)
++#define RA_PIPECACHEMISSCOUNT (RA_TOTALPRIMCOUNT     + 1)
++#define RA_PREFCACHEMISSCOUNT (RA_PIPECACHEMISSCOUNT + 1)
++#define RA_EEZCULLCOUNT       (RA_PREFCACHEMISSCOUNT + 1)
++
++#define TX_TOTBILINEARREQ     1
++#define TX_TOTTRILINEARREQ    (TX_TOTBILINEARREQ      + 1)
++#define TX_TOTDISCARDTEXREQ   (TX_TOTTRILINEARREQ     + 1)
++#define TX_TOTTEXREQ          (TX_TOTDISCARDTEXREQ    + 1)
++#define TX_MEMREADCOUNT       (TX_TOTTEXREQ           + 1)
++#define TX_MEMREADIN8BCOUNT   (TX_MEMREADCOUNT        + 1)
++#define TX_CACHEMISSCOUNT     (TX_MEMREADIN8BCOUNT    + 1)
++#define TX_CACHEHITTEXELCOUNT (TX_CACHEMISSCOUNT      + 1)
++#define TX_CACHEMISSTEXELCOUNT (TX_CACHEHITTEXELCOUNT + 1)
++
++#define PE_KILLEDBYCOLOR      1
++#define PE_KILLEDBYDEPTH      (PE_KILLEDBYCOLOR    + 1)
++#define PE_DRAWNBYCOLOR       (PE_KILLEDBYDEPTH    + 1)
++#define PE_DRAWNBYDEPTH       (PE_DRAWNBYCOLOR     + 1)
++
++#define MC_READREQ8BPIPE      1
++#define MC_READREQ8BIP        (MC_READREQ8BPIPE    + 1)
++#define MC_WRITEREQ8BPIPE     (MC_READREQ8BIP      + 1)
++
++#define AXI_READREQSTALLED    1
++#define AXI_WRITEREQSTALLED   (AXI_READREQSTALLED  + 1)
++#define AXI_WRITEDATASTALLED  (AXI_WRITEREQSTALLED + 1)
++
++#define PVS_INSTRCOUNT        1
++#define PVS_ALUINSTRCOUNT     (PVS_INSTRCOUNT      + 1)
++#define PVS_TEXINSTRCOUNT     (PVS_ALUINSTRCOUNT   + 1)
++#define PVS_ATTRIBCOUNT       (PVS_TEXINSTRCOUNT   + 1)
++#define PVS_UNIFORMCOUNT      (PVS_ATTRIBCOUNT     + 1)
++#define PVS_FUNCTIONCOUNT     (PVS_UNIFORMCOUNT    + 1)
++#define PVS_SOURCE            (PVS_FUNCTIONCOUNT   + 1)
++
++#define PPS_INSTRCOUNT       1
++#define PPS_ALUINSTRCOUNT    (PPS_INSTRCOUNT       + 1)
++#define PPS_TEXINSTRCOUNT    (PPS_ALUINSTRCOUNT    + 1)
++#define PPS_ATTRIBCOUNT      (PPS_TEXINSTRCOUNT    + 1)
++#define PPS_UNIFORMCOUNT     (PPS_ATTRIBCOUNT      + 1)
++#define PPS_FUNCTIONCOUNT    (PPS_UNIFORMCOUNT     + 1)
++#define PPS_SOURCE           (PPS_FUNCTIONCOUNT    + 1)
++/* End of MISC Counter IDs. */
++
++#ifdef gcdNEW_PROFILER_FILE
++
++/* Category Constants. */
++#define VPHEADER        0x010000
++#define VPG_INFO        0x020000
++#define VPG_TIME        0x030000
++#define VPG_MEM         0x040000
++#define VPG_ES11        0x050000
++#define VPG_ES20        0x060000
++#define VPG_VG11        0x070000
++#define VPG_HAL         0x080000
++#define VPG_HW          0x090000
++#define VPG_GPU         0x0a0000
++#define VPG_VS          0x0b0000
++#define VPG_PS          0x0c0000
++#define VPG_PA          0x0d0000
++#define VPG_SETUP       0x0e0000
++#define VPG_RA          0x0f0000
++#define VPG_TX          0x100000
++#define VPG_PE          0x110000
++#define VPG_MC          0x120000
++#define VPG_AXI         0x130000
++#define VPG_PROG        0x140000
++#define VPG_PVS         0x150000
++#define VPG_PPS         0x160000
++#define VPG_ES11_TIME   0x170000
++#define VPG_ES20_TIME   0x180000
++#define VPG_FRAME       0x190000
++#define VPG_ES11_DRAW   0x200000
++#define VPG_ES20_DRAW   0x210000
++#define VPG_END         0xff0000
++
++/* Info. */
++#define VPC_INFOCOMPANY         (VPG_INFO + 1)
++#define VPC_INFOVERSION         (VPC_INFOCOMPANY + 1)
++#define VPC_INFORENDERER        (VPC_INFOVERSION + 1)
++#define VPC_INFOREVISION        (VPC_INFORENDERER + 1)
++#define VPC_INFODRIVER          (VPC_INFOREVISION + 1)
++#define VPC_INFODRIVERMODE      (VPC_INFODRIVER + 1)
++#define VPC_INFOSCREENSIZE      (VPC_INFODRIVERMODE + 1)
++
++/* Counter Constants. */
++#define VPC_ELAPSETIME          (VPG_TIME + 1)
++#define VPC_CPUTIME             (VPC_ELAPSETIME + 1)
++
++#define VPC_MEMMAXRES           (VPG_MEM + 1)
++#define VPC_MEMSHARED           (VPC_MEMMAXRES + 1)
++#define VPC_MEMUNSHAREDDATA     (VPC_MEMSHARED + 1)
++#define VPC_MEMUNSHAREDSTACK    (VPC_MEMUNSHAREDDATA + 1)
++
++/* OpenGL ES11 Statics Counter IDs. */
++#define    VPC_ES11CALLS            (VPG_ES11 +    ES11_CALLS)
++#define    VPC_ES11DRAWCALLS        (VPG_ES11 +    ES11_DRAWCALLS)
++#define    VPC_ES11STATECHANGECALLS (VPG_ES11 +    ES11_STATECHANGECALLS)
++#define    VPC_ES11POINTCOUNT       (VPG_ES11 +    ES11_POINTCOUNT)
++#define    VPC_ES11LINECOUNT        (VPG_ES11 +    ES11_LINECOUNT)
++#define    VPC_ES11TRIANGLECOUNT    (VPG_ES11 +    ES11_TRIANGLECOUNT)
++
++/* OpenGL ES20 Statistics Counter IDs. */
++#define    VPC_ES20CALLS            (VPG_ES20 +    ES20_CALLS)
++#define    VPC_ES20DRAWCALLS        (VPG_ES20 +    ES20_DRAWCALLS)
++#define    VPC_ES20STATECHANGECALLS (VPG_ES20 +    ES20_STATECHANGECALLS)
++#define    VPC_ES20POINTCOUNT       (VPG_ES20 +    ES20_POINTCOUNT)
++#define    VPC_ES20LINECOUNT        (VPG_ES20 +    ES20_LINECOUNT)
++#define    VPC_ES20TRIANGLECOUNT    (VPG_ES20 +    ES20_TRIANGLECOUNT)
++
++/* OpenVG Statistics Counter IDs. */
++#define    VPC_VG11CALLS            (VPG_VG11 +    VG11_CALLS)
++#define    VPC_VG11DRAWCALLS        (VPG_VG11 +    VG11_DRAWCALLS)
++#define    VPC_VG11STATECHANGECALLS (VPG_VG11 +    VG11_STATECHANGECALLS)
++#define    VPC_VG11FILLCOUNT        (VPG_VG11 +    VG11_FILLCOUNT)
++#define    VPC_VG11STROKECOUNT      (VPG_VG11 +    VG11_STROKECOUNT)
++
++/* HAL Counters. */
++#define VPC_HALVERTBUFNEWBYTEALLOC      (VPG_HAL + HAL_VERTBUFNEWBYTEALLOC)
++#define VPC_HALVERTBUFTOTALBYTEALLOC    (VPG_HAL + HAL_VERTBUFTOTALBYTEALLOC)
++#define VPC_HALVERTBUFNEWOBJALLOC       (VPG_HAL + HAL_VERTBUFNEWOBJALLOC)
++#define VPC_HALVERTBUFTOTALOBJALLOC     (VPG_HAL + HAL_VERTBUFTOTALOBJALLOC)
++#define VPC_HALINDBUFNEWBYTEALLOC       (VPG_HAL + HAL_INDBUFNEWBYTEALLOC)
++#define VPC_HALINDBUFTOTALBYTEALLOC     (VPG_HAL + HAL_INDBUFTOTALBYTEALLOC)
++#define VPC_HALINDBUFNEWOBJALLOC        (VPG_HAL + HAL_INDBUFNEWOBJALLOC)
++#define VPC_HALINDBUFTOTALOBJALLOC      (VPG_HAL + HAL_INDBUFTOTALOBJALLOC)
++#define VPC_HALTEXBUFNEWBYTEALLOC       (VPG_HAL + HAL_TEXBUFNEWBYTEALLOC)
++#define VPC_HALTEXBUFTOTALBYTEALLOC     (VPG_HAL + HAL_TEXBUFTOTALBYTEALLOC)
++#define VPC_HALTEXBUFNEWOBJALLOC        (VPG_HAL + HAL_TEXBUFNEWOBJALLOC)
++#define VPC_HALTEXBUFTOTALOBJALLOC      (VPG_HAL + HAL_TEXBUFTOTALOBJALLOC)
++
++/* HW: GPU Counters. */
++#define VPC_GPUCYCLES                   (VPG_GPU + GPU_CYCLES)
++#define VPC_GPUREAD64BYTE               (VPG_GPU + GPU_READ64BYTE)
++#define VPC_GPUWRITE64BYTE              (VPG_GPU + GPU_WRITE64BYTE)
++#define VPC_GPUTOTALCYCLES              (VPG_GPU + GPU_TOTALCYCLES)
++#define VPC_GPUIDLECYCLES               (VPG_GPU + GPU_IDLECYCLES)
++
++/* HW: Shader Counters. */
++#define VPC_VSINSTCOUNT                 (VPG_VS + VS_INSTCOUNT)
++#define VPC_VSBRANCHINSTCOUNT           (VPG_VS + VS_BRANCHINSTCOUNT)
++#define VPC_VSTEXLDINSTCOUNT            (VPG_VS + VS_TEXLDINSTCOUNT)
++#define VPC_VSRENDEREDVERTCOUNT         (VPG_VS + VS_RENDEREDVERTCOUNT)
++/* HW: PS Count. */
++#define VPC_PSINSTCOUNT                 (VPG_PS + PS_INSTCOUNT)
++#define VPC_PSBRANCHINSTCOUNT           (VPG_PS + PS_BRANCHINSTCOUNT)
++#define VPC_PSTEXLDINSTCOUNT            (VPG_PS + PS_TEXLDINSTCOUNT)
++#define VPC_PSRENDEREDPIXCOUNT          (VPG_PS + PS_RENDEREDPIXCOUNT)
++
++
++/* HW: PA Counters. */
++#define VPC_PAINVERTCOUNT               (VPG_PA + PA_INVERTCOUNT)
++#define VPC_PAINPRIMCOUNT               (VPG_PA + PA_INPRIMCOUNT)
++#define VPC_PAOUTPRIMCOUNT              (VPG_PA + PA_OUTPRIMCOUNT)
++#define VPC_PADEPTHCLIPCOUNT            (VPG_PA + PA_DEPTHCLIPCOUNT)
++#define VPC_PATRIVIALREJCOUNT           (VPG_PA + PA_TRIVIALREJCOUNT)
++#define VPC_PACULLCOUNT                 (VPG_PA + PA_CULLCOUNT)
++
++/* HW: Setup Counters. */
++#define VPC_SETRIANGLECOUNT             (VPG_SETUP + SE_TRIANGLECOUNT)
++#define VPC_SELINECOUNT                 (VPG_SETUP + SE_LINECOUNT)
++
++/* HW: RA Counters. */
++#define VPC_RAVALIDPIXCOUNT             (VPG_RA + RA_VALIDPIXCOUNT)
++#define VPC_RATOTALQUADCOUNT            (VPG_RA + RA_TOTALQUADCOUNT)
++#define VPC_RAVALIDQUADCOUNTEZ          (VPG_RA + RA_VALIDQUADCOUNTEZ)
++#define VPC_RATOTALPRIMCOUNT            (VPG_RA + RA_TOTALPRIMCOUNT)
++#define VPC_RAPIPECACHEMISSCOUNT        (VPG_RA + RA_PIPECACHEMISSCOUNT)
++#define VPC_RAPREFCACHEMISSCOUNT        (VPG_RA + RA_PREFCACHEMISSCOUNT)
++#define VPC_RAEEZCULLCOUNT              (VPG_RA + RA_EEZCULLCOUNT)
++
++/* HW: TEX Counters. */
++#define VPC_TXTOTBILINEARREQ            (VPG_TX + TX_TOTBILINEARREQ)
++#define VPC_TXTOTTRILINEARREQ           (VPG_TX + TX_TOTTRILINEARREQ)
++#define VPC_TXTOTDISCARDTEXREQ          (VPG_TX + TX_TOTDISCARDTEXREQ)
++#define VPC_TXTOTTEXREQ                 (VPG_TX + TX_TOTTEXREQ)
++#define VPC_TXMEMREADCOUNT              (VPG_TX + TX_MEMREADCOUNT)
++#define VPC_TXMEMREADIN8BCOUNT          (VPG_TX + TX_MEMREADIN8BCOUNT)
++#define VPC_TXCACHEMISSCOUNT            (VPG_TX + TX_CACHEMISSCOUNT)
++#define VPC_TXCACHEHITTEXELCOUNT        (VPG_TX + TX_CACHEHITTEXELCOUNT)
++#define VPC_TXCACHEMISSTEXELCOUNT       (VPG_TX + TX_CACHEMISSTEXELCOUNT)
++
++/* HW: PE Counters. */
++#define VPC_PEKILLEDBYCOLOR             (VPG_PE + PE_KILLEDBYCOLOR)
++#define VPC_PEKILLEDBYDEPTH             (VPG_PE + PE_KILLEDBYDEPTH)
++#define VPC_PEDRAWNBYCOLOR              (VPG_PE + PE_DRAWNBYCOLOR)
++#define VPC_PEDRAWNBYDEPTH              (VPG_PE + PE_DRAWNBYDEPTH)
++
++/* HW: MC Counters. */
++#define VPC_MCREADREQ8BPIPE             (VPG_MC + MC_READREQ8BPIPE)
++#define VPC_MCREADREQ8BIP               (VPG_MC + MC_READREQ8BIP)
++#define VPC_MCWRITEREQ8BPIPE            (VPG_MC + MC_WRITEREQ8BPIPE)
++
++/* HW: AXI Counters. */
++#define VPC_AXIREADREQSTALLED           (VPG_AXI + AXI_READREQSTALLED)
++#define VPC_AXIWRITEREQSTALLED          (VPG_AXI + AXI_WRITEREQSTALLED)
++#define VPC_AXIWRITEDATASTALLED         (VPG_AXI + AXI_WRITEDATASTALLED)
++
++/* PROGRAM: Shader program counters. */
++#define VPC_PVSINSTRCOUNT           (VPG_PVS + PVS_INSTRCOUNT)
++#define VPC_PVSALUINSTRCOUNT        (VPG_PVS + PVS_ALUINSTRCOUNT)
++#define VPC_PVSTEXINSTRCOUNT        (VPG_PVS + PVS_TEXINSTRCOUNT)
++#define VPC_PVSATTRIBCOUNT          (VPG_PVS + PVS_ATTRIBCOUNT)
++#define VPC_PVSUNIFORMCOUNT         (VPG_PVS + PVS_UNIFORMCOUNT)
++#define VPC_PVSFUNCTIONCOUNT        (VPG_PVS + PVS_FUNCTIONCOUNT)
++#define VPC_PVSSOURCE               (VPG_PVS + PVS_SOURCE)
++
++#define VPC_PPSINSTRCOUNT           (VPG_PPS + PPS_INSTRCOUNT)
++#define VPC_PPSALUINSTRCOUNT        (VPG_PPS + PPS_ALUINSTRCOUNT)
++#define VPC_PPSTEXINSTRCOUNT        (VPG_PPS + PPS_TEXINSTRCOUNT)
++#define VPC_PPSATTRIBCOUNT          (VPG_PPS + PPS_ATTRIBCOUNT)
++#define VPC_PPSUNIFORMCOUNT         (VPG_PPS + PPS_UNIFORMCOUNT)
++#define VPC_PPSFUNCTIONCOUNT        (VPG_PPS + PPS_FUNCTIONCOUNT)
++#define VPC_PPSSOURCE               (VPG_PPS + PPS_SOURCE)
++
++#define VPC_PROGRAMHANDLE           (VPG_PROG + 1)
++
++#define VPG_ES20_DRAW_NO  (VPG_ES20_DRAW + 1)
++#define VPG_ES11_DRAW_NO  (VPG_ES11_DRAW + 1)
++
++#define VPG_FRAME_USEVBO (VPG_FRAME + 1)
++
++#endif
++
++
++/* HW profile information. */
++typedef struct _gcsPROFILER_COUNTERS
++{
++    /* HW static counters. */
++    gctUINT32       gpuClock;
++    gctUINT32       axiClock;
++    gctUINT32       shaderClock;
++
++    /* HW vairable counters. */
++    gctUINT32       gpuClockStart;
++    gctUINT32       gpuClockEnd;
++
++    /* HW vairable counters. */
++    gctUINT32       gpuCyclesCounter;
++    gctUINT32       gpuTotalCyclesCounter;
++    gctUINT32       gpuIdleCyclesCounter;
++    gctUINT32       gpuTotalRead64BytesPerFrame;
++    gctUINT32       gpuTotalWrite64BytesPerFrame;
++
++    /* PE */
++    gctUINT32       pe_pixel_count_killed_by_color_pipe;
++    gctUINT32       pe_pixel_count_killed_by_depth_pipe;
++    gctUINT32       pe_pixel_count_drawn_by_color_pipe;
++    gctUINT32       pe_pixel_count_drawn_by_depth_pipe;
++
++    /* SH */
++    gctUINT32       ps_inst_counter;
++    gctUINT32       rendered_pixel_counter;
++    gctUINT32       vs_inst_counter;
++    gctUINT32       rendered_vertice_counter;
++    gctUINT32       vtx_branch_inst_counter;
++    gctUINT32       vtx_texld_inst_counter;
++    gctUINT32       pxl_branch_inst_counter;
++    gctUINT32       pxl_texld_inst_counter;
++
++    /* PA */
++    gctUINT32       pa_input_vtx_counter;
++    gctUINT32       pa_input_prim_counter;
++    gctUINT32       pa_output_prim_counter;
++    gctUINT32       pa_depth_clipped_counter;
++    gctUINT32       pa_trivial_rejected_counter;
++    gctUINT32       pa_culled_counter;
++
++    /* SE */
++    gctUINT32       se_culled_triangle_count;
++    gctUINT32       se_culled_lines_count;
++
++    /* RA */
++    gctUINT32       ra_valid_pixel_count;
++    gctUINT32       ra_total_quad_count;
++    gctUINT32       ra_valid_quad_count_after_early_z;
++    gctUINT32       ra_total_primitive_count;
++    gctUINT32       ra_pipe_cache_miss_counter;
++    gctUINT32       ra_prefetch_cache_miss_counter;
++    gctUINT32       ra_eez_culled_counter;
++
++    /* TX */
++    gctUINT32       tx_total_bilinear_requests;
++    gctUINT32       tx_total_trilinear_requests;
++    gctUINT32       tx_total_discarded_texture_requests;
++    gctUINT32       tx_total_texture_requests;
++    gctUINT32       tx_mem_read_count;
++    gctUINT32       tx_mem_read_in_8B_count;
++    gctUINT32       tx_cache_miss_count;
++    gctUINT32       tx_cache_hit_texel_count;
++    gctUINT32       tx_cache_miss_texel_count;
++
++    /* MC */
++    gctUINT32       mc_total_read_req_8B_from_pipeline;
++    gctUINT32       mc_total_read_req_8B_from_IP;
++    gctUINT32       mc_total_write_req_8B_from_pipeline;
++
++    /* HI */
++    gctUINT32       hi_axi_cycles_read_request_stalled;
++    gctUINT32       hi_axi_cycles_write_request_stalled;
++    gctUINT32       hi_axi_cycles_write_data_stalled;
++}
++gcsPROFILER_COUNTERS;
++
++/* HAL profile information. */
++typedef struct _gcsPROFILER
++{
++    gctUINT32       enable;
++    gctBOOL         enableHal;
++    gctBOOL         enableHW;
++    gctBOOL         enableSH;
++    gctBOOL         isSyncMode;
++
++    gctBOOL         useSocket;
++    gctINT          sockFd;
++
++    gctFILE         file;
++
++    /* Aggregate Information */
++
++    /* Clock Info */
++    gctUINT64       frameStart;
++    gctUINT64       frameEnd;
++
++    /* Current frame information */
++    gctUINT32       frameNumber;
++    gctUINT64       frameStartTimeusec;
++    gctUINT64       frameEndTimeusec;
++    gctUINT64       frameStartCPUTimeusec;
++    gctUINT64       frameEndCPUTimeusec;
++
++#if PROFILE_HAL_COUNTERS
++    gctUINT32       vertexBufferTotalBytesAlloc;
++    gctUINT32       vertexBufferNewBytesAlloc;
++    int             vertexBufferTotalObjectsAlloc;
++    int             vertexBufferNewObjectsAlloc;
++
++    gctUINT32       indexBufferTotalBytesAlloc;
++    gctUINT32       indexBufferNewBytesAlloc;
++    int             indexBufferTotalObjectsAlloc;
++    int             indexBufferNewObjectsAlloc;
++
++    gctUINT32       textureBufferTotalBytesAlloc;
++    gctUINT32       textureBufferNewBytesAlloc;
++    int             textureBufferTotalObjectsAlloc;
++    int             textureBufferNewObjectsAlloc;
++
++    gctUINT32       numCommits;
++    gctUINT32       drawPointCount;
++    gctUINT32       drawLineCount;
++    gctUINT32       drawTriangleCount;
++    gctUINT32       drawVertexCount;
++    gctUINT32       redundantStateChangeCalls;
++#endif
++
++    gctUINT32       prevVSInstCount;
++    gctUINT32       prevVSBranchInstCount;
++    gctUINT32       prevVSTexInstCount;
++    gctUINT32       prevVSVertexCount;
++    gctUINT32       prevPSInstCount;
++    gctUINT32       prevPSBranchInstCount;
++    gctUINT32       prevPSTexInstCount;
++    gctUINT32       prevPSPixelCount;
++
++    char*           psSource;
++    char*           vsSource;
++
++}
++gcsPROFILER;
++
++/* Memory profile information. */
++struct _gcsMemProfile
++{
++    /* Memory Usage */
++    gctUINT32       videoMemUsed;
++    gctUINT32       systemMemUsed;
++    gctUINT32       commitBufferSize;
++    gctUINT32       contextBufferCopyBytes;
++};
++
++/* Shader profile information. */
++struct _gcsSHADER_PROFILER
++{
++    gctUINT32       shaderLength;
++    gctUINT32       shaderALUCycles;
++    gctUINT32       shaderTexLoadCycles;
++    gctUINT32       shaderTempRegCount;
++    gctUINT32       shaderSamplerRegCount;
++    gctUINT32       shaderInputRegCount;
++    gctUINT32       shaderOutputRegCount;
++};
++
++/* Initialize the gcsProfiler. */
++gceSTATUS
++gcoPROFILER_Initialize(
++    IN gcoHAL Hal
++    );
++
++/* Destroy the gcProfiler. */
++gceSTATUS
++gcoPROFILER_Destroy(
++    IN gcoHAL Hal
++    );
++
++/* Write data to profiler. */
++gceSTATUS
++gcoPROFILER_Write(
++    IN gcoHAL Hal,
++    IN gctSIZE_T ByteCount,
++    IN gctCONST_POINTER Data
++    );
++
++/* Flush data out. */
++gceSTATUS
++gcoPROFILER_Flush(
++    IN gcoHAL Hal
++    );
++
++/* Call to signal end of frame. */
++gceSTATUS
++gcoPROFILER_EndFrame(
++    IN gcoHAL Hal
++    );
++
++/* Call to signal end of draw. */
++gceSTATUS
++gcoPROFILER_EndDraw(
++    IN gcoHAL Hal,
++    IN gctBOOL FirstDraw
++    );
++
++/* Increase profile counter Enum by Value. */
++gceSTATUS
++gcoPROFILER_Count(
++	IN gcoHAL Hal,
++	IN gctUINT32 Enum,
++	IN gctINT Value
++	);
++
++gceSTATUS
++gcoPROFILER_ShaderSourceFS(
++    IN gcoHAL Hal,
++    IN char* source
++    );
++
++gceSTATUS
++gcoPROFILER_ShaderSourceVS(
++    IN gcoHAL Hal,
++    IN char* source
++    );
++
++/* Profile input vertex shader. */
++gceSTATUS
++gcoPROFILER_ShaderVS(
++    IN gcoHAL Hal,
++    IN gctPOINTER Vs
++    );
++
++/* Profile input fragment shader. */
++gceSTATUS
++gcoPROFILER_ShaderFS(
++    IN gcoHAL Hal,
++    IN gctPOINTER Fs
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_profiler_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_raster.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,1010 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_raster_h_
++#define __gc_hal_raster_h_
++
++#include "gc_hal_enum.h"
++#include "gc_hal_types.h"
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++****************************** Object Declarations *****************************
++\******************************************************************************/
++
++typedef struct _gcoBRUSH *				gcoBRUSH;
++typedef struct _gcoBRUSH_CACHE *  		gcoBRUSH_CACHE;
++
++/******************************************************************************\
++******************************** gcoBRUSH Object *******************************
++\******************************************************************************/
++
++/* Create a new solid color gcoBRUSH object. */
++gceSTATUS
++gcoBRUSH_ConstructSingleColor(
++	IN gcoHAL Hal,
++	IN gctUINT32 ColorConvert,
++	IN gctUINT32 Color,
++	IN gctUINT64 Mask,
++	gcoBRUSH * Brush
++	);
++
++/* Create a new monochrome gcoBRUSH object. */
++gceSTATUS
++gcoBRUSH_ConstructMonochrome(
++	IN gcoHAL Hal,
++	IN gctUINT32 OriginX,
++	IN gctUINT32 OriginY,
++	IN gctUINT32 ColorConvert,
++	IN gctUINT32 FgColor,
++	IN gctUINT32 BgColor,
++	IN gctUINT64 Bits,
++	IN gctUINT64 Mask,
++	gcoBRUSH * Brush
++	);
++
++/* Create a color gcoBRUSH object. */
++gceSTATUS
++gcoBRUSH_ConstructColor(
++	IN gcoHAL Hal,
++	IN gctUINT32 OriginX,
++	IN gctUINT32 OriginY,
++	IN gctPOINTER Address,
++	IN gceSURF_FORMAT Format,
++	IN gctUINT64 Mask,
++	gcoBRUSH * Brush
++	);
++
++/* Destroy an gcoBRUSH object. */
++gceSTATUS
++gcoBRUSH_Destroy(
++	IN gcoBRUSH Brush
++	);
++
++/******************************************************************************\
++******************************** gcoSURF Object *******************************
++\******************************************************************************/
++
++/* Set cipping rectangle. */
++gceSTATUS
++gcoSURF_SetClipping(
++	IN gcoSURF Surface
++	);
++
++/* Clear one or more rectangular areas. */
++gceSTATUS
++gcoSURF_Clear2D(
++	IN gcoSURF DestSurface,
++	IN gctUINT32 RectCount,
++	IN gcsRECT_PTR DestRect,
++	IN gctUINT32 LoColor,
++	IN gctUINT32 HiColor
++	);
++
++/* Draw one or more Bresenham lines. */
++gceSTATUS
++gcoSURF_Line(
++	IN gcoSURF Surface,
++	IN gctUINT32 LineCount,
++	IN gcsRECT_PTR Position,
++	IN gcoBRUSH Brush,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop
++	);
++
++/* Generic rectangular blit. */
++gceSTATUS
++gcoSURF_Blit(
++	IN OPTIONAL gcoSURF SrcSurface,
++	IN gcoSURF DestSurface,
++	IN gctUINT32 RectCount,
++	IN OPTIONAL gcsRECT_PTR SrcRect,
++	IN gcsRECT_PTR DestRect,
++	IN OPTIONAL gcoBRUSH Brush,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN OPTIONAL gceSURF_TRANSPARENCY Transparency,
++	IN OPTIONAL gctUINT32 TransparencyColor,
++	IN OPTIONAL gctPOINTER Mask,
++	IN OPTIONAL gceSURF_MONOPACK MaskPack
++	);
++
++/* Monochrome blit. */
++gceSTATUS
++gcoSURF_MonoBlit(
++	IN gcoSURF DestSurface,
++	IN gctPOINTER Source,
++	IN gceSURF_MONOPACK SourcePack,
++	IN gcsPOINT_PTR SourceSize,
++	IN gcsPOINT_PTR SourceOrigin,
++	IN gcsRECT_PTR DestRect,
++	IN OPTIONAL gcoBRUSH Brush,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gctBOOL ColorConvert,
++	IN gctUINT8 MonoTransparency,
++	IN gceSURF_TRANSPARENCY Transparency,
++	IN gctUINT32 FgColor,
++	IN gctUINT32 BgColor
++	);
++
++/* Filter blit. */
++gceSTATUS
++gcoSURF_FilterBlit(
++	IN gcoSURF SrcSurface,
++	IN gcoSURF DestSurface,
++	IN gcsRECT_PTR SrcRect,
++	IN gcsRECT_PTR DestRect,
++	IN gcsRECT_PTR DestSubRect
++	);
++
++/* Enable alpha blending engine in the hardware and disengage the ROP engine. */
++gceSTATUS
++gcoSURF_EnableAlphaBlend(
++	IN gcoSURF Surface,
++	IN gctUINT8 SrcGlobalAlphaValue,
++	IN gctUINT8 DstGlobalAlphaValue,
++	IN gceSURF_PIXEL_ALPHA_MODE SrcAlphaMode,
++	IN gceSURF_PIXEL_ALPHA_MODE DstAlphaMode,
++	IN gceSURF_GLOBAL_ALPHA_MODE SrcGlobalAlphaMode,
++	IN gceSURF_GLOBAL_ALPHA_MODE DstGlobalAlphaMode,
++	IN gceSURF_BLEND_FACTOR_MODE SrcFactorMode,
++	IN gceSURF_BLEND_FACTOR_MODE DstFactorMode,
++	IN gceSURF_PIXEL_COLOR_MODE SrcColorMode,
++	IN gceSURF_PIXEL_COLOR_MODE DstColorMode
++	);
++
++/* Disable alpha blending engine in the hardware and engage the ROP engine. */
++gceSTATUS
++gcoSURF_DisableAlphaBlend(
++	IN gcoSURF Surface
++	);
++
++/* Copy a rectangular area with format conversion. */
++gceSTATUS
++gcoSURF_CopyPixels(
++	IN gcoSURF Source,
++	IN gcoSURF Target,
++	IN gctINT SourceX,
++	IN gctINT SourceY,
++	IN gctINT TargetX,
++	IN gctINT TargetY,
++	IN gctINT Width,
++	IN gctINT Height
++	);
++
++/* Read surface pixel. */
++gceSTATUS
++gcoSURF_ReadPixel(
++	IN gcoSURF Surface,
++	IN gctPOINTER Memory,
++	IN gctINT X,
++	IN gctINT Y,
++	IN gceSURF_FORMAT Format,
++	OUT gctPOINTER PixelValue
++	);
++
++/* Write surface pixel. */
++gceSTATUS
++gcoSURF_WritePixel(
++	IN gcoSURF Surface,
++	IN gctPOINTER Memory,
++	IN gctINT X,
++	IN gctINT Y,
++	IN gceSURF_FORMAT Format,
++	IN gctPOINTER PixelValue
++	);
++
++gceSTATUS
++gcoSURF_SetDither(
++    IN gcoSURF Surface,
++    IN gctBOOL Dither
++    );
++/******************************************************************************\
++********************************** gco2D Object *********************************
++\******************************************************************************/
++
++/* Construct a new gco2D object. */
++gceSTATUS
++gco2D_Construct(
++	IN gcoHAL Hal,
++	OUT gco2D * Hardware
++	);
++
++/* Destroy an gco2D object. */
++gceSTATUS
++gco2D_Destroy(
++	IN gco2D Hardware
++	);
++
++/* Sets the maximum number of brushes in the brush cache. */
++gceSTATUS
++gco2D_SetBrushLimit(
++	IN gco2D Hardware,
++	IN gctUINT MaxCount
++	);
++
++/* Flush the brush. */
++gceSTATUS
++gco2D_FlushBrush(
++	IN gco2D Engine,
++	IN gcoBRUSH Brush,
++	IN gceSURF_FORMAT Format
++	);
++
++/* Program the specified solid color brush. */
++gceSTATUS
++gco2D_LoadSolidBrush(
++	IN gco2D Engine,
++	IN gceSURF_FORMAT Format,
++	IN gctUINT32 ColorConvert,
++	IN gctUINT32 Color,
++	IN gctUINT64 Mask
++	);
++
++gceSTATUS
++gco2D_LoadMonochromeBrush(
++    IN gco2D Engine,
++    IN gctUINT32 OriginX,
++    IN gctUINT32 OriginY,
++    IN gctUINT32 ColorConvert,
++    IN gctUINT32 FgColor,
++    IN gctUINT32 BgColor,
++    IN gctUINT64 Bits,
++    IN gctUINT64 Mask
++    );
++
++gceSTATUS
++gco2D_LoadColorBrush(
++    IN gco2D Engine,
++    IN gctUINT32 OriginX,
++    IN gctUINT32 OriginY,
++    IN gctUINT32 Address,
++    IN gceSURF_FORMAT Format,
++    IN gctUINT64 Mask
++    );
++
++/* Configure monochrome source. */
++gceSTATUS
++gco2D_SetMonochromeSource(
++	IN gco2D Engine,
++	IN gctBOOL ColorConvert,
++	IN gctUINT8 MonoTransparency,
++	IN gceSURF_MONOPACK DataPack,
++	IN gctBOOL CoordRelative,
++	IN gceSURF_TRANSPARENCY Transparency,
++	IN gctUINT32 FgColor,
++	IN gctUINT32 BgColor
++	);
++
++/* Configure color source. */
++gceSTATUS
++gco2D_SetColorSource(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_FORMAT Format,
++	IN gceSURF_ROTATION Rotation,
++	IN gctUINT32 SurfaceWidth,
++	IN gctBOOL CoordRelative,
++	IN gceSURF_TRANSPARENCY Transparency,
++	IN gctUINT32 TransparencyColor
++	);
++
++/* Configure color source extension for full rotation. */
++gceSTATUS
++gco2D_SetColorSourceEx(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_FORMAT Format,
++	IN gceSURF_ROTATION Rotation,
++	IN gctUINT32 SurfaceWidth,
++	IN gctUINT32 SurfaceHeight,
++	IN gctBOOL CoordRelative,
++	IN gceSURF_TRANSPARENCY Transparency,
++	IN gctUINT32 TransparencyColor
++	);
++
++/* Configure color source. */
++gceSTATUS
++gco2D_SetColorSourceAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_FORMAT Format,
++	IN gceSURF_ROTATION Rotation,
++	IN gctUINT32 SurfaceWidth,
++	IN gctUINT32 SurfaceHeight,
++	IN gctBOOL CoordRelative
++	);
++
++gceSTATUS
++gco2D_SetColorSourceN(
++    IN gco2D Engine,
++    IN gctUINT32 Address,
++    IN gctUINT32 Stride,
++    IN gceSURF_FORMAT Format,
++    IN gceSURF_ROTATION Rotation,
++    IN gctUINT32 SurfaceWidth,
++    IN gctUINT32 SurfaceHeight,
++    IN gctUINT32 SurfaceNumber
++    );
++
++/* Configure masked color source. */
++gceSTATUS
++gco2D_SetMaskedSource(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_FORMAT Format,
++	IN gctBOOL CoordRelative,
++	IN gceSURF_MONOPACK MaskPack
++	);
++
++/* Configure masked color source extension for full rotation. */
++gceSTATUS
++gco2D_SetMaskedSourceEx(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_FORMAT Format,
++	IN gctBOOL CoordRelative,
++	IN gceSURF_MONOPACK MaskPack,
++	IN gceSURF_ROTATION Rotation,
++	IN gctUINT32 SurfaceWidth,
++	IN gctUINT32 SurfaceHeight
++	);
++
++/* Setup the source rectangle. */
++gceSTATUS
++gco2D_SetSource(
++	IN gco2D Engine,
++	IN gcsRECT_PTR SrcRect
++	);
++
++/* Set clipping rectangle. */
++gceSTATUS
++gco2D_SetClipping(
++	IN gco2D Engine,
++	IN gcsRECT_PTR Rect
++	);
++
++/* Configure destination. */
++gceSTATUS
++gco2D_SetTarget(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_ROTATION Rotation,
++	IN gctUINT32 SurfaceWidth
++	);
++
++/* Configure destination extension for full rotation. */
++gceSTATUS
++gco2D_SetTargetEx(
++	IN gco2D Engine,
++	IN gctUINT32 Address,
++	IN gctUINT32 Stride,
++	IN gceSURF_ROTATION Rotation,
++	IN gctUINT32 SurfaceWidth,
++	IN gctUINT32 SurfaceHeight
++	);
++
++/* Calculate and program the stretch factors. */
++gceSTATUS
++gco2D_CalcStretchFactor(
++    IN gco2D Engine,
++    IN gctINT32 SrcSize,
++    IN gctINT32 DestSize,
++    OUT gctUINT32_PTR Factor
++    );
++
++gceSTATUS
++gco2D_SetStretchFactors(
++	IN gco2D Engine,
++	IN gctUINT32 HorFactor,
++	IN gctUINT32 VerFactor
++	);
++
++/* Calculate and program the stretch factors based on the rectangles. */
++gceSTATUS
++gco2D_SetStretchRectFactors(
++	IN gco2D Engine,
++	IN gcsRECT_PTR SrcRect,
++	IN gcsRECT_PTR DestRect
++	);
++
++/* Create a new solid color gcoBRUSH object. */
++gceSTATUS
++gco2D_ConstructSingleColorBrush(
++	IN gco2D Engine,
++	IN gctUINT32 ColorConvert,
++	IN gctUINT32 Color,
++	IN gctUINT64 Mask,
++	gcoBRUSH * Brush
++	);
++
++/* Create a new monochrome gcoBRUSH object. */
++gceSTATUS
++gco2D_ConstructMonochromeBrush(
++	IN gco2D Engine,
++	IN gctUINT32 OriginX,
++	IN gctUINT32 OriginY,
++	IN gctUINT32 ColorConvert,
++	IN gctUINT32 FgColor,
++	IN gctUINT32 BgColor,
++	IN gctUINT64 Bits,
++	IN gctUINT64 Mask,
++	gcoBRUSH * Brush
++	);
++
++/* Create a color gcoBRUSH object. */
++gceSTATUS
++gco2D_ConstructColorBrush(
++	IN gco2D Engine,
++	IN gctUINT32 OriginX,
++	IN gctUINT32 OriginY,
++	IN gctPOINTER Address,
++	IN gceSURF_FORMAT Format,
++	IN gctUINT64 Mask,
++	gcoBRUSH * Brush
++	);
++
++/* Clear one or more rectangular areas. */
++gceSTATUS
++gco2D_Clear(
++	IN gco2D Engine,
++	IN gctUINT32 RectCount,
++	IN gcsRECT_PTR Rect,
++	IN gctUINT32 Color32,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++/* Draw one or more Bresenham lines. */
++gceSTATUS
++gco2D_Line(
++	IN gco2D Engine,
++	IN gctUINT32 LineCount,
++	IN gcsRECT_PTR Position,
++	IN gcoBRUSH Brush,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++/* Draw one or more Bresenham lines based on the 32-bit color. */
++gceSTATUS
++gco2D_ColorLine(
++	IN gco2D Engine,
++	IN gctUINT32 LineCount,
++	IN gcsRECT_PTR Position,
++	IN gctUINT32 Color32,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++/* Generic blit. */
++gceSTATUS
++gco2D_Blit(
++	IN gco2D Engine,
++	IN gctUINT32 RectCount,
++	IN gcsRECT_PTR Rect,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++gceSTATUS
++gco2D_Blend(
++    IN gco2D Engine,
++    IN gctUINT32 SrcCount,
++    IN gctUINT32 RectCount,
++    IN gcsRECT_PTR Rect,
++    IN gctUINT8 FgRop,
++    IN gctUINT8 BgRop,
++    IN gceSURF_FORMAT DestFormat
++    );
++
++/* Batch blit. */
++gceSTATUS
++gco2D_BatchBlit(
++	IN gco2D Engine,
++	IN gctUINT32 RectCount,
++	IN gcsRECT_PTR SrcRect,
++	IN gcsRECT_PTR DestRect,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++/* Stretch blit. */
++gceSTATUS
++gco2D_StretchBlit(
++	IN gco2D Engine,
++	IN gctUINT32 RectCount,
++	IN gcsRECT_PTR Rect,
++	IN gctUINT8 FgRop,
++	IN gctUINT8 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++/* Monochrome blit. */
++gceSTATUS
++gco2D_MonoBlit(
++	IN gco2D Engine,
++	IN gctPOINTER StreamBits,
++	IN gcsPOINT_PTR StreamSize,
++	IN gcsRECT_PTR StreamRect,
++	IN gceSURF_MONOPACK SrcStreamPack,
++	IN gceSURF_MONOPACK DestStreamPack,
++	IN gcsRECT_PTR DestRect,
++	IN gctUINT32 FgRop,
++	IN gctUINT32 BgRop,
++	IN gceSURF_FORMAT DestFormat
++	);
++
++gceSTATUS
++gco2D_MonoBlitEx(
++    IN gco2D        Engine,
++    IN gctPOINTER   StreamBits,
++    IN gctINT32     StreamStride,
++    IN gctINT32     StreamWidth,
++    IN gctINT32     StreamHeight,
++    IN gctINT32     StreamX,
++    IN gctINT32     StreamY,
++    IN gctUINT32    FgColor,
++    IN gctUINT32    BgColor,
++    IN gcsRECT_PTR  SrcRect,
++    IN gcsRECT_PTR  DstRect,
++    IN gctUINT8     FgRop,
++    IN gctUINT8     BgRop
++    );
++
++/* Set kernel size. */
++gceSTATUS
++gco2D_SetKernelSize(
++	IN gco2D Engine,
++	IN gctUINT8 HorKernelSize,
++	IN gctUINT8 VerKernelSize
++	);
++
++/* Set filter type. */
++gceSTATUS
++gco2D_SetFilterType(
++	IN gco2D Engine,
++	IN gceFILTER_TYPE FilterType
++	);
++
++/* Set the filter kernel by user. */
++gceSTATUS
++gco2D_SetUserFilterKernel(
++	IN gco2D Engine,
++	IN gceFILTER_PASS_TYPE PassType,
++	IN gctUINT16_PTR KernelArray
++	);
++
++/* Select the pass(es) to be done for user defined filter. */
++gceSTATUS
++gco2D_EnableUserFilterPasses(
++	IN gco2D Engine,
++	IN gctBOOL HorPass,
++	IN gctBOOL VerPass
++	);
++
++/* Frees the temporary buffer allocated by filter blit operation. */
++gceSTATUS
++gco2D_FreeFilterBuffer(
++	IN gco2D Engine
++	);
++
++/* Filter blit. */
++gceSTATUS
++gco2D_FilterBlit(
++	IN gco2D Engine,
++	IN gctUINT32 SrcAddress,
++	IN gctUINT SrcStride,
++	IN gctUINT32 SrcUAddress,
++	IN gctUINT SrcUStride,
++	IN gctUINT32 SrcVAddress,
++	IN gctUINT SrcVStride,
++	IN gceSURF_FORMAT SrcFormat,
++	IN gceSURF_ROTATION SrcRotation,
++	IN gctUINT32 SrcSurfaceWidth,
++	IN gcsRECT_PTR SrcRect,
++	IN gctUINT32 DestAddress,
++	IN gctUINT DestStride,
++	IN gceSURF_FORMAT DestFormat,
++	IN gceSURF_ROTATION DestRotation,
++	IN gctUINT32 DestSurfaceWidth,
++	IN gcsRECT_PTR DestRect,
++	IN gcsRECT_PTR DestSubRect
++	);
++
++/* Filter blit extension for full rotation. */
++gceSTATUS
++gco2D_FilterBlitEx(
++	IN gco2D Engine,
++	IN gctUINT32 SrcAddress,
++	IN gctUINT SrcStride,
++	IN gctUINT32 SrcUAddress,
++	IN gctUINT SrcUStride,
++	IN gctUINT32 SrcVAddress,
++	IN gctUINT SrcVStride,
++	IN gceSURF_FORMAT SrcFormat,
++	IN gceSURF_ROTATION SrcRotation,
++	IN gctUINT32 SrcSurfaceWidth,
++	IN gctUINT32 SrcSurfaceHeight,
++	IN gcsRECT_PTR SrcRect,
++	IN gctUINT32 DestAddress,
++	IN gctUINT DestStride,
++	IN gceSURF_FORMAT DestFormat,
++	IN gceSURF_ROTATION DestRotation,
++	IN gctUINT32 DestSurfaceWidth,
++	IN gctUINT32 DestSurfaceHeight,
++	IN gcsRECT_PTR DestRect,
++	IN gcsRECT_PTR DestSubRect
++	);
++
++gceSTATUS
++gco2D_FilterBlitEx2(
++    IN gco2D                Engine,
++    IN gctUINT32_PTR        SrcAddresses,
++    IN gctUINT32            SrcAddressNum,
++    IN gctUINT32_PTR        SrcStrides,
++    IN gctUINT32            SrcStrideNum,
++    IN gceTILING            SrcTiling,
++    IN gceSURF_FORMAT       SrcFormat,
++    IN gceSURF_ROTATION     SrcRotation,
++    IN gctUINT32            SrcSurfaceWidth,
++    IN gctUINT32            SrcSurfaceHeight,
++    IN gcsRECT_PTR          SrcRect,
++    IN gctUINT32_PTR        DestAddresses,
++    IN gctUINT32            DestAddressNum,
++    IN gctUINT32_PTR        DestStrides,
++    IN gctUINT32            DestStrideNum,
++    IN gceTILING            DestTiling,
++    IN gceSURF_FORMAT       DestFormat,
++    IN gceSURF_ROTATION     DestRotation,
++    IN gctUINT32            DestSurfaceWidth,
++    IN gctUINT32            DestSurfaceHeight,
++    IN gcsRECT_PTR          DestRect,
++    IN gcsRECT_PTR          DestSubRect
++    );
++
++/* Enable alpha blending engine in the hardware and disengage the ROP engine. */
++gceSTATUS
++gco2D_EnableAlphaBlend(
++	IN gco2D Engine,
++	IN gctUINT8 SrcGlobalAlphaValue,
++	IN gctUINT8 DstGlobalAlphaValue,
++	IN gceSURF_PIXEL_ALPHA_MODE SrcAlphaMode,
++	IN gceSURF_PIXEL_ALPHA_MODE DstAlphaMode,
++	IN gceSURF_GLOBAL_ALPHA_MODE SrcGlobalAlphaMode,
++	IN gceSURF_GLOBAL_ALPHA_MODE DstGlobalAlphaMode,
++	IN gceSURF_BLEND_FACTOR_MODE SrcFactorMode,
++	IN gceSURF_BLEND_FACTOR_MODE DstFactorMode,
++	IN gceSURF_PIXEL_COLOR_MODE SrcColorMode,
++	IN gceSURF_PIXEL_COLOR_MODE DstColorMode
++	);
++
++/* Enable alpha blending engine in the hardware. */
++gceSTATUS
++gco2D_EnableAlphaBlendAdvanced(
++	IN gco2D Engine,
++	IN gceSURF_PIXEL_ALPHA_MODE SrcAlphaMode,
++	IN gceSURF_PIXEL_ALPHA_MODE DstAlphaMode,
++	IN gceSURF_GLOBAL_ALPHA_MODE SrcGlobalAlphaMode,
++	IN gceSURF_GLOBAL_ALPHA_MODE DstGlobalAlphaMode,
++	IN gceSURF_BLEND_FACTOR_MODE SrcFactorMode,
++	IN gceSURF_BLEND_FACTOR_MODE DstFactorMode
++	);
++
++/* Enable alpha blending engine with Porter Duff rule. */
++gceSTATUS
++gco2D_SetPorterDuffBlending(
++	IN gco2D Engine,
++	IN gce2D_PORTER_DUFF_RULE Rule
++	);
++
++/* Disable alpha blending engine in the hardware and engage the ROP engine. */
++gceSTATUS
++gco2D_DisableAlphaBlend(
++	IN gco2D Engine
++	);
++
++/* Retrieve the maximum number of 32-bit data chunks for a single DE command. */
++gctUINT32
++gco2D_GetMaximumDataCount(
++	void
++	);
++
++/* Retrieve the maximum number of rectangles, that can be passed in a single DE command. */
++gctUINT32
++gco2D_GetMaximumRectCount(
++	void
++	);
++
++/* Returns the pixel alignment of the surface. */
++gceSTATUS
++gco2D_GetPixelAlignment(
++	gceSURF_FORMAT Format,
++	gcsPOINT_PTR Alignment
++	);
++
++/* Retrieve monochrome stream pack size. */
++gceSTATUS
++gco2D_GetPackSize(
++	IN gceSURF_MONOPACK StreamPack,
++	OUT gctUINT32 * PackWidth,
++	OUT gctUINT32 * PackHeight
++	);
++
++/* Flush the 2D pipeline. */
++gceSTATUS
++gco2D_Flush(
++	IN gco2D Engine
++	);
++
++/* Load 256-entry color table for INDEX8 source surfaces. */
++gceSTATUS
++gco2D_LoadPalette(
++	IN gco2D Engine,
++	IN gctUINT FirstIndex,
++	IN gctUINT IndexCount,
++	IN gctPOINTER ColorTable,
++	IN gctBOOL ColorConvert
++	);
++
++/* Enable/disable 2D BitBlt mirrorring. */
++gceSTATUS
++gco2D_SetBitBlitMirror(
++	IN gco2D Engine,
++	IN gctBOOL HorizontalMirror,
++	IN gctBOOL VerticalMirror
++	);
++
++/*
++ * Set the transparency for source, destination and pattern.
++ * It also enable or disable the DFB color key mode.
++ */
++gceSTATUS
++gco2D_SetTransparencyAdvancedEx(
++    IN gco2D Engine,
++    IN gce2D_TRANSPARENCY SrcTransparency,
++    IN gce2D_TRANSPARENCY DstTransparency,
++    IN gce2D_TRANSPARENCY PatTransparency,
++    IN gctBOOL EnableDFBColorKeyMode
++	);
++
++/* Set the transparency for source, destination and pattern. */
++gceSTATUS
++gco2D_SetTransparencyAdvanced(
++	IN gco2D Engine,
++	IN gce2D_TRANSPARENCY SrcTransparency,
++	IN gce2D_TRANSPARENCY DstTransparency,
++	IN gce2D_TRANSPARENCY PatTransparency
++	);
++
++/* Set the source color key. */
++gceSTATUS
++gco2D_SetSourceColorKeyAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 ColorKey
++	);
++
++/* Set the source color key range. */
++gceSTATUS
++gco2D_SetSourceColorKeyRangeAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 ColorKeyLow,
++	IN gctUINT32 ColorKeyHigh
++	);
++
++/* Set the target color key. */
++gceSTATUS
++gco2D_SetTargetColorKeyAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 ColorKey
++	);
++
++/* Set the target color key range. */
++gceSTATUS
++gco2D_SetTargetColorKeyRangeAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 ColorKeyLow,
++	IN gctUINT32 ColorKeyHigh
++	);
++
++/* Set the YUV color space mode. */
++gceSTATUS
++gco2D_SetYUVColorMode(
++	IN gco2D Engine,
++	IN gce2D_YUV_COLOR_MODE Mode
++	);
++
++/* Setup the source global color value in ARGB8 format. */
++gceSTATUS gco2D_SetSourceGlobalColorAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 Color32
++	);
++
++/* Setup the target global color value in ARGB8 format. */
++gceSTATUS gco2D_SetTargetGlobalColorAdvanced(
++	IN gco2D Engine,
++	IN gctUINT32 Color32
++	);
++
++/* Setup the source and target pixel multiply modes. */
++gceSTATUS
++gco2D_SetPixelMultiplyModeAdvanced(
++	IN gco2D Engine,
++	IN gce2D_PIXEL_COLOR_MULTIPLY_MODE SrcPremultiplySrcAlpha,
++	IN gce2D_PIXEL_COLOR_MULTIPLY_MODE DstPremultiplyDstAlpha,
++	IN gce2D_GLOBAL_COLOR_MULTIPLY_MODE SrcPremultiplyGlobalMode,
++	IN gce2D_PIXEL_COLOR_MULTIPLY_MODE DstDemultiplyDstAlpha
++	);
++
++/* Set the GPU clock cycles after which the idle engine will keep auto-flushing. */
++gceSTATUS
++gco2D_SetAutoFlushCycles(
++	IN gco2D Engine,
++	IN gctUINT32 Cycles
++	);
++
++#if VIVANTE_PROFILER
++/* Read the profile registers available in the 2D engine and sets them in the profile.
++   The function will also reset the pixelsRendered counter every time.
++*/
++gceSTATUS
++gco2D_ProfileEngine(
++	IN gco2D Engine,
++	OPTIONAL gcs2D_PROFILE_PTR Profile
++	);
++#endif
++
++/* Enable or disable 2D dithering. */
++gceSTATUS
++gco2D_EnableDither(
++	IN gco2D Engine,
++	IN gctBOOL Enable
++	);
++
++gceSTATUS
++gco2D_SetGenericSource(
++    IN gco2D               Engine,
++    IN gctUINT32_PTR       Addresses,
++    IN gctUINT32           AddressNum,
++    IN gctUINT32_PTR       Strides,
++    IN gctUINT32           StrideNum,
++    IN gceTILING           Tiling,
++    IN gceSURF_FORMAT      Format,
++    IN gceSURF_ROTATION    Rotation,
++    IN gctUINT32           SurfaceWidth,
++    IN gctUINT32           SurfaceHeight
++);
++
++gceSTATUS
++gco2D_SetGenericTarget(
++    IN gco2D               Engine,
++    IN gctUINT32_PTR       Addresses,
++    IN gctUINT32           AddressNum,
++    IN gctUINT32_PTR       Strides,
++    IN gctUINT32           StrideNum,
++    IN gceTILING           Tiling,
++    IN gceSURF_FORMAT      Format,
++    IN gceSURF_ROTATION    Rotation,
++    IN gctUINT32           SurfaceWidth,
++    IN gctUINT32           SurfaceHeight
++);
++
++gceSTATUS
++gco2D_SetCurrentSourceIndex(
++    IN gco2D        Engine,
++    IN gctUINT32    SrcIndex
++    );
++
++gceSTATUS
++gco2D_MultiSourceBlit(
++    IN gco2D Engine,
++    IN gctUINT32 SourceMask,
++    IN gcsRECT_PTR DestRect,
++    IN gctUINT32 RectCount
++    );
++
++gceSTATUS
++gco2D_SetROP(
++    IN gco2D Engine,
++    IN gctUINT8 FgRop,
++    IN gctUINT8 BgRop
++    );
++
++gceSTATUS
++gco2D_SetGdiStretchMode(
++    IN gco2D Engine,
++    IN gctBOOL Enable
++    );
++
++gceSTATUS
++gco2D_SetSourceTileStatus(
++    IN gco2D Engine,
++    IN gce2D_TILE_STATUS_CONFIG TSControl,
++    IN gceSURF_FORMAT CompressedFormat,
++    IN gctUINT32 ClearValue,
++    IN gctUINT32 GpuAddress
++    );
++
++gceSTATUS
++gco2D_SetTargetTileStatus(
++    IN gco2D Engine,
++    IN gce2D_TILE_STATUS_CONFIG TileStatusConfig,
++    IN gceSURF_FORMAT CompressedFormat,
++    IN gctUINT32 ClearValue,
++    IN gctUINT32 GpuAddress
++    );
++
++gceSTATUS
++gco2D_QueryU32(
++    IN gco2D Engine,
++    IN gce2D_QUERY Item,
++    OUT gctUINT32_PTR Value
++    );
++
++gceSTATUS
++gco2D_SetStateU32(
++    IN gco2D Engine,
++    IN gce2D_STATE State,
++    IN gctUINT32 Value
++    );
++
++gceSTATUS
++gco2D_SetStateArrayI32(
++    IN gco2D Engine,
++    IN gce2D_STATE State,
++    IN gctINT32_PTR Array,
++    IN gctINT32 ArraySize
++    );
++
++gceSTATUS
++gco2D_SetStateArrayU32(
++    IN gco2D Engine,
++    IN gce2D_STATE State,
++    IN gctUINT32_PTR Array,
++    IN gctINT32 ArraySize
++    );
++
++gceSTATUS
++gco2D_SetTargetRect(
++    IN gco2D Engine,
++    IN gcsRECT_PTR Rect
++    );
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_raster_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_rename.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,248 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_rename_h_
++#define __gc_hal_rename_h_
++
++
++#if defined(_HAL2D_APPENDIX)
++
++#define _HAL2D_RENAME_2(api, appendix)  api ## appendix
++#define _HAL2D_RENAME_1(api, appendix)  _HAL2D_RENAME_2(api, appendix)
++#define gcmHAL2D(api)                   _HAL2D_RENAME_1(api, _HAL2D_APPENDIX)
++
++
++#define gckOS_Construct                 gcmHAL2D(gckOS_Construct)
++#define gckOS_Destroy                   gcmHAL2D(gckOS_Destroy)
++#define gckOS_QueryVideoMemory          gcmHAL2D(gckOS_QueryVideoMemory)
++#define gckOS_Allocate                  gcmHAL2D(gckOS_Allocate)
++#define gckOS_Free                      gcmHAL2D(gckOS_Free)
++#define gckOS_AllocateMemory            gcmHAL2D(gckOS_AllocateMemory)
++#define gckOS_FreeMemory                gcmHAL2D(gckOS_FreeMemory)
++#define gckOS_AllocatePagedMemory       gcmHAL2D(gckOS_AllocatePagedMemory)
++#define gckOS_AllocatePagedMemoryEx     gcmHAL2D(gckOS_AllocatePagedMemoryEx)
++#define gckOS_LockPages                 gcmHAL2D(gckOS_LockPages)
++#define gckOS_MapPages                  gcmHAL2D(gckOS_MapPages)
++#define gckOS_UnlockPages               gcmHAL2D(gckOS_UnlockPages)
++#define gckOS_FreePagedMemory           gcmHAL2D(gckOS_FreePagedMemory)
++#define gckOS_AllocateNonPagedMemory    gcmHAL2D(gckOS_AllocateNonPagedMemory)
++#define gckOS_FreeNonPagedMemory        gcmHAL2D(gckOS_FreeNonPagedMemory)
++#define gckOS_AllocateContiguous        gcmHAL2D(gckOS_AllocateContiguous)
++#define gckOS_FreeContiguous            gcmHAL2D(gckOS_FreeContiguous)
++#define gckOS_GetPageSize               gcmHAL2D(gckOS_GetPageSize)
++#define gckOS_GetPhysicalAddress        gcmHAL2D(gckOS_GetPhysicalAddress)
++#define gckOS_GetPhysicalAddressProcess     gcmHAL2D(gckOS_GetPhysicalAddressProcess)
++#define gckOS_MapPhysical                   gcmHAL2D(gckOS_MapPhysical)
++#define gckOS_UnmapPhysical             gcmHAL2D(gckOS_UnmapPhysical)
++#define gckOS_ReadRegister              gcmHAL2D(gckOS_ReadRegister)
++#define gckOS_WriteRegister             gcmHAL2D(gckOS_WriteRegister)
++#define gckOS_WriteMemory               gcmHAL2D(gckOS_WriteMemory)
++#define gckOS_MapMemory                 gcmHAL2D(gckOS_MapMemory)
++#define gckOS_UnmapMemory               gcmHAL2D(gckOS_UnmapMemory)
++#define gckOS_UnmapMemoryEx             gcmHAL2D(gckOS_UnmapMemoryEx)
++#define gckOS_CreateMutex               gcmHAL2D(gckOS_CreateMutex)
++#define gckOS_DeleteMutex               gcmHAL2D(gckOS_DeleteMutex)
++#define gckOS_AcquireMutex              gcmHAL2D(gckOS_AcquireMutex)
++#define gckOS_ReleaseMutex              gcmHAL2D(gckOS_ReleaseMutex)
++#define gckOS_AtomicExchange            gcmHAL2D(gckOS_AtomicExchange)
++#define gckOS_AtomicExchangePtr         gcmHAL2D(gckOS_AtomicExchangePtr)
++#define gckOS_AtomConstruct             gcmHAL2D(gckOS_AtomConstruct)
++#define gckOS_AtomDestroy               gcmHAL2D(gckOS_AtomDestroy)
++#define gckOS_AtomGet                   gcmHAL2D(gckOS_AtomGet)
++#define gckOS_AtomIncrement             gcmHAL2D(gckOS_AtomIncrement)
++#define gckOS_AtomDecrement             gcmHAL2D(gckOS_AtomDecrement)
++#define gckOS_Delay                     gcmHAL2D(gckOS_Delay)
++#define gckOS_GetTime                   gcmHAL2D(gckOS_GetTime)
++#define gckOS_MemoryBarrier             gcmHAL2D(gckOS_MemoryBarrier)
++#define gckOS_MapUserPointer            gcmHAL2D(gckOS_MapUserPointer)
++#define gckOS_UnmapUserPointer          gcmHAL2D(gckOS_UnmapUserPointer)
++#define gckOS_QueryNeedCopy             gcmHAL2D(gckOS_QueryNeedCopy)
++#define gckOS_CopyFromUserData          gcmHAL2D(gckOS_CopyFromUserData)
++#define gckOS_CopyToUserData            gcmHAL2D(gckOS_CopyToUserData)
++#define gckOS_MapUserPhysical           gcmHAL2D(gckOS_MapUserPhysical)
++#define gckOS_SuspendInterrupt          gcmHAL2D(gckOS_SuspendInterrupt)
++#define gckOS_ResumeInterrupt           gcmHAL2D(gckOS_ResumeInterrupt)
++#define gckOS_GetBaseAddress            gcmHAL2D(gckOS_GetBaseAddress)
++#define gckOS_MemCopy                   gcmHAL2D(gckOS_MemCopy)
++#define gckOS_ZeroMemory                gcmHAL2D(gckOS_ZeroMemory)
++#define gckOS_DeviceControl             gcmHAL2D(gckOS_DeviceControl)
++#define gckOS_GetProcessID              gcmHAL2D(gckOS_GetProcessID)
++#define gckOS_GetThreadID               gcmHAL2D(gckOS_GetThreadID)
++#define gckOS_CreateSignal              gcmHAL2D(gckOS_CreateSignal)
++#define gckOS_DestroySignal             gcmHAL2D(gckOS_DestroySignal)
++#define gckOS_Signal                    gcmHAL2D(gckOS_Signal)
++#define gckOS_WaitSignal                gcmHAL2D(gckOS_WaitSignal)
++#define gckOS_MapSignal                 gcmHAL2D(gckOS_MapSignal)
++#define gckOS_MapUserMemory             gcmHAL2D(gckOS_MapUserMemory)
++#define gckOS_UnmapUserMemory           gcmHAL2D(gckOS_UnmapUserMemory)
++#define gckOS_CreateUserSignal          gcmHAL2D(gckOS_CreateUserSignal)
++#define gckOS_DestroyUserSignal         gcmHAL2D(gckOS_DestroyUserSignal)
++#define gckOS_WaitUserSignal            gcmHAL2D(gckOS_WaitUserSignal)
++#define gckOS_SignalUserSignal          gcmHAL2D(gckOS_SignalUserSignal)
++#define gckOS_UserSignal                gcmHAL2D(gckOS_UserSignal)
++#define gckOS_UserSignal                gcmHAL2D(gckOS_UserSignal)
++#define gckOS_CacheClean                gcmHAL2D(gckOS_CacheClean)
++#define gckOS_CacheFlush                gcmHAL2D(gckOS_CacheFlush)
++#define gckOS_SetDebugLevel             gcmHAL2D(gckOS_SetDebugLevel)
++#define gckOS_SetDebugZone              gcmHAL2D(gckOS_SetDebugZone)
++#define gckOS_SetDebugLevelZone         gcmHAL2D(gckOS_SetDebugLevelZone)
++#define gckOS_SetDebugZones             gcmHAL2D(gckOS_SetDebugZones)
++#define gckOS_SetDebugFile              gcmHAL2D(gckOS_SetDebugFile)
++#define gckOS_Broadcast                 gcmHAL2D(gckOS_Broadcast)
++#define gckOS_SetGPUPower               gcmHAL2D(gckOS_SetGPUPower)
++#define gckOS_CreateSemaphore           gcmHAL2D(gckOS_CreateSemaphore)
++#define gckOS_DestroySemaphore          gcmHAL2D(gckOS_DestroySemaphore)
++#define gckOS_AcquireSemaphore          gcmHAL2D(gckOS_AcquireSemaphore)
++#define gckOS_ReleaseSemaphore          gcmHAL2D(gckOS_ReleaseSemaphore)
++#define gckHEAP_Construct               gcmHAL2D(gckHEAP_Construct)
++#define gckHEAP_Destroy                 gcmHAL2D(gckHEAP_Destroy)
++#define gckHEAP_Allocate                gcmHAL2D(gckHEAP_Allocate)
++#define gckHEAP_Free                    gcmHAL2D(gckHEAP_Free)
++#define gckHEAP_ProfileStart            gcmHAL2D(gckHEAP_ProfileStart)
++#define gckHEAP_ProfileEnd              gcmHAL2D(gckHEAP_ProfileEnd)
++#define gckHEAP_Test                    gcmHAL2D(gckHEAP_Test)
++#define gckVIDMEM_Construct             gcmHAL2D(gckVIDMEM_Construct)
++#define gckVIDMEM_Destroy               gcmHAL2D(gckVIDMEM_Destroy)
++#define gckVIDMEM_Allocate              gcmHAL2D(gckVIDMEM_Allocate)
++#define gckVIDMEM_AllocateLinear        gcmHAL2D(gckVIDMEM_AllocateLinear)
++#define gckVIDMEM_Free                  gcmHAL2D(gckVIDMEM_Free)
++#define gckVIDMEM_Lock                  gcmHAL2D(gckVIDMEM_Lock)
++#define gckVIDMEM_Unlock                gcmHAL2D(gckVIDMEM_Unlock)
++#define gckVIDMEM_ConstructVirtual      gcmHAL2D(gckVIDMEM_ConstructVirtual)
++#define gckVIDMEM_DestroyVirtual        gcmHAL2D(gckVIDMEM_DestroyVirtual)
++#define gckKERNEL_Construct             gcmHAL2D(gckKERNEL_Construct)
++#define gckKERNEL_Destroy               gcmHAL2D(gckKERNEL_Destroy)
++#define gckKERNEL_Dispatch              gcmHAL2D(gckKERNEL_Dispatch)
++#define gckKERNEL_QueryVideoMemory      gcmHAL2D(gckKERNEL_QueryVideoMemory)
++#define gckKERNEL_GetVideoMemoryPool    gcmHAL2D(gckKERNEL_GetVideoMemoryPool)
++#define gckKERNEL_MapVideoMemory        gcmHAL2D(gckKERNEL_MapVideoMemory)
++#define gckKERNEL_UnmapVideoMemory      gcmHAL2D(gckKERNEL_UnmapVideoMemory)
++#define gckKERNEL_MapMemory             gcmHAL2D(gckKERNEL_MapMemory)
++#define gckKERNEL_UnmapMemory           gcmHAL2D(gckKERNEL_UnmapMemory)
++#define gckKERNEL_Notify                gcmHAL2D(gckKERNEL_Notify)
++#define gckKERNEL_QuerySettings         gcmHAL2D(gckKERNEL_QuerySettings)
++#define gckKERNEL_Recovery              gcmHAL2D(gckKERNEL_Recovery)
++#define gckKERNEL_OpenUserData          gcmHAL2D(gckKERNEL_OpenUserData)
++#define gckKERNEL_CloseUserData         gcmHAL2D(gckKERNEL_CloseUserData)
++#define gckHARDWARE_Construct           gcmHAL2D(gckHARDWARE_Construct)
++#define gckHARDWARE_Destroy             gcmHAL2D(gckHARDWARE_Destroy)
++#define gckHARDWARE_QuerySystemMemory   gcmHAL2D(gckHARDWARE_QuerySystemMemory)
++#define gckHARDWARE_BuildVirtualAddress     gcmHAL2D(gckHARDWARE_BuildVirtualAddress)
++#define gckHARDWARE_QueryCommandBuffer      gcmHAL2D(gckHARDWARE_QueryCommandBuffer)
++#define gckHARDWARE_WaitLink            gcmHAL2D(gckHARDWARE_WaitLink)
++#define gckHARDWARE_Execute             gcmHAL2D(gckHARDWARE_Execute)
++#define gckHARDWARE_End                 gcmHAL2D(gckHARDWARE_End)
++#define gckHARDWARE_Nop                 gcmHAL2D(gckHARDWARE_Nop)
++#define gckHARDWARE_Wait                gcmHAL2D(gckHARDWARE_Wait)
++#define gckHARDWARE_PipeSelect          gcmHAL2D(gckHARDWARE_PipeSelect)
++#define gckHARDWARE_Link                gcmHAL2D(gckHARDWARE_Link)
++#define gckHARDWARE_Event               gcmHAL2D(gckHARDWARE_Event)
++#define gckHARDWARE_QueryMemory         gcmHAL2D(gckHARDWARE_QueryMemory)
++#define gckHARDWARE_QueryChipIdentity   gcmHAL2D(gckHARDWARE_QueryChipIdentity)
++#define gckHARDWARE_QueryChipSpecs      gcmHAL2D(gckHARDWARE_QueryChipSpecs)
++#define gckHARDWARE_QueryShaderCaps     gcmHAL2D(gckHARDWARE_QueryShaderCaps)
++#define gckHARDWARE_ConvertFormat       gcmHAL2D(gckHARDWARE_ConvertFormat)
++#define gckHARDWARE_SplitMemory         gcmHAL2D(gckHARDWARE_SplitMemory)
++#define gckHARDWARE_AlignToTile         gcmHAL2D(gckHARDWARE_AlignToTile)
++#define gckHARDWARE_UpdateQueueTail     gcmHAL2D(gckHARDWARE_UpdateQueueTail)
++#define gckHARDWARE_ConvertLogical      gcmHAL2D(gckHARDWARE_ConvertLogical)
++#define gckHARDWARE_ConvertPhysical     gcmHAL2D(gckHARDWARE_ConvertPhysical)
++#define gckHARDWARE_Interrupt           gcmHAL2D(gckHARDWARE_Interrupt)
++#define gckHARDWARE_SetMMU              gcmHAL2D(gckHARDWARE_SetMMU)
++#define gckHARDWARE_FlushMMU            gcmHAL2D(gckHARDWARE_FlushMMU)
++#define gckHARDWARE_GetIdle             gcmHAL2D(gckHARDWARE_GetIdle)
++#define gckHARDWARE_Flush               gcmHAL2D(gckHARDWARE_Flush)
++#define gckHARDWARE_SetFastClear        gcmHAL2D(gckHARDWARE_SetFastClear)
++#define gckHARDWARE_ReadInterrupt       gcmHAL2D(gckHARDWARE_ReadInterrupt)
++#define gckHARDWARE_SetPowerManagementState         gcmHAL2D(gckHARDWARE_SetPowerManagementState)
++#define gckHARDWARE_QueryPowerManagementState       gcmHAL2D(gckHARDWARE_QueryPowerManagementState)
++#define gckHARDWARE_ProfileEngine2D     gcmHAL2D(gckHARDWARE_ProfileEngine2D)
++#define gckHARDWARE_InitializeHardware  gcmHAL2D(gckHARDWARE_InitializeHardware)
++#define gckHARDWARE_Reset               gcmHAL2D(gckHARDWARE_Reset)
++#define gckINTERRUPT_Construct          gcmHAL2D(gckINTERRUPT_Construct)
++#define gckINTERRUPT_Destroy            gcmHAL2D(gckINTERRUPT_Destroy)
++#define gckINTERRUPT_SetHandler         gcmHAL2D(gckINTERRUPT_SetHandler)
++#define gckINTERRUPT_Notify             gcmHAL2D(gckINTERRUPT_Notify)
++#define gckEVENT_Construct              gcmHAL2D(gckEVENT_Construct)
++#define gckEVENT_Destroy                gcmHAL2D(gckEVENT_Destroy)
++#define gckEVENT_AddList                gcmHAL2D(gckEVENT_AddList)
++#define gckEVENT_FreeNonPagedMemory     gcmHAL2D(gckEVENT_FreeNonPagedMemory)
++#define gckEVENT_FreeContiguousMemory   gcmHAL2D(gckEVENT_FreeContiguousMemory)
++#define gckEVENT_FreeVideoMemory        gcmHAL2D(gckEVENT_FreeVideoMemory)
++#define gckEVENT_Signal                 gcmHAL2D(gckEVENT_Signal)
++#define gckEVENT_Unlock                 gcmHAL2D(gckEVENT_Unlock)
++#define gckEVENT_Submit                 gcmHAL2D(gckEVENT_Submit)
++#define gckEVENT_Commit                 gcmHAL2D(gckEVENT_Commit)
++#define gckEVENT_Notify                 gcmHAL2D(gckEVENT_Notify)
++#define gckEVENT_Interrupt              gcmHAL2D(gckEVENT_Interrupt)
++#define gckCOMMAND_Construct            gcmHAL2D(gckCOMMAND_Construct)
++#define gckCOMMAND_Destroy              gcmHAL2D(gckCOMMAND_Destroy)
++#define gckCOMMAND_EnterCommit          gcmHAL2D(gckCOMMAND_EnterCommit)
++#define gckCOMMAND_ExitCommit           gcmHAL2D(gckCOMMAND_ExitCommit)
++#define gckCOMMAND_Start                gcmHAL2D(gckCOMMAND_Start)
++#define gckCOMMAND_Stop                 gcmHAL2D(gckCOMMAND_Stop)
++#define gckCOMMAND_Commit               gcmHAL2D(gckCOMMAND_Commit)
++#define gckCOMMAND_Reserve              gcmHAL2D(gckCOMMAND_Reserve)
++#define gckCOMMAND_Execute              gcmHAL2D(gckCOMMAND_Execute)
++#define gckCOMMAND_Stall                gcmHAL2D(gckCOMMAND_Stall)
++#define gckCOMMAND_Attach               gcmHAL2D(gckCOMMAND_Attach)
++#define gckCOMMAND_Detach               gcmHAL2D(gckCOMMAND_Detach)
++#define gckMMU_Construct                gcmHAL2D(gckMMU_Construct)
++#define gckMMU_Destroy                  gcmHAL2D(gckMMU_Destroy)
++#define gckMMU_AllocatePages            gcmHAL2D(gckMMU_AllocatePages)
++#define gckMMU_FreePages                gcmHAL2D(gckMMU_FreePages)
++#define gckMMU_InsertNode               gcmHAL2D(gckMMU_InsertNode)
++#define gckMMU_RemoveNode               gcmHAL2D(gckMMU_RemoveNode)
++#define gckMMU_FreeHandleMemory         gcmHAL2D(gckMMU_FreeHandleMemory)
++#define gckMMU_Test                     gcmHAL2D(gckMMU_Test)
++#define gckHARDWARE_QueryProfileRegisters     gcmHAL2D(gckHARDWARE_QueryProfileRegisters)
++
++
++#define FindMdlMap                      gcmHAL2D(FindMdlMap)
++#define OnProcessExit                   gcmHAL2D(OnProcessExit)
++
++#define gckGALDEVICE_Destroy            gcmHAL2D(gckGALDEVICE_Destroy)
++#define gckOS_Print                     gcmHAL2D(gckOS_Print)
++#define gckGALDEVICE_FreeMemory         gcmHAL2D(gckGALDEVICE_FreeMemory)
++#define gckGALDEVICE_AllocateMemory     gcmHAL2D(gckGALDEVICE_AllocateMemory)
++#define gckOS_DebugBreak                gcmHAL2D(gckOS_DebugBreak)
++#define gckGALDEVICE_Release_ISR        gcmHAL2D(gckGALDEVICE_Release_ISR)
++#define gckOS_Verify                    gcmHAL2D(gckOS_Verify)
++#define gckCOMMAND_Release              gcmHAL2D(gckCOMMAND_Release)
++#define gckGALDEVICE_Stop               gcmHAL2D(gckGALDEVICE_Stop)
++#define gckGALDEVICE_Construct          gcmHAL2D(gckGALDEVICE_Construct)
++#define gckOS_DebugFatal                gcmHAL2D(gckOS_DebugFatal)
++#define gckOS_DebugTrace                gcmHAL2D(gckOS_DebugTrace)
++#define gckHARDWARE_GetBaseAddress      gcmHAL2D(gckHARDWARE_GetBaseAddress)
++#define gckGALDEVICE_Setup_ISR          gcmHAL2D(gckGALDEVICE_Setup_ISR)
++#define gckKERNEL_AttachProcess         gcmHAL2D(gckKERNEL_AttachProcess)
++#define gckKERNEL_AttachProcessEx       gcmHAL2D(gckKERNEL_AttachProcessEx)
++#define gckGALDEVICE_Start_Thread       gcmHAL2D(gckGALDEVICE_Start_Thread)
++#define gckHARDWARE_QueryIdle           gcmHAL2D(gckHARDWARE_QueryIdle)
++#define gckGALDEVICE_Start              gcmHAL2D(gckGALDEVICE_Start)
++#define gckOS_GetKernelLogical          gcmHAL2D(gckOS_GetKernelLogical)
++#define gckOS_DebugTraceZone            gcmHAL2D(gckOS_DebugTraceZone)
++#define gckGALDEVICE_Stop_Thread        gcmHAL2D(gckGALDEVICE_Stop_Thread)
++#define gckHARDWARE_NeedBaseAddress     gcmHAL2D(gckHARDWARE_NeedBaseAddress)
++
++#endif
++
++#endif /* __gc_hal_rename_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_security_interface.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,137 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef _GC_HAL_SECURITY_INTERFACE_H_
++#define _GC_HAL_SECURITY_INTERFACE_H_
++/*!
++ @brief Command codes between kernel module and TrustZone
++ @discussion
++ Critical services must be done in TrustZone to avoid sensitive content leak. Most of kernel module is kept in non-Secure os to minimize
++ code in TrustZone.
++ */
++typedef enum kernel_packet_command {
++    KERNEL_START_COMMAND,
++    KERNEL_SUBMIT,
++    KERNEL_MAP_MEMORY,                    /* */
++    KERNEL_UNMAP_MEMORY,
++    KERNEL_ALLOCATE_SECRUE_MEMORY,        /*! Security memory management. */
++    KERNEL_FREE_SECURE_MEMORY,
++    KERNEL_EXECUTE,                       /* Execute a command buffer. */
++} kernel_packet_command_t;
++
++/*!
++ @brief gckCOMMAND Object requests TrustZone to start FE.
++ @discussion
++ DMA enabled register can only be written in TrustZone to avoid GPU from jumping to a hacked code.
++ Kernel module need use these command to ask TrustZone start command parser.
++ */
++struct kernel_start_command {
++    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
++    gctUINT8       gpu;                    /*! Which GPU. */
++};
++
++/*!
++ @brief gckCOMMAND Object requests TrustZone to submit command buffer.
++ @discussion
++ Code in trustzone will check content of command buffer after copying command buffer to TrustZone.
++ */
++struct kernel_submit {
++    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
++    gctUINT8       gpu;                    /*! Which GPU. */
++    gctUINT8       kernel_command;         /*! Whether it is a kernel command. */
++    gctUINT32      command_buffer_handle;  /*! Handle to command buffer. */
++    gctUINT32      offset;                  /* Offset in command buffer. */
++    gctUINT32 *    command_buffer;         /*! Content of command buffer need to be submit. */
++    gctUINT32      command_buffer_length;  /*! Length of command buffer. */
++};
++
++
++/*!
++ @brief gckVIDMEM Object requests TrustZone to allocate security memory.
++ @discussion
++ Allocate a buffer from security GPU memory.
++ */
++struct kernel_allocate_security_memory {
++    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
++    gctUINT32      bytes;                  /*! Requested bytes. */
++    gctUINT32      memory_handle;          /*! Handle of allocated memory. */
++};
++
++/*!
++ @brief gckVIDMEM Object requests TrustZone to allocate security memory.
++ @discussion
++ Free a video memory buffer from security GPU memory.
++ */
++struct kernel_free_security_memory {
++    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
++    gctUINT32      memory_handle;          /*! Handle of allocated memory. */
++};
++
++struct kernel_execute {
++    kernel_packet_command_t command;      /*! The command (always needs to be the first entry in a structure). */
++    gctUINT8       gpu;                    /*! Which GPU. */
++    gctUINT8       kernel_command;         /*! Whether it is a kernel command. */
++    gctUINT32 *    command_buffer;         /*! Content of command buffer need to be submit. */
++    gctUINT32      command_buffer_length;  /*! Length of command buffer. */
++};
++
++typedef struct kernel_map_scatter_gather {
++    gctUINT32      bytes;
++    gctUINT32      physical;
++    struct kernel_map_scatter_gather *next;
++}
++kernel_map_scatter_gather_t;
++
++struct kernel_map_memory {
++    kernel_packet_command_t command;
++    kernel_map_scatter_gather_t *scatter;
++    gctUINT32       *physicals;
++    gctUINT32       pageCount;
++    gctUINT32       gpuAddress;
++};
++
++struct kernel_unmap_memory {
++    gctUINT32       gpuAddress;
++    gctUINT32       pageCount;
++};
++
++typedef struct _gcsTA_INTERFACE {
++    kernel_packet_command_t command;
++    union {
++        struct kernel_submit                   Submit;
++        struct kernel_start_command            StartCommand;
++        struct kernel_allocate_security_memory AllocateSecurityMemory;
++        struct kernel_execute                  Execute;
++        struct kernel_map_memory               MapMemory;
++        struct kernel_unmap_memory             UnmapMemory;
++    } u;
++    gceSTATUS result;
++} gcsTA_INTERFACE;
++
++enum {
++    gcvTA_COMMAND_INIT,
++    gcvTA_COMMAND_DISPATCH,
++
++    gcvTA_CALLBACK_ALLOC_SECURE_MEM,
++    gcvTA_CALLBACK_FREE_SECURE_MEM,
++};
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_statistics.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,115 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_statistics_h_
++#define __gc_hal_statistics_h_
++
++
++#define VIV_STAT_ENABLE_STATISTICS              0
++
++/*  Toal number of frames for which the frame time is accounted. We have storage
++    to keep frame times for last this many frames.
++*/
++#define VIV_STAT_FRAME_BUFFER_SIZE              30
++
++/*
++    Total number of frames sampled for a mode. This means
++
++    # of frames for HZ Current  : VIV_STAT_EARLY_Z_SAMPLE_FRAMES
++    # of frames for HZ Switched : VIV_STAT_EARLY_Z_SAMPLE_FRAMES
++  +
++  --------------------------------------------------------
++                                : (2 * VIV_STAT_EARLY_Z_SAMPLE_FRAMES) frames needed
++
++    IMPORTANT: This total must be smaller than VIV_STAT_FRAME_BUFFER_SIZE
++*/
++#define VIV_STAT_EARLY_Z_SAMPLE_FRAMES          7
++#define VIV_STAT_EARLY_Z_LATENCY_FRAMES         2
++
++/* Multiplication factor for previous Hz off mode. Make it more than 1.0 to advertise HZ on.*/
++#define VIV_STAT_EARLY_Z_FACTOR                 (1.05f)
++
++/* Defines the statistical data keys monitored by the statistics module */
++typedef enum _gceSTATISTICS
++{
++    gcvFRAME_FPS        =   1,
++}
++gceSTATISTICS;
++
++/* HAL statistics information. */
++typedef struct _gcsSTATISTICS_EARLYZ
++{
++    gctUINT                     switchBackCount;
++    gctUINT                     nextCheckPoint;
++    gctBOOL                     disabled;
++}
++gcsSTATISTICS_EARLYZ;
++
++
++/* Defines the statistical data keys monitored by the statistics module */
++typedef enum _gceSTATISTICS_Call
++{
++	gcvSTAT_ES11_GLDRAWELEMENTS      =   1,
++}
++gceSTATISTICS_Call;
++
++
++/* HAL statistics information. */
++typedef struct _gcsSTATISTICS
++{
++    gctUINT64                   frameTime[VIV_STAT_FRAME_BUFFER_SIZE];
++    gctUINT64                   previousFrameTime;
++    gctUINT                     frame;
++    gcsSTATISTICS_EARLYZ        earlyZ;
++	gctUINT						ES11_drawElementsCount;
++	gctBOOL						applyRTestVAFix;
++}
++gcsSTATISTICS;
++
++
++/* Add a frame based data into current statistics. */
++void
++gcfSTATISTICS_AddData(
++    IN gceSTATISTICS Key,
++    IN gctUINT Value
++    );
++
++/* Marks the frame end and triggers statistical calculations and decisions.*/
++void
++gcfSTATISTICS_MarkFrameEnd (
++    void
++    );
++
++/* Sets whether the dynmaic HZ is disabled or not .*/
++void
++gcfSTATISTICS_DisableDynamicEarlyZ (
++    IN gctBOOL Disabled
++    );
++
++/* Checks whether or not glDrawArray function call will be discarded */
++gctBOOL
++gcfSTATISTICS_DiscardCall(
++	gceSTATISTICS_Call Function
++	);
++
++
++#endif /*__gc_hal_statistics_h_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_types.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,1088 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++#ifndef __gc_hal_types_h_
++#define __gc_hal_types_h_
++
++#include "gc_hal_version.h"
++#include "gc_hal_options.h"
++
++#ifdef _WIN32
++#pragma warning(disable:4127)   /* Conditional expression is constant (do { }
++                                ** while(0)). */
++#pragma warning(disable:4100)   /* Unreferenced formal parameter. */
++#pragma warning(disable:4204)   /* Non-constant aggregate initializer (C99). */
++#pragma warning(disable:4131)   /* Uses old-style declarator (for Bison and
++                                ** Flex generated files). */
++#pragma warning(disable:4206)   /* Translation unit is empty. */
++#endif
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++**  Platform macros.
++*/
++
++#if defined(__GNUC__)
++#   define gcdHAS_ELLIPSES      1       /* GCC always has it. */
++#elif defined(__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L)
++#   define gcdHAS_ELLIPSES      1       /* C99 has it. */
++#elif defined(_MSC_VER) && (_MSC_VER >= 1500)
++#   define gcdHAS_ELLIPSES      1       /* MSVC 2007+ has it. */
++#elif defined(UNDER_CE)
++#if UNDER_CE >= 600
++#       define gcdHAS_ELLIPSES  1
++#   else
++#       define gcdHAS_ELLIPSES  0
++#   endif
++#else
++#   error "gcdHAS_ELLIPSES: Platform could not be determined"
++#endif
++
++/******************************************************************************\
++************************************ Keyword ***********************************
++\******************************************************************************/
++
++#if (defined(__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L))
++#   define gcmINLINE            inline      /* C99 keyword. */
++#elif defined(__GNUC__)
++#   define gcmINLINE            __inline__  /* GNU keyword. */
++#elif defined(_MSC_VER) || defined(UNDER_CE)
++#   define gcmINLINE            __inline    /* Internal keyword. */
++#else
++#   error "gcmINLINE: Platform could not be determined"
++#endif
++
++/* Possible debug flags. */
++#define gcdDEBUG_NONE           0
++#define gcdDEBUG_ALL            (1 << 0)
++#define gcdDEBUG_FATAL          (1 << 1)
++#define gcdDEBUG_TRACE          (1 << 2)
++#define gcdDEBUG_BREAK          (1 << 3)
++#define gcdDEBUG_ASSERT         (1 << 4)
++#define gcdDEBUG_CODE           (1 << 5)
++#define gcdDEBUG_STACK          (1 << 6)
++
++#define gcmIS_DEBUG(flag)       ( gcdDEBUG & (flag | gcdDEBUG_ALL) )
++
++#ifndef gcdDEBUG
++#if (defined(DBG) && DBG) || defined(DEBUG) || defined(_DEBUG)
++#       define gcdDEBUG         gcdDEBUG_ALL
++#   else
++#       define gcdDEBUG         gcdDEBUG_NONE
++#   endif
++#endif
++
++#ifdef _USRDLL
++#ifdef _MSC_VER
++#ifdef HAL_EXPORTS
++#           define HALAPI       __declspec(dllexport)
++#       else
++#           define HALAPI       __declspec(dllimport)
++#       endif
++#       define HALDECL          __cdecl
++#   else
++#ifdef HAL_EXPORTS
++#           define HALAPI
++#       else
++#           define HALAPI       extern
++#       endif
++#   endif
++#else
++#   define HALAPI
++#   define HALDECL
++#endif
++
++/******************************************************************************\
++********************************** Common Types ********************************
++\******************************************************************************/
++
++#define gcvFALSE                0
++#define gcvTRUE                 1
++
++#define gcvINFINITE             ((gctUINT32) ~0U)
++
++#define gcvINVALID_HANDLE       ((gctHANDLE) ~0U)
++
++typedef int                     gctBOOL;
++typedef gctBOOL *               gctBOOL_PTR;
++
++typedef int                     gctINT;
++typedef long                    gctLONG;
++typedef signed char             gctINT8;
++typedef signed short            gctINT16;
++typedef signed int              gctINT32;
++typedef signed long long        gctINT64;
++
++typedef gctINT *                gctINT_PTR;
++typedef gctINT8 *               gctINT8_PTR;
++typedef gctINT16 *              gctINT16_PTR;
++typedef gctINT32 *              gctINT32_PTR;
++typedef gctINT64 *              gctINT64_PTR;
++
++typedef unsigned int            gctUINT;
++typedef unsigned char           gctUINT8;
++typedef unsigned short          gctUINT16;
++typedef unsigned int            gctUINT32;
++typedef unsigned long long      gctUINT64;
++typedef unsigned long           gctUINTPTR_T;
++
++typedef gctUINT *               gctUINT_PTR;
++typedef gctUINT8 *              gctUINT8_PTR;
++typedef gctUINT16 *             gctUINT16_PTR;
++typedef gctUINT32 *             gctUINT32_PTR;
++typedef gctUINT64 *             gctUINT64_PTR;
++
++typedef unsigned long           gctSIZE_T;
++typedef gctSIZE_T *             gctSIZE_T_PTR;
++
++#ifdef __cplusplus
++#   define gcvNULL              0
++#else
++#   define gcvNULL              ((void *) 0)
++#endif
++
++typedef float                   gctFLOAT;
++typedef signed int              gctFIXED_POINT;
++typedef float *                 gctFLOAT_PTR;
++
++typedef void *                  gctPHYS_ADDR;
++typedef void *                  gctHANDLE;
++typedef void *                  gctFILE;
++typedef void *                  gctSIGNAL;
++typedef void *                  gctWINDOW;
++typedef void *                  gctIMAGE;
++typedef void *                  gctSYNC_POINT;
++
++typedef void *					gctSEMAPHORE;
++
++typedef void *                  gctPOINTER;
++typedef const void *            gctCONST_POINTER;
++
++typedef char                    gctCHAR;
++typedef char *                  gctSTRING;
++typedef const char *            gctCONST_STRING;
++
++typedef struct _gcsCOUNT_STRING
++{
++    gctSIZE_T                   Length;
++    gctCONST_STRING             String;
++}
++gcsCOUNT_STRING;
++
++typedef union _gcuFLOAT_UINT32
++{
++    gctFLOAT    f;
++    gctUINT32   u;
++}
++gcuFLOAT_UINT32;
++
++/* Fixed point constants. */
++#define gcvZERO_X               ((gctFIXED_POINT) 0x00000000)
++#define gcvHALF_X               ((gctFIXED_POINT) 0x00008000)
++#define gcvONE_X                ((gctFIXED_POINT) 0x00010000)
++#define gcvNEGONE_X             ((gctFIXED_POINT) 0xFFFF0000)
++#define gcvTWO_X                ((gctFIXED_POINT) 0x00020000)
++
++/* Stringizing macro. */
++#define gcmSTRING(Value)        #Value
++
++/******************************************************************************\
++******************************* Fixed Point Math *******************************
++\******************************************************************************/
++
++#define gcmXMultiply(x1, x2)            gcoMATH_MultiplyFixed(x1, x2)
++#define gcmXDivide(x1, x2)              gcoMATH_DivideFixed(x1, x2)
++#define gcmXMultiplyDivide(x1, x2, x3)  gcoMATH_MultiplyDivideFixed(x1, x2, x3)
++
++/* 2D Engine profile. */
++typedef struct _gcs2D_PROFILE
++{
++    /* Cycle count.
++       32bit counter incremented every 2D clock cycle.
++       Wraps back to 0 when the counter overflows.
++    */
++    gctUINT32 cycleCount;
++
++    /* Pixels rendered by the 2D engine.
++       Resets to 0 every time it is read. */
++    gctUINT32 pixelsRendered;
++}
++gcs2D_PROFILE;
++
++/* Macro to combine four characters into a Charcater Code. */
++#define gcmCC(c1, c2, c3, c4) \
++( \
++    (char) (c1) \
++    | \
++    ((char) (c2) <<  8) \
++    | \
++    ((char) (c3) << 16) \
++    | \
++    ((char) (c4) << 24) \
++)
++
++#define gcmPRINTABLE(c)         ((((c) >= ' ') && ((c) <= '}')) ? ((c) != '%' ?  (c) : ' ') : ' ')
++
++#define gcmCC_PRINT(cc) \
++    gcmPRINTABLE((char) ( (cc)        & 0xFF)), \
++    gcmPRINTABLE((char) (((cc) >>  8) & 0xFF)), \
++    gcmPRINTABLE((char) (((cc) >> 16) & 0xFF)), \
++    gcmPRINTABLE((char) (((cc) >> 24) & 0xFF))
++
++/******************************************************************************\
++****************************** Function Parameters *****************************
++\******************************************************************************/
++
++#define IN
++#define OUT
++#define OPTIONAL
++
++/******************************************************************************\
++********************************* Status Codes *********************************
++\******************************************************************************/
++
++typedef enum _gceSTATUS
++{
++    gcvSTATUS_OK                    =   0,
++    gcvSTATUS_FALSE                 =   0,
++    gcvSTATUS_TRUE                  =   1,
++    gcvSTATUS_NO_MORE_DATA          =   2,
++    gcvSTATUS_CACHED                =   3,
++    gcvSTATUS_MIPMAP_TOO_LARGE      =   4,
++    gcvSTATUS_NAME_NOT_FOUND        =   5,
++    gcvSTATUS_NOT_OUR_INTERRUPT     =   6,
++    gcvSTATUS_MISMATCH              =   7,
++    gcvSTATUS_MIPMAP_TOO_SMALL      =   8,
++    gcvSTATUS_LARGER                =   9,
++    gcvSTATUS_SMALLER               =   10,
++    gcvSTATUS_CHIP_NOT_READY        =   11,
++    gcvSTATUS_NEED_CONVERSION       =   12,
++    gcvSTATUS_SKIP                  =   13,
++    gcvSTATUS_DATA_TOO_LARGE        =   14,
++    gcvSTATUS_INVALID_CONFIG        =   15,
++    gcvSTATUS_CHANGED               =   16,
++    gcvSTATUS_NOT_SUPPORT_DITHER    =   17,
++	gcvSTATUS_EXECUTED				=	18,
++    gcvSTATUS_TERMINATE             =   19,
++
++    gcvSTATUS_CONVERT_TO_SINGLE_STREAM    =   20,
++
++    gcvSTATUS_INVALID_ARGUMENT      =   -1,
++    gcvSTATUS_INVALID_OBJECT        =   -2,
++    gcvSTATUS_OUT_OF_MEMORY         =   -3,
++    gcvSTATUS_MEMORY_LOCKED         =   -4,
++    gcvSTATUS_MEMORY_UNLOCKED       =   -5,
++    gcvSTATUS_HEAP_CORRUPTED        =   -6,
++    gcvSTATUS_GENERIC_IO            =   -7,
++    gcvSTATUS_INVALID_ADDRESS       =   -8,
++    gcvSTATUS_CONTEXT_LOSSED        =   -9,
++    gcvSTATUS_TOO_COMPLEX           =   -10,
++    gcvSTATUS_BUFFER_TOO_SMALL      =   -11,
++    gcvSTATUS_INTERFACE_ERROR       =   -12,
++    gcvSTATUS_NOT_SUPPORTED         =   -13,
++    gcvSTATUS_MORE_DATA             =   -14,
++    gcvSTATUS_TIMEOUT               =   -15,
++    gcvSTATUS_OUT_OF_RESOURCES      =   -16,
++    gcvSTATUS_INVALID_DATA          =   -17,
++    gcvSTATUS_INVALID_MIPMAP        =   -18,
++    gcvSTATUS_NOT_FOUND             =   -19,
++    gcvSTATUS_NOT_ALIGNED           =   -20,
++    gcvSTATUS_INVALID_REQUEST       =   -21,
++    gcvSTATUS_GPU_NOT_RESPONDING    =   -22,
++    gcvSTATUS_TIMER_OVERFLOW        =   -23,
++    gcvSTATUS_VERSION_MISMATCH      =   -24,
++    gcvSTATUS_LOCKED                =   -25,
++    gcvSTATUS_INTERRUPTED           =   -26,
++    gcvSTATUS_DEVICE                =   -27,
++    gcvSTATUS_NOT_MULTI_PIPE_ALIGNED =   -28,
++
++    /* Linker errors. */
++    gcvSTATUS_GLOBAL_TYPE_MISMATCH  =   -1000,
++    gcvSTATUS_TOO_MANY_ATTRIBUTES   =   -1001,
++    gcvSTATUS_TOO_MANY_UNIFORMS     =   -1002,
++    gcvSTATUS_TOO_MANY_VARYINGS     =   -1003,
++    gcvSTATUS_UNDECLARED_VARYING    =   -1004,
++    gcvSTATUS_VARYING_TYPE_MISMATCH =   -1005,
++    gcvSTATUS_MISSING_MAIN          =   -1006,
++    gcvSTATUS_NAME_MISMATCH         =   -1007,
++    gcvSTATUS_INVALID_INDEX         =   -1008,
++    gcvSTATUS_UNIFORM_TYPE_MISMATCH =   -1009,
++
++    /* Compiler errors. */
++    gcvSTATUS_COMPILER_FE_PREPROCESSOR_ERROR = -2000,
++    gcvSTATUS_COMPILER_FE_PARSER_ERROR = -2001,
++}
++gceSTATUS;
++
++/******************************************************************************\
++********************************* Status Macros ********************************
++\******************************************************************************/
++
++#define gcmIS_ERROR(status)         (status < 0)
++#define gcmNO_ERROR(status)         (status >= 0)
++#define gcmIS_SUCCESS(status)       (status == gcvSTATUS_OK)
++
++/******************************************************************************\
++********************************* Field Macros *********************************
++\******************************************************************************/
++
++#define __gcmSTART(reg_field) \
++    (0 ? reg_field)
++
++#define __gcmEND(reg_field) \
++    (1 ? reg_field)
++
++#define __gcmGETSIZE(reg_field) \
++    (__gcmEND(reg_field) - __gcmSTART(reg_field) + 1)
++
++#define __gcmALIGN(data, reg_field) \
++    (((gctUINT32) (data)) << __gcmSTART(reg_field))
++
++#define __gcmMASK(reg_field) \
++    ((gctUINT32) ((__gcmGETSIZE(reg_field) == 32) \
++        ?  ~0 \
++        : (~(~0 << __gcmGETSIZE(reg_field)))))
++
++/*******************************************************************************
++**
++**  gcmFIELDMASK
++**
++**      Get aligned field mask.
++**
++**  ARGUMENTS:
++**
++**      reg     Name of register.
++**      field   Name of field within register.
++*/
++#define gcmFIELDMASK(reg, field) \
++( \
++    __gcmALIGN(__gcmMASK(reg##_##field), reg##_##field) \
++)
++
++/*******************************************************************************
++**
++**  gcmGETFIELD
++**
++**      Extract the value of a field from specified data.
++**
++**  ARGUMENTS:
++**
++**      data    Data value.
++**      reg     Name of register.
++**      field   Name of field within register.
++*/
++#define gcmGETFIELD(data, reg, field) \
++( \
++    ((((gctUINT32) (data)) >> __gcmSTART(reg##_##field)) \
++        & __gcmMASK(reg##_##field)) \
++)
++
++/*******************************************************************************
++**
++**  gcmSETFIELD
++**
++**      Set the value of a field within specified data.
++**
++**  ARGUMENTS:
++**
++**      data    Data value.
++**      reg     Name of register.
++**      field   Name of field within register.
++**      value   Value for field.
++*/
++#define gcmSETFIELD(data, reg, field, value) \
++( \
++    (((gctUINT32) (data)) \
++        & ~__gcmALIGN(__gcmMASK(reg##_##field), reg##_##field)) \
++        |  __gcmALIGN((gctUINT32) (value) \
++            & __gcmMASK(reg##_##field), reg##_##field) \
++)
++
++/*******************************************************************************
++**
++**  gcmSETFIELDVALUE
++**
++**      Set the value of a field within specified data with a
++**      predefined value.
++**
++**  ARGUMENTS:
++**
++**      data    Data value.
++**      reg     Name of register.
++**      field   Name of field within register.
++**      value   Name of the value within the field.
++*/
++#define gcmSETFIELDVALUE(data, reg, field, value) \
++( \
++    (((gctUINT32) (data)) \
++        & ~__gcmALIGN(__gcmMASK(reg##_##field), reg##_##field)) \
++        |  __gcmALIGN(reg##_##field##_##value \
++            & __gcmMASK(reg##_##field), reg##_##field) \
++)
++
++/*******************************************************************************
++**
++**  gcmGETMASKEDFIELDMASK
++**
++**      Determine field mask of a masked field.
++**
++**  ARGUMENTS:
++**
++**      reg     Name of register.
++**      field   Name of field within register.
++*/
++#define gcmGETMASKEDFIELDMASK(reg, field) \
++( \
++    gcmSETFIELD(0, reg,          field, ~0) | \
++    gcmSETFIELD(0, reg, MASK_ ## field, ~0)   \
++)
++
++/*******************************************************************************
++**
++**  gcmSETMASKEDFIELD
++**
++**      Set the value of a masked field with specified data.
++**
++**  ARGUMENTS:
++**
++**      reg     Name of register.
++**      field   Name of field within register.
++**      value   Value for field.
++*/
++#define gcmSETMASKEDFIELD(reg, field, value) \
++( \
++    gcmSETFIELD     (~0, reg,          field, value) & \
++    gcmSETFIELDVALUE(~0, reg, MASK_ ## field, ENABLED) \
++)
++
++/*******************************************************************************
++**
++**  gcmSETMASKEDFIELDVALUE
++**
++**      Set the value of a masked field with specified data.
++**
++**  ARGUMENTS:
++**
++**      reg     Name of register.
++**      field   Name of field within register.
++**      value   Value for field.
++*/
++#define gcmSETMASKEDFIELDVALUE(reg, field, value) \
++( \
++    gcmSETFIELDVALUE(~0, reg,          field, value) & \
++    gcmSETFIELDVALUE(~0, reg, MASK_ ## field, ENABLED) \
++)
++
++/*******************************************************************************
++**
++**  gcmVERIFYFIELDVALUE
++**
++**      Verify if the value of a field within specified data equals a
++**      predefined value.
++**
++**  ARGUMENTS:
++**
++**      data    Data value.
++**      reg     Name of register.
++**      field   Name of field within register.
++**      value   Name of the value within the field.
++*/
++#define gcmVERIFYFIELDVALUE(data, reg, field, value) \
++( \
++    (((gctUINT32) (data)) >> __gcmSTART(reg##_##field) & \
++                             __gcmMASK(reg##_##field)) \
++        == \
++    (reg##_##field##_##value & __gcmMASK(reg##_##field)) \
++)
++
++/*******************************************************************************
++**  Bit field macros.
++*/
++
++#define __gcmSTARTBIT(Field) \
++    ( 1 ? Field )
++
++#define __gcmBITSIZE(Field) \
++    ( 0 ? Field )
++
++#define __gcmBITMASK(Field) \
++( \
++    (1 << __gcmBITSIZE(Field)) - 1 \
++)
++
++#define gcmGETBITS(Value, Type, Field) \
++( \
++    ( ((Type) (Value)) >> __gcmSTARTBIT(Field) ) \
++    & \
++    __gcmBITMASK(Field) \
++)
++
++#define gcmSETBITS(Value, Type, Field, NewValue) \
++( \
++    ( ((Type) (Value)) \
++    & ~(__gcmBITMASK(Field) << __gcmSTARTBIT(Field)) \
++    ) \
++    | \
++    ( ( ((Type) (NewValue)) \
++      & __gcmBITMASK(Field) \
++      ) << __gcmSTARTBIT(Field) \
++    ) \
++)
++
++/*******************************************************************************
++**
++**  gcmISINREGRANGE
++**
++**      Verify whether the specified address is in the register range.
++**
++**  ARGUMENTS:
++**
++**      Address Address to be verified.
++**      Name    Name of a register.
++*/
++
++#define gcmISINREGRANGE(Address, Name) \
++( \
++    ((Address & (~0U << Name ## _LSB)) == (Name ## _Address >> 2)) \
++)
++
++/*******************************************************************************
++**
++**  A set of macros to aid state loading.
++**
++**  ARGUMENTS:
++**
++**      CommandBuffer   Pointer to a gcoCMDBUF object.
++**      StateDelta      Pointer to a gcsSTATE_DELTA state delta structure.
++**      Memory          Destination memory pointer of gctUINT32_PTR type.
++**      PartOfContext   Whether or not the state is a part of the context.
++**      FixedPoint      Whether or not the state is of the fixed point format.
++**      Count           Number of consecutive states to be loaded.
++**      Address         State address.
++**      Data            Data to be set to the state.
++*/
++
++/*----------------------------------------------------------------------------*/
++
++#if gcmIS_DEBUG(gcdDEBUG_CODE)
++
++#   define gcmSTORELOADSTATE(CommandBuffer, Memory, Address, Count) \
++        CommandBuffer->lastLoadStatePtr     = gcmPTR_TO_UINT64(Memory); \
++        CommandBuffer->lastLoadStateAddress = Address; \
++        CommandBuffer->lastLoadStateCount   = Count
++
++#   define gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address) \
++        gcmASSERT( \
++            (gctUINT) (Memory  - gcmUINT64_TO_TYPE(CommandBuffer->lastLoadStatePtr, gctUINT32_PTR) - 1) \
++            == \
++            (gctUINT) (Address - CommandBuffer->lastLoadStateAddress) \
++            ); \
++        \
++        gcmASSERT(CommandBuffer->lastLoadStateCount > 0); \
++        \
++        CommandBuffer->lastLoadStateCount -= 1
++
++#   define gcmVERIFYLOADSTATEDONE(CommandBuffer) \
++        gcmASSERT(CommandBuffer->lastLoadStateCount == 0)
++
++#else
++
++#   define gcmSTORELOADSTATE(CommandBuffer, Memory, Address, Count)
++#   define gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address)
++#   define gcmVERIFYLOADSTATEDONE(CommandBuffer)
++
++#endif
++
++#if gcdSECURE_USER
++
++#   define gcmDEFINESECUREUSER() \
++        gctUINT         __secure_user_offset__; \
++        gctUINT32_PTR   __secure_user_hintArray__;
++
++#   define gcmBEGINSECUREUSER() \
++        __secure_user_offset__ = reserve->lastOffset; \
++        \
++        __secure_user_hintArray__ = gcmUINT64_TO_PTR(reserve->hintArrayTail)
++
++#   define gcmENDSECUREUSER() \
++        reserve->hintArrayTail = gcmPTR_TO_UINT64(__secure_user_hintArray__)
++
++#   define gcmSKIPSECUREUSER() \
++        __secure_user_offset__ += gcmSIZEOF(gctUINT32)
++
++#   define gcmUPDATESECUREUSER() \
++        *__secure_user_hintArray__ = __secure_user_offset__; \
++        \
++        __secure_user_offset__    += gcmSIZEOF(gctUINT32); \
++        __secure_user_hintArray__ += 1
++
++#else
++
++#   define gcmDEFINESECUREUSER()
++#   define gcmBEGINSECUREUSER()
++#   define gcmENDSECUREUSER()
++#   define gcmSKIPSECUREUSER()
++#   define gcmUPDATESECUREUSER()
++
++#endif
++
++/*----------------------------------------------------------------------------*/
++
++#if gcdDUMP
++#   define gcmDUMPSTATEDATA(StateDelta, FixedPoint, Address, Data) \
++        if (FixedPoint) \
++        { \
++            gcmDUMP(gcvNULL, "@[state.x 0x%04X 0x%08X]", \
++                Address, Data \
++                ); \
++        } \
++        else \
++        { \
++            gcmDUMP(gcvNULL, "@[state 0x%04X 0x%08X]", \
++                Address, Data \
++                ); \
++        }
++#else
++#   define gcmDUMPSTATEDATA(StateDelta, FixedPoint, Address, Data)
++#endif
++
++/*----------------------------------------------------------------------------*/
++
++#define gcmDEFINESTATEBUFFER(CommandBuffer, StateDelta, Memory, ReserveSize) \
++    gcmDEFINESECUREUSER() \
++    gctSIZE_T ReserveSize; \
++    gcoCMDBUF CommandBuffer; \
++    gctUINT32_PTR Memory; \
++    gcsSTATE_DELTA_PTR StateDelta
++
++#define gcmBEGINSTATEBUFFER(Hardware, CommandBuffer, StateDelta, Memory, ReserveSize) \
++{ \
++    gcmONERROR(gcoBUFFER_Reserve( \
++        Hardware->buffer, ReserveSize, gcvTRUE, &CommandBuffer \
++        )); \
++    \
++    Memory =  gcmUINT64_TO_PTR(CommandBuffer->lastReserve); \
++    \
++    StateDelta = Hardware->delta; \
++    \
++    gcmBEGINSECUREUSER(); \
++}
++
++#define gcmENDSTATEBUFFER(CommandBuffer, Memory, ReserveSize) \
++{ \
++    gcmENDSECUREUSER(); \
++    \
++    gcmASSERT( \
++        gcmUINT64_TO_TYPE(CommandBuffer->lastReserve, gctUINT8_PTR) + ReserveSize \
++        == \
++         (gctUINT8_PTR) Memory \
++        ); \
++}
++
++/*----------------------------------------------------------------------------*/
++
++#define gcmBEGINSTATEBATCH(CommandBuffer, Memory, FixedPoint, Address, Count) \
++{ \
++    gcmASSERT(((Memory - gcmUINT64_TO_TYPE(CommandBuffer->lastReserve, gctUINT32_PTR)) & 1) == 0); \
++    gcmASSERT((gctUINT32)Count <= 1024); \
++    \
++    gcmVERIFYLOADSTATEDONE(CommandBuffer); \
++    \
++    gcmSTORELOADSTATE(CommandBuffer, Memory, Address, Count); \
++    \
++    *Memory++ \
++        = gcmSETFIELDVALUE(0, AQ_COMMAND_LOAD_STATE_COMMAND, OPCODE,  LOAD_STATE) \
++        | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, FLOAT,   FixedPoint) \
++        | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, COUNT,   Count) \
++        | gcmSETFIELD     (0, AQ_COMMAND_LOAD_STATE_COMMAND, ADDRESS, Address); \
++    \
++    gcmSKIPSECUREUSER(); \
++}
++
++#define gcmENDSTATEBATCH(CommandBuffer, Memory) \
++{ \
++    gcmVERIFYLOADSTATEDONE(CommandBuffer); \
++    \
++    gcmASSERT(((Memory - gcmUINT64_TO_TYPE(CommandBuffer->lastReserve, gctUINT32_PTR)) & 1) == 0); \
++}
++
++/*----------------------------------------------------------------------------*/
++
++#define gcmSETSTATEDATA(StateDelta, CommandBuffer, Memory, FixedPoint, \
++                        Address, Data) \
++{ \
++    gctUINT32 __temp_data32__; \
++    \
++    gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address); \
++    \
++    __temp_data32__ = Data; \
++    \
++    *Memory++ = __temp_data32__; \
++    \
++    gcoHARDWARE_UpdateDelta( \
++        StateDelta, FixedPoint, Address, 0, __temp_data32__ \
++        ); \
++    \
++    gcmDUMPSTATEDATA(StateDelta, FixedPoint, Address, __temp_data32__); \
++    \
++    gcmUPDATESECUREUSER(); \
++}
++
++#define gcmSETCTRLSTATE(StateDelta, CommandBuffer, Memory, Address, Data) \
++{ \
++    gctUINT32 __temp_data32__; \
++    \
++    gcmVERIFYLOADSTATE(CommandBuffer, Memory, Address); \
++    \
++    __temp_data32__ = Data; \
++    \
++    *Memory++ = __temp_data32__; \
++    \
++    gcmDUMPSTATEDATA(StateDelta, gcvFALSE, Address, __temp_data32__); \
++    \
++    gcmSKIPSECUREUSER(); \
++}
++
++#define gcmSETFILLER(CommandBuffer, Memory) \
++{ \
++    gcmVERIFYLOADSTATEDONE(CommandBuffer); \
++    \
++    Memory += 1; \
++    \
++    gcmSKIPSECUREUSER(); \
++}
++
++/*----------------------------------------------------------------------------*/
++
++#define gcmSETSINGLESTATE(StateDelta, CommandBuffer, Memory, FixedPoint, \
++                          Address, Data) \
++{ \
++    gcmBEGINSTATEBATCH(CommandBuffer, Memory, FixedPoint, Address, 1); \
++    gcmSETSTATEDATA(StateDelta, CommandBuffer, Memory, FixedPoint, \
++                    Address, Data); \
++    gcmENDSTATEBATCH(CommandBuffer, Memory); \
++}
++
++#define gcmSETSINGLECTRLSTATE(StateDelta, CommandBuffer, Memory, FixedPoint, \
++                              Address, Data) \
++{ \
++    gcmBEGINSTATEBATCH(CommandBuffer, Memory, FixedPoint, Address, 1); \
++    gcmSETCTRLSTATE(StateDelta, CommandBuffer, Memory, Address, Data); \
++    gcmENDSTATEBATCH(CommandBuffer, Memory); \
++}
++
++
++/*******************************************************************************
++**
++**  gcmSETSTARTDECOMMAND
++**
++**      Form a START_DE command.
++**
++**  ARGUMENTS:
++**
++**      Memory          Destination memory pointer of gctUINT32_PTR type.
++**      Count           Number of the rectangles.
++*/
++
++#define gcmSETSTARTDECOMMAND(Memory, Count) \
++{ \
++    *Memory++ \
++        = gcmSETFIELDVALUE(0, AQ_COMMAND_START_DE_COMMAND, OPCODE,     START_DE) \
++        | gcmSETFIELD     (0, AQ_COMMAND_START_DE_COMMAND, COUNT,      Count) \
++        | gcmSETFIELD     (0, AQ_COMMAND_START_DE_COMMAND, DATA_COUNT, 0); \
++    \
++    *Memory++ = 0xDEADDEED; \
++}
++
++/******************************************************************************\
++******************************** Ceiling Macro ********************************
++\******************************************************************************/
++#define gcmCEIL(x) ((x - (gctUINT32)x) == 0 ? (gctUINT32)x : (gctUINT32)x + 1)
++
++/******************************************************************************\
++******************************** Min/Max Macros ********************************
++\******************************************************************************/
++
++#define gcmMIN(x, y)            (((x) <= (y)) ?  (x) :  (y))
++#define gcmMAX(x, y)            (((x) >= (y)) ?  (x) :  (y))
++#define gcmCLAMP(x, min, max)   (((x) < (min)) ? (min) : \
++                                 ((x) > (max)) ? (max) : (x))
++#define gcmABS(x)               (((x) < 0)    ? -(x) :  (x))
++#define gcmNEG(x)               (((x) < 0)    ?  (x) : -(x))
++
++/*******************************************************************************
++**
++**  gcmPTR2INT
++**
++**      Convert a pointer to an integer value.
++**
++**  ARGUMENTS:
++**
++**      p       Pointer value.
++*/
++#if defined(_WIN32) || (defined(__LP64__) && __LP64__)
++#   define gcmPTR2INT(p) \
++    ( \
++        (gctUINT32) (gctUINT64) (p) \
++    )
++#else
++#   define gcmPTR2INT(p) \
++    ( \
++        (gctUINT32) (p) \
++    )
++#endif
++
++/*******************************************************************************
++**
++**  gcmINT2PTR
++**
++**      Convert an integer value into a pointer.
++**
++**  ARGUMENTS:
++**
++**      v       Integer value.
++*/
++#ifdef __LP64__
++#   define gcmINT2PTR(i) \
++    ( \
++        (gctPOINTER) (gctINT64) (i) \
++    )
++#else
++#   define gcmINT2PTR(i) \
++    ( \
++        (gctPOINTER) (i) \
++    )
++#endif
++
++/*******************************************************************************
++**
++**  gcmOFFSETOF
++**
++**      Compute the byte offset of a field inside a structure.
++**
++**  ARGUMENTS:
++**
++**      s       Structure name.
++**      field   Field name.
++*/
++#define gcmOFFSETOF(s, field) \
++( \
++    gcmPTR2INT(& (((struct s *) 0)->field)) \
++)
++
++#define gcmSWAB32(x) ((gctUINT32)( \
++        (((gctUINT32)(x) & (gctUINT32)0x000000FFUL) << 24) | \
++        (((gctUINT32)(x) & (gctUINT32)0x0000FF00UL) << 8)  | \
++        (((gctUINT32)(x) & (gctUINT32)0x00FF0000UL) >> 8)  | \
++        (((gctUINT32)(x) & (gctUINT32)0xFF000000UL) >> 24)))
++
++/*******************************************************************************
++***** Database ****************************************************************/
++
++typedef struct _gcsDATABASE_COUNTERS
++{
++    /* Number of currently allocated bytes. */
++    gctUINT64                   bytes;
++
++    /* Maximum number of bytes allocated (memory footprint). */
++    gctUINT64                   maxBytes;
++
++    /* Total number of bytes allocated. */
++    gctUINT64                   totalBytes;
++}
++gcsDATABASE_COUNTERS;
++
++typedef struct _gcuDATABASE_INFO
++{
++    /* Counters. */
++    gcsDATABASE_COUNTERS        counters;
++
++    /* Time value. */
++    gctUINT64                   time;
++}
++gcuDATABASE_INFO;
++
++/*******************************************************************************
++***** Frame database **********************************************************/
++
++/* gcsHAL_FRAME_INFO */
++typedef struct _gcsHAL_FRAME_INFO
++{
++    /* Current timer tick. */
++    OUT gctUINT64               ticks;
++
++    /* Bandwidth counters. */
++    OUT gctUINT                 readBytes8[8];
++    OUT gctUINT                 writeBytes8[8];
++
++    /* Counters. */
++    OUT gctUINT                 cycles[8];
++    OUT gctUINT                 idleCycles[8];
++    OUT gctUINT                 mcCycles[8];
++    OUT gctUINT                 readRequests[8];
++    OUT gctUINT                 writeRequests[8];
++
++    /* FE counters. */
++    OUT gctUINT                 drawCount;
++    OUT gctUINT                 vertexOutCount;
++    OUT gctUINT                 vertexMissCount;
++
++    /* 3D counters. */
++    OUT gctUINT                 vertexCount;
++    OUT gctUINT                 primitiveCount;
++    OUT gctUINT                 rejectedPrimitives;
++    OUT gctUINT                 culledPrimitives;
++    OUT gctUINT                 clippedPrimitives;
++    OUT gctUINT                 droppedPrimitives;
++    OUT gctUINT                 frustumClippedPrimitives;
++    OUT gctUINT                 outPrimitives;
++    OUT gctUINT                 inPrimitives;
++    OUT gctUINT                 culledQuadCount;
++    OUT gctUINT                 totalQuadCount;
++    OUT gctUINT                 quadCount;
++    OUT gctUINT                 totalPixelCount;
++
++    /* PE counters. */
++    OUT gctUINT                 colorKilled[8];
++    OUT gctUINT                 colorDrawn[8];
++    OUT gctUINT                 depthKilled[8];
++    OUT gctUINT                 depthDrawn[8];
++
++    /* Shader counters. */
++    OUT gctUINT                 shaderCycles;
++    OUT gctUINT                 vsInstructionCount;
++    OUT gctUINT                 vsTextureCount;
++    OUT gctUINT                 vsBranchCount;
++    OUT gctUINT                 vsVertices;
++    OUT gctUINT                 psInstructionCount;
++    OUT gctUINT                 psTextureCount;
++    OUT gctUINT                 psBranchCount;
++    OUT gctUINT                 psPixels;
++
++    /* Texture counters. */
++    OUT gctUINT                 bilinearRequests;
++    OUT gctUINT                 trilinearRequests;
++    OUT gctUINT                 txBytes8[2];
++    OUT gctUINT                 txHitCount;
++    OUT gctUINT                 txMissCount;
++}
++gcsHAL_FRAME_INFO;
++
++typedef enum _gcePATCH_ID
++{
++    gcePATCH_UNKNOWN = 0xFFFFFFFF,
++
++    /* Benchmark list*/
++    gcePATCH_GLB11 = 0x0,
++    gcePATCH_GLB21,
++    gcePATCH_GLB25,
++    gcePATCH_GLB27,
++
++    gcePATCH_BM21,
++    gcePATCH_MM,
++    gcePATCH_MM06,
++    gcePATCH_MM07,
++    gcePATCH_QUADRANT,
++    gcePATCH_ANTUTU,
++    gcePATCH_SMARTBENCH,
++    gcePATCH_JPCT,
++    gcePATCH_NENAMARK,
++    gcePATCH_NENAMARK2,
++    gcePATCH_NEOCORE,
++    gcePATCH_GLB,
++    gcePATCH_GB,
++    gcePATCH_RTESTVA,
++    gcePATCH_BMX,
++    gcePATCH_BMGUI,
++
++    /* Game list */
++    gcePATCH_NBA2013,
++    gcePATCH_BARDTALE,
++    gcePATCH_BUSPARKING3D,
++    gcePATCH_FISHBOODLE,
++    gcePATCH_SUBWAYSURFER,
++    gcePATCH_HIGHWAYDRIVER,
++    gcePATCH_PREMIUM,
++    gcePATCH_RACEILLEGAL,
++    gcePATCH_BLABLA,
++    gcePATCH_MEGARUN,
++    gcePATCH_GALAXYONFIRE2,
++    gcePATCH_GLOFTR3HM,
++    gcePATCH_GLOFTSXHM,
++    gcePATCH_GLOFTF3HM,
++    gcePATCH_GLOFTGANG,
++    gcePATCH_XRUNNER,
++    gcePATCH_WP,
++    gcePATCH_DEVIL,
++    gcePATCH_HOLYARCH,
++    gcePATCH_MUSE,
++    gcePATCH_SG,
++    gcePATCH_SIEGECRAFT,
++    gcePATCH_CARCHALLENGE,
++    gcePATCH_HEROESCALL,
++    gcePATCH_MONOPOLY,
++    gcePATCH_CTGL20,
++    gcePATCH_FIREFOX,
++    gcePATCH_CHORME,
++    gcePATCH_DUOKANTV,
++    gcePATCH_TESTAPP,
++    gcePATCH_GOOGLEEARTH,
++    gcePATCH_SF4,
++    gcePATCH_SPEEDRACE,
++    gcePATCH_AIRNAVY,
++    gcePATCH_F18NEW,
++    gcePATCH_F18,
++    gcePATCH_WISTONESG,
++    gcvPATCH_VECUNIT_RED,
++    gcvPATCH_NAMESGAS,
++    gcvPATCH_AFTERBURNER,
++    gcvPATCH_UIMARK,
++    /* Count enum*/
++    gcePATCH_COUNT,
++}
++gcePATCH_ID;
++
++#if gcdLINK_QUEUE_SIZE
++typedef struct _gckLINKDATA * gckLINKDATA;
++struct _gckLINKDATA
++{
++    gctUINT32                   start;
++    gctUINT32                   end;
++    gctINT                      pid;
++};
++
++typedef struct _gckLINKQUEUE * gckLINKQUEUE;
++struct _gckLINKQUEUE
++{
++    struct _gckLINKDATA         data[gcdLINK_QUEUE_SIZE];
++    gctUINT32                   rear;
++    gctUINT32                   front;
++    gctUINT32                   count;
++};
++#endif
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_types_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_version.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,37 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_version_h_
++#define __gc_hal_version_h_
++
++#define gcvVERSION_MAJOR        4
++
++#define gcvVERSION_MINOR        6
++
++#define gcvVERSION_PATCH        9
++
++#define gcvVERSION_BUILD     9754
++
++#define gcvVERSION_DATE      __DATE__
++
++#define gcvVERSION_TIME      __TIME__
++
++#endif /* __gc_hal_version_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/kernel/inc/gc_hal_vg.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,913 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_vg_h_
++#define __gc_hal_vg_h_
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++
++#include "gc_hal_rename.h"
++#include "gc_hal_types.h"
++#include "gc_hal_enum.h"
++#include "gc_hal_base.h"
++
++#if gcdENABLE_VG
++
++/* Thread routine type. */
++#if defined(LINUX)
++    typedef gctINT              gctTHREADFUNCRESULT;
++    typedef gctPOINTER          gctTHREADFUNCPARAMETER;
++#   define  gctTHREADFUNCTYPE
++#elif defined(WIN32)
++    typedef gctUINT             gctTHREADFUNCRESULT;
++    typedef gctPOINTER          gctTHREADFUNCPARAMETER;
++#   define  gctTHREADFUNCTYPE   __stdcall
++#elif defined(__QNXNTO__)
++    typedef void *              gctTHREADFUNCRESULT;
++    typedef gctPOINTER          gctTHREADFUNCPARAMETER;
++#   define  gctTHREADFUNCTYPE
++#endif
++
++typedef gctTHREADFUNCRESULT (gctTHREADFUNCTYPE * gctTHREADFUNC) (
++    gctTHREADFUNCPARAMETER ThreadParameter
++    );
++
++
++#if defined(gcvDEBUG)
++#   undef gcvDEBUG
++#endif
++
++#define gcdFORCE_DEBUG 0
++#define gcdFORCE_MESSAGES 0
++
++
++#if DBG || defined(DEBUG) || defined(_DEBUG) || gcdFORCE_DEBUG
++#   define gcvDEBUG 1
++#else
++#   define gcvDEBUG 0
++#endif
++
++#define _gcmERROR_RETURN(prefix, func) \
++    status = func; \
++    if (gcmIS_ERROR(status)) \
++    { \
++        prefix##PRINT_VERSION(); \
++        prefix##TRACE(gcvLEVEL_ERROR, \
++            #prefix "ERR_RETURN: status=%d(%s) @ %s(%d)", \
++            status, gcoOS_DebugStatus2Name(status), __FUNCTION__, __LINE__); \
++        return status; \
++    } \
++    do { } while (gcvFALSE)
++
++#define gcmERROR_RETURN(func)         _gcmERROR_RETURN(gcm, func)
++
++#define gcmLOG_LOCATION()
++
++#define gcmkIS_ERROR(status)        (status < 0)
++
++#define gcmALIGNDOWN(n, align) \
++( \
++    (n) & ~((align) - 1) \
++)
++
++#define gcmIS_VALID_INDEX(Index, Array) \
++    (((gctUINT) (Index)) < gcmCOUNTOF(Array))
++
++
++#define gcmIS_NAN(x) \
++( \
++    ((* (gctUINT32_PTR) &(x)) & 0x7FFFFFFF) == 0x7FFFFFFF \
++)
++
++#define gcmLERP(v1, v2, w) \
++    ((v1) * (w) + (v2) * (1.0f - (w)))
++
++#define gcmINTERSECT(Start1, Start2, Length) \
++    (gcmABS((Start1) - (Start2)) < (Length))
++
++/*******************************************************************************
++**
++**  gcmERR_GOTO
++**
++**      Prints a message and terminates the current loop on error.
++**
++**  ASSUMPTIONS:
++**
++**      'status' variable of gceSTATUS type must be defined.
++**
++**  ARGUMENTS:
++**
++**      Function
++**          Function to evaluate.
++*/
++
++#define gcmERR_GOTO(Function) \
++    status = Function; \
++    if (gcmIS_ERROR(status)) \
++    { \
++        gcmTRACE( \
++            gcvLEVEL_ERROR, \
++            "gcmERR_GOTO: status=%d @ line=%d in function %s.\n", \
++            status, __LINE__, __FUNCTION__ \
++            ); \
++        goto ErrorHandler; \
++    }
++
++#if gcvDEBUG || gcdFORCE_MESSAGES
++#   define gcmVERIFY_BOOLEAN(Expression) \
++        gcmASSERT( \
++            ( (Expression) == gcvFALSE ) || \
++            ( (Expression) == gcvTRUE  )    \
++            )
++#else
++#   define gcmVERIFY_BOOLEAN(Expression)
++#endif
++
++/*******************************************************************************
++**
++**  gcmVERIFYFIELDFIT
++**
++**      Verify whether the value fits in the field.
++**
++**  ARGUMENTS:
++**
++**      data    Data value.
++**      reg     Name of register.
++**      field   Name of field within register.
++**      value   Value for field.
++*/
++#define gcmVERIFYFIELDFIT(reg, field, value) \
++    gcmASSERT( \
++        (value) <= gcmFIELDMAX(reg, field) \
++        )
++/*******************************************************************************
++**
++**  gcmFIELDMAX
++**
++**      Get field maximum value.
++**
++**  ARGUMENTS:
++**
++**      reg     Name of register.
++**      field   Name of field within register.
++*/
++#define gcmFIELDMAX(reg, field) \
++( \
++    (gctUINT32) \
++        ( \
++        (__gcmGETSIZE(reg##_##field) == 32) \
++                ?  ~0 \
++                : (~(~0 << __gcmGETSIZE(reg##_##field))) \
++        ) \
++)
++
++
++/* ANSI C does not have the 'f' functions, define replacements here. */
++#define gcmSINF(x)                      ((gctFLOAT) sin(x))
++#define gcmCOSF(x)                      ((gctFLOAT) cos(x))
++#define gcmASINF(x)                     ((gctFLOAT) asin(x))
++#define gcmACOSF(x)                     ((gctFLOAT) acos(x))
++#define gcmSQRTF(x)                     ((gctFLOAT) sqrt(x))
++#define gcmFABSF(x)                     ((gctFLOAT) fabs(x))
++#define gcmFMODF(x, y)                  ((gctFLOAT) fmod((x), (y)))
++#define gcmCEILF(x)                     ((gctFLOAT) ceil(x))
++#define gcmFLOORF(x)                    ((gctFLOAT) floor(x))
++
++
++
++/* Fixed point constants. */
++#define gcvZERO_X               ((gctFIXED_POINT) 0x00000000)
++#define gcvHALF_X               ((gctFIXED_POINT) 0x00008000)
++#define gcvONE_X                ((gctFIXED_POINT) 0x00010000)
++#define gcvNEGONE_X             ((gctFIXED_POINT) 0xFFFF0000)
++#define gcvTWO_X                ((gctFIXED_POINT) 0x00020000)
++
++/* Integer constants. */
++#define gcvMAX_POS_INT          ((gctINT) 0x7FFFFFFF)
++#define gcvMAX_NEG_INT          ((gctINT) 0x80000000)
++
++/* Float constants. */
++#define gcvMAX_POS_FLOAT        ((gctFLOAT)  3.4028235e+038)
++#define gcvMAX_NEG_FLOAT        ((gctFLOAT) -3.4028235e+038)
++
++/******************************************************************************\
++***************************** Miscellaneous Macro ******************************
++\******************************************************************************/
++
++#define gcmKB2BYTES(Kilobyte) \
++( \
++    (Kilobyte) << 10 \
++)
++
++#define gcmMB2BYTES(Megabyte) \
++( \
++    (Megabyte) << 20 \
++)
++
++#define gcmMAT(Matrix, Row, Column) \
++( \
++    (Matrix) [(Row) * 3 + (Column)] \
++)
++
++#define gcmMAKE2CHAR(Char1, Char2) \
++( \
++    ((gctUINT16) (gctUINT8) (Char1) << 0) | \
++    ((gctUINT16) (gctUINT8) (Char2) << 8) \
++)
++
++#define gcmMAKE4CHAR(Char1, Char2, Char3, Char4) \
++( \
++    ((gctUINT32)(gctUINT8) (Char1) <<  0) | \
++    ((gctUINT32)(gctUINT8) (Char2) <<  8) | \
++    ((gctUINT32)(gctUINT8) (Char3) << 16) | \
++    ((gctUINT32)(gctUINT8) (Char4) << 24) \
++)
++
++/* some platforms need to fix the physical address for HW to access*/
++#define gcmFIXADDRESS(address) \
++(\
++    (address)\
++)
++
++#define gcmkFIXADDRESS(address) \
++(\
++    (address)\
++)
++
++/******************************************************************************\
++****************************** Kernel Debug Macro ******************************
++\******************************************************************************/
++
++/* Set signal to signaled state for specified process. */
++gceSTATUS
++gckOS_SetSignal(
++    IN gckOS Os,
++    IN gctHANDLE Process,
++    IN gctSIGNAL Signal
++    );
++
++/* Return the kernel logical pointer for the given physical one. */
++gceSTATUS
++gckOS_GetKernelLogical(
++    IN gckOS Os,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * KernelPointer
++    );
++
++/* Return the kernel logical pointer for the given physical one. */
++gceSTATUS
++gckOS_GetKernelLogicalEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * KernelPointer
++    );
++
++/*----------------------------------------------------------------------------*/
++/*----------------------------- Semaphore Object -----------------------------*/
++
++/* Increment the value of a semaphore. */
++gceSTATUS
++gckOS_IncrementSemaphore(
++    IN gckOS Os,
++    IN gctSEMAPHORE Semaphore
++    );
++
++/* Decrement the value of a semaphore (waiting might occur). */
++gceSTATUS
++gckOS_DecrementSemaphore(
++    IN gckOS Os,
++    IN gctSEMAPHORE Semaphore
++    );
++
++
++/*----------------------------------------------------------------------------*/
++/*------------------------------- Thread Object ------------------------------*/
++
++/* Start a thread. */
++gceSTATUS
++gckOS_StartThread(
++    IN gckOS Os,
++    IN gctTHREADFUNC ThreadFunction,
++    IN gctPOINTER ThreadParameter,
++    OUT gctTHREAD * Thread
++    );
++
++/* Stop a thread. */
++gceSTATUS
++gckOS_StopThread(
++    IN gckOS Os,
++    IN gctTHREAD Thread
++    );
++
++/* Verify whether the thread is still running. */
++gceSTATUS
++gckOS_VerifyThread(
++    IN gckOS Os,
++    IN gctTHREAD Thread
++    );
++
++
++/* Construct a new gckVGKERNEL object. */
++gceSTATUS
++gckVGKERNEL_Construct(
++    IN gckOS Os,
++    IN gctPOINTER Context,
++    IN gckKERNEL  inKernel,
++    OUT gckVGKERNEL * Kernel
++    );
++
++/* Destroy an gckVGKERNEL object. */
++gceSTATUS
++gckVGKERNEL_Destroy(
++    IN gckVGKERNEL Kernel
++    );
++
++/* Allocate linear video memory. */
++gceSTATUS
++gckKERNEL_AllocateLinearMemory(
++    IN gckKERNEL Kernel,
++    IN OUT gcePOOL * Pool,
++    IN gctSIZE_T Bytes,
++    IN gctSIZE_T Alignment,
++    IN gceSURF_TYPE Type,
++    OUT gcuVIDMEM_NODE_PTR * Node
++    );
++
++/* Unmap memory. */
++gceSTATUS
++gckKERNEL_UnmapMemory(
++    IN gckKERNEL Kernel,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    );
++
++/* Dispatch a user-level command. */
++gceSTATUS
++gckVGKERNEL_Dispatch(
++    IN gckKERNEL Kernel,
++    IN gctBOOL FromUser,
++    IN OUT struct _gcsHAL_INTERFACE * Interface
++    );
++
++/* Query command buffer requirements. */
++gceSTATUS
++gckKERNEL_QueryCommandBuffer(
++    IN gckKERNEL Kernel,
++    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
++    );
++
++#if gcdDYNAMIC_MAP_RESERVED_MEMORY
++gceSTATUS
++gckOS_MapReservedMemoryToKernel(
++    IN gckOS Os,
++    IN gctUINT32 Physical,
++    IN gctINT Bytes,
++    IN OUT gctPOINTER *Virtual
++    );
++
++gceSTATUS
++gckOS_UnmapReservedMemoryFromKernel(
++    IN gctPOINTER Virtual
++    );
++#endif
++
++/******************************************************************************\
++******************************* gckVGHARDWARE Object ******************************
++\******************************************************************************/
++
++/* Construct a new gckVGHARDWARE object. */
++gceSTATUS
++gckVGHARDWARE_Construct(
++    IN gckOS Os,
++    OUT gckVGHARDWARE * Hardware
++    );
++
++/* Destroy an gckVGHARDWARE object. */
++gceSTATUS
++gckVGHARDWARE_Destroy(
++    IN gckVGHARDWARE Hardware
++    );
++
++/* Query system memory requirements. */
++gceSTATUS
++gckVGHARDWARE_QuerySystemMemory(
++    IN gckVGHARDWARE Hardware,
++    OUT gctSIZE_T * SystemSize,
++    OUT gctUINT32 * SystemBaseAddress
++    );
++
++/* Build virtual address. */
++gceSTATUS
++gckVGHARDWARE_BuildVirtualAddress(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Index,
++    IN gctUINT32 Offset,
++    OUT gctUINT32 * Address
++    );
++
++/* Kickstart the command processor. */
++gceSTATUS
++gckVGHARDWARE_Execute(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Address,
++    IN gctSIZE_T Count
++    );
++
++/* Query the available memory. */
++gceSTATUS
++gckVGHARDWARE_QueryMemory(
++    IN gckVGHARDWARE Hardware,
++    OUT gctSIZE_T * InternalSize,
++    OUT gctUINT32 * InternalBaseAddress,
++    OUT gctUINT32 * InternalAlignment,
++    OUT gctSIZE_T * ExternalSize,
++    OUT gctUINT32 * ExternalBaseAddress,
++    OUT gctUINT32 * ExternalAlignment,
++    OUT gctUINT32 * HorizontalTileSize,
++    OUT gctUINT32 * VerticalTileSize
++    );
++
++/* Query the identity of the hardware. */
++gceSTATUS
++gckVGHARDWARE_QueryChipIdentity(
++    IN gckVGHARDWARE Hardware,
++    OUT gceCHIPMODEL* ChipModel,
++    OUT gctUINT32* ChipRevision,
++    OUT gctUINT32* ChipFeatures,
++    OUT gctUINT32* ChipMinorFeatures,
++    OUT gctUINT32* ChipMinorFeatures1
++    );
++
++/* Convert an API format. */
++gceSTATUS
++gckVGHARDWARE_ConvertFormat(
++    IN gckVGHARDWARE Hardware,
++    IN gceSURF_FORMAT Format,
++    OUT gctUINT32 * BitsPerPixel,
++    OUT gctUINT32 * BytesPerTile
++    );
++
++/* Split a harwdare specific address into API stuff. */
++gceSTATUS
++gckVGHARDWARE_SplitMemory(
++    IN gckVGHARDWARE Hardware,
++    IN gctUINT32 Address,
++    OUT gcePOOL * Pool,
++    OUT gctUINT32 * Offset
++    );
++
++/* Align size to tile boundary. */
++gceSTATUS
++gckVGHARDWARE_AlignToTile(
++    IN gckVGHARDWARE Hardware,
++    IN gceSURF_TYPE Type,
++    IN OUT gctUINT32_PTR Width,
++    IN OUT gctUINT32_PTR Height
++    );
++
++/* Convert logical address to hardware specific address. */
++gceSTATUS
++gckVGHARDWARE_ConvertLogical(
++    IN gckVGHARDWARE Hardware,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    );
++
++/* Program MMU. */
++gceSTATUS
++gckVGHARDWARE_SetMMU(
++    IN gckVGHARDWARE Hardware,
++    IN gctPOINTER Logical
++    );
++
++/* Flush the MMU. */
++gceSTATUS
++gckVGHARDWARE_FlushMMU(
++    IN gckVGHARDWARE Hardware
++    );
++
++/* Get idle register. */
++gceSTATUS
++gckVGHARDWARE_GetIdle(
++    IN gckVGHARDWARE Hardware,
++    OUT gctUINT32 * Data
++    );
++
++/* Flush the caches. */
++gceSTATUS
++gckVGHARDWARE_Flush(
++    IN gckVGHARDWARE Hardware,
++    IN gceKERNEL_FLUSH Flush,
++    IN gctPOINTER Logical,
++    IN OUT gctSIZE_T * Bytes
++    );
++
++/* Enable/disable fast clear. */
++gceSTATUS
++gckVGHARDWARE_SetFastClear(
++    IN gckVGHARDWARE Hardware,
++    IN gctINT Enable
++    );
++
++gceSTATUS
++gckVGHARDWARE_ReadInterrupt(
++    IN gckVGHARDWARE Hardware,
++    OUT gctUINT32_PTR IDs
++    );
++
++/* Power management. */
++gceSTATUS
++gckVGHARDWARE_SetPowerManagementState(
++    IN gckVGHARDWARE Hardware,
++    IN gceCHIPPOWERSTATE State
++    );
++
++gceSTATUS
++gckVGHARDWARE_QueryPowerManagementState(
++    IN gckVGHARDWARE Hardware,
++    OUT gceCHIPPOWERSTATE* State
++    );
++
++gceSTATUS
++gckVGHARDWARE_SetPowerManagement(
++    IN gckVGHARDWARE Hardware,
++    IN gctBOOL PowerManagement
++    );
++
++gceSTATUS
++gckVGHARDWARE_SetPowerOffTimeout(
++    IN gckVGHARDWARE  Hardware,
++    IN gctUINT32    Timeout
++    );
++
++gceSTATUS
++gckVGHARDWARE_QueryPowerOffTimeout(
++    IN gckVGHARDWARE  Hardware,
++    OUT gctUINT32*  Timeout
++    );
++
++gceSTATUS
++gckVGHARDWARE_QueryIdle(
++    IN gckVGHARDWARE Hardware,
++    OUT gctBOOL_PTR IsIdle
++    );
++/******************************************************************************\
++*************************** Command Buffer Structures **************************
++\******************************************************************************/
++
++/* Vacant command buffer marker. */
++#define gcvVACANT_BUFFER        ((gcsCOMPLETION_SIGNAL_PTR) (1))
++
++/* Command buffer header. */
++typedef struct _gcsCMDBUFFER * gcsCMDBUFFER_PTR;
++typedef struct _gcsCMDBUFFER
++{
++    /* Pointer to the completion signal. */
++    gcsCOMPLETION_SIGNAL_PTR    completion;
++
++    /* The user sets this to the node of the container buffer whitin which
++       this particular command buffer resides. The kernel sets this to the
++       node of the internally allocated buffer. */
++    gctUINT64                   node;
++
++    /* Command buffer hardware address. */
++    gctUINT32                   address;
++
++    /* The offset of the buffer from the beginning of the header. */
++    gctUINT32                   bufferOffset;
++
++    /* Size of the area allocated for the data portion of this particular
++       command buffer (headers and tail reserves are excluded). */
++    gctSIZE_T                   size;
++
++    /* Offset into the buffer [0..size]; reflects exactly how much data has
++       been put into the command buffer. */
++    gctUINT                     offset;
++
++    /* The number of command units in the buffer for the hardware to
++       execute. */
++    gctSIZE_T                   dataCount;
++
++    /* MANAGED BY : user HAL (gcoBUFFER object).
++       USED BY    : user HAL (gcoBUFFER object).
++       Points to the immediate next allocated command buffer. */
++    gcsCMDBUFFER_PTR            nextAllocated;
++
++    /* MANAGED BY : user layers (HAL and drivers).
++       USED BY    : kernel HAL (gcoBUFFER object).
++       Points to the next subbuffer if any. A family of subbuffers are chained
++       together and are meant to be executed inseparably as a unit. Meaning
++       that context switching cannot occur while a chain of subbuffers is being
++       executed. */
++    gcsCMDBUFFER_PTR            nextSubBuffer;
++}
++gcsCMDBUFFER;
++
++/* Command queue element. */
++typedef struct _gcsVGCMDQUEUE
++{
++    /* Pointer to the command buffer header. */
++    gcsCMDBUFFER_PTR            commandBuffer;
++
++    /* Dynamic vs. static command buffer state. */
++    gctBOOL                     dynamic;
++}
++gcsVGCMDQUEUE;
++
++/* Context map entry. */
++typedef struct _gcsVGCONTEXT_MAP
++{
++    /* State index. */
++    gctUINT32                   index;
++
++    /* New state value. */
++    gctUINT32                   data;
++
++    /* Points to the next entry in the mod list. */
++    gcsVGCONTEXT_MAP_PTR            next;
++}
++gcsVGCONTEXT_MAP;
++
++/* gcsVGCONTEXT structure that holds the current context. */
++typedef struct _gcsVGCONTEXT
++{
++    /* Context ID. */
++    gctUINT64                   id;
++
++    /* State caching ebable flag. */
++    gctBOOL                     stateCachingEnabled;
++
++    /* Current pipe. */
++    gctUINT32                   currentPipe;
++
++    /* State map/mod buffer. */
++    gctSIZE_T                   mapFirst;
++    gctSIZE_T                   mapLast;
++#ifdef __QNXNTO__
++    gctSIZE_T                   mapContainerSize;
++#endif
++    gcsVGCONTEXT_MAP_PTR            mapContainer;
++    gcsVGCONTEXT_MAP_PTR            mapPrev;
++    gcsVGCONTEXT_MAP_PTR            mapCurr;
++    gcsVGCONTEXT_MAP_PTR            firstPrevMap;
++    gcsVGCONTEXT_MAP_PTR            firstCurrMap;
++
++    /* Main context buffer. */
++    gcsCMDBUFFER_PTR            header;
++    gctUINT32_PTR               buffer;
++
++    /* Completion signal. */
++    gctHANDLE                   process;
++    gctSIGNAL                   signal;
++
++#if defined(__QNXNTO__)
++    gctINT32                    coid;
++    gctINT32                    rcvid;
++#endif
++}
++gcsVGCONTEXT;
++
++/* User space task header. */
++typedef struct _gcsTASK * gcsTASK_PTR;
++typedef struct _gcsTASK
++{
++    /* Pointer to the next task for the same interrupt in user space. */
++    gcsTASK_PTR                 next;
++
++    /* Size of the task data that immediately follows the structure. */
++    gctUINT                     size;
++
++    /* Task data starts here. */
++    /* ... */
++}
++gcsTASK;
++
++/* User space task master table entry. */
++typedef struct _gcsTASK_MASTER_ENTRY * gcsTASK_MASTER_ENTRY_PTR;
++typedef struct _gcsTASK_MASTER_ENTRY
++{
++    /* Pointers to the head and to the tail of the task chain. */
++    gcsTASK_PTR                 head;
++    gcsTASK_PTR                 tail;
++}
++gcsTASK_MASTER_ENTRY;
++
++/* User space task master table entry. */
++typedef struct _gcsTASK_MASTER_TABLE
++{
++    /* Table with one entry per block. */
++    gcsTASK_MASTER_ENTRY        table[gcvBLOCK_COUNT];
++
++    /* The total number of tasks sckeduled. */
++    gctUINT                     count;
++
++    /* The total size of event data in bytes. */
++    gctUINT                     size;
++
++#if defined(__QNXNTO__)
++    gctINT32                    coid;
++    gctINT32                    rcvid;
++#endif
++}
++gcsTASK_MASTER_TABLE;
++
++/******************************************************************************\
++***************************** gckVGINTERRUPT Object ******************************
++\******************************************************************************/
++
++typedef struct _gckVGINTERRUPT * gckVGINTERRUPT;
++
++typedef gceSTATUS (* gctINTERRUPT_HANDLER)(
++    IN gckVGKERNEL Kernel
++    );
++
++gceSTATUS
++gckVGINTERRUPT_Construct(
++    IN gckVGKERNEL Kernel,
++    OUT gckVGINTERRUPT * Interrupt
++    );
++
++gceSTATUS
++gckVGINTERRUPT_Destroy(
++    IN gckVGINTERRUPT Interrupt
++    );
++
++gceSTATUS
++gckVGINTERRUPT_Enable(
++    IN gckVGINTERRUPT Interrupt,
++    IN OUT gctINT32_PTR Id,
++    IN gctINTERRUPT_HANDLER Handler
++    );
++
++gceSTATUS
++gckVGINTERRUPT_Disable(
++    IN gckVGINTERRUPT Interrupt,
++    IN gctINT32 Id
++    );
++
++#ifndef __QNXNTO__
++
++gceSTATUS
++gckVGINTERRUPT_Enque(
++    IN gckVGINTERRUPT Interrupt
++    );
++
++#else
++
++gceSTATUS
++gckVGINTERRUPT_Enque(
++    IN gckVGINTERRUPT Interrupt,
++    OUT gckOS *Os,
++    OUT gctSEMAPHORE *Semaphore
++    );
++
++#endif
++
++gceSTATUS
++gckVGINTERRUPT_DumpState(
++    IN gckVGINTERRUPT Interrupt
++    );
++
++
++/******************************************************************************\
++******************************* gckVGCOMMAND Object *******************************
++\******************************************************************************/
++
++typedef struct _gckVGCOMMAND *      gckVGCOMMAND;
++
++/* Construct a new gckVGCOMMAND object. */
++gceSTATUS
++gckVGCOMMAND_Construct(
++    IN gckVGKERNEL Kernel,
++    IN gctUINT TaskGranularity,
++    IN gctUINT QueueSize,
++    OUT gckVGCOMMAND * Command
++    );
++
++/* Destroy an gckVGCOMMAND object. */
++gceSTATUS
++gckVGCOMMAND_Destroy(
++    IN gckVGCOMMAND Command
++    );
++
++/* Query command buffer attributes. */
++gceSTATUS
++gckVGCOMMAND_QueryCommandBuffer(
++    IN gckVGCOMMAND Command,
++    OUT gcsCOMMAND_BUFFER_INFO_PTR Information
++    );
++
++/* Allocate a command queue. */
++gceSTATUS
++gckVGCOMMAND_Allocate(
++    IN gckVGCOMMAND Command,
++    IN gctSIZE_T Size,
++    OUT gcsCMDBUFFER_PTR * CommandBuffer,
++    OUT gctPOINTER * Data
++    );
++
++/* Release memory held by the command queue. */
++gceSTATUS
++gckVGCOMMAND_Free(
++    IN gckVGCOMMAND Command,
++    IN gcsCMDBUFFER_PTR CommandBuffer
++    );
++
++/* Schedule the command queue for execution. */
++gceSTATUS
++gckVGCOMMAND_Execute(
++    IN gckVGCOMMAND Command,
++    IN gcsCMDBUFFER_PTR CommandBuffer
++    );
++
++/* Commit a buffer to the command queue. */
++gceSTATUS
++gckVGCOMMAND_Commit(
++    IN gckVGCOMMAND Command,
++    IN gcsVGCONTEXT_PTR Context,
++    IN gcsVGCMDQUEUE_PTR Queue,
++    IN gctUINT EntryCount,
++    IN gcsTASK_MASTER_TABLE_PTR TaskTable
++    );
++
++/******************************************************************************\
++********************************* gckVGMMU Object ********************************
++\******************************************************************************/
++
++typedef struct _gckVGMMU *          gckVGMMU;
++
++/* Construct a new gckVGMMU object. */
++gceSTATUS
++gckVGMMU_Construct(
++    IN gckVGKERNEL Kernel,
++    IN gctSIZE_T MmuSize,
++    OUT gckVGMMU * Mmu
++    );
++
++/* Destroy an gckVGMMU object. */
++gceSTATUS
++gckVGMMU_Destroy(
++    IN gckVGMMU Mmu
++    );
++
++/* Allocate pages inside the MMU. */
++gceSTATUS
++gckVGMMU_AllocatePages(
++    IN gckVGMMU Mmu,
++    IN gctSIZE_T PageCount,
++    OUT gctPOINTER * PageTable,
++    OUT gctUINT32 * Address
++    );
++
++/* Remove a page table from the MMU. */
++gceSTATUS
++gckVGMMU_FreePages(
++    IN gckVGMMU Mmu,
++    IN gctPOINTER PageTable,
++    IN gctSIZE_T PageCount
++    );
++
++/* Set the MMU page with info. */
++gceSTATUS
++gckVGMMU_SetPage(
++   IN gckVGMMU Mmu,
++   IN gctUINT32 PageAddress,
++   IN gctUINT32 *PageEntry
++   );
++
++/* Flush MMU */
++gceSTATUS
++gckVGMMU_Flush(
++   IN gckVGMMU Mmu
++   );
++
++#endif /* gcdENABLE_VG */
++
++#ifdef __cplusplus
++} /* extern "C" */
++#endif
++
++#endif /* __gc_hal_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/default/gc_hal_kernel_allocator_array.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,34 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++extern gceSTATUS
++_DefaultAlloctorInit(
++    IN gckOS Os,
++    OUT gckALLOCATOR * Allocator
++    );
++
++gcsALLOCATOR_DESC allocatorArray[] =
++{
++    /* Default allocator. */
++    gcmkDEFINE_ALLOCATOR_DESC("default", _DefaultAlloctorInit),
++};
++
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_array.h	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,45 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++extern gceSTATUS
++_DefaultAlloctorInit(
++    IN gckOS Os,
++    OUT gckALLOCATOR * Allocator
++    );
++
++#if LINUX_CMA_FSL
++gceSTATUS
++_CMAFSLAlloctorInit(
++    IN gckOS Os,
++    OUT gckALLOCATOR * Allocator
++    );
++#endif
++
++gcsALLOCATOR_DESC allocatorArray[] =
++{
++#if LINUX_CMA_FSL
++    gcmkDEFINE_ALLOCATOR_DESC("cmafsl", _CMAFSLAlloctorInit),
++#endif
++    /* Default allocator. */
++    gcmkDEFINE_ALLOCATOR_DESC("default", _DefaultAlloctorInit),
++};
++
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/allocator/freescale/gc_hal_kernel_allocator_cma.c	2015-07-27 23:13:06.218794344 +0200
+@@ -0,0 +1,412 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++#include "gc_hal_kernel_allocator.h"
++
++#include <linux/pagemap.h>
++#include <linux/seq_file.h>
++#include <linux/mman.h>
++#include <asm/atomic.h>
++#include <linux/dma-mapping.h>
++#include <linux/slab.h>
++#include <linux/dma-mapping.h>
++
++#define _GC_OBJ_ZONE    gcvZONE_OS
++
++typedef struct _gcsCMA_PRIV * gcsCMA_PRIV_PTR;
++typedef struct _gcsCMA_PRIV {
++    gctUINT32 cmasize;
++}
++gcsCMA_PRIV;
++
++struct mdl_cma_priv {
++    gctPOINTER kvaddr;
++    dma_addr_t physical;
++};
++
++int gc_cma_usage_show(struct seq_file* m, void* data)
++{
++    gcsINFO_NODE *node = m->private;
++    gckALLOCATOR Allocator = node->device;
++    gcsCMA_PRIV_PTR priv = Allocator->privateData;
++
++    seq_printf(m, "cma:  %u bytes\n", priv->cmasize);
++
++    return 0;
++}
++
++static gcsINFO InfoList[] =
++{
++    {"cmausage", gc_cma_usage_show},
++};
++
++static void
++_DefaultAllocatorDebugfsInit(
++    IN gckALLOCATOR Allocator,
++    IN gckDEBUGFS_DIR Root
++    )
++{
++    gcmkVERIFY_OK(
++        gckDEBUGFS_DIR_Init(&Allocator->debugfsDir, Root->root, "cma"));
++
++    gcmkVERIFY_OK(gckDEBUGFS_DIR_CreateFiles(
++        &Allocator->debugfsDir,
++        InfoList,
++        gcmCOUNTOF(InfoList),
++        Allocator
++        ));
++}
++
++static void
++_DefaultAllocatorDebugfsCleanup(
++    IN gckALLOCATOR Allocator
++    )
++{
++    gcmkVERIFY_OK(gckDEBUGFS_DIR_RemoveFiles(
++        &Allocator->debugfsDir,
++        InfoList,
++        gcmCOUNTOF(InfoList)
++        ));
++
++    gckDEBUGFS_DIR_Deinit(&Allocator->debugfsDir);
++}
++
++static gceSTATUS
++_CMAFSLAlloc(
++    IN gckALLOCATOR Allocator,
++    INOUT PLINUX_MDL Mdl,
++    IN gctSIZE_T NumPages,
++    IN gctUINT32 Flags
++    )
++{
++    gceSTATUS status;
++    gcsCMA_PRIV_PTR priv = (gcsCMA_PRIV_PTR)Allocator->privateData;
++
++    struct mdl_cma_priv *mdl_priv=gcvNULL;
++    gckOS os = Allocator->os;
++
++    gcmkHEADER_ARG("Mdl=%p NumPages=%d", Mdl, NumPages);
++
++    gcmkONERROR(gckOS_Allocate(os, sizeof(struct mdl_cma_priv), (gctPOINTER *)&mdl_priv));
++    mdl_priv->kvaddr = gcvNULL;
++
++    mdl_priv->kvaddr = dma_alloc_writecombine(gcvNULL,
++            NumPages * PAGE_SIZE,
++            &mdl_priv->physical,
++            GFP_KERNEL | gcdNOWARN);
++
++    if (mdl_priv->kvaddr == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    Mdl->priv = mdl_priv;
++    priv->cmasize += NumPages * PAGE_SIZE;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if(mdl_priv)
++        gckOS_Free(os, mdl_priv);
++    gcmkFOOTER();
++    return status;
++}
++
++static void
++_CMAFSLFree(
++    IN gckALLOCATOR Allocator,
++    IN OUT PLINUX_MDL Mdl
++    )
++{
++    gckOS os = Allocator->os;
++    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
++    gcsCMA_PRIV_PTR priv = (gcsCMA_PRIV_PTR)Allocator->privateData;
++    dma_free_writecombine(gcvNULL,
++            Mdl->numPages * PAGE_SIZE,
++            mdl_priv->kvaddr,
++            mdl_priv->physical);
++     gckOS_Free(os, mdl_priv);
++    priv->cmasize -= Mdl->numPages * PAGE_SIZE;
++}
++
++gctINT
++_CMAFSLMapUser(
++    gckALLOCATOR Allocator,
++    PLINUX_MDL Mdl,
++    PLINUX_MDL_MAP MdlMap,
++    gctBOOL Cacheable
++    )
++{
++
++    PLINUX_MDL      mdl = Mdl;
++    PLINUX_MDL_MAP  mdlMap = MdlMap;
++    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
++
++    gcmkHEADER_ARG("Allocator=%p Mdl=%p MdlMap=%p gctBOOL=%d", Allocator, Mdl, MdlMap, Cacheable);
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
++    mdlMap->vmaAddr = (gctSTRING)vm_mmap(gcvNULL,
++                    0L,
++                    mdl->numPages * PAGE_SIZE,
++                    PROT_READ | PROT_WRITE,
++                    MAP_SHARED,
++                    0);
++#else
++    down_write(&current->mm->mmap_sem);
++
++    mdlMap->vmaAddr = (gctSTRING)do_mmap_pgoff(gcvNULL,
++                    0L,
++                    mdl->numPages * PAGE_SIZE,
++                    PROT_READ | PROT_WRITE,
++                    MAP_SHARED,
++                    0);
++
++    up_write(&current->mm->mmap_sem);
++#endif
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_OS,
++        "%s(%d): vmaAddr->0x%X for phys_addr->0x%X",
++        __FUNCTION__, __LINE__,
++        (gctUINT32)(gctUINTPTR_T)mdlMap->vmaAddr,
++        (gctUINT32)(gctUINTPTR_T)mdl
++        );
++
++    if (IS_ERR(mdlMap->vmaAddr))
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): do_mmap_pgoff error",
++            __FUNCTION__, __LINE__
++            );
++
++        mdlMap->vmaAddr = gcvNULL;
++
++        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++        return gcvSTATUS_OUT_OF_MEMORY;
++    }
++
++    down_write(&current->mm->mmap_sem);
++
++    mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
++
++    if (mdlMap->vma == gcvNULL)
++    {
++        up_write(&current->mm->mmap_sem);
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): find_vma error",
++            __FUNCTION__, __LINE__
++            );
++
++        mdlMap->vmaAddr = gcvNULL;
++
++        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++        return gcvSTATUS_OUT_OF_RESOURCES;
++    }
++
++    /* Now map all the vmalloc pages to this user address. */
++    if (mdl->contiguous)
++    {
++        /* map kernel memory to user space.. */
++        if (dma_mmap_writecombine(gcvNULL,
++                mdlMap->vma,
++                mdl_priv->kvaddr,
++                mdl_priv->physical,
++                mdl->numPages * PAGE_SIZE) < 0)
++        {
++            up_write(&current->mm->mmap_sem);
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): dma_mmap_attrs error",
++                __FUNCTION__, __LINE__
++                );
++
++             mdlMap->vmaAddr = gcvNULL;
++
++            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++            return gcvSTATUS_OUT_OF_MEMORY;
++        }
++    }
++    else
++    {
++        gckOS_Print("incorrect mdl:conti%d\n",mdl->contiguous);
++    }
++
++    up_write(&current->mm->mmap_sem);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++void
++_CMAUnmapUser(
++    IN gckALLOCATOR Allocator,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Size
++    )
++{
++    if (unlikely(current->mm == gcvNULL))
++    {
++        /* Do nothing if process is exiting. */
++        return;
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,4,0)
++    if (vm_munmap((unsigned long)Logical, Size) < 0)
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): vm_munmap failed",
++                __FUNCTION__, __LINE__
++                );
++    }
++#else
++    down_write(&current->mm->mmap_sem);
++    if (do_munmap(current->mm, (unsigned long)Logical, Size) < 0)
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): do_munmap failed",
++                __FUNCTION__, __LINE__
++                );
++    }
++    up_write(&current->mm->mmap_sem);
++#endif
++}
++
++gceSTATUS
++_CMAMapKernel(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    OUT gctPOINTER *Logical
++    )
++{
++    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
++    *Logical =mdl_priv->kvaddr;
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_CMAUnmapKernel(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctPOINTER Logical
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++extern gceSTATUS
++_DefaultLogicalToPhysical(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctPOINTER Logical,
++    IN gctUINT32 ProcessID,
++    OUT gctUINT32_PTR Physical
++    );
++
++extern gceSTATUS
++_DefaultCache(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Physical,
++    IN gctUINT32 Bytes,
++    IN gceCACHEOPERATION Operation
++    );
++
++gceSTATUS
++_CMAPhysical(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctUINT32 Offset,
++    OUT gctUINT32_PTR Physical
++    )
++{
++    struct mdl_cma_priv *mdl_priv=(struct mdl_cma_priv *)Mdl->priv;
++     gcmkASSERT(!Offset);
++    *Physical = mdl_priv->physical;
++
++    return gcvSTATUS_OK;
++}
++
++
++extern void
++_DefaultAllocatorDestructor(
++    IN void* PrivateData
++    );
++
++/* Default allocator operations. */
++gcsALLOCATOR_OPERATIONS CMAFSLAllocatorOperations = {
++    .Alloc              = _CMAFSLAlloc,
++    .Free               = _CMAFSLFree,
++    .MapUser            = _CMAFSLMapUser,
++    .UnmapUser          = _CMAUnmapUser,
++    .MapKernel          = _CMAMapKernel,
++    .UnmapKernel        = _CMAUnmapKernel,
++    .LogicalToPhysical  = _DefaultLogicalToPhysical,
++    .Cache              = _DefaultCache,
++    .Physical           = _CMAPhysical,
++};
++
++/* Default allocator entry. */
++gceSTATUS
++_CMAFSLAlloctorInit(
++    IN gckOS Os,
++    OUT gckALLOCATOR * Allocator
++    )
++{
++    gceSTATUS status;
++    gckALLOCATOR allocator;
++    gcsCMA_PRIV_PTR priv = gcvNULL;
++
++    gcmkONERROR(
++        gckALLOCATOR_Construct(Os, &CMAFSLAllocatorOperations, &allocator));
++
++    priv = kzalloc(gcmSIZEOF(gcsCMA_PRIV), GFP_KERNEL | gcdNOWARN);
++
++    if (!priv)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Register private data. */
++    allocator->privateData = priv;
++    allocator->privateDataDestructor = _DefaultAllocatorDestructor;
++
++    allocator->debugfsInit = _DefaultAllocatorDebugfsInit;
++    allocator->debugfsCleanup = _DefaultAllocatorDebugfsCleanup;
++
++    allocator->capability = gcvALLOC_FLAG_CONTIGUOUS;
++
++    *Allocator = allocator;
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,938 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++#include "gc_hal_kernel_allocator.h"
++#include <linux/pagemap.h>
++#include <linux/seq_file.h>
++#include <linux/mman.h>
++#include <asm/atomic.h>
++#include <linux/dma-mapping.h>
++#include <linux/slab.h>
++
++#include "gc_hal_kernel_allocator_array.h"
++#include "gc_hal_kernel_platform.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_OS
++
++typedef struct _gcsDEFAULT_PRIV * gcsDEFAULT_PRIV_PTR;
++typedef struct _gcsDEFAULT_PRIV {
++    gctUINT32 low;
++    gctUINT32 high;
++}
++gcsDEFAULT_PRIV;
++
++/******************************************************************************\
++************************** Default Allocator Debugfs ***************************
++\******************************************************************************/
++
++int gc_usage_show(struct seq_file* m, void* data)
++{
++    gcsINFO_NODE *node = m->private;
++    gckALLOCATOR Allocator = node->device;
++    gcsDEFAULT_PRIV_PTR priv = Allocator->privateData;
++
++    seq_printf(m, "low:  %u bytes\n", priv->low);
++    seq_printf(m, "high: %u bytes\n", priv->high);
++
++    return 0;
++}
++
++static gcsINFO InfoList[] =
++{
++    {"lowHighUsage", gc_usage_show},
++};
++
++static void
++_DefaultAllocatorDebugfsInit(
++    IN gckALLOCATOR Allocator,
++    IN gckDEBUGFS_DIR Root
++    )
++{
++    gcmkVERIFY_OK(
++        gckDEBUGFS_DIR_Init(&Allocator->debugfsDir, Root->root, "default"));
++
++    gcmkVERIFY_OK(gckDEBUGFS_DIR_CreateFiles(
++        &Allocator->debugfsDir,
++        InfoList,
++        gcmCOUNTOF(InfoList),
++        Allocator
++        ));
++}
++
++static void
++_DefaultAllocatorDebugfsCleanup(
++    IN gckALLOCATOR Allocator
++    )
++{
++    gcmkVERIFY_OK(gckDEBUGFS_DIR_RemoveFiles(
++        &Allocator->debugfsDir,
++        InfoList,
++        gcmCOUNTOF(InfoList)
++        ));
++
++    gckDEBUGFS_DIR_Deinit(&Allocator->debugfsDir);
++}
++
++
++static void
++_NonContiguousFree(
++    IN struct page ** Pages,
++    IN gctUINT32 NumPages
++    )
++{
++    gctINT i;
++
++    gcmkHEADER_ARG("Pages=0x%X, NumPages=%d", Pages, NumPages);
++
++    gcmkASSERT(Pages != gcvNULL);
++
++    for (i = 0; i < NumPages; i++)
++    {
++        __free_page(Pages[i]);
++    }
++
++    if (is_vmalloc_addr(Pages))
++    {
++        vfree(Pages);
++    }
++    else
++    {
++        kfree(Pages);
++    }
++
++    gcmkFOOTER_NO();
++}
++
++static struct page **
++_NonContiguousAlloc(
++    IN gctUINT32 NumPages
++    )
++{
++    struct page ** pages;
++    struct page *p;
++    gctINT i, size;
++
++    gcmkHEADER_ARG("NumPages=%lu", NumPages);
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 32)
++    if (NumPages > totalram_pages)
++#else
++    if (NumPages > num_physpages)
++#endif
++    {
++        gcmkFOOTER_NO();
++        return gcvNULL;
++    }
++
++    size = NumPages * sizeof(struct page *);
++
++    pages = kmalloc(size, GFP_KERNEL | gcdNOWARN);
++
++    if (!pages)
++    {
++        pages = vmalloc(size);
++
++        if (!pages)
++        {
++            gcmkFOOTER_NO();
++            return gcvNULL;
++        }
++    }
++
++    for (i = 0; i < NumPages; i++)
++    {
++        p = alloc_page(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN);
++
++        if (!p)
++        {
++            _NonContiguousFree(pages, i);
++            gcmkFOOTER_NO();
++            return gcvNULL;
++        }
++
++        pages[i] = p;
++    }
++
++    gcmkFOOTER_ARG("pages=0x%X", pages);
++    return pages;
++}
++
++gctSTRING
++_CreateKernelVirtualMapping(
++    IN PLINUX_MDL Mdl
++    )
++{
++    gctSTRING addr = 0;
++    gctINT numPages = Mdl->numPages;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    if (Mdl->contiguous)
++    {
++        addr = page_address(Mdl->u.contiguousPages);
++    }
++    else
++    {
++        addr = vmap(Mdl->u.nonContiguousPages,
++                    numPages,
++                    0,
++                    PAGE_KERNEL);
++
++        /* Trigger a page fault. */
++        memset(addr, 0, numPages * PAGE_SIZE);
++    }
++#else
++    struct page ** pages;
++    gctBOOL free = gcvFALSE;
++    gctINT i;
++
++    if (Mdl->contiguous)
++    {
++        pages = kmalloc(sizeof(struct page *) * numPages, GFP_KERNEL | gcdNOWARN);
++
++        if (!pages)
++        {
++            return gcvNULL;
++        }
++
++        for (i = 0; i < numPages; i++)
++        {
++            pages[i] = nth_page(Mdl->u.contiguousPages, i);
++        }
++
++        free = gcvTRUE;
++    }
++    else
++    {
++        pages = Mdl->u.nonContiguousPages;
++    }
++
++    /* ioremap() can't work on system memory since 2.6.38. */
++    addr = vmap(pages, numPages, 0, gcmkNONPAGED_MEMROY_PROT(PAGE_KERNEL));
++
++    if (free)
++    {
++        kfree(pages);
++    }
++
++#endif
++
++    return addr;
++}
++
++void
++_DestoryKernelVirtualMapping(
++    IN gctSTRING Addr
++    )
++{
++#if !gcdNONPAGED_MEMORY_CACHEABLE
++    vunmap(Addr);
++#endif
++}
++
++void
++_UnmapUserLogical(
++    IN gctPOINTER Logical,
++    IN gctUINT32  Size
++)
++{
++    if (unlikely(current->mm == gcvNULL))
++    {
++        /* Do nothing if process is exiting. */
++        return;
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    if (vm_munmap((unsigned long)Logical, Size) < 0)
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): vm_munmap failed",
++                __FUNCTION__, __LINE__
++                );
++    }
++#else
++    down_write(&current->mm->mmap_sem);
++    if (do_munmap(current->mm, (unsigned long)Logical, Size) < 0)
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): do_munmap failed",
++                __FUNCTION__, __LINE__
++                );
++    }
++    up_write(&current->mm->mmap_sem);
++#endif
++}
++
++/***************************************************************************\
++************************ Default Allocator **********************************
++\***************************************************************************/
++#define C_MAX_PAGENUM  (50*1024)
++static gceSTATUS
++_DefaultAlloc(
++    IN gckALLOCATOR Allocator,
++    INOUT PLINUX_MDL Mdl,
++    IN gctSIZE_T NumPages,
++    IN gctUINT32 Flags
++    )
++{
++    gceSTATUS status;
++    gctUINT32 order;
++    gctSIZE_T bytes;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++    gctPOINTER addr = gcvNULL;
++#endif
++    gctUINT32 numPages;
++    gctUINT i = 0;
++    gctBOOL contiguous = Flags & gcvALLOC_FLAG_CONTIGUOUS;
++    struct sysinfo temsysinfo;
++    gcsDEFAULT_PRIV_PTR priv = (gcsDEFAULT_PRIV_PTR)Allocator->privateData;
++
++    gcmkHEADER_ARG("Mdl=%p NumPages=%d", Mdl, NumPages);
++
++    numPages = NumPages;
++    bytes = NumPages * PAGE_SIZE;
++    order = get_order(bytes);
++
++    si_meminfo(&temsysinfo);
++
++    if (Flags & gcvALLOC_FLAG_MEMLIMIT)
++    {
++        if ( (temsysinfo.freeram < NumPages) || ((temsysinfo.freeram-NumPages) < C_MAX_PAGENUM) )
++        {
++            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++        }
++    }
++
++    if (contiguous)
++    {
++        if (order >= MAX_ORDER)
++        {
++            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++        }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++        addr =
++            alloc_pages_exact(bytes, GFP_KERNEL | gcdNOWARN | __GFP_NORETRY);
++
++        Mdl->u.contiguousPages = addr
++                               ? virt_to_page(addr)
++                               : gcvNULL;
++
++        Mdl->exact = gcvTRUE;
++#else
++        Mdl->u.contiguousPages =
++            alloc_pages(GFP_KERNEL | gcdNOWARN | __GFP_NORETRY, order);
++#endif
++
++        if (Mdl->u.contiguousPages == gcvNULL)
++        {
++            Mdl->u.contiguousPages =
++                alloc_pages(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN, order);
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++            Mdl->exact = gcvFALSE;
++#endif
++        }
++    }
++    else
++    {
++        Mdl->u.nonContiguousPages = _NonContiguousAlloc(numPages);
++    }
++
++    if (Mdl->u.contiguousPages == gcvNULL && Mdl->u.nonContiguousPages == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    for (i = 0; i < numPages; i++)
++    {
++        struct page *page;
++
++        if (contiguous)
++        {
++            page = nth_page(Mdl->u.contiguousPages, i);
++        }
++        else
++        {
++            page = _NonContiguousToPage(Mdl->u.nonContiguousPages, i);
++        }
++
++        SetPageReserved(page);
++
++        if (!PageHighMem(page) && page_to_phys(page))
++        {
++            gcmkVERIFY_OK(
++                gckOS_CacheFlush(Allocator->os, _GetProcessID(), gcvNULL,
++                                 page_to_phys(page),
++                                 page_address(page),
++                                 PAGE_SIZE));
++
++            priv->low += PAGE_SIZE;
++        }
++        else
++        {
++            flush_dcache_page(page);
++
++#if !gcdCACHE_FUNCTION_UNIMPLEMENTED && defined(CONFIG_OUTER_CACHE) && gcdENABLE_OUTER_CACHE_PATCH
++            if (page_to_phys(page))
++            {
++                _HandleOuterCache(
++                    Allocator->os,
++                    page_to_phys(page),
++                    gcvNULL,
++                    PAGE_SIZE,
++                    gcvCACHE_FLUSH
++                    );
++            }
++#endif
++
++            priv->high += PAGE_SIZE;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++static void
++_DefaultFree(
++    IN gckALLOCATOR Allocator,
++    IN OUT PLINUX_MDL Mdl
++    )
++{
++    gctINT i;
++    struct page * page;
++    gcsDEFAULT_PRIV_PTR priv = (gcsDEFAULT_PRIV_PTR)Allocator->privateData;
++
++    for (i = 0; i < Mdl->numPages; i++)
++    {
++        if (Mdl->contiguous)
++        {
++            page = nth_page(Mdl->u.contiguousPages, i);
++        }
++        else
++        {
++            page = _NonContiguousToPage(Mdl->u.nonContiguousPages, i);
++        }
++
++        ClearPageReserved(page);
++
++        if (PageHighMem(page))
++        {
++            priv->high -= PAGE_SIZE;
++        }
++        else
++        {
++            priv->low -= PAGE_SIZE;
++        }
++    }
++
++    if (Mdl->contiguous)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++        if (Mdl->exact == gcvTRUE)
++        {
++            free_pages_exact(page_address(Mdl->u.contiguousPages), Mdl->numPages * PAGE_SIZE);
++        }
++        else
++#endif
++        {
++            __free_pages(Mdl->u.contiguousPages, get_order(Mdl->numPages * PAGE_SIZE));
++        }
++    }
++    else
++    {
++        _NonContiguousFree(Mdl->u.nonContiguousPages, Mdl->numPages);
++    }
++}
++
++gctINT
++_DefaultMapUser(
++    gckALLOCATOR Allocator,
++    PLINUX_MDL Mdl,
++    PLINUX_MDL_MAP MdlMap,
++    gctBOOL Cacheable
++    )
++{
++
++    gctSTRING       addr;
++    unsigned long   start;
++    unsigned long   pfn;
++    gctINT i;
++    gckOS           os = Allocator->os;
++    gcsPLATFORM *   platform = os->device->platform;
++
++    PLINUX_MDL      mdl = Mdl;
++    PLINUX_MDL_MAP  mdlMap = MdlMap;
++
++    gcmkHEADER_ARG("Allocator=%p Mdl=%p MdlMap=%p gctBOOL=%d", Allocator, Mdl, MdlMap, Cacheable);
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
++    mdlMap->vmaAddr = (gctSTRING)vm_mmap(gcvNULL,
++                    0L,
++                    mdl->numPages * PAGE_SIZE,
++                    PROT_READ | PROT_WRITE,
++                    MAP_SHARED,
++                    0);
++#else
++    down_write(&current->mm->mmap_sem);
++
++    mdlMap->vmaAddr = (gctSTRING)do_mmap_pgoff(gcvNULL,
++                    0L,
++                    mdl->numPages * PAGE_SIZE,
++                    PROT_READ | PROT_WRITE,
++                    MAP_SHARED,
++                    0);
++
++    up_write(&current->mm->mmap_sem);
++#endif
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_OS,
++        "%s(%d): vmaAddr->0x%X for phys_addr->0x%X",
++        __FUNCTION__, __LINE__,
++        (gctUINT32)(gctUINTPTR_T)mdlMap->vmaAddr,
++        (gctUINT32)(gctUINTPTR_T)mdl
++        );
++
++    if (IS_ERR(mdlMap->vmaAddr))
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): do_mmap_pgoff error",
++            __FUNCTION__, __LINE__
++            );
++
++        mdlMap->vmaAddr = gcvNULL;
++
++        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++        return gcvSTATUS_OUT_OF_MEMORY;
++    }
++
++    down_write(&current->mm->mmap_sem);
++
++    mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
++
++    if (mdlMap->vma == gcvNULL)
++    {
++        up_write(&current->mm->mmap_sem);
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): find_vma error",
++            __FUNCTION__, __LINE__
++            );
++
++        mdlMap->vmaAddr = gcvNULL;
++
++        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++        return gcvSTATUS_OUT_OF_RESOURCES;
++    }
++
++    mdlMap->vma->vm_flags |= gcdVM_FLAGS;
++
++    if (Cacheable == gcvFALSE)
++    {
++        /* Make this mapping non-cached. */
++        mdlMap->vma->vm_page_prot = gcmkPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
++    }
++
++    if (platform && platform->ops->adjustProt)
++    {
++        platform->ops->adjustProt(mdlMap->vma);
++    }
++
++    addr = mdl->addr;
++
++    /* Now map all the vmalloc pages to this user address. */
++    if (mdl->contiguous)
++    {
++        /* map kernel memory to user space.. */
++        if (remap_pfn_range(mdlMap->vma,
++                            mdlMap->vma->vm_start,
++                            page_to_pfn(mdl->u.contiguousPages),
++                            mdlMap->vma->vm_end - mdlMap->vma->vm_start,
++                            mdlMap->vma->vm_page_prot) < 0)
++        {
++            up_write(&current->mm->mmap_sem);
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_OS,
++                "%s(%d): unable to mmap ret",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++            return gcvSTATUS_OUT_OF_MEMORY;
++        }
++    }
++    else
++    {
++        start = mdlMap->vma->vm_start;
++
++        for (i = 0; i < mdl->numPages; i++)
++        {
++            pfn = _NonContiguousToPfn(mdl->u.nonContiguousPages, i);
++
++            if (remap_pfn_range(mdlMap->vma,
++                                start,
++                                pfn,
++                                PAGE_SIZE,
++                                mdlMap->vma->vm_page_prot) < 0)
++            {
++                up_write(&current->mm->mmap_sem);
++
++                mdlMap->vmaAddr = gcvNULL;
++
++                gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++                return gcvSTATUS_OUT_OF_MEMORY;
++            }
++
++            start += PAGE_SIZE;
++            addr += PAGE_SIZE;
++        }
++    }
++
++    up_write(&current->mm->mmap_sem);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++void
++_DefaultUnmapUser(
++    IN gckALLOCATOR Allocator,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Size
++    )
++{
++    _UnmapUserLogical(Logical, Size);
++}
++
++gceSTATUS
++_DefaultMapKernel(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    OUT gctPOINTER *Logical
++    )
++{
++    *Logical = _CreateKernelVirtualMapping(Mdl);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_DefaultUnmapKernel(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctPOINTER Logical
++    )
++{
++    _DestoryKernelVirtualMapping(Logical);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_DefaultLogicalToPhysical(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctPOINTER Logical,
++    IN gctUINT32 ProcessID,
++    OUT gctUINT32_PTR Physical
++    )
++{
++    return _ConvertLogical2Physical(
++                Allocator->os, Logical, ProcessID, Mdl, Physical);
++}
++
++gceSTATUS
++_DefaultCache(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctPOINTER Logical,
++    IN gctUINT32 Physical,
++    IN gctUINT32 Bytes,
++    IN gceCACHEOPERATION Operation
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_DefaultPhysical(
++    IN gckALLOCATOR Allocator,
++    IN PLINUX_MDL Mdl,
++    IN gctUINT32 Offset,
++    OUT gctUINT32_PTR Physical
++    )
++{
++    gcmkASSERT(Mdl->pagedMem && !Mdl->contiguous);
++    *Physical = _NonContiguousToPhys(Mdl->u.nonContiguousPages, Offset);
++
++    return gcvSTATUS_OK;
++}
++
++void
++_DefaultAllocatorDestructor(
++    IN void* PrivateData
++    )
++{
++    kfree(PrivateData);
++}
++
++/* Default allocator operations. */
++gcsALLOCATOR_OPERATIONS DefaultAllocatorOperations = {
++    .Alloc              = _DefaultAlloc,
++    .Free               = _DefaultFree,
++    .MapUser            = _DefaultMapUser,
++    .UnmapUser          = _DefaultUnmapUser,
++    .MapKernel          = _DefaultMapKernel,
++    .UnmapKernel        = _DefaultUnmapKernel,
++    .LogicalToPhysical  = _DefaultLogicalToPhysical,
++    .Cache              = _DefaultCache,
++    .Physical           = _DefaultPhysical,
++};
++
++/* Default allocator entry. */
++gceSTATUS
++_DefaultAlloctorInit(
++    IN gckOS Os,
++    OUT gckALLOCATOR * Allocator
++    )
++{
++    gceSTATUS status;
++    gckALLOCATOR allocator;
++    gcsDEFAULT_PRIV_PTR priv = gcvNULL;
++
++    gcmkONERROR(
++        gckALLOCATOR_Construct(Os, &DefaultAllocatorOperations, &allocator));
++
++    priv = kzalloc(gcmSIZEOF(gcsDEFAULT_PRIV), GFP_KERNEL | gcdNOWARN);
++
++    if (!priv)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Register private data. */
++    allocator->privateData = priv;
++    allocator->privateDataDestructor = _DefaultAllocatorDestructor;
++
++    allocator->debugfsInit = _DefaultAllocatorDebugfsInit;
++    allocator->debugfsCleanup = _DefaultAllocatorDebugfsCleanup;
++
++    *Allocator = allocator;
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++/***************************************************************************\
++************************ Allocator helper ***********************************
++\***************************************************************************/
++
++gceSTATUS
++gckALLOCATOR_Construct(
++    IN gckOS Os,
++    IN gcsALLOCATOR_OPERATIONS * Operations,
++    OUT gckALLOCATOR * Allocator
++    )
++{
++    gceSTATUS status;
++    gckALLOCATOR allocator;
++
++    gcmkHEADER_ARG("Os=%p, Operations=%p, Allocator=%p",
++                   Os, Operations, Allocator);
++
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Allocator != gcvNULL);
++    gcmkVERIFY_ARGUMENT
++        (  Operations
++        && Operations->Alloc
++        && Operations->Free
++        && Operations->MapUser
++        && Operations->UnmapUser
++        && Operations->MapKernel
++        && Operations->UnmapKernel
++        && Operations->LogicalToPhysical
++        && Operations->Cache
++        && Operations->Physical
++        );
++
++    gcmkONERROR(
++        gckOS_Allocate(Os, gcmSIZEOF(gcsALLOCATOR), (gctPOINTER *)&allocator));
++
++    gckOS_ZeroMemory(allocator, gcmSIZEOF(gcsALLOCATOR));
++
++    /* Record os. */
++    allocator->os = Os;
++
++    /* Set operations. */
++    allocator->ops = Operations;
++
++    allocator->capability = gcvALLOC_FLAG_CONTIGUOUS
++                          | gcvALLOC_FLAG_NON_CONTIGUOUS
++                          | gcvALLOC_FLAG_CACHEABLE
++                          | gcvALLOC_FLAG_MEMLIMIT;
++                          ;
++
++    *Allocator = allocator;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/******************************************************************************\
++******************************** Debugfs Support *******************************
++\******************************************************************************/
++
++static gceSTATUS
++_AllocatorDebugfsInit(
++    IN gckOS Os
++    )
++{
++    gceSTATUS status;
++    gckGALDEVICE device = Os->device;
++
++    gckDEBUGFS_DIR dir = &Os->allocatorDebugfsDir;
++
++    gcmkONERROR(gckDEBUGFS_DIR_Init(dir, device->debugfsDir.root, "allocators"));
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++static void
++_AllocatorDebugfsCleanup(
++    IN gckOS Os
++    )
++{
++    gckDEBUGFS_DIR dir = &Os->allocatorDebugfsDir;
++
++    gckDEBUGFS_DIR_Deinit(dir);
++}
++
++/***************************************************************************\
++************************ Allocator management *******************************
++\***************************************************************************/
++
++gceSTATUS
++gckOS_ImportAllocators(
++    gckOS Os
++    )
++{
++    gceSTATUS status;
++    gctUINT i;
++    gckALLOCATOR allocator;
++
++    _AllocatorDebugfsInit(Os);
++
++    INIT_LIST_HEAD(&Os->allocatorList);
++
++    for (i = 0; i < gcmCOUNTOF(allocatorArray); i++)
++    {
++        if (allocatorArray[i].construct)
++        {
++            /* Construct allocator. */
++            status = allocatorArray[i].construct(Os, &allocator);
++
++            if (gcmIS_ERROR(status))
++            {
++                gcmkPRINT("["DEVICE_NAME"]: Can't construct allocator(%s)",
++                          allocatorArray[i].name);
++
++                continue;
++            }
++
++            allocator->name = allocatorArray[i].name;
++
++            if (allocator->debugfsInit)
++            {
++                /* Init allocator's debugfs. */
++                allocator->debugfsInit(allocator, &Os->allocatorDebugfsDir);
++            }
++
++            list_add_tail(&allocator->head, &Os->allocatorList);
++        }
++    }
++
++#if gcdDEBUG
++    list_for_each_entry(allocator, &Os->allocatorList, head)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_WARNING, gcvZONE_OS,
++            "%s(%d) Allocator: %s",
++            __FUNCTION__, __LINE__,
++            allocator->name
++            );
++    }
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_FreeAllocators(
++    gckOS Os
++    )
++{
++    gckALLOCATOR allocator;
++    gckALLOCATOR temp;
++
++    list_for_each_entry_safe(allocator, temp, &Os->allocatorList, head)
++    {
++        list_del(&allocator->head);
++
++        if (allocator->debugfsCleanup)
++        {
++            /* Clean up allocator's debugfs. */
++            allocator->debugfsCleanup(allocator);
++        }
++
++        /* Free private data. */
++        if (allocator->privateDataDestructor && allocator->privateData)
++        {
++            allocator->privateDataDestructor(allocator->privateData);
++        }
++
++        gckOS_Free(Os, allocator);
++    }
++
++    _AllocatorDebugfsCleanup(Os);
++
++    return gcvSTATUS_OK;
++}
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_allocator.h	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,400 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_allocator_h_
++#define __gc_hal_kernel_allocator_h_
++
++#include "gc_hal_kernel_linux.h"
++
++typedef struct _gcsALLOCATOR * gckALLOCATOR;
++
++typedef struct _gcsALLOCATOR_OPERATIONS
++{
++    /**************************************************************************
++    **
++    ** Alloc
++    **
++    ** Allocte memory, request size is page aligned.
++    **
++    ** INPUT:
++    **
++    **    gckALLOCATOR Allocator
++    **        Pointer to an gckALLOCATOER object.
++    **
++    **    PLINUX_Mdl
++    **        Pointer to Mdl whichs stores information
++    **        about allocated memory.
++    **
++    **    gctSIZE_T NumPages
++    **        Number of pages need to allocate.
++    **
++    **    gctUINT32 Flag
++    **        Allocation option.
++    **
++    ** OUTPUT:
++    **
++    **      Nothing.
++    **
++    */
++    gceSTATUS
++    (*Alloc)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        IN gctSIZE_T NumPages,
++        IN gctUINT32 Flag
++        );
++
++    /**************************************************************************
++    **
++    ** Free
++    **
++    ** Free memory.
++    **
++    ** INPUT:
++    **
++    **     gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **     PLINUX_MDL Mdl
++    **          Mdl which stores information.
++    **
++    ** OUTPUT:
++    **
++    **      Nothing.
++    **
++    */
++    void
++    (*Free)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl
++        );
++
++    /**************************************************************************
++    **
++    ** MapUser
++    **
++    ** Map memory to user space.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      PLINUX_MDL Mdl
++    **          Pointer to a Mdl.
++    **
++    **      PLINUX_MDL_MAP MdlMap
++    **          Pointer to a MdlMap, mapped address is stored
++    **          in MdlMap->vmaAddr
++    **
++    **      gctBOOL Cacheable
++    **          Whether this mapping is cacheable.
++    **
++    ** OUTPUT:
++    **
++    **      Nothing.
++    **
++    */
++    gctINT
++    (*MapUser)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        IN PLINUX_MDL_MAP MdlMap,
++        IN gctBOOL Cacheable
++        );
++
++    /**************************************************************************
++    **
++    ** UnmapUser
++    **
++    ** Unmap address from user address space.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      gctPOINTER Logical
++    **          Address to be unmap
++    **
++    **      gctUINT32 Size
++    **          Size of address space
++    **
++    ** OUTPUT:
++    **
++    **      Nothing.
++    **
++    */
++    void
++    (*UnmapUser)(
++        IN gckALLOCATOR Allocator,
++        IN gctPOINTER Logical,
++        IN gctUINT32 Size
++        );
++
++    /**************************************************************************
++    **
++    ** MapKernel
++    **
++    ** Map memory to kernel space.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      PLINUX_MDL Mdl
++    **          Pointer to a Mdl object.
++    **
++    ** OUTPUT:
++    **      gctPOINTER * Logical
++    **          Mapped kernel address.
++    */
++    gceSTATUS
++    (*MapKernel)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        OUT gctPOINTER *Logical
++        );
++
++    /**************************************************************************
++    **
++    ** UnmapKernel
++    **
++    ** Unmap memory from kernel space.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      PLINUX_MDL Mdl
++    **          Pointer to a Mdl object.
++    **
++    **      gctPOINTER Logical
++    **          Mapped kernel address.
++    **
++    ** OUTPUT:
++    **
++    **      Nothing.
++    **
++    */
++    gceSTATUS
++    (*UnmapKernel)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        IN gctPOINTER Logical
++        );
++
++    /**************************************************************************
++    **
++    ** LogicalToPhysical
++    **
++    ** Get physical address from logical address, logical
++    ** address could be user virtual address or kernel
++    ** virtual address.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      PLINUX_MDL Mdl
++    **          Pointer to a Mdl object.
++    **
++    **      gctPOINTER Logical
++    **          Mapped kernel address.
++    **
++    **      gctUINT32 ProcessID
++    **          pid of current process.
++    ** OUTPUT:
++    **
++    **      gctUINT32_PTR Physical
++    **          Physical address.
++    **
++    */
++    gceSTATUS
++    (*LogicalToPhysical)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        IN gctPOINTER Logical,
++        IN gctUINT32 ProcessID,
++        OUT gctUINT32_PTR Physical
++        );
++
++    /**************************************************************************
++    **
++    ** Cache
++    **
++    ** Maintain cache coherency.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      PLINUX_MDL Mdl
++    **          Pointer to a Mdl object.
++    **
++    **      gctPOINTER Logical
++    **          Logical address, could be user address or kernel address
++    **
++    **      gctUINT32_PTR Physical
++    **          Physical address.
++    **
++    **      gctUINT32 Bytes
++    **          Size of memory region.
++    **
++    **      gceCACHEOPERATION Opertaion
++    **          Cache operation.
++    **
++    ** OUTPUT:
++    **
++    **      Nothing.
++    **
++    */
++    gceSTATUS (*Cache)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        IN gctPOINTER Logical,
++        IN gctUINT32 Physical,
++        IN gctUINT32 Bytes,
++        IN gceCACHEOPERATION Operation
++        );
++
++    /**************************************************************************
++    **
++    ** Physical
++    **
++    ** Get physical address from a offset in memory region.
++    **
++    ** INPUT:
++    **      gckALLOCATOR Allocator
++    **          Pointer to an gckALLOCATOER object.
++    **
++    **      PLINUX_MDL Mdl
++    **          Pointer to a Mdl object.
++    **
++    **      gctUINT32 Offset
++    **          Offset in this memory region.
++    **
++    ** OUTPUT:
++    **      gctUINT32_PTR Physical
++    **          Physical address.
++    **
++    */
++    gceSTATUS (*Physical)(
++        IN gckALLOCATOR Allocator,
++        IN PLINUX_MDL Mdl,
++        IN gctUINT32 Offset,
++        OUT gctUINT32_PTR Physical
++        );
++}
++gcsALLOCATOR_OPERATIONS;
++
++typedef struct _gcsALLOCATOR
++{
++    /* Pointer to gckOS Object. */
++    gckOS                     os;
++
++    /* Name. */
++    gctSTRING                 name;
++
++    /* Operations. */
++    gcsALLOCATOR_OPERATIONS*  ops;
++
++    /* Capability of this allocator. */
++    gctUINT32                 capability;
++
++    struct list_head          head;
++
++    /* Debugfs entry of this allocator. */
++    gcsDEBUGFS_DIR            debugfsDir;
++
++    /* Init allocator debugfs. */
++    void                      (*debugfsInit)(gckALLOCATOR, gckDEBUGFS_DIR);
++
++    /* Cleanup allocator debugfs. */
++    void                      (*debugfsCleanup)(gckALLOCATOR);
++
++    /* Private data used by customer allocator. */
++    void *                    privateData;
++
++    /* Private data destructor. */
++    void                      (*privateDataDestructor)(void *);
++}
++gcsALLOCATOR;
++
++typedef struct _gcsALLOCATOR_DESC
++{
++    /* Name of a allocator. */
++    char *                    name;
++
++    /* Entry function to construct a allocator. */
++    gceSTATUS                 (*construct)(gckOS, gckALLOCATOR *);
++}
++gcsALLOCATOR_DESC;
++
++/*
++* Helpers
++*/
++
++/* Fill a gcsALLOCATOR_DESC structure. */
++#define gcmkDEFINE_ALLOCATOR_DESC(Name, Construct) \
++    { \
++        .name      = Name, \
++        .construct = Construct, \
++    }
++
++/* Construct a allocator. */
++gceSTATUS
++gckALLOCATOR_Construct(
++    IN gckOS Os,
++    IN gcsALLOCATOR_OPERATIONS * Operations,
++    OUT gckALLOCATOR * Allocator
++    );
++
++/*
++    How to implement customer allocator
++
++    Build in customer alloctor
++
++        It is recommanded that customer allocator is implmented in independent
++        source file(s) which is specified by CUSOMTER_ALLOCATOR_OBJS in Kbuld.
++
++    Register gcsALLOCATOR
++
++        For each customer specified allocator, a desciption entry must be added
++        to allocatorArray defined in gc_hal_kernel_allocator_array.h.
++
++        An entry in allocatorArray is a gcsALLOCATOR_DESC structure which describes
++        name and constructor of a gckALLOCATOR object.
++
++
++    Implement gcsALLOCATOR_DESC.init()
++
++        In gcsALLOCATOR_DESC.init(), gckALLOCATOR_Construct should be called
++        to create a gckALLOCATOR object, customer specified private data can
++        be put in gcsALLOCATOR.privateData.
++
++
++    Implement gcsALLOCATOR_OPERATIONS
++
++        When call gckALLOCATOR_Construct to create a gckALLOCATOR object, a
++        gcsALLOCATOR_OPERATIONS structure must be provided whose all members
++        implemented.
++
++*/
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,795 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifdef MODULE
++#include <linux/module.h>
++#endif
++#include <linux/init.h>
++#include <linux/debugfs.h>
++#include <linux/slab.h>
++#ifdef MODVERSIONS
++#include <linux/modversions.h>
++#endif
++#include <linux/stddef.h>
++#include <linux/sched.h>
++#include <linux/kernel.h>
++#include <linux/timer.h>
++#include <linux/delay.h>
++#include <linux/errno.h>
++#include <linux/mutex.h>
++#include <linux/vmalloc.h>
++#include <linux/types.h>
++#include <linux/fs.h>
++#include <linux/poll.h>
++#include <asm/uaccess.h>
++#include <linux/completion.h>
++#include "gc_hal_kernel_linux.h"
++
++/*
++   Prequsite:
++
++   1) Debugfs feature must be enabled in the kernel.
++       1.a) You can enable this, in the compilation of the uImage, all you have to do is, In the "make menuconfig" part,
++       you have to enable the debugfs in the kernel hacking part of the menu.
++
++   HOW TO USE:
++   1) insert the driver with the following option logFileSize, Ex: insmod galcore.ko ...... logFileSize=10240
++   This gives a circular buffer of 10 MB
++
++   2)Usually after inserting the driver, the debug file system is mounted under /sys/kernel/debug/
++
++        2.a)If the debugfs is not mounted, you must do "mount -t debugfs none /sys/kernel/debug"
++
++   3) To read what is being printed in the debugfs file system:
++        Ex : cat /sys/kernel/debug/gpu/galcore_trace
++
++   4)To write into the debug file system from user side :
++        Ex: echo "hello" > cat /sys/kernel/debug/gpu/galcore_trace
++
++   5)To write into debugfs from kernel side, Use the function called gckDebugFileSystemPrint
++
++
++   USECASE Kernel Dump:
++
++   1) Go to /hal/inc/gc_hal_options.h, and enable the following flags:
++        - #   define gcdDUMP                              1
++        - #   define gcdDUMP_IN_KERNEL          1
++        - #   define gcdDUMP_COMMAND          1
++
++    2) Go to /hal/kernel/gc_hal_kernel_command.c and disable the following flag
++        -#define gcdSIMPLE_COMMAND_DUMP  0
++
++    3) Compile the driver
++    4) insmod it with the logFileSize option
++    5) Run an application
++    6) You can get the dump by cat /sys/kernel/debug/gpu/galcore_trace
++
++ */
++
++/**/
++typedef va_list gctDBGARGS ;
++#define gcmkARGS_START(argument, pointer)   va_start(argument, pointer)
++#define gcmkARGS_END(argument)              	      va_end(argument)
++
++#define gcmkDBGFSPRINT(ArgumentSize, Message) \
++  { \
++	  gctDBGARGS __arguments__; \
++	  gcmkARGS_START(__arguments__, Message); \
++	  _DebugFSPrint(ArgumentSize, Message, __arguments__);\
++	  gcmkARGS_END(__arguments__); \
++  }
++
++/*Debug File System Node Struct*/
++struct _gcsDebugFileSystemNode
++{
++    /*wait queues for read and write operations*/
++#if defined(DECLARE_WAIT_QUEUE_HEAD)
++    wait_queue_head_t read_q , write_q ;
++#else
++    struct wait_queue *read_q , *write_q ;
++#endif
++    struct dentry *parent ; /*parent directory*/
++    struct dentry *filen ; /*filename*/
++    struct semaphore sem ; /* mutual exclusion semaphore */
++    char *data ; /* The circular buffer data */
++    int size ; /* Size of the buffer pointed to by 'data' */
++    int refcount ; /* Files that have this buffer open */
++    int read_point ; /* Offset in circ. buffer of oldest data */
++    int write_point ; /* Offset in circ. buffer of newest data */
++    int offset ; /* Byte number of read_point in the stream */
++    struct _gcsDebugFileSystemNode *next ;
++} ;
++
++/* amount of data in the queue */
++#define gcmkNODE_QLEN(node) ( (node)->write_point >= (node)->read_point ? \
++         (node)->write_point - (node)->read_point : \
++         (node)->size - (node)->read_point + (node)->write_point)
++
++/* byte number of the last byte in the queue */
++#define gcmkNODE_FIRST_EMPTY_BYTE(node) ((node)->offset + gcmkNODE_QLEN(node))
++
++/*Synchronization primitives*/
++#define gcmkNODE_READQ(node) (&((node)->read_q))
++#define gcmkNODE_WRITEQ(node) (&((node)->write_q))
++#define gcmkNODE_SEM(node) (&((node)->sem))
++
++/*Utilities*/
++#define gcmkMIN(x, y) ((x) < (y) ? (x) : y)
++
++/*Debug File System Struct*/
++typedef struct _gcsDebugFileSystem
++{
++    gcsDebugFileSystemNode* linkedlist ;
++    gcsDebugFileSystemNode* currentNode ;
++    int isInited ;
++} gcsDebugFileSystem ;
++
++
++/*debug file system*/
++static gcsDebugFileSystem gc_dbgfs ;
++
++
++
++/*******************************************************************************
++ **
++ **		READ & WRITE FUNCTIONS (START)
++ **
++ *******************************************************************************/
++
++/*******************************************************************************
++ **
++ **  _ReadFromNode
++ **
++ **	1) reading bytes out of a circular buffer with wraparound.
++ **	2)returns caddr_t, pointer to data read, which the caller must free.
++ **	3) length is (a pointer to) the number of bytes to be read, which will be set by this function to
++ **	    be the number of bytes actually returned
++ **
++ *******************************************************************************/
++static caddr_t
++_ReadFromNode (
++                gcsDebugFileSystemNode* Node ,
++                size_t *Length ,
++                loff_t *Offset
++                )
++{
++    caddr_t retval ;
++    int bytes_copied = 0 , n , start_point , remaining ;
++
++    /* is the user trying to read data that has already scrolled off? */
++    if ( *Offset < Node->offset )
++    {
++        *Offset = Node->offset ;
++    }
++
++    /* is the user trying to read past EOF? */
++    if ( *Offset >= gcmkNODE_FIRST_EMPTY_BYTE ( Node ) )
++    {
++        return NULL ;
++    }
++
++    /* find the smaller of the total bytes we have available and what
++     * the user is asking for */
++
++    *Length = gcmkMIN ( *Length , gcmkNODE_FIRST_EMPTY_BYTE ( Node ) - *Offset ) ;
++
++    remaining = * Length ;
++
++    /* figure out where to start based on user's Offset */
++    start_point = Node->read_point + ( *Offset - Node->offset ) ;
++
++    start_point = start_point % Node->size ;
++
++    /* allocate memory to return */
++    if ( ( retval = kmalloc ( sizeof (char ) * remaining , GFP_KERNEL ) ) == NULL )
++        return NULL ;
++
++    /* copy the (possibly noncontiguous) data to our buffer */
++    while ( remaining )
++    {
++        n = gcmkMIN ( remaining , Node->size - start_point ) ;
++        memcpy ( retval + bytes_copied , Node->data + start_point , n ) ;
++        bytes_copied += n ;
++        remaining -= n ;
++        start_point = ( start_point + n ) % Node->size ;
++    }
++
++    /* advance user's file pointer */
++    *Offset += * Length ;
++
++    return retval ;
++}
++
++/*******************************************************************************
++ **
++ **  _WriteToNode
++ **
++ ** 1) writes to a circular buffer with wraparound.
++ ** 2)in case of an overflow, it overwrites the oldest unread data.
++ **
++ *********************************************************************************/
++static void
++_WriteToNode (
++               gcsDebugFileSystemNode* Node ,
++               caddr_t Buf ,
++               int Length
++               )
++{
++    int bytes_copied = 0 ;
++    int overflow = 0 ;
++    int n ;
++
++    if ( Length + gcmkNODE_QLEN ( Node ) >= ( Node->size - 1 ) )
++    {
++        overflow = 1 ;
++
++        /* in case of overflow, figure out where the new buffer will
++         * begin.  we start by figuring out where the current buffer ENDS:
++         * node->parent->offset +  gcmkNODE_QLEN.	we then advance the end-offset
++         * by the Length of the current write, and work backwards to
++         * figure out what the oldest unoverwritten data will be (i.e.,
++         * size of the buffer). */
++        Node->offset = Node->offset + gcmkNODE_QLEN ( Node ) + Length
++                - Node->size + 1 ;
++    }
++
++    while ( Length )
++    {
++        /* how many contiguous bytes are available from the write point to
++         * the end of the circular buffer? */
++        n = gcmkMIN ( Length , Node->size - Node->write_point ) ;
++        memcpy ( Node->data + Node->write_point , Buf + bytes_copied , n ) ;
++        bytes_copied += n ;
++        Length -= n ;
++        Node->write_point = ( Node->write_point + n ) % Node->size ;
++    }
++
++    /* if there is an overflow, reset the read point to read whatever is
++     * the oldest data that we have, that has not yet been
++     * overwritten. */
++    if ( overflow )
++    {
++        Node->read_point = ( Node->write_point + 1 ) % Node->size ;
++    }
++}
++
++
++/*******************************************************************************
++ **
++ ** 		PRINTING UTILITY (START)
++ **
++ *******************************************************************************/
++
++/*******************************************************************************
++ **
++ **  _GetArgumentSize
++ **
++ **
++ *******************************************************************************/
++static gctINT
++_GetArgumentSize (
++                   IN gctCONST_STRING Message
++                   )
++{
++    gctINT i , count ;
++
++    for ( i = 0 , count = 0 ; Message[i] ; i += 1 )
++    {
++        if ( Message[i] == '%' )
++        {
++            count += 1 ;
++        }
++    }
++    return count * sizeof (unsigned int ) ;
++}
++
++/*******************************************************************************
++ **
++ ** _AppendString
++ **
++ **
++ *******************************************************************************/
++static ssize_t
++_AppendString (
++                IN gcsDebugFileSystemNode* Node ,
++                IN gctCONST_STRING String ,
++                IN int Length
++                )
++{
++    caddr_t message = NULL ;
++    int n ;
++
++    /* if the message is longer than the buffer, just take the beginning
++     * of it, in hopes that the reader (if any) will have time to read
++     * before we wrap around and obliterate it */
++    n = gcmkMIN ( Length , Node->size - 1 ) ;
++
++    /* make sure we have the memory for it */
++    if ( ( message = kmalloc ( n , GFP_KERNEL ) ) == NULL )
++        return - ENOMEM ;
++
++    /* copy into our temp buffer */
++    memcpy ( message , String , n ) ;
++
++    /* now copy it into the circular buffer and free our temp copy */
++    _WriteToNode ( Node , message , n ) ;
++    kfree ( message ) ;
++    return n ;
++}
++
++/*******************************************************************************
++ **
++ ** _DebugFSPrint
++ **
++ **
++ *******************************************************************************/
++static void
++_DebugFSPrint (
++                IN unsigned int ArgumentSize ,
++                IN const char* Message ,
++                IN gctDBGARGS Arguments
++
++                )
++{
++    char buffer[MAX_LINE_SIZE] ;
++    int len ;
++    down ( gcmkNODE_SEM ( gc_dbgfs.currentNode ) ) ;
++    len = vsnprintf ( buffer , sizeof (buffer ) , Message , *( va_list * ) & Arguments ) ;
++    buffer[len] = '\0' ;
++
++    /* Add end-of-line if missing. */
++    if ( buffer[len - 1] != '\n' )
++    {
++        buffer[len ++] = '\n' ;
++        buffer[len] = '\0' ;
++    }
++    _AppendString ( gc_dbgfs.currentNode , buffer , len ) ;
++    up ( gcmkNODE_SEM ( gc_dbgfs.currentNode ) ) ;
++    wake_up_interruptible ( gcmkNODE_READQ ( gc_dbgfs.currentNode ) ) ; /* blocked in read*/
++}
++
++/*******************************************************************************
++ **
++ **                     LINUX SYSTEM FUNCTIONS (START)
++ **
++ *******************************************************************************/
++
++/*******************************************************************************
++ **
++ **  find the vivlog structure associated with an inode.
++ **  	returns a	pointer to the structure if found, NULL if not found
++ **
++ *******************************************************************************/
++static gcsDebugFileSystemNode*
++_GetNodeInfo (
++               IN struct inode *Inode
++               )
++{
++    gcsDebugFileSystemNode* node ;
++
++    if ( Inode == NULL )
++        return NULL ;
++
++    for ( node = gc_dbgfs.linkedlist ; node != NULL ; node = node->next )
++        if ( node->filen->d_inode->i_ino == Inode->i_ino )
++            return node ;
++
++    return NULL ;
++}
++
++/*******************************************************************************
++ **
++ **   _DebugFSRead
++ **
++ *******************************************************************************/
++static ssize_t
++_DebugFSRead (
++               struct file *file ,
++               char __user * buffer ,
++               size_t length ,
++               loff_t * offset
++               )
++{
++    int retval ;
++    caddr_t data_to_return ;
++    gcsDebugFileSystemNode* node ;
++    /* get the metadata about this emlog */
++    if ( ( node = _GetNodeInfo ( file->f_path.dentry->d_inode ) ) == NULL )
++    {
++        printk ( "debugfs_read: record not found\n" ) ;
++        return - EIO ;
++    }
++
++    if ( down_interruptible ( gcmkNODE_SEM ( node ) ) )
++    {
++        return - ERESTARTSYS ;
++    }
++
++    /* wait until there's data available (unless we do nonblocking reads) */
++    while ( *offset >= gcmkNODE_FIRST_EMPTY_BYTE ( node ) )
++    {
++        up ( gcmkNODE_SEM ( node ) ) ;
++        if ( file->f_flags & O_NONBLOCK )
++        {
++            return - EAGAIN ;
++        }
++        if ( wait_event_interruptible ( ( *( gcmkNODE_READQ ( node ) ) ) , ( *offset < gcmkNODE_FIRST_EMPTY_BYTE ( node ) ) ) )
++        {
++            return - ERESTARTSYS ; /* signal: tell the fs layer to handle it */
++        }
++        /* otherwise loop, but first reacquire the lock */
++        if ( down_interruptible ( gcmkNODE_SEM ( node ) ) )
++        {
++            return - ERESTARTSYS ;
++        }
++    }
++    data_to_return = _ReadFromNode ( node , &length , offset ) ;
++    if ( data_to_return == NULL )
++    {
++        retval = 0 ;
++        goto unlock ;
++    }
++    if ( copy_to_user ( buffer , data_to_return , length ) > 0 )
++    {
++        retval = - EFAULT ;
++    }
++    else
++    {
++        retval = length ;
++    }
++    kfree ( data_to_return ) ;
++unlock:
++    up ( gcmkNODE_SEM ( node ) ) ;
++    wake_up_interruptible ( gcmkNODE_WRITEQ ( node ) ) ;
++    return retval ;
++}
++
++/*******************************************************************************
++ **
++ **_DebugFSWrite
++ **
++ *******************************************************************************/
++static ssize_t
++_DebugFSWrite (
++                struct file *file ,
++                const char __user * buffer ,
++                size_t length ,
++                loff_t * offset
++                )
++{
++    caddr_t message = NULL ;
++    int n ;
++    gcsDebugFileSystemNode*node ;
++
++    /* get the metadata about this log */
++    if ( ( node = _GetNodeInfo ( file->f_path.dentry->d_inode ) ) == NULL )
++    {
++        return - EIO ;
++    }
++
++    if ( down_interruptible ( gcmkNODE_SEM ( node ) ) )
++    {
++        return - ERESTARTSYS ;
++    }
++
++    /* if the message is longer than the buffer, just take the beginning
++     * of it, in hopes that the reader (if any) will have time to read
++     * before we wrap around and obliterate it */
++    n = gcmkMIN ( length , node->size - 1 ) ;
++
++    /* make sure we have the memory for it */
++    if ( ( message = kmalloc ( n , GFP_KERNEL ) ) == NULL )
++    {
++        up ( gcmkNODE_SEM ( node ) ) ;
++        return - ENOMEM ;
++    }
++
++    /* copy into our temp buffer */
++    if ( copy_from_user ( message , buffer , n ) > 0 )
++    {
++        up ( gcmkNODE_SEM ( node ) ) ;
++        kfree ( message ) ;
++        return - EFAULT ;
++    }
++
++    /* now copy it into the circular buffer and free our temp copy */
++    _WriteToNode ( node , message , n ) ;
++
++    kfree ( message ) ;
++    up ( gcmkNODE_SEM ( node ) ) ;
++
++    /* wake up any readers that might be waiting for the data.  we call
++     * schedule in the vague hope that a reader will run before the
++     * writer's next write, to avoid losing data. */
++    wake_up_interruptible ( gcmkNODE_READQ ( node ) ) ;
++
++    return n ;
++}
++
++/*******************************************************************************
++ **
++ ** File Operations Table
++ **
++ *******************************************************************************/
++static const struct file_operations debugfs_operations = {
++                                                          .owner = THIS_MODULE ,
++                                                          .read = _DebugFSRead ,
++                                                          .write = _DebugFSWrite ,
++} ;
++
++/*******************************************************************************
++ **
++ **                             INTERFACE FUNCTIONS (START)
++ **
++ *******************************************************************************/
++
++/*******************************************************************************
++ **
++ **  gckDebugFileSystemIsEnabled
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++
++
++gctINT
++gckDebugFileSystemIsEnabled ( void )
++{
++    return gc_dbgfs.isInited ;
++}
++/*******************************************************************************
++ **
++ **  gckDebugFileSystemInitialize
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++
++gctINT
++gckDebugFileSystemInitialize ( void )
++{
++    if ( ! gc_dbgfs.isInited )
++    {
++        gc_dbgfs.linkedlist = gcvNULL ;
++        gc_dbgfs.currentNode = gcvNULL ;
++        gc_dbgfs.isInited = 1 ;
++    }
++    return gc_dbgfs.isInited ;
++}
++/*******************************************************************************
++ **
++ **  gckDebugFileSystemTerminate
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++
++gctINT
++gckDebugFileSystemTerminate ( void )
++{
++    gcsDebugFileSystemNode * next = gcvNULL ;
++    gcsDebugFileSystemNode * temp = gcvNULL ;
++    if ( gc_dbgfs.isInited )
++    {
++        temp = gc_dbgfs.linkedlist ;
++        while ( temp != gcvNULL )
++        {
++            next = temp->next ;
++            gckDebugFileSystemFreeNode ( temp ) ;
++            kfree ( temp ) ;
++            temp = next ;
++        }
++        gc_dbgfs.isInited = 0 ;
++    }
++    return 0 ;
++}
++
++
++/*******************************************************************************
++ **
++ **  gckDebugFileSystemCreateNode
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ **	 gckDebugFileSystemFreeNode * Device
++ **		  Pointer to a variable receiving the gcsDebugFileSystemNode object pointer on
++ **		  success.
++ *********************************************************************************/
++
++gctINT
++gckDebugFileSystemCreateNode (
++                               IN gctINT SizeInKB ,
++                               IN gctCONST_STRING ParentName ,
++                               IN gctCONST_STRING NodeName ,
++                               OUT gcsDebugFileSystemNode **Node
++                               )
++{
++    gcsDebugFileSystemNode*node ;
++    /* allocate space for our metadata and initialize it */
++    if ( ( node = kmalloc ( sizeof (gcsDebugFileSystemNode ) , GFP_KERNEL ) ) == NULL )
++        goto struct_malloc_failed ;
++
++    /*Zero it out*/
++    memset ( node , 0 , sizeof (gcsDebugFileSystemNode ) ) ;
++
++    /*Init the sync primitives*/
++#if defined(DECLARE_WAIT_QUEUE_HEAD)
++    init_waitqueue_head ( gcmkNODE_READQ ( node ) ) ;
++#else
++    init_waitqueue ( gcmkNODE_READQ ( node ) ) ;
++#endif
++
++#if defined(DECLARE_WAIT_QUEUE_HEAD)
++    init_waitqueue_head ( gcmkNODE_WRITEQ ( node ) ) ;
++#else
++    init_waitqueue ( gcmkNODE_WRITEQ ( node ) ) ;
++#endif
++    sema_init ( gcmkNODE_SEM ( node ) , 1 ) ;
++    /*End the sync primitives*/
++
++
++    /* figure out how much of a buffer this should be and allocate the buffer */
++    node->size = 1024 * SizeInKB ;
++    if ( ( node->data = ( char * ) vmalloc ( sizeof (char ) * node->size ) ) == NULL )
++        goto data_malloc_failed ;
++
++    /*creating the debug file system*/
++    node->parent = debugfs_create_dir ( ParentName , NULL ) ;
++
++    /*creating the file*/
++    node->filen = debugfs_create_file ( NodeName , S_IRUGO | S_IWUSR , node->parent , NULL ,
++                                        &debugfs_operations ) ;
++
++    /* add it to our linked list */
++    node->next = gc_dbgfs.linkedlist ;
++    gc_dbgfs.linkedlist = node ;
++
++    /* pass the struct back */
++    *Node = node ;
++    return 0 ;
++
++    vfree ( node->data ) ;
++data_malloc_failed:
++    kfree ( node ) ;
++struct_malloc_failed:
++    return - ENOMEM ;
++}
++
++/*******************************************************************************
++ **
++ **  gckDebugFileSystemFreeNode
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++void
++gckDebugFileSystemFreeNode (
++                             IN gcsDebugFileSystemNode * Node
++                             )
++{
++
++    gcsDebugFileSystemNode **ptr ;
++
++    if ( Node == NULL )
++    {
++        printk ( "null passed to free_vinfo\n" ) ;
++        return ;
++    }
++
++    down ( gcmkNODE_SEM ( Node ) ) ;
++    /*free data*/
++    vfree ( Node->data ) ;
++
++    /*Close Debug fs*/
++    if ( Node->filen )
++    {
++        debugfs_remove ( Node->filen ) ;
++    }
++    if ( Node->parent )
++    {
++        debugfs_remove ( Node->parent ) ;
++    }
++
++    /* now delete the node from the linked list */
++    ptr = & ( gc_dbgfs.linkedlist ) ;
++    while ( *ptr != Node )
++    {
++        if ( ! *ptr )
++        {
++            printk ( "corrupt info list!\n" ) ;
++            break ;
++        }
++        else
++            ptr = & ( ( **ptr ).next ) ;
++    }
++    *ptr = Node->next ;
++    up ( gcmkNODE_SEM ( Node ) ) ;
++}
++
++/*******************************************************************************
++ **
++ **   gckDebugFileSystemSetCurrentNode
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++void
++gckDebugFileSystemSetCurrentNode (
++                                   IN gcsDebugFileSystemNode * Node
++                                   )
++{
++    gc_dbgfs.currentNode = Node ;
++}
++
++/*******************************************************************************
++ **
++ **   gckDebugFileSystemGetCurrentNode
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++void
++gckDebugFileSystemGetCurrentNode (
++                                   OUT gcsDebugFileSystemNode ** Node
++                                   )
++{
++    *Node = gc_dbgfs.currentNode ;
++}
++
++/*******************************************************************************
++ **
++ **   gckDebugFileSystemPrint
++ **
++ **
++ **  INPUT:
++ **
++ **  OUTPUT:
++ **
++ *******************************************************************************/
++void
++gckDebugFileSystemPrint (
++                          IN gctCONST_STRING Message ,
++                          ...
++                          )
++{
++    gcmkDBGFSPRINT ( _GetArgumentSize ( Message ) , Message ) ;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debugfs.h	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,84 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include <stdarg.h>
++
++#ifndef __gc_hal_kernel_debugfs_h_
++#define __gc_hal_kernel_debugfs_h_
++
++ #define MAX_LINE_SIZE 768  	     /* Max bytes for a line of debug info */
++
++
++ typedef struct _gcsDebugFileSystemNode gcsDebugFileSystemNode ;
++
++
++/*******************************************************************************
++ **
++ **                             System Related
++ **
++ *******************************************************************************/
++
++gctINT    gckDebugFileSystemIsEnabled(void);
++
++gctINT   gckDebugFileSystemInitialize(void);
++
++gctINT   gckDebugFileSystemTerminate(void);
++
++
++/*******************************************************************************
++ **
++ **                             Node Related
++ **
++ *******************************************************************************/
++
++gctINT gckDebugFileSystemCreateNode(
++ 			IN gctINT SizeInKB,
++                        IN gctCONST_STRING  ParentName ,
++                        IN gctCONST_STRING  NodeName,
++                        OUT gcsDebugFileSystemNode  **Node
++                        );
++
++
++void gckDebugFileSystemFreeNode(
++			IN gcsDebugFileSystemNode  * Node
++			);
++
++
++
++void gckDebugFileSystemSetCurrentNode(
++			IN gcsDebugFileSystemNode  * Node
++			);
++
++
++
++void gckDebugFileSystemGetCurrentNode(
++			OUT gcsDebugFileSystemNode  ** Node
++			);
++
++
++void gckDebugFileSystemPrint(
++    			IN gctCONST_STRING  Message,
++    			...
++   			 );
++
++#endif
++
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_debug.h	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,102 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_debug_h_
++#define __gc_hal_kernel_debug_h_
++
++#include <gc_hal_kernel_linux.h>
++#include <linux/spinlock.h>
++#include <linux/time.h>
++#include <stdarg.h>
++
++#ifdef __cplusplus
++extern "C" {
++#endif
++
++/******************************************************************************\
++****************************** OS-dependent Macros *****************************
++\******************************************************************************/
++
++typedef va_list gctARGUMENTS;
++
++#define gcmkARGUMENTS_START(Arguments, Pointer) \
++    va_start(Arguments, Pointer)
++
++#define gcmkARGUMENTS_END(Arguments) \
++    va_end(Arguments)
++
++#define gcmkDECLARE_LOCK(__spinLock__) \
++    static DEFINE_SPINLOCK(__spinLock__);
++
++#define gcmkLOCKSECTION(__spinLock__) \
++    spin_lock(&__spinLock__)
++
++#define gcmkUNLOCKSECTION(__spinLock__) \
++    spin_unlock(&__spinLock__)
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
++#   define gcmkGETPROCESSID() \
++        task_tgid_vnr(current)
++#else
++#   define gcmkGETPROCESSID() \
++        current->tgid
++#endif
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
++#   define gcmkGETTHREADID() \
++        task_pid_vnr(current)
++#else
++#   define gcmkGETTHREADID() \
++        current->pid
++#endif
++
++#define gcmkOUTPUT_STRING(String) \
++   if(gckDebugFileSystemIsEnabled()) \
++   	gckDebugFileSystemPrint(String);\
++   else\
++   	printk(String); \
++    touch_softlockup_watchdog()
++
++
++#define gcmkSPRINTF(Destination, Size, Message, Value) \
++    snprintf(Destination, Size, Message, Value)
++
++#define gcmkSPRINTF2(Destination, Size, Message, Value1, Value2) \
++    snprintf(Destination, Size, Message, Value1, Value2)
++
++#define gcmkSPRINTF3(Destination, Size, Message, Value1, Value2, Value3) \
++    snprintf(Destination, Size, Message, Value1, Value2, Value3)
++
++#define gcmkVSPRINTF(Destination, Size, Message, Arguments) \
++    vsnprintf(Destination, Size, Message, *(va_list *) &Arguments)
++
++#define gcmkSTRCAT(Destination, Size, String) \
++    strncat(Destination, String, Size)
++
++/* If not zero, forces data alignment in the variable argument list
++   by its individual size. */
++#define gcdALIGNBYSIZE      1
++
++#ifdef __cplusplus
++}
++#endif
++
++#endif /* __gc_hal_kernel_debug_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,1676 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++#include <linux/pagemap.h>
++#include <linux/seq_file.h>
++#include <linux/mm.h>
++#include <linux/mman.h>
++#include <linux/slab.h>
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
++#include <mach/hardware.h>
++#endif
++#include <linux/pm_runtime.h>
++
++#define _GC_OBJ_ZONE    gcvZONE_DEVICE
++
++#define DEBUG_FILE 			"galcore_trace"
++#define PARENT_FILE 		"gpu"
++
++
++#ifdef FLAREON
++    static struct dove_gpio_irq_handler gc500_handle;
++#endif
++
++#define gcmIS_CORE_PRESENT(Device, Core) (Device->irqLines[Core] > 0)
++
++/******************************************************************************\
++*************************** Memory Allocation Wrappers *************************
++\******************************************************************************/
++
++static gceSTATUS
++_AllocateMemory(
++    IN gckGALDEVICE Device,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER *Logical,
++    OUT gctPHYS_ADDR *Physical,
++    OUT gctUINT32 *PhysAddr
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Device=0x%x Bytes=%lu", Device, Bytes);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++    gcmkVERIFY_ARGUMENT(Logical != NULL);
++    gcmkVERIFY_ARGUMENT(Physical != NULL);
++    gcmkVERIFY_ARGUMENT(PhysAddr != NULL);
++
++    gcmkONERROR(gckOS_AllocateContiguous(
++        Device->os, gcvFALSE, &Bytes, Physical, Logical
++        ));
++
++    *PhysAddr = ((PLINUX_MDL)*Physical)->dmaHandle - Device->baseAddress;
++
++    /* Success. */
++    gcmkFOOTER_ARG(
++        "*Logical=0x%x *Physical=0x%x *PhysAddr=0x%08x",
++        *Logical, *Physical, *PhysAddr
++        );
++
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++_FreeMemory(
++    IN gckGALDEVICE Device,
++    IN gctPOINTER Logical,
++    IN gctPHYS_ADDR Physical)
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Device=0x%x Logical=0x%x Physical=0x%x",
++                   Device, Logical, Physical);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    status = gckOS_FreeContiguous(
++        Device->os, Physical, Logical,
++        ((PLINUX_MDL) Physical)->numPages * PAGE_SIZE
++        );
++
++    gcmkFOOTER();
++    return status;
++}
++
++
++
++/******************************************************************************\
++******************************* Interrupt Handler ******************************
++\******************************************************************************/
++static irqreturn_t isrRoutine(int irq, void *ctxt)
++{
++    gceSTATUS status;
++    gckGALDEVICE device;
++
++    device = (gckGALDEVICE) ctxt;
++
++    /* Call kernel interrupt notification. */
++    status = gckKERNEL_Notify(device->kernels[gcvCORE_MAJOR], gcvNOTIFY_INTERRUPT, gcvTRUE);
++
++    if (gcmIS_SUCCESS(status))
++    {
++        device->dataReadys[gcvCORE_MAJOR] = gcvTRUE;
++
++        up(&device->semas[gcvCORE_MAJOR]);
++
++        return IRQ_HANDLED;
++    }
++
++    return IRQ_NONE;
++}
++
++static int threadRoutine(void *ctxt)
++{
++    gckGALDEVICE device = (gckGALDEVICE) ctxt;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
++                   "Starting isr Thread with extension=%p",
++                   device);
++
++    for (;;)
++    {
++        static int down;
++
++        down = down_interruptible(&device->semas[gcvCORE_MAJOR]);
++        if (down); /*To make gcc 4.6 happye*/
++        device->dataReadys[gcvCORE_MAJOR] = gcvFALSE;
++
++        if (device->killThread == gcvTRUE)
++        {
++            /* The daemon exits. */
++            while (!kthread_should_stop())
++            {
++                gckOS_Delay(device->os, 1);
++            }
++
++            return 0;
++        }
++
++        gckKERNEL_Notify(device->kernels[gcvCORE_MAJOR], gcvNOTIFY_INTERRUPT, gcvFALSE);
++    }
++}
++
++static irqreturn_t isrRoutine2D(int irq, void *ctxt)
++{
++    gceSTATUS status;
++    gckGALDEVICE device;
++
++    device = (gckGALDEVICE) ctxt;
++
++    /* Call kernel interrupt notification. */
++    status = gckKERNEL_Notify(device->kernels[gcvCORE_2D], gcvNOTIFY_INTERRUPT, gcvTRUE);
++
++    if (gcmIS_SUCCESS(status))
++    {
++        device->dataReadys[gcvCORE_2D] = gcvTRUE;
++
++        up(&device->semas[gcvCORE_2D]);
++
++        return IRQ_HANDLED;
++    }
++
++    return IRQ_NONE;
++}
++
++static int threadRoutine2D(void *ctxt)
++{
++    gckGALDEVICE device = (gckGALDEVICE) ctxt;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
++                   "Starting isr Thread with extension=%p",
++                   device);
++
++    for (;;)
++    {
++        static int down;
++
++        down = down_interruptible(&device->semas[gcvCORE_2D]);
++        if (down); /*To make gcc 4.6 happye*/
++        device->dataReadys[gcvCORE_2D] = gcvFALSE;
++
++        if (device->killThread == gcvTRUE)
++        {
++            /* The daemon exits. */
++            while (!kthread_should_stop())
++            {
++                gckOS_Delay(device->os, 1);
++            }
++
++            return 0;
++        }
++
++        gckKERNEL_Notify(device->kernels[gcvCORE_2D], gcvNOTIFY_INTERRUPT, gcvFALSE);
++    }
++}
++
++static irqreturn_t isrRoutineVG(int irq, void *ctxt)
++{
++#if gcdENABLE_VG
++    gceSTATUS status;
++    gckGALDEVICE device;
++
++    device = (gckGALDEVICE) ctxt;
++
++	/* Serve the interrupt. */
++	status = gckVGINTERRUPT_Enque(device->kernels[gcvCORE_VG]->vg->interrupt);
++
++	/* Determine the return value. */
++	return (status == gcvSTATUS_NOT_OUR_INTERRUPT)
++		? IRQ_RETVAL(0)
++		: IRQ_RETVAL(1);
++#else
++    return IRQ_NONE;
++#endif
++}
++
++static int threadRoutineVG(void *ctxt)
++{
++    gckGALDEVICE device = (gckGALDEVICE) ctxt;
++
++    gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
++                   "Starting isr Thread with extension=%p",
++                   device);
++
++    for (;;)
++    {
++        static int down;
++
++        down = down_interruptible(&device->semas[gcvCORE_VG]);
++        if (down); /*To make gcc 4.6 happye*/
++        device->dataReadys[gcvCORE_VG] = gcvFALSE;
++
++        if (device->killThread == gcvTRUE)
++        {
++            /* The daemon exits. */
++            while (!kthread_should_stop())
++            {
++                gckOS_Delay(device->os, 1);
++            }
++
++            return 0;
++        }
++
++        gckKERNEL_Notify(device->kernels[gcvCORE_VG], gcvNOTIFY_INTERRUPT, gcvFALSE);
++    }
++}
++
++/******************************************************************************\
++******************************* gckGALDEVICE Code ******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Construct
++**
++**  Constructor.
++**
++**  INPUT:
++**
++**  OUTPUT:
++**
++**      gckGALDEVICE * Device
++**          Pointer to a variable receiving the gckGALDEVICE object pointer on
++**          success.
++*/
++gceSTATUS
++gckGALDEVICE_Construct(
++    IN gctINT IrqLine,
++    IN gctUINT32 RegisterMemBase,
++    IN gctSIZE_T RegisterMemSize,
++    IN gctINT IrqLine2D,
++    IN gctUINT32 RegisterMemBase2D,
++    IN gctSIZE_T RegisterMemSize2D,
++    IN gctINT IrqLineVG,
++    IN gctUINT32 RegisterMemBaseVG,
++    IN gctSIZE_T RegisterMemSizeVG,
++    IN gctUINT32 ContiguousBase,
++    IN gctSIZE_T ContiguousSize,
++    IN gctSIZE_T BankSize,
++    IN gctINT FastClear,
++    IN gctINT Compression,
++    IN gctUINT32 PhysBaseAddr,
++    IN gctUINT32 PhysSize,
++    IN gctINT Signal,
++    IN gctUINT LogFileSize,
++    IN struct device *pdev,
++    IN gctINT PowerManagement,
++    IN gctINT GpuProfiler,
++    OUT gckGALDEVICE *Device
++    )
++{
++    gctUINT32 internalBaseAddress = 0, internalAlignment = 0;
++    gctUINT32 externalBaseAddress = 0, externalAlignment = 0;
++    gctUINT32 horizontalTileSize, verticalTileSize;
++    struct resource* mem_region;
++    gctUINT32 physAddr;
++    gctUINT32 physical;
++    gckGALDEVICE device;
++    gceSTATUS status;
++    gctINT32 i;
++    gceHARDWARE_TYPE type;
++    gckDB sharedDB = gcvNULL;
++    gckKERNEL kernel = gcvNULL;
++
++    gcmkHEADER_ARG("IrqLine=%d RegisterMemBase=0x%08x RegisterMemSize=%u "
++                   "IrqLine2D=%d RegisterMemBase2D=0x%08x RegisterMemSize2D=%u "
++                   "IrqLineVG=%d RegisterMemBaseVG=0x%08x RegisterMemSizeVG=%u "
++                   "ContiguousBase=0x%08x ContiguousSize=%lu BankSize=%lu "
++                   "FastClear=%d Compression=%d PhysBaseAddr=0x%x PhysSize=%d Signal=%d",
++                   IrqLine, RegisterMemBase, RegisterMemSize,
++                   IrqLine2D, RegisterMemBase2D, RegisterMemSize2D,
++                   IrqLineVG, RegisterMemBaseVG, RegisterMemSizeVG,
++                   ContiguousBase, ContiguousSize, BankSize, FastClear, Compression,
++                   PhysBaseAddr, PhysSize, Signal);
++
++    /* Allocate device structure. */
++    device = kmalloc(sizeof(struct _gckGALDEVICE), GFP_KERNEL);
++
++    if (!device)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    memset(device, 0, sizeof(struct _gckGALDEVICE));
++
++   device->dbgnode = gcvNULL;
++   if(LogFileSize != 0)
++   {
++	if(gckDebugFileSystemCreateNode(LogFileSize,PARENT_FILE,DEBUG_FILE,&(device->dbgnode)) != 0)
++	{
++		gcmkTRACE_ZONE(
++		gcvLEVEL_ERROR, gcvZONE_DRIVER,
++		"%s(%d): Failed to create  the debug file system  %s/%s \n",
++		__FUNCTION__, __LINE__,
++		PARENT_FILE, DEBUG_FILE
++		);
++	}
++	else
++	{
++		/*Everything is OK*/
++	 	gckDebugFileSystemSetCurrentNode(device->dbgnode);
++	}
++    }
++#ifdef CONFIG_PM
++    /*Init runtime pm for gpu*/
++    pm_runtime_enable(pdev);
++    device->pmdev = pdev;
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++    /*get gpu regulator*/
++    device->gpu_regulator = regulator_get(pdev, "cpu_vddgpu");
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    device->gpu_regulator = devm_regulator_get(pdev, "pu");
++#endif
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    if (IS_ERR(device->gpu_regulator)) {
++	gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DRIVER,
++		"%s(%d): Failed to get gpu regulator  %s/%s \n",
++		__FUNCTION__, __LINE__,
++		PARENT_FILE, DEBUG_FILE);
++	gcmkONERROR(gcvSTATUS_NOT_FOUND);
++    }
++#endif
++    /*Initialize the clock structure*/
++    if (IrqLine != -1) {
++        device->clk_3d_core = clk_get(pdev, "gpu3d_clk");
++        if (!IS_ERR(device->clk_3d_core)) {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++            if (cpu_is_mx6q()) {
++	            device->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
++	            if (IS_ERR(device->clk_3d_shader)) {
++	                IrqLine = -1;
++	                clk_put(device->clk_3d_core);
++	                device->clk_3d_core = NULL;
++	                device->clk_3d_shader = NULL;
++	                gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
++	            }
++	          }
++#else
++	            device->clk_3d_axi = clk_get(pdev, "gpu3d_axi_clk");
++	            device->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
++	            if (IS_ERR(device->clk_3d_shader)) {
++	                IrqLine = -1;
++	                clk_put(device->clk_3d_core);
++	                device->clk_3d_core = NULL;
++	                device->clk_3d_shader = NULL;
++	                gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
++	            }
++#endif
++        } else {
++            IrqLine = -1;
++            device->clk_3d_core = NULL;
++            gckOS_Print("galcore: clk_get gpu3d_clk failed, disable 3d!\n");
++        }
++    }
++    if ((IrqLine2D != -1) || (IrqLineVG != -1)) {
++        device->clk_2d_core = clk_get(pdev, "gpu2d_clk");
++        if (IS_ERR(device->clk_2d_core)) {
++            IrqLine2D = -1;
++            IrqLineVG = -1;
++            device->clk_2d_core = NULL;
++            gckOS_Print("galcore: clk_get 2d core clock failed, disable 2d/vg!\n");
++        } else {
++	    if (IrqLine2D != -1) {
++                device->clk_2d_axi = clk_get(pdev, "gpu2d_axi_clk");
++                if (IS_ERR(device->clk_2d_axi)) {
++                    device->clk_2d_axi = NULL;
++                    IrqLine2D = -1;
++                    gckOS_Print("galcore: clk_get 2d axi clock failed, disable 2d\n");
++                }
++            }
++            if (IrqLineVG != -1) {
++                device->clk_vg_axi = clk_get(pdev, "openvg_axi_clk");
++                if (IS_ERR(device->clk_vg_axi)) {
++                    IrqLineVG = -1;
++	                device->clk_vg_axi = NULL;
++	                gckOS_Print("galcore: clk_get vg clock failed, disable vg!\n");
++                }
++            }
++        }
++    }
++
++    if (IrqLine != -1)
++    {
++        device->requestedRegisterMemBases[gcvCORE_MAJOR]    = RegisterMemBase;
++        device->requestedRegisterMemSizes[gcvCORE_MAJOR]    = RegisterMemSize;
++    }
++
++    if (IrqLine2D != -1)
++    {
++        device->requestedRegisterMemBases[gcvCORE_2D]       = RegisterMemBase2D;
++        device->requestedRegisterMemSizes[gcvCORE_2D]       = RegisterMemSize2D;
++    }
++
++    if (IrqLineVG != -1)
++    {
++        device->requestedRegisterMemBases[gcvCORE_VG]       = RegisterMemBaseVG;
++        device->requestedRegisterMemSizes[gcvCORE_VG]       = RegisterMemSizeVG;
++    }
++
++    device->requestedContiguousBase  = 0;
++    device->requestedContiguousSize  = 0;
++
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        physical = device->requestedRegisterMemBases[i];
++
++        /* Set up register memory region. */
++        if (physical != 0)
++        {
++            mem_region = request_mem_region(
++                physical, device->requestedRegisterMemSizes[i], "galcore register region"
++                );
++
++            if (mem_region == gcvNULL)
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                    "%s(%d): Failed to claim %lu bytes @ 0x%08X\n",
++                    __FUNCTION__, __LINE__,
++                    physical, device->requestedRegisterMemSizes[i]
++                    );
++
++                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++            }
++
++            device->registerBases[i] = (gctPOINTER) ioremap_nocache(
++                physical, device->requestedRegisterMemSizes[i]);
++
++            if (device->registerBases[i] == gcvNULL)
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                    "%s(%d): Unable to map %ld bytes @ 0x%08X\n",
++                    __FUNCTION__, __LINE__,
++                    physical, device->requestedRegisterMemSizes[i]
++                    );
++
++                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++            }
++
++            physical += device->requestedRegisterMemSizes[i];
++        }
++        else
++        {
++            device->registerBases[i] = gcvNULL;
++        }
++    }
++
++    /* Set the base address */
++    device->baseAddress = PhysBaseAddr;
++
++    /* Construct the gckOS object. */
++    gcmkONERROR(gckOS_Construct(device, &device->os));
++
++    if (IrqLine != -1)
++    {
++        /* Construct the gckKERNEL object. */
++        gcmkONERROR(gckKERNEL_Construct(
++            device->os, gcvCORE_MAJOR, device,
++            gcvNULL, &device->kernels[gcvCORE_MAJOR]));
++
++        sharedDB = device->kernels[gcvCORE_MAJOR]->db;
++
++        /* Initialize core mapping */
++        for (i = 0; i < 8; i++)
++        {
++            device->coreMapping[i] = gcvCORE_MAJOR;
++        }
++
++        /* Setup the ISR manager. */
++        gcmkONERROR(gckHARDWARE_SetIsrManager(
++            device->kernels[gcvCORE_MAJOR]->hardware,
++            (gctISRMANAGERFUNC) gckGALDEVICE_Enable_ISR,
++            (gctISRMANAGERFUNC) gckGALDEVICE_Disable_ISR,
++            device
++            ));
++
++        gcmkONERROR(gckHARDWARE_SetFastClear(
++            device->kernels[gcvCORE_MAJOR]->hardware, FastClear, Compression
++            ));
++
++        gcmkONERROR(gckHARDWARE_SetPowerManagement(
++            device->kernels[gcvCORE_MAJOR]->hardware, PowerManagement
++            ));
++
++        gcmkONERROR(gckHARDWARE_SetGpuProfiler(
++            device->kernels[gcvCORE_MAJOR]->hardware, GpuProfiler
++            ));
++
++#if COMMAND_PROCESSOR_VERSION == 1
++        /* Start the command queue. */
++        gcmkONERROR(gckCOMMAND_Start(device->kernels[gcvCORE_MAJOR]->command));
++#endif
++    }
++    else
++    {
++        device->kernels[gcvCORE_MAJOR] = gcvNULL;
++    }
++
++    if (IrqLine2D != -1)
++    {
++        gcmkONERROR(gckKERNEL_Construct(
++            device->os, gcvCORE_2D, device,
++            sharedDB, &device->kernels[gcvCORE_2D]));
++
++        if (sharedDB == gcvNULL) sharedDB = device->kernels[gcvCORE_2D]->db;
++
++        /* Verify the hardware type */
++        gcmkONERROR(gckHARDWARE_GetType(device->kernels[gcvCORE_2D]->hardware, &type));
++
++        if (type != gcvHARDWARE_2D)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Unexpected hardware type: %d\n",
++                __FUNCTION__, __LINE__,
++                type
++                );
++
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        /* Initialize core mapping */
++        if (device->kernels[gcvCORE_MAJOR] == gcvNULL)
++        {
++            for (i = 0; i < 8; i++)
++            {
++                device->coreMapping[i] = gcvCORE_2D;
++            }
++        }
++        else
++        {
++            device->coreMapping[gcvHARDWARE_2D] = gcvCORE_2D;
++        }
++
++        /* Setup the ISR manager. */
++        gcmkONERROR(gckHARDWARE_SetIsrManager(
++            device->kernels[gcvCORE_2D]->hardware,
++            (gctISRMANAGERFUNC) gckGALDEVICE_Enable_ISR,
++            (gctISRMANAGERFUNC) gckGALDEVICE_Disable_ISR,
++            device
++            ));
++
++        gcmkONERROR(gckHARDWARE_SetPowerManagement(
++            device->kernels[gcvCORE_2D]->hardware, PowerManagement
++            ));
++
++
++#if COMMAND_PROCESSOR_VERSION == 1
++        /* Start the command queue. */
++        gcmkONERROR(gckCOMMAND_Start(device->kernels[gcvCORE_2D]->command));
++#endif
++    }
++    else
++    {
++        device->kernels[gcvCORE_2D] = gcvNULL;
++    }
++
++    if (IrqLineVG != -1)
++    {
++#if gcdENABLE_VG
++        gcmkONERROR(gckKERNEL_Construct(
++            device->os, gcvCORE_VG, device,
++            sharedDB, &device->kernels[gcvCORE_VG]));
++        /* Initialize core mapping */
++        if (device->kernels[gcvCORE_MAJOR] == gcvNULL
++            && device->kernels[gcvCORE_2D] == gcvNULL
++            )
++        {
++            for (i = 0; i < 8; i++)
++            {
++                device->coreMapping[i] = gcvCORE_VG;
++            }
++        }
++        else
++        {
++            device->coreMapping[gcvHARDWARE_VG] = gcvCORE_VG;
++        }
++
++
++        gcmkONERROR(gckVGHARDWARE_SetPowerManagement(
++            device->kernels[gcvCORE_VG]->vg->hardware,
++            PowerManagement
++            ));
++
++#endif
++    }
++    else
++    {
++        device->kernels[gcvCORE_VG] = gcvNULL;
++    }
++
++    /* Initialize the ISR. */
++    device->irqLines[gcvCORE_MAJOR] = IrqLine;
++    device->irqLines[gcvCORE_2D]    = IrqLine2D;
++    device->irqLines[gcvCORE_VG]    = IrqLineVG;
++
++    /* Initialize the kernel thread semaphores. */
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->irqLines[i] != -1) sema_init(&device->semas[i], 0);
++    }
++
++    device->signal = Signal;
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->kernels[i] != gcvNULL) break;
++    }
++
++    if (i == gcdMAX_GPU_COUNT)
++	{
++		gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++	}
++
++#if gcdENABLE_VG
++    if (i == gcvCORE_VG)
++    {
++        /* Query the ceiling of the system memory. */
++        gcmkONERROR(gckVGHARDWARE_QuerySystemMemory(
++                device->kernels[i]->vg->hardware,
++                &device->systemMemorySize,
++                &device->systemMemoryBaseAddress
++                ));
++            /* query the amount of video memory */
++        gcmkONERROR(gckVGHARDWARE_QueryMemory(
++            device->kernels[i]->vg->hardware,
++            &device->internalSize, &internalBaseAddress, &internalAlignment,
++            &device->externalSize, &externalBaseAddress, &externalAlignment,
++            &horizontalTileSize, &verticalTileSize
++            ));
++    }
++    else
++#endif
++    {
++        /* Query the ceiling of the system memory. */
++        gcmkONERROR(gckHARDWARE_QuerySystemMemory(
++                device->kernels[i]->hardware,
++                &device->systemMemorySize,
++                &device->systemMemoryBaseAddress
++                ));
++
++            /* query the amount of video memory */
++        gcmkONERROR(gckHARDWARE_QueryMemory(
++            device->kernels[i]->hardware,
++            &device->internalSize, &internalBaseAddress, &internalAlignment,
++            &device->externalSize, &externalBaseAddress, &externalAlignment,
++            &horizontalTileSize, &verticalTileSize
++            ));
++    }
++
++
++    /* Grab the first availiable kernel */
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->irqLines[i] != -1)
++        {
++            kernel = device->kernels[i];
++            break;
++        }
++    }
++
++    /* Set up the internal memory region. */
++    if (device->internalSize > 0)
++    {
++        status = gckVIDMEM_Construct(
++            device->os,
++            internalBaseAddress, device->internalSize, internalAlignment,
++            0, &device->internalVidMem
++            );
++
++        if (gcmIS_ERROR(status))
++        {
++            /* Error, disable internal heap. */
++            device->internalSize = 0;
++        }
++        else
++        {
++            /* Map internal memory. */
++            device->internalLogical
++                = (gctPOINTER) ioremap_nocache(physical, device->internalSize);
++
++            if (device->internalLogical == gcvNULL)
++            {
++                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++            }
++
++            device->internalPhysical = (gctPHYS_ADDR)(gctUINTPTR_T) physical;
++            device->internalPhysicalName = gcmPTR_TO_NAME(device->internalPhysical);
++            physical += device->internalSize;
++        }
++    }
++
++    if (device->externalSize > 0)
++    {
++        /* create the external memory heap */
++        status = gckVIDMEM_Construct(
++            device->os,
++            externalBaseAddress, device->externalSize, externalAlignment,
++            0, &device->externalVidMem
++            );
++
++        if (gcmIS_ERROR(status))
++        {
++            /* Error, disable internal heap. */
++            device->externalSize = 0;
++        }
++        else
++        {
++            /* Map external memory. */
++            device->externalLogical
++                = (gctPOINTER) ioremap_nocache(physical, device->externalSize);
++
++            if (device->externalLogical == gcvNULL)
++            {
++                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++            }
++
++            device->externalPhysical = (gctPHYS_ADDR)(gctUINTPTR_T) physical;
++            device->externalPhysicalName = gcmPTR_TO_NAME(device->externalPhysical);
++            physical += device->externalSize;
++        }
++    }
++
++    /* set up the contiguous memory */
++    device->contiguousSize = ContiguousSize;
++
++    if (ContiguousSize > 0)
++    {
++        if (ContiguousBase == 0)
++        {
++            while (device->contiguousSize > 0)
++            {
++                /* Allocate contiguous memory. */
++                status = _AllocateMemory(
++                    device,
++                    device->contiguousSize,
++                    &device->contiguousBase,
++                    &device->contiguousPhysical,
++                    &physAddr
++                    );
++
++                if (gcmIS_SUCCESS(status))
++                {
++                    device->contiguousPhysicalName = gcmPTR_TO_NAME(device->contiguousPhysical);
++                    status = gckVIDMEM_Construct(
++                        device->os,
++                        physAddr | device->systemMemoryBaseAddress,
++                        device->contiguousSize,
++                        64,
++                        BankSize,
++                        &device->contiguousVidMem
++                        );
++
++                    if (gcmIS_SUCCESS(status))
++                    {
++                        break;
++                    }
++
++                    gcmkONERROR(_FreeMemory(
++                        device,
++                        device->contiguousBase,
++                        device->contiguousPhysical
++                        ));
++
++                    gcmRELEASE_NAME(device->contiguousPhysicalName);
++                    device->contiguousBase     = gcvNULL;
++                    device->contiguousPhysical = gcvNULL;
++                }
++
++                if (device->contiguousSize <= (4 << 20))
++                {
++                    device->contiguousSize = 0;
++                }
++                else
++                {
++                    device->contiguousSize -= (4 << 20);
++                }
++            }
++        }
++        else
++        {
++            /* Create the contiguous memory heap. */
++            status = gckVIDMEM_Construct(
++                device->os,
++                ContiguousBase | device->systemMemoryBaseAddress,
++                ContiguousSize,
++                64, BankSize,
++                &device->contiguousVidMem
++                );
++
++            if (gcmIS_ERROR(status))
++            {
++                /* Error, disable contiguous memory pool. */
++                device->contiguousVidMem = gcvNULL;
++                device->contiguousSize   = 0;
++            }
++            else
++            {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
++                mem_region = request_mem_region(
++                    ContiguousBase, ContiguousSize, "galcore managed memory"
++                    );
++
++                if (mem_region == gcvNULL)
++                {
++                    gcmkTRACE_ZONE(
++                        gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                        "%s(%d): Failed to claim %ld bytes @ 0x%08X\n",
++                        __FUNCTION__, __LINE__,
++                        ContiguousSize, ContiguousBase
++                        );
++
++                    gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++                }
++#endif
++
++                device->requestedContiguousBase  = ContiguousBase;
++                device->requestedContiguousSize  = ContiguousSize;
++
++#if !gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
++                if (gcmIS_CORE_PRESENT(device, gcvCORE_VG))
++                {
++                    device->contiguousBase
++#if gcdPAGED_MEMORY_CACHEABLE
++                        = (gctPOINTER) ioremap_cached(ContiguousBase, ContiguousSize);
++#else
++                        = (gctPOINTER) ioremap_nocache(ContiguousBase, ContiguousSize);
++#endif
++                    if (device->contiguousBase == gcvNULL)
++                    {
++                        device->contiguousVidMem = gcvNULL;
++                        device->contiguousSize = 0;
++
++                        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++                    }
++                }
++#endif
++
++                device->contiguousPhysical = gcvNULL;
++                device->contiguousPhysicalName = 0;
++                device->contiguousSize     = ContiguousSize;
++                device->contiguousMapped   = gcvTRUE;
++            }
++        }
++    }
++
++    /* Return pointer to the device. */
++    * Device = device;
++
++    gcmkFOOTER_ARG("*Device=0x%x", * Device);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Roll back. */
++    gcmkVERIFY_OK(gckGALDEVICE_Destroy(device));
++
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Destroy
++**
++**  Class destructor.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckGALDEVICE_Destroy(
++    gckGALDEVICE Device)
++{
++    gctINT i;
++    gceSTATUS status = gcvSTATUS_OK;
++    gckKERNEL kernel = gcvNULL;
++
++    gcmkHEADER_ARG("Device=0x%x", Device);
++
++    if (Device != gcvNULL)
++    {
++        /* Grab the first availiable kernel */
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (Device->irqLines[i] != -1)
++            {
++                kernel = Device->kernels[i];
++                break;
++            }
++        }
++        if (Device->internalPhysicalName != 0)
++        {
++            gcmRELEASE_NAME(Device->internalPhysicalName);
++            Device->internalPhysicalName = 0;
++        }
++        if (Device->externalPhysicalName != 0)
++        {
++            gcmRELEASE_NAME(Device->externalPhysicalName);
++            Device->externalPhysicalName = 0;
++        }
++        if (Device->contiguousPhysicalName != 0)
++        {
++            gcmRELEASE_NAME(Device->contiguousPhysicalName);
++            Device->contiguousPhysicalName = 0;
++        }
++
++
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (Device->kernels[i] != gcvNULL)
++            {
++                /* Destroy the gckKERNEL object. */
++                gcmkVERIFY_OK(gckKERNEL_Destroy(Device->kernels[i]));
++                Device->kernels[i] = gcvNULL;
++            }
++        }
++
++        {
++            if (Device->internalLogical != gcvNULL)
++            {
++                /* Unmap the internal memory. */
++                iounmap(Device->internalLogical);
++                Device->internalLogical = gcvNULL;
++            }
++
++            if (Device->internalVidMem != gcvNULL)
++            {
++                /* Destroy the internal heap. */
++                gcmkVERIFY_OK(gckVIDMEM_Destroy(Device->internalVidMem));
++                Device->internalVidMem = gcvNULL;
++            }
++        }
++
++        {
++            if (Device->externalLogical != gcvNULL)
++            {
++                /* Unmap the external memory. */
++                iounmap(Device->externalLogical);
++                Device->externalLogical = gcvNULL;
++            }
++
++            if (Device->externalVidMem != gcvNULL)
++            {
++                /* destroy the external heap */
++                gcmkVERIFY_OK(gckVIDMEM_Destroy(Device->externalVidMem));
++                Device->externalVidMem = gcvNULL;
++            }
++        }
++
++        {
++            if (Device->contiguousBase != gcvNULL)
++            {
++                if (Device->contiguousMapped)
++                {
++#if !gcdDYNAMIC_MAP_RESERVED_MEMORY && gcdENABLE_VG
++                    if (Device->contiguousBase)
++                    {
++                        /* Unmap the contiguous memory. */
++                        iounmap(Device->contiguousBase);
++                    }
++#endif
++                }
++                else
++                {
++                    gcmkONERROR(_FreeMemory(
++                        Device,
++                        Device->contiguousBase,
++                        Device->contiguousPhysical
++                        ));
++                }
++
++                Device->contiguousBase     = gcvNULL;
++                Device->contiguousPhysical = gcvNULL;
++            }
++
++            if (Device->requestedContiguousBase != 0)
++            {
++                release_mem_region(Device->requestedContiguousBase, Device->requestedContiguousSize);
++                Device->requestedContiguousBase = 0;
++                Device->requestedContiguousSize = 0;
++            }
++
++            if (Device->contiguousVidMem != gcvNULL)
++            {
++                /* Destroy the contiguous heap. */
++                gcmkVERIFY_OK(gckVIDMEM_Destroy(Device->contiguousVidMem));
++                Device->contiguousVidMem = gcvNULL;
++            }
++        }
++
++	{
++	    if(gckDebugFileSystemIsEnabled())
++	    {
++		 gckDebugFileSystemFreeNode(Device->dbgnode);
++		 kfree(Device->dbgnode);
++		 Device->dbgnode = gcvNULL;
++	    }
++	}
++
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (Device->registerBases[i] != gcvNULL)
++            {
++                /* Unmap register memory. */
++                iounmap(Device->registerBases[i]);
++			    if (Device->requestedRegisterMemBases[i] != 0)
++			    {
++				    release_mem_region(Device->requestedRegisterMemBases[i], Device->requestedRegisterMemSizes[i]);
++			    }
++
++                Device->registerBases[i] = gcvNULL;
++                Device->requestedRegisterMemBases[i] = 0;
++                Device->requestedRegisterMemSizes[i] = 0;
++            }
++        }
++
++        /*Disable clock*/
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++        if (Device->clk_3d_axi) {
++           clk_put(Device->clk_3d_axi);
++           Device->clk_3d_axi = NULL;
++        }
++#endif
++        if (Device->clk_3d_core) {
++           clk_put(Device->clk_3d_core);
++           Device->clk_3d_core = NULL;
++        }
++        if (Device->clk_3d_shader) {
++           clk_put(Device->clk_3d_shader);
++           Device->clk_3d_shader = NULL;
++        }
++        if (Device->clk_2d_core) {
++           clk_put(Device->clk_2d_core);
++           Device->clk_2d_core = NULL;
++        }
++        if (Device->clk_2d_axi) {
++           clk_put(Device->clk_2d_axi);
++           Device->clk_2d_axi = NULL;
++        }
++        if (Device->clk_vg_axi) {
++           clk_put(Device->clk_vg_axi);
++           Device->clk_vg_axi = NULL;
++        }
++
++#ifdef CONFIG_PM
++        if(Device->pmdev)
++            pm_runtime_disable(Device->pmdev);
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++        if (Device->gpu_regulator) {
++           regulator_put(Device->gpu_regulator);
++           Device->gpu_regulator = NULL;
++        }
++#endif
++
++        /* Destroy the gckOS object. */
++        if (Device->os != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_Destroy(Device->os));
++            Device->os = gcvNULL;
++        }
++
++        /* Free the device. */
++        kfree(Device);
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Setup_ISR
++**
++**  Start the ISR routine.
++**
++**  INPUT:
++**
++**      gckGALDEVICE Device
++**          Pointer to an gckGALDEVICE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      gcvSTATUS_OK
++**          Setup successfully.
++**      gcvSTATUS_GENERIC_IO
++**          Setup failed.
++*/
++gceSTATUS
++gckGALDEVICE_Setup_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    )
++{
++    gceSTATUS status;
++    gctINT ret = -1;
++
++    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    if (Device->irqLines[Core] < 0)
++    {
++        gcmkONERROR(gcvSTATUS_GENERIC_IO);
++    }
++
++    /* Hook up the isr based on the irq line. */
++#ifdef FLAREON
++    gc500_handle.dev_name  = "galcore interrupt service";
++    gc500_handle.dev_id    = Device;
++    switch (Core) {
++        case gcvCORE_MAJOR:
++            gc500_handle.handler   = isrRoutine;
++            break;
++        case gcvCORE_2D:
++            gc500_handle.handler   = isrRoutine2D;
++            break;
++        case gcvCORE_VG:
++            gc500_handle.handler   = isrRoutineVG;
++            break;
++        default:
++            break;
++    }
++    gc500_handle.intr_gen  = GPIO_INTR_LEVEL_TRIGGER;
++    gc500_handle.intr_trig = GPIO_TRIG_HIGH_LEVEL;
++
++    ret = dove_gpio_request(
++        DOVE_GPIO0_7, &gc500_handle
++        );
++#else
++    switch (Core) {
++        case gcvCORE_MAJOR:
++            ret = request_irq(
++                Device->irqLines[Core], isrRoutine, 0x0/*IRQF_DISABLED*/,
++                "galcore interrupt service", Device
++                );
++            break;
++        case gcvCORE_2D:
++            ret = request_irq(
++                Device->irqLines[Core], isrRoutine2D, 0x0/*IRQF_DISABLED*/,
++                "galcore 2D interrupt service", Device
++                );
++            break;
++        case gcvCORE_VG:
++            ret = request_irq(
++                Device->irqLines[Core], isrRoutineVG, 0x0/*IRQF_DISABLED*/,
++                "galcore VG interrupt service", Device
++                );
++            break;
++        default:
++            break;
++    }
++#endif
++
++    if (ret != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): Could not register irq line %d (error=%d)\n",
++            __FUNCTION__, __LINE__,
++            Device->irqLines[Core], ret
++            );
++
++        gcmkONERROR(gcvSTATUS_GENERIC_IO);
++    }
++
++    Device->isrEnabled[Core] = 1;
++
++    /* Mark ISR as initialized. */
++    Device->isrInitializeds[Core] = gcvTRUE;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckGALDEVICE_Enable_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    if (Device->irqLines[Core] < 0)
++    {
++        gcmkONERROR(gcvSTATUS_GENERIC_IO);
++    }
++
++    spin_lock(&Device->kernels[Core]->irq_lock);
++    if (Device->isrEnabled[Core] == 0)
++    {
++        enable_irq(Device->irqLines[Core]);
++        /* Mark ISR as initialized. */
++        Device->isrEnabled[Core] = gcvTRUE;
++    }
++    Device->isrEnabled[Core]++;
++    spin_unlock(&Device->kernels[Core]->irq_lock);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Release_ISR
++**
++**  Release the irq line.
++**
++**  INPUT:
++**
++**      gckGALDEVICE Device
++**          Pointer to an gckGALDEVICE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckGALDEVICE_Release_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    )
++{
++    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    /* release the irq */
++    if (Device->isrInitializeds[Core])
++    {
++#ifdef FLAREON
++        dove_gpio_free(DOVE_GPIO0_7, "galcore interrupt service");
++#else
++        free_irq(Device->irqLines[Core], Device);
++#endif
++
++	Device->isrInitializeds[Core] = gcvFALSE;
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckGALDEVICE_Disable_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    )
++{
++    gcmkHEADER_ARG("Device=0x%x Core=%d", Device, Core);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    /* disable the irq */
++    spin_lock(&Device->kernels[Core]->irq_lock);
++    if (Device->isrEnabled[Core] > 0)
++    {
++        Device->isrEnabled[Core]--;
++        if (Device->isrEnabled[Core] == 0)
++            disable_irq(Device->irqLines[Core]);
++    }
++    spin_unlock(&Device->kernels[Core]->irq_lock);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Start_Threads
++**
++**  Start the daemon threads.
++**
++**  INPUT:
++**
++**      gckGALDEVICE Device
++**          Pointer to an gckGALDEVICE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      gcvSTATUS_OK
++**          Start successfully.
++**      gcvSTATUS_GENERIC_IO
++**          Start failed.
++*/
++gceSTATUS
++gckGALDEVICE_Start_Threads(
++    IN gckGALDEVICE Device
++    )
++{
++    gceSTATUS status;
++    struct task_struct * task;
++
++    gcmkHEADER_ARG("Device=0x%x", Device);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    if (Device->kernels[gcvCORE_MAJOR] != gcvNULL)
++    {
++        /* Start the kernel thread. */
++        task = kthread_run(threadRoutine, Device, "galcore daemon thread");
++
++        if (IS_ERR(task))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Could not start the kernel thread.\n",
++                __FUNCTION__, __LINE__
++                );
++
++            gcmkONERROR(gcvSTATUS_GENERIC_IO);
++        }
++
++        Device->threadCtxts[gcvCORE_MAJOR]          = task;
++        Device->threadInitializeds[gcvCORE_MAJOR]   = gcvTRUE;
++    }
++
++    if (Device->kernels[gcvCORE_2D] != gcvNULL)
++    {
++        /* Start the kernel thread. */
++        task = kthread_run(threadRoutine2D, Device, "galcore daemon thread for 2D");
++
++        if (IS_ERR(task))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Could not start the kernel thread.\n",
++                __FUNCTION__, __LINE__
++                );
++
++            gcmkONERROR(gcvSTATUS_GENERIC_IO);
++        }
++
++        Device->threadCtxts[gcvCORE_2D]         = task;
++        Device->threadInitializeds[gcvCORE_2D]  = gcvTRUE;
++    }
++    else
++    {
++        Device->threadInitializeds[gcvCORE_2D]  = gcvFALSE;
++    }
++
++    if (Device->kernels[gcvCORE_VG] != gcvNULL)
++    {
++        /* Start the kernel thread. */
++        task = kthread_run(threadRoutineVG, Device, "galcore daemon thread for VG");
++
++        if (IS_ERR(task))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Could not start the kernel thread.\n",
++                __FUNCTION__, __LINE__
++                );
++
++            gcmkONERROR(gcvSTATUS_GENERIC_IO);
++        }
++
++        Device->threadCtxts[gcvCORE_VG]         = task;
++        Device->threadInitializeds[gcvCORE_VG]  = gcvTRUE;
++    }
++    else
++    {
++        Device->threadInitializeds[gcvCORE_VG]  = gcvFALSE;
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Stop_Threads
++**
++**  Stop the gal device, including the following actions: stop the daemon
++**  thread, release the irq.
++**
++**  INPUT:
++**
++**      gckGALDEVICE Device
++**          Pointer to an gckGALDEVICE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckGALDEVICE_Stop_Threads(
++    gckGALDEVICE Device
++    )
++{
++    gctINT i;
++
++    gcmkHEADER_ARG("Device=0x%x", Device);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        /* Stop the kernel threads. */
++        if (Device->threadInitializeds[i])
++        {
++            Device->killThread = gcvTRUE;
++            up(&Device->semas[i]);
++
++            kthread_stop(Device->threadCtxts[i]);
++            Device->threadCtxts[i]        = gcvNULL;
++            Device->threadInitializeds[i] = gcvFALSE;
++        }
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Start
++**
++**  Start the gal device, including the following actions: setup the isr routine
++**  and start the daemoni thread.
++**
++**  INPUT:
++**
++**      gckGALDEVICE Device
++**          Pointer to an gckGALDEVICE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      gcvSTATUS_OK
++**          Start successfully.
++*/
++gceSTATUS
++gckGALDEVICE_Start(
++    IN gckGALDEVICE Device
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Device=0x%x", Device);
++
++    /* Start the kernel thread. */
++    gcmkONERROR(gckGALDEVICE_Start_Threads(Device));
++
++    if (Device->kernels[gcvCORE_MAJOR] != gcvNULL)
++    {
++        /* Setup the ISR routine. */
++        gcmkONERROR(gckGALDEVICE_Setup_ISR(Device, gcvCORE_MAJOR));
++
++        /* Switch to SUSPEND power state. */
++        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
++            Device->kernels[gcvCORE_MAJOR]->hardware, gcvPOWER_OFF_BROADCAST
++            ));
++    }
++
++    if (Device->kernels[gcvCORE_2D] != gcvNULL)
++    {
++        /* Setup the ISR routine. */
++        gcmkONERROR(gckGALDEVICE_Setup_ISR(Device, gcvCORE_2D));
++
++        /* Switch to SUSPEND power state. */
++        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
++            Device->kernels[gcvCORE_2D]->hardware, gcvPOWER_OFF_BROADCAST
++            ));
++    }
++
++    if (Device->kernels[gcvCORE_VG] != gcvNULL)
++    {
++        /* Setup the ISR routine. */
++        gcmkONERROR(gckGALDEVICE_Setup_ISR(Device, gcvCORE_VG));
++
++        /* Switch to SUSPEND power state. */
++        gcmkONERROR(gckVGHARDWARE_SetPowerManagementState(
++            Device->kernels[gcvCORE_VG]->vg->hardware, gcvPOWER_OFF_BROADCAST
++            ));
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckGALDEVICE_Stop
++**
++**  Stop the gal device, including the following actions: stop the daemon
++**  thread, release the irq.
++**
++**  INPUT:
++**
++**      gckGALDEVICE Device
++**          Pointer to an gckGALDEVICE object.
++**
++**  OUTPUT:
++**
++**      Nothing.
++**
++**  RETURNS:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckGALDEVICE_Stop(
++    gckGALDEVICE Device
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Device=0x%x", Device);
++
++    gcmkVERIFY_ARGUMENT(Device != NULL);
++
++    if (Device->kernels[gcvCORE_MAJOR] != gcvNULL)
++    {
++        /* Switch to OFF power state. */
++        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
++            Device->kernels[gcvCORE_MAJOR]->hardware, gcvPOWER_OFF
++            ));
++
++        /* Remove the ISR routine. */
++        gcmkONERROR(gckGALDEVICE_Release_ISR(Device, gcvCORE_MAJOR));
++    }
++
++    if (Device->kernels[gcvCORE_2D] != gcvNULL)
++    {
++        /* Setup the ISR routine. */
++        gcmkONERROR(gckGALDEVICE_Release_ISR(Device, gcvCORE_2D));
++
++        /* Switch to OFF power state. */
++        gcmkONERROR(gckHARDWARE_SetPowerManagementState(
++            Device->kernels[gcvCORE_2D]->hardware, gcvPOWER_OFF
++            ));
++    }
++
++    if (Device->kernels[gcvCORE_VG] != gcvNULL)
++    {
++        /* Setup the ISR routine. */
++        gcmkONERROR(gckGALDEVICE_Release_ISR(Device, gcvCORE_VG));
++
++#if gcdENABLE_VG
++        /* Switch to OFF power state. */
++        gcmkONERROR(gckVGHARDWARE_SetPowerManagementState(
++            Device->kernels[gcvCORE_VG]->vg->hardware, gcvPOWER_OFF
++            ));
++#endif
++    }
++
++    /* Stop the kernel thread. */
++    gcmkONERROR(gckGALDEVICE_Stop_Threads(Device));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_device.h	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,192 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_device_h_
++#define __gc_hal_kernel_device_h_
++
++/******************************************************************************\
++******************************* gckGALDEVICE Structure *******************************
++\******************************************************************************/
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++struct contiguous_mem_pool {
++	struct dma_attrs attrs;
++	dma_addr_t phys;
++	void *virt;
++	size_t size;
++};
++#endif
++
++typedef struct _gckGALDEVICE
++{
++    /* Objects. */
++    gckOS               os;
++    gckKERNEL           kernels[gcdMAX_GPU_COUNT];
++
++    /* Attributes. */
++    gctSIZE_T           internalSize;
++    gctPHYS_ADDR        internalPhysical;
++    gctUINT32           internalPhysicalName;
++    gctPOINTER          internalLogical;
++    gckVIDMEM           internalVidMem;
++    gctSIZE_T           externalSize;
++    gctPHYS_ADDR        externalPhysical;
++    gctUINT32           externalPhysicalName;
++    gctPOINTER          externalLogical;
++    gckVIDMEM           externalVidMem;
++    gckVIDMEM           contiguousVidMem;
++    gctPOINTER          contiguousBase;
++    gctPHYS_ADDR        contiguousPhysical;
++    gctUINT32           contiguousPhysicalName;
++    gctSIZE_T           contiguousSize;
++    gctBOOL             contiguousMapped;
++    gctPOINTER          contiguousMappedUser;
++    gctSIZE_T           systemMemorySize;
++    gctUINT32           systemMemoryBaseAddress;
++    gctPOINTER          registerBases[gcdMAX_GPU_COUNT];
++    gctSIZE_T           registerSizes[gcdMAX_GPU_COUNT];
++    gctUINT32           baseAddress;
++    gctUINT32           requestedRegisterMemBases[gcdMAX_GPU_COUNT];
++    gctSIZE_T           requestedRegisterMemSizes[gcdMAX_GPU_COUNT];
++    gctUINT32           requestedContiguousBase;
++    gctSIZE_T           requestedContiguousSize;
++
++    /* IRQ management. */
++    gctINT              irqLines[gcdMAX_GPU_COUNT];
++    gctBOOL             isrInitializeds[gcdMAX_GPU_COUNT];
++    gctINT              isrEnabled[gcdMAX_GPU_COUNT];
++    gctBOOL             dataReadys[gcdMAX_GPU_COUNT];
++
++    /* Thread management. */
++    struct task_struct  *threadCtxts[gcdMAX_GPU_COUNT];
++    struct semaphore    semas[gcdMAX_GPU_COUNT];
++    gctBOOL             threadInitializeds[gcdMAX_GPU_COUNT];
++    gctBOOL             killThread;
++
++    /* Signal management. */
++    gctINT              signal;
++
++    /* Core mapping */
++    gceCORE             coreMapping[8];
++
++    /* States before suspend. */
++    gceCHIPPOWERSTATE   statesStored[gcdMAX_GPU_COUNT];
++
++    /*Device Debug File System Entry in Kernel*/
++   struct _gcsDebugFileSystemNode * dbgnode;
++
++    /* Clock management.*/
++    struct clk         *clk_3d_core;
++    struct clk         *clk_3d_shader;
++    struct clk		   *clk_3d_axi;
++    struct clk         *clk_2d_core;
++    struct clk         *clk_2d_axi;
++    struct clk         *clk_vg_axi;
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    /*Power management.*/
++    struct regulator      *gpu_regulator;
++#endif
++	/*Run time pm*/
++	struct device		*pmdev;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	struct contiguous_mem_pool *pool;
++	struct reset_control *rstc[gcdMAX_GPU_COUNT];
++#endif
++}
++* gckGALDEVICE;
++
++typedef struct _gcsHAL_PRIVATE_DATA
++{
++    gckGALDEVICE        device;
++    gctPOINTER          mappedMemory;
++    gctPOINTER          contiguousLogical;
++    /* The process opening the device may not be the same as the one that closes it. */
++    gctUINT32           pidOpen;
++}
++gcsHAL_PRIVATE_DATA, * gcsHAL_PRIVATE_DATA_PTR;
++
++gceSTATUS gckGALDEVICE_Enable_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    );
++
++gceSTATUS gckGALDEVICE_Disable_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    );
++
++gceSTATUS gckGALDEVICE_Setup_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    );
++
++gceSTATUS gckGALDEVICE_Release_ISR(
++    IN gckGALDEVICE Device,
++    IN gceCORE Core
++    );
++
++gceSTATUS gckGALDEVICE_Start_Threads(
++    IN gckGALDEVICE Device
++    );
++
++gceSTATUS gckGALDEVICE_Stop_Threads(
++    gckGALDEVICE Device
++    );
++
++gceSTATUS gckGALDEVICE_Start(
++    IN gckGALDEVICE Device
++    );
++
++gceSTATUS gckGALDEVICE_Stop(
++    gckGALDEVICE Device
++    );
++
++gceSTATUS gckGALDEVICE_Construct(
++    IN gctINT IrqLine,
++    IN gctUINT32 RegisterMemBase,
++    IN gctSIZE_T RegisterMemSize,
++    IN gctINT IrqLine2D,
++    IN gctUINT32 RegisterMemBase2D,
++    IN gctSIZE_T RegisterMemSize2D,
++    IN gctINT IrqLineVG,
++    IN gctUINT32 RegisterMemBaseVG,
++    IN gctSIZE_T RegisterMemSizeVG,
++    IN gctUINT32 ContiguousBase,
++    IN gctSIZE_T ContiguousSize,
++    IN gctSIZE_T BankSize,
++    IN gctINT FastClear,
++    IN gctINT Compression,
++    IN gctUINT32 PhysBaseAddr,
++    IN gctUINT32 PhysSize,
++    IN gctINT Signal,
++    IN gctUINT LogFileSize,
++    IN struct device *pdev,
++    IN gctINT PowerManagement,
++    IN gctINT GpuProfiler,
++    OUT gckGALDEVICE *Device
++    );
++
++gceSTATUS gckGALDEVICE_Destroy(
++    IN gckGALDEVICE Device
++    );
++
++#endif /* __gc_hal_kernel_device_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_driver.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,1476 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*    Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++#include <linux/device.h>
++#include <linux/slab.h>
++#include <linux/notifier.h>
++#include "gc_hal_kernel_linux.h"
++#include "gc_hal_driver.h"
++
++#if USE_PLATFORM_DRIVER
++#   include <linux/platform_device.h>
++#endif
++
++#ifdef CONFIG_PXA_DVFM
++#   include <mach/dvfm.h>
++#   include <mach/pxa3xx_dvfm.h>
++#endif
++
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++#    include <linux/resmem_account.h>
++#    include <linux/kernel.h>
++#    include <linux/mm.h>
++#    include <linux/oom.h>
++#    include <linux/sched.h>
++#    include <linux/notifier.h>
++
++struct task_struct *lowmem_deathpending;
++
++static int
++task_notify_func(struct notifier_block *self, unsigned long val, void *data);
++
++static struct notifier_block task_nb = {
++	.notifier_call	= task_notify_func,
++};
++
++static int
++task_notify_func(struct notifier_block *self, unsigned long val, void *data)
++{
++	struct task_struct *task = data;
++
++	if (task == lowmem_deathpending)
++		lowmem_deathpending = NULL;
++
++	return NOTIFY_OK;
++}
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++#include <mach/viv_gpu.h>
++#else
++#include <linux/pm_runtime.h>
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
++#include <mach/busfreq.h>
++#else
++#include <linux/busfreq-imx6.h>
++#include <linux/reset.h>
++#endif
++#endif
++/* Zone used for header/footer. */
++#define _GC_OBJ_ZONE    gcvZONE_DRIVER
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++#include <linux/device_cooling.h>
++#define REG_THERMAL_NOTIFIER(a) register_devfreq_cooling_notifier(a);
++#define UNREG_THERMAL_NOTIFIER(a) unregister_devfreq_cooling_notifier(a);
++#else
++extern int register_thermal_notifier(struct notifier_block *nb);
++extern int unregister_thermal_notifier(struct notifier_block *nb);
++#define REG_THERMAL_NOTIFIER(a) register_thermal_notifier(a);
++#define UNREG_THERMAL_NOTIFIER(a) unregister_thermal_notifier(a);
++#endif
++#endif
++
++MODULE_DESCRIPTION("Vivante Graphics Driver");
++MODULE_LICENSE("GPL");
++
++static struct class* gpuClass;
++
++static gckGALDEVICE galDevice;
++
++static uint major = 199;
++module_param(major, uint, 0644);
++
++static int irqLine = -1;
++module_param(irqLine, int, 0644);
++
++static ulong registerMemBase = 0x80000000;
++module_param(registerMemBase, ulong, 0644);
++
++static ulong registerMemSize = 2 << 10;
++module_param(registerMemSize, ulong, 0644);
++
++static int irqLine2D = -1;
++module_param(irqLine2D, int, 0644);
++
++static ulong registerMemBase2D = 0x00000000;
++module_param(registerMemBase2D, ulong, 0644);
++
++static ulong registerMemSize2D = 2 << 10;
++module_param(registerMemSize2D, ulong, 0644);
++
++static int irqLineVG = -1;
++module_param(irqLineVG, int, 0644);
++
++static ulong registerMemBaseVG = 0x00000000;
++module_param(registerMemBaseVG, ulong, 0644);
++
++static ulong registerMemSizeVG = 2 << 10;
++module_param(registerMemSizeVG, ulong, 0644);
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++static ulong contiguousSize = 128 << 20;
++#else
++static ulong contiguousSize = 4 << 20;
++#endif
++module_param(contiguousSize, ulong, 0644);
++
++static ulong contiguousBase = 0;
++module_param(contiguousBase, ulong, 0644);
++
++static ulong bankSize = 0;
++module_param(bankSize, ulong, 0644);
++
++static int fastClear = -1;
++module_param(fastClear, int, 0644);
++
++static int compression = -1;
++module_param(compression, int, 0644);
++
++static int powerManagement = 1;
++module_param(powerManagement, int, 0644);
++
++static int gpuProfiler = 0;
++module_param(gpuProfiler, int, 0644);
++
++static int signal = 48;
++module_param(signal, int, 0644);
++
++static ulong baseAddress = 0;
++module_param(baseAddress, ulong, 0644);
++
++static ulong physSize = 0;
++module_param(physSize, ulong, 0644);
++
++static uint logFileSize=0;
++module_param(logFileSize,uint, 0644);
++
++static int showArgs = 0;
++module_param(showArgs, int, 0644);
++
++int gpu3DMinClock = 0;
++module_param(gpu3DMinClock, int, 0644);
++
++#if ENABLE_GPU_CLOCK_BY_DRIVER
++    unsigned long coreClock = 156000000;
++    module_param(coreClock, ulong, 0644);
++#endif
++
++static int drv_open(
++    struct inode* inode,
++    struct file* filp
++    );
++
++static int drv_release(
++    struct inode* inode,
++    struct file* filp
++    );
++
++static long drv_ioctl(
++    struct file* filp,
++    unsigned int ioctlCode,
++    unsigned long arg
++    );
++
++static int drv_mmap(
++    struct file* filp,
++    struct vm_area_struct* vma
++    );
++
++static struct file_operations driver_fops =
++{
++    .owner      = THIS_MODULE,
++    .open       = drv_open,
++    .release    = drv_release,
++    .unlocked_ioctl = drv_ioctl,
++#ifdef HAVE_COMPAT_IOCTL
++    .compat_ioctl = drv_ioctl,
++#endif
++    .mmap       = drv_mmap,
++};
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++static size_t viv_gpu_resmem_query(struct task_struct *p, struct reserved_memory_account *m);
++static struct reserved_memory_account viv_gpu_resmem_handler = {
++    .name = "viv_gpu",
++    .get_page_used_by_process = viv_gpu_resmem_query,
++};
++
++size_t viv_gpu_resmem_query(struct task_struct *p, struct reserved_memory_account *m)
++{
++    gcuDATABASE_INFO info;
++    unsigned int processid = p->pid;
++    gckKERNEL gpukernel = m->data;
++
++    /* ignore error happens in this api. */
++    if (gckKERNEL_QueryProcessDB(gpukernel, processid, false, gcvDB_VIDEO_MEMORY, &info) != gcvSTATUS_OK)
++	return 0;
++
++    /* we return pages. */
++    if (info.counters.bytes > 0)
++	return info.counters.bytes / PAGE_SIZE;
++    return 0;
++}
++#endif
++
++int drv_open(
++    struct inode* inode,
++    struct file* filp
++    )
++{
++    gceSTATUS status;
++    gctBOOL attached = gcvFALSE;
++    gcsHAL_PRIVATE_DATA_PTR data = gcvNULL;
++    gctINT i;
++
++    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = kmalloc(sizeof(gcsHAL_PRIVATE_DATA), GFP_KERNEL);
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    data->device             = galDevice;
++    data->mappedMemory       = gcvNULL;
++    data->contiguousLogical  = gcvNULL;
++    gcmkONERROR(gckOS_GetProcessID(&data->pidOpen));
++
++    /* Attached the process. */
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (galDevice->kernels[i] != gcvNULL)
++        {
++            gcmkONERROR(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvTRUE));
++        }
++    }
++    attached = gcvTRUE;
++
++    if (!galDevice->contiguousMapped)
++    {
++        gcmkONERROR(gckOS_MapMemory(
++            galDevice->os,
++            galDevice->contiguousPhysical,
++            galDevice->contiguousSize,
++            &data->contiguousLogical
++            ));
++    }
++
++    filp->private_data = data;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    if (data != gcvNULL)
++    {
++        if (data->contiguousLogical != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_UnmapMemory(
++                galDevice->os,
++                galDevice->contiguousPhysical,
++                galDevice->contiguousSize,
++                data->contiguousLogical
++                ));
++        }
++
++        kfree(data);
++    }
++
++    if (attached)
++    {
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (galDevice->kernels[i] != gcvNULL)
++            {
++                gcmkVERIFY_OK(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvFALSE));
++            }
++        }
++    }
++
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++int drv_release(
++    struct inode* inode,
++    struct file* filp
++    )
++{
++    gceSTATUS status;
++    gcsHAL_PRIVATE_DATA_PTR data;
++    gckGALDEVICE device;
++    gctINT i;
++
++    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = filp->private_data;
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    device = data->device;
++
++    if (device == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): device is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if (!device->contiguousMapped)
++    {
++        if (data->contiguousLogical != gcvNULL)
++        {
++            gcmkONERROR(gckOS_UnmapMemoryEx(
++                galDevice->os,
++                galDevice->contiguousPhysical,
++                galDevice->contiguousSize,
++                data->contiguousLogical,
++                data->pidOpen
++                ));
++
++            data->contiguousLogical = gcvNULL;
++        }
++    }
++
++    /* A process gets detached. */
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (galDevice->kernels[i] != gcvNULL)
++        {
++            gcmkONERROR(gckKERNEL_AttachProcessEx(galDevice->kernels[i], gcvFALSE, data->pidOpen));
++        }
++    }
++
++    kfree(data);
++    filp->private_data = NULL;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++long drv_ioctl(
++    struct file* filp,
++    unsigned int ioctlCode,
++    unsigned long arg
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++    gctUINT32 copyLen;
++    DRIVER_ARGS drvArgs;
++    gckGALDEVICE device;
++    gcsHAL_PRIVATE_DATA_PTR data;
++    gctINT32 i, count;
++
++    gcmkHEADER_ARG(
++        "filp=0x%08X ioctlCode=0x%08X arg=0x%08X",
++        filp, ioctlCode, arg
++        );
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = filp->private_data;
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    device = data->device;
++
++    if (device == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): device is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if ((ioctlCode != IOCTL_GCHAL_INTERFACE)
++    &&  (ioctlCode != IOCTL_GCHAL_KERNEL_INTERFACE)
++    )
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): unknown command %d\n",
++            __FUNCTION__, __LINE__,
++            ioctlCode
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Get the drvArgs. */
++    copyLen = copy_from_user(
++        &drvArgs, (void *) arg, sizeof(DRIVER_ARGS)
++        );
++
++    if (copyLen != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): error copying of the input arguments.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Now bring in the gcsHAL_INTERFACE structure. */
++    if ((drvArgs.InputBufferSize  != sizeof(gcsHAL_INTERFACE))
++    ||  (drvArgs.OutputBufferSize != sizeof(gcsHAL_INTERFACE))
++    )
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): input or/and output structures are invalid.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    copyLen = copy_from_user(
++        &iface, gcmUINT64_TO_PTR(drvArgs.InputBuffer), sizeof(gcsHAL_INTERFACE)
++        );
++
++    if (copyLen != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): error copying of input HAL interface.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if (iface.command == gcvHAL_CHIP_INFO)
++    {
++        count = 0;
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (device->kernels[i] != gcvNULL)
++            {
++#if gcdENABLE_VG
++                if (i == gcvCORE_VG)
++                {
++                    iface.u.ChipInfo.types[count] = gcvHARDWARE_VG;
++                }
++                else
++#endif
++                {
++                    gcmkVERIFY_OK(gckHARDWARE_GetType(device->kernels[i]->hardware,
++                                                      &iface.u.ChipInfo.types[count]));
++                }
++                count++;
++            }
++        }
++
++        iface.u.ChipInfo.count = count;
++        iface.status = status = gcvSTATUS_OK;
++    }
++    else
++    {
++        if (iface.hardwareType < 0 || iface.hardwareType > 7)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): unknown hardwareType %d\n",
++                __FUNCTION__, __LINE__,
++                iface.hardwareType
++                );
++
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++#if gcdENABLE_VG
++        if (device->coreMapping[iface.hardwareType] == gcvCORE_VG)
++        {
++            status = gckVGKERNEL_Dispatch(device->kernels[gcvCORE_VG],
++                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
++                                        &iface);
++        }
++        else
++#endif
++        {
++            status = gckKERNEL_Dispatch(device->kernels[device->coreMapping[iface.hardwareType]],
++                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
++                                        &iface);
++        }
++    }
++
++    /* Redo system call after pending signal is handled. */
++    if (status == gcvSTATUS_INTERRUPTED)
++    {
++        gcmkFOOTER();
++        return -ERESTARTSYS;
++    }
++
++    if (gcmIS_SUCCESS(status) && (iface.command == gcvHAL_LOCK_VIDEO_MEMORY))
++    {
++        gcuVIDMEM_NODE_PTR node = gcmUINT64_TO_PTR(iface.u.LockVideoMemory.node);
++        /* Special case for mapped memory. */
++        if ((data->mappedMemory != gcvNULL)
++        &&  (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        )
++        {
++            /* Compute offset into mapped memory. */
++            gctUINT32 offset
++                = (gctUINT8 *) gcmUINT64_TO_PTR(iface.u.LockVideoMemory.memory)
++                - (gctUINT8 *) device->contiguousBase;
++
++            /* Compute offset into user-mapped region. */
++            iface.u.LockVideoMemory.memory =
++                gcmPTR_TO_UINT64((gctUINT8 *) data->mappedMemory + offset);
++        }
++    }
++
++    /* Copy data back to the user. */
++    copyLen = copy_to_user(
++        gcmUINT64_TO_PTR(drvArgs.OutputBuffer), &iface, sizeof(gcsHAL_INTERFACE)
++        );
++
++    if (copyLen != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): error copying of output HAL interface.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++static int drv_mmap(
++    struct file* filp,
++    struct vm_area_struct* vma
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gcsHAL_PRIVATE_DATA_PTR data;
++    gckGALDEVICE device;
++
++    gcmkHEADER_ARG("filp=0x%08X vma=0x%08X", filp, vma);
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = filp->private_data;
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    device = data->device;
++
++    if (device == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): device is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++#if !gcdPAGED_MEMORY_CACHEABLE
++    vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
++    vma->vm_flags    |= gcdVM_FLAGS;
++#endif
++    vma->vm_pgoff     = 0;
++
++    if (device->contiguousMapped)
++    {
++        unsigned long size = vma->vm_end - vma->vm_start;
++        int ret = 0;
++
++        if (size > device->contiguousSize)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Invalid mapping size.\n",
++                __FUNCTION__, __LINE__
++                );
++
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        ret = io_remap_pfn_range(
++            vma,
++            vma->vm_start,
++            device->requestedContiguousBase >> PAGE_SHIFT,
++            size,
++            vma->vm_page_prot
++            );
++
++        if (ret != 0)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): io_remap_pfn_range failed %d\n",
++                __FUNCTION__, __LINE__,
++                ret
++                );
++
++            data->mappedMemory = gcvNULL;
++
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++
++        data->mappedMemory = (gctPOINTER) vma->vm_start;
++
++        /* Success. */
++        gcmkFOOTER_NO();
++        return 0;
++    }
++
++
++OnError:
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++
++#if !USE_PLATFORM_DRIVER
++static int __init drv_init(void)
++#else
++static int drv_init(struct device *pdev)
++#endif
++{
++    int ret;
++    int result = -EINVAL;
++    gceSTATUS status;
++    gckGALDEVICE device = gcvNULL;
++    struct class* device_class = gcvNULL;
++
++    gcmkHEADER();
++
++#if ENABLE_GPU_CLOCK_BY_DRIVER && (LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,28))
++    {
++# if 0
++        struct clk * clk;
++
++        clk = clk_get(NULL, "GCCLK");
++
++        if (IS_ERR(clk))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): clk get error: %d\n",
++                __FUNCTION__, __LINE__,
++                PTR_ERR(clk)
++                );
++
++            result = -ENODEV;
++            gcmkONERROR(gcvSTATUS_GENERIC_IO);
++        }
++
++        /*
++         * APMU_GC_156M, APMU_GC_312M, APMU_GC_PLL2, APMU_GC_PLL2_DIV2 currently.
++         * Use the 2X clock.
++         */
++        if (clk_set_rate(clk, coreClock * 2))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Failed to set core clock.\n",
++                __FUNCTION__, __LINE__
++                );
++
++            result = -EAGAIN;
++            gcmkONERROR(gcvSTATUS_GENERIC_IO);
++        }
++
++        clk_enable(clk);
++
++#if defined(CONFIG_PXA_DVFM) && (LINUX_VERSION_CODE > KERNEL_VERSION(2,6,29))
++        gc_pwr(1);
++#   endif
++# endif
++    }
++#endif
++
++    printk(KERN_INFO "Galcore version %d.%d.%d.%d\n",
++        gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH, gcvVERSION_BUILD);
++    /* when enable gpu profiler, we need to turn off gpu powerMangement */
++    if(gpuProfiler)
++        powerManagement = 0;
++    if (showArgs)
++    {
++        printk("galcore options:\n");
++        printk("  irqLine           = %d\n",      irqLine);
++        printk("  registerMemBase   = 0x%08lX\n", registerMemBase);
++        printk("  registerMemSize   = 0x%08lX\n", registerMemSize);
++
++        if (irqLine2D != -1)
++        {
++            printk("  irqLine2D         = %d\n",      irqLine2D);
++            printk("  registerMemBase2D = 0x%08lX\n", registerMemBase2D);
++            printk("  registerMemSize2D = 0x%08lX\n", registerMemSize2D);
++        }
++
++        if (irqLineVG != -1)
++        {
++            printk("  irqLineVG         = %d\n",      irqLineVG);
++            printk("  registerMemBaseVG = 0x%08lX\n", registerMemBaseVG);
++            printk("  registerMemSizeVG = 0x%08lX\n", registerMemSizeVG);
++        }
++
++        printk("  contiguousSize    = %ld\n",     contiguousSize);
++        printk("  contiguousBase    = 0x%08lX\n", contiguousBase);
++        printk("  bankSize          = 0x%08lX\n", bankSize);
++        printk("  fastClear         = %d\n",      fastClear);
++        printk("  compression       = %d\n",      compression);
++        printk("  signal            = %d\n",      signal);
++        printk("  baseAddress       = 0x%08lX\n", baseAddress);
++        printk("  physSize          = 0x%08lX\n", physSize);
++        printk("  logFileSize       = %d KB \n",  logFileSize);
++        printk("  powerManagement   = %d\n",      powerManagement);
++        printk("  gpuProfiler   = %d\n",      gpuProfiler);
++#if ENABLE_GPU_CLOCK_BY_DRIVER
++        printk("  coreClock       = %lu\n",     coreClock);
++#endif
++    }
++
++    if(logFileSize != 0)
++    {
++    	gckDebugFileSystemInitialize();
++    }
++
++    /* Create the GAL device. */
++    gcmkONERROR(gckGALDEVICE_Construct(
++        irqLine,
++        registerMemBase, registerMemSize,
++        irqLine2D,
++        registerMemBase2D, registerMemSize2D,
++        irqLineVG,
++        registerMemBaseVG, registerMemSizeVG,
++        contiguousBase, contiguousSize,
++        bankSize, fastClear, compression, baseAddress, physSize, signal,
++        logFileSize,
++        pdev,
++        powerManagement,
++        gpuProfiler,
++        &device
++        ));
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	device->pool = dev_get_drvdata(pdev);
++#endif
++
++    /* Start the GAL device. */
++    gcmkONERROR(gckGALDEVICE_Start(device));
++
++    if ((physSize != 0)
++       && (device->kernels[gcvCORE_MAJOR] != gcvNULL)
++       && (device->kernels[gcvCORE_MAJOR]->hardware->mmuVersion != 0))
++    {
++        status = gckMMU_Enable(device->kernels[gcvCORE_MAJOR]->mmu, baseAddress, physSize);
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
++            "Enable new MMU: status=%d\n", status);
++
++        if ((device->kernels[gcvCORE_2D] != gcvNULL)
++            && (device->kernels[gcvCORE_2D]->hardware->mmuVersion != 0))
++        {
++            status = gckMMU_Enable(device->kernels[gcvCORE_2D]->mmu, baseAddress, physSize);
++            gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_DRIVER,
++                "Enable new MMU for 2D: status=%d\n", status);
++        }
++
++        /* Reset the base address */
++        device->baseAddress = 0;
++    }
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++    task_free_register(&task_nb);
++    viv_gpu_resmem_handler.data = device->kernels[gcvCORE_MAJOR];
++    register_reserved_memory_account(&viv_gpu_resmem_handler);
++#endif
++
++
++    /* Register the character device. */
++    ret = register_chrdev(major, DRV_NAME, &driver_fops);
++
++    if (ret < 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): Could not allocate major number for mmap.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    if (major == 0)
++    {
++        major = ret;
++    }
++
++    /* Create the device class. */
++    device_class = class_create(THIS_MODULE, "graphics_class");
++
++    if (IS_ERR(device_class))
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): Failed to create the class.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
++    device_create(device_class, NULL, MKDEV(major, 0), NULL, "galcore");
++#else
++    device_create(device_class, NULL, MKDEV(major, 0), "galcore");
++#endif
++
++    galDevice = device;
++    gpuClass  = device_class;
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_DRIVER,
++        "%s(%d): irqLine=%d, contiguousSize=%lu, memBase=0x%lX\n",
++        __FUNCTION__, __LINE__,
++        irqLine, contiguousSize, registerMemBase
++        );
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    /* Roll back. */
++    if (device_class != gcvNULL)
++    {
++        device_destroy(device_class, MKDEV(major, 0));
++        class_destroy(device_class);
++    }
++
++    if (device != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckGALDEVICE_Stop(device));
++        gcmkVERIFY_OK(gckGALDEVICE_Destroy(device));
++    }
++
++    gcmkFOOTER();
++    return result;
++}
++
++#if !USE_PLATFORM_DRIVER
++static void __exit drv_exit(void)
++#else
++static void drv_exit(void)
++#endif
++{
++    gcmkHEADER();
++
++#ifdef CONFIG_ANDROID_RESERVED_MEMORY_ACCOUNT
++    task_free_unregister(&task_nb);
++    unregister_reserved_memory_account(&viv_gpu_resmem_handler);
++#endif
++
++    gcmkASSERT(gpuClass != gcvNULL);
++    device_destroy(gpuClass, MKDEV(major, 0));
++    class_destroy(gpuClass);
++
++    unregister_chrdev(major, DRV_NAME);
++
++    gcmkVERIFY_OK(gckGALDEVICE_Stop(galDevice));
++    gcmkVERIFY_OK(gckGALDEVICE_Destroy(galDevice));
++
++   if(gckDebugFileSystemIsEnabled())
++   {
++   	 gckDebugFileSystemTerminate();
++   }
++
++#if ENABLE_GPU_CLOCK_BY_DRIVER && LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,28)
++    {
++# if 0
++        struct clk * clk = NULL;
++
++#if defined(CONFIG_PXA_DVFM) && (LINUX_VERSION_CODE > KERNEL_VERSION(2,6,29))
++        gc_pwr(0);
++#endif
++        clk = clk_get(NULL, "GCCLK");
++        clk_disable(clk);
++# endif
++    }
++#endif
++
++    gcmkFOOTER_NO();
++}
++
++#if !USE_PLATFORM_DRIVER
++    module_init(drv_init);
++    module_exit(drv_exit);
++#else
++
++#ifdef CONFIG_DOVE_GPU
++#   define DEVICE_NAME "dove_gpu"
++#else
++#   define DEVICE_NAME "galcore"
++#endif
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++static int thermal_hot_pm_notify(struct notifier_block *nb, unsigned long event,
++	void *dummy)
++{
++    static gctUINT orgFscale, minFscale, maxFscale;
++    static gctBOOL critical;
++    gckHARDWARE hardware = galDevice->kernels[gcvCORE_MAJOR]->hardware;
++
++    if (event > 4) {
++	critical = gcvTRUE;
++        gckHARDWARE_GetFscaleValue(hardware,&orgFscale,&minFscale, &maxFscale);
++        gckHARDWARE_SetFscaleValue(hardware, minFscale);
++        gckOS_Print("System is too hot. GPU3D scalign to %d/64 clock.\n", minFscale);
++    } else if (event > 1) {
++        gckHARDWARE_GetFscaleValue(hardware,&orgFscale,&minFscale, &maxFscale);
++        gckHARDWARE_SetFscaleValue(hardware, maxFscale - (8 * event));
++    } else if (orgFscale) {
++        gckHARDWARE_SetFscaleValue(hardware, orgFscale);
++	if (critical) {
++            gckOS_Print("Hot alarm is canceled. GPU3D clock will return to %d/64\n", orgFscale);
++            critical = gcvFALSE;
++        }
++    }
++    return NOTIFY_OK;
++}
++
++static struct notifier_block thermal_hot_pm_notifier = {
++    .notifier_call = thermal_hot_pm_notify,
++    };
++#endif
++
++
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
++static int gpu_probe(struct platform_device *pdev)
++#else
++static int __devinit gpu_probe(struct platform_device *pdev)
++#endif
++{
++    int ret = -ENODEV;
++    struct resource* res;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	struct contiguous_mem_pool *pool;
++	struct reset_control *rstc;
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++	struct device_node *dn =pdev->dev.of_node;
++	const u32 *prop;
++#else
++	struct viv_gpu_platform_data *pdata;
++#endif
++    gcmkHEADER();
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "phys_baseaddr");
++    if (res)
++        baseAddress = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_3d");
++    if (res)
++        irqLine = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_3d");
++    if (res)
++    {
++        registerMemBase = res->start;
++        registerMemSize = res->end - res->start + 1;
++    }
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_2d");
++    if (res)
++        irqLine2D = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_2d");
++    if (res)
++    {
++        registerMemBase2D = res->start;
++        registerMemSize2D = res->end - res->start + 1;
++    }
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_vg");
++    if (res)
++        irqLineVG = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_vg");
++    if (res)
++    {
++        registerMemBaseVG = res->start;
++        registerMemSizeVG = res->end - res->start + 1;
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	pool = devm_kzalloc(&pdev->dev, sizeof(*pool), GFP_KERNEL);
++	if (!pool)
++		return -ENOMEM;
++	pool->size = contiguousSize;
++	init_dma_attrs(&pool->attrs);
++	dma_set_attr(DMA_ATTR_WRITE_COMBINE, &pool->attrs);
++	pool->virt = dma_alloc_attrs(&pdev->dev, pool->size, &pool->phys,
++				     GFP_KERNEL, &pool->attrs);
++	if (!pool->virt) {
++		dev_err(&pdev->dev, "Failed to allocate contiguous memory\n");
++		return -ENOMEM;
++	}
++	contiguousBase = pool->phys;
++	dev_set_drvdata(&pdev->dev, pool);
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++	prop = of_get_property(dn, "contiguousbase", NULL);
++	if(prop)
++		contiguousBase = *prop;
++	of_property_read_u32(dn,"contiguoussize", (u32 *)&contiguousSize);
++#else
++    pdata = pdev->dev.platform_data;
++    if (pdata) {
++        contiguousBase = pdata->reserved_mem_base;
++        contiguousSize = pdata->reserved_mem_size;
++     }
++#endif
++    if (contiguousSize == 0)
++       gckOS_Print("Warning: No contiguous memory is reserverd for gpu.!\n ");
++    ret = drv_init(&pdev->dev);
++
++    if (!ret)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	rstc = devm_reset_control_get(&pdev->dev, "gpu3d");
++	galDevice->rstc[gcvCORE_MAJOR] = IS_ERR(rstc) ? NULL : rstc;
++
++	rstc = devm_reset_control_get(&pdev->dev, "gpu2d");
++	galDevice->rstc[gcvCORE_2D] = IS_ERR(rstc) ? NULL : rstc;
++
++	rstc = devm_reset_control_get(&pdev->dev, "gpuvg");
++	galDevice->rstc[gcvCORE_VG] = IS_ERR(rstc) ? NULL : rstc;
++#endif
++        platform_set_drvdata(pdev, galDevice);
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++        if (galDevice->kernels[gcvCORE_MAJOR])
++            REG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
++#endif
++        gcmkFOOTER_NO();
++        return ret;
++    }
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    UNREG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
++#endif
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	dma_free_attrs(&pdev->dev, pool->size, pool->virt, pool->phys,
++		       &pool->attrs);
++#endif
++    gcmkFOOTER_ARG(KERN_INFO "Failed to register gpu driver: %d\n", ret);
++    return ret;
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
++static int gpu_remove(struct platform_device *pdev)
++#else
++static int __devexit gpu_remove(struct platform_device *pdev)
++#endif
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	gckGALDEVICE device = platform_get_drvdata(pdev);
++	struct contiguous_mem_pool *pool = device->pool;
++#endif
++    gcmkHEADER();
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    if(galDevice->kernels[gcvCORE_MAJOR])
++        UNREG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
++#endif
++    drv_exit();
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	dma_free_attrs(&pdev->dev, pool->size, pool->virt, pool->phys,
++		       &pool->attrs);
++#endif
++    gcmkFOOTER_NO();
++    return 0;
++}
++
++static int gpu_suspend(struct platform_device *dev, pm_message_t state)
++{
++    gceSTATUS status;
++    gckGALDEVICE device;
++    gctINT i;
++
++    device = platform_get_drvdata(dev);
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->kernels[i] != gcvNULL)
++        {
++            /* Store states. */
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_QueryPowerManagementState(device->kernels[i]->vg->hardware, &device->statesStored[i]);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_QueryPowerManagementState(device->kernels[i]->hardware, &device->statesStored[i]);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_OFF);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_OFF);
++            }
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++
++        }
++    }
++
++    return 0;
++}
++
++static int gpu_resume(struct platform_device *dev)
++{
++    gceSTATUS status;
++    gckGALDEVICE device;
++    gctINT i;
++    gceCHIPPOWERSTATE   statesStored;
++
++    device = platform_get_drvdata(dev);
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->kernels[i] != gcvNULL)
++        {
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_ON);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_ON);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++
++            /* Convert global state to crossponding internal state. */
++            switch(device->statesStored[i])
++            {
++            case gcvPOWER_OFF:
++                statesStored = gcvPOWER_OFF_BROADCAST;
++                break;
++            case gcvPOWER_IDLE:
++                statesStored = gcvPOWER_IDLE_BROADCAST;
++                break;
++            case gcvPOWER_SUSPEND:
++                statesStored = gcvPOWER_SUSPEND_BROADCAST;
++                break;
++            case gcvPOWER_ON:
++                statesStored = gcvPOWER_ON_AUTO;
++                break;
++            default:
++                statesStored = device->statesStored[i];
++                break;
++        }
++
++            /* Restore states. */
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, statesStored);
++    }
++            else
++#endif
++            {
++                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, statesStored);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++        }
++    }
++
++    return 0;
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++static const struct of_device_id mxs_gpu_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-gpu", },
++	{/* sentinel */}
++};
++MODULE_DEVICE_TABLE(of, mxs_gpu_dt_ids);
++
++#ifdef CONFIG_PM
++static int gpu_runtime_suspend(struct device *dev)
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 7)
++	release_bus_freq(BUS_FREQ_HIGH);
++#endif
++	return 0;
++}
++
++static int gpu_runtime_resume(struct device *dev)
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 7)
++	request_bus_freq(BUS_FREQ_HIGH);
++#endif
++	return 0;
++}
++
++static int gpu_system_suspend(struct device *dev)
++{
++	pm_message_t state={0};
++	return gpu_suspend(to_platform_device(dev), state);
++}
++
++static int gpu_system_resume(struct device *dev)
++{
++	return gpu_resume(to_platform_device(dev));
++}
++
++static const struct dev_pm_ops gpu_pm_ops = {
++	SET_RUNTIME_PM_OPS(gpu_runtime_suspend, gpu_runtime_resume, NULL)
++	SET_SYSTEM_SLEEP_PM_OPS(gpu_system_suspend, gpu_system_resume)
++};
++#endif
++#endif
++
++static struct platform_driver gpu_driver = {
++    .probe      = gpu_probe,
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
++    .remove     = gpu_remove,
++#else
++    .remove     = __devexit_p(gpu_remove),
++#endif
++
++    .suspend    = gpu_suspend,
++    .resume     = gpu_resume,
++
++    .driver     = {
++        .name   = DEVICE_NAME,
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++		.of_match_table = mxs_gpu_dt_ids,
++#if CONFIG_PM
++		.pm		= &gpu_pm_ops,
++#endif
++#endif
++    }
++};
++
++#if 0 /*CONFIG_DOVE_GPU*/
++static struct resource gpu_resources[] = {
++    {
++        .name   = "gpu_irq",
++        .flags  = IORESOURCE_IRQ,
++    },
++    {
++        .name   = "gpu_base",
++        .flags  = IORESOURCE_MEM,
++    },
++    {
++        .name   = "gpu_mem",
++        .flags  = IORESOURCE_MEM,
++    },
++};
++
++static struct platform_device * gpu_device;
++#endif
++
++static int __init gpu_init(void)
++{
++    int ret = 0;
++
++#if 0 /*ndef CONFIG_DOVE_GPU*/
++    gpu_resources[0].start = gpu_resources[0].end = irqLine;
++
++    gpu_resources[1].start = registerMemBase;
++    gpu_resources[1].end   = registerMemBase + registerMemSize - 1;
++
++    gpu_resources[2].start = contiguousBase;
++    gpu_resources[2].end   = contiguousBase + contiguousSize - 1;
++
++    /* Allocate device */
++    gpu_device = platform_device_alloc(DEVICE_NAME, -1);
++    if (!gpu_device)
++    {
++        printk(KERN_ERR "galcore: platform_device_alloc failed.\n");
++        ret = -ENOMEM;
++        goto out;
++    }
++
++    /* Insert resource */
++    ret = platform_device_add_resources(gpu_device, gpu_resources, 3);
++    if (ret)
++    {
++        printk(KERN_ERR "galcore: platform_device_add_resources failed.\n");
++        goto put_dev;
++    }
++
++    /* Add device */
++    ret = platform_device_add(gpu_device);
++    if (ret)
++    {
++        printk(KERN_ERR "galcore: platform_device_add failed.\n");
++        goto put_dev;
++    }
++#endif
++
++    ret = platform_driver_register(&gpu_driver);
++    if (!ret)
++    {
++        goto out;
++    }
++
++#if 0 /*ndef CONFIG_DOVE_GPU*/
++    platform_device_del(gpu_device);
++put_dev:
++    platform_device_put(gpu_device);
++#endif
++
++out:
++    return ret;
++}
++
++static void __exit gpu_exit(void)
++{
++    platform_driver_unregister(&gpu_driver);
++#if 0 /*ndef CONFIG_DOVE_GPU*/
++    platform_device_unregister(gpu_device);
++#endif
++}
++
++module_init(gpu_init);
++module_exit(gpu_exit);
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_iommu.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,216 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++#include "gc_hal_kernel_device.h"
++
++#include <linux/iommu.h>
++#include <linux/platform_device.h>
++
++#define _GC_OBJ_ZONE gcvZONE_OS
++
++typedef struct _gcsIOMMU
++{
++    struct iommu_domain * domain;
++    struct device *       device;
++}
++gcsIOMMU;
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++static int
++_IOMMU_Fault_Handler(
++    struct iommu_domain * Domain,
++    struct device * Dev,
++    unsigned long DomainAddress,
++    int flags,
++    void * args
++    )
++#else
++static int
++_IOMMU_Fault_Handler(
++    struct iommu_domain * Domain,
++    struct device * Dev,
++    unsigned long DomainAddress,
++    int flags
++    )
++#endif
++{
++    return 0;
++}
++
++static int
++_FlatMapping(
++    IN gckIOMMU Iommu
++    )
++{
++    gceSTATUS status;
++    gctUINT32 physical;
++
++    for (physical = 0; physical < 0x80000000; physical += PAGE_SIZE)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "Map %x => %x bytes = %d",
++            physical, physical, PAGE_SIZE
++            );
++
++        gcmkONERROR(gckIOMMU_Map(Iommu, physical, physical, PAGE_SIZE));
++    }
++
++    return gcvSTATUS_OK;
++
++OnError:
++    return status;
++}
++
++void
++gckIOMMU_Destory(
++    IN gckOS Os,
++    IN gckIOMMU Iommu
++    )
++{
++    gcmkHEADER();
++
++    if (Iommu->domain && Iommu->device)
++    {
++        iommu_attach_device(Iommu->domain, Iommu->device);
++    }
++
++    if (Iommu->domain)
++    {
++        iommu_domain_free(Iommu->domain);
++    }
++
++    if (Iommu)
++    {
++        gcmkOS_SAFE_FREE(Os, Iommu);
++    }
++
++    gcmkFOOTER_NO();
++}
++
++gceSTATUS
++gckIOMMU_Construct(
++    IN gckOS Os,
++    OUT gckIOMMU * Iommu
++    )
++{
++    gceSTATUS status;
++    gckIOMMU iommu = gcvNULL;
++    struct device *dev;
++    int ret;
++
++    gcmkHEADER();
++
++    dev = &Os->device->platform->device->dev;
++
++    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(gcsIOMMU), (gctPOINTER *)&iommu));
++
++    gckOS_ZeroMemory(iommu, gcmSIZEOF(gcsIOMMU));
++
++    iommu->domain = iommu_domain_alloc(&platform_bus_type);
++
++    if (!iommu->domain)
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "iommu_domain_alloc() fail");
++
++        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    iommu_set_fault_handler(iommu->domain, _IOMMU_Fault_Handler, dev);
++#else
++    iommu_set_fault_handler(iommu->domain, _IOMMU_Fault_Handler);
++#endif
++
++    ret = iommu_attach_device(iommu->domain, dev);
++
++    if (ret)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS, "iommu_attach_device() fail %d", ret);
++
++        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++    }
++
++    iommu->device = dev;
++
++    _FlatMapping(iommu);
++
++    *Iommu = iommu;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    gckIOMMU_Destory(Os, iommu);
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckIOMMU_Map(
++    IN gckIOMMU Iommu,
++    IN gctUINT32 DomainAddress,
++    IN gctUINT32 Physical,
++    IN gctUINT32 Bytes
++    )
++{
++    gceSTATUS status;
++    int ret;
++
++    gcmkHEADER_ARG("DomainAddress=%#X, Physical=%#X, Bytes=%d",
++                   DomainAddress, Physical, Bytes);
++
++    ret = iommu_map(Iommu->domain, DomainAddress, Physical, Bytes, 0);
++
++    if (ret)
++    {
++        gcmkONERROR(gcvSTATUS_NOT_SUPPORTED);
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++
++    gcmkFOOTER();
++    return status;
++
++}
++
++gceSTATUS
++gckIOMMU_Unmap(
++    IN gckIOMMU Iommu,
++    IN gctUINT32 DomainAddress,
++    IN gctUINT32 Bytes
++    )
++{
++    gcmkHEADER();
++
++    iommu_unmap(Iommu->domain, DomainAddress, Bytes);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,481 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++
++#define _GC_OBJ_ZONE    gcvZONE_KERNEL
++
++/******************************************************************************\
++******************************* gckKERNEL API Code ******************************
++\******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckKERNEL_QueryVideoMemory
++**
++**  Query the amount of video memory.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**  OUTPUT:
++**
++**      gcsHAL_INTERFACE * Interface
++**          Pointer to an gcsHAL_INTERFACE structure that will be filled in with
++**          the memory information.
++*/
++gceSTATUS
++gckKERNEL_QueryVideoMemory(
++    IN gckKERNEL Kernel,
++    OUT gcsHAL_INTERFACE * Interface
++    )
++{
++    gckGALDEVICE device;
++
++    gcmkHEADER_ARG("Kernel=%p", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Interface != NULL);
++
++    /* Extract the pointer to the gckGALDEVICE class. */
++    device = (gckGALDEVICE) Kernel->context;
++
++    /* Get internal memory size and physical address. */
++    Interface->u.QueryVideoMemory.internalSize = device->internalSize;
++    Interface->u.QueryVideoMemory.internalPhysical = device->internalPhysicalName;
++
++    /* Get external memory size and physical address. */
++    Interface->u.QueryVideoMemory.externalSize = device->externalSize;
++    Interface->u.QueryVideoMemory.externalPhysical = device->externalPhysicalName;
++
++    /* Get contiguous memory size and physical address. */
++    Interface->u.QueryVideoMemory.contiguousSize = device->contiguousSize;
++    Interface->u.QueryVideoMemory.contiguousPhysical = device->contiguousPhysicalName;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_GetVideoMemoryPool
++**
++**  Get the gckVIDMEM object belonging to the specified pool.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gcePOOL Pool
++**          Pool to query gckVIDMEM object for.
++**
++**  OUTPUT:
++**
++**      gckVIDMEM * VideoMemory
++**          Pointer to a variable that will hold the pointer to the gckVIDMEM
++**          object belonging to the requested pool.
++*/
++gceSTATUS
++gckKERNEL_GetVideoMemoryPool(
++    IN gckKERNEL Kernel,
++    IN gcePOOL Pool,
++    OUT gckVIDMEM * VideoMemory
++    )
++{
++    gckGALDEVICE device;
++    gckVIDMEM videoMemory;
++
++    gcmkHEADER_ARG("Kernel=%p Pool=%d", Kernel, Pool);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(VideoMemory != NULL);
++
++    /* Extract the pointer to the gckGALDEVICE class. */
++    device = (gckGALDEVICE) Kernel->context;
++
++    /* Dispatch on pool. */
++    switch (Pool)
++    {
++    case gcvPOOL_LOCAL_INTERNAL:
++        /* Internal memory. */
++        videoMemory = device->internalVidMem;
++        break;
++
++    case gcvPOOL_LOCAL_EXTERNAL:
++        /* External memory. */
++        videoMemory = device->externalVidMem;
++        break;
++
++    case gcvPOOL_SYSTEM:
++        /* System memory. */
++        videoMemory = device->contiguousVidMem;
++        break;
++
++    default:
++        /* Unknown pool. */
++        videoMemory = NULL;
++    }
++
++    /* Return pointer to the gckVIDMEM object. */
++    *VideoMemory = videoMemory;
++
++    /* Return status. */
++    gcmkFOOTER_ARG("*VideoMemory=%p", *VideoMemory);
++    return (videoMemory == NULL) ? gcvSTATUS_OUT_OF_MEMORY : gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_MapMemory
++**
++**  Map video memory into the current process space.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of video memory to map.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to map.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that will hold the base address of the mapped
++**          memory region.
++*/
++gceSTATUS
++gckKERNEL_MapMemory(
++    IN gckKERNEL Kernel,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Logical
++    )
++{
++    gckKERNEL kernel = Kernel;
++    gctPHYS_ADDR physical = gcmNAME_TO_PTR(Physical);
++
++    return gckOS_MapMemory(Kernel->os, physical, Bytes, Logical);
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_UnmapMemory
++**
++**  Unmap video memory from the current process space.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of video memory to map.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to map.
++**
++**      gctPOINTER Logical
++**          Base address of the mapped memory region.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_UnmapMemory(
++    IN gckKERNEL Kernel,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    )
++{
++    gckKERNEL kernel = Kernel;
++    gctPHYS_ADDR physical = gcmNAME_TO_PTR(Physical);
++
++    return gckOS_UnmapMemory(Kernel->os, physical, Bytes, Logical);
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_MapVideoMemory
++**
++**  Get the logical address for a hardware specific memory address for the
++**  current process.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL InUserSpace
++**          gcvTRUE to map the memory into the user space.
++**
++**      gctUINT32 Address
++**          Hardware specific memory address.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that will hold the logical address of the
++**          specified memory address.
++*/
++gceSTATUS
++gckKERNEL_MapVideoMemoryEx(
++    IN gckKERNEL Kernel,
++    IN gceCORE Core,
++    IN gctBOOL InUserSpace,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * Logical
++    )
++{
++    gckGALDEVICE device;
++    PLINUX_MDL mdl;
++    PLINUX_MDL_MAP mdlMap;
++    gcePOOL pool;
++    gctUINT32 offset, base;
++    gceSTATUS status;
++    gctPOINTER logical;
++
++    gcmkHEADER_ARG("Kernel=%p InUserSpace=%d Address=%08x",
++                   Kernel, InUserSpace, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Logical != NULL);
++
++    /* Extract the pointer to the gckGALDEVICE class. */
++    device = (gckGALDEVICE) Kernel->context;
++
++#if gcdENABLE_VG
++    if (Core == gcvCORE_VG)
++    {
++        /* Split the memory address into a pool type and offset. */
++        gcmkONERROR(
++            gckVGHARDWARE_SplitMemory(Kernel->vg->hardware, Address, &pool, &offset));
++    }
++    else
++#endif
++    {
++        /* Split the memory address into a pool type and offset. */
++        gcmkONERROR(
++            gckHARDWARE_SplitMemory(Kernel->hardware, Address, &pool, &offset));
++    }
++
++    /* Dispatch on pool. */
++    switch (pool)
++    {
++    case gcvPOOL_LOCAL_INTERNAL:
++        /* Internal memory. */
++        logical = device->internalLogical;
++        break;
++
++    case gcvPOOL_LOCAL_EXTERNAL:
++        /* External memory. */
++        logical = device->externalLogical;
++        break;
++
++    case gcvPOOL_SYSTEM:
++        /* System memory. */
++        if (device->contiguousMapped)
++        {
++            logical = device->contiguousBase;
++        }
++        else
++        {
++            gctINT processID;
++            gckOS_GetProcessID(&processID);
++
++            mdl = (PLINUX_MDL) device->contiguousPhysical;
++
++            mdlMap = FindMdlMap(mdl, processID);
++            gcmkASSERT(mdlMap);
++
++            logical = (gctPOINTER) mdlMap->vmaAddr;
++        }
++#if gcdENABLE_VG
++        if (Core == gcvCORE_VG)
++        {
++            gcmkVERIFY_OK(
++                gckVGHARDWARE_SplitMemory(Kernel->vg->hardware,
++                                        device->contiguousVidMem->baseAddress,
++                                        &pool,
++                                        &base));
++        }
++        else
++#endif
++        {
++            gctUINT32 baseAddress = 0;
++
++            if (Kernel->hardware->mmuVersion == 0)
++            {
++                gcmkONERROR(gckOS_GetBaseAddress(Kernel->os, &baseAddress));
++            }
++
++            gcmkVERIFY_OK(
++                gckHARDWARE_SplitMemory(Kernel->hardware,
++                                        device->contiguousVidMem->baseAddress - baseAddress,
++                                        &pool,
++                                        &base));
++        }
++        offset -= base;
++        break;
++
++    default:
++        /* Invalid memory pool. */
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Build logical address of specified address. */
++    *Logical = (gctPOINTER) ((gctUINT8_PTR) logical + offset);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Logical=%p", *Logical);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Retunn the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckKERNEL_MapVideoMemory
++**
++**  Get the logical address for a hardware specific memory address for the
++**  current process.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gctBOOL InUserSpace
++**          gcvTRUE to map the memory into the user space.
++**
++**      gctUINT32 Address
++**          Hardware specific memory address.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that will hold the logical address of the
++**          specified memory address.
++*/
++gceSTATUS
++gckKERNEL_MapVideoMemory(
++    IN gckKERNEL Kernel,
++    IN gctBOOL InUserSpace,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * Logical
++    )
++{
++    return gckKERNEL_MapVideoMemoryEx(Kernel, gcvCORE_MAJOR, InUserSpace, Address, Logical);
++}
++/*******************************************************************************
++**
++**  gckKERNEL_Notify
++**
++**  This function iscalled by clients to notify the gckKERNRL object of an event.
++**
++**  INPUT:
++**
++**      gckKERNEL Kernel
++**          Pointer to an gckKERNEL object.
++**
++**      gceNOTIFY Notification
++**          Notification event.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckKERNEL_Notify(
++    IN gckKERNEL Kernel,
++    IN gceNOTIFY Notification,
++    IN gctBOOL Data
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Kernel=%p Notification=%d Data=%d",
++                   Kernel, Notification, Data);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++
++    /* Dispatch on notifcation. */
++    switch (Notification)
++    {
++    case gcvNOTIFY_INTERRUPT:
++        /* Process the interrupt. */
++#if COMMAND_PROCESSOR_VERSION > 1
++        status = gckINTERRUPT_Notify(Kernel->interrupt, Data);
++#else
++        status = gckHARDWARE_Interrupt(Kernel->hardware, Data);
++#endif
++        break;
++
++    default:
++        status = gcvSTATUS_OK;
++        break;
++    }
++
++    /* Success. */
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckKERNEL_QuerySettings(
++    IN gckKERNEL Kernel,
++    OUT gcsKERNEL_SETTINGS * Settings
++    )
++{
++    gckGALDEVICE device;
++
++    gcmkHEADER_ARG("Kernel=%p", Kernel);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Kernel, gcvOBJ_KERNEL);
++    gcmkVERIFY_ARGUMENT(Settings != gcvNULL);
++
++    /* Extract the pointer to the gckGALDEVICE class. */
++    device = (gckGALDEVICE) Kernel->context;
++
++    /* Fill in signal. */
++    Settings->signal = device->signal;
++
++    /* Success. */
++    gcmkFOOTER_ARG("Settings->signal=%d", Settings->signal);
++    return gcvSTATUS_OK;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_linux.h	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,94 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_linux_h_
++#define __gc_hal_kernel_linux_h_
++
++#include <linux/version.h>
++#include <linux/init.h>
++#include <linux/module.h>
++#include <linux/fs.h>
++#include <linux/mm.h>
++#include <linux/sched.h>
++#include <linux/signal.h>
++#ifdef FLAREON
++#   include <asm/arch-realview/dove_gpio_irq.h>
++#endif
++#include <linux/interrupt.h>
++#include <linux/vmalloc.h>
++#include <linux/dma-mapping.h>
++#include <linux/kthread.h>
++
++#ifdef MODVERSIONS
++#  include <linux/modversions.h>
++#endif
++#include <asm/io.h>
++#include <asm/uaccess.h>
++
++#if ENABLE_GPU_CLOCK_BY_DRIVER && LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,28)
++#include <linux/clk.h>
++#include <linux/regulator/consumer.h>
++#endif
++
++#define NTSTRSAFE_NO_CCH_FUNCTIONS
++#include "gc_hal.h"
++#include "gc_hal_driver.h"
++#include "gc_hal_kernel.h"
++#include "gc_hal_kernel_device.h"
++#include "gc_hal_kernel_os.h"
++#include "gc_hal_kernel_debugfs.h"
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,31)
++#define FIND_TASK_BY_PID(x) pid_task(find_vpid(x), PIDTYPE_PID)
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
++#define FIND_TASK_BY_PID(x) find_task_by_vpid(x)
++#else
++#define FIND_TASK_BY_PID(x) find_task_by_pid(x)
++#endif
++
++#define _WIDE(string)				L##string
++#define WIDE(string)				_WIDE(string)
++
++#define countof(a)					(sizeof(a) / sizeof(a[0]))
++
++#define DRV_NAME          			"galcore"
++
++#define GetPageCount(size, offset) 	((((size) + ((offset) & ~PAGE_CACHE_MASK)) + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT)
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION (3,7,0)
++#define gcdVM_FLAGS (VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_DONTDUMP)
++#else
++#define gcdVM_FLAGS (VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_RESERVED)
++#endif
++
++static inline gctINT
++GetOrder(
++	IN gctINT numPages
++	)
++{
++    gctINT order = 0;
++
++	while ((1 << order) <  numPages) order++;
++
++	return order;
++}
++
++#endif /* __gc_hal_kernel_linux_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_math.c	2015-07-27 23:13:06.222780123 +0200
+@@ -0,0 +1,32 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++
++gctINT
++gckMATH_ModuloInt(
++    IN gctINT X,
++    IN gctINT Y
++    )
++{
++    if(Y ==0) {return 0;}
++    else {return X % Y;}
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,9078 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++
++#include <linux/pagemap.h>
++#include <linux/seq_file.h>
++#include <linux/mm.h>
++#include <linux/mman.h>
++#include <linux/sched.h>
++#include <asm/atomic.h>
++#include <linux/dma-mapping.h>
++#include <linux/slab.h>
++#include <linux/idr.h>
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
++#include <mach/hardware.h>
++#endif
++#include <linux/workqueue.h>
++#include <linux/idr.h>
++#if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,23)
++#include <linux/math64.h>
++#endif
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++#include <linux/reset.h>
++static inline void imx_gpc_power_up_pu(bool flag) {}
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++#include <mach/common.h>
++#endif
++#include <linux/delay.h>
++#include <linux/pm_runtime.h>
++
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++#include <linux/file.h>
++#include "gc_hal_kernel_sync.h"
++#endif
++
++
++#define _GC_OBJ_ZONE    gcvZONE_OS
++
++/*******************************************************************************
++***** Version Signature *******************************************************/
++
++#ifdef ANDROID
++const char * _PLATFORM = "\n\0$PLATFORM$Android$\n";
++#else
++const char * _PLATFORM = "\n\0$PLATFORM$Linux$\n";
++#endif
++
++#define USER_SIGNAL_TABLE_LEN_INIT  64
++#define gcdSUPPRESS_OOM_MESSAGE 1
++
++#define MEMORY_LOCK(os) \
++    gcmkVERIFY_OK(gckOS_AcquireMutex( \
++                                (os), \
++                                (os)->memoryLock, \
++                                gcvINFINITE))
++
++#define MEMORY_UNLOCK(os) \
++    gcmkVERIFY_OK(gckOS_ReleaseMutex((os), (os)->memoryLock))
++
++#define MEMORY_MAP_LOCK(os) \
++    gcmkVERIFY_OK(gckOS_AcquireMutex( \
++                                (os), \
++                                (os)->memoryMapLock, \
++                                gcvINFINITE))
++
++#define MEMORY_MAP_UNLOCK(os) \
++    gcmkVERIFY_OK(gckOS_ReleaseMutex((os), (os)->memoryMapLock))
++
++/* Protection bit when mapping memroy to user sapce */
++#define gcmkPAGED_MEMROY_PROT(x)    pgprot_writecombine(x)
++
++#if gcdNONPAGED_MEMORY_BUFFERABLE
++#define gcmkIOREMAP                 ioremap_wc
++#define gcmkNONPAGED_MEMROY_PROT(x) pgprot_writecombine(x)
++#elif !gcdNONPAGED_MEMORY_CACHEABLE
++#define gcmkIOREMAP                 ioremap_nocache
++#define gcmkNONPAGED_MEMROY_PROT(x) pgprot_noncached(x)
++#endif
++
++#if gcdSUPPRESS_OOM_MESSAGE
++#define gcdNOWARN __GFP_NOWARN
++#else
++#define gcdNOWARN 0
++#endif
++
++#define gcdINFINITE_TIMEOUT     (60 * 1000)
++#define gcdDETECT_TIMEOUT       0
++#define gcdDETECT_DMA_ADDRESS   1
++#define gcdDETECT_DMA_STATE     1
++
++#define gcdUSE_NON_PAGED_MEMORY_CACHE 10
++
++/******************************************************************************\
++********************************** Structures **********************************
++\******************************************************************************/
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++typedef struct _gcsNonPagedMemoryCache
++{
++#ifndef NO_DMA_COHERENT
++    gctINT                           size;
++    gctSTRING                        addr;
++    dma_addr_t                       dmaHandle;
++#else
++    long                             order;
++    struct page *                    page;
++#endif
++
++    struct _gcsNonPagedMemoryCache * prev;
++    struct _gcsNonPagedMemoryCache * next;
++}
++gcsNonPagedMemoryCache;
++#endif /* gcdUSE_NON_PAGED_MEMORY_CACHE */
++
++typedef struct _gcsUSER_MAPPING * gcsUSER_MAPPING_PTR;
++typedef struct _gcsUSER_MAPPING
++{
++    /* Pointer to next mapping structure. */
++    gcsUSER_MAPPING_PTR         next;
++
++    /* Physical address of this mapping. */
++    gctUINT32                   physical;
++
++    /* Logical address of this mapping. */
++    gctPOINTER                  logical;
++
++    /* Number of bytes of this mapping. */
++    gctSIZE_T                   bytes;
++
++    /* Starting address of this mapping. */
++    gctINT8_PTR                 start;
++
++    /* Ending address of this mapping. */
++    gctINT8_PTR                 end;
++}
++gcsUSER_MAPPING;
++
++typedef struct _gcsINTEGER_DB * gcsINTEGER_DB_PTR;
++typedef struct _gcsINTEGER_DB
++{
++    struct idr                  idr;
++    spinlock_t                  lock;
++    gctINT                      curr;
++}
++gcsINTEGER_DB;
++
++struct _gckOS
++{
++    /* Object. */
++    gcsOBJECT                   object;
++
++    /* Heap. */
++    gckHEAP                     heap;
++
++    /* Pointer to device */
++    gckGALDEVICE                device;
++
++    /* Memory management */
++    gctPOINTER                  memoryLock;
++    gctPOINTER                  memoryMapLock;
++
++    struct _LINUX_MDL           *mdlHead;
++    struct _LINUX_MDL           *mdlTail;
++
++    /* Kernel process ID. */
++    gctUINT32                   kernelProcessID;
++
++    /* Signal management. */
++
++    /* Lock. */
++    gctPOINTER                  signalMutex;
++
++    /* signal id database. */
++    gcsINTEGER_DB               signalDB;
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    /* Lock. */
++    gctPOINTER                  syncPointMutex;
++
++    /* sync point id database. */
++    gcsINTEGER_DB               syncPointDB;
++#endif
++
++    gcsUSER_MAPPING_PTR         userMap;
++    gctPOINTER                  debugLock;
++
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    gctUINT                      cacheSize;
++    gcsNonPagedMemoryCache *     cacheHead;
++    gcsNonPagedMemoryCache *     cacheTail;
++#endif
++
++    /* workqueue for os timer. */
++    struct workqueue_struct *   workqueue;
++
++    int                         gpu_clk_on[3];
++    struct mutex                gpu_clk_mutex;
++
++    gctPOINTER                  vidmemMutex;
++};
++
++typedef struct _gcsSIGNAL * gcsSIGNAL_PTR;
++typedef struct _gcsSIGNAL
++{
++    /* Kernel sync primitive. */
++    struct completion obj;
++
++    /* Manual reset flag. */
++    gctBOOL manualReset;
++
++    /* The reference counter. */
++    atomic_t ref;
++
++    /* The owner of the signal. */
++    gctHANDLE process;
++
++    gckHARDWARE hardware;
++
++    /* ID. */
++    gctUINT32 id;
++}
++gcsSIGNAL;
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++typedef struct _gcsSYNC_POINT * gcsSYNC_POINT_PTR;
++typedef struct _gcsSYNC_POINT
++{
++    /* The reference counter. */
++    atomic_t ref;
++
++    /* State. */
++    atomic_t state;
++
++    /* timeline. */
++    struct sync_timeline * timeline;
++
++    /* ID. */
++    gctUINT32 id;
++}
++gcsSYNC_POINT;
++#endif
++
++typedef struct _gcsPageInfo * gcsPageInfo_PTR;
++typedef struct _gcsPageInfo
++{
++    struct page **pages;
++    gctUINT32_PTR pageTable;
++}
++gcsPageInfo;
++
++typedef struct _gcsOSTIMER * gcsOSTIMER_PTR;
++typedef struct _gcsOSTIMER
++{
++    struct delayed_work     work;
++    gctTIMERFUNCTION        function;
++    gctPOINTER              data;
++} gcsOSTIMER;
++
++/******************************************************************************\
++******************************* Private Functions ******************************
++\******************************************************************************/
++
++static gctINT
++_GetProcessID(
++    void
++    )
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
++    return task_tgid_vnr(current);
++#else
++    return current->tgid;
++#endif
++}
++
++static gctINT
++_GetThreadID(
++    void
++    )
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,24)
++    return task_pid_vnr(current);
++#else
++    return current->pid;
++#endif
++}
++
++static PLINUX_MDL
++_CreateMdl(
++    IN gctINT ProcessID
++    )
++{
++    PLINUX_MDL  mdl;
++
++    gcmkHEADER_ARG("ProcessID=%d", ProcessID);
++
++    mdl = (PLINUX_MDL)kzalloc(sizeof(struct _LINUX_MDL), GFP_KERNEL | gcdNOWARN);
++    if (mdl == gcvNULL)
++    {
++        gcmkFOOTER_NO();
++        return gcvNULL;
++    }
++
++    mdl->pid    = ProcessID;
++    mdl->maps   = gcvNULL;
++    mdl->prev   = gcvNULL;
++    mdl->next   = gcvNULL;
++
++    gcmkFOOTER_ARG("0x%X", mdl);
++    return mdl;
++}
++
++static gceSTATUS
++_DestroyMdlMap(
++    IN PLINUX_MDL Mdl,
++    IN PLINUX_MDL_MAP MdlMap
++    );
++
++static gceSTATUS
++_DestroyMdl(
++    IN PLINUX_MDL Mdl
++    )
++{
++    PLINUX_MDL_MAP mdlMap, next;
++
++    gcmkHEADER_ARG("Mdl=0x%X", Mdl);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Mdl != gcvNULL);
++
++    mdlMap = Mdl->maps;
++
++    while (mdlMap != gcvNULL)
++    {
++        next = mdlMap->next;
++
++        gcmkVERIFY_OK(_DestroyMdlMap(Mdl, mdlMap));
++
++        mdlMap = next;
++    }
++
++    kfree(Mdl);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++static PLINUX_MDL_MAP
++_CreateMdlMap(
++    IN PLINUX_MDL Mdl,
++    IN gctINT ProcessID
++    )
++{
++    PLINUX_MDL_MAP  mdlMap;
++
++    gcmkHEADER_ARG("Mdl=0x%X ProcessID=%d", Mdl, ProcessID);
++
++    mdlMap = (PLINUX_MDL_MAP)kmalloc(sizeof(struct _LINUX_MDL_MAP), GFP_KERNEL | gcdNOWARN);
++    if (mdlMap == gcvNULL)
++    {
++        gcmkFOOTER_NO();
++        return gcvNULL;
++    }
++
++    mdlMap->pid     = ProcessID;
++    mdlMap->vmaAddr = gcvNULL;
++    mdlMap->vma     = gcvNULL;
++    mdlMap->count   = 0;
++
++    mdlMap->next    = Mdl->maps;
++    Mdl->maps       = mdlMap;
++
++    gcmkFOOTER_ARG("0x%X", mdlMap);
++    return mdlMap;
++}
++
++static gceSTATUS
++_DestroyMdlMap(
++    IN PLINUX_MDL Mdl,
++    IN PLINUX_MDL_MAP MdlMap
++    )
++{
++    PLINUX_MDL_MAP  prevMdlMap;
++
++    gcmkHEADER_ARG("Mdl=0x%X MdlMap=0x%X", Mdl, MdlMap);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(MdlMap != gcvNULL);
++    gcmkASSERT(Mdl->maps != gcvNULL);
++
++    if (Mdl->maps == MdlMap)
++    {
++        Mdl->maps = MdlMap->next;
++    }
++    else
++    {
++        prevMdlMap = Mdl->maps;
++
++        while (prevMdlMap->next != MdlMap)
++        {
++            prevMdlMap = prevMdlMap->next;
++
++            gcmkASSERT(prevMdlMap != gcvNULL);
++        }
++
++        prevMdlMap->next = MdlMap->next;
++    }
++
++    kfree(MdlMap);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++extern PLINUX_MDL_MAP
++FindMdlMap(
++    IN PLINUX_MDL Mdl,
++    IN gctINT ProcessID
++    )
++{
++    PLINUX_MDL_MAP  mdlMap;
++
++    gcmkHEADER_ARG("Mdl=0x%X ProcessID=%d", Mdl, ProcessID);
++    if(Mdl == gcvNULL)
++    {
++        gcmkFOOTER_NO();
++        return gcvNULL;
++    }
++    mdlMap = Mdl->maps;
++
++    while (mdlMap != gcvNULL)
++    {
++        if (mdlMap->pid == ProcessID)
++        {
++            gcmkFOOTER_ARG("0x%X", mdlMap);
++            return mdlMap;
++        }
++
++        mdlMap = mdlMap->next;
++    }
++
++    gcmkFOOTER_NO();
++    return gcvNULL;
++}
++
++void
++OnProcessExit(
++    IN gckOS Os,
++    IN gckKERNEL Kernel
++    )
++{
++}
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,25)
++static inline int
++is_vmalloc_addr(
++    void *Addr
++    )
++{
++    unsigned long addr = (unsigned long)Addr;
++
++    return addr >= VMALLOC_START && addr < VMALLOC_END;
++}
++#endif
++
++static void
++_NonContiguousFree(
++    IN struct page ** Pages,
++    IN gctUINT32 NumPages
++    )
++{
++    gctINT i;
++
++    gcmkHEADER_ARG("Pages=0x%X, NumPages=%d", Pages, NumPages);
++
++    gcmkASSERT(Pages != gcvNULL);
++
++    for (i = 0; i < NumPages; i++)
++    {
++        __free_page(Pages[i]);
++    }
++
++    if (is_vmalloc_addr(Pages))
++    {
++        vfree(Pages);
++    }
++    else
++    {
++        kfree(Pages);
++    }
++
++    gcmkFOOTER_NO();
++}
++
++static struct page **
++_NonContiguousAlloc(
++    IN gctUINT32 NumPages
++    )
++{
++    struct page ** pages;
++    struct page *p;
++    gctINT i, size;
++
++    gcmkHEADER_ARG("NumPages=%lu", NumPages);
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 32)
++    if (NumPages > totalram_pages)
++#else
++    if (NumPages > num_physpages)
++#endif
++    {
++        gcmkFOOTER_NO();
++        return gcvNULL;
++    }
++
++    size = NumPages * sizeof(struct page *);
++
++    pages = kmalloc(size, GFP_KERNEL | gcdNOWARN);
++
++    if (!pages)
++    {
++        pages = vmalloc(size);
++
++        if (!pages)
++        {
++            gcmkFOOTER_NO();
++            return gcvNULL;
++        }
++    }
++
++    for (i = 0; i < NumPages; i++)
++    {
++        p = alloc_page(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN);
++
++        if (!p)
++        {
++            _NonContiguousFree(pages, i);
++            gcmkFOOTER_NO();
++            return gcvNULL;
++        }
++
++        pages[i] = p;
++    }
++
++    gcmkFOOTER_ARG("pages=0x%X", pages);
++    return pages;
++}
++
++static inline struct page *
++_NonContiguousToPage(
++    IN struct page ** Pages,
++    IN gctUINT32 Index
++    )
++{
++    gcmkASSERT(Pages != gcvNULL);
++    return Pages[Index];
++}
++
++static inline unsigned long
++_NonContiguousToPfn(
++    IN struct page ** Pages,
++    IN gctUINT32 Index
++    )
++{
++    gcmkASSERT(Pages != gcvNULL);
++    return page_to_pfn(_NonContiguousToPage(Pages, Index));
++}
++
++static inline unsigned long
++_NonContiguousToPhys(
++    IN struct page ** Pages,
++    IN gctUINT32 Index
++    )
++{
++    gcmkASSERT(Pages != gcvNULL);
++    return page_to_phys(_NonContiguousToPage(Pages, Index));
++}
++
++
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++
++static gctBOOL
++_AddNonPagedMemoryCache(
++    gckOS Os,
++#ifndef NO_DMA_COHERENT
++    gctINT Size,
++    gctSTRING Addr,
++    dma_addr_t DmaHandle
++#else
++    long Order,
++    struct page * Page
++#endif
++    )
++{
++    gcsNonPagedMemoryCache *cache;
++
++    if (Os->cacheSize >= gcdUSE_NON_PAGED_MEMORY_CACHE)
++    {
++        return gcvFALSE;
++    }
++
++    /* Allocate the cache record */
++    cache = (gcsNonPagedMemoryCache *)kmalloc(sizeof(gcsNonPagedMemoryCache), GFP_ATOMIC);
++
++    if (cache == gcvNULL) return gcvFALSE;
++
++#ifndef NO_DMA_COHERENT
++    cache->size  = Size;
++    cache->addr  = Addr;
++    cache->dmaHandle = DmaHandle;
++#else
++    cache->order = Order;
++    cache->page  = Page;
++#endif
++
++    /* Add to list */
++    if (Os->cacheHead == gcvNULL)
++    {
++        cache->prev   = gcvNULL;
++        cache->next   = gcvNULL;
++        Os->cacheHead =
++        Os->cacheTail = cache;
++    }
++    else
++    {
++        /* Add to the tail. */
++        cache->prev         = Os->cacheTail;
++        cache->next         = gcvNULL;
++        Os->cacheTail->next = cache;
++        Os->cacheTail       = cache;
++    }
++
++    Os->cacheSize++;
++
++    return gcvTRUE;
++}
++
++#ifndef NO_DMA_COHERENT
++static gctSTRING
++_GetNonPagedMemoryCache(
++    gckOS Os,
++    gctINT Size,
++    dma_addr_t * DmaHandle
++    )
++#else
++static struct page *
++_GetNonPagedMemoryCache(
++    gckOS Os,
++    long Order
++    )
++#endif
++{
++    gcsNonPagedMemoryCache *cache;
++#ifndef NO_DMA_COHERENT
++    gctSTRING addr;
++#else
++    struct page * page;
++#endif
++
++    if (Os->cacheHead == gcvNULL) return gcvNULL;
++
++    /* Find the right cache */
++    cache = Os->cacheHead;
++
++    while (cache != gcvNULL)
++    {
++#ifndef NO_DMA_COHERENT
++        if (cache->size == Size) break;
++#else
++        if (cache->order == Order) break;
++#endif
++
++        cache = cache->next;
++    }
++
++    if (cache == gcvNULL) return gcvNULL;
++
++    /* Remove the cache from list */
++    if (cache == Os->cacheHead)
++    {
++        Os->cacheHead = cache->next;
++
++        if (Os->cacheHead == gcvNULL)
++        {
++            Os->cacheTail = gcvNULL;
++        }
++    }
++    else
++    {
++        cache->prev->next = cache->next;
++
++        if (cache == Os->cacheTail)
++        {
++            Os->cacheTail = cache->prev;
++        }
++        else
++        {
++            cache->next->prev = cache->prev;
++        }
++    }
++
++    /* Destroy cache */
++#ifndef NO_DMA_COHERENT
++    addr       = cache->addr;
++    *DmaHandle = cache->dmaHandle;
++#else
++    page       = cache->page;
++#endif
++
++    kfree(cache);
++
++    Os->cacheSize--;
++
++#ifndef NO_DMA_COHERENT
++    return addr;
++#else
++    return page;
++#endif
++}
++
++static void
++_FreeAllNonPagedMemoryCache(
++    gckOS Os
++    )
++{
++    gcsNonPagedMemoryCache *cache, *nextCache;
++
++    MEMORY_LOCK(Os);
++
++    cache = Os->cacheHead;
++
++    while (cache != gcvNULL)
++    {
++        if (cache != Os->cacheTail)
++        {
++            nextCache = cache->next;
++        }
++        else
++        {
++            nextCache = gcvNULL;
++        }
++
++        /* Remove the cache from list */
++        if (cache == Os->cacheHead)
++        {
++            Os->cacheHead = cache->next;
++
++            if (Os->cacheHead == gcvNULL)
++            {
++                Os->cacheTail = gcvNULL;
++            }
++        }
++        else
++        {
++            cache->prev->next = cache->next;
++
++            if (cache == Os->cacheTail)
++            {
++                Os->cacheTail = cache->prev;
++            }
++            else
++            {
++                cache->next->prev = cache->prev;
++            }
++        }
++
++#ifndef NO_DMA_COHERENT
++    dma_free_coherent(gcvNULL,
++                    cache->size,
++                    cache->addr,
++                    cache->dmaHandle);
++#else
++    free_pages((unsigned long)page_address(cache->page), cache->order);
++#endif
++
++        kfree(cache);
++
++        cache = nextCache;
++    }
++
++    MEMORY_UNLOCK(Os);
++}
++
++#endif /* gcdUSE_NON_PAGED_MEMORY_CACHE */
++
++/*******************************************************************************
++** Integer Id Management.
++*/
++gceSTATUS
++_AllocateIntegerId(
++    IN gcsINTEGER_DB_PTR Database,
++    IN gctPOINTER KernelPointer,
++    OUT gctUINT32 *Id
++    )
++{
++    int result;
++    gctINT next;
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 9, 0)
++    idr_preload(GFP_KERNEL | gcdNOWARN);
++
++    spin_lock(&Database->lock);
++
++    next = (Database->curr + 1 <= 0) ? 1 : Database->curr + 1;
++    result = idr_alloc(&Database->idr, KernelPointer, next, 0, GFP_ATOMIC);
++
++    if (!result)
++    {
++        Database->curr = *Id;
++    }
++
++    spin_unlock(&Database->lock);
++
++    idr_preload_end();
++
++    if (result < 0)
++    {
++        return gcvSTATUS_OUT_OF_RESOURCES;
++    }
++
++    *Id = result;
++#else
++again:
++    if (idr_pre_get(&Database->idr, GFP_KERNEL | gcdNOWARN) == 0)
++    {
++        return gcvSTATUS_OUT_OF_MEMORY;
++    }
++
++    spin_lock(&Database->lock);
++
++    next = (Database->curr + 1 <= 0) ? 1 : Database->curr + 1;
++
++    /* Try to get a id greater than current id. */
++    result = idr_get_new_above(&Database->idr, KernelPointer, next, Id);
++
++    if (!result)
++    {
++        Database->curr = *Id;
++    }
++
++    spin_unlock(&Database->lock);
++
++    if (result == -EAGAIN)
++    {
++        goto again;
++    }
++
++    if (result != 0)
++    {
++        return gcvSTATUS_OUT_OF_RESOURCES;
++    }
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_QueryIntegerId(
++    IN gcsINTEGER_DB_PTR Database,
++    IN gctUINT32  Id,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    gctPOINTER pointer;
++
++    spin_lock(&Database->lock);
++
++    pointer = idr_find(&Database->idr, Id);
++
++    spin_unlock(&Database->lock);
++
++    if(pointer)
++    {
++        *KernelPointer = pointer;
++        return gcvSTATUS_OK;
++    }
++    else
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_OS,
++                "%s(%d) Id = %d is not found",
++                __FUNCTION__, __LINE__, Id);
++
++        return gcvSTATUS_NOT_FOUND;
++    }
++}
++
++gceSTATUS
++_DestroyIntegerId(
++    IN gcsINTEGER_DB_PTR Database,
++    IN gctUINT32 Id
++    )
++{
++    spin_lock(&Database->lock);
++
++    idr_remove(&Database->idr, Id);
++
++    spin_unlock(&Database->lock);
++
++    return gcvSTATUS_OK;
++}
++
++static void
++_UnmapUserLogical(
++    IN gctINT Pid,
++    IN gctPOINTER Logical,
++    IN gctUINT32  Size
++)
++{
++    if (unlikely(current->mm == gcvNULL))
++    {
++        /* Do nothing if process is exiting. */
++        return;
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    if (vm_munmap((unsigned long)Logical, Size) < 0)
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): vm_munmap failed",
++                __FUNCTION__, __LINE__
++                );
++    }
++#else
++    down_write(&current->mm->mmap_sem);
++    if (do_munmap(current->mm, (unsigned long)Logical, Size) < 0)
++    {
++        gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): do_munmap failed",
++                __FUNCTION__, __LINE__
++                );
++    }
++    up_write(&current->mm->mmap_sem);
++#endif
++}
++
++gceSTATUS
++_QueryProcessPageTable(
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    )
++{
++    spinlock_t *lock;
++    gctUINTPTR_T logical = (gctUINTPTR_T)Logical;
++    pgd_t *pgd;
++    pud_t *pud;
++    pmd_t *pmd;
++    pte_t *pte;
++
++    if (!current->mm)
++    {
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    pgd = pgd_offset(current->mm, logical);
++    if (pgd_none(*pgd) || pgd_bad(*pgd))
++    {
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    pud = pud_offset(pgd, logical);
++    if (pud_none(*pud) || pud_bad(*pud))
++    {
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    pmd = pmd_offset(pud, logical);
++    if (pmd_none(*pmd) || pmd_bad(*pmd))
++    {
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    pte = pte_offset_map_lock(current->mm, pmd, logical, &lock);
++    if (!pte)
++    {
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    if (!pte_present(*pte))
++    {
++        pte_unmap_unlock(pte, lock);
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    *Address = (pte_pfn(*pte) << PAGE_SHIFT) | (logical & ~PAGE_MASK);
++    pte_unmap_unlock(pte, lock);
++
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_Construct
++**
++**  Construct a new gckOS object.
++**
++**  INPUT:
++**
++**      gctPOINTER Context
++**          Pointer to the gckGALDEVICE class.
++**
++**  OUTPUT:
++**
++**      gckOS * Os
++**          Pointer to a variable that will hold the pointer to the gckOS object.
++*/
++gceSTATUS
++gckOS_Construct(
++    IN gctPOINTER Context,
++    OUT gckOS * Os
++    )
++{
++    gckOS os;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Context=0x%X", Context);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Os != gcvNULL);
++
++    /* Allocate the gckOS object. */
++    os = (gckOS) kmalloc(gcmSIZEOF(struct _gckOS), GFP_KERNEL | gcdNOWARN);
++
++    if (os == gcvNULL)
++    {
++        /* Out of memory. */
++        gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_MEMORY);
++        return gcvSTATUS_OUT_OF_MEMORY;
++    }
++
++    /* Zero the memory. */
++    gckOS_ZeroMemory(os, gcmSIZEOF(struct _gckOS));
++
++    /* Initialize the gckOS object. */
++    os->object.type = gcvOBJ_OS;
++
++    /* Set device device. */
++    os->device = Context;
++
++    /* IMPORTANT! No heap yet. */
++    os->heap = gcvNULL;
++
++    /* Initialize the memory lock. */
++    gcmkONERROR(gckOS_CreateMutex(os, &os->memoryLock));
++    gcmkONERROR(gckOS_CreateMutex(os, &os->memoryMapLock));
++
++    /* Create debug lock mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &os->debugLock));
++
++
++    os->mdlHead = os->mdlTail = gcvNULL;
++
++    /* Get the kernel process ID. */
++    gcmkONERROR(gckOS_GetProcessID(&os->kernelProcessID));
++
++    /*
++     * Initialize the signal manager.
++     */
++
++    /* Initialize mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &os->signalMutex));
++
++    /* Initialize signal id database lock. */
++    spin_lock_init(&os->signalDB.lock);
++
++    /* Initialize signal id database. */
++    idr_init(&os->signalDB.idr);
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    /*
++     * Initialize the sync point manager.
++     */
++
++    /* Initialize mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &os->syncPointMutex));
++
++    /* Initialize sync point id database lock. */
++    spin_lock_init(&os->syncPointDB.lock);
++
++    /* Initialize sync point id database. */
++    idr_init(&os->syncPointDB.idr);
++#endif
++
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    os->cacheSize = 0;
++    os->cacheHead = gcvNULL;
++    os->cacheTail = gcvNULL;
++#endif
++
++    /* Create a workqueue for os timer. */
++    os->workqueue = create_singlethread_workqueue("galcore workqueue");
++
++    if (os->workqueue == gcvNULL)
++    {
++        /* Out of memory. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    mutex_init(&os->gpu_clk_mutex);
++
++    /* Construct a video memory mutex. */
++    gcmkONERROR(gckOS_CreateMutex(os, &os->vidmemMutex));
++
++    /* Return pointer to the gckOS object. */
++    *Os = os;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Os=0x%X", *Os);
++    return gcvSTATUS_OK;
++
++OnError:
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    if (os->syncPointMutex != gcvNULL)
++    {
++        gcmkVERIFY_OK(
++            gckOS_DeleteMutex(os, os->syncPointMutex));
++    }
++#endif
++
++    if (os->signalMutex != gcvNULL)
++    {
++        gcmkVERIFY_OK(
++            gckOS_DeleteMutex(os, os->signalMutex));
++    }
++
++    if (os->heap != gcvNULL)
++    {
++        gcmkVERIFY_OK(
++            gckHEAP_Destroy(os->heap));
++    }
++
++    if (os->memoryMapLock != gcvNULL)
++    {
++        gcmkVERIFY_OK(
++            gckOS_DeleteMutex(os, os->memoryMapLock));
++    }
++
++    if (os->memoryLock != gcvNULL)
++    {
++        gcmkVERIFY_OK(
++            gckOS_DeleteMutex(os, os->memoryLock));
++    }
++
++    if (os->debugLock != gcvNULL)
++    {
++        gcmkVERIFY_OK(
++            gckOS_DeleteMutex(os, os->debugLock));
++    }
++
++    if (os->workqueue != gcvNULL)
++    {
++        destroy_workqueue(os->workqueue);
++    }
++
++    kfree(os);
++
++    /* Return the error. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_Destroy
++**
++**  Destroy an gckOS object.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object that needs to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_Destroy(
++    IN gckOS Os
++    )
++{
++    gckHEAP heap;
++
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    _FreeAllNonPagedMemoryCache(Os);
++#endif
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++    /*
++     * Destroy the sync point manager.
++     */
++
++    /* Destroy the mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->syncPointMutex));
++#endif
++
++    /*
++     * Destroy the signal manager.
++     */
++
++    /* Destroy the mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->signalMutex));
++
++    if (Os->heap != gcvNULL)
++    {
++        /* Mark gckHEAP as gone. */
++        heap     = Os->heap;
++        Os->heap = gcvNULL;
++
++        /* Destroy the gckHEAP object. */
++        gcmkVERIFY_OK(gckHEAP_Destroy(heap));
++    }
++
++    /* Destroy the memory lock. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->memoryMapLock));
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->memoryLock));
++
++    /* Destroy debug lock mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->debugLock));
++
++    /* Destroy video memory mutex. */
++    gcmkVERIFY_OK(gckOS_DeleteMutex(Os, Os->vidmemMutex));
++
++    /* Wait for all works done. */
++    flush_workqueue(Os->workqueue);
++
++    /* Destory work queue. */
++    destroy_workqueue(Os->workqueue);
++
++    /* Flush the debug cache. */
++    gcmkDEBUGFLUSH(~0U);
++
++    /* Mark the gckOS object as unknown. */
++    Os->object.type = gcvOBJ_UNKNOWN;
++
++    /* Free the gckOS object. */
++    kfree(Os);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++static gctSTRING
++_CreateKernelVirtualMapping(
++    IN PLINUX_MDL Mdl
++    )
++{
++    gctSTRING addr = 0;
++    gctINT numPages = Mdl->numPages;
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    if (Mdl->contiguous)
++    {
++        addr = page_address(Mdl->u.contiguousPages);
++    }
++    else
++    {
++        addr = vmap(Mdl->u.nonContiguousPages,
++                    numPages,
++                    0,
++                    PAGE_KERNEL);
++
++        /* Trigger a page fault. */
++        memset(addr, 0, numPages * PAGE_SIZE);
++    }
++#else
++    struct page ** pages;
++    gctBOOL free = gcvFALSE;
++    gctINT i;
++
++    if (Mdl->contiguous)
++    {
++        pages = kmalloc(sizeof(struct page *) * numPages, GFP_KERNEL | gcdNOWARN);
++
++        if (!pages)
++        {
++            return gcvNULL;
++        }
++
++        for (i = 0; i < numPages; i++)
++        {
++            pages[i] = nth_page(Mdl->u.contiguousPages, i);
++        }
++
++        free = gcvTRUE;
++    }
++    else
++    {
++        pages = Mdl->u.nonContiguousPages;
++    }
++
++    /* ioremap() can't work on system memory since 2.6.38. */
++    addr = vmap(pages, numPages, 0, gcmkNONPAGED_MEMROY_PROT(PAGE_KERNEL));
++
++    /* Trigger a page fault. */
++    memset(addr, 0, numPages * PAGE_SIZE);
++
++    if (free)
++    {
++        kfree(pages);
++    }
++
++#endif
++
++    return addr;
++}
++
++static void
++_DestoryKernelVirtualMapping(
++    IN gctSTRING Addr
++    )
++{
++#if !gcdNONPAGED_MEMORY_CACHEABLE
++    vunmap(Addr);
++#endif
++}
++
++gceSTATUS
++gckOS_CreateKernelVirtualMapping(
++    IN gctPHYS_ADDR Physical,
++    OUT gctSIZE_T * PageCount,
++    OUT gctPOINTER * Logical
++    )
++{
++    *PageCount = ((PLINUX_MDL)Physical)->numPages;
++    *Logical = _CreateKernelVirtualMapping((PLINUX_MDL)Physical);
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_DestroyKernelVirtualMapping(
++    IN gctPOINTER Logical
++    )
++{
++    _DestoryKernelVirtualMapping((gctSTRING)Logical);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_Allocate
++**
++**  Allocate memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to allocate.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Memory
++**          Pointer to a variable that will hold the allocated memory location.
++*/
++gceSTATUS
++gckOS_Allocate(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Bytes=%lu", Os, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    /* Do we have a heap? */
++    if (Os->heap != gcvNULL)
++    {
++        /* Allocate from the heap. */
++        gcmkONERROR(gckHEAP_Allocate(Os->heap, Bytes, Memory));
++    }
++    else
++    {
++        gcmkONERROR(gckOS_AllocateMemory(Os, Bytes, Memory));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Memory=0x%X", *Memory);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_Free
++**
++**  Free allocated memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Memory
++**          Pointer to memory allocation to free.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_Free(
++    IN gckOS Os,
++    IN gctPOINTER Memory
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Memory=0x%X", Os, Memory);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    /* Do we have a heap? */
++    if (Os->heap != gcvNULL)
++    {
++        /* Free from the heap. */
++        gcmkONERROR(gckHEAP_Free(Os->heap, Memory));
++    }
++    else
++    {
++        gcmkONERROR(gckOS_FreeMemory(Os, Memory));
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AllocateMemory
++**
++**  Allocate memory wrapper.
++**
++**  INPUT:
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to allocate.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Memory
++**          Pointer to a variable that will hold the allocated memory location.
++*/
++gceSTATUS
++gckOS_AllocateMemory(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Memory
++    )
++{
++    gctPOINTER memory;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Bytes=%lu", Os, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    if (Bytes > PAGE_SIZE)
++    {
++        memory = (gctPOINTER) vmalloc(Bytes);
++    }
++    else
++    {
++        memory = (gctPOINTER) kmalloc(Bytes, GFP_KERNEL | gcdNOWARN);
++    }
++
++    if (memory == gcvNULL)
++    {
++        /* Out of memory. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Return pointer to the memory allocation. */
++    *Memory = memory;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Memory=0x%X", *Memory);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_FreeMemory
++**
++**  Free allocated memory wrapper.
++**
++**  INPUT:
++**
++**      gctPOINTER Memory
++**          Pointer to memory allocation to free.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_FreeMemory(
++    IN gckOS Os,
++    IN gctPOINTER Memory
++    )
++{
++    gcmkHEADER_ARG("Memory=0x%X", Memory);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++
++    /* Free the memory from the OS pool. */
++    if (is_vmalloc_addr(Memory))
++    {
++        vfree(Memory);
++    }
++    else
++    {
++        kfree(Memory);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_MapMemory
++**
++**  Map physical memory into the current process.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Start of physical address memory.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to map.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Memory
++**          Pointer to a variable that will hold the logical address of the
++**          mapped memory.
++*/
++gceSTATUS
++gckOS_MapMemory(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Logical
++    )
++{
++    PLINUX_MDL_MAP  mdlMap;
++    PLINUX_MDL      mdl = (PLINUX_MDL)Physical;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != 0);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    MEMORY_LOCK(Os);
++
++    mdlMap = FindMdlMap(mdl, _GetProcessID());
++
++    if (mdlMap == gcvNULL)
++    {
++        mdlMap = _CreateMdlMap(mdl, _GetProcessID());
++
++        if (mdlMap == gcvNULL)
++        {
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_MEMORY);
++            return gcvSTATUS_OUT_OF_MEMORY;
++        }
++    }
++
++    if (mdlMap->vmaAddr == gcvNULL)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
++        mdlMap->vmaAddr = (char *)vm_mmap(gcvNULL,
++                    0L,
++                    mdl->numPages * PAGE_SIZE,
++                    PROT_READ | PROT_WRITE,
++                    MAP_SHARED,
++                    0);
++#else
++        down_write(&current->mm->mmap_sem);
++
++        mdlMap->vmaAddr = (char *)do_mmap_pgoff(gcvNULL,
++                    0L,
++                    mdl->numPages * PAGE_SIZE,
++                    PROT_READ | PROT_WRITE,
++                    MAP_SHARED,
++                    0);
++
++        up_write(&current->mm->mmap_sem);
++#endif
++
++        if (IS_ERR(mdlMap->vmaAddr))
++        {
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): do_mmap_pgoff error",
++                __FUNCTION__, __LINE__
++                );
++
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): mdl->numPages: %d mdl->vmaAddr: 0x%X",
++                __FUNCTION__, __LINE__,
++                mdl->numPages,
++                mdlMap->vmaAddr
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_MEMORY);
++            return gcvSTATUS_OUT_OF_MEMORY;
++        }
++
++        down_write(&current->mm->mmap_sem);
++
++        mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
++
++        if (!mdlMap->vma)
++        {
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): find_vma error.",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            up_write(&current->mm->mmap_sem);
++
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++            return gcvSTATUS_OUT_OF_RESOURCES;
++        }
++
++#ifndef NO_DMA_COHERENT
++        if (dma_mmap_coherent(gcvNULL,
++                    mdlMap->vma,
++                    mdl->addr,
++                    mdl->dmaHandle,
++                    mdl->numPages * PAGE_SIZE) < 0)
++        {
++            up_write(&current->mm->mmap_sem);
++
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): dma_mmap_coherent error.",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++            return gcvSTATUS_OUT_OF_RESOURCES;
++        }
++#else
++#if !gcdPAGED_MEMORY_CACHEABLE
++        mdlMap->vma->vm_page_prot = gcmkPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
++        mdlMap->vma->vm_flags |= gcdVM_FLAGS;
++#   endif
++        mdlMap->vma->vm_pgoff = 0;
++
++        if (remap_pfn_range(mdlMap->vma,
++                            mdlMap->vma->vm_start,
++                            mdl->dmaHandle >> PAGE_SHIFT,
++                            mdl->numPages*PAGE_SIZE,
++                            mdlMap->vma->vm_page_prot) < 0)
++        {
++            up_write(&current->mm->mmap_sem);
++
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): remap_pfn_range error.",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++            return gcvSTATUS_OUT_OF_RESOURCES;
++        }
++#endif
++
++        up_write(&current->mm->mmap_sem);
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    *Logical = mdlMap->vmaAddr;
++
++    gcmkFOOTER_ARG("*Logical=0x%X", *Logical);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_UnmapMemory
++**
++**  Unmap physical memory out of the current process.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Start of physical address memory.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to unmap.
++**
++**      gctPOINTER Memory
++**          Pointer to a previously mapped memory region.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnmapMemory(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu Logical=0x%X",
++                   Os, Physical, Bytes, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != 0);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    gckOS_UnmapMemoryEx(Os, Physical, Bytes, Logical, _GetProcessID());
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++/*******************************************************************************
++**
++**  gckOS_UnmapMemoryEx
++**
++**  Unmap physical memory in the specified process.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Start of physical address memory.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to unmap.
++**
++**      gctPOINTER Memory
++**          Pointer to a previously mapped memory region.
++**
++**      gctUINT32 PID
++**          Pid of the process that opened the device and mapped this memory.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnmapMemoryEx(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical,
++    IN gctUINT32 PID
++    )
++{
++    PLINUX_MDL_MAP          mdlMap;
++    PLINUX_MDL              mdl = (PLINUX_MDL)Physical;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu Logical=0x%X PID=%d",
++                   Os, Physical, Bytes, Logical, PID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != 0);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(PID != 0);
++
++    MEMORY_LOCK(Os);
++
++    if (Logical)
++    {
++        mdlMap = FindMdlMap(mdl, PID);
++
++        if (mdlMap == gcvNULL || mdlMap->vmaAddr == gcvNULL)
++        {
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
++            return gcvSTATUS_INVALID_ARGUMENT;
++        }
++
++        _UnmapUserLogical(PID, mdlMap->vmaAddr, mdl->numPages * PAGE_SIZE);
++
++        gcmkVERIFY_OK(_DestroyMdlMap(mdl, mdlMap));
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_UnmapUserLogical
++**
++**  Unmap user logical memory out of physical memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Start of physical address memory.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to unmap.
++**
++**      gctPOINTER Memory
++**          Pointer to a previously mapped memory region.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnmapUserLogical(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu Logical=0x%X",
++                   Os, Physical, Bytes, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != 0);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    gckOS_UnmapMemory(Os, Physical, Bytes, Logical);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++}
++
++/*******************************************************************************
++**
++**  gckOS_AllocateNonPagedMemory
++**
++**  Allocate a number of pages from non-paged memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctBOOL InUserSpace
++**          gcvTRUE if the pages need to be mapped into user space.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that holds the number of bytes to allocate.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that hold the number of bytes allocated.
++**
++**      gctPHYS_ADDR * Physical
++**          Pointer to a variable that will hold the physical address of the
++**          allocation.
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that will hold the logical address of the
++**          allocation.
++*/
++gceSTATUS
++gckOS_AllocateNonPagedMemory(
++    IN gckOS Os,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    )
++{
++    gctSIZE_T bytes;
++    gctINT numPages;
++    PLINUX_MDL mdl = gcvNULL;
++    PLINUX_MDL_MAP mdlMap = gcvNULL;
++    gctSTRING addr;
++#ifdef NO_DMA_COHERENT
++    struct page * page;
++    long size, order;
++    gctPOINTER vaddr;
++#endif
++    gctBOOL locked = gcvFALSE;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X InUserSpace=%d *Bytes=%lu",
++                   Os, InUserSpace, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes != gcvNULL);
++    gcmkVERIFY_ARGUMENT(*Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Align number of bytes to page size. */
++    bytes = gcmALIGN(*Bytes, PAGE_SIZE);
++
++    /* Get total number of pages.. */
++    numPages = GetPageCount(bytes, 0);
++
++    /* Allocate mdl+vector structure */
++    mdl = _CreateMdl(_GetProcessID());
++    if (mdl == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    mdl->pagedMem = 0;
++    mdl->numPages = numPages;
++
++    MEMORY_LOCK(Os);
++    locked = gcvTRUE;
++
++#ifndef NO_DMA_COHERENT
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    addr = _GetNonPagedMemoryCache(Os,
++                mdl->numPages * PAGE_SIZE,
++                &mdl->dmaHandle);
++
++    if (addr == gcvNULL)
++#endif
++    {
++        addr = dma_zalloc_coherent(gcvNULL,
++                mdl->numPages * PAGE_SIZE,
++                &mdl->dmaHandle,
++                GFP_KERNEL | gcdNOWARN);
++    }
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    if(addr == gcvNULL)
++    {
++            MEMORY_UNLOCK(Os);
++            locked = gcvFALSE;
++            /*Free all cache and try again*/
++            _FreeAllNonPagedMemoryCache(Os);
++            MEMORY_LOCK(Os);
++            locked = gcvTRUE;
++            addr = dma_zalloc_coherent(gcvNULL,
++                mdl->numPages * PAGE_SIZE,
++                &mdl->dmaHandle,
++                GFP_KERNEL | gcdNOWARN);
++    }
++#endif
++#else
++    size    = mdl->numPages * PAGE_SIZE;
++    order   = get_order(size);
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    page = _GetNonPagedMemoryCache(Os, order);
++
++    if (page == gcvNULL)
++#endif
++    {
++        page = alloc_pages(GFP_KERNEL | gcdNOWARN, order);
++    }
++
++    if (page == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    vaddr           = (gctPOINTER)page_address(page);
++    mdl->contiguous = gcvTRUE;
++    mdl->u.contiguousPages = page;
++    addr            = _CreateKernelVirtualMapping(mdl);
++    mdl->dmaHandle  = virt_to_phys(vaddr);
++    mdl->kaddr      = vaddr;
++    mdl->u.contiguousPages = page;
++
++#if !defined(CONFIG_PPC)
++    /* Cache invalidate. */
++    dma_sync_single_for_device(
++                gcvNULL,
++                page_to_phys(page),
++                bytes,
++                DMA_FROM_DEVICE);
++#endif
++
++    while (size > 0)
++    {
++        SetPageReserved(virt_to_page(vaddr));
++
++        vaddr   += PAGE_SIZE;
++        size    -= PAGE_SIZE;
++    }
++#endif
++
++    if (addr == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    mdl->addr = addr;
++
++    /* Return allocated memory. */
++    *Bytes = bytes;
++    *Physical = (gctPHYS_ADDR) mdl;
++
++    if (InUserSpace)
++    {
++        mdlMap = _CreateMdlMap(mdl, _GetProcessID());
++
++        if (mdlMap == gcvNULL)
++        {
++            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++        }
++
++        /* Only after mmap this will be valid. */
++
++        /* We need to map this to user space. */
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
++        mdlMap->vmaAddr = (gctSTRING) vm_mmap(gcvNULL,
++                0L,
++                mdl->numPages * PAGE_SIZE,
++                PROT_READ | PROT_WRITE,
++                MAP_SHARED,
++                0);
++#else
++        down_write(&current->mm->mmap_sem);
++
++        mdlMap->vmaAddr = (gctSTRING) do_mmap_pgoff(gcvNULL,
++                0L,
++                mdl->numPages * PAGE_SIZE,
++                PROT_READ | PROT_WRITE,
++                MAP_SHARED,
++                0);
++
++        up_write(&current->mm->mmap_sem);
++#endif
++
++        if (IS_ERR(mdlMap->vmaAddr))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): do_mmap_pgoff error",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++        }
++
++        down_write(&current->mm->mmap_sem);
++
++        mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
++
++        if (mdlMap->vma == gcvNULL)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): find_vma error",
++                __FUNCTION__, __LINE__
++                );
++
++            up_write(&current->mm->mmap_sem);
++
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++
++#ifndef NO_DMA_COHERENT
++        if (dma_mmap_coherent(gcvNULL,
++                mdlMap->vma,
++                mdl->addr,
++                mdl->dmaHandle,
++                mdl->numPages * PAGE_SIZE) < 0)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): dma_mmap_coherent error",
++                __FUNCTION__, __LINE__
++                );
++
++            up_write(&current->mm->mmap_sem);
++
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++#else
++        mdlMap->vma->vm_page_prot = gcmkNONPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
++        mdlMap->vma->vm_flags |= gcdVM_FLAGS;
++        mdlMap->vma->vm_pgoff = 0;
++
++        if (remap_pfn_range(mdlMap->vma,
++                            mdlMap->vma->vm_start,
++                            mdl->dmaHandle >> PAGE_SHIFT,
++                            mdl->numPages * PAGE_SIZE,
++                            mdlMap->vma->vm_page_prot))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_WARNING, gcvZONE_OS,
++                "%s(%d): remap_pfn_range error",
++                __FUNCTION__, __LINE__
++                );
++
++            up_write(&current->mm->mmap_sem);
++
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++#endif /* NO_DMA_COHERENT */
++
++        up_write(&current->mm->mmap_sem);
++
++        *Logical = mdlMap->vmaAddr;
++    }
++    else
++    {
++        *Logical = (gctPOINTER)mdl->addr;
++    }
++
++    /*
++     * Add this to a global list.
++     * Will be used by get physical address
++     * and mapuser pointer functions.
++     */
++
++    if (!Os->mdlHead)
++    {
++        /* Initialize the queue. */
++        Os->mdlHead = Os->mdlTail = mdl;
++    }
++    else
++    {
++        /* Add to the tail. */
++        mdl->prev = Os->mdlTail;
++        Os->mdlTail->next = mdl;
++        Os->mdlTail = mdl;
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu *Physical=0x%X *Logical=0x%X",
++                   *Bytes, *Physical, *Logical);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (mdlMap != gcvNULL)
++    {
++        /* Free LINUX_MDL_MAP. */
++        gcmkVERIFY_OK(_DestroyMdlMap(mdl, mdlMap));
++    }
++
++    if (mdl != gcvNULL)
++    {
++        /* Free LINUX_MDL. */
++        gcmkVERIFY_OK(_DestroyMdl(mdl));
++    }
++
++    if (locked)
++    {
++        /* Unlock memory. */
++        MEMORY_UNLOCK(Os);
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_FreeNonPagedMemory
++**
++**  Free previously allocated and mapped pages from non-paged memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes allocated.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the allocated memory.
++**
++**      gctPOINTER Logical
++**          Logical address of the allocated memory.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS gckOS_FreeNonPagedMemory(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical
++    )
++{
++    PLINUX_MDL mdl;
++    PLINUX_MDL_MAP mdlMap;
++#ifdef NO_DMA_COHERENT
++    unsigned size;
++    gctPOINTER vaddr;
++#endif /* NO_DMA_COHERENT */
++
++    gcmkHEADER_ARG("Os=0x%X Bytes=%lu Physical=0x%X Logical=0x%X",
++                   Os, Bytes, Physical, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Physical != 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Convert physical address into a pointer to a MDL. */
++    mdl = (PLINUX_MDL) Physical;
++
++    MEMORY_LOCK(Os);
++
++#ifndef NO_DMA_COHERENT
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    if (!_AddNonPagedMemoryCache(Os,
++                                 mdl->numPages * PAGE_SIZE,
++                                 mdl->addr,
++                                 mdl->dmaHandle))
++#endif
++    {
++        dma_free_coherent(gcvNULL,
++                mdl->numPages * PAGE_SIZE,
++                mdl->addr,
++                mdl->dmaHandle);
++    }
++#else
++    size    = mdl->numPages * PAGE_SIZE;
++    vaddr   = mdl->kaddr;
++
++    while (size > 0)
++    {
++        ClearPageReserved(virt_to_page(vaddr));
++
++        vaddr   += PAGE_SIZE;
++        size    -= PAGE_SIZE;
++    }
++
++#if gcdUSE_NON_PAGED_MEMORY_CACHE
++    if (!_AddNonPagedMemoryCache(Os,
++                                 get_order(mdl->numPages * PAGE_SIZE),
++                                 virt_to_page(mdl->kaddr)))
++#endif
++    {
++        free_pages((unsigned long)mdl->kaddr, get_order(mdl->numPages * PAGE_SIZE));
++    }
++
++    _DestoryKernelVirtualMapping(mdl->addr);
++#endif /* NO_DMA_COHERENT */
++
++    mdlMap = mdl->maps;
++
++    while (mdlMap != gcvNULL)
++    {
++        if (mdlMap->vmaAddr != gcvNULL)
++        {
++            /* No mapped memory exists when free nonpaged memory */
++            gcmkASSERT(0);
++        }
++
++        mdlMap = mdlMap->next;
++    }
++
++    /* Remove the node from global list.. */
++    if (mdl == Os->mdlHead)
++    {
++        if ((Os->mdlHead = mdl->next) == gcvNULL)
++        {
++            Os->mdlTail = gcvNULL;
++        }
++    }
++    else
++    {
++        mdl->prev->next = mdl->next;
++        if (mdl == Os->mdlTail)
++        {
++            Os->mdlTail = mdl->prev;
++        }
++        else
++        {
++            mdl->next->prev = mdl->prev;
++        }
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    gcmkVERIFY_OK(_DestroyMdl(mdl));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_ReadRegister
++**
++**  Read data from a register.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 Address
++**          Address of register.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Data
++**          Pointer to a variable that receives the data read from the register.
++*/
++gceSTATUS
++gckOS_ReadRegister(
++    IN gckOS Os,
++    IN gctUINT32 Address,
++    OUT gctUINT32 * Data
++    )
++{
++    return gckOS_ReadRegisterEx(Os, gcvCORE_MAJOR, Address, Data);
++}
++
++gceSTATUS
++gckOS_ReadRegisterEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT32 Address,
++    OUT gctUINT32 * Data
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Core=%d Address=0x%X", Os, Core, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Address < Os->device->requestedRegisterMemSizes[Core]);
++    gcmkVERIFY_ARGUMENT(Data != gcvNULL);
++
++    if(Address != 0x10) mutex_lock(&Os->gpu_clk_mutex);
++    BUG_ON(!Os->gpu_clk_on[Core]);
++
++    if(Address)
++    {
++        gctUINT32 AQHiClockControl = readl((gctUINT8 *)Os->device->registerBases[Core]);
++        BUG_ON((AQHiClockControl & 0x3) == 0x3);
++    }
++
++    *Data = readl((gctUINT8 *)Os->device->registerBases[Core] + Address);
++    if(Address != 0x10) mutex_unlock(&Os->gpu_clk_mutex);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Data=0x%08x", *Data);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_WriteRegister
++**
++**  Write data to a register.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 Address
++**          Address of register.
++**
++**      gctUINT32 Data
++**          Data for register.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_WriteRegister(
++    IN gckOS Os,
++    IN gctUINT32 Address,
++    IN gctUINT32 Data
++    )
++{
++    return gckOS_WriteRegisterEx(Os, gcvCORE_MAJOR, Address, Data);
++}
++
++gceSTATUS
++gckOS_WriteRegisterEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT32 Address,
++    IN gctUINT32 Data
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Core=%d Address=0x%X Data=0x%08x", Os, Core, Address, Data);
++
++    gcmkVERIFY_ARGUMENT(Address < Os->device->requestedRegisterMemSizes[Core]);
++
++    mutex_lock(&Os->gpu_clk_mutex);
++    BUG_ON(!Os->gpu_clk_on[Core]);
++
++    if(Address)
++    {
++        gctUINT32 AQHiClockControl = readl((gctUINT8 *)Os->device->registerBases[Core]);
++        BUG_ON((AQHiClockControl & 0x3) == 0x3);
++    }
++
++    writel(Data, (gctUINT8 *)Os->device->registerBases[Core] + Address);
++    mutex_unlock(&Os->gpu_clk_mutex);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetPageSize
++**
++**  Get the system's page size.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * PageSize
++**          Pointer to a variable that will receive the system's page size.
++*/
++gceSTATUS gckOS_GetPageSize(
++    IN gckOS Os,
++    OUT gctSIZE_T * PageSize
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(PageSize != gcvNULL);
++
++    /* Return the page size. */
++    *PageSize = (gctSIZE_T) PAGE_SIZE;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*PageSize", *PageSize);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetPhysicalAddress
++**
++**  Get the physical system address of a corresponding virtual address.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Logical
++**          Logical address.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Poinetr to a variable that receives the 32-bit physical adress.
++*/
++gceSTATUS
++gckOS_GetPhysicalAddress(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    OUT gctUINT32 * Address
++    )
++{
++    gceSTATUS status;
++    gctUINT32 processID;
++
++    gcmkHEADER_ARG("Os=0x%X Logical=0x%X", Os, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Query page table of current process first. */
++    status = _QueryProcessPageTable(Logical, Address);
++
++    if (gcmIS_ERROR(status))
++    {
++        /* Get current process ID. */
++        processID = _GetProcessID();
++
++        /* Route through other function. */
++        gcmkONERROR(
++            gckOS_GetPhysicalAddressProcess(Os, Logical, processID, Address));
++    }
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdSECURE_USER
++static gceSTATUS
++gckOS_AddMapping(
++    IN gckOS Os,
++    IN gctUINT32 Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gceSTATUS status;
++    gcsUSER_MAPPING_PTR map;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Logical=0x%X Bytes=%lu",
++                   Os, Physical, Logical, Bytes);
++
++    gcmkONERROR(gckOS_Allocate(Os,
++                               gcmSIZEOF(gcsUSER_MAPPING),
++                               (gctPOINTER *) &map));
++
++    map->next     = Os->userMap;
++    map->physical = Physical - Os->device->baseAddress;
++    map->logical  = Logical;
++    map->bytes    = Bytes;
++    map->start    = (gctINT8_PTR) Logical;
++    map->end      = map->start + Bytes;
++
++    Os->userMap = map;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++static gceSTATUS
++gckOS_RemoveMapping(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gceSTATUS status;
++    gcsUSER_MAPPING_PTR map, prev;
++
++    gcmkHEADER_ARG("Os=0x%X Logical=0x%X Bytes=%lu", Os, Logical, Bytes);
++
++    for (map = Os->userMap, prev = gcvNULL; map != gcvNULL; map = map->next)
++    {
++        if ((map->logical == Logical)
++        &&  (map->bytes   == Bytes)
++        )
++        {
++            break;
++        }
++
++        prev = map;
++    }
++
++    if (map == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_INVALID_ADDRESS);
++    }
++
++    if (prev == gcvNULL)
++    {
++        Os->userMap = map->next;
++    }
++    else
++    {
++        prev->next = map->next;
++    }
++
++    gcmkONERROR(gcmkOS_SAFE_FREE(Os, map));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++static gceSTATUS
++_ConvertLogical2Physical(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    IN gctUINT32 ProcessID,
++    IN PLINUX_MDL Mdl,
++    OUT gctUINT32_PTR Physical
++    )
++{
++    gctINT8_PTR base, vBase;
++    gctUINT32 offset;
++    PLINUX_MDL_MAP map;
++    gcsUSER_MAPPING_PTR userMap;
++
++    base = (Mdl == gcvNULL) ? gcvNULL : (gctINT8_PTR) Mdl->addr;
++
++    /* Check for the logical address match. */
++    if ((base != gcvNULL)
++    &&  ((gctINT8_PTR) Logical >= base)
++    &&  ((gctINT8_PTR) Logical <  base + Mdl->numPages * PAGE_SIZE)
++    )
++    {
++        offset = (gctINT8_PTR) Logical - base;
++
++        if (Mdl->dmaHandle != 0)
++        {
++            /* The memory was from coherent area. */
++            *Physical = (gctUINT32) Mdl->dmaHandle + offset;
++        }
++        else if (Mdl->pagedMem && !Mdl->contiguous)
++        {
++            /* paged memory is not mapped to kernel space. */
++            return gcvSTATUS_INVALID_ADDRESS;
++        }
++        else
++        {
++            *Physical = gcmPTR2INT(virt_to_phys(base)) + offset;
++        }
++
++        return gcvSTATUS_OK;
++    }
++
++    /* Walk user maps. */
++    for (userMap = Os->userMap; userMap != gcvNULL; userMap = userMap->next)
++    {
++        if (((gctINT8_PTR) Logical >= userMap->start)
++        &&  ((gctINT8_PTR) Logical <  userMap->end)
++        )
++        {
++            *Physical = userMap->physical
++                      + (gctUINT32) ((gctINT8_PTR) Logical - userMap->start);
++
++            return gcvSTATUS_OK;
++        }
++    }
++
++    if (ProcessID != Os->kernelProcessID)
++    {
++        map   = FindMdlMap(Mdl, (gctINT) ProcessID);
++        vBase = (map == gcvNULL) ? gcvNULL : (gctINT8_PTR) map->vmaAddr;
++
++        /* Is the given address within that range. */
++        if ((vBase != gcvNULL)
++        &&  ((gctINT8_PTR) Logical >= vBase)
++        &&  ((gctINT8_PTR) Logical <  vBase + Mdl->numPages * PAGE_SIZE)
++        )
++        {
++            offset = (gctINT8_PTR) Logical - vBase;
++
++            if (Mdl->dmaHandle != 0)
++            {
++                /* The memory was from coherent area. */
++                *Physical = (gctUINT32) Mdl->dmaHandle + offset;
++            }
++            else if (Mdl->pagedMem && !Mdl->contiguous)
++            {
++                *Physical = _NonContiguousToPhys(Mdl->u.nonContiguousPages, offset/PAGE_SIZE);
++            }
++            else
++            {
++                *Physical = page_to_phys(Mdl->u.contiguousPages) + offset;
++            }
++
++            return gcvSTATUS_OK;
++        }
++    }
++
++    /* Address not yet found. */
++    return gcvSTATUS_INVALID_ADDRESS;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetPhysicalAddressProcess
++**
++**  Get the physical system address of a corresponding virtual address for a
++**  given process.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctPOINTER Logical
++**          Logical address.
++**
++**      gctUINT32 ProcessID
++**          Process ID.
++**
++**  OUTPUT:
++**
++**      gctUINT32 * Address
++**          Poinetr to a variable that receives the 32-bit physical adress.
++*/
++gceSTATUS
++gckOS_GetPhysicalAddressProcess(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    IN gctUINT32 ProcessID,
++    OUT gctUINT32 * Address
++    )
++{
++    PLINUX_MDL mdl;
++    gctINT8_PTR base;
++    gceSTATUS status = gcvSTATUS_INVALID_ADDRESS;
++
++    gcmkHEADER_ARG("Os=0x%X Logical=0x%X ProcessID=%d", Os, Logical, ProcessID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    MEMORY_LOCK(Os);
++
++    /* First try the contiguous memory pool. */
++    if (Os->device->contiguousMapped)
++    {
++        base = (gctINT8_PTR) Os->device->contiguousBase;
++
++        if (((gctINT8_PTR) Logical >= base)
++        &&  ((gctINT8_PTR) Logical <  base + Os->device->contiguousSize)
++        )
++        {
++            /* Convert logical address into physical. */
++            *Address = Os->device->contiguousVidMem->baseAddress
++                     + (gctINT8_PTR) Logical - base;
++            status   = gcvSTATUS_OK;
++        }
++    }
++    else
++    {
++        /* Try the contiguous memory pool. */
++        mdl = (PLINUX_MDL) Os->device->contiguousPhysical;
++        status = _ConvertLogical2Physical(Os,
++                                          Logical,
++                                          ProcessID,
++                                          mdl,
++                                          Address);
++    }
++
++    if (gcmIS_ERROR(status))
++    {
++        /* Walk all MDLs. */
++        for (mdl = Os->mdlHead; mdl != gcvNULL; mdl = mdl->next)
++        {
++            /* Try this MDL. */
++            status = _ConvertLogical2Physical(Os,
++                                              Logical,
++                                              ProcessID,
++                                              mdl,
++                                              Address);
++            if (gcmIS_SUCCESS(status))
++            {
++                break;
++            }
++        }
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    gcmkONERROR(status);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Address=0x%08x", *Address);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_MapPhysical
++**
++**  Map a physical address into kernel space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 Physical
++**          Physical address of the memory to map.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to map.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that receives the base address of the mapped
++**          memory.
++*/
++gceSTATUS
++gckOS_MapPhysical(
++    IN gckOS Os,
++    IN gctUINT32 Physical,
++    IN gctSIZE_T Bytes,
++    OUT gctPOINTER * Logical
++    )
++{
++    gctPOINTER logical;
++    PLINUX_MDL mdl;
++    gctUINT32 physical = Physical;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    MEMORY_LOCK(Os);
++
++    /* Go through our mapping to see if we know this physical address already. */
++    mdl = Os->mdlHead;
++
++    while (mdl != gcvNULL)
++    {
++        if (mdl->dmaHandle != 0)
++        {
++            if ((physical >= mdl->dmaHandle)
++            &&  (physical < mdl->dmaHandle + mdl->numPages * PAGE_SIZE)
++            )
++            {
++                *Logical = mdl->addr + (physical - mdl->dmaHandle);
++                break;
++            }
++        }
++
++        mdl = mdl->next;
++    }
++
++    if (mdl == gcvNULL)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	struct contiguous_mem_pool *pool = Os->device->pool;
++
++	if (Physical >= pool->phys && Physical < pool->phys + pool->size)
++		logical = (gctPOINTER)(Physical - pool->phys + pool->virt);
++	else
++		logical = gcvNULL;
++#else
++        /* Map memory as cached memory. */
++        request_mem_region(physical, Bytes, "MapRegion");
++        logical = (gctPOINTER) ioremap_nocache(physical, Bytes);
++#endif
++
++        if (logical == gcvNULL)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_OS,
++                "%s(%d): Failed to map physical address 0x%08x",
++                __FUNCTION__, __LINE__, Physical
++                );
++
++            MEMORY_UNLOCK(Os);
++
++            /* Out of resources. */
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++            return gcvSTATUS_OUT_OF_RESOURCES;
++        }
++
++        /* Return pointer to mapped memory. */
++        *Logical = logical;
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Logical=0x%X", *Logical);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_UnmapPhysical
++**
++**  Unmap a previously mapped memory region from kernel memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Logical
++**          Pointer to the base address of the memory to unmap.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to unmap.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnmapPhysical(
++    IN gckOS Os,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    PLINUX_MDL  mdl;
++
++    gcmkHEADER_ARG("Os=0x%X Logical=0x%X Bytes=%lu", Os, Logical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    MEMORY_LOCK(Os);
++
++    mdl = Os->mdlHead;
++
++    while (mdl != gcvNULL)
++    {
++        if (mdl->addr != gcvNULL)
++        {
++            if (Logical >= (gctPOINTER)mdl->addr
++                    && Logical < (gctPOINTER)((gctSTRING)mdl->addr + mdl->numPages * PAGE_SIZE))
++            {
++                break;
++            }
++        }
++
++        mdl = mdl->next;
++    }
++
++    if (mdl == gcvNULL)
++    {
++        /* Unmap the memory. */
++        iounmap(Logical);
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_CreateMutex
++**
++**  Create a new mutex.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Mutex
++**          Pointer to a variable that will hold a pointer to the mutex.
++*/
++gceSTATUS
++gckOS_CreateMutex(
++    IN gckOS Os,
++    OUT gctPOINTER * Mutex
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Validate the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
++
++    /* Allocate the mutex structure. */
++    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(struct mutex), Mutex));
++
++    /* Initialize the mutex. */
++    mutex_init(*Mutex);
++
++    /* Return status. */
++    gcmkFOOTER_ARG("*Mutex=0x%X", *Mutex);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_DeleteMutex
++**
++**  Delete a mutex.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Mutex
++**          Pointer to the mute to be deleted.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_DeleteMutex(
++    IN gckOS Os,
++    IN gctPOINTER Mutex
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Mutex=0x%X", Os, Mutex);
++
++    /* Validate the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
++
++    /* Destroy the mutex. */
++    mutex_destroy(Mutex);
++
++    /* Free the mutex structure. */
++    gcmkONERROR(gckOS_Free(Os, Mutex));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AcquireMutex
++**
++**  Acquire a mutex.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Mutex
++**          Pointer to the mutex to be acquired.
++**
++**      gctUINT32 Timeout
++**          Timeout value specified in milliseconds.
++**          Specify the value of gcvINFINITE to keep the thread suspended
++**          until the mutex has been acquired.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AcquireMutex(
++    IN gckOS Os,
++    IN gctPOINTER Mutex,
++    IN gctUINT32 Timeout
++    )
++{
++#if gcdDETECT_TIMEOUT
++    gctUINT32 timeout;
++#endif
++
++    gcmkHEADER_ARG("Os=0x%X Mutex=0x%0x Timeout=%u", Os, Mutex, Timeout);
++
++    /* Validate the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
++
++#if gcdDETECT_TIMEOUT
++    timeout = 0;
++
++    for (;;)
++    {
++        /* Try to acquire the mutex. */
++        if (mutex_trylock(Mutex))
++        {
++            /* Success. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        /* Advance the timeout. */
++        timeout += 1;
++
++        if (Timeout == gcvINFINITE)
++        {
++            if (timeout == gcdINFINITE_TIMEOUT)
++            {
++                gctUINT32 dmaAddress1, dmaAddress2;
++                gctUINT32 dmaState1, dmaState2;
++
++                dmaState1   = dmaState2   =
++                dmaAddress1 = dmaAddress2 = 0;
++
++                /* Verify whether DMA is running. */
++                gcmkVERIFY_OK(_VerifyDMA(
++                    Os, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
++                    ));
++
++#if gcdDETECT_DMA_ADDRESS
++                /* Dump only if DMA appears stuck. */
++                if (
++                    (dmaAddress1 == dmaAddress2)
++#if gcdDETECT_DMA_STATE
++                 && (dmaState1   == dmaState2)
++#      endif
++                )
++#   endif
++                {
++                    gcmkVERIFY_OK(_DumpGPUState(Os, gcvCORE_MAJOR));
++
++                    gcmkPRINT(
++                        "%s(%d): mutex 0x%X; forced message flush.",
++                        __FUNCTION__, __LINE__, Mutex
++                        );
++
++                    /* Flush the debug cache. */
++                    gcmkDEBUGFLUSH(dmaAddress2);
++                }
++
++                timeout = 0;
++            }
++        }
++        else
++        {
++            /* Timedout? */
++            if (timeout >= Timeout)
++            {
++                break;
++            }
++        }
++
++        /* Wait for 1 millisecond. */
++        gcmkVERIFY_OK(gckOS_Delay(Os, 1));
++    }
++#else
++    if (Timeout == gcvINFINITE)
++    {
++        /* Lock the mutex. */
++        mutex_lock(Mutex);
++
++        /* Success. */
++        gcmkFOOTER_NO();
++        return gcvSTATUS_OK;
++    }
++
++    for (;;)
++    {
++        /* Try to acquire the mutex. */
++        if (mutex_trylock(Mutex))
++        {
++            /* Success. */
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        if (Timeout-- == 0)
++        {
++            break;
++        }
++
++        /* Wait for 1 millisecond. */
++        gcmkVERIFY_OK(gckOS_Delay(Os, 1));
++    }
++#endif
++
++    /* Timeout. */
++    gcmkFOOTER_ARG("status=%d", gcvSTATUS_TIMEOUT);
++    return gcvSTATUS_TIMEOUT;
++}
++
++/*******************************************************************************
++**
++**  gckOS_ReleaseMutex
++**
++**  Release an acquired mutex.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Mutex
++**          Pointer to the mutex to be released.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_ReleaseMutex(
++    IN gckOS Os,
++    IN gctPOINTER Mutex
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Mutex=0x%0x", Os, Mutex);
++
++    /* Validate the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Mutex != gcvNULL);
++
++    /* Release the mutex. */
++    mutex_unlock(Mutex);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomicExchange
++**
++**  Atomically exchange a pair of 32-bit values.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      IN OUT gctINT32_PTR Target
++**          Pointer to the 32-bit value to exchange.
++**
++**      IN gctINT32 NewValue
++**          Specifies a new value for the 32-bit value pointed to by Target.
++**
++**      OUT gctINT32_PTR OldValue
++**          The old value of the 32-bit value pointed to by Target.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomicExchange(
++    IN gckOS Os,
++    IN OUT gctUINT32_PTR Target,
++    IN gctUINT32 NewValue,
++    OUT gctUINT32_PTR OldValue
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Target=0x%X NewValue=%u", Os, Target, NewValue);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++    /* Exchange the pair of 32-bit values. */
++    *OldValue = (gctUINT32) atomic_xchg((atomic_t *) Target, (int) NewValue);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*OldValue=%u", *OldValue);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomicExchangePtr
++**
++**  Atomically exchange a pair of pointers.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      IN OUT gctPOINTER * Target
++**          Pointer to the 32-bit value to exchange.
++**
++**      IN gctPOINTER NewValue
++**          Specifies a new value for the pointer pointed to by Target.
++**
++**      OUT gctPOINTER * OldValue
++**          The old value of the pointer pointed to by Target.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomicExchangePtr(
++    IN gckOS Os,
++    IN OUT gctPOINTER * Target,
++    IN gctPOINTER NewValue,
++    OUT gctPOINTER * OldValue
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Target=0x%X NewValue=0x%X", Os, Target, NewValue);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++    /* Exchange the pair of pointers. */
++    *OldValue = (gctPOINTER)(gctUINTPTR_T) atomic_xchg((atomic_t *) Target, (int)(gctUINTPTR_T) NewValue);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*OldValue=0x%X", *OldValue);
++    return gcvSTATUS_OK;
++}
++
++#if gcdSMP
++/*******************************************************************************
++**
++**  gckOS_AtomicSetMask
++**
++**  Atomically set mask to Atom
++**
++**  INPUT:
++**      IN OUT gctPOINTER Atom
++**          Pointer to the atom to set.
++**
++**      IN gctUINT32 Mask
++**          Mask to set.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomSetMask(
++    IN gctPOINTER Atom,
++    IN gctUINT32 Mask
++    )
++{
++    gctUINT32 oval, nval;
++
++    gcmkHEADER_ARG("Atom=0x%0x", Atom);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    do
++    {
++        oval = atomic_read((atomic_t *) Atom);
++        nval = oval | Mask;
++    } while (atomic_cmpxchg((atomic_t *) Atom, oval, nval) != oval);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomClearMask
++**
++**  Atomically clear mask from Atom
++**
++**  INPUT:
++**      IN OUT gctPOINTER Atom
++**          Pointer to the atom to clear.
++**
++**      IN gctUINT32 Mask
++**          Mask to clear.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomClearMask(
++    IN gctPOINTER Atom,
++    IN gctUINT32 Mask
++    )
++{
++    gctUINT32 oval, nval;
++
++    gcmkHEADER_ARG("Atom=0x%0x", Atom);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    do
++    {
++        oval = atomic_read((atomic_t *) Atom);
++        nval = oval & ~Mask;
++    } while (atomic_cmpxchg((atomic_t *) Atom, oval, nval) != oval);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckOS_AtomConstruct
++**
++**  Create an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Atom
++**          Pointer to a variable receiving the constructed atom.
++*/
++gceSTATUS
++gckOS_AtomConstruct(
++    IN gckOS Os,
++    OUT gctPOINTER * Atom
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    /* Allocate the atom. */
++    gcmkONERROR(gckOS_Allocate(Os, gcmSIZEOF(atomic_t), Atom));
++
++    /* Initialize the atom. */
++    atomic_set((atomic_t *) *Atom, 0);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Atom=0x%X", *Atom);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomDestroy
++**
++**  Destroy an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom to destroy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomDestroy(
++    IN gckOS Os,
++    OUT gctPOINTER Atom
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    /* Free the atom. */
++    gcmkONERROR(gcmkOS_SAFE_FREE(Os, Atom));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomGet
++**
++**  Get the 32-bit value protected by an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**  OUTPUT:
++**
++**      gctINT32_PTR Value
++**          Pointer to a variable the receives the value of the atom.
++*/
++gceSTATUS
++gckOS_AtomGet(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    OUT gctINT32_PTR Value
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    /* Return the current value of atom. */
++    *Value = atomic_read((atomic_t *) Atom);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Value=%d", *Value);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomSet
++**
++**  Set the 32-bit value protected by an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**      gctINT32 Value
++**          The value of the atom.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AtomSet(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    IN gctINT32 Value
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x Value=%d", Os, Atom);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    /* Set the current value of atom. */
++    atomic_set((atomic_t *) Atom, Value);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomIncrement
++**
++**  Atomically increment the 32-bit integer value inside an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**  OUTPUT:
++**
++**      gctINT32_PTR Value
++**          Pointer to a variable that receives the original value of the atom.
++*/
++gceSTATUS
++gckOS_AtomIncrement(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    OUT gctINT32_PTR Value
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    /* Increment the atom. */
++    *Value = atomic_inc_return((atomic_t *) Atom) - 1;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Value=%d", *Value);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AtomDecrement
++**
++**  Atomically decrement the 32-bit integer value inside an atom.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gctPOINTER Atom
++**          Pointer to the atom.
++**
++**  OUTPUT:
++**
++**      gctINT32_PTR Value
++**          Pointer to a variable that receives the original value of the atom.
++*/
++gceSTATUS
++gckOS_AtomDecrement(
++    IN gckOS Os,
++    IN gctPOINTER Atom,
++    OUT gctINT32_PTR Value
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Atom=0x%0x", Os, Atom);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Atom != gcvNULL);
++
++    /* Decrement the atom. */
++    *Value = atomic_dec_return((atomic_t *) Atom) + 1;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Value=%d", *Value);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_Delay
++**
++**  Delay execution of the current thread for a number of milliseconds.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 Delay
++**          Delay to sleep, specified in milliseconds.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_Delay(
++    IN gckOS Os,
++    IN gctUINT32 Delay
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Delay=%u", Os, Delay);
++
++    if (Delay > 0)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 28)
++        ktime_t delay = ktime_set(Delay/1000, (Delay%1000) * NSEC_PER_MSEC);
++        __set_current_state(TASK_UNINTERRUPTIBLE);
++        schedule_hrtimeout(&delay, HRTIMER_MODE_REL);
++#else
++        msleep(Delay);
++#endif
++
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetTicks
++**
++**  Get the number of milliseconds since the system started.
++**
++**  INPUT:
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR Time
++**          Pointer to a variable to get time.
++**
++*/
++gceSTATUS
++gckOS_GetTicks(
++    OUT gctUINT32_PTR Time
++    )
++{
++     gcmkHEADER();
++
++    *Time = jiffies_to_msecs(jiffies);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_TicksAfter
++**
++**  Compare time values got from gckOS_GetTicks.
++**
++**  INPUT:
++**      gctUINT32 Time1
++**          First time value to be compared.
++**
++**      gctUINT32 Time2
++**          Second time value to be compared.
++**
++**  OUTPUT:
++**
++**      gctBOOL_PTR IsAfter
++**          Pointer to a variable to result.
++**
++*/
++gceSTATUS
++gckOS_TicksAfter(
++    IN gctUINT32 Time1,
++    IN gctUINT32 Time2,
++    OUT gctBOOL_PTR IsAfter
++    )
++{
++    gcmkHEADER();
++
++    *IsAfter = time_after((unsigned long)Time1, (unsigned long)Time2);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetTime
++**
++**  Get the number of microseconds since the system started.
++**
++**  INPUT:
++**
++**  OUTPUT:
++**
++**      gctUINT64_PTR Time
++**          Pointer to a variable to get time.
++**
++*/
++gceSTATUS
++gckOS_GetTime(
++    OUT gctUINT64_PTR Time
++    )
++{
++    gcmkHEADER();
++
++    *Time = 0;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_MemoryBarrier
++**
++**  Make sure the CPU has executed everything up to this point and the data got
++**  written to the specified pointer.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Address
++**          Address of memory that needs to be barriered.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_MemoryBarrier(
++    IN gckOS Os,
++    IN gctPOINTER Address
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Address=0x%X", Os, Address);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++#if gcdNONPAGED_MEMORY_BUFFERABLE \
++    && defined (CONFIG_ARM) \
++    && (LINUX_VERSION_CODE < KERNEL_VERSION(2,6,34))
++    /* drain write buffer */
++    dsb();
++
++    /* drain outer cache's write buffer? */
++#else
++    mb();
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AllocatePagedMemory
++**
++**  Allocate memory from the paged pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to allocate.
++**
++**  OUTPUT:
++**
++**      gctPHYS_ADDR * Physical
++**          Pointer to a variable that receives the physical address of the
++**          memory allocation.
++*/
++gceSTATUS
++gckOS_AllocatePagedMemory(
++    IN gckOS Os,
++    IN gctSIZE_T Bytes,
++    OUT gctPHYS_ADDR * Physical
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Bytes=%lu", Os, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++
++    /* Allocate the memory. */
++    gcmkONERROR(gckOS_AllocatePagedMemoryEx(Os, gcvFALSE, Bytes, Physical));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Physical=0x%X", *Physical);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AllocatePagedMemoryEx
++**
++**  Allocate memory from the paged pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctBOOL Contiguous
++**          Need contiguous memory or not.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes to allocate.
++**
++**  OUTPUT:
++**
++**      gctPHYS_ADDR * Physical
++**          Pointer to a variable that receives the physical address of the
++**          memory allocation.
++*/
++gceSTATUS
++gckOS_AllocatePagedMemoryEx(
++    IN gckOS Os,
++    IN gctBOOL Contiguous,
++    IN gctSIZE_T Bytes,
++    OUT gctPHYS_ADDR * Physical
++    )
++{
++    gctINT numPages;
++    gctINT i;
++    PLINUX_MDL mdl = gcvNULL;
++    gctSIZE_T bytes;
++    gctBOOL locked = gcvFALSE;
++    gceSTATUS status;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++    gctPOINTER addr = gcvNULL;
++#endif
++
++    gcmkHEADER_ARG("Os=0x%X Contiguous=%d Bytes=%lu", Os, Contiguous, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++
++    bytes = gcmALIGN(Bytes, PAGE_SIZE);
++
++    numPages = GetPageCount(bytes, 0);
++
++    MEMORY_LOCK(Os);
++    locked = gcvTRUE;
++
++    mdl = _CreateMdl(_GetProcessID());
++    if (mdl == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    if (Contiguous)
++    {
++        gctUINT32 order = get_order(bytes);
++
++        if (order >= MAX_ORDER)
++        {
++            gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++        }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++        addr =
++            alloc_pages_exact(numPages * PAGE_SIZE, GFP_KERNEL | gcdNOWARN | __GFP_NORETRY);
++
++        mdl->u.contiguousPages = addr
++                               ? virt_to_page(addr)
++                               : gcvNULL;
++
++        mdl->exact = gcvTRUE;
++#else
++        mdl->u.contiguousPages =
++            alloc_pages(GFP_KERNEL | gcdNOWARN | __GFP_NORETRY, order);
++#endif
++        if (mdl->u.contiguousPages == gcvNULL)
++        {
++            mdl->u.contiguousPages =
++                alloc_pages(GFP_KERNEL | __GFP_HIGHMEM | gcdNOWARN, order);
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++            mdl->exact = gcvFALSE;
++#endif
++        }
++    }
++    else
++    {
++        mdl->u.nonContiguousPages = _NonContiguousAlloc(numPages);
++    }
++
++    if (mdl->u.contiguousPages == gcvNULL && mdl->u.nonContiguousPages == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    mdl->dmaHandle  = 0;
++    mdl->addr       = 0;
++    mdl->numPages   = numPages;
++    mdl->pagedMem   = 1;
++    mdl->contiguous = Contiguous;
++
++    for (i = 0; i < mdl->numPages; i++)
++    {
++        struct page *page;
++
++        if (mdl->contiguous)
++        {
++            page = nth_page(mdl->u.contiguousPages, i);
++        }
++        else
++        {
++            page = _NonContiguousToPage(mdl->u.nonContiguousPages, i);
++        }
++
++        SetPageReserved(page);
++
++        if (!PageHighMem(page) && page_to_phys(page))
++        {
++            gcmkVERIFY_OK(
++                gckOS_CacheFlush(Os, _GetProcessID(), gcvNULL,
++                                 (gctPOINTER)(gctUINTPTR_T)page_to_phys(page),
++                                 page_address(page),
++                                 PAGE_SIZE));
++        }
++    }
++
++    /* Return physical address. */
++    *Physical = (gctPHYS_ADDR) mdl;
++
++    /*
++     * Add this to a global list.
++     * Will be used by get physical address
++     * and mapuser pointer functions.
++     */
++    if (!Os->mdlHead)
++    {
++        /* Initialize the queue. */
++        Os->mdlHead = Os->mdlTail = mdl;
++    }
++    else
++    {
++        /* Add to tail. */
++        mdl->prev           = Os->mdlTail;
++        Os->mdlTail->next   = mdl;
++        Os->mdlTail         = mdl;
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Physical=0x%X", *Physical);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (mdl != gcvNULL)
++    {
++        /* Free the memory. */
++        _DestroyMdl(mdl);
++    }
++
++    if (locked)
++    {
++        /* Unlock the memory. */
++        MEMORY_UNLOCK(Os);
++    }
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_FreePagedMemory
++**
++**  Free memory allocated from the paged pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the allocation.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes of the allocation.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_FreePagedMemory(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes
++    )
++{
++    PLINUX_MDL mdl = (PLINUX_MDL) Physical;
++    gctINT i;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    /*addr = mdl->addr;*/
++
++    MEMORY_LOCK(Os);
++
++    for (i = 0; i < mdl->numPages; i++)
++    {
++        if (mdl->contiguous)
++        {
++            ClearPageReserved(nth_page(mdl->u.contiguousPages, i));
++        }
++        else
++        {
++            ClearPageReserved(_NonContiguousToPage(mdl->u.nonContiguousPages, i));
++        }
++    }
++
++    if (mdl->contiguous)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++        if (mdl->exact == gcvTRUE)
++        {
++            free_pages_exact(page_address(mdl->u.contiguousPages), mdl->numPages * PAGE_SIZE);
++        }
++        else
++#endif
++        {
++            __free_pages(mdl->u.contiguousPages, GetOrder(mdl->numPages));
++        }
++    }
++    else
++    {
++        _NonContiguousFree(mdl->u.nonContiguousPages, mdl->numPages);
++    }
++
++    /* Remove the node from global list. */
++    if (mdl == Os->mdlHead)
++    {
++        if ((Os->mdlHead = mdl->next) == gcvNULL)
++        {
++            Os->mdlTail = gcvNULL;
++        }
++    }
++    else
++    {
++        mdl->prev->next = mdl->next;
++
++        if (mdl == Os->mdlTail)
++        {
++            Os->mdlTail = mdl->prev;
++        }
++        else
++        {
++            mdl->next->prev = mdl->prev;
++        }
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Free the structure... */
++    gcmkVERIFY_OK(_DestroyMdl(mdl));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_LockPages
++**
++**  Lock memory allocated from the paged pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the allocation.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes of the allocation.
++**
++**      gctBOOL Cacheable
++**          Cache mode of mapping.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that receives the address of the mapped
++**          memory.
++**
++**      gctSIZE_T * PageCount
++**          Pointer to a variable that receives the number of pages required for
++**          the page table according to the GPU page size.
++*/
++gceSTATUS
++gckOS_LockPages(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctBOOL Cacheable,
++    OUT gctPOINTER * Logical,
++    OUT gctSIZE_T * PageCount
++    )
++{
++    PLINUX_MDL      mdl;
++    PLINUX_MDL_MAP  mdlMap;
++    gctSTRING       addr;
++    unsigned long   start;
++    unsigned long   pfn;
++    gctINT          i;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%lu", Os, Physical, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(PageCount != gcvNULL);
++
++    mdl = (PLINUX_MDL) Physical;
++
++    MEMORY_LOCK(Os);
++
++    mdlMap = FindMdlMap(mdl, _GetProcessID());
++
++    if (mdlMap == gcvNULL)
++    {
++        mdlMap = _CreateMdlMap(mdl, _GetProcessID());
++
++        if (mdlMap == gcvNULL)
++        {
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++            return gcvSTATUS_OUT_OF_MEMORY;
++        }
++    }
++
++    if (mdlMap->vmaAddr == gcvNULL)
++    {
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 4, 0)
++        mdlMap->vmaAddr = (gctSTRING)vm_mmap(gcvNULL,
++                        0L,
++                        mdl->numPages * PAGE_SIZE,
++                        PROT_READ | PROT_WRITE,
++                        MAP_SHARED,
++                        0);
++#else
++        down_write(&current->mm->mmap_sem);
++
++        mdlMap->vmaAddr = (gctSTRING)do_mmap_pgoff(gcvNULL,
++                        0L,
++                        mdl->numPages * PAGE_SIZE,
++                        PROT_READ | PROT_WRITE,
++                        MAP_SHARED,
++                        0);
++
++        up_write(&current->mm->mmap_sem);
++#endif
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): vmaAddr->0x%X for phys_addr->0x%X",
++            __FUNCTION__, __LINE__,
++            (gctUINT32)(gctUINTPTR_T)mdlMap->vmaAddr,
++            (gctUINT32)(gctUINTPTR_T)mdl
++            );
++
++        if (IS_ERR(mdlMap->vmaAddr))
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_OS,
++                "%s(%d): do_mmap_pgoff error",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++            return gcvSTATUS_OUT_OF_MEMORY;
++        }
++
++        down_write(&current->mm->mmap_sem);
++
++        mdlMap->vma = find_vma(current->mm, (unsigned long)mdlMap->vmaAddr);
++
++        if (mdlMap->vma == gcvNULL)
++        {
++            up_write(&current->mm->mmap_sem);
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_OS,
++                "%s(%d): find_vma error",
++                __FUNCTION__, __LINE__
++                );
++
++            mdlMap->vmaAddr = gcvNULL;
++
++            MEMORY_UNLOCK(Os);
++
++            gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_RESOURCES);
++            return gcvSTATUS_OUT_OF_RESOURCES;
++        }
++
++        mdlMap->vma->vm_flags |= gcdVM_FLAGS;
++
++        if (Cacheable == gcvFALSE)
++        {
++            /* Make this mapping non-cached. */
++            mdlMap->vma->vm_page_prot = gcmkPAGED_MEMROY_PROT(mdlMap->vma->vm_page_prot);
++        }
++
++        addr = mdl->addr;
++
++        /* Now map all the vmalloc pages to this user address. */
++        if (mdl->contiguous)
++        {
++            /* map kernel memory to user space.. */
++            if (remap_pfn_range(mdlMap->vma,
++                                mdlMap->vma->vm_start,
++                                page_to_pfn(mdl->u.contiguousPages),
++                                mdlMap->vma->vm_end - mdlMap->vma->vm_start,
++                                mdlMap->vma->vm_page_prot) < 0)
++            {
++                up_write(&current->mm->mmap_sem);
++
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_INFO, gcvZONE_OS,
++                    "%s(%d): unable to mmap ret",
++                    __FUNCTION__, __LINE__
++                    );
++
++                mdlMap->vmaAddr = gcvNULL;
++
++                MEMORY_UNLOCK(Os);
++
++                gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++                return gcvSTATUS_OUT_OF_MEMORY;
++            }
++        }
++        else
++        {
++            start = mdlMap->vma->vm_start;
++
++            for (i = 0; i < mdl->numPages; i++)
++            {
++                pfn = _NonContiguousToPfn(mdl->u.nonContiguousPages, i);
++
++                if (remap_pfn_range(mdlMap->vma,
++                                    start,
++                                    pfn,
++                                    PAGE_SIZE,
++                                    mdlMap->vma->vm_page_prot) < 0)
++                {
++                    up_write(&current->mm->mmap_sem);
++
++                    gcmkTRACE_ZONE(
++                        gcvLEVEL_INFO, gcvZONE_OS,
++                        "%s(%d): gctPHYS_ADDR->0x%X Logical->0x%X Unable to map addr->0x%X to start->0x%X",
++                        __FUNCTION__, __LINE__,
++                        (gctUINT32)(gctUINTPTR_T)Physical,
++                        (gctUINT32)(gctUINTPTR_T)*Logical,
++                        (gctUINT32)(gctUINTPTR_T)addr,
++                        (gctUINT32)(gctUINTPTR_T)start
++                        );
++
++                    mdlMap->vmaAddr = gcvNULL;
++
++                    MEMORY_UNLOCK(Os);
++
++                    gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++                    return gcvSTATUS_OUT_OF_MEMORY;
++                }
++
++                start += PAGE_SIZE;
++                addr += PAGE_SIZE;
++            }
++        }
++
++        up_write(&current->mm->mmap_sem);
++    }
++
++    mdlMap->count++;
++
++    /* Convert pointer to MDL. */
++    *Logical = mdlMap->vmaAddr;
++
++    /* Return the page number according to the GPU page size. */
++    gcmkASSERT((PAGE_SIZE % 4096) == 0);
++    gcmkASSERT((PAGE_SIZE / 4096) >= 1);
++
++    *PageCount = mdl->numPages * (PAGE_SIZE / 4096);
++
++    MEMORY_UNLOCK(Os);
++
++    gcmkVERIFY_OK(gckOS_CacheFlush(
++        Os,
++        _GetProcessID(),
++        Physical,
++        gcvNULL,
++        (gctPOINTER)mdlMap->vmaAddr,
++        mdl->numPages * PAGE_SIZE
++        ));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Logical=0x%X *PageCount=%lu", *Logical, *PageCount);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_MapPages
++**
++**  Map paged memory into a page table.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the allocation.
++**
++**      gctSIZE_T PageCount
++**          Number of pages required for the physical address.
++**
++**      gctPOINTER PageTable
++**          Pointer to the page table to fill in.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_MapPages(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T PageCount,
++    IN gctPOINTER PageTable
++    )
++{
++    return gckOS_MapPagesEx(Os,
++                            gcvCORE_MAJOR,
++                            Physical,
++                            PageCount,
++                            PageTable);
++}
++
++gceSTATUS
++gckOS_MapPagesEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T PageCount,
++    IN gctPOINTER PageTable
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    PLINUX_MDL  mdl;
++    gctUINT32*  table;
++    gctUINT32   offset;
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    gckMMU      mmu;
++    PLINUX_MDL  mmuMdl;
++    gctUINT32   bytes;
++    gctPHYS_ADDR pageTablePhysical;
++#endif
++
++    gcmkHEADER_ARG("Os=0x%X Core=%d Physical=0x%X PageCount=%u PageTable=0x%X",
++                   Os, Core, Physical, PageCount, PageTable);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(PageCount > 0);
++    gcmkVERIFY_ARGUMENT(PageTable != gcvNULL);
++
++    /* Convert pointer to MDL. */
++    mdl = (PLINUX_MDL)Physical;
++
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_OS,
++        "%s(%d): Physical->0x%X PageCount->0x%X PagedMemory->?%d",
++        __FUNCTION__, __LINE__,
++        (gctUINT32)(gctUINTPTR_T)Physical,
++        (gctUINT32)(gctUINTPTR_T)PageCount,
++        mdl->pagedMem
++        );
++
++    MEMORY_LOCK(Os);
++
++    table = (gctUINT32 *)PageTable;
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    mmu = Os->device->kernels[Core]->mmu;
++    bytes = PageCount * sizeof(*table);
++    mmuMdl = (PLINUX_MDL)mmu->pageTablePhysical;
++#endif
++
++     /* Get all the physical addresses and store them in the page table. */
++
++    offset = 0;
++
++    if (mdl->pagedMem)
++    {
++        /* Try to get the user pages so DMA can happen. */
++        while (PageCount-- > 0)
++        {
++#if gcdENABLE_VG
++            if (Core == gcvCORE_VG)
++            {
++                if (mdl->contiguous)
++                {
++                    gcmkONERROR(
++                        gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
++                             page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
++                             table));
++                }
++                else
++                {
++                    gcmkONERROR(
++                        gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
++                             _NonContiguousToPhys(mdl->u.nonContiguousPages, offset),
++                             table));
++                }
++            }
++            else
++#endif
++            {
++                if (mdl->contiguous)
++                {
++                    gcmkONERROR(
++                        gckMMU_SetPage(Os->device->kernels[Core]->mmu,
++                             page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
++                             table));
++                }
++                else
++                {
++                    gcmkONERROR(
++                        gckMMU_SetPage(Os->device->kernels[Core]->mmu,
++                             _NonContiguousToPhys(mdl->u.nonContiguousPages, offset),
++                             table));
++                }
++            }
++
++            table++;
++            offset += 1;
++        }
++    }
++    else
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): we should not get this call for Non Paged Memory!",
++            __FUNCTION__, __LINE__
++            );
++
++        while (PageCount-- > 0)
++        {
++#if gcdENABLE_VG
++            if (Core == gcvCORE_VG)
++            {
++                gcmkONERROR(
++                        gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
++                                         page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
++                                         table));
++            }
++            else
++#endif
++            {
++                gcmkONERROR(
++                        gckMMU_SetPage(Os->device->kernels[Core]->mmu,
++                                         page_to_phys(nth_page(mdl->u.contiguousPages, offset)),
++                                         table));
++            }
++            table++;
++            offset += 1;
++        }
++    }
++
++#if gcdNONPAGED_MEMORY_CACHEABLE
++    /* Get physical address of pageTable */
++    pageTablePhysical = (gctPHYS_ADDR)(mmuMdl->dmaHandle +
++                        ((gctUINT32 *)PageTable - mmu->pageTableLogical));
++
++    /* Flush the mmu page table cache. */
++    gcmkONERROR(gckOS_CacheClean(
++        Os,
++        _GetProcessID(),
++        gcvNULL,
++        pageTablePhysical,
++        PageTable,
++        bytes
++        ));
++#endif
++
++OnError:
++
++    MEMORY_UNLOCK(Os);
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_UnlockPages
++**
++**  Unlock memory allocated from the paged pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the allocation.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes of the allocation.
++**
++**      gctPOINTER Logical
++**          Address of the mapped memory.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnlockPages(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctSIZE_T Bytes,
++    IN gctPOINTER Logical
++    )
++{
++    PLINUX_MDL_MAP          mdlMap;
++    PLINUX_MDL              mdl = (PLINUX_MDL)Physical;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Bytes=%u Logical=0x%X",
++                   Os, Physical, Bytes, Logical);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Make sure there is already a mapping...*/
++    gcmkVERIFY_ARGUMENT(mdl->u.nonContiguousPages != gcvNULL
++                       || mdl->u.contiguousPages != gcvNULL);
++
++    MEMORY_LOCK(Os);
++
++    mdlMap = mdl->maps;
++
++    while (mdlMap != gcvNULL)
++    {
++        if ((mdlMap->vmaAddr != gcvNULL) && (_GetProcessID() == mdlMap->pid))
++        {
++            if (--mdlMap->count == 0)
++            {
++                _UnmapUserLogical(mdlMap->pid, mdlMap->vmaAddr, mdl->numPages * PAGE_SIZE);
++                mdlMap->vmaAddr = gcvNULL;
++            }
++        }
++
++        mdlMap = mdlMap->next;
++    }
++
++    MEMORY_UNLOCK(Os);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++/*******************************************************************************
++**
++**  gckOS_AllocateContiguous
++**
++**  Allocate memory from the contiguous pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctBOOL InUserSpace
++**          gcvTRUE if the pages need to be mapped into user space.
++**
++**      gctSIZE_T * Bytes
++**          Pointer to the number of bytes to allocate.
++**
++**  OUTPUT:
++**
++**      gctSIZE_T * Bytes
++**          Pointer to a variable that receives the number of bytes allocated.
++**
++**      gctPHYS_ADDR * Physical
++**          Pointer to a variable that receives the physical address of the
++**          memory allocation.
++**
++**      gctPOINTER * Logical
++**          Pointer to a variable that receives the logical address of the
++**          memory allocation.
++*/
++gceSTATUS
++gckOS_AllocateContiguous(
++    IN gckOS Os,
++    IN gctBOOL InUserSpace,
++    IN OUT gctSIZE_T * Bytes,
++    OUT gctPHYS_ADDR * Physical,
++    OUT gctPOINTER * Logical
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X InUserSpace=%d *Bytes=%lu",
++                   Os, InUserSpace, gcmOPT_VALUE(Bytes));
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Bytes != gcvNULL);
++    gcmkVERIFY_ARGUMENT(*Bytes > 0);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++
++    /* Same as non-paged memory for now. */
++    gcmkONERROR(gckOS_AllocateNonPagedMemory(Os,
++                                             InUserSpace,
++                                             Bytes,
++                                             Physical,
++                                             Logical));
++
++    /* Success. */
++    gcmkFOOTER_ARG("*Bytes=%lu *Physical=0x%X *Logical=0x%X",
++                   *Bytes, *Physical, *Logical);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_FreeContiguous
++**
++**  Free memory allocated from the contiguous pool.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPHYS_ADDR Physical
++**          Physical address of the allocation.
++**
++**      gctPOINTER Logical
++**          Logicval address of the allocation.
++**
++**      gctSIZE_T Bytes
++**          Number of bytes of the allocation.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_FreeContiguous(
++    IN gckOS Os,
++    IN gctPHYS_ADDR Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Physical=0x%X Logical=0x%X Bytes=%lu",
++                   Os, Physical, Logical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Physical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    /* Same of non-paged memory for now. */
++    gcmkONERROR(gckOS_FreeNonPagedMemory(Os, Bytes, Physical, Logical));
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdENABLE_VG
++/******************************************************************************
++**
++**  gckOS_GetKernelLogical
++**
++**  Return the kernel logical pointer that corresponods to the specified
++**  hardware address.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 Address
++**          Hardware physical address.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * KernelPointer
++**          Pointer to a variable receiving the pointer in kernel address space.
++*/
++gceSTATUS
++gckOS_GetKernelLogical(
++    IN gckOS Os,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    return gckOS_GetKernelLogicalEx(Os, gcvCORE_MAJOR, Address, KernelPointer);
++}
++
++gceSTATUS
++gckOS_GetKernelLogicalEx(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT32 Address,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Core=%d Address=0x%08x", Os, Core, Address);
++
++    do
++    {
++        gckGALDEVICE device;
++        gckKERNEL kernel;
++        gcePOOL pool;
++        gctUINT32 offset;
++        gctPOINTER logical;
++
++        /* Extract the pointer to the gckGALDEVICE class. */
++        device = (gckGALDEVICE) Os->device;
++
++        /* Kernel shortcut. */
++        kernel = device->kernels[Core];
++#if gcdENABLE_VG
++       if (Core == gcvCORE_VG)
++       {
++           gcmkERR_BREAK(gckVGHARDWARE_SplitMemory(
++                kernel->vg->hardware, Address, &pool, &offset
++                ));
++       }
++       else
++#endif
++       {
++        /* Split the memory address into a pool type and offset. */
++            gcmkERR_BREAK(gckHARDWARE_SplitMemory(
++                kernel->hardware, Address, &pool, &offset
++                ));
++       }
++
++        /* Dispatch on pool. */
++        switch (pool)
++        {
++        case gcvPOOL_LOCAL_INTERNAL:
++            /* Internal memory. */
++            logical = device->internalLogical;
++            break;
++
++        case gcvPOOL_LOCAL_EXTERNAL:
++            /* External memory. */
++            logical = device->externalLogical;
++            break;
++
++        case gcvPOOL_SYSTEM:
++            /* System memory. */
++            logical = device->contiguousBase;
++            break;
++
++        default:
++            /* Invalid memory pool. */
++            gcmkFOOTER();
++            return gcvSTATUS_INVALID_ARGUMENT;
++        }
++
++        /* Build logical address of specified address. */
++        * KernelPointer = ((gctUINT8_PTR) logical) + offset;
++
++        /* Success. */
++        gcmkFOOTER_ARG("*KernelPointer=0x%X", *KernelPointer);
++        return gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    /* Return status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckOS_MapUserPointer
++**
++**  Map a pointer from the user process into the kernel address space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Pointer
++**          Pointer in user process space that needs to be mapped.
++**
++**      gctSIZE_T Size
++**          Number of bytes that need to be mapped.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * KernelPointer
++**          Pointer to a variable receiving the mapped pointer in kernel address
++**          space.
++*/
++gceSTATUS
++gckOS_MapUserPointer(
++    IN gckOS Os,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * KernelPointer
++    )
++{
++    gctPOINTER buf = gcvNULL;
++    gctUINT32 len;
++
++    gcmkHEADER_ARG("Os=0x%X Pointer=0x%X Size=%lu", Os, Pointer, Size);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
++
++    buf = kmalloc(Size, GFP_KERNEL | gcdNOWARN);
++    if (buf == gcvNULL)
++    {
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): Failed to allocate memory.",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_OUT_OF_MEMORY);
++        return gcvSTATUS_OUT_OF_MEMORY;
++    }
++
++    len = copy_from_user(buf, Pointer, Size);
++    if (len != 0)
++    {
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): Failed to copy data from user.",
++            __FUNCTION__, __LINE__
++            );
++
++        if (buf != gcvNULL)
++        {
++            kfree(buf);
++        }
++
++        gcmkFOOTER_ARG("*status=%d", gcvSTATUS_GENERIC_IO);
++        return gcvSTATUS_GENERIC_IO;
++    }
++
++    *KernelPointer = buf;
++
++    gcmkFOOTER_ARG("*KernelPointer=0x%X", *KernelPointer);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_UnmapUserPointer
++**
++**  Unmap a user process pointer from the kernel address space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Pointer
++**          Pointer in user process space that needs to be unmapped.
++**
++**      gctSIZE_T Size
++**          Number of bytes that need to be unmapped.
++**
++**      gctPOINTER KernelPointer
++**          Pointer in kernel address space that needs to be unmapped.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnmapUserPointer(
++    IN gckOS Os,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size,
++    IN gctPOINTER KernelPointer
++    )
++{
++    gctUINT32 len;
++
++    gcmkHEADER_ARG("Os=0x%X Pointer=0x%X Size=%lu KernelPointer=0x%X",
++                   Os, Pointer, Size, KernelPointer);
++
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
++
++    len = copy_to_user(Pointer, KernelPointer, Size);
++
++    kfree(KernelPointer);
++
++    if (len != 0)
++    {
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): Failed to copy data to user.",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkFOOTER_ARG("status=%d", gcvSTATUS_GENERIC_IO);
++        return gcvSTATUS_GENERIC_IO;
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_QueryNeedCopy
++**
++**  Query whether the memory can be accessed or mapped directly or it has to be
++**  copied.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Process ID of the current process.
++**
++**  OUTPUT:
++**
++**      gctBOOL_PTR NeedCopy
++**          Pointer to a boolean receiving gcvTRUE if the memory needs a copy or
++**          gcvFALSE if the memory can be accessed or mapped dircetly.
++*/
++gceSTATUS
++gckOS_QueryNeedCopy(
++    IN gckOS Os,
++    IN gctUINT32 ProcessID,
++    OUT gctBOOL_PTR NeedCopy
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X ProcessID=%d", Os, ProcessID);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(NeedCopy != gcvNULL);
++
++    /* We need to copy data. */
++    *NeedCopy = gcvTRUE;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*NeedCopy=%d", *NeedCopy);
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_CopyFromUserData
++**
++**  Copy data from user to kernel memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER KernelPointer
++**          Pointer to kernel memory.
++**
++**      gctPOINTER Pointer
++**          Pointer to user memory.
++**
++**      gctSIZE_T Size
++**          Number of bytes to copy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_CopyFromUserData(
++    IN gckOS Os,
++    IN gctPOINTER KernelPointer,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X KernelPointer=0x%X Pointer=0x%X Size=%lu",
++                   Os, KernelPointer, Pointer, Size);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++
++    /* Copy data from user. */
++    if (copy_from_user(KernelPointer, Pointer, Size) != 0)
++    {
++        /* Could not copy all the bytes. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_CopyToUserData
++**
++**  Copy data from kernel to user memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER KernelPointer
++**          Pointer to kernel memory.
++**
++**      gctPOINTER Pointer
++**          Pointer to user memory.
++**
++**      gctSIZE_T Size
++**          Number of bytes to copy.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_CopyToUserData(
++    IN gckOS Os,
++    IN gctPOINTER KernelPointer,
++    IN gctPOINTER Pointer,
++    IN gctSIZE_T Size
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X KernelPointer=0x%X Pointer=0x%X Size=%lu",
++                   Os, KernelPointer, Pointer, Size);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(KernelPointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Pointer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++
++    /* Copy data to user. */
++    if (copy_to_user(Pointer, KernelPointer, Size) != 0)
++    {
++        /* Could not copy all the bytes. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_WriteMemory
++**
++**  Write data to a memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctPOINTER Address
++**          Address of the memory to write to.
++**
++**      gctUINT32 Data
++**          Data for register.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_WriteMemory(
++    IN gckOS Os,
++    IN gctPOINTER Address,
++    IN gctUINT32 Data
++    )
++{
++    gceSTATUS status;
++    gcmkHEADER_ARG("Os=0x%X Address=0x%X Data=%u", Os, Address, Data);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    /* Write memory. */
++    if (access_ok(VERIFY_WRITE, Address, 4))
++    {
++        /* User address. */
++        if(put_user(Data, (gctUINT32*)Address))
++        {
++            gcmkONERROR(gcvSTATUS_INVALID_ADDRESS);
++        }
++    }
++    else
++    {
++        /* Kernel address. */
++        *(gctUINT32 *)Address = Data;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_MapUserMemory
++**
++**  Lock down a user buffer and return an DMA'able address to be used by the
++**  hardware to access it.
++**
++**  INPUT:
++**
++**      gctPOINTER Memory
++**          Pointer to memory to lock down.
++**
++**      gctSIZE_T Size
++**          Size in bytes of the memory to lock down.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Info
++**          Pointer to variable receiving the information record required by
++**          gckOS_UnmapUserMemory.
++**
++**      gctUINT32_PTR Address
++**          Pointer to a variable that will receive the address DMA'able by the
++**          hardware.
++*/
++gceSTATUS
++gckOS_MapUserMemory(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPOINTER Memory,
++    IN gctUINT32 Physical,
++    IN gctSIZE_T Size,
++    OUT gctPOINTER * Info,
++    OUT gctUINT32_PTR Address
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%x Core=%d Memory=0x%x Size=%lu", Os, Core, Memory, Size);
++
++#if gcdSECURE_USER
++    gcmkONERROR(gckOS_AddMapping(Os, *Address, Memory, Size));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++#else
++{
++    gctSIZE_T pageCount, i, j;
++    gctUINT32_PTR pageTable;
++    gctUINT32 address = 0, physical = ~0U;
++    gctUINTPTR_T start, end, memory;
++    gctUINT32 offset;
++    gctINT result = 0;
++
++    gcsPageInfo_PTR info = gcvNULL;
++    struct page **pages = gcvNULL;
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL || Physical != ~0U);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Address != gcvNULL);
++
++    do
++    {
++        memory = (gctUINTPTR_T) Memory;
++
++        /* Get the number of required pages. */
++        end = (memory + Size + PAGE_SIZE - 1) >> PAGE_SHIFT;
++        start = memory >> PAGE_SHIFT;
++        pageCount = end - start;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): pageCount: %d.",
++            __FUNCTION__, __LINE__,
++            pageCount
++            );
++
++        /* Overflow. */
++        if ((memory + Size) < memory)
++        {
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
++            return gcvSTATUS_INVALID_ARGUMENT;
++        }
++
++        MEMORY_MAP_LOCK(Os);
++
++        /* Allocate the Info struct. */
++        info = (gcsPageInfo_PTR)kmalloc(sizeof(gcsPageInfo), GFP_KERNEL | gcdNOWARN);
++
++        if (info == gcvNULL)
++        {
++            status = gcvSTATUS_OUT_OF_MEMORY;
++            break;
++        }
++
++        /* Allocate the array of page addresses. */
++        pages = (struct page **)kmalloc(pageCount * sizeof(struct page *), GFP_KERNEL | gcdNOWARN);
++
++        if (pages == gcvNULL)
++        {
++            status = gcvSTATUS_OUT_OF_MEMORY;
++            break;
++        }
++
++        if (Physical != ~0U)
++        {
++            for (i = 0; i < pageCount; i++)
++            {
++                pages[i] = pfn_to_page((Physical >> PAGE_SHIFT) + i);
++                get_page(pages[i]);
++            }
++        }
++        else
++        {
++            /* Get the user pages. */
++            down_read(&current->mm->mmap_sem);
++
++            result = get_user_pages(current,
++                    current->mm,
++                    memory & PAGE_MASK,
++                    pageCount,
++                    1,
++                    0,
++                    pages,
++                    gcvNULL
++                    );
++
++            up_read(&current->mm->mmap_sem);
++
++            if (result <=0 || result < pageCount)
++            {
++                struct vm_area_struct *vma;
++
++                /* Release the pages if any. */
++                if (result > 0)
++                {
++                    for (i = 0; i < result; i++)
++                    {
++                        if (pages[i] == gcvNULL)
++                        {
++                            break;
++                        }
++
++                        page_cache_release(pages[i]);
++                        pages[i] = gcvNULL;
++                    }
++
++                    result = 0;
++                }
++
++                vma = find_vma(current->mm, memory);
++
++                if (vma && (vma->vm_flags & VM_PFNMAP))
++                {
++                    pte_t       * pte;
++                    spinlock_t  * ptl;
++                    gctUINTPTR_T logical = memory;
++
++                    for (i = 0; i < pageCount; i++)
++                    {
++                        pgd_t * pgd = pgd_offset(current->mm, logical);
++                        pud_t * pud = pud_offset(pgd, logical);
++
++                        if (pud)
++                        {
++                            pmd_t * pmd = pmd_offset(pud, logical);
++                            pte = pte_offset_map_lock(current->mm, pmd, logical, &ptl);
++                            if (!pte)
++                            {
++                                gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++                            }
++                        }
++                        else
++                        {
++                            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++                        }
++
++                        pages[i] = pte_page(*pte);
++                        pte_unmap_unlock(pte, ptl);
++
++                        /* Advance to next. */
++                        logical += PAGE_SIZE;
++                    }
++                }
++                else
++                {
++                    gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++                }
++
++                /* Check if this memory is contiguous for old mmu. */
++                if (Os->device->kernels[Core]->hardware->mmuVersion == 0)
++                {
++                    for (i = 1; i < pageCount; i++)
++                    {
++                        if (pages[i] != nth_page(pages[0], i))
++                        {
++                            /* Non-contiguous. */
++                            break;
++                        }
++                    }
++
++                    if (i == pageCount)
++                    {
++                        /* Contiguous memory. */
++                        physical = page_to_phys(pages[0]) | (memory & ~PAGE_MASK);
++
++                        if (!((physical - Os->device->baseAddress) & 0x80000000))
++                        {
++                            kfree(pages);
++                            pages = gcvNULL;
++
++                            info->pages = gcvNULL;
++                            info->pageTable = gcvNULL;
++
++                            MEMORY_MAP_UNLOCK(Os);
++
++                            *Address = physical - Os->device->baseAddress;
++                            *Info    = info;
++
++                            gcmkFOOTER_ARG("*Info=0x%X *Address=0x%08x",
++                                           *Info, *Address);
++
++                            return gcvSTATUS_OK;
++                        }
++                    }
++                }
++
++                /* Reference pages. */
++                for (i = 0; i < pageCount; i++)
++                {
++                    get_page(pages[i]);
++                }
++            }
++        }
++
++        for (i = 0; i < pageCount; i++)
++        {
++#ifdef CONFIG_ARM
++            gctUINT32 data;
++            get_user(data, (gctUINT32*)((memory & PAGE_MASK) + i * PAGE_SIZE));
++#endif
++
++            /* Flush(clean) the data cache. */
++            gcmkONERROR(gckOS_CacheFlush(Os, _GetProcessID(), gcvNULL,
++                             (gctPOINTER)(gctUINTPTR_T)page_to_phys(pages[i]),
++                             (gctPOINTER)(memory & PAGE_MASK) + i*PAGE_SIZE,
++                             PAGE_SIZE));
++        }
++
++#if gcdENABLE_VG
++        if (Core == gcvCORE_VG)
++        {
++            /* Allocate pages inside the page table. */
++            gcmkERR_BREAK(gckVGMMU_AllocatePages(Os->device->kernels[Core]->vg->mmu,
++                                              pageCount * (PAGE_SIZE/4096),
++                                              (gctPOINTER *) &pageTable,
++                                              &address));
++        }
++        else
++#endif
++        {
++            /* Allocate pages inside the page table. */
++            gcmkERR_BREAK(gckMMU_AllocatePages(Os->device->kernels[Core]->mmu,
++                                              pageCount * (PAGE_SIZE/4096),
++                                              (gctPOINTER *) &pageTable,
++                                              &address));
++        }
++
++        /* Fill the page table. */
++        for (i = 0; i < pageCount; i++)
++        {
++            gctUINT32 phys;
++            gctUINT32_PTR tab = pageTable + i * (PAGE_SIZE/4096);
++
++            phys = page_to_phys(pages[i]);
++
++#if gcdENABLE_VG
++            if (Core == gcvCORE_VG)
++            {
++                /* Get the physical address from page struct. */
++                gcmkONERROR(
++                    gckVGMMU_SetPage(Os->device->kernels[Core]->vg->mmu,
++                                   phys,
++                                   tab));
++            }
++            else
++#endif
++            {
++                /* Get the physical address from page struct. */
++                gcmkONERROR(
++                    gckMMU_SetPage(Os->device->kernels[Core]->mmu,
++                                   phys,
++                                   tab));
++            }
++
++            for (j = 1; j < (PAGE_SIZE/4096); j++)
++            {
++                pageTable[i * (PAGE_SIZE/4096) + j] = pageTable[i * (PAGE_SIZE/4096)] + 4096 * j;
++            }
++
++            gcmkTRACE_ZONE(
++                gcvLEVEL_INFO, gcvZONE_OS,
++                "%s(%d): pageTable[%d]: 0x%X 0x%X.",
++                __FUNCTION__, __LINE__,
++                i, phys, pageTable[i]);
++        }
++
++#if gcdENABLE_VG
++        if (Core == gcvCORE_VG)
++        {
++            gcmkONERROR(gckVGMMU_Flush(Os->device->kernels[Core]->vg->mmu));
++        }
++        else
++#endif
++        {
++            gcmkONERROR(gckMMU_Flush(Os->device->kernels[Core]->mmu));
++        }
++
++        /* Save pointer to page table. */
++        info->pageTable = pageTable;
++        info->pages = pages;
++
++        *Info = (gctPOINTER) info;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): info->pages: 0x%X, info->pageTable: 0x%X, info: 0x%X.",
++            __FUNCTION__, __LINE__,
++            info->pages,
++            info->pageTable,
++            info
++            );
++
++        offset = (Physical != ~0U)
++               ? (Physical & ~PAGE_MASK)
++               : (memory & ~PAGE_MASK);
++
++        /* Return address. */
++        *Address = address + offset;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): Address: 0x%X.",
++            __FUNCTION__, __LINE__,
++            *Address
++            );
++
++        /* Success. */
++        status = gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++OnError:
++
++    if (gcmIS_ERROR(status))
++    {
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): error occured: %d.",
++            __FUNCTION__, __LINE__,
++            status
++            );
++
++        /* Release page array. */
++        if (result > 0 && pages != gcvNULL)
++        {
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): error: page table is freed.",
++                __FUNCTION__, __LINE__
++                );
++
++            for (i = 0; i < result; i++)
++            {
++                if (pages[i] == gcvNULL)
++                {
++                    break;
++                }
++                page_cache_release(pages[i]);
++            }
++        }
++
++        if (info!= gcvNULL && pages != gcvNULL)
++        {
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): error: pages is freed.",
++                __FUNCTION__, __LINE__
++                );
++
++            /* Free the page table. */
++            kfree(pages);
++            info->pages = gcvNULL;
++        }
++
++        /* Release page info struct. */
++        if (info != gcvNULL)
++        {
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): error: info is freed.",
++                __FUNCTION__, __LINE__
++                );
++
++            /* Free the page info struct. */
++            kfree(info);
++            *Info = gcvNULL;
++        }
++    }
++
++    MEMORY_MAP_UNLOCK(Os);
++
++    /* Return the status. */
++    if (gcmIS_SUCCESS(status))
++    {
++        gcmkFOOTER_ARG("*Info=0x%X *Address=0x%08x", *Info, *Address);
++    }
++    else
++    {
++        gcmkFOOTER();
++    }
++
++    return status;
++}
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckOS_UnmapUserMemory
++**
++**  Unlock a user buffer and that was previously locked down by
++**  gckOS_MapUserMemory.
++**
++**  INPUT:
++**
++**      gctPOINTER Memory
++**          Pointer to memory to unlock.
++**
++**      gctSIZE_T Size
++**          Size in bytes of the memory to unlock.
++**
++**      gctPOINTER Info
++**          Information record returned by gckOS_MapUserMemory.
++**
++**      gctUINT32_PTR Address
++**          The address returned by gckOS_MapUserMemory.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UnmapUserMemory(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctPOINTER Memory,
++    IN gctSIZE_T Size,
++    IN gctPOINTER Info,
++    IN gctUINT32 Address
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Core=%d Memory=0x%X Size=%lu Info=0x%X Address0x%08x",
++                   Os, Core, Memory, Size, Info, Address);
++
++#if gcdSECURE_USER
++    gcmkONERROR(gckOS_RemoveMapping(Os, Memory, Size));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++#else
++{
++    gctUINTPTR_T memory, start, end;
++    gcsPageInfo_PTR info;
++    gctSIZE_T pageCount, i;
++    struct page **pages;
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Size > 0);
++    gcmkVERIFY_ARGUMENT(Info != gcvNULL);
++
++    do
++    {
++        info = (gcsPageInfo_PTR) Info;
++
++        pages = info->pages;
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): info=0x%X, pages=0x%X.",
++            __FUNCTION__, __LINE__,
++            info, pages
++            );
++
++        /* Invalid page array. */
++        if (pages == gcvNULL && info->pageTable == gcvNULL)
++        {
++            kfree(info);
++
++            gcmkFOOTER_NO();
++            return gcvSTATUS_OK;
++        }
++
++        memory = (gctUINTPTR_T)Memory;
++        end = (memory + Size + PAGE_SIZE - 1) >> PAGE_SHIFT;
++        start = memory >> PAGE_SHIFT;
++        pageCount = end - start;
++
++        /* Overflow. */
++        if ((memory + Size) < memory)
++        {
++            gcmkFOOTER_ARG("status=%d", gcvSTATUS_INVALID_ARGUMENT);
++            return gcvSTATUS_INVALID_ARGUMENT;
++        }
++
++        gcmkTRACE_ZONE(
++            gcvLEVEL_INFO, gcvZONE_OS,
++            "%s(%d): memory: 0x%X, pageCount: %d, pageTable: 0x%X.",
++            __FUNCTION__, __LINE__,
++            memory, pageCount, info->pageTable
++            );
++
++        MEMORY_MAP_LOCK(Os);
++
++        gcmkASSERT(info->pageTable != gcvNULL);
++
++#if gcdENABLE_VG
++        if (Core == gcvCORE_VG)
++        {
++            /* Free the pages from the MMU. */
++            gcmkERR_BREAK(gckVGMMU_FreePages(Os->device->kernels[Core]->vg->mmu,
++                                          info->pageTable,
++                                          pageCount * (PAGE_SIZE/4096)
++                                          ));
++        }
++        else
++#endif
++        {
++            /* Free the pages from the MMU. */
++            gcmkERR_BREAK(gckMMU_FreePages(Os->device->kernels[Core]->mmu,
++                                          info->pageTable,
++                                          pageCount * (PAGE_SIZE/4096)
++                                          ));
++        }
++
++        /* Release the page cache. */
++        if (pages)
++        {
++            for (i = 0; i < pageCount; i++)
++            {
++                gcmkTRACE_ZONE(
++                    gcvLEVEL_INFO, gcvZONE_OS,
++                    "%s(%d): pages[%d]: 0x%X.",
++                    __FUNCTION__, __LINE__,
++                    i, pages[i]
++                    );
++
++                if (!PageReserved(pages[i]))
++                {
++                     SetPageDirty(pages[i]);
++                }
++
++                page_cache_release(pages[i]);
++            }
++        }
++
++        /* Success. */
++        status = gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    if (info != gcvNULL)
++    {
++        /* Free the page array. */
++        if (info->pages != gcvNULL)
++        {
++            kfree(info->pages);
++        }
++
++        kfree(info);
++    }
++
++    MEMORY_MAP_UNLOCK(Os);
++
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetBaseAddress
++**
++**  Get the base address for the physical memory.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR BaseAddress
++**          Pointer to a variable that will receive the base address.
++*/
++gceSTATUS
++gckOS_GetBaseAddress(
++    IN gckOS Os,
++    OUT gctUINT32_PTR BaseAddress
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(BaseAddress != gcvNULL);
++
++    /* Return base address. */
++    *BaseAddress = Os->device->baseAddress;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*BaseAddress=0x%08x", *BaseAddress);
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_SuspendInterrupt(
++    IN gckOS Os
++    )
++{
++    return gckOS_SuspendInterruptEx(Os, gcvCORE_MAJOR);
++}
++
++gceSTATUS
++gckOS_SuspendInterruptEx(
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Core=%d", Os, Core);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++    disable_irq(Os->device->irqLines[Core]);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_ResumeInterrupt(
++    IN gckOS Os
++    )
++{
++    return gckOS_ResumeInterruptEx(Os, gcvCORE_MAJOR);
++}
++
++gceSTATUS
++gckOS_ResumeInterruptEx(
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Core=%d", Os, Core);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++    enable_irq(Os->device->irqLines[Core]);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_MemCopy(
++    IN gctPOINTER Destination,
++    IN gctCONST_POINTER Source,
++    IN gctSIZE_T Bytes
++    )
++{
++    gcmkHEADER_ARG("Destination=0x%X Source=0x%X Bytes=%lu",
++                   Destination, Source, Bytes);
++
++    gcmkVERIFY_ARGUMENT(Destination != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Source != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    memcpy(Destination, Source, Bytes);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_ZeroMemory(
++    IN gctPOINTER Memory,
++    IN gctSIZE_T Bytes
++    )
++{
++    gcmkHEADER_ARG("Memory=0x%X Bytes=%lu", Memory, Bytes);
++
++    gcmkVERIFY_ARGUMENT(Memory != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++    memset(Memory, 0, Bytes);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++********************************* Cache Control ********************************
++*******************************************************************************/
++
++#if !gcdCACHE_FUNCTION_UNIMPLEMENTED && defined(CONFIG_OUTER_CACHE)
++static inline gceSTATUS
++outer_func(
++    gceCACHEOPERATION Type,
++    unsigned long Start,
++    unsigned long End
++    )
++{
++    switch (Type)
++    {
++        case gcvCACHE_CLEAN:
++            outer_clean_range(Start, End);
++            break;
++        case gcvCACHE_INVALIDATE:
++            outer_inv_range(Start, End);
++            break;
++        case gcvCACHE_FLUSH:
++            outer_flush_range(Start, End);
++            break;
++        default:
++            return gcvSTATUS_INVALID_ARGUMENT;
++            break;
++    }
++    return gcvSTATUS_OK;
++}
++
++#if gcdENABLE_OUTER_CACHE_PATCH
++/*******************************************************************************
++**  _HandleOuterCache
++**
++**  Handle the outer cache for the specified addresses.
++**
++**  ARGUMENTS:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Process ID Logical belongs.
++**
++**      gctPHYS_ADDR Handle
++**          Physical address handle.  If gcvNULL it is video memory.
++**
++**      gctPOINTER Physical
++**          Physical address to flush.
++**
++**      gctPOINTER Logical
++**          Logical address to flush.
++**
++**      gctSIZE_T Bytes
++**          Size of the address range in bytes to flush.
++**
++**      gceOUTERCACHE_OPERATION Type
++**          Operation need to be execute.
++*/
++static gceSTATUS
++_HandleOuterCache(
++    IN gckOS Os,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Handle,
++    IN gctPOINTER Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes,
++    IN gceCACHEOPERATION Type
++    )
++{
++    gceSTATUS status;
++    gctUINT32 i, pageNum;
++    unsigned long paddr;
++    gctPOINTER vaddr;
++
++    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
++                   Os, ProcessID, Handle, Logical, Bytes);
++
++    if (Physical != gcvNULL)
++    {
++        /* Non paged memory or gcvPOOL_USER surface */
++        paddr = (unsigned long) Physical;
++        gcmkONERROR(outer_func(Type, paddr, paddr + Bytes));
++    }
++    else if ((Handle == gcvNULL)
++    || (Handle != gcvNULL && ((PLINUX_MDL)Handle)->contiguous)
++    )
++    {
++        /* Video Memory or contiguous virtual memory */
++        gcmkONERROR(gckOS_GetPhysicalAddress(Os, Logical, (gctUINT32*)&paddr));
++        gcmkONERROR(outer_func(Type, paddr, paddr + Bytes));
++    }
++    else
++    {
++        /* Non contiguous virtual memory */
++        vaddr = (gctPOINTER)gcmALIGN_BASE((gctUINTPTR_T)Logical, PAGE_SIZE);
++        pageNum = GetPageCount(Bytes, 0);
++
++        for (i = 0; i < pageNum; i += 1)
++        {
++            gcmkONERROR(_ConvertLogical2Physical(
++                Os,
++                vaddr + PAGE_SIZE * i,
++                ProcessID,
++                (PLINUX_MDL)Handle,
++                (gctUINT32*)&paddr
++                ));
++
++            gcmkONERROR(outer_func(Type, paddr, paddr + PAGE_SIZE));
++        }
++    }
++
++    mb();
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++#endif
++#endif
++
++/*******************************************************************************
++**  gckOS_CacheClean
++**
++**  Clean the cache for the specified addresses.  The GPU is going to need the
++**  data.  If the system is allocating memory as non-cachable, this function can
++**  be ignored.
++**
++**  ARGUMENTS:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Process ID Logical belongs.
++**
++**      gctPHYS_ADDR Handle
++**          Physical address handle.  If gcvNULL it is video memory.
++**
++**      gctPOINTER Physical
++**          Physical address to flush.
++**
++**      gctPOINTER Logical
++**          Logical address to flush.
++**
++**      gctSIZE_T Bytes
++**          Size of the address range in bytes to flush.
++*/
++gceSTATUS
++gckOS_CacheClean(
++    IN gckOS Os,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Handle,
++    IN gctPOINTER Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
++                   Os, ProcessID, Handle, Logical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++#if !gcdCACHE_FUNCTION_UNIMPLEMENTED
++#ifdef CONFIG_ARM
++
++    /* Inner cache. */
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,35)
++    dmac_map_area(Logical, Bytes, DMA_TO_DEVICE);
++#      else
++    dmac_clean_range(Logical, Logical + Bytes);
++#      endif
++
++#if defined(CONFIG_OUTER_CACHE)
++    /* Outer cache. */
++#if gcdENABLE_OUTER_CACHE_PATCH
++    _HandleOuterCache(Os, ProcessID, Handle, Physical, Logical, Bytes, gcvCACHE_CLEAN);
++#else
++    outer_clean_range((unsigned long) Handle, (unsigned long) Handle + Bytes);
++#endif
++#endif
++
++#elif defined(CONFIG_MIPS)
++
++    dma_cache_wback((unsigned long) Logical, Bytes);
++
++#elif defined(CONFIG_PPC)
++
++    /* TODO */
++
++#else
++    dma_sync_single_for_device(
++              gcvNULL,
++              (dma_addr_t)Physical,
++              Bytes,
++              DMA_TO_DEVICE);
++#endif
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**  gckOS_CacheInvalidate
++**
++**  Invalidate the cache for the specified addresses. The GPU is going to need
++**  data.  If the system is allocating memory as non-cachable, this function can
++**  be ignored.
++**
++**  ARGUMENTS:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Process ID Logical belongs.
++**
++**      gctPHYS_ADDR Handle
++**          Physical address handle.  If gcvNULL it is video memory.
++**
++**      gctPOINTER Logical
++**          Logical address to flush.
++**
++**      gctSIZE_T Bytes
++**          Size of the address range in bytes to flush.
++*/
++gceSTATUS
++gckOS_CacheInvalidate(
++    IN gckOS Os,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Handle,
++    IN gctPOINTER Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
++                   Os, ProcessID, Handle, Logical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++#if !gcdCACHE_FUNCTION_UNIMPLEMENTED
++#ifdef CONFIG_ARM
++
++    /* Inner cache. */
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,35)
++    dmac_map_area(Logical, Bytes, DMA_FROM_DEVICE);
++#      else
++    dmac_inv_range(Logical, Logical + Bytes);
++#      endif
++
++#if defined(CONFIG_OUTER_CACHE)
++    /* Outer cache. */
++#if gcdENABLE_OUTER_CACHE_PATCH
++    _HandleOuterCache(Os, ProcessID, Handle, Physical, Logical, Bytes, gcvCACHE_INVALIDATE);
++#else
++    outer_inv_range((unsigned long) Handle, (unsigned long) Handle + Bytes);
++#endif
++#endif
++
++#elif defined(CONFIG_MIPS)
++    dma_cache_inv((unsigned long) Logical, Bytes);
++#elif defined(CONFIG_PPC)
++    /* TODO */
++#else
++    dma_sync_single_for_device(
++              gcvNULL,
++              (dma_addr_t)Physical,
++              Bytes,
++              DMA_FROM_DEVICE);
++#endif
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**  gckOS_CacheFlush
++**
++**  Clean the cache for the specified addresses and invalidate the lines as
++**  well.  The GPU is going to need and modify the data.  If the system is
++**  allocating memory as non-cachable, this function can be ignored.
++**
++**  ARGUMENTS:
++**
++**      gckOS Os
++**          Pointer to gckOS object.
++**
++**      gctUINT32 ProcessID
++**          Process ID Logical belongs.
++**
++**      gctPHYS_ADDR Handle
++**          Physical address handle.  If gcvNULL it is video memory.
++**
++**      gctPOINTER Logical
++**          Logical address to flush.
++**
++**      gctSIZE_T Bytes
++**          Size of the address range in bytes to flush.
++*/
++gceSTATUS
++gckOS_CacheFlush(
++    IN gckOS Os,
++    IN gctUINT32 ProcessID,
++    IN gctPHYS_ADDR Handle,
++    IN gctPOINTER Physical,
++    IN gctPOINTER Logical,
++    IN gctSIZE_T Bytes
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X ProcessID=%d Handle=0x%X Logical=0x%X Bytes=%lu",
++                   Os, ProcessID, Handle, Logical, Bytes);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Logical != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Bytes > 0);
++
++#if !gcdCACHE_FUNCTION_UNIMPLEMENTED
++#ifdef CONFIG_ARM
++    /* Inner cache. */
++    dmac_flush_range(Logical, Logical + Bytes);
++
++#if defined(CONFIG_OUTER_CACHE)
++    /* Outer cache. */
++#if gcdENABLE_OUTER_CACHE_PATCH
++    _HandleOuterCache(Os, ProcessID, Handle, Physical, Logical, Bytes, gcvCACHE_FLUSH);
++#else
++    outer_flush_range((unsigned long) Handle, (unsigned long) Handle + Bytes);
++#endif
++#endif
++
++#elif defined(CONFIG_MIPS)
++    dma_cache_wback_inv((unsigned long) Logical, Bytes);
++#elif defined(CONFIG_PPC)
++    /* TODO */
++#else
++    dma_sync_single_for_device(
++              gcvNULL,
++              (dma_addr_t)Physical,
++              Bytes,
++              DMA_BIDIRECTIONAL);
++#endif
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++********************************* Broadcasting *********************************
++*******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckOS_Broadcast
++**
++**  System hook for broadcast events from the kernel driver.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gceBROADCAST Reason
++**          Reason for the broadcast.  Can be one of the following values:
++**
++**              gcvBROADCAST_GPU_IDLE
++**                  Broadcasted when the kernel driver thinks the GPU might be
++**                  idle.  This can be used to handle power management.
++**
++**              gcvBROADCAST_GPU_COMMIT
++**                  Broadcasted when any client process commits a command
++**                  buffer.  This can be used to handle power management.
++**
++**              gcvBROADCAST_GPU_STUCK
++**                  Broadcasted when the kernel driver hits the timeout waiting
++**                  for the GPU.
++**
++**              gcvBROADCAST_FIRST_PROCESS
++**                  First process is trying to connect to the kernel.
++**
++**              gcvBROADCAST_LAST_PROCESS
++**                  Last process has detached from the kernel.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_Broadcast(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gceBROADCAST Reason
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Hardware=0x%X Reason=%d", Os, Hardware, Reason);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_OBJECT(Hardware, gcvOBJ_HARDWARE);
++
++    switch (Reason)
++    {
++    case gcvBROADCAST_FIRST_PROCESS:
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "First process has attached");
++        break;
++
++    case gcvBROADCAST_LAST_PROCESS:
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "Last process has detached");
++
++        /* Put GPU OFF. */
++        gcmkONERROR(
++            gckHARDWARE_SetPowerManagementState(Hardware,
++                                                gcvPOWER_OFF_BROADCAST));
++        break;
++
++    case gcvBROADCAST_GPU_IDLE:
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "GPU idle.");
++
++        /* Put GPU IDLE. */
++        gcmkONERROR(
++            gckHARDWARE_SetPowerManagementState(Hardware,
++#if gcdPOWER_SUSNPEND_WHEN_IDLE
++                                                gcvPOWER_SUSPEND_BROADCAST));
++#else
++                                                gcvPOWER_IDLE_BROADCAST));
++#endif
++
++        /* Add idle process DB. */
++        gcmkONERROR(gckKERNEL_AddProcessDB(Hardware->kernel,
++                                           1,
++                                           gcvDB_IDLE,
++                                           gcvNULL, gcvNULL, 0));
++        break;
++
++    case gcvBROADCAST_GPU_COMMIT:
++        gcmkTRACE_ZONE(gcvLEVEL_INFO, gcvZONE_OS, "COMMIT has arrived.");
++
++        /* Add busy process DB. */
++        gcmkONERROR(gckKERNEL_AddProcessDB(Hardware->kernel,
++                                           0,
++                                           gcvDB_IDLE,
++                                           gcvNULL, gcvNULL, 0));
++
++        /* Put GPU ON. */
++        gcmkONERROR(
++            gckHARDWARE_SetPowerManagementState(Hardware, gcvPOWER_ON_AUTO));
++        break;
++
++    case gcvBROADCAST_GPU_STUCK:
++        gcmkTRACE_N(gcvLEVEL_ERROR, 0, "gcvBROADCAST_GPU_STUCK\n");
++#if !gcdENABLE_RECOVERY
++        gcmkONERROR(gckHARDWARE_DumpGPUState(Hardware));
++#endif
++        gcmkONERROR(gckKERNEL_Recovery(Hardware->kernel));
++        break;
++
++    case gcvBROADCAST_AXI_BUS_ERROR:
++        gcmkTRACE_N(gcvLEVEL_ERROR, 0, "gcvBROADCAST_AXI_BUS_ERROR\n");
++        gcmkONERROR(gckHARDWARE_DumpGPUState(Hardware));
++        gcmkONERROR(gckKERNEL_Recovery(Hardware->kernel));
++        break;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_BroadcastHurry
++**
++**  The GPU is running too slow.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gctUINT Urgency
++**          The higher the number, the higher the urgency to speed up the GPU.
++**          The maximum value is defined by the gcdDYNAMIC_EVENT_THRESHOLD.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_BroadcastHurry(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT Urgency
++    )
++{
++    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x Urgency=%u", Os, Hardware, Urgency);
++
++    /* Do whatever you need to do to speed up the GPU now. */
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_BroadcastCalibrateSpeed
++**
++**  Calibrate the speed of the GPU.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gckHARDWARE Hardware
++**          Pointer to the gckHARDWARE object.
++**
++**      gctUINT Idle, Time
++**          Idle/Time will give the percentage the GPU is idle, so you can use
++**          this to calibrate the working point of the GPU.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_BroadcastCalibrateSpeed(
++    IN gckOS Os,
++    IN gckHARDWARE Hardware,
++    IN gctUINT Idle,
++    IN gctUINT Time
++    )
++{
++    gcmkHEADER_ARG("Os=0x%x Hardware=0x%x Idle=%u Time=%u",
++                   Os, Hardware, Idle, Time);
++
++    /* Do whatever you need to do to callibrate the GPU speed. */
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++********************************** Semaphores **********************************
++*******************************************************************************/
++
++/*******************************************************************************
++**
++**  gckOS_CreateSemaphore
++**
++**  Create a semaphore.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Semaphore
++**          Pointer to the variable that will receive the created semaphore.
++*/
++gceSTATUS
++gckOS_CreateSemaphore(
++    IN gckOS Os,
++    OUT gctPOINTER * Semaphore
++    )
++{
++    gceSTATUS status;
++    struct semaphore *sem = gcvNULL;
++
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    /* Allocate the semaphore structure. */
++    sem = (struct semaphore *)kmalloc(gcmSIZEOF(struct semaphore), GFP_KERNEL | gcdNOWARN);
++    if (sem == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Initialize the semaphore. */
++    sema_init(sem, 1);
++
++    /* Return to caller. */
++    *Semaphore = (gctPOINTER) sem;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_AcquireSemaphore
++**
++**  Acquire a semaphore.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Semaphore
++**          Pointer to the semaphore thet needs to be acquired.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_AcquireSemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%08X Semaphore=0x%08X", Os, Semaphore);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    /* Acquire the semaphore. */
++    if (down_interruptible((struct semaphore *) Semaphore))
++    {
++        gcmkONERROR(gcvSTATUS_INTERRUPTED);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_TryAcquireSemaphore
++**
++**  Try to acquire a semaphore.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Semaphore
++**          Pointer to the semaphore thet needs to be acquired.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_TryAcquireSemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    )
++{
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%x", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    /* Acquire the semaphore. */
++    if (down_trylock((struct semaphore *) Semaphore))
++    {
++        /* Timeout. */
++        status = gcvSTATUS_TIMEOUT;
++        gcmkFOOTER();
++        return status;
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_ReleaseSemaphore
++**
++**  Release a previously acquired semaphore.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Semaphore
++**          Pointer to the semaphore thet needs to be released.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_ReleaseSemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%X", Os, Semaphore);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    /* Release the semaphore. */
++    up((struct semaphore *) Semaphore);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_DestroySemaphore
++**
++**  Destroy a semaphore.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Semaphore
++**          Pointer to the semaphore thet needs to be destroyed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_DestroySemaphore(
++    IN gckOS Os,
++    IN gctPOINTER Semaphore
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%X", Os, Semaphore);
++
++     /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    /* Free the sempahore structure. */
++    kfree(Semaphore);
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetProcessID
++**
++**  Get current process ID.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR ProcessID
++**          Pointer to the variable that receives the process ID.
++*/
++gceSTATUS
++gckOS_GetProcessID(
++    OUT gctUINT32_PTR ProcessID
++    )
++{
++    /* Get process ID. */
++    if (ProcessID != gcvNULL)
++    {
++        *ProcessID = _GetProcessID();
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_GetThreadID
++**
++**  Get current thread ID.
++**
++**  INPUT:
++**
++**      Nothing.
++**
++**  OUTPUT:
++**
++**      gctUINT32_PTR ThreadID
++**          Pointer to the variable that receives the thread ID.
++*/
++gceSTATUS
++gckOS_GetThreadID(
++    OUT gctUINT32_PTR ThreadID
++    )
++{
++    /* Get thread ID. */
++    if (ThreadID != gcvNULL)
++    {
++        *ThreadID = _GetThreadID();
++    }
++
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetGPUPower
++**
++**  Set the power of the GPU on or off.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gckCORE Core
++**          GPU whose power is set.
++**
++**      gctBOOL Clock
++**          gcvTRUE to turn on the clock, or gcvFALSE to turn off the clock.
++**
++**      gctBOOL Power
++**          gcvTRUE to turn on the power, or gcvFALSE to turn off the power.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_SetGPUPower(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctBOOL Clock,
++    IN gctBOOL Power
++    )
++{
++    struct clk *clk_3dcore = Os->device->clk_3d_core;
++    struct clk *clk_3dshader = Os->device->clk_3d_shader;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    struct clk *clk_3d_axi = Os->device->clk_3d_axi;
++#endif
++    struct clk *clk_2dcore = Os->device->clk_2d_core;
++    struct clk *clk_2d_axi = Os->device->clk_2d_axi;
++    struct clk *clk_vg_axi = Os->device->clk_vg_axi;
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    int ret;
++#endif
++
++    gctBOOL oldClockState = gcvFALSE;
++    gctBOOL oldPowerState = gcvFALSE;
++
++    gcmkHEADER_ARG("Os=0x%X Core=%d Clock=%d Power=%d", Os, Core, Clock, Power);
++
++    if (Os->device->kernels[Core] != NULL)
++    {
++#if gcdENABLE_VG
++        if (Core == gcvCORE_VG)
++        {
++            oldClockState = Os->device->kernels[Core]->vg->hardware->clockState;
++            oldPowerState = Os->device->kernels[Core]->vg->hardware->powerState;
++        }
++        else
++        {
++#endif
++            oldClockState = Os->device->kernels[Core]->hardware->clockState;
++            oldPowerState = Os->device->kernels[Core]->hardware->powerState;
++#if gcdENABLE_VG
++        }
++#endif
++    }
++	if((Power == gcvTRUE) && (oldPowerState == gcvFALSE))
++	{
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++        if(!IS_ERR(Os->device->gpu_regulator)) {
++            ret = regulator_enable(Os->device->gpu_regulator);
++            if (ret != 0)
++                gckOS_Print("%s(%d): fail to enable pu regulator %d!\n",
++                    __FUNCTION__, __LINE__, ret);
++        }
++#else
++        imx_gpc_power_up_pu(true);
++#endif
++
++#ifdef CONFIG_PM
++		pm_runtime_get_sync(Os->device->pmdev);
++#endif
++	}
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++    if (Clock == gcvTRUE) {
++        if (oldClockState == gcvFALSE) {
++            mutex_lock(&Os->gpu_clk_mutex);
++            switch (Core) {
++            case gcvCORE_MAJOR:
++                clk_enable(clk_3dcore);
++                if (cpu_is_mx6q())
++                    clk_enable(clk_3dshader);
++                break;
++            case gcvCORE_2D:
++                clk_enable(clk_2dcore);
++                clk_enable(clk_2d_axi);
++                break;
++            case gcvCORE_VG:
++                clk_enable(clk_2dcore);
++                clk_enable(clk_vg_axi);
++                break;
++            default:
++                break;
++            }
++            Os->gpu_clk_on[Core] = 1;
++            mutex_unlock(&Os->gpu_clk_mutex);
++        }
++    } else {
++        if (oldClockState == gcvTRUE) {
++            mutex_lock(&Os->gpu_clk_mutex);
++            switch (Core) {
++            case gcvCORE_MAJOR:
++                if (cpu_is_mx6q())
++                    clk_disable(clk_3dshader);
++                clk_disable(clk_3dcore);
++                break;
++           case gcvCORE_2D:
++                clk_disable(clk_2dcore);
++                clk_disable(clk_2d_axi);
++                break;
++            case gcvCORE_VG:
++                clk_disable(clk_2dcore);
++                clk_disable(clk_vg_axi);
++                break;
++            default:
++                break;
++            }
++            Os->gpu_clk_on[Core] = 0;
++            mutex_unlock(&Os->gpu_clk_mutex);
++        }
++    }
++#else
++    if (Clock == gcvTRUE) {
++        if (oldClockState == gcvFALSE) {
++            mutex_lock(&Os->gpu_clk_mutex);
++            switch (Core) {
++            case gcvCORE_MAJOR:
++                clk_prepare_enable(clk_3dcore);
++                clk_prepare_enable(clk_3dshader);
++                clk_prepare_enable(clk_3d_axi);
++                break;
++            case gcvCORE_2D:
++                clk_prepare_enable(clk_2dcore);
++                clk_prepare_enable(clk_2d_axi);
++                break;
++            case gcvCORE_VG:
++                clk_prepare_enable(clk_2dcore);
++                clk_prepare_enable(clk_vg_axi);
++                break;
++            default:
++                break;
++            }
++            Os->gpu_clk_on[Core] = 1;
++            mutex_unlock(&Os->gpu_clk_mutex);
++        }
++    } else {
++        if (oldClockState == gcvTRUE) {
++            mutex_lock(&Os->gpu_clk_mutex);
++            switch (Core) {
++            case gcvCORE_MAJOR:
++                clk_disable_unprepare(clk_3d_axi);
++                clk_disable_unprepare(clk_3dshader);
++                clk_disable_unprepare(clk_3dcore);
++                break;
++           case gcvCORE_2D:
++                clk_disable_unprepare(clk_2d_axi);
++                clk_disable_unprepare(clk_2dcore);
++                break;
++            case gcvCORE_VG:
++                clk_disable_unprepare(clk_vg_axi);
++                clk_disable_unprepare(clk_2dcore);
++                break;
++            default:
++                break;
++            }
++            Os->gpu_clk_on[Core] = 0;
++            mutex_unlock(&Os->gpu_clk_mutex);
++        }
++    }
++#endif
++	if((Power == gcvFALSE) && (oldPowerState == gcvTRUE))
++	{
++#ifdef CONFIG_PM
++		pm_runtime_put_sync(Os->device->pmdev);
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++        if(!IS_ERR(Os->device->gpu_regulator))
++            regulator_disable(Os->device->gpu_regulator);
++#else
++        imx_gpc_power_up_pu(false);
++#endif
++
++	}
++    /* TODO: Put your code here. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_ResetGPU
++**
++**  Reset the GPU.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gckCORE Core
++**          GPU whose power is set.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_ResetGPU(
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++#define SRC_SCR_OFFSET 0
++#define BP_SRC_SCR_GPU3D_RST 1
++#define BP_SRC_SCR_GPU2D_RST 4
++    void __iomem *src_base = IO_ADDRESS(SRC_BASE_ADDR);
++    gctUINT32 bit_offset,val;
++
++    gcmkHEADER_ARG("Os=0x%X Core=%d", Os, Core);
++
++    if(Core == gcvCORE_MAJOR) {
++        bit_offset = BP_SRC_SCR_GPU3D_RST;
++    } else if((Core == gcvCORE_VG)
++            ||(Core == gcvCORE_2D)) {
++        bit_offset = BP_SRC_SCR_GPU2D_RST;
++    } else {
++        return gcvSTATUS_INVALID_CONFIG;
++    }
++    val = __raw_readl(src_base + SRC_SCR_OFFSET);
++    val &= ~(1 << (bit_offset));
++    val |= (1 << (bit_offset));
++    __raw_writel(val, src_base + SRC_SCR_OFFSET);
++
++    while ((__raw_readl(src_base + SRC_SCR_OFFSET) &
++                (1 << (bit_offset))) != 0) {
++    }
++
++    gcmkFOOTER_NO();
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++	struct reset_control *rstc = Os->device->rstc[Core];
++	if (rstc)
++		reset_control_reset(rstc);
++#else
++    imx_src_reset_gpu((int)Core);
++#endif
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_PrepareGPUFrequency
++**
++**  Prepare to set GPU frequency and voltage.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gckCORE Core
++**          GPU whose frequency and voltage will be set.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_PrepareGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_FinishGPUFrequency
++**
++**  Finish GPU frequency setting.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gckCORE Core
++**          GPU whose frequency and voltage is set.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_FinishGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_QueryGPUFrequency
++**
++**  Query the current frequency of the GPU.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gckCORE Core
++**          GPU whose power is set.
++**
++**      gctUINT32 * Frequency
++**          Pointer to a gctUINT32 to obtain current frequency, in MHz.
++**
++**      gctUINT8 * Scale
++**          Pointer to a gctUINT8 to obtain current scale(1 - 64).
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_QueryGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core,
++    OUT gctUINT32 * Frequency,
++    OUT gctUINT8 * Scale
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetGPUFrequency
++**
++**  Set frequency and voltage of the GPU.
++**
++**      1. DVFS manager gives the target scale of full frequency, BSP must find
++**         a real frequency according to this scale and board's configure.
++**
++**      2. BSP should find a suitable voltage for this frequency.
++**
++**      3. BSP must make sure setting take effect before this function returns.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to a gckOS object.
++**
++**      gckCORE Core
++**          GPU whose power is set.
++**
++**      gctUINT8 Scale
++**          Target scale of full frequency, range is [1, 64]. 1 means 1/64 of
++**          full frequency and 64 means 64/64 of full frequency.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_SetGPUFrequency(
++    IN gckOS Os,
++    IN gceCORE Core,
++    IN gctUINT8 Scale
++    )
++{
++    return gcvSTATUS_OK;
++}
++
++/*----------------------------------------------------------------------------*/
++/*----- Profile --------------------------------------------------------------*/
++
++gceSTATUS
++gckOS_GetProfileTick(
++    OUT gctUINT64_PTR Tick
++    )
++{
++    struct timespec time;
++
++    ktime_get_ts(&time);
++
++    *Tick = time.tv_nsec + time.tv_sec * 1000000000ULL;
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_QueryProfileTickRate(
++    OUT gctUINT64_PTR TickRate
++    )
++{
++    struct timespec res;
++
++    hrtimer_get_res(CLOCK_MONOTONIC, &res);
++
++    *TickRate = res.tv_nsec + res.tv_sec * 1000000000ULL;
++
++    return gcvSTATUS_OK;
++}
++
++gctUINT32
++gckOS_ProfileToMS(
++    IN gctUINT64 Ticks
++    )
++{
++#if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,23)
++    return div_u64(Ticks, 1000000);
++#else
++    gctUINT64 rem = Ticks;
++    gctUINT64 b = 1000000;
++    gctUINT64 res, d = 1;
++    gctUINT32 high = rem >> 32;
++
++    /* Reduce the thing a bit first */
++    res = 0;
++    if (high >= 1000000)
++    {
++        high /= 1000000;
++        res   = (gctUINT64) high << 32;
++        rem  -= (gctUINT64) (high * 1000000) << 32;
++    }
++
++    while (((gctINT64) b > 0) && (b < rem))
++    {
++        b <<= 1;
++        d <<= 1;
++    }
++
++    do
++    {
++        if (rem >= b)
++        {
++            rem -= b;
++            res += d;
++        }
++
++        b >>= 1;
++        d >>= 1;
++    }
++    while (d);
++
++    return (gctUINT32) res;
++#endif
++}
++
++/******************************************************************************\
++******************************* Signal Management ******************************
++\******************************************************************************/
++
++#undef _GC_OBJ_ZONE
++#define _GC_OBJ_ZONE    gcvZONE_SIGNAL
++
++/*******************************************************************************
++**
++**  gckOS_CreateSignal
++**
++**  Create a new signal.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctBOOL ManualReset
++**          If set to gcvTRUE, gckOS_Signal with gcvFALSE must be called in
++**          order to set the signal to nonsignaled state.
++**          If set to gcvFALSE, the signal will automatically be set to
++**          nonsignaled state by gckOS_WaitSignal function.
++**
++**  OUTPUT:
++**
++**      gctSIGNAL * Signal
++**          Pointer to a variable receiving the created gctSIGNAL.
++*/
++gceSTATUS
++gckOS_CreateSignal(
++    IN gckOS Os,
++    IN gctBOOL ManualReset,
++    OUT gctSIGNAL * Signal
++    )
++{
++    gceSTATUS status;
++    gcsSIGNAL_PTR signal;
++
++    gcmkHEADER_ARG("Os=0x%X ManualReset=%d", Os, ManualReset);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++
++    /* Create an event structure. */
++    signal = (gcsSIGNAL_PTR) kmalloc(sizeof(gcsSIGNAL), GFP_KERNEL | gcdNOWARN);
++
++    if (signal == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Save the process ID. */
++    signal->process = (gctHANDLE)(gctUINTPTR_T) _GetProcessID();
++    signal->manualReset = ManualReset;
++    signal->hardware = gcvNULL;
++    init_completion(&signal->obj);
++    atomic_set(&signal->ref, 1);
++
++    gcmkONERROR(_AllocateIntegerId(&Os->signalDB, signal, &signal->id));
++
++    *Signal = (gctSIGNAL)(gctUINTPTR_T)signal->id;
++
++    gcmkFOOTER_ARG("*Signal=0x%X", *Signal);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (signal != gcvNULL)
++    {
++        kfree(signal);
++    }
++
++    gcmkFOOTER_NO();
++    return status;
++}
++
++gceSTATUS
++gckOS_SignalQueryHardware(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    OUT gckHARDWARE * Hardware
++    )
++{
++    gceSTATUS status;
++    gcsSIGNAL_PTR signal;
++
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Hardware=0x%X", Os, Signal, Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Hardware != gcvNULL);
++
++    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
++
++    *Hardware = signal->hardware;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_SignalSetHardware(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gckHARDWARE Hardware
++    )
++{
++    gceSTATUS status;
++    gcsSIGNAL_PTR signal;
++
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Hardware=0x%X", Os, Signal, Hardware);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++
++    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
++
++    signal->hardware = Hardware;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_DestroySignal
++**
++**  Destroy a signal.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIGNAL Signal
++**          Pointer to the gctSIGNAL.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_DestroySignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal
++    )
++{
++    gceSTATUS status;
++    gcsSIGNAL_PTR signal;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X", Os, Signal);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++
++    gcmkONERROR(gckOS_AcquireMutex(Os, Os->signalMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
++
++    gcmkASSERT(signal->id == (gctUINT32)(gctUINTPTR_T)Signal);
++
++    if (atomic_dec_and_test(&signal->ref))
++    {
++        gcmkVERIFY_OK(_DestroyIntegerId(&Os->signalDB, signal->id));
++
++        /* Free the sgianl. */
++        kfree(signal);
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_Signal
++**
++**  Set a state of the specified signal.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIGNAL Signal
++**          Pointer to the gctSIGNAL.
++**
++**      gctBOOL State
++**          If gcvTRUE, the signal will be set to signaled state.
++**          If gcvFALSE, the signal will be set to nonsignaled state.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_Signal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctBOOL State
++    )
++{
++    gceSTATUS status;
++    gcsSIGNAL_PTR signal;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X State=%d", Os, Signal, State);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++
++    gcmkONERROR(gckOS_AcquireMutex(Os, Os->signalMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
++
++    gcmkASSERT(signal->id == (gctUINT32)(gctUINTPTR_T)Signal);
++
++    if (State)
++    {
++        /* unbind the signal from hardware. */
++        signal->hardware = gcvNULL;
++
++        /* Set the event to a signaled state. */
++        complete(&signal->obj);
++    }
++    else
++    {
++        /* Set the event to an unsignaled state. */
++        reinit_completion(&signal->obj);
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->signalMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++#if gcdENABLE_VG
++gceSTATUS
++gckOS_SetSignalVG(
++    IN gckOS Os,
++    IN gctHANDLE Process,
++    IN gctSIGNAL Signal
++    )
++{
++    gceSTATUS status;
++    gctINT result;
++    struct task_struct * userTask;
++    struct siginfo info;
++
++    userTask = FIND_TASK_BY_PID((pid_t)(gctUINTPTR_T) Process);
++
++    if (userTask != gcvNULL)
++    {
++        info.si_signo = 48;
++        info.si_code  = __SI_CODE(__SI_RT, SI_KERNEL);
++        info.si_pid   = 0;
++        info.si_uid   = 0;
++        info.si_ptr   = (gctPOINTER) Signal;
++
++        /* Signals with numbers between 32 and 63 are real-time,
++           send a real-time signal to the user process. */
++        result = send_sig_info(48, &info, userTask);
++
++        printk("gckOS_SetSignalVG:0x%x\n", result);
++        /* Error? */
++        if (result < 0)
++        {
++            status = gcvSTATUS_GENERIC_IO;
++
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): an error has occurred.\n",
++                __FUNCTION__, __LINE__
++                );
++        }
++        else
++        {
++            status = gcvSTATUS_OK;
++        }
++    }
++    else
++    {
++        status = gcvSTATUS_GENERIC_IO;
++
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): an error has occurred.\n",
++            __FUNCTION__, __LINE__
++            );
++    }
++
++    /* Return status. */
++    return status;
++}
++#endif
++
++/*******************************************************************************
++**
++**  gckOS_UserSignal
++**
++**  Set the specified signal which is owned by a process to signaled state.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIGNAL Signal
++**          Pointer to the gctSIGNAL.
++**
++**      gctHANDLE Process
++**          Handle of process owning the signal.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_UserSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctHANDLE Process
++    )
++{
++    gceSTATUS status;
++    gctSIGNAL signal;
++
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Process=%d",
++                   Os, Signal, (gctINT32)(gctUINTPTR_T)Process);
++
++    /* Map the signal into kernel space. */
++    gcmkONERROR(gckOS_MapSignal(Os, Signal, Process, &signal));
++
++    /* Signal. */
++    status = gckOS_Signal(Os, signal, gcvTRUE);
++
++    /* Unmap the signal */
++    gcmkVERIFY_OK(gckOS_UnmapSignal(Os, Signal));
++
++    gcmkFOOTER();
++    return status;
++
++OnError:
++    /* Return the status. */
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_WaitSignal
++**
++**  Wait for a signal to become signaled.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIGNAL Signal
++**          Pointer to the gctSIGNAL.
++**
++**      gctUINT32 Wait
++**          Number of milliseconds to wait.
++**          Pass the value of gcvINFINITE for an infinite wait.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_WaitSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctUINT32 Wait
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gcsSIGNAL_PTR signal;
++
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Wait=0x%08X", Os, Signal, Wait);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++
++    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
++
++    gcmkASSERT(signal->id == (gctUINT32)(gctUINTPTR_T)Signal);
++
++    might_sleep();
++
++    spin_lock_irq(&signal->obj.wait.lock);
++
++    if (signal->obj.done)
++    {
++        if (!signal->manualReset)
++        {
++            signal->obj.done = 0;
++        }
++
++        status = gcvSTATUS_OK;
++    }
++    else if (Wait == 0)
++    {
++        status = gcvSTATUS_TIMEOUT;
++    }
++    else
++    {
++        /* Convert wait to milliseconds. */
++#if gcdDETECT_TIMEOUT
++        gctINT timeout = (Wait == gcvINFINITE)
++            ? gcdINFINITE_TIMEOUT * HZ / 1000
++            : Wait * HZ / 1000;
++
++        gctUINT complained = 0;
++#else
++        gctINT timeout = (Wait == gcvINFINITE)
++            ? MAX_SCHEDULE_TIMEOUT
++            : Wait * HZ / 1000;
++#endif
++
++        DECLARE_WAITQUEUE(wait, current);
++        wait.flags |= WQ_FLAG_EXCLUSIVE;
++        __add_wait_queue_tail(&signal->obj.wait, &wait);
++
++        while (gcvTRUE)
++        {
++            if (signal_pending(current))
++            {
++                /* Interrupt received. */
++                status = gcvSTATUS_INTERRUPTED;
++                break;
++            }
++
++            __set_current_state(TASK_INTERRUPTIBLE);
++            spin_unlock_irq(&signal->obj.wait.lock);
++            timeout = schedule_timeout(timeout);
++            spin_lock_irq(&signal->obj.wait.lock);
++
++            if (signal->obj.done)
++            {
++                if (!signal->manualReset)
++                {
++                    signal->obj.done = 0;
++                }
++
++                status = gcvSTATUS_OK;
++                break;
++            }
++
++#if gcdDETECT_TIMEOUT
++            if ((Wait == gcvINFINITE) && (timeout == 0))
++            {
++                gctUINT32 dmaAddress1, dmaAddress2;
++                gctUINT32 dmaState1, dmaState2;
++
++                dmaState1   = dmaState2   =
++                dmaAddress1 = dmaAddress2 = 0;
++
++                /* Verify whether DMA is running. */
++                gcmkVERIFY_OK(_VerifyDMA(
++                    Os, &dmaAddress1, &dmaAddress2, &dmaState1, &dmaState2
++                    ));
++
++#if gcdDETECT_DMA_ADDRESS
++                /* Dump only if DMA appears stuck. */
++                if (
++                    (dmaAddress1 == dmaAddress2)
++#if gcdDETECT_DMA_STATE
++                 && (dmaState1   == dmaState2)
++#endif
++                )
++#endif
++                {
++                    /* Increment complain count. */
++                    complained += 1;
++
++                    gcmkVERIFY_OK(_DumpGPUState(Os, gcvCORE_MAJOR));
++
++                    gcmkPRINT(
++                        "%s(%d): signal 0x%X; forced message flush (%d).",
++                        __FUNCTION__, __LINE__, Signal, complained
++                        );
++
++                    /* Flush the debug cache. */
++                    gcmkDEBUGFLUSH(dmaAddress2);
++                }
++
++                /* Reset timeout. */
++                timeout = gcdINFINITE_TIMEOUT * HZ / 1000;
++            }
++#endif
++
++            if (timeout == 0)
++            {
++
++                status = gcvSTATUS_TIMEOUT;
++                break;
++            }
++        }
++
++        __remove_wait_queue(&signal->obj.wait, &wait);
++
++#if gcdDETECT_TIMEOUT
++        if (complained)
++        {
++            gcmkPRINT(
++                "%s(%d): signal=0x%X; waiting done; status=%d",
++                __FUNCTION__, __LINE__, Signal, status
++                );
++        }
++#endif
++    }
++
++    spin_unlock_irq(&signal->obj.wait.lock);
++
++OnError:
++    /* Return status. */
++    gcmkFOOTER_ARG("Signal=0x%X status=%d", Signal, status);
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_MapSignal
++**
++**  Map a signal in to the current process space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctSIGNAL Signal
++**          Pointer to tha gctSIGNAL to map.
++**
++**      gctHANDLE Process
++**          Handle of process owning the signal.
++**
++**  OUTPUT:
++**
++**      gctSIGNAL * MappedSignal
++**          Pointer to a variable receiving the mapped gctSIGNAL.
++*/
++gceSTATUS
++gckOS_MapSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal,
++    IN gctHANDLE Process,
++    OUT gctSIGNAL * MappedSignal
++    )
++{
++    gceSTATUS status;
++    gcsSIGNAL_PTR signal;
++    gcmkHEADER_ARG("Os=0x%X Signal=0x%X Process=0x%X", Os, Signal, Process);
++
++    gcmkVERIFY_ARGUMENT(Signal != gcvNULL);
++    gcmkVERIFY_ARGUMENT(MappedSignal != gcvNULL);
++
++    gcmkONERROR(_QueryIntegerId(&Os->signalDB, (gctUINT32)(gctUINTPTR_T)Signal, (gctPOINTER)&signal));
++
++    if(atomic_inc_return(&signal->ref) <= 1)
++    {
++        /* The previous value is 0, it has been deleted. */
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    *MappedSignal = (gctSIGNAL) Signal;
++
++    /* Success. */
++    gcmkFOOTER_ARG("*MappedSignal=0x%X", *MappedSignal);
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER_NO();
++    return status;
++}
++
++/*******************************************************************************
++**
++**	gckOS_UnmapSignal
++**
++**	Unmap a signal .
++**
++**	INPUT:
++**
++**		gckOS Os
++**			Pointer to an gckOS object.
++**
++**		gctSIGNAL Signal
++**			Pointer to that gctSIGNAL mapped.
++*/
++gceSTATUS
++gckOS_UnmapSignal(
++    IN gckOS Os,
++    IN gctSIGNAL Signal
++    )
++{
++    return gckOS_DestroySignal(Os, Signal);
++}
++
++/*******************************************************************************
++**
++**  gckOS_CreateUserSignal
++**
++**  Create a new signal to be used in the user space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctBOOL ManualReset
++**          If set to gcvTRUE, gckOS_Signal with gcvFALSE must be called in
++**          order to set the signal to nonsignaled state.
++**          If set to gcvFALSE, the signal will automatically be set to
++**          nonsignaled state by gckOS_WaitSignal function.
++**
++**  OUTPUT:
++**
++**      gctINT * SignalID
++**          Pointer to a variable receiving the created signal's ID.
++*/
++gceSTATUS
++gckOS_CreateUserSignal(
++    IN gckOS Os,
++    IN gctBOOL ManualReset,
++    OUT gctINT * SignalID
++    )
++{
++    gceSTATUS status;
++    gctSIZE_T signal;
++
++    /* Create a new signal. */
++    status = gckOS_CreateSignal(Os, ManualReset, (gctSIGNAL *) &signal);
++    *SignalID = (gctINT) signal;
++
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_DestroyUserSignal
++**
++**  Destroy a signal to be used in the user space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctINT SignalID
++**          The signal's ID.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_DestroyUserSignal(
++    IN gckOS Os,
++    IN gctINT SignalID
++    )
++{
++    return gckOS_DestroySignal(Os, (gctSIGNAL)(gctUINTPTR_T)SignalID);
++}
++
++/*******************************************************************************
++**
++**  gckOS_WaitUserSignal
++**
++**  Wait for a signal used in the user mode to become signaled.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctINT SignalID
++**          Signal ID.
++**
++**      gctUINT32 Wait
++**          Number of milliseconds to wait.
++**          Pass the value of gcvINFINITE for an infinite wait.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_WaitUserSignal(
++    IN gckOS Os,
++    IN gctINT SignalID,
++    IN gctUINT32 Wait
++    )
++{
++    return gckOS_WaitSignal(Os, (gctSIGNAL)(gctUINTPTR_T)SignalID, Wait);
++}
++
++/*******************************************************************************
++**
++**  gckOS_SignalUserSignal
++**
++**  Set a state of the specified signal to be used in the user space.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to an gckOS object.
++**
++**      gctINT SignalID
++**          SignalID.
++**
++**      gctBOOL State
++**          If gcvTRUE, the signal will be set to signaled state.
++**          If gcvFALSE, the signal will be set to nonsignaled state.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_SignalUserSignal(
++    IN gckOS Os,
++    IN gctINT SignalID,
++    IN gctBOOL State
++    )
++{
++    return gckOS_Signal(Os, (gctSIGNAL)(gctUINTPTR_T)SignalID, State);
++}
++
++#if gcdENABLE_VG
++gceSTATUS
++gckOS_CreateSemaphoreVG(
++    IN gckOS Os,
++    OUT gctSEMAPHORE * Semaphore
++    )
++{
++    gceSTATUS status;
++    struct semaphore * newSemaphore;
++
++    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%x", Os, Semaphore);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    do
++    {
++        /* Allocate the semaphore structure. */
++    	newSemaphore = (struct semaphore *)kmalloc(gcmSIZEOF(struct semaphore), GFP_KERNEL | gcdNOWARN);
++    	if (newSemaphore == gcvNULL)
++    	{
++        	gcmkERR_BREAK(gcvSTATUS_OUT_OF_MEMORY);
++    	}
++
++        /* Initialize the semaphore. */
++        sema_init(newSemaphore, 0);
++
++        /* Set the handle. */
++        * Semaphore = (gctSEMAPHORE) newSemaphore;
++
++        /* Success. */
++        status = gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++
++gceSTATUS
++gckOS_IncrementSemaphore(
++    IN gckOS Os,
++    IN gctSEMAPHORE Semaphore
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%x", Os, Semaphore);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    /* Increment the semaphore's count. */
++    up((struct semaphore *) Semaphore);
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_DecrementSemaphore(
++    IN gckOS Os,
++    IN gctSEMAPHORE Semaphore
++    )
++{
++    gceSTATUS status;
++    gctINT result;
++
++    gcmkHEADER_ARG("Os=0x%X Semaphore=0x%x", Os, Semaphore);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Semaphore != gcvNULL);
++
++    do
++    {
++        /* Decrement the semaphore's count. If the count is zero, wait
++           until it gets incremented. */
++        result = down_interruptible((struct semaphore *) Semaphore);
++
++        /* Signal received? */
++        if (result != 0)
++        {
++            status = gcvSTATUS_TERMINATE;
++            break;
++        }
++
++        /* Success. */
++        status = gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_SetSignal
++**
++**  Set the specified signal to signaled state.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctHANDLE Process
++**          Handle of process owning the signal.
++**
++**      gctSIGNAL Signal
++**          Pointer to the gctSIGNAL.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_SetSignal(
++    IN gckOS Os,
++    IN gctHANDLE Process,
++    IN gctSIGNAL Signal
++    )
++{
++    gceSTATUS status;
++    gctINT result;
++    struct task_struct * userTask;
++    struct siginfo info;
++
++    userTask = FIND_TASK_BY_PID((pid_t)(gctUINTPTR_T) Process);
++
++    if (userTask != gcvNULL)
++    {
++        info.si_signo = 48;
++        info.si_code  = __SI_CODE(__SI_RT, SI_KERNEL);
++        info.si_pid   = 0;
++        info.si_uid   = 0;
++        info.si_ptr   = (gctPOINTER) Signal;
++
++        /* Signals with numbers between 32 and 63 are real-time,
++           send a real-time signal to the user process. */
++        result = send_sig_info(48, &info, userTask);
++
++        /* Error? */
++        if (result < 0)
++        {
++            status = gcvSTATUS_GENERIC_IO;
++
++            gcmkTRACE(
++                gcvLEVEL_ERROR,
++                "%s(%d): an error has occurred.\n",
++                __FUNCTION__, __LINE__
++                );
++        }
++        else
++        {
++            status = gcvSTATUS_OK;
++        }
++    }
++    else
++    {
++        status = gcvSTATUS_GENERIC_IO;
++
++        gcmkTRACE(
++            gcvLEVEL_ERROR,
++            "%s(%d): an error has occurred.\n",
++            __FUNCTION__, __LINE__
++            );
++    }
++
++    /* Return status. */
++    return status;
++}
++
++/******************************************************************************\
++******************************** Thread Object *********************************
++\******************************************************************************/
++
++gceSTATUS
++gckOS_StartThread(
++    IN gckOS Os,
++    IN gctTHREADFUNC ThreadFunction,
++    IN gctPOINTER ThreadParameter,
++    OUT gctTHREAD * Thread
++    )
++{
++    gceSTATUS status;
++    struct task_struct * thread;
++
++    gcmkHEADER_ARG("Os=0x%X ", Os);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(ThreadFunction != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Thread != gcvNULL);
++
++    do
++    {
++        /* Create the thread. */
++        thread = kthread_create(
++            ThreadFunction,
++            ThreadParameter,
++            "Vivante Kernel Thread"
++            );
++
++        /* Failed? */
++        if (IS_ERR(thread))
++        {
++            status = gcvSTATUS_GENERIC_IO;
++            break;
++        }
++
++        /* Start the thread. */
++        wake_up_process(thread);
++
++        /* Set the thread handle. */
++        * Thread = (gctTHREAD) thread;
++
++        /* Success. */
++        status = gcvSTATUS_OK;
++    }
++    while (gcvFALSE);
++
++    gcmkFOOTER();
++    /* Return the status. */
++    return status;
++}
++
++gceSTATUS
++gckOS_StopThread(
++    IN gckOS Os,
++    IN gctTHREAD Thread
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Thread=0x%x", Os, Thread);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Thread != gcvNULL);
++
++    /* Thread should have already been enabled to terminate. */
++    kthread_stop((struct task_struct *) Thread);
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_VerifyThread(
++    IN gckOS Os,
++    IN gctTHREAD Thread
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X Thread=0x%x", Os, Thread);
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Thread != gcvNULL);
++
++    gcmkFOOTER_NO();
++    /* Success. */
++    return gcvSTATUS_OK;
++}
++#endif
++
++/******************************************************************************\
++******************************** Software Timer ********************************
++\******************************************************************************/
++
++void
++_TimerFunction(
++    struct work_struct * work
++    )
++{
++    gcsOSTIMER_PTR timer = (gcsOSTIMER_PTR)work;
++
++    gctTIMERFUNCTION function = timer->function;
++
++    function(timer->data);
++}
++
++/*******************************************************************************
++**
++**  gckOS_CreateTimer
++**
++**  Create a software timer.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctTIMERFUNCTION Function.
++**          Pointer to a call back function which will be called when timer is
++**          expired.
++**
++**      gctPOINTER Data.
++**          Private data which will be passed to call back function.
++**
++**  OUTPUT:
++**
++**      gctPOINTER * Timer
++**          Pointer to a variable receiving the created timer.
++*/
++gceSTATUS
++gckOS_CreateTimer(
++    IN gckOS Os,
++    IN gctTIMERFUNCTION Function,
++    IN gctPOINTER Data,
++    OUT gctPOINTER * Timer
++    )
++{
++    gceSTATUS status;
++    gcsOSTIMER_PTR pointer;
++    gcmkHEADER_ARG("Os=0x%X Function=0x%X Data=0x%X", Os, Function, Data);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
++
++    gcmkONERROR(gckOS_Allocate(Os, sizeof(gcsOSTIMER), (gctPOINTER)&pointer));
++
++    pointer->function = Function;
++    pointer->data = Data;
++
++    INIT_DELAYED_WORK(&pointer->work, _TimerFunction);
++
++    *Timer = pointer;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++/*******************************************************************************
++**
++**  gckOS_DestroyTimer
++**
++**  Destory a software timer.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Timer
++**          Pointer to the timer to be destoryed.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_DestroyTimer(
++    IN gckOS Os,
++    IN gctPOINTER Timer
++    )
++{
++    gcsOSTIMER_PTR timer;
++    gcmkHEADER_ARG("Os=0x%X Timer=0x%X", Os, Timer);
++
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
++
++    timer = (gcsOSTIMER_PTR)Timer;
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,23)
++    cancel_delayed_work_sync(&timer->work);
++#else
++    cancel_delayed_work(&timer->work);
++    flush_workqueue(Os->workqueue);
++#endif
++
++    gcmkVERIFY_OK(gcmkOS_SAFE_FREE(Os, Timer));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_StartTimer
++**
++**  Schedule a software timer.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Timer
++**          Pointer to the timer to be scheduled.
++**
++**      gctUINT32 Delay
++**          Delay in milliseconds.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_StartTimer(
++    IN gckOS Os,
++    IN gctPOINTER Timer,
++    IN gctUINT32 Delay
++    )
++{
++    gcsOSTIMER_PTR timer;
++
++    gcmkHEADER_ARG("Os=0x%X Timer=0x%X Delay=%u", Os, Timer, Delay);
++
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
++    gcmkVERIFY_ARGUMENT(Delay != 0);
++
++    timer = (gcsOSTIMER_PTR)Timer;
++
++    if (unlikely(delayed_work_pending(&timer->work)))
++    {
++        if (unlikely(!cancel_delayed_work(&timer->work)))
++        {
++            cancel_work_sync(&timer->work.work);
++
++            if (unlikely(delayed_work_pending(&timer->work)))
++            {
++                gckOS_Print("gckOS_StartTimer error, the pending worker cannot complete!!!! \n");
++
++                return gcvSTATUS_INVALID_REQUEST;
++            }
++        }
++    }
++
++    queue_delayed_work(Os->workqueue, &timer->work, msecs_to_jiffies(Delay));
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++/*******************************************************************************
++**
++**  gckOS_StopTimer
++**
++**  Cancel a unscheduled timer.
++**
++**  INPUT:
++**
++**      gckOS Os
++**          Pointer to the gckOS object.
++**
++**      gctPOINTER Timer
++**          Pointer to the timer to be cancel.
++**
++**  OUTPUT:
++**
++**      Nothing.
++*/
++gceSTATUS
++gckOS_StopTimer(
++    IN gckOS Os,
++    IN gctPOINTER Timer
++    )
++{
++    gcsOSTIMER_PTR timer;
++    gcmkHEADER_ARG("Os=0x%X Timer=0x%X", Os, Timer);
++
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(Timer != gcvNULL);
++
++    timer = (gcsOSTIMER_PTR)Timer;
++
++    cancel_delayed_work(&timer->work);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++gceSTATUS
++gckOS_DumpCallStack(
++    IN gckOS Os
++    )
++{
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++    dump_stack();
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++
++gceSTATUS
++gckOS_GetProcessNameByPid(
++    IN gctINT Pid,
++    IN gctSIZE_T Length,
++    OUT gctUINT8_PTR String
++    )
++{
++    struct task_struct *task;
++
++    /* Get the task_struct of the task with pid. */
++    rcu_read_lock();
++
++    task = FIND_TASK_BY_PID(Pid);
++
++    if (task == gcvNULL)
++    {
++        rcu_read_unlock();
++        return gcvSTATUS_NOT_FOUND;
++    }
++
++    /* Get name of process. */
++    strncpy(String, task->comm, Length);
++
++    rcu_read_unlock();
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_GetVideoMemoryMutex(
++    IN gckOS Os,
++    OUT gctPOINTER *Mutex
++    )
++{
++    gcmkHEADER_ARG("Mutex=x%X", Mutex);
++
++    *Mutex = Os->vidmemMutex;
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++}
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++
++gceSTATUS
++gckOS_CreateSyncPoint(
++    IN gckOS Os,
++    OUT gctSYNC_POINT * SyncPoint
++    )
++{
++    gceSTATUS status;
++    gcsSYNC_POINT_PTR syncPoint;
++
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++
++    /* Create an sync point structure. */
++    syncPoint = (gcsSYNC_POINT_PTR) kmalloc(
++            sizeof(gcsSYNC_POINT), GFP_KERNEL | gcdNOWARN);
++
++    if (syncPoint == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Initialize the sync point. */
++    atomic_set(&syncPoint->ref, 1);
++    atomic_set(&syncPoint->state, 0);
++
++    gcmkONERROR(_AllocateIntegerId(&Os->syncPointDB, syncPoint, &syncPoint->id));
++
++    *SyncPoint = (gctSYNC_POINT)(gctUINTPTR_T)syncPoint->id;
++
++    gcmkFOOTER_ARG("*SyncPonint=%d", syncPoint->id);
++    return gcvSTATUS_OK;
++
++OnError:
++    if (syncPoint != gcvNULL)
++    {
++        kfree(syncPoint);
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_ReferenceSyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint
++    )
++{
++    gceSTATUS status;
++    gcsSYNC_POINT_PTR syncPoint;
++
++    gcmkHEADER_ARG("Os=0x%X", Os);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
++
++    gcmkONERROR(
++        _QueryIntegerId(&Os->syncPointDB,
++                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
++                        (gctPOINTER)&syncPoint));
++
++    /* Initialize the sync point. */
++    atomic_inc(&syncPoint->ref);
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_DestroySyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint
++    )
++{
++    gceSTATUS status;
++    gcsSYNC_POINT_PTR syncPoint;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Os=0x%X SyncPoint=%d", Os, (gctUINT32)(gctUINTPTR_T)SyncPoint);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
++
++    gcmkONERROR(gckOS_AcquireMutex(Os, Os->syncPointMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    gcmkONERROR(
++        _QueryIntegerId(&Os->syncPointDB,
++                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
++                        (gctPOINTER)&syncPoint));
++
++    gcmkASSERT(syncPoint->id == (gctUINT32)(gctUINTPTR_T)SyncPoint);
++
++    if (atomic_dec_and_test(&syncPoint->ref))
++    {
++        gcmkVERIFY_OK(_DestroyIntegerId(&Os->syncPointDB, syncPoint->id));
++
++        /* Free the sgianl. */
++        syncPoint->timeline = gcvNULL;
++        kfree(syncPoint);
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_SignalSyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint
++    )
++{
++    gceSTATUS status;
++    gcsSYNC_POINT_PTR syncPoint;
++    gctBOOL acquired = gcvFALSE;
++
++    gcmkHEADER_ARG("Os=0x%X SyncPoint=%d", Os, (gctUINT32)(gctUINTPTR_T)SyncPoint);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
++
++    gcmkONERROR(gckOS_AcquireMutex(Os, Os->syncPointMutex, gcvINFINITE));
++    acquired = gcvTRUE;
++
++    gcmkONERROR(
++        _QueryIntegerId(&Os->syncPointDB,
++                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
++                        (gctPOINTER)&syncPoint));
++
++    gcmkASSERT(syncPoint->id == (gctUINT32)(gctUINTPTR_T)SyncPoint);
++
++    /* Get state. */
++    atomic_set(&syncPoint->state, gcvTRUE);
++
++    /* Signal timeline. */
++    if (syncPoint->timeline)
++    {
++        sync_timeline_signal(syncPoint->timeline);
++    }
++
++    gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
++    acquired = gcvFALSE;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    if (acquired)
++    {
++        /* Release the mutex. */
++        gcmkVERIFY_OK(gckOS_ReleaseMutex(Os, Os->syncPointMutex));
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_QuerySyncPoint(
++    IN gckOS Os,
++    IN gctSYNC_POINT SyncPoint,
++    OUT gctBOOL_PTR State
++    )
++{
++    gceSTATUS status;
++    gcsSYNC_POINT_PTR syncPoint;
++
++    gcmkHEADER_ARG("Os=0x%X SyncPoint=%d", Os, (gctUINT32)(gctUINTPTR_T)SyncPoint);
++
++    /* Verify the arguments. */
++    gcmkVERIFY_OBJECT(Os, gcvOBJ_OS);
++    gcmkVERIFY_ARGUMENT(SyncPoint != gcvNULL);
++
++    gcmkONERROR(
++        _QueryIntegerId(&Os->syncPointDB,
++                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
++                        (gctPOINTER)&syncPoint));
++
++    gcmkASSERT(syncPoint->id == (gctUINT32)(gctUINTPTR_T)SyncPoint);
++
++    /* Get state. */
++    *State = atomic_read(&syncPoint->state);
++
++    /* Success. */
++    gcmkFOOTER_ARG("*State=%d", *State);
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_CreateSyncTimeline(
++    IN gckOS Os,
++    OUT gctHANDLE * Timeline
++    )
++{
++    struct viv_sync_timeline * timeline;
++
++    /* Create viv sync timeline. */
++    timeline = viv_sync_timeline_create("viv timeline", Os);
++
++    if (timeline == gcvNULL)
++    {
++        /* Out of memory. */
++        return gcvSTATUS_OUT_OF_MEMORY;
++    }
++
++    *Timeline = (gctHANDLE) timeline;
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_DestroySyncTimeline(
++    IN gckOS Os,
++    IN gctHANDLE Timeline
++    )
++{
++    struct viv_sync_timeline * timeline;
++    gcmkASSERT(Timeline != gcvNULL);
++
++    /* Destroy timeline. */
++    timeline = (struct viv_sync_timeline *) Timeline;
++    sync_timeline_destroy(&timeline->obj);
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_CreateNativeFence(
++    IN gckOS Os,
++    IN gctHANDLE Timeline,
++    IN gctSYNC_POINT SyncPoint,
++    OUT gctINT * FenceFD
++    )
++{
++    int fd = -1;
++    struct viv_sync_timeline *timeline;
++    struct sync_pt * pt = gcvNULL;
++    struct sync_fence * fence;
++    char name[32];
++    gcsSYNC_POINT_PTR syncPoint;
++    gceSTATUS status;
++
++    gcmkHEADER_ARG("Os=0x%X Timeline=0x%X SyncPoint=%d",
++                   Os, Timeline, (gctUINT)(gctUINTPTR_T)SyncPoint);
++
++    gcmkONERROR(
++        _QueryIntegerId(&Os->syncPointDB,
++                        (gctUINT32)(gctUINTPTR_T)SyncPoint,
++                        (gctPOINTER)&syncPoint));
++
++    /* Cast timeline. */
++    timeline = (struct viv_sync_timeline *) Timeline;
++
++    fd = get_unused_fd();
++
++    if (fd < 0)
++    {
++        /* Out of resources. */
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++    /* Create viv_sync_pt. */
++    pt = viv_sync_pt_create(timeline, SyncPoint);
++
++    if (pt == gcvNULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Reference sync_timeline. */
++    syncPoint->timeline = &timeline->obj;
++
++    /* Build fence name. */
++    snprintf(name, 32, "viv sync_fence-%u", (gctUINT)(gctUINTPTR_T)SyncPoint);
++
++    /* Create sync_fence. */
++    fence = sync_fence_create(name, pt);
++
++    if (fence == NULL)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    /* Install fence to fd. */
++    sync_fence_install(fence, fd);
++
++    *FenceFD = fd;
++    gcmkFOOTER_ARG("*FenceFD=%d", fd);
++    return gcvSTATUS_OK;
++
++OnError:
++    /* Error roll back. */
++    if (pt)
++    {
++        sync_pt_free(pt);
++    }
++
++    if (fd > 0)
++    {
++        put_unused_fd(fd);
++    }
++
++    gcmkFOOTER();
++    return status;
++}
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_os.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,83 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_os_h_
++#define __gc_hal_kernel_os_h_
++
++typedef struct _LINUX_MDL_MAP
++{
++    gctINT                  pid;
++    gctPOINTER              vmaAddr;
++    gctUINT32               count;
++    struct vm_area_struct * vma;
++    struct _LINUX_MDL_MAP * next;
++}
++LINUX_MDL_MAP;
++
++typedef struct _LINUX_MDL_MAP * PLINUX_MDL_MAP;
++
++typedef struct _LINUX_MDL
++{
++    gctINT                  pid;
++    char *                  addr;
++
++    union _pages
++    {
++        /* Pointer to a array of pages. */
++        struct page *       contiguousPages;
++        /* Pointer to a array of pointers to page. */
++        struct page **      nonContiguousPages;
++    }
++    u;
++
++#ifdef NO_DMA_COHERENT
++    gctPOINTER              kaddr;
++#endif /* NO_DMA_COHERENT */
++
++    gctINT                  numPages;
++    gctINT                  pagedMem;
++    gctBOOL                 contiguous;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 27)
++    gctBOOL                 exact;
++#endif
++    dma_addr_t              dmaHandle;
++    PLINUX_MDL_MAP          maps;
++    struct _LINUX_MDL *     prev;
++    struct _LINUX_MDL *     next;
++}
++LINUX_MDL, *PLINUX_MDL;
++
++extern PLINUX_MDL_MAP
++FindMdlMap(
++    IN PLINUX_MDL Mdl,
++    IN gctINT PID
++    );
++
++typedef struct _DRIVER_ARGS
++{
++    gctUINT64               InputBuffer;
++    gctUINT64               InputBufferSize;
++    gctUINT64               OutputBuffer;
++    gctUINT64               OutputBufferSize;
++}
++DRIVER_ARGS;
++
++#endif /* __gc_hal_kernel_os_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_platform.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,279 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef _gc_hal_kernel_platform_h_
++#define _gc_hal_kernel_platform_h_
++#include <linux/mm.h>
++
++typedef struct _gcsMODULE_PARAMETERS
++{
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++    gctINT  irqLine3D0;
++    gctUINT registerMemBase3D0;
++    gctUINT registerMemSize3D0;
++    gctINT  irqLine3D1;
++    gctUINT registerMemBase3D1;
++    gctUINT registerMemSize3D1;
++#else
++    gctINT  irqLine;
++    gctUINT registerMemBase;
++    gctUINT registerMemSize;
++#endif
++    gctINT  irqLine2D;
++    gctUINT registerMemBase2D;
++    gctUINT registerMemSize2D;
++    gctINT  irqLineVG;
++    gctUINT registerMemBaseVG;
++    gctUINT registerMemSizeVG;
++    gctUINT contiguousSize;
++    gctUINT contiguousBase;
++    gctUINT contiguousRequested;
++    gctUINT bankSize;
++    gctINT  fastClear;
++    gctINT  compression;
++    gctINT  powerManagement;
++    gctINT  gpuProfiler;
++    gctINT  signal;
++    gctUINT baseAddress;
++    gctUINT physSize;
++    gctUINT logFileSize;
++    gctUINT recovery;
++    gctUINT stuckDump;
++    gctUINT showArgs;
++    gctUINT gpu3DMinClock;
++}
++gcsMODULE_PARAMETERS;
++
++typedef struct _gcsPLATFORM * gckPLATFORM;
++
++typedef struct _gcsPLATFORM_OPERATIONS
++{
++    /*******************************************************************************
++    **
++    **  needAddDevice
++    **
++    **  Determine whether platform_device is created by initialization code.
++    **  If platform_device is created by BSP, return gcvFLASE here.
++    */
++    gctBOOL
++    (*needAddDevice)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  adjustParam
++    **
++    **  Override content of arguments, if a argument is not changed here, it will
++    **  keep as default value or value set by insmod command line.
++    */
++    gceSTATUS
++    (*adjustParam)(
++        IN gckPLATFORM Platform,
++        OUT gcsMODULE_PARAMETERS *Args
++        );
++
++    /*******************************************************************************
++    **
++    **  adjustDriver
++    **
++    **  Override content of platform_driver which will be registered.
++    */
++    gceSTATUS
++    (*adjustDriver)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  getPower
++    **
++    **  Prepare power and clock operation.
++    */
++    gceSTATUS
++    (*getPower)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  putPower
++    **
++    **  Finish power and clock operation.
++    */
++    gceSTATUS
++    (*putPower)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  allocPriv
++    **
++    **  Construct platform private data.
++    */
++    gceSTATUS
++    (*allocPriv)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  freePriv
++    **
++    **  free platform private data.
++    */
++    gceSTATUS
++    (*freePriv)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  setPower
++    **
++    **  Set power state of specified GPU.
++    **
++    **  INPUT:
++    **
++    **      gceCORE GPU
++    **          GPU neeed to config.
++    **
++    **      gceBOOL Enable
++    **          Enable or disable power.
++    */
++    gceSTATUS
++    (*setPower)(
++        IN gckPLATFORM Platform,
++        IN gceCORE GPU,
++        IN gctBOOL Enable
++        );
++
++    /*******************************************************************************
++    **
++    **  setClock
++    **
++    **  Set clock state of specified GPU.
++    **
++    **  INPUT:
++    **
++    **      gceCORE GPU
++    **          GPU neeed to config.
++    **
++    **      gceBOOL Enable
++    **          Enable or disable clock.
++    */
++    gceSTATUS
++    (*setClock)(
++        IN gckPLATFORM Platform,
++        IN gceCORE GPU,
++        IN gctBOOL Enable
++        );
++
++    /*******************************************************************************
++    **
++    **  reset
++    **
++    **  Reset GPU outside.
++    **
++    **  INPUT:
++    **
++    **      gceCORE GPU
++    **          GPU neeed to reset.
++    */
++    gceSTATUS
++    (*reset)(
++        IN gckPLATFORM Platform,
++        IN gceCORE GPU
++        );
++
++    /*******************************************************************************
++    **
++    **  getGPUPhysical
++    **
++    **  Convert CPU physical address to GPU physical address if they are
++    **  different.
++    */
++    gceSTATUS
++    (*getGPUPhysical)(
++        IN gckPLATFORM Platform,
++        IN gctUINT32 CPUPhysical,
++        OUT gctUINT32_PTR GPUPhysical
++        );
++
++    /*******************************************************************************
++    **
++    **  adjustProt
++    **
++    **  Override Prot flag when mapping paged memory to userspace.
++    */
++    gceSTATUS
++    (*adjustProt)(
++        IN struct vm_area_struct * vma
++        );
++
++    /*******************************************************************************
++    **
++    **  shrinkMemory
++    **
++    **  Do something to collect memory, eg, act as oom killer.
++    */
++    gceSTATUS
++    (*shrinkMemory)(
++        IN gckPLATFORM Platform
++        );
++
++    /*******************************************************************************
++    **
++    **  cache
++    **
++    **  Cache operation.
++    */
++    gceSTATUS
++    (*cache)(
++        IN gckPLATFORM Platform,
++        IN gctUINT32 ProcessID,
++        IN gctPHYS_ADDR Handle,
++        IN gctUINT32 Physical,
++        IN gctPOINTER Logical,
++        IN gctSIZE_T Bytes,
++        IN gceCACHEOPERATION Operation
++        );
++}
++gcsPLATFORM_OPERATIONS;
++
++typedef struct _gcsPLATFORM
++{
++    struct platform_device* device;
++    struct platform_driver* driver;
++
++    gcsPLATFORM_OPERATIONS* ops;
++
++    void*                   priv;
++}
++gcsPLATFORM;
++
++void
++gckPLATFORM_QueryOperations(
++    IN gcsPLATFORM_OPERATIONS ** Operations
++    );
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_probe.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,1347 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include <linux/device.h>
++#include <linux/slab.h>
++
++#include "gc_hal_kernel_linux.h"
++#include "gc_hal_driver.h"
++
++#if USE_PLATFORM_DRIVER
++#   include <linux/platform_device.h>
++#endif
++
++#ifdef CONFIG_PXA_DVFM
++#   include <mach/dvfm.h>
++#   include <mach/pxa3xx_dvfm.h>
++#endif
++
++
++/* Zone used for header/footer. */
++#define _GC_OBJ_ZONE    gcvZONE_DRIVER
++
++MODULE_DESCRIPTION("Vivante Graphics Driver");
++MODULE_LICENSE("GPL");
++
++static struct class* gpuClass;
++
++static gcsPLATFORM platform;
++
++static gckGALDEVICE galDevice;
++
++static uint major = 199;
++module_param(major, uint, 0644);
++
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++static int irqLine3D0 = -1;
++module_param(irqLine3D0, int, 0644);
++
++static ulong registerMemBase3D0 = 0;
++module_param(registerMemBase3D0, ulong, 0644);
++
++static ulong registerMemSize3D0 = 2 << 10;
++module_param(registerMemSize3D0, ulong, 0644);
++
++static int irqLine3D1 = -1;
++module_param(irqLine3D1, int, 0644);
++
++static ulong registerMemBase3D1 = 0;
++module_param(registerMemBase3D1, ulong, 0644);
++
++static ulong registerMemSize3D1 = 2 << 10;
++module_param(registerMemSize3D1, ulong, 0644);
++#else
++static int irqLine = -1;
++module_param(irqLine, int, 0644);
++
++static ulong registerMemBase = 0x80000000;
++module_param(registerMemBase, ulong, 0644);
++
++static ulong registerMemSize = 2 << 10;
++module_param(registerMemSize, ulong, 0644);
++#endif
++
++static int irqLine2D = -1;
++module_param(irqLine2D, int, 0644);
++
++static ulong registerMemBase2D = 0x00000000;
++module_param(registerMemBase2D, ulong, 0644);
++
++static ulong registerMemSize2D = 2 << 10;
++module_param(registerMemSize2D, ulong, 0644);
++
++static int irqLineVG = -1;
++module_param(irqLineVG, int, 0644);
++
++static ulong registerMemBaseVG = 0x00000000;
++module_param(registerMemBaseVG, ulong, 0644);
++
++static ulong registerMemSizeVG = 2 << 10;
++module_param(registerMemSizeVG, ulong, 0644);
++
++#ifndef gcdDEFAULT_CONTIGUOUS_SIZE
++#define gcdDEFAULT_CONTIGUOUS_SIZE (4 << 20)
++#endif
++static ulong contiguousSize = gcdDEFAULT_CONTIGUOUS_SIZE;
++module_param(contiguousSize, ulong, 0644);
++
++static ulong contiguousBase = 0;
++module_param(contiguousBase, ulong, 0644);
++
++static ulong bankSize = 0;
++module_param(bankSize, ulong, 0644);
++
++static int fastClear = -1;
++module_param(fastClear, int, 0644);
++
++static int compression = -1;
++module_param(compression, int, 0644);
++
++static int powerManagement = -1;
++module_param(powerManagement, int, 0644);
++
++static int gpuProfiler = 0;
++module_param(gpuProfiler, int, 0644);
++
++static int signal = 48;
++module_param(signal, int, 0644);
++
++static ulong baseAddress = 0;
++module_param(baseAddress, ulong, 0644);
++
++static ulong physSize = 0;
++module_param(physSize, ulong, 0644);
++
++static uint logFileSize = 0;
++module_param(logFileSize,uint, 0644);
++
++static uint recovery = 1;
++module_param(recovery, uint, 0644);
++MODULE_PARM_DESC(recovery, "Recover GPU from stuck (1: Enable, 0: Disable)");
++
++/* Middle needs about 40KB buffer, Maximal may need more than 200KB buffer. */
++static uint stuckDump = 1;
++module_param(stuckDump, uint, 0644);
++MODULE_PARM_DESC(stuckDump, "Level of stuck dump content (1: Minimal, 2: Middle, 3: Maximal)");
++
++static int showArgs = 0;
++module_param(showArgs, int, 0644);
++
++static int mmu = 1;
++module_param(mmu, int, 0644);
++
++static int gpu3DMinClock = 1;
++
++static int contiguousRequested = 0;
++
++static int drv_open(
++    struct inode* inode,
++    struct file* filp
++    );
++
++static int drv_release(
++    struct inode* inode,
++    struct file* filp
++    );
++
++static long drv_ioctl(
++    struct file* filp,
++    unsigned int ioctlCode,
++    unsigned long arg
++    );
++
++static int drv_mmap(
++    struct file* filp,
++    struct vm_area_struct* vma
++    );
++
++static struct file_operations driver_fops =
++{
++    .owner      = THIS_MODULE,
++    .open       = drv_open,
++    .release    = drv_release,
++    .unlocked_ioctl = drv_ioctl,
++#ifdef HAVE_COMPAT_IOCTL
++    .compat_ioctl = drv_ioctl,
++#endif
++    .mmap       = drv_mmap,
++};
++
++void
++_UpdateModuleParam(
++    gcsMODULE_PARAMETERS *Param
++    )
++{
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++#else
++    irqLine           = Param->irqLine ;
++    registerMemBase   = Param->registerMemBase;
++    registerMemSize   = Param->registerMemSize;
++#endif
++    irqLine2D         = Param->irqLine2D      ;
++    registerMemBase2D = Param->registerMemBase2D;
++    registerMemSize2D = Param->registerMemSize2D;
++    irqLineVG         = Param->irqLineVG;
++    registerMemBaseVG = Param->registerMemBaseVG;
++    registerMemSizeVG = Param->registerMemSizeVG;
++    contiguousSize    = Param->contiguousSize;
++    contiguousBase    = Param->contiguousBase;
++    bankSize          = Param->bankSize;
++    fastClear         = Param->fastClear;
++    compression       = Param->compression;
++    powerManagement   = Param->powerManagement;
++    gpuProfiler       = Param->gpuProfiler;
++    signal            = Param->signal;
++    baseAddress       = Param->baseAddress;
++    physSize          = Param->physSize;
++    logFileSize       = Param->logFileSize;
++    recovery          = Param->recovery;
++    stuckDump         = Param->stuckDump;
++    showArgs          = Param->showArgs;
++    contiguousRequested = Param->contiguousRequested;
++    gpu3DMinClock     = Param->gpu3DMinClock;
++}
++
++void
++gckOS_DumpParam(
++    void
++    )
++{
++    printk("Galcore options:\n");
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++    printk("  irqLine3D0         = %d\n",      irqLine3D0);
++    printk("  registerMemBase3D0 = 0x%08lX\n", registerMemBase3D0);
++    printk("  registerMemSize3D0 = 0x%08lX\n", registerMemSize3D0);
++
++    if (irqLine3D1 != -1)
++    {
++        printk("  irqLine3D1         = %d\n",      irqLine3D1);
++        printk("  registerMemBase3D1 = 0x%08lX\n", registerMemBase3D1);
++        printk("  registerMemSize3D1 = 0x%08lX\n", registerMemSize3D1);
++    }
++#else
++    printk("  irqLine           = %d\n",      irqLine);
++    printk("  registerMemBase   = 0x%08lX\n", registerMemBase);
++    printk("  registerMemSize   = 0x%08lX\n", registerMemSize);
++#endif
++
++    if (irqLine2D != -1)
++    {
++        printk("  irqLine2D         = %d\n",      irqLine2D);
++        printk("  registerMemBase2D = 0x%08lX\n", registerMemBase2D);
++        printk("  registerMemSize2D = 0x%08lX\n", registerMemSize2D);
++    }
++
++    if (irqLineVG != -1)
++    {
++        printk("  irqLineVG         = %d\n",      irqLineVG);
++        printk("  registerMemBaseVG = 0x%08lX\n", registerMemBaseVG);
++        printk("  registerMemSizeVG = 0x%08lX\n", registerMemSizeVG);
++    }
++
++    printk("  contiguousSize    = %ld\n",     contiguousSize);
++    printk("  contiguousBase    = 0x%08lX\n", contiguousBase);
++    printk("  bankSize          = 0x%08lX\n", bankSize);
++    printk("  fastClear         = %d\n",      fastClear);
++    printk("  compression       = %d\n",      compression);
++    printk("  signal            = %d\n",      signal);
++    printk("  powerManagement   = %d\n",      powerManagement);
++    printk("  baseAddress       = 0x%08lX\n", baseAddress);
++    printk("  physSize          = 0x%08lX\n", physSize);
++    printk("  logFileSize       = %d KB \n",  logFileSize);
++    printk("  recovery          = %d\n",      recovery);
++    printk("  stuckDump         = %d\n",      stuckDump);
++    printk("  gpuProfiler       = %d\n",      gpuProfiler);
++}
++
++int drv_open(
++    struct inode* inode,
++    struct file* filp
++    )
++{
++    gceSTATUS status;
++    gctBOOL attached = gcvFALSE;
++    gcsHAL_PRIVATE_DATA_PTR data = gcvNULL;
++    gctINT i;
++
++    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = kmalloc(sizeof(gcsHAL_PRIVATE_DATA), GFP_KERNEL | __GFP_NOWARN);
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    data->device             = galDevice;
++    data->mappedMemory       = gcvNULL;
++    data->contiguousLogical  = gcvNULL;
++    gcmkONERROR(gckOS_GetProcessID(&data->pidOpen));
++
++    /* Attached the process. */
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (galDevice->kernels[i] != gcvNULL)
++        {
++            gcmkONERROR(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvTRUE));
++        }
++    }
++    attached = gcvTRUE;
++
++    if (!galDevice->contiguousMapped)
++    {
++        if (galDevice->contiguousPhysical != gcvNULL)
++        {
++            gcmkONERROR(gckOS_MapMemory(
++                galDevice->os,
++                galDevice->contiguousPhysical,
++                galDevice->contiguousSize,
++                &data->contiguousLogical
++                ));
++        }
++    }
++
++    filp->private_data = data;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    if (data != gcvNULL)
++    {
++        if (data->contiguousLogical != gcvNULL)
++        {
++            gcmkVERIFY_OK(gckOS_UnmapMemory(
++                galDevice->os,
++                galDevice->contiguousPhysical,
++                galDevice->contiguousSize,
++                data->contiguousLogical
++                ));
++        }
++
++        kfree(data);
++    }
++
++    if (attached)
++    {
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (galDevice->kernels[i] != gcvNULL)
++            {
++                gcmkVERIFY_OK(gckKERNEL_AttachProcess(galDevice->kernels[i], gcvFALSE));
++            }
++        }
++    }
++
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++int drv_release(
++    struct inode* inode,
++    struct file* filp
++    )
++{
++    gceSTATUS status;
++    gcsHAL_PRIVATE_DATA_PTR data;
++    gckGALDEVICE device;
++    gctINT i;
++
++    gcmkHEADER_ARG("inode=0x%08X filp=0x%08X", inode, filp);
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = filp->private_data;
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    device = data->device;
++
++    if (device == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): device is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if (!device->contiguousMapped)
++    {
++        if (data->contiguousLogical != gcvNULL)
++        {
++            gcmkONERROR(gckOS_UnmapMemoryEx(
++                galDevice->os,
++                galDevice->contiguousPhysical,
++                galDevice->contiguousSize,
++                data->contiguousLogical,
++                data->pidOpen
++                ));
++
++            data->contiguousLogical = gcvNULL;
++        }
++    }
++
++    /* A process gets detached. */
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (galDevice->kernels[i] != gcvNULL)
++        {
++            gcmkONERROR(gckKERNEL_AttachProcessEx(galDevice->kernels[i], gcvFALSE, data->pidOpen));
++        }
++    }
++
++    kfree(data);
++    filp->private_data = NULL;
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++long drv_ioctl(
++    struct file* filp,
++    unsigned int ioctlCode,
++    unsigned long arg
++    )
++{
++    gceSTATUS status;
++    gcsHAL_INTERFACE iface;
++    gctUINT32 copyLen;
++    DRIVER_ARGS drvArgs;
++    gckGALDEVICE device;
++    gcsHAL_PRIVATE_DATA_PTR data;
++    gctINT32 i, count;
++    gckVIDMEM_NODE nodeObject;
++
++    gcmkHEADER_ARG(
++        "filp=0x%08X ioctlCode=0x%08X arg=0x%08X",
++        filp, ioctlCode, arg
++        );
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = filp->private_data;
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    device = data->device;
++
++    if (device == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): device is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if ((ioctlCode != IOCTL_GCHAL_INTERFACE)
++    &&  (ioctlCode != IOCTL_GCHAL_KERNEL_INTERFACE)
++    )
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): unknown command %d\n",
++            __FUNCTION__, __LINE__,
++            ioctlCode
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Get the drvArgs. */
++    copyLen = copy_from_user(
++        &drvArgs, (void *) arg, sizeof(DRIVER_ARGS)
++        );
++
++    if (copyLen != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): error copying of the input arguments.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Now bring in the gcsHAL_INTERFACE structure. */
++    if ((drvArgs.InputBufferSize  != sizeof(gcsHAL_INTERFACE))
++    ||  (drvArgs.OutputBufferSize != sizeof(gcsHAL_INTERFACE))
++    )
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): input or/and output structures are invalid.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    copyLen = copy_from_user(
++        &iface, gcmUINT64_TO_PTR(drvArgs.InputBuffer), sizeof(gcsHAL_INTERFACE)
++        );
++
++    if (copyLen != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): error copying of input HAL interface.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    if (iface.command == gcvHAL_CHIP_INFO)
++    {
++        count = 0;
++        for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++        {
++            if (device->kernels[i] != gcvNULL)
++            {
++#if gcdENABLE_VG
++                if (i == gcvCORE_VG)
++                {
++                    iface.u.ChipInfo.types[count] = gcvHARDWARE_VG;
++                }
++                else
++#endif
++                {
++                    gcmkVERIFY_OK(gckHARDWARE_GetType(device->kernels[i]->hardware,
++                                                      &iface.u.ChipInfo.types[count]));
++                }
++                count++;
++            }
++        }
++
++        iface.u.ChipInfo.count = count;
++        iface.status = status = gcvSTATUS_OK;
++    }
++    else
++    {
++        if (iface.hardwareType > 7)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): unknown hardwareType %d\n",
++                __FUNCTION__, __LINE__,
++                iface.hardwareType
++                );
++
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++#if gcdENABLE_VG
++        if (device->coreMapping[iface.hardwareType] == gcvCORE_VG)
++        {
++            status = gckVGKERNEL_Dispatch(device->kernels[gcvCORE_VG],
++                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
++                                        &iface);
++        }
++        else
++#endif
++        {
++            status = gckKERNEL_Dispatch(device->kernels[device->coreMapping[iface.hardwareType]],
++                                        (ioctlCode == IOCTL_GCHAL_INTERFACE),
++                                        &iface);
++        }
++    }
++
++    /* Redo system call after pending signal is handled. */
++    if (status == gcvSTATUS_INTERRUPTED)
++    {
++        gcmkFOOTER();
++        return -ERESTARTSYS;
++    }
++
++    if (gcmIS_SUCCESS(status) && (iface.command == gcvHAL_LOCK_VIDEO_MEMORY))
++    {
++        gcuVIDMEM_NODE_PTR node;
++        gctUINT32 processID;
++
++        gckOS_GetProcessID(&processID);
++
++        gcmkONERROR(gckVIDMEM_HANDLE_Lookup(device->kernels[device->coreMapping[iface.hardwareType]],
++                                processID,
++                                (gctUINT32)iface.u.LockVideoMemory.node,
++                                &nodeObject));
++        node = nodeObject->node;
++
++        /* Special case for mapped memory. */
++        if ((data->mappedMemory != gcvNULL)
++        &&  (node->VidMem.memory->object.type == gcvOBJ_VIDMEM)
++        )
++        {
++            /* Compute offset into mapped memory. */
++            gctUINT32 offset
++                = (gctUINT8 *) gcmUINT64_TO_PTR(iface.u.LockVideoMemory.memory)
++                - (gctUINT8 *) device->contiguousBase;
++
++            /* Compute offset into user-mapped region. */
++            iface.u.LockVideoMemory.memory =
++                gcmPTR_TO_UINT64((gctUINT8 *) data->mappedMemory + offset);
++        }
++    }
++
++    /* Copy data back to the user. */
++    copyLen = copy_to_user(
++        gcmUINT64_TO_PTR(drvArgs.OutputBuffer), &iface, sizeof(gcsHAL_INTERFACE)
++        );
++
++    if (copyLen != 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): error copying of output HAL interface.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++static int drv_mmap(
++    struct file* filp,
++    struct vm_area_struct* vma
++    )
++{
++    gceSTATUS status = gcvSTATUS_OK;
++    gcsHAL_PRIVATE_DATA_PTR data;
++    gckGALDEVICE device;
++
++    gcmkHEADER_ARG("filp=0x%08X vma=0x%08X", filp, vma);
++
++    if (filp == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): filp is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    data = filp->private_data;
++
++    if (data == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): private_data is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++    device = data->device;
++
++    if (device == gcvNULL)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): device is NULL\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++    }
++
++#if !gcdPAGED_MEMORY_CACHEABLE
++    vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
++    vma->vm_flags    |= gcdVM_FLAGS;
++#endif
++    vma->vm_pgoff     = 0;
++
++    if (device->contiguousMapped)
++    {
++        unsigned long size = vma->vm_end - vma->vm_start;
++        int ret = 0;
++
++        if (size > device->contiguousSize)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): Invalid mapping size.\n",
++                __FUNCTION__, __LINE__
++                );
++
++            gcmkONERROR(gcvSTATUS_INVALID_ARGUMENT);
++        }
++
++        ret = io_remap_pfn_range(
++            vma,
++            vma->vm_start,
++            device->requestedContiguousBase >> PAGE_SHIFT,
++            size,
++            vma->vm_page_prot
++            );
++
++        if (ret != 0)
++        {
++            gcmkTRACE_ZONE(
++                gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                "%s(%d): io_remap_pfn_range failed %d\n",
++                __FUNCTION__, __LINE__,
++                ret
++                );
++
++            data->mappedMemory = gcvNULL;
++
++            gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++        }
++
++        data->mappedMemory = (gctPOINTER) vma->vm_start;
++
++        /* Success. */
++        gcmkFOOTER_NO();
++        return 0;
++    }
++
++OnError:
++    gcmkFOOTER();
++    return -ENOTTY;
++}
++
++
++#if !USE_PLATFORM_DRIVER
++static int __init drv_init(void)
++#else
++static int drv_init(void)
++#endif
++{
++    int ret;
++    int result = -EINVAL;
++    gceSTATUS status;
++    gckGALDEVICE device = gcvNULL;
++    struct class* device_class = gcvNULL;
++
++    gcsDEVICE_CONSTRUCT_ARGS args = {
++        .recovery           = recovery,
++        .stuckDump          = stuckDump,
++        .gpu3DMinClock      = gpu3DMinClock,
++        .contiguousRequested = contiguousRequested,
++        .platform           = &platform,
++        .mmu                = mmu,
++    };
++
++    gcmkHEADER();
++
++    printk(KERN_INFO "Galcore version %d.%d.%d.%d\n",
++        gcvVERSION_MAJOR, gcvVERSION_MINOR, gcvVERSION_PATCH, gcvVERSION_BUILD);
++
++#if !VIVANTE_PROFILER_PM
++    /* when enable gpu profiler, we need to turn off gpu powerMangement */
++    if (gpuProfiler)
++    {
++        powerManagement = 0;
++    }
++#endif
++
++    if (showArgs)
++    {
++        gckOS_DumpParam();
++    }
++
++    if (logFileSize != 0)
++    {
++        gckDEBUGFS_Initialize();
++    }
++
++    /* Create the GAL device. */
++    status = gckGALDEVICE_Construct(
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++        irqLine3D0,
++        registerMemBase3D0, registerMemSize3D0,
++        irqLine3D1,
++        registerMemBase3D1, registerMemSize3D1,
++#else
++        irqLine,
++        registerMemBase, registerMemSize,
++#endif
++        irqLine2D,
++        registerMemBase2D, registerMemSize2D,
++        irqLineVG,
++        registerMemBaseVG, registerMemSizeVG,
++        contiguousBase, contiguousSize,
++        bankSize, fastClear, compression, baseAddress, physSize, signal,
++        logFileSize,
++        powerManagement,
++        gpuProfiler,
++        &args,
++        &device
++    );
++
++    if (gcmIS_ERROR(status))
++    {
++        gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DRIVER,
++                       "%s(%d): Failed to create the GAL device: status=%d\n",
++                       __FUNCTION__, __LINE__, status);
++
++        goto OnError;
++    }
++
++    /* Start the GAL device. */
++    gcmkONERROR(gckGALDEVICE_Start(device));
++
++    if ((physSize != 0)
++       && (device->kernels[gcvCORE_MAJOR] != gcvNULL)
++       && (device->kernels[gcvCORE_MAJOR]->hardware->mmuVersion != 0))
++    {
++        /* Reset the base address */
++        device->baseAddress = 0;
++    }
++
++    /* Register the character device. */
++    ret = register_chrdev(major, DEVICE_NAME, &driver_fops);
++
++    if (ret < 0)
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): Could not allocate major number for mmap.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    if (major == 0)
++    {
++        major = ret;
++    }
++
++    /* Create the device class. */
++    device_class = class_create(THIS_MODULE, "graphics_class");
++
++    if (IS_ERR(device_class))
++    {
++        gcmkTRACE_ZONE(
++            gcvLEVEL_ERROR, gcvZONE_DRIVER,
++            "%s(%d): Failed to create the class.\n",
++            __FUNCTION__, __LINE__
++            );
++
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
++    device_create(device_class, NULL, MKDEV(major, 0), NULL, DEVICE_NAME);
++#else
++    device_create(device_class, NULL, MKDEV(major, 0), DEVICE_NAME);
++#endif
++
++    galDevice = device;
++    gpuClass  = device_class;
++
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_DRIVER,
++        "%s(%d): irqLine3D0=%d, contiguousSize=%lu, memBase3D0=0x%lX\n",
++        __FUNCTION__, __LINE__,
++        irqLine3D0, contiguousSize, registerMemBase3D0
++        );
++#else
++    gcmkTRACE_ZONE(
++        gcvLEVEL_INFO, gcvZONE_DRIVER,
++        "%s(%d): irqLine=%d, contiguousSize=%lu, memBase=0x%lX\n",
++        __FUNCTION__, __LINE__,
++        irqLine, contiguousSize, registerMemBase
++        );
++#endif
++
++    /* Success. */
++    gcmkFOOTER_NO();
++    return 0;
++
++OnError:
++    /* Roll back. */
++    if (device_class != gcvNULL)
++    {
++        device_destroy(device_class, MKDEV(major, 0));
++        class_destroy(device_class);
++    }
++
++    if (device != gcvNULL)
++    {
++        gcmkVERIFY_OK(gckGALDEVICE_Stop(device));
++        gcmkVERIFY_OK(gckGALDEVICE_Destroy(device));
++    }
++
++    gcmkFOOTER();
++    return result;
++}
++
++#if !USE_PLATFORM_DRIVER
++static void __exit drv_exit(void)
++#else
++static void drv_exit(void)
++#endif
++{
++    gcmkHEADER();
++
++    gcmkASSERT(gpuClass != gcvNULL);
++    device_destroy(gpuClass, MKDEV(major, 0));
++    class_destroy(gpuClass);
++
++    unregister_chrdev(major, DEVICE_NAME);
++
++    gcmkVERIFY_OK(gckGALDEVICE_Stop(galDevice));
++    gcmkVERIFY_OK(gckGALDEVICE_Destroy(galDevice));
++
++    if(gckDEBUGFS_IsEnabled())
++    {
++        gckDEBUGFS_Terminate();
++    }
++
++    gcmkFOOTER_NO();
++}
++
++#if !USE_PLATFORM_DRIVER
++    module_init(drv_init);
++    module_exit(drv_exit);
++#else
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
++static int gpu_probe(struct platform_device *pdev)
++#else
++static int __devinit gpu_probe(struct platform_device *pdev)
++#endif
++{
++    int ret = -ENODEV;
++    gcsMODULE_PARAMETERS moduleParam = {
++#if gcdMULTI_GPU || gcdMULTI_GPU_AFFINITY
++#else
++        .irqLine            = irqLine,
++        .registerMemBase    = registerMemBase,
++        .registerMemSize    = registerMemSize,
++#endif
++        .irqLine2D          = irqLine2D,
++        .registerMemBase2D  = registerMemBase2D,
++        .registerMemSize2D  = registerMemSize2D,
++        .irqLineVG          = irqLineVG,
++        .registerMemBaseVG  = registerMemBaseVG,
++        .registerMemSizeVG  = registerMemSizeVG,
++        .contiguousSize     = contiguousSize,
++        .contiguousBase     = contiguousBase,
++        .bankSize           = bankSize,
++        .fastClear          = fastClear,
++        .compression        = compression,
++        .powerManagement    = powerManagement,
++        .gpuProfiler        = gpuProfiler,
++        .signal             = signal,
++        .baseAddress        = baseAddress,
++        .physSize           = physSize,
++        .logFileSize        = logFileSize,
++        .recovery           = recovery,
++        .stuckDump          = stuckDump,
++        .showArgs           = showArgs,
++        .gpu3DMinClock      = gpu3DMinClock,
++    };
++
++    gcmkHEADER();
++
++    platform.device = pdev;
++
++    if (platform.ops->getPower)
++    {
++        if (gcmIS_ERROR(platform.ops->getPower(&platform)))
++        {
++            gcmkFOOTER_NO();
++            return ret;
++        }
++    }
++
++    if (platform.ops->adjustParam)
++    {
++        /* Override default module param. */
++        platform.ops->adjustParam(&platform, &moduleParam);
++
++        /* Update module param because drv_init() uses them directly. */
++        _UpdateModuleParam(&moduleParam);
++    }
++
++    ret = drv_init();
++
++    if (!ret)
++    {
++        platform_set_drvdata(pdev, galDevice);
++
++        gcmkFOOTER_NO();
++        return ret;
++    }
++
++    gcmkFOOTER_ARG(KERN_INFO "Failed to register gpu driver: %d\n", ret);
++    return ret;
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
++static int gpu_remove(struct platform_device *pdev)
++#else
++static int __devexit gpu_remove(struct platform_device *pdev)
++#endif
++{
++    gcmkHEADER();
++
++    drv_exit();
++
++    if (platform.ops->putPower)
++    {
++        platform.ops->putPower(&platform);
++    }
++
++    gcmkFOOTER_NO();
++    return 0;
++}
++
++static int gpu_suspend(struct platform_device *dev, pm_message_t state)
++{
++    gceSTATUS status;
++    gckGALDEVICE device;
++    gctINT i;
++
++    device = platform_get_drvdata(dev);
++
++    if (!device)
++    {
++        return -1;
++    }
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->kernels[i] != gcvNULL)
++        {
++            /* Store states. */
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_QueryPowerManagementState(device->kernels[i]->vg->hardware, &device->statesStored[i]);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_QueryPowerManagementState(device->kernels[i]->hardware, &device->statesStored[i]);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_OFF);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_OFF);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++
++        }
++    }
++
++    return 0;
++}
++
++static int gpu_resume(struct platform_device *dev)
++{
++    gceSTATUS status;
++    gckGALDEVICE device;
++    gctINT i;
++    gceCHIPPOWERSTATE   statesStored;
++
++    device = platform_get_drvdata(dev);
++
++    if (!device)
++    {
++        return -1;
++    }
++
++    for (i = 0; i < gcdMAX_GPU_COUNT; i++)
++    {
++        if (device->kernels[i] != gcvNULL)
++        {
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, gcvPOWER_ON);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, gcvPOWER_ON);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++
++            /* Convert global state to crossponding internal state. */
++            switch(device->statesStored[i])
++            {
++            case gcvPOWER_OFF:
++                statesStored = gcvPOWER_OFF_BROADCAST;
++                break;
++            case gcvPOWER_IDLE:
++                statesStored = gcvPOWER_IDLE_BROADCAST;
++                break;
++            case gcvPOWER_SUSPEND:
++                statesStored = gcvPOWER_SUSPEND_BROADCAST;
++                break;
++            case gcvPOWER_ON:
++                statesStored = gcvPOWER_ON_AUTO;
++                break;
++            default:
++                statesStored = device->statesStored[i];
++                break;
++            }
++
++            /* Restore states. */
++#if gcdENABLE_VG
++            if (i == gcvCORE_VG)
++            {
++                status = gckVGHARDWARE_SetPowerManagementState(device->kernels[i]->vg->hardware, statesStored);
++            }
++            else
++#endif
++            {
++                status = gckHARDWARE_SetPowerManagementState(device->kernels[i]->hardware, statesStored);
++            }
++
++            if (gcmIS_ERROR(status))
++            {
++                return -1;
++            }
++        }
++    }
++
++    return 0;
++}
++
++#if defined(CONFIG_PM) && LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 30)
++#ifdef CONFIG_PM_SLEEP
++static int gpu_system_suspend(struct device *dev)
++{
++    pm_message_t state={0};
++    return gpu_suspend(to_platform_device(dev), state);
++}
++
++static int gpu_system_resume(struct device *dev)
++{
++    return gpu_resume(to_platform_device(dev));
++}
++#endif
++
++static const struct dev_pm_ops gpu_pm_ops = {
++    SET_SYSTEM_SLEEP_PM_OPS(gpu_system_suspend, gpu_system_resume)
++};
++#endif
++
++static struct platform_driver gpu_driver = {
++    .probe      = gpu_probe,
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 8, 0)
++    .remove     = gpu_remove,
++#else
++    .remove     = __devexit_p(gpu_remove),
++#endif
++
++    .suspend    = gpu_suspend,
++    .resume     = gpu_resume,
++
++    .driver     = {
++        .name   = DEVICE_NAME,
++#if defined(CONFIG_PM) && LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 30)
++        .pm     = &gpu_pm_ops,
++#endif
++    }
++};
++
++static int __init gpu_init(void)
++{
++    int ret = 0;
++
++    memset(&platform, 0, sizeof(gcsPLATFORM));
++
++    gckPLATFORM_QueryOperations(&platform.ops);
++
++    if (platform.ops == gcvNULL)
++    {
++        printk(KERN_ERR "galcore: No platform specific operations.\n");
++        ret = -ENODEV;
++        goto out;
++    }
++
++    if (platform.ops->allocPriv)
++    {
++        /* Allocate platform private data. */
++        if (gcmIS_ERROR(platform.ops->allocPriv(&platform)))
++        {
++            ret = -ENOMEM;
++            goto out;
++        }
++    }
++
++    if (platform.ops->needAddDevice
++     && platform.ops->needAddDevice(&platform))
++    {
++        /* Allocate device */
++        platform.device = platform_device_alloc(DEVICE_NAME, -1);
++        if (!platform.device)
++        {
++            printk(KERN_ERR "galcore: platform_device_alloc failed.\n");
++            ret = -ENOMEM;
++            goto out;
++        }
++
++        /* Add device */
++        ret = platform_device_add(platform.device);
++        if (ret)
++        {
++            printk(KERN_ERR "galcore: platform_device_add failed.\n");
++            goto put_dev;
++        }
++    }
++
++    platform.driver = &gpu_driver;
++
++    if (platform.ops->adjustDriver)
++    {
++        /* Override default platform_driver struct. */
++        platform.ops->adjustDriver(&platform);
++    }
++
++    ret = platform_driver_register(&gpu_driver);
++    if (!ret)
++    {
++        goto out;
++    }
++
++    platform_device_del(platform.device);
++put_dev:
++    platform_device_put(platform.device);
++
++out:
++    return ret;
++}
++
++static void __exit gpu_exit(void)
++{
++    platform_driver_unregister(&gpu_driver);
++
++    if (platform.ops->needAddDevice
++     && platform.ops->needAddDevice(&platform))
++    {
++        platform_device_unregister(platform.device);
++    }
++
++    if (platform.priv)
++    {
++        /* Free platform private data. */
++        platform.ops->freePriv(&platform);
++    }
++}
++
++module_init(gpu_init);
++module_exit(gpu_exit);
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_security_channel.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,385 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++#include <linux/slab.h>
++
++#include "tee_client_api.h"
++
++#define _GC_OBJ_ZONE gcvZONE_OS
++
++#define GPU3D_UUID   { 0xcc9f80ea, 0xa836, 0x11e3, { 0x9b, 0x07, 0x78, 0x2b, 0xcb, 0x5c, 0xf3, 0xe3 } }
++
++static const TEEC_UUID gpu3d_uuid = GPU3D_UUID;
++TEEC_Context teecContext;
++
++typedef struct _gcsSecurityChannel {
++    gckOS               os;
++    TEEC_Session        session;
++    int *               virtual;
++    TEEC_SharedMemory   inputBuffer;
++    gctUINT32           bytes;
++    gctPOINTER          mutex;
++} gcsSecurityChannel;
++
++TEEC_SharedMemory *
++gpu3d_allocate_secure_mem(
++    gckOS Os,
++    unsigned int size
++    )
++{
++    TEEC_Result result;
++    TEEC_Context *context = &teecContext;
++    TEEC_SharedMemory *shm = NULL;
++    void *handle = NULL;
++    unsigned int phyAddr = 0xFFFFFFFF;
++    gceSTATUS status;
++    gctSIZE_T bytes = size;
++
++    shm = kmalloc(sizeof(TEEC_SharedMemory), GFP_KERNEL);
++
++    if (NULL == shm)
++    {
++        return NULL;
++    }
++
++    memset(shm, 0, sizeof(TEEC_SharedMemory));
++
++    status = gckOS_AllocatePagedMemoryEx(
++                Os,
++                gcvALLOC_FLAG_SECURITY,
++                bytes,
++                gcvNULL,
++                (gctPHYS_ADDR *)&handle);
++
++    if (gcmIS_ERROR(status))
++    {
++         kfree(shm);
++         return NULL;
++    }
++
++    status = gckOS_PhysicalToPhysicalAddress(
++                Os,
++                handle,
++                &phyAddr);
++
++    if (gcmIS_ERROR(status))
++    {
++         kfree(shm);
++         return NULL;
++    }
++
++    /* record the handle into shm->user_data */
++    shm->userdata = handle;
++
++    /* [b] Bulk input buffer. */
++    shm->size = size;
++    shm->flags = TEEC_MEM_INPUT;
++
++    /* Use TEE Client API to register the underlying memory buffer. */
++    shm->phyAddr = (void *)phyAddr;
++
++    result = TEEC_RegisterSharedMemory(
++            context,
++            shm);
++
++    if (result != TEEC_SUCCESS)
++    {
++        gckOS_FreePagedMemory(Os, (gctPHYS_ADDR)handle, shm->size);
++        kfree(shm);
++        return NULL;
++    }
++
++    return shm;
++}
++
++void gpu3d_release_secure_mem(
++    gckOS Os,
++    void *shm_handle
++    )
++{
++    TEEC_SharedMemory *shm = shm_handle;
++    void * handle;
++
++    if (!shm)
++    {
++        return;
++    }
++
++    handle = shm->userdata;
++
++    TEEC_ReleaseSharedMemory(shm);
++    gckOS_FreePagedMemory(Os, (gctPHYS_ADDR)handle, shm->size);
++
++    kfree(shm);
++
++    return;
++}
++
++static TEEC_Result gpu3d_session_callback(
++    TEEC_Session*   session,
++    uint32_t    commandID,
++    TEEC_Operation* operation,
++    void*   userdata
++    )
++{
++    gcsSecurityChannel *channel = userdata;
++
++    if (channel == gcvNULL)
++    {
++        return TEEC_ERROR_BAD_PARAMETERS;
++    }
++
++    switch(commandID)
++    {
++        case gcvTA_CALLBACK_ALLOC_SECURE_MEM:
++        {
++            uint32_t size = operation->params[0].value.a;
++            TEEC_SharedMemory *shm = NULL;
++
++            shm = gpu3d_allocate_secure_mem(channel->os, size);
++
++            /* use the value to save the pointer in client side */
++            operation->params[0].value.a = (uint32_t)shm;
++            operation->params[0].value.b = (uint32_t)shm->phyAddr;
++
++            break;
++        }
++        case gcvTA_CALLBACK_FREE_SECURE_MEM:
++        {
++            TEEC_SharedMemory *shm = (TEEC_SharedMemory *)operation->params[0].value.a;
++
++            gpu3d_release_secure_mem(channel->os, shm);
++            break;
++        }
++        default:
++            break;
++    }
++
++    return TEEC_SUCCESS;
++}
++
++gceSTATUS
++gckOS_OpenSecurityChannel(
++    IN gckOS Os,
++    IN gceCORE GPU,
++    OUT gctUINT32 *Channel
++    )
++{
++    gceSTATUS status;
++    TEEC_Result result;
++    static bool initialized = gcvFALSE;
++    gcsSecurityChannel *channel = gcvNULL;
++
++    TEEC_Operation operation = {0};
++
++    /* Connect to TEE. */
++    if (initialized == gcvFALSE)
++    {
++        result = TEEC_InitializeContext(NULL, &teecContext);
++
++        if (result != TEEC_SUCCESS) {
++            gcmkONERROR(gcvSTATUS_CHIP_NOT_READY);
++        }
++
++        initialized = gcvTRUE;
++    }
++
++    /* Construct channel. */
++    gcmkONERROR(
++        gckOS_Allocate(Os, gcmSIZEOF(*channel), (gctPOINTER *)&channel));
++
++    gckOS_ZeroMemory(channel, gcmSIZEOF(gcsSecurityChannel));
++
++    channel->os = Os;
++
++    gcmkONERROR(gckOS_CreateMutex(Os, &channel->mutex));
++
++    /* Allocate shared memory for passing gcTA_INTERFACE. */
++    channel->bytes = gcmSIZEOF(gcsTA_INTERFACE);
++    channel->virtual = kmalloc(channel->bytes, GFP_KERNEL | __GFP_NOWARN);
++
++    if (!channel->virtual)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_MEMORY);
++    }
++
++    channel->inputBuffer.size    = channel->bytes;
++    channel->inputBuffer.flags   = TEEC_MEM_INPUT | TEEC_MEM_OUTPUT;
++    channel->inputBuffer.phyAddr = (void *)virt_to_phys(channel->virtual);
++
++    result = TEEC_RegisterSharedMemory(&teecContext, &channel->inputBuffer);
++
++    if (result != TEEC_SUCCESS)
++    {
++        gcmkONERROR(gcvSTATUS_OUT_OF_RESOURCES);
++    }
++
++    operation.paramTypes = TEEC_PARAM_TYPES(
++            TEEC_VALUE_INPUT,
++            TEEC_NONE,
++            TEEC_NONE,
++            TEEC_NONE);
++
++    operation.params[0].value.a = GPU;
++
++    /* Open session with TEE application. */
++    result = TEEC_OpenSession(
++                &teecContext,
++                &channel->session,
++                &gpu3d_uuid,
++                TEEC_LOGIN_USER,
++                NULL,
++                &operation,
++                NULL);
++
++    /* Prepare callback. */
++    TEEC_RegisterCallback(&channel->session, gpu3d_session_callback, channel);
++
++    *Channel = (gctUINT32)channel;
++
++    return gcvSTATUS_OK;
++
++OnError:
++    if (channel)
++    {
++        if (channel->virtual)
++        {
++        }
++
++        if (channel->mutex)
++        {
++            gcmkVERIFY_OK(gckOS_DeleteMutex(Os, channel->mutex));
++        }
++
++        gcmkVERIFY_OK(gckOS_Free(Os, channel));
++    }
++
++    return status;
++}
++
++gceSTATUS
++gckOS_CloseSecurityChannel(
++    IN gctUINT32 Channel
++    )
++{
++    /* TODO . */
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++gckOS_CallSecurityService(
++    IN gctUINT32 Channel,
++    IN gcsTA_INTERFACE *Interface
++    )
++{
++    gceSTATUS status;
++    TEEC_Result result;
++    gcsSecurityChannel *channel = (gcsSecurityChannel *)Channel;
++    TEEC_Operation operation = {0};
++
++    gcmkHEADER();
++    gcmkVERIFY_ARGUMENT(Channel != 0);
++
++    gckOS_AcquireMutex(channel->os, channel->mutex, gcvINFINITE);
++
++    gckOS_MemCopy(channel->virtual, Interface, channel->bytes);
++
++    operation.paramTypes = TEEC_PARAM_TYPES(
++            TEEC_MEMREF_PARTIAL_INPUT,
++            TEEC_NONE,
++            TEEC_NONE,
++            TEEC_NONE);
++
++    /* Note: we use the updated size in the MemRef output by the encryption. */
++    operation.params[0].memref.parent = &channel->inputBuffer;
++    operation.params[0].memref.offset = 0;
++    operation.params[0].memref.size = sizeof(gcsTA_INTERFACE);
++    operation.started = true;
++
++    /* Start the commit command within the TEE application. */
++    result = TEEC_InvokeCommand(
++            &channel->session,
++            gcvTA_COMMAND_DISPATCH,
++            &operation,
++            NULL);
++
++    gckOS_MemCopy(Interface, channel->virtual, channel->bytes);
++
++    gckOS_ReleaseMutex(channel->os, channel->mutex);
++
++    if (result != TEEC_SUCCESS)
++    {
++        gcmkONERROR(gcvSTATUS_GENERIC_IO);
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
++
++gceSTATUS
++gckOS_InitSecurityChannel(
++    IN gctUINT32 Channel
++    )
++{
++    gceSTATUS status;
++    TEEC_Result result;
++    gcsSecurityChannel *channel = (gcsSecurityChannel *)Channel;
++    TEEC_Operation operation = {0};
++
++    gcmkHEADER();
++    gcmkVERIFY_ARGUMENT(Channel != 0);
++
++    operation.paramTypes = TEEC_PARAM_TYPES(
++            TEEC_MEMREF_PARTIAL_INPUT,
++            TEEC_NONE,
++            TEEC_NONE,
++            TEEC_NONE);
++
++    /* Note: we use the updated size in the MemRef output by the encryption. */
++    operation.params[0].memref.parent = &channel->inputBuffer;
++    operation.params[0].memref.offset = 0;
++    operation.params[0].memref.size = gcmSIZEOF(gcsTA_INTERFACE);
++    operation.started = true;
++
++    /* Start the commit command within the TEE application. */
++    result = TEEC_InvokeCommand(
++            &channel->session,
++            gcvTA_COMMAND_INIT,
++            &operation,
++            NULL);
++
++    if (result != TEEC_SUCCESS)
++    {
++        gcmkONERROR(gcvSTATUS_GENERIC_IO);
++    }
++
++    gcmkFOOTER_NO();
++    return gcvSTATUS_OK;
++
++OnError:
++    gcmkFOOTER();
++    return status;
++}
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,174 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include <linux/kernel.h>
++#include <linux/file.h>
++#include <linux/fs.h>
++#include <linux/miscdevice.h>
++#include <linux/module.h>
++#include <linux/syscalls.h>
++#include <linux/uaccess.h>
++
++#include "gc_hal_kernel_sync.h"
++
++#if gcdANDROID_NATIVE_FENCE_SYNC
++
++static struct sync_pt *
++viv_sync_pt_dup(
++    struct sync_pt * sync_pt
++    )
++{
++    gceSTATUS status;
++    struct viv_sync_pt *pt;
++    struct viv_sync_pt *src;
++    struct viv_sync_timeline *obj;
++
++    src = (struct viv_sync_pt *) sync_pt;
++    obj = (struct viv_sync_timeline *) sync_pt->parent;
++
++    /* Create the new sync_pt. */
++    pt = (struct viv_sync_pt *)
++        sync_pt_create(&obj->obj, sizeof(struct viv_sync_pt));
++
++    pt->stamp = src->stamp;
++    pt->sync = src->sync;
++
++    /* Reference sync point. */
++    status = gckOS_ReferenceSyncPoint(obj->os, pt->sync);
++
++    if (gcmIS_ERROR(status))
++    {
++        sync_pt_free((struct sync_pt *)pt);
++        return NULL;
++    }
++
++    return (struct sync_pt *)pt;
++}
++
++static int
++viv_sync_pt_has_signaled(
++    struct sync_pt * sync_pt
++    )
++{
++    gceSTATUS status;
++    gctBOOL state;
++    struct viv_sync_pt * pt;
++    struct viv_sync_timeline * obj;
++
++    pt  = (struct viv_sync_pt *)sync_pt;
++    obj = (struct viv_sync_timeline *)sync_pt->parent;
++
++    status = gckOS_QuerySyncPoint(obj->os, pt->sync, &state);
++
++    if (gcmIS_ERROR(status))
++    {
++        /* Error. */
++        return -1;
++    }
++
++    return state;
++}
++
++static int
++viv_sync_pt_compare(
++    struct sync_pt * a,
++    struct sync_pt * b
++    )
++{
++    int ret;
++    struct viv_sync_pt * pt1 = (struct viv_sync_pt *) a;
++    struct viv_sync_pt * pt2 = (struct viv_sync_pt *) b;
++
++    ret = (pt1->stamp <  pt2->stamp) ? -1
++        : (pt1->stamp == pt2->stamp) ?  0
++        : 1;
++
++    return ret;
++}
++
++static void
++viv_sync_pt_free(
++    struct sync_pt * sync_pt
++    )
++{
++    struct viv_sync_pt * pt;
++    struct viv_sync_timeline * obj;
++
++    pt  = (struct viv_sync_pt *) sync_pt;
++    obj = (struct viv_sync_timeline *) sync_pt->parent;
++
++    gckOS_DestroySyncPoint(obj->os, pt->sync);
++}
++
++static struct sync_timeline_ops viv_timeline_ops =
++{
++    .driver_name = "viv_sync",
++    .dup = viv_sync_pt_dup,
++    .has_signaled = viv_sync_pt_has_signaled,
++    .compare = viv_sync_pt_compare,
++    .free_pt = viv_sync_pt_free,
++};
++
++struct viv_sync_timeline *
++viv_sync_timeline_create(
++    const char * name,
++    gckOS os
++    )
++{
++    struct viv_sync_timeline * obj;
++
++    obj = (struct viv_sync_timeline *)
++        sync_timeline_create(&viv_timeline_ops, sizeof(struct viv_sync_timeline), name);
++
++    obj->os    = os;
++    obj->stamp = 0;
++
++    return obj;
++}
++
++struct sync_pt *
++viv_sync_pt_create(
++    struct viv_sync_timeline * obj,
++    gctSYNC_POINT SyncPoint
++    )
++{
++    gceSTATUS status;
++    struct viv_sync_pt * pt;
++
++    pt = (struct viv_sync_pt *)
++        sync_pt_create(&obj->obj, sizeof(struct viv_sync_pt));
++
++    pt->stamp = obj->stamp++;
++    pt->sync  = SyncPoint;
++
++    /* Dup signal. */
++    status = gckOS_ReferenceSyncPoint(obj->os, SyncPoint);
++
++    if (gcmIS_ERROR(status))
++    {
++        sync_pt_free((struct sync_pt *)pt);
++        return NULL;
++    }
++
++    return (struct sync_pt *) pt;
++}
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/gc_hal_kernel_sync.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,71 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2013 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#ifndef __gc_hal_kernel_sync_h_
++#define __gc_hal_kernel_sync_h_
++
++#include <linux/types.h>
++
++#include <uapi/sync.h>
++
++#include <gc_hal.h>
++#include <gc_hal_base.h>
++
++struct viv_sync_timeline
++{
++    /* Parent object. */
++    struct sync_timeline obj;
++
++    /* Timestamp when sync_pt is created. */
++    gctUINT stamp;
++
++    /* Pointer to os struct. */
++    gckOS os;
++};
++
++
++struct viv_sync_pt
++{
++    /* Parent object. */
++    struct sync_pt pt;
++
++    /* Reference sync point*/
++    gctSYNC_POINT sync;
++
++    /* Timestamp when sync_pt is created. */
++    gctUINT stamp;
++};
++
++/* Create viv_sync_timeline object. */
++struct viv_sync_timeline *
++viv_sync_timeline_create(
++    const char * Name,
++    gckOS Os
++    );
++
++/* Create viv_sync_pt object. */
++struct sync_pt *
++viv_sync_pt_create(
++    struct viv_sync_timeline * Obj,
++    gctSYNC_POINT SyncPoint
++    );
++
++#endif /* __gc_hal_kernel_sync_h_ */
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,880 @@
++/****************************************************************************
++*
++*    Copyright (C) 2005 - 2014 by Vivante Corp.
++*
++*    This program is free software; you can redistribute it and/or modify
++*    it under the terms of the GNU General Public License as published by
++*    the Free Software Foundation; either version 2 of the license, or
++*    (at your option) any later version.
++*
++*    This program is distributed in the hope that it will be useful,
++*    but WITHOUT ANY WARRANTY; without even the implied warranty of
++*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++*    GNU General Public License for more details.
++*
++*    You should have received a copy of the GNU General Public License
++*    along with this program; if not write to the Free Software
++*    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++*
++*****************************************************************************/
++
++
++#include "gc_hal_kernel_linux.h"
++#include "gc_hal_kernel_platform.h"
++#include "gc_hal_kernel_device.h"
++#include "gc_hal_driver.h"
++#include <linux/slab.h>
++
++#if USE_PLATFORM_DRIVER
++#   include <linux/platform_device.h>
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++#include <mach/viv_gpu.h>
++#else
++#include <linux/pm_runtime.h>
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
++#include <mach/busfreq.h>
++#else
++#include <linux/busfreq-imx6.h>
++#include <linux/reset.h>
++#endif
++#endif
++
++#include <linux/clk.h>
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,10,0)
++#include <mach/hardware.h>
++#endif
++#include <linux/pm_runtime.h>
++
++#include <linux/regulator/consumer.h>
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++#include <linux/device_cooling.h>
++#define REG_THERMAL_NOTIFIER(a) register_devfreq_cooling_notifier(a);
++#define UNREG_THERMAL_NOTIFIER(a) unregister_devfreq_cooling_notifier(a);
++#else
++extern int register_thermal_notifier(struct notifier_block *nb);
++extern int unregister_thermal_notifier(struct notifier_block *nb);
++#define REG_THERMAL_NOTIFIER(a) register_thermal_notifier(a);
++#define UNREG_THERMAL_NOTIFIER(a) unregister_thermal_notifier(a);
++#endif
++
++static int initgpu3DMinClock = 1;
++module_param(initgpu3DMinClock, int, 0644);
++
++struct platform_device *pdevice;
++
++#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
++#    include <linux/kernel.h>
++#    include <linux/mm.h>
++#    include <linux/oom.h>
++#    include <linux/sched.h>
++
++struct task_struct *lowmem_deathpending;
++
++static int
++task_notify_func(struct notifier_block *self, unsigned long val, void *data);
++
++static struct notifier_block task_nb = {
++	.notifier_call	= task_notify_func,
++};
++
++static int
++task_notify_func(struct notifier_block *self, unsigned long val, void *data)
++{
++	struct task_struct *task = data;
++
++	if (task == lowmem_deathpending)
++		lowmem_deathpending = NULL;
++
++	return NOTIFY_OK;
++}
++
++extern struct task_struct *lowmem_deathpending;
++static unsigned long lowmem_deathpending_timeout;
++
++static int force_contiguous_lowmem_shrink(IN gckKERNEL Kernel)
++{
++	struct task_struct *p;
++	struct task_struct *selected = NULL;
++	int tasksize;
++        int ret = -1;
++	int min_adj = 0;
++	int selected_tasksize = 0;
++	int selected_oom_adj;
++	/*
++	 * If we already have a death outstanding, then
++	 * bail out right away; indicating to vmscan
++	 * that we have nothing further to offer on
++	 * this pass.
++	 *
++	 */
++	if (lowmem_deathpending &&
++	    time_before_eq(jiffies, lowmem_deathpending_timeout))
++		return 0;
++	selected_oom_adj = min_adj;
++
++       rcu_read_lock();
++	for_each_process(p) {
++		struct mm_struct *mm;
++		struct signal_struct *sig;
++                gcuDATABASE_INFO info;
++		int oom_adj;
++
++		task_lock(p);
++		mm = p->mm;
++		sig = p->signal;
++		if (!mm || !sig) {
++			task_unlock(p);
++			continue;
++		}
++		oom_adj = sig->oom_score_adj;
++		if (oom_adj < min_adj) {
++			task_unlock(p);
++			continue;
++		}
++
++		tasksize = 0;
++		task_unlock(p);
++               rcu_read_unlock();
++
++		if (gckKERNEL_QueryProcessDB(Kernel, p->pid, gcvFALSE, gcvDB_VIDEO_MEMORY, &info) == gcvSTATUS_OK){
++			tasksize += info.counters.bytes / PAGE_SIZE;
++		}
++		if (gckKERNEL_QueryProcessDB(Kernel, p->pid, gcvFALSE, gcvDB_CONTIGUOUS, &info) == gcvSTATUS_OK){
++			tasksize += info.counters.bytes / PAGE_SIZE;
++		}
++
++               rcu_read_lock();
++
++		if (tasksize <= 0)
++			continue;
++
++		gckOS_Print("<gpu> pid %d (%s), adj %d, size %d \n", p->pid, p->comm, oom_adj, tasksize);
++
++		if (selected) {
++			if (oom_adj < selected_oom_adj)
++				continue;
++			if (oom_adj == selected_oom_adj &&
++			    tasksize <= selected_tasksize)
++				continue;
++		}
++		selected = p;
++		selected_tasksize = tasksize;
++		selected_oom_adj = oom_adj;
++	}
++	if (selected) {
++		gckOS_Print("<gpu> send sigkill to %d (%s), adj %d, size %d\n",
++			     selected->pid, selected->comm,
++			     selected_oom_adj, selected_tasksize);
++		lowmem_deathpending = selected;
++		lowmem_deathpending_timeout = jiffies + HZ;
++		force_sig(SIGKILL, selected);
++		ret = 0;
++	}
++       rcu_read_unlock();
++	return ret;
++}
++
++
++gceSTATUS
++_ShrinkMemory(
++    IN gckPLATFORM Platform
++    )
++{
++    struct platform_device *pdev;
++    gckGALDEVICE galDevice;
++    gckKERNEL kernel;
++
++    pdev = Platform->device;
++
++    galDevice = platform_get_drvdata(pdev);
++
++    kernel = galDevice->kernels[gcvCORE_MAJOR];
++
++    if (kernel != gcvNULL)
++    {
++        force_contiguous_lowmem_shrink(kernel);
++    }
++    else
++    {
++        gcmkPRINT("%s(%d) can't find kernel! ", __FUNCTION__, __LINE__);
++    }
++
++    return gcvSTATUS_OK;
++}
++#endif
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++static int thermal_hot_pm_notify(struct notifier_block *nb, unsigned long event,
++       void *dummy)
++{
++    static gctUINT orgFscale, minFscale, maxFscale;
++    static gctBOOL bAlreadyTooHot = gcvFALSE;
++    gckHARDWARE hardware;
++    gckGALDEVICE galDevice;
++
++    galDevice = platform_get_drvdata(pdevice);
++    if (!galDevice)
++    {
++        /* GPU is not ready, so it is meaningless to change GPU freq. */
++        return NOTIFY_OK;
++    }
++
++    if (!galDevice->kernels[gcvCORE_MAJOR])
++    {
++        return NOTIFY_OK;
++    }
++
++    hardware = galDevice->kernels[gcvCORE_MAJOR]->hardware;
++
++    if (!hardware)
++    {
++        return NOTIFY_OK;
++    }
++
++    if (event && !bAlreadyTooHot) {
++        gckHARDWARE_GetFscaleValue(hardware,&orgFscale,&minFscale, &maxFscale);
++        gckHARDWARE_SetFscaleValue(hardware, minFscale);
++        bAlreadyTooHot = gcvTRUE;
++        gckOS_Print("System is too hot. GPU3D will work at %d/64 clock.\n", minFscale);
++    } else if (!event && bAlreadyTooHot) {
++        gckHARDWARE_SetFscaleValue(hardware, orgFscale);
++        gckOS_Print("Hot alarm is canceled. GPU3D clock will return to %d/64\n", orgFscale);
++        bAlreadyTooHot = gcvFALSE;
++    }
++    return NOTIFY_OK;
++}
++
++static struct notifier_block thermal_hot_pm_notifier = {
++    .notifier_call = thermal_hot_pm_notify,
++    };
++
++static ssize_t show_gpu3DMinClock(struct device_driver *dev, char *buf)
++{
++    gctUINT currentf,minf,maxf;
++    gckGALDEVICE galDevice;
++
++    galDevice = platform_get_drvdata(pdevice);
++    if(galDevice->kernels[gcvCORE_MAJOR])
++    {
++         gckHARDWARE_GetFscaleValue(galDevice->kernels[gcvCORE_MAJOR]->hardware,
++            &currentf, &minf, &maxf);
++    }
++    snprintf(buf, PAGE_SIZE, "%d\n", minf);
++    return strlen(buf);
++}
++
++static ssize_t update_gpu3DMinClock(struct device_driver *dev, const char *buf, size_t count)
++{
++
++    gctINT fields;
++    gctUINT MinFscaleValue;
++    gckGALDEVICE galDevice;
++
++    galDevice = platform_get_drvdata(pdevice);
++    if(galDevice->kernels[gcvCORE_MAJOR])
++    {
++         fields = sscanf(buf, "%d", &MinFscaleValue);
++         if (fields < 1)
++             return -EINVAL;
++
++         gckHARDWARE_SetMinFscaleValue(galDevice->kernels[gcvCORE_MAJOR]->hardware,MinFscaleValue);
++    }
++
++    return count;
++}
++
++static DRIVER_ATTR(gpu3DMinClock, S_IRUGO | S_IWUSR, show_gpu3DMinClock, update_gpu3DMinClock);
++#endif
++
++
++
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++static const struct of_device_id mxs_gpu_dt_ids[] = {
++    { .compatible = "fsl,imx6q-gpu", },
++    {/* sentinel */}
++};
++MODULE_DEVICE_TABLE(of, mxs_gpu_dt_ids);
++#endif
++
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++struct contiguous_mem_pool {
++    struct dma_attrs attrs;
++    dma_addr_t phys;
++    void *virt;
++    size_t size;
++};
++#endif
++
++struct imx_priv {
++    /* Clock management.*/
++    struct clk         *clk_3d_core;
++    struct clk         *clk_3d_shader;
++    struct clk         *clk_3d_axi;
++    struct clk         *clk_2d_core;
++    struct clk         *clk_2d_axi;
++    struct clk         *clk_vg_axi;
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    /*Power management.*/
++    struct regulator      *gpu_regulator;
++#endif
++#endif
++       /*Run time pm*/
++       struct device           *pmdev;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    struct contiguous_mem_pool *pool;
++    struct reset_control *rstc[gcdMAX_GPU_COUNT];
++#endif
++};
++
++static struct imx_priv imxPriv;
++
++gceSTATUS
++gckPLATFORM_AdjustParam(
++    IN gckPLATFORM Platform,
++    OUT gcsMODULE_PARAMETERS *Args
++    )
++{
++     struct resource* res;
++     struct platform_device* pdev = Platform->device;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++       struct device_node *dn =pdev->dev.of_node;
++       const u32 *prop;
++#else
++       struct viv_gpu_platform_data *pdata;
++#endif
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "phys_baseaddr");
++    if (res)
++        Args->baseAddress = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_3d");
++    if (res)
++        Args->irqLine = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_3d");
++    if (res)
++    {
++        Args->registerMemBase = res->start;
++        Args->registerMemSize = res->end - res->start + 1;
++    }
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_2d");
++    if (res)
++        Args->irqLine2D = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_2d");
++    if (res)
++    {
++        Args->registerMemBase2D = res->start;
++        Args->registerMemSize2D = res->end - res->start + 1;
++    }
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_IRQ, "irq_vg");
++    if (res)
++        Args->irqLineVG = res->start;
++
++    res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "iobase_vg");
++    if (res)
++    {
++        Args->registerMemBaseVG = res->start;
++        Args->registerMemSizeVG = res->end - res->start + 1;
++    }
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++       Args->contiguousBase = 0;
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++       prop = of_get_property(dn, "contiguousbase", NULL);
++       if(prop)
++               Args->contiguousBase = *prop;
++       of_property_read_u32(dn,"contiguoussize", (u32 *)&contiguousSize);
++#else
++    pdata = pdev->dev.platform_data;
++    if (pdata) {
++        Args->contiguousBase = pdata->reserved_mem_base;
++       Args->contiguousSize = pdata->reserved_mem_size;
++     }
++#endif
++    if (Args->contiguousSize == 0)
++       gckOS_Print("Warning: No contiguous memory is reserverd for gpu.!\n ");
++
++    Args->gpu3DMinClock = initgpu3DMinClock;
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_AllocPriv(
++    IN gckPLATFORM Platform
++    )
++{
++    Platform->priv = &imxPriv;
++
++#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
++    task_free_register(&task_nb);
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_FreePriv(
++    IN gckPLATFORM Platform
++    )
++{
++#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
++    task_free_unregister(&task_nb);
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_GetPower(
++    IN gckPLATFORM Platform
++    )
++{
++    struct device* pdev = &Platform->device->dev;
++    struct imx_priv *priv = Platform->priv;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    struct reset_control *rstc;
++#endif
++
++#ifdef CONFIG_PM
++    /*Init runtime pm for gpu*/
++    pm_runtime_enable(pdev);
++    priv->pmdev = pdev;
++#endif
++
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    rstc = devm_reset_control_get(pdev, "gpu3d");
++    priv->rstc[gcvCORE_MAJOR] = IS_ERR(rstc) ? NULL : rstc;
++    rstc = devm_reset_control_get(pdev, "gpu2d");
++    priv->rstc[gcvCORE_2D] = IS_ERR(rstc) ? NULL : rstc;
++    rstc = devm_reset_control_get(pdev, "gpuvg");
++    priv->rstc[gcvCORE_VG] = IS_ERR(rstc) ? NULL : rstc;
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++    /*get gpu regulator*/
++    priv->gpu_regulator = regulator_get(pdev, "cpu_vddgpu");
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    priv->gpu_regulator = devm_regulator_get(pdev, "pu");
++#endif
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    if (IS_ERR(priv->gpu_regulator)) {
++       gcmkTRACE_ZONE(gcvLEVEL_ERROR, gcvZONE_DRIVER,
++               "%s(%d): Failed to get gpu regulator \n",
++               __FUNCTION__, __LINE__);
++       return gcvSTATUS_NOT_FOUND;
++    }
++#endif
++#endif
++
++    /*Initialize the clock structure*/
++    priv->clk_3d_core = clk_get(pdev, "gpu3d_clk");
++    if (!IS_ERR(priv->clk_3d_core)) {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++        if (cpu_is_mx6q()) {
++               priv->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
++               if (IS_ERR(priv->clk_3d_shader)) {
++                   clk_put(priv->clk_3d_core);
++                   priv->clk_3d_core = NULL;
++                   priv->clk_3d_shader = NULL;
++                   gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
++               }
++             }
++#else
++               priv->clk_3d_axi = clk_get(pdev, "gpu3d_axi_clk");
++               priv->clk_3d_shader = clk_get(pdev, "gpu3d_shader_clk");
++               if (IS_ERR(priv->clk_3d_shader)) {
++                   clk_put(priv->clk_3d_core);
++                   priv->clk_3d_core = NULL;
++                   priv->clk_3d_shader = NULL;
++                   gckOS_Print("galcore: clk_get gpu3d_shader_clk failed, disable 3d!\n");
++               }
++#endif
++    } else {
++        priv->clk_3d_core = NULL;
++        gckOS_Print("galcore: clk_get gpu3d_clk failed, disable 3d!\n");
++    }
++
++    priv->clk_2d_core = clk_get(pdev, "gpu2d_clk");
++    if (IS_ERR(priv->clk_2d_core)) {
++        priv->clk_2d_core = NULL;
++        gckOS_Print("galcore: clk_get 2d core clock failed, disable 2d/vg!\n");
++    } else {
++        priv->clk_2d_axi = clk_get(pdev, "gpu2d_axi_clk");
++        if (IS_ERR(priv->clk_2d_axi)) {
++            priv->clk_2d_axi = NULL;
++            gckOS_Print("galcore: clk_get 2d axi clock failed, disable 2d\n");
++        }
++
++        priv->clk_vg_axi = clk_get(pdev, "openvg_axi_clk");
++        if (IS_ERR(priv->clk_vg_axi)) {
++               priv->clk_vg_axi = NULL;
++               gckOS_Print("galcore: clk_get vg clock failed, disable vg!\n");
++        }
++    }
++
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    pdevice = Platform->device;
++    REG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
++    {
++        int ret = 0;
++        ret = driver_create_file(pdevice->dev.driver, &driver_attr_gpu3DMinClock);
++        if(ret)
++            dev_err(&pdevice->dev, "create gpu3DMinClock attr failed (%d)\n", ret);
++    }
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_PutPower(
++    IN gckPLATFORM Platform
++    )
++{
++    struct imx_priv *priv = Platform->priv;
++
++    /*Disable clock*/
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    if (priv->clk_3d_axi) {
++       clk_put(priv->clk_3d_axi);
++       priv->clk_3d_axi = NULL;
++    }
++#endif
++    if (priv->clk_3d_core) {
++       clk_put(priv->clk_3d_core);
++       priv->clk_3d_core = NULL;
++    }
++    if (priv->clk_3d_shader) {
++       clk_put(priv->clk_3d_shader);
++       priv->clk_3d_shader = NULL;
++    }
++    if (priv->clk_2d_core) {
++       clk_put(priv->clk_2d_core);
++       priv->clk_2d_core = NULL;
++    }
++    if (priv->clk_2d_axi) {
++       clk_put(priv->clk_2d_axi);
++       priv->clk_2d_axi = NULL;
++    }
++    if (priv->clk_vg_axi) {
++       clk_put(priv->clk_vg_axi);
++       priv->clk_vg_axi = NULL;
++    }
++
++#ifdef CONFIG_PM
++    if(priv->pmdev)
++        pm_runtime_disable(priv->pmdev);
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++    if (priv->gpu_regulator) {
++       regulator_put(priv->gpu_regulator);
++       priv->gpu_regulator = NULL;
++    }
++#endif
++
++#if gcdENABLE_FSCALE_VAL_ADJUST
++    UNREG_THERMAL_NOTIFIER(&thermal_hot_pm_notifier);
++
++    driver_remove_file(pdevice->dev.driver, &driver_attr_gpu3DMinClock);
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_SetPower(
++    IN gckPLATFORM Platform,
++    IN gceCORE GPU,
++    IN gctBOOL Enable
++    )
++{
++    struct imx_priv* priv = Platform->priv;
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    int ret;
++#endif
++#endif
++
++    if (Enable)
++    {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++        if(!IS_ERR(priv->gpu_regulator)) {
++            ret = regulator_enable(priv->gpu_regulator);
++            if (ret != 0)
++                gckOS_Print("%s(%d): fail to enable pu regulator %d!\n",
++                    __FUNCTION__, __LINE__, ret);
++        }
++#else
++        imx_gpc_power_up_pu(true);
++#endif
++#endif
++
++#ifdef CONFIG_PM
++		pm_runtime_get_sync(priv->pmdev);
++#endif
++	}
++    else
++    {
++#ifdef CONFIG_PM
++        pm_runtime_put_sync(priv->pmdev);
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,14,0)
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++        if(!IS_ERR(priv->gpu_regulator))
++            regulator_disable(priv->gpu_regulator);
++#else
++        imx_gpc_power_up_pu(false);
++#endif
++#endif
++
++    }
++
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_SetClock(
++    IN gckPLATFORM Platform,
++    IN gceCORE GPU,
++    IN gctBOOL Enable
++    )
++{
++    struct imx_priv* priv = Platform->priv;
++    struct clk *clk_3dcore = priv->clk_3d_core;
++    struct clk *clk_3dshader = priv->clk_3d_shader;
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    struct clk *clk_3d_axi = priv->clk_3d_axi;
++#endif
++    struct clk *clk_2dcore = priv->clk_2d_core;
++    struct clk *clk_2d_axi = priv->clk_2d_axi;
++    struct clk *clk_vg_axi = priv->clk_vg_axi;
++
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++    if (Enable) {
++        switch (GPU) {
++        case gcvCORE_MAJOR:
++            clk_enable(clk_3dcore);
++            if (cpu_is_mx6q())
++                clk_enable(clk_3dshader);
++            break;
++        case gcvCORE_2D:
++            clk_enable(clk_2dcore);
++            clk_enable(clk_2d_axi);
++            break;
++        case gcvCORE_VG:
++            clk_enable(clk_2dcore);
++            clk_enable(clk_vg_axi);
++            break;
++        default:
++            break;
++        }
++    } else {
++        switch (GPU) {
++        case gcvCORE_MAJOR:
++            if (cpu_is_mx6q())
++                clk_disable(clk_3dshader);
++            clk_disable(clk_3dcore);
++            break;
++       case gcvCORE_2D:
++            clk_disable(clk_2dcore);
++            clk_disable(clk_2d_axi);
++            break;
++        case gcvCORE_VG:
++            clk_disable(clk_2dcore);
++            clk_disable(clk_vg_axi);
++            break;
++        default:
++            break;
++        }
++    }
++#else
++    if (Enable) {
++        switch (GPU) {
++        case gcvCORE_MAJOR:
++            clk_prepare(clk_3dcore);
++            clk_enable(clk_3dcore);
++            clk_prepare(clk_3dshader);
++            clk_enable(clk_3dshader);
++            clk_prepare(clk_3d_axi);
++            clk_enable(clk_3d_axi);
++            break;
++        case gcvCORE_2D:
++            clk_prepare(clk_2dcore);
++            clk_enable(clk_2dcore);
++            clk_prepare(clk_2d_axi);
++            clk_enable(clk_2d_axi);
++            break;
++        case gcvCORE_VG:
++            clk_prepare(clk_2dcore);
++            clk_enable(clk_2dcore);
++            clk_prepare(clk_vg_axi);
++            clk_enable(clk_vg_axi);
++            break;
++        default:
++            break;
++        }
++    } else {
++        switch (GPU) {
++        case gcvCORE_MAJOR:
++            clk_disable(clk_3dshader);
++            clk_unprepare(clk_3dshader);
++            clk_disable(clk_3dcore);
++            clk_unprepare(clk_3dcore);
++            clk_disable(clk_3d_axi);
++            clk_unprepare(clk_3d_axi);
++            break;
++       case gcvCORE_2D:
++            clk_disable(clk_2dcore);
++            clk_unprepare(clk_2dcore);
++            clk_disable(clk_2d_axi);
++            clk_unprepare(clk_2d_axi);
++            break;
++        case gcvCORE_VG:
++            clk_disable(clk_2dcore);
++            clk_unprepare(clk_2dcore);
++            clk_disable(clk_vg_axi);
++            clk_unprepare(clk_vg_axi);
++            break;
++        default:
++            break;
++        }
++    }
++#endif
++
++    return gcvSTATUS_OK;
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++#ifdef CONFIG_PM
++static int gpu_runtime_suspend(struct device *dev)
++{
++    release_bus_freq(BUS_FREQ_HIGH);
++    return 0;
++}
++
++static int gpu_runtime_resume(struct device *dev)
++{
++    request_bus_freq(BUS_FREQ_HIGH);
++    return 0;
++}
++
++static struct dev_pm_ops gpu_pm_ops;
++#endif
++#endif
++
++gceSTATUS
++_AdjustDriver(
++    IN gckPLATFORM Platform
++    )
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    struct platform_driver * driver = Platform->driver;
++#endif
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    driver->driver.of_match_table = mxs_gpu_dt_ids;
++#endif
++
++    /* Override PM callbacks to add runtime PM callbacks. */
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3,5,0)
++    /* Fill local structure with original value. */
++    memcpy(&gpu_pm_ops, driver->driver.pm, sizeof(struct dev_pm_ops));
++
++    /* Add runtime PM callback. */
++#ifdef CONFIG_PM
++    gpu_pm_ops.runtime_suspend = gpu_runtime_suspend;
++    gpu_pm_ops.runtime_resume = gpu_runtime_resume;
++    gpu_pm_ops.runtime_idle = NULL;
++#endif
++
++    /* Replace callbacks. */
++    driver->driver.pm = &gpu_pm_ops;
++#endif
++    return gcvSTATUS_OK;
++}
++
++gceSTATUS
++_Reset(
++    IN gckPLATFORM Platform,
++    gceCORE GPU
++    )
++{
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3,5,0)
++#define SRC_SCR_OFFSET 0
++#define BP_SRC_SCR_GPU3D_RST 1
++#define BP_SRC_SCR_GPU2D_RST 4
++    void __iomem *src_base = IO_ADDRESS(SRC_BASE_ADDR);
++    gctUINT32 bit_offset,val;
++
++    if(GPU == gcvCORE_MAJOR) {
++        bit_offset = BP_SRC_SCR_GPU3D_RST;
++    } else if((GPU == gcvCORE_VG)
++            ||(GPU == gcvCORE_2D)) {
++        bit_offset = BP_SRC_SCR_GPU2D_RST;
++    } else {
++        return gcvSTATUS_INVALID_CONFIG;
++    }
++    val = __raw_readl(src_base + SRC_SCR_OFFSET);
++    val &= ~(1 << (bit_offset));
++    val |= (1 << (bit_offset));
++    __raw_writel(val, src_base + SRC_SCR_OFFSET);
++
++    while ((__raw_readl(src_base + SRC_SCR_OFFSET) &
++                (1 << (bit_offset))) != 0) {
++    }
++
++    return gcvSTATUS_NOT_SUPPORTED;
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
++    struct imx_priv* priv = Platform->priv;
++    struct reset_control *rstc = priv->rstc[GPU];
++    if (rstc)
++        reset_control_reset(rstc);
++#else
++    imx_src_reset_gpu((int)GPU);
++#endif
++    return gcvSTATUS_OK;
++}
++
++gcsPLATFORM_OPERATIONS platformOperations = {
++    .adjustParam  = gckPLATFORM_AdjustParam,
++    .allocPriv    = _AllocPriv,
++    .freePriv     = _FreePriv,
++    .getPower     = _GetPower,
++    .putPower     = _PutPower,
++    .setPower     = _SetPower,
++    .setClock     = _SetClock,
++    .adjustDriver = _AdjustDriver,
++    .reset        = _Reset,
++#ifdef CONFIG_GPU_LOW_MEMORY_KILLER
++    .shrinkMemory = _ShrinkMemory,
++#endif
++};
++
++void
++gckPLATFORM_QueryOperations(
++    IN gcsPLATFORM_OPERATIONS ** Operations
++    )
++{
++     *Operations = &platformOperations;
++}
++
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config
+--- linux-4.1.3/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/hal/os/linux/kernel/platform/freescale/gc_hal_kernel_platform_imx6q14.config	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,15 @@
++EXTRA_CFLAGS += -DgcdDEFAULT_CONTIGUOUS_SIZE=134217728
++
++ifneq ($(CONFIG_ANDROID),)
++# build for android
++EXTRA_CFLAGS += -DgcdANDROID_NATIVE_FENCE_SYNC=3
++
++ifeq ($(CONFIG_SYNC),)
++$(warn CONFIG_SYNC is not set in kernel config)
++$(warn Android native fence sync needs CONFIG_SYNC)
++endif
++endif
++
++EXTRA_CFLAGS += -DLINUX_CMA_FSL=1
++ALLOCATOR_ARRAY_H_LOCATION := $(OS_KERNEL_DIR)/allocator/freescale
++CUSTOMER_ALLOCATOR_OBJS := $(ALLOCATOR_ARRAY_H_LOCATION)/gc_hal_kernel_allocator_cma.o
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/Kbuild linux-xbian-imx6/drivers/mxc/gpu-viv/Kbuild
+--- linux-4.1.3/drivers/mxc/gpu-viv/Kbuild	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/Kbuild	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,236 @@
++##############################################################################
++#
++#    Copyright (C) 2005 - 2013 by Vivante Corp.
++#
++#    This program is free software; you can redistribute it and/or modify
++#    it under the terms of the GNU General Public License as published by
++#    the Free Software Foundation; either version 2 of the license, or
++#    (at your option) any later version.
++#
++#    This program is distributed in the hope that it will be useful,
++#    but WITHOUT ANY WARRANTY; without even the implied warranty of
++#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
++#    GNU General Public License for more details.
++#
++#    You should have received a copy of the GNU General Public License
++#    along with this program; if not write to the Free Software
++#    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
++#
++##############################################################################
++
++
++#
++# Linux build file for kernel HAL driver.
++#
++
++AQROOT := $(srctree)/drivers/mxc/gpu-viv
++AQARCH := $(AQROOT)/arch/XAQ2
++AQVGARCH := $(AQROOT)/arch/GC350
++
++include $(AQROOT)/config
++
++KERNEL_DIR ?= $(TOOL_DIR)/kernel
++
++OS_KERNEL_DIR   := hal/os/linux/kernel
++ARCH_KERNEL_DIR := arch/$(notdir $(AQARCH))/hal/kernel
++ARCH_VG_KERNEL_DIR := arch/$(notdir $(AQVGARCH))/hal/kernel
++HAL_KERNEL_DIR  := hal/kernel
++
++# EXTRA_CFLAGS += -Werror
++
++OBJS := $(OS_KERNEL_DIR)/gc_hal_kernel_device.o \
++        $(OS_KERNEL_DIR)/gc_hal_kernel_driver.o \
++        $(OS_KERNEL_DIR)/gc_hal_kernel_linux.o \
++        $(OS_KERNEL_DIR)/gc_hal_kernel_math.o \
++        $(OS_KERNEL_DIR)/gc_hal_kernel_os.o \
++        $(OS_KERNEL_DIR)/gc_hal_kernel_debugfs.o
++
++OBJS += $(HAL_KERNEL_DIR)/gc_hal_kernel.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_command.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_db.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_debug.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_event.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_heap.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_mmu.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_video_memory.o \
++        $(HAL_KERNEL_DIR)/gc_hal_kernel_power.o
++
++OBJS += $(ARCH_KERNEL_DIR)/gc_hal_kernel_context.o \
++        $(ARCH_KERNEL_DIR)/gc_hal_kernel_hardware.o
++
++ifeq ($(VIVANTE_ENABLE_VG), 1)
++OBJS +=\
++          $(HAL_KERNEL_DIR)/gc_hal_kernel_vg.o\
++          $(HAL_KERNEL_DIR)/gc_hal_kernel_command_vg.o\
++          $(HAL_KERNEL_DIR)/gc_hal_kernel_interrupt_vg.o\
++          $(HAL_KERNEL_DIR)/gc_hal_kernel_mmu_vg.o\
++          $(ARCH_VG_KERNEL_DIR)/gc_hal_kernel_hardware_command_vg.o\
++          $(ARCH_VG_KERNEL_DIR)/gc_hal_kernel_hardware_vg.o
++endif
++
++ifneq ($(CONFIG_SYNC),)
++OBJS += $(OS_KERNEL_DIR)/gc_hal_kernel_sync.o
++endif
++
++ifeq ($(KERNELRELEASE), )
++
++.PHONY: all clean install
++
++# Define targets.
++all:
++	@make V=$(V) ARCH=$(ARCH_TYPE) -C $(KERNEL_DIR) SUBDIRS=`pwd` modules
++
++clean:
++	@rm -rf $(OBJS)
++	@rm -rf modules.order Module.symvers
++	@find $(AQROOT) -name ".gc_*.cmd" | xargs rm -f
++
++install: all
++	@mkdir -p $(SDK_DIR)/drivers
++
++else
++
++
++EXTRA_CFLAGS += -DLINUX -DDRIVER
++
++ifeq ($(ENUM_WORKAROUND), 1)
++EXTRA_CFLAGS += -DENUM_WORKAROUND=1
++else
++EXTRA_CFLAGS += -DENUM_WORKAROUND=0
++endif
++
++ifeq ($(FLAREON),1)
++EXTRA_CFLAGS += -DFLAREON
++endif
++
++ifeq ($(DEBUG), 1)
++EXTRA_CFLAGS += -DDBG=1 -DDEBUG -D_DEBUG
++else
++EXTRA_CFLAGS += -DDBG=0
++endif
++
++ifeq ($(NO_DMA_COHERENT), 1)
++EXTRA_CFLAGS += -DNO_DMA_COHERENT
++endif
++
++ifeq ($(CONFIG_DOVE_GPU), 1)
++EXTRA_CFLAGS += -DCONFIG_DOVE_GPU=1
++endif
++
++ifneq ($(USE_PLATFORM_DRIVER), 0)
++EXTRA_CFLAGS += -DUSE_PLATFORM_DRIVER=1
++else
++EXTRA_CFLAGS += -DUSE_PLATFORM_DRIVER=0
++endif
++
++
++EXTRA_CFLAGS += -DVIVANTE_PROFILER=1
++EXTRA_CFLAGS += -DVIVANTE_PROFILER_CONTEXT=1
++
++
++ifeq ($(ANDROID), 1)
++EXTRA_CFLAGS += -DANDROID=1
++endif
++
++ifeq ($(ENABLE_GPU_CLOCK_BY_DRIVER), 1)
++EXTRA_CFLAGS += -DENABLE_GPU_CLOCK_BY_DRIVER=1
++else
++EXTRA_CFLAGS += -DENABLE_GPU_CLOCK_BY_DRIVER=0
++endif
++
++ifeq ($(USE_NEW_LINUX_SIGNAL), 1)
++EXTRA_CFLAGS += -DUSE_NEW_LINUX_SIGNAL=1
++else
++EXTRA_CFLAGS += -DUSE_NEW_LINUX_SIGNAL=0
++endif
++
++ifeq ($(NO_USER_DIRECT_ACCESS_FROM_KERNEL), 1)
++EXTRA_CFLAGS += -DNO_USER_DIRECT_ACCESS_FROM_KERNEL=1
++else
++EXTRA_CFLAGS += -DNO_USER_DIRECT_ACCESS_FROM_KERNEL=0
++endif
++
++ifeq ($(FORCE_ALL_VIDEO_MEMORY_CACHED), 1)
++EXTRA_CFLAGS += -DgcdPAGED_MEMORY_CACHEABLE=1
++else
++EXTRA_CFLAGS += -DgcdPAGED_MEMORY_CACHEABLE=0
++endif
++
++ifeq ($(NONPAGED_MEMORY_CACHEABLE), 1)
++EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_CACHEABLE=1
++else
++EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_CACHEABLE=0
++endif
++
++ifeq ($(NONPAGED_MEMORY_BUFFERABLE), 1)
++EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_BUFFERABLE=1
++else
++EXTRA_CFLAGS += -DgcdNONPAGED_MEMORY_BUFFERABLE=0
++endif
++
++ifeq ($(CACHE_FUNCTION_UNIMPLEMENTED), 1)
++EXTRA_CFLAGS += -DgcdCACHE_FUNCTION_UNIMPLEMENTED=1
++else
++EXTRA_CFLAGS += -DgcdCACHE_FUNCTION_UNIMPLEMENTED=0
++endif
++
++ifeq ($(SUPPORT_SWAP_RECTANGLE), 1)
++EXTRA_CFLAGS += -DgcdSUPPORT_SWAP_RECTANGLE=1
++else
++EXTRA_CFLAGS += -DgcdSUPPORT_SWAP_RECTANGLE=0
++endif
++
++ifeq ($(VIVANTE_ENABLE_VG), 1)
++EXTRA_CFLAGS += -DgcdENABLE_VG=1
++else
++EXTRA_CFLAGS += -DgcdENABLE_VG=0
++endif
++
++ifeq ($(CONFIG_SMP), y)
++EXTRA_CFLAGS += -DgcdSMP=1
++else
++EXTRA_CFLAGS += -DgcdSMP=0
++endif
++
++ifeq ($(VIVANTE_NO_3D),1)
++EXTRA_CFLAGS += -DVIVANTE_NO_3D
++endif
++
++ifeq ($(ENABLE_OUTER_CACHE_PATCH), 1)
++EXTRA_CFLAGS += -DgcdENABLE_OUTER_CACHE_PATCH=1
++else
++EXTRA_CFLAGS += -DgcdENABLE_OUTER_CACHE_PATCH=0
++endif
++
++ifeq ($(USE_BANK_ALIGNMENT), 1)
++    EXTRA_CFLAGS += -DgcdENABLE_BANK_ALIGNMENT=1
++    ifneq ($(BANK_BIT_START), 0)
++	        ifneq ($(BANK_BIT_END), 0)
++	            EXTRA_CFLAGS += -DgcdBANK_BIT_START=$(BANK_BIT_START)
++	            EXTRA_CFLAGS += -DgcdBANK_BIT_END=$(BANK_BIT_END)
++	        endif
++    endif
++
++    ifneq ($(BANK_CHANNEL_BIT), 0)
++        EXTRA_CFLAGS += -DgcdBANK_CHANNEL_BIT=$(BANK_CHANNEL_BIT)
++    endif
++endif
++
++ifneq ($(CONFIG_SYNC),)
++EXTRA_CFLAGS += -DgcdANDROID_NATIVE_FENCE_SYNC=1
++endif
++
++EXTRA_CFLAGS += -I$(AQROOT)/hal/kernel/inc
++EXTRA_CFLAGS += -I$(AQROOT)/hal/kernel
++EXTRA_CFLAGS += -I$(AQARCH)/hal/kernel
++EXTRA_CFLAGS += -I$(AQROOT)/hal/os/linux/kernel
++
++ifeq ($(VIVANTE_ENABLE_VG), 1)
++EXTRA_CFLAGS += -I$(AQVGARCH)/hal/kernel
++endif
++
++obj-$(CONFIG_MXC_GPU_VIV) += galcore.o
++
++galcore-objs  := $(OBJS)
++
++endif
+diff -Nur linux-4.1.3/drivers/mxc/gpu-viv/Kconfig linux-xbian-imx6/drivers/mxc/gpu-viv/Kconfig
+--- linux-4.1.3/drivers/mxc/gpu-viv/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/gpu-viv/Kconfig	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,9 @@
++menu "MXC Vivante GPU support"
++	depends on SOC_IMX6Q
++
++config MXC_GPU_VIV
++	tristate "MXC Vivante GPU support"
++	---help---
++         Say Y to get the GPU driver support.
++
++endmenu
+diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/Kconfig linux-xbian-imx6/drivers/mxc/hdmi-cec/Kconfig
+--- linux-4.1.3/drivers/mxc/hdmi-cec/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/hdmi-cec/Kconfig	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,11 @@
++
++menu "MXC HDMI CEC (Consumer Electronics Control) support"
++
++config MXC_HDMI_CEC
++	tristate "Support for MXC HDMI CEC (Consumer Electronics Control)"
++	depends on MFD_MXC_HDMI
++	depends on FB_MXC_HDMI || DRM_IMX_HDMI
++	help
++	  The HDMI CEC device implement low level protocol on i.MX6x platforms.
++
++endmenu
+diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/Makefile linux-xbian-imx6/drivers/mxc/hdmi-cec/Makefile
+--- linux-4.1.3/drivers/mxc/hdmi-cec/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/hdmi-cec/Makefile	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1 @@
++obj-$(CONFIG_MXC_HDMI_CEC)                  += mxc_hdmi-cec.o
+diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c
+--- linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,786 @@
++/*
++ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file mxc_hdmi-cec.c
++ *
++ * @brief HDMI CEC system initialization and file operation implementation
++ *
++ * @ingroup HDMI
++ */
++
++//#define DEBUG
++
++#include <linux/module.h>
++#include <linux/kernel.h>
++#include <linux/mm.h>
++#include <linux/fs.h>
++#include <linux/stat.h>
++#include <linux/platform_device.h>
++#include <linux/poll.h>
++#include <linux/wait.h>
++#include <linux/list.h>
++#include <linux/delay.h>
++#include <linux/fsl_devices.h>
++#include <linux/uaccess.h>
++#include <linux/io.h>
++#include <linux/slab.h>
++#include <linux/vmalloc.h>
++#include <linux/workqueue.h>
++#include <linux/sizes.h>
++
++#include <linux/console.h>
++#include <linux/types.h>
++#include <linux/mfd/mxc-hdmi-core.h>
++#include <linux/pinctrl/consumer.h>
++
++#include <video/mxc_hdmi.h>
++
++#include "mxc_hdmi-cec.h"
++
++#define MAXCLIENTS 15
++
++struct hdmi_cec_priv {
++	u8 la;
++	struct list_head msg_head;
++	struct list_head client_node;
++	struct list_head wakeup_node;
++	wait_queue_head_t hdmi_cec_qm;
++	spinlock_t i_lock_cl;
++};
++
++struct hdmi_cec_event {
++	u8 event_type;
++	u8 msg_len;
++	u8 msg[MAX_MESSAGE_LEN];
++};
++
++struct hdmi_cec_event_list {
++	struct hdmi_cec_event data;
++	u8 libcec_la;
++	struct list_head msg_node;
++};
++
++struct hdmi_cec_shared {
++	bool write_busy;
++	int  receive_error;
++	int  send_error;
++	struct delayed_work hdmi_cec_work;
++	spinlock_t i_lock;
++	spinlock_t buffer_lock;
++	struct mutex m_lock;
++	struct list_head client_head;
++	struct list_head buffer_head;
++	int nr_ff;
++	u16 addresses;
++	u8 latest_cec_stat;
++	u32 physical_address;
++};
++
++static struct hdmi_cec_shared hdmi_cec_root;
++
++static bool hdmi_cec_state;
++static int hdmi_cec_ready = 0;
++static int hdmi_cec_major;
++static struct class *hdmi_cec_class;
++static u8 open_count = 0;
++
++static int in_worker = 0;
++
++static wait_queue_head_t hdmi_cec_qs, hdmi_cec_qw;
++
++static int SIGNAL_FREE_ARB = 0;
++
++static inline bool la_is_local(u8 la)
++{
++	return (la == 0xf) ? false : hdmi_cec_root.addresses & BIT(la);
++}
++
++static inline u8 get_o(u8 la)
++{
++	return (la >> 4);
++}
++
++static inline u8 get_o_e(struct hdmi_cec_event_list *event)
++{
++	return (event->data.msg[0] >> 4);
++}
++
++static inline u8 get_d(u8 la)
++{
++	return (la & 0x0f);
++}
++
++static inline u8 get_d_e(struct hdmi_cec_event_list *event)
++{
++	return (event->data.msg[0] & 0x0f);
++}
++
++int mxc_hdmi_cec_buffer(uint16_t offset, int len, u8 cec_type, u8 llla)
++{
++	struct hdmi_cec_event_list *event = NULL;
++	unsigned long flags;
++	u8 i;
++
++	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_ATOMIC);
++	if (NULL == event) {
++		pr_err("%s: Not enough memory!\n", __func__);
++		return -ENOMEM;
++	}
++	event->data.msg_len = len;
++	if (!event->data.msg_len || event->data.msg_len > MAX_MESSAGE_LEN) {
++		pr_err("%s: Bad message size %d!\n", __func__, event->data.msg_len);
++		kfree(event);
++		return -E2BIG;
++	}
++
++	for (i = 0; i < event->data.msg_len; i++)
++		event->data.msg[i] = hdmi_readb(offset+i);
++
++	event->data.event_type = cec_type;
++	event->libcec_la = llla ? llla : get_o(event->data.msg[0]);
++
++	spin_lock_irqsave(&hdmi_cec_root.buffer_lock, flags);
++	list_add_tail(&event->msg_node, &hdmi_cec_root.buffer_head);
++	spin_unlock_irqrestore(&hdmi_cec_root.buffer_lock, flags);
++	return 0;
++}
++
++static irqreturn_t mxc_hdmi_cec_isr(int irq, void *data)
++{
++	u8 cec_stat = 0;
++	u8 val;
++	unsigned long flags;
++	irqreturn_t ret = IRQ_HANDLED;
++
++	cec_stat = hdmi_readb(HDMI_IH_CEC_STAT0);
++	if (!cec_stat || !hdmi_cec_state) {
++		ret = IRQ_NONE;
++		goto done;
++	}
++
++	pr_debug("%s:  HDMI CEC interrupt handler\n", __func__);
++
++	spin_lock_irqsave(&hdmi_cec_root.i_lock, flags);
++
++	hdmi_writeb(0x7f, HDMI_IH_MUTE_CEC_STAT0);
++	hdmi_writeb(cec_stat, HDMI_IH_CEC_STAT0);
++
++	if (cec_stat & (HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_ARB_LOST)) {
++		hdmi_cec_root.send_error++;
++		SIGNAL_FREE_ARB = cec_stat & HDMI_IH_CEC_STAT0_ERROR_INIT ? SIGNAL_FREE_TIME_RESEND : SIGNAL_FREE_LOST;
++		pr_debug("%s:  error %d\n", __func__, hdmi_cec_root.send_error);
++		wake_up(&hdmi_cec_qs);
++	}
++	if (cec_stat & (HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_DONE)) {
++		mxc_hdmi_cec_buffer(HDMI_CEC_TX_DATA0, hdmi_readb(HDMI_CEC_TX_CNT),
++				  cec_stat & HDMI_IH_CEC_STAT0_NACK ? MESSAGE_TYPE_NOACK : MESSAGE_TYPE_SEND_SUCCESS, 0);
++		hdmi_cec_root.send_error = 0;
++		hdmi_cec_root.write_busy = false;
++		wake_up(&hdmi_cec_qs);
++		hdmi_writeb(0, HDMI_CEC_TX_CNT);
++	}
++	if (cec_stat & HDMI_IH_CEC_STAT0_EOM) {
++		mxc_hdmi_cec_buffer(HDMI_CEC_RX_DATA0, hdmi_readb(HDMI_CEC_RX_CNT), MESSAGE_TYPE_RECEIVE_SUCCESS, 0);
++		hdmi_writeb(0, HDMI_CEC_LOCK);
++	}
++
++	pr_debug("%s:  HDMI CEC interrupt received %#x\n", __func__, cec_stat);
++	if (!in_worker) {
++		in_worker = 1;
++		schedule_delayed_work(&hdmi_cec_root.hdmi_cec_work, msecs_to_jiffies(20));
++	}
++
++	spin_unlock_irqrestore(&hdmi_cec_root.i_lock, flags);
++	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL;
++	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
++
++done:
++	return ret;
++}
++
++static void __mxc_hdmi_cec_msg(struct hdmi_cec_event_list *event, struct hdmi_cec_priv *client, struct list_head *wakeup, u8 event_type)
++{
++	struct hdmi_cec_event_list *tevent = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL);
++	unsigned long flags;
++
++	if (!tevent) {
++		pr_err("%s: Not enough memory!\n", __func__);
++		return;
++	}
++	memcpy(&tevent->data, &event->data, min(sizeof(struct hdmi_cec_event), (size_t)(event->data.msg_len + 2)));
++	if (event_type)
++		tevent->data.event_type = event_type;
++
++	spin_lock_irqsave(&client->i_lock_cl, flags);
++	list_add_tail(&tevent->msg_node, &client->msg_head);
++	spin_unlock_irqrestore(&client->i_lock_cl, flags);
++
++	if (wakeup)
++		list_add_tail(&client->wakeup_node, wakeup);
++}
++
++void mxc_hdmi_cec_handle(u32 cec_stat)
++{
++	struct hdmi_cec_event_list *event = NULL;
++	struct hdmi_cec_priv *client = NULL;
++
++	if (cec_stat)
++		hdmi_cec_root.physical_address = cec_stat;
++
++	/* HDMI cable connected / HDMI cable disconnected */
++	if (!hdmi_cec_ready)
++		return;
++	pr_debug("%s: enter\n", __func__);
++
++	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_ATOMIC);
++	if (!event) {
++		pr_err("%s: Not enough memory!\n", __func__);
++		return;
++	}
++	event->data.event_type = cec_stat ?
++		MESSAGE_TYPE_CONNECTED : MESSAGE_TYPE_DISCONNECTED;
++
++	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
++		mutex_lock(&hdmi_cec_root.m_lock);
++		__mxc_hdmi_cec_msg(event, client, NULL, 0);
++		mutex_unlock(&hdmi_cec_root.m_lock);
++		wake_up(&client->hdmi_cec_qm);
++	}
++	pr_debug("%s: exit\n", __func__);
++}
++EXPORT_SYMBOL(mxc_hdmi_cec_handle);
++
++void mxc_hdmi_cec_msg(void)
++{
++	struct hdmi_cec_event_list *event = NULL;
++	struct hdmi_cec_priv *client = NULL;
++	unsigned long flags;
++	LIST_HEAD(wakeup);
++
++	spin_lock_irqsave(&hdmi_cec_root.buffer_lock, flags);
++	event = list_first_entry_or_null(&hdmi_cec_root.buffer_head, struct hdmi_cec_event_list, msg_node);
++	if (!event) {
++		spin_unlock_irqrestore(&hdmi_cec_root.buffer_lock, flags);
++		return;
++	}
++	list_del_init(&event->msg_node);
++	spin_unlock_irqrestore(&hdmi_cec_root.buffer_lock, flags);
++
++	event->data.event_type = (event->data.event_type == MESSAGE_TYPE_NOACK && la_is_local(event->data.msg[0] & 0x0f)) ?
++								MESSAGE_TYPE_SEND_SUCCESS : event->data.event_type;
++
++	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
++		if (client->la == 0xff) continue;
++		pr_debug("client %d: MSG from %d to %d, %x. (clla: %d) ET: %d\n", client->la, get_o(event->data.msg[0]), get_d(event->data.msg[0]), event->data.msg[1], event->libcec_la, event->data.event_type);
++
++		if ((event->data.event_type == MESSAGE_TYPE_RECEIVE_SUCCESS &&
++					((get_d_e(event) == 15 && event->libcec_la != client->la) || (event->data.msg[0] & 0x0f) == client->la))
++		    ||
++		    (event->data.event_type != MESSAGE_TYPE_RECEIVE_SUCCESS &&
++					((get_o_e(event) == get_d_e(event) && client->la == 15) || client->la == get_o_e(event))) )
++		{
++			pr_debug("writing to %d\n", client->la);
++			__mxc_hdmi_cec_msg(event, client, &wakeup, 0);
++		}
++
++		if ((event->data.event_type == MESSAGE_TYPE_SEND_SUCCESS) &&
++					((la_is_local(event->data.msg[0] & 0x0f) && (event->data.msg[0] & 0x0f) == client->la)
++					||
++					((event->data.msg[0] & 0x0f) == 15 && !event->libcec_la)) )
++		{
++			pr_debug("writing to %d\n", client->la);
++			__mxc_hdmi_cec_msg(event, client, &wakeup, MESSAGE_TYPE_RECEIVE_SUCCESS);
++		}
++	}
++	list_for_each_entry(client, &wakeup, wakeup_node)
++		wake_up(&(client->hdmi_cec_qm));
++	kfree(event);
++}
++
++static void mxc_hdmi_cec_worker(struct work_struct *work)
++{
++	pr_debug("%s: \n", __func__);
++	while (!list_empty_careful(&hdmi_cec_root.buffer_head))
++		mxc_hdmi_cec_msg();
++	in_worker = 0;
++	pr_debug("%s:  exit\n", __func__);
++}
++
++static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec);
++/*!
++ * @brief open function for cec file operation
++ *
++ * @return  0 on success or negative error code on error
++ */
++static int hdmi_cec_open(struct inode *inode, struct file *filp)
++{
++	struct hdmi_cec_priv *hdmi_cec = NULL;
++
++	mutex_lock(&hdmi_cec_root.m_lock);
++	if (open_count == MAXCLIENTS || !hdmi_cec_ready) {
++		mutex_unlock(&hdmi_cec_root.m_lock);
++		return -EBUSY;
++	}
++	open_count++;
++
++	hdmi_cec = kzalloc(sizeof(struct hdmi_cec_priv), GFP_KERNEL);
++	hdmi_cec->la = -1;
++	init_waitqueue_head(&(hdmi_cec->hdmi_cec_qm));
++	spin_lock_init(&(hdmi_cec->i_lock_cl));
++	INIT_LIST_HEAD(&hdmi_cec->msg_head);
++
++	filp->private_data = (void *)(hdmi_cec);
++
++	list_add_tail(&hdmi_cec->client_node, &hdmi_cec_root.client_head);
++	hdmi_cec_set_address(15, hdmi_cec);
++	mutex_unlock(&hdmi_cec_root.m_lock);
++
++	return 0;
++}
++
++static ssize_t hdmi_cec_read(struct file *file, char __user *buf, size_t count,
++			    loff_t *ppos)
++{
++	struct hdmi_cec_priv *hdmi_cec = file->private_data;
++	int ret = 0;
++
++	if (!open_count || hdmi_cec->la == 0xff)
++		return -ENODEV;
++
++	pr_debug("%s:  client la %x, (addr %x)\n", __func__, hdmi_cec->la, (unsigned int)hdmi_cec);
++
++	count = min(count, sizeof(struct hdmi_cec_event));
++	do {
++		unsigned long flags;
++		struct hdmi_cec_event_list *event = NULL;
++
++		spin_lock_irqsave(&(hdmi_cec->i_lock_cl), flags);
++		if (!list_empty(&hdmi_cec->msg_head)) {
++			event = list_first_entry_or_null(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
++			list_del(&event->msg_node);
++		}
++		spin_unlock_irqrestore(&(hdmi_cec->i_lock_cl), flags);
++
++		if (event) {
++			ret = copy_to_user(buf, &event->data, count) ? -EFAULT : count;
++			kfree(event);
++		}
++		else if (file->f_flags & O_NONBLOCK) {
++			ret = -EAGAIN;
++		}
++		else if (wait_event_interruptible(hdmi_cec->hdmi_cec_qm, (!list_empty(&hdmi_cec->msg_head)))) {
++			ret = -ERESTARTSYS;
++		}
++	} while(!ret);
++
++	pr_debug("%s:  exit %d\n", __func__, ret);
++	return ret;
++}
++
++static ssize_t hdmi_cec_write(struct file *file, const char __user *buf,
++			     size_t count, loff_t *ppos)
++{
++	struct hdmi_cec_priv *hdmi_cec = file->private_data;
++	int ret = 0 , i = 0;
++	u8 msg[MAX_MESSAGE_LEN];
++	u8 val = 0;
++	int timeout = 1500;
++
++	if (!open_count || hdmi_cec->la == 0xff)
++		return -ENODEV;
++
++	if (count > MAX_MESSAGE_LEN)
++		return -E2BIG;
++
++	memset(&msg, 0, MAX_MESSAGE_LEN);
++	if (copy_from_user(&msg, buf, count))
++		return -EFAULT;
++
++	if (file->f_flags & O_NONBLOCK && hdmi_cec_root.write_busy)
++		return -EAGAIN;
++	else if (wait_event_interruptible(hdmi_cec_qw, (!hdmi_cec_root.write_busy)))
++		return -ERESTARTSYS;
++
++	mutex_lock(&hdmi_cec_root.m_lock);
++	pr_debug("%s: \n", __func__);
++	hdmi_cec_root.write_busy = true;
++
++	hdmi_writeb(count, HDMI_CEC_TX_CNT);
++	for (i = 0; i < count; i++)
++		hdmi_writeb(msg[i], HDMI_CEC_TX_DATA0+i);
++
++	if (get_d(msg[0]) == 15) {
++		ret = count;
++		mxc_hdmi_cec_buffer(HDMI_CEC_TX_DATA0, count, MESSAGE_TYPE_RECEIVE_SUCCESS, hdmi_cec->la);
++		pr_debug("%s:  wait_event la_is_local\n", __func__);
++		hdmi_cec_root.write_busy = false;
++	}
++
++	do {
++		val = hdmi_readb(HDMI_CEC_CTRL); val |= 0x01; val &= ~0x6;
++		val |= SIGNAL_FREE_ARB;
++		hdmi_writeb(val, HDMI_CEC_CTRL);
++		SIGNAL_FREE_ARB = SIGNAL_FREE_TIME_NORMAL;
++
++		ret = wait_event_timeout(hdmi_cec_qs, !((val = hdmi_readb(HDMI_CEC_CTRL)) & 0x01), msecs_to_jiffies(timeout));
++		pr_debug("%s:  wait_event ret %d\n", __func__, ret);
++		if (hdmi_cec_root.send_error > 5 || ret < 2) {
++			hdmi_writeb(0, HDMI_CEC_TX_CNT);
++			hdmi_cec_root.write_busy = false;
++			ret = -EIO;
++		} else if (hdmi_cec_root.send_error && ret > 1) {
++			pr_debug("%s: --- resending msg\n", __func__);
++			timeout = jiffies_to_msecs(ret);
++			ret = 0;
++		} else if (ret > 1) {
++			ret = count;
++		}
++	} while(!ret);
++
++	mutex_unlock(&hdmi_cec_root.m_lock);
++	wake_up(&hdmi_cec_qw);
++	return ret;
++}
++
++static void hdmi_cec_hwenable(void)
++{
++	u8 val;
++
++	pr_debug("%s: \n", __func__);
++	hdmi_cec_state = true;
++
++	val = hdmi_readb(HDMI_MC_CLKDIS);
++	val &= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
++	hdmi_writeb(val, HDMI_MC_CLKDIS);
++
++	val = HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_NACK |
++		HDMI_IH_CEC_STAT0_EOM | HDMI_IH_CEC_STAT0_DONE |
++		HDMI_IH_CEC_STAT0_ARB_LOST;
++	hdmi_writeb(val, HDMI_CEC_POLARITY);
++
++	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL;
++	hdmi_writeb(val, HDMI_CEC_MASK);
++	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
++	hdmi_writeb(0x0, HDMI_CEC_LOCK);
++	hdmi_writeb(0x2, HDMI_CEC_CTRL);
++}
++
++static void hdmi_cec_hwdisable(void)
++{
++	u8 val;
++
++	pr_debug("%s: \n", __func__);
++	hdmi_cec_state = false;
++
++	hdmi_writeb(0x10, HDMI_CEC_CTRL);
++
++	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL |
++		HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_ARB_LOST |
++		HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_EOM |
++		HDMI_IH_CEC_STAT0_DONE;
++	hdmi_writeb(val, HDMI_CEC_MASK);
++	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
++
++	hdmi_writeb(0x0, HDMI_CEC_POLARITY);
++
++	val = hdmi_readb(HDMI_MC_CLKDIS);
++	val |= HDMI_MC_CLKDIS_CECCLK_DISABLE;
++	hdmi_writeb(val, HDMI_MC_CLKDIS);
++}
++
++static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec)
++{
++
++	if (hdmi_cec->la == arg)
++		return 0;
++
++	pr_debug("%s: to %d\n", __func__, arg);
++
++	if (arg == 15)
++		hdmi_cec_root.nr_ff++;
++	if (hdmi_cec->la == 15)
++		hdmi_cec_root.nr_ff--;
++	else
++		hdmi_cec_root.addresses &= ~BIT(hdmi_cec->la);
++
++	hdmi_cec->la = arg;
++	if ((u8)arg != 0xff)
++		hdmi_cec_root.addresses |= BIT(arg);
++	else
++		wake_up(&hdmi_cec->hdmi_cec_qm);
++
++	if (!hdmi_cec_root.nr_ff)
++		hdmi_cec_root.addresses &= ~BIT(15);
++
++	hdmi_writeb(hdmi_cec_root.addresses & 0xff, HDMI_CEC_ADDR_L);
++	/* 
++	 * Don't register LA = 15 to with hardware. with it set, broadcast messages are never
++	 * sent (considered local by CEC controler)
++	 */
++	hdmi_writeb((hdmi_cec_root.addresses & 0x7f00) >> 8, HDMI_CEC_ADDR_H);
++	return 0;
++}
++
++/*!
++ * @brief IO ctrl function for vpu file operation
++ * @param cmd IO ctrl command
++ * @return  0 on success or negative error code on error
++ */
++static long hdmi_cec_ioctl(struct file *filp, u_int cmd,
++		     u_long arg)
++{
++	int ret = 0, i;
++	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
++
++	pr_debug("%s: \n", __func__);
++
++	if (!open_count)
++		return -ENODEV;
++
++	switch (cmd) {
++	case HDMICEC_IOC_SETLOGICALADDRESS:
++		mutex_lock(&hdmi_cec_root.m_lock);
++		ret = hdmi_cec_set_address(arg, hdmi_cec);
++		mutex_unlock(&hdmi_cec_root.m_lock);
++		/*
++		 * in case we have more clients, inform them about PA change.
++		 * (if libCEC is not in monitoring mode, it won't allow more
++		 * clients with same PA - it changes all previous holders of
++		 * that 'taken' PA to 1000.
++		 * to avoid that, we expand PA further by replacing first empty
++		 * dimension with LA (for instance if our PA is 2.2.0.0, we 
++		 * change to 2.2.X.0 all concurent clients, where X is actual LA
++		 */
++		if (open_count > 1 && arg != 15)
++			mxc_hdmi_cec_handle(hdmi_cec_root.physical_address);
++		break;
++
++	case HDMICEC_IOC_STARTDEVICE:
++		if (!hdmi_cec_state)
++			hdmi_cec_hwenable();
++		break;
++
++	case HDMICEC_IOC_STOPDEVICE:
++		hdmi_cec_set_address(-1, hdmi_cec);
++		if (hdmi_cec_state && open_count < 2)
++			hdmi_cec_hwdisable();
++		break;
++
++	case HDMICEC_IOC_GETPHYADDRESS:
++		ret = copy_to_user((void __user *)arg, &hdmi_cec_root.physical_address,
++					4*sizeof(u8))?-EFAULT:0;
++		if (open_count > 1) {
++			for (i = 0; i < 4 && ((u8*)arg)[i] != 0x0; i++);
++			((u8*)arg)[i] = hdmi_cec->la;
++		}
++		break;
++
++	default:
++		ret = -EINVAL;
++		break;
++	}
++
++	return ret;
++}
++
++void hdmi_cec_start_device(void)
++{
++	if(open_count && hdmi_cec_ready && !hdmi_cec_state)
++		hdmi_cec_hwenable();
++}
++EXPORT_SYMBOL(hdmi_cec_start_device);
++
++void hdmi_cec_stop_device(void)
++{
++	if(hdmi_cec_ready && hdmi_cec_state)
++		hdmi_cec_hwdisable();
++}
++EXPORT_SYMBOL(hdmi_cec_stop_device);
++
++/*!
++* @brief Release function for vpu file operation
++* @return  0 on success or negative error code on error
++*/
++static int hdmi_cec_release(struct inode *inode, struct file *filp)
++{
++	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
++	struct hdmi_cec_priv *client, *t;
++	unsigned long flags;
++
++	pr_debug("%s: \n", __func__);
++
++	mutex_lock(&hdmi_cec_root.m_lock);
++	spin_lock_irqsave(&hdmi_cec->i_lock_cl, flags);
++
++	hdmi_cec_set_address(-1, hdmi_cec);
++	if (!--open_count)
++		hdmi_cec_hwdisable();
++	while (!list_empty(&hdmi_cec->msg_head)) {
++		struct hdmi_cec_event_list *event = NULL;
++
++		event = list_first_entry(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
++		list_del(&event->msg_node);
++		kfree(event);
++	}
++	spin_unlock_irqrestore(&hdmi_cec->i_lock_cl, flags);
++
++	list_for_each_entry_safe(client, t, &hdmi_cec_root.client_head, client_node) {
++		if (client == hdmi_cec) {
++			list_del(&client->client_node);
++			filp->private_data = NULL;
++			kfree(client);
++		}
++	}
++
++	mutex_unlock(&hdmi_cec_root.m_lock);
++	return 0;
++}
++
++static unsigned int hdmi_cec_poll(struct file *file, poll_table *wait)
++{
++	unsigned int mask = 0;
++	struct hdmi_cec_priv *hdmi_cec = file->private_data;
++
++	pr_debug("%s: poll client %lx, la %d\n", __func__, (unsigned long)hdmi_cec, hdmi_cec->la);
++
++	if (hdmi_cec->la == 0xff)
++		return POLLHUP;
++
++	poll_wait(file, &hdmi_cec->hdmi_cec_qm, wait);
++	poll_wait(file, &hdmi_cec_qw, wait);
++
++	if (!hdmi_cec_root.write_busy)
++		mask = (POLLOUT | POLLWRNORM);
++	if (!list_empty(&hdmi_cec->msg_head))
++		mask |= (POLLIN | POLLRDNORM);
++
++	return mask;
++}
++
++const struct file_operations hdmi_cec_fops = {
++	.owner = THIS_MODULE,
++	.read = hdmi_cec_read,
++	.write = hdmi_cec_write,
++	.open = hdmi_cec_open,
++	.unlocked_ioctl = hdmi_cec_ioctl,
++	.release = hdmi_cec_release,
++	.poll = hdmi_cec_poll,
++};
++
++static int hdmi_cec_dev_probe(struct platform_device *pdev)
++{
++	int err = 0;
++	struct device *temp_class;
++	struct resource *res;
++	struct pinctrl *pinctrl;
++	int irq = platform_get_irq(pdev, 0);
++
++	hdmi_cec_major = register_chrdev(hdmi_cec_major, "mxc_hdmi_cec", &hdmi_cec_fops);
++	if (hdmi_cec_major < 0) {
++		dev_err(&pdev->dev, "%s: unable to get a major for HDMI CEC\n", __func__);
++		err = -EBUSY;
++		goto out;
++	}
++
++	res = platform_get_resource(pdev, IORESOURCE_IRQ, 0);
++	if (unlikely(res == NULL)) {
++		dev_err(&pdev->dev, "%s: No HDMI irq line provided\n", __func__);
++		goto err_out_chrdev;
++	}
++	spin_lock_init(&hdmi_cec_root.i_lock);
++
++	err = devm_request_irq(&pdev->dev, irq, mxc_hdmi_cec_isr, IRQF_SHARED,
++			dev_name(&pdev->dev), &hdmi_cec_root);
++	if (err < 0) {
++		dev_err(&pdev->dev, "%s: Unable to request irq: %d\n", __func__, err);
++		goto err_out_chrdev;
++	}
++
++	hdmi_cec_class = class_create(THIS_MODULE, "mxc_hdmi_cec");
++	if (IS_ERR(hdmi_cec_class)) {
++		err = PTR_ERR(hdmi_cec_class);
++		goto err_out_chrdev;
++	}
++
++	temp_class = device_create(hdmi_cec_class, NULL,
++			MKDEV(hdmi_cec_major, 0), NULL, "mxc_hdmi_cec");
++	if (IS_ERR(temp_class)) {
++		err = PTR_ERR(temp_class);
++		goto err_out_class;
++	}
++
++	pinctrl = devm_pinctrl_get_select_default(&pdev->dev);
++	if (IS_ERR(pinctrl)) {
++		dev_err(&pdev->dev, "%s: can't get/select CEC pinctrl\n", __func__);
++		goto err_out_class;
++	}
++
++	init_waitqueue_head(&hdmi_cec_qs);
++	init_waitqueue_head(&hdmi_cec_qw);
++
++	INIT_LIST_HEAD(&hdmi_cec_root.client_head);
++	INIT_LIST_HEAD(&hdmi_cec_root.buffer_head);
++
++	mutex_init(&hdmi_cec_root.m_lock);
++	hdmi_cec_root.addresses = 0;
++	platform_set_drvdata(pdev, &hdmi_cec_root);
++	INIT_DELAYED_WORK(&hdmi_cec_root.hdmi_cec_work, mxc_hdmi_cec_worker);
++
++	dev_info(&pdev->dev, "%s: HDMI CEC initialized\n", __func__);
++	hdmi_cec_ready = 1;
++	goto out;
++
++err_out_class:
++	device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
++	class_destroy(hdmi_cec_class);
++err_out_chrdev:
++	unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
++out:
++	return err;
++}
++
++static int hdmi_cec_dev_remove(struct platform_device *pdev)
++{
++	if (hdmi_cec_major > 0) {
++		flush_scheduled_work();
++		device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
++		class_destroy(hdmi_cec_class);
++		unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
++		hdmi_cec_major = 0;
++	}
++	return 0;
++}
++
++static const struct of_device_id imx_hdmi_cec_match[] = {
++	{ .compatible = "fsl,imx6q-hdmi-cec", },
++	{ .compatible = "fsl,imx6dl-hdmi-cec", },
++	{ /* sentinel */ }
++};
++
++static struct platform_driver mxc_hdmi_cec_driver = {
++	.probe = hdmi_cec_dev_probe,
++	.remove = hdmi_cec_dev_remove,
++	.driver = {
++		.name = "mxc_hdmi_cec",
++		.of_match_table	= imx_hdmi_cec_match,
++	},
++};
++
++module_platform_driver(mxc_hdmi_cec_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("Linux HDMI CEC driver for Freescale i.MX/MXC");
++MODULE_LICENSE("GPL");
++MODULE_ALIAS("platform:mxc_hdmi_cec");
++
+diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c
+--- linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.debug.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,765 @@
++/*
++ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file mxc_hdmi-cec.c
++ *
++ * @brief HDMI CEC system initialization and file operation implementation
++ *
++ * @ingroup HDMI
++ */
++
++//#define DEBUG
++
++#include <linux/module.h>
++#include <linux/kernel.h>
++#include <linux/mm.h>
++#include <linux/fs.h>
++#include <linux/stat.h>
++#include <linux/platform_device.h>
++#include <linux/poll.h>
++#include <linux/wait.h>
++#include <linux/list.h>
++#include <linux/delay.h>
++#include <linux/fsl_devices.h>
++#include <linux/uaccess.h>
++#include <linux/io.h>
++#include <linux/slab.h>
++#include <linux/vmalloc.h>
++#include <linux/workqueue.h>
++#include <linux/sizes.h>
++
++#include <linux/console.h>
++#include <linux/types.h>
++#include <linux/mfd/mxc-hdmi-core.h>
++#include <linux/pinctrl/consumer.h>
++
++#include <video/mxc_hdmi.h>
++
++#include "mxc_hdmi-cec.h"
++
++#define MAXCLIENTS 15
++
++struct hdmi_cec_priv {
++	u8 la;
++	u8 libcec_la;
++	struct list_head msg_head;
++	struct list_head client_node;
++	struct list_head wakeup_node;
++	wait_queue_head_t hdmi_cec_qm;
++	spinlock_t i_lock_cl;
++};
++
++struct hdmi_cec_event {
++	u8 event_type;
++	u8 msg_len;
++	u8 msg[MAX_MESSAGE_LEN];
++};
++
++struct hdmi_cec_event_list {
++	struct hdmi_cec_event data;
++	struct list_head msg_node;
++};
++
++struct hdmi_cec_shared {
++	bool write_busy;
++	int  receive_error;
++	int  send_error;
++	struct delayed_work hdmi_cec_work, hdmi_msg_trigger;
++	spinlock_t i_lock;
++	struct mutex m_lock_cl;
++	struct list_head client_head;
++	int nr_ff;
++	u16 addresses;
++	u8 latest_cec_stat;
++	u32 physical_address;
++};
++
++static struct hdmi_cec_shared hdmi_cec_root;
++
++static bool hdmi_cec_state;
++static int hdmi_cec_ready = 0;
++static int hdmi_cec_major;
++static struct class *hdmi_cec_class;
++static u8 open_count = 0;
++
++static wait_queue_head_t hdmi_cec_qs, hdmi_cec_qw;
++
++static inline bool la_is_local(u8 la)
++{
++	return (la == 0xf) ? false : hdmi_cec_root.addresses & BIT(la);
++}
++
++static irqreturn_t mxc_hdmi_cec_isr(int irq, void *data)
++{
++	u8 cec_stat = 0;
++	unsigned long flags;
++	irqreturn_t ret = IRQ_HANDLED;
++
++	spin_lock_irqsave(&hdmi_cec_root.i_lock, flags);
++
++	cec_stat = hdmi_readb(HDMI_IH_CEC_STAT0);
++	if (!cec_stat) {
++		ret = IRQ_NONE;
++		goto irqnone;
++	}
++	hdmi_writeb(0x7f, HDMI_IH_MUTE_CEC_STAT0);
++	hdmi_writeb(cec_stat, HDMI_IH_CEC_STAT0);
++
++	if (cec_stat & HDMI_IH_CEC_STAT0_ERROR_INIT) {
++		hdmi_cec_root.send_error++;
++		pr_debug("%s:  error %d\n", __func__, hdmi_cec_root.send_error);
++		wake_up(&hdmi_cec_qs);
++	}
++	if (cec_stat & (HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_DONE)) {
++		hdmi_cec_root.send_error = 0;
++		wake_up(&hdmi_cec_qs);
++	}
++
++	hdmi_cec_root.latest_cec_stat = cec_stat;
++	pr_debug("%s:  HDMI CEC interrupt received\n", __func__);
++	schedule_delayed_work(&(hdmi_cec_root.hdmi_cec_work), msecs_to_jiffies(5));
++
++irqnone:
++	spin_unlock_irqrestore(&hdmi_cec_root.i_lock, flags);
++	return ret;
++}
++
++static void __mxc_hdmi_cec_msg(struct hdmi_cec_event_list *event, struct hdmi_cec_priv *client, struct list_head *wakeup, u8 event_type)
++{
++	struct hdmi_cec_event_list *tevent = NULL;
++	unsigned long flags;
++
++	if (!(tevent = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL))) {
++		pr_err("%s: Not enough memory!\n", __func__);
++		return;
++	}
++	memcpy(tevent, event, max(sizeof(struct hdmi_cec_event_list),(size_t)event->data.msg_len));
++	if (event_type)
++		tevent->data.event_type = event_type;
++	spin_lock_irqsave(&client->i_lock_cl, flags);
++	list_add_tail(&tevent->msg_node, &client->msg_head);
++	spin_unlock_irqrestore(&client->i_lock_cl, flags);
++
++	if (wakeup)
++		list_add_tail(&client->wakeup_node, wakeup);
++	pr_debug("%s:  -- event to client %x\n", __func__, (int)client);
++}
++
++void mxc_hdmi_cec_handle(u32 cec_stat)
++{
++	struct hdmi_cec_event_list *event = NULL;
++	struct hdmi_cec_priv *client = NULL;
++
++	if (cec_stat)
++		hdmi_cec_root.physical_address = cec_stat;
++
++	/* HDMI cable connected / HDMI cable disconnected */
++	if (!hdmi_cec_ready)
++		return;
++	pr_debug("%s: enter\n", __func__);
++
++	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL);
++	if (!event) {
++		pr_err("%s: Not enough memory!\n", __func__);
++		return;
++	}
++	event->data.event_type = cec_stat ?
++		MESSAGE_TYPE_CONNECTED : MESSAGE_TYPE_DISCONNECTED;
++
++	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
++		__mxc_hdmi_cec_msg(event, client, NULL, 0);
++		wake_up(&client->hdmi_cec_qm);
++	}
++	pr_debug("%s: exit\n", __func__);
++}
++EXPORT_SYMBOL(mxc_hdmi_cec_handle);
++
++void mxc_hdmi_cec_msg(u8 event_type)
++{
++	struct hdmi_cec_event_list *event = NULL;
++	struct hdmi_cec_priv *client = NULL;
++	u8 i;
++	LIST_HEAD(wakeup);
++
++	event = kzalloc(sizeof(struct hdmi_cec_event_list), GFP_KERNEL);
++	if (NULL == event) {
++		pr_err("%s: Not enough memory!\n", __func__);
++		goto error2;
++	}
++	event->data.msg_len = (event_type == MESSAGE_TYPE_RECEIVE_SUCCESS) ?
++		hdmi_readb(HDMI_CEC_RX_CNT) : hdmi_readb(HDMI_CEC_TX_CNT);
++
++	if (!event->data.msg_len || event->data.msg_len > MAX_MESSAGE_LEN) {
++		pr_err("%s: Bad message size %d!\n", __func__, event->data.msg_len);
++		goto error1;
++	}
++
++	for (i = 0; i < event->data.msg_len; i++)
++		event->data.msg[i] = (event_type == MESSAGE_TYPE_RECEIVE_SUCCESS) ?
++				hdmi_readb(HDMI_CEC_RX_DATA0+i) : hdmi_readb(HDMI_CEC_TX_DATA0+i);
++
++	if (event_type == MESSAGE_TYPE_RECEIVE_SUCCESS)
++		hdmi_writeb(0x0, HDMI_CEC_LOCK);
++
++	event->data.event_type = (event_type == MESSAGE_TYPE_NOACK && la_is_local(event->data.msg[0] & 0x0f)) ?
++								MESSAGE_TYPE_SEND_SUCCESS : event_type;
++
++	list_for_each_entry(client, &hdmi_cec_root.client_head, client_node) {
++		if (client->la == 0xff) continue;
++		pr_debug("%s:  -- l:%x, r:%x, ch:%x LA: %x\n", __func__, (event->data.msg[0] & 0xf0) >> 4, event->data.msg[0] & 0x0f, client->libcec_la, client->la);
++
++		if ((event_type == MESSAGE_TYPE_RECEIVE_SUCCESS && 
++					(((event->data.msg[0] & 0x0f) == 15 && client->libcec_la != client->la) || (event->data.msg[0] & 0x0f) == client->la))
++		    ||
++		    (event_type != MESSAGE_TYPE_RECEIVE_SUCCESS &&
++					(client->libcec_la == (int)client->la)) )
++		{
++			pr_debug("%s:  -- adding msg %x->%x to client %x (event: %x)\n", __func__, (event->data.msg[0] & 0xf0) >> 4, event->data.msg[0] & 0x0f, client->la, (int)event);
++			__mxc_hdmi_cec_msg(event, client, &wakeup, 0);
++		}
++
++		if ((event->data.event_type == MESSAGE_TYPE_SEND_SUCCESS) &&
++					((la_is_local(event->data.msg[0] & 0x0f) && (event->data.msg[0] & 0x0f) == client->la)
++					||
++					((event->data.msg[0] & 0x0f) == 15 && !client->libcec_la)) )
++		{
++			pr_debug("%s:  -- COPYing event to client %x\n", __func__, (int)client);
++			__mxc_hdmi_cec_msg(event, client, &wakeup, MESSAGE_TYPE_RECEIVE_SUCCESS);
++		}
++		client->libcec_la = 0;
++	}
++	list_for_each_entry(client, &wakeup, wakeup_node)
++		wake_up(&(client->hdmi_cec_qm));
++
++error1:
++	kfree(event);
++error2:
++	if (event_type != MESSAGE_TYPE_RECEIVE_SUCCESS) {
++		mutex_lock(&hdmi_cec_root.m_lock_cl);
++		hdmi_cec_root.write_busy = false;
++		hdmi_writeb(0, HDMI_CEC_TX_CNT);
++		mutex_unlock(&hdmi_cec_root.m_lock_cl);
++		wake_up(&hdmi_cec_qw);
++	}
++}
++
++static void mxc_hdmi_cec_worker(struct work_struct *work)
++{
++	unsigned long flags;
++	u8 val;
++
++	pr_debug("%s: \n", __func__);
++	if (hdmi_cec_root.latest_cec_stat && open_count) {
++		/* The current transmission is successful (for initiator only).*/
++		if (hdmi_cec_root.latest_cec_stat & HDMI_IH_CEC_STAT0_DONE) {
++			mxc_hdmi_cec_msg(MESSAGE_TYPE_SEND_SUCCESS);
++		}
++		/*A frame is not acknowledged in a directly addressed message. Or a frame is negatively acknowledged in
++		a broadcast message (for initiator only).*/
++		if (hdmi_cec_root.latest_cec_stat & HDMI_IH_CEC_STAT0_NACK) {
++			mxc_hdmi_cec_msg(MESSAGE_TYPE_NOACK);
++		}
++		/*EOM is detected so that the received data is ready in the receiver data buffer*/
++		if (hdmi_cec_root.latest_cec_stat & HDMI_IH_CEC_STAT0_EOM) {
++			mxc_hdmi_cec_msg(MESSAGE_TYPE_RECEIVE_SUCCESS);
++		}
++		hdmi_cec_root.latest_cec_stat = 0;
++	}
++
++	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL | HDMI_IH_CEC_STAT0_ARB_LOST;
++//	spin_lock_irqsave(&hdmi_cec_root.i_lock, flags);
++	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
++//	spin_unlock_irqrestore(&hdmi_cec_root.i_lock, flags);
++	pr_debug("%s:  exit\n", __func__);
++}
++
++static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec);
++/*!
++ * @brief open function for cec file operation
++ *
++ * @return  0 on success or negative error code on error
++ */
++static int hdmi_cec_open(struct inode *inode, struct file *filp)
++{
++	struct hdmi_cec_priv *hdmi_cec = NULL;
++
++	mutex_lock(&hdmi_cec_root.m_lock_cl);
++	if (open_count == MAXCLIENTS || !hdmi_cec_ready) {
++		mutex_unlock(&hdmi_cec_root.m_lock_cl);
++		return -EBUSY;
++	}
++	open_count++;
++
++	hdmi_cec = kzalloc(sizeof(struct hdmi_cec_priv), GFP_KERNEL);
++	hdmi_cec->la = -1;
++	init_waitqueue_head(&(hdmi_cec->hdmi_cec_qm));
++	spin_lock_init(&(hdmi_cec->i_lock_cl));
++	INIT_LIST_HEAD(&hdmi_cec->msg_head);
++
++	filp->private_data = (void *)(hdmi_cec);
++
++	list_add_tail(&hdmi_cec->client_node, &hdmi_cec_root.client_head);
++	hdmi_cec_set_address(15, hdmi_cec);
++	mutex_unlock(&hdmi_cec_root.m_lock_cl);
++
++	return 0;
++}
++
++/*
++ * run delayed mxc_hdmi_cec_msg() to deal with msgs to LAs registered on local CEC.
++ * imx CEC is not transporting such messages through (local) interface
++ * (messages with destination the same as any regstered LA)
++ */
++static void mxc_hdmi_cec_msg_trigger(struct work_struct *work)
++{
++	mxc_hdmi_cec_msg(MESSAGE_TYPE_SEND_SUCCESS);
++}
++
++static ssize_t hdmi_cec_read(struct file *file, char __user *buf, size_t count,
++			    loff_t *ppos)
++{
++	struct hdmi_cec_priv *hdmi_cec = file->private_data;
++	int ret = 0;
++
++	if (!open_count || hdmi_cec->la == 0xff)
++		return -ENODEV;
++
++	pr_debug("%s:  client la %x, (addr %x)\n", __func__, hdmi_cec->la, (unsigned int)hdmi_cec);
++
++	count = min(count, sizeof(struct hdmi_cec_event));
++	do {
++		unsigned long flags;
++		struct hdmi_cec_event_list *event = NULL;
++
++		spin_lock_irqsave(&(hdmi_cec->i_lock_cl), flags);
++		if (!list_empty(&hdmi_cec->msg_head)) {
++			event = list_first_entry_or_null(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
++			list_del(&event->msg_node);
++		}
++		spin_unlock_irqrestore(&(hdmi_cec->i_lock_cl), flags);
++
++		if (event) {
++			ret = copy_to_user(buf, &event->data, count) ? -EFAULT : count;
++			kfree(event);
++		}
++		else if (file->f_flags & O_NONBLOCK) {
++			ret = -EAGAIN;
++		}
++		else if (wait_event_interruptible(hdmi_cec->hdmi_cec_qm, (!list_empty(&hdmi_cec->msg_head)))) {
++			ret = -ERESTARTSYS;
++		}
++	} while(!ret);
++
++	pr_debug("%s:  exit %d\n", __func__, ret);
++	return ret;
++}
++
++static ssize_t hdmi_cec_write(struct file *file, const char __user *buf,
++			     size_t count, loff_t *ppos)
++{
++	struct hdmi_cec_priv *hdmi_cec = file->private_data;
++	int ret = 0 , i = 0;
++	u8 msg[MAX_MESSAGE_LEN];
++	u8 val = 0;
++	int timeout = 1500;
++
++	if (!open_count || hdmi_cec->la == 0xff)
++		return -ENODEV;
++
++	if (count > MAX_MESSAGE_LEN)
++		return -E2BIG;
++
++	memset(&msg, 0, MAX_MESSAGE_LEN);
++	if (copy_from_user(&msg, buf, count))
++		return -EFAULT;
++
++	if (file->f_flags & O_NONBLOCK && hdmi_cec_root.write_busy)
++		return -EAGAIN;
++	else if (wait_event_interruptible(hdmi_cec_qw, (!hdmi_cec_root.write_busy)))
++		return -ERESTARTSYS;
++
++	mutex_lock(&hdmi_cec_root.m_lock_cl);
++	pr_debug("%s: \n", __func__);
++	hdmi_cec_root.write_busy = true;
++
++	hdmi_writeb(count, HDMI_CEC_TX_CNT);
++	for (i = 0; i < count; i++)
++		hdmi_writeb(msg[i], HDMI_CEC_TX_DATA0+i);
++
++	hdmi_cec->libcec_la = hdmi_cec->la;
++	if (la_is_local(msg[0] & 0x0f)) {
++		ret = count;
++		schedule_delayed_work(&(hdmi_cec_root.hdmi_msg_trigger), msecs_to_jiffies(20));
++		pr_debug("%s:  wait_event la_is_local\n", __func__);
++	} else
++
++	do {
++		val = hdmi_readb(HDMI_CEC_CTRL) | 0x01;
++		val |= hdmi_cec_root.send_error ? SIGNAL_FREE_TIME_RESEND : SIGNAL_FREE_TIME_NORMAL;
++		hdmi_writeb(val, HDMI_CEC_CTRL);
++
++		ret = wait_event_timeout(hdmi_cec_qs, !((val = hdmi_readb(HDMI_CEC_CTRL)) & 0x01), msecs_to_jiffies(timeout));
++		pr_debug("%s:  wait_event ret %d\n", __func__, ret);
++		if (hdmi_cec_root.send_error > 5 || ret < 2) {
++			hdmi_writeb(0, HDMI_CEC_TX_CNT);
++			hdmi_cec_root.write_busy = false;
++			wake_up(&hdmi_cec_qw);
++			ret = -EIO;
++		} else if (hdmi_cec_root.send_error && ret > 1) {
++			pr_debug("%s: --- resending msg\n", __func__);
++			timeout = jiffies_to_msecs(ret);
++			ret = 0;
++		} else if (ret > 1) {
++			ret = count;
++		}
++	} while(!ret);
++
++	mutex_unlock(&hdmi_cec_root.m_lock_cl);
++	return ret;
++}
++
++static void hdmi_cec_hwenable(void)
++{
++	u8 val;
++
++	pr_debug("%s: \n", __func__);
++	hdmi_cec_state = true;
++
++	val = hdmi_readb(HDMI_MC_CLKDIS);
++	val &= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
++	hdmi_writeb(val, HDMI_MC_CLKDIS);
++
++	val = HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_NACK |
++		HDMI_IH_CEC_STAT0_EOM | HDMI_IH_CEC_STAT0_DONE;
++	hdmi_writeb(val, HDMI_CEC_POLARITY);
++
++	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL |
++		HDMI_IH_CEC_STAT0_ARB_LOST;
++	hdmi_writeb(val, HDMI_CEC_MASK);
++	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
++	hdmi_writeb(0x0, HDMI_CEC_LOCK);
++	hdmi_writeb(0x02, HDMI_CEC_CTRL);
++}
++
++static void hdmi_cec_hwdisable(void)
++{
++	u8 val;
++
++	pr_debug("%s: \n", __func__);
++	hdmi_cec_state = false;
++
++	hdmi_writeb(0x10, HDMI_CEC_CTRL);
++
++	val = HDMI_IH_CEC_STAT0_WAKEUP | HDMI_IH_CEC_STAT0_ERROR_FOLL |
++		HDMI_IH_CEC_STAT0_ERROR_INIT | HDMI_IH_CEC_STAT0_ARB_LOST |
++		HDMI_IH_CEC_STAT0_NACK | HDMI_IH_CEC_STAT0_EOM |
++		HDMI_IH_CEC_STAT0_DONE;
++	hdmi_writeb(val, HDMI_CEC_MASK);
++	hdmi_writeb(val, HDMI_IH_MUTE_CEC_STAT0);
++
++	hdmi_writeb(0x0, HDMI_CEC_POLARITY);
++
++	val = hdmi_readb(HDMI_MC_CLKDIS);
++	val |= HDMI_MC_CLKDIS_CECCLK_DISABLE;
++	hdmi_writeb(val, HDMI_MC_CLKDIS);
++}
++
++static long hdmi_cec_set_address(u8 arg, struct hdmi_cec_priv *hdmi_cec)
++{
++
++	if (hdmi_cec->la == arg)
++		return 0;
++
++	pr_debug("%s: to %d\n", __func__, arg);
++
++	if (arg == 15)
++		hdmi_cec_root.nr_ff++;
++	if (hdmi_cec->la == 15)
++		hdmi_cec_root.nr_ff--;
++	else
++		hdmi_cec_root.addresses &= ~BIT(hdmi_cec->la);
++
++	hdmi_cec->la = arg;
++	if ((u8)arg != 0xff)
++		hdmi_cec_root.addresses |= BIT(arg);
++	else
++		wake_up(&hdmi_cec->hdmi_cec_qm);
++
++	if (!hdmi_cec_root.nr_ff)
++		hdmi_cec_root.addresses &= ~BIT(15);
++
++	hdmi_writeb(hdmi_cec_root.addresses & 0xff, HDMI_CEC_ADDR_L);
++	/* 
++	 * Don't register LA = 15 to with hardware. with it set, broadcast messages are never
++	 * sent (considered local by CEC controler)
++	 */
++	hdmi_writeb((hdmi_cec_root.addresses & 0x7f00) >> 8, HDMI_CEC_ADDR_H);
++	return 0;
++}
++
++/*!
++ * @brief IO ctrl function for vpu file operation
++ * @param cmd IO ctrl command
++ * @return  0 on success or negative error code on error
++ */
++static long hdmi_cec_ioctl(struct file *filp, u_int cmd,
++		     u_long arg)
++{
++	int ret = 0, i;
++	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
++
++	pr_debug("%s: \n", __func__);
++
++	if (!open_count)
++		return -ENODEV;
++
++	switch (cmd) {
++	case HDMICEC_IOC_SETLOGICALADDRESS:
++		mutex_lock(&hdmi_cec_root.m_lock_cl);
++		ret = hdmi_cec_set_address(arg, hdmi_cec);
++		mutex_unlock(&hdmi_cec_root.m_lock_cl);
++		/*
++		 * in case we have more clients, inform them about PA change.
++		 * (if libCEC is not in monitoring mode, it won't allow more
++		 * clients with same PA - it changes all previous holders of
++		 * that 'taken' PA to 1000.
++		 * to avoid that, we expand PA further by replacing first empty
++		 * dimension with LA (for instance if our PA is 2.2.0.0, we 
++		 * change to 2.2.X.0 all concurent clients, where X is actual LA
++		 */
++		if (open_count > 1 && arg != 15)
++			mxc_hdmi_cec_handle(hdmi_cec_root.physical_address);
++		break;
++
++	case HDMICEC_IOC_STARTDEVICE:
++		if (!hdmi_cec_state)
++			hdmi_cec_hwenable();
++		break;
++
++	case HDMICEC_IOC_STOPDEVICE:
++		hdmi_cec_set_address(-1, hdmi_cec);
++		if (hdmi_cec_state && open_count < 2)
++			hdmi_cec_hwdisable();
++		break;
++
++	case HDMICEC_IOC_GETPHYADDRESS:
++		ret = copy_to_user((void __user *)arg, &hdmi_cec_root.physical_address,
++					4*sizeof(u8))?-EFAULT:0;
++		if (open_count > 1) {
++			for (i = 0; i < 4 && ((u8*)arg)[i] != 0x0; i++);
++			((u8*)arg)[i] = hdmi_cec->la;
++		}
++		break;
++
++	default:
++		ret = -EINVAL;
++		break;
++	}
++
++	return ret;
++}
++
++void hdmi_cec_start_device(void)
++{
++	if(open_count && hdmi_cec_ready && !hdmi_cec_state)
++		hdmi_cec_hwenable();
++}
++EXPORT_SYMBOL(hdmi_cec_start_device);
++
++void hdmi_cec_stop_device(void)
++{
++	if(hdmi_cec_ready && hdmi_cec_state)
++		hdmi_cec_hwdisable();
++}
++EXPORT_SYMBOL(hdmi_cec_stop_device);
++
++/*!
++* @brief Release function for vpu file operation
++* @return  0 on success or negative error code on error
++*/
++static int hdmi_cec_release(struct inode *inode, struct file *filp)
++{
++	struct hdmi_cec_priv *hdmi_cec = filp->private_data;
++	struct hdmi_cec_priv *client, *t;
++	unsigned long flags;
++
++	pr_debug("%s: \n", __func__);
++
++	mutex_lock(&hdmi_cec_root.m_lock_cl);
++	spin_lock_irqsave(&hdmi_cec->i_lock_cl, flags);
++
++	hdmi_cec_set_address(-1, hdmi_cec);
++	if (open_count > 0)
++		open_count--;
++	if (!open_count)
++		hdmi_cec_hwdisable();
++	while (!list_empty(&hdmi_cec->msg_head)) {
++		struct hdmi_cec_event_list *event = NULL;
++
++		event = list_first_entry(&hdmi_cec->msg_head, struct hdmi_cec_event_list, msg_node);
++		list_del(&event->msg_node);
++		kfree(event);
++	}
++
++	spin_unlock_irqrestore(&hdmi_cec->i_lock_cl, flags);
++
++	list_for_each_entry_safe(client, t, &hdmi_cec_root.client_head, client_node) {
++		if (client == hdmi_cec) {
++			list_del(&client->client_node);
++			filp->private_data = NULL;
++			kfree(client);
++		}
++	}
++
++	mutex_unlock(&hdmi_cec_root.m_lock_cl);
++	return 0;
++}
++
++static unsigned int hdmi_cec_poll(struct file *file, poll_table *wait)
++{
++	unsigned int mask = 0;
++	struct hdmi_cec_priv *hdmi_cec = file->private_data;
++
++	pr_debug("%s: poll client %lx, la %d\n", __func__, (unsigned long)hdmi_cec, hdmi_cec->la);
++
++	if (hdmi_cec->la == 0xff)
++		return POLLHUP;
++
++	poll_wait(file, &hdmi_cec->hdmi_cec_qm, wait);
++	poll_wait(file, &hdmi_cec_qw, wait);
++
++	if (!hdmi_cec_root.write_busy)
++		mask = (POLLOUT | POLLWRNORM);
++	if (!list_empty(&hdmi_cec->msg_head))
++		mask |= (POLLIN | POLLRDNORM);
++
++	return mask;
++}
++
++const struct file_operations hdmi_cec_fops = {
++	.owner = THIS_MODULE,
++	.read = hdmi_cec_read,
++	.write = hdmi_cec_write,
++	.open = hdmi_cec_open,
++	.unlocked_ioctl = hdmi_cec_ioctl,
++	.release = hdmi_cec_release,
++	.poll = hdmi_cec_poll,
++};
++
++static int hdmi_cec_dev_probe(struct platform_device *pdev)
++{
++	int err = 0;
++	struct device *temp_class;
++	struct resource *res;
++	struct pinctrl *pinctrl;
++	int irq = platform_get_irq(pdev, 0);
++
++	hdmi_cec_major = register_chrdev(hdmi_cec_major, "mxc_hdmi_cec", &hdmi_cec_fops);
++	if (hdmi_cec_major < 0) {
++		dev_err(&pdev->dev, "%s: unable to get a major for HDMI CEC\n", __func__);
++		err = -EBUSY;
++		goto out;
++	}
++
++	res = platform_get_resource(pdev, IORESOURCE_IRQ, 0);
++	if (unlikely(res == NULL)) {
++		dev_err(&pdev->dev, "%s: No HDMI irq line provided\n", __func__);
++		goto err_out_chrdev;
++	}
++	spin_lock_init(&hdmi_cec_root.i_lock);
++
++	err = devm_request_irq(&pdev->dev, irq, mxc_hdmi_cec_isr, IRQF_SHARED,
++			dev_name(&pdev->dev), &hdmi_cec_root);
++	if (err < 0) {
++		dev_err(&pdev->dev, "%s: Unable to request irq: %d\n", __func__, err);
++		goto err_out_chrdev;
++	}
++
++	hdmi_cec_class = class_create(THIS_MODULE, "mxc_hdmi_cec");
++	if (IS_ERR(hdmi_cec_class)) {
++		err = PTR_ERR(hdmi_cec_class);
++		goto err_out_chrdev;
++	}
++
++	temp_class = device_create(hdmi_cec_class, NULL,
++			MKDEV(hdmi_cec_major, 0), NULL, "mxc_hdmi_cec");
++	if (IS_ERR(temp_class)) {
++		err = PTR_ERR(temp_class);
++		goto err_out_class;
++	}
++
++	pinctrl = devm_pinctrl_get_select_default(&pdev->dev);
++	if (IS_ERR(pinctrl)) {
++		dev_err(&pdev->dev, "%s: can't get/select CEC pinctrl\n", __func__);
++		goto err_out_class;
++	}
++
++	init_waitqueue_head(&hdmi_cec_qs);
++	init_waitqueue_head(&hdmi_cec_qw);
++
++	INIT_LIST_HEAD(&hdmi_cec_root.client_head);
++
++	mutex_init(&hdmi_cec_root.m_lock_cl);
++	hdmi_cec_root.addresses = 0;
++	platform_set_drvdata(pdev, &hdmi_cec_root);
++	INIT_DELAYED_WORK(&hdmi_cec_root.hdmi_cec_work, mxc_hdmi_cec_worker);
++	INIT_DELAYED_WORK(&hdmi_cec_root.hdmi_msg_trigger, mxc_hdmi_cec_msg_trigger);
++
++	dev_info(&pdev->dev, "%s: HDMI CEC initialized\n", __func__);
++	hdmi_cec_ready = 1;
++	goto out;
++
++err_out_class:
++	device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
++	class_destroy(hdmi_cec_class);
++err_out_chrdev:
++	unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
++out:
++	return err;
++}
++
++static int hdmi_cec_dev_remove(struct platform_device *pdev)
++{
++	if (hdmi_cec_major > 0) {
++		flush_scheduled_work();
++		device_destroy(hdmi_cec_class, MKDEV(hdmi_cec_major, 0));
++		class_destroy(hdmi_cec_class);
++		unregister_chrdev(hdmi_cec_major, "mxc_hdmi_cec");
++		hdmi_cec_major = 0;
++	}
++	return 0;
++}
++
++static const struct of_device_id imx_hdmi_cec_match[] = {
++	{ .compatible = "fsl,imx6q-hdmi-cec", },
++	{ .compatible = "fsl,imx6dl-hdmi-cec", },
++	{ /* sentinel */ }
++};
++
++static struct platform_driver mxc_hdmi_cec_driver = {
++	.probe = hdmi_cec_dev_probe,
++	.remove = hdmi_cec_dev_remove,
++	.driver = {
++		.name = "mxc_hdmi_cec",
++		.of_match_table	= imx_hdmi_cec_match,
++	},
++};
++
++module_platform_driver(mxc_hdmi_cec_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("Linux HDMI CEC driver for Freescale i.MX/MXC");
++MODULE_LICENSE("GPL");
++MODULE_ALIAS("platform:mxc_hdmi_cec");
++
+diff -Nur linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h
+--- linux-4.1.3/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/hdmi-cec/mxc_hdmi-cec.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,53 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++#ifndef _HDMICEC_H_
++#define _HDMICEC_H_
++#include <linux/ioctl.h>
++
++/*
++ * Ioctl definitions
++ */
++
++/* Use 'k' as magic number */
++#define HDMICEC_IOC_MAGIC  'H'
++/*
++ * S means "Set" through a ptr,
++ * T means "Tell" directly with the argument value
++ * G means "Get": reply by setting through a pointer
++ * Q means "Query": response is on the return value
++ * X means "eXchange": G and S atomically
++ * H means "sHift": T and Q atomically
++ */
++#define HDMICEC_IOC_SETLOGICALADDRESS  \
++				_IOW(HDMICEC_IOC_MAGIC, 1, unsigned char)
++#define HDMICEC_IOC_STARTDEVICE	_IO(HDMICEC_IOC_MAGIC,  2)
++#define HDMICEC_IOC_STOPDEVICE	_IO(HDMICEC_IOC_MAGIC,  3)
++#define HDMICEC_IOC_GETPHYADDRESS	\
++				_IOR(HDMICEC_IOC_MAGIC, 4, unsigned char[4])
++#define HDMICEC_IOC_LOG \
++				_IOW(HDMICEC_IOC_MAGIC, 5, unsigned char[255])
++
++#define MAX_MESSAGE_LEN                         16
++
++#define MESSAGE_TYPE_RECEIVE_SUCCESS            1
++#define MESSAGE_TYPE_NOACK                      2
++#define MESSAGE_TYPE_DISCONNECTED               3
++#define MESSAGE_TYPE_CONNECTED                  4
++#define MESSAGE_TYPE_SEND_SUCCESS               5
++
++#define SIGNAL_FREE_LOST			BIT(2)
++#define SIGNAL_FREE_TIME_NORMAL			BIT(1)
++#define SIGNAL_FREE_TIME_RESEND			0
++
++#endif				/* !_HDMICEC_H_ */
++
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_calc_stripes_sizes.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,495 @@
++/*
++ * Copyright 2009-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*
++ * @file ipu_calc_stripes_sizes.c
++ *
++ * @brief IPU IC functions
++ *
++ * @ingroup IPU
++ */
++
++#include <linux/ipu-v3.h>
++#include <linux/module.h>
++#include <linux/math64.h>
++
++#define BPP_32 0
++#define BPP_16 3
++#define BPP_8 5
++#define BPP_24 1
++#define BPP_12 4
++#define BPP_18 2
++
++static u32 truncate(u32 up, /* 0: down; else: up */
++					u64 a, /* must be non-negative */
++					u32 b)
++{
++	u32 d;
++	u64 div;
++	div = div_u64(a, b);
++	d = b * (div >> 32);
++	if (up && (a > (((u64)d) << 32)))
++		return d+b;
++	else
++		return d;
++}
++
++static unsigned int f_calc(unsigned int pfs, unsigned int bpp, unsigned int *write)
++{/* return input_f */
++	unsigned int f_calculated = 0;
++	switch (pfs) {
++	case IPU_PIX_FMT_YVU422P:
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_YUV444P:
++		f_calculated = 16;
++		break;
++
++	case IPU_PIX_FMT_RGB565:
++	case IPU_PIX_FMT_YUYV:
++	case IPU_PIX_FMT_UYVY:
++		f_calculated = 8;
++		break;
++
++	case IPU_PIX_FMT_NV12:
++		f_calculated = 8;
++		break;
++
++	default:
++		f_calculated = 0;
++		break;
++
++	}
++	if (!f_calculated) {
++		switch (bpp) {
++		case BPP_32:
++			f_calculated = 2;
++			break;
++
++		case BPP_16:
++			f_calculated = 4;
++			break;
++
++		case BPP_8:
++		case BPP_24:
++			f_calculated = 8;
++			break;
++
++		case BPP_12:
++			f_calculated = 16;
++			break;
++
++		case BPP_18:
++			f_calculated = 32;
++			break;
++
++		default:
++			f_calculated = 0;
++			break;
++			}
++		}
++	return f_calculated;
++}
++
++
++static unsigned int m_calc(unsigned int pfs)
++{
++	unsigned int m_calculated = 0;
++	switch (pfs) {
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YVU422P:
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_YUV444P:
++		m_calculated = 16;
++		break;
++
++	case IPU_PIX_FMT_NV12:
++	case IPU_PIX_FMT_YUYV:
++	case IPU_PIX_FMT_UYVY:
++		m_calculated = 8;
++		break;
++
++	default:
++		m_calculated = 8;
++		break;
++
++	}
++	return m_calculated;
++}
++
++static int calc_split_resize_coeffs(unsigned int inSize, unsigned int outSize,
++				    unsigned int *resizeCoeff,
++				    unsigned int *downsizeCoeff)
++{
++	uint32_t tempSize;
++	uint32_t tempDownsize;
++
++	if (inSize > 4096) {
++		pr_debug("IC input size(%d) cannot exceed 4096\n",
++			inSize);
++		return -EINVAL;
++	}
++
++	if (outSize > 1024) {
++		pr_debug("IC output size(%d) cannot exceed 1024\n",
++			outSize);
++		return -EINVAL;
++	}
++
++	if ((outSize << 3) < inSize) {
++		pr_debug("IC cannot downsize more than 8:1\n");
++		return -EINVAL;
++	}
++
++	/* Compute downsizing coefficient */
++	/* Output of downsizing unit cannot be more than 1024 */
++	tempDownsize = 0;
++	tempSize = inSize;
++	while (((tempSize > 1024) || (tempSize >= outSize * 2)) &&
++	       (tempDownsize < 2)) {
++		tempSize >>= 1;
++		tempDownsize++;
++	}
++	*downsizeCoeff = tempDownsize;
++
++	/* compute resizing coefficient using the following equation:
++	   resizeCoeff = M*(SI -1)/(SO - 1)
++	   where M = 2^13, SI - input size, SO - output size    */
++	*resizeCoeff = (8192L * (tempSize - 1)) / (outSize - 1);
++	if (*resizeCoeff >= 16384L) {
++		pr_debug("Overflow on IC resize coefficient.\n");
++		return -EINVAL;
++	}
++
++	pr_debug("resizing from %u -> %u pixels, "
++		"downsize=%u, resize=%u.%lu (reg=%u)\n", inSize, outSize,
++		*downsizeCoeff, (*resizeCoeff >= 8192L) ? 1 : 0,
++		((*resizeCoeff & 0x1FFF) * 10000L) / 8192L, *resizeCoeff);
++
++	return 0;
++}
++
++/* Stripe parameters calculator */
++/**************************************************************************
++Notes:
++MSW = the maximal width allowed for a stripe
++	i.MX31: 720, i.MX35: 800, i.MX37/51/53: 1024
++cirr = the maximal inverse resizing ratio for which overlap in the input
++	is requested; typically cirr~2
++flags
++	bit 0 - equal_stripes
++		0  each stripe is allowed to have independent parameters
++		for maximal image quality
++		1  the stripes are requested to have identical parameters
++	(except the base address), for maximal performance
++	bit 1 - vertical/horizontal
++		0 horizontal
++		1 vertical
++
++If performance is the top priority (above image quality)
++	Avoid overlap, by setting CIRR = 0
++		This will also force effectively identical_stripes = 1
++	Choose IF & OF that corresponds to the same IOX/SX for both stripes
++	Choose IFW & OFW such that
++	IFW/IM, IFW/IF, OFW/OM, OFW/OF are even integers
++	The function returns an error status:
++	0: no error
++	1: invalid input parameters -> aborted without result
++		Valid parameters should satisfy the following conditions
++		IFW <= OFW, otherwise downsizing is required
++					 - which is not supported yet
++		4 <= IFW,OFW, so some interpolation may be needed even without overlap
++		IM, OM, IF, OF should not vanish
++		2*IF <= IFW
++		so the frame can be split to two equal stripes, even without overlap
++		2*(OF+IF/irr_opt) <= OFW
++		so a valid positive INW exists even for equal stripes
++		OF <= MSW, otherwise, the left stripe cannot be sufficiently large
++		MSW < OFW, so splitting to stripes is required
++		OFW <= 2*MSW, so two stripes are sufficient
++		(this also implies that 2<=MSW)
++	2: OF is not a multiple of OM - not fully-supported yet
++	Output is produced but OW is not guaranited to be a multiple of OM
++	4: OFW reduced to be a multiple of OM
++	8: CIRR > 1: truncated to 1
++	Overlap is not supported (and not needed) y for upsizing)
++**************************************************************************/
++int ipu_calc_stripes_sizes(const unsigned int input_frame_width,
++			   /* input frame width;>1 */
++			   unsigned int output_frame_width, /* output frame width; >1 */
++			   const unsigned int maximal_stripe_width,
++			   /* the maximal width allowed for a stripe */
++			   const unsigned long long cirr, /* see above */
++			   const unsigned int flags, /* see above */
++			   u32 input_pixelformat,/* pixel format after of read channel*/
++			   u32 output_pixelformat,/* pixel format after of write channel*/
++			   struct stripe_param *left,
++			   struct stripe_param *right)
++{
++	const unsigned int irr_frac_bits = 13;
++	const unsigned long irr_steps = 1 << irr_frac_bits;
++	const u64 dirr = ((u64)1) << (32 - 2);
++	/* The maximum relative difference allowed between the irrs */
++	const u64 cr = ((u64)4) << 32;
++	/* The importance ratio between the two terms in the cost function below */
++
++	unsigned int status;
++	unsigned int temp;
++	unsigned int onw_min;
++	unsigned int inw = 0, onw = 0, inw_best = 0;
++	/* number of pixels in the left stripe NOT hidden by the right stripe */
++	u64 irr_opt; /* the optimal inverse resizing ratio */
++	u64 rr_opt; /* the optimal resizing ratio = 1/irr_opt*/
++	u64 dinw; /* the misalignment between the stripes */
++	/* (measured in units of input columns) */
++	u64 difwl, difwr = 0;
++	/* The number of input columns not reflected in the output */
++	/* the resizing ratio used for the right stripe is */
++	/*   left->irr and right->irr respectively */
++	u64 cost, cost_min;
++	u64 div; /* result of division */
++	bool equal_stripes = (flags & 0x1) != 0;
++	bool vertical =      (flags & 0x2) != 0;
++
++	unsigned int input_m, input_f, output_m, output_f; /* parameters for upsizing by stripes */
++	unsigned int resize_coeff;
++	unsigned int downsize_coeff;
++
++	status = 0;
++
++	if (vertical) {
++		input_f = 2;
++		input_m = 8;
++		output_f = 8;
++		output_m = 2;
++	} else {
++		input_f = f_calc(input_pixelformat, 0, NULL);
++		input_m = m_calc(input_pixelformat);
++		output_f = input_m;
++		output_m = m_calc(output_pixelformat);
++	}
++	if ((input_frame_width < 4) || (output_frame_width < 4))
++		return 1;
++
++	irr_opt = div_u64((((u64)(input_frame_width - 1)) << 32),
++			  (output_frame_width - 1));
++	rr_opt = div_u64((((u64)(output_frame_width - 1)) << 32),
++			 (input_frame_width - 1));
++
++	if ((input_m == 0) || (output_m == 0) || (input_f == 0) || (output_f == 0)
++	    || (input_frame_width < (2 * input_f))
++	    || ((((u64)output_frame_width) << 32) <
++		(2 * ((((u64)output_f) << 32) + (input_f * rr_opt))))
++	    || (maximal_stripe_width < output_f)
++	    || ((output_frame_width <= maximal_stripe_width)
++		&& (equal_stripes == 0))
++	    || ((2 * maximal_stripe_width) < output_frame_width))
++		return 1;
++
++	if (output_f % output_m)
++		status += 2;
++
++	temp = truncate(0, (((u64)output_frame_width) << 32), output_m);
++	if (temp < output_frame_width) {
++		output_frame_width = temp;
++		status += 4;
++	}
++
++	pr_debug("---------------->\n"
++		   "if  = %d\n"
++		   "im  = %d\n"
++		   "of = %d\n"
++		   "om = %d\n"
++		   "irr_opt  = %llu\n"
++		   "rr_opt   = %llu\n"
++		   "cirr     = %llu\n"
++		   "pixel in  = %08x\n"
++		   "pixel out = %08x\n"
++		   "ifw = %d\n"
++		   "ofwidth = %d\n",
++		   input_f,
++		   input_m,
++		   output_f,
++		   output_m,
++		   irr_opt,
++		   rr_opt,
++		   cirr,
++		   input_pixelformat,
++		   output_pixelformat,
++		   input_frame_width,
++		   output_frame_width
++		   );
++
++	if (equal_stripes) {
++		if ((irr_opt > cirr) /* overlap in the input is not requested */
++		    && ((input_frame_width % (input_m << 1)) == 0)
++		    && ((input_frame_width % (input_f << 1)) == 0)
++		    && ((output_frame_width % (output_m << 1)) == 0)
++		    && ((output_frame_width % (output_f << 1)) == 0)) {
++			/* without overlap */
++			left->input_width = right->input_width = right->input_column =
++				input_frame_width >> 1;
++			left->output_width = right->output_width = right->output_column =
++				output_frame_width >> 1;
++			left->input_column = 0;
++			left->output_column = 0;
++			div = div_u64(((((u64)irr_steps) << 32) *
++				       (right->input_width - 1)), (right->output_width - 1));
++			left->irr = right->irr = truncate(0, div, 1);
++		} else { /* with overlap */
++			onw = truncate(0, (((u64)output_frame_width - 1) << 32) >> 1,
++				       output_f);
++			inw = truncate(0, onw * irr_opt, input_f);
++			/* this is the maximal inw which allows the same resizing ratio */
++			/* in both stripes */
++			onw = truncate(1, (inw * rr_opt), output_f);
++			div = div_u64((((u64)(irr_steps * inw)) <<
++				       32), onw);
++			left->irr = right->irr = truncate(0, div, 1);
++			left->output_width = right->output_width =
++				output_frame_width - onw;
++			/* These are valid assignments for output_width, */
++			/* assuming output_f is a multiple of output_m */
++			div = (((u64)(left->output_width-1) * (left->irr)) << 32);
++			div = (((u64)1) << 32) + div_u64(div, irr_steps);
++
++			left->input_width = right->input_width = truncate(1, div, input_m);
++
++			div = div_u64((((u64)((right->output_width - 1) * right->irr)) <<
++				       32), irr_steps);
++			difwr = (((u64)(input_frame_width - 1 - inw)) << 32) - div;
++			div = div_u64((difwr + (((u64)input_f) << 32)), 2);
++			left->input_column = truncate(0, div, input_f);
++
++
++			/* This splits the truncated input columns evenly */
++			/*    between the left and right margins */
++			right->input_column = left->input_column + inw;
++			left->output_column = 0;
++			right->output_column = onw;
++		}
++		if (left->input_width > left->output_width) {
++			if (calc_split_resize_coeffs(left->input_width,
++						     left->output_width,
++						     &resize_coeff,
++						     &downsize_coeff) < 0)
++				return -EINVAL;
++
++			if (downsize_coeff > 0) {
++				left->irr = right->irr =
++					(downsize_coeff << 14) | resize_coeff;
++			}
++		}
++		pr_debug("inw %d, onw %d, ilw %d, ilc %d, olw %d,"
++			 " irw %d, irc %d, orw %d, orc %d, "
++			 "difwr  %llu, lirr %u\n",
++			 inw, onw, left->input_width,
++			 left->input_column, left->output_width,
++			 right->input_width, right->input_column,
++			 right->output_width,
++			 right->output_column, difwr, left->irr);
++		} else { /* independent stripes */
++		onw_min = output_frame_width - maximal_stripe_width;
++		/* onw is a multiple of output_f, in the range */
++		/* [max(output_f,output_frame_width-maximal_stripe_width),*/
++		/*min(output_frame_width-2,maximal_stripe_width)] */
++		/* definitely beyond the cost of any valid setting */
++		cost_min = (((u64)input_frame_width) << 32) + cr;
++		onw = truncate(0, ((u64)maximal_stripe_width), output_f);
++		if (output_frame_width - onw == 1)
++			onw -= output_f; /*  => onw and output_frame_width-1-onw are positive */
++		inw = truncate(0, onw * irr_opt, input_f);
++		/* this is the maximal inw which allows the same resizing ratio */
++		/* in both stripes */
++		onw = truncate(1, inw * rr_opt, output_f);
++		do {
++			div = div_u64((((u64)(irr_steps * inw)) << 32), onw);
++			left->irr = truncate(0, div, 1);
++			div = div_u64((((u64)(onw * left->irr)) << 32),
++				      irr_steps);
++			dinw = (((u64)inw) << 32) - div;
++
++			div = div_u64((((u64)((output_frame_width - 1 - onw) * left->irr)) <<
++				       32), irr_steps);
++
++			difwl = (((u64)(input_frame_width - 1 - inw)) << 32) - div;
++
++			cost = difwl + (((u64)(cr * dinw)) >> 32);
++
++			if (cost < cost_min) {
++				inw_best = inw;
++				cost_min = cost;
++			}
++
++			inw -= input_f;
++			onw = truncate(1, inw * rr_opt, output_f);
++			/* This is the minimal onw which allows the same resizing ratio */
++			/*     in both stripes */
++		} while (onw >= onw_min);
++
++		inw = inw_best;
++		onw = truncate(1, inw * rr_opt, output_f);
++		div = div_u64((((u64)(irr_steps * inw)) << 32), onw);
++		left->irr = truncate(0, div, 1);
++
++		left->output_width = onw;
++		right->output_width = output_frame_width - onw;
++		/* These are valid assignments for output_width, */
++		/* assuming output_f is a multiple of output_m */
++		left->input_width = truncate(1, ((u64)(inw + 1)) << 32, input_m);
++		right->input_width = truncate(1, ((u64)(input_frame_width - inw)) <<
++					      32, input_m);
++
++		div = div_u64((((u64)(irr_steps * (input_frame_width - 1 - inw))) <<
++			       32), (right->output_width - 1));
++		right->irr = truncate(0, div, 1);
++		temp = truncate(0, ((u64)left->irr) * ((((u64)1) << 32) + dirr), 1);
++		if (temp < right->irr)
++			right->irr = temp;
++		div = div_u64(((u64)((right->output_width - 1) * right->irr) <<
++			       32), irr_steps);
++		difwr = (u64)(input_frame_width - 1 - inw) - div;
++
++
++		div = div_u64((difwr + (((u64)input_f) << 32)), 2);
++		left->input_column = truncate(0, div, input_f);
++
++		/* This splits the truncated input columns evenly */
++		/*    between the left and right margins */
++		right->input_column = left->input_column + inw;
++		left->output_column = 0;
++		right->output_column = onw;
++		if (left->input_width > left->output_width) {
++			if (calc_split_resize_coeffs(left->input_width,
++						     left->output_width,
++						     &resize_coeff,
++						     &downsize_coeff) < 0)
++				return -EINVAL;
++			left->irr = (downsize_coeff << 14) | resize_coeff;
++		}
++		if (right->input_width > right->output_width) {
++			if (calc_split_resize_coeffs(right->input_width,
++						     right->output_width,
++						     &resize_coeff,
++						     &downsize_coeff) < 0)
++				return -EINVAL;
++			right->irr = (downsize_coeff << 14) | resize_coeff;
++		}
++	}
++	return status;
++}
++EXPORT_SYMBOL(ipu_calc_stripes_sizes);
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_capture.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_capture.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_capture.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_capture.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,816 @@
++/*
++ * Copyright 2008-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file ipu_capture.c
++ *
++ * @brief IPU capture dase functions
++ *
++ * @ingroup IPU
++ */
++#include <linux/clk.h>
++#include <linux/delay.h>
++#include <linux/errno.h>
++#include <linux/init.h>
++#include <linux/io.h>
++#include <linux/ipu-v3.h>
++#include <linux/module.h>
++#include <linux/spinlock.h>
++#include <linux/types.h>
++
++#include "ipu_prv.h"
++#include "ipu_regs.h"
++
++/*!
++ * _ipu_csi_mclk_set
++ *
++ * @param	ipu		ipu handler
++ * @param	pixel_clk   desired pixel clock frequency in Hz
++ * @param	csi         csi 0 or csi 1
++ *
++ * @return	Returns 0 on success or negative error code on fail
++ */
++int _ipu_csi_mclk_set(struct ipu_soc *ipu, uint32_t pixel_clk, uint32_t csi)
++{
++	uint32_t temp;
++	uint32_t div_ratio;
++
++	div_ratio = (clk_get_rate(ipu->ipu_clk) / pixel_clk) - 1;
++
++	if (div_ratio > 0xFF || div_ratio < 0) {
++		dev_dbg(ipu->dev, "value of pixel_clk extends normal range\n");
++		return -EINVAL;
++	}
++
++	temp = ipu_csi_read(ipu, csi, CSI_SENS_CONF);
++	temp &= ~CSI_SENS_CONF_DIVRATIO_MASK;
++	ipu_csi_write(ipu, csi, temp |
++			(div_ratio << CSI_SENS_CONF_DIVRATIO_SHIFT),
++			CSI_SENS_CONF);
++
++	return 0;
++}
++
++/*!
++ * ipu_csi_init_interface
++ *	Sets initial values for the CSI registers.
++ *	The width and height of the sensor and the actual frame size will be
++ *	set to the same values.
++ * @param	ipu		ipu handler
++ * @param	width		Sensor width
++ * @param       height		Sensor height
++ * @param       pixel_fmt	pixel format
++ * @param       cfg_param	ipu_csi_signal_cfg_t structure
++ * @param       csi             csi 0 or csi 1
++ *
++ * @return      0 for success, -EINVAL for error
++ */
++int32_t
++ipu_csi_init_interface(struct ipu_soc *ipu, uint16_t width, uint16_t height,
++	uint32_t pixel_fmt, ipu_csi_signal_cfg_t cfg_param)
++{
++	uint32_t data = 0;
++	uint32_t csi = cfg_param.csi;
++
++	/* Set SENS_DATA_FORMAT bits (8, 9 and 10)
++	   RGB or YUV444 is 0 which is current value in data so not set
++	   explicitly
++	   This is also the default value if attempts are made to set it to
++	   something invalid. */
++	switch (pixel_fmt) {
++	case IPU_PIX_FMT_YUYV:
++		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_YUV422_YUYV;
++		break;
++	case IPU_PIX_FMT_UYVY:
++		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_YUV422_UYVY;
++		break;
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_BGR24:
++		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_RGB_YUV444;
++		break;
++	case IPU_PIX_FMT_GENERIC:
++	case IPU_PIX_FMT_GENERIC_16:
++		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_BAYER;
++		break;
++	case IPU_PIX_FMT_RGB565:
++		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_RGB565;
++		break;
++	case IPU_PIX_FMT_RGB555:
++		cfg_param.data_fmt = CSI_SENS_CONF_DATA_FMT_RGB555;
++		break;
++	default:
++		return -EINVAL;
++	}
++
++	/* Set the CSI_SENS_CONF register remaining fields */
++	data |= cfg_param.data_width << CSI_SENS_CONF_DATA_WIDTH_SHIFT |
++		cfg_param.data_fmt << CSI_SENS_CONF_DATA_FMT_SHIFT |
++		cfg_param.data_pol << CSI_SENS_CONF_DATA_POL_SHIFT |
++		cfg_param.Vsync_pol << CSI_SENS_CONF_VSYNC_POL_SHIFT |
++		cfg_param.Hsync_pol << CSI_SENS_CONF_HSYNC_POL_SHIFT |
++		cfg_param.pixclk_pol << CSI_SENS_CONF_PIX_CLK_POL_SHIFT |
++		cfg_param.ext_vsync << CSI_SENS_CONF_EXT_VSYNC_SHIFT |
++		cfg_param.clk_mode << CSI_SENS_CONF_SENS_PRTCL_SHIFT |
++		cfg_param.pack_tight << CSI_SENS_CONF_PACK_TIGHT_SHIFT |
++		cfg_param.force_eof << CSI_SENS_CONF_FORCE_EOF_SHIFT |
++		cfg_param.data_en_pol << CSI_SENS_CONF_DATA_EN_POL_SHIFT;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	ipu_csi_write(ipu, csi, data, CSI_SENS_CONF);
++
++	/* Setup sensor frame size */
++	ipu_csi_write(ipu, csi, (width - 1) | (height - 1) << 16, CSI_SENS_FRM_SIZE);
++
++	/* Set CCIR registers */
++	if (cfg_param.clk_mode == IPU_CSI_CLK_MODE_CCIR656_PROGRESSIVE) {
++		ipu_csi_write(ipu, csi, 0x40030, CSI_CCIR_CODE_1);
++		ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
++	} else if (cfg_param.clk_mode == IPU_CSI_CLK_MODE_CCIR656_INTERLACED) {
++		if (width == 720 && height == 625) {
++			/* PAL case */
++			/*
++			 * Field0BlankEnd = 0x6, Field0BlankStart = 0x2,
++			 * Field0ActiveEnd = 0x4, Field0ActiveStart = 0
++			 */
++			ipu_csi_write(ipu, csi, 0x40596, CSI_CCIR_CODE_1);
++			/*
++			 * Field1BlankEnd = 0x7, Field1BlankStart = 0x3,
++			 * Field1ActiveEnd = 0x5, Field1ActiveStart = 0x1
++			 */
++			ipu_csi_write(ipu, csi, 0xD07DF, CSI_CCIR_CODE_2);
++
++			ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
++
++		} else if (width == 720 && height == 525) {
++			/* NTSC case */
++			/*
++			 * Field0BlankEnd = 0x7, Field0BlankStart = 0x3,
++			 * Field0ActiveEnd = 0x5, Field0ActiveStart = 0x1
++			 */
++			ipu_csi_write(ipu, csi, 0xD07DF, CSI_CCIR_CODE_1);
++			/*
++			 * Field1BlankEnd = 0x6, Field1BlankStart = 0x2,
++			 * Field1ActiveEnd = 0x4, Field1ActiveStart = 0
++			 */
++			ipu_csi_write(ipu, csi, 0x40596, CSI_CCIR_CODE_2);
++			ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
++		} else {
++			dev_err(ipu->dev, "Unsupported CCIR656 interlaced "
++					"video mode\n");
++			mutex_unlock(&ipu->mutex_lock);
++			_ipu_put(ipu);
++			return -EINVAL;
++		}
++		_ipu_csi_ccir_err_detection_enable(ipu, csi);
++	} else if ((cfg_param.clk_mode ==
++			IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_DDR) ||
++		(cfg_param.clk_mode ==
++			IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_SDR) ||
++		(cfg_param.clk_mode ==
++			IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_DDR) ||
++		(cfg_param.clk_mode ==
++			IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_SDR)) {
++		ipu_csi_write(ipu, csi, 0x40030, CSI_CCIR_CODE_1);
++		ipu_csi_write(ipu, csi, 0xFF0000, CSI_CCIR_CODE_3);
++		_ipu_csi_ccir_err_detection_enable(ipu, csi);
++	} else if ((cfg_param.clk_mode == IPU_CSI_CLK_MODE_GATED_CLK) ||
++		   (cfg_param.clk_mode == IPU_CSI_CLK_MODE_NONGATED_CLK)) {
++		_ipu_csi_ccir_err_detection_disable(ipu, csi);
++	}
++
++	dev_dbg(ipu->dev, "CSI_SENS_CONF = 0x%08X\n",
++		ipu_csi_read(ipu, csi, CSI_SENS_CONF));
++	dev_dbg(ipu->dev, "CSI_ACT_FRM_SIZE = 0x%08X\n",
++		ipu_csi_read(ipu, csi, CSI_ACT_FRM_SIZE));
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_csi_init_interface);
++
++/*!
++ * ipu_csi_get_sensor_protocol
++ *
++ * @param	ipu		ipu handler
++ * @param	csi         csi 0 or csi 1
++ *
++ * @return	Returns sensor protocol
++ */
++int32_t ipu_csi_get_sensor_protocol(struct ipu_soc *ipu, uint32_t csi)
++{
++	int ret;
++	_ipu_get(ipu);
++	ret = (ipu_csi_read(ipu, csi, CSI_SENS_CONF) &
++		CSI_SENS_CONF_SENS_PRTCL_MASK) >>
++		CSI_SENS_CONF_SENS_PRTCL_SHIFT;
++	_ipu_put(ipu);
++	return ret;
++}
++EXPORT_SYMBOL(ipu_csi_get_sensor_protocol);
++
++/*!
++ * ipu_csi_enable_mclk
++ *
++ * @param	ipu		ipu handler
++ * @param	csi         csi 0 or csi 1
++ * @param       flag        true to enable mclk, false to disable mclk
++ * @param       wait        true to wait 100ms make clock stable, false not wait
++ *
++ * @return      Returns 0 on success
++ */
++int ipu_csi_enable_mclk(struct ipu_soc *ipu, int csi, bool flag, bool wait)
++{
++	/* Return immediately if there is no csi_clk to manage */
++	if (ipu->csi_clk[csi] == NULL)
++		return 0;
++
++	if (flag) {
++		clk_enable(ipu->csi_clk[csi]);
++		if (wait == true)
++			msleep(10);
++	} else {
++		clk_disable(ipu->csi_clk[csi]);
++	}
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_csi_enable_mclk);
++
++/*!
++ * ipu_csi_get_window_size
++ *
++ * @param	ipu		ipu handler
++ * @param	width	pointer to window width
++ * @param	height	pointer to window height
++ * @param	csi	csi 0 or csi 1
++ */
++void ipu_csi_get_window_size(struct ipu_soc *ipu, uint32_t *width, uint32_t *height, uint32_t csi)
++{
++	uint32_t reg;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	reg = ipu_csi_read(ipu, csi, CSI_ACT_FRM_SIZE);
++	*width = (reg & 0xFFFF) + 1;
++	*height = (reg >> 16 & 0xFFFF) + 1;
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_csi_get_window_size);
++
++/*!
++ * ipu_csi_set_window_size
++ *
++ * @param	ipu		ipu handler
++ * @param	width	window width
++ * @param       height	window height
++ * @param       csi	csi 0 or csi 1
++ */
++void ipu_csi_set_window_size(struct ipu_soc *ipu, uint32_t width, uint32_t height, uint32_t csi)
++{
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	ipu_csi_write(ipu, csi, (width - 1) | (height - 1) << 16, CSI_ACT_FRM_SIZE);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_csi_set_window_size);
++
++/*!
++ * ipu_csi_set_window_pos
++ *
++ * @param	ipu		ipu handler
++ * @param       left	uint32 window x start
++ * @param       top	uint32 window y start
++ * @param       csi	csi 0 or csi 1
++ */
++void ipu_csi_set_window_pos(struct ipu_soc *ipu, uint32_t left, uint32_t top, uint32_t csi)
++{
++	uint32_t temp;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
++	temp &= ~(CSI_HSC_MASK | CSI_VSC_MASK);
++	temp |= ((top << CSI_VSC_SHIFT) | (left << CSI_HSC_SHIFT));
++	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_csi_set_window_pos);
++
++/*!
++ * _ipu_csi_horizontal_downsize_enable
++ *	Enable horizontal downsizing(decimation) by 2.
++ *
++ * @param	ipu		ipu handler
++ * @param	csi	csi 0 or csi 1
++ */
++void _ipu_csi_horizontal_downsize_enable(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
++	temp |= CSI_HORI_DOWNSIZE_EN;
++	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
++}
++
++/*!
++ * _ipu_csi_horizontal_downsize_disable
++ *	Disable horizontal downsizing(decimation) by 2.
++ *
++ * @param	ipu		ipu handler
++ * @param	csi	csi 0 or csi 1
++ */
++void _ipu_csi_horizontal_downsize_disable(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
++	temp &= ~CSI_HORI_DOWNSIZE_EN;
++	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
++}
++
++/*!
++ * _ipu_csi_vertical_downsize_enable
++ *	Enable vertical downsizing(decimation) by 2.
++ *
++ * @param	ipu		ipu handler
++ * @param	csi	csi 0 or csi 1
++ */
++void _ipu_csi_vertical_downsize_enable(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
++	temp |= CSI_VERT_DOWNSIZE_EN;
++	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
++}
++
++/*!
++ * _ipu_csi_vertical_downsize_disable
++ *	Disable vertical downsizing(decimation) by 2.
++ *
++ * @param	ipu		ipu handler
++ * @param	csi	csi 0 or csi 1
++ */
++void _ipu_csi_vertical_downsize_disable(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_OUT_FRM_CTRL);
++	temp &= ~CSI_VERT_DOWNSIZE_EN;
++	ipu_csi_write(ipu, csi, temp, CSI_OUT_FRM_CTRL);
++}
++
++/*!
++ * _ipu_csi_set_test_generator
++ *
++ * @param	ipu		ipu handler
++ * @param	active       1 for active and 0 for inactive
++ * @param       r_value	     red value for the generated pattern of even pixel
++ * @param       g_value      green value for the generated pattern of even
++ *			     pixel
++ * @param       b_value      blue value for the generated pattern of even pixel
++ * @param	pixel_clk   desired pixel clock frequency in Hz
++ * @param       csi          csi 0 or csi 1
++ */
++void _ipu_csi_set_test_generator(struct ipu_soc *ipu, bool active, uint32_t r_value,
++	uint32_t g_value, uint32_t b_value, uint32_t pix_clk, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_TST_CTRL);
++
++	if (active == false) {
++		temp &= ~CSI_TEST_GEN_MODE_EN;
++		ipu_csi_write(ipu, csi, temp, CSI_TST_CTRL);
++	} else {
++		/* Set sensb_mclk div_ratio*/
++		_ipu_csi_mclk_set(ipu, pix_clk, csi);
++
++		temp &= ~(CSI_TEST_GEN_R_MASK | CSI_TEST_GEN_G_MASK |
++			CSI_TEST_GEN_B_MASK);
++		temp |= CSI_TEST_GEN_MODE_EN;
++		temp |= (r_value << CSI_TEST_GEN_R_SHIFT) |
++			(g_value << CSI_TEST_GEN_G_SHIFT) |
++			(b_value << CSI_TEST_GEN_B_SHIFT);
++		ipu_csi_write(ipu, csi, temp, CSI_TST_CTRL);
++	}
++}
++
++/*!
++ * _ipu_csi_ccir_err_detection_en
++ *	Enable error detection and correction for
++ *	CCIR interlaced mode with protection bit.
++ *
++ * @param	ipu		ipu handler
++ * @param	csi	csi 0 or csi 1
++ */
++void _ipu_csi_ccir_err_detection_enable(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_CCIR_CODE_1);
++	temp |= CSI_CCIR_ERR_DET_EN;
++	ipu_csi_write(ipu, csi, temp, CSI_CCIR_CODE_1);
++
++}
++
++/*!
++ * _ipu_csi_ccir_err_detection_disable
++ *	Disable error detection and correction for
++ *	CCIR interlaced mode with protection bit.
++ *
++ * @param	ipu		ipu handler
++ * @param	csi	csi 0 or csi 1
++ */
++void _ipu_csi_ccir_err_detection_disable(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_csi_read(ipu, csi, CSI_CCIR_CODE_1);
++	temp &= ~CSI_CCIR_ERR_DET_EN;
++	ipu_csi_write(ipu, csi, temp, CSI_CCIR_CODE_1);
++
++}
++
++/*!
++ * _ipu_csi_set_mipi_di
++ *
++ * @param	ipu		ipu handler
++ * @param	num	MIPI data identifier 0-3 handled by CSI
++ * @param	di_val	data identifier value
++ * @param	csi	csi 0 or csi 1
++ *
++ * @return	Returns 0 on success or negative error code on fail
++ */
++int _ipu_csi_set_mipi_di(struct ipu_soc *ipu, uint32_t num, uint32_t di_val, uint32_t csi)
++{
++	uint32_t temp;
++	int retval = 0;
++
++	if (di_val > 0xFFL) {
++		retval = -EINVAL;
++		goto err;
++	}
++
++	temp = ipu_csi_read(ipu, csi, CSI_MIPI_DI);
++
++	switch (num) {
++	case IPU_CSI_MIPI_DI0:
++		temp &= ~CSI_MIPI_DI0_MASK;
++		temp |= (di_val << CSI_MIPI_DI0_SHIFT);
++		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
++		break;
++	case IPU_CSI_MIPI_DI1:
++		temp &= ~CSI_MIPI_DI1_MASK;
++		temp |= (di_val << CSI_MIPI_DI1_SHIFT);
++		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
++		break;
++	case IPU_CSI_MIPI_DI2:
++		temp &= ~CSI_MIPI_DI2_MASK;
++		temp |= (di_val << CSI_MIPI_DI2_SHIFT);
++		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
++		break;
++	case IPU_CSI_MIPI_DI3:
++		temp &= ~CSI_MIPI_DI3_MASK;
++		temp |= (di_val << CSI_MIPI_DI3_SHIFT);
++		ipu_csi_write(ipu, csi, temp, CSI_MIPI_DI);
++		break;
++	default:
++		retval = -EINVAL;
++	}
++
++err:
++	return retval;
++}
++
++/*!
++ * _ipu_csi_set_skip_isp
++ *
++ * @param	ipu		ipu handler
++ * @param	skip		select frames to be skipped and set the
++ *				correspond bits to 1
++ * @param	max_ratio	number of frames in a skipping set and the
++ * 				maximum value of max_ratio is 5
++ * @param	csi		csi 0 or csi 1
++ *
++ * @return	Returns 0 on success or negative error code on fail
++ */
++int _ipu_csi_set_skip_isp(struct ipu_soc *ipu, uint32_t skip, uint32_t max_ratio, uint32_t csi)
++{
++	uint32_t temp;
++	int retval = 0;
++
++	if (max_ratio > 5) {
++		retval = -EINVAL;
++		goto err;
++	}
++
++	temp = ipu_csi_read(ipu, csi, CSI_SKIP);
++	temp &= ~(CSI_MAX_RATIO_SKIP_ISP_MASK | CSI_SKIP_ISP_MASK);
++	temp |= (max_ratio << CSI_MAX_RATIO_SKIP_ISP_SHIFT) |
++		(skip << CSI_SKIP_ISP_SHIFT);
++	ipu_csi_write(ipu, csi, temp, CSI_SKIP);
++
++err:
++	return retval;
++}
++
++/*!
++ * _ipu_csi_set_skip_smfc
++ *
++ * @param	ipu		ipu handler
++ * @param	skip		select frames to be skipped and set the
++ *				correspond bits to 1
++ * @param	max_ratio	number of frames in a skipping set and the
++ *				maximum value of max_ratio is 5
++ * @param	id		csi to smfc skipping id
++ * @param	csi		csi 0 or csi 1
++ *
++ * @return	Returns 0 on success or negative error code on fail
++ */
++int _ipu_csi_set_skip_smfc(struct ipu_soc *ipu, uint32_t skip,
++	uint32_t max_ratio, uint32_t id, uint32_t csi)
++{
++	uint32_t temp;
++	int retval = 0;
++
++	if (max_ratio > 5 || id > 3) {
++		retval = -EINVAL;
++		goto err;
++	}
++
++	temp = ipu_csi_read(ipu, csi, CSI_SKIP);
++	temp &= ~(CSI_MAX_RATIO_SKIP_SMFC_MASK | CSI_ID_2_SKIP_MASK |
++			CSI_SKIP_SMFC_MASK);
++	temp |= (max_ratio << CSI_MAX_RATIO_SKIP_SMFC_SHIFT) |
++			(id << CSI_ID_2_SKIP_SHIFT) |
++			(skip << CSI_SKIP_SMFC_SHIFT);
++	ipu_csi_write(ipu, csi, temp, CSI_SKIP);
++
++err:
++	return retval;
++}
++
++/*!
++ * _ipu_smfc_init
++ *	Map CSI frames to IDMAC channels.
++ *
++ * @param	ipu		ipu handler
++ * @param	channel		IDMAC channel 0-3
++ * @param	mipi_id		mipi id number 0-3
++ * @param	csi		csi0 or csi1
++ */
++void _ipu_smfc_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t mipi_id, uint32_t csi)
++{
++	uint32_t temp;
++
++	temp = ipu_smfc_read(ipu, SMFC_MAP);
++
++	switch (channel) {
++	case CSI_MEM0:
++		temp &= ~SMFC_MAP_CH0_MASK;
++		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH0_SHIFT;
++		break;
++	case CSI_MEM1:
++		temp &= ~SMFC_MAP_CH1_MASK;
++		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH1_SHIFT;
++		break;
++	case CSI_MEM2:
++		temp &= ~SMFC_MAP_CH2_MASK;
++		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH2_SHIFT;
++		break;
++	case CSI_MEM3:
++		temp &= ~SMFC_MAP_CH3_MASK;
++		temp |= ((csi << 2) | mipi_id) << SMFC_MAP_CH3_SHIFT;
++		break;
++	default:
++		return;
++	}
++
++	ipu_smfc_write(ipu, temp, SMFC_MAP);
++}
++
++/*!
++ * _ipu_smfc_set_wmc
++ *	Caution: The number of required channels,  the enabled channels
++ *	and the FIFO size per channel are configured restrictedly.
++ *
++ * @param	ipu		ipu handler
++ * @param	channel		IDMAC channel 0-3
++ * @param	set		set 1 or clear 0
++ * @param	level		water mark level when FIFO is on the
++ *				relative size
++ */
++void _ipu_smfc_set_wmc(struct ipu_soc *ipu, ipu_channel_t channel, bool set, uint32_t level)
++{
++	uint32_t temp;
++
++	temp = ipu_smfc_read(ipu, SMFC_WMC);
++
++	switch (channel) {
++	case CSI_MEM0:
++		if (set == true) {
++			temp &= ~SMFC_WM0_SET_MASK;
++			temp |= level << SMFC_WM0_SET_SHIFT;
++		} else {
++			temp &= ~SMFC_WM0_CLR_MASK;
++			temp |= level << SMFC_WM0_CLR_SHIFT;
++		}
++		break;
++	case CSI_MEM1:
++		if (set == true) {
++			temp &= ~SMFC_WM1_SET_MASK;
++			temp |= level << SMFC_WM1_SET_SHIFT;
++		} else {
++			temp &= ~SMFC_WM1_CLR_MASK;
++			temp |= level << SMFC_WM1_CLR_SHIFT;
++		}
++		break;
++	case CSI_MEM2:
++		if (set == true) {
++			temp &= ~SMFC_WM2_SET_MASK;
++			temp |= level << SMFC_WM2_SET_SHIFT;
++		} else {
++			temp &= ~SMFC_WM2_CLR_MASK;
++			temp |= level << SMFC_WM2_CLR_SHIFT;
++		}
++		break;
++	case CSI_MEM3:
++		if (set == true) {
++			temp &= ~SMFC_WM3_SET_MASK;
++			temp |= level << SMFC_WM3_SET_SHIFT;
++		} else {
++			temp &= ~SMFC_WM3_CLR_MASK;
++			temp |= level << SMFC_WM3_CLR_SHIFT;
++		}
++		break;
++	default:
++		return;
++	}
++
++	ipu_smfc_write(ipu, temp, SMFC_WMC);
++}
++
++/*!
++ * _ipu_smfc_set_burst_size
++ *
++ * @param	ipu		ipu handler
++ * @param	channel		IDMAC channel 0-3
++ * @param	bs		burst size of IDMAC channel,
++ *				the value programmed here shoud be BURST_SIZE-1
++ */
++void _ipu_smfc_set_burst_size(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t bs)
++{
++	uint32_t temp;
++
++	temp = ipu_smfc_read(ipu, SMFC_BS);
++
++	switch (channel) {
++	case CSI_MEM0:
++		temp &= ~SMFC_BS0_MASK;
++		temp |= bs << SMFC_BS0_SHIFT;
++		break;
++	case CSI_MEM1:
++		temp &= ~SMFC_BS1_MASK;
++		temp |= bs << SMFC_BS1_SHIFT;
++		break;
++	case CSI_MEM2:
++		temp &= ~SMFC_BS2_MASK;
++		temp |= bs << SMFC_BS2_SHIFT;
++		break;
++	case CSI_MEM3:
++		temp &= ~SMFC_BS3_MASK;
++		temp |= bs << SMFC_BS3_SHIFT;
++		break;
++	default:
++		return;
++	}
++
++	ipu_smfc_write(ipu, temp, SMFC_BS);
++}
++
++/*!
++ * _ipu_csi_init
++ *
++ * @param	ipu		ipu handler
++ * @param	channel      IDMAC channel
++ * @param	csi	     csi 0 or csi 1
++ *
++ * @return	Returns 0 on success or negative error code on fail
++ */
++int _ipu_csi_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t csi)
++{
++	uint32_t csi_sens_conf, csi_dest;
++	int retval = 0;
++
++	switch (channel) {
++	case CSI_MEM0:
++	case CSI_MEM1:
++	case CSI_MEM2:
++	case CSI_MEM3:
++		csi_dest = CSI_DATA_DEST_IDMAC;
++		break;
++	case CSI_PRP_ENC_MEM:
++	case CSI_PRP_VF_MEM:
++		csi_dest = CSI_DATA_DEST_IC;
++		break;
++	default:
++		retval = -EINVAL;
++		goto err;
++	}
++
++	csi_sens_conf = ipu_csi_read(ipu, csi, CSI_SENS_CONF);
++	csi_sens_conf &= ~CSI_SENS_CONF_DATA_DEST_MASK;
++	ipu_csi_write(ipu, csi, csi_sens_conf | (csi_dest <<
++		CSI_SENS_CONF_DATA_DEST_SHIFT), CSI_SENS_CONF);
++err:
++	return retval;
++}
++
++/*!
++ * csi_irq_handler
++ *
++ * @param	irq		interrupt id
++ * @param	dev_id		pointer to ipu handler
++ *
++ * @return	Returns if irq is handled
++ */
++static irqreturn_t csi_irq_handler(int irq, void *dev_id)
++{
++	struct ipu_soc *ipu = dev_id;
++	struct completion *comp = &ipu->csi_comp;
++
++	complete(comp);
++	return IRQ_HANDLED;
++}
++
++/*!
++ * _ipu_csi_wait4eof
++ *
++ * @param	ipu		ipu handler
++ * @param	channel      IDMAC channel
++ *
++ */
++void _ipu_csi_wait4eof(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	int ret;
++	int irq = 0;
++
++	if (channel == CSI_MEM0)
++		irq = IPU_IRQ_CSI0_OUT_EOF;
++	else if (channel == CSI_MEM1)
++		irq = IPU_IRQ_CSI1_OUT_EOF;
++	else if (channel == CSI_MEM2)
++		irq = IPU_IRQ_CSI2_OUT_EOF;
++	else if (channel == CSI_MEM3)
++		irq = IPU_IRQ_CSI3_OUT_EOF;
++	else if (channel == CSI_PRP_ENC_MEM)
++		irq = IPU_IRQ_PRP_ENC_OUT_EOF;
++	else if (channel == CSI_PRP_VF_MEM)
++		irq = IPU_IRQ_PRP_VF_OUT_EOF;
++	else{
++		dev_err(ipu->dev, "Not a CSI channel\n");
++		return;
++	}
++
++	init_completion(&ipu->csi_comp);
++	ret = ipu_request_irq(ipu, irq, csi_irq_handler, 0, NULL, ipu);
++	if (ret < 0) {
++		dev_err(ipu->dev, "CSI irq %d in use\n", irq);
++		return;
++	}
++	ret = wait_for_completion_timeout(&ipu->csi_comp, msecs_to_jiffies(500));
++	ipu_free_irq(ipu, irq, ipu);
++	dev_dbg(ipu->dev, "CSI stop timeout - %d * 10ms\n", 5 - ret);
++}
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_common.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_common.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_common.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_common.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,3151 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file ipu_common.c
++ *
++ * @brief This file contains the IPU driver common API functions.
++ *
++ * @ingroup IPU
++ */
++
++
++#include <linux/clk.h>
++#include <linux/clk-provider.h>
++#include <linux/clk/clk-conf.h>
++
++
++#include <linux/busfreq-imx6.h>
++#include <linux/delay.h>
++#include <linux/err.h>
++#include <linux/init.h>
++#include <linux/interrupt.h>
++#include <linux/io.h>
++#include <linux/ipu-v3.h>
++#include <linux/irq.h>
++#include <linux/irqdesc.h>
++#include <linux/module.h>
++#include <linux/mod_devicetable.h>
++#include <linux/of_device.h>
++#include <linux/platform_device.h>
++#include <linux/pm_runtime.h>
++#include <linux/reset.h>
++#include <linux/spinlock.h>
++#include <linux/types.h>
++
++#include <asm/cacheflush.h>
++
++#include "ipu_param_mem.h"
++#include "ipu_regs.h"
++
++static struct ipu_soc ipu_array[MXC_IPU_MAX_NUM];
++int g_ipu_hw_rev;
++
++/* Static functions */
++static irqreturn_t ipu_sync_irq_handler(int irq, void *desc);
++static irqreturn_t ipu_err_irq_handler(int irq, void *desc);
++
++static inline uint32_t channel_2_dma(ipu_channel_t ch, ipu_buffer_t type)
++{
++	return ((uint32_t) ch >> (6 * type)) & 0x3F;
++};
++
++static inline int _ipu_is_ic_chan(uint32_t dma_chan)
++{
++	return (((dma_chan >= 11) && (dma_chan <= 22) && (dma_chan != 17) &&
++		(dma_chan != 18)));
++}
++
++static inline int _ipu_is_vdi_out_chan(uint32_t dma_chan)
++{
++	return (dma_chan == 5);
++}
++
++static inline int _ipu_is_ic_graphic_chan(uint32_t dma_chan)
++{
++	return (dma_chan == 14 || dma_chan == 15);
++}
++
++/* Either DP BG or DP FG can be graphic window */
++static inline int _ipu_is_dp_graphic_chan(uint32_t dma_chan)
++{
++	return (dma_chan == 23 || dma_chan == 27);
++}
++
++static inline int _ipu_is_irt_chan(uint32_t dma_chan)
++{
++	return ((dma_chan >= 45) && (dma_chan <= 50));
++}
++
++static inline int _ipu_is_dmfc_chan(uint32_t dma_chan)
++{
++	return ((dma_chan >= 23) && (dma_chan <= 29));
++}
++
++static inline int _ipu_is_smfc_chan(uint32_t dma_chan)
++{
++	return ((dma_chan >= 0) && (dma_chan <= 3));
++}
++
++static inline int _ipu_is_trb_chan(uint32_t dma_chan)
++{
++	return (((dma_chan == 8) || (dma_chan == 9) ||
++		 (dma_chan == 10) || (dma_chan == 13) ||
++		 (dma_chan == 21) || (dma_chan == 23) ||
++		 (dma_chan == 27) || (dma_chan == 28)) &&
++		(g_ipu_hw_rev >= IPU_V3DEX));
++}
++
++/*
++ * We usually use IDMAC 23 as full plane and IDMAC 27 as partial
++ * plane.
++ * IDMAC 23/24/28/41 can drive a display respectively - primary
++ * IDMAC 27 depends on IDMAC 23 - nonprimary
++ */
++static inline int _ipu_is_primary_disp_chan(uint32_t dma_chan)
++{
++	return ((dma_chan == 23) || (dma_chan == 24) ||
++		(dma_chan == 28) || (dma_chan == 41));
++}
++
++static inline int _ipu_is_sync_irq(uint32_t irq)
++{
++	/* sync interrupt register number */
++	int reg_num = irq / 32 + 1;
++
++	return ((reg_num == 1)  || (reg_num == 2)  || (reg_num == 3)  ||
++		(reg_num == 4)  || (reg_num == 7)  || (reg_num == 8)  ||
++		(reg_num == 11) || (reg_num == 12) || (reg_num == 13) ||
++		(reg_num == 14) || (reg_num == 15));
++}
++
++#define idma_is_valid(ch)	(ch != NO_DMA)
++#define idma_mask(ch)		(idma_is_valid(ch) ? (1UL << (ch & 0x1F)) : 0)
++#define idma_is_set(ipu, reg, dma)	(ipu_idmac_read(ipu, reg(dma)) & idma_mask(dma))
++#define tri_cur_buf_mask(ch)	(idma_mask(ch*2) * 3)
++#define tri_cur_buf_shift(ch)	(ffs(idma_mask(ch*2)) - 1)
++
++static int ipu_clk_setup_enable(struct ipu_soc *ipu,
++			struct ipu_pltfm_data *pdata)
++{
++	char pixel_clk_0[] = "ipu1_pclk_0";
++	char pixel_clk_1[] = "ipu1_pclk_1";
++	char pixel_clk_0_sel[] = "ipu1_pclk0_sel";
++	char pixel_clk_1_sel[] = "ipu1_pclk1_sel";
++	char pixel_clk_0_div[] = "ipu1_pclk0_div";
++	char pixel_clk_1_div[] = "ipu1_pclk1_div";
++	char *ipu_pixel_clk_sel1[] = { "ipu1", "ipu1_di0", "ipu1_di1", };
++	char *ipu_pixel_clk_sel2[] = { "ipu2", "ipu2_di0", "ipu2_di1", };
++	char **ipu_pixel_clk_sel;
++	struct clk *clk;
++	int ret;
++
++	strncpy(ipu->pixel_clk_0, pixel_clk_0, sizeof(ipu->pixel_clk_0));
++	ipu->pixel_clk_0[3] += pdata->id;
++	strncpy(ipu->pixel_clk_1, pixel_clk_1, sizeof(ipu->pixel_clk_1));
++	ipu->pixel_clk_1[3] += pdata->id;
++	strncpy(ipu->pixel_clk_0_sel, pixel_clk_0_sel, sizeof(ipu->pixel_clk_0_sel));
++	ipu->pixel_clk_0_sel[3] += pdata->id;
++	strncpy(ipu->pixel_clk_1_sel, pixel_clk_1_sel, sizeof(ipu->pixel_clk_1_sel));
++	ipu->pixel_clk_1_sel[3] += pdata->id;
++	strncpy(ipu->pixel_clk_0_div, pixel_clk_0_div, sizeof(ipu->pixel_clk_0_div));
++	ipu->pixel_clk_0_div[3] += pdata->id;
++	strncpy(ipu->pixel_clk_1_div, pixel_clk_1_div, sizeof(ipu->pixel_clk_1_div));
++	ipu->pixel_clk_1_div[3] += pdata->id;
++
++	if (pdata->id == 0)
++		ipu_pixel_clk_sel = ipu_pixel_clk_sel1;
++	else 
++		ipu_pixel_clk_sel = ipu_pixel_clk_sel2;
++
++	clk = clk_register_mux_pix_clk(ipu->dev, ipu->pixel_clk_0_sel,
++			(const char **)ipu_pixel_clk_sel,
++			ARRAY_SIZE(ipu_pixel_clk_sel1),
++			0, pdata->id, 0, 0);
++	if (IS_ERR(clk)) {
++		dev_err(ipu->dev, "clk_register mux di0 failed");
++		return PTR_ERR(clk);
++	}
++	ipu->pixel_clk_sel[0] = clk;
++	clk = clk_register_mux_pix_clk(ipu->dev, ipu->pixel_clk_1_sel,
++			(const char **)ipu_pixel_clk_sel,
++			ARRAY_SIZE(ipu_pixel_clk_sel1),
++			0, pdata->id, 1, 0);
++	if (IS_ERR(clk)) {
++		dev_err(ipu->dev, "clk_register mux di1 failed");
++		return PTR_ERR(clk);
++	}
++	ipu->pixel_clk_sel[1] = clk;
++
++	clk = clk_register_div_pix_clk(ipu->dev, ipu->pixel_clk_0_div,
++				ipu->pixel_clk_0_sel, 0, pdata->id, 0, 0);
++	if (IS_ERR(clk)) {
++		dev_err(ipu->dev, "clk register di0 div failed");
++		return PTR_ERR(clk);
++	}
++	clk = clk_register_div_pix_clk(ipu->dev, ipu->pixel_clk_1_div,
++			ipu->pixel_clk_1_sel, CLK_SET_RATE_PARENT, pdata->id, 1, 0);
++	if (IS_ERR(clk)) {
++		dev_err(ipu->dev, "clk register di1 div failed");
++		return PTR_ERR(clk);
++	}
++
++	ipu->pixel_clk[0] = clk_register_gate_pix_clk(ipu->dev, ipu->pixel_clk_0,
++				ipu->pixel_clk_0_div, CLK_SET_RATE_PARENT,
++				pdata->id, 0, 0);
++	if (IS_ERR(ipu->pixel_clk[0])) {
++		dev_err(ipu->dev, "clk register di0 gate failed");
++		return PTR_ERR(ipu->pixel_clk[0]);
++	}
++	ipu->pixel_clk[1] = clk_register_gate_pix_clk(ipu->dev, ipu->pixel_clk_1,
++				ipu->pixel_clk_1_div, CLK_SET_RATE_PARENT,
++				pdata->id, 1, 0);
++	if (IS_ERR(ipu->pixel_clk[1])) {
++		dev_err(ipu->dev, "clk register di1 gate failed");
++		return PTR_ERR(ipu->pixel_clk[1]);
++	}
++
++	ret = clk_set_parent(ipu->pixel_clk_sel[0], ipu->ipu_clk);
++	if (ret) {
++		dev_err(ipu->dev, "clk set parent failed %s, %d", __clk_get_name(ipu->ipu_clk), ret);
++		return ret;
++	}
++
++	ret = clk_set_parent(ipu->pixel_clk_sel[1], ipu->ipu_clk);
++	if (ret) {
++		dev_err(ipu->dev, "clk set parent failed %s, %d", __clk_get_name(ipu->ipu_clk), ret);
++		return ret;
++	}
++
++	ipu->di_clk[0] = devm_clk_get(ipu->dev, "di0");
++	if (IS_ERR(ipu->di_clk[0])) {
++		dev_err(ipu->dev, "clk_get di0 failed");
++		return PTR_ERR(ipu->di_clk[0]);
++	}
++	ipu->di_clk[1] = devm_clk_get(ipu->dev, "di1");
++	if (IS_ERR(ipu->di_clk[1])) {
++		dev_err(ipu->dev, "clk_get di1 failed");
++		return PTR_ERR(ipu->di_clk[1]);
++	}
++
++	ipu->di_clk_sel[0] = devm_clk_get(ipu->dev, "di0_sel");
++	if (IS_ERR(ipu->di_clk_sel[0])) {
++		dev_err(ipu->dev, "clk_get di0_sel failed");
++		return PTR_ERR(ipu->di_clk_sel[0]);
++	}
++	ipu->di_clk_sel[1] = devm_clk_get(ipu->dev, "di1_sel");
++	if (IS_ERR(ipu->di_clk_sel[1])) {
++		dev_err(ipu->dev, "clk_get di1_sel failed");
++		return PTR_ERR(ipu->di_clk_sel[1]);
++	}
++
++	return 0;
++}
++
++static int ipu_mem_reset(struct ipu_soc *ipu)
++{
++	int timeout = 1000;
++
++	ipu_cm_write(ipu, 0x807FFFFF, IPU_MEM_RST);
++
++	while (ipu_cm_read(ipu, IPU_MEM_RST) & 0x80000000) {
++		if (!timeout--)
++			return -ETIME;
++		msleep(1);
++	}
++
++	return 0;
++}
++
++struct ipu_soc *ipu_get_soc(int id)
++{
++	if (id >= MXC_IPU_MAX_NUM)
++		return ERR_PTR(-ENODEV);
++	else if (!ipu_array[id].online)
++		return ERR_PTR(-ENODEV);
++	else
++		return &(ipu_array[id]);
++}
++EXPORT_SYMBOL_GPL(ipu_get_soc);
++
++void _ipu_get(struct ipu_soc *ipu)
++{
++	int ret;
++
++	ret = clk_enable(ipu->ipu_clk);
++	if (ret < 0)
++		BUG();
++}
++
++void _ipu_put(struct ipu_soc *ipu)
++{
++	clk_disable(ipu->ipu_clk);
++}
++
++void ipu_disable_hsp_clk(struct ipu_soc *ipu)
++{
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_disable_hsp_clk);
++
++static struct platform_device_id imx_ipu_type[] = {
++	{
++		.name = "ipu-imx6q",
++		.driver_data = IPU_V3H,
++	}, {
++		/* sentinel */
++	}
++};
++MODULE_DEVICE_TABLE(platform, imx_ipu_type);
++
++static const struct of_device_id imx_ipuv3_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-ipu", .data = &imx_ipu_type[IMX6Q_IPU], },
++	{ /* sentinel */ }
++};
++MODULE_DEVICE_TABLE(of, imx_ipuv3_dt_ids);
++
++/*!
++ * This function is called by the driver framework to initialize the IPU
++ * hardware.
++ *
++ * @param	dev	The device structure for the IPU passed in by the
++ *			driver framework.
++ *
++ * @return      Returns 0 on success or negative error code on error
++ */
++static int ipu_probe(struct platform_device *pdev)
++{
++	struct ipu_soc *ipu;
++	struct resource *res;
++	unsigned long ipu_base;
++	const struct of_device_id *of_id =
++			of_match_device(imx_ipuv3_dt_ids, &pdev->dev);
++	struct ipu_pltfm_data *pltfm_data;
++	int ret = 0;
++	u32 bypass_reset;
++
++	dev_dbg(&pdev->dev, "<%s>\n", __func__);
++
++	pltfm_data = devm_kzalloc(&pdev->dev, sizeof(struct ipu_pltfm_data),
++				GFP_KERNEL);
++	if (!pltfm_data)
++		return -ENOMEM;
++
++	ret = of_property_read_u32(pdev->dev.of_node,
++					"bypass_reset", &bypass_reset);
++	if (ret < 0) {
++		dev_dbg(&pdev->dev, "can not get bypass_reset\n");
++		return ret;
++	}
++	pltfm_data->bypass_reset = (bool)bypass_reset;
++
++	pltfm_data->id = of_alias_get_id(pdev->dev.of_node, "ipu");
++	if (pltfm_data->id < 0) {
++		dev_dbg(&pdev->dev, "can not get alias id\n");
++		return pltfm_data->id;
++	} else
++		dev_dbg(&pdev->dev, "get alias id %d\n", pltfm_data->id);
++
++	if (of_id)
++		pdev->id_entry = of_id->data;
++	pltfm_data->devtype = pdev->id_entry->driver_data;
++	g_ipu_hw_rev = pltfm_data->devtype;
++
++	ipu = &ipu_array[pltfm_data->id];
++	memset(ipu, 0, sizeof(struct ipu_soc));
++	ipu->dev = &pdev->dev;
++	ipu->pdata = pltfm_data;
++	dev_dbg(ipu->dev, "IPU rev:%d\n", g_ipu_hw_rev);
++	spin_lock_init(&ipu->int_reg_spin_lock);
++	spin_lock_init(&ipu->rdy_reg_spin_lock);
++	mutex_init(&ipu->mutex_lock);
++
++	ipu->irq_sync = platform_get_irq(pdev, 0);
++	ipu->irq_err = platform_get_irq(pdev, 1);
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++
++	if (!res || ipu->irq_sync < 0 || ipu->irq_err < 0) {
++		dev_err(&pdev->dev, "can't get device resources\n");
++		return -ENODEV;
++	}
++
++	if (!devm_request_mem_region(&pdev->dev, res->start,
++				     resource_size(res), pdev->name))
++		return -EBUSY;
++
++	ret = devm_request_irq(&pdev->dev, ipu->irq_sync,
++			ipu_sync_irq_handler, 0, pdev->name, ipu);
++	if (ret) {
++		dev_err(ipu->dev, "request SYNC interrupt failed\n");
++		return ret;
++	}
++	ret = devm_request_irq(&pdev->dev, ipu->irq_err,
++			ipu_err_irq_handler, 0, pdev->name, ipu);
++	if (ret) {
++		dev_err(ipu->dev, "request ERR interrupt failed\n");
++		return ret;
++	}
++
++	ipu_base = res->start;
++	/* base fixup */
++	if (g_ipu_hw_rev == IPU_V3H)	/* IPUv3H */
++		ipu_base += IPUV3H_REG_BASE;
++	else if (g_ipu_hw_rev == IPU_V3M)	/* IPUv3M */
++		ipu_base += IPUV3M_REG_BASE;
++	else			/* IPUv3D, v3E, v3EX */
++		ipu_base += IPUV3DEX_REG_BASE;
++
++	ipu->cm_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_CM_REG_BASE, PAGE_SIZE);
++	ipu->ic_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_IC_REG_BASE, PAGE_SIZE);
++	ipu->idmac_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_IDMAC_REG_BASE, PAGE_SIZE);
++	/* DP Registers are accessed thru the SRM */
++	ipu->dp_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_SRM_REG_BASE, PAGE_SIZE);
++	ipu->dc_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_DC_REG_BASE, PAGE_SIZE);
++	ipu->dmfc_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_DMFC_REG_BASE, PAGE_SIZE);
++	ipu->di_reg[0] = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_DI0_REG_BASE, PAGE_SIZE);
++	ipu->di_reg[1] = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_DI1_REG_BASE, PAGE_SIZE);
++	ipu->smfc_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_SMFC_REG_BASE, PAGE_SIZE);
++	ipu->csi_reg[0] = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_CSI0_REG_BASE, PAGE_SIZE);
++	ipu->csi_reg[1] = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_CSI1_REG_BASE, PAGE_SIZE);
++	ipu->cpmem_base = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_CPMEM_REG_BASE, SZ_128K);
++	ipu->tpmem_base = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_TPM_REG_BASE, SZ_64K);
++	ipu->dc_tmpl_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_DC_TMPL_REG_BASE, SZ_128K);
++	ipu->vdi_reg = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_VDI_REG_BASE, PAGE_SIZE);
++	ipu->disp_base[1] = devm_ioremap(&pdev->dev,
++				ipu_base + IPU_DISP1_BASE, SZ_4K);
++	if (!ipu->cm_reg || !ipu->ic_reg || !ipu->idmac_reg ||
++		!ipu->dp_reg || !ipu->dc_reg || !ipu->dmfc_reg ||
++		!ipu->di_reg[0] || !ipu->di_reg[1] || !ipu->smfc_reg ||
++		!ipu->csi_reg[0] || !ipu->csi_reg[1] || !ipu->cpmem_base ||
++		!ipu->tpmem_base || !ipu->dc_tmpl_reg || !ipu->disp_base[1]
++		|| !ipu->vdi_reg)
++		return -ENOMEM;
++
++	dev_dbg(ipu->dev, "IPU CM Regs = %p\n", ipu->cm_reg);
++	dev_dbg(ipu->dev, "IPU IC Regs = %p\n", ipu->ic_reg);
++	dev_dbg(ipu->dev, "IPU IDMAC Regs = %p\n", ipu->idmac_reg);
++	dev_dbg(ipu->dev, "IPU DP Regs = %p\n", ipu->dp_reg);
++	dev_dbg(ipu->dev, "IPU DC Regs = %p\n", ipu->dc_reg);
++	dev_dbg(ipu->dev, "IPU DMFC Regs = %p\n", ipu->dmfc_reg);
++	dev_dbg(ipu->dev, "IPU DI0 Regs = %p\n", ipu->di_reg[0]);
++	dev_dbg(ipu->dev, "IPU DI1 Regs = %p\n", ipu->di_reg[1]);
++	dev_dbg(ipu->dev, "IPU SMFC Regs = %p\n", ipu->smfc_reg);
++	dev_dbg(ipu->dev, "IPU CSI0 Regs = %p\n", ipu->csi_reg[0]);
++	dev_dbg(ipu->dev, "IPU CSI1 Regs = %p\n", ipu->csi_reg[1]);
++	dev_dbg(ipu->dev, "IPU CPMem = %p\n", ipu->cpmem_base);
++	dev_dbg(ipu->dev, "IPU TPMem = %p\n", ipu->tpmem_base);
++	dev_dbg(ipu->dev, "IPU DC Template Mem = %p\n", ipu->dc_tmpl_reg);
++	dev_dbg(ipu->dev, "IPU Display Region 1 Mem = %p\n", ipu->disp_base[1]);
++	dev_dbg(ipu->dev, "IPU VDI Regs = %p\n", ipu->vdi_reg);
++
++	ipu->ipu_clk = devm_clk_get(ipu->dev, "bus");
++	if (IS_ERR(ipu->ipu_clk)) {
++		dev_err(ipu->dev, "clk_get ipu failed");
++		return PTR_ERR(ipu->ipu_clk);
++	}
++
++	/* ipu_clk is always prepared */
++	ret = clk_prepare_enable(ipu->ipu_clk);
++	if (ret < 0) {
++		dev_err(ipu->dev, "ipu clk enable failed\n");
++		return ret;
++	}
++
++	ipu->online = true;
++
++	platform_set_drvdata(pdev, ipu);
++
++	if (!pltfm_data->bypass_reset) {
++		ret = device_reset(&pdev->dev);
++		if (ret) {
++			dev_err(&pdev->dev, "failed to reset: %d\n", ret);
++			return ret;
++		}
++
++		ipu_mem_reset(ipu);
++
++		ipu_disp_init(ipu);
++
++		/* Set MCU_T to divide MCU access window into 2 */
++		ipu_cm_write(ipu, 0x00400000L | (IPU_MCU_T_DEFAULT << 18),
++			     IPU_DISP_GEN);
++	}
++
++	/* setup ipu clk tree after ipu reset  */
++	ret = ipu_clk_setup_enable(ipu, pltfm_data);
++	if (ret < 0) {
++		dev_err(ipu->dev, "ipu clk setup failed\n");
++		ipu->online = false;
++		return ret;
++	}
++
++	/* Set sync refresh channels and CSI->mem channel as high priority */
++	ipu_idmac_write(ipu, 0x18800001L, IDMAC_CHA_PRI(0));
++
++	/* Enable error interrupts by default */
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(5));
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(6));
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(9));
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(10));
++
++	if (!pltfm_data->bypass_reset)
++		clk_disable(ipu->ipu_clk);
++
++	register_ipu_device(ipu, ipu->pdata->id);
++
++	pm_runtime_enable(&pdev->dev);
++
++	return ret;
++}
++
++int ipu_remove(struct platform_device *pdev)
++{
++	struct ipu_soc *ipu = platform_get_drvdata(pdev);
++
++	unregister_ipu_device(ipu, ipu->pdata->id);
++
++	clk_put(ipu->ipu_clk);
++
++	return 0;
++}
++
++void ipu_dump_registers(struct ipu_soc *ipu)
++{
++	dev_dbg(ipu->dev, "IPU_CONF = \t0x%08X\n", ipu_cm_read(ipu, IPU_CONF));
++	dev_dbg(ipu->dev, "IDMAC_CONF = \t0x%08X\n", ipu_idmac_read(ipu, IDMAC_CONF));
++	dev_dbg(ipu->dev, "IDMAC_CHA_EN1 = \t0x%08X\n",
++	       ipu_idmac_read(ipu, IDMAC_CHA_EN(0)));
++	dev_dbg(ipu->dev, "IDMAC_CHA_EN2 = \t0x%08X\n",
++	       ipu_idmac_read(ipu, IDMAC_CHA_EN(32)));
++	dev_dbg(ipu->dev, "IDMAC_CHA_PRI1 = \t0x%08X\n",
++	       ipu_idmac_read(ipu, IDMAC_CHA_PRI(0)));
++	dev_dbg(ipu->dev, "IDMAC_CHA_PRI2 = \t0x%08X\n",
++	       ipu_idmac_read(ipu, IDMAC_CHA_PRI(32)));
++	dev_dbg(ipu->dev, "IDMAC_BAND_EN1 = \t0x%08X\n",
++	       ipu_idmac_read(ipu, IDMAC_BAND_EN(0)));
++	dev_dbg(ipu->dev, "IDMAC_BAND_EN2 = \t0x%08X\n",
++	       ipu_idmac_read(ipu, IDMAC_BAND_EN(32)));
++	dev_dbg(ipu->dev, "IPU_CHA_DB_MODE_SEL0 = \t0x%08X\n",
++	       ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(0)));
++	dev_dbg(ipu->dev, "IPU_CHA_DB_MODE_SEL1 = \t0x%08X\n",
++	       ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(32)));
++	if (g_ipu_hw_rev >= IPU_V3DEX) {
++		dev_dbg(ipu->dev, "IPU_CHA_TRB_MODE_SEL0 = \t0x%08X\n",
++		       ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(0)));
++		dev_dbg(ipu->dev, "IPU_CHA_TRB_MODE_SEL1 = \t0x%08X\n",
++		       ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(32)));
++	}
++	dev_dbg(ipu->dev, "DMFC_WR_CHAN = \t0x%08X\n",
++	       ipu_dmfc_read(ipu, DMFC_WR_CHAN));
++	dev_dbg(ipu->dev, "DMFC_WR_CHAN_DEF = \t0x%08X\n",
++	       ipu_dmfc_read(ipu, DMFC_WR_CHAN_DEF));
++	dev_dbg(ipu->dev, "DMFC_DP_CHAN = \t0x%08X\n",
++	       ipu_dmfc_read(ipu, DMFC_DP_CHAN));
++	dev_dbg(ipu->dev, "DMFC_DP_CHAN_DEF = \t0x%08X\n",
++	       ipu_dmfc_read(ipu, DMFC_DP_CHAN_DEF));
++	dev_dbg(ipu->dev, "DMFC_IC_CTRL = \t0x%08X\n",
++	       ipu_dmfc_read(ipu, DMFC_IC_CTRL));
++	dev_dbg(ipu->dev, "IPU_FS_PROC_FLOW1 = \t0x%08X\n",
++	       ipu_cm_read(ipu, IPU_FS_PROC_FLOW1));
++	dev_dbg(ipu->dev, "IPU_FS_PROC_FLOW2 = \t0x%08X\n",
++	       ipu_cm_read(ipu, IPU_FS_PROC_FLOW2));
++	dev_dbg(ipu->dev, "IPU_FS_PROC_FLOW3 = \t0x%08X\n",
++	       ipu_cm_read(ipu, IPU_FS_PROC_FLOW3));
++	dev_dbg(ipu->dev, "IPU_FS_DISP_FLOW1 = \t0x%08X\n",
++	       ipu_cm_read(ipu, IPU_FS_DISP_FLOW1));
++	dev_dbg(ipu->dev, "IPU_VDIC_VDI_FSIZE = \t0x%08X\n",
++	       ipu_vdi_read(ipu, VDI_FSIZE));
++	dev_dbg(ipu->dev, "IPU_VDIC_VDI_C = \t0x%08X\n",
++	       ipu_vdi_read(ipu, VDI_C));
++	dev_dbg(ipu->dev, "IPU_IC_CONF = \t0x%08X\n",
++	       ipu_ic_read(ipu, IC_CONF));
++}
++
++/*!
++ * This function is called to initialize a logical IPU channel.
++ *
++ * @param	ipu	ipu handler
++ * @param       channel Input parameter for the logical channel ID to init.
++ *
++ * @param       params  Input parameter containing union of channel
++ *                      initialization parameters.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_init_channel(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params)
++{
++	int ret = 0;
++	bool bad_pixfmt;
++	uint32_t ipu_conf, reg, in_g_pixel_fmt, sec_dma;
++
++	dev_dbg(ipu->dev, "init channel = %d\n", IPU_CHAN_ID(channel));
++
++	ret = pm_runtime_get_sync(ipu->dev);
++	if (ret < 0) {
++		dev_err(ipu->dev, "ch = %d, pm_runtime_get failed:%d!\n",
++				IPU_CHAN_ID(channel), ret);
++		dump_stack();
++		return ret;
++	}
++	/*
++	 * Here, ret could be 1 if the device's runtime PM status was
++	 * already 'active', so clear it to be 0.
++	 */
++	ret = 0;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	/* Re-enable error interrupts every time a channel is initialized */
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(5));
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(6));
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(9));
++	ipu_cm_write(ipu, 0xFFFFFFFF, IPU_INT_CTRL(10));
++
++	if (ipu->channel_init_mask & (1L << IPU_CHAN_ID(channel))) {
++		dev_warn(ipu->dev, "Warning: channel already initialized %d\n",
++			IPU_CHAN_ID(channel));
++	}
++
++	ipu_conf = ipu_cm_read(ipu, IPU_CONF);
++
++	switch (channel) {
++	case CSI_MEM0:
++	case CSI_MEM1:
++	case CSI_MEM2:
++	case CSI_MEM3:
++		if (params->csi_mem.csi > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++
++		if (params->csi_mem.interlaced)
++			ipu->chan_is_interlaced[channel_2_dma(channel,
++				IPU_OUTPUT_BUFFER)] = true;
++		else
++			ipu->chan_is_interlaced[channel_2_dma(channel,
++				IPU_OUTPUT_BUFFER)] = false;
++
++		ipu->smfc_use_count++;
++		ipu->csi_channel[params->csi_mem.csi] = channel;
++
++		/*SMFC setting*/
++		if (params->csi_mem.mipi_en) {
++			ipu_conf |= (1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
++				params->csi_mem.csi));
++			_ipu_smfc_init(ipu, channel, params->csi_mem.mipi_vc,
++				params->csi_mem.csi);
++			_ipu_csi_set_mipi_di(ipu, params->csi_mem.mipi_vc,
++				params->csi_mem.mipi_id, params->csi_mem.csi);
++		} else {
++			ipu_conf &= ~(1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
++				params->csi_mem.csi));
++			_ipu_smfc_init(ipu, channel, 0, params->csi_mem.csi);
++		}
++
++		/*CSI data (include compander) dest*/
++		_ipu_csi_init(ipu, channel, params->csi_mem.csi);
++		break;
++	case CSI_PRP_ENC_MEM:
++		if (params->csi_prp_enc_mem.csi > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++		if ((ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM) ||
++			(ipu->using_ic_dirct_ch == MEM_VDI_MEM)) {
++			ret = -EINVAL;
++			goto err;
++		}
++		ipu->using_ic_dirct_ch = CSI_PRP_ENC_MEM;
++
++		ipu->ic_use_count++;
++		ipu->csi_channel[params->csi_prp_enc_mem.csi] = channel;
++
++		if (params->csi_prp_enc_mem.mipi_en) {
++			ipu_conf |= (1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
++				params->csi_prp_enc_mem.csi));
++			_ipu_csi_set_mipi_di(ipu,
++				params->csi_prp_enc_mem.mipi_vc,
++				params->csi_prp_enc_mem.mipi_id,
++				params->csi_prp_enc_mem.csi);
++		} else
++			ipu_conf &= ~(1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
++				params->csi_prp_enc_mem.csi));
++
++		/*CSI0/1 feed into IC*/
++		ipu_conf &= ~IPU_CONF_IC_INPUT;
++		if (params->csi_prp_enc_mem.csi)
++			ipu_conf |= IPU_CONF_CSI_SEL;
++		else
++			ipu_conf &= ~IPU_CONF_CSI_SEL;
++
++		/*PRP skip buffer in memory, only valid when RWS_EN is true*/
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg & ~FS_ENC_IN_VALID, IPU_FS_PROC_FLOW1);
++
++		/*CSI data (include compander) dest*/
++		_ipu_csi_init(ipu, channel, params->csi_prp_enc_mem.csi);
++		_ipu_ic_init_prpenc(ipu, params, true);
++		break;
++	case CSI_PRP_VF_MEM:
++		if (params->csi_prp_vf_mem.csi > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++		if ((ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM) ||
++			(ipu->using_ic_dirct_ch == MEM_VDI_MEM)) {
++			ret = -EINVAL;
++			goto err;
++		}
++		ipu->using_ic_dirct_ch = CSI_PRP_VF_MEM;
++
++		ipu->ic_use_count++;
++		ipu->csi_channel[params->csi_prp_vf_mem.csi] = channel;
++
++		if (params->csi_prp_vf_mem.mipi_en) {
++			ipu_conf |= (1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
++				params->csi_prp_vf_mem.csi));
++			_ipu_csi_set_mipi_di(ipu,
++				params->csi_prp_vf_mem.mipi_vc,
++				params->csi_prp_vf_mem.mipi_id,
++				params->csi_prp_vf_mem.csi);
++		} else
++			ipu_conf &= ~(1 << (IPU_CONF_CSI0_DATA_SOURCE_OFFSET +
++				params->csi_prp_vf_mem.csi));
++
++		/*CSI0/1 feed into IC*/
++		ipu_conf &= ~IPU_CONF_IC_INPUT;
++		if (params->csi_prp_vf_mem.csi)
++			ipu_conf |= IPU_CONF_CSI_SEL;
++		else
++			ipu_conf &= ~IPU_CONF_CSI_SEL;
++
++		/*PRP skip buffer in memory, only valid when RWS_EN is true*/
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg & ~FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
++
++		/*CSI data (include compander) dest*/
++		_ipu_csi_init(ipu, channel, params->csi_prp_vf_mem.csi);
++		_ipu_ic_init_prpvf(ipu, params, true);
++		break;
++	case MEM_PRP_VF_MEM:
++		if (params->mem_prp_vf_mem.graphics_combine_en) {
++			sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
++			in_g_pixel_fmt = params->mem_prp_vf_mem.in_g_pixel_fmt;
++			bad_pixfmt =
++				_ipu_ch_param_bad_alpha_pos(in_g_pixel_fmt);
++
++			if (params->mem_prp_vf_mem.alpha_chan_en) {
++				if (bad_pixfmt) {
++					dev_err(ipu->dev, "bad pixel format "
++						"for graphics plane from "
++						"ch%d\n", sec_dma);
++					ret = -EINVAL;
++					goto err;
++				}
++				ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
++			}
++			ipu->sec_chan_en[IPU_CHAN_ID(channel)] = true;
++		}
++
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg | FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
++
++		_ipu_ic_init_prpvf(ipu, params, false);
++		ipu->ic_use_count++;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		if ((ipu->using_ic_dirct_ch == CSI_PRP_VF_MEM) ||
++			(ipu->using_ic_dirct_ch == MEM_VDI_MEM) ||
++		     (ipu->using_ic_dirct_ch == CSI_PRP_ENC_MEM)) {
++			ret = -EINVAL;
++			goto err;
++		}
++		ipu->using_ic_dirct_ch = MEM_VDI_PRP_VF_MEM;
++		ipu->ic_use_count++;
++		ipu->vdi_use_count++;
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		reg &= ~FS_VDI_SRC_SEL_MASK;
++		ipu_cm_write(ipu, reg , IPU_FS_PROC_FLOW1);
++
++		if (params->mem_prp_vf_mem.graphics_combine_en)
++			ipu->sec_chan_en[IPU_CHAN_ID(channel)] = true;
++		_ipu_ic_init_prpvf(ipu, params, false);
++		_ipu_vdi_init(ipu, channel, params);
++		break;
++	case MEM_VDI_PRP_VF_MEM_P:
++	case MEM_VDI_PRP_VF_MEM_N:
++	case MEM_VDI_MEM_P:
++	case MEM_VDI_MEM_N:
++		_ipu_vdi_init(ipu, channel, params);
++		break;
++	case MEM_VDI_MEM:
++		if ((ipu->using_ic_dirct_ch == CSI_PRP_VF_MEM) ||
++			(ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM) ||
++		     (ipu->using_ic_dirct_ch == CSI_PRP_ENC_MEM)) {
++			ret = -EINVAL;
++			goto err;
++		}
++		ipu->using_ic_dirct_ch = MEM_VDI_MEM;
++		ipu->ic_use_count++;
++		ipu->vdi_use_count++;
++		_ipu_vdi_init(ipu, channel, params);
++		break;
++	case MEM_ROT_VF_MEM:
++		ipu->ic_use_count++;
++		ipu->rot_use_count++;
++		_ipu_ic_init_rotate_vf(ipu, params);
++		break;
++	case MEM_PRP_ENC_MEM:
++		ipu->ic_use_count++;
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg | FS_ENC_IN_VALID, IPU_FS_PROC_FLOW1);
++		_ipu_ic_init_prpenc(ipu, params, false);
++		break;
++	case MEM_ROT_ENC_MEM:
++		ipu->ic_use_count++;
++		ipu->rot_use_count++;
++		_ipu_ic_init_rotate_enc(ipu, params);
++		break;
++	case MEM_PP_MEM:
++		if (params->mem_pp_mem.graphics_combine_en) {
++			sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
++			in_g_pixel_fmt = params->mem_pp_mem.in_g_pixel_fmt;
++			bad_pixfmt =
++				_ipu_ch_param_bad_alpha_pos(in_g_pixel_fmt);
++
++			if (params->mem_pp_mem.alpha_chan_en) {
++				if (bad_pixfmt) {
++					dev_err(ipu->dev, "bad pixel format "
++						"for graphics plane from "
++						"ch%d\n", sec_dma);
++					ret = -EINVAL;
++					goto err;
++				}
++				ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
++			}
++
++			ipu->sec_chan_en[IPU_CHAN_ID(channel)] = true;
++		}
++
++		_ipu_ic_init_pp(ipu, params);
++		ipu->ic_use_count++;
++		break;
++	case MEM_ROT_PP_MEM:
++		_ipu_ic_init_rotate_pp(ipu, params);
++		ipu->ic_use_count++;
++		ipu->rot_use_count++;
++		break;
++	case MEM_DC_SYNC:
++		if (params->mem_dc_sync.di > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++
++		ipu->dc_di_assignment[1] = params->mem_dc_sync.di;
++		_ipu_dc_init(ipu, 1, params->mem_dc_sync.di,
++			     params->mem_dc_sync.interlaced,
++			     params->mem_dc_sync.out_pixel_fmt);
++		ipu->di_use_count[params->mem_dc_sync.di]++;
++		ipu->dc_use_count++;
++		ipu->dmfc_use_count++;
++		break;
++	case MEM_BG_SYNC:
++		if (params->mem_dp_bg_sync.di > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++
++		if (params->mem_dp_bg_sync.alpha_chan_en)
++			ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
++
++		ipu->dc_di_assignment[5] = params->mem_dp_bg_sync.di;
++		_ipu_dp_init(ipu, channel, params->mem_dp_bg_sync.in_pixel_fmt,
++			     params->mem_dp_bg_sync.out_pixel_fmt);
++		_ipu_dc_init(ipu, 5, params->mem_dp_bg_sync.di,
++			     params->mem_dp_bg_sync.interlaced,
++			     params->mem_dp_bg_sync.out_pixel_fmt);
++		ipu->di_use_count[params->mem_dp_bg_sync.di]++;
++		ipu->dc_use_count++;
++		ipu->dp_use_count++;
++		ipu->dmfc_use_count++;
++		break;
++	case MEM_FG_SYNC:
++		_ipu_dp_init(ipu, channel, params->mem_dp_fg_sync.in_pixel_fmt,
++			     params->mem_dp_fg_sync.out_pixel_fmt);
++
++		if (params->mem_dp_fg_sync.alpha_chan_en)
++			ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = true;
++
++		ipu->dc_use_count++;
++		ipu->dp_use_count++;
++		ipu->dmfc_use_count++;
++		break;
++	case DIRECT_ASYNC0:
++		if (params->direct_async.di > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++
++		ipu->dc_di_assignment[8] = params->direct_async.di;
++		_ipu_dc_init(ipu, 8, params->direct_async.di, false, IPU_PIX_FMT_GENERIC);
++		ipu->di_use_count[params->direct_async.di]++;
++		ipu->dc_use_count++;
++		break;
++	case DIRECT_ASYNC1:
++		if (params->direct_async.di > 1) {
++			ret = -EINVAL;
++			goto err;
++		}
++
++		ipu->dc_di_assignment[9] = params->direct_async.di;
++		_ipu_dc_init(ipu, 9, params->direct_async.di, false, IPU_PIX_FMT_GENERIC);
++		ipu->di_use_count[params->direct_async.di]++;
++		ipu->dc_use_count++;
++		break;
++	default:
++		dev_err(ipu->dev, "Missing channel initialization\n");
++		break;
++	}
++
++	ipu->channel_init_mask |= 1L << IPU_CHAN_ID(channel);
++
++	ipu_cm_write(ipu, ipu_conf, IPU_CONF);
++
++err:
++	mutex_unlock(&ipu->mutex_lock);
++	return ret;
++}
++EXPORT_SYMBOL(ipu_init_channel);
++
++/*!
++ * This function is called to uninitialize a logical IPU channel.
++ *
++ * @param	ipu	ipu handler
++ * @param       channel Input parameter for the logical channel ID to uninit.
++ */
++void ipu_uninit_channel(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t reg;
++	uint32_t in_dma, out_dma = 0;
++	uint32_t ipu_conf;
++	uint32_t dc_chan = 0;
++	int ret;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	if ((ipu->channel_init_mask & (1L << IPU_CHAN_ID(channel))) == 0) {
++		dev_dbg(ipu->dev, "Channel already uninitialized %d\n",
++			IPU_CHAN_ID(channel));
++		mutex_unlock(&ipu->mutex_lock);
++		return;
++	}
++
++	/* Make sure channel is disabled */
++	/* Get input and output dma channels */
++	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
++	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
++
++	if (idma_is_set(ipu, IDMAC_CHA_EN, in_dma) ||
++	    idma_is_set(ipu, IDMAC_CHA_EN, out_dma)) {
++		dev_err(ipu->dev,
++			"Channel %d is not disabled, disable first\n",
++			IPU_CHAN_ID(channel));
++		mutex_unlock(&ipu->mutex_lock);
++		return;
++	}
++
++	ipu_conf = ipu_cm_read(ipu, IPU_CONF);
++
++	/* Reset the double buffer */
++	reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(in_dma));
++	ipu_cm_write(ipu, reg & ~idma_mask(in_dma), IPU_CHA_DB_MODE_SEL(in_dma));
++	reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(out_dma));
++	ipu_cm_write(ipu, reg & ~idma_mask(out_dma), IPU_CHA_DB_MODE_SEL(out_dma));
++
++	/* Reset the triple buffer */
++	reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(in_dma));
++	ipu_cm_write(ipu, reg & ~idma_mask(in_dma), IPU_CHA_TRB_MODE_SEL(in_dma));
++	reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(out_dma));
++	ipu_cm_write(ipu, reg & ~idma_mask(out_dma), IPU_CHA_TRB_MODE_SEL(out_dma));
++
++	if (_ipu_is_ic_chan(in_dma) || _ipu_is_dp_graphic_chan(in_dma)) {
++		ipu->sec_chan_en[IPU_CHAN_ID(channel)] = false;
++		ipu->thrd_chan_en[IPU_CHAN_ID(channel)] = false;
++	}
++
++	switch (channel) {
++	case CSI_MEM0:
++	case CSI_MEM1:
++	case CSI_MEM2:
++	case CSI_MEM3:
++		ipu->smfc_use_count--;
++		if (ipu->csi_channel[0] == channel) {
++			ipu->csi_channel[0] = CHAN_NONE;
++		} else if (ipu->csi_channel[1] == channel) {
++			ipu->csi_channel[1] = CHAN_NONE;
++		}
++		break;
++	case CSI_PRP_ENC_MEM:
++		ipu->ic_use_count--;
++		if (ipu->using_ic_dirct_ch == CSI_PRP_ENC_MEM)
++			ipu->using_ic_dirct_ch = 0;
++		_ipu_ic_uninit_prpenc(ipu);
++		if (ipu->csi_channel[0] == channel) {
++			ipu->csi_channel[0] = CHAN_NONE;
++		} else if (ipu->csi_channel[1] == channel) {
++			ipu->csi_channel[1] = CHAN_NONE;
++		}
++		break;
++	case CSI_PRP_VF_MEM:
++		ipu->ic_use_count--;
++		if (ipu->using_ic_dirct_ch == CSI_PRP_VF_MEM)
++			ipu->using_ic_dirct_ch = 0;
++		_ipu_ic_uninit_prpvf(ipu);
++		if (ipu->csi_channel[0] == channel) {
++			ipu->csi_channel[0] = CHAN_NONE;
++		} else if (ipu->csi_channel[1] == channel) {
++			ipu->csi_channel[1] = CHAN_NONE;
++		}
++		break;
++	case MEM_PRP_VF_MEM:
++		ipu->ic_use_count--;
++		_ipu_ic_uninit_prpvf(ipu);
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg & ~FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		ipu->ic_use_count--;
++		ipu->vdi_use_count--;
++		if (ipu->using_ic_dirct_ch == MEM_VDI_PRP_VF_MEM)
++			ipu->using_ic_dirct_ch = 0;
++		_ipu_ic_uninit_prpvf(ipu);
++		_ipu_vdi_uninit(ipu);
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg & ~FS_VF_IN_VALID, IPU_FS_PROC_FLOW1);
++		break;
++	case MEM_VDI_MEM:
++		ipu->ic_use_count--;
++		ipu->vdi_use_count--;
++		if (ipu->using_ic_dirct_ch == MEM_VDI_MEM)
++			ipu->using_ic_dirct_ch = 0;
++		_ipu_vdi_uninit(ipu);
++		break;
++	case MEM_VDI_PRP_VF_MEM_P:
++	case MEM_VDI_PRP_VF_MEM_N:
++	case MEM_VDI_MEM_P:
++	case MEM_VDI_MEM_N:
++		break;
++	case MEM_ROT_VF_MEM:
++		ipu->rot_use_count--;
++		ipu->ic_use_count--;
++		_ipu_ic_uninit_rotate_vf(ipu);
++		break;
++	case MEM_PRP_ENC_MEM:
++		ipu->ic_use_count--;
++		_ipu_ic_uninit_prpenc(ipu);
++		reg = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++		ipu_cm_write(ipu, reg & ~FS_ENC_IN_VALID, IPU_FS_PROC_FLOW1);
++		break;
++	case MEM_ROT_ENC_MEM:
++		ipu->rot_use_count--;
++		ipu->ic_use_count--;
++		_ipu_ic_uninit_rotate_enc(ipu);
++		break;
++	case MEM_PP_MEM:
++		ipu->ic_use_count--;
++		_ipu_ic_uninit_pp(ipu);
++		break;
++	case MEM_ROT_PP_MEM:
++		ipu->rot_use_count--;
++		ipu->ic_use_count--;
++		_ipu_ic_uninit_rotate_pp(ipu);
++		break;
++	case MEM_DC_SYNC:
++		dc_chan = 1;
++		_ipu_dc_uninit(ipu, 1);
++		ipu->di_use_count[ipu->dc_di_assignment[1]]--;
++		ipu->dc_use_count--;
++		ipu->dmfc_use_count--;
++		break;
++	case MEM_BG_SYNC:
++		dc_chan = 5;
++		_ipu_dp_uninit(ipu, channel);
++		_ipu_dc_uninit(ipu, 5);
++		ipu->di_use_count[ipu->dc_di_assignment[5]]--;
++		ipu->dc_use_count--;
++		ipu->dp_use_count--;
++		ipu->dmfc_use_count--;
++		break;
++	case MEM_FG_SYNC:
++		_ipu_dp_uninit(ipu, channel);
++		ipu->dc_use_count--;
++		ipu->dp_use_count--;
++		ipu->dmfc_use_count--;
++		break;
++	case DIRECT_ASYNC0:
++		dc_chan = 8;
++		_ipu_dc_uninit(ipu, 8);
++		ipu->di_use_count[ipu->dc_di_assignment[8]]--;
++		ipu->dc_use_count--;
++		break;
++	case DIRECT_ASYNC1:
++		dc_chan = 9;
++		_ipu_dc_uninit(ipu, 9);
++		ipu->di_use_count[ipu->dc_di_assignment[9]]--;
++		ipu->dc_use_count--;
++		break;
++	default:
++		break;
++	}
++
++	if (ipu->ic_use_count == 0)
++		ipu_conf &= ~IPU_CONF_IC_EN;
++	if (ipu->vdi_use_count == 0) {
++		ipu_conf &= ~IPU_CONF_ISP_EN;
++		ipu_conf &= ~IPU_CONF_VDI_EN;
++		ipu_conf &= ~IPU_CONF_IC_INPUT;
++	}
++	if (ipu->rot_use_count == 0)
++		ipu_conf &= ~IPU_CONF_ROT_EN;
++	if (ipu->dc_use_count == 0)
++		ipu_conf &= ~IPU_CONF_DC_EN;
++	if (ipu->dp_use_count == 0)
++		ipu_conf &= ~IPU_CONF_DP_EN;
++	if (ipu->dmfc_use_count == 0)
++		ipu_conf &= ~IPU_CONF_DMFC_EN;
++	if (ipu->di_use_count[0] == 0) {
++		ipu_conf &= ~IPU_CONF_DI0_EN;
++	}
++	if (ipu->di_use_count[1] == 0) {
++		ipu_conf &= ~IPU_CONF_DI1_EN;
++	}
++	if (ipu->smfc_use_count == 0)
++		ipu_conf &= ~IPU_CONF_SMFC_EN;
++
++	ipu_cm_write(ipu, ipu_conf, IPU_CONF);
++
++	ipu->channel_init_mask &= ~(1L << IPU_CHAN_ID(channel));
++
++	/*
++	 * Disable pixel clk and its parent clock(if the parent clock
++	 * usecount is 1) after clearing DC/DP/DI bits in IPU_CONF
++	 * register to prevent LVDS display channel starvation.
++	 */
++	if (_ipu_is_primary_disp_chan(in_dma))
++		clk_disable_unprepare(ipu->pixel_clk[ipu->dc_di_assignment[dc_chan]]);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++
++	ret = pm_runtime_put_sync_suspend(ipu->dev);
++	if (ret < 0) {
++		dev_err(ipu->dev, "ch = %d, pm_runtime_put failed:%d!\n",
++				IPU_CHAN_ID(channel), ret);
++		dump_stack();
++	}
++
++	WARN_ON(ipu->ic_use_count < 0);
++	WARN_ON(ipu->vdi_use_count < 0);
++	WARN_ON(ipu->rot_use_count < 0);
++	WARN_ON(ipu->dc_use_count < 0);
++	WARN_ON(ipu->dp_use_count < 0);
++	WARN_ON(ipu->dmfc_use_count < 0);
++	WARN_ON(ipu->smfc_use_count < 0);
++}
++EXPORT_SYMBOL(ipu_uninit_channel);
++
++/*!
++ * This function is called to initialize buffer(s) for logical IPU channel.
++ *
++ * @param	ipu		ipu handler
++ *
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to initialize.
++ *
++ * @param       pixel_fmt       Input parameter for pixel format of buffer.
++ *                              Pixel format is a FOURCC ASCII code.
++ *
++ * @param       width           Input parameter for width of buffer in pixels.
++ *
++ * @param       height          Input parameter for height of buffer in pixels.
++ *
++ * @param       stride          Input parameter for stride length of buffer
++ *                              in pixels.
++ *
++ * @param       rot_mode        Input parameter for rotation setting of buffer.
++ *                              A rotation setting other than
++ *                              IPU_ROTATE_VERT_FLIP
++ *                              should only be used for input buffers of
++ *                              rotation channels.
++ *
++ * @param       phyaddr_0       Input parameter buffer 0 physical address.
++ *
++ * @param       phyaddr_1       Input parameter buffer 1 physical address.
++ *                              Setting this to a value other than NULL enables
++ *                              double buffering mode.
++ *
++ * @param       phyaddr_2       Input parameter buffer 2 physical address.
++ *                              Setting this to a value other than NULL enables
++ *                              triple buffering mode, phyaddr_1 should not be
++ *                              NULL then.
++ *
++ * @param       u		private u offset for additional cropping,
++ *				zero if not used.
++ *
++ * @param       v		private v offset for additional cropping,
++ *				zero if not used.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_init_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
++				ipu_buffer_t type,
++				uint32_t pixel_fmt,
++				uint16_t width, uint16_t height,
++				uint32_t stride,
++				ipu_rotate_mode_t rot_mode,
++				dma_addr_t phyaddr_0, dma_addr_t phyaddr_1,
++				dma_addr_t phyaddr_2,
++				uint32_t u, uint32_t v)
++{
++	uint32_t reg;
++	uint32_t dma_chan;
++	uint32_t burst_size;
++
++	dma_chan = channel_2_dma(channel, type);
++	if (!idma_is_valid(dma_chan))
++		return -EINVAL;
++
++	if (stride < width * bytes_per_pixel(pixel_fmt))
++		stride = width * bytes_per_pixel(pixel_fmt);
++
++	if (stride % 4) {
++		dev_err(ipu->dev,
++			"Stride not 32-bit aligned, stride = %d\n", stride);
++		return -EINVAL;
++	}
++	/* IC & IRT channels' width must be multiple of 8 pixels */
++	if ((_ipu_is_ic_chan(dma_chan) || _ipu_is_irt_chan(dma_chan))
++		&& (width % 8)) {
++		dev_err(ipu->dev, "Width must be 8 pixel multiple\n");
++		return -EINVAL;
++	}
++
++	if (_ipu_is_vdi_out_chan(dma_chan) &&
++		((width < 16) || (height < 16) || (width % 2) || (height % 4))) {
++		dev_err(ipu->dev, "vdi width/height limited err\n");
++		return -EINVAL;
++	}
++
++	/* IPUv3EX and IPUv3M support triple buffer */
++	if ((!_ipu_is_trb_chan(dma_chan)) && phyaddr_2) {
++		dev_err(ipu->dev, "Chan%d doesn't support triple buffer "
++				   "mode\n", dma_chan);
++		return -EINVAL;
++	}
++	if (!phyaddr_1 && phyaddr_2) {
++		dev_err(ipu->dev, "Chan%d's buf1 physical addr is NULL for "
++				   "triple buffer mode\n", dma_chan);
++		return -EINVAL;
++	}
++
++	mutex_lock(&ipu->mutex_lock);
++
++	/* Build parameter memory data for DMA channel */
++	_ipu_ch_param_init(ipu, dma_chan, pixel_fmt, width, height, stride, u, v, 0,
++			   phyaddr_0, phyaddr_1, phyaddr_2);
++
++	/* Set correlative channel parameter of local alpha channel */
++	if ((_ipu_is_ic_graphic_chan(dma_chan) ||
++	     _ipu_is_dp_graphic_chan(dma_chan)) &&
++	    (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] == true)) {
++		_ipu_ch_param_set_alpha_use_separate_channel(ipu, dma_chan, true);
++		_ipu_ch_param_set_alpha_buffer_memory(ipu, dma_chan);
++		_ipu_ch_param_set_alpha_condition_read(ipu, dma_chan);
++		/* fix alpha width as 8 and burst size as 16*/
++		_ipu_ch_params_set_alpha_width(ipu, dma_chan, 8);
++		_ipu_ch_param_set_burst_size(ipu, dma_chan, 16);
++	} else if (_ipu_is_ic_graphic_chan(dma_chan) &&
++		   ipu_pixel_format_has_alpha(pixel_fmt))
++		_ipu_ch_param_set_alpha_use_separate_channel(ipu, dma_chan, false);
++
++	if (rot_mode)
++		_ipu_ch_param_set_rotation(ipu, dma_chan, rot_mode);
++
++	/* IC and ROT channels have restriction of 8 or 16 pix burst length */
++	if (_ipu_is_ic_chan(dma_chan) || _ipu_is_vdi_out_chan(dma_chan)) {
++		if ((width % 16) == 0)
++			_ipu_ch_param_set_burst_size(ipu, dma_chan, 16);
++		else
++			_ipu_ch_param_set_burst_size(ipu, dma_chan, 8);
++	} else if (_ipu_is_irt_chan(dma_chan)) {
++		_ipu_ch_param_set_burst_size(ipu, dma_chan, 8);
++		_ipu_ch_param_set_block_mode(ipu, dma_chan);
++	} else if (_ipu_is_dmfc_chan(dma_chan)) {
++		burst_size = _ipu_ch_param_get_burst_size(ipu, dma_chan);
++		_ipu_dmfc_set_wait4eot(ipu, dma_chan, width);
++		_ipu_dmfc_set_burst_size(ipu, dma_chan, burst_size);
++	}
++
++	if (_ipu_disp_chan_is_interlaced(ipu, channel) ||
++		ipu->chan_is_interlaced[dma_chan])
++		_ipu_ch_param_set_interlaced_scan(ipu, dma_chan);
++
++	if (_ipu_is_ic_chan(dma_chan) || _ipu_is_irt_chan(dma_chan) ||
++		_ipu_is_vdi_out_chan(dma_chan)) {
++		burst_size = _ipu_ch_param_get_burst_size(ipu, dma_chan);
++		_ipu_ic_idma_init(ipu, dma_chan, width, height, burst_size,
++			rot_mode);
++	} else if (_ipu_is_smfc_chan(dma_chan)) {
++		burst_size = _ipu_ch_param_get_burst_size(ipu, dma_chan);
++		/*
++		 * This is different from IPUv3 spec, but it is confirmed
++		 * in IPUforum that SMFC burst size should be NPB[6:3]
++		 * when IDMAC works in 16-bit generic data mode.
++		 */
++		if (pixel_fmt == IPU_PIX_FMT_GENERIC)
++			/* 8 bits per pixel */
++			burst_size = burst_size >> 4;
++		else if (pixel_fmt == IPU_PIX_FMT_GENERIC_16)
++			/* 16 bits per pixel */
++			burst_size = burst_size >> 3;
++		else
++			burst_size = burst_size >> 2;
++		_ipu_smfc_set_burst_size(ipu, channel, burst_size-1);
++	}
++
++	/* AXI-id */
++	if (idma_is_set(ipu, IDMAC_CHA_PRI, dma_chan)) {
++		unsigned reg = IDMAC_CH_LOCK_EN_1;
++		uint32_t value = 0;
++		if (ipu->pdata->devtype == IPU_V3H) {
++			_ipu_ch_param_set_axi_id(ipu, dma_chan, 0);
++			switch (dma_chan) {
++			case 5:
++				value = 0x3;
++				break;
++			case 11:
++				value = 0x3 << 2;
++				break;
++			case 12:
++				value = 0x3 << 4;
++				break;
++			case 14:
++				value = 0x3 << 6;
++				break;
++			case 15:
++				value = 0x3 << 8;
++				break;
++			case 20:
++				value = 0x3 << 10;
++				break;
++			case 21:
++				value = 0x3 << 12;
++				break;
++			case 22:
++				value = 0x3 << 14;
++				break;
++			case 23:
++				value = 0x3 << 16;
++				break;
++			case 27:
++				value = 0x3 << 18;
++				break;
++			case 28:
++				value = 0x3 << 20;
++				break;
++			case 45:
++				reg = IDMAC_CH_LOCK_EN_2;
++				value = 0x3 << 0;
++				break;
++			case 46:
++				reg = IDMAC_CH_LOCK_EN_2;
++				value = 0x3 << 2;
++				break;
++			case 47:
++				reg = IDMAC_CH_LOCK_EN_2;
++				value = 0x3 << 4;
++				break;
++			case 48:
++				reg = IDMAC_CH_LOCK_EN_2;
++				value = 0x3 << 6;
++				break;
++			case 49:
++				reg = IDMAC_CH_LOCK_EN_2;
++				value = 0x3 << 8;
++				break;
++			case 50:
++				reg = IDMAC_CH_LOCK_EN_2;
++				value = 0x3 << 10;
++				break;
++			default:
++				break;
++			}
++			value |= ipu_idmac_read(ipu, reg);
++			ipu_idmac_write(ipu, value, reg);
++		} else
++			_ipu_ch_param_set_axi_id(ipu, dma_chan, 1);
++	} else {
++		if (ipu->pdata->devtype == IPU_V3H)
++			_ipu_ch_param_set_axi_id(ipu, dma_chan, 1);
++	}
++
++	_ipu_ch_param_dump(ipu, dma_chan);
++
++	if (phyaddr_2 && g_ipu_hw_rev >= IPU_V3DEX) {
++		reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(dma_chan));
++		reg &= ~idma_mask(dma_chan);
++		ipu_cm_write(ipu, reg, IPU_CHA_DB_MODE_SEL(dma_chan));
++
++		reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan));
++		reg |= idma_mask(dma_chan);
++		ipu_cm_write(ipu, reg, IPU_CHA_TRB_MODE_SEL(dma_chan));
++
++		/* Set IDMAC third buffer's cpmem number */
++		/* See __ipu_ch_get_third_buf_cpmem_num() for mapping */
++		ipu_idmac_write(ipu, 0x00444047L, IDMAC_SUB_ADDR_4);
++		ipu_idmac_write(ipu, 0x46004241L, IDMAC_SUB_ADDR_3);
++		ipu_idmac_write(ipu, 0x00000045L, IDMAC_SUB_ADDR_1);
++
++		/* Reset to buffer 0 */
++		ipu_cm_write(ipu, tri_cur_buf_mask(dma_chan),
++				IPU_CHA_TRIPLE_CUR_BUF(dma_chan));
++	} else {
++		reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan));
++		reg &= ~idma_mask(dma_chan);
++		ipu_cm_write(ipu, reg, IPU_CHA_TRB_MODE_SEL(dma_chan));
++
++		reg = ipu_cm_read(ipu, IPU_CHA_DB_MODE_SEL(dma_chan));
++		if (phyaddr_1)
++			reg |= idma_mask(dma_chan);
++		else
++			reg &= ~idma_mask(dma_chan);
++		ipu_cm_write(ipu, reg, IPU_CHA_DB_MODE_SEL(dma_chan));
++
++		/* Reset to buffer 0 */
++		ipu_cm_write(ipu, idma_mask(dma_chan),
++				IPU_CHA_CUR_BUF(dma_chan));
++
++	}
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_init_channel_buffer);
++
++/*!
++ * This function is called to update the physical address of a buffer for
++ * a logical IPU channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to initialize.
++ *
++ * @param       bufNum          Input parameter for buffer number to update.
++ *                              0 or 1 are the only valid values.
++ *
++ * @param       phyaddr         Input parameter buffer physical address.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail. This function will fail if the buffer is set to ready.
++ */
++int32_t ipu_update_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
++				ipu_buffer_t type, uint32_t bufNum, dma_addr_t phyaddr)
++{
++	uint32_t reg;
++	int ret = 0;
++	uint32_t dma_chan = channel_2_dma(channel, type);
++	unsigned long lock_flags;
++
++	if (dma_chan == IDMA_CHAN_INVALID)
++		return -EINVAL;
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	if (bufNum == 0)
++		reg = ipu_cm_read(ipu, IPU_CHA_BUF0_RDY(dma_chan));
++	else if (bufNum == 1)
++		reg = ipu_cm_read(ipu, IPU_CHA_BUF1_RDY(dma_chan));
++	else
++		reg = ipu_cm_read(ipu, IPU_CHA_BUF2_RDY(dma_chan));
++
++	if ((reg & idma_mask(dma_chan)) == 0)
++		_ipu_ch_param_set_buffer(ipu, dma_chan, bufNum, phyaddr);
++	else
++		ret = -EACCES;
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	return ret;
++}
++EXPORT_SYMBOL(ipu_update_channel_buffer);
++
++/*!
++ * This function is called to update the band mode setting for
++ * a logical IPU channel.
++ *
++ * @param	ipu		ipu handler
++ *
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to initialize.
++ *
++ * @param       band_height     Input parameter for band lines:
++ *				shoule be log2(4/8/16/32/64/128/256).
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_set_channel_bandmode(struct ipu_soc *ipu, ipu_channel_t channel,
++				 ipu_buffer_t type, uint32_t band_height)
++{
++	uint32_t reg;
++	int ret = 0;
++	uint32_t dma_chan = channel_2_dma(channel, type);
++
++	if ((2 > band_height) || (8 < band_height))
++		return -EINVAL;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	reg = ipu_idmac_read(ipu, IDMAC_BAND_EN(dma_chan));
++	reg |= 1 << (dma_chan % 32);
++	ipu_idmac_write(ipu, reg, IDMAC_BAND_EN(dma_chan));
++
++	_ipu_ch_param_set_bandmode(ipu, dma_chan, band_height);
++	dev_dbg(ipu->dev, "dma_chan:%d, band_height:%d.\n\n",
++				dma_chan, 1 << band_height);
++	mutex_unlock(&ipu->mutex_lock);
++
++	return ret;
++}
++EXPORT_SYMBOL(ipu_set_channel_bandmode);
++
++/*!
++ * This function is called to initialize a buffer for logical IPU channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to initialize.
++ *
++ * @param       pixel_fmt       Input parameter for pixel format of buffer.
++ *                              Pixel format is a FOURCC ASCII code.
++ *
++ * @param       width           Input parameter for width of buffer in pixels.
++ *
++ * @param       height          Input parameter for height of buffer in pixels.
++ *
++ * @param       stride          Input parameter for stride length of buffer
++ *                              in pixels.
++ *
++ * @param       u		predefined private u offset for additional cropping,
++ *								zero if not used.
++ *
++ * @param       v		predefined private v offset for additional cropping,
++ *								zero if not used.
++ *
++ * @param			vertical_offset vertical offset for Y coordinate
++ * 								in the existed frame
++ *
++ *
++ * @param			horizontal_offset horizontal offset for X coordinate
++ * 								in the existed frame
++ *
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ *              This function will fail if any buffer is set to ready.
++ */
++
++int32_t ipu_update_channel_offset(struct ipu_soc *ipu,
++				ipu_channel_t channel, ipu_buffer_t type,
++				uint32_t pixel_fmt,
++				uint16_t width, uint16_t height,
++				uint32_t stride,
++				uint32_t u, uint32_t v,
++				uint32_t vertical_offset, uint32_t horizontal_offset)
++{
++	int ret = 0;
++	uint32_t dma_chan = channel_2_dma(channel, type);
++	unsigned long lock_flags;
++
++	if (dma_chan == IDMA_CHAN_INVALID)
++		return -EINVAL;
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	if ((ipu_cm_read(ipu, IPU_CHA_BUF0_RDY(dma_chan)) & idma_mask(dma_chan)) ||
++	    (ipu_cm_read(ipu, IPU_CHA_BUF1_RDY(dma_chan)) & idma_mask(dma_chan)) ||
++	    ((ipu_cm_read(ipu, IPU_CHA_BUF2_RDY(dma_chan)) & idma_mask(dma_chan)) &&
++	     (ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan)) & idma_mask(dma_chan)) &&
++	     _ipu_is_trb_chan(dma_chan)))
++		ret = -EACCES;
++	else
++		_ipu_ch_offset_update(ipu, dma_chan, pixel_fmt, width, height, stride,
++				      u, v, 0, vertical_offset, horizontal_offset);
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	return ret;
++}
++EXPORT_SYMBOL(ipu_update_channel_offset);
++
++
++/*!
++ * This function is called to set a channel's buffer as ready.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to initialize.
++ *
++ * @param       bufNum          Input parameter for which buffer number set to
++ *                              ready state.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_select_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
++			ipu_buffer_t type, uint32_t bufNum)
++{
++	uint32_t dma_chan = channel_2_dma(channel, type);
++	unsigned long lock_flags;
++
++	if (dma_chan == IDMA_CHAN_INVALID)
++		return -EINVAL;
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	/* Mark buffer to be ready. */
++	if (bufNum == 0)
++		ipu_cm_write(ipu, idma_mask(dma_chan),
++			     IPU_CHA_BUF0_RDY(dma_chan));
++	else if (bufNum == 1)
++		ipu_cm_write(ipu, idma_mask(dma_chan),
++			     IPU_CHA_BUF1_RDY(dma_chan));
++	else
++		ipu_cm_write(ipu, idma_mask(dma_chan),
++			     IPU_CHA_BUF2_RDY(dma_chan));
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_select_buffer);
++
++/*!
++ * This function is called to set a channel's buffer as ready.
++ *
++ * @param	ipu		ipu handler
++ * @param       bufNum          Input parameter for which buffer number set to
++ *                              ready state.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_select_multi_vdi_buffer(struct ipu_soc *ipu, uint32_t bufNum)
++{
++
++	uint32_t dma_chan = channel_2_dma(MEM_VDI_PRP_VF_MEM, IPU_INPUT_BUFFER);
++	uint32_t mask_bit =
++		idma_mask(channel_2_dma(MEM_VDI_PRP_VF_MEM_P, IPU_INPUT_BUFFER))|
++		idma_mask(dma_chan)|
++		idma_mask(channel_2_dma(MEM_VDI_PRP_VF_MEM_N, IPU_INPUT_BUFFER));
++	unsigned long lock_flags;
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	/* Mark buffers to be ready. */
++	if (bufNum == 0)
++		ipu_cm_write(ipu, mask_bit, IPU_CHA_BUF0_RDY(dma_chan));
++	else
++		ipu_cm_write(ipu, mask_bit, IPU_CHA_BUF1_RDY(dma_chan));
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_select_multi_vdi_buffer);
++
++#define NA	-1
++static int proc_dest_sel[] = {
++	0, 1, 1, 3, 5, 5, 4, 7, 8, 9, 10, 11, 12, 14, 15, 16,
++	0, 1, 1, 5, 5, 5, 5, 5, 7, 8, 9, 10, 11, 12, 14, 31 };
++static int proc_src_sel[] = { 0, 6, 7, 6, 7, 8, 5, NA, NA, NA,
++  NA, NA, NA, NA, NA,  1,  2,  3,  4,  7,  8, NA, 8, NA };
++static int disp_src_sel[] = { 0, 6, 7, 8, 3, 4, 5, NA, NA, NA,
++  NA, NA, NA, NA, NA,  1, NA,  2, NA,  3,  4,  4,  4,  4 };
++
++
++/*!
++ * This function links 2 channels together for automatic frame
++ * synchronization. The output of the source channel is linked to the input of
++ * the destination channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       src_ch          Input parameter for the logical channel ID of
++ *                              the source channel.
++ *
++ * @param       dest_ch         Input parameter for the logical channel ID of
++ *                              the destination channel.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_link_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch)
++{
++	int retval = 0;
++	uint32_t fs_proc_flow1;
++	uint32_t fs_proc_flow2;
++	uint32_t fs_proc_flow3;
++	uint32_t fs_disp_flow1;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	fs_proc_flow1 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++	fs_proc_flow2 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW2);
++	fs_proc_flow3 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW3);
++	fs_disp_flow1 = ipu_cm_read(ipu, IPU_FS_DISP_FLOW1);
++
++	switch (src_ch) {
++	case CSI_MEM0:
++		fs_proc_flow3 &= ~FS_SMFC0_DEST_SEL_MASK;
++		fs_proc_flow3 |=
++			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++			FS_SMFC0_DEST_SEL_OFFSET;
++		break;
++	case CSI_MEM1:
++		fs_proc_flow3 &= ~FS_SMFC1_DEST_SEL_MASK;
++		fs_proc_flow3 |=
++			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++			FS_SMFC1_DEST_SEL_OFFSET;
++		break;
++	case CSI_MEM2:
++		fs_proc_flow3 &= ~FS_SMFC2_DEST_SEL_MASK;
++		fs_proc_flow3 |=
++			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++			FS_SMFC2_DEST_SEL_OFFSET;
++		break;
++	case CSI_MEM3:
++		fs_proc_flow3 &= ~FS_SMFC3_DEST_SEL_MASK;
++		fs_proc_flow3 |=
++			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++			FS_SMFC3_DEST_SEL_OFFSET;
++		break;
++	case CSI_PRP_ENC_MEM:
++		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++			FS_PRPENC_DEST_SEL_OFFSET;
++		break;
++	case CSI_PRP_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++			proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++			FS_PRPVF_DEST_SEL_OFFSET;
++		break;
++	case MEM_PP_MEM:
++		fs_proc_flow2 &= ~FS_PP_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PP_DEST_SEL_OFFSET;
++		break;
++	case MEM_ROT_PP_MEM:
++		fs_proc_flow2 &= ~FS_PP_ROT_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PP_ROT_DEST_SEL_OFFSET;
++		break;
++	case MEM_PRP_ENC_MEM:
++		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PRPENC_DEST_SEL_OFFSET;
++		break;
++	case MEM_ROT_ENC_MEM:
++		fs_proc_flow2 &= ~FS_PRPENC_ROT_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PRPENC_ROT_DEST_SEL_OFFSET;
++		break;
++	case MEM_PRP_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PRPVF_DEST_SEL_OFFSET;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PRPVF_DEST_SEL_OFFSET;
++		break;
++	case MEM_ROT_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_ROT_DEST_SEL_MASK;
++		fs_proc_flow2 |=
++		    proc_dest_sel[IPU_CHAN_ID(dest_ch)] <<
++		    FS_PRPVF_ROT_DEST_SEL_OFFSET;
++		break;
++	case MEM_VDOA_MEM:
++		fs_proc_flow3 &= ~FS_VDOA_DEST_SEL_MASK;
++		if (MEM_VDI_MEM == dest_ch)
++			fs_proc_flow3 |= FS_VDOA_DEST_SEL_VDI;
++		else if (MEM_PP_MEM == dest_ch)
++			fs_proc_flow3 |= FS_VDOA_DEST_SEL_IC;
++		else {
++			retval = -EINVAL;
++			goto err;
++		}
++		break;
++	default:
++		retval = -EINVAL;
++		goto err;
++	}
++
++	switch (dest_ch) {
++	case MEM_PP_MEM:
++		fs_proc_flow1 &= ~FS_PP_SRC_SEL_MASK;
++		if (MEM_VDOA_MEM == src_ch)
++			fs_proc_flow1 |= FS_PP_SRC_SEL_VDOA;
++		else
++			fs_proc_flow1 |= proc_src_sel[IPU_CHAN_ID(src_ch)] <<
++						FS_PP_SRC_SEL_OFFSET;
++		break;
++	case MEM_ROT_PP_MEM:
++		fs_proc_flow1 &= ~FS_PP_ROT_SRC_SEL_MASK;
++		fs_proc_flow1 |=
++		    proc_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_PP_ROT_SRC_SEL_OFFSET;
++		break;
++	case MEM_PRP_ENC_MEM:
++		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
++		fs_proc_flow1 |=
++		    proc_src_sel[IPU_CHAN_ID(src_ch)] << FS_PRP_SRC_SEL_OFFSET;
++		break;
++	case MEM_ROT_ENC_MEM:
++		fs_proc_flow1 &= ~FS_PRPENC_ROT_SRC_SEL_MASK;
++		fs_proc_flow1 |=
++		    proc_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_PRPENC_ROT_SRC_SEL_OFFSET;
++		break;
++	case MEM_PRP_VF_MEM:
++		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
++		fs_proc_flow1 |=
++		    proc_src_sel[IPU_CHAN_ID(src_ch)] << FS_PRP_SRC_SEL_OFFSET;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
++		fs_proc_flow1 |=
++		    proc_src_sel[IPU_CHAN_ID(src_ch)] << FS_PRP_SRC_SEL_OFFSET;
++		break;
++	case MEM_ROT_VF_MEM:
++		fs_proc_flow1 &= ~FS_PRPVF_ROT_SRC_SEL_MASK;
++		fs_proc_flow1 |=
++		    proc_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_PRPVF_ROT_SRC_SEL_OFFSET;
++		break;
++	case MEM_DC_SYNC:
++		fs_disp_flow1 &= ~FS_DC1_SRC_SEL_MASK;
++		fs_disp_flow1 |=
++		    disp_src_sel[IPU_CHAN_ID(src_ch)] << FS_DC1_SRC_SEL_OFFSET;
++		break;
++	case MEM_BG_SYNC:
++		fs_disp_flow1 &= ~FS_DP_SYNC0_SRC_SEL_MASK;
++		fs_disp_flow1 |=
++		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_DP_SYNC0_SRC_SEL_OFFSET;
++		break;
++	case MEM_FG_SYNC:
++		fs_disp_flow1 &= ~FS_DP_SYNC1_SRC_SEL_MASK;
++		fs_disp_flow1 |=
++		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_DP_SYNC1_SRC_SEL_OFFSET;
++		break;
++	case MEM_DC_ASYNC:
++		fs_disp_flow1 &= ~FS_DC2_SRC_SEL_MASK;
++		fs_disp_flow1 |=
++		    disp_src_sel[IPU_CHAN_ID(src_ch)] << FS_DC2_SRC_SEL_OFFSET;
++		break;
++	case MEM_BG_ASYNC0:
++		fs_disp_flow1 &= ~FS_DP_ASYNC0_SRC_SEL_MASK;
++		fs_disp_flow1 |=
++		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_DP_ASYNC0_SRC_SEL_OFFSET;
++		break;
++	case MEM_FG_ASYNC0:
++		fs_disp_flow1 &= ~FS_DP_ASYNC1_SRC_SEL_MASK;
++		fs_disp_flow1 |=
++		    disp_src_sel[IPU_CHAN_ID(src_ch)] <<
++		    FS_DP_ASYNC1_SRC_SEL_OFFSET;
++		break;
++	case MEM_VDI_MEM:
++		fs_proc_flow1 &= ~FS_VDI_SRC_SEL_MASK;
++		if (MEM_VDOA_MEM == src_ch)
++			fs_proc_flow1 |= FS_VDI_SRC_SEL_VDOA;
++		else {
++			retval = -EINVAL;
++			goto err;
++		}
++		break;
++	default:
++		retval = -EINVAL;
++		goto err;
++	}
++
++	ipu_cm_write(ipu, fs_proc_flow1, IPU_FS_PROC_FLOW1);
++	ipu_cm_write(ipu, fs_proc_flow2, IPU_FS_PROC_FLOW2);
++	ipu_cm_write(ipu, fs_proc_flow3, IPU_FS_PROC_FLOW3);
++	ipu_cm_write(ipu, fs_disp_flow1, IPU_FS_DISP_FLOW1);
++
++err:
++	mutex_unlock(&ipu->mutex_lock);
++	return retval;
++}
++EXPORT_SYMBOL(ipu_link_channels);
++
++/*!
++ * This function unlinks 2 channels and disables automatic frame
++ * synchronization.
++ *
++ * @param	ipu		ipu handler
++ * @param       src_ch          Input parameter for the logical channel ID of
++ *                              the source channel.
++ *
++ * @param       dest_ch         Input parameter for the logical channel ID of
++ *                              the destination channel.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_unlink_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch)
++{
++	int retval = 0;
++	uint32_t fs_proc_flow1;
++	uint32_t fs_proc_flow2;
++	uint32_t fs_proc_flow3;
++	uint32_t fs_disp_flow1;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	fs_proc_flow1 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW1);
++	fs_proc_flow2 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW2);
++	fs_proc_flow3 = ipu_cm_read(ipu, IPU_FS_PROC_FLOW3);
++	fs_disp_flow1 = ipu_cm_read(ipu, IPU_FS_DISP_FLOW1);
++
++	switch (src_ch) {
++	case CSI_MEM0:
++		fs_proc_flow3 &= ~FS_SMFC0_DEST_SEL_MASK;
++		break;
++	case CSI_MEM1:
++		fs_proc_flow3 &= ~FS_SMFC1_DEST_SEL_MASK;
++		break;
++	case CSI_MEM2:
++		fs_proc_flow3 &= ~FS_SMFC2_DEST_SEL_MASK;
++		break;
++	case CSI_MEM3:
++		fs_proc_flow3 &= ~FS_SMFC3_DEST_SEL_MASK;
++		break;
++	case CSI_PRP_ENC_MEM:
++		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
++		break;
++	case CSI_PRP_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
++		break;
++	case MEM_PP_MEM:
++		fs_proc_flow2 &= ~FS_PP_DEST_SEL_MASK;
++		break;
++	case MEM_ROT_PP_MEM:
++		fs_proc_flow2 &= ~FS_PP_ROT_DEST_SEL_MASK;
++		break;
++	case MEM_PRP_ENC_MEM:
++		fs_proc_flow2 &= ~FS_PRPENC_DEST_SEL_MASK;
++		break;
++	case MEM_ROT_ENC_MEM:
++		fs_proc_flow2 &= ~FS_PRPENC_ROT_DEST_SEL_MASK;
++		break;
++	case MEM_PRP_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_DEST_SEL_MASK;
++		break;
++	case MEM_ROT_VF_MEM:
++		fs_proc_flow2 &= ~FS_PRPVF_ROT_DEST_SEL_MASK;
++		break;
++	case MEM_VDOA_MEM:
++		fs_proc_flow3 &= ~FS_VDOA_DEST_SEL_MASK;
++		break;
++	default:
++		retval = -EINVAL;
++		goto err;
++	}
++
++	switch (dest_ch) {
++	case MEM_PP_MEM:
++		fs_proc_flow1 &= ~FS_PP_SRC_SEL_MASK;
++		break;
++	case MEM_ROT_PP_MEM:
++		fs_proc_flow1 &= ~FS_PP_ROT_SRC_SEL_MASK;
++		break;
++	case MEM_PRP_ENC_MEM:
++		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
++		break;
++	case MEM_ROT_ENC_MEM:
++		fs_proc_flow1 &= ~FS_PRPENC_ROT_SRC_SEL_MASK;
++		break;
++	case MEM_PRP_VF_MEM:
++		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		fs_proc_flow1 &= ~FS_PRP_SRC_SEL_MASK;
++		break;
++	case MEM_ROT_VF_MEM:
++		fs_proc_flow1 &= ~FS_PRPVF_ROT_SRC_SEL_MASK;
++		break;
++	case MEM_DC_SYNC:
++		fs_disp_flow1 &= ~FS_DC1_SRC_SEL_MASK;
++		break;
++	case MEM_BG_SYNC:
++		fs_disp_flow1 &= ~FS_DP_SYNC0_SRC_SEL_MASK;
++		break;
++	case MEM_FG_SYNC:
++		fs_disp_flow1 &= ~FS_DP_SYNC1_SRC_SEL_MASK;
++		break;
++	case MEM_DC_ASYNC:
++		fs_disp_flow1 &= ~FS_DC2_SRC_SEL_MASK;
++		break;
++	case MEM_BG_ASYNC0:
++		fs_disp_flow1 &= ~FS_DP_ASYNC0_SRC_SEL_MASK;
++		break;
++	case MEM_FG_ASYNC0:
++		fs_disp_flow1 &= ~FS_DP_ASYNC1_SRC_SEL_MASK;
++		break;
++	case MEM_VDI_MEM:
++		fs_proc_flow1 &= ~FS_VDI_SRC_SEL_MASK;
++		break;
++	default:
++		retval = -EINVAL;
++		goto err;
++	}
++
++	ipu_cm_write(ipu, fs_proc_flow1, IPU_FS_PROC_FLOW1);
++	ipu_cm_write(ipu, fs_proc_flow2, IPU_FS_PROC_FLOW2);
++	ipu_cm_write(ipu, fs_proc_flow3, IPU_FS_PROC_FLOW3);
++	ipu_cm_write(ipu, fs_disp_flow1, IPU_FS_DISP_FLOW1);
++
++err:
++	mutex_unlock(&ipu->mutex_lock);
++	return retval;
++}
++EXPORT_SYMBOL(ipu_unlink_channels);
++
++/*!
++ * This function check whether a logical channel was enabled.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @return      This function returns 1 while request channel is enabled or
++ *              0 for not enabled.
++ */
++int32_t ipu_is_channel_busy(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t reg;
++	uint32_t in_dma;
++	uint32_t out_dma;
++
++	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
++	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
++
++	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(in_dma));
++	if (reg & idma_mask(in_dma))
++		return 1;
++	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(out_dma));
++	if (reg & idma_mask(out_dma))
++		return 1;
++	return 0;
++}
++EXPORT_SYMBOL(ipu_is_channel_busy);
++
++/*!
++ * This function enables a logical channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_enable_channel(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t reg;
++	uint32_t ipu_conf;
++	uint32_t in_dma;
++	uint32_t out_dma;
++	uint32_t sec_dma;
++	uint32_t thrd_dma;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	if (ipu->channel_enable_mask & (1L << IPU_CHAN_ID(channel))) {
++		dev_err(ipu->dev, "Warning: channel already enabled %d\n",
++			IPU_CHAN_ID(channel));
++		mutex_unlock(&ipu->mutex_lock);
++		return -EACCES;
++	}
++
++	/* Get input and output dma channels */
++	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
++	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
++
++	ipu_conf = ipu_cm_read(ipu, IPU_CONF);
++	if (ipu->di_use_count[0] > 0) {
++		ipu_conf |= IPU_CONF_DI0_EN;
++	}
++	if (ipu->di_use_count[1] > 0) {
++		ipu_conf |= IPU_CONF_DI1_EN;
++	}
++	if (ipu->dp_use_count > 0)
++		ipu_conf |= IPU_CONF_DP_EN;
++	if (ipu->dc_use_count > 0)
++		ipu_conf |= IPU_CONF_DC_EN;
++	if (ipu->dmfc_use_count > 0)
++		ipu_conf |= IPU_CONF_DMFC_EN;
++	if (ipu->ic_use_count > 0)
++		ipu_conf |= IPU_CONF_IC_EN;
++	if (ipu->vdi_use_count > 0) {
++		ipu_conf |= IPU_CONF_ISP_EN;
++		ipu_conf |= IPU_CONF_VDI_EN;
++		ipu_conf |= IPU_CONF_IC_INPUT;
++	}
++	if (ipu->rot_use_count > 0)
++		ipu_conf |= IPU_CONF_ROT_EN;
++	if (ipu->smfc_use_count > 0)
++		ipu_conf |= IPU_CONF_SMFC_EN;
++	ipu_cm_write(ipu, ipu_conf, IPU_CONF);
++
++	if (idma_is_valid(in_dma)) {
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(in_dma));
++		ipu_idmac_write(ipu, reg | idma_mask(in_dma), IDMAC_CHA_EN(in_dma));
++	}
++	if (idma_is_valid(out_dma)) {
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(out_dma));
++		ipu_idmac_write(ipu, reg | idma_mask(out_dma), IDMAC_CHA_EN(out_dma));
++	}
++
++	if ((ipu->sec_chan_en[IPU_CHAN_ID(channel)]) &&
++		((channel == MEM_PP_MEM) || (channel == MEM_PRP_VF_MEM) ||
++		 (channel == MEM_VDI_PRP_VF_MEM))) {
++		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(sec_dma));
++		ipu_idmac_write(ipu, reg | idma_mask(sec_dma), IDMAC_CHA_EN(sec_dma));
++	}
++	if ((ipu->thrd_chan_en[IPU_CHAN_ID(channel)]) &&
++		((channel == MEM_PP_MEM) || (channel == MEM_PRP_VF_MEM))) {
++		thrd_dma = channel_2_dma(channel, IPU_ALPHA_IN_BUFFER);
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(thrd_dma));
++		ipu_idmac_write(ipu, reg | idma_mask(thrd_dma), IDMAC_CHA_EN(thrd_dma));
++
++		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
++		reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
++		ipu_idmac_write(ipu, reg | idma_mask(sec_dma), IDMAC_SEP_ALPHA);
++	} else if ((ipu->thrd_chan_en[IPU_CHAN_ID(channel)]) &&
++		   ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC))) {
++		thrd_dma = channel_2_dma(channel, IPU_ALPHA_IN_BUFFER);
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(thrd_dma));
++		ipu_idmac_write(ipu, reg | idma_mask(thrd_dma), IDMAC_CHA_EN(thrd_dma));
++		reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
++		ipu_idmac_write(ipu, reg | idma_mask(in_dma), IDMAC_SEP_ALPHA);
++	}
++
++	if ((channel == MEM_DC_SYNC) || (channel == MEM_BG_SYNC) ||
++	    (channel == MEM_FG_SYNC)) {
++		reg = ipu_idmac_read(ipu, IDMAC_WM_EN(in_dma));
++		ipu_idmac_write(ipu, reg | idma_mask(in_dma), IDMAC_WM_EN(in_dma));
++
++		_ipu_dp_dc_enable(ipu, channel);
++	}
++
++	if (_ipu_is_ic_chan(in_dma) || _ipu_is_ic_chan(out_dma) ||
++		_ipu_is_irt_chan(in_dma) || _ipu_is_irt_chan(out_dma) ||
++		_ipu_is_vdi_out_chan(out_dma))
++		_ipu_ic_enable_task(ipu, channel);
++
++	ipu->channel_enable_mask |= 1L << IPU_CHAN_ID(channel);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_enable_channel);
++
++/*!
++ * This function check buffer ready for a logical channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to clear.
++ *
++ * @param       bufNum          Input parameter for which buffer number clear
++ * 				ready state.
++ *
++ */
++int32_t ipu_check_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++		uint32_t bufNum)
++{
++	uint32_t dma_chan = channel_2_dma(channel, type);
++	uint32_t reg;
++	unsigned long lock_flags;
++
++	if (dma_chan == IDMA_CHAN_INVALID)
++		return -EINVAL;
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	if (bufNum == 0)
++		reg = ipu_cm_read(ipu, IPU_CHA_BUF0_RDY(dma_chan));
++	else if (bufNum == 1)
++		reg = ipu_cm_read(ipu, IPU_CHA_BUF1_RDY(dma_chan));
++	else
++		reg = ipu_cm_read(ipu, IPU_CHA_BUF2_RDY(dma_chan));
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	if (reg & idma_mask(dma_chan))
++		return 1;
++	else
++		return 0;
++}
++EXPORT_SYMBOL(ipu_check_buffer_ready);
++
++/*!
++ * This function clear buffer ready for a logical channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       type            Input parameter which buffer to clear.
++ *
++ * @param       bufNum          Input parameter for which buffer number clear
++ * 				ready state.
++ *
++ */
++void _ipu_clear_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++		uint32_t bufNum)
++{
++	uint32_t dma_ch = channel_2_dma(channel, type);
++
++	if (!idma_is_valid(dma_ch))
++		return;
++
++	ipu_cm_write(ipu, 0xF0300000, IPU_GPR); /* write one to clear */
++	if (bufNum == 0)
++		ipu_cm_write(ipu, idma_mask(dma_ch),
++				IPU_CHA_BUF0_RDY(dma_ch));
++	else if (bufNum == 1)
++		ipu_cm_write(ipu, idma_mask(dma_ch),
++				IPU_CHA_BUF1_RDY(dma_ch));
++	else
++		ipu_cm_write(ipu, idma_mask(dma_ch),
++				IPU_CHA_BUF2_RDY(dma_ch));
++	ipu_cm_write(ipu, 0x0, IPU_GPR); /* write one to set */
++}
++
++void ipu_clear_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++		uint32_t bufNum)
++{
++	unsigned long lock_flags;
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	_ipu_clear_buffer_ready(ipu, channel, type, bufNum);
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++}
++EXPORT_SYMBOL(ipu_clear_buffer_ready);
++
++/*!
++ * This function disables a logical channel.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       wait_for_stop   Flag to set whether to wait for channel end
++ *                              of frame or return immediately.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_disable_channel(struct ipu_soc *ipu, ipu_channel_t channel, bool wait_for_stop)
++{
++	uint32_t reg;
++	uint32_t in_dma;
++	uint32_t out_dma;
++	uint32_t sec_dma = NO_DMA;
++	uint32_t thrd_dma = NO_DMA;
++	uint16_t fg_pos_x, fg_pos_y;
++	unsigned long lock_flags;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	if ((ipu->channel_enable_mask & (1L << IPU_CHAN_ID(channel))) == 0) {
++		dev_dbg(ipu->dev, "Channel already disabled %d\n",
++			IPU_CHAN_ID(channel));
++		mutex_unlock(&ipu->mutex_lock);
++		return -EACCES;
++	}
++
++	/* Get input and output dma channels */
++	out_dma = channel_2_dma(channel, IPU_OUTPUT_BUFFER);
++	in_dma = channel_2_dma(channel, IPU_VIDEO_IN_BUFFER);
++
++	if ((idma_is_valid(in_dma) &&
++		!idma_is_set(ipu, IDMAC_CHA_EN, in_dma))
++		&& (idma_is_valid(out_dma) &&
++		!idma_is_set(ipu, IDMAC_CHA_EN, out_dma))) {
++		mutex_unlock(&ipu->mutex_lock);
++		return -EINVAL;
++	}
++
++	if (ipu->sec_chan_en[IPU_CHAN_ID(channel)])
++		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
++	if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)]) {
++		sec_dma = channel_2_dma(channel, IPU_GRAPH_IN_BUFFER);
++		thrd_dma = channel_2_dma(channel, IPU_ALPHA_IN_BUFFER);
++	}
++
++	if ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC) ||
++	    (channel == MEM_DC_SYNC)) {
++		if (channel == MEM_FG_SYNC) {
++			_ipu_disp_get_window_pos(ipu, channel, &fg_pos_x, &fg_pos_y);
++			_ipu_disp_set_window_pos(ipu, channel, 0, 0);
++		}
++
++		_ipu_dp_dc_disable(ipu, channel, false);
++
++		/*
++		 * wait for BG channel EOF then disable FG-IDMAC,
++		 * it avoid FG NFB4EOF error.
++		 */
++		if ((channel == MEM_FG_SYNC) && (ipu_is_channel_busy(ipu, MEM_BG_SYNC))) {
++			int timeout = 50;
++
++			ipu_cm_write(ipu, IPUIRQ_2_MASK(IPU_IRQ_BG_SYNC_EOF),
++					IPUIRQ_2_STATREG(IPU_IRQ_BG_SYNC_EOF));
++			while ((ipu_cm_read(ipu, IPUIRQ_2_STATREG(IPU_IRQ_BG_SYNC_EOF)) &
++						IPUIRQ_2_MASK(IPU_IRQ_BG_SYNC_EOF)) == 0) {
++				msleep(10);
++				timeout -= 10;
++				if (timeout <= 0) {
++					dev_err(ipu->dev, "warning: wait for bg sync eof timeout\n");
++					break;
++				}
++			}
++		}
++	} else if (wait_for_stop && !_ipu_is_smfc_chan(out_dma) &&
++		   channel != CSI_PRP_VF_MEM && channel != CSI_PRP_ENC_MEM) {
++		while (idma_is_set(ipu, IDMAC_CHA_BUSY, in_dma) ||
++		       idma_is_set(ipu, IDMAC_CHA_BUSY, out_dma) ||
++			(ipu->sec_chan_en[IPU_CHAN_ID(channel)] &&
++			idma_is_set(ipu, IDMAC_CHA_BUSY, sec_dma)) ||
++			(ipu->thrd_chan_en[IPU_CHAN_ID(channel)] &&
++			idma_is_set(ipu, IDMAC_CHA_BUSY, thrd_dma))) {
++			uint32_t irq = 0xffffffff;
++			int timeout = 50000;
++
++			if (idma_is_set(ipu, IDMAC_CHA_BUSY, out_dma))
++				irq = out_dma;
++			if (ipu->sec_chan_en[IPU_CHAN_ID(channel)] &&
++				idma_is_set(ipu, IDMAC_CHA_BUSY, sec_dma))
++				irq = sec_dma;
++			if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] &&
++				idma_is_set(ipu, IDMAC_CHA_BUSY, thrd_dma))
++				irq = thrd_dma;
++			if (idma_is_set(ipu, IDMAC_CHA_BUSY, in_dma))
++				irq = in_dma;
++
++			if (irq == 0xffffffff) {
++				dev_dbg(ipu->dev, "warning: no channel busy, break\n");
++				break;
++			}
++
++			ipu_cm_write(ipu, IPUIRQ_2_MASK(irq),
++					IPUIRQ_2_STATREG(irq));
++
++			dev_dbg(ipu->dev, "warning: channel %d busy, need wait\n", irq);
++
++			while (((ipu_cm_read(ipu, IPUIRQ_2_STATREG(irq))
++				& IPUIRQ_2_MASK(irq)) == 0) &&
++				(idma_is_set(ipu, IDMAC_CHA_BUSY, irq))) {
++				udelay(10);
++				timeout -= 10;
++				if (timeout <= 0) {
++					ipu_dump_registers(ipu);
++					dev_err(ipu->dev, "warning: disable ipu dma channel %d during its busy state\n", irq);
++					break;
++				}
++			}
++			dev_dbg(ipu->dev, "wait_time:%d\n", 50000 - timeout);
++
++		}
++	}
++
++	if ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC) ||
++	    (channel == MEM_DC_SYNC)) {
++		reg = ipu_idmac_read(ipu, IDMAC_WM_EN(in_dma));
++		ipu_idmac_write(ipu, reg & ~idma_mask(in_dma), IDMAC_WM_EN(in_dma));
++	}
++
++	/* Disable IC task */
++	if (_ipu_is_ic_chan(in_dma) || _ipu_is_ic_chan(out_dma) ||
++		_ipu_is_irt_chan(in_dma) || _ipu_is_irt_chan(out_dma) ||
++		_ipu_is_vdi_out_chan(out_dma))
++		_ipu_ic_disable_task(ipu, channel);
++
++	/* Disable DMA channel(s) */
++	if (idma_is_valid(in_dma)) {
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(in_dma));
++		ipu_idmac_write(ipu, reg & ~idma_mask(in_dma), IDMAC_CHA_EN(in_dma));
++		ipu_cm_write(ipu, idma_mask(in_dma), IPU_CHA_CUR_BUF(in_dma));
++		ipu_cm_write(ipu, tri_cur_buf_mask(in_dma),
++					IPU_CHA_TRIPLE_CUR_BUF(in_dma));
++	}
++	if (idma_is_valid(out_dma)) {
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(out_dma));
++		ipu_idmac_write(ipu, reg & ~idma_mask(out_dma), IDMAC_CHA_EN(out_dma));
++		ipu_cm_write(ipu, idma_mask(out_dma), IPU_CHA_CUR_BUF(out_dma));
++		ipu_cm_write(ipu, tri_cur_buf_mask(out_dma),
++					IPU_CHA_TRIPLE_CUR_BUF(out_dma));
++	}
++	if (ipu->sec_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(sec_dma)) {
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(sec_dma));
++		ipu_idmac_write(ipu, reg & ~idma_mask(sec_dma), IDMAC_CHA_EN(sec_dma));
++		ipu_cm_write(ipu, idma_mask(sec_dma), IPU_CHA_CUR_BUF(sec_dma));
++	}
++	if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(thrd_dma)) {
++		reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(thrd_dma));
++		ipu_idmac_write(ipu, reg & ~idma_mask(thrd_dma), IDMAC_CHA_EN(thrd_dma));
++		if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC) {
++			reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
++			ipu_idmac_write(ipu, reg & ~idma_mask(in_dma), IDMAC_SEP_ALPHA);
++		} else {
++			reg = ipu_idmac_read(ipu, IDMAC_SEP_ALPHA);
++			ipu_idmac_write(ipu, reg & ~idma_mask(sec_dma), IDMAC_SEP_ALPHA);
++		}
++		ipu_cm_write(ipu, idma_mask(thrd_dma), IPU_CHA_CUR_BUF(thrd_dma));
++	}
++
++	if (channel == MEM_FG_SYNC)
++		_ipu_disp_set_window_pos(ipu, channel, fg_pos_x, fg_pos_y);
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	/* Set channel buffers NOT to be ready */
++	if (idma_is_valid(in_dma)) {
++		_ipu_clear_buffer_ready(ipu, channel, IPU_VIDEO_IN_BUFFER, 0);
++		_ipu_clear_buffer_ready(ipu, channel, IPU_VIDEO_IN_BUFFER, 1);
++		_ipu_clear_buffer_ready(ipu, channel, IPU_VIDEO_IN_BUFFER, 2);
++	}
++	if (idma_is_valid(out_dma)) {
++		_ipu_clear_buffer_ready(ipu, channel, IPU_OUTPUT_BUFFER, 0);
++		_ipu_clear_buffer_ready(ipu, channel, IPU_OUTPUT_BUFFER, 1);
++	}
++	if (ipu->sec_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(sec_dma)) {
++		_ipu_clear_buffer_ready(ipu, channel, IPU_GRAPH_IN_BUFFER, 0);
++		_ipu_clear_buffer_ready(ipu, channel, IPU_GRAPH_IN_BUFFER, 1);
++	}
++	if (ipu->thrd_chan_en[IPU_CHAN_ID(channel)] && idma_is_valid(thrd_dma)) {
++		_ipu_clear_buffer_ready(ipu, channel, IPU_ALPHA_IN_BUFFER, 0);
++		_ipu_clear_buffer_ready(ipu, channel, IPU_ALPHA_IN_BUFFER, 1);
++	}
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	ipu->channel_enable_mask &= ~(1L << IPU_CHAN_ID(channel));
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_disable_channel);
++
++/*!
++ * This function enables CSI.
++ *
++ * @param	ipu		ipu handler
++ * @param       csi	csi num 0 or 1
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_enable_csi(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t reg;
++
++	if (csi > 1) {
++		dev_err(ipu->dev, "Wrong csi num_%d\n", csi);
++		return -EINVAL;
++	}
++
++	_ipu_get(ipu);
++	mutex_lock(&ipu->mutex_lock);
++	ipu->csi_use_count[csi]++;
++
++	if (ipu->csi_use_count[csi] == 1) {
++		reg = ipu_cm_read(ipu, IPU_CONF);
++		if (csi == 0)
++			ipu_cm_write(ipu, reg | IPU_CONF_CSI0_EN, IPU_CONF);
++		else
++			ipu_cm_write(ipu, reg | IPU_CONF_CSI1_EN, IPU_CONF);
++	}
++	mutex_unlock(&ipu->mutex_lock);
++	_ipu_put(ipu);
++	return 0;
++}
++EXPORT_SYMBOL(ipu_enable_csi);
++
++/*!
++ * This function disables CSI.
++ *
++ * @param	ipu		ipu handler
++ * @param       csi	csi num 0 or 1
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_disable_csi(struct ipu_soc *ipu, uint32_t csi)
++{
++	uint32_t reg;
++
++	if (csi > 1) {
++		dev_err(ipu->dev, "Wrong csi num_%d\n", csi);
++		return -EINVAL;
++	}
++	_ipu_get(ipu);
++	mutex_lock(&ipu->mutex_lock);
++	ipu->csi_use_count[csi]--;
++	if (ipu->csi_use_count[csi] == 0) {
++		_ipu_csi_wait4eof(ipu, ipu->csi_channel[csi]);
++		reg = ipu_cm_read(ipu, IPU_CONF);
++		if (csi == 0)
++			ipu_cm_write(ipu, reg & ~IPU_CONF_CSI0_EN, IPU_CONF);
++		else
++			ipu_cm_write(ipu, reg & ~IPU_CONF_CSI1_EN, IPU_CONF);
++	}
++	mutex_unlock(&ipu->mutex_lock);
++	_ipu_put(ipu);
++	return 0;
++}
++EXPORT_SYMBOL(ipu_disable_csi);
++
++static irqreturn_t ipu_sync_irq_handler(int irq, void *desc)
++{
++	struct ipu_soc *ipu = desc;
++	int i;
++	uint32_t line, bit, int_stat, int_ctrl;
++	irqreturn_t result = IRQ_NONE;
++	const int int_reg[] = { 1, 2, 3, 4, 11, 12, 13, 14, 15, 0 };
++
++	spin_lock(&ipu->int_reg_spin_lock);
++
++	for (i = 0; int_reg[i] != 0; i++) {
++		int_stat = ipu_cm_read(ipu, IPU_INT_STAT(int_reg[i]));
++		int_ctrl = ipu_cm_read(ipu, IPU_INT_CTRL(int_reg[i]));
++		int_stat &= int_ctrl;
++		ipu_cm_write(ipu, int_stat, IPU_INT_STAT(int_reg[i]));
++		while ((line = ffs(int_stat)) != 0) {
++			bit = --line;
++			int_stat &= ~(1UL << line);
++			line += (int_reg[i] - 1) * 32;
++			result |=
++			    ipu->irq_list[line].handler(line,
++						       ipu->irq_list[line].
++						       dev_id);
++			if (ipu->irq_list[line].flags & IPU_IRQF_ONESHOT) {
++				int_ctrl &= ~(1UL << bit);
++				ipu_cm_write(ipu, int_ctrl,
++						IPU_INT_CTRL(int_reg[i]));
++			}
++		}
++	}
++
++	spin_unlock(&ipu->int_reg_spin_lock);
++
++	return result;
++}
++
++static irqreturn_t ipu_err_irq_handler(int irq, void *desc)
++{
++	struct ipu_soc *ipu = desc;
++	int i;
++	uint32_t int_stat;
++	const int err_reg[] = { 5, 6, 9, 10, 0 };
++
++	spin_lock(&ipu->int_reg_spin_lock);
++
++	for (i = 0; err_reg[i] != 0; i++) {
++		int_stat = ipu_cm_read(ipu, IPU_INT_STAT(err_reg[i]));
++		int_stat &= ipu_cm_read(ipu, IPU_INT_CTRL(err_reg[i]));
++		if (int_stat) {
++			ipu_cm_write(ipu, int_stat, IPU_INT_STAT(err_reg[i]));
++			dev_warn(ipu->dev,
++				"IPU Warning - IPU_INT_STAT_%d = 0x%08X\n",
++				err_reg[i], int_stat);
++			/* Disable interrupts so we only get error once */
++			int_stat = ipu_cm_read(ipu, IPU_INT_CTRL(err_reg[i])) &
++					~int_stat;
++			ipu_cm_write(ipu, int_stat, IPU_INT_CTRL(err_reg[i]));
++		}
++	}
++
++	spin_unlock(&ipu->int_reg_spin_lock);
++
++	return IRQ_HANDLED;
++}
++
++/*!
++ * This function enables the interrupt for the specified interrupt line.
++ * The interrupt lines are defined in \b ipu_irq_line enum.
++ *
++ * @param	ipu		ipu handler
++ * @param       irq             Interrupt line to enable interrupt for.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int ipu_enable_irq(struct ipu_soc *ipu, uint32_t irq)
++{
++	uint32_t reg;
++	unsigned long lock_flags;
++	int ret = 0;
++
++	_ipu_get(ipu);
++
++	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
++
++	/*
++	 * Check sync interrupt handler only, since we do nothing for
++	 * error interrupts but than print out register values in the
++	 * error interrupt source handler.
++	 */
++	if (_ipu_is_sync_irq(irq) && (ipu->irq_list[irq].handler == NULL)) {
++		dev_err(ipu->dev, "handler hasn't been registered on sync "
++				  "irq %d\n", irq);
++		ret = -EACCES;
++		goto out;
++	}
++
++	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
++	reg |= IPUIRQ_2_MASK(irq);
++	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
++out:
++	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
++
++	_ipu_put(ipu);
++
++	return ret;
++}
++EXPORT_SYMBOL(ipu_enable_irq);
++
++/*!
++ * This function disables the interrupt for the specified interrupt line.
++ * The interrupt lines are defined in \b ipu_irq_line enum.
++ *
++ * @param	ipu		ipu handler
++ * @param       irq             Interrupt line to disable interrupt for.
++ *
++ */
++void ipu_disable_irq(struct ipu_soc *ipu, uint32_t irq)
++{
++	uint32_t reg;
++	unsigned long lock_flags;
++
++	_ipu_get(ipu);
++
++	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
++
++	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
++	reg &= ~IPUIRQ_2_MASK(irq);
++	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
++
++	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
++
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_disable_irq);
++
++/*!
++ * This function clears the interrupt for the specified interrupt line.
++ * The interrupt lines are defined in \b ipu_irq_line enum.
++ *
++ * @param	ipu		ipu handler
++ * @param       irq             Interrupt line to clear interrupt for.
++ *
++ */
++void ipu_clear_irq(struct ipu_soc *ipu, uint32_t irq)
++{
++	unsigned long lock_flags;
++
++	_ipu_get(ipu);
++
++	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
++
++	ipu_cm_write(ipu, IPUIRQ_2_MASK(irq), IPUIRQ_2_STATREG(irq));
++
++	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
++
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_clear_irq);
++
++/*!
++ * This function returns the current interrupt status for the specified
++ * interrupt line. The interrupt lines are defined in \b ipu_irq_line enum.
++ *
++ * @param	ipu		ipu handler
++ * @param       irq             Interrupt line to get status for.
++ *
++ * @return      Returns true if the interrupt is pending/asserted or false if
++ *              the interrupt is not pending.
++ */
++bool ipu_get_irq_status(struct ipu_soc *ipu, uint32_t irq)
++{
++	uint32_t reg;
++	unsigned long lock_flags;
++
++	_ipu_get(ipu);
++
++	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
++	reg = ipu_cm_read(ipu, IPUIRQ_2_STATREG(irq));
++	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
++
++	_ipu_put(ipu);
++
++	if (reg & IPUIRQ_2_MASK(irq))
++		return true;
++	else
++		return false;
++}
++EXPORT_SYMBOL(ipu_get_irq_status);
++
++/*!
++ * This function registers an interrupt handler function for the specified
++ * interrupt line. The interrupt lines are defined in \b ipu_irq_line enum.
++ *
++ * @param	ipu		ipu handler
++ * @param       irq             Interrupt line to get status for.
++ *
++ * @param       handler         Input parameter for address of the handler
++ *                              function.
++ *
++ * @param       irq_flags       Flags for interrupt mode. Currently not used.
++ *
++ * @param       devname         Input parameter for string name of driver
++ *                              registering the handler.
++ *
++ * @param       dev_id          Input parameter for pointer of data to be
++ *                              passed to the handler.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int ipu_request_irq(struct ipu_soc *ipu, uint32_t irq,
++		    irqreturn_t(*handler) (int, void *),
++		    uint32_t irq_flags, const char *devname, void *dev_id)
++{
++	uint32_t reg;
++	unsigned long lock_flags;
++	int ret = 0;
++
++	BUG_ON(irq >= IPU_IRQ_COUNT);
++
++	_ipu_get(ipu);
++
++	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
++
++	if (ipu->irq_list[irq].handler != NULL) {
++		dev_err(ipu->dev,
++			"handler already installed on irq %d\n", irq);
++		ret = -EINVAL;
++		goto out;
++	}
++
++	/*
++	 * Check sync interrupt handler only, since we do nothing for
++	 * error interrupts but than print out register values in the
++	 * error interrupt source handler.
++	 */
++	if (_ipu_is_sync_irq(irq) && (handler == NULL)) {
++		dev_err(ipu->dev, "handler is NULL for sync irq %d\n", irq);
++		ret = -EINVAL;
++		goto out;
++	}
++
++	ipu->irq_list[irq].handler = handler;
++	ipu->irq_list[irq].flags = irq_flags;
++	ipu->irq_list[irq].dev_id = dev_id;
++	ipu->irq_list[irq].name = devname;
++
++	/* clear irq stat for previous use */
++	ipu_cm_write(ipu, IPUIRQ_2_MASK(irq), IPUIRQ_2_STATREG(irq));
++	/* enable the interrupt */
++	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
++	reg |= IPUIRQ_2_MASK(irq);
++	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
++out:
++	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
++
++	_ipu_put(ipu);
++
++	return ret;
++}
++EXPORT_SYMBOL(ipu_request_irq);
++
++/*!
++ * This function unregisters an interrupt handler for the specified interrupt
++ * line. The interrupt lines are defined in \b ipu_irq_line enum.
++ *
++ * @param	ipu		ipu handler
++ * @param       irq             Interrupt line to get status for.
++ *
++ * @param       dev_id          Input parameter for pointer of data to be passed
++ *                              to the handler. This must match value passed to
++ *                              ipu_request_irq().
++ *
++ */
++void ipu_free_irq(struct ipu_soc *ipu, uint32_t irq, void *dev_id)
++{
++	uint32_t reg;
++	unsigned long lock_flags;
++
++	_ipu_get(ipu);
++
++	if (ipu->irq_list[irq].dev_id != dev_id)
++		return;
++
++	spin_lock_irqsave(&ipu->int_reg_spin_lock, lock_flags);
++
++	/* disable the interrupt */
++	reg = ipu_cm_read(ipu, IPUIRQ_2_CTRLREG(irq));
++	reg &= ~IPUIRQ_2_MASK(irq);
++	ipu_cm_write(ipu, reg, IPUIRQ_2_CTRLREG(irq));
++	memset(&ipu->irq_list[irq], 0, sizeof(ipu->irq_list[irq]));
++
++	spin_unlock_irqrestore(&ipu->int_reg_spin_lock, lock_flags);
++
++	_ipu_put(ipu);
++}
++EXPORT_SYMBOL(ipu_free_irq);
++
++uint32_t ipu_get_cur_buffer_idx(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type)
++{
++	uint32_t reg, dma_chan;
++
++	dma_chan = channel_2_dma(channel, type);
++	if (!idma_is_valid(dma_chan))
++		return -EINVAL;
++
++	reg = ipu_cm_read(ipu, IPU_CHA_TRB_MODE_SEL(dma_chan));
++	if ((reg & idma_mask(dma_chan)) && _ipu_is_trb_chan(dma_chan)) {
++		reg = ipu_cm_read(ipu, IPU_CHA_TRIPLE_CUR_BUF(dma_chan));
++		return (reg & tri_cur_buf_mask(dma_chan)) >>
++				tri_cur_buf_shift(dma_chan);
++	} else {
++		reg = ipu_cm_read(ipu, IPU_CHA_CUR_BUF(dma_chan));
++		if (reg & idma_mask(dma_chan))
++			return 1;
++		else
++			return 0;
++	}
++}
++EXPORT_SYMBOL(ipu_get_cur_buffer_idx);
++
++uint32_t _ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t stat = 0;
++	uint32_t task_stat_reg = ipu_cm_read(ipu, IPU_PROC_TASK_STAT);
++
++	switch (channel) {
++	case MEM_PRP_VF_MEM:
++		stat = (task_stat_reg & TSTAT_VF_MASK) >> TSTAT_VF_OFFSET;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		stat = (task_stat_reg & TSTAT_VF_MASK) >> TSTAT_VF_OFFSET;
++		break;
++	case MEM_ROT_VF_MEM:
++		stat =
++		    (task_stat_reg & TSTAT_VF_ROT_MASK) >> TSTAT_VF_ROT_OFFSET;
++		break;
++	case MEM_PRP_ENC_MEM:
++		stat = (task_stat_reg & TSTAT_ENC_MASK) >> TSTAT_ENC_OFFSET;
++		break;
++	case MEM_ROT_ENC_MEM:
++		stat =
++		    (task_stat_reg & TSTAT_ENC_ROT_MASK) >>
++		    TSTAT_ENC_ROT_OFFSET;
++		break;
++	case MEM_PP_MEM:
++		stat = (task_stat_reg & TSTAT_PP_MASK) >> TSTAT_PP_OFFSET;
++		break;
++	case MEM_ROT_PP_MEM:
++		stat =
++		    (task_stat_reg & TSTAT_PP_ROT_MASK) >> TSTAT_PP_ROT_OFFSET;
++		break;
++
++	default:
++		stat = TASK_STAT_IDLE;
++		break;
++	}
++	return stat;
++}
++
++/*!
++ * This function check for  a logical channel status
++ *
++ * @param	ipu		ipu handler
++ * @param	channel         Input parameter for the logical channel ID.
++ *
++ * @return      This function returns 0 on idle and 1 on busy.
++ *
++ */
++uint32_t ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t dma_status;
++
++	_ipu_get(ipu);
++	mutex_lock(&ipu->mutex_lock);
++	dma_status = ipu_is_channel_busy(ipu, channel);
++	mutex_unlock(&ipu->mutex_lock);
++	_ipu_put(ipu);
++
++	dev_dbg(ipu->dev, "%s, dma_status:%d.\n", __func__, dma_status);
++
++	return dma_status;
++}
++EXPORT_SYMBOL(ipu_channel_status);
++
++int32_t ipu_swap_channel(struct ipu_soc *ipu, ipu_channel_t from_ch, ipu_channel_t to_ch)
++{
++	uint32_t reg;
++	unsigned long lock_flags;
++	int from_dma = channel_2_dma(from_ch, IPU_INPUT_BUFFER);
++	int to_dma = channel_2_dma(to_ch, IPU_INPUT_BUFFER);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	/* enable target channel */
++	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(to_dma));
++	ipu_idmac_write(ipu, reg | idma_mask(to_dma), IDMAC_CHA_EN(to_dma));
++
++	ipu->channel_enable_mask |= 1L << IPU_CHAN_ID(to_ch);
++
++	/* switch dp dc */
++	_ipu_dp_dc_disable(ipu, from_ch, true);
++
++	/* disable source channel */
++	reg = ipu_idmac_read(ipu, IDMAC_CHA_EN(from_dma));
++	ipu_idmac_write(ipu, reg & ~idma_mask(from_dma), IDMAC_CHA_EN(from_dma));
++	ipu_cm_write(ipu, idma_mask(from_dma), IPU_CHA_CUR_BUF(from_dma));
++	ipu_cm_write(ipu, tri_cur_buf_mask(from_dma),
++				IPU_CHA_TRIPLE_CUR_BUF(from_dma));
++
++	ipu->channel_enable_mask &= ~(1L << IPU_CHAN_ID(from_ch));
++
++	spin_lock_irqsave(&ipu->rdy_reg_spin_lock, lock_flags);
++	_ipu_clear_buffer_ready(ipu, from_ch, IPU_VIDEO_IN_BUFFER, 0);
++	_ipu_clear_buffer_ready(ipu, from_ch, IPU_VIDEO_IN_BUFFER, 1);
++	_ipu_clear_buffer_ready(ipu, from_ch, IPU_VIDEO_IN_BUFFER, 2);
++	spin_unlock_irqrestore(&ipu->rdy_reg_spin_lock, lock_flags);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_swap_channel);
++
++uint32_t bytes_per_pixel(uint32_t fmt)
++{
++	switch (fmt) {
++	case IPU_PIX_FMT_GENERIC:	/*generic data */
++	case IPU_PIX_FMT_RGB332:
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YUV444P:
++		return 1;
++		break;
++	case IPU_PIX_FMT_GENERIC_16:	/* generic data */
++	case IPU_PIX_FMT_RGB565:
++	case IPU_PIX_FMT_YUYV:
++	case IPU_PIX_FMT_UYVY:
++		return 2;
++		break;
++	case IPU_PIX_FMT_BGR24:
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_YUV444:
++		return 3;
++		break;
++	case IPU_PIX_FMT_GENERIC_32:	/*generic data */
++	case IPU_PIX_FMT_BGR32:
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_RGB32:
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_ABGR32:
++		return 4;
++		break;
++	default:
++		return 1;
++		break;
++	}
++	return 0;
++}
++EXPORT_SYMBOL(bytes_per_pixel);
++
++ipu_color_space_t format_to_colorspace(uint32_t fmt)
++{
++	switch (fmt) {
++	case IPU_PIX_FMT_RGB666:
++	case IPU_PIX_FMT_RGB565:
++	case IPU_PIX_FMT_BGR24:
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_GBR24:
++	case IPU_PIX_FMT_BGR32:
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_RGB32:
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_ABGR32:
++	case IPU_PIX_FMT_LVDS666:
++	case IPU_PIX_FMT_LVDS888:
++		return RGB;
++		break;
++
++	default:
++		return YCbCr;
++		break;
++	}
++	return RGB;
++}
++
++bool ipu_pixel_format_has_alpha(uint32_t fmt)
++{
++	switch (fmt) {
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_ABGR32:
++		return true;
++		break;
++	default:
++		return false;
++		break;
++	}
++	return false;
++}
++
++bool ipu_ch_param_bad_alpha_pos(uint32_t pixel_fmt)
++{
++	return _ipu_ch_param_bad_alpha_pos(pixel_fmt);
++}
++EXPORT_SYMBOL(ipu_ch_param_bad_alpha_pos);
++
++#ifdef CONFIG_PM
++static int ipu_suspend(struct device *dev)
++{
++	struct ipu_soc *ipu = dev_get_drvdata(dev);
++
++	/* All IDMAC channel and IPU clock should be disabled.*/
++	if (ipu->pdata->pg)
++		ipu->pdata->pg(1);
++
++	dev_dbg(dev, "ipu suspend.\n");
++	return 0;
++}
++
++static int ipu_resume(struct device *dev)
++{
++	struct ipu_soc *ipu = dev_get_drvdata(dev);
++
++	if (ipu->pdata->pg) {
++		ipu->pdata->pg(0);
++
++		_ipu_get(ipu);
++		_ipu_dmfc_init(ipu, dmfc_type_setup, 1);
++		/* Set sync refresh channels as high priority */
++		ipu_idmac_write(ipu, 0x18800001L, IDMAC_CHA_PRI(0));
++		_ipu_put(ipu);
++	}
++	dev_dbg(dev, "ipu resume.\n");
++	return 0;
++}
++
++int ipu_runtime_suspend(struct device *dev)
++{
++	dev_dbg(dev, "ipu busfreq high release.\n");
++	release_bus_freq(BUS_FREQ_HIGH);
++
++	return 0;
++}
++
++int ipu_runtime_resume(struct device *dev)
++{
++	dev_dbg(dev, "ipu busfreq high requst.\n");
++	request_bus_freq(BUS_FREQ_HIGH);
++
++	return 0;
++}
++
++static const struct dev_pm_ops ipu_pm_ops = {
++	SET_RUNTIME_PM_OPS(ipu_runtime_suspend, ipu_runtime_resume, NULL)
++	SET_SYSTEM_SLEEP_PM_OPS(ipu_suspend, ipu_resume)
++};
++#endif
++
++/*!
++ * This structure contains pointers to the power management callback functions.
++ */
++static struct platform_driver mxcipu_driver = {
++	.driver = {
++			.name		= "imx-ipuv3",
++			.of_match_table	= imx_ipuv3_dt_ids,
++		#ifdef CONFIG_PM
++			.pm	= &ipu_pm_ops,
++		#endif
++	},
++	.probe		= ipu_probe,
++	.id_table	= imx_ipu_type,
++	.remove		= ipu_remove,
++};
++
++int32_t __init ipu_gen_init(void)
++{
++	int32_t ret;
++
++	ret = platform_driver_register(&mxcipu_driver);
++	return 0;
++}
++
++subsys_initcall(ipu_gen_init);
++
++static void __exit ipu_gen_uninit(void)
++{
++	platform_driver_unregister(&mxcipu_driver);
++}
++
++module_exit(ipu_gen_uninit);
++
++MODULE_DESCRIPTION("i.MX IPU v3 driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_device.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_device.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_device.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_device.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,3725 @@
++/*
++ * Copyright 2005-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file ipu_device.c
++ *
++ * @brief This file contains the IPUv3 driver device interface and fops functions.
++ *
++ * @ingroup IPU
++ */
++#include <linux/clk.h>
++#include <linux/cpumask.h>
++#include <linux/delay.h>
++#include <linux/dma-mapping.h>
++#include <linux/err.h>
++#include <linux/init.h>
++#include <linux/io.h>
++#include <linux/ipu-v3.h>
++#include <linux/kernel.h>
++#include <linux/kthread.h>
++#include <linux/module.h>
++#include <linux/platform_device.h>
++#include <linux/poll.h>
++#include <linux/sched.h>
++#include <linux/sched/rt.h>
++#include <linux/slab.h>
++#include <linux/spinlock.h>
++#include <linux/time.h>
++#include <linux/types.h>
++#include <linux/vmalloc.h>
++#include <linux/wait.h>
++
++#include <asm/cacheflush.h>
++#include <asm/outercache.h>
++
++#include "ipu_param_mem.h"
++#include "ipu_regs.h"
++#include "vdoa.h"
++
++#define CHECK_RETCODE(cont, str, err, label, ret)			\
++do {									\
++	if (cont) {							\
++		dev_err(t->dev, "ERR:[0x%p]-no:0x%x "#str" ret:%d,"	\
++				"line:%d\n", t, t->task_no, ret, __LINE__);\
++		if (ret != -EACCES) {					\
++			t->state = err;					\
++			goto label;					\
++		}							\
++	}								\
++} while (0)
++
++#define CHECK_RETCODE_CONT(cont, str, err, ret)				\
++do {									\
++	if (cont) {							\
++		dev_err(t->dev, "ERR:[0x%p]-no:0x%x"#str" ret:%d,"	\
++				"line:%d\n", t, t->task_no, ret, __LINE__);\
++		if (ret != -EACCES) {					\
++			if (t->state == STATE_OK)			\
++				t->state = err;				\
++		}							\
++	}								\
++} while (0)
++
++#undef DBG_IPU_PERF
++#ifdef DBG_IPU_PERF
++#define CHECK_PERF(ts)							\
++do {									\
++	getnstimeofday(ts);						\
++} while (0)
++
++#define DECLARE_PERF_VAR						\
++	struct timespec ts_queue;					\
++	struct timespec ts_dotask;					\
++	struct timespec ts_waitirq;					\
++	struct timespec ts_sche;					\
++	struct timespec ts_rel;						\
++	struct timespec ts_frame
++
++#define PRINT_TASK_STATISTICS						\
++do {									\
++	ts_queue = timespec_sub(tsk->ts_dotask, tsk->ts_queue);		\
++	ts_dotask = timespec_sub(tsk->ts_waitirq, tsk->ts_dotask);	\
++	ts_waitirq = timespec_sub(tsk->ts_inirq, tsk->ts_waitirq);	\
++	ts_sche = timespec_sub(tsk->ts_wakeup, tsk->ts_inirq);		\
++	ts_rel = timespec_sub(tsk->ts_rel, tsk->ts_wakeup);		\
++	ts_frame = timespec_sub(tsk->ts_rel, tsk->ts_queue);		\
++	dev_dbg(tsk->dev, "[0x%p] no-0x%x, ts_q:%ldus, ts_do:%ldus,"	\
++		"ts_waitirq:%ldus,ts_sche:%ldus, ts_rel:%ldus,"		\
++		"ts_frame: %ldus\n", tsk, tsk->task_no,			\
++	ts_queue.tv_nsec / NSEC_PER_USEC + ts_queue.tv_sec * USEC_PER_SEC,\
++	ts_dotask.tv_nsec / NSEC_PER_USEC + ts_dotask.tv_sec * USEC_PER_SEC,\
++	ts_waitirq.tv_nsec / NSEC_PER_USEC + ts_waitirq.tv_sec * USEC_PER_SEC,\
++	ts_sche.tv_nsec / NSEC_PER_USEC + ts_sche.tv_sec * USEC_PER_SEC,\
++	ts_rel.tv_nsec / NSEC_PER_USEC + ts_rel.tv_sec * USEC_PER_SEC,\
++	ts_frame.tv_nsec / NSEC_PER_USEC + ts_frame.tv_sec * USEC_PER_SEC); \
++	if ((ts_frame.tv_nsec/NSEC_PER_USEC + ts_frame.tv_sec*USEC_PER_SEC) > \
++		80000)	\
++		dev_dbg(tsk->dev, "ts_frame larger than 80ms [0x%p] no-0x%x.\n"\
++				, tsk, tsk->task_no);	\
++} while (0)
++#else
++#define CHECK_PERF(ts)
++#define DECLARE_PERF_VAR
++#define PRINT_TASK_STATISTICS
++#endif
++
++#define	IPU_PP_CH_VF	(IPU_TASK_ID_VF - 1)
++#define	IPU_PP_CH_PP	(IPU_TASK_ID_PP - 1)
++#define MAX_PP_CH	(IPU_TASK_ID_MAX - 1)
++#define VDOA_DEF_TIMEOUT_MS	(HZ/2)
++
++/* Strucutures and variables for exporting MXC IPU as device*/
++typedef enum {
++	STATE_OK = 0,
++	STATE_QUEUE,
++	STATE_IN_PROGRESS,
++	STATE_ERR,
++	STATE_TIMEOUT,
++	STATE_RES_TIMEOUT,
++	STATE_NO_IPU,
++	STATE_NO_IRQ,
++	STATE_IPU_BUSY,
++	STATE_IRQ_FAIL,
++	STATE_IRQ_TIMEOUT,
++	STATE_ENABLE_CHAN_FAIL,
++	STATE_DISABLE_CHAN_FAIL,
++	STATE_SEL_BUF_FAIL,
++	STATE_INIT_CHAN_FAIL,
++	STATE_LINK_CHAN_FAIL,
++	STATE_UNLINK_CHAN_FAIL,
++	STATE_INIT_CHAN_BUF_FAIL,
++	STATE_INIT_CHAN_BAND_FAIL,
++	STATE_SYS_NO_MEM,
++	STATE_VDOA_IRQ_TIMEOUT,
++	STATE_VDOA_IRQ_FAIL,
++	STATE_VDOA_TASK_FAIL,
++} ipu_state_t;
++
++enum {
++	INPUT_CHAN_VDI_P = 1,
++	INPUT_CHAN,
++	INPUT_CHAN_VDI_N,
++};
++
++struct ipu_state_msg {
++	int state;
++	char *msg;
++} state_msg[] = {
++	{STATE_OK, "ok"},
++	{STATE_QUEUE, "split queue"},
++	{STATE_IN_PROGRESS, "split in progress"},
++	{STATE_ERR, "error"},
++	{STATE_TIMEOUT, "split task timeout"},
++	{STATE_RES_TIMEOUT, "wait resource timeout"},
++	{STATE_NO_IPU, "no ipu found"},
++	{STATE_NO_IRQ, "no irq found for task"},
++	{STATE_IPU_BUSY, "ipu busy"},
++	{STATE_IRQ_FAIL, "request irq failed"},
++	{STATE_IRQ_TIMEOUT, "wait for irq timeout"},
++	{STATE_ENABLE_CHAN_FAIL, "ipu enable channel fail"},
++	{STATE_DISABLE_CHAN_FAIL, "ipu disable channel fail"},
++	{STATE_SEL_BUF_FAIL, "ipu select buf fail"},
++	{STATE_INIT_CHAN_FAIL, "ipu init channel fail"},
++	{STATE_LINK_CHAN_FAIL, "ipu link channel fail"},
++	{STATE_UNLINK_CHAN_FAIL, "ipu unlink channel fail"},
++	{STATE_INIT_CHAN_BUF_FAIL, "ipu init channel buffer fail"},
++	{STATE_INIT_CHAN_BAND_FAIL, "ipu init channel band mode fail"},
++	{STATE_SYS_NO_MEM, "sys no mem: -ENOMEM"},
++	{STATE_VDOA_IRQ_TIMEOUT, "wait for vdoa irq timeout"},
++	{STATE_VDOA_IRQ_FAIL, "vdoa irq fail"},
++	{STATE_VDOA_TASK_FAIL, "vdoa task fail"},
++};
++
++struct stripe_setting {
++	u32 iw;
++	u32 ih;
++	u32 ow;
++	u32 oh;
++	u32 outh_resize_ratio;
++	u32 outv_resize_ratio;
++	u32 i_left_pos;
++	u32 i_right_pos;
++	u32 i_top_pos;
++	u32 i_bottom_pos;
++	u32 o_left_pos;
++	u32 o_right_pos;
++	u32 o_top_pos;
++	u32 o_bottom_pos;
++	u32 rl_split_line;
++	u32 ud_split_line;
++};
++
++struct task_set {
++#define	NULL_MODE	0x0
++#define	IC_MODE		0x1
++#define	ROT_MODE	0x2
++#define	VDI_MODE	0x4
++#define IPU_PREPROCESS_MODE_MASK	(IC_MODE | ROT_MODE | VDI_MODE)
++/* VDOA_MODE means this task use vdoa, and VDOA has two modes:
++ * BAND MODE and non-BAND MODE. Non-band mode will do transfer data
++ * to memory. BAND mode needs hareware sync with IPU, it is used default
++ * if connected to VDIC.
++ */
++#define	VDOA_MODE	0x8
++#define	VDOA_BAND_MODE	0x10
++	u8	mode;
++#define IC_VF	0x1
++#define IC_PP	0x2
++#define ROT_VF	0x4
++#define ROT_PP	0x8
++#define VDI_VF	0x10
++#define	VDOA_ONLY	0x20
++	u8	task;
++#define NO_SPLIT	0x0
++#define RL_SPLIT	0x1
++#define UD_SPLIT	0x2
++#define LEFT_STRIPE	0x1
++#define RIGHT_STRIPE	0x2
++#define UP_STRIPE	0x4
++#define DOWN_STRIPE	0x8
++#define SPLIT_MASK	0xF
++	u8	split_mode;
++	u8	band_lines;
++	ipu_channel_t ic_chan;
++	ipu_channel_t rot_chan;
++	ipu_channel_t vdi_ic_p_chan;
++	ipu_channel_t vdi_ic_n_chan;
++
++	u32 i_off;
++	u32 i_uoff;
++	u32 i_voff;
++	u32 istride;
++
++	u32 ov_off;
++	u32 ov_uoff;
++	u32 ov_voff;
++	u32 ovstride;
++
++	u32 ov_alpha_off;
++	u32 ov_alpha_stride;
++
++	u32 o_off;
++	u32 o_uoff;
++	u32 o_voff;
++	u32 ostride;
++
++	u32 r_fmt;
++	u32 r_width;
++	u32 r_height;
++	u32 r_stride;
++	dma_addr_t r_paddr;
++
++	struct stripe_setting sp_setting;
++};
++
++struct ipu_split_task {
++	struct ipu_task task;
++	struct ipu_task_entry *parent_task;
++	struct ipu_task_entry *child_task;
++	u32 task_no;
++};
++
++struct ipu_task_entry {
++	struct ipu_input input;
++	struct ipu_output output;
++
++	bool overlay_en;
++	struct ipu_overlay overlay;
++#define DEF_TIMEOUT_MS	1000
++#define DEF_DELAY_MS 20
++	int	timeout;
++	int	irq;
++
++	u8	task_id;
++	u8	ipu_id;
++	u8	task_in_list;
++	u8	split_done;
++	struct mutex split_lock;
++	struct mutex vdic_lock;
++	wait_queue_head_t split_waitq;
++
++	struct list_head node;
++	struct list_head split_list;
++	struct ipu_soc *ipu;
++	struct device *dev;
++	struct task_set set;
++	wait_queue_head_t task_waitq;
++	struct completion irq_comp;
++	struct kref refcount;
++	ipu_state_t state;
++	u32 task_no;
++	atomic_t done;
++	atomic_t res_free;
++	atomic_t res_get;
++
++	struct ipu_task_entry *parent;
++	char *vditmpbuf[2];
++	u32 old_save_lines;
++	u32 old_size;
++	bool buf1filled;
++	bool buf0filled;
++
++	vdoa_handle_t vdoa_handle;
++	struct vdoa_output_mem {
++		void *vaddr;
++		dma_addr_t paddr;
++		int size;
++	} vdoa_dma;
++
++#ifdef DBG_IPU_PERF
++	struct timespec ts_queue;
++	struct timespec ts_dotask;
++	struct timespec ts_waitirq;
++	struct timespec ts_inirq;
++	struct timespec ts_wakeup;
++	struct timespec ts_rel;
++#endif
++};
++
++struct ipu_channel_tabel {
++	struct mutex	lock;
++	u8		used[MXC_IPU_MAX_NUM][MAX_PP_CH];
++	u8		vdoa_used;
++};
++
++struct ipu_thread_data {
++	struct ipu_soc *ipu;
++	u32	id;
++	u32	is_vdoa;
++};
++
++struct ipu_alloc_list {
++	struct list_head list;
++	dma_addr_t phy_addr;
++	void *cpu_addr;
++	u32 size;
++	void *file_index;
++};
++
++static LIST_HEAD(ipu_alloc_list);
++static DEFINE_MUTEX(ipu_alloc_lock);
++static struct ipu_channel_tabel	ipu_ch_tbl;
++static LIST_HEAD(ipu_task_list);
++static DEFINE_SPINLOCK(ipu_task_list_lock);
++static DECLARE_WAIT_QUEUE_HEAD(thread_waitq);
++static DECLARE_WAIT_QUEUE_HEAD(res_waitq);
++static atomic_t req_cnt;
++static atomic_t file_index = ATOMIC_INIT(1);
++static int major;
++static int max_ipu_no;
++static int thread_id;
++static atomic_t frame_no;
++static struct class *ipu_class;
++static struct device *ipu_dev;
++static int debug;
++module_param(debug, int, 0600);
++#ifdef DBG_IPU_PERF
++static struct timespec ts_frame_max;
++static u32 ts_frame_avg;
++static atomic_t frame_cnt;
++#endif
++
++static bool deinterlace_3_field(struct ipu_task_entry *t)
++{
++	return ((t->set.mode & VDI_MODE) &&
++		(t->input.deinterlace.motion != HIGH_MOTION));
++}
++
++static u32 tiled_filed_size(struct ipu_task_entry *t)
++{
++	u32 field_size;
++
++	/* note: page_align is required by VPU hw ouput buffer */
++	field_size = TILED_NV12_FRAME_SIZE(t->input.width, t->input.height/2);
++	return field_size;
++}
++
++static bool only_ic(u8 mode)
++{
++	mode = mode & IPU_PREPROCESS_MODE_MASK;
++	return ((mode == IC_MODE) || (mode == VDI_MODE));
++}
++
++static bool only_rot(u8 mode)
++{
++	mode = mode & IPU_PREPROCESS_MODE_MASK;
++	return (mode == ROT_MODE);
++}
++
++static bool ic_and_rot(u8 mode)
++{
++	mode = mode & IPU_PREPROCESS_MODE_MASK;
++	return ((mode == (IC_MODE | ROT_MODE)) ||
++		 (mode == (VDI_MODE | ROT_MODE)));
++}
++
++static bool need_split(struct ipu_task_entry *t)
++{
++	return ((t->set.split_mode != NO_SPLIT) || (t->task_no & SPLIT_MASK));
++}
++
++unsigned int fmt_to_bpp(unsigned int pixelformat)
++{
++	u32 bpp;
++
++	switch (pixelformat) {
++	case IPU_PIX_FMT_RGB565:
++	/*interleaved 422*/
++	case IPU_PIX_FMT_YUYV:
++	case IPU_PIX_FMT_UYVY:
++	/*non-interleaved 422*/
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YVU422P:
++		bpp = 16;
++		break;
++	case IPU_PIX_FMT_BGR24:
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_YUV444:
++	case IPU_PIX_FMT_YUV444P:
++		bpp = 24;
++		break;
++	case IPU_PIX_FMT_BGR32:
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_RGB32:
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_ABGR32:
++		bpp = 32;
++		break;
++	/*non-interleaved 420*/
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_NV12:
++		bpp = 12;
++		break;
++	default:
++		bpp = 8;
++		break;
++	}
++	return bpp;
++}
++EXPORT_SYMBOL_GPL(fmt_to_bpp);
++
++cs_t colorspaceofpixel(int fmt)
++{
++	switch (fmt) {
++	case IPU_PIX_FMT_RGB565:
++	case IPU_PIX_FMT_RGB666:
++	case IPU_PIX_FMT_BGR24:
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_BGR32:
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_RGB32:
++	case IPU_PIX_FMT_ABGR32:
++		return RGB_CS;
++		break;
++	case IPU_PIX_FMT_UYVY:
++	case IPU_PIX_FMT_YUYV:
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_YVU422P:
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YUV444:
++	case IPU_PIX_FMT_YUV444P:
++	case IPU_PIX_FMT_NV12:
++	case IPU_PIX_FMT_TILED_NV12:
++	case IPU_PIX_FMT_TILED_NV12F:
++		return YUV_CS;
++		break;
++	default:
++		return NULL_CS;
++	}
++}
++EXPORT_SYMBOL_GPL(colorspaceofpixel);
++
++int need_csc(int ifmt, int ofmt)
++{
++	cs_t ics, ocs;
++
++	ics = colorspaceofpixel(ifmt);
++	ocs = colorspaceofpixel(ofmt);
++
++	if ((ics == NULL_CS) || (ocs == NULL_CS))
++		return -1;
++	else if (ics != ocs)
++		return 1;
++
++	return 0;
++}
++EXPORT_SYMBOL_GPL(need_csc);
++
++static int soc_max_in_width(u32 is_vdoa)
++{
++	return is_vdoa ? 8192 : 4096;
++}
++
++static int soc_max_vdi_in_width(void)
++{
++	return IPU_MAX_VDI_IN_WIDTH;
++}
++static int soc_max_in_height(void)
++{
++	return 4096;
++}
++
++static int soc_max_out_width(void)
++{
++	/* mx51/mx53/mx6q is 1024*/
++	return 1024;
++}
++
++static int soc_max_out_height(void)
++{
++	/* mx51/mx53/mx6q is 1024*/
++	return 1024;
++}
++
++static void dump_task_info(struct ipu_task_entry *t)
++{
++	if (!debug)
++		return;
++	dev_dbg(t->dev, "[0x%p]input:\n", (void *)t);
++	dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n", (void *)t, t->input.format);
++	dev_dbg(t->dev, "[0x%p]\twidth = %d\n", (void *)t, t->input.width);
++	dev_dbg(t->dev, "[0x%p]\theight = %d\n", (void *)t, t->input.height);
++	dev_dbg(t->dev, "[0x%p]\tcrop.w = %d\n", (void *)t, t->input.crop.w);
++	dev_dbg(t->dev, "[0x%p]\tcrop.h = %d\n", (void *)t, t->input.crop.h);
++	dev_dbg(t->dev, "[0x%p]\tcrop.pos.x = %d\n",
++			(void *)t, t->input.crop.pos.x);
++	dev_dbg(t->dev, "[0x%p]\tcrop.pos.y = %d\n",
++			(void *)t, t->input.crop.pos.y);
++	dev_dbg(t->dev, "[0x%p]input buffer:\n", (void *)t);
++	dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n", (void *)t, t->input.paddr);
++	dev_dbg(t->dev, "[0x%p]\ti_off = 0x%x\n", (void *)t, t->set.i_off);
++	dev_dbg(t->dev, "[0x%p]\ti_uoff = 0x%x\n", (void *)t, t->set.i_uoff);
++	dev_dbg(t->dev, "[0x%p]\ti_voff = 0x%x\n", (void *)t, t->set.i_voff);
++	dev_dbg(t->dev, "[0x%p]\tistride = %d\n", (void *)t, t->set.istride);
++	if (t->input.deinterlace.enable) {
++		dev_dbg(t->dev, "[0x%p]deinterlace enabled with:\n", (void *)t);
++		if (t->input.deinterlace.motion != HIGH_MOTION) {
++			dev_dbg(t->dev, "[0x%p]\tlow/medium motion\n", (void *)t);
++			dev_dbg(t->dev, "[0x%p]\tpaddr_n = 0x%x\n",
++				(void *)t, t->input.paddr_n);
++		} else
++			dev_dbg(t->dev, "[0x%p]\thigh motion\n", (void *)t);
++	}
++
++	dev_dbg(t->dev, "[0x%p]output:\n", (void *)t);
++	dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n", (void *)t, t->output.format);
++	dev_dbg(t->dev, "[0x%p]\twidth = %d\n", (void *)t, t->output.width);
++	dev_dbg(t->dev, "[0x%p]\theight = %d\n", (void *)t, t->output.height);
++	dev_dbg(t->dev, "[0x%p]\tcrop.w = %d\n", (void *)t, t->output.crop.w);
++	dev_dbg(t->dev, "[0x%p]\tcrop.h = %d\n", (void *)t, t->output.crop.h);
++	dev_dbg(t->dev, "[0x%p]\tcrop.pos.x = %d\n",
++			(void *)t, t->output.crop.pos.x);
++	dev_dbg(t->dev, "[0x%p]\tcrop.pos.y = %d\n",
++			(void *)t, t->output.crop.pos.y);
++	dev_dbg(t->dev, "[0x%p]\trotate = %d\n", (void *)t, t->output.rotate);
++	dev_dbg(t->dev, "[0x%p]output buffer:\n", (void *)t);
++	dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n", (void *)t, t->output.paddr);
++	dev_dbg(t->dev, "[0x%p]\to_off = 0x%x\n", (void *)t, t->set.o_off);
++	dev_dbg(t->dev, "[0x%p]\to_uoff = 0x%x\n", (void *)t, t->set.o_uoff);
++	dev_dbg(t->dev, "[0x%p]\to_voff = 0x%x\n", (void *)t, t->set.o_voff);
++	dev_dbg(t->dev, "[0x%p]\tostride = %d\n", (void *)t, t->set.ostride);
++
++	if (t->overlay_en) {
++		dev_dbg(t->dev, "[0x%p]overlay:\n", (void *)t);
++		dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n",
++				(void *)t, t->overlay.format);
++		dev_dbg(t->dev, "[0x%p]\twidth = %d\n",
++				(void *)t, t->overlay.width);
++		dev_dbg(t->dev, "[0x%p]\theight = %d\n",
++				(void *)t, t->overlay.height);
++		dev_dbg(t->dev, "[0x%p]\tcrop.w = %d\n",
++				(void *)t, t->overlay.crop.w);
++		dev_dbg(t->dev, "[0x%p]\tcrop.h = %d\n",
++				(void *)t, t->overlay.crop.h);
++		dev_dbg(t->dev, "[0x%p]\tcrop.pos.x = %d\n",
++				(void *)t, t->overlay.crop.pos.x);
++		dev_dbg(t->dev, "[0x%p]\tcrop.pos.y = %d\n",
++				(void *)t, t->overlay.crop.pos.y);
++		dev_dbg(t->dev, "[0x%p]overlay buffer:\n", (void *)t);
++		dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n",
++				(void *)t, t->overlay.paddr);
++		dev_dbg(t->dev, "[0x%p]\tov_off = 0x%x\n",
++				(void *)t, t->set.ov_off);
++		dev_dbg(t->dev, "[0x%p]\tov_uoff = 0x%x\n",
++				(void *)t, t->set.ov_uoff);
++		dev_dbg(t->dev, "[0x%p]\tov_voff = 0x%x\n",
++				(void *)t, t->set.ov_voff);
++		dev_dbg(t->dev, "[0x%p]\tovstride = %d\n",
++				(void *)t, t->set.ovstride);
++		if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
++			dev_dbg(t->dev, "[0x%p]local alpha enabled with:\n",
++					(void *)t);
++			dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n",
++					(void *)t, t->overlay.alpha.loc_alp_paddr);
++			dev_dbg(t->dev, "[0x%p]\tov_alpha_off = 0x%x\n",
++					(void *)t, t->set.ov_alpha_off);
++			dev_dbg(t->dev, "[0x%p]\tov_alpha_stride = %d\n",
++					(void *)t, t->set.ov_alpha_stride);
++		} else
++			dev_dbg(t->dev, "[0x%p]globle alpha enabled with value 0x%x\n",
++					(void *)t, t->overlay.alpha.gvalue);
++		if (t->overlay.colorkey.enable)
++			dev_dbg(t->dev, "[0x%p]colorkey enabled with value 0x%x\n",
++					(void *)t, t->overlay.colorkey.value);
++	}
++
++	dev_dbg(t->dev, "[0x%p]want task_id = %d\n", (void *)t, t->task_id);
++	dev_dbg(t->dev, "[0x%p]want task mode is 0x%x\n",
++				(void *)t, t->set.mode);
++	dev_dbg(t->dev, "[0x%p]\tIC_MODE = 0x%x\n", (void *)t, IC_MODE);
++	dev_dbg(t->dev, "[0x%p]\tROT_MODE = 0x%x\n", (void *)t, ROT_MODE);
++	dev_dbg(t->dev, "[0x%p]\tVDI_MODE = 0x%x\n", (void *)t, VDI_MODE);
++	dev_dbg(t->dev, "[0x%p]\tTask_no = 0x%x\n\n\n", (void *)t, t->task_no);
++}
++
++static void dump_check_err(struct device *dev, int err)
++{
++	switch (err) {
++	case IPU_CHECK_ERR_INPUT_CROP:
++		dev_err(dev, "input crop setting error\n");
++		break;
++	case IPU_CHECK_ERR_OUTPUT_CROP:
++		dev_err(dev, "output crop setting error\n");
++		break;
++	case IPU_CHECK_ERR_OVERLAY_CROP:
++		dev_err(dev, "overlay crop setting error\n");
++		break;
++	case IPU_CHECK_ERR_INPUT_OVER_LIMIT:
++		dev_err(dev, "input over limitation\n");
++		break;
++	case IPU_CHECK_ERR_OVERLAY_WITH_VDI:
++		dev_err(dev, "do not support overlay with deinterlace\n");
++		break;
++	case IPU_CHECK_ERR_OV_OUT_NO_FIT:
++		dev_err(dev,
++			"width/height of overlay and ic output should be same\n");
++		break;
++	case IPU_CHECK_ERR_PROC_NO_NEED:
++		dev_err(dev, "no ipu processing need\n");
++		break;
++	case IPU_CHECK_ERR_SPLIT_INPUTW_OVER:
++		dev_err(dev, "split mode input width overflow\n");
++		break;
++	case IPU_CHECK_ERR_SPLIT_INPUTH_OVER:
++		dev_err(dev, "split mode input height overflow\n");
++		break;
++	case IPU_CHECK_ERR_SPLIT_OUTPUTW_OVER:
++		dev_err(dev, "split mode output width overflow\n");
++		break;
++	case IPU_CHECK_ERR_SPLIT_OUTPUTH_OVER:
++		dev_err(dev, "split mode output height overflow\n");
++		break;
++	case IPU_CHECK_ERR_SPLIT_WITH_ROT:
++		dev_err(dev, "not support split mode with rotation\n");
++		break;
++	case IPU_CHECK_ERR_W_DOWNSIZE_OVER:
++		dev_err(dev, "horizontal downsizing ratio overflow\n");
++		break;
++	case IPU_CHECK_ERR_H_DOWNSIZE_OVER:
++		dev_err(dev, "vertical downsizing ratio overflow\n");
++		break;
++	default:
++		break;
++	}
++}
++
++static void dump_check_warn(struct device *dev, int warn)
++{
++	if (warn & IPU_CHECK_WARN_INPUT_OFFS_NOT8ALIGN)
++		dev_warn(dev, "input u/v offset not 8 align\n");
++	if (warn & IPU_CHECK_WARN_OUTPUT_OFFS_NOT8ALIGN)
++		dev_warn(dev, "output u/v offset not 8 align\n");
++	if (warn & IPU_CHECK_WARN_OVERLAY_OFFS_NOT8ALIGN)
++		dev_warn(dev, "overlay u/v offset not 8 align\n");
++}
++
++static int set_crop(struct ipu_crop *crop, int width, int height, int fmt)
++{
++	if ((width == 0) || (height == 0)) {
++		pr_err("Invalid param: width=%d, height=%d\n", width, height);
++		return -EINVAL;
++	}
++
++	if ((IPU_PIX_FMT_TILED_NV12 == fmt) ||
++		(IPU_PIX_FMT_TILED_NV12F == fmt)) {
++		if (crop->w || crop->h) {
++			if (((crop->w + crop->pos.x) > width)
++			|| ((crop->h + crop->pos.y) > height)
++			|| (0 != (crop->w % IPU_PIX_FMT_TILED_NV12_MBALIGN))
++			|| (0 != (crop->h % IPU_PIX_FMT_TILED_NV12_MBALIGN))
++			|| (0 != (crop->pos.x % IPU_PIX_FMT_TILED_NV12_MBALIGN))
++			|| (0 != (crop->pos.y % IPU_PIX_FMT_TILED_NV12_MBALIGN))
++			) {
++				pr_err("set_crop error MB align.\n");
++				return -EINVAL;
++			}
++		} else {
++			crop->pos.x = 0;
++			crop->pos.y = 0;
++			crop->w = width;
++			crop->h = height;
++			if ((0 != (crop->w % IPU_PIX_FMT_TILED_NV12_MBALIGN))
++			|| (0 != (crop->h % IPU_PIX_FMT_TILED_NV12_MBALIGN))) {
++				pr_err("set_crop error w/h MB align.\n");
++				return -EINVAL;
++			}
++		}
++	} else {
++		if (crop->w || crop->h) {
++			if (((crop->w + crop->pos.x) > (width + 16))
++			|| ((crop->h + crop->pos.y) > height + 16)) {
++				pr_err("set_crop error exceeds width/height.\n");
++				return -EINVAL;
++			}
++		} else {
++			crop->pos.x = 0;
++			crop->pos.y = 0;
++			crop->w = width;
++			crop->h = height;
++		}
++		crop->w -= crop->w%8;
++		crop->h -= crop->h%8;
++	}
++
++	if ((crop->w == 0) || (crop->h == 0)) {
++		pr_err("Invalid crop param: crop.w=%d, crop.h=%d\n",
++			crop->w, crop->h);
++		return -EINVAL;
++	}
++
++	return 0;
++}
++
++static void update_offset(unsigned int fmt,
++				unsigned int width, unsigned int height,
++				unsigned int pos_x, unsigned int pos_y,
++				int *off, int *uoff, int *voff, int *stride)
++{
++	/* NOTE: u v offset should based on start point of off*/
++	switch (fmt) {
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YUV420P:
++		*off = pos_y * width + pos_x;
++		*uoff = (width * (height - pos_y) - pos_x)
++			+ (width/2) * (pos_y/2) + pos_x/2;
++		/* In case height is odd, round up to even */
++		*voff = *uoff + (width/2) * ((height+1)/2);
++		break;
++	case IPU_PIX_FMT_YVU420P:
++		*off = pos_y * width + pos_x;
++		*voff = (width * (height - pos_y) - pos_x)
++			+ (width/2) * (pos_y/2) + pos_x/2;
++		/* In case height is odd, round up to even */
++		*uoff = *voff + (width/2) * ((height+1)/2);
++		break;
++	case IPU_PIX_FMT_YVU422P:
++		*off = pos_y * width + pos_x;
++		*voff = (width * (height - pos_y) - pos_x)
++			+ (width/2) * pos_y + pos_x/2;
++		*uoff = *voff + (width/2) * height;
++		break;
++	case IPU_PIX_FMT_YUV422P:
++		*off = pos_y * width + pos_x;
++		*uoff = (width * (height - pos_y) - pos_x)
++			+ (width/2) * pos_y + pos_x/2;
++		*voff = *uoff + (width/2) * height;
++		break;
++	case IPU_PIX_FMT_YUV444P:
++		*off = pos_y * width + pos_x;
++		*uoff = width * height;
++		*voff = width * height * 2;
++		break;
++	case IPU_PIX_FMT_NV12:
++		*off = pos_y * width + pos_x;
++		*uoff = (width * (height - pos_y) - pos_x)
++			+ width * (pos_y/2) + pos_x;
++		break;
++	case IPU_PIX_FMT_TILED_NV12:
++		/*
++		 * tiled format, progressive:
++		 * assuming that line is aligned with MB height (aligned to 16)
++		 * offset = line * stride + (pixel / MB_width) * pixels_in_MB
++		 * = line * stride + (pixel / 16) * 256
++		 * = line * stride + pixel * 16
++		 */
++		*off = pos_y * width + (pos_x << 4);
++		*uoff = ALIGN(width * height, SZ_4K) + (*off >> 1) - *off;
++		break;
++	case IPU_PIX_FMT_TILED_NV12F:
++		/*
++		 * tiled format, interlaced:
++		 * same as above, only number of pixels in MB is 128,
++		 * instead of 256
++		 */
++		*off = (pos_y >> 1) * width + (pos_x << 3);
++		*uoff = ALIGN(width * height/2, SZ_4K) + (*off >> 1) - *off;
++		break;
++	default:
++		*off = (pos_y * width + pos_x) * fmt_to_bpp(fmt)/8;
++		break;
++	}
++	*stride = width * bytes_per_pixel(fmt);
++}
++
++static int update_split_setting(struct ipu_task_entry *t, bool vdi_split)
++{
++	struct stripe_param left_stripe;
++	struct stripe_param right_stripe;
++	struct stripe_param up_stripe;
++	struct stripe_param down_stripe;
++	u32 iw, ih, ow, oh;
++	u32 max_width;
++	int ret;
++
++	if (t->output.rotate >= IPU_ROTATE_90_RIGHT)
++		return IPU_CHECK_ERR_SPLIT_WITH_ROT;
++
++	iw = t->input.crop.w;
++	ih = t->input.crop.h;
++
++	ow = t->output.crop.w;
++	oh = t->output.crop.h;
++
++	memset(&left_stripe, 0, sizeof(left_stripe));
++	memset(&right_stripe, 0, sizeof(right_stripe));
++	memset(&up_stripe, 0, sizeof(up_stripe));
++	memset(&down_stripe, 0, sizeof(down_stripe));
++
++	if (t->set.split_mode & RL_SPLIT) {
++		/*
++		 * We do want equal strips: initialize stripes in case
++		 * calc_stripes returns before actually doing the calculation
++		 */
++		left_stripe.input_width = iw / 2;
++		left_stripe.output_width = ow / 2;
++		right_stripe.input_column = iw / 2;
++		right_stripe.output_column = ow / 2;
++
++		if (vdi_split)
++			max_width = soc_max_vdi_in_width();
++		else
++			max_width = soc_max_out_width();
++		ret = ipu_calc_stripes_sizes(iw,
++				ow,
++				max_width,
++				(((unsigned long long)1) << 32), /* 32bit for fractional*/
++				1, /* equal stripes */
++				t->input.format,
++				t->output.format,
++				&left_stripe,
++				&right_stripe);
++		if (ret < 0)
++			return IPU_CHECK_ERR_W_DOWNSIZE_OVER;
++		else if (ret)
++			dev_dbg(t->dev, "Warn: no:0x%x,calc_stripes ret:%d\n",
++				 t->task_no, ret);
++		t->set.sp_setting.iw = left_stripe.input_width;
++		t->set.sp_setting.ow = left_stripe.output_width;
++		t->set.sp_setting.outh_resize_ratio = left_stripe.irr;
++		t->set.sp_setting.i_left_pos = left_stripe.input_column;
++		t->set.sp_setting.o_left_pos = left_stripe.output_column;
++		t->set.sp_setting.i_right_pos = right_stripe.input_column;
++		t->set.sp_setting.o_right_pos = right_stripe.output_column;
++	} else {
++		t->set.sp_setting.iw = iw;
++		t->set.sp_setting.ow = ow;
++		t->set.sp_setting.outh_resize_ratio = 0;
++		t->set.sp_setting.i_left_pos = 0;
++		t->set.sp_setting.o_left_pos = 0;
++		t->set.sp_setting.i_right_pos = 0;
++		t->set.sp_setting.o_right_pos = 0;
++	}
++	if ((t->set.sp_setting.iw + t->set.sp_setting.i_right_pos) > (iw+16))
++		return IPU_CHECK_ERR_SPLIT_INPUTW_OVER;
++	if (((t->set.sp_setting.ow + t->set.sp_setting.o_right_pos) > ow)
++		|| (t->set.sp_setting.ow > soc_max_out_width()))
++		return IPU_CHECK_ERR_SPLIT_OUTPUTW_OVER;
++	if (rounddown(t->set.sp_setting.ow, 8) * 8 <=
++	    rounddown(t->set.sp_setting.iw, 8))
++		return IPU_CHECK_ERR_W_DOWNSIZE_OVER;
++
++	if (t->set.split_mode & UD_SPLIT) {
++		/*
++		 * We do want equal strips: initialize stripes in case
++		 * calc_stripes returns before actually doing the calculation
++		 */
++		up_stripe.input_width = ih / 2;
++		up_stripe.output_width = oh / 2;
++		down_stripe.input_column = ih / 2;
++		down_stripe.output_column = oh / 2;
++		ret = ipu_calc_stripes_sizes(ih,
++				oh,
++				soc_max_out_height(),
++				(((unsigned long long)1) << 32), /* 32bit for fractional*/
++				0x1 | 0x2, /* equal stripes and vertical */
++				t->input.format,
++				t->output.format,
++				&up_stripe,
++				&down_stripe);
++		if (ret < 0)
++			return IPU_CHECK_ERR_H_DOWNSIZE_OVER;
++		else if (ret)
++			dev_err(t->dev, "Warn: no:0x%x,calc_stripes ret:%d\n",
++				 t->task_no, ret);
++		t->set.sp_setting.ih = up_stripe.input_width;
++		t->set.sp_setting.oh = up_stripe.output_width;
++		t->set.sp_setting.outv_resize_ratio = up_stripe.irr;
++		t->set.sp_setting.i_top_pos = up_stripe.input_column;
++		t->set.sp_setting.o_top_pos = up_stripe.output_column;
++		t->set.sp_setting.i_bottom_pos = down_stripe.input_column;
++		t->set.sp_setting.o_bottom_pos = down_stripe.output_column;
++	} else {
++		t->set.sp_setting.ih = ih;
++		t->set.sp_setting.oh = oh;
++		t->set.sp_setting.outv_resize_ratio = 0;
++		t->set.sp_setting.i_top_pos = 0;
++		t->set.sp_setting.o_top_pos = 0;
++		t->set.sp_setting.i_bottom_pos = 0;
++		t->set.sp_setting.o_bottom_pos = 0;
++	}
++
++	/* downscale case: enforce limits */
++	if (((t->set.sp_setting.ih + t->set.sp_setting.i_bottom_pos) > (ih))
++	     && (t->set.sp_setting.ih >= t->set.sp_setting.oh))
++		return IPU_CHECK_ERR_SPLIT_INPUTH_OVER;
++	/* upscale case: relax limits because ipu_calc_stripes_sizes() may
++	   create input stripe that falls just outside of the input window */
++	else if ((t->set.sp_setting.ih + t->set.sp_setting.i_bottom_pos)
++		 > (ih+16))
++		return IPU_CHECK_ERR_SPLIT_INPUTH_OVER;
++	if (((t->set.sp_setting.oh + t->set.sp_setting.o_bottom_pos) > oh)
++		|| (t->set.sp_setting.oh > soc_max_out_height()))
++		return IPU_CHECK_ERR_SPLIT_OUTPUTH_OVER;
++	if (rounddown(t->set.sp_setting.oh, 8) * 8 <=
++	    rounddown(t->set.sp_setting.ih, 8))
++		return IPU_CHECK_ERR_H_DOWNSIZE_OVER;
++
++	return IPU_CHECK_OK;
++}
++
++static int check_task(struct ipu_task_entry *t)
++{
++	int tmp;
++	int ret = IPU_CHECK_OK;
++	int timeout;
++	bool vdi_split = false;
++	int ocw, och;
++
++	if ((IPU_PIX_FMT_TILED_NV12 == t->overlay.format) ||
++		(IPU_PIX_FMT_TILED_NV12F == t->overlay.format) ||
++		(IPU_PIX_FMT_TILED_NV12 == t->output.format) ||
++		(IPU_PIX_FMT_TILED_NV12F == t->output.format) ||
++		((IPU_PIX_FMT_TILED_NV12F == t->input.format) &&
++			!t->input.deinterlace.enable)) {
++		ret = IPU_CHECK_ERR_NOT_SUPPORT;
++		goto done;
++	}
++
++	/* check input */
++	ret = set_crop(&t->input.crop, t->input.width, t->input.height,
++		t->input.format);
++	if (ret < 0) {
++		ret = IPU_CHECK_ERR_INPUT_CROP;
++		goto done;
++	} else
++		update_offset(t->input.format, t->input.width, t->input.height,
++				t->input.crop.pos.x, t->input.crop.pos.y,
++				&t->set.i_off, &t->set.i_uoff,
++				&t->set.i_voff, &t->set.istride);
++
++	/* check output */
++	ret = set_crop(&t->output.crop, t->output.width, t->output.height,
++		t->output.format);
++	if (ret < 0) {
++		ret = IPU_CHECK_ERR_OUTPUT_CROP;
++		goto done;
++	} else
++		update_offset(t->output.format,
++				t->output.width, t->output.height,
++				t->output.crop.pos.x, t->output.crop.pos.y,
++				&t->set.o_off, &t->set.o_uoff,
++				&t->set.o_voff, &t->set.ostride);
++
++	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
++		/*
++		 * Cache output width and height and
++		 * swap them so that we may check
++		 * downsize overflow correctly.
++		 */
++		ocw = t->output.crop.h;
++		och = t->output.crop.w;
++	} else {
++		ocw = t->output.crop.w;
++		och = t->output.crop.h;
++	}
++
++	if (ocw * 8 <= t->input.crop.w) {
++		ret = IPU_CHECK_ERR_W_DOWNSIZE_OVER;
++		goto done;
++	}
++
++	if (och * 8 <= t->input.crop.h) {
++		ret = IPU_CHECK_ERR_H_DOWNSIZE_OVER;
++		goto done;
++	}
++
++	if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
++		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
++		if ((t->input.crop.w > soc_max_in_width(1)) ||
++			(t->input.crop.h > soc_max_in_height())) {
++			ret = IPU_CHECK_ERR_INPUT_OVER_LIMIT;
++			goto done;
++		}
++		/* output fmt: NV12 and YUYV, now don't support resize */
++		if (((IPU_PIX_FMT_NV12 != t->output.format) &&
++				(IPU_PIX_FMT_YUYV != t->output.format)) ||
++			(t->input.crop.w != t->output.crop.w) ||
++			(t->input.crop.h != t->output.crop.h)) {
++			ret = IPU_CHECK_ERR_NOT_SUPPORT;
++			goto done;
++		}
++	}
++
++	/* check overlay if there is */
++	if (t->overlay_en) {
++		if (t->input.deinterlace.enable) {
++			ret = IPU_CHECK_ERR_OVERLAY_WITH_VDI;
++			goto done;
++		}
++
++		ret = set_crop(&t->overlay.crop, t->overlay.width,
++			t->overlay.height, t->overlay.format);
++		if (ret < 0) {
++			ret = IPU_CHECK_ERR_OVERLAY_CROP;
++			goto done;
++		} else {
++			ocw = t->output.crop.w;
++			och = t->output.crop.h;
++
++			if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
++				ocw = t->output.crop.h;
++				och = t->output.crop.w;
++			}
++			if ((t->overlay.crop.w != ocw) ||
++			    (t->overlay.crop.h != och)) {
++				ret = IPU_CHECK_ERR_OV_OUT_NO_FIT;
++				goto done;
++			}
++
++			update_offset(t->overlay.format,
++					t->overlay.width, t->overlay.height,
++					t->overlay.crop.pos.x, t->overlay.crop.pos.y,
++					&t->set.ov_off, &t->set.ov_uoff,
++					&t->set.ov_voff, &t->set.ovstride);
++			if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
++				t->set.ov_alpha_stride = t->overlay.width;
++				t->set.ov_alpha_off = t->overlay.crop.pos.y *
++					t->overlay.width + t->overlay.crop.pos.x;
++			}
++		}
++	}
++
++	/* input overflow? */
++	if (!((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
++		(IPU_PIX_FMT_TILED_NV12F == t->input.format))) {
++		if ((t->input.crop.w > soc_max_in_width(0)) ||
++			(t->input.crop.h > soc_max_in_height())) {
++				ret = IPU_CHECK_ERR_INPUT_OVER_LIMIT;
++				goto done;
++		}
++	}
++
++	/* check task mode */
++	t->set.mode = NULL_MODE;
++	t->set.split_mode = NO_SPLIT;
++
++	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
++		/*output swap*/
++		tmp = t->output.crop.w;
++		t->output.crop.w = t->output.crop.h;
++		t->output.crop.h = tmp;
++	}
++
++	if (t->output.rotate >= IPU_ROTATE_90_RIGHT)
++		t->set.mode |= ROT_MODE;
++
++	/*need resize or CSC?*/
++	if ((t->input.crop.w != t->output.crop.w) ||
++			(t->input.crop.h != t->output.crop.h) ||
++			need_csc(t->input.format, t->output.format))
++		t->set.mode |= IC_MODE;
++
++	/*need cropping?*/
++	if ((t->input.crop.w != t->input.width)       ||
++		(t->input.crop.h != t->input.height)  ||
++		(t->output.crop.w != t->output.width) ||
++		(t->output.crop.h != t->output.height))
++		t->set.mode |= IC_MODE;
++
++	/*need flip?*/
++	if ((t->set.mode == NULL_MODE) && (t->output.rotate > IPU_ROTATE_NONE))
++		t->set.mode |= IC_MODE;
++
++	/*need IDMAC do format(same color space)?*/
++	if ((t->set.mode == NULL_MODE) && (t->input.format != t->output.format))
++		t->set.mode |= IC_MODE;
++
++	/*overlay support*/
++	if (t->overlay_en)
++		t->set.mode |= IC_MODE;
++
++	/*deinterlace*/
++	if (t->input.deinterlace.enable) {
++		t->set.mode &= ~IC_MODE;
++		t->set.mode |= VDI_MODE;
++	}
++	if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
++		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
++		if (t->set.mode & ROT_MODE) {
++			ret = IPU_CHECK_ERR_NOT_SUPPORT;
++			goto done;
++		}
++		t->set.mode |= VDOA_MODE;
++		if (IPU_PIX_FMT_TILED_NV12F == t->input.format)
++			t->set.mode |= VDOA_BAND_MODE;
++		t->set.mode &= ~IC_MODE;
++	}
++
++	if ((t->set.mode & (IC_MODE | VDI_MODE)) &&
++		(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
++		if (t->output.crop.w > soc_max_out_width())
++			t->set.split_mode |= RL_SPLIT;
++		if (t->output.crop.h > soc_max_out_height())
++			t->set.split_mode |= UD_SPLIT;
++		if (!t->set.split_mode && (t->set.mode & VDI_MODE) &&
++				(t->input.crop.w > soc_max_vdi_in_width())) {
++			t->set.split_mode |= RL_SPLIT;
++			vdi_split = true;
++		}
++		if (t->set.split_mode) {
++			if ((t->set.split_mode == RL_SPLIT) ||
++				 (t->set.split_mode == UD_SPLIT))
++				timeout = DEF_TIMEOUT_MS * 2 + DEF_DELAY_MS;
++			else
++				timeout = DEF_TIMEOUT_MS * 4 + DEF_DELAY_MS;
++			if (t->timeout < timeout)
++				t->timeout = timeout;
++
++			ret = update_split_setting(t, vdi_split);
++			if (ret > IPU_CHECK_ERR_MIN)
++				goto done;
++		}
++	}
++
++	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
++		/*output swap*/
++		tmp = t->output.crop.w;
++		t->output.crop.w = t->output.crop.h;
++		t->output.crop.h = tmp;
++	}
++
++	if (t->set.mode == NULL_MODE) {
++		ret = IPU_CHECK_ERR_PROC_NO_NEED;
++		goto done;
++	}
++
++	if ((t->set.i_uoff % 8) || (t->set.i_voff % 8))
++		ret |= IPU_CHECK_WARN_INPUT_OFFS_NOT8ALIGN;
++	if ((t->set.o_uoff % 8) || (t->set.o_voff % 8))
++		ret |= IPU_CHECK_WARN_OUTPUT_OFFS_NOT8ALIGN;
++	if (t->overlay_en && ((t->set.ov_uoff % 8) || (t->set.ov_voff % 8)))
++		ret |= IPU_CHECK_WARN_OVERLAY_OFFS_NOT8ALIGN;
++
++done:
++	/* dump msg */
++	if (debug) {
++		if (ret > IPU_CHECK_ERR_MIN)
++			dump_check_err(t->dev, ret);
++		else if (ret != IPU_CHECK_OK)
++			dump_check_warn(t->dev, ret);
++	}
++
++	return ret;
++}
++
++static int prepare_task(struct ipu_task_entry *t)
++{
++	int ret = 0;
++
++	ret = check_task(t);
++	if (ret > IPU_CHECK_ERR_MIN)
++		return -EINVAL;
++
++	if (t->set.mode & VDI_MODE) {
++		t->task_id = IPU_TASK_ID_VF;
++		t->set.task = VDI_VF;
++		if (t->set.mode & ROT_MODE)
++			t->set.task |= ROT_VF;
++	}
++
++	if (VDOA_MODE == t->set.mode) {
++		if (t->set.task != 0) {
++			dev_err(t->dev, "ERR: vdoa only task:0x%x, [0x%p].\n",
++					t->set.task, t);
++			return -EINVAL;
++		}
++		t->set.task |= VDOA_ONLY;
++	}
++
++	if (VDOA_BAND_MODE & t->set.mode) {
++		/* to save band size: 1<<3 = 8 lines */
++		t->set.band_lines = 3;
++	}
++
++	dump_task_info(t);
++
++	return ret;
++}
++
++static uint32_t ic_vf_pp_is_busy(struct ipu_soc *ipu, bool is_vf)
++{
++	uint32_t	status;
++	uint32_t	status_vf;
++	uint32_t	status_rot;
++
++	if (is_vf) {
++		status = ipu_channel_status(ipu, MEM_VDI_PRP_VF_MEM);
++		status_vf = ipu_channel_status(ipu, MEM_PRP_VF_MEM);
++		status_rot = ipu_channel_status(ipu, MEM_ROT_VF_MEM);
++		return status || status_vf || status_rot;
++	} else {
++		status = ipu_channel_status(ipu, MEM_PP_MEM);
++		status_rot = ipu_channel_status(ipu, MEM_ROT_PP_MEM);
++		return status || status_rot;
++	}
++}
++
++static int _get_vdoa_ipu_res(struct ipu_task_entry *t)
++{
++	int		i;
++	struct ipu_soc	*ipu;
++	u8		*used;
++	uint32_t	found_ipu = 0;
++	uint32_t	found_vdoa = 0;
++	struct ipu_channel_tabel	*tbl = &ipu_ch_tbl;
++
++	mutex_lock(&tbl->lock);
++	if (t->set.mode & VDOA_MODE) {
++		if (NULL != t->vdoa_handle)
++			found_vdoa = 1;
++		else {
++			found_vdoa = tbl->vdoa_used ? 0 : 1;
++			if (found_vdoa) {
++				tbl->vdoa_used = 1;
++				vdoa_get_handle(&t->vdoa_handle);
++			} else
++				/* first get vdoa->ipu resource sequence */
++				goto out;
++			if (t->set.task & VDOA_ONLY)
++				goto out;
++		}
++	}
++
++	for (i = 0; i < max_ipu_no; i++) {
++		ipu = ipu_get_soc(i);
++		if (IS_ERR(ipu))
++			dev_err(t->dev, "no:0x%x,found_vdoa:%d, ipu:%d\n",
++				 t->task_no, found_vdoa, i);
++
++		used = &tbl->used[i][IPU_PP_CH_VF];
++		if (t->set.mode & VDI_MODE) {
++			if (0 == *used) {
++				*used = 1;
++				found_ipu = 1;
++				break;
++			}
++		} else if ((t->set.mode & IC_MODE) || only_rot(t->set.mode)) {
++			if (0 == *used) {
++				t->task_id = IPU_TASK_ID_VF;
++				if (t->set.mode & IC_MODE)
++					t->set.task |= IC_VF;
++				if (t->set.mode & ROT_MODE)
++					t->set.task |= ROT_VF;
++				*used = 1;
++				found_ipu = 1;
++				break;
++			}
++		} else
++			dev_err(t->dev, "no:0x%x,found_vdoa:%d, mode:0x%x\n",
++				 t->task_no, found_vdoa, t->set.mode);
++	}
++	if (found_ipu)
++		goto next;
++
++	for (i = 0; i < max_ipu_no; i++) {
++		ipu = ipu_get_soc(i);
++		if (IS_ERR(ipu))
++			dev_err(t->dev, "no:0x%x,found_vdoa:%d, ipu:%d\n",
++				 t->task_no, found_vdoa, i);
++
++		if ((t->set.mode & IC_MODE) || only_rot(t->set.mode)) {
++			used = &tbl->used[i][IPU_PP_CH_PP];
++			if (0 == *used) {
++				t->task_id = IPU_TASK_ID_PP;
++				if (t->set.mode & IC_MODE)
++					t->set.task |= IC_PP;
++				if (t->set.mode & ROT_MODE)
++					t->set.task |= ROT_PP;
++				*used = 1;
++				found_ipu = 1;
++				break;
++			}
++		}
++	}
++
++next:
++	if (found_ipu) {
++		t->ipu = ipu;
++		t->ipu_id = i;
++		t->dev = ipu->dev;
++		if (atomic_inc_return(&t->res_get) == 2)
++			dev_err(t->dev,
++				"ERR no:0x%x,found_vdoa:%d,get ipu twice\n",
++				 t->task_no, found_vdoa);
++	}
++out:
++	dev_dbg(t->dev,
++		"%s:no:0x%x,found_vdoa:%d, found_ipu:%d\n",
++		 __func__, t->task_no, found_vdoa, found_ipu);
++	mutex_unlock(&tbl->lock);
++	if (t->set.task & VDOA_ONLY)
++		return found_vdoa;
++	else if (t->set.mode & VDOA_MODE)
++		return found_vdoa && found_ipu;
++	else
++		return found_ipu;
++}
++
++static void put_vdoa_ipu_res(struct ipu_task_entry *tsk, int vdoa_only)
++{
++	int ret;
++	int rel_vdoa = 0, rel_ipu = 0;
++	struct ipu_channel_tabel	*tbl = &ipu_ch_tbl;
++
++	mutex_lock(&tbl->lock);
++	if (tsk->set.mode & VDOA_MODE) {
++		if (!tbl->vdoa_used && tsk->vdoa_handle)
++			dev_err(tsk->dev,
++				"ERR no:0x%x,vdoa not used,mode:0x%x\n",
++				 tsk->task_no, tsk->set.mode);
++		if (tbl->vdoa_used && tsk->vdoa_handle) {
++			tbl->vdoa_used = 0;
++			vdoa_put_handle(&tsk->vdoa_handle);
++			if (tsk->ipu)
++				tsk->ipu->vdoa_en = 0;
++			rel_vdoa = 1;
++			if (vdoa_only || (tsk->set.task & VDOA_ONLY))
++				goto out;
++		}
++	}
++
++	tbl->used[tsk->ipu_id][tsk->task_id - 1] = 0;
++	rel_ipu = 1;
++	ret = atomic_inc_return(&tsk->res_free);
++	if (ret == 2)
++		dev_err(tsk->dev,
++			"ERR no:0x%x,rel_vdoa:%d,put ipu twice\n",
++			 tsk->task_no, rel_vdoa);
++out:
++	dev_dbg(tsk->dev,
++		"%s:no:0x%x,rel_vdoa:%d, rel_ipu:%d\n",
++		 __func__, tsk->task_no, rel_vdoa, rel_ipu);
++	mutex_unlock(&tbl->lock);
++}
++
++static int get_vdoa_ipu_res(struct ipu_task_entry *t)
++{
++	int		ret;
++	uint32_t	found = 0;
++
++	found = _get_vdoa_ipu_res(t);
++	if (!found) {
++		t->ipu_id = -1;
++		t->ipu = NULL;
++		/* blocking to get resource */
++		ret = atomic_inc_return(&req_cnt);
++		dev_dbg(t->dev,
++			"wait_res:no:0x%x,req_cnt:%d\n", t->task_no, ret);
++		ret = wait_event_timeout(res_waitq, _get_vdoa_ipu_res(t),
++				 msecs_to_jiffies(t->timeout - DEF_DELAY_MS));
++		if (ret == 0) {
++			dev_err(t->dev, "ERR[0x%p,no-0x%x] wait_res timeout:%dms!\n",
++					 t, t->task_no, t->timeout - DEF_DELAY_MS);
++			ret = -ETIMEDOUT;
++			t->state = STATE_RES_TIMEOUT;
++			goto out;
++		} else {
++			if (!(t->set.task & VDOA_ONLY) && (!t->ipu))
++				dev_err(t->dev,
++					"ERR[no-0x%x] can not get ipu!\n",
++					t->task_no);
++			ret = atomic_read(&req_cnt);
++			if (ret > 0)
++				ret = atomic_dec_return(&req_cnt);
++			else
++				dev_err(t->dev,
++					"ERR[no-0x%x] req_cnt:%d mismatch!\n",
++					t->task_no, ret);
++			dev_dbg(t->dev, "no-0x%x,[0x%p],req_cnt:%d, got_res!\n",
++						t->task_no, t, ret);
++			found = 1;
++		}
++	}
++
++out:
++	return found;
++}
++
++static struct ipu_task_entry *create_task_entry(struct ipu_task *task)
++{
++	struct ipu_task_entry *tsk;
++
++	tsk = kzalloc(sizeof(struct ipu_task_entry), GFP_KERNEL);
++	if (!tsk)
++		return ERR_PTR(-ENOMEM);
++	kref_init(&tsk->refcount);
++	tsk->state = -EINVAL;
++	tsk->ipu_id = -1;
++	tsk->dev = ipu_dev;
++	tsk->input = task->input;
++	tsk->output = task->output;
++	tsk->overlay_en = task->overlay_en;
++	if (tsk->overlay_en)
++		tsk->overlay = task->overlay;
++	if (task->timeout > DEF_TIMEOUT_MS)
++		tsk->timeout = task->timeout;
++	else
++		tsk->timeout = DEF_TIMEOUT_MS;
++
++	return tsk;
++}
++
++static void task_mem_free(struct kref *ref)
++{
++	struct ipu_task_entry *tsk =
++			container_of(ref, struct ipu_task_entry, refcount);
++	kfree(tsk);
++}
++
++int create_split_child_task(struct ipu_split_task *sp_task)
++{
++	int ret = 0;
++	struct ipu_task_entry *tsk;
++
++	tsk = create_task_entry(&sp_task->task);
++	if (IS_ERR(tsk))
++		return PTR_ERR(tsk);
++
++	sp_task->child_task = tsk;
++	tsk->task_no = sp_task->task_no;
++
++	ret = prepare_task(tsk);
++	if (ret < 0)
++		goto err;
++
++	tsk->parent = sp_task->parent_task;
++	tsk->set.sp_setting = sp_task->parent_task->set.sp_setting;
++
++	list_add(&tsk->node, &tsk->parent->split_list);
++	dev_dbg(tsk->dev, "[0x%p] sp_tsk Q list,no-0x%x\n", tsk, tsk->task_no);
++	tsk->state = STATE_QUEUE;
++	CHECK_PERF(&tsk->ts_queue);
++err:
++	return ret;
++}
++
++static inline int sp_task_check_done(struct ipu_split_task *sp_task,
++			struct ipu_task_entry *parent, int num, int *idx)
++{
++	int i;
++	int ret = 0;
++	struct ipu_task_entry *tsk;
++	struct mutex *lock = &parent->split_lock;
++
++	*idx = -EINVAL;
++	mutex_lock(lock);
++	for (i = 0; i < num; i++) {
++		tsk = sp_task[i].child_task;
++		if (tsk && tsk->split_done) {
++			*idx = i;
++			ret = 1;
++			goto out;
++		}
++	}
++
++out:
++	mutex_unlock(lock);
++	return ret;
++}
++
++static int create_split_task(
++		int stripe,
++		struct ipu_split_task *sp_task)
++{
++	struct ipu_task *task = &(sp_task->task);
++	struct ipu_task_entry *t = sp_task->parent_task;
++	int ret;
++
++	sp_task->task_no |= stripe;
++
++	task->input = t->input;
++	task->output = t->output;
++	task->overlay_en = t->overlay_en;
++	if (task->overlay_en)
++		task->overlay = t->overlay;
++	task->task_id = t->task_id;
++	if ((t->set.split_mode == RL_SPLIT) ||
++		 (t->set.split_mode == UD_SPLIT))
++		task->timeout = t->timeout / 2;
++	else
++		task->timeout = t->timeout / 4;
++
++	task->input.crop.w = t->set.sp_setting.iw;
++	task->input.crop.h = t->set.sp_setting.ih;
++	if (task->overlay_en) {
++		task->overlay.crop.w = t->set.sp_setting.ow;
++		task->overlay.crop.h = t->set.sp_setting.oh;
++	}
++	if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
++		task->output.crop.w = t->set.sp_setting.oh;
++		task->output.crop.h = t->set.sp_setting.ow;
++		t->set.sp_setting.rl_split_line = t->set.sp_setting.o_bottom_pos;
++		t->set.sp_setting.ud_split_line = t->set.sp_setting.o_right_pos;
++
++	} else {
++		task->output.crop.w = t->set.sp_setting.ow;
++		task->output.crop.h = t->set.sp_setting.oh;
++		t->set.sp_setting.rl_split_line = t->set.sp_setting.o_right_pos;
++		t->set.sp_setting.ud_split_line = t->set.sp_setting.o_bottom_pos;
++	}
++
++	if (stripe & LEFT_STRIPE)
++		task->input.crop.pos.x += t->set.sp_setting.i_left_pos;
++	else if (stripe & RIGHT_STRIPE)
++		task->input.crop.pos.x += t->set.sp_setting.i_right_pos;
++	if (stripe & UP_STRIPE)
++		task->input.crop.pos.y += t->set.sp_setting.i_top_pos;
++	else if (stripe & DOWN_STRIPE)
++		task->input.crop.pos.y += t->set.sp_setting.i_bottom_pos;
++
++	if (task->overlay_en) {
++		if (stripe & LEFT_STRIPE)
++			task->overlay.crop.pos.x += t->set.sp_setting.o_left_pos;
++		else if (stripe & RIGHT_STRIPE)
++			task->overlay.crop.pos.x += t->set.sp_setting.o_right_pos;
++		if (stripe & UP_STRIPE)
++			task->overlay.crop.pos.y += t->set.sp_setting.o_top_pos;
++		else if (stripe & DOWN_STRIPE)
++			task->overlay.crop.pos.y += t->set.sp_setting.o_bottom_pos;
++	}
++
++	switch (t->output.rotate) {
++	case IPU_ROTATE_NONE:
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_left_pos;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_right_pos;
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_top_pos;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_bottom_pos;
++		break;
++	case IPU_ROTATE_VERT_FLIP:
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_left_pos;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_right_pos;
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
++		break;
++	case IPU_ROTATE_HORIZ_FLIP:
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_top_pos;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_bottom_pos;
++		break;
++	case IPU_ROTATE_180:
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
++		break;
++	case IPU_ROTATE_90_RIGHT:
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_left_pos;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_right_pos;
++		break;
++	case IPU_ROTATE_90_RIGHT_HFLIP:
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_top_pos;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_bottom_pos;
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_left_pos;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.y += t->set.sp_setting.o_right_pos;
++		break;
++	case IPU_ROTATE_90_RIGHT_VFLIP:
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_top_pos - t->set.sp_setting.oh;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.x =
++					t->output.crop.pos.x + t->output.crop.w
++					- t->set.sp_setting.o_bottom_pos - t->set.sp_setting.oh;
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
++		break;
++	case IPU_ROTATE_90_LEFT:
++		if (stripe & UP_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_top_pos;
++		else if (stripe & DOWN_STRIPE)
++			task->output.crop.pos.x += t->set.sp_setting.o_bottom_pos;
++		if (stripe & LEFT_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_left_pos - t->set.sp_setting.ow;
++		else if (stripe & RIGHT_STRIPE)
++			task->output.crop.pos.y =
++					t->output.crop.pos.y + t->output.crop.h
++					- t->set.sp_setting.o_right_pos - t->set.sp_setting.ow;
++		break;
++	default:
++		dev_err(t->dev, "ERR:should not be here\n");
++		break;
++	}
++
++	ret = create_split_child_task(sp_task);
++	if (ret < 0)
++		dev_err(t->dev, "ERR:create_split_child_task() ret:%d\n", ret);
++	return ret;
++}
++
++static int queue_split_task(struct ipu_task_entry *t,
++				struct ipu_split_task *sp_task, uint32_t size)
++{
++	int err[4];
++	int ret = 0;
++	int i, j;
++	struct ipu_task_entry *tsk = NULL;
++	struct mutex *lock = &t->split_lock;
++	struct mutex *vdic_lock = &t->vdic_lock;
++
++	dev_dbg(t->dev, "Split task 0x%p, no-0x%x, size:%d\n",
++			 t, t->task_no, size);
++	mutex_init(lock);
++	mutex_init(vdic_lock);
++	init_waitqueue_head(&t->split_waitq);
++	INIT_LIST_HEAD(&t->split_list);
++	for (j = 0; j < size; j++) {
++		memset(&sp_task[j], 0, sizeof(*sp_task));
++		sp_task[j].parent_task = t;
++		sp_task[j].task_no = t->task_no;
++	}
++
++	if (t->set.split_mode == RL_SPLIT) {
++		i = 0;
++		err[i] = create_split_task(RIGHT_STRIPE, &sp_task[i]);
++		if (err[i] < 0)
++			goto err_start;
++		i = 1;
++		err[i] = create_split_task(LEFT_STRIPE, &sp_task[i]);
++	} else if (t->set.split_mode == UD_SPLIT) {
++		i = 0;
++		err[i] = create_split_task(DOWN_STRIPE, &sp_task[i]);
++		if (err[i] < 0)
++			goto err_start;
++		i = 1;
++		err[i] = create_split_task(UP_STRIPE, &sp_task[i]);
++	} else {
++		i = 0;
++		err[i] = create_split_task(RIGHT_STRIPE | DOWN_STRIPE, &sp_task[i]);
++		if (err[i] < 0)
++			goto err_start;
++		i = 1;
++		err[i] = create_split_task(LEFT_STRIPE | DOWN_STRIPE, &sp_task[i]);
++		if (err[i] < 0)
++			goto err_start;
++		i = 2;
++		err[i] = create_split_task(RIGHT_STRIPE | UP_STRIPE, &sp_task[i]);
++		if (err[i] < 0)
++			goto err_start;
++		i = 3;
++		err[i] = create_split_task(LEFT_STRIPE | UP_STRIPE, &sp_task[i]);
++	}
++
++err_start:
++	for (j = 0; j < (i + 1); j++) {
++		if (err[j] < 0) {
++			if (sp_task[j].child_task)
++				dev_err(t->dev,
++				 "sp_task[%d],no-0x%x fail state:%d, queue err:%d.\n",
++				j, sp_task[j].child_task->task_no,
++				sp_task[j].child_task->state, err[j]);
++			goto err_exit;
++		}
++		dev_dbg(t->dev, "[0x%p] sp_task[%d], no-0x%x state:%s, queue ret:%d.\n",
++			sp_task[j].child_task, j, sp_task[j].child_task->task_no,
++			state_msg[sp_task[j].child_task->state].msg, err[j]);
++	}
++
++	return ret;
++
++err_exit:
++	for (j = 0; j < (i + 1); j++) {
++		if (err[j] < 0 && !ret)
++			ret = err[j];
++		tsk = sp_task[j].child_task;
++		if (!tsk)
++			continue;
++		kfree(tsk);
++	}
++	t->state = STATE_ERR;
++	return ret;
++
++}
++
++static int init_tiled_buf(struct ipu_soc *ipu, struct ipu_task_entry *t,
++				ipu_channel_t channel, uint32_t ch_type)
++{
++	int ret = 0;
++	int i;
++	uint32_t ipu_fmt;
++	dma_addr_t inbuf_base = 0;
++	u32 field_size;
++	struct vdoa_params param;
++	struct vdoa_ipu_buf buf;
++	struct ipu_soc *ipu_idx;
++	u32 ipu_stride, obuf_size;
++	u32 height, width;
++	ipu_buffer_t type;
++
++	if ((IPU_PIX_FMT_YUYV != t->output.format) &&
++		(IPU_PIX_FMT_NV12 != t->output.format)) {
++		dev_err(t->dev, "ERR:[0x%d] output format\n", t->task_no);
++		return -EINVAL;
++	}
++
++	memset(&param, 0, sizeof(param));
++	/* init channel tiled bufs */
++	if (deinterlace_3_field(t) &&
++		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
++		field_size = tiled_filed_size(t);
++		if (INPUT_CHAN_VDI_P == ch_type) {
++			inbuf_base = t->input.paddr + field_size;
++			param.vfield_buf.prev_veba = inbuf_base + t->set.i_off;
++		} else if (INPUT_CHAN == ch_type) {
++			inbuf_base = t->input.paddr_n;
++			param.vfield_buf.cur_veba = inbuf_base + t->set.i_off;
++		} else if (INPUT_CHAN_VDI_N == ch_type) {
++			inbuf_base = t->input.paddr_n + field_size;
++			param.vfield_buf.next_veba = inbuf_base + t->set.i_off;
++		} else
++			return -EINVAL;
++		height = t->input.crop.h >> 1; /* field format for vdoa */
++		width = t->input.crop.w;
++		param.vfield_buf.vubo = t->set.i_uoff;
++		param.interlaced = 1;
++		param.scan_order = 1;
++		type = IPU_INPUT_BUFFER;
++	} else if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) &&
++			(INPUT_CHAN == ch_type)) {
++		height = t->input.crop.h;
++		width = t->input.crop.w;
++		param.vframe_buf.veba = t->input.paddr + t->set.i_off;
++		param.vframe_buf.vubo = t->set.i_uoff;
++		type = IPU_INPUT_BUFFER;
++	} else
++		return -EINVAL;
++
++	param.band_mode = (t->set.mode & VDOA_BAND_MODE) ? 1 : 0;
++	if (param.band_mode && (t->set.band_lines != 3) &&
++		 (t->set.band_lines != 4) && (t->set.band_lines != 5))
++		return -EINVAL;
++	else if (param.band_mode)
++		param.band_lines = (1 << t->set.band_lines);
++	for (i = 0; i < max_ipu_no; i++) {
++		ipu_idx = ipu_get_soc(i);
++		if (!IS_ERR(ipu_idx) && ipu_idx == ipu)
++			break;
++	}
++	if (t->set.task & VDOA_ONLY)
++		/* dummy, didn't need ipu res */
++		i = 0;
++	if (max_ipu_no == i) {
++		dev_err(t->dev, "ERR:[0x%p] get ipu num\n", t);
++		return -EINVAL;
++	}
++
++	param.ipu_num = i;
++	param.vpu_stride = t->input.width;
++	param.height = height;
++	param.width = width;
++	if (IPU_PIX_FMT_NV12 == t->output.format)
++		param.pfs = VDOA_PFS_NV12;
++	else
++		param.pfs = VDOA_PFS_YUYV;
++	ipu_fmt = (param.pfs == VDOA_PFS_YUYV) ? IPU_PIX_FMT_YUYV :
++				IPU_PIX_FMT_NV12;
++	ipu_stride = param.width * bytes_per_pixel(ipu_fmt);
++	obuf_size = PAGE_ALIGN(param.width * param.height *
++				fmt_to_bpp(ipu_fmt)/8);
++	dev_dbg(t->dev, "band_mode:%d, band_lines:%d\n",
++			param.band_mode, param.band_lines);
++	if (!param.band_mode) {
++		/* note: if only for tiled -> raster convert and
++		   no other post-processing, we don't need alloc buf
++		   and use output buffer directly.
++		*/
++		if (t->set.task & VDOA_ONLY)
++			param.ieba0 = t->output.paddr;
++		else {
++			dev_err(t->dev, "ERR:[0x%d] vdoa task\n", t->task_no);
++			return -EINVAL;
++		}
++	} else {
++		if (IPU_PIX_FMT_TILED_NV12F != t->input.format) {
++			dev_err(t->dev, "ERR [0x%d] vdoa task\n", t->task_no);
++			return -EINVAL;
++		}
++	}
++	ret = vdoa_setup(t->vdoa_handle, &param);
++	if (ret)
++		goto done;
++	vdoa_get_output_buf(t->vdoa_handle, &buf);
++	if (t->set.task & VDOA_ONLY)
++		goto done;
++
++	ret = ipu_init_channel_buffer(ipu,
++			channel,
++			type,
++			ipu_fmt,
++			width,
++			height,
++			ipu_stride,
++			IPU_ROTATE_NONE,
++			buf.ieba0,
++			buf.ieba1,
++			0,
++			buf.iubo,
++			0);
++	if (ret < 0) {
++		t->state = STATE_INIT_CHAN_BUF_FAIL;
++		goto done;
++	}
++
++	if (param.band_mode) {
++		ret = ipu_set_channel_bandmode(ipu, channel,
++				type, t->set.band_lines);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BAND_FAIL;
++			goto done;
++		}
++	}
++done:
++	return ret;
++}
++
++static int init_tiled_ch_bufs(struct ipu_soc *ipu, struct ipu_task_entry *t)
++{
++	int ret = 0;
++
++	if (IPU_PIX_FMT_TILED_NV12 == t->input.format) {
++		ret = init_tiled_buf(ipu, t, t->set.ic_chan, INPUT_CHAN);
++		CHECK_RETCODE(ret < 0, "init tiled_ch", t->state, done, ret);
++	} else if (IPU_PIX_FMT_TILED_NV12F == t->input.format) {
++		ret = init_tiled_buf(ipu, t, t->set.ic_chan, INPUT_CHAN);
++		CHECK_RETCODE(ret < 0, "init tiled_ch-c", t->state, done, ret);
++		ret = init_tiled_buf(ipu, t, t->set.vdi_ic_p_chan,
++					INPUT_CHAN_VDI_P);
++		CHECK_RETCODE(ret < 0, "init tiled_ch-p", t->state, done, ret);
++		ret = init_tiled_buf(ipu, t, t->set.vdi_ic_n_chan,
++					INPUT_CHAN_VDI_N);
++		CHECK_RETCODE(ret < 0, "init tiled_ch-n", t->state, done, ret);
++	} else {
++		ret = -EINVAL;
++		dev_err(t->dev, "ERR[no-0x%x] invalid fmt:0x%x!\n",
++			t->task_no, t->input.format);
++	}
++
++done:
++	return ret;
++}
++
++static int init_ic(struct ipu_soc *ipu, struct ipu_task_entry *t)
++{
++	int ret = 0;
++	ipu_channel_params_t params;
++	dma_addr_t inbuf = 0, ovbuf = 0, ov_alp_buf = 0;
++	dma_addr_t inbuf_p = 0, inbuf_n = 0;
++	dma_addr_t outbuf = 0;
++	int out_uoff = 0, out_voff = 0, out_rot;
++	int out_w = 0, out_h = 0, out_stride;
++	int out_fmt;
++	u32 vdi_frame_idx = 0;
++
++	memset(&params, 0, sizeof(params));
++
++	/* is it need link a rot channel */
++	if (ic_and_rot(t->set.mode)) {
++		outbuf = t->set.r_paddr;
++		out_w = t->set.r_width;
++		out_h = t->set.r_height;
++		out_stride = t->set.r_stride;
++		out_fmt = t->set.r_fmt;
++		out_uoff = 0;
++		out_voff = 0;
++		out_rot = IPU_ROTATE_NONE;
++	} else {
++		outbuf = t->output.paddr + t->set.o_off;
++		out_w = t->output.crop.w;
++		out_h = t->output.crop.h;
++		out_stride = t->set.ostride;
++		out_fmt = t->output.format;
++		out_uoff = t->set.o_uoff;
++		out_voff = t->set.o_voff;
++		out_rot = t->output.rotate;
++	}
++
++	/* settings */
++	params.mem_prp_vf_mem.in_width = t->input.crop.w;
++	params.mem_prp_vf_mem.out_width = out_w;
++	params.mem_prp_vf_mem.in_height = t->input.crop.h;
++	params.mem_prp_vf_mem.out_height = out_h;
++	params.mem_prp_vf_mem.in_pixel_fmt = t->input.format;
++	params.mem_prp_vf_mem.out_pixel_fmt = out_fmt;
++	params.mem_prp_vf_mem.motion_sel = t->input.deinterlace.motion;
++
++	params.mem_prp_vf_mem.outh_resize_ratio =
++			t->set.sp_setting.outh_resize_ratio;
++	params.mem_prp_vf_mem.outv_resize_ratio =
++			t->set.sp_setting.outv_resize_ratio;
++
++	if (t->overlay_en) {
++		params.mem_prp_vf_mem.in_g_pixel_fmt = t->overlay.format;
++		params.mem_prp_vf_mem.graphics_combine_en = 1;
++		if (t->overlay.alpha.mode == IPU_ALPHA_MODE_GLOBAL)
++			params.mem_prp_vf_mem.global_alpha_en = 1;
++		else if (t->overlay.alpha.loc_alp_paddr)
++			params.mem_prp_vf_mem.alpha_chan_en = 1;
++		/* otherwise, alpha bending per pixel is used. */
++		params.mem_prp_vf_mem.alpha = t->overlay.alpha.gvalue;
++		if (t->overlay.colorkey.enable) {
++			params.mem_prp_vf_mem.key_color_en = 1;
++			params.mem_prp_vf_mem.key_color = t->overlay.colorkey.value;
++		}
++	}
++
++	if (t->input.deinterlace.enable) {
++		if (t->input.deinterlace.field_fmt & IPU_DEINTERLACE_FIELD_MASK)
++			params.mem_prp_vf_mem.field_fmt =
++				IPU_DEINTERLACE_FIELD_BOTTOM;
++		else
++			params.mem_prp_vf_mem.field_fmt =
++				IPU_DEINTERLACE_FIELD_TOP;
++
++		if (t->input.deinterlace.field_fmt & IPU_DEINTERLACE_RATE_EN)
++			vdi_frame_idx = t->input.deinterlace.field_fmt &
++						IPU_DEINTERLACE_RATE_FRAME1;
++	}
++
++	if (t->set.mode & VDOA_MODE)
++		ipu->vdoa_en = 1;
++
++	/* init channels */
++	if (!(t->set.task & VDOA_ONLY)) {
++		ret = ipu_init_channel(ipu, t->set.ic_chan, &params);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_FAIL;
++			goto done;
++		}
++	}
++
++	if (deinterlace_3_field(t)) {
++		ret = ipu_init_channel(ipu, t->set.vdi_ic_p_chan, &params);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_FAIL;
++			goto done;
++		}
++		ret = ipu_init_channel(ipu, t->set.vdi_ic_n_chan, &params);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_FAIL;
++			goto done;
++		}
++	}
++
++	/* init channel bufs */
++	if ((IPU_PIX_FMT_TILED_NV12 == t->input.format) ||
++		(IPU_PIX_FMT_TILED_NV12F == t->input.format)) {
++		ret = init_tiled_ch_bufs(ipu, t);
++		if (ret < 0)
++			goto done;
++	} else {
++		if ((deinterlace_3_field(t)) &&
++			(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
++			if (params.mem_prp_vf_mem.field_fmt ==
++				IPU_DEINTERLACE_FIELD_TOP) {
++				if (vdi_frame_idx) {
++					inbuf_p = t->input.paddr + t->set.istride +
++							t->set.i_off;
++					inbuf = t->input.paddr_n + t->set.i_off;
++					inbuf_n = t->input.paddr_n + t->set.istride +
++							t->set.i_off;
++					params.mem_prp_vf_mem.field_fmt =
++						IPU_DEINTERLACE_FIELD_BOTTOM;
++				} else {
++					inbuf_p = t->input.paddr + t->set.i_off;
++					inbuf = t->input.paddr + t->set.istride + t->set.i_off;
++					inbuf_n = t->input.paddr_n + t->set.i_off;
++				}
++			} else {
++				if (vdi_frame_idx) {
++					inbuf_p = t->input.paddr + t->set.i_off;
++					inbuf = t->input.paddr_n + t->set.istride + t->set.i_off;
++					inbuf_n = t->input.paddr_n + t->set.i_off;
++					params.mem_prp_vf_mem.field_fmt =
++						IPU_DEINTERLACE_FIELD_TOP;
++				} else {
++					inbuf_p = t->input.paddr + t->set.istride +
++							t->set.i_off;
++					inbuf = t->input.paddr + t->set.i_off;
++					inbuf_n = t->input.paddr_n + t->set.istride +
++							t->set.i_off;
++				}
++			}
++		} else {
++			if (t->input.deinterlace.enable) {
++				if (params.mem_prp_vf_mem.field_fmt ==
++					IPU_DEINTERLACE_FIELD_TOP) {
++					if (vdi_frame_idx) {
++						inbuf = t->input.paddr + t->set.istride + t->set.i_off;
++						params.mem_prp_vf_mem.field_fmt =
++							IPU_DEINTERLACE_FIELD_BOTTOM;
++					} else
++						inbuf = t->input.paddr + t->set.i_off;
++				} else {
++					if (vdi_frame_idx) {
++						inbuf = t->input.paddr + t->set.i_off;
++						params.mem_prp_vf_mem.field_fmt =
++							IPU_DEINTERLACE_FIELD_TOP;
++					} else
++						inbuf = t->input.paddr + t->set.istride + t->set.i_off;
++				}
++			} else
++				inbuf = t->input.paddr + t->set.i_off;
++		}
++
++		if (t->overlay_en)
++			ovbuf = t->overlay.paddr + t->set.ov_off;
++	}
++	if (t->overlay_en && (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL))
++		ov_alp_buf = t->overlay.alpha.loc_alp_paddr
++			+ t->set.ov_alpha_off;
++
++	if ((IPU_PIX_FMT_TILED_NV12 != t->input.format) &&
++		(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
++		ret = ipu_init_channel_buffer(ipu,
++				t->set.ic_chan,
++				IPU_INPUT_BUFFER,
++				t->input.format,
++				t->input.crop.w,
++				t->input.crop.h,
++				t->set.istride,
++				IPU_ROTATE_NONE,
++				inbuf,
++				0,
++				0,
++				t->set.i_uoff,
++				t->set.i_voff);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BUF_FAIL;
++			goto done;
++		}
++	}
++	if (deinterlace_3_field(t) &&
++		(IPU_PIX_FMT_TILED_NV12F != t->input.format)) {
++		ret = ipu_init_channel_buffer(ipu,
++				t->set.vdi_ic_p_chan,
++				IPU_INPUT_BUFFER,
++				t->input.format,
++				t->input.crop.w,
++				t->input.crop.h,
++				t->set.istride,
++				IPU_ROTATE_NONE,
++				inbuf_p,
++				0,
++				0,
++				t->set.i_uoff,
++				t->set.i_voff);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BUF_FAIL;
++			goto done;
++		}
++
++		ret = ipu_init_channel_buffer(ipu,
++				t->set.vdi_ic_n_chan,
++				IPU_INPUT_BUFFER,
++				t->input.format,
++				t->input.crop.w,
++				t->input.crop.h,
++				t->set.istride,
++				IPU_ROTATE_NONE,
++				inbuf_n,
++				0,
++				0,
++				t->set.i_uoff,
++				t->set.i_voff);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BUF_FAIL;
++			goto done;
++		}
++	}
++
++	if (t->overlay_en) {
++		ret = ipu_init_channel_buffer(ipu,
++				t->set.ic_chan,
++				IPU_GRAPH_IN_BUFFER,
++				t->overlay.format,
++				t->overlay.crop.w,
++				t->overlay.crop.h,
++				t->set.ovstride,
++				IPU_ROTATE_NONE,
++				ovbuf,
++				0,
++				0,
++				t->set.ov_uoff,
++				t->set.ov_voff);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BUF_FAIL;
++			goto done;
++		}
++	}
++
++	if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
++		ret = ipu_init_channel_buffer(ipu,
++				t->set.ic_chan,
++				IPU_ALPHA_IN_BUFFER,
++				IPU_PIX_FMT_GENERIC,
++				t->overlay.crop.w,
++				t->overlay.crop.h,
++				t->set.ov_alpha_stride,
++				IPU_ROTATE_NONE,
++				ov_alp_buf,
++				0,
++				0,
++				0, 0);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BUF_FAIL;
++			goto done;
++		}
++	}
++
++	if (!(t->set.task & VDOA_ONLY)) {
++		ret = ipu_init_channel_buffer(ipu,
++				t->set.ic_chan,
++				IPU_OUTPUT_BUFFER,
++				out_fmt,
++				out_w,
++				out_h,
++				out_stride,
++				out_rot,
++				outbuf,
++				0,
++				0,
++				out_uoff,
++				out_voff);
++		if (ret < 0) {
++			t->state = STATE_INIT_CHAN_BUF_FAIL;
++			goto done;
++		}
++	}
++
++	if ((t->set.mode & VDOA_BAND_MODE) && (t->set.task & VDI_VF)) {
++		ret = ipu_link_channels(ipu, MEM_VDOA_MEM, t->set.ic_chan);
++		CHECK_RETCODE(ret < 0, "ipu_link_ch vdoa_ic",
++				STATE_LINK_CHAN_FAIL, done, ret);
++	}
++
++done:
++	return ret;
++}
++
++static void uninit_ic(struct ipu_soc *ipu, struct ipu_task_entry *t)
++{
++	int ret;
++
++	if ((t->set.mode & VDOA_BAND_MODE) && (t->set.task & VDI_VF)) {
++		ret = ipu_unlink_channels(ipu, MEM_VDOA_MEM, t->set.ic_chan);
++		CHECK_RETCODE_CONT(ret < 0, "ipu_unlink_ch vdoa_ic",
++				STATE_UNLINK_CHAN_FAIL, ret);
++	}
++	ipu_uninit_channel(ipu, t->set.ic_chan);
++	if (deinterlace_3_field(t)) {
++		ipu_uninit_channel(ipu, t->set.vdi_ic_p_chan);
++		ipu_uninit_channel(ipu, t->set.vdi_ic_n_chan);
++	}
++}
++
++static int init_rot(struct ipu_soc *ipu, struct ipu_task_entry *t)
++{
++	int ret = 0;
++	dma_addr_t inbuf = 0, outbuf = 0;
++	int in_uoff = 0, in_voff = 0;
++	int in_fmt, in_width, in_height, in_stride;
++
++	/* init channel */
++	ret = ipu_init_channel(ipu, t->set.rot_chan, NULL);
++	if (ret < 0) {
++		t->state = STATE_INIT_CHAN_FAIL;
++		goto done;
++	}
++
++	/* init channel buf */
++	/* is it need link to a ic channel */
++	if (ic_and_rot(t->set.mode)) {
++		in_fmt = t->set.r_fmt;
++		in_width = t->set.r_width;
++		in_height = t->set.r_height;
++		in_stride = t->set.r_stride;
++		inbuf = t->set.r_paddr;
++		in_uoff = 0;
++		in_voff = 0;
++	} else {
++		in_fmt = t->input.format;
++		in_width = t->input.crop.w;
++		in_height = t->input.crop.h;
++		in_stride = t->set.istride;
++		inbuf = t->input.paddr + t->set.i_off;
++		in_uoff = t->set.i_uoff;
++		in_voff = t->set.i_voff;
++	}
++	outbuf = t->output.paddr + t->set.o_off;
++
++	ret = ipu_init_channel_buffer(ipu,
++			t->set.rot_chan,
++			IPU_INPUT_BUFFER,
++			in_fmt,
++			in_width,
++			in_height,
++			in_stride,
++			t->output.rotate,
++			inbuf,
++			0,
++			0,
++			in_uoff,
++			in_voff);
++	if (ret < 0) {
++		t->state = STATE_INIT_CHAN_BUF_FAIL;
++		goto done;
++	}
++
++	ret = ipu_init_channel_buffer(ipu,
++			t->set.rot_chan,
++			IPU_OUTPUT_BUFFER,
++			t->output.format,
++			t->output.crop.w,
++			t->output.crop.h,
++			t->set.ostride,
++			IPU_ROTATE_NONE,
++			outbuf,
++			0,
++			0,
++			t->set.o_uoff,
++			t->set.o_voff);
++	if (ret < 0) {
++		t->state = STATE_INIT_CHAN_BUF_FAIL;
++		goto done;
++	}
++
++done:
++	return ret;
++}
++
++static void uninit_rot(struct ipu_soc *ipu, struct ipu_task_entry *t)
++{
++	ipu_uninit_channel(ipu, t->set.rot_chan);
++}
++
++static int get_irq(struct ipu_task_entry *t)
++{
++	int irq;
++	ipu_channel_t chan;
++
++	if (only_ic(t->set.mode))
++		chan = t->set.ic_chan;
++	else
++		chan = t->set.rot_chan;
++
++	switch (chan) {
++	case MEM_ROT_VF_MEM:
++		irq = IPU_IRQ_PRP_VF_ROT_OUT_EOF;
++		break;
++	case MEM_ROT_PP_MEM:
++		irq = IPU_IRQ_PP_ROT_OUT_EOF;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++	case MEM_PRP_VF_MEM:
++		irq = IPU_IRQ_PRP_VF_OUT_EOF;
++		break;
++	case MEM_PP_MEM:
++		irq = IPU_IRQ_PP_OUT_EOF;
++		break;
++	case MEM_VDI_MEM:
++		irq = IPU_IRQ_VDIC_OUT_EOF;
++		break;
++	default:
++		irq = -EINVAL;
++	}
++
++	return irq;
++}
++
++static irqreturn_t task_irq_handler(int irq, void *dev_id)
++{
++	struct ipu_task_entry *prev_tsk = dev_id;
++
++	CHECK_PERF(&prev_tsk->ts_inirq);
++	complete(&prev_tsk->irq_comp);
++	dev_dbg(prev_tsk->dev, "[0x%p] no-0x%x in-irq!",
++				 prev_tsk, prev_tsk->task_no);
++
++	return IRQ_HANDLED;
++}
++
++/* Fix deinterlace up&down split mode medium line */
++static void vdi_split_process(struct ipu_soc *ipu, struct ipu_task_entry *t)
++{
++	u32 vdi_size;
++	u32 vdi_save_lines;
++	u32 stripe_mode;
++	u32 task_no;
++	u32 i, offset_addr;
++	u32 line_size;
++	unsigned char  *base_off;
++	struct ipu_task_entry *parent = t->parent;
++	struct mutex *lock = &parent->vdic_lock;
++
++	if (!parent) {
++		dev_err(t->dev, "ERR[0x%x]invalid parent\n", t->task_no);
++		return;
++	}
++	mutex_lock(lock);
++	stripe_mode = t->task_no & 0xf;
++	task_no = t->task_no >> 4;
++
++	/* Save both luma and chroma part for interleaved YUV(e.g. YUYV).
++	 * Save luma part for non-interleaved and partial-interleaved
++	 * YUV format (e.g NV12 and YV12). */
++	if (t->output.format == IPU_PIX_FMT_YUYV ||
++			t->output.format == IPU_PIX_FMT_UYVY)
++		line_size = t->output.crop.w * fmt_to_bpp(t->output.format)/8;
++	else
++		line_size = t->output.crop.w;
++
++	vdi_save_lines = (t->output.crop.h - t->set.sp_setting.ud_split_line)/2;
++	vdi_size = vdi_save_lines * line_size;
++	if (vdi_save_lines <= 0) {
++		dev_err(t->dev, "[0x%p] vdi_save_line error\n", (void *)t);
++		mutex_unlock(lock);
++		return;
++	}
++
++	/*check vditmpbuf buffer have alloced or buffer size is changed */
++	if ((vdi_save_lines != parent->old_save_lines) ||
++		(vdi_size != parent->old_size)) {
++		if (parent->vditmpbuf[0] != NULL)
++			kfree(parent->vditmpbuf[0]);
++		if (parent->vditmpbuf[1] != NULL)
++			kfree(parent->vditmpbuf[1]);
++
++		parent->vditmpbuf[0] = kmalloc(vdi_size, GFP_KERNEL);
++		if (parent->vditmpbuf[0] == NULL) {
++			dev_err(t->dev,
++				"[0x%p]Falied Alloc vditmpbuf[0]\n", (void *)t);
++			mutex_unlock(lock);
++			return;
++		}
++		memset(parent->vditmpbuf[0], 0, vdi_size);
++
++		parent->vditmpbuf[1] = kmalloc(vdi_size, GFP_KERNEL);
++		if (parent->vditmpbuf[1] == NULL) {
++			dev_err(t->dev,
++				"[0x%p]Falied Alloc vditmpbuf[1]\n", (void *)t);
++			mutex_unlock(lock);
++			return;
++		}
++		memset(parent->vditmpbuf[1], 0, vdi_size);
++
++		parent->old_save_lines = vdi_save_lines;
++		parent->old_size = vdi_size;
++	}
++
++	if (pfn_valid(t->output.paddr >> PAGE_SHIFT)) {
++		base_off = page_address(pfn_to_page(t->output.paddr >> PAGE_SHIFT));
++		base_off += t->output.paddr & ((1 << PAGE_SHIFT) - 1);
++	} else {
++		base_off = (char *)ioremap_nocache(t->output.paddr,
++				t->output.width * t->output.height *
++				fmt_to_bpp(t->output.format)/8);
++	}
++	if (base_off == NULL) {
++		dev_err(t->dev, "ERR[0x%p]Failed get virtual address\n", t);
++		mutex_unlock(lock);
++		return;
++	}
++
++	/* UP stripe or UP&LEFT stripe */
++	if ((stripe_mode == UP_STRIPE) ||
++			(stripe_mode == (UP_STRIPE | LEFT_STRIPE))) {
++		if (!parent->buf0filled) {
++			offset_addr = t->set.o_off +
++				t->set.sp_setting.ud_split_line*t->set.ostride;
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + vdi_size);
++			outer_flush_range(t->output.paddr + offset_addr,
++				t->output.paddr + offset_addr + vdi_size);
++
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(parent->vditmpbuf[0] + i*line_size,
++					base_off + offset_addr +
++					i*t->set.ostride, line_size);
++			parent->buf0filled = true;
++		} else {
++			offset_addr = t->set.o_off + (t->output.crop.h -
++					vdi_save_lines) * t->set.ostride;
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(base_off + offset_addr + i*t->set.ostride,
++						parent->vditmpbuf[0] + i*line_size, line_size);
++
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + i*t->set.ostride);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + i*t->set.ostride);
++			parent->buf0filled = false;
++		}
++	}
++	/*Down stripe or Down&Left stripe*/
++	else if ((stripe_mode == DOWN_STRIPE) ||
++			(stripe_mode == (DOWN_STRIPE | LEFT_STRIPE))) {
++		if (!parent->buf0filled) {
++			offset_addr = t->set.o_off + vdi_save_lines*t->set.ostride;
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + vdi_size);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + vdi_size);
++
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(parent->vditmpbuf[0] + i*line_size,
++						base_off + offset_addr + i*t->set.ostride,
++						line_size);
++			parent->buf0filled = true;
++		} else {
++			offset_addr = t->set.o_off;
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(base_off + offset_addr + i*t->set.ostride,
++						parent->vditmpbuf[0] + i*line_size,
++						line_size);
++
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + i*t->set.ostride);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + i*t->set.ostride);
++			parent->buf0filled = false;
++		}
++	}
++	/*Up&Right stripe*/
++	else if (stripe_mode == (UP_STRIPE | RIGHT_STRIPE)) {
++		if (!parent->buf1filled) {
++			offset_addr = t->set.o_off +
++				t->set.sp_setting.ud_split_line*t->set.ostride;
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + vdi_size);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + vdi_size);
++
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(parent->vditmpbuf[1] + i*line_size,
++						base_off + offset_addr + i*t->set.ostride,
++						line_size);
++			parent->buf1filled = true;
++		} else {
++			offset_addr = t->set.o_off +
++				(t->output.crop.h - vdi_save_lines)*t->set.ostride;
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(base_off + offset_addr + i*t->set.ostride,
++						parent->vditmpbuf[1] + i*line_size,
++						line_size);
++
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + i*t->set.ostride);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + i*t->set.ostride);
++			parent->buf1filled = false;
++		}
++	}
++	/*Down stripe or Down&Right stript*/
++	else if (stripe_mode == (DOWN_STRIPE | RIGHT_STRIPE)) {
++		if (!parent->buf1filled) {
++			offset_addr = t->set.o_off + vdi_save_lines*t->set.ostride;
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + vdi_save_lines*t->set.ostride);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + vdi_save_lines*t->set.ostride);
++
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(parent->vditmpbuf[1] + i*line_size,
++						base_off + offset_addr + i*t->set.ostride,
++						line_size);
++			parent->buf1filled = true;
++		} else {
++			offset_addr = t->set.o_off;
++			for (i = 0; i < vdi_save_lines; i++)
++				memcpy(base_off + offset_addr + i*t->set.ostride,
++						parent->vditmpbuf[1] + i*line_size,
++						line_size);
++
++			dmac_flush_range(base_off + offset_addr,
++					base_off + offset_addr + vdi_save_lines*t->set.ostride);
++			outer_flush_range(t->output.paddr + offset_addr,
++					t->output.paddr + offset_addr + vdi_save_lines*t->set.ostride);
++			parent->buf1filled = false;
++		}
++	}
++	if (!pfn_valid(t->output.paddr >> PAGE_SHIFT))
++		iounmap(base_off);
++	mutex_unlock(lock);
++}
++
++static void do_task_release(struct ipu_task_entry *t, int fail)
++{
++	int ret;
++	struct ipu_soc *ipu = t->ipu;
++
++	if (t->input.deinterlace.enable && !fail &&
++			(t->task_no & (UP_STRIPE | DOWN_STRIPE)))
++		vdi_split_process(ipu, t);
++
++	ipu_free_irq(ipu, t->irq, t);
++
++	if (t->vdoa_dma.vaddr)
++		dma_free_coherent(t->dev,
++			t->vdoa_dma.size,
++			t->vdoa_dma.vaddr,
++			t->vdoa_dma.paddr);
++
++	if (only_ic(t->set.mode)) {
++		ret = ipu_disable_channel(ipu, t->set.ic_chan, true);
++		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_ic",
++				STATE_DISABLE_CHAN_FAIL, ret);
++		if (deinterlace_3_field(t)) {
++			ret = ipu_disable_channel(ipu, t->set.vdi_ic_p_chan,
++							true);
++			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_ic_p",
++					STATE_DISABLE_CHAN_FAIL, ret);
++			ret = ipu_disable_channel(ipu, t->set.vdi_ic_n_chan,
++							true);
++			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_ic_n",
++					STATE_DISABLE_CHAN_FAIL, ret);
++		}
++	} else if (only_rot(t->set.mode)) {
++		ret = ipu_disable_channel(ipu, t->set.rot_chan, true);
++		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch only_rot",
++				STATE_DISABLE_CHAN_FAIL, ret);
++	} else if (ic_and_rot(t->set.mode)) {
++		ret = ipu_unlink_channels(ipu, t->set.ic_chan, t->set.rot_chan);
++		CHECK_RETCODE_CONT(ret < 0, "ipu_unlink_ch",
++				STATE_UNLINK_CHAN_FAIL, ret);
++		ret = ipu_disable_channel(ipu, t->set.rot_chan, true);
++		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch ic_and_rot-rot",
++				STATE_DISABLE_CHAN_FAIL, ret);
++		ret = ipu_disable_channel(ipu, t->set.ic_chan, true);
++		CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch ic_and_rot-ic",
++				STATE_DISABLE_CHAN_FAIL, ret);
++		if (deinterlace_3_field(t)) {
++			ret = ipu_disable_channel(ipu, t->set.vdi_ic_p_chan,
++							true);
++			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch icrot-ic-p",
++					STATE_DISABLE_CHAN_FAIL, ret);
++			ret = ipu_disable_channel(ipu, t->set.vdi_ic_n_chan,
++							true);
++			CHECK_RETCODE_CONT(ret < 0, "ipu_disable_ch icrot-ic-n",
++					STATE_DISABLE_CHAN_FAIL, ret);
++		}
++	}
++
++	if (only_ic(t->set.mode))
++		uninit_ic(ipu, t);
++	else if (only_rot(t->set.mode))
++		uninit_rot(ipu, t);
++	else if (ic_and_rot(t->set.mode)) {
++		uninit_ic(ipu, t);
++		uninit_rot(ipu, t);
++	}
++
++	t->state = STATE_OK;
++	CHECK_PERF(&t->ts_rel);
++	return;
++}
++
++static void do_task_vdoa_only(struct ipu_task_entry *t)
++{
++	int ret;
++
++	ret = init_tiled_ch_bufs(NULL, t);
++	CHECK_RETCODE(ret < 0, "do_vdoa_only", STATE_ERR, out, ret);
++	ret = vdoa_start(t->vdoa_handle, VDOA_DEF_TIMEOUT_MS);
++	vdoa_stop(t->vdoa_handle);
++	CHECK_RETCODE(ret < 0, "vdoa_wait4complete, do_vdoa_only",
++			STATE_VDOA_IRQ_TIMEOUT, out, ret);
++
++	t->state = STATE_OK;
++out:
++	return;
++}
++
++static void do_task(struct ipu_task_entry *t)
++{
++	int r_size;
++	int irq;
++	int ret;
++	uint32_t busy;
++	struct ipu_soc *ipu = t->ipu;
++
++	CHECK_PERF(&t->ts_dotask);
++
++	if (!ipu) {
++		t->state = STATE_NO_IPU;
++		return;
++	}
++
++	init_completion(&t->irq_comp);
++	dev_dbg(ipu->dev, "[0x%p]Do task no:0x%x: id %d\n", (void *)t,
++		 t->task_no, t->task_id);
++	dump_task_info(t);
++
++	if (t->set.task & IC_PP) {
++		t->set.ic_chan = MEM_PP_MEM;
++		dev_dbg(ipu->dev, "[0x%p]ic channel MEM_PP_MEM\n", (void *)t);
++	} else if (t->set.task & IC_VF) {
++		t->set.ic_chan = MEM_PRP_VF_MEM;
++		dev_dbg(ipu->dev, "[0x%p]ic channel MEM_PRP_VF_MEM\n", (void *)t);
++	} else if (t->set.task & VDI_VF) {
++		if (t->set.mode & VDOA_BAND_MODE) {
++			t->set.ic_chan = MEM_VDI_MEM;
++			if (deinterlace_3_field(t)) {
++				t->set.vdi_ic_p_chan = MEM_VDI_MEM_P;
++				t->set.vdi_ic_n_chan = MEM_VDI_MEM_N;
++			}
++			dev_dbg(ipu->dev, "[0x%p]ic ch MEM_VDI_MEM\n",
++					 (void *)t);
++		} else {
++			t->set.ic_chan = MEM_VDI_PRP_VF_MEM;
++			if (deinterlace_3_field(t)) {
++				t->set.vdi_ic_p_chan = MEM_VDI_PRP_VF_MEM_P;
++				t->set.vdi_ic_n_chan = MEM_VDI_PRP_VF_MEM_N;
++			}
++			dev_dbg(ipu->dev,
++				"[0x%p]ic ch MEM_VDI_PRP_VF_MEM\n", t);
++		}
++	}
++
++	if (t->set.task & ROT_PP) {
++		t->set.rot_chan = MEM_ROT_PP_MEM;
++		dev_dbg(ipu->dev, "[0x%p]rot channel MEM_ROT_PP_MEM\n", (void *)t);
++	} else if (t->set.task & ROT_VF) {
++		t->set.rot_chan = MEM_ROT_VF_MEM;
++		dev_dbg(ipu->dev, "[0x%p]rot channel MEM_ROT_VF_MEM\n", (void *)t);
++	}
++
++	if (t->task_id == IPU_TASK_ID_VF)
++		busy = ic_vf_pp_is_busy(ipu, true);
++	else if (t->task_id == IPU_TASK_ID_PP)
++		busy = ic_vf_pp_is_busy(ipu, false);
++	else {
++		dev_err(ipu->dev, "ERR[no:0x%x]ipu task_id:%d invalid!\n",
++				t->task_no, t->task_id);
++		return;
++	}
++	if (busy) {
++		dev_err(ipu->dev, "ERR[0x%p-no:0x%x]ipu task_id:%d busy!\n",
++				(void *)t, t->task_no, t->task_id);
++		t->state = STATE_IPU_BUSY;
++		return;
++	}
++
++	irq = get_irq(t);
++	if (irq < 0) {
++		t->state = STATE_NO_IRQ;
++		return;
++	}
++	t->irq = irq;
++
++	/* channel setup */
++	if (only_ic(t->set.mode)) {
++		dev_dbg(t->dev, "[0x%p]only ic mode\n", (void *)t);
++		ret = init_ic(ipu, t);
++		CHECK_RETCODE(ret < 0, "init_ic only_ic",
++				t->state, chan_setup, ret);
++	} else if (only_rot(t->set.mode)) {
++		dev_dbg(t->dev, "[0x%p]only rot mode\n", (void *)t);
++		ret = init_rot(ipu, t);
++		CHECK_RETCODE(ret < 0, "init_rot only_rot",
++				t->state, chan_setup, ret);
++	} else if (ic_and_rot(t->set.mode)) {
++		int rot_idx = (t->task_id == IPU_TASK_ID_VF) ? 0 : 1;
++
++		dev_dbg(t->dev, "[0x%p]ic + rot mode\n", (void *)t);
++		t->set.r_fmt = t->output.format;
++		if (t->output.rotate >= IPU_ROTATE_90_RIGHT) {
++			t->set.r_width = t->output.crop.h;
++			t->set.r_height = t->output.crop.w;
++		} else {
++			t->set.r_width = t->output.crop.w;
++			t->set.r_height = t->output.crop.h;
++		}
++		t->set.r_stride = t->set.r_width *
++			bytes_per_pixel(t->set.r_fmt);
++		r_size = PAGE_ALIGN(t->set.r_width * t->set.r_height
++			* fmt_to_bpp(t->set.r_fmt)/8);
++
++		if (r_size > ipu->rot_dma[rot_idx].size) {
++			dev_dbg(t->dev, "[0x%p]realloc rot buffer\n", (void *)t);
++
++			if (ipu->rot_dma[rot_idx].vaddr)
++				dma_free_coherent(t->dev,
++					ipu->rot_dma[rot_idx].size,
++					ipu->rot_dma[rot_idx].vaddr,
++					ipu->rot_dma[rot_idx].paddr);
++
++			ipu->rot_dma[rot_idx].size = r_size;
++			ipu->rot_dma[rot_idx].vaddr = dma_zalloc_coherent(t->dev,
++						r_size,
++						&ipu->rot_dma[rot_idx].paddr,
++						GFP_DMA | GFP_KERNEL);
++			CHECK_RETCODE(ipu->rot_dma[rot_idx].vaddr == NULL,
++					"ic_and_rot", STATE_SYS_NO_MEM,
++					chan_setup, -ENOMEM);
++		}
++		t->set.r_paddr = ipu->rot_dma[rot_idx].paddr;
++
++		dev_dbg(t->dev, "[0x%p]rotation:\n", (void *)t);
++		dev_dbg(t->dev, "[0x%p]\tformat = 0x%x\n", (void *)t, t->set.r_fmt);
++		dev_dbg(t->dev, "[0x%p]\twidth = %d\n", (void *)t, t->set.r_width);
++		dev_dbg(t->dev, "[0x%p]\theight = %d\n", (void *)t, t->set.r_height);
++		dev_dbg(t->dev, "[0x%p]\tpaddr = 0x%x\n", (void *)t, t->set.r_paddr);
++		dev_dbg(t->dev, "[0x%p]\trstride = %d\n", (void *)t, t->set.r_stride);
++
++		ret = init_ic(ipu, t);
++		CHECK_RETCODE(ret < 0, "init_ic ic_and_rot",
++				t->state, chan_setup, ret);
++		ret = init_rot(ipu, t);
++		CHECK_RETCODE(ret < 0, "init_rot ic_and_rot",
++				t->state, chan_setup, ret);
++		ret = ipu_link_channels(ipu, t->set.ic_chan,
++				t->set.rot_chan);
++		CHECK_RETCODE(ret < 0, "ipu_link_ch ic_and_rot",
++				STATE_LINK_CHAN_FAIL, chan_setup, ret);
++	} else {
++		dev_err(t->dev, "ERR [0x%p]do task: should not be here\n", t);
++		t->state = STATE_ERR;
++		return;
++	}
++
++	ret = ipu_request_irq(ipu, irq, task_irq_handler, 0, NULL, t);
++	CHECK_RETCODE(ret < 0, "ipu_req_irq",
++			STATE_IRQ_FAIL, chan_setup, ret);
++
++	/* enable/start channel */
++	if (only_ic(t->set.mode)) {
++		ret = ipu_enable_channel(ipu, t->set.ic_chan);
++		CHECK_RETCODE(ret < 0, "ipu_enable_ch only_ic",
++				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++		if (deinterlace_3_field(t)) {
++			ret = ipu_enable_channel(ipu, t->set.vdi_ic_p_chan);
++			CHECK_RETCODE(ret < 0, "ipu_enable_ch only_ic_p",
++					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++			ret = ipu_enable_channel(ipu, t->set.vdi_ic_n_chan);
++			CHECK_RETCODE(ret < 0, "ipu_enable_ch only_ic_n",
++					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++		}
++
++		ret = ipu_select_buffer(ipu, t->set.ic_chan, IPU_OUTPUT_BUFFER,
++					0);
++		CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic",
++				STATE_SEL_BUF_FAIL, chan_buf, ret);
++		if (t->overlay_en) {
++			ret = ipu_select_buffer(ipu, t->set.ic_chan,
++						IPU_GRAPH_IN_BUFFER, 0);
++			CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic_g",
++					STATE_SEL_BUF_FAIL, chan_buf, ret);
++			if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
++				ret = ipu_select_buffer(ipu, t->set.ic_chan,
++							IPU_ALPHA_IN_BUFFER, 0);
++				CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic_a",
++						STATE_SEL_BUF_FAIL, chan_buf,
++						ret);
++			}
++		}
++		if (!(t->set.mode & VDOA_BAND_MODE)) {
++			if (deinterlace_3_field(t))
++				ipu_select_multi_vdi_buffer(ipu, 0);
++			else {
++				ret = ipu_select_buffer(ipu, t->set.ic_chan,
++							IPU_INPUT_BUFFER, 0);
++				CHECK_RETCODE(ret < 0, "ipu_sel_buf only_ic_i",
++					STATE_SEL_BUF_FAIL, chan_buf, ret);
++			}
++		}
++	} else if (only_rot(t->set.mode)) {
++		ret = ipu_enable_channel(ipu, t->set.rot_chan);
++		CHECK_RETCODE(ret < 0, "ipu_enable_ch only_rot",
++				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++		ret = ipu_select_buffer(ipu, t->set.rot_chan,
++						IPU_OUTPUT_BUFFER, 0);
++		CHECK_RETCODE(ret < 0, "ipu_sel_buf only_rot_o",
++				STATE_SEL_BUF_FAIL, chan_buf, ret);
++		ret = ipu_select_buffer(ipu, t->set.rot_chan,
++						IPU_INPUT_BUFFER, 0);
++		CHECK_RETCODE(ret < 0, "ipu_sel_buf only_rot_i",
++				STATE_SEL_BUF_FAIL, chan_buf, ret);
++	} else if (ic_and_rot(t->set.mode)) {
++		ret = ipu_enable_channel(ipu, t->set.rot_chan);
++		CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-rot",
++				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++		ret = ipu_enable_channel(ipu, t->set.ic_chan);
++		CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-ic",
++				STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++		if (deinterlace_3_field(t)) {
++			ret = ipu_enable_channel(ipu, t->set.vdi_ic_p_chan);
++			CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-p",
++					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++			ret = ipu_enable_channel(ipu, t->set.vdi_ic_n_chan);
++			CHECK_RETCODE(ret < 0, "ipu_enable_ch ic_and_rot-n",
++					STATE_ENABLE_CHAN_FAIL, chan_en, ret);
++		}
++
++		ret = ipu_select_buffer(ipu, t->set.rot_chan,
++						IPU_OUTPUT_BUFFER, 0);
++		CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-rot-o",
++				STATE_SEL_BUF_FAIL, chan_buf, ret);
++		if (t->overlay_en) {
++			ret = ipu_select_buffer(ipu, t->set.ic_chan,
++							IPU_GRAPH_IN_BUFFER, 0);
++			CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-ic-g",
++					STATE_SEL_BUF_FAIL, chan_buf, ret);
++			if (t->overlay.alpha.mode == IPU_ALPHA_MODE_LOCAL) {
++				ret = ipu_select_buffer(ipu, t->set.ic_chan,
++							IPU_ALPHA_IN_BUFFER, 0);
++				CHECK_RETCODE(ret < 0, "ipu_sel_buf icrot-ic-a",
++						STATE_SEL_BUF_FAIL,
++						chan_buf, ret);
++			}
++		}
++		ret = ipu_select_buffer(ipu, t->set.ic_chan,
++						IPU_OUTPUT_BUFFER, 0);
++		CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-ic-o",
++				STATE_SEL_BUF_FAIL, chan_buf, ret);
++		if (deinterlace_3_field(t))
++			ipu_select_multi_vdi_buffer(ipu, 0);
++		else {
++			ret = ipu_select_buffer(ipu, t->set.ic_chan,
++							IPU_INPUT_BUFFER, 0);
++			CHECK_RETCODE(ret < 0, "ipu_sel_buf ic_and_rot-ic-i",
++					STATE_SEL_BUF_FAIL, chan_buf, ret);
++		}
++	}
++
++	if (need_split(t))
++		t->state = STATE_IN_PROGRESS;
++
++	if (t->set.mode & VDOA_BAND_MODE) {
++		ret = vdoa_start(t->vdoa_handle, VDOA_DEF_TIMEOUT_MS);
++		CHECK_RETCODE(ret < 0, "vdoa_wait4complete, do_vdoa_band",
++				STATE_VDOA_IRQ_TIMEOUT, chan_rel, ret);
++	}
++
++	CHECK_PERF(&t->ts_waitirq);
++	ret = wait_for_completion_timeout(&t->irq_comp,
++				 msecs_to_jiffies(t->timeout - DEF_DELAY_MS));
++	CHECK_PERF(&t->ts_wakeup);
++	CHECK_RETCODE(ret == 0, "wait_for_comp_timeout",
++			STATE_IRQ_TIMEOUT, chan_rel, ret);
++	dev_dbg(t->dev, "[0x%p] no-0x%x ipu irq done!", t, t->task_no);
++
++chan_rel:
++chan_buf:
++chan_en:
++chan_setup:
++	if (t->set.mode & VDOA_BAND_MODE)
++		vdoa_stop(t->vdoa_handle);
++	do_task_release(t, t->state >= STATE_ERR);
++	return;
++}
++
++static void do_task_vdoa_vdi(struct ipu_task_entry *t)
++{
++	int i;
++	int ret;
++	u32 stripe_width;
++
++	/* FIXME: crop mode not support now */
++	stripe_width = t->input.width >> 1;
++	t->input.crop.pos.x = 0;
++	t->input.crop.pos.y = 0;
++	t->input.crop.w = stripe_width;
++	t->input.crop.h = t->input.height;
++	t->output.crop.w = stripe_width;
++	t->output.crop.h = t->input.height;
++
++	for (i = 0; i < 2; i++) {
++		t->input.crop.pos.x = t->input.crop.pos.x + i * stripe_width;
++		t->output.crop.pos.x = t->output.crop.pos.x + i * stripe_width;
++		/* check input */
++		ret = set_crop(&t->input.crop, t->input.width, t->input.height,
++			t->input.format);
++		if (ret < 0) {
++			ret = STATE_ERR;
++			goto done;
++		} else
++			update_offset(t->input.format,
++					t->input.width, t->input.height,
++					t->input.crop.pos.x,
++					t->input.crop.pos.y,
++					&t->set.i_off, &t->set.i_uoff,
++					&t->set.i_voff, &t->set.istride);
++		dev_dbg(t->dev, "i_off:0x%x, i_uoff:0x%x, istride:%d.\n",
++			t->set.i_off, t->set.i_uoff, t->set.istride);
++		/* check output */
++		ret = set_crop(&t->output.crop, t->input.width,
++					t->output.height, t->output.format);
++		if (ret < 0) {
++			ret = STATE_ERR;
++			goto done;
++		} else
++			update_offset(t->output.format,
++					t->output.width, t->output.height,
++					t->output.crop.pos.x,
++					t->output.crop.pos.y,
++					&t->set.o_off, &t->set.o_uoff,
++					&t->set.o_voff, &t->set.ostride);
++
++		dev_dbg(t->dev, "o_off:0x%x, o_uoff:0x%x, ostride:%d.\n",
++				t->set.o_off, t->set.o_uoff, t->set.ostride);
++
++		do_task(t);
++	}
++
++	return;
++done:
++	dev_err(t->dev, "ERR %s set_crop.\n", __func__);
++	t->state = ret;
++	return;
++}
++
++static void get_res_do_task(struct ipu_task_entry *t)
++{
++	uint32_t	found;
++	uint32_t	split_child;
++	struct mutex	*lock;
++
++	found = get_vdoa_ipu_res(t);
++	if (!found) {
++		dev_err(t->dev, "ERR:[0x%p] no-0x%x can not get res\n",
++			t, t->task_no);
++		return;
++	} else {
++		if (t->set.task & VDOA_ONLY)
++			do_task_vdoa_only(t);
++		else if ((IPU_PIX_FMT_TILED_NV12F == t->input.format) &&
++				(t->set.mode & VDOA_BAND_MODE) &&
++				(t->input.crop.w > soc_max_vdi_in_width()))
++			do_task_vdoa_vdi(t);
++		else
++			do_task(t);
++		put_vdoa_ipu_res(t, 0);
++	}
++	if (t->state != STATE_OK) {
++		dev_err(t->dev, "ERR:[0x%p] no-0x%x state: %s\n",
++			t, t->task_no, state_msg[t->state].msg);
++	}
++
++	split_child = need_split(t) && t->parent;
++	if (split_child) {
++		lock = &t->parent->split_lock;
++		mutex_lock(lock);
++		t->split_done = 1;
++		mutex_unlock(lock);
++		wake_up(&t->parent->split_waitq);
++	}
++
++	return;
++}
++
++static void wait_split_task_complete(struct ipu_task_entry *parent,
++				struct ipu_split_task *sp_task, uint32_t size)
++{
++	struct ipu_task_entry *tsk = NULL;
++	int ret = 0, rc;
++	int j, idx = -1;
++	unsigned long flags;
++	struct mutex *lock = &parent->split_lock;
++	int k, busy_vf, busy_pp;
++	struct ipu_soc *ipu;
++	DECLARE_PERF_VAR;
++
++	for (j = 0; j < size; j++) {
++		rc = wait_event_timeout(
++			parent->split_waitq,
++			sp_task_check_done(sp_task, parent, size, &idx),
++			msecs_to_jiffies(parent->timeout - DEF_DELAY_MS));
++		if (!rc) {
++			dev_err(parent->dev,
++				"ERR:[0x%p] no-0x%x, split_task timeout,j:%d,"
++				"size:%d.\n",
++				 parent, parent->task_no, j, size);
++			ret = -ETIMEDOUT;
++			goto out;
++		} else {
++			if (idx < 0) {
++				dev_err(parent->dev,
++				"ERR:[0x%p] no-0x%x, invalid task idx:%d\n",
++				 parent, parent->task_no, idx);
++				continue;
++			}
++			tsk = sp_task[idx].child_task;
++			mutex_lock(lock);
++			if (!tsk->split_done || !tsk->ipu)
++				dev_err(tsk->dev,
++				"ERR:no-0x%x,split not done:%d/null ipu:0x%p\n",
++				 tsk->task_no, tsk->split_done, tsk->ipu);
++			tsk->split_done = 0;
++			mutex_unlock(lock);
++
++			dev_dbg(tsk->dev,
++				"[0x%p] no-0x%x sp_tsk[%d] done,state:%d.\n",
++				 tsk, tsk->task_no, idx, tsk->state);
++			#ifdef DBG_IPU_PERF
++				CHECK_PERF(&tsk->ts_rel);
++				PRINT_TASK_STATISTICS;
++			#endif
++		}
++	}
++
++out:
++	if (ret == -ETIMEDOUT) {
++		/* debug */
++		for (k = 0; k < max_ipu_no; k++) {
++			ipu = ipu_get_soc(k);
++			if (IS_ERR(ipu)) {
++				dev_err(parent->dev, "no:0x%x, null ipu:%d\n",
++				 parent->task_no, k);
++			} else {
++				busy_vf = ic_vf_pp_is_busy(ipu, true);
++				busy_pp = ic_vf_pp_is_busy(ipu, false);
++				dev_err(parent->dev,
++					"ERR:ipu[%d] busy_vf:%d, busy_pp:%d.\n",
++					k, busy_vf, busy_pp);
++			}
++		}
++		for (k = 0; k < size; k++) {
++			tsk = sp_task[k].child_task;
++			if (!tsk)
++				continue;
++			dev_err(parent->dev,
++				"ERR: sp_task[%d][0x%p] no-0x%x done:%d,"
++				 "state:%s,on_list:%d, ipu:0x%p,timeout!\n",
++				 k, tsk, tsk->task_no, tsk->split_done,
++				 state_msg[tsk->state].msg, tsk->task_in_list,
++				 tsk->ipu);
++		}
++	}
++
++	for (j = 0; j < size; j++) {
++		tsk = sp_task[j].child_task;
++		if (!tsk)
++			continue;
++		spin_lock_irqsave(&ipu_task_list_lock, flags);
++		if (tsk->task_in_list) {
++			list_del(&tsk->node);
++			tsk->task_in_list = 0;
++			dev_dbg(tsk->dev,
++				"[0x%p] no-0x%x,id:%d sp_tsk timeout list_del.\n",
++				 tsk, tsk->task_no, tsk->task_id);
++		}
++		spin_unlock_irqrestore(&ipu_task_list_lock, flags);
++		if (!tsk->ipu)
++			continue;
++		if (tsk->state != STATE_OK) {
++			dev_err(tsk->dev,
++				"ERR:[0x%p] no-0x%x,id:%d, sp_tsk state: %s\n",
++					tsk, tsk->task_no, tsk->task_id,
++					state_msg[tsk->state].msg);
++		}
++		kref_put(&tsk->refcount, task_mem_free);
++	}
++
++	kfree(parent->vditmpbuf[0]);
++	kfree(parent->vditmpbuf[1]);
++
++	if (ret < 0)
++		parent->state = STATE_TIMEOUT;
++	else
++		parent->state = STATE_OK;
++	return;
++}
++
++static inline int find_task(struct ipu_task_entry **t, int thread_id)
++{
++	int found;
++	unsigned long flags;
++	struct ipu_task_entry *tsk;
++	struct list_head *task_list = &ipu_task_list;
++
++	*t = NULL;
++	spin_lock_irqsave(&ipu_task_list_lock, flags);
++	found = !list_empty(task_list);
++	if (found) {
++		tsk = list_first_entry(task_list, struct ipu_task_entry, node);
++		if (tsk->task_in_list) {
++			list_del(&tsk->node);
++			tsk->task_in_list = 0;
++			*t = tsk;
++			kref_get(&tsk->refcount);
++			dev_dbg(tsk->dev,
++			"thread_id:%d,[0x%p] task_no:0x%x,mode:0x%x list_del\n",
++			thread_id, tsk, tsk->task_no, tsk->set.mode);
++		} else
++			dev_err(tsk->dev,
++			"thread_id:%d,task_no:0x%x,mode:0x%x not on list_del\n",
++			thread_id, tsk->task_no, tsk->set.mode);
++	}
++	spin_unlock_irqrestore(&ipu_task_list_lock, flags);
++
++	return found;
++}
++
++static int ipu_task_thread(void *argv)
++{
++	struct ipu_task_entry *tsk;
++	struct ipu_task_entry *sp_tsk0;
++	struct ipu_split_task sp_task[4];
++	/* priority lower than irq_thread */
++	const struct sched_param param = {
++		.sched_priority = MAX_USER_RT_PRIO/2 - 1,
++	};
++	int ret;
++	int curr_thread_id;
++	uint32_t size;
++	unsigned long flags;
++	unsigned int cpu;
++	struct cpumask cpu_mask;
++	struct ipu_thread_data *data = (struct ipu_thread_data *)argv;
++
++	thread_id++;
++	curr_thread_id = thread_id;
++	sched_setscheduler(current, SCHED_FIFO, &param);
++
++	if (!data->is_vdoa) {
++		cpu = cpumask_first(cpu_online_mask);
++		cpumask_set_cpu(cpu, &cpu_mask);
++		ret = sched_setaffinity(data->ipu->thread[data->id]->pid,
++			&cpu_mask);
++		if (ret < 0) {
++			pr_err("%s: sched_setaffinity fail:%d.\n", __func__, ret);
++		}
++		pr_debug("%s: sched_setaffinity cpu:%d.\n", __func__, cpu);
++	}
++
++	while (!kthread_should_stop()) {
++		int split_fail = 0;
++		int split_parent;
++		int split_child;
++
++		wait_event_interruptible(thread_waitq, find_task(&tsk, curr_thread_id));
++
++		if (!tsk) {
++			pr_err("thread:%d can not find task.\n",
++				curr_thread_id);
++			continue;
++		}
++
++		/* note: other threads run split child task */
++		split_parent = need_split(tsk) && !tsk->parent;
++		split_child = need_split(tsk) && tsk->parent;
++		if (split_parent) {
++			if ((tsk->set.split_mode == RL_SPLIT) ||
++				 (tsk->set.split_mode == UD_SPLIT))
++				size = 2;
++			else
++				size = 4;
++			ret = queue_split_task(tsk, sp_task, size);
++			if (ret < 0) {
++				split_fail = 1;
++			} else {
++				struct list_head *pos;
++
++				spin_lock_irqsave(&ipu_task_list_lock, flags);
++
++				sp_tsk0 = list_first_entry(&tsk->split_list,
++						struct ipu_task_entry, node);
++				list_del(&sp_tsk0->node);
++
++				list_for_each(pos, &tsk->split_list) {
++					struct ipu_task_entry *tmp;
++
++					tmp = list_entry(pos,
++						struct ipu_task_entry, node);
++					tmp->task_in_list = 1;
++					dev_dbg(tmp->dev,
++						"[0x%p] no-0x%x,id:%d sp_tsk "
++						"add_to_list.\n", tmp,
++						tmp->task_no, tmp->task_id);
++				}
++				/* add to global list */
++				list_splice(&tsk->split_list, &ipu_task_list);
++
++				spin_unlock_irqrestore(&ipu_task_list_lock,
++									flags);
++				/* let the parent thread do the first sp_task */
++				/* FIXME: ensure the correct sequence for split
++					4size: 5/6->9/a*/
++				if (!sp_tsk0)
++					dev_err(tsk->dev,
++					"ERR: no-0x%x,can not get split_tsk0\n",
++					tsk->task_no);
++				wake_up_interruptible(&thread_waitq);
++				get_res_do_task(sp_tsk0);
++				dev_dbg(sp_tsk0->dev,
++					"thread:%d complete tsk no:0x%x.\n",
++					curr_thread_id, sp_tsk0->task_no);
++				ret = atomic_read(&req_cnt);
++				if (ret > 0) {
++					wake_up(&res_waitq);
++					dev_dbg(sp_tsk0->dev,
++					"sp_tsk0 sche thread:%d no:0x%x,"
++					"req_cnt:%d\n", curr_thread_id,
++					sp_tsk0->task_no, ret);
++					/* For other threads to get_res */
++					schedule();
++				}
++			}
++		} else
++			get_res_do_task(tsk);
++
++		/* wait for all 4 sp_task finished here or timeout
++			and then release all resources */
++		if (split_parent && !split_fail)
++			wait_split_task_complete(tsk, sp_task, size);
++
++		if (!split_child) {
++			atomic_inc(&tsk->done);
++			wake_up(&tsk->task_waitq);
++		}
++
++		dev_dbg(tsk->dev, "thread:%d complete tsk no:0x%x-[0x%p].\n",
++				curr_thread_id, tsk->task_no, tsk);
++		ret = atomic_read(&req_cnt);
++		if (ret > 0) {
++			wake_up(&res_waitq);
++			dev_dbg(tsk->dev, "sche thread:%d no:0x%x,req_cnt:%d\n",
++				curr_thread_id, tsk->task_no, ret);
++			/* note: give cpu to other threads to get_res */
++			schedule();
++		}
++
++		kref_put(&tsk->refcount, task_mem_free);
++	}
++
++	pr_info("ERR %s exit.\n", __func__);
++	return 0;
++}
++
++int ipu_check_task(struct ipu_task *task)
++{
++	struct ipu_task_entry *tsk;
++	int ret = 0;
++
++	tsk = create_task_entry(task);
++	if (IS_ERR(tsk))
++		return PTR_ERR(tsk);
++
++	ret = check_task(tsk);
++
++	task->input = tsk->input;
++	task->output = tsk->output;
++	task->overlay = tsk->overlay;
++	dump_task_info(tsk);
++
++	kref_put(&tsk->refcount, task_mem_free);
++	if (ret != 0)
++		pr_debug("%s ret:%d.\n", __func__, ret);
++	return ret;
++}
++EXPORT_SYMBOL_GPL(ipu_check_task);
++
++int ipu_queue_task(struct ipu_task *task)
++{
++	struct ipu_task_entry *tsk;
++	unsigned long flags;
++	int ret;
++	u32 tmp_task_no;
++	DECLARE_PERF_VAR;
++
++	tsk = create_task_entry(task);
++	if (IS_ERR(tsk))
++		return PTR_ERR(tsk);
++
++	CHECK_PERF(&tsk->ts_queue);
++	ret = prepare_task(tsk);
++	if (ret < 0)
++		goto done;
++
++	if (need_split(tsk)) {
++		CHECK_PERF(&tsk->ts_dotask);
++		CHECK_PERF(&tsk->ts_waitirq);
++		CHECK_PERF(&tsk->ts_inirq);
++		CHECK_PERF(&tsk->ts_wakeup);
++	}
++
++	/* task_no last four bits for split task type*/
++	tmp_task_no = atomic_inc_return(&frame_no);
++	tsk->task_no = tmp_task_no << 4;
++	init_waitqueue_head(&tsk->task_waitq);
++
++	spin_lock_irqsave(&ipu_task_list_lock, flags);
++	list_add_tail(&tsk->node, &ipu_task_list);
++	tsk->task_in_list = 1;
++	dev_dbg(tsk->dev, "[0x%p,no-0x%x] list_add_tail\n", tsk, tsk->task_no);
++	spin_unlock_irqrestore(&ipu_task_list_lock, flags);
++	wake_up_interruptible(&thread_waitq);
++
++	ret = wait_event_timeout(tsk->task_waitq, atomic_read(&tsk->done),
++						msecs_to_jiffies(tsk->timeout));
++	if (0 == ret) {
++		/* note: the timeout should larger than the internal timeout!*/
++		ret = -ETIMEDOUT;
++		dev_err(tsk->dev, "ERR: [0x%p] no-0x%x, timeout:%dms!\n",
++				tsk, tsk->task_no, tsk->timeout);
++	} else {
++		if (STATE_OK != tsk->state) {
++			dev_err(tsk->dev, "ERR: [0x%p] no-0x%x,state %d: %s\n",
++				tsk, tsk->task_no, tsk->state,
++				state_msg[tsk->state].msg);
++			ret = -ECANCELED;
++		} else
++			ret = 0;
++	}
++
++	spin_lock_irqsave(&ipu_task_list_lock, flags);
++	if (tsk->task_in_list) {
++		list_del(&tsk->node);
++		tsk->task_in_list = 0;
++		dev_dbg(tsk->dev, "[0x%p] no:0x%x list_del\n",
++				tsk, tsk->task_no);
++	}
++	spin_unlock_irqrestore(&ipu_task_list_lock, flags);
++
++#ifdef DBG_IPU_PERF
++	CHECK_PERF(&tsk->ts_rel);
++	PRINT_TASK_STATISTICS;
++	if (ts_frame_avg == 0)
++		ts_frame_avg = ts_frame.tv_nsec / NSEC_PER_USEC +
++				ts_frame.tv_sec * USEC_PER_SEC;
++	else
++		ts_frame_avg = (ts_frame_avg + ts_frame.tv_nsec / NSEC_PER_USEC
++				+ ts_frame.tv_sec * USEC_PER_SEC)/2;
++	if (timespec_compare(&ts_frame, &ts_frame_max) > 0)
++		ts_frame_max = ts_frame;
++
++	atomic_inc(&frame_cnt);
++
++	if ((atomic_read(&frame_cnt) %  1000) == 0)
++		pr_debug("ipu_dev: max frame time:%ldus, avg frame time:%dus,"
++			"frame_cnt:%d\n", ts_frame_max.tv_nsec / NSEC_PER_USEC
++			+ ts_frame_max.tv_sec * USEC_PER_SEC,
++			ts_frame_avg, atomic_read(&frame_cnt));
++#endif
++done:
++	if (ret < 0)
++		dev_err(tsk->dev, "ERR: no-0x%x,ipu_queue_task err:%d\n",
++				tsk->task_no, ret);
++
++	kref_put(&tsk->refcount, task_mem_free);
++
++	return ret;
++}
++EXPORT_SYMBOL_GPL(ipu_queue_task);
++
++static int mxc_ipu_open(struct inode *inode, struct file *file)
++{
++	file->private_data = (void *)atomic_inc_return(&file_index);
++	return 0;
++}
++
++static long mxc_ipu_ioctl(struct file *file,
++		unsigned int cmd, unsigned long arg)
++{
++	int __user *argp = (void __user *)arg;
++	int ret = 0;
++
++	switch (cmd) {
++	case IPU_CHECK_TASK:
++		{
++			struct ipu_task task;
++
++			if (copy_from_user
++					(&task, (struct ipu_task *) arg,
++					 sizeof(struct ipu_task)))
++				return -EFAULT;
++			ret = ipu_check_task(&task);
++			if (copy_to_user((struct ipu_task *) arg,
++				&task, sizeof(struct ipu_task)))
++				return -EFAULT;
++			break;
++		}
++	case IPU_QUEUE_TASK:
++		{
++			struct ipu_task task;
++
++			if (copy_from_user
++					(&task, (struct ipu_task *) arg,
++					 sizeof(struct ipu_task)))
++				return -EFAULT;
++			ret = ipu_queue_task(&task);
++			break;
++		}
++	case IPU_ALLOC:
++		{
++			int size;
++			struct ipu_alloc_list *mem;
++
++			mem = kzalloc(sizeof(*mem), GFP_KERNEL);
++			if (mem == NULL)
++				return -ENOMEM;
++
++			if (get_user(size, argp))
++				return -EFAULT;
++
++			mem->size = PAGE_ALIGN(size);
++
++			mem->cpu_addr = dma_zalloc_coherent(ipu_dev, size,
++							   &mem->phy_addr,
++							   GFP_DMA | GFP_KERNEL);
++			if (mem->cpu_addr == NULL) {
++				kfree(mem);
++				return -ENOMEM;
++			}
++			mem->file_index = file->private_data;
++			mutex_lock(&ipu_alloc_lock);
++			list_add(&mem->list, &ipu_alloc_list);
++			mutex_unlock(&ipu_alloc_lock);
++
++			dev_dbg(ipu_dev, "allocated %d bytes @ 0x%08X\n",
++				mem->size, mem->phy_addr);
++
++			if (put_user(mem->phy_addr, argp))
++				return -EFAULT;
++
++			break;
++		}
++	case IPU_FREE:
++		{
++			unsigned long offset;
++			struct ipu_alloc_list *mem;
++
++			if (get_user(offset, argp))
++				return -EFAULT;
++
++			ret = -EINVAL;
++			mutex_lock(&ipu_alloc_lock);
++			list_for_each_entry(mem, &ipu_alloc_list, list) {
++				if (mem->phy_addr == offset) {
++					list_del(&mem->list);
++					dma_free_coherent(ipu_dev,
++							  mem->size,
++							  mem->cpu_addr,
++							  mem->phy_addr);
++					kfree(mem);
++					ret = 0;
++					break;
++				}
++			}
++			mutex_unlock(&ipu_alloc_lock);
++			if (0 == ret)
++				dev_dbg(ipu_dev, "free %d bytes @ 0x%08X\n",
++					mem->size, mem->phy_addr);
++
++			break;
++		}
++	default:
++		break;
++	}
++	return ret;
++}
++
++static int mxc_ipu_mmap(struct file *file, struct vm_area_struct *vma)
++{
++	bool found = false;
++	u32 len;
++	unsigned long offset = vma->vm_pgoff << PAGE_SHIFT;
++	struct ipu_alloc_list *mem;
++
++	mutex_lock(&ipu_alloc_lock);
++	list_for_each_entry(mem, &ipu_alloc_list, list) {
++		if (offset == mem->phy_addr) {
++			found = true;
++			len = mem->size;
++			break;
++		}
++	}
++	mutex_unlock(&ipu_alloc_lock);
++	if (!found)
++		return -EINVAL;
++
++	if (vma->vm_end - vma->vm_start > len)
++		return -EINVAL;
++
++	vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
++
++	if (remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
++				vma->vm_end - vma->vm_start,
++				vma->vm_page_prot)) {
++		printk(KERN_ERR
++				"mmap failed!\n");
++		return -ENOBUFS;
++	}
++	return 0;
++}
++
++static int mxc_ipu_release(struct inode *inode, struct file *file)
++{
++	struct ipu_alloc_list *mem;
++	struct ipu_alloc_list *n;
++
++	mutex_lock(&ipu_alloc_lock);
++	list_for_each_entry_safe(mem, n, &ipu_alloc_list, list) {
++		if ((mem->cpu_addr != 0) &&
++			(file->private_data == mem->file_index)) {
++			list_del(&mem->list);
++			dma_free_coherent(ipu_dev,
++					  mem->size,
++					  mem->cpu_addr,
++					  mem->phy_addr);
++			dev_dbg(ipu_dev, "rel-free %d bytes @ 0x%08X\n",
++				mem->size, mem->phy_addr);
++			kfree(mem);
++		}
++	}
++	mutex_unlock(&ipu_alloc_lock);
++	atomic_dec(&file_index);
++
++	return 0;
++}
++
++static struct file_operations mxc_ipu_fops = {
++	.owner = THIS_MODULE,
++	.open = mxc_ipu_open,
++	.mmap = mxc_ipu_mmap,
++	.release = mxc_ipu_release,
++	.unlocked_ioctl = mxc_ipu_ioctl,
++};
++
++int register_ipu_device(struct ipu_soc *ipu, int id)
++{
++	int ret = 0;
++	static int idx;
++	static struct ipu_thread_data thread_data[5];
++
++	if (!major) {
++		major = register_chrdev(0, "mxc_ipu", &mxc_ipu_fops);
++		if (major < 0) {
++			printk(KERN_ERR "Unable to register mxc_ipu as a char device\n");
++			ret = major;
++			goto register_cdev_fail;
++		}
++
++		ipu_class = class_create(THIS_MODULE, "mxc_ipu");
++		if (IS_ERR(ipu_class)) {
++			ret = PTR_ERR(ipu_class);
++			goto ipu_class_fail;
++		}
++
++		ipu_dev = device_create(ipu_class, NULL, MKDEV(major, 0),
++				NULL, "mxc_ipu");
++		if (IS_ERR(ipu_dev)) {
++			ret = PTR_ERR(ipu_dev);
++			goto dev_create_fail;
++		}
++		ipu_dev->dma_mask = kmalloc(sizeof(*ipu_dev->dma_mask), GFP_KERNEL);
++		*ipu_dev->dma_mask = DMA_BIT_MASK(32);
++		ipu_dev->coherent_dma_mask = DMA_BIT_MASK(32);
++
++		mutex_init(&ipu_ch_tbl.lock);
++	}
++	max_ipu_no = ++id;
++	ipu->rot_dma[0].size = 0;
++	ipu->rot_dma[1].size = 0;
++
++	thread_data[idx].ipu = ipu;
++	thread_data[idx].id = 0;
++	thread_data[idx].is_vdoa = 0;
++	ipu->thread[0] = kthread_run(ipu_task_thread, &thread_data[idx++],
++					"ipu%d_task", id);
++	if (IS_ERR(ipu->thread[0])) {
++		ret = PTR_ERR(ipu->thread[0]);
++		goto kthread0_fail;
++	}
++
++	thread_data[idx].ipu = ipu;
++	thread_data[idx].id = 1;
++	thread_data[idx].is_vdoa = 0;
++	ipu->thread[1] = kthread_run(ipu_task_thread, &thread_data[idx++],
++				"ipu%d_task", id);
++	if (IS_ERR(ipu->thread[1])) {
++		ret = PTR_ERR(ipu->thread[1]);
++		goto kthread1_fail;
++	}
++
++
++	return ret;
++
++kthread1_fail:
++	kthread_stop(ipu->thread[0]);
++kthread0_fail:
++	if (id == 0)
++		device_destroy(ipu_class, MKDEV(major, 0));
++dev_create_fail:
++	if (id == 0) {
++		class_destroy(ipu_class);
++	}
++ipu_class_fail:
++	if (id == 0)
++		unregister_chrdev(major, "mxc_ipu");
++register_cdev_fail:
++	return ret;
++}
++
++void unregister_ipu_device(struct ipu_soc *ipu, int id)
++{
++	int i;
++
++	kthread_stop(ipu->thread[0]);
++	kthread_stop(ipu->thread[1]);
++	for (i = 0; i < 2; i++) {
++		if (ipu->rot_dma[i].vaddr)
++			dma_free_coherent(ipu_dev,
++				ipu->rot_dma[i].size,
++				ipu->rot_dma[i].vaddr,
++				ipu->rot_dma[i].paddr);
++	}
++
++	if (major) {
++		device_destroy(ipu_class, MKDEV(major, 0));
++		class_destroy(ipu_class);
++		unregister_chrdev(major, "mxc_ipu");
++		major = 0;
++	}
++}
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_disp.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_disp.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_disp.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_disp.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,1956 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file ipu_disp.c
++ *
++ * @brief IPU display submodule API functions
++ *
++ * @ingroup IPU
++ */
++
++#include <linux/clk.h>
++#include <linux/clk-provider.h>
++#include <linux/delay.h>
++#include <linux/err.h>
++#include <linux/errno.h>
++#include <linux/io.h>
++#include <linux/ipu-v3.h>
++#include <linux/module.h>
++#include <linux/spinlock.h>
++#include <linux/types.h>
++
++#include <asm/atomic.h>
++
++#include "ipu_param_mem.h"
++#include "ipu_regs.h"
++
++struct dp_csc_param_t {
++	int mode;
++	void *coeff;
++};
++
++#define SYNC_WAVE 0
++#define NULL_WAVE (-1)
++#define ASYNC_SER_WAVE 6
++
++/* DC display ID assignments */
++#define DC_DISP_ID_SYNC(di)	(di)
++#define DC_DISP_ID_SERIAL	2
++#define DC_DISP_ID_ASYNC	3
++
++int dmfc_type_setup;
++
++void _ipu_dmfc_init(struct ipu_soc *ipu, int dmfc_type, int first)
++{
++	u32 dmfc_wr_chan, dmfc_dp_chan;
++
++	if (first) {
++		if (dmfc_type_setup > dmfc_type)
++			dmfc_type = dmfc_type_setup;
++		else
++			dmfc_type_setup = dmfc_type;
++
++		/* disable DMFC-IC channel*/
++		ipu_dmfc_write(ipu, 0x2, DMFC_IC_CTRL);
++	} else if (dmfc_type_setup >= DMFC_HIGH_RESOLUTION_DC) {
++		dev_dbg(ipu->dev, "DMFC high resolution has set, will not change\n");
++		return;
++	} else
++		dmfc_type_setup = dmfc_type;
++
++	if (dmfc_type == DMFC_HIGH_RESOLUTION_DC) {
++		/* 1 - segment 0~3;
++		 * 5B - segement 4, 5;
++		 * 5F - segement 6, 7;
++		 * 1C, 2C and 6B, 6F unused;
++		 */
++		dev_info(ipu->dev, "IPU DMFC DC HIGH RESOLUTION: 1(0~3), 5B(4,5), 5F(6,7)\n");
++		dmfc_wr_chan = 0x00000088;
++		dmfc_dp_chan = 0x00009694;
++		ipu->dmfc_size_28 = 256*4;
++		ipu->dmfc_size_29 = 0;
++		ipu->dmfc_size_24 = 0;
++		ipu->dmfc_size_27 = 128*4;
++		ipu->dmfc_size_23 = 128*4;
++	} else if (dmfc_type == DMFC_HIGH_RESOLUTION_DP) {
++		/* 1 - segment 0, 1;
++		 * 5B - segement 2~5;
++		 * 5F - segement 6,7;
++		 * 1C, 2C and 6B, 6F unused;
++		 */
++		dev_info(ipu->dev, "IPU DMFC DP HIGH RESOLUTION: 1(0,1), 5B(2~5), 5F(6,7)\n");
++		dmfc_wr_chan = 0x00000090;
++		dmfc_dp_chan = 0x0000968a;
++		ipu->dmfc_size_28 = 128*4;
++		ipu->dmfc_size_29 = 0;
++		ipu->dmfc_size_24 = 0;
++		ipu->dmfc_size_27 = 128*4;
++		ipu->dmfc_size_23 = 256*4;
++	} else if (dmfc_type == DMFC_HIGH_RESOLUTION_ONLY_DP) {
++		/* 5B - segement 0~3;
++		 * 5F - segement 4~7;
++		 * 1, 1C, 2C and 6B, 6F unused;
++		 */
++		dev_info(ipu->dev, "IPU DMFC ONLY-DP HIGH RESOLUTION: 5B(0~3), 5F(4~7)\n");
++		dmfc_wr_chan = 0x00000000;
++		dmfc_dp_chan = 0x00008c88;
++		ipu->dmfc_size_28 = 0;
++		ipu->dmfc_size_29 = 0;
++		ipu->dmfc_size_24 = 0;
++		ipu->dmfc_size_27 = 256*4;
++		ipu->dmfc_size_23 = 256*4;
++	} else {
++		/* 1 - segment 0, 1;
++		 * 5B - segement 4, 5;
++		 * 5F - segement 6, 7;
++		 * 1C, 2C and 6B, 6F unused;
++		 */
++		dev_info(ipu->dev, "IPU DMFC NORMAL mode: 1(0~1), 5B(4,5), 5F(6,7)\n");
++		dmfc_wr_chan = 0x00000090;
++		dmfc_dp_chan = 0x00009694;
++		ipu->dmfc_size_28 = 128*4;
++		ipu->dmfc_size_29 = 0;
++		ipu->dmfc_size_24 = 0;
++		ipu->dmfc_size_27 = 128*4;
++		ipu->dmfc_size_23 = 128*4;
++	}
++	ipu_dmfc_write(ipu, dmfc_wr_chan, DMFC_WR_CHAN);
++	ipu_dmfc_write(ipu, 0x202020F6, DMFC_WR_CHAN_DEF);
++	ipu_dmfc_write(ipu, dmfc_dp_chan, DMFC_DP_CHAN);
++	/* Enable chan 5 watermark set at 5 bursts and clear at 7 bursts */
++	ipu_dmfc_write(ipu, 0x2020F6F6, DMFC_DP_CHAN_DEF);
++}
++
++static int __init dmfc_setup(char *options)
++{
++	get_option(&options, &dmfc_type_setup);
++	if (dmfc_type_setup > DMFC_HIGH_RESOLUTION_ONLY_DP)
++		dmfc_type_setup = DMFC_HIGH_RESOLUTION_ONLY_DP;
++	return 1;
++}
++__setup("dmfc=", dmfc_setup);
++
++void _ipu_dmfc_set_wait4eot(struct ipu_soc *ipu, int dma_chan, int width)
++{
++	u32 dmfc_gen1 = ipu_dmfc_read(ipu, DMFC_GENERAL1);
++
++	if (width >= HIGH_RESOLUTION_WIDTH) {
++		if (dma_chan == 23)
++			_ipu_dmfc_init(ipu, DMFC_HIGH_RESOLUTION_DP, 0);
++		else if (dma_chan == 28)
++			_ipu_dmfc_init(ipu, DMFC_HIGH_RESOLUTION_DC, 0);
++	}
++
++	if (dma_chan == 23) { /*5B*/
++		if (ipu->dmfc_size_23/width > 3)
++			dmfc_gen1 |= 1UL << 20;
++		else
++			dmfc_gen1 &= ~(1UL << 20);
++	} else if (dma_chan == 24) { /*6B*/
++		if (ipu->dmfc_size_24/width > 1)
++			dmfc_gen1 |= 1UL << 22;
++		else
++			dmfc_gen1 &= ~(1UL << 22);
++	} else if (dma_chan == 27) { /*5F*/
++		if (ipu->dmfc_size_27/width > 2)
++			dmfc_gen1 |= 1UL << 21;
++		else
++			dmfc_gen1 &= ~(1UL << 21);
++	} else if (dma_chan == 28) { /*1*/
++		if (ipu->dmfc_size_28/width > 2)
++			dmfc_gen1 |= 1UL << 16;
++		else
++			dmfc_gen1 &= ~(1UL << 16);
++	} else if (dma_chan == 29) { /*6F*/
++		if (ipu->dmfc_size_29/width > 1)
++			dmfc_gen1 |= 1UL << 23;
++		else
++			dmfc_gen1 &= ~(1UL << 23);
++	}
++
++	ipu_dmfc_write(ipu, dmfc_gen1, DMFC_GENERAL1);
++}
++
++void _ipu_dmfc_set_burst_size(struct ipu_soc *ipu, int dma_chan, int burst_size)
++{
++	u32 dmfc_wr_chan = ipu_dmfc_read(ipu, DMFC_WR_CHAN);
++	u32 dmfc_dp_chan = ipu_dmfc_read(ipu, DMFC_DP_CHAN);
++	int dmfc_bs = 0;
++
++	switch (burst_size) {
++	case 64:
++		dmfc_bs = 0x40;
++		break;
++	case 32:
++	case 20:
++		dmfc_bs = 0x80;
++		break;
++	case 16:
++		dmfc_bs = 0xc0;
++		break;
++	default:
++		dev_err(ipu->dev, "Unsupported burst size %d\n",
++			burst_size);
++		return;
++	}
++
++	if (dma_chan == 23) { /*5B*/
++		dmfc_dp_chan &= ~(0xc0);
++		dmfc_dp_chan |= dmfc_bs;
++	} else if (dma_chan == 27) { /*5F*/
++		dmfc_dp_chan &= ~(0xc000);
++		dmfc_dp_chan |= (dmfc_bs << 8);
++	} else if (dma_chan == 28) { /*1*/
++		dmfc_wr_chan &= ~(0xc0);
++		dmfc_wr_chan |= dmfc_bs;
++	}
++
++	ipu_dmfc_write(ipu, dmfc_wr_chan, DMFC_WR_CHAN);
++	ipu_dmfc_write(ipu, dmfc_dp_chan, DMFC_DP_CHAN);
++}
++
++static void _ipu_di_data_wave_config(struct ipu_soc *ipu,
++				int di, int wave_gen,
++				int access_size, int component_size)
++{
++	u32 reg;
++	reg = (access_size << DI_DW_GEN_ACCESS_SIZE_OFFSET) |
++	    (component_size << DI_DW_GEN_COMPONENT_SIZE_OFFSET);
++	ipu_di_write(ipu, di, reg, DI_DW_GEN(wave_gen));
++}
++
++static void _ipu_di_data_pin_config(struct ipu_soc *ipu,
++			int di, int wave_gen, int di_pin, int set,
++			int up, int down)
++{
++	u32 reg;
++
++	reg = ipu_di_read(ipu, di, DI_DW_GEN(wave_gen));
++	reg &= ~(0x3 << (di_pin * 2));
++	reg |= set << (di_pin * 2);
++	ipu_di_write(ipu, di, reg, DI_DW_GEN(wave_gen));
++
++	ipu_di_write(ipu, di, (down << 16) | up, DI_DW_SET(wave_gen, set));
++}
++
++static void _ipu_di_sync_config(struct ipu_soc *ipu,
++				int di, int wave_gen,
++				int run_count, int run_src,
++				int offset_count, int offset_src,
++				int repeat_count, int cnt_clr_src,
++				int cnt_polarity_gen_en,
++				int cnt_polarity_clr_src,
++				int cnt_polarity_trigger_src,
++				int cnt_up, int cnt_down)
++{
++	u32 reg;
++
++	if ((run_count >= 0x1000) || (offset_count >= 0x1000) || (repeat_count >= 0x1000) ||
++		(cnt_up >= 0x400) || (cnt_down >= 0x400)) {
++		dev_err(ipu->dev, "DI%d counters out of range.\n", di);
++		return;
++	}
++
++	reg = (run_count << 19) | (++run_src << 16) |
++	    (offset_count << 3) | ++offset_src;
++	ipu_di_write(ipu, di, reg, DI_SW_GEN0(wave_gen));
++	reg = (cnt_polarity_gen_en << 29) | (++cnt_clr_src << 25) |
++	    (++cnt_polarity_trigger_src << 12) | (++cnt_polarity_clr_src << 9);
++	reg |= (cnt_down << 16) | cnt_up;
++	if (repeat_count == 0) {
++		/* Enable auto reload */
++		reg |= 0x10000000;
++	}
++	ipu_di_write(ipu, di, reg, DI_SW_GEN1(wave_gen));
++	reg = ipu_di_read(ipu, di, DI_STP_REP(wave_gen));
++	reg &= ~(0xFFFF << (16 * ((wave_gen - 1) & 0x1)));
++	reg |= repeat_count << (16 * ((wave_gen - 1) & 0x1));
++	ipu_di_write(ipu, di, reg, DI_STP_REP(wave_gen));
++}
++
++static void _ipu_dc_map_link(struct ipu_soc *ipu,
++		int current_map,
++		int base_map_0, int buf_num_0,
++		int base_map_1, int buf_num_1,
++		int base_map_2, int buf_num_2)
++{
++	int ptr_0 = base_map_0 * 3 + buf_num_0;
++	int ptr_1 = base_map_1 * 3 + buf_num_1;
++	int ptr_2 = base_map_2 * 3 + buf_num_2;
++	int ptr;
++	u32 reg;
++	ptr = (ptr_2 << 10) +  (ptr_1 << 5) + ptr_0;
++
++	reg = ipu_dc_read(ipu, DC_MAP_CONF_PTR(current_map));
++	reg &= ~(0x1F << ((16 * (current_map & 0x1))));
++	reg |= ptr << ((16 * (current_map & 0x1)));
++	ipu_dc_write(ipu, reg, DC_MAP_CONF_PTR(current_map));
++}
++
++static void _ipu_dc_map_config(struct ipu_soc *ipu,
++		int map, int byte_num, int offset, int mask)
++{
++	int ptr = map * 3 + byte_num;
++	u32 reg;
++
++	reg = ipu_dc_read(ipu, DC_MAP_CONF_VAL(ptr));
++	reg &= ~(0xFFFF << (16 * (ptr & 0x1)));
++	reg |= ((offset << 8) | mask) << (16 * (ptr & 0x1));
++	ipu_dc_write(ipu, reg, DC_MAP_CONF_VAL(ptr));
++
++	reg = ipu_dc_read(ipu, DC_MAP_CONF_PTR(map));
++	reg &= ~(0x1F << ((16 * (map & 0x1)) + (5 * byte_num)));
++	reg |= ptr << ((16 * (map & 0x1)) + (5 * byte_num));
++	ipu_dc_write(ipu, reg, DC_MAP_CONF_PTR(map));
++}
++
++static void _ipu_dc_map_clear(struct ipu_soc *ipu, int map)
++{
++	u32 reg = ipu_dc_read(ipu, DC_MAP_CONF_PTR(map));
++	ipu_dc_write(ipu, reg & ~(0xFFFF << (16 * (map & 0x1))),
++		     DC_MAP_CONF_PTR(map));
++}
++
++static void _ipu_dc_write_tmpl(struct ipu_soc *ipu,
++			int word, u32 opcode, u32 operand, int map,
++			int wave, int glue, int sync, int stop)
++{
++	u32 reg;
++
++	if (opcode == WRG) {
++		reg = sync;
++		reg |= (glue << 4);
++		reg |= (++wave << 11);
++		reg |= ((operand & 0x1FFFF) << 15);
++		ipu_dc_tmpl_write(ipu, reg, word * 8);
++
++		reg = (operand >> 17);
++		reg |= opcode << 7;
++		reg |= (stop << 9);
++		ipu_dc_tmpl_write(ipu, reg, word * 8 + 4);
++	} else {
++		reg = sync;
++		reg |= (glue << 4);
++		reg |= (++wave << 11);
++		reg |= (++map << 15);
++		reg |= (operand << 20) & 0xFFF00000;
++		ipu_dc_tmpl_write(ipu, reg, word * 8);
++
++		reg = (operand >> 12);
++		reg |= opcode << 4;
++		reg |= (stop << 9);
++		ipu_dc_tmpl_write(ipu, reg, word * 8 + 4);
++	}
++}
++
++static void _ipu_dc_link_event(struct ipu_soc *ipu,
++		int chan, int event, int addr, int priority)
++{
++	u32 reg;
++	u32 address_shift;
++	if (event < DC_EVEN_UGDE0) {
++		reg = ipu_dc_read(ipu, DC_RL_CH(chan, event));
++		reg &= ~(0xFFFF << (16 * (event & 0x1)));
++		reg |= ((addr << 8) | priority) << (16 * (event & 0x1));
++		ipu_dc_write(ipu, reg, DC_RL_CH(chan, event));
++	} else {
++		reg = ipu_dc_read(ipu, DC_UGDE_0((event - DC_EVEN_UGDE0) / 2));
++		if ((event - DC_EVEN_UGDE0) & 0x1) {
++			reg &= ~(0x2FF << 16);
++			reg |= (addr << 16);
++			reg |= priority ? (2 << 24) : 0x0;
++		} else {
++			reg &= ~0xFC00FFFF;
++			if (priority)
++				chan = (chan >> 1) +
++					((((chan & 0x1) + ((chan & 0x2) >> 1))) | (chan >> 3));
++			else
++				chan = 0x7;
++			address_shift = ((event - DC_EVEN_UGDE0) >> 1) ? 7 : 8;
++			reg |= (addr << address_shift) | (priority << 3) | chan;
++		}
++		ipu_dc_write(ipu, reg, DC_UGDE_0((event - DC_EVEN_UGDE0) / 2));
++	}
++}
++
++/*     Y = R *  1.200 + G *  2.343 + B *  .453 + 0.250;
++       U = R * -.672 + G * -1.328 + B *  2.000 + 512.250.;
++       V = R *  2.000 + G * -1.672 + B * -.328 + 512.250.;*/
++static const int rgb2ycbcr_coeff[5][3] = {
++	{0x4D, 0x96, 0x1D},
++	{-0x2B, -0x55, 0x80},
++	{0x80, -0x6B, -0x15},
++	{0x0000, 0x0200, 0x0200},	/* B0, B1, B2 */
++	{0x2, 0x2, 0x2},	/* S0, S1, S2 */
++};
++
++/*     R = (1.164 * (Y - 16)) + (1.596 * (Cr - 128));
++       G = (1.164 * (Y - 16)) - (0.392 * (Cb - 128)) - (0.813 * (Cr - 128));
++       B = (1.164 * (Y - 16)) + (2.017 * (Cb - 128); */
++static const int ycbcr2rgb_coeff[5][3] = {
++	{0x095, 0x000, 0x0CC},
++	{0x095, 0x3CE, 0x398},
++	{0x095, 0x0FF, 0x000},
++	{0x3E42, 0x010A, 0x3DD6},	/*B0,B1,B2 */
++	{0x1, 0x1, 0x1},	/*S0,S1,S2 */
++};
++
++#define mask_a(a) ((u32)(a) & 0x3FF)
++#define mask_b(b) ((u32)(b) & 0x3FFF)
++
++/* Pls keep S0, S1 and S2 as 0x2 by using this convertion */
++static int _rgb_to_yuv(int n, int red, int green, int blue)
++{
++	int c;
++	c = red * rgb2ycbcr_coeff[n][0];
++	c += green * rgb2ycbcr_coeff[n][1];
++	c += blue * rgb2ycbcr_coeff[n][2];
++	c /= 16;
++	c += rgb2ycbcr_coeff[3][n] * 4;
++	c += 8;
++	c /= 16;
++	if (c < 0)
++		c = 0;
++	if (c > 255)
++		c = 255;
++	return c;
++}
++
++/*
++ * Row is for BG: 	RGB2YUV YUV2RGB RGB2RGB YUV2YUV CSC_NONE
++ * Column is for FG:	RGB2YUV YUV2RGB RGB2RGB YUV2YUV CSC_NONE
++ */
++static struct dp_csc_param_t dp_csc_array[CSC_NUM][CSC_NUM] = {
++{{DP_COM_CONF_CSC_DEF_BOTH, &rgb2ycbcr_coeff}, {0, 0}, {0, 0}, {DP_COM_CONF_CSC_DEF_BG, &rgb2ycbcr_coeff}, {DP_COM_CONF_CSC_DEF_BG, &rgb2ycbcr_coeff} },
++{{0, 0}, {DP_COM_CONF_CSC_DEF_BOTH, &ycbcr2rgb_coeff}, {DP_COM_CONF_CSC_DEF_BG, &ycbcr2rgb_coeff}, {0, 0}, {DP_COM_CONF_CSC_DEF_BG, &ycbcr2rgb_coeff} },
++{{0, 0}, {DP_COM_CONF_CSC_DEF_FG, &ycbcr2rgb_coeff}, {0, 0}, {0, 0}, {0, 0} },
++{{DP_COM_CONF_CSC_DEF_FG, &rgb2ycbcr_coeff}, {0, 0}, {0, 0}, {0, 0}, {0, 0} },
++{{DP_COM_CONF_CSC_DEF_FG, &rgb2ycbcr_coeff}, {DP_COM_CONF_CSC_DEF_FG, &ycbcr2rgb_coeff}, {0, 0}, {0, 0}, {0, 0} }
++};
++
++void __ipu_dp_csc_setup(struct ipu_soc *ipu,
++		int dp, struct dp_csc_param_t dp_csc_param,
++		bool srm_mode_update)
++{
++	u32 reg;
++	const int (*coeff)[5][3];
++
++	if (dp_csc_param.mode >= 0) {
++		reg = ipu_dp_read(ipu, DP_COM_CONF(dp));
++		reg &= ~DP_COM_CONF_CSC_DEF_MASK;
++		reg |= dp_csc_param.mode;
++		ipu_dp_write(ipu, reg, DP_COM_CONF(dp));
++	}
++
++	coeff = dp_csc_param.coeff;
++
++	if (coeff) {
++		ipu_dp_write(ipu, mask_a((*coeff)[0][0]) |
++				(mask_a((*coeff)[0][1]) << 16), DP_CSC_A_0(dp));
++		ipu_dp_write(ipu, mask_a((*coeff)[0][2]) |
++				(mask_a((*coeff)[1][0]) << 16), DP_CSC_A_1(dp));
++		ipu_dp_write(ipu, mask_a((*coeff)[1][1]) |
++				(mask_a((*coeff)[1][2]) << 16), DP_CSC_A_2(dp));
++		ipu_dp_write(ipu, mask_a((*coeff)[2][0]) |
++				(mask_a((*coeff)[2][1]) << 16), DP_CSC_A_3(dp));
++		ipu_dp_write(ipu, mask_a((*coeff)[2][2]) |
++				(mask_b((*coeff)[3][0]) << 16) |
++				((*coeff)[4][0] << 30), DP_CSC_0(dp));
++		ipu_dp_write(ipu, mask_b((*coeff)[3][1]) | ((*coeff)[4][1] << 14) |
++				(mask_b((*coeff)[3][2]) << 16) |
++				((*coeff)[4][2] << 30), DP_CSC_1(dp));
++	}
++
++	if (srm_mode_update) {
++		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++	}
++}
++
++int _ipu_dp_init(struct ipu_soc *ipu,
++		ipu_channel_t channel, uint32_t in_pixel_fmt,
++		uint32_t out_pixel_fmt)
++{
++	int in_fmt, out_fmt;
++	int dp;
++	int partial = false;
++	uint32_t reg;
++
++	if (channel == MEM_FG_SYNC) {
++		dp = DP_SYNC;
++		partial = true;
++	} else if (channel == MEM_BG_SYNC) {
++		dp = DP_SYNC;
++		partial = false;
++	} else if (channel == MEM_BG_ASYNC0) {
++		dp = DP_ASYNC0;
++		partial = false;
++	} else {
++		return -EINVAL;
++	}
++
++	in_fmt = format_to_colorspace(in_pixel_fmt);
++	out_fmt = format_to_colorspace(out_pixel_fmt);
++
++	if (partial) {
++		if (in_fmt == RGB) {
++			if (out_fmt == RGB)
++				ipu->fg_csc_type = RGB2RGB;
++			else
++				ipu->fg_csc_type = RGB2YUV;
++		} else {
++			if (out_fmt == RGB)
++				ipu->fg_csc_type = YUV2RGB;
++			else
++				ipu->fg_csc_type = YUV2YUV;
++		}
++	} else {
++		if (in_fmt == RGB) {
++			if (out_fmt == RGB)
++				ipu->bg_csc_type = RGB2RGB;
++			else
++				ipu->bg_csc_type = RGB2YUV;
++		} else {
++			if (out_fmt == RGB)
++				ipu->bg_csc_type = YUV2RGB;
++			else
++				ipu->bg_csc_type = YUV2YUV;
++		}
++	}
++
++	/* Transform color key from rgb to yuv if CSC is enabled */
++	reg = ipu_dp_read(ipu, DP_COM_CONF(dp));
++	if (ipu->color_key_4rgb && (reg & DP_COM_CONF_GWCKE) &&
++			(((ipu->fg_csc_type == RGB2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
++			 ((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == RGB2YUV)) ||
++			 ((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
++			 ((ipu->fg_csc_type == YUV2RGB) && (ipu->bg_csc_type == YUV2RGB)))) {
++		int red, green, blue;
++		int y, u, v;
++		uint32_t color_key = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(dp)) & 0xFFFFFFL;
++
++		dev_dbg(ipu->dev, "_ipu_dp_init color key 0x%x need change to yuv fmt!\n", color_key);
++
++		red = (color_key >> 16) & 0xFF;
++		green = (color_key >> 8) & 0xFF;
++		blue = color_key & 0xFF;
++
++		y = _rgb_to_yuv(0, red, green, blue);
++		u = _rgb_to_yuv(1, red, green, blue);
++		v = _rgb_to_yuv(2, red, green, blue);
++		color_key = (y << 16) | (u << 8) | v;
++
++		reg = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(dp)) & 0xFF000000L;
++		ipu_dp_write(ipu, reg | color_key, DP_GRAPH_WIND_CTRL(dp));
++		ipu->color_key_4rgb = false;
++
++		dev_dbg(ipu->dev, "_ipu_dp_init color key change to yuv fmt 0x%x!\n", color_key);
++	}
++
++	__ipu_dp_csc_setup(ipu, dp, dp_csc_array[ipu->bg_csc_type][ipu->fg_csc_type], true);
++
++	return 0;
++}
++
++void _ipu_dp_uninit(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	int dp;
++	int partial = false;
++
++	if (channel == MEM_FG_SYNC) {
++		dp = DP_SYNC;
++		partial = true;
++	} else if (channel == MEM_BG_SYNC) {
++		dp = DP_SYNC;
++		partial = false;
++	} else if (channel == MEM_BG_ASYNC0) {
++		dp = DP_ASYNC0;
++		partial = false;
++	} else {
++		return;
++	}
++
++	if (partial)
++		ipu->fg_csc_type = CSC_NONE;
++	else
++		ipu->bg_csc_type = CSC_NONE;
++
++	__ipu_dp_csc_setup(ipu, dp, dp_csc_array[ipu->bg_csc_type][ipu->fg_csc_type], false);
++}
++
++void _ipu_dc_init(struct ipu_soc *ipu, int dc_chan, int di, bool interlaced, uint32_t pixel_fmt)
++{
++	u32 reg = 0;
++
++	if ((dc_chan == 1) || (dc_chan == 5)) {
++		if (interlaced) {
++			if (di) {
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 1, 3);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 1, 2);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 1, 1);
++				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE1, 9, 5);
++					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE1, 8, 5);
++				}
++			} else {
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 0, 3);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 0, 2);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 0, 1);
++				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE0, 10, 5);
++					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE0, 11, 5);
++				}
++			}
++		} else {
++			if (di) {
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 2, 3);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 3, 2);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 1, 1);
++				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE1, 9, 5);
++					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE1, 8, 5);
++				}
++			} else {
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 5, 3);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 6, 2);
++				_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 12, 1);
++				if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++					_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE0, 10, 5);
++					_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE0, 11, 5);
++				}
++			}
++		}
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NF, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NFIELD, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOF, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOFIELD, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR, 0, 0);
++
++		reg = 0x2;
++		reg |= DC_DISP_ID_SYNC(di) << DC_WR_CH_CONF_PROG_DISP_ID_OFFSET;
++		reg |= di << 2;
++		if (interlaced)
++			reg |= DC_WR_CH_CONF_FIELD_MODE;
++	} else if ((dc_chan == 8) || (dc_chan == 9)) {
++		/* async channels */
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_0, 0x64, 1);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_1, 0x64, 1);
++
++		reg = 0x3;
++		reg |= DC_DISP_ID_SERIAL << DC_WR_CH_CONF_PROG_DISP_ID_OFFSET;
++	}
++	ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
++
++	ipu_dc_write(ipu, 0x00000000, DC_WR_CH_ADDR(dc_chan));
++
++	ipu_dc_write(ipu, 0x00000084, DC_GEN);
++}
++
++void _ipu_dc_uninit(struct ipu_soc *ipu, int dc_chan)
++{
++	if ((dc_chan == 1) || (dc_chan == 5)) {
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NL, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOL, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NF, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NFIELD, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOF, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_EOFIELD, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_ODD_UGDE1, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVEN_UGDE1, 0, 0);
++	} else if ((dc_chan == 8) || (dc_chan == 9)) {
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_W_0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_W_1, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_W_0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_W_1, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_W_1, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_R_0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_ADDR_R_1, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_R_0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_CHAN_R_1, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_R_0, 0, 0);
++		_ipu_dc_link_event(ipu, dc_chan, DC_EVT_NEW_DATA_R_1, 0, 0);
++	}
++}
++
++int _ipu_disp_chan_is_interlaced(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	if (channel == MEM_DC_SYNC)
++		return !!(ipu_dc_read(ipu, DC_WR_CH_CONF_1) &
++			  DC_WR_CH_CONF_FIELD_MODE);
++	else if ((channel == MEM_BG_SYNC) || (channel == MEM_FG_SYNC))
++		return !!(ipu_dc_read(ipu, DC_WR_CH_CONF_5) &
++			  DC_WR_CH_CONF_FIELD_MODE);
++	return 0;
++}
++
++void _ipu_dp_dc_enable(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	int di;
++	uint32_t reg;
++	uint32_t dc_chan;
++	int irq = 0;
++
++	if (channel == MEM_FG_SYNC)
++		irq = IPU_IRQ_DP_SF_END;
++	else if (channel == MEM_DC_SYNC)
++		dc_chan = 1;
++	else if (channel == MEM_BG_SYNC)
++		dc_chan = 5;
++	else
++		return;
++
++	if (channel == MEM_FG_SYNC) {
++		/* Enable FG channel */
++		reg = ipu_dp_read(ipu, DP_COM_CONF(DP_SYNC));
++		ipu_dp_write(ipu, reg | DP_COM_CONF_FG_EN, DP_COM_CONF(DP_SYNC));
++
++		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++		return;
++	} else if (channel == MEM_BG_SYNC) {
++		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++	}
++
++	di = ipu->dc_di_assignment[dc_chan];
++
++	/* Make sure other DC sync channel is not assigned same DI */
++	reg = ipu_dc_read(ipu, DC_WR_CH_CONF(6 - dc_chan));
++	if ((di << 2) == (reg & DC_WR_CH_CONF_PROG_DI_ID)) {
++		reg &= ~DC_WR_CH_CONF_PROG_DI_ID;
++		reg |= di ? 0 : DC_WR_CH_CONF_PROG_DI_ID;
++		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(6 - dc_chan));
++	}
++
++	reg = ipu_dc_read(ipu, DC_WR_CH_CONF(dc_chan));
++	reg |= 4 << DC_WR_CH_CONF_PROG_TYPE_OFFSET;
++	ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
++
++	clk_prepare_enable(ipu->pixel_clk[di]);
++}
++
++static irqreturn_t dc_irq_handler(int irq, void *dev_id)
++{
++	struct ipu_soc *ipu = dev_id;
++	struct completion *comp = &ipu->dc_comp;
++	uint32_t reg;
++	uint32_t dc_chan;
++
++	if (irq == IPU_IRQ_DC_FC_1)
++		dc_chan = 1;
++	else
++		dc_chan = 5;
++
++	if (!ipu->dc_swap) {
++		reg = ipu_dc_read(ipu, DC_WR_CH_CONF(dc_chan));
++		reg &= ~DC_WR_CH_CONF_PROG_TYPE_MASK;
++		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
++
++		reg = ipu_cm_read(ipu, IPU_DISP_GEN);
++		if (ipu->dc_di_assignment[dc_chan])
++			reg &= ~DI1_COUNTER_RELEASE;
++		else
++			reg &= ~DI0_COUNTER_RELEASE;
++		ipu_cm_write(ipu, reg, IPU_DISP_GEN);
++	}
++
++	complete(comp);
++	return IRQ_HANDLED;
++}
++
++void _ipu_dp_dc_disable(struct ipu_soc *ipu, ipu_channel_t channel, bool swap)
++{
++	int ret;
++	uint32_t reg;
++	uint32_t csc;
++	uint32_t dc_chan;
++	int irq = 0;
++	int timeout = 50;
++
++	ipu->dc_swap = swap;
++
++	if (channel == MEM_DC_SYNC) {
++		dc_chan = 1;
++		irq = IPU_IRQ_DC_FC_1;
++	} else if (channel == MEM_BG_SYNC) {
++		dc_chan = 5;
++		irq = IPU_IRQ_DP_SF_END;
++	} else if (channel == MEM_FG_SYNC) {
++		/* Disable FG channel */
++		dc_chan = 5;
++
++		reg = ipu_dp_read(ipu, DP_COM_CONF(DP_SYNC));
++		csc = reg & DP_COM_CONF_CSC_DEF_MASK;
++		if (csc == DP_COM_CONF_CSC_DEF_FG)
++			reg &= ~DP_COM_CONF_CSC_DEF_MASK;
++
++		reg &= ~DP_COM_CONF_FG_EN;
++		ipu_dp_write(ipu, reg, DP_COM_CONF(DP_SYNC));
++
++		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++
++		if (ipu_is_channel_busy(ipu, MEM_BG_SYNC)) {
++			ipu_cm_write(ipu, IPUIRQ_2_MASK(IPU_IRQ_DP_SF_END),
++					IPUIRQ_2_STATREG(IPU_IRQ_DP_SF_END));
++			while ((ipu_cm_read(ipu, IPUIRQ_2_STATREG(IPU_IRQ_DP_SF_END)) &
++						IPUIRQ_2_MASK(IPU_IRQ_DP_SF_END)) == 0) {
++				msleep(2);
++				timeout -= 2;
++				if (timeout <= 0)
++					break;
++			}
++		}
++		return;
++	} else {
++		return;
++	}
++
++	init_completion(&ipu->dc_comp);
++	ret = ipu_request_irq(ipu, irq, dc_irq_handler, 0, NULL, ipu);
++	if (ret < 0) {
++		dev_err(ipu->dev, "DC irq %d in use\n", irq);
++		return;
++	}
++	ret = wait_for_completion_timeout(&ipu->dc_comp, msecs_to_jiffies(50));
++	ipu_free_irq(ipu, irq, ipu);
++	dev_dbg(ipu->dev, "DC stop timeout - %d * 10ms\n", 5 - ret);
++
++	if (ipu->dc_swap) {
++		/* Swap DC channel 1 and 5 settings, and disable old dc chan */
++		reg = ipu_dc_read(ipu, DC_WR_CH_CONF(dc_chan));
++		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(6 - dc_chan));
++		reg &= ~DC_WR_CH_CONF_PROG_TYPE_MASK;
++		reg ^= DC_WR_CH_CONF_PROG_DI_ID;
++		ipu_dc_write(ipu, reg, DC_WR_CH_CONF(dc_chan));
++	}
++}
++
++void _ipu_init_dc_mappings(struct ipu_soc *ipu)
++{
++	/* IPU_PIX_FMT_RGB24 */
++	_ipu_dc_map_clear(ipu, 0);
++	_ipu_dc_map_config(ipu, 0, 0, 7, 0xFF);
++	_ipu_dc_map_config(ipu, 0, 1, 15, 0xFF);
++	_ipu_dc_map_config(ipu, 0, 2, 23, 0xFF);
++
++	/* IPU_PIX_FMT_RGB666 */
++	_ipu_dc_map_clear(ipu, 1);
++	_ipu_dc_map_config(ipu, 1, 0, 5, 0xFC);
++	_ipu_dc_map_config(ipu, 1, 1, 11, 0xFC);
++	_ipu_dc_map_config(ipu, 1, 2, 17, 0xFC);
++
++	/* IPU_PIX_FMT_YUV444 */
++	_ipu_dc_map_clear(ipu, 2);
++	_ipu_dc_map_config(ipu, 2, 0, 15, 0xFF);
++	_ipu_dc_map_config(ipu, 2, 1, 23, 0xFF);
++	_ipu_dc_map_config(ipu, 2, 2, 7, 0xFF);
++
++	/* IPU_PIX_FMT_RGB565 */
++	_ipu_dc_map_clear(ipu, 3);
++	_ipu_dc_map_config(ipu, 3, 0, 4, 0xF8);
++	_ipu_dc_map_config(ipu, 3, 1, 10, 0xFC);
++	_ipu_dc_map_config(ipu, 3, 2, 15, 0xF8);
++
++	/* IPU_PIX_FMT_LVDS666 */
++	_ipu_dc_map_clear(ipu, 4);
++	_ipu_dc_map_config(ipu, 4, 0, 5, 0xFC);
++	_ipu_dc_map_config(ipu, 4, 1, 13, 0xFC);
++	_ipu_dc_map_config(ipu, 4, 2, 21, 0xFC);
++
++	/* IPU_PIX_FMT_VYUY 16bit width */
++	_ipu_dc_map_clear(ipu, 5);
++	_ipu_dc_map_config(ipu, 5, 0, 7, 0xFF);
++	_ipu_dc_map_config(ipu, 5, 1, 0, 0x0);
++	_ipu_dc_map_config(ipu, 5, 2, 15, 0xFF);
++	_ipu_dc_map_clear(ipu, 6);
++	_ipu_dc_map_config(ipu, 6, 0, 0, 0x0);
++	_ipu_dc_map_config(ipu, 6, 1, 7, 0xFF);
++	_ipu_dc_map_config(ipu, 6, 2, 15, 0xFF);
++
++	/* IPU_PIX_FMT_UYUV 16bit width */
++	_ipu_dc_map_clear(ipu, 7);
++	_ipu_dc_map_link(ipu, 7, 6, 0, 6, 1, 6, 2);
++	_ipu_dc_map_clear(ipu, 8);
++	_ipu_dc_map_link(ipu, 8, 5, 0, 5, 1, 5, 2);
++
++	/* IPU_PIX_FMT_YUYV 16bit width */
++	_ipu_dc_map_clear(ipu, 9);
++	_ipu_dc_map_link(ipu, 9, 5, 2, 5, 1, 5, 0);
++	_ipu_dc_map_clear(ipu, 10);
++	_ipu_dc_map_link(ipu, 10, 5, 1, 5, 2, 5, 0);
++
++	/* IPU_PIX_FMT_YVYU 16bit width */
++	_ipu_dc_map_clear(ipu, 11);
++	_ipu_dc_map_link(ipu, 11, 5, 1, 5, 2, 5, 0);
++	_ipu_dc_map_clear(ipu, 12);
++	_ipu_dc_map_link(ipu, 12, 5, 2, 5, 1, 5, 0);
++
++	/* IPU_PIX_FMT_GBR24 */
++	/* IPU_PIX_FMT_VYU444 */
++	_ipu_dc_map_clear(ipu, 13);
++	_ipu_dc_map_link(ipu, 13, 0, 2, 0, 0, 0, 1);
++
++	/* IPU_PIX_FMT_BGR24 */
++	_ipu_dc_map_clear(ipu, 14);
++	_ipu_dc_map_link(ipu, 14, 0, 2, 0, 1, 0, 0);
++}
++
++int _ipu_pixfmt_to_map(uint32_t fmt)
++{
++	switch (fmt) {
++	case IPU_PIX_FMT_GENERIC:
++	case IPU_PIX_FMT_RGB24:
++		return 0;
++	case IPU_PIX_FMT_RGB666:
++		return 1;
++	case IPU_PIX_FMT_YUV444:
++		return 2;
++	case IPU_PIX_FMT_RGB565:
++		return 3;
++	case IPU_PIX_FMT_LVDS666:
++		return 4;
++	case IPU_PIX_FMT_VYUY:
++		return 6;
++	case IPU_PIX_FMT_UYVY:
++		return 8;
++	case IPU_PIX_FMT_YUYV:
++		return 10;
++	case IPU_PIX_FMT_YVYU:
++		return 12;
++	case IPU_PIX_FMT_GBR24:
++	case IPU_PIX_FMT_VYU444:
++		return 13;
++	case IPU_PIX_FMT_BGR24:
++		return 14;
++	}
++
++	return -1;
++}
++
++/*!
++ * This function sets the colorspace for of dp.
++ * modes.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       param         	If it's not NULL, update the csc table
++ *                              with this parameter.
++ *
++ * @return      N/A
++ */
++void _ipu_dp_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3])
++{
++	int dp;
++	struct dp_csc_param_t dp_csc_param;
++
++	if (channel == MEM_FG_SYNC)
++		dp = DP_SYNC;
++	else if (channel == MEM_BG_SYNC)
++		dp = DP_SYNC;
++	else if (channel == MEM_BG_ASYNC0)
++		dp = DP_ASYNC0;
++	else
++		return;
++
++	dp_csc_param.mode = -1;
++	dp_csc_param.coeff = param;
++	__ipu_dp_csc_setup(ipu, dp, dp_csc_param, true);
++}
++
++void ipu_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3])
++{
++	_ipu_dp_set_csc_coefficients(ipu, channel, param);
++}
++EXPORT_SYMBOL(ipu_set_csc_coefficients);
++
++/*!
++ * This function is called to adapt synchronous LCD panel to IPU restriction.
++ *
++ */
++void adapt_panel_to_ipu_restricitions(struct ipu_soc *ipu, uint16_t *v_start_width,
++					uint16_t *v_sync_width,
++					uint16_t *v_end_width)
++{
++	if (*v_end_width < 2) {
++		uint16_t diff = 2 - *v_end_width;
++		if (*v_start_width >= diff) {
++			*v_end_width = 2;
++			*v_start_width = *v_start_width - diff;
++		} else if (*v_sync_width > diff) {
++			*v_end_width = 2;
++			*v_sync_width = *v_sync_width - diff;
++		} else
++			dev_err(ipu->dev, "WARNING: try to adapt timming, but failed\n");
++		dev_err(ipu->dev, "WARNING: adapt panel end blank lines\n");
++	}
++}
++
++/*!
++ * This function is called to initialize a synchronous LCD panel.
++ *
++ * @param	ipu		ipu handler
++ * @param       disp            The DI the panel is attached to.
++ *
++ * @param       pixel_clk       Desired pixel clock frequency in Hz.
++ *
++ * @param       pixel_fmt       Input parameter for pixel format of buffer.
++ *                              Pixel format is a FOURCC ASCII code.
++ *
++ * @param       width           The width of panel in pixels.
++ *
++ * @param       height          The height of panel in pixels.
++ *
++ * @param       hStartWidth     The number of pixel clocks between the HSYNC
++ *                              signal pulse and the start of valid data.
++ *
++ * @param       hSyncWidth      The width of the HSYNC signal in units of pixel
++ *                              clocks.
++ *
++ * @param       hEndWidth       The number of pixel clocks between the end of
++ *                              valid data and the HSYNC signal for next line.
++ *
++ * @param       vStartWidth     The number of lines between the VSYNC
++ *                              signal pulse and the start of valid data.
++ *
++ * @param       vSyncWidth      The width of the VSYNC signal in units of lines
++ *
++ * @param       vEndWidth       The number of lines between the end of valid
++ *                              data and the VSYNC signal for next frame.
++ *
++ * @param       sig             Bitfield of signal polarities for LCD interface.
++ *
++ * @return      This function returns 0 on success or negative error code on
++ *              fail.
++ */
++int32_t ipu_init_sync_panel(struct ipu_soc *ipu, int disp, uint32_t pixel_clk,
++			    uint16_t width, uint16_t height,
++			    uint32_t pixel_fmt,
++			    uint16_t h_start_width, uint16_t h_sync_width,
++			    uint16_t h_end_width, uint16_t v_start_width,
++			    uint16_t v_sync_width, uint16_t v_end_width,
++			    uint32_t v_to_h_sync, ipu_di_signal_cfg_t sig)
++{
++	uint32_t field0_offset = 0;
++	uint32_t field1_offset;
++	uint32_t reg;
++	uint32_t di_gen, vsync_cnt;
++	uint32_t div, rounded_pixel_clk;
++	uint32_t h_total, v_total;
++	int map;
++	int ret;
++	struct clk *ldb_di0_clk, *ldb_di1_clk;
++	struct clk *di_parent;
++
++	dev_dbg(ipu->dev, "panel size = %d x %d\n", width, height);
++
++	if ((v_sync_width == 0) || (h_sync_width == 0))
++		return -EINVAL;
++
++	adapt_panel_to_ipu_restricitions(ipu, &v_start_width, &v_sync_width, &v_end_width);
++	h_total = width + h_sync_width + h_start_width + h_end_width;
++	v_total = height + v_sync_width + v_start_width + v_end_width;
++
++	/* Init clocking */
++	dev_dbg(ipu->dev, "pixel clk = %d\n", pixel_clk);
++
++	di_parent = clk_get_parent(ipu->di_clk_sel[disp]);
++	if (!di_parent) {
++		dev_err(ipu->dev, "get di clk parent fail\n");
++		return -EINVAL;
++	}
++	ldb_di0_clk = clk_get(ipu->dev, "ldb_di0");
++	if (IS_ERR(ldb_di0_clk)) {
++		dev_err(ipu->dev, "clk_get di0 failed");
++		return PTR_ERR(ldb_di0_clk);
++	}
++	ldb_di1_clk = clk_get(ipu->dev, "ldb_di1");
++	if (IS_ERR(ldb_di1_clk)) {
++		dev_err(ipu->dev, "clk_get di1 failed");
++		return PTR_ERR(ldb_di1_clk);
++	}
++
++	if (ldb_di0_clk == di_parent || ldb_di1_clk == di_parent) {
++		/* if di clk parent is tve/ldb, then keep it;*/
++		dev_dbg(ipu->dev, "use special clk parent\n");
++		ret = clk_set_parent(ipu->pixel_clk_sel[disp], ipu->di_clk[disp]);
++		if (ret) {
++			dev_err(ipu->dev, "set pixel clk error:%d\n", ret);
++			return ret;
++		}
++		clk_put(ldb_di0_clk);
++		clk_put(ldb_di1_clk);
++	} else {
++		/* try ipu clk first*/
++		dev_dbg(ipu->dev, "try ipu internal clk\n");
++		ret = clk_set_parent(ipu->pixel_clk_sel[disp], ipu->ipu_clk);
++		if (ret) {
++			dev_err(ipu->dev, "set pixel clk error:%d\n", ret);
++			return ret;
++		}
++		rounded_pixel_clk = clk_round_rate(ipu->pixel_clk[disp], pixel_clk);
++		dev_dbg(ipu->dev, "rounded pix clk:%d\n", rounded_pixel_clk);
++		/*
++		 * we will only use 1/2 fraction for ipu clk,
++		 * so if the clk rate is not fit, try ext clk.
++		 */
++		if (!sig.int_clk &&
++			((rounded_pixel_clk >= pixel_clk + pixel_clk/200) ||
++			(rounded_pixel_clk <= pixel_clk - pixel_clk/200))) {
++			dev_dbg(ipu->dev, "try ipu ext di clk\n");
++
++			rounded_pixel_clk =
++				clk_round_rate(ipu->di_clk[disp], pixel_clk);
++			ret = clk_set_rate(ipu->di_clk[disp],
++						rounded_pixel_clk);
++			if (ret) {
++				dev_err(ipu->dev,
++					"set di clk rate error:%d\n", ret);
++				return ret;
++			}
++			dev_dbg(ipu->dev, "di clk:%d\n", rounded_pixel_clk);
++			ret = clk_set_parent(ipu->pixel_clk_sel[disp],
++						ipu->di_clk[disp]);
++			if (ret) {
++				dev_err(ipu->dev,
++					"set pixel clk parent error:%d\n", ret);
++				return ret;
++			}
++		}
++	}
++	rounded_pixel_clk = clk_round_rate(ipu->pixel_clk[disp], pixel_clk);
++	dev_dbg(ipu->dev, "round pixel clk:%d\n", rounded_pixel_clk);
++	ret = clk_set_rate(ipu->pixel_clk[disp], rounded_pixel_clk);
++	if (ret) {
++		dev_err(ipu->dev, "set pixel clk rate error:%d\n", ret);
++		return ret;
++	}
++	msleep(5);
++	/* Get integer portion of divider */
++	div = clk_get_rate(clk_get_parent(ipu->pixel_clk_sel[disp])) / rounded_pixel_clk;
++	dev_dbg(ipu->dev, "div:%d\n", div);
++	if (!div) {
++		dev_err(ipu->dev, "invalid pixel clk div = 0\n");
++		return -EINVAL;
++	}
++
++
++	mutex_lock(&ipu->mutex_lock);
++
++	_ipu_di_data_wave_config(ipu, disp, SYNC_WAVE, div - 1, div - 1);
++	_ipu_di_data_pin_config(ipu, disp, SYNC_WAVE, DI_PIN15, 3, 0, div * 2);
++
++	map = _ipu_pixfmt_to_map(pixel_fmt);
++	if (map < 0) {
++		dev_dbg(ipu->dev, "IPU_DISP: No MAP\n");
++		mutex_unlock(&ipu->mutex_lock);
++		return -EINVAL;
++	}
++
++	/*clear DI*/
++	di_gen = ipu_di_read(ipu, disp, DI_GENERAL);
++	di_gen &= (0x3 << 20);
++	ipu_di_write(ipu, disp, di_gen, DI_GENERAL);
++
++	if (sig.interlaced) {
++		if (g_ipu_hw_rev >= IPU_V3DEX) {
++			/* Internal VSYNC for each frame */
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_COUNT_1, 		/* counter */
++					v_total*2 - 1, 	/* run count */
++					(3 - 1),	/* run_resolution, counter 1 can reference to counter 6,7,8 with run_resolution=2,3,4 */
++					1, 		/* offset */
++					(3 - 1), 	/* offset resolution, 3=counter 7 */
++					0, 		/* repeat count */
++					DI_SYNC_NONE, 	/* CNT_CLR_SEL */
++					0, 		/* CNT_POLARITY_GEN_EN */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
++					0, 		/* COUNT UP */
++					0		/* COUNT DOWN */
++					);
++
++			/* HSYNC waveform on DI_PIN02 */
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_HSYNC, 		/* counter */
++					h_total - 1,	/* run count */
++					DI_SYNC_CLK,	/* run_resolution, counter 2 can reference to counter 5,7 with run_resolution=3,4 */
++					0, 		/* offset */
++					DI_SYNC_NONE, 	/* offset resolution */
++					0, 		/* repeat count */
++					DI_SYNC_NONE, 	/* CNT_CLR_SEL */
++					1, 		/* CNT_POLARITY_GEN_EN */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					DI_SYNC_CLK, 	/* CNT_POLARITY_TRIGGER_SEL */
++					0, 		/* COUNT UP */
++					2*h_sync_width		/* COUNT DOWN */
++					);
++
++			/* VSYNC waveform on DI_PIN03 */
++			vsync_cnt = DI_SYNC_VSYNC;
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_VSYNC, 		/* counter */
++					v_total - 1,	/* run count */
++					(4 - 1),	/* run_resolution, counter 3 can reference to counter 7 with run_resolution=4 */
++					1, 			/* offset */
++					(4 - 1), 	/* offset resolution, 4=counter 7 */
++					2, 		/* repeat count */
++					DI_SYNC_COUNT_1, 	/* CNT_CLR_SEL */
++					1, 		/* CNT_POLARITY_GEN_EN */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					(4 - 1),	/* CNT_POLARITY_TRIGGER_SEL, 4=counter 7 */
++					0, 		/* COUNT UP */
++					2*v_sync_width		/* COUNT DOWN */
++					);
++
++			/* Active Field */
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_AFIELD, 		/* counter */
++					(v_total/2 + 1) - 1, 	/* run count */
++					DI_SYNC_HSYNC,	/* run_resolution */
++					h_total/2, /*  offset */
++					DI_SYNC_CLK,	/* offset resolution */
++					2, 		/* repeat count */
++					DI_SYNC_COUNT_1, 	/* CNT_CLR_SEL */
++					0, 		/* CNT_POLARITY_GEN_EN */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
++					0, 		/* COUNT UP */
++					0		/* COUNT DOWN */
++					);
++
++			/* Active Line */
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_ALINE, 		/* counter */
++					0, 		/* run count */
++					DI_SYNC_HSYNC,	/* run_resolution */
++					(v_start_width + v_sync_width) / 2, 		/*  offset */
++					DI_SYNC_HSYNC, 	/* offset resolution */
++					height/2, 	/* repeat count */
++					DI_SYNC_AFIELD, 		/* CNT_CLR_SEL */
++					0, 		/* CNT_POLARITY_GEN_EN */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
++					0, 		/* COUNT UP */
++					0		/* COUNT DOWN */
++					);
++
++			/* Active Pixel */
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_APIXEL, 		/* counter */
++					0, 		/* run count  */
++					DI_SYNC_CLK,	/* run_resolution */
++					h_start_width + h_sync_width, 	/* offset  */
++					DI_SYNC_CLK, 	/* offset resolution */
++					width, 		/* repeat count  */
++					DI_SYNC_ALINE, 		/* CNT_CLR_SEL  */
++					0, 		/* CNT_POLARITY_GEN_EN  */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL  */
++					0, 		/* COUNT UP  */
++					0		/* COUNT DOWN */
++					);
++
++			/* Half line HSYNC */
++			_ipu_di_sync_config(ipu,
++					disp, 		/* display */
++					DI_SYNC_COUNT_7, 		/* counter */
++					h_total/2 - 1,	/* run count */
++					DI_SYNC_CLK,	/* run_resolution */
++					0, 		/* offset */
++					DI_SYNC_NONE, 	/* offset resolution */
++					0, 		/* repeat count */
++					DI_SYNC_NONE, 	/* CNT_CLR_SEL */
++					0, 		/* CNT_POLARITY_GEN_EN */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_CLR_SEL */
++					DI_SYNC_NONE, 	/* CNT_POLARITY_TRIGGER_SEL */
++					0, 		/* COUNT UP */
++					0		/* COUNT DOWN */
++					);
++
++			ipu_di_write(ipu, disp, v_total / 2 - 1, DI_SCR_CONF);
++
++			/* set y_sel = 1 */
++			di_gen |= ((DI_SYNC_HSYNC-1)<<28);
++		} else {
++			/* Internal HSYNC waveform */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_INT_HSYNC, h_total - 1, DI_SYNC_CLK,
++					0, DI_SYNC_NONE, 0, DI_SYNC_NONE, 0, DI_SYNC_NONE,
++					DI_SYNC_NONE, 0, 0);
++
++			field1_offset = v_sync_width + v_start_width + height / 2 +
++				v_end_width;
++			if (sig.odd_field_first) {
++				field0_offset = field1_offset - 1;
++				field1_offset = 0;
++			}
++			v_total += v_start_width + v_end_width;
++
++			/* HSYNC waveform */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_HSYNC, h_total - 1, DI_SYNC_CLK,
++					0, DI_SYNC_NONE, 0, DI_SYNC_NONE, 0,
++					DI_SYNC_NONE, DI_SYNC_NONE, 0, 4);
++
++			/* Field 1 VSYNC waveform */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_VSYNC, v_total - 1, DI_SYNC_INT_HSYNC,
++					field0_offset,
++					field0_offset ? DI_SYNC_INT_HSYNC : DI_SYNC_NONE,
++					0, DI_SYNC_NONE, 0,
++					DI_SYNC_NONE, DI_SYNC_NONE, 0, 4);
++
++			/* Active Field */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_AFIELD,
++					field0_offset ?
++					field0_offset : field1_offset - 2,
++					DI_SYNC_INT_HSYNC, v_start_width + v_sync_width, DI_SYNC_INT_HSYNC, 
++					2, DI_SYNC_VSYNC, 0, DI_SYNC_NONE, DI_SYNC_NONE, 0, 0);
++
++			/* Active Line */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_ALINE, 0, DI_SYNC_INT_HSYNC,
++					0, DI_SYNC_NONE,
++					height / 2, DI_SYNC_AFIELD, 0, DI_SYNC_NONE,
++					DI_SYNC_NONE, 0, 0);
++
++			/* Active Pixel */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_APIXEL, 0, DI_SYNC_CLK,
++					h_sync_width + h_start_width, DI_SYNC_CLK,
++					width, DI_SYNC_ALINE, 0, DI_SYNC_NONE, DI_SYNC_NONE,
++					0, 0);
++
++			/* DC VSYNC waveform */
++			vsync_cnt = DI_SYNC_COUNT_7;
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_7, 0, DI_SYNC_INT_HSYNC,
++					field1_offset,
++					field1_offset ? DI_SYNC_INT_HSYNC : DI_SYNC_NONE,
++					1, DI_SYNC_VSYNC, 0, DI_SYNC_NONE, DI_SYNC_NONE, 0, 0);
++
++			/* Field 0 VSYNC waveform */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_8, v_total - 1, DI_SYNC_INT_HSYNC,
++					0, DI_SYNC_NONE,
++					0, DI_SYNC_NONE, 0, DI_SYNC_NONE,
++					DI_SYNC_NONE, 0, 0);
++
++			/* ??? */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_9, v_total - 1, (DI_SYNC_HSYNC - 1),
++					0, DI_SYNC_NONE,
++					0, DI_SYNC_NONE, 6, DI_SYNC_NONE,
++					DI_SYNC_NONE, 0, 0);
++
++			reg = ipu_di_read(ipu, disp, DI_SW_GEN1(9));
++			reg |= 0x8000;
++			ipu_di_write(ipu, disp, reg, DI_SW_GEN1(9));
++
++			ipu_di_write(ipu, disp, v_sync_width + v_start_width +
++					v_end_width + height / 2 - 1, DI_SCR_CONF);
++		}
++
++		/* Init template microcode */
++		if (disp) {
++			_ipu_dc_write_tmpl(ipu, 1, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++				_ipu_dc_write_tmpl(ipu, 8, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				_ipu_dc_write_tmpl(ipu, 9, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				/* configure user events according to DISP NUM */
++				ipu_dc_write(ipu, (width - 1), DC_UGDE_3(disp));
++			}
++		} else {
++			_ipu_dc_write_tmpl(ipu, 0, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++				_ipu_dc_write_tmpl(ipu, 10, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				_ipu_dc_write_tmpl(ipu, 11, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				/* configure user events according to DISP NUM */
++				ipu_dc_write(ipu, width - 1, DC_UGDE_3(disp));
++			}
++		}
++
++		if (sig.Hsync_pol)
++			di_gen |= DI_GEN_POLARITY_2;
++		if (sig.Vsync_pol)
++			di_gen |= DI_GEN_POLARITY_3;
++	} else {
++		/* Setup internal HSYNC waveform */
++		_ipu_di_sync_config(ipu, disp, DI_SYNC_INT_HSYNC, h_total - 1, DI_SYNC_CLK,
++					0, DI_SYNC_NONE, 0, DI_SYNC_NONE, 0, DI_SYNC_NONE,
++					DI_SYNC_NONE, 0, 0);
++
++		/* Setup external (delayed) HSYNC waveform */
++		_ipu_di_sync_config(ipu, disp, DI_SYNC_HSYNC, h_total - 1,
++				    DI_SYNC_CLK, div * v_to_h_sync, DI_SYNC_CLK,
++				    0, DI_SYNC_NONE, 1, DI_SYNC_NONE,
++				    DI_SYNC_CLK, 0, h_sync_width * 2);
++		/* Setup VSYNC waveform */
++		vsync_cnt = DI_SYNC_VSYNC;
++		_ipu_di_sync_config(ipu, disp, DI_SYNC_VSYNC, v_total - 1,
++				    DI_SYNC_INT_HSYNC, 0, DI_SYNC_NONE, 0,
++				    DI_SYNC_NONE, 1, DI_SYNC_NONE,
++				    DI_SYNC_INT_HSYNC, 0, v_sync_width * 2);
++		ipu_di_write(ipu, disp, v_total - 1, DI_SCR_CONF);
++
++		/* Setup active data waveform to sync with DC */
++		_ipu_di_sync_config(ipu, disp, DI_SYNC_ALINE, 0, DI_SYNC_HSYNC,
++				    v_sync_width + v_start_width, DI_SYNC_HSYNC, height,
++				    DI_SYNC_VSYNC, 0, DI_SYNC_NONE,
++				    DI_SYNC_NONE, 0, 0);
++		_ipu_di_sync_config(ipu, disp, DI_SYNC_APIXEL, 0, DI_SYNC_CLK,
++				    h_sync_width + h_start_width, DI_SYNC_CLK,
++				    width, DI_SYNC_ALINE, 0, DI_SYNC_NONE, DI_SYNC_NONE, 0,
++				    0);
++
++		/* set VGA delayed hsync/vsync no matter VGA enabled */
++		if (disp) {
++			/* couter 7 for VGA delay HSYNC */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_7,
++					h_total - 1, DI_SYNC_CLK,
++					18, DI_SYNC_CLK,
++					0, DI_SYNC_NONE,
++					1, DI_SYNC_NONE, DI_SYNC_CLK,
++					0, h_sync_width * 2);
++
++			/* couter 8 for VGA delay VSYNC */
++			_ipu_di_sync_config(ipu, disp, DI_SYNC_COUNT_8,
++					v_total - 1, DI_SYNC_INT_HSYNC,
++					1, DI_SYNC_INT_HSYNC,
++					0, DI_SYNC_NONE,
++					1, DI_SYNC_NONE, DI_SYNC_INT_HSYNC,
++					0, v_sync_width * 2);
++		}
++
++		/* reset all unused counters */
++		if (!disp) {
++			ipu_di_write(ipu, disp, 0, DI_SW_GEN0(7));
++			ipu_di_write(ipu, disp, 0, DI_SW_GEN1(7));
++			ipu_di_write(ipu, disp, 0, DI_STP_REP(7));
++			ipu_di_write(ipu, disp, 0, DI_SW_GEN0(8));
++			ipu_di_write(ipu, disp, 0, DI_SW_GEN1(8));
++			ipu_di_write(ipu, disp, 0, DI_STP_REP(8));
++		}
++		ipu_di_write(ipu, disp, 0, DI_SW_GEN0(9));
++		ipu_di_write(ipu, disp, 0, DI_SW_GEN1(9));
++		ipu_di_write(ipu, disp, 0, DI_STP_REP(9));
++
++		/* Init template microcode */
++		if (disp) {
++			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++				_ipu_dc_write_tmpl(ipu, 8, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				_ipu_dc_write_tmpl(ipu, 9, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				/* configure user events according to DISP NUM */
++				ipu_dc_write(ipu, (width - 1), DC_UGDE_3(disp));
++			}
++			_ipu_dc_write_tmpl(ipu, 2, WROD(0), 0, map, SYNC_WAVE, 8, DI_SYNC_APIXEL, 1);
++			_ipu_dc_write_tmpl(ipu, 3, WROD(0), 0, map, SYNC_WAVE, 4, DI_SYNC_APIXEL, 0);
++			_ipu_dc_write_tmpl(ipu, 4, WRG, 0, map, NULL_WAVE, 0, DI_SYNC_CLK, 1);
++			_ipu_dc_write_tmpl(ipu, 1, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++
++		} else {
++			if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++				(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++				(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++				(pixel_fmt == IPU_PIX_FMT_VYUY)) {
++				_ipu_dc_write_tmpl(ipu, 10, WROD(0), 0, (map - 1), SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				_ipu_dc_write_tmpl(ipu, 11, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++				/* configure user events according to DISP NUM */
++				ipu_dc_write(ipu, width - 1, DC_UGDE_3(disp));
++			}
++		   _ipu_dc_write_tmpl(ipu, 5, WROD(0), 0, map, SYNC_WAVE, 8, DI_SYNC_APIXEL, 1);
++		   _ipu_dc_write_tmpl(ipu, 6, WROD(0), 0, map, SYNC_WAVE, 4, DI_SYNC_APIXEL, 0);
++		   _ipu_dc_write_tmpl(ipu, 7, WRG, 0, map, NULL_WAVE, 0, DI_SYNC_CLK, 1);
++		   _ipu_dc_write_tmpl(ipu, 12, WROD(0), 0, map, SYNC_WAVE, 0, DI_SYNC_APIXEL, 1);
++		}
++
++		if (sig.Hsync_pol) {
++			di_gen |= DI_GEN_POLARITY_2;
++			if (disp)
++				di_gen |= DI_GEN_POLARITY_7;
++		}
++		if (sig.Vsync_pol) {
++			di_gen |= DI_GEN_POLARITY_3;
++			if (disp)
++				di_gen |= DI_GEN_POLARITY_8;
++		}
++	}
++	/* changinc DISP_CLK polarity: it can be wrong for some applications */
++	if ((pixel_fmt == IPU_PIX_FMT_YUYV) ||
++		(pixel_fmt == IPU_PIX_FMT_UYVY) ||
++		(pixel_fmt == IPU_PIX_FMT_YVYU) ||
++		(pixel_fmt == IPU_PIX_FMT_VYUY))
++			di_gen |= 0x00020000;
++
++	if (!sig.clk_pol)
++		di_gen |= DI_GEN_POLARITY_DISP_CLK;
++
++	ipu_di_write(ipu, disp, di_gen, DI_GENERAL);
++
++	ipu_di_write(ipu, disp, (--vsync_cnt << DI_VSYNC_SEL_OFFSET) |
++			0x00000002, DI_SYNC_AS_GEN);
++	reg = ipu_di_read(ipu, disp, DI_POL);
++	reg &= ~(DI_POL_DRDY_DATA_POLARITY | DI_POL_DRDY_POLARITY_15);
++	if (sig.enable_pol)
++		reg |= DI_POL_DRDY_POLARITY_15;
++	if (sig.data_pol)
++		reg |= DI_POL_DRDY_DATA_POLARITY;
++	ipu_di_write(ipu, disp, reg, DI_POL);
++
++	ipu_dc_write(ipu, width, DC_DISP_CONF2(DC_DISP_ID_SYNC(disp)));
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_init_sync_panel);
++
++void ipu_uninit_sync_panel(struct ipu_soc *ipu, int disp)
++{
++	uint32_t reg;
++	uint32_t di_gen;
++
++	if ((disp != 0) || (disp != 1))
++		return;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	di_gen = ipu_di_read(ipu, disp, DI_GENERAL);
++	di_gen |= 0x3ff | DI_GEN_POLARITY_DISP_CLK;
++	ipu_di_write(ipu, disp, di_gen, DI_GENERAL);
++
++	reg = ipu_di_read(ipu, disp, DI_POL);
++	reg |= 0x3ffffff;
++	ipu_di_write(ipu, disp, reg, DI_POL);
++
++	mutex_unlock(&ipu->mutex_lock);
++}
++EXPORT_SYMBOL(ipu_uninit_sync_panel);
++
++int ipu_init_async_panel(struct ipu_soc *ipu, int disp, int type, uint32_t cycle_time,
++			 uint32_t pixel_fmt, ipu_adc_sig_cfg_t sig)
++{
++	int map;
++	u32 ser_conf = 0;
++	u32 div;
++	u32 di_clk = clk_get_rate(ipu->ipu_clk);
++
++	/* round up cycle_time, then calcalate the divider using scaled math */
++	cycle_time += (1000000000UL / di_clk) - 1;
++	div = (cycle_time * (di_clk / 256UL)) / (1000000000UL / 256UL);
++
++	map = _ipu_pixfmt_to_map(pixel_fmt);
++	if (map < 0)
++		return -EINVAL;
++
++	mutex_lock(&ipu->mutex_lock);
++
++	if (type == IPU_PANEL_SERIAL) {
++		ipu_di_write(ipu, disp, (div << 24) | ((sig.ifc_width - 1) << 4),
++			     DI_DW_GEN(ASYNC_SER_WAVE));
++
++		_ipu_di_data_pin_config(ipu, disp, ASYNC_SER_WAVE, DI_PIN_CS,
++					0, 0, (div * 2) + 1);
++		_ipu_di_data_pin_config(ipu, disp, ASYNC_SER_WAVE, DI_PIN_SER_CLK,
++					1, div, div * 2);
++		_ipu_di_data_pin_config(ipu, disp, ASYNC_SER_WAVE, DI_PIN_SER_RS,
++					2, 0, 0);
++
++		_ipu_dc_write_tmpl(ipu, 0x64, WROD(0), 0, map, ASYNC_SER_WAVE, 0, 0, 1);
++
++		/* Configure DC for serial panel */
++		ipu_dc_write(ipu, 0x14, DC_DISP_CONF1(DC_DISP_ID_SERIAL));
++
++		if (sig.clk_pol)
++			ser_conf |= DI_SER_CONF_SERIAL_CLK_POL;
++		if (sig.data_pol)
++			ser_conf |= DI_SER_CONF_SERIAL_DATA_POL;
++		if (sig.rs_pol)
++			ser_conf |= DI_SER_CONF_SERIAL_RS_POL;
++		if (sig.cs_pol)
++			ser_conf |= DI_SER_CONF_SERIAL_CS_POL;
++		ipu_di_write(ipu, disp, ser_conf, DI_SER_CONF);
++	}
++
++	mutex_unlock(&ipu->mutex_lock);
++	return 0;
++}
++EXPORT_SYMBOL(ipu_init_async_panel);
++
++/*!
++ * This function sets the foreground and background plane global alpha blending
++ * modes. This function also sets the DP graphic plane according to the
++ * parameter of IPUv3 DP channel.
++ *
++ * @param	ipu		ipu handler
++ * @param	channel		IPUv3 DP channel
++ *
++ * @param       enable          Boolean to enable or disable global alpha
++ *                              blending. If disabled, local blending is used.
++ *
++ * @param       alpha           Global alpha value.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_disp_set_global_alpha(struct ipu_soc *ipu, ipu_channel_t channel,
++				bool enable, uint8_t alpha)
++{
++	uint32_t reg;
++	uint32_t flow;
++	bool bg_chan;
++
++	if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC)
++		flow = DP_SYNC;
++	else if (channel == MEM_BG_ASYNC0 || channel == MEM_FG_ASYNC0)
++		flow = DP_ASYNC0;
++	else if (channel == MEM_BG_ASYNC1 || channel == MEM_FG_ASYNC1)
++		flow = DP_ASYNC1;
++	else
++		return -EINVAL;
++
++	if (channel == MEM_BG_SYNC || channel == MEM_BG_ASYNC0 ||
++	    channel == MEM_BG_ASYNC1)
++		bg_chan = true;
++	else
++		bg_chan = false;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	if (bg_chan) {
++		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GWSEL, DP_COM_CONF(flow));
++	} else {
++		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++		ipu_dp_write(ipu, reg | DP_COM_CONF_GWSEL, DP_COM_CONF(flow));
++	}
++
++	if (enable) {
++		reg = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(flow)) & 0x00FFFFFFL;
++		ipu_dp_write(ipu, reg | ((uint32_t) alpha << 24),
++			     DP_GRAPH_WIND_CTRL(flow));
++
++		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++		ipu_dp_write(ipu, reg | DP_COM_CONF_GWAM, DP_COM_CONF(flow));
++	} else {
++		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GWAM, DP_COM_CONF(flow));
++	}
++
++	reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++	ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_disp_set_global_alpha);
++
++/*!
++ * This function sets the transparent color key for SDC graphic plane.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       enable          Boolean to enable or disable color key
++ *
++ * @param       colorKey        24-bit RGB color for transparent color key.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_disp_set_color_key(struct ipu_soc *ipu, ipu_channel_t channel,
++				bool enable, uint32_t color_key)
++{
++	uint32_t reg, flow;
++	int y, u, v;
++	int red, green, blue;
++
++	if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC)
++		flow = DP_SYNC;
++	else if (channel == MEM_BG_ASYNC0 || channel == MEM_FG_ASYNC0)
++		flow = DP_ASYNC0;
++	else if (channel == MEM_BG_ASYNC1 || channel == MEM_FG_ASYNC1)
++		flow = DP_ASYNC1;
++	else
++		return -EINVAL;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	ipu->color_key_4rgb = true;
++	/* Transform color key from rgb to yuv if CSC is enabled */
++	if (((ipu->fg_csc_type == RGB2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
++			((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == RGB2YUV)) ||
++			((ipu->fg_csc_type == YUV2YUV) && (ipu->bg_csc_type == YUV2YUV)) ||
++			((ipu->fg_csc_type == YUV2RGB) && (ipu->bg_csc_type == YUV2RGB))) {
++
++		dev_dbg(ipu->dev, "color key 0x%x need change to yuv fmt\n", color_key);
++
++		red = (color_key >> 16) & 0xFF;
++		green = (color_key >> 8) & 0xFF;
++		blue = color_key & 0xFF;
++
++		y = _rgb_to_yuv(0, red, green, blue);
++		u = _rgb_to_yuv(1, red, green, blue);
++		v = _rgb_to_yuv(2, red, green, blue);
++		color_key = (y << 16) | (u << 8) | v;
++
++		ipu->color_key_4rgb = false;
++
++		dev_dbg(ipu->dev, "color key change to yuv fmt 0x%x\n", color_key);
++	}
++
++	if (enable) {
++		reg = ipu_dp_read(ipu, DP_GRAPH_WIND_CTRL(flow)) & 0xFF000000L;
++		ipu_dp_write(ipu, reg | color_key, DP_GRAPH_WIND_CTRL(flow));
++
++		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++		ipu_dp_write(ipu, reg | DP_COM_CONF_GWCKE, DP_COM_CONF(flow));
++	} else {
++		reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GWCKE, DP_COM_CONF(flow));
++	}
++
++	reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++	ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_disp_set_color_key);
++
++/*!
++ * This function sets the gamma correction for DP output.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       enable          Boolean to enable or disable gamma correction.
++ *
++ * @param       constk        	Gamma piecewise linear approximation constk coeff.
++ *
++ * @param       slopek        	Gamma piecewise linear approximation slopek coeff.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t ipu_disp_set_gamma_correction(struct ipu_soc *ipu, ipu_channel_t channel, bool enable, int constk[], int slopek[])
++{
++	uint32_t reg, flow, i;
++
++	if (channel == MEM_BG_SYNC || channel == MEM_FG_SYNC)
++		flow = DP_SYNC;
++	else if (channel == MEM_BG_ASYNC0 || channel == MEM_FG_ASYNC0)
++		flow = DP_ASYNC0;
++	else if (channel == MEM_BG_ASYNC1 || channel == MEM_FG_ASYNC1)
++		flow = DP_ASYNC1;
++	else
++		return -EINVAL;
++
++	_ipu_get(ipu);
++
++	mutex_lock(&ipu->mutex_lock);
++
++	for (i = 0; i < 8; i++)
++		ipu_dp_write(ipu, (constk[2*i] & 0x1ff) | ((constk[2*i+1] & 0x1ff) << 16), DP_GAMMA_C(flow, i));
++	for (i = 0; i < 4; i++)
++		ipu_dp_write(ipu, (slopek[4*i] & 0xff) | ((slopek[4*i+1] & 0xff) << 8) |
++			((slopek[4*i+2] & 0xff) << 16) | ((slopek[4*i+3] & 0xff) << 24), DP_GAMMA_S(flow, i));
++
++	reg = ipu_dp_read(ipu, DP_COM_CONF(flow));
++	if (enable) {
++		if ((ipu->bg_csc_type == RGB2YUV) || (ipu->bg_csc_type == YUV2YUV))
++			reg |= DP_COM_CONF_GAMMA_YUV_EN;
++		else
++			reg &= ~DP_COM_CONF_GAMMA_YUV_EN;
++		ipu_dp_write(ipu, reg | DP_COM_CONF_GAMMA_EN, DP_COM_CONF(flow));
++	} else
++		ipu_dp_write(ipu, reg & ~DP_COM_CONF_GAMMA_EN, DP_COM_CONF(flow));
++
++	reg = ipu_cm_read(ipu, IPU_SRM_PRI2) | 0x8;
++	ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++
++	mutex_unlock(&ipu->mutex_lock);
++
++	_ipu_put(ipu);
++
++	return 0;
++}
++EXPORT_SYMBOL(ipu_disp_set_gamma_correction);
++
++/*!
++ * This function sets the window position of the foreground or background plane.
++ * modes.
++ *
++ * @param	ipu		ipu handler
++ * @param       channel         Input parameter for the logical channel ID.
++ *
++ * @param       x_pos           The X coordinate position to place window at.
++ *                              The position is relative to the top left corner.
++ *
++ * @param       y_pos           The Y coordinate position to place window at.
++ *                              The position is relative to the top left corner.
++ *
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int32_t _ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
++				int16_t x_pos, int16_t y_pos)
++{
++	u32 reg;
++	uint32_t flow = 0;
++	uint32_t dp_srm_shift;
++
++	if ((channel == MEM_FG_SYNC) || (channel == MEM_BG_SYNC)) {
++		flow = DP_SYNC;
++		dp_srm_shift = 3;
++	} else if (channel == MEM_FG_ASYNC0) {
++		flow = DP_ASYNC0;
++		dp_srm_shift = 5;
++	} else if (channel == MEM_FG_ASYNC1) {
++		flow = DP_ASYNC1;
++		dp_srm_shift = 7;
++	} else
++		return -EINVAL;
++
++	ipu_dp_write(ipu, (x_pos << 16) | y_pos, DP_FG_POS(flow));
++
++	if (ipu_is_channel_busy(ipu, channel)) {
++		/* controled by FSU if channel enabled */
++		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) & (~(0x3 << dp_srm_shift));
++		reg |= (0x1 << dp_srm_shift);
++		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++	} else {
++		/* disable auto swap, controled by MCU if channel disabled */
++		reg = ipu_cm_read(ipu, IPU_SRM_PRI2) & (~(0x3 << dp_srm_shift));
++		ipu_cm_write(ipu, reg, IPU_SRM_PRI2);
++	}
++
++	return 0;
++}
++
++int32_t ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
++				int16_t x_pos, int16_t y_pos)
++{
++	int ret;
++
++	_ipu_get(ipu);
++	mutex_lock(&ipu->mutex_lock);
++	ret = _ipu_disp_set_window_pos(ipu, channel, x_pos, y_pos);
++	mutex_unlock(&ipu->mutex_lock);
++	_ipu_put(ipu);
++	return ret;
++}
++EXPORT_SYMBOL(ipu_disp_set_window_pos);
++
++int32_t _ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
++				int16_t *x_pos, int16_t *y_pos)
++{
++	u32 reg;
++	uint32_t flow = 0;
++
++	if (channel == MEM_FG_SYNC)
++		flow = DP_SYNC;
++	else if (channel == MEM_FG_ASYNC0)
++		flow = DP_ASYNC0;
++	else if (channel == MEM_FG_ASYNC1)
++		flow = DP_ASYNC1;
++	else
++		return -EINVAL;
++
++	reg = ipu_dp_read(ipu, DP_FG_POS(flow));
++
++	*x_pos = (reg >> 16) & 0x7FF;
++	*y_pos = reg & 0x7FF;
++
++	return 0;
++}
++int32_t ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
++				int16_t *x_pos, int16_t *y_pos)
++{
++	int ret;
++
++	_ipu_get(ipu);
++	mutex_lock(&ipu->mutex_lock);
++	ret = _ipu_disp_get_window_pos(ipu, channel, x_pos, y_pos);
++	mutex_unlock(&ipu->mutex_lock);
++	_ipu_put(ipu);
++	return ret;
++}
++EXPORT_SYMBOL(ipu_disp_get_window_pos);
++
++void ipu_disp_direct_write(struct ipu_soc *ipu, ipu_channel_t channel, u32 value, u32 offset)
++{
++	if (channel == DIRECT_ASYNC0)
++		writel(value, ipu->disp_base[0] + offset);
++	else if (channel == DIRECT_ASYNC1)
++		writel(value, ipu->disp_base[1] + offset);
++}
++EXPORT_SYMBOL(ipu_disp_direct_write);
++
++void ipu_reset_disp_panel(struct ipu_soc *ipu)
++{
++	uint32_t tmp;
++
++	tmp = ipu_di_read(ipu, 1, DI_GENERAL);
++	ipu_di_write(ipu, 1, tmp | 0x08, DI_GENERAL);
++	msleep(10); /* tRES >= 100us */
++	tmp = ipu_di_read(ipu, 1, DI_GENERAL);
++	ipu_di_write(ipu, 1, tmp & ~0x08, DI_GENERAL);
++	msleep(60);
++
++	return;
++}
++EXPORT_SYMBOL(ipu_reset_disp_panel);
++
++void ipu_disp_init(struct ipu_soc *ipu)
++{
++	ipu->fg_csc_type = ipu->bg_csc_type = CSC_NONE;
++	ipu->color_key_4rgb = true;
++	_ipu_init_dc_mappings(ipu);
++	_ipu_dmfc_init(ipu, DMFC_NORMAL, 1);
++}
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_ic.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_ic.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_ic.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_ic.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,924 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*
++ * @file ipu_ic.c
++ *
++ * @brief IPU IC functions
++ *
++ * @ingroup IPU
++ */
++#include <linux/errno.h>
++#include <linux/init.h>
++#include <linux/io.h>
++#include <linux/ipu-v3.h>
++#include <linux/spinlock.h>
++#include <linux/types.h>
++#include <linux/videodev2.h>
++
++#include "ipu_param_mem.h"
++#include "ipu_regs.h"
++
++enum {
++	IC_TASK_VIEWFINDER,
++	IC_TASK_ENCODER,
++	IC_TASK_POST_PROCESSOR
++};
++
++static void _init_csc(struct ipu_soc *ipu, uint8_t ic_task, ipu_color_space_t in_format,
++		      ipu_color_space_t out_format, int csc_index);
++
++static int _calc_resize_coeffs(struct ipu_soc *ipu,
++				uint32_t inSize, uint32_t outSize,
++				uint32_t *resizeCoeff,
++				uint32_t *downsizeCoeff);
++
++void _ipu_vdi_set_top_field_man(struct ipu_soc *ipu, bool top_field_0)
++{
++	uint32_t reg;
++
++	reg = ipu_vdi_read(ipu, VDI_C);
++	if (top_field_0)
++		reg &= ~VDI_C_TOP_FIELD_MAN_1;
++	else
++		reg |= VDI_C_TOP_FIELD_MAN_1;
++	ipu_vdi_write(ipu, reg, VDI_C);
++}
++
++void _ipu_vdi_set_motion(struct ipu_soc *ipu, ipu_motion_sel motion_sel)
++{
++	uint32_t reg;
++
++	reg = ipu_vdi_read(ipu, VDI_C);
++	reg &= ~(VDI_C_MOT_SEL_FULL | VDI_C_MOT_SEL_MED | VDI_C_MOT_SEL_LOW);
++	if (motion_sel == HIGH_MOTION)
++		reg |= VDI_C_MOT_SEL_FULL;
++	else if (motion_sel == MED_MOTION)
++		reg |= VDI_C_MOT_SEL_MED;
++	else
++		reg |= VDI_C_MOT_SEL_LOW;
++
++	ipu_vdi_write(ipu, reg, VDI_C);
++	dev_dbg(ipu->dev, "VDI_C = \t0x%08X\n", reg);
++}
++
++void ic_dump_register(struct ipu_soc *ipu)
++{
++	printk(KERN_DEBUG "IC_CONF = \t0x%08X\n", ipu_ic_read(ipu, IC_CONF));
++	printk(KERN_DEBUG "IC_PRP_ENC_RSC = \t0x%08X\n",
++	       ipu_ic_read(ipu, IC_PRP_ENC_RSC));
++	printk(KERN_DEBUG "IC_PRP_VF_RSC = \t0x%08X\n",
++	       ipu_ic_read(ipu, IC_PRP_VF_RSC));
++	printk(KERN_DEBUG "IC_PP_RSC = \t0x%08X\n", ipu_ic_read(ipu, IC_PP_RSC));
++	printk(KERN_DEBUG "IC_IDMAC_1 = \t0x%08X\n", ipu_ic_read(ipu, IC_IDMAC_1));
++	printk(KERN_DEBUG "IC_IDMAC_2 = \t0x%08X\n", ipu_ic_read(ipu, IC_IDMAC_2));
++	printk(KERN_DEBUG "IC_IDMAC_3 = \t0x%08X\n", ipu_ic_read(ipu, IC_IDMAC_3));
++}
++
++void _ipu_ic_enable_task(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t ic_conf;
++
++	ic_conf = ipu_ic_read(ipu, IC_CONF);
++	switch (channel) {
++	case CSI_PRP_VF_MEM:
++	case MEM_PRP_VF_MEM:
++		ic_conf |= IC_CONF_PRPVF_EN;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		ic_conf |= IC_CONF_PRPVF_EN;
++		break;
++	case MEM_VDI_MEM:
++		ic_conf |= IC_CONF_PRPVF_EN | IC_CONF_RWS_EN ;
++		break;
++	case MEM_ROT_VF_MEM:
++		ic_conf |= IC_CONF_PRPVF_ROT_EN;
++		break;
++	case CSI_PRP_ENC_MEM:
++	case MEM_PRP_ENC_MEM:
++		ic_conf |= IC_CONF_PRPENC_EN;
++		break;
++	case MEM_ROT_ENC_MEM:
++		ic_conf |= IC_CONF_PRPENC_ROT_EN;
++		break;
++	case MEM_PP_MEM:
++		ic_conf |= IC_CONF_PP_EN;
++		break;
++	case MEM_ROT_PP_MEM:
++		ic_conf |= IC_CONF_PP_ROT_EN;
++		break;
++	default:
++		break;
++	}
++	ipu_ic_write(ipu, ic_conf, IC_CONF);
++}
++
++void _ipu_ic_disable_task(struct ipu_soc *ipu, ipu_channel_t channel)
++{
++	uint32_t ic_conf;
++
++	ic_conf = ipu_ic_read(ipu, IC_CONF);
++	switch (channel) {
++	case CSI_PRP_VF_MEM:
++	case MEM_PRP_VF_MEM:
++		ic_conf &= ~IC_CONF_PRPVF_EN;
++		break;
++	case MEM_VDI_PRP_VF_MEM:
++		ic_conf &= ~IC_CONF_PRPVF_EN;
++		break;
++	case MEM_VDI_MEM:
++		ic_conf &= ~(IC_CONF_PRPVF_EN | IC_CONF_RWS_EN);
++		break;
++	case MEM_ROT_VF_MEM:
++		ic_conf &= ~IC_CONF_PRPVF_ROT_EN;
++		break;
++	case CSI_PRP_ENC_MEM:
++	case MEM_PRP_ENC_MEM:
++		ic_conf &= ~IC_CONF_PRPENC_EN;
++		break;
++	case MEM_ROT_ENC_MEM:
++		ic_conf &= ~IC_CONF_PRPENC_ROT_EN;
++		break;
++	case MEM_PP_MEM:
++		ic_conf &= ~IC_CONF_PP_EN;
++		break;
++	case MEM_ROT_PP_MEM:
++		ic_conf &= ~IC_CONF_PP_ROT_EN;
++		break;
++	default:
++		break;
++	}
++	ipu_ic_write(ipu, ic_conf, IC_CONF);
++}
++
++void _ipu_vdi_init(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params)
++{
++	uint32_t reg;
++	uint32_t pixel_fmt;
++	uint32_t pix_per_burst;
++
++	reg = ((params->mem_prp_vf_mem.in_height-1) << 16) |
++	  (params->mem_prp_vf_mem.in_width-1);
++	ipu_vdi_write(ipu, reg, VDI_FSIZE);
++
++	/* Full motion, only vertical filter is used
++	   Burst size is 4 accesses */
++	if (params->mem_prp_vf_mem.in_pixel_fmt ==
++	     IPU_PIX_FMT_UYVY ||
++	     params->mem_prp_vf_mem.in_pixel_fmt ==
++	     IPU_PIX_FMT_YUYV) {
++		pixel_fmt = VDI_C_CH_422;
++		pix_per_burst = 32;
++	 } else {
++		pixel_fmt = VDI_C_CH_420;
++		pix_per_burst = 64;
++	}
++
++	reg = ipu_vdi_read(ipu, VDI_C);
++	reg |= pixel_fmt;
++	switch (channel) {
++	case MEM_VDI_PRP_VF_MEM:
++		reg |= VDI_C_BURST_SIZE2_4;
++		break;
++	case MEM_VDI_PRP_VF_MEM_P:
++		reg |= VDI_C_BURST_SIZE1_4 | VDI_C_VWM1_SET_1 | VDI_C_VWM1_CLR_2;
++		break;
++	case MEM_VDI_PRP_VF_MEM_N:
++		reg |= VDI_C_BURST_SIZE3_4 | VDI_C_VWM3_SET_1 | VDI_C_VWM3_CLR_2;
++		break;
++
++	case MEM_VDI_MEM:
++		reg |= (((pix_per_burst >> 2) - 1) & VDI_C_BURST_SIZE_MASK)
++				<< VDI_C_BURST_SIZE2_OFFSET;
++		break;
++	case MEM_VDI_MEM_P:
++		reg |= (((pix_per_burst >> 2) - 1) & VDI_C_BURST_SIZE_MASK)
++				<< VDI_C_BURST_SIZE1_OFFSET;
++		reg |= VDI_C_VWM1_SET_2 | VDI_C_VWM1_CLR_2;
++		break;
++	case MEM_VDI_MEM_N:
++		reg |= (((pix_per_burst >> 2) - 1) & VDI_C_BURST_SIZE_MASK)
++				<< VDI_C_BURST_SIZE3_OFFSET;
++		reg |= VDI_C_VWM3_SET_2 | VDI_C_VWM3_CLR_2;
++		break;
++	default:
++		break;
++	}
++	ipu_vdi_write(ipu, reg, VDI_C);
++
++	if (params->mem_prp_vf_mem.field_fmt == IPU_DEINTERLACE_FIELD_TOP)
++		_ipu_vdi_set_top_field_man(ipu, true);
++	else if (params->mem_prp_vf_mem.field_fmt == IPU_DEINTERLACE_FIELD_BOTTOM)
++		_ipu_vdi_set_top_field_man(ipu, false);
++
++	_ipu_vdi_set_motion(ipu, params->mem_prp_vf_mem.motion_sel);
++
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~IC_CONF_RWS_EN;
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++void _ipu_vdi_uninit(struct ipu_soc *ipu)
++{
++	ipu_vdi_write(ipu, 0, VDI_FSIZE);
++	ipu_vdi_write(ipu, 0, VDI_C);
++}
++
++int _ipu_ic_init_prpvf(struct ipu_soc *ipu, ipu_channel_params_t *params,
++		       bool src_is_csi)
++{
++	uint32_t reg, ic_conf;
++	uint32_t downsizeCoeff, resizeCoeff;
++	ipu_color_space_t in_fmt, out_fmt;
++	int ret = 0;
++
++	/* Setup vertical resizing */
++	if (!params->mem_prp_vf_mem.outv_resize_ratio) {
++		ret = _calc_resize_coeffs(ipu, params->mem_prp_vf_mem.in_height,
++					params->mem_prp_vf_mem.out_height,
++					&resizeCoeff, &downsizeCoeff);
++		if (ret < 0) {
++			dev_err(ipu->dev, "failed to calculate prpvf height "
++				"scaling coefficients\n");
++			return ret;
++		}
++
++		reg = (downsizeCoeff << 30) | (resizeCoeff << 16);
++	} else
++		reg = (params->mem_prp_vf_mem.outv_resize_ratio) << 16;
++
++	/* Setup horizontal resizing */
++	if (!params->mem_prp_vf_mem.outh_resize_ratio) {
++		ret = _calc_resize_coeffs(ipu, params->mem_prp_vf_mem.in_width,
++					params->mem_prp_vf_mem.out_width,
++					&resizeCoeff, &downsizeCoeff);
++		if (ret < 0) {
++			dev_err(ipu->dev, "failed to calculate prpvf width "
++				"scaling coefficients\n");
++			return ret;
++		}
++
++		reg |= (downsizeCoeff << 14) | resizeCoeff;
++	} else
++		reg |= params->mem_prp_vf_mem.outh_resize_ratio;
++
++	ipu_ic_write(ipu, reg, IC_PRP_VF_RSC);
++
++	ic_conf = ipu_ic_read(ipu, IC_CONF);
++
++	/* Setup color space conversion */
++	in_fmt = format_to_colorspace(params->mem_prp_vf_mem.in_pixel_fmt);
++	out_fmt = format_to_colorspace(params->mem_prp_vf_mem.out_pixel_fmt);
++	if (in_fmt == RGB) {
++		if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
++			/* Enable RGB->YCBCR CSC1 */
++			_init_csc(ipu, IC_TASK_VIEWFINDER, RGB, out_fmt, 1);
++			ic_conf |= IC_CONF_PRPVF_CSC1;
++		}
++	}
++	if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
++		if (out_fmt == RGB) {
++			/* Enable YCBCR->RGB CSC1 */
++			_init_csc(ipu, IC_TASK_VIEWFINDER, YCbCr, RGB, 1);
++			ic_conf |= IC_CONF_PRPVF_CSC1;
++		} else {
++			/* TODO: Support YUV<->YCbCr conversion? */
++		}
++	}
++
++	if (params->mem_prp_vf_mem.graphics_combine_en) {
++		ic_conf |= IC_CONF_PRPVF_CMB;
++
++		if (!(ic_conf & IC_CONF_PRPVF_CSC1)) {
++			/* need transparent CSC1 conversion */
++			_init_csc(ipu, IC_TASK_VIEWFINDER, RGB, RGB, 1);
++			ic_conf |= IC_CONF_PRPVF_CSC1;  /* Enable RGB->RGB CSC */
++		}
++		in_fmt = format_to_colorspace(params->mem_prp_vf_mem.in_g_pixel_fmt);
++		out_fmt = format_to_colorspace(params->mem_prp_vf_mem.out_pixel_fmt);
++		if (in_fmt == RGB) {
++			if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
++				/* Enable RGB->YCBCR CSC2 */
++				_init_csc(ipu, IC_TASK_VIEWFINDER, RGB, out_fmt, 2);
++				ic_conf |= IC_CONF_PRPVF_CSC2;
++			}
++		}
++		if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
++			if (out_fmt == RGB) {
++				/* Enable YCBCR->RGB CSC2 */
++				_init_csc(ipu, IC_TASK_VIEWFINDER, YCbCr, RGB, 2);
++				ic_conf |= IC_CONF_PRPVF_CSC2;
++			} else {
++				/* TODO: Support YUV<->YCbCr conversion? */
++			}
++		}
++
++		if (params->mem_prp_vf_mem.global_alpha_en) {
++			ic_conf |= IC_CONF_IC_GLB_LOC_A;
++			reg = ipu_ic_read(ipu, IC_CMBP_1);
++			reg &= ~(0xff);
++			reg |= params->mem_prp_vf_mem.alpha;
++			ipu_ic_write(ipu, reg, IC_CMBP_1);
++		} else
++			ic_conf &= ~IC_CONF_IC_GLB_LOC_A;
++
++		if (params->mem_prp_vf_mem.key_color_en) {
++			ic_conf |= IC_CONF_KEY_COLOR_EN;
++			ipu_ic_write(ipu, params->mem_prp_vf_mem.key_color,
++					IC_CMBP_2);
++		} else
++			ic_conf &= ~IC_CONF_KEY_COLOR_EN;
++	} else {
++		ic_conf &= ~IC_CONF_PRPVF_CMB;
++	}
++
++	if (src_is_csi)
++		ic_conf &= ~IC_CONF_RWS_EN;
++	else
++		ic_conf |= IC_CONF_RWS_EN;
++
++	ipu_ic_write(ipu, ic_conf, IC_CONF);
++
++	return ret;
++}
++
++void _ipu_ic_uninit_prpvf(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~(IC_CONF_PRPVF_EN | IC_CONF_PRPVF_CMB |
++		 IC_CONF_PRPVF_CSC2 | IC_CONF_PRPVF_CSC1);
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++void _ipu_ic_init_rotate_vf(struct ipu_soc *ipu, ipu_channel_params_t *params)
++{
++}
++
++void _ipu_ic_uninit_rotate_vf(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~IC_CONF_PRPVF_ROT_EN;
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++int _ipu_ic_init_prpenc(struct ipu_soc *ipu, ipu_channel_params_t *params,
++			bool src_is_csi)
++{
++	uint32_t reg, ic_conf;
++	uint32_t downsizeCoeff, resizeCoeff;
++	ipu_color_space_t in_fmt, out_fmt;
++	int ret = 0;
++
++	/* Setup vertical resizing */
++	if (!params->mem_prp_enc_mem.outv_resize_ratio) {
++		ret = _calc_resize_coeffs(ipu,
++					params->mem_prp_enc_mem.in_height,
++					params->mem_prp_enc_mem.out_height,
++					&resizeCoeff, &downsizeCoeff);
++		if (ret < 0) {
++			dev_err(ipu->dev, "failed to calculate prpenc height "
++				"scaling coefficients\n");
++			return ret;
++		}
++
++		reg = (downsizeCoeff << 30) | (resizeCoeff << 16);
++	} else
++		reg = (params->mem_prp_enc_mem.outv_resize_ratio) << 16;
++
++	/* Setup horizontal resizing */
++	if (!params->mem_prp_enc_mem.outh_resize_ratio) {
++		ret = _calc_resize_coeffs(ipu, params->mem_prp_enc_mem.in_width,
++					params->mem_prp_enc_mem.out_width,
++					&resizeCoeff, &downsizeCoeff);
++		if (ret < 0) {
++			dev_err(ipu->dev, "failed to calculate prpenc width "
++				"scaling coefficients\n");
++			return ret;
++		}
++
++		reg |= (downsizeCoeff << 14) | resizeCoeff;
++	} else
++		reg |= params->mem_prp_enc_mem.outh_resize_ratio;
++
++	ipu_ic_write(ipu, reg, IC_PRP_ENC_RSC);
++
++	ic_conf = ipu_ic_read(ipu, IC_CONF);
++
++	/* Setup color space conversion */
++	in_fmt = format_to_colorspace(params->mem_prp_enc_mem.in_pixel_fmt);
++	out_fmt = format_to_colorspace(params->mem_prp_enc_mem.out_pixel_fmt);
++	if (in_fmt == RGB) {
++		if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
++			/* Enable RGB->YCBCR CSC1 */
++			_init_csc(ipu, IC_TASK_ENCODER, RGB, out_fmt, 1);
++			ic_conf |= IC_CONF_PRPENC_CSC1;
++		}
++	}
++	if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
++		if (out_fmt == RGB) {
++			/* Enable YCBCR->RGB CSC1 */
++			_init_csc(ipu, IC_TASK_ENCODER, YCbCr, RGB, 1);
++			ic_conf |= IC_CONF_PRPENC_CSC1;
++		} else {
++			/* TODO: Support YUV<->YCbCr conversion? */
++		}
++	}
++
++	if (src_is_csi)
++		ic_conf &= ~IC_CONF_RWS_EN;
++	else
++		ic_conf |= IC_CONF_RWS_EN;
++
++	ipu_ic_write(ipu, ic_conf, IC_CONF);
++
++	return ret;
++}
++
++void _ipu_ic_uninit_prpenc(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~(IC_CONF_PRPENC_EN | IC_CONF_PRPENC_CSC1);
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++void _ipu_ic_init_rotate_enc(struct ipu_soc *ipu, ipu_channel_params_t *params)
++{
++}
++
++void _ipu_ic_uninit_rotate_enc(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~(IC_CONF_PRPENC_ROT_EN);
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++int _ipu_ic_init_pp(struct ipu_soc *ipu, ipu_channel_params_t *params)
++{
++	uint32_t reg, ic_conf;
++	uint32_t downsizeCoeff, resizeCoeff;
++	ipu_color_space_t in_fmt, out_fmt;
++	int ret = 0;
++
++	/* Setup vertical resizing */
++	if (!params->mem_pp_mem.outv_resize_ratio) {
++		ret = _calc_resize_coeffs(ipu, params->mem_pp_mem.in_height,
++				    params->mem_pp_mem.out_height,
++				    &resizeCoeff, &downsizeCoeff);
++		if (ret < 0) {
++			dev_err(ipu->dev, "failed to calculate pp height "
++				"scaling coefficients\n");
++			return ret;
++		}
++
++		reg = (downsizeCoeff << 30) | (resizeCoeff << 16);
++	} else {
++		reg = (params->mem_pp_mem.outv_resize_ratio) << 16;
++	}
++
++	/* Setup horizontal resizing */
++	if (!params->mem_pp_mem.outh_resize_ratio) {
++		ret = _calc_resize_coeffs(ipu, params->mem_pp_mem.in_width,
++					params->mem_pp_mem.out_width,
++					&resizeCoeff, &downsizeCoeff);
++		if (ret < 0) {
++			dev_err(ipu->dev, "failed to calculate pp width "
++				"scaling coefficients\n");
++			return ret;
++		}
++
++		reg |= (downsizeCoeff << 14) | resizeCoeff;
++	} else {
++		reg |= params->mem_pp_mem.outh_resize_ratio;
++	}
++
++	ipu_ic_write(ipu, reg, IC_PP_RSC);
++
++	ic_conf = ipu_ic_read(ipu, IC_CONF);
++
++	/* Setup color space conversion */
++	in_fmt = format_to_colorspace(params->mem_pp_mem.in_pixel_fmt);
++	out_fmt = format_to_colorspace(params->mem_pp_mem.out_pixel_fmt);
++	if (in_fmt == RGB) {
++		if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
++			/* Enable RGB->YCBCR CSC1 */
++			_init_csc(ipu, IC_TASK_POST_PROCESSOR, RGB, out_fmt, 1);
++			ic_conf |= IC_CONF_PP_CSC1;
++		}
++	}
++	if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
++		if (out_fmt == RGB) {
++			/* Enable YCBCR->RGB CSC1 */
++			_init_csc(ipu, IC_TASK_POST_PROCESSOR, YCbCr, RGB, 1);
++			ic_conf |= IC_CONF_PP_CSC1;
++		} else {
++			/* TODO: Support YUV<->YCbCr conversion? */
++		}
++	}
++
++	if (params->mem_pp_mem.graphics_combine_en) {
++		ic_conf |= IC_CONF_PP_CMB;
++
++		if (!(ic_conf & IC_CONF_PP_CSC1)) {
++			/* need transparent CSC1 conversion */
++			_init_csc(ipu, IC_TASK_POST_PROCESSOR, RGB, RGB, 1);
++			ic_conf |= IC_CONF_PP_CSC1;  /* Enable RGB->RGB CSC */
++		}
++
++		in_fmt = format_to_colorspace(params->mem_pp_mem.in_g_pixel_fmt);
++		out_fmt = format_to_colorspace(params->mem_pp_mem.out_pixel_fmt);
++		if (in_fmt == RGB) {
++			if ((out_fmt == YCbCr) || (out_fmt == YUV)) {
++				/* Enable RGB->YCBCR CSC2 */
++				_init_csc(ipu, IC_TASK_POST_PROCESSOR, RGB, out_fmt, 2);
++				ic_conf |= IC_CONF_PP_CSC2;
++			}
++		}
++		if ((in_fmt == YCbCr) || (in_fmt == YUV)) {
++			if (out_fmt == RGB) {
++				/* Enable YCBCR->RGB CSC2 */
++				_init_csc(ipu, IC_TASK_POST_PROCESSOR, YCbCr, RGB, 2);
++				ic_conf |= IC_CONF_PP_CSC2;
++			} else {
++				/* TODO: Support YUV<->YCbCr conversion? */
++			}
++		}
++
++		if (params->mem_pp_mem.global_alpha_en) {
++			ic_conf |= IC_CONF_IC_GLB_LOC_A;
++			reg = ipu_ic_read(ipu, IC_CMBP_1);
++			reg &= ~(0xff00);
++			reg |= (params->mem_pp_mem.alpha << 8);
++			ipu_ic_write(ipu, reg, IC_CMBP_1);
++		} else
++			ic_conf &= ~IC_CONF_IC_GLB_LOC_A;
++
++		if (params->mem_pp_mem.key_color_en) {
++			ic_conf |= IC_CONF_KEY_COLOR_EN;
++			ipu_ic_write(ipu, params->mem_pp_mem.key_color,
++					IC_CMBP_2);
++		} else
++			ic_conf &= ~IC_CONF_KEY_COLOR_EN;
++	} else {
++		ic_conf &= ~IC_CONF_PP_CMB;
++	}
++
++	ipu_ic_write(ipu, ic_conf, IC_CONF);
++
++	return ret;
++}
++
++void _ipu_ic_uninit_pp(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~(IC_CONF_PP_EN | IC_CONF_PP_CSC1 | IC_CONF_PP_CSC2 |
++		 IC_CONF_PP_CMB);
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++void _ipu_ic_init_rotate_pp(struct ipu_soc *ipu, ipu_channel_params_t *params)
++{
++}
++
++void _ipu_ic_uninit_rotate_pp(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++	reg = ipu_ic_read(ipu, IC_CONF);
++	reg &= ~IC_CONF_PP_ROT_EN;
++	ipu_ic_write(ipu, reg, IC_CONF);
++}
++
++int _ipu_ic_idma_init(struct ipu_soc *ipu, int dma_chan,
++		uint16_t width, uint16_t height,
++		int burst_size, ipu_rotate_mode_t rot)
++{
++	u32 ic_idmac_1, ic_idmac_2, ic_idmac_3;
++	u32 temp_rot = bitrev8(rot) >> 5;
++	bool need_hor_flip = false;
++
++	if ((burst_size != 8) && (burst_size != 16)) {
++		dev_dbg(ipu->dev, "Illegal burst length for IC\n");
++		return -EINVAL;
++	}
++
++	width--;
++	height--;
++
++	if (temp_rot & 0x2)	/* Need horizontal flip */
++		need_hor_flip = true;
++
++	ic_idmac_1 = ipu_ic_read(ipu, IC_IDMAC_1);
++	ic_idmac_2 = ipu_ic_read(ipu, IC_IDMAC_2);
++	ic_idmac_3 = ipu_ic_read(ipu, IC_IDMAC_3);
++	if (dma_chan == 22) {	/* PP output - CB2 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB2_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB2_BURST_16;
++
++		if (need_hor_flip)
++			ic_idmac_1 |= IC_IDMAC_1_PP_FLIP_RS;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_PP_FLIP_RS;
++
++		ic_idmac_2 &= ~IC_IDMAC_2_PP_HEIGHT_MASK;
++		ic_idmac_2 |= height << IC_IDMAC_2_PP_HEIGHT_OFFSET;
++
++		ic_idmac_3 &= ~IC_IDMAC_3_PP_WIDTH_MASK;
++		ic_idmac_3 |= width << IC_IDMAC_3_PP_WIDTH_OFFSET;
++	} else if (dma_chan == 11) {	/* PP Input - CB5 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB5_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB5_BURST_16;
++	} else if (dma_chan == 47) {	/* PP Rot input */
++		ic_idmac_1 &= ~IC_IDMAC_1_PP_ROT_MASK;
++		ic_idmac_1 |= temp_rot << IC_IDMAC_1_PP_ROT_OFFSET;
++	}
++
++	if (dma_chan == 12) {	/* PRP Input - CB6 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB6_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB6_BURST_16;
++	}
++
++	if (dma_chan == 20) {	/* PRP ENC output - CB0 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB0_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB0_BURST_16;
++
++		if (need_hor_flip)
++			ic_idmac_1 |= IC_IDMAC_1_PRPENC_FLIP_RS;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_PRPENC_FLIP_RS;
++
++		ic_idmac_2 &= ~IC_IDMAC_2_PRPENC_HEIGHT_MASK;
++		ic_idmac_2 |= height << IC_IDMAC_2_PRPENC_HEIGHT_OFFSET;
++
++		ic_idmac_3 &= ~IC_IDMAC_3_PRPENC_WIDTH_MASK;
++		ic_idmac_3 |= width << IC_IDMAC_3_PRPENC_WIDTH_OFFSET;
++
++	} else if (dma_chan == 45) {	/* PRP ENC Rot input */
++		ic_idmac_1 &= ~IC_IDMAC_1_PRPENC_ROT_MASK;
++		ic_idmac_1 |= temp_rot << IC_IDMAC_1_PRPENC_ROT_OFFSET;
++	}
++
++	if (dma_chan == 21) {	/* PRP VF output - CB1 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB1_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB1_BURST_16;
++
++		if (need_hor_flip)
++			ic_idmac_1 |= IC_IDMAC_1_PRPVF_FLIP_RS;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_PRPVF_FLIP_RS;
++
++		ic_idmac_2 &= ~IC_IDMAC_2_PRPVF_HEIGHT_MASK;
++		ic_idmac_2 |= height << IC_IDMAC_2_PRPVF_HEIGHT_OFFSET;
++
++		ic_idmac_3 &= ~IC_IDMAC_3_PRPVF_WIDTH_MASK;
++		ic_idmac_3 |= width << IC_IDMAC_3_PRPVF_WIDTH_OFFSET;
++
++	} else if (dma_chan == 46) {	/* PRP VF Rot input */
++		ic_idmac_1 &= ~IC_IDMAC_1_PRPVF_ROT_MASK;
++		ic_idmac_1 |= temp_rot << IC_IDMAC_1_PRPVF_ROT_OFFSET;
++	}
++
++	if (dma_chan == 14) {	/* PRP VF graphics combining input - CB3 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB3_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB3_BURST_16;
++	} else if (dma_chan == 15) {	/* PP graphics combining input - CB4 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB4_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB4_BURST_16;
++	} else if (dma_chan == 5) {	/* VDIC OUTPUT - CB7 */
++		if (burst_size == 16)
++			ic_idmac_1 |= IC_IDMAC_1_CB7_BURST_16;
++		else
++			ic_idmac_1 &= ~IC_IDMAC_1_CB7_BURST_16;
++	}
++
++	ipu_ic_write(ipu, ic_idmac_1, IC_IDMAC_1);
++	ipu_ic_write(ipu, ic_idmac_2, IC_IDMAC_2);
++	ipu_ic_write(ipu, ic_idmac_3, IC_IDMAC_3);
++	return 0;
++}
++
++static void _init_csc(struct ipu_soc *ipu, uint8_t ic_task, ipu_color_space_t in_format,
++		      ipu_color_space_t out_format, int csc_index)
++{
++	/*
++	 * Y =  0.257 * R + 0.504 * G + 0.098 * B +  16;
++	 * U = -0.148 * R - 0.291 * G + 0.439 * B + 128;
++	 * V =  0.439 * R - 0.368 * G - 0.071 * B + 128;
++	 */
++	static const uint32_t rgb2ycbcr_coeff[4][3] = {
++		{0x0042, 0x0081, 0x0019},
++		{0x01DA, 0x01B6, 0x0070},
++		{0x0070, 0x01A2, 0x01EE},
++		{0x0040, 0x0200, 0x0200},	/* A0, A1, A2 */
++	};
++
++	/* transparent RGB->RGB matrix for combining
++	 */
++	static const uint32_t rgb2rgb_coeff[4][3] = {
++		{0x0080, 0x0000, 0x0000},
++		{0x0000, 0x0080, 0x0000},
++		{0x0000, 0x0000, 0x0080},
++		{0x0000, 0x0000, 0x0000},	/* A0, A1, A2 */
++	};
++
++/*     R = (1.164 * (Y - 16)) + (1.596 * (Cr - 128));
++       G = (1.164 * (Y - 16)) - (0.392 * (Cb - 128)) - (0.813 * (Cr - 128));
++       B = (1.164 * (Y - 16)) + (2.017 * (Cb - 128); */
++	static const uint32_t ycbcr2rgb_coeff[4][3] = {
++		{149, 0, 204},
++		{149, 462, 408},
++		{149, 255, 0},
++		{8192 - 446, 266, 8192 - 554},	/* A0, A1, A2 */
++	};
++
++	uint32_t param;
++	uint32_t *base = NULL;
++
++	if (ic_task == IC_TASK_ENCODER) {
++		base = (uint32_t *)ipu->tpmem_base + 0x2008 / 4;
++	} else if (ic_task == IC_TASK_VIEWFINDER) {
++		if (csc_index == 1)
++			base = (uint32_t *)ipu->tpmem_base + 0x4028 / 4;
++		else
++			base = (uint32_t *)ipu->tpmem_base + 0x4040 / 4;
++	} else if (ic_task == IC_TASK_POST_PROCESSOR) {
++		if (csc_index == 1)
++			base = (uint32_t *)ipu->tpmem_base + 0x6060 / 4;
++		else
++			base = (uint32_t *)ipu->tpmem_base + 0x6078 / 4;
++	} else {
++		BUG();
++	}
++
++	if ((in_format == YCbCr) && (out_format == RGB)) {
++		/* Init CSC (YCbCr->RGB) */
++		param = (ycbcr2rgb_coeff[3][0] << 27) |
++			(ycbcr2rgb_coeff[0][0] << 18) |
++			(ycbcr2rgb_coeff[1][1] << 9) | ycbcr2rgb_coeff[2][2];
++		writel(param, base++);
++		/* scale = 2, sat = 0 */
++		param = (ycbcr2rgb_coeff[3][0] >> 5) | (2L << (40 - 32));
++		writel(param, base++);
++
++		param = (ycbcr2rgb_coeff[3][1] << 27) |
++			(ycbcr2rgb_coeff[0][1] << 18) |
++			(ycbcr2rgb_coeff[1][0] << 9) | ycbcr2rgb_coeff[2][0];
++		writel(param, base++);
++		param = (ycbcr2rgb_coeff[3][1] >> 5);
++		writel(param, base++);
++
++		param = (ycbcr2rgb_coeff[3][2] << 27) |
++			(ycbcr2rgb_coeff[0][2] << 18) |
++			(ycbcr2rgb_coeff[1][2] << 9) | ycbcr2rgb_coeff[2][1];
++		writel(param, base++);
++		param = (ycbcr2rgb_coeff[3][2] >> 5);
++		writel(param, base++);
++	} else if ((in_format == RGB) && (out_format == YCbCr)) {
++		/* Init CSC (RGB->YCbCr) */
++		param = (rgb2ycbcr_coeff[3][0] << 27) |
++			(rgb2ycbcr_coeff[0][0] << 18) |
++			(rgb2ycbcr_coeff[1][1] << 9) | rgb2ycbcr_coeff[2][2];
++		writel(param, base++);
++		/* scale = 1, sat = 0 */
++		param = (rgb2ycbcr_coeff[3][0] >> 5) | (1UL << 8);
++		writel(param, base++);
++
++		param = (rgb2ycbcr_coeff[3][1] << 27) |
++			(rgb2ycbcr_coeff[0][1] << 18) |
++			(rgb2ycbcr_coeff[1][0] << 9) | rgb2ycbcr_coeff[2][0];
++		writel(param, base++);
++		param = (rgb2ycbcr_coeff[3][1] >> 5);
++		writel(param, base++);
++
++		param = (rgb2ycbcr_coeff[3][2] << 27) |
++			(rgb2ycbcr_coeff[0][2] << 18) |
++			(rgb2ycbcr_coeff[1][2] << 9) | rgb2ycbcr_coeff[2][1];
++		writel(param, base++);
++		param = (rgb2ycbcr_coeff[3][2] >> 5);
++		writel(param, base++);
++	} else if ((in_format == RGB) && (out_format == RGB)) {
++		/* Init CSC */
++		param =
++		    (rgb2rgb_coeff[3][0] << 27) | (rgb2rgb_coeff[0][0] << 18) |
++		    (rgb2rgb_coeff[1][1] << 9) | rgb2rgb_coeff[2][2];
++		writel(param, base++);
++		/* scale = 2, sat = 0 */
++		param = (rgb2rgb_coeff[3][0] >> 5) | (2UL << 8);
++		writel(param, base++);
++
++		param =
++		    (rgb2rgb_coeff[3][1] << 27) | (rgb2rgb_coeff[0][1] << 18) |
++		    (rgb2rgb_coeff[1][0] << 9) | rgb2rgb_coeff[2][0];
++		writel(param, base++);
++		param = (rgb2rgb_coeff[3][1] >> 5);
++		writel(param, base++);
++
++		param =
++		    (rgb2rgb_coeff[3][2] << 27) | (rgb2rgb_coeff[0][2] << 18) |
++		    (rgb2rgb_coeff[1][2] << 9) | rgb2rgb_coeff[2][1];
++		writel(param, base++);
++		param = (rgb2rgb_coeff[3][2] >> 5);
++		writel(param, base++);
++	} else {
++		dev_err(ipu->dev, "Unsupported color space conversion\n");
++	}
++}
++
++static int _calc_resize_coeffs(struct ipu_soc *ipu,
++				uint32_t inSize, uint32_t outSize,
++				uint32_t *resizeCoeff,
++				uint32_t *downsizeCoeff)
++{
++	uint32_t tempSize;
++	uint32_t tempDownsize;
++
++	if (inSize > 4096) {
++		dev_err(ipu->dev, "IC input size(%d) cannot exceed 4096\n",
++			inSize);
++		return -EINVAL;
++	}
++
++	if (outSize > 1024) {
++		dev_err(ipu->dev, "IC output size(%d) cannot exceed 1024\n",
++			outSize);
++		return -EINVAL;
++	}
++
++	if ((outSize << 3) < inSize) {
++		dev_err(ipu->dev, "IC cannot downsize more than 8:1\n");
++		return -EINVAL;
++	}
++
++	/* Compute downsizing coefficient */
++	/* Output of downsizing unit cannot be more than 1024 */
++	tempDownsize = 0;
++	tempSize = inSize;
++	while (((tempSize > 1024) || (tempSize >= outSize * 2)) &&
++	       (tempDownsize < 2)) {
++		tempSize >>= 1;
++		tempDownsize++;
++	}
++	*downsizeCoeff = tempDownsize;
++
++	/* compute resizing coefficient using the following equation:
++	   resizeCoeff = M*(SI -1)/(SO - 1)
++	   where M = 2^13, SI - input size, SO - output size    */
++	*resizeCoeff = (8192L * (tempSize - 1)) / (outSize - 1);
++	if (*resizeCoeff >= 16384L) {
++		dev_err(ipu->dev, "Overflow on IC resize coefficient.\n");
++		return -EINVAL;
++	}
++
++	dev_dbg(ipu->dev, "resizing from %u -> %u pixels, "
++		"downsize=%u, resize=%u.%lu (reg=%u)\n", inSize, outSize,
++		*downsizeCoeff, (*resizeCoeff >= 8192L) ? 1 : 0,
++		((*resizeCoeff & 0x1FFF) * 10000L) / 8192L, *resizeCoeff);
++
++	return 0;
++}
++
++void _ipu_vdi_toggle_top_field_man(struct ipu_soc *ipu)
++{
++	uint32_t reg;
++	uint32_t mask_reg;
++
++	reg = ipu_vdi_read(ipu, VDI_C);
++	mask_reg = reg & VDI_C_TOP_FIELD_MAN_1;
++	if (mask_reg == VDI_C_TOP_FIELD_MAN_1)
++		reg &= ~VDI_C_TOP_FIELD_MAN_1;
++	else
++		reg |= VDI_C_TOP_FIELD_MAN_1;
++
++	ipu_vdi_write(ipu, reg, VDI_C);
++}
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_param_mem.h linux-xbian-imx6/drivers/mxc/ipu3/ipu_param_mem.h
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_param_mem.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_param_mem.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,921 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++#ifndef __INCLUDE_IPU_PARAM_MEM_H__
++#define __INCLUDE_IPU_PARAM_MEM_H__
++
++#include <linux/bitrev.h>
++#include <linux/types.h>
++
++#include "ipu_prv.h"
++
++extern u32 *ipu_cpmem_base;
++
++struct ipu_ch_param_word {
++	uint32_t data[5];
++	uint32_t res[3];
++};
++
++struct ipu_ch_param {
++	struct ipu_ch_param_word word[2];
++};
++
++#define ipu_ch_param_addr(ipu, ch) (((struct ipu_ch_param *)ipu->cpmem_base) + (ch))
++
++#define _param_word(base, w) \
++	(((struct ipu_ch_param *)(base))->word[(w)].data)
++
++#define ipu_ch_param_set_field(base, w, bit, size, v) { \
++	int i = (bit) / 32; \
++	int off = (bit) % 32; \
++	_param_word(base, w)[i] |= (v) << off; \
++	if (((bit)+(size)-1)/32 > i) { \
++		_param_word(base, w)[i + 1] |= (v) >> (off ? (32 - off) : 0); \
++	} \
++}
++
++#define ipu_ch_param_set_field_io(base, w, bit, size, v) { \
++	int i = (bit) / 32; \
++	int off = (bit) % 32; \
++	unsigned reg_offset; \
++	u32 temp; \
++	reg_offset = sizeof(struct ipu_ch_param_word) * w / 4; \
++	reg_offset += i; \
++	temp = readl((u32 *)base + reg_offset); \
++	temp |= (v) << off; \
++	writel(temp, (u32 *)base + reg_offset); \
++	if (((bit)+(size)-1)/32 > i) { \
++		reg_offset++; \
++		temp = readl((u32 *)base + reg_offset); \
++		temp |= (v) >> (off ? (32 - off) : 0); \
++		writel(temp, (u32 *)base + reg_offset); \
++	} \
++}
++
++#define ipu_ch_param_mod_field(base, w, bit, size, v) { \
++	int i = (bit) / 32; \
++	int off = (bit) % 32; \
++	u32 mask = (1UL << size) - 1; \
++	u32 temp = _param_word(base, w)[i]; \
++	temp &= ~(mask << off); \
++	_param_word(base, w)[i] = temp | (v) << off; \
++	if (((bit)+(size)-1)/32 > i) { \
++		temp = _param_word(base, w)[i + 1]; \
++		temp &= ~(mask >> (32 - off)); \
++		_param_word(base, w)[i + 1] = \
++			temp | ((v) >> (off ? (32 - off) : 0)); \
++	} \
++}
++
++#define ipu_ch_param_mod_field_io(base, w, bit, size, v) { \
++	int i = (bit) / 32; \
++	int off = (bit) % 32; \
++	u32 mask = (1UL << size) - 1; \
++	unsigned reg_offset; \
++	u32 temp; \
++	reg_offset = sizeof(struct ipu_ch_param_word) * w / 4; \
++	reg_offset += i; \
++	temp = readl((u32 *)base + reg_offset); \
++	temp &= ~(mask << off); \
++	temp |= (v) << off; \
++	writel(temp, (u32 *)base + reg_offset); \
++	if (((bit)+(size)-1)/32 > i) { \
++		reg_offset++; \
++		temp = readl((u32 *)base + reg_offset); \
++		temp &= ~(mask >> (32 - off)); \
++		temp |= ((v) >> (off ? (32 - off) : 0)); \
++		writel(temp, (u32 *)base + reg_offset); \
++	} \
++}
++
++#define ipu_ch_param_read_field(base, w, bit, size) ({ \
++	u32 temp2; \
++	int i = (bit) / 32; \
++	int off = (bit) % 32; \
++	u32 mask = (1UL << size) - 1; \
++	u32 temp1 = _param_word(base, w)[i]; \
++	temp1 = mask & (temp1 >> off); \
++	if (((bit)+(size)-1)/32 > i) { \
++		temp2 = _param_word(base, w)[i + 1]; \
++		temp2 &= mask >> (off ? (32 - off) : 0); \
++		temp1 |= temp2 << (off ? (32 - off) : 0); \
++	} \
++	temp1; \
++})
++
++#define ipu_ch_param_read_field_io(base, w, bit, size) ({ \
++	u32 temp1, temp2; \
++	int i = (bit) / 32; \
++	int off = (bit) % 32; \
++	u32 mask = (1UL << size) - 1; \
++	unsigned reg_offset; \
++	reg_offset = sizeof(struct ipu_ch_param_word) * w / 4; \
++	reg_offset += i; \
++	temp1 = readl((u32 *)base + reg_offset); \
++	temp1 = mask & (temp1 >> off); \
++	if (((bit)+(size)-1)/32 > i) { \
++		reg_offset++; \
++		temp2 = readl((u32 *)base + reg_offset); \
++		temp2 &= mask >> (off ? (32 - off) : 0); \
++		temp1 |= temp2 << (off ? (32 - off) : 0); \
++	} \
++	temp1; \
++})
++
++static inline int __ipu_ch_get_third_buf_cpmem_num(int ch)
++{
++	switch (ch) {
++	case 8:
++		return 64;
++	case 9:
++		return 65;
++	case 10:
++		return 66;
++	case 13:
++		return 67;
++	case 21:
++		return 68;
++	case 23:
++		return 69;
++	case 27:
++		return 70;
++	case 28:
++		return 71;
++	default:
++		return -EINVAL;
++	}
++	return 0;
++}
++
++static inline void _ipu_ch_params_set_packing(struct ipu_ch_param *p,
++					      int red_width, int red_offset,
++					      int green_width, int green_offset,
++					      int blue_width, int blue_offset,
++					      int alpha_width, int alpha_offset)
++{
++	/* Setup red width and offset */
++	ipu_ch_param_set_field(p, 1, 116, 3, red_width - 1);
++	ipu_ch_param_set_field(p, 1, 128, 5, red_offset);
++	/* Setup green width and offset */
++	ipu_ch_param_set_field(p, 1, 119, 3, green_width - 1);
++	ipu_ch_param_set_field(p, 1, 133, 5, green_offset);
++	/* Setup blue width and offset */
++	ipu_ch_param_set_field(p, 1, 122, 3, blue_width - 1);
++	ipu_ch_param_set_field(p, 1, 138, 5, blue_offset);
++	/* Setup alpha width and offset */
++	ipu_ch_param_set_field(p, 1, 125, 3, alpha_width - 1);
++	ipu_ch_param_set_field(p, 1, 143, 5, alpha_offset);
++}
++
++static inline void _ipu_ch_param_dump(struct ipu_soc *ipu, int ch)
++{
++	struct ipu_ch_param *p = ipu_ch_param_addr(ipu, ch);
++	dev_dbg(ipu->dev, "ch %d word 0 - %08X %08X %08X %08X %08X\n", ch,
++		 p->word[0].data[0], p->word[0].data[1], p->word[0].data[2],
++		 p->word[0].data[3], p->word[0].data[4]);
++	dev_dbg(ipu->dev, "ch %d word 1 - %08X %08X %08X %08X %08X\n", ch,
++		 p->word[1].data[0], p->word[1].data[1], p->word[1].data[2],
++		 p->word[1].data[3], p->word[1].data[4]);
++	dev_dbg(ipu->dev, "PFS 0x%x, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 85, 4));
++	dev_dbg(ipu->dev, "BPP 0x%x, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 107, 3));
++	dev_dbg(ipu->dev, "NPB 0x%x\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 78, 7));
++
++	dev_dbg(ipu->dev, "FW %d, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 125, 13));
++	dev_dbg(ipu->dev, "FH %d, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 138, 12));
++	dev_dbg(ipu->dev, "EBA0 0x%x\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 0, 29) << 3);
++	dev_dbg(ipu->dev, "EBA1 0x%x\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 29, 29) << 3);
++	dev_dbg(ipu->dev, "Stride %d\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 102, 14));
++	dev_dbg(ipu->dev, "scan_order %d\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 113, 1));
++	dev_dbg(ipu->dev, "uv_stride %d\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 128, 14));
++	dev_dbg(ipu->dev, "u_offset 0x%x\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 46, 22) << 3);
++	dev_dbg(ipu->dev, "v_offset 0x%x\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 68, 22) << 3);
++
++	dev_dbg(ipu->dev, "Width0 %d+1, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 116, 3));
++	dev_dbg(ipu->dev, "Width1 %d+1, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 119, 3));
++	dev_dbg(ipu->dev, "Width2 %d+1, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 122, 3));
++	dev_dbg(ipu->dev, "Width3 %d+1, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 125, 3));
++	dev_dbg(ipu->dev, "Offset0 %d, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 128, 5));
++	dev_dbg(ipu->dev, "Offset1 %d, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 133, 5));
++	dev_dbg(ipu->dev, "Offset2 %d, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 138, 5));
++	dev_dbg(ipu->dev, "Offset3 %d\n",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 143, 5));
++}
++
++static inline void fill_cpmem(struct ipu_soc *ipu, int ch, struct ipu_ch_param *params)
++{
++	int i, w;
++	void *addr = ipu_ch_param_addr(ipu, ch);
++
++	/* 2 words, 5 valid data */
++	for (w = 0; w < 2; w++) {
++		for (i = 0; i < 5; i++) {
++			writel(params->word[w].data[i], addr);
++			addr += 4;
++		}
++		addr += 12;
++	}
++}
++
++static inline void _ipu_ch_param_init(struct ipu_soc *ipu, int ch,
++				      uint32_t pixel_fmt, uint32_t width,
++				      uint32_t height, uint32_t stride,
++				      uint32_t u, uint32_t v,
++				      uint32_t uv_stride, dma_addr_t addr0,
++				      dma_addr_t addr1, dma_addr_t addr2)
++{
++	uint32_t u_offset = 0;
++	uint32_t v_offset = 0;
++	int32_t sub_ch = 0;
++	struct ipu_ch_param params;
++
++	memset(&params, 0, sizeof(params));
++
++	ipu_ch_param_set_field(&params, 0, 125, 13, width - 1);
++
++	if (((ch == 8) || (ch == 9) || (ch == 10)) && !ipu->vdoa_en) {
++		ipu_ch_param_set_field(&params, 0, 138, 12, (height / 2) - 1);
++		ipu_ch_param_set_field(&params, 1, 102, 14, (stride * 2) - 1);
++	} else {
++		/* note: for vdoa+vdi- ch8/9/10, always use band mode */
++		ipu_ch_param_set_field(&params, 0, 138, 12, height - 1);
++		ipu_ch_param_set_field(&params, 1, 102, 14, stride - 1);
++	}
++
++	/* EBA is 8-byte aligned */
++	ipu_ch_param_set_field(&params, 1, 0, 29, addr0 >> 3);
++	ipu_ch_param_set_field(&params, 1, 29, 29, addr1 >> 3);
++	if (addr0%8)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's EBA0 is not 8-byte aligned\n", ch);
++	if (addr1%8)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's EBA1 is not 8-byte aligned\n", ch);
++
++	switch (pixel_fmt) {
++	case IPU_PIX_FMT_GENERIC:
++		/*Represents 8-bit Generic data */
++		ipu_ch_param_set_field(&params, 0, 107, 3, 5);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 6);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 63);	/* burst size */
++
++		break;
++	case IPU_PIX_FMT_GENERIC_16:
++		/* Represents 16-bit generic data */
++		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 6);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++
++		break;
++	case IPU_PIX_FMT_GENERIC_32:
++		/*Represents 32-bit Generic data */
++		break;
++	case IPU_PIX_FMT_RGB565:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 5, 0, 6, 5, 5, 11, 8, 16);
++		break;
++	case IPU_PIX_FMT_BGR24:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 1);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 19);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 8, 0, 8, 8, 8, 16, 8, 24);
++		break;
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_YUV444:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 1);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 19);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 8, 16, 8, 8, 8, 0, 8, 24);
++		break;
++	case IPU_PIX_FMT_VYU444:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 1);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 19);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 8, 8, 8, 0, 8, 16, 8, 24);
++		break;
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_BGR32:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 0);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 15);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 8, 8, 8, 16, 8, 24, 8, 0);
++		break;
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_RGB32:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 0);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 15);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 8, 24, 8, 16, 8, 8, 8, 0);
++		break;
++	case IPU_PIX_FMT_ABGR32:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 0);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 7);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 15);	/* burst size */
++
++		_ipu_ch_params_set_packing(&params, 8, 0, 8, 8, 8, 16, 8, 24);
++		break;
++	case IPU_PIX_FMT_UYVY:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 0xA);	/* pix format */
++		if ((ch == 8) || (ch == 9) || (ch == 10)) {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 15);  /* burst size */
++		} else {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++		}
++		break;
++	case IPU_PIX_FMT_YUYV:
++		ipu_ch_param_set_field(&params, 0, 107, 3, 3);	/* bits/pixel */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 0x8);	/* pix format */
++		if ((ch == 8) || (ch == 9) || (ch == 10)) {
++			if (ipu->vdoa_en) {
++				ipu_ch_param_set_field(&params, 1, 78, 7, 31);
++			} else {
++				ipu_ch_param_set_field(&params, 1, 78, 7, 15);
++			}
++		} else {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++		}
++		break;
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YUV420P:
++		ipu_ch_param_set_field(&params, 1, 85, 4, 2);	/* pix format */
++
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		u_offset = stride * height;
++		v_offset = u_offset + (uv_stride * height / 2);
++		if ((ch == 8) || (ch == 9) || (ch == 10)) {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 15);  /* burst size */
++			uv_stride = uv_stride*2;
++		} else {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 63);  /* burst size */
++		}
++		break;
++	case IPU_PIX_FMT_YVU420P:
++		ipu_ch_param_set_field(&params, 1, 85, 4, 2);	/* pix format */
++
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		v_offset = stride * height;
++		u_offset = v_offset + (uv_stride * height / 2);
++		if ((ch == 8) || (ch == 9) || (ch == 10)) {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 15);  /* burst size */
++			uv_stride = uv_stride*2;
++		} else {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 31);  /* burst size */
++		}
++		break;
++	case IPU_PIX_FMT_YVU422P:
++		/* BPP & pixel format */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 1);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		v_offset = (v == 0) ? stride * height : v;
++		u_offset = (u == 0) ? v_offset + v_offset / 2 : u;
++		break;
++	case IPU_PIX_FMT_YUV422P:
++		/* BPP & pixel format */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 1);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		u_offset = (u == 0) ? stride * height : u;
++		v_offset = (v == 0) ? u_offset + u_offset / 2 : v;
++		break;
++	case IPU_PIX_FMT_YUV444P:
++		/* BPP & pixel format */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 0);	/* pix format */
++		ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++		uv_stride = stride;
++		u_offset = (u == 0) ? stride * height : u;
++		v_offset = (v == 0) ? u_offset * 2 : v;
++		break;
++	case IPU_PIX_FMT_NV12:
++		/* BPP & pixel format */
++		ipu_ch_param_set_field(&params, 1, 85, 4, 4);	/* pix format */
++		uv_stride = stride;
++		u_offset = (u == 0) ? stride * height : u;
++		if ((ch == 8) || (ch == 9) || (ch == 10)) {
++			if (ipu->vdoa_en) {
++				 /* one field buffer, memory width 64bits */
++				ipu_ch_param_set_field(&params, 1, 78, 7, 63);
++			} else {
++				ipu_ch_param_set_field(&params, 1, 78, 7, 15);
++				 /* top/bottom field in one buffer*/
++				uv_stride = uv_stride*2;
++			}
++		} else {
++			ipu_ch_param_set_field(&params, 1, 78, 7, 31);	/* burst size */
++		}
++		break;
++	default:
++		dev_err(ipu->dev, "mxc ipu: unimplemented pixel format\n");
++		break;
++	}
++	/*set burst size to 16*/
++
++
++	if (uv_stride)
++		ipu_ch_param_set_field(&params, 1, 128, 14, uv_stride - 1);
++
++	/* Get the uv offset from user when need cropping */
++	if (u || v) {
++		u_offset = u;
++		v_offset = v;
++	}
++
++	/* UBO and VBO are 22-bit and 8-byte aligned */
++	if (u_offset/8 > 0x3fffff)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's U offset exceeds IPU limitation\n", ch);
++	if (v_offset/8 > 0x3fffff)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's V offset exceeds IPU limitation\n", ch);
++	if (u_offset%8)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's U offset is not 8-byte aligned\n", ch);
++	if (v_offset%8)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's V offset is not 8-byte aligned\n", ch);
++
++	ipu_ch_param_set_field(&params, 0, 46, 22, u_offset / 8);
++	ipu_ch_param_set_field(&params, 0, 68, 22, v_offset / 8);
++
++	dev_dbg(ipu->dev, "initializing idma ch %d @ %p\n", ch, ipu_ch_param_addr(ipu, ch));
++	fill_cpmem(ipu, ch, &params);
++	if (addr2) {
++		sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++		if (sub_ch <= 0)
++			return;
++
++		ipu_ch_param_set_field(&params, 1, 0, 29, addr2 >> 3);
++		ipu_ch_param_set_field(&params, 1, 29, 29, 0);
++		if (addr2%8)
++			dev_warn(ipu->dev,
++				 "IDMAC%d's sub-CPMEM entry%d EBA0 is not "
++				 "8-byte aligned\n", ch, sub_ch);
++
++		dev_dbg(ipu->dev, "initializing idma ch %d @ %p sub cpmem\n", ch,
++					ipu_ch_param_addr(ipu, sub_ch));
++		fill_cpmem(ipu, sub_ch, &params);
++	}
++};
++
++static inline void _ipu_ch_param_set_burst_size(struct ipu_soc *ipu,
++						uint32_t ch,
++						uint16_t burst_pixels)
++{
++	int32_t sub_ch = 0;
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 78, 7,
++			       burst_pixels - 1);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 78, 7,
++			       burst_pixels - 1);
++};
++
++static inline int _ipu_ch_param_get_burst_size(struct ipu_soc *ipu, uint32_t ch)
++{
++	return ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 78, 7) + 1;
++};
++
++static inline int _ipu_ch_param_get_bpp(struct ipu_soc *ipu, uint32_t ch)
++{
++	return ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 107, 3);
++};
++
++static inline void _ipu_ch_param_set_buffer(struct ipu_soc *ipu, uint32_t ch,
++					int bufNum, dma_addr_t phyaddr)
++{
++	if (bufNum == 2) {
++		ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++		if (ch <= 0)
++			return;
++		bufNum = 0;
++	}
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 29 * bufNum, 29,
++			       phyaddr / 8);
++};
++
++static inline void _ipu_ch_param_set_rotation(struct ipu_soc *ipu, uint32_t ch,
++					      ipu_rotate_mode_t rot)
++{
++	u32 temp_rot = bitrev8(rot) >> 5;
++	int32_t sub_ch = 0;
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 119, 3, temp_rot);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 119, 3, temp_rot);
++};
++
++static inline void _ipu_ch_param_set_block_mode(struct ipu_soc *ipu, uint32_t ch)
++{
++	int32_t sub_ch = 0;
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 117, 2, 1);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 117, 2, 1);
++};
++
++static inline void _ipu_ch_param_set_alpha_use_separate_channel(struct ipu_soc *ipu,
++								uint32_t ch,
++								bool option)
++{
++	int32_t sub_ch = 0;
++
++	if (option) {
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 89, 1, 1);
++	} else {
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 89, 1, 0);
++	}
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++
++	if (option) {
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 89, 1, 1);
++	} else {
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 89, 1, 0);
++	}
++};
++
++static inline void _ipu_ch_param_set_alpha_condition_read(struct ipu_soc *ipu, uint32_t ch)
++{
++	int32_t sub_ch = 0;
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 149, 1, 1);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 149, 1, 1);
++};
++
++static inline void _ipu_ch_param_set_alpha_buffer_memory(struct ipu_soc *ipu, uint32_t ch)
++{
++	int alp_mem_idx;
++	int32_t sub_ch = 0;
++
++	switch (ch) {
++	case 14: /* PRP graphic */
++		alp_mem_idx = 0;
++		break;
++	case 15: /* PP graphic */
++		alp_mem_idx = 1;
++		break;
++	case 23: /* DP BG SYNC graphic */
++		alp_mem_idx = 4;
++		break;
++	case 27: /* DP FG SYNC graphic */
++		alp_mem_idx = 2;
++		break;
++	default:
++		dev_err(ipu->dev, "unsupported correlative channel of local "
++			"alpha channel\n");
++		return;
++	}
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 90, 3, alp_mem_idx);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 90, 3, alp_mem_idx);
++};
++
++static inline void _ipu_ch_param_set_interlaced_scan(struct ipu_soc *ipu, uint32_t ch)
++{
++	u32 stride;
++	int32_t sub_ch = 0;
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++
++	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, ch), 0, 113, 1, 1);
++	if (sub_ch > 0)
++		ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 113, 1, 1);
++	stride = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 1, 102, 14) + 1;
++	/* ILO is 20-bit and 8-byte aligned */
++	if (stride/8 > 0xfffff)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's ILO exceeds IPU limitation\n", ch);
++	if (stride%8)
++		dev_warn(ipu->dev,
++			 "IDMAC%d's ILO is not 8-byte aligned\n", ch);
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 58, 20, stride / 8);
++	if (sub_ch > 0)
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 58, 20,
++				       stride / 8);
++	stride *= 2;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 102, 14, stride - 1);
++	if (sub_ch > 0)
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 102, 14,
++				       stride - 1);
++};
++
++static inline void _ipu_ch_param_set_axi_id(struct ipu_soc *ipu, uint32_t ch, uint32_t id)
++{
++	int32_t sub_ch = 0;
++
++	id %= 4;
++
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 1, 93, 2, id);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 93, 2, id);
++};
++
++/* IDMAC U/V offset changing support */
++/* U and V input is not affected, */
++/* the update is done by new calculation according to */
++/* vertical_offset and horizontal_offset */
++static inline void _ipu_ch_offset_update(struct ipu_soc *ipu,
++					int ch,
++					uint32_t pixel_fmt,
++					uint32_t width,
++					uint32_t height,
++					uint32_t stride,
++					uint32_t u,
++					uint32_t v,
++					uint32_t uv_stride,
++					uint32_t vertical_offset,
++					uint32_t horizontal_offset)
++{
++	uint32_t u_offset = 0;
++	uint32_t v_offset = 0;
++	uint32_t old_offset = 0;
++	uint32_t u_fix = 0;
++	uint32_t v_fix = 0;
++	int32_t sub_ch = 0;
++
++	switch (pixel_fmt) {
++	case IPU_PIX_FMT_GENERIC:
++	case IPU_PIX_FMT_GENERIC_16:
++	case IPU_PIX_FMT_GENERIC_32:
++	case IPU_PIX_FMT_RGB565:
++	case IPU_PIX_FMT_BGR24:
++	case IPU_PIX_FMT_RGB24:
++	case IPU_PIX_FMT_YUV444:
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_BGR32:
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_RGB32:
++	case IPU_PIX_FMT_ABGR32:
++	case IPU_PIX_FMT_UYVY:
++	case IPU_PIX_FMT_YUYV:
++		break;
++
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YUV420P:
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		u_offset = stride * (height - vertical_offset - 1) +
++					(stride - horizontal_offset) +
++					(uv_stride * vertical_offset / 2) +
++					horizontal_offset / 2;
++		v_offset = u_offset + (uv_stride * height / 2);
++		u_fix = u ? (u + (uv_stride * vertical_offset / 2) +
++					(horizontal_offset / 2) -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					u_offset;
++		v_fix = v ? (v + (uv_stride * vertical_offset / 2) +
++					(horizontal_offset / 2) -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					v_offset;
++
++		break;
++	case IPU_PIX_FMT_YVU420P:
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		v_offset = stride * (height - vertical_offset - 1) +
++					(stride - horizontal_offset) +
++					(uv_stride * vertical_offset / 2) +
++					horizontal_offset / 2;
++		u_offset = v_offset + (uv_stride * height / 2);
++		u_fix = u ? (u + (uv_stride * vertical_offset / 2) +
++					(horizontal_offset / 2) -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					u_offset;
++		v_fix = v ? (v + (uv_stride * vertical_offset / 2) +
++					(horizontal_offset / 2) -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					v_offset;
++
++		break;
++	case IPU_PIX_FMT_YVU422P:
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		v_offset = stride * (height - vertical_offset - 1) +
++					(stride - horizontal_offset) +
++					(uv_stride * vertical_offset) +
++					horizontal_offset / 2;
++		u_offset = v_offset + uv_stride * height;
++		u_fix = u ? (u + (uv_stride * vertical_offset) +
++					horizontal_offset / 2 -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					u_offset;
++		v_fix = v ? (v + (uv_stride * vertical_offset) +
++					horizontal_offset / 2 -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					v_offset;
++		break;
++	case IPU_PIX_FMT_YUV422P:
++		if (uv_stride < stride / 2)
++			uv_stride = stride / 2;
++
++		u_offset = stride * (height - vertical_offset - 1) +
++					(stride - horizontal_offset) +
++					(uv_stride * vertical_offset) +
++					horizontal_offset / 2;
++		v_offset = u_offset + uv_stride * height;
++		u_fix = u ? (u + (uv_stride * vertical_offset) +
++					horizontal_offset / 2 -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					u_offset;
++		v_fix = v ? (v + (uv_stride * vertical_offset) +
++					horizontal_offset / 2 -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					v_offset;
++		break;
++
++	case IPU_PIX_FMT_YUV444P:
++		uv_stride = stride;
++		u_offset = stride * (height - vertical_offset - 1) +
++					(stride - horizontal_offset) +
++					(uv_stride * vertical_offset) +
++					horizontal_offset;
++		v_offset = u_offset + uv_stride * height;
++		u_fix = u ? (u + (uv_stride * vertical_offset) +
++					horizontal_offset -
++					(stride * vertical_offset) -
++					(horizontal_offset)) :
++					u_offset;
++		v_fix = v ? (v + (uv_stride * vertical_offset) +
++					horizontal_offset -
++					(stride * vertical_offset) -
++					(horizontal_offset)) :
++					v_offset;
++		break;
++	case IPU_PIX_FMT_NV12:
++		uv_stride = stride;
++		u_offset = stride * (height - vertical_offset - 1) +
++					(stride - horizontal_offset) +
++					(uv_stride * vertical_offset / 2) +
++					horizontal_offset;
++		u_fix = u ? (u + (uv_stride * vertical_offset / 2) +
++					horizontal_offset -
++					(stride * vertical_offset) - (horizontal_offset)) :
++					u_offset;
++
++		break;
++	default:
++		dev_err(ipu->dev, "mxc ipu: unimplemented pixel format\n");
++		break;
++	}
++
++
++
++	if (u_fix > u_offset)
++		u_offset = u_fix;
++
++	if (v_fix > v_offset)
++		v_offset = v_fix;
++
++	/* UBO and VBO are 22-bit and 8-byte aligned */
++	if (u_offset/8 > 0x3fffff)
++		dev_warn(ipu->dev,
++			"IDMAC%d's U offset exceeds IPU limitation\n", ch);
++	if (v_offset/8 > 0x3fffff)
++		dev_warn(ipu->dev,
++			"IDMAC%d's V offset exceeds IPU limitation\n", ch);
++	if (u_offset%8)
++		dev_warn(ipu->dev,
++			"IDMAC%d's U offset is not 8-byte aligned\n", ch);
++	if (v_offset%8)
++		dev_warn(ipu->dev,
++			"IDMAC%d's V offset is not 8-byte aligned\n", ch);
++
++	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 46, 22);
++	if (old_offset != u_offset / 8)
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 46, 22, u_offset / 8);
++	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 68, 22);
++	if (old_offset != v_offset / 8)
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, ch), 0, 68, 22, v_offset / 8);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 46, 22);
++	if (old_offset != u_offset / 8)
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 46, 22, u_offset / 8);
++	old_offset = ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 68, 22);
++	if (old_offset != v_offset / 8)
++		ipu_ch_param_mod_field_io(ipu_ch_param_addr(ipu, sub_ch), 0, 68, 22, v_offset / 8);
++};
++
++static inline void _ipu_ch_params_set_alpha_width(struct ipu_soc *ipu, uint32_t ch, int alpha_width)
++{
++	int32_t sub_ch = 0;
++
++	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, ch), 1, 125, 3, alpha_width - 1);
++
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, sub_ch), 1, 125, 3, alpha_width - 1);
++};
++
++static inline void _ipu_ch_param_set_bandmode(struct ipu_soc *ipu,
++			uint32_t ch, uint32_t band_height)
++{
++	int32_t sub_ch = 0;
++
++	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, ch),
++					0, 114, 3, band_height - 1);
++	sub_ch = __ipu_ch_get_third_buf_cpmem_num(ch);
++	if (sub_ch <= 0)
++		return;
++	ipu_ch_param_set_field_io(ipu_ch_param_addr(ipu, sub_ch),
++					0, 114, 3, band_height - 1);
++
++	dev_dbg(ipu->dev, "BNDM 0x%x, ",
++		 ipu_ch_param_read_field_io(ipu_ch_param_addr(ipu, ch), 0, 114, 3));
++}
++
++/*
++ * The IPUv3 IDMAC has a bug to read 32bpp pixels from a graphics plane
++ * whose alpha component is at the most significant 8 bits. The bug only
++ * impacts on cases in which the relevant separate alpha channel is enabled.
++ *
++ * Return true on bad alpha component position, otherwise, return false.
++ */
++static inline bool _ipu_ch_param_bad_alpha_pos(uint32_t pixel_fmt)
++{
++	switch (pixel_fmt) {
++	case IPU_PIX_FMT_BGRA32:
++	case IPU_PIX_FMT_BGR32:
++	case IPU_PIX_FMT_RGBA32:
++	case IPU_PIX_FMT_RGB32:
++		return true;
++	}
++
++	return false;
++}
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_pixel_clk.c linux-xbian-imx6/drivers/mxc/ipu3/ipu_pixel_clk.c
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_pixel_clk.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_pixel_clk.c	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,317 @@
++/*
++ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file ipu_pixel_clk.c
++ *
++ * @brief IPU pixel clock implementation
++ *
++ * @ingroup IPU
++ */
++
++#include <linux/clk-provider.h>
++#include <linux/err.h>
++#include <linux/io.h>
++#include <linux/ipu-v3.h>
++#include <linux/module.h>
++#include <linux/slab.h>
++#include <linux/string.h>
++
++#include "ipu_prv.h"
++#include "ipu_regs.h"
++
++ /*
++ * muxd clock implementation
++ */
++struct clk_di_mux {
++	struct clk_hw hw;
++	u8		ipu_id;
++	u8		di_id;
++	u8		flags;
++	u8		index;
++};
++#define to_clk_di_mux(_hw) container_of(_hw, struct clk_di_mux, hw)
++
++static int _ipu_pixel_clk_set_parent(struct clk_hw *hw, u8 index)
++{
++	struct clk_di_mux *mux = to_clk_di_mux(hw);
++	struct ipu_soc *ipu = ipu_get_soc(mux->ipu_id);
++	u32 di_gen;
++
++	di_gen = ipu_di_read(ipu, mux->di_id, DI_GENERAL);
++	if (index == 0)
++		/* ipu1_clk or ipu2_clk internal clk */
++		di_gen &= ~DI_GEN_DI_CLK_EXT;
++	else
++		di_gen |= DI_GEN_DI_CLK_EXT;
++
++	ipu_di_write(ipu, mux->di_id, di_gen, DI_GENERAL);
++	mux->index = index;
++	pr_debug("ipu_pixel_clk: di_clk_ext:0x%x, di_gen reg:0x%x.\n",
++			!(di_gen & DI_GEN_DI_CLK_EXT), di_gen);
++	return 0;
++}
++
++static u8 _ipu_pixel_clk_get_parent(struct clk_hw *hw)
++{
++	struct clk_di_mux *mux = to_clk_di_mux(hw);
++
++	return mux->index;
++}
++
++const struct clk_ops clk_mux_di_ops = {
++	.get_parent = _ipu_pixel_clk_get_parent,
++	.set_parent = _ipu_pixel_clk_set_parent,
++};
++
++struct clk *clk_register_mux_pix_clk(struct device *dev, const char *name,
++		const char **parent_names, u8 num_parents, unsigned long flags,
++		u8 ipu_id, u8 di_id, u8 clk_mux_flags)
++{
++	struct clk_di_mux *mux;
++	struct clk *clk;
++	struct clk_init_data init;
++
++	mux = kzalloc(sizeof(struct clk_di_mux), GFP_KERNEL);
++	if (!mux)
++		return ERR_PTR(-ENOMEM);
++
++	init.name = name;
++	init.ops = &clk_mux_di_ops;
++	init.flags = flags;
++	init.parent_names = parent_names;
++	init.num_parents = num_parents;
++
++	mux->ipu_id = ipu_id;
++	mux->di_id = di_id;
++	mux->flags = clk_mux_flags | CLK_SET_RATE_PARENT;
++	mux->hw.init = &init;
++
++	clk = clk_register(dev, &mux->hw);
++	if (IS_ERR(clk))
++		kfree(mux);
++
++	return clk;
++}
++
++/*
++ * Gated clock implementation
++ */
++struct clk_di_div {
++	struct clk_hw hw;
++	u8		ipu_id;
++	u8		di_id;
++	u8		flags;
++};
++#define to_clk_di_div(_hw) container_of(_hw, struct clk_di_div, hw)
++
++static unsigned long _ipu_pixel_clk_div_recalc_rate(struct clk_hw *hw,
++					unsigned long parent_rate)
++{
++	struct clk_di_div *di_div = to_clk_di_div(hw);
++	struct ipu_soc *ipu = ipu_get_soc(di_div->ipu_id);
++	u32 div;
++	u64 final_rate = (unsigned long long)parent_rate * 16;
++
++	_ipu_get(ipu);
++	div = ipu_di_read(ipu, di_div->di_id, DI_BS_CLKGEN0);
++	_ipu_put(ipu);
++	pr_debug("ipu_di%d read BS_CLKGEN0 div:%d, final_rate:%lld, prate:%ld\n",
++			di_div->di_id, div, final_rate, parent_rate);
++
++	if (div == 0)
++		return 0;
++	do_div(final_rate, div);
++
++	return (unsigned long)final_rate;
++}
++
++static long _ipu_pixel_clk_div_round_rate(struct clk_hw *hw, unsigned long rate,
++			       unsigned long *parent_clk_rate)
++{
++	u64 div, final_rate;
++	u32 remainder;
++	u64 parent_rate = (unsigned long long)(*parent_clk_rate) * 16;
++
++	/*
++	 * Calculate divider
++	 * Fractional part is 4 bits,
++	 * so simply multiply by 2^4 to get fractional part.
++	 */
++	div = parent_rate;
++	remainder = do_div(div, rate);
++	/* Round the divider value */
++	if (remainder > (rate/2))
++		div++;
++	if (div < 0x10)            /* Min DI disp clock divider is 1 */
++		div = 0x10;
++	if (div & ~0xFEF)
++		div &= 0xFF8;
++	else {
++		/* Round up divider if it gets us closer to desired pix clk */
++		if ((div & 0xC) == 0xC) {
++			div += 0x10;
++			div &= ~0xF;
++		}
++	}
++	final_rate = parent_rate;
++	do_div(final_rate, div);
++
++	return final_rate;
++}
++
++static int _ipu_pixel_clk_div_set_rate(struct clk_hw *hw, unsigned long rate,
++			    unsigned long parent_clk_rate)
++{
++	struct clk_di_div *di_div = to_clk_di_div(hw);
++	struct ipu_soc *ipu = ipu_get_soc(di_div->ipu_id);
++	u64 div, parent_rate;
++	u32 remainder;
++
++	parent_rate = (unsigned long long)parent_clk_rate * 16;
++	div = parent_rate;
++	remainder = do_div(div, rate);
++	/* Round the divider value */
++	if (remainder > (rate/2))
++		div++;
++
++	/* Round up divider if it gets us closer to desired pix clk */
++	if ((div & 0xC) == 0xC) {
++		div += 0x10;
++		div &= ~0xF;
++	}
++	if (div > 0x1000)
++		pr_err("Overflow, di:%d, DI_BS_CLKGEN0 div:0x%x\n",
++				di_div->di_id, (u32)div);
++	_ipu_get(ipu);
++	ipu_di_write(ipu, di_div->di_id, (u32)div, DI_BS_CLKGEN0);
++
++	/* Setup pixel clock timing */
++	/* FIXME: needs to be more flexible */
++	/* Down time is half of period */
++	ipu_di_write(ipu, di_div->di_id, ((u32)div / 16) << 16, DI_BS_CLKGEN1);
++	_ipu_put(ipu);
++
++	return 0;
++}
++
++static struct clk_ops clk_div_ops = {
++	.recalc_rate = _ipu_pixel_clk_div_recalc_rate,
++	.round_rate = _ipu_pixel_clk_div_round_rate,
++	.set_rate = _ipu_pixel_clk_div_set_rate,
++};
++
++struct clk *clk_register_div_pix_clk(struct device *dev, const char *name,
++		const char *parent_name, unsigned long flags,
++		u8 ipu_id, u8 di_id, u8 clk_div_flags)
++{
++	struct clk_di_div *di_div;
++	struct clk *clk;
++	struct clk_init_data init;
++
++	di_div = kzalloc(sizeof(struct clk_di_div), GFP_KERNEL);
++	if (!di_div)
++		return ERR_PTR(-ENOMEM);
++
++	/* struct clk_di_div assignments */
++	di_div->ipu_id = ipu_id;
++	di_div->di_id = di_id;
++	di_div->flags = clk_div_flags;
++
++	init.name = name;
++	init.ops = &clk_div_ops;
++	init.flags = flags | CLK_SET_RATE_PARENT;
++	init.parent_names = parent_name ? &parent_name : NULL;
++	init.num_parents = parent_name ? 1 : 0;
++
++	di_div->hw.init = &init;
++
++	clk = clk_register(dev, &di_div->hw);
++	if (IS_ERR(clk))
++		kfree(clk);
++
++	return clk;
++}
++
++/*
++ * Gated clock implementation
++ */
++struct clk_di_gate {
++	struct clk_hw hw;
++	u8		ipu_id;
++	u8		di_id;
++	u8		flags;
++};
++#define to_clk_di_gate(_hw) container_of(_hw, struct clk_di_gate, hw)
++
++static int _ipu_pixel_clk_enable(struct clk_hw *hw)
++{
++	struct clk_di_gate *gate = to_clk_di_gate(hw);
++	struct ipu_soc *ipu = ipu_get_soc(gate->ipu_id);
++	u32 disp_gen;
++
++	disp_gen = ipu_cm_read(ipu, IPU_DISP_GEN);
++	disp_gen |= gate->di_id ? DI1_COUNTER_RELEASE : DI0_COUNTER_RELEASE;
++	ipu_cm_write(ipu, disp_gen, IPU_DISP_GEN);
++
++	return 0;
++}
++
++static void _ipu_pixel_clk_disable(struct clk_hw *hw)
++{
++	struct clk_di_gate *gate = to_clk_di_gate(hw);
++	struct ipu_soc *ipu = ipu_get_soc(gate->ipu_id);
++	u32 disp_gen;
++
++	disp_gen = ipu_cm_read(ipu, IPU_DISP_GEN);
++	disp_gen &= gate->di_id ? ~DI1_COUNTER_RELEASE : ~DI0_COUNTER_RELEASE;
++	ipu_cm_write(ipu, disp_gen, IPU_DISP_GEN);
++
++}
++
++
++static struct clk_ops clk_gate_di_ops = {
++	.enable = _ipu_pixel_clk_enable,
++	.disable = _ipu_pixel_clk_disable,
++};
++
++struct clk *clk_register_gate_pix_clk(struct device *dev, const char *name,
++		const char *parent_name, unsigned long flags,
++		u8 ipu_id, u8 di_id, u8 clk_gate_flags)
++{
++	struct clk_di_gate *gate;
++	struct clk *clk;
++	struct clk_init_data init;
++
++	gate = kzalloc(sizeof(struct clk_di_gate), GFP_KERNEL);
++	if (!gate)
++		return ERR_PTR(-ENOMEM);
++
++	gate->ipu_id = ipu_id;
++	gate->di_id = di_id;
++	gate->flags = clk_gate_flags;
++
++	init.name = name;
++	init.ops = &clk_gate_di_ops;
++	init.flags = flags | CLK_SET_RATE_PARENT;
++	init.parent_names = parent_name ? &parent_name : NULL;
++	init.num_parents = parent_name ? 1 : 0;
++
++	gate->hw.init = &init;
++
++	clk = clk_register(dev, &gate->hw);
++	if (IS_ERR(clk))
++		kfree(clk);
++
++	return clk;
++}
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_prv.h linux-xbian-imx6/drivers/mxc/ipu3/ipu_prv.h
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_prv.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_prv.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,363 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++#ifndef __INCLUDE_IPU_PRV_H__
++#define __INCLUDE_IPU_PRV_H__
++
++#include <linux/clkdev.h>
++#include <linux/device.h>
++#include <linux/fsl_devices.h>
++#include <linux/interrupt.h>
++#include <linux/types.h>
++
++#define MXC_IPU_MAX_NUM		2
++#define MXC_DI_NUM_PER_IPU	2
++
++/* Globals */
++extern int dmfc_type_setup;
++
++#define IDMA_CHAN_INVALID	0xFF
++#define HIGH_RESOLUTION_WIDTH	1024
++
++struct ipu_irq_node {
++	irqreturn_t(*handler) (int, void *);	/*!< the ISR */
++	const char *name;	/*!< device associated with the interrupt */
++	void *dev_id;		/*!< some unique information for the ISR */
++	__u32 flags;		/*!< not used */
++};
++
++enum csc_type_t {
++	RGB2YUV = 0,
++	YUV2RGB,
++	RGB2RGB,
++	YUV2YUV,
++	CSC_NONE,
++	CSC_NUM
++};
++
++enum imx_ipu_type {
++	IMX6Q_IPU,
++};
++
++struct ipu_pltfm_data {
++	u32 id;
++	u32 devtype;
++	int (*init) (int);
++	void (*pg) (int);
++
++	/*
++	 * Bypass reset to avoid display channel being
++	 * stopped by probe since it may starts to work
++	 * in bootloader.
++	 */
++	bool bypass_reset;
++};
++
++struct ipu_soc {
++	bool online;
++	struct ipu_pltfm_data *pdata;
++
++	/*clk*/
++	struct clk *ipu_clk;
++	struct clk *di_clk[2];
++	struct clk *di_clk_sel[2];
++	struct clk *pixel_clk[2];
++	struct clk *pixel_clk_sel[2];
++	struct clk *csi_clk[2];
++
++	/*irq*/
++	int irq_sync;
++	int irq_err;
++	struct ipu_irq_node irq_list[IPU_IRQ_COUNT];
++
++	/*reg*/
++	void __iomem *cm_reg;
++	void __iomem *idmac_reg;
++	void __iomem *dp_reg;
++	void __iomem *ic_reg;
++	void __iomem *dc_reg;
++	void __iomem *dc_tmpl_reg;
++	void __iomem *dmfc_reg;
++	void __iomem *di_reg[2];
++	void __iomem *smfc_reg;
++	void __iomem *csi_reg[2];
++	void __iomem *cpmem_base;
++	void __iomem *tpmem_base;
++	void __iomem *disp_base[2];
++	void __iomem *vdi_reg;
++
++	struct device *dev;
++
++	ipu_channel_t csi_channel[2];
++	ipu_channel_t using_ic_dirct_ch;
++	unsigned char dc_di_assignment[10];
++	bool sec_chan_en[24];
++	bool thrd_chan_en[24];
++	bool chan_is_interlaced[52];
++	uint32_t channel_init_mask;
++	uint32_t channel_enable_mask;
++
++	/*use count*/
++	int dc_use_count;
++	int dp_use_count;
++	int dmfc_use_count;
++	int smfc_use_count;
++	int ic_use_count;
++	int rot_use_count;
++	int vdi_use_count;
++	int di_use_count[2];
++	int csi_use_count[2];
++
++	struct mutex mutex_lock;
++	spinlock_t int_reg_spin_lock;
++	spinlock_t rdy_reg_spin_lock;
++
++	int dmfc_size_28;
++	int dmfc_size_29;
++	int dmfc_size_24;
++	int dmfc_size_27;
++	int dmfc_size_23;
++
++	enum csc_type_t fg_csc_type;
++	enum csc_type_t bg_csc_type;
++	bool color_key_4rgb;
++	bool dc_swap;
++	struct completion dc_comp;
++	struct completion csi_comp;
++
++	struct rot_mem {
++		void *vaddr;
++		dma_addr_t paddr;
++		int size;
++	} rot_dma[2];
++
++	int	vdoa_en;
++	struct task_struct *thread[2];
++
++	char pixel_clk_0[12];
++	char pixel_clk_1[12];
++	char pixel_clk_0_sel[15];
++	char pixel_clk_1_sel[15];
++	char pixel_clk_0_div[15];
++	char pixel_clk_1_div[15];
++	char ipu_pixel_clk_sel[3][9];
++};
++
++struct ipu_channel {
++	u8 video_in_dma;
++	u8 alpha_in_dma;
++	u8 graph_in_dma;
++	u8 out_dma;
++};
++
++enum ipu_dmfc_type {
++	DMFC_NORMAL = 0,
++	DMFC_HIGH_RESOLUTION_DC,
++	DMFC_HIGH_RESOLUTION_DP,
++	DMFC_HIGH_RESOLUTION_ONLY_DP,
++};
++
++static inline u32 ipu_cm_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->cm_reg + offset);
++}
++
++static inline void ipu_cm_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->cm_reg + offset);
++}
++
++static inline u32 ipu_idmac_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->idmac_reg + offset);
++}
++
++static inline void ipu_idmac_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->idmac_reg + offset);
++}
++
++static inline u32 ipu_dc_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->dc_reg + offset);
++}
++
++static inline void ipu_dc_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->dc_reg + offset);
++}
++
++static inline u32 ipu_dc_tmpl_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->dc_tmpl_reg + offset);
++}
++
++static inline void ipu_dc_tmpl_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->dc_tmpl_reg + offset);
++}
++
++static inline u32 ipu_dmfc_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->dmfc_reg + offset);
++}
++
++static inline void ipu_dmfc_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->dmfc_reg + offset);
++}
++
++static inline u32 ipu_dp_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->dp_reg + offset);
++}
++
++static inline void ipu_dp_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->dp_reg + offset);
++}
++
++static inline u32 ipu_di_read(struct ipu_soc *ipu, int di, unsigned offset)
++{
++	return readl(ipu->di_reg[di] + offset);
++}
++
++static inline void ipu_di_write(struct ipu_soc *ipu, int di,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->di_reg[di] + offset);
++}
++
++static inline u32 ipu_csi_read(struct ipu_soc *ipu, int csi, unsigned offset)
++{
++	return readl(ipu->csi_reg[csi] + offset);
++}
++
++static inline void ipu_csi_write(struct ipu_soc *ipu, int csi,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->csi_reg[csi] + offset);
++}
++
++static inline u32 ipu_smfc_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->smfc_reg + offset);
++}
++
++static inline void ipu_smfc_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->smfc_reg + offset);
++}
++
++static inline u32 ipu_vdi_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->vdi_reg + offset);
++}
++
++static inline void ipu_vdi_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->vdi_reg + offset);
++}
++
++static inline u32 ipu_ic_read(struct ipu_soc *ipu, unsigned offset)
++{
++	return readl(ipu->ic_reg + offset);
++}
++
++static inline void ipu_ic_write(struct ipu_soc *ipu,
++		u32 value, unsigned offset)
++{
++	writel(value, ipu->ic_reg + offset);
++}
++
++int register_ipu_device(struct ipu_soc *ipu, int id);
++void unregister_ipu_device(struct ipu_soc *ipu, int id);
++ipu_color_space_t format_to_colorspace(uint32_t fmt);
++bool ipu_pixel_format_has_alpha(uint32_t fmt);
++
++void ipu_dump_registers(struct ipu_soc *ipu);
++
++uint32_t _ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel);
++
++void ipu_disp_init(struct ipu_soc *ipu);
++void _ipu_init_dc_mappings(struct ipu_soc *ipu);
++int _ipu_dp_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t in_pixel_fmt,
++		 uint32_t out_pixel_fmt);
++void _ipu_dp_uninit(struct ipu_soc *ipu, ipu_channel_t channel);
++void _ipu_dc_init(struct ipu_soc *ipu, int dc_chan, int di, bool interlaced, uint32_t pixel_fmt);
++void _ipu_dc_uninit(struct ipu_soc *ipu, int dc_chan);
++void _ipu_dp_dc_enable(struct ipu_soc *ipu, ipu_channel_t channel);
++void _ipu_dp_dc_disable(struct ipu_soc *ipu, ipu_channel_t channel, bool swap);
++void _ipu_dmfc_init(struct ipu_soc *ipu, int dmfc_type, int first);
++void _ipu_dmfc_set_wait4eot(struct ipu_soc *ipu, int dma_chan, int width);
++void _ipu_dmfc_set_burst_size(struct ipu_soc *ipu, int dma_chan, int burst_size);
++int _ipu_disp_chan_is_interlaced(struct ipu_soc *ipu, ipu_channel_t channel);
++
++void _ipu_ic_enable_task(struct ipu_soc *ipu, ipu_channel_t channel);
++void _ipu_ic_disable_task(struct ipu_soc *ipu, ipu_channel_t channel);
++int  _ipu_ic_init_prpvf(struct ipu_soc *ipu, ipu_channel_params_t *params,
++			bool src_is_csi);
++void _ipu_vdi_init(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params);
++void _ipu_vdi_uninit(struct ipu_soc *ipu);
++void _ipu_ic_uninit_prpvf(struct ipu_soc *ipu);
++void _ipu_ic_init_rotate_vf(struct ipu_soc *ipu, ipu_channel_params_t *params);
++void _ipu_ic_uninit_rotate_vf(struct ipu_soc *ipu);
++void _ipu_ic_init_csi(struct ipu_soc *ipu, ipu_channel_params_t *params);
++void _ipu_ic_uninit_csi(struct ipu_soc *ipu);
++int  _ipu_ic_init_prpenc(struct ipu_soc *ipu, ipu_channel_params_t *params,
++			 bool src_is_csi);
++void _ipu_ic_uninit_prpenc(struct ipu_soc *ipu);
++void _ipu_ic_init_rotate_enc(struct ipu_soc *ipu, ipu_channel_params_t *params);
++void _ipu_ic_uninit_rotate_enc(struct ipu_soc *ipu);
++int  _ipu_ic_init_pp(struct ipu_soc *ipu, ipu_channel_params_t *params);
++void _ipu_ic_uninit_pp(struct ipu_soc *ipu);
++void _ipu_ic_init_rotate_pp(struct ipu_soc *ipu, ipu_channel_params_t *params);
++void _ipu_ic_uninit_rotate_pp(struct ipu_soc *ipu);
++int _ipu_ic_idma_init(struct ipu_soc *ipu, int dma_chan, uint16_t width, uint16_t height,
++		      int burst_size, ipu_rotate_mode_t rot);
++void _ipu_vdi_toggle_top_field_man(struct ipu_soc *ipu);
++int _ipu_csi_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t csi);
++int _ipu_csi_set_mipi_di(struct ipu_soc *ipu, uint32_t num, uint32_t di_val, uint32_t csi);
++void ipu_csi_set_test_generator(struct ipu_soc *ipu, bool active, uint32_t r_value,
++		uint32_t g_value, uint32_t b_value,
++		uint32_t pix_clk, uint32_t csi);
++void _ipu_csi_ccir_err_detection_enable(struct ipu_soc *ipu, uint32_t csi);
++void _ipu_csi_ccir_err_detection_disable(struct ipu_soc *ipu, uint32_t csi);
++void _ipu_csi_wait4eof(struct ipu_soc *ipu, ipu_channel_t channel);
++void _ipu_smfc_init(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t mipi_id, uint32_t csi);
++void _ipu_smfc_set_burst_size(struct ipu_soc *ipu, ipu_channel_t channel, uint32_t bs);
++void _ipu_dp_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3]);
++int32_t _ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
++		int16_t x_pos, int16_t y_pos);
++int32_t _ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel,
++		int16_t *x_pos, int16_t *y_pos);
++void _ipu_get(struct ipu_soc *ipu);
++void _ipu_put(struct ipu_soc *ipu);
++
++struct clk *clk_register_mux_pix_clk(struct device *dev, const char *name,
++		const char **parent_names, u8 num_parents, unsigned long flags,
++		u8 ipu_id, u8 di_id, u8 clk_mux_flags);
++struct clk *clk_register_div_pix_clk(struct device *dev, const char *name,
++		const char *parent_name, unsigned long flags,
++		u8 ipu_id, u8 di_id, u8 clk_div_flags);
++struct clk *clk_register_gate_pix_clk(struct device *dev, const char *name,
++		const char *parent_name, unsigned long flags,
++		u8 ipu_id, u8 di_id, u8 clk_gate_flags);
++#endif				/* __INCLUDE_IPU_PRV_H__ */
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/ipu_regs.h linux-xbian-imx6/drivers/mxc/ipu3/ipu_regs.h
+--- linux-4.1.3/drivers/mxc/ipu3/ipu_regs.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/ipu_regs.h	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,749 @@
++/*
++ * Copyright (C) 2005-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*
++ * @file ipu_regs.h
++ *
++ * @brief IPU Register definitions
++ *
++ * @ingroup IPU
++ */
++#ifndef __IPU_REGS_INCLUDED__
++#define __IPU_REGS_INCLUDED__
++
++enum imx_ipu_rev {
++	IPU_V3DEX = 2,
++	IPU_V3M,
++	IPU_V3H,
++};
++
++/*
++ * hw_rev 2: IPUV3DEX
++ * hw_rev 3: IPUV3M
++ * hw_rev 4: IPUV3H
++ */
++extern int g_ipu_hw_rev;
++
++#define IPU_MAX_VDI_IN_WIDTH	({g_ipu_hw_rev >= 3 ? \
++				   (968) : \
++				   (720); })
++#define IPU_DISP0_BASE		0x00000000
++#define IPU_MCU_T_DEFAULT	8
++#define IPU_DISP1_BASE		({g_ipu_hw_rev < 4 ? \
++				(IPU_MCU_T_DEFAULT << 25) : \
++				(0x00000000); })
++#define IPUV3DEX_REG_BASE	0x1E000000
++#define IPUV3M_REG_BASE		0x06000000
++#define IPUV3H_REG_BASE		0x00200000
++
++#define IPU_CM_REG_BASE		0x00000000
++#define IPU_IDMAC_REG_BASE	0x00008000
++#define IPU_ISP_REG_BASE	0x00010000
++#define IPU_DP_REG_BASE		0x00018000
++#define IPU_IC_REG_BASE		0x00020000
++#define IPU_IRT_REG_BASE	0x00028000
++#define IPU_CSI0_REG_BASE	0x00030000
++#define IPU_CSI1_REG_BASE	0x00038000
++#define IPU_DI0_REG_BASE	0x00040000
++#define IPU_DI1_REG_BASE	0x00048000
++#define IPU_SMFC_REG_BASE	0x00050000
++#define IPU_DC_REG_BASE		0x00058000
++#define IPU_DMFC_REG_BASE	0x00060000
++#define IPU_VDI_REG_BASE	0x00068000
++#define IPU_CPMEM_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
++				   (0x00100000) : \
++				   (0x01000000); })
++#define IPU_LUT_REG_BASE	0x01020000
++#define IPU_SRM_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
++				   (0x00140000) : \
++				   (0x01040000); })
++#define IPU_TPM_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
++				   (0x00160000) : \
++				   (0x01060000); })
++#define IPU_DC_TMPL_REG_BASE 	({g_ipu_hw_rev >= 4 ? \
++				   (0x00180000) : \
++				   (0x01080000); })
++#define IPU_ISP_TBPR_REG_BASE	0x010C0000
++
++/* Register addresses */
++/* IPU Common registers */
++#define IPU_CM_REG(offset)		(offset)
++
++#define IPU_CONF			IPU_CM_REG(0)
++#define IPU_SRM_PRI1			IPU_CM_REG(0x00A0)
++#define IPU_SRM_PRI2			IPU_CM_REG(0x00A4)
++#define IPU_FS_PROC_FLOW1		IPU_CM_REG(0x00A8)
++#define IPU_FS_PROC_FLOW2		IPU_CM_REG(0x00AC)
++#define IPU_FS_PROC_FLOW3		IPU_CM_REG(0x00B0)
++#define IPU_FS_DISP_FLOW1		IPU_CM_REG(0x00B4)
++#define IPU_FS_DISP_FLOW2		IPU_CM_REG(0x00B8)
++#define IPU_SKIP			IPU_CM_REG(0x00BC)
++#define IPU_DISP_ALT_CONF		IPU_CM_REG(0x00C0)
++#define IPU_DISP_GEN			IPU_CM_REG(0x00C4)
++#define IPU_DISP_ALT1			IPU_CM_REG(0x00C8)
++#define IPU_DISP_ALT2			IPU_CM_REG(0x00CC)
++#define IPU_DISP_ALT3			IPU_CM_REG(0x00D0)
++#define IPU_DISP_ALT4			IPU_CM_REG(0x00D4)
++#define IPU_SNOOP			IPU_CM_REG(0x00D8)
++#define IPU_MEM_RST			IPU_CM_REG(0x00DC)
++#define IPU_PM				IPU_CM_REG(0x00E0)
++#define IPU_GPR				IPU_CM_REG(0x00E4)
++#define IPU_CHA_DB_MODE_SEL(ch)		IPU_CM_REG(0x0150 + 4 * ((ch) / 32))
++#define IPU_ALT_CHA_DB_MODE_SEL(ch)	IPU_CM_REG(0x0168 + 4 * ((ch) / 32))
++/*
++ * IPUv3D doesn't support triple buffer, so point
++ * IPU_CHA_TRB_MODE_SEL, IPU_CHA_TRIPLE_CUR_BUF and
++ * IPU_CHA_BUF2_RDY to readonly
++ * IPU_ALT_CUR_BUF0 for IPUv3D.
++ */
++#define IPU_CHA_TRB_MODE_SEL(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0178 + 4 * ((ch) / 32)) : \
++					    (0x012C); })
++#define IPU_CHA_TRIPLE_CUR_BUF(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					      (0x0258 + \
++					       4 * (((ch) * 2) / 32)) : \
++					      (0x012C); })
++#define IPU_CHA_BUF2_RDY(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0288 + 4 * ((ch) / 32)) : \
++					    (0x012C); })
++#define IPU_CHA_CUR_BUF(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x023C + 4 * ((ch) / 32)) : \
++					    (0x0124 + 4 * ((ch) / 32)); })
++#define IPU_ALT_CUR_BUF0	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0244) : \
++					    (0x012C); })
++#define IPU_ALT_CUR_BUF1	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0248) : \
++					    (0x0130); })
++#define IPU_SRM_STAT		IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x024C) : \
++					    (0x0134); })
++#define IPU_PROC_TASK_STAT	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0250) : \
++					    (0x0138); })
++#define IPU_DISP_TASK_STAT	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0254) : \
++					    (0x013C); })
++#define IPU_CHA_BUF0_RDY(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0268 + 4 * ((ch) / 32)) : \
++					    (0x0140 + 4 * ((ch) / 32)); })
++#define IPU_CHA_BUF1_RDY(ch)	IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0270 + 4 * ((ch) / 32)) : \
++					    (0x0148 + 4 * ((ch) / 32)); })
++#define IPU_ALT_CHA_BUF0_RDY(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					     (0x0278 + 4 * ((ch) / 32)) : \
++					     (0x0158 + 4 * ((ch) / 32)); })
++#define IPU_ALT_CHA_BUF1_RDY(ch) IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					     (0x0280 + 4 * ((ch) / 32)) : \
++					     (0x0160 + 4 * ((ch) / 32)); })
++
++#define IPU_INT_CTRL(n)		IPU_CM_REG(0x003C + 4 * ((n) - 1))
++#define IPU_INT_STAT(n)		IPU_CM_REG({g_ipu_hw_rev >= 2 ? \
++					    (0x0200 + 4 * ((n) - 1)) : \
++					    (0x00E8 + 4 * ((n) - 1)); })
++
++#define IPUIRQ_2_STATREG(irq)	IPU_CM_REG(IPU_INT_STAT(1) + 4 * ((irq) / 32))
++#define IPUIRQ_2_CTRLREG(irq)	IPU_CM_REG(IPU_INT_CTRL(1) + 4 * ((irq) / 32))
++#define IPUIRQ_2_MASK(irq)	(1UL << ((irq) & 0x1F))
++
++/* IPU VDI registers */
++#define IPU_VDI_REG(offset)	(offset)
++
++#define VDI_FSIZE		IPU_VDI_REG(0)
++#define VDI_C			IPU_VDI_REG(0x0004)
++
++/* IPU CSI Registers */
++#define IPU_CSI_REG(offset)	(offset)
++
++#define CSI_SENS_CONF		IPU_CSI_REG(0)
++#define CSI_SENS_FRM_SIZE	IPU_CSI_REG(0x0004)
++#define CSI_ACT_FRM_SIZE	IPU_CSI_REG(0x0008)
++#define CSI_OUT_FRM_CTRL	IPU_CSI_REG(0x000C)
++#define CSI_TST_CTRL		IPU_CSI_REG(0x0010)
++#define CSI_CCIR_CODE_1		IPU_CSI_REG(0x0014)
++#define CSI_CCIR_CODE_2		IPU_CSI_REG(0x0018)
++#define CSI_CCIR_CODE_3		IPU_CSI_REG(0x001C)
++#define CSI_MIPI_DI		IPU_CSI_REG(0x0020)
++#define CSI_SKIP		IPU_CSI_REG(0x0024)
++#define CSI_CPD_CTRL		IPU_CSI_REG(0x0028)
++#define CSI_CPD_RC(n)		IPU_CSI_REG(0x002C + 4 * (n))
++#define CSI_CPD_RS(n)		IPU_CSI_REG(0x004C + 4 * (n))
++#define CSI_CPD_GRC(n)		IPU_CSI_REG(0x005C + 4 * (n))
++#define CSI_CPD_GRS(n)		IPU_CSI_REG(0x007C + 4 * (n))
++#define CSI_CPD_GBC(n)		IPU_CSI_REG(0x008C + 4 * (n))
++#define CSI_CPD_GBS(n)		IPU_CSI_REG(0x00AC + 4 * (n))
++#define CSI_CPD_BC(n)		IPU_CSI_REG(0x00BC + 4 * (n))
++#define CSI_CPD_BS(n)		IPU_CSI_REG(0x00DC + 4 * (n))
++#define CSI_CPD_OFFSET1		IPU_CSI_REG(0x00EC)
++#define CSI_CPD_OFFSET2		IPU_CSI_REG(0x00F0)
++
++/* IPU SMFC Registers */
++#define IPU_SMFC_REG(offset)	(offset)
++
++#define SMFC_MAP		IPU_SMFC_REG(0)
++#define SMFC_WMC		IPU_SMFC_REG(0x0004)
++#define SMFC_BS			IPU_SMFC_REG(0x0008)
++
++/* IPU IC Registers */
++#define IPU_IC_REG(offset)	(offset)
++
++#define IC_CONF			IPU_IC_REG(0)
++#define IC_PRP_ENC_RSC		IPU_IC_REG(0x0004)
++#define IC_PRP_VF_RSC		IPU_IC_REG(0x0008)
++#define IC_PP_RSC		IPU_IC_REG(0x000C)
++#define IC_CMBP_1		IPU_IC_REG(0x0010)
++#define IC_CMBP_2		IPU_IC_REG(0x0014)
++#define IC_IDMAC_1		IPU_IC_REG(0x0018)
++#define IC_IDMAC_2		IPU_IC_REG(0x001C)
++#define IC_IDMAC_3		IPU_IC_REG(0x0020)
++#define IC_IDMAC_4		IPU_IC_REG(0x0024)
++
++/* IPU IDMAC Registers */
++#define IPU_IDMAC_REG(offset)	(offset)
++
++#define IDMAC_CONF		IPU_IDMAC_REG(0x0000)
++#define IDMAC_CHA_EN(ch)	IPU_IDMAC_REG(0x0004 + 4 * ((ch) / 32))
++#define IDMAC_SEP_ALPHA		IPU_IDMAC_REG(0x000C)
++#define IDMAC_ALT_SEP_ALPHA	IPU_IDMAC_REG(0x0010)
++#define IDMAC_CHA_PRI(ch)	IPU_IDMAC_REG(0x0014 + 4 * ((ch) / 32))
++#define IDMAC_WM_EN(ch)		IPU_IDMAC_REG(0x001C + 4 * ((ch) / 32))
++#define IDMAC_CH_LOCK_EN_1	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0024) : 0; })
++#define IDMAC_CH_LOCK_EN_2	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0028) : \
++					       (0x0024); })
++#define IDMAC_SUB_ADDR_0	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x002C) : \
++					       (0x0028); })
++#define IDMAC_SUB_ADDR_1	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0030) : \
++					       (0x002C); })
++#define IDMAC_SUB_ADDR_2	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0034) : \
++					       (0x0030); })
++/*
++ * IPUv3D doesn't support IDMAC_SUB_ADDR_3 and IDMAC_SUB_ADDR_4,
++ * so point them to readonly IDMAC_CHA_BUSY1 for IPUv3D.
++ */
++#define IDMAC_SUB_ADDR_3	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0038) : \
++					       (0x0040); })
++#define IDMAC_SUB_ADDR_4	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x003C) : \
++					       (0x0040); })
++#define IDMAC_BAND_EN(ch)	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0040 + 4 * ((ch) / 32)) : \
++					       (0x0034 + 4 * ((ch) / 32)); })
++#define IDMAC_CHA_BUSY(ch)	IPU_IDMAC_REG({g_ipu_hw_rev >= 2 ? \
++					       (0x0100 + 4 * ((ch) / 32)) : \
++					       (0x0040 + 4 * ((ch) / 32)); })
++
++/* IPU DI Registers */
++#define IPU_DI_REG(offset)	(offset)
++
++#define DI_GENERAL		IPU_DI_REG(0)
++#define DI_BS_CLKGEN0		IPU_DI_REG(0x0004)
++#define DI_BS_CLKGEN1		IPU_DI_REG(0x0008)
++#define DI_SW_GEN0(gen)		IPU_DI_REG(0x000C + 4 * ((gen) - 1))
++#define DI_SW_GEN1(gen)		IPU_DI_REG(0x0030 + 4 * ((gen) - 1))
++#define DI_STP_REP(gen)		IPU_DI_REG(0x0148 + 4 * (((gen) - 1) / 2))
++#define DI_SYNC_AS_GEN		IPU_DI_REG(0x0054)
++#define DI_DW_GEN(gen)		IPU_DI_REG(0x0058 + 4 * (gen))
++#define DI_DW_SET(gen, set)	IPU_DI_REG(0x0088 + 4 * ((gen) + 0xC * (set)))
++#define DI_SER_CONF		IPU_DI_REG(0x015C)
++#define DI_SSC			IPU_DI_REG(0x0160)
++#define DI_POL			IPU_DI_REG(0x0164)
++#define DI_AW0			IPU_DI_REG(0x0168)
++#define DI_AW1			IPU_DI_REG(0x016C)
++#define DI_SCR_CONF		IPU_DI_REG(0x0170)
++#define DI_STAT			IPU_DI_REG(0x0174)
++
++/* IPU DMFC Registers */
++#define IPU_DMFC_REG(offset)	(offset)
++
++#define DMFC_RD_CHAN		IPU_DMFC_REG(0)
++#define DMFC_WR_CHAN		IPU_DMFC_REG(0x0004)
++#define DMFC_WR_CHAN_DEF	IPU_DMFC_REG(0x0008)
++#define DMFC_DP_CHAN		IPU_DMFC_REG(0x000C)
++#define DMFC_DP_CHAN_DEF	IPU_DMFC_REG(0x0010)
++#define DMFC_GENERAL1		IPU_DMFC_REG(0x0014)
++#define DMFC_GENERAL2		IPU_DMFC_REG(0x0018)
++#define DMFC_IC_CTRL		IPU_DMFC_REG(0x001C)
++#define DMFC_STAT		IPU_DMFC_REG(0x0020)
++
++/* IPU DC Registers */
++#define IPU_DC_REG(offset)	(offset)
++
++#define DC_MAP_CONF_PTR(n)	IPU_DC_REG(0x0108 + ((n) & ~0x1) * 2)
++#define DC_MAP_CONF_VAL(n)	IPU_DC_REG(0x0144 + ((n) & ~0x1) * 2)
++
++#define _RL_CH_2_OFFSET(ch)	(((ch) == 0) ? 8 : ( \
++				 ((ch) == 1) ? 0x24 : ( \
++				 ((ch) == 2) ? 0x40 : ( \
++				 ((ch) == 5) ? 0x64 : ( \
++				 ((ch) == 6) ? 0x80 : ( \
++				 ((ch) == 8) ? 0x9C : ( \
++				 ((ch) == 9) ? 0xBC : (-1))))))))
++#define DC_RL_CH(ch, evt)	IPU_DC_REG(_RL_CH_2_OFFSET(ch) + \
++					   ((evt) & ~0x1) * 2)
++
++#define DC_EVT_NF		0
++#define DC_EVT_NL		1
++#define DC_EVT_EOF		2
++#define DC_EVT_NFIELD		3
++#define DC_EVT_EOL		4
++#define DC_EVT_EOFIELD		5
++#define DC_EVT_NEW_ADDR		6
++#define DC_EVT_NEW_CHAN		7
++#define DC_EVT_NEW_DATA		8
++
++#define DC_EVT_NEW_ADDR_W_0	0
++#define DC_EVT_NEW_ADDR_W_1	1
++#define DC_EVT_NEW_CHAN_W_0	2
++#define DC_EVT_NEW_CHAN_W_1	3
++#define DC_EVT_NEW_DATA_W_0	4
++#define DC_EVT_NEW_DATA_W_1	5
++#define DC_EVT_NEW_ADDR_R_0	6
++#define DC_EVT_NEW_ADDR_R_1	7
++#define DC_EVT_NEW_CHAN_R_0	8
++#define DC_EVT_NEW_CHAN_R_1	9
++#define DC_EVT_NEW_DATA_R_0	10
++#define DC_EVT_NEW_DATA_R_1	11
++#define DC_EVEN_UGDE0 		12
++#define DC_ODD_UGDE0 		13
++#define DC_EVEN_UGDE1 		14
++#define DC_ODD_UGDE1 		15
++#define DC_EVEN_UGDE2 		16
++#define DC_ODD_UGDE2 		17
++#define DC_EVEN_UGDE3 		18
++#define DC_ODD_UGDE3 		19
++
++#define dc_ch_offset(ch) \
++({ \
++	const u8 _offset[] = { \
++		0, 0x1C, 0x38, 0x54, 0x58, 0x5C, 0x78, 0, 0x94, 0xB4}; \
++	_offset[ch]; \
++})
++#define DC_WR_CH_CONF(ch)	IPU_DC_REG(dc_ch_offset(ch))
++#define DC_WR_CH_ADDR(ch)	IPU_DC_REG(dc_ch_offset(ch) + 4)
++
++#define DC_WR_CH_CONF_1		IPU_DC_REG(0x001C)
++#define DC_WR_CH_ADDR_1		IPU_DC_REG(0x0020)
++#define DC_WR_CH_CONF_5		IPU_DC_REG(0x005C)
++#define DC_WR_CH_ADDR_5		IPU_DC_REG(0x0060)
++#define DC_GEN			IPU_DC_REG(0x00D4)
++#define DC_DISP_CONF1(disp)	IPU_DC_REG(0x00D8 + 4 * (disp))
++#define DC_DISP_CONF2(disp)	IPU_DC_REG(0x00E8 + 4 * (disp))
++#define DC_STAT			IPU_DC_REG(0x01C8)
++#define DC_UGDE_0(evt)		IPU_DC_REG(0x0174 + 16 * (evt))
++#define DC_UGDE_1(evt)		IPU_DC_REG(0x0178 + 16 * (evt))
++#define DC_UGDE_2(evt)		IPU_DC_REG(0x017C + 16 * (evt))
++#define DC_UGDE_3(evt)		IPU_DC_REG(0x0180 + 16 * (evt))
++
++/* IPU DP Registers */
++#define IPU_DP_REG(offset)		(offset)
++
++#define DP_SYNC				0
++#define DP_ASYNC0			0x60
++#define DP_ASYNC1			0xBC
++#define DP_COM_CONF(flow)		IPU_DP_REG(flow)
++#define DP_GRAPH_WIND_CTRL(flow)	IPU_DP_REG(0x0004 + (flow))
++#define DP_FG_POS(flow)			IPU_DP_REG(0x0008 + (flow))
++#define DP_GAMMA_C(flow, i)		IPU_DP_REG(0x0014 + (flow) + 4 * (i))
++#define DP_GAMMA_S(flow, i)		IPU_DP_REG(0x0034 + (flow) + 4 * (i))
++#define DP_CSC_A_0(flow)		IPU_DP_REG(0x0044 + (flow))
++#define DP_CSC_A_1(flow)		IPU_DP_REG(0x0048 + (flow))
++#define DP_CSC_A_2(flow)		IPU_DP_REG(0x004C + (flow))
++#define DP_CSC_A_3(flow)		IPU_DP_REG(0x0050 + (flow))
++#define DP_CSC_0(flow)			IPU_DP_REG(0x0054 + (flow))
++#define DP_CSC_1(flow)			IPU_DP_REG(0x0058 + (flow))
++
++enum {
++	IPU_CONF_CSI0_EN = 0x00000001,
++	IPU_CONF_CSI1_EN = 0x00000002,
++	IPU_CONF_IC_EN = 0x00000004,
++	IPU_CONF_ROT_EN = 0x00000008,
++	IPU_CONF_ISP_EN = 0x00000010,
++	IPU_CONF_DP_EN = 0x00000020,
++	IPU_CONF_DI0_EN = 0x00000040,
++	IPU_CONF_DI1_EN = 0x00000080,
++	IPU_CONF_DMFC_EN = 0x00000400,
++	IPU_CONF_SMFC_EN = 0x00000100,
++	IPU_CONF_DC_EN = 0x00000200,
++	IPU_CONF_VDI_EN = 0x00001000,
++	IPU_CONF_IDMAC_DIS = 0x00400000,
++	IPU_CONF_IC_DMFC_SEL = 0x02000000,
++	IPU_CONF_IC_DMFC_SYNC = 0x04000000,
++	IPU_CONF_VDI_DMFC_SYNC = 0x08000000,
++	IPU_CONF_CSI0_DATA_SOURCE = 0x10000000,
++	IPU_CONF_CSI0_DATA_SOURCE_OFFSET = 28,
++	IPU_CONF_CSI1_DATA_SOURCE = 0x20000000,
++	IPU_CONF_IC_INPUT = 0x40000000,
++	IPU_CONF_CSI_SEL = 0x80000000,
++
++	DI0_COUNTER_RELEASE = 0x01000000,
++	DI1_COUNTER_RELEASE = 0x02000000,
++
++	FS_PRPVF_ROT_SRC_SEL_MASK = 0x00000F00,
++	FS_PRPVF_ROT_SRC_SEL_OFFSET = 8,
++	FS_PRPENC_ROT_SRC_SEL_MASK = 0x0000000F,
++	FS_PRPENC_ROT_SRC_SEL_OFFSET = 0,
++	FS_PP_ROT_SRC_SEL_MASK = 0x000F0000,
++	FS_PP_ROT_SRC_SEL_OFFSET = 16,
++	FS_PP_SRC_SEL_MASK = 0x0000F000,
++	FS_PP_SRC_SEL_VDOA = 0x00008000,
++	FS_PP_SRC_SEL_OFFSET = 12,
++	FS_PRP_SRC_SEL_MASK = 0x0F000000,
++	FS_PRP_SRC_SEL_OFFSET = 24,
++	FS_VF_IN_VALID = 0x80000000,
++	FS_ENC_IN_VALID = 0x40000000,
++	FS_VDI_SRC_SEL_MASK = 0x30000000,
++	FS_VDI_SRC_SEL_VDOA = 0x20000000,
++	FS_VDOA_DEST_SEL_MASK = 0x00030000,
++	FS_VDOA_DEST_SEL_VDI = 0x00020000,
++	FS_VDOA_DEST_SEL_IC = 0x00010000,
++	FS_VDI_SRC_SEL_OFFSET = 28,
++
++
++	FS_PRPENC_DEST_SEL_MASK = 0x0000000F,
++	FS_PRPENC_DEST_SEL_OFFSET = 0,
++	FS_PRPVF_DEST_SEL_MASK = 0x000000F0,
++	FS_PRPVF_DEST_SEL_OFFSET = 4,
++	FS_PRPVF_ROT_DEST_SEL_MASK = 0x00000F00,
++	FS_PRPVF_ROT_DEST_SEL_OFFSET = 8,
++	FS_PP_DEST_SEL_MASK = 0x0000F000,
++	FS_PP_DEST_SEL_OFFSET = 12,
++	FS_PP_ROT_DEST_SEL_MASK = 0x000F0000,
++	FS_PP_ROT_DEST_SEL_OFFSET = 16,
++	FS_PRPENC_ROT_DEST_SEL_MASK = 0x00F00000,
++	FS_PRPENC_ROT_DEST_SEL_OFFSET = 20,
++
++	FS_SMFC0_DEST_SEL_MASK = 0x0000000F,
++	FS_SMFC0_DEST_SEL_OFFSET = 0,
++	FS_SMFC1_DEST_SEL_MASK = 0x00000070,
++	FS_SMFC1_DEST_SEL_OFFSET = 4,
++	FS_SMFC2_DEST_SEL_MASK = 0x00000780,
++	FS_SMFC2_DEST_SEL_OFFSET = 7,
++	FS_SMFC3_DEST_SEL_MASK = 0x00003800,
++	FS_SMFC3_DEST_SEL_OFFSET = 11,
++
++	FS_DC1_SRC_SEL_MASK = 0x00F00000,
++	FS_DC1_SRC_SEL_OFFSET = 20,
++	FS_DC2_SRC_SEL_MASK = 0x000F0000,
++	FS_DC2_SRC_SEL_OFFSET = 16,
++	FS_DP_SYNC0_SRC_SEL_MASK = 0x0000000F,
++	FS_DP_SYNC0_SRC_SEL_OFFSET = 0,
++	FS_DP_SYNC1_SRC_SEL_MASK = 0x000000F0,
++	FS_DP_SYNC1_SRC_SEL_OFFSET = 4,
++	FS_DP_ASYNC0_SRC_SEL_MASK = 0x00000F00,
++	FS_DP_ASYNC0_SRC_SEL_OFFSET = 8,
++	FS_DP_ASYNC1_SRC_SEL_MASK = 0x0000F000,
++	FS_DP_ASYNC1_SRC_SEL_OFFSET = 12,
++
++	FS_AUTO_REF_PER_MASK = 0,
++	FS_AUTO_REF_PER_OFFSET = 16,
++
++	TSTAT_VF_MASK = 0x0000000C,
++	TSTAT_VF_OFFSET = 2,
++	TSTAT_VF_ROT_MASK = 0x00000300,
++	TSTAT_VF_ROT_OFFSET = 8,
++	TSTAT_ENC_MASK = 0x00000003,
++	TSTAT_ENC_OFFSET = 0,
++	TSTAT_ENC_ROT_MASK = 0x000000C0,
++	TSTAT_ENC_ROT_OFFSET = 6,
++	TSTAT_PP_MASK = 0x00000030,
++	TSTAT_PP_OFFSET = 4,
++	TSTAT_PP_ROT_MASK = 0x00000C00,
++	TSTAT_PP_ROT_OFFSET = 10,
++
++	TASK_STAT_IDLE = 0,
++	TASK_STAT_ACTIVE = 1,
++	TASK_STAT_WAIT4READY = 2,
++
++	/* Image Converter Register bits */
++	IC_CONF_PRPENC_EN = 0x00000001,
++	IC_CONF_PRPENC_CSC1 = 0x00000002,
++	IC_CONF_PRPENC_ROT_EN = 0x00000004,
++	IC_CONF_PRPVF_EN = 0x00000100,
++	IC_CONF_PRPVF_CSC1 = 0x00000200,
++	IC_CONF_PRPVF_CSC2 = 0x00000400,
++	IC_CONF_PRPVF_CMB = 0x00000800,
++	IC_CONF_PRPVF_ROT_EN = 0x00001000,
++	IC_CONF_PP_EN = 0x00010000,
++	IC_CONF_PP_CSC1 = 0x00020000,
++	IC_CONF_PP_CSC2 = 0x00040000,
++	IC_CONF_PP_CMB = 0x00080000,
++	IC_CONF_PP_ROT_EN = 0x00100000,
++	IC_CONF_IC_GLB_LOC_A = 0x10000000,
++	IC_CONF_KEY_COLOR_EN = 0x20000000,
++	IC_CONF_RWS_EN = 0x40000000,
++	IC_CONF_CSI_MEM_WR_EN = 0x80000000,
++
++	IC_RSZ_MAX_RESIZE_RATIO = 0x00004000,
++
++	IC_IDMAC_1_CB0_BURST_16 = 0x00000001,
++	IC_IDMAC_1_CB1_BURST_16 = 0x00000002,
++	IC_IDMAC_1_CB2_BURST_16 = 0x00000004,
++	IC_IDMAC_1_CB3_BURST_16 = 0x00000008,
++	IC_IDMAC_1_CB4_BURST_16 = 0x00000010,
++	IC_IDMAC_1_CB5_BURST_16 = 0x00000020,
++	IC_IDMAC_1_CB6_BURST_16 = 0x00000040,
++	IC_IDMAC_1_CB7_BURST_16 = 0x00000080,
++	IC_IDMAC_1_PRPENC_ROT_MASK = 0x00003800,
++	IC_IDMAC_1_PRPENC_ROT_OFFSET = 11,
++	IC_IDMAC_1_PRPVF_ROT_MASK = 0x0001C000,
++	IC_IDMAC_1_PRPVF_ROT_OFFSET = 14,
++	IC_IDMAC_1_PP_ROT_MASK = 0x000E0000,
++	IC_IDMAC_1_PP_ROT_OFFSET = 17,
++	IC_IDMAC_1_PP_FLIP_RS = 0x00400000,
++	IC_IDMAC_1_PRPVF_FLIP_RS = 0x00200000,
++	IC_IDMAC_1_PRPENC_FLIP_RS = 0x00100000,
++
++	IC_IDMAC_2_PRPENC_HEIGHT_MASK = 0x000003FF,
++	IC_IDMAC_2_PRPENC_HEIGHT_OFFSET = 0,
++	IC_IDMAC_2_PRPVF_HEIGHT_MASK = 0x000FFC00,
++	IC_IDMAC_2_PRPVF_HEIGHT_OFFSET = 10,
++	IC_IDMAC_2_PP_HEIGHT_MASK = 0x3FF00000,
++	IC_IDMAC_2_PP_HEIGHT_OFFSET = 20,
++
++	IC_IDMAC_3_PRPENC_WIDTH_MASK = 0x000003FF,
++	IC_IDMAC_3_PRPENC_WIDTH_OFFSET = 0,
++	IC_IDMAC_3_PRPVF_WIDTH_MASK = 0x000FFC00,
++	IC_IDMAC_3_PRPVF_WIDTH_OFFSET = 10,
++	IC_IDMAC_3_PP_WIDTH_MASK = 0x3FF00000,
++	IC_IDMAC_3_PP_WIDTH_OFFSET = 20,
++
++	CSI_SENS_CONF_DATA_FMT_SHIFT = 8,
++	CSI_SENS_CONF_DATA_FMT_MASK = 0x00000700,
++	CSI_SENS_CONF_DATA_FMT_RGB_YUV444 = 0L,
++	CSI_SENS_CONF_DATA_FMT_YUV422_YUYV = 1L,
++	CSI_SENS_CONF_DATA_FMT_YUV422_UYVY = 2L,
++	CSI_SENS_CONF_DATA_FMT_BAYER = 3L,
++	CSI_SENS_CONF_DATA_FMT_RGB565 = 4L,
++	CSI_SENS_CONF_DATA_FMT_RGB555 = 5L,
++	CSI_SENS_CONF_DATA_FMT_RGB444 = 6L,
++	CSI_SENS_CONF_DATA_FMT_JPEG = 7L,
++
++	CSI_SENS_CONF_VSYNC_POL_SHIFT = 0,
++	CSI_SENS_CONF_HSYNC_POL_SHIFT = 1,
++	CSI_SENS_CONF_DATA_POL_SHIFT = 2,
++	CSI_SENS_CONF_PIX_CLK_POL_SHIFT = 3,
++	CSI_SENS_CONF_SENS_PRTCL_MASK = 0x00000070L,
++	CSI_SENS_CONF_SENS_PRTCL_SHIFT = 4,
++	CSI_SENS_CONF_PACK_TIGHT_SHIFT = 7,
++	CSI_SENS_CONF_DATA_WIDTH_SHIFT = 11,
++	CSI_SENS_CONF_EXT_VSYNC_SHIFT = 15,
++	CSI_SENS_CONF_DIVRATIO_SHIFT = 16,
++
++	CSI_SENS_CONF_DIVRATIO_MASK = 0x00FF0000L,
++	CSI_SENS_CONF_DATA_DEST_SHIFT = 24,
++	CSI_SENS_CONF_DATA_DEST_MASK = 0x07000000L,
++	CSI_SENS_CONF_JPEG8_EN_SHIFT = 27,
++	CSI_SENS_CONF_JPEG_EN_SHIFT = 28,
++	CSI_SENS_CONF_FORCE_EOF_SHIFT = 29,
++	CSI_SENS_CONF_DATA_EN_POL_SHIFT = 31,
++
++	CSI_DATA_DEST_ISP = 1L,
++	CSI_DATA_DEST_IC = 2L,
++	CSI_DATA_DEST_IDMAC = 4L,
++
++	CSI_CCIR_ERR_DET_EN = 0x01000000L,
++	CSI_HORI_DOWNSIZE_EN = 0x80000000L,
++	CSI_VERT_DOWNSIZE_EN = 0x40000000L,
++	CSI_TEST_GEN_MODE_EN = 0x01000000L,
++
++	CSI_HSC_MASK = 0x1FFF0000,
++	CSI_HSC_SHIFT = 16,
++	CSI_VSC_MASK = 0x00000FFF,
++	CSI_VSC_SHIFT = 0,
++
++	CSI_TEST_GEN_R_MASK = 0x000000FFL,
++	CSI_TEST_GEN_R_SHIFT = 0,
++	CSI_TEST_GEN_G_MASK = 0x0000FF00L,
++	CSI_TEST_GEN_G_SHIFT = 8,
++	CSI_TEST_GEN_B_MASK = 0x00FF0000L,
++	CSI_TEST_GEN_B_SHIFT = 16,
++
++	CSI_MIPI_DI0_MASK = 0x000000FFL,
++	CSI_MIPI_DI0_SHIFT = 0,
++	CSI_MIPI_DI1_MASK = 0x0000FF00L,
++	CSI_MIPI_DI1_SHIFT = 8,
++	CSI_MIPI_DI2_MASK = 0x00FF0000L,
++	CSI_MIPI_DI2_SHIFT = 16,
++	CSI_MIPI_DI3_MASK = 0xFF000000L,
++	CSI_MIPI_DI3_SHIFT = 24,
++
++	CSI_MAX_RATIO_SKIP_ISP_MASK = 0x00070000L,
++	CSI_MAX_RATIO_SKIP_ISP_SHIFT = 16,
++	CSI_SKIP_ISP_MASK = 0x00F80000L,
++	CSI_SKIP_ISP_SHIFT = 19,
++	CSI_MAX_RATIO_SKIP_SMFC_MASK = 0x00000007L,
++	CSI_MAX_RATIO_SKIP_SMFC_SHIFT = 0,
++	CSI_SKIP_SMFC_MASK = 0x000000F8L,
++	CSI_SKIP_SMFC_SHIFT = 3,
++	CSI_ID_2_SKIP_MASK = 0x00000300L,
++	CSI_ID_2_SKIP_SHIFT = 8,
++
++	CSI_COLOR_FIRST_ROW_MASK = 0x00000002L,
++	CSI_COLOR_FIRST_COMP_MASK = 0x00000001L,
++
++	SMFC_MAP_CH0_MASK = 0x00000007L,
++	SMFC_MAP_CH0_SHIFT = 0,
++	SMFC_MAP_CH1_MASK = 0x00000038L,
++	SMFC_MAP_CH1_SHIFT = 3,
++	SMFC_MAP_CH2_MASK = 0x000001C0L,
++	SMFC_MAP_CH2_SHIFT = 6,
++	SMFC_MAP_CH3_MASK = 0x00000E00L,
++	SMFC_MAP_CH3_SHIFT = 9,
++
++	SMFC_WM0_SET_MASK = 0x00000007L,
++	SMFC_WM0_SET_SHIFT = 0,
++	SMFC_WM1_SET_MASK = 0x000001C0L,
++	SMFC_WM1_SET_SHIFT = 6,
++	SMFC_WM2_SET_MASK = 0x00070000L,
++	SMFC_WM2_SET_SHIFT = 16,
++	SMFC_WM3_SET_MASK = 0x01C00000L,
++	SMFC_WM3_SET_SHIFT = 22,
++
++	SMFC_WM0_CLR_MASK = 0x00000038L,
++	SMFC_WM0_CLR_SHIFT = 3,
++	SMFC_WM1_CLR_MASK = 0x00000E00L,
++	SMFC_WM1_CLR_SHIFT = 9,
++	SMFC_WM2_CLR_MASK = 0x00380000L,
++	SMFC_WM2_CLR_SHIFT = 19,
++	SMFC_WM3_CLR_MASK = 0x0E000000L,
++	SMFC_WM3_CLR_SHIFT = 25,
++
++	SMFC_BS0_MASK = 0x0000000FL,
++	SMFC_BS0_SHIFT = 0,
++	SMFC_BS1_MASK = 0x000000F0L,
++	SMFC_BS1_SHIFT = 4,
++	SMFC_BS2_MASK = 0x00000F00L,
++	SMFC_BS2_SHIFT = 8,
++	SMFC_BS3_MASK = 0x0000F000L,
++	SMFC_BS3_SHIFT = 12,
++
++	PF_CONF_TYPE_MASK = 0x00000007,
++	PF_CONF_TYPE_SHIFT = 0,
++	PF_CONF_PAUSE_EN = 0x00000010,
++	PF_CONF_RESET = 0x00008000,
++	PF_CONF_PAUSE_ROW_MASK = 0x00FF0000,
++	PF_CONF_PAUSE_ROW_SHIFT = 16,
++
++	DI_DW_GEN_ACCESS_SIZE_OFFSET = 24,
++	DI_DW_GEN_COMPONENT_SIZE_OFFSET = 16,
++
++	DI_GEN_DI_CLK_EXT = 0x100000,
++	DI_GEN_POLARITY_DISP_CLK = 0x00020000,
++	DI_GEN_POLARITY_1 = 0x00000001,
++	DI_GEN_POLARITY_2 = 0x00000002,
++	DI_GEN_POLARITY_3 = 0x00000004,
++	DI_GEN_POLARITY_4 = 0x00000008,
++	DI_GEN_POLARITY_5 = 0x00000010,
++	DI_GEN_POLARITY_6 = 0x00000020,
++	DI_GEN_POLARITY_7 = 0x00000040,
++	DI_GEN_POLARITY_8 = 0x00000080,
++
++	DI_POL_DRDY_DATA_POLARITY = 0x00000080,
++	DI_POL_DRDY_POLARITY_15 = 0x00000010,
++
++	DI_VSYNC_SEL_OFFSET = 13,
++
++	DC_WR_CH_CONF_FIELD_MODE = 0x00000200,
++	DC_WR_CH_CONF_PROG_TYPE_OFFSET = 5,
++	DC_WR_CH_CONF_PROG_TYPE_MASK = 0x000000E0,
++	DC_WR_CH_CONF_PROG_DI_ID = 0x00000004,
++	DC_WR_CH_CONF_PROG_DISP_ID_OFFSET = 3,
++	DC_WR_CH_CONF_PROG_DISP_ID_MASK = 0x00000018,
++
++	DC_UGDE_0_ODD_EN = 0x02000000,
++	DC_UGDE_0_ID_CODED_MASK = 0x00000007,
++	DC_UGDE_0_ID_CODED_OFFSET = 0,
++	DC_UGDE_0_EV_PRIORITY_MASK = 0x00000078,
++	DC_UGDE_0_EV_PRIORITY_OFFSET = 3,
++
++	DP_COM_CONF_FG_EN = 0x00000001,
++	DP_COM_CONF_GWSEL = 0x00000002,
++	DP_COM_CONF_GWAM = 0x00000004,
++	DP_COM_CONF_GWCKE = 0x00000008,
++	DP_COM_CONF_CSC_DEF_MASK = 0x00000300,
++	DP_COM_CONF_CSC_DEF_OFFSET = 8,
++	DP_COM_CONF_CSC_DEF_FG = 0x00000300,
++	DP_COM_CONF_CSC_DEF_BG = 0x00000200,
++	DP_COM_CONF_CSC_DEF_BOTH = 0x00000100,
++	DP_COM_CONF_GAMMA_EN = 0x00001000,
++	DP_COM_CONF_GAMMA_YUV_EN = 0x00002000,
++
++	DI_SER_CONF_LLA_SER_ACCESS = 0x00000020,
++	DI_SER_CONF_SERIAL_CLK_POL = 0x00000010,
++	DI_SER_CONF_SERIAL_DATA_POL = 0x00000008,
++	DI_SER_CONF_SERIAL_RS_POL = 0x00000004,
++	DI_SER_CONF_SERIAL_CS_POL = 0x00000002,
++	DI_SER_CONF_WAIT4SERIAL = 0x00000001,
++
++	VDI_C_CH_420 = 0x00000000,
++	VDI_C_CH_422 = 0x00000002,
++	VDI_C_MOT_SEL_FULL = 0x00000008,
++	VDI_C_MOT_SEL_LOW = 0x00000004,
++	VDI_C_MOT_SEL_MED = 0x00000000,
++	VDI_C_BURST_SIZE1_4 = 0x00000030,
++	VDI_C_BURST_SIZE2_4 = 0x00000300,
++	VDI_C_BURST_SIZE3_4 = 0x00003000,
++	VDI_C_BURST_SIZE_MASK = 0xF,
++	VDI_C_BURST_SIZE1_OFFSET = 4,
++	VDI_C_BURST_SIZE2_OFFSET = 8,
++	VDI_C_BURST_SIZE3_OFFSET = 12,
++	VDI_C_VWM1_SET_1 = 0x00000000,
++	VDI_C_VWM1_SET_2 = 0x00010000,
++	VDI_C_VWM1_CLR_2 = 0x00080000,
++	VDI_C_VWM3_SET_1 = 0x00000000,
++	VDI_C_VWM3_SET_2 = 0x00400000,
++	VDI_C_VWM3_CLR_2 = 0x02000000,
++	VDI_C_TOP_FIELD_MAN_1 = 0x40000000,
++	VDI_C_TOP_FIELD_AUTO_1 = 0x80000000,
++};
++
++enum di_pins {
++	DI_PIN11 = 0,
++	DI_PIN12 = 1,
++	DI_PIN13 = 2,
++	DI_PIN14 = 3,
++	DI_PIN15 = 4,
++	DI_PIN16 = 5,
++	DI_PIN17 = 6,
++	DI_PIN_CS = 7,
++
++	DI_PIN_SER_CLK = 0,
++	DI_PIN_SER_RS = 1,
++};
++
++enum di_sync_wave {
++	DI_SYNC_NONE = -1,
++	DI_SYNC_CLK = 0,
++	DI_SYNC_INT_HSYNC = 1,
++	DI_SYNC_COUNT_1 = 1,
++	DI_SYNC_HSYNC = 2,
++	DI_SYNC_VSYNC = 3,
++	DI_SYNC_AFIELD = 4,
++	DI_SYNC_ALINE = 5,
++	DI_SYNC_APIXEL = 6,
++	DI_SYNC_COUNT_7 = 7,
++	DI_SYNC_COUNT_8 = 8,
++	DI_SYNC_COUNT_9 = 9,
++};
++
++/* DC template opcodes */
++#define WROD(lf)		(0x18 | (lf << 1))
++#define WRG	        	(0x01)
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/Kconfig linux-xbian-imx6/drivers/mxc/ipu3/Kconfig
+--- linux-4.1.3/drivers/mxc/ipu3/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/Kconfig	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,2 @@
++config MXC_IPU_V3_FSL
++	bool
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/Makefile linux-xbian-imx6/drivers/mxc/ipu3/Makefile
+--- linux-4.1.3/drivers/mxc/ipu3/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/Makefile	2015-07-27 23:13:06.226765901 +0200
+@@ -0,0 +1,4 @@
++obj-$(CONFIG_MXC_IPU_V3_FSL) = mxc_ipu.o
++
++mxc_ipu-objs := ipu_common.o ipu_ic.o ipu_disp.o ipu_capture.o ipu_device.o \
++		ipu_calc_stripes_sizes.o vdoa.o ipu_pixel_clk.o
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/vdoa.c linux-xbian-imx6/drivers/mxc/ipu3/vdoa.c
+--- linux-4.1.3/drivers/mxc/ipu3/vdoa.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/vdoa.c	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,547 @@
++/*
++ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/clk.h>
++#include <linux/err.h>
++#include <linux/io.h>
++#include <linux/ipu.h>
++#include <linux/genalloc.h>
++#include <linux/module.h>
++#include <linux/platform_device.h>
++#include <linux/slab.h>
++#include <linux/types.h>
++#include <linux/of.h>
++#include <linux/of_irq.h>
++#include <linux/of_pci.h>
++
++#include "vdoa.h"
++/* 6band(3field* double buffer) * (width*2) * bandline(8)
++	= 6x1024x2x8 = 96k or 72k(1.5byte) */
++#define MAX_VDOA_IRAM_SIZE	(1024*96)
++#define VDOA_IRAM_SIZE		(1024*72)
++
++#define VDOAC_BAND_HEIGHT_32LINES	(32)
++#define VDOAC_BAND_HEIGHT_16LINES	(16)
++#define VDOAC_BAND_HEIGHT_8LINES	(8)
++#define VDOAC_THREE_FRAMES		(0x1 << 2)
++#define VDOAC_SYNC_BAND_MODE		(0x1 << 3)
++#define VDOAC_SCAN_ORDER_INTERLACED	(0x1 << 4)
++#define VDOAC_PFS_YUYV			(0x1 << 5)
++#define VDOAC_IPU_SEL_1			(0x1 << 6)
++#define VDOAFP_FH_MASK			(0x1FFF)
++#define VDOAFP_FH_SHIFT			(16)
++#define VDOAFP_FW_MASK			(0x3FFF)
++#define VDOAFP_FW_SHIFT			(0)
++#define VDOASL_VSLY_MASK		(0x3FFF)
++#define VDOASL_VSLY_SHIFT		(16)
++#define VDOASL_ISLY_MASK		(0x7FFF)
++#define VDOASL_ISLY_SHIFT		(0)
++#define VDOASRR_START_XFER		(0x2)
++#define VDOASRR_SWRST			(0x1)
++#define VDOAIEIST_TRANSFER_ERR		(0x2)
++#define VDOAIEIST_TRANSFER_END		(0x1)
++
++#define	VDOAC		(0x0)	/* Control Register */
++#define	VDOASRR		(0x4)	/* Start and Reset Register */
++#define	VDOAIE		(0x8)	/* Interrupt Enable Register */
++#define	VDOAIST		(0xc)	/* Interrupt Status Register */
++#define	VDOAFP		(0x10)	/* Frame Parameters Register */
++#define	VDOAIEBA00	(0x14)	/* External Buffer n Frame m Address Register */
++#define	VDOAIEBA01	(0x18)	/* External Buffer n Frame m Address Register */
++#define	VDOAIEBA02	(0x1c)	/* External Buffer n Frame m Address Register */
++#define	VDOAIEBA10	(0x20)	/* External Buffer n Frame m Address Register */
++#define	VDOAIEBA11	(0x24)	/* External Buffer n Frame m Address Register */
++#define	VDOAIEBA12	(0x28)	/* External Buffer n Frame m Address Register */
++#define	VDOASL		(0x2c)	/* IPU Stride Line Register */
++#define	VDOAIUBO	(0x30)	/* IPU Chroma Buffer Offset Register */
++#define	VDOAVEBA0	(0x34)	/* External Buffer m Address Register */
++#define	VDOAVEBA1	(0x38)	/* External Buffer m Address Register */
++#define	VDOAVEBA2	(0x3c)	/* External Buffer m Address Register */
++#define	VDOAVUBO	(0x40)	/* VPU Chroma Buffer Offset */
++#define	VDOASR		(0x44)	/* Status Register */
++#define	VDOATD		(0x48)	/* Test Debug Register */
++
++
++enum {
++	VDOA_INIT	= 0x1,
++	VDOA_GET	= 0x2,
++	VDOA_SETUP	= 0x4,
++	VDOA_GET_OBUF	= 0x8,
++	VDOA_START	= 0x10,
++	VDOA_INIRQ	= 0x20,
++	VDOA_STOP	= 0x40,
++	VDOA_PUT	= VDOA_INIT,
++};
++
++enum {
++	VDOA_NULL	= 0,
++	VDOA_FRAME	= 1,
++	VDOA_PREV_FIELD	= 2,
++	VDOA_CURR_FIELD	= 3,
++	VDOA_NEXT_FIELD	= 4,
++};
++
++#define CHECK_STATE(expect, retcode)					\
++do {									\
++	if (!((expect) & vdoa->state)) {				\
++		dev_err(vdoa->dev, "ERR: %s state:0x%x, expect:0x%x.\n",\
++				__func__, vdoa->state, (expect));	\
++		retcode;						\
++	}								\
++} while (0)
++
++#define CHECK_NULL_PTR(ptr)						\
++do {									\
++	pr_debug("vdoa_ptr:0x%p in %s state:0x%x.\n",			\
++			vdoa, __func__, vdoa->state);			\
++	if (NULL == (ptr)) {						\
++		pr_err("ERR vdoa: %s state:0x%x null ptr.\n",		\
++				__func__, vdoa->state);			\
++	}								\
++} while (0)
++
++struct vdoa_info {
++	int		state;
++	struct device	*dev;
++	struct clk	*vdoa_clk;
++	void __iomem	*reg_base;
++	struct gen_pool	*iram_pool;
++	unsigned long	iram_base;
++	unsigned long	iram_paddr;
++	int		irq;
++	int		field;
++	struct completion comp;
++};
++
++static struct vdoa_info *g_vdoa;
++static unsigned long iram_size;
++static DEFINE_MUTEX(vdoa_lock);
++
++static inline void vdoa_read_register(struct vdoa_info *vdoa,
++				u32 reg, u32 *val)
++{
++	*val = ioread32(vdoa->reg_base + reg);
++	dev_dbg(vdoa->dev, "read_reg:0x%02x, val:0x%08x.\n", reg, *val);
++}
++
++static inline void vdoa_write_register(struct vdoa_info *vdoa,
++				u32 reg, u32 val)
++{
++	iowrite32(val, vdoa->reg_base + reg);
++	dev_dbg(vdoa->dev, "\t\twrite_reg:0x%02x, val:0x%08x.\n", reg, val);
++}
++
++static void dump_registers(struct vdoa_info *vdoa)
++{
++	int i;
++	u32 data;
++
++	for (i = VDOAC; i < VDOATD; i += 4)
++		vdoa_read_register(vdoa, i, &data);
++}
++
++int vdoa_setup(vdoa_handle_t handle, struct vdoa_params *params)
++{
++	int	band_size;
++	int	total_band_size = 0;
++	int	ipu_stride;
++	u32	data;
++	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
++
++	CHECK_NULL_PTR(vdoa);
++	CHECK_STATE(VDOA_GET | VDOA_GET_OBUF | VDOA_STOP, return -EINVAL);
++	if (VDOA_GET == vdoa->state) {
++		dev_dbg(vdoa->dev, "w:%d, h:%d.\n",
++			 params->width, params->height);
++		data = (params->band_lines == VDOAC_BAND_HEIGHT_32LINES) ? 2 :
++			((params->band_lines == VDOAC_BAND_HEIGHT_16LINES) ?
++				 1 : 0);
++		data |= params->scan_order ? VDOAC_SCAN_ORDER_INTERLACED : 0;
++		data |= params->band_mode ? VDOAC_SYNC_BAND_MODE : 0;
++		data |= params->pfs ? VDOAC_PFS_YUYV : 0;
++		data |= params->ipu_num ? VDOAC_IPU_SEL_1 : 0;
++		vdoa_write_register(vdoa, VDOAC, data);
++
++		data = ((params->width & VDOAFP_FW_MASK) << VDOAFP_FW_SHIFT) |
++			((params->height & VDOAFP_FH_MASK) << VDOAFP_FH_SHIFT);
++		vdoa_write_register(vdoa, VDOAFP, data);
++
++		ipu_stride = params->pfs ? params->width << 1 : params->width;
++		data = ((params->vpu_stride & VDOASL_VSLY_MASK) <<
++							VDOASL_VSLY_SHIFT) |
++			((ipu_stride & VDOASL_ISLY_MASK) << VDOASL_ISLY_SHIFT);
++		vdoa_write_register(vdoa, VDOASL, data);
++
++		dev_dbg(vdoa->dev, "band_mode:%d, band_line:%d, base:0x%lx.\n",
++		params->band_mode, params->band_lines, vdoa->iram_paddr);
++	}
++	/*
++	 * band size	= (luma_per_line + chroma_per_line) * bandLines
++	 *		= width * (3/2 or 2) * bandLines
++	 * double buffer mode used.
++	 */
++	if (params->pfs)
++		band_size = (params->width << 1) * params->band_lines;
++	else
++		band_size = ((params->width * 3) >> 1) *
++						params->band_lines;
++	if (params->interlaced) {
++		total_band_size = 6 * band_size; /* 3 frames*double buffer */
++		if (iram_size < total_band_size) {
++			dev_err(vdoa->dev, "iram_size:0x%lx is smaller than "
++				"request:0x%x!\n", iram_size, total_band_size);
++			return -EINVAL;
++		}
++		if (params->vfield_buf.prev_veba) {
++			if (params->band_mode) {
++				vdoa_write_register(vdoa, VDOAIEBA00,
++							vdoa->iram_paddr);
++				vdoa_write_register(vdoa, VDOAIEBA10,
++						 vdoa->iram_paddr + band_size);
++			} else
++				vdoa_write_register(vdoa, VDOAIEBA00,
++							params->ieba0);
++			vdoa_write_register(vdoa, VDOAVEBA0,
++					params->vfield_buf.prev_veba);
++			vdoa->field = VDOA_PREV_FIELD;
++		}
++		if (params->vfield_buf.cur_veba) {
++			if (params->band_mode) {
++				vdoa_write_register(vdoa, VDOAIEBA01,
++					 vdoa->iram_paddr + band_size * 2);
++				vdoa_write_register(vdoa, VDOAIEBA11,
++					 vdoa->iram_paddr + band_size * 3);
++			} else
++				vdoa_write_register(vdoa, VDOAIEBA01,
++							params->ieba1);
++			vdoa_write_register(vdoa, VDOAVEBA1,
++					params->vfield_buf.cur_veba);
++			vdoa->field = VDOA_CURR_FIELD;
++		}
++		if (params->vfield_buf.next_veba) {
++			if (params->band_mode) {
++				vdoa_write_register(vdoa, VDOAIEBA02,
++					 vdoa->iram_paddr + band_size * 4);
++				vdoa_write_register(vdoa, VDOAIEBA12,
++					 vdoa->iram_paddr + band_size * 5);
++			} else
++				vdoa_write_register(vdoa, VDOAIEBA02,
++							params->ieba2);
++			vdoa_write_register(vdoa, VDOAVEBA2,
++					params->vfield_buf.next_veba);
++			vdoa->field = VDOA_NEXT_FIELD;
++			vdoa_read_register(vdoa, VDOAC, &data);
++			data |= VDOAC_THREE_FRAMES;
++			vdoa_write_register(vdoa, VDOAC, data);
++		}
++
++		if (!params->pfs)
++			vdoa_write_register(vdoa, VDOAIUBO,
++				 params->width * params->band_lines);
++		vdoa_write_register(vdoa, VDOAVUBO,
++				 params->vfield_buf.vubo);
++		dev_dbg(vdoa->dev, "total band_size:0x%x.\n", band_size*6);
++	} else if (params->band_mode) {
++		/* used for progressive frame resize on PrP channel */
++		BUG(); /* currently not support */
++		/* progressvie frame: band mode */
++		vdoa_write_register(vdoa, VDOAIEBA00, vdoa->iram_paddr);
++		vdoa_write_register(vdoa, VDOAIEBA10,
++					 vdoa->iram_paddr + band_size);
++		if (!params->pfs)
++			vdoa_write_register(vdoa, VDOAIUBO,
++					params->width * params->band_lines);
++		dev_dbg(vdoa->dev, "total band_size:0x%x\n", band_size*2);
++	} else {
++		/* progressive frame: mem->mem, non-band mode */
++		vdoa->field = VDOA_FRAME;
++		vdoa_write_register(vdoa, VDOAVEBA0, params->vframe_buf.veba);
++		vdoa_write_register(vdoa, VDOAVUBO, params->vframe_buf.vubo);
++		vdoa_write_register(vdoa, VDOAIEBA00, params->ieba0);
++		if (!params->pfs)
++			/* note: iubo is relative value, based on ieba0 */
++			vdoa_write_register(vdoa, VDOAIUBO,
++					params->width * params->height);
++	}
++	vdoa->state = VDOA_SETUP;
++	return 0;
++}
++
++void vdoa_get_output_buf(vdoa_handle_t handle, struct vdoa_ipu_buf *buf)
++{
++	u32	data;
++	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
++
++	CHECK_NULL_PTR(vdoa);
++	CHECK_STATE(VDOA_SETUP, return);
++	vdoa->state = VDOA_GET_OBUF;
++	memset(buf, 0, sizeof(*buf));
++
++	vdoa_read_register(vdoa, VDOAC, &data);
++	switch (vdoa->field) {
++	case VDOA_FRAME:
++	case VDOA_PREV_FIELD:
++		vdoa_read_register(vdoa, VDOAIEBA00, &buf->ieba0);
++		if (data & VDOAC_SYNC_BAND_MODE)
++			vdoa_read_register(vdoa, VDOAIEBA10, &buf->ieba1);
++		break;
++	case VDOA_CURR_FIELD:
++		vdoa_read_register(vdoa, VDOAIEBA01, &buf->ieba0);
++		vdoa_read_register(vdoa, VDOAIEBA11, &buf->ieba1);
++		break;
++	case VDOA_NEXT_FIELD:
++		vdoa_read_register(vdoa, VDOAIEBA02, &buf->ieba0);
++		vdoa_read_register(vdoa, VDOAIEBA12, &buf->ieba1);
++		break;
++	default:
++		BUG();
++		break;
++	}
++	if (!(data & VDOAC_PFS_YUYV))
++		vdoa_read_register(vdoa, VDOAIUBO, &buf->iubo);
++}
++
++int vdoa_start(vdoa_handle_t handle, int timeout_ms)
++{
++	int ret;
++	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
++
++	CHECK_NULL_PTR(vdoa);
++	CHECK_STATE(VDOA_GET_OBUF, return -EINVAL);
++	vdoa->state = VDOA_START;
++	init_completion(&vdoa->comp);
++	vdoa_write_register(vdoa, VDOAIST,
++			VDOAIEIST_TRANSFER_ERR | VDOAIEIST_TRANSFER_END);
++	vdoa_write_register(vdoa, VDOAIE,
++			VDOAIEIST_TRANSFER_ERR | VDOAIEIST_TRANSFER_END);
++
++	enable_irq(vdoa->irq);
++	vdoa_write_register(vdoa, VDOASRR, VDOASRR_START_XFER);
++	dump_registers(vdoa);
++
++	ret = wait_for_completion_timeout(&vdoa->comp,
++			msecs_to_jiffies(timeout_ms));
++
++	return ret > 0 ? 0 : -ETIMEDOUT;
++}
++
++void vdoa_stop(vdoa_handle_t handle)
++{
++	struct vdoa_info *vdoa = (struct vdoa_info *)handle;
++
++	CHECK_NULL_PTR(vdoa);
++	CHECK_STATE(VDOA_GET | VDOA_START | VDOA_INIRQ, return);
++	vdoa->state = VDOA_STOP;
++
++	disable_irq(vdoa->irq);
++
++	vdoa_write_register(vdoa, VDOASRR, VDOASRR_SWRST);
++}
++
++void vdoa_get_handle(vdoa_handle_t *handle)
++{
++	struct vdoa_info *vdoa = g_vdoa;
++
++	CHECK_NULL_PTR(handle);
++	*handle = (vdoa_handle_t *)NULL;
++	CHECK_STATE(VDOA_INIT, return);
++	mutex_lock(&vdoa_lock);
++	clk_prepare_enable(vdoa->vdoa_clk);
++	vdoa->state = VDOA_GET;
++	vdoa->field = VDOA_NULL;
++	vdoa_write_register(vdoa, VDOASRR, VDOASRR_SWRST);
++
++	*handle = (vdoa_handle_t *)vdoa;
++}
++
++void vdoa_put_handle(vdoa_handle_t *handle)
++{
++	struct vdoa_info *vdoa = (struct vdoa_info *)(*handle);
++
++	CHECK_NULL_PTR(vdoa);
++	CHECK_STATE(VDOA_STOP, return);
++	if (vdoa != g_vdoa)
++		BUG();
++
++	clk_disable_unprepare(vdoa->vdoa_clk);
++	vdoa->state = VDOA_PUT;
++	*handle = (vdoa_handle_t *)NULL;
++	mutex_unlock(&vdoa_lock);
++}
++
++static irqreturn_t vdoa_irq_handler(int irq, void *data)
++{
++	u32 status, mask, val;
++	struct vdoa_info *vdoa = data;
++
++	CHECK_NULL_PTR(vdoa);
++	CHECK_STATE(VDOA_START, return IRQ_HANDLED);
++	vdoa->state = VDOA_INIRQ;
++	vdoa_read_register(vdoa, VDOAIST, &status);
++	vdoa_read_register(vdoa, VDOAIE, &mask);
++	val = status & mask;
++	vdoa_write_register(vdoa, VDOAIST, val);
++	if (VDOAIEIST_TRANSFER_ERR & val)
++		dev_err(vdoa->dev, "vdoa Transfer err irq!\n");
++	if (VDOAIEIST_TRANSFER_END & val)
++		dev_dbg(vdoa->dev, "vdoa Transfer end irq!\n");
++	if (0 == val) {
++		dev_err(vdoa->dev, "vdoa unknown irq!\n");
++		BUG();
++	}
++
++	complete(&vdoa->comp);
++	return IRQ_HANDLED;
++}
++
++/* IRAM Size in Kbytes, example:vdoa_iram_size=64, 64KBytes */
++static int __init vdoa_iram_size_setup(char *options)
++{
++	int ret;
++
++	ret = kstrtol(options, 0, &iram_size);
++	if (ret)
++		iram_size = 0;
++	else
++		iram_size *= SZ_1K;
++
++	return 1;
++}
++__setup("vdoa_iram_size=", vdoa_iram_size_setup);
++
++static const struct of_device_id imx_vdoa_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-vdoa", },
++	{ /* sentinel */ }
++};
++
++static int vdoa_probe(struct platform_device *pdev)
++{
++	int ret;
++	struct vdoa_info *vdoa;
++	struct resource *res;
++	struct resource *res_irq;
++	struct device	*dev = &pdev->dev;
++	struct device_node *np = pdev->dev.of_node;
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res) {
++		dev_err(dev, "can't get device resources\n");
++		return -ENOENT;
++	}
++
++	res_irq = platform_get_resource(pdev, IORESOURCE_IRQ, 0);
++	if (!res_irq) {
++		dev_err(dev, "failed to get irq resource\n");
++		return -ENOENT;
++	}
++
++	vdoa = devm_kzalloc(dev, sizeof(struct vdoa_info), GFP_KERNEL);
++	if (!vdoa)
++		return -ENOMEM;
++	vdoa->dev = dev;
++
++	vdoa->reg_base = devm_ioremap_resource(&pdev->dev, res);
++	if (!vdoa->reg_base)
++		return -EBUSY;
++
++	vdoa->irq = res_irq->start;
++	ret = devm_request_irq(dev, vdoa->irq, vdoa_irq_handler, 0,
++				"vdoa", vdoa);
++	if (ret) {
++		dev_err(dev, "can't claim irq %d\n", vdoa->irq);
++		return ret;
++	}
++	disable_irq(vdoa->irq);
++
++	vdoa->vdoa_clk = devm_clk_get(dev, NULL);
++	if (IS_ERR(vdoa->vdoa_clk)) {
++		dev_err(dev, "failed to get vdoa_clk\n");
++		return PTR_ERR(vdoa->vdoa_clk);
++	}
++
++	vdoa->iram_pool = of_get_named_gen_pool(np, "iram", 0);
++	if (!vdoa->iram_pool) {
++		dev_err(&pdev->dev, "iram pool not available\n");
++		return -ENOMEM;
++	}
++
++	if ((iram_size == 0) || (iram_size > MAX_VDOA_IRAM_SIZE))
++		iram_size = VDOA_IRAM_SIZE;
++
++	vdoa->iram_base = gen_pool_alloc(vdoa->iram_pool, iram_size);
++	if (!vdoa->iram_base) {
++		dev_err(&pdev->dev, "unable to alloc iram\n");
++		return -ENOMEM;
++	}
++
++	vdoa->iram_paddr = gen_pool_virt_to_phys(vdoa->iram_pool,
++						 vdoa->iram_base);
++
++	dev_dbg(dev, "iram_base:0x%lx,iram_paddr:0x%lx,size:0x%lx\n",
++		 vdoa->iram_base, vdoa->iram_paddr, iram_size);
++
++	vdoa->state = VDOA_INIT;
++	dev_set_drvdata(dev, vdoa);
++	g_vdoa = vdoa;
++	dev_info(dev, "i.MX Video Data Order Adapter(VDOA) driver probed\n");
++	return 0;
++}
++
++static int vdoa_remove(struct platform_device *pdev)
++{
++	struct vdoa_info *vdoa = dev_get_drvdata(&pdev->dev);
++
++	gen_pool_free(vdoa->iram_pool, vdoa->iram_base, iram_size);
++	kfree(vdoa);
++	dev_set_drvdata(&pdev->dev, NULL);
++
++	return 0;
++}
++
++static struct platform_driver vdoa_driver = {
++	.driver = {
++		.name = "mxc_vdoa",
++		.of_match_table = imx_vdoa_dt_ids,
++	},
++	.probe = vdoa_probe,
++	.remove = vdoa_remove,
++};
++
++static int __init vdoa_init(void)
++{
++	int err;
++
++	err = platform_driver_register(&vdoa_driver);
++	if (err) {
++		pr_err("vdoa_driver register failed\n");
++		return -ENODEV;
++	}
++	return 0;
++}
++
++static void __exit vdoa_cleanup(void)
++{
++	platform_driver_unregister(&vdoa_driver);
++}
++
++module_init(vdoa_init);
++module_exit(vdoa_cleanup);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("i.MX Video Data Order Adapter(VDOA) driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/mxc/ipu3/vdoa.h linux-xbian-imx6/drivers/mxc/ipu3/vdoa.h
+--- linux-4.1.3/drivers/mxc/ipu3/vdoa.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/ipu3/vdoa.h	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,69 @@
++/*
++ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __VDOA_H__
++#define __VDOA_H__
++
++#define VDOA_PFS_YUYV (1)
++#define VDOA_PFS_NV12 (0)
++
++
++struct vfield_buf {
++	u32	prev_veba;
++	u32	cur_veba;
++	u32	next_veba;
++	u32	vubo;
++};
++
++struct vframe_buf {
++	u32	veba;
++	u32	vubo;
++};
++
++struct vdoa_params {
++	u32	width;
++	u32	height;
++	int	vpu_stride;
++	int	interlaced;
++	int	scan_order;
++	int	ipu_num;
++	int	band_lines;
++	int	band_mode;
++	int	pfs;
++	u32	ieba0;
++	u32	ieba1;
++	u32	ieba2;
++	struct	vframe_buf vframe_buf;
++	struct	vfield_buf vfield_buf;
++};
++struct vdoa_ipu_buf {
++	u32	ieba0;
++	u32	ieba1;
++	u32	iubo;
++};
++
++struct vdoa_info;
++typedef void *vdoa_handle_t;
++
++int vdoa_setup(vdoa_handle_t handle, struct vdoa_params *params);
++void vdoa_get_output_buf(vdoa_handle_t handle, struct vdoa_ipu_buf *buf);
++int  vdoa_start(vdoa_handle_t handle, int timeout_ms);
++void vdoa_stop(vdoa_handle_t handle);
++void vdoa_get_handle(vdoa_handle_t *handle);
++void vdoa_put_handle(vdoa_handle_t *handle);
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/Kconfig linux-xbian-imx6/drivers/mxc/Kconfig
+--- linux-4.1.3/drivers/mxc/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/Kconfig	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,25 @@
++# drivers/mxc/Kconfig
++
++if ARCH_MXC
++
++menu "MXC support drivers"
++
++config MXC_IPU
++	tristate "Image Processing Unit Driver"
++	select MXC_IPU_V3_FSL
++	depends on !IMX_IPUV3_CORE
++	help
++	  If you plan to use the Image Processing unit, say
++	  Y here. IPU is needed by Framebuffer and V4L2 drivers.
++
++source "drivers/mxc/gpu-viv/Kconfig"
++source "drivers/mxc/ipu3/Kconfig"
++source "drivers/mxc/asrc/Kconfig"
++source "drivers/mxc/vpu/Kconfig"
++source "drivers/mxc/hdmi-cec/Kconfig"
++source "drivers/mxc/mipi/Kconfig"
++source "drivers/mxc/mlb/Kconfig"
++
++endmenu
++
++endif
+diff -Nur linux-4.1.3/drivers/mxc/Makefile linux-xbian-imx6/drivers/mxc/Makefile
+--- linux-4.1.3/drivers/mxc/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/Makefile	2015-07-27 23:13:06.166979215 +0200
+@@ -0,0 +1,7 @@
++obj-$(CONFIG_MXC_GPU_VIV) += gpu-viv/
++obj-$(CONFIG_MXC_IPU_V3_FSL) += ipu3/
++obj-$(CONFIG_MXC_ASRC) += asrc/
++obj-$(CONFIG_MXC_VPU) += vpu/
++obj-$(CONFIG_MXC_HDMI_CEC) += hdmi-cec/
++obj-$(CONFIG_MXC_MIPI_CSI2) += mipi/
++obj-$(CONFIG_MXC_MLB) += mlb/
+diff -Nur linux-4.1.3/drivers/mxc/mipi/Kconfig linux-xbian-imx6/drivers/mxc/mipi/Kconfig
+--- linux-4.1.3/drivers/mxc/mipi/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mipi/Kconfig	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,14 @@
++#
++# MIPI configuration
++#
++
++menu "MXC MIPI Support"
++
++config MXC_MIPI_CSI2
++	tristate "MIPI CSI2 support"
++	depends on SOC_IMX6Q
++	default n
++	---help---
++	Say Y to get the MIPI CSI2 support.
++
++endmenu
+diff -Nur linux-4.1.3/drivers/mxc/mipi/Makefile linux-xbian-imx6/drivers/mxc/mipi/Makefile
+--- linux-4.1.3/drivers/mxc/mipi/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mipi/Makefile	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,4 @@
++#
++# Makefile for the mipi interface driver
++#
++obj-$(CONFIG_MXC_MIPI_CSI2) += mxc_mipi_csi2.o
+diff -Nur linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.c linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.c
+--- linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.c	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,540 @@
++/*
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/module.h>
++#include <linux/types.h>
++#include <linux/interrupt.h>
++#include <linux/irq.h>
++#include <linux/irqdesc.h>
++#include <linux/init.h>
++#include <linux/platform_device.h>
++#include <linux/err.h>
++#include <linux/clk.h>
++#include <linux/console.h>
++#include <linux/io.h>
++#include <linux/bitops.h>
++#include <linux/delay.h>
++#include <linux/fsl_devices.h>
++#include <linux/slab.h>
++#include <linux/of.h>
++
++#include <linux/mipi_csi2.h>
++
++#include "mxc_mipi_csi2.h"
++
++static struct mipi_csi2_info *gmipi_csi2;
++
++void _mipi_csi2_lock(struct mipi_csi2_info *info)
++{
++	if (!in_irq() && !in_softirq())
++		mutex_lock(&info->mutex_lock);
++}
++
++void _mipi_csi2_unlock(struct mipi_csi2_info *info)
++{
++	if (!in_irq() && !in_softirq())
++		mutex_unlock(&info->mutex_lock);
++}
++
++static inline void mipi_csi2_write(struct mipi_csi2_info *info,
++		unsigned value, unsigned offset)
++{
++	writel(value, info->mipi_csi2_base + offset);
++}
++
++static inline unsigned int mipi_csi2_read(struct mipi_csi2_info *info,
++		unsigned offset)
++{
++	return readl(info->mipi_csi2_base + offset);
++}
++
++/*!
++ * This function is called to enable the mipi csi2 interface.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns setted value
++ */
++bool mipi_csi2_enable(struct mipi_csi2_info *info)
++{
++	bool status;
++
++	_mipi_csi2_lock(info);
++
++	if (!info->mipi_en) {
++		info->mipi_en = true;
++		clk_prepare_enable(info->cfg_clk);
++		clk_prepare_enable(info->dphy_clk);
++	} else
++		mipi_dbg("mipi csi2 already enabled!\n");
++
++	status = info->mipi_en;
++
++	_mipi_csi2_unlock(info);
++
++	return status;
++}
++EXPORT_SYMBOL(mipi_csi2_enable);
++
++/*!
++ * This function is called to disable the mipi csi2 interface.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns setted value
++ */
++bool mipi_csi2_disable(struct mipi_csi2_info *info)
++{
++	bool status;
++
++	_mipi_csi2_lock(info);
++
++	if (info->mipi_en) {
++		info->mipi_en = false;
++		clk_disable_unprepare(info->dphy_clk);
++		clk_disable_unprepare(info->cfg_clk);
++	} else
++		mipi_dbg("mipi csi2 already disabled!\n");
++
++	status = info->mipi_en;
++
++	_mipi_csi2_unlock(info);
++
++	return status;
++}
++EXPORT_SYMBOL(mipi_csi2_disable);
++
++/*!
++ * This function is called to get mipi csi2 disable/enable status.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns mipi csi2 status
++ */
++bool mipi_csi2_get_status(struct mipi_csi2_info *info)
++{
++	bool status;
++
++	_mipi_csi2_lock(info);
++	status = info->mipi_en;
++	_mipi_csi2_unlock(info);
++
++	return status;
++}
++EXPORT_SYMBOL(mipi_csi2_get_status);
++
++/*!
++ * This function is called to set mipi lanes.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns setted value
++ */
++unsigned int mipi_csi2_set_lanes(struct mipi_csi2_info *info)
++{
++	unsigned int lanes;
++
++	_mipi_csi2_lock(info);
++	mipi_csi2_write(info, info->lanes - 1, MIPI_CSI2_N_LANES);
++	lanes = mipi_csi2_read(info, MIPI_CSI2_N_LANES);
++	_mipi_csi2_unlock(info);
++
++	return lanes;
++}
++EXPORT_SYMBOL(mipi_csi2_set_lanes);
++
++/*!
++ * This function is called to set mipi data type.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns setted value
++ */
++unsigned int mipi_csi2_set_datatype(struct mipi_csi2_info *info,
++					unsigned int datatype)
++{
++	unsigned int dtype;
++
++	_mipi_csi2_lock(info);
++	info->datatype = datatype;
++	dtype = info->datatype;
++	_mipi_csi2_unlock(info);
++
++	return dtype;
++}
++EXPORT_SYMBOL(mipi_csi2_set_datatype);
++
++/*!
++ * This function is called to get mipi data type.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns mipi data type
++ */
++unsigned int mipi_csi2_get_datatype(struct mipi_csi2_info *info)
++{
++	unsigned int dtype;
++
++	_mipi_csi2_lock(info);
++	dtype = info->datatype;
++	_mipi_csi2_unlock(info);
++
++	return dtype;
++}
++EXPORT_SYMBOL(mipi_csi2_get_datatype);
++
++/*!
++ * This function is called to get mipi csi2 dphy status.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns dphy status
++ */
++unsigned int mipi_csi2_dphy_status(struct mipi_csi2_info *info)
++{
++	unsigned int status;
++
++	_mipi_csi2_lock(info);
++	status = mipi_csi2_read(info, MIPI_CSI2_PHY_STATE);
++	_mipi_csi2_unlock(info);
++
++	return status;
++}
++EXPORT_SYMBOL(mipi_csi2_dphy_status);
++
++/*!
++ * This function is called to get mipi csi2 error1 status.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns error1 value
++ */
++unsigned int mipi_csi2_get_error1(struct mipi_csi2_info *info)
++{
++	unsigned int err1;
++
++	_mipi_csi2_lock(info);
++	err1 = mipi_csi2_read(info, MIPI_CSI2_ERR1);
++	_mipi_csi2_unlock(info);
++
++	return err1;
++}
++EXPORT_SYMBOL(mipi_csi2_get_error1);
++
++/*!
++ * This function is called to get mipi csi2 error1 status.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns error1 value
++ */
++unsigned int mipi_csi2_get_error2(struct mipi_csi2_info *info)
++{
++	unsigned int err2;
++
++	_mipi_csi2_lock(info);
++	err2 = mipi_csi2_read(info, MIPI_CSI2_ERR2);
++	_mipi_csi2_unlock(info);
++
++	return err2;
++}
++EXPORT_SYMBOL(mipi_csi2_get_error2);
++
++/*!
++ * This function is called to enable mipi to ipu pixel clock.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int mipi_csi2_pixelclk_enable(struct mipi_csi2_info *info)
++{
++	return clk_prepare_enable(info->pixel_clk);
++}
++EXPORT_SYMBOL(mipi_csi2_pixelclk_enable);
++
++/*!
++ * This function is called to disable mipi to ipu pixel clock.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns 0 on success or negative error code on fail
++ */
++void mipi_csi2_pixelclk_disable(struct mipi_csi2_info *info)
++{
++	clk_disable_unprepare(info->pixel_clk);
++}
++EXPORT_SYMBOL(mipi_csi2_pixelclk_disable);
++
++/*!
++ * This function is called to power on mipi csi2.
++ *
++ * @param	info		mipi csi2 hander
++ * @return      Returns 0 on success or negative error code on fail
++ */
++int mipi_csi2_reset(struct mipi_csi2_info *info)
++{
++	_mipi_csi2_lock(info);
++
++	mipi_csi2_write(info, 0x0, MIPI_CSI2_PHY_SHUTDOWNZ);
++	mipi_csi2_write(info, 0x0, MIPI_CSI2_DPHY_RSTZ);
++	mipi_csi2_write(info, 0x0, MIPI_CSI2_CSI2_RESETN);
++
++	mipi_csi2_write(info, 0x00000001, MIPI_CSI2_PHY_TST_CTRL0);
++	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL1);
++	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL0);
++	mipi_csi2_write(info, 0x00000002, MIPI_CSI2_PHY_TST_CTRL0);
++	mipi_csi2_write(info, 0x00010044, MIPI_CSI2_PHY_TST_CTRL1);
++	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL0);
++	mipi_csi2_write(info, 0x00000014, MIPI_CSI2_PHY_TST_CTRL1);
++	mipi_csi2_write(info, 0x00000002, MIPI_CSI2_PHY_TST_CTRL0);
++	mipi_csi2_write(info, 0x00000000, MIPI_CSI2_PHY_TST_CTRL0);
++
++	mipi_csi2_write(info, 0xffffffff, MIPI_CSI2_PHY_SHUTDOWNZ);
++	mipi_csi2_write(info, 0xffffffff, MIPI_CSI2_DPHY_RSTZ);
++	mipi_csi2_write(info, 0xffffffff, MIPI_CSI2_CSI2_RESETN);
++
++	_mipi_csi2_unlock(info);
++
++	return 0;
++}
++EXPORT_SYMBOL(mipi_csi2_reset);
++
++/*!
++ * This function is called to get mipi csi2 info.
++ *
++ * @return      Returns mipi csi2 info struct pointor
++ */
++struct mipi_csi2_info *mipi_csi2_get_info(void)
++{
++	return gmipi_csi2;
++}
++EXPORT_SYMBOL(mipi_csi2_get_info);
++
++/*!
++ * This function is called to get mipi csi2 bind ipu num.
++ *
++ * @return      Returns mipi csi2 bind ipu num
++ */
++int mipi_csi2_get_bind_ipu(struct mipi_csi2_info *info)
++{
++	int ipu_id;
++
++	_mipi_csi2_lock(info);
++	ipu_id = info->ipu_id;
++	_mipi_csi2_unlock(info);
++
++	return ipu_id;
++}
++EXPORT_SYMBOL(mipi_csi2_get_bind_ipu);
++
++/*!
++ * This function is called to get mipi csi2 bind csi num.
++ *
++ * @return      Returns mipi csi2 bind csi num
++ */
++unsigned int mipi_csi2_get_bind_csi(struct mipi_csi2_info *info)
++{
++	unsigned int csi_id;
++
++	_mipi_csi2_lock(info);
++	csi_id = info->csi_id;
++	_mipi_csi2_unlock(info);
++
++	return csi_id;
++}
++EXPORT_SYMBOL(mipi_csi2_get_bind_csi);
++
++/*!
++ * This function is called to get mipi csi2 virtual channel.
++ *
++ * @return      Returns mipi csi2 virtual channel num
++ */
++unsigned int mipi_csi2_get_virtual_channel(struct mipi_csi2_info *info)
++{
++	unsigned int v_channel;
++
++	_mipi_csi2_lock(info);
++	v_channel = info->v_channel;
++	_mipi_csi2_unlock(info);
++
++	return v_channel;
++}
++EXPORT_SYMBOL(mipi_csi2_get_virtual_channel);
++
++/**
++ * This function is called by the driver framework to initialize the MIPI CSI2
++ * device.
++ *
++ * @param	pdev	The device structure for the MIPI CSI2 passed in by the
++ *			driver framework.
++ *
++ * @return      Returns 0 on success or negative error code on error
++ */
++static int mipi_csi2_probe(struct platform_device *pdev)
++{
++	struct device *dev = &pdev->dev;
++	struct device_node *np = pdev->dev.of_node;
++	struct resource *res;
++	u32 mipi_csi2_dphy_ver;
++	int ret;
++
++	gmipi_csi2 = kmalloc(sizeof(struct mipi_csi2_info), GFP_KERNEL);
++	if (!gmipi_csi2) {
++		ret = -ENOMEM;
++		goto alloc_failed;
++	}
++
++	ret = of_property_read_u32(np, "ipu_id", &(gmipi_csi2->ipu_id));
++	if (ret) {
++		dev_err(&pdev->dev, "ipu_id missing or invalid\n");
++		goto err;
++	}
++
++	ret = of_property_read_u32(np, "csi_id", &(gmipi_csi2->csi_id));
++	if (ret) {
++		dev_err(&pdev->dev, "csi_id missing or invalid\n");
++		goto err;
++	}
++
++	ret = of_property_read_u32(np, "v_channel", &(gmipi_csi2->v_channel));
++	if (ret) {
++		dev_err(&pdev->dev, "v_channel missing or invalid\n");
++		goto err;
++	}
++
++	ret = of_property_read_u32(np, "lanes", &(gmipi_csi2->lanes));
++	if (ret) {
++		dev_err(&pdev->dev, "lanes missing or invalid\n");
++		goto err;
++	}
++
++	if ((gmipi_csi2->ipu_id < 0) || (gmipi_csi2->ipu_id > 1) ||
++		(gmipi_csi2->csi_id > 1) || (gmipi_csi2->v_channel > 3) ||
++		(gmipi_csi2->lanes > 4)) {
++		dev_err(&pdev->dev, "invalid param for mipi csi2!\n");
++		ret = -EINVAL;
++		goto err;
++	}
++
++	/* initialize mutex */
++	mutex_init(&gmipi_csi2->mutex_lock);
++
++	/* get mipi csi2 informaiton */
++	gmipi_csi2->pdev = pdev;
++	gmipi_csi2->mipi_en = false;
++
++	gmipi_csi2->cfg_clk = devm_clk_get(dev, "cfg_clk");
++	if (IS_ERR(gmipi_csi2->cfg_clk)) {
++		dev_err(&pdev->dev, "failed to get cfg_clk\n");
++		ret = PTR_ERR(gmipi_csi2->cfg_clk);
++		goto err;
++	}
++
++	/* get mipi dphy clk */
++	gmipi_csi2->dphy_clk = devm_clk_get(dev, "dphy_clk");
++	if (IS_ERR(gmipi_csi2->dphy_clk)) {
++		dev_err(&pdev->dev, "failed to get dphy pll_ref_clk\n");
++		ret = PTR_ERR(gmipi_csi2->dphy_clk);
++		goto err;
++	}
++
++	/* get mipi to ipu pixel clk */
++	gmipi_csi2->pixel_clk = devm_clk_get(dev, "pixel_clk");
++	if (IS_ERR(gmipi_csi2->pixel_clk)) {
++		dev_err(&pdev->dev, "failed to get mipi pixel clk\n");
++		ret = PTR_ERR(gmipi_csi2->pixel_clk);
++		goto err;
++	}
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res) {
++		ret = -ENODEV;
++		goto err;
++	}
++
++	/* mipi register mapping */
++	gmipi_csi2->mipi_csi2_base = ioremap(res->start, PAGE_SIZE);
++	if (!gmipi_csi2->mipi_csi2_base) {
++		ret = -ENOMEM;
++		goto err;
++	}
++
++	/* mipi dphy clk enable for register access */
++	clk_prepare_enable(gmipi_csi2->dphy_clk);
++	/* get mipi csi2 dphy version */
++	mipi_csi2_dphy_ver = mipi_csi2_read(gmipi_csi2, MIPI_CSI2_VERSION);
++
++	clk_disable_unprepare(gmipi_csi2->dphy_clk);
++
++	platform_set_drvdata(pdev, gmipi_csi2);
++
++	dev_info(&pdev->dev, "i.MX MIPI CSI2 driver probed\n");
++	dev_info(&pdev->dev, "i.MX MIPI CSI2 dphy version is 0x%x\n",
++						mipi_csi2_dphy_ver);
++
++	return 0;
++
++err:
++	kfree(gmipi_csi2);
++alloc_failed:
++	dev_err(&pdev->dev, "i.MX MIPI CSI2 driver probed -  error\n");
++	return ret;
++}
++
++static int mipi_csi2_remove(struct platform_device *pdev)
++{
++	/* unmapping mipi register */
++	iounmap(gmipi_csi2->mipi_csi2_base);
++
++	kfree(gmipi_csi2);
++
++	dev_set_drvdata(&pdev->dev, NULL);
++
++	return 0;
++}
++
++static const struct of_device_id imx_mipi_csi2_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-mipi-csi2", },
++	{ /* sentinel */ }
++};
++
++static struct platform_driver mipi_csi2_driver = {
++	.driver = {
++		   .name = "mxc_mipi_csi2",
++		   .of_match_table = imx_mipi_csi2_dt_ids,
++	},
++	.probe = mipi_csi2_probe,
++	.remove = mipi_csi2_remove,
++};
++
++static int __init mipi_csi2_init(void)
++{
++	int err;
++
++	err = platform_driver_register(&mipi_csi2_driver);
++	if (err) {
++		pr_err("mipi_csi2_driver register failed\n");
++		return -ENODEV;
++	}
++
++	pr_info("MIPI CSI2 driver module loaded\n");
++
++	return 0;
++}
++
++static void __exit mipi_csi2_cleanup(void)
++{
++	platform_driver_unregister(&mipi_csi2_driver);
++}
++
++subsys_initcall(mipi_csi2_init);
++module_exit(mipi_csi2_cleanup);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("i.MX MIPI CSI2 driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.h linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.h
+--- linux-4.1.3/drivers/mxc/mipi/mxc_mipi_csi2.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mipi/mxc_mipi_csi2.h	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,46 @@
++/*
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __MXC_MIPI_CSI2_H__
++#define __MXC_MIPI_CSI2_H__
++
++#ifdef DEBUG
++#define mipi_dbg(fmt, ...)	\
++	printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__)
++#else
++#define mipi_dbg(fmt, ...)
++#endif
++
++/* driver private data */
++struct mipi_csi2_info {
++	bool		mipi_en;
++	int		ipu_id;
++	unsigned int	csi_id;
++	unsigned int	v_channel;
++	unsigned int	lanes;
++	unsigned int	datatype;
++	struct clk	*cfg_clk;
++	struct clk	*dphy_clk;
++	struct clk	*pixel_clk;
++	void __iomem	*mipi_csi2_base;
++	struct platform_device	*pdev;
++
++	struct mutex mutex_lock;
++};
++
++#endif
+diff -Nur linux-4.1.3/drivers/mxc/mlb/Kconfig linux-xbian-imx6/drivers/mxc/mlb/Kconfig
+--- linux-4.1.3/drivers/mxc/mlb/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mlb/Kconfig	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,17 @@
++#
++# MLB150 configuration
++#
++
++menu "MXC Media Local Bus Driver"
++
++config MXC_MLB
++	boolean
++
++config MXC_MLB150
++	tristate "MLB150 support"
++	depends on SOC_IMX6Q
++	select MXC_MLB
++	---help---
++	Say Y to get the MLB150 support.
++
++endmenu
+diff -Nur linux-4.1.3/drivers/mxc/mlb/Makefile linux-xbian-imx6/drivers/mxc/mlb/Makefile
+--- linux-4.1.3/drivers/mxc/mlb/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mlb/Makefile	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,5 @@
++#
++# Makefile for the i.MX6Q/DL MLB150 driver
++#
++
++obj-$(CONFIG_MXC_MLB150) += mxc_mlb150.o
+diff -Nur linux-4.1.3/drivers/mxc/mlb/mxc_mlb150.c linux-xbian-imx6/drivers/mxc/mlb/mxc_mlb150.c
+--- linux-4.1.3/drivers/mxc/mlb/mxc_mlb150.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/mlb/mxc_mlb150.c	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,2778 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/cdev.h>
++#include <linux/circ_buf.h>
++#include <linux/clk.h>
++#include <linux/delay.h>
++#include <linux/device.h>
++#include <linux/errno.h>
++#include <linux/fs.h>
++#include <linux/genalloc.h>
++#include <linux/init.h>
++#include <linux/interrupt.h>
++#include <linux/io.h>
++#include <linux/kernel.h>
++#include <linux/module.h>
++#include <linux/mxc_mlb.h>
++#include <linux/of.h>
++#include <linux/platform_device.h>
++#include <linux/poll.h>
++#include <linux/regulator/consumer.h>
++#include <linux/sched.h>
++#include <linux/slab.h>
++#include <linux/spinlock.h>
++#include <linux/uaccess.h>
++
++#define DRIVER_NAME "mxc_mlb150"
++
++/*
++ * MLB module memory map registers define
++ */
++#define REG_MLBC0		0x0
++#define MLBC0_MLBEN		(0x1)
++#define MLBC0_MLBCLK_MASK	(0x7 << 2)
++#define MLBC0_MLBCLK_SHIFT	(2)
++#define MLBC0_MLBPEN		(0x1 << 5)
++#define MLBC0_MLBLK		(0x1 << 7)
++#define MLBC0_ASYRETRY		(0x1 << 12)
++#define MLBC0_CTLRETRY		(0x1 << 12)
++#define MLBC0_FCNT_MASK		(0x7 << 15)
++#define MLBC0_FCNT_SHIFT	(15)
++
++#define REG_MLBPC0		0x8
++#define MLBPC0_MCLKHYS		(0x1 << 11)
++
++#define REG_MS0			0xC
++#define REG_MS1			0x14
++
++#define REG_MSS			0x20
++#define MSS_RSTSYSCMD		(0x1)
++#define MSS_LKSYSCMD		(0x1 << 1)
++#define MSS_ULKSYSCMD		(0x1 << 2)
++#define MSS_CSSYSCMD		(0x1 << 3)
++#define MSS_SWSYSCMD		(0x1 << 4)
++#define MSS_SERVREQ		(0x1 << 5)
++
++#define REG_MSD			0x24
++
++#define REG_MIEN		0x2C
++#define MIEN_ISOC_PE		(0x1)
++#define MIEN_ISOC_BUFO		(0x1 << 1)
++#define MIEN_SYNC_PE		(0x1 << 16)
++#define MIEN_ARX_DONE		(0x1 << 17)
++#define MIEN_ARX_PE		(0x1 << 18)
++#define MIEN_ARX_BREAK		(0x1 << 19)
++#define MIEN_ATX_DONE		(0x1 << 20)
++#define MIEN_ATX_PE		(0x1 << 21)
++#define MIEN_ATX_BREAK		(0x1 << 22)
++#define MIEN_CRX_DONE		(0x1 << 24)
++#define MIEN_CRX_PE		(0x1 << 25)
++#define MIEN_CRX_BREAK		(0x1 << 26)
++#define MIEN_CTX_DONE		(0x1 << 27)
++#define MIEN_CTX_PE		(0x1 << 28)
++#define MIEN_CTX_BREAK		(0x1 << 29)
++
++#define REG_MLBPC2		0x34
++#define REG_MLBPC1		0x38
++#define MLBPC1_VAL		(0x00000888)
++
++#define REG_MLBC1		0x3C
++#define MLBC1_LOCK		(0x1 << 6)
++#define MLBC1_CLKM		(0x1 << 7)
++#define MLBC1_NDA_MASK		(0xFF << 8)
++#define MLBC1_NDA_SHIFT		(8)
++
++#define REG_HCTL		0x80
++#define HCTL_RST0		(0x1)
++#define HCTL_RST1		(0x1 << 1)
++#define HCTL_EN			(0x1 << 15)
++
++#define REG_HCMR0		0x88
++#define REG_HCMR1		0x8C
++#define REG_HCER0		0x90
++#define REG_HCER1		0x94
++#define REG_HCBR0		0x98
++#define REG_HCBR1		0x9C
++
++#define REG_MDAT0		0xC0
++#define REG_MDAT1		0xC4
++#define REG_MDAT2		0xC8
++#define REG_MDAT3		0xCC
++
++#define REG_MDWE0		0xD0
++#define REG_MDWE1		0xD4
++#define REG_MDWE2		0xD8
++#define REG_MDWE3		0xDC
++
++#define REG_MCTL		0xE0
++#define MCTL_XCMP		(0x1)
++
++#define REG_MADR		0xE4
++#define MADR_WNR		(0x1 << 31)
++#define MADR_TB			(0x1 << 30)
++#define MADR_ADDR_MASK		(0x7f << 8)
++#define MADR_ADDR_SHIFT		(0)
++
++#define REG_ACTL		0x3C0
++#define ACTL_MPB		(0x1 << 4)
++#define ACTL_DMAMODE		(0x1 << 2)
++#define ACTL_SMX		(0x1 << 1)
++#define ACTL_SCE		(0x1)
++
++#define REG_ACSR0		0x3D0
++#define REG_ACSR1		0x3D4
++#define REG_ACMR0		0x3D8
++#define REG_ACMR1		0x3DC
++
++#define REG_CAT_MDATn(ch) (REG_MDAT0 + ((ch % 8) >> 1) * 4)
++#define REG_CAT_MDWEn(ch) (REG_MDWE0 + ((ch % 8) >> 1) * 4)
++
++#define INT_AHB0_CH_START	(0)
++#define INT_AHB1_CH_START	(32)
++
++#define LOGIC_CH_NUM		(64)
++#define BUF_CDT_OFFSET		(0x0)
++#define BUF_ADT_OFFSET		(0x40)
++#define BUF_CAT_MLB_OFFSET	(0x80)
++#define BUF_CAT_HBI_OFFSET	(0x88)
++#define BUF_CTR_END_OFFSET	(0x8F)
++
++#define CAT_MODE_RX		(0x1 << 0)
++#define CAT_MODE_TX		(0x1 << 1)
++#define CAT_MODE_INBOUND_DMA	(0x1 << 8)
++#define CAT_MODE_OUTBOUND_DMA	(0x1 << 9)
++
++#define CH_SYNC_DEFAULT_QUAD	(1)
++#define CH_SYNC_MAX_QUAD	(15)
++#define CH_SYNC_CDT_BUF_DEP	(CH_SYNC_DEFAULT_QUAD * 4 * 4)
++#define CH_SYNC_ADT_BUF_MULTI	(4)
++#define CH_SYNC_ADT_BUF_DEP	(CH_SYNC_CDT_BUF_DEP * CH_SYNC_ADT_BUF_MULTI)
++#define CH_SYNC_BUF_SZ		(CH_SYNC_MAX_QUAD * 4 * 4 * \
++				CH_SYNC_ADT_BUF_MULTI)
++#define CH_CTRL_CDT_BUF_DEP	(64)
++#define CH_CTRL_ADT_BUF_DEP	(CH_CTRL_CDT_BUF_DEP)
++#define CH_CTRL_BUF_SZ		(CH_CTRL_ADT_BUF_DEP)
++#define CH_ASYNC_MDP_PACKET_LEN	(1024)
++#define CH_ASYNC_MEP_PACKET_LEN	(1536)
++#define CH_ASYNC_CDT_BUF_DEP	(CH_ASYNC_MEP_PACKET_LEN)
++#define CH_ASYNC_ADT_BUF_DEP	(CH_ASYNC_CDT_BUF_DEP)
++#define CH_ASYNC_BUF_SZ		(CH_ASYNC_ADT_BUF_DEP)
++#define CH_ISOC_BLK_SIZE_188	(188)
++#define CH_ISOC_BLK_SIZE_196	(196)
++#define CH_ISOC_BLK_SIZE	(CH_ISOC_BLK_SIZE_188)
++#define CH_ISOC_BLK_NUM		(1)
++#define CH_ISOC_CDT_BUF_DEP	(CH_ISOC_BLK_SIZE * CH_ISOC_BLK_NUM)
++#define CH_ISOC_ADT_BUF_DEP	(CH_ISOC_CDT_BUF_DEP)
++#define CH_ISOC_BUF_SZ		(1024)
++
++#define CH_SYNC_DBR_BUF_OFFSET	(0x0)
++#define CH_CTRL_DBR_BUF_OFFSET	(CH_SYNC_DBR_BUF_OFFSET + \
++				2 * (CH_SYNC_MAX_QUAD * 4 * 4))
++#define CH_ASYNC_DBR_BUF_OFFSET	(CH_CTRL_DBR_BUF_OFFSET + \
++				2 * CH_CTRL_CDT_BUF_DEP)
++#define CH_ISOC_DBR_BUF_OFFSET	(CH_ASYNC_DBR_BUF_OFFSET + \
++				2 * CH_ASYNC_CDT_BUF_DEP)
++
++#define DBR_BUF_START 0x00000
++
++#define CDT_LEN			(16)
++#define ADT_LEN			(16)
++#define CAT_LEN			(2)
++
++#define CDT_SZ			(CDT_LEN * LOGIC_CH_NUM)
++#define ADT_SZ			(ADT_LEN * LOGIC_CH_NUM)
++#define CAT_SZ			(CAT_LEN * LOGIC_CH_NUM * 2)
++
++#define CDT_BASE(base)		(base + BUF_CDT_OFFSET)
++#define ADT_BASE(base)		(base + BUF_ADT_OFFSET)
++#define CAT_MLB_BASE(base)	(base + BUF_CAT_MLB_OFFSET)
++#define CAT_HBI_BASE(base)	(base + BUF_CAT_HBI_OFFSET)
++
++#define CDTn_ADDR(base, n)	(base + BUF_CDT_OFFSET + n * CDT_LEN)
++#define ADTn_ADDR(base, n)	(base + BUF_ADT_OFFSET + n * ADT_LEN)
++#define CATn_MLB_ADDR(base, n)	(base + BUF_CAT_MLB_OFFSET + n * CAT_LEN)
++#define CATn_HBI_ADDR(base, n)	(base + BUF_CAT_HBI_OFFSET + n * CAT_LEN)
++
++#define CAT_CL_SHIFT		(0x0)
++#define CAT_CT_SHIFT		(8)
++#define CAT_CE			(0x1 << 11)
++#define CAT_RNW			(0x1 << 12)
++#define CAT_MT			(0x1 << 13)
++#define CAT_FCE			(0x1 << 14)
++#define CAT_MFE			(0x1 << 14)
++
++#define CDT_WSBC_SHIFT		(14)
++#define CDT_WPC_SHIFT		(11)
++#define CDT_RSBC_SHIFT		(30)
++#define CDT_RPC_SHIFT		(27)
++#define CDT_WPC_1_SHIFT		(12)
++#define CDT_RPC_1_SHIFT		(28)
++#define CDT_WPTR_SHIFT		(0)
++#define CDT_SYNC_WSTS_MASK	(0x0000f000)
++#define CDT_SYNC_WSTS_SHIFT	(12)
++#define CDT_CTRL_ASYNC_WSTS_MASK	(0x0000f000)
++#define CDT_CTRL_ASYNC_WSTS_SHIFT	(12)
++#define CDT_ISOC_WSTS_MASK	(0x0000e000)
++#define CDT_ISOC_WSTS_SHIFT	(13)
++#define CDT_RPTR_SHIFT		(16)
++#define CDT_SYNC_RSTS_MASK	(0xf0000000)
++#define CDT_SYNC_RSTS_SHIFT	(28)
++#define CDT_CTRL_ASYNC_RSTS_MASK	(0xf0000000)
++#define CDT_CTRL_ASYNC_RSTS_SHIFT	(28)
++#define CDT_ISOC_RSTS_MASK	(0xe0000000)
++#define CDT_ISOC_RSTS_SHIFT	(29)
++#define CDT_CTRL_ASYNC_WSTS_1	(0x1 << 14)
++#define CDT_CTRL_ASYNC_RSTS_1	(0x1 << 15)
++#define CDT_BD_SHIFT		(0)
++#define CDT_BA_SHIFT		(16)
++#define CDT_BS_SHIFT		(0)
++#define CDT_BF_SHIFT		(31)
++
++#define ADT_PG			(0x1 << 13)
++#define ADT_LE			(0x1 << 14)
++#define ADT_CE			(0x1 << 15)
++#define ADT_BD1_SHIFT		(0)
++#define ADT_ERR1		(0x1 << 13)
++#define ADT_DNE1		(0x1 << 14)
++#define ADT_RDY1		(0x1 << 15)
++#define ADT_BD2_SHIFT		(16)
++#define ADT_ERR2		(0x1 << 29)
++#define ADT_DNE2		(0x1 << 30)
++#define ADT_RDY2		(0x1 << 31)
++#define ADT_BA1_SHIFT		(0x0)
++#define ADT_BA2_SHIFT		(0x0)
++#define ADT_PS1			(0x1 << 12)
++#define ADT_PS2			(0x1 << 28)
++#define ADT_MEP1		(0x1 << 11)
++#define ADT_MEP2		(0x1 << 27)
++
++#define MLB_MINOR_DEVICES	4
++#define MLB_CONTROL_DEV_NAME	"ctrl"
++#define MLB_ASYNC_DEV_NAME	"async"
++#define MLB_SYNC_DEV_NAME	"sync"
++#define MLB_ISOC_DEV_NAME	"isoc"
++
++#define TX_CHANNEL		0
++#define RX_CHANNEL		1
++
++#define TRANS_RING_NODES	(1 << 3)
++
++enum MLB_CTYPE {
++	MLB_CTYPE_SYNC,
++	MLB_CTYPE_CTRL,
++	MLB_CTYPE_ASYNC,
++	MLB_CTYPE_ISOC,
++};
++
++enum CLK_SPEED {
++	CLK_256FS,
++	CLK_512FS,
++	CLK_1024FS,
++	CLK_2048FS,
++	CLK_3072FS,
++	CLK_4096FS,
++	CLK_6144FS,
++	CLK_8192FS,
++};
++
++struct mlb_ringbuf {
++	s8 *virt_bufs[TRANS_RING_NODES];
++	u32 phy_addrs[TRANS_RING_NODES];
++	s32 head;
++	s32 tail;
++	s32 unit_size;
++	s32 total_size;
++	rwlock_t rb_lock ____cacheline_aligned; /* ring index lock */
++};
++
++struct mlb_channel_info {
++	/* Input MLB channel address */
++	u32 address;
++	/* Internal AHB channel label */
++	u32 cl;
++	/* DBR buf head */
++	u32 dbr_buf_head;
++};
++
++struct mlb_dev_info {
++	/* device node name */
++	const char dev_name[20];
++	/* channel type */
++	const unsigned int channel_type;
++	/* ch fps */
++	enum CLK_SPEED fps;
++	/* channel info for tx/rx */
++	struct mlb_channel_info channels[2];
++	/* ring buffer */
++	u8 *rbuf_base_virt;
++	u32 rbuf_base_phy;
++	struct mlb_ringbuf rx_rbuf;
++	struct mlb_ringbuf tx_rbuf;
++	/* exception event */
++	unsigned long ex_event;
++	/* tx busy indicator */
++	unsigned long tx_busy;
++	/* channel started up or not */
++	atomic_t on;
++	/* device open count */
++	atomic_t opencnt;
++	/* wait queue head for channel */
++	wait_queue_head_t rx_wq;
++	wait_queue_head_t tx_wq;
++	/* TX OK */
++	s32 tx_ok;
++	/* spinlock for event access */
++	spinlock_t event_lock;
++	/*
++	 * Block size for isoc mode
++	 * This variable can be configured in ioctl
++	 */
++	u32 isoc_blksz;
++	/*
++	 * Quads number for sync mode
++	 * This variable can be confifured in ioctl
++	 */
++	u32 sync_quad;
++	/* Buffer depth in cdt */
++	u32 cdt_buf_dep;
++	/* Buffer depth in adt */
++	u32 adt_buf_dep;
++	/* Buffer size to hold data */
++	u32 buf_size;
++};
++
++struct mlb_data {
++	struct mlb_dev_info *devinfo;
++	struct clk *clk_mlb3p;
++	struct clk *clk_mlb6p;
++	struct cdev cdev;
++	struct class *class;	/* device class */
++	dev_t firstdev;
++#ifdef CONFIG_REGULATOR
++	struct regulator *nvcc;
++#endif
++	void __iomem *membase;	/* mlb module base address */
++	struct gen_pool *iram_pool;
++	u32 iram_size;
++	u32 irq_ahb0;
++	u32 irq_ahb1;
++	u32 irq_mlb;
++};
++
++/*
++ * For optimization, we use fixed channel label for
++ * input channels of each mode
++ * SYNC: CL = 0 for RX, CL = 64 for TX
++ * CTRL: CL = 1 for RX, CL = 65 for TX
++ * ASYNC: CL = 2 for RX, CL = 66 for TX
++ * ISOC: CL = 3 for RX, CL = 67 for TX
++ */
++#define SYNC_RX_CL_AHB0		0
++#define CTRL_RX_CL_AHB0		1
++#define ASYNC_RX_CL_AHB0	2
++#define ISOC_RX_CL_AHB0		3
++#define SYNC_TX_CL_AHB0		4
++#define CTRL_TX_CL_AHB0		5
++#define ASYNC_TX_CL_AHB0	6
++#define ISOC_TX_CL_AHB0		7
++
++#define SYNC_RX_CL_AHB1		32
++#define CTRL_RX_CL_AHB1		33
++#define ASYNC_RX_CL_AHB1	34
++#define ISOC_RX_CL_AHB1		35
++#define SYNC_TX_CL_AHB1		36
++#define CTRL_TX_CL_AHB1		37
++#define ASYNC_TX_CL_AHB1	38
++#define ISOC_TX_CL_AHB1		39
++
++#define SYNC_RX_CL	SYNC_RX_CL_AHB0
++#define CTRL_RX_CL	CTRL_RX_CL_AHB0
++#define ASYNC_RX_CL	ASYNC_RX_CL_AHB0
++#define ISOC_RX_CL	ISOC_RX_CL_AHB0
++
++#define SYNC_TX_CL	SYNC_TX_CL_AHB0
++#define CTRL_TX_CL	CTRL_TX_CL_AHB0
++#define ASYNC_TX_CL	ASYNC_TX_CL_AHB0
++#define ISOC_TX_CL	ISOC_TX_CL_AHB0
++
++static struct mlb_dev_info mlb_devinfo[MLB_MINOR_DEVICES] = {
++	{
++	.dev_name = MLB_SYNC_DEV_NAME,
++	.channel_type = MLB_CTYPE_SYNC,
++	.channels = {
++		[0] = {
++			.cl = SYNC_TX_CL,
++			.dbr_buf_head = CH_SYNC_DBR_BUF_OFFSET,
++		},
++		[1] = {
++			.cl = SYNC_RX_CL,
++			.dbr_buf_head = CH_SYNC_DBR_BUF_OFFSET
++					+ CH_SYNC_BUF_SZ,
++		},
++	},
++	.rx_rbuf = {
++		.unit_size = CH_SYNC_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[0].rx_rbuf.rb_lock),
++	},
++	.tx_rbuf = {
++		.unit_size = CH_SYNC_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[0].tx_rbuf.rb_lock),
++	},
++	.cdt_buf_dep = CH_SYNC_CDT_BUF_DEP,
++	.adt_buf_dep = CH_SYNC_ADT_BUF_DEP,
++	.buf_size = CH_SYNC_BUF_SZ,
++	.on = ATOMIC_INIT(0),
++	.opencnt = ATOMIC_INIT(0),
++	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[0].event_lock),
++	},
++	{
++	.dev_name = MLB_CONTROL_DEV_NAME,
++	.channel_type = MLB_CTYPE_CTRL,
++	.channels = {
++		[0] = {
++			.cl = CTRL_TX_CL,
++			.dbr_buf_head = CH_CTRL_DBR_BUF_OFFSET,
++		},
++		[1] = {
++			.cl = CTRL_RX_CL,
++			.dbr_buf_head = CH_CTRL_DBR_BUF_OFFSET
++					+ CH_CTRL_BUF_SZ,
++		},
++	},
++	.rx_rbuf = {
++		.unit_size = CH_CTRL_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[1].rx_rbuf.rb_lock),
++	},
++	.tx_rbuf = {
++		.unit_size = CH_CTRL_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[1].tx_rbuf.rb_lock),
++	},
++	.cdt_buf_dep = CH_CTRL_CDT_BUF_DEP,
++	.adt_buf_dep = CH_CTRL_ADT_BUF_DEP,
++	.buf_size = CH_CTRL_BUF_SZ,
++	.on = ATOMIC_INIT(0),
++	.opencnt = ATOMIC_INIT(0),
++	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[1].event_lock),
++	},
++	{
++	.dev_name = MLB_ASYNC_DEV_NAME,
++	.channel_type = MLB_CTYPE_ASYNC,
++	.channels = {
++		[0] = {
++			.cl = ASYNC_TX_CL,
++			.dbr_buf_head = CH_ASYNC_DBR_BUF_OFFSET,
++		},
++		[1] = {
++			.cl = ASYNC_RX_CL,
++			.dbr_buf_head = CH_ASYNC_DBR_BUF_OFFSET
++					+ CH_ASYNC_BUF_SZ,
++		},
++	},
++	.rx_rbuf = {
++		.unit_size = CH_ASYNC_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[2].rx_rbuf.rb_lock),
++	},
++	.tx_rbuf = {
++		.unit_size = CH_ASYNC_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[2].tx_rbuf.rb_lock),
++	},
++	.cdt_buf_dep = CH_ASYNC_CDT_BUF_DEP,
++	.adt_buf_dep = CH_ASYNC_ADT_BUF_DEP,
++	.buf_size = CH_ASYNC_BUF_SZ,
++	.on = ATOMIC_INIT(0),
++	.opencnt = ATOMIC_INIT(0),
++	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[2].event_lock),
++	},
++	{
++	.dev_name = MLB_ISOC_DEV_NAME,
++	.channel_type = MLB_CTYPE_ISOC,
++	.channels = {
++		[0] = {
++			.cl = ISOC_TX_CL,
++			.dbr_buf_head = CH_ISOC_DBR_BUF_OFFSET,
++		},
++		[1] = {
++			.cl = ISOC_RX_CL,
++			.dbr_buf_head = CH_ISOC_DBR_BUF_OFFSET
++					+ CH_ISOC_BUF_SZ,
++		},
++	},
++	.rx_rbuf = {
++		.unit_size = CH_ISOC_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[3].rx_rbuf.rb_lock),
++	},
++	.tx_rbuf = {
++		.unit_size = CH_ISOC_BUF_SZ,
++		.rb_lock =
++			__RW_LOCK_UNLOCKED(mlb_devinfo[3].tx_rbuf.rb_lock),
++	},
++	.cdt_buf_dep = CH_ISOC_CDT_BUF_DEP,
++	.adt_buf_dep = CH_ISOC_ADT_BUF_DEP,
++	.buf_size = CH_ISOC_BUF_SZ,
++	.on = ATOMIC_INIT(0),
++	.opencnt = ATOMIC_INIT(0),
++	.event_lock = __SPIN_LOCK_UNLOCKED(mlb_devinfo[3].event_lock),
++	.isoc_blksz = CH_ISOC_BLK_SIZE_188,
++	},
++};
++
++static void __iomem *mlb_base;
++
++DEFINE_SPINLOCK(ctr_lock);
++
++#ifdef DEBUG
++#define DUMP_REG(reg) pr_debug(#reg": 0x%08x\n", __raw_readl(mlb_base + reg))
++
++static void mlb150_dev_dump_reg(void)
++{
++	pr_debug("mxc_mlb150: Dump registers:\n");
++	DUMP_REG(REG_MLBC0);
++	DUMP_REG(REG_MLBPC0);
++	DUMP_REG(REG_MS0);
++	DUMP_REG(REG_MS1);
++	DUMP_REG(REG_MSS);
++	DUMP_REG(REG_MSD);
++	DUMP_REG(REG_MIEN);
++	DUMP_REG(REG_MLBPC2);
++	DUMP_REG(REG_MLBPC1);
++	DUMP_REG(REG_MLBC1);
++	DUMP_REG(REG_HCTL);
++	DUMP_REG(REG_HCMR0);
++	DUMP_REG(REG_HCMR1);
++	DUMP_REG(REG_HCER0);
++	DUMP_REG(REG_HCER1);
++	DUMP_REG(REG_HCBR0);
++	DUMP_REG(REG_HCBR1);
++	DUMP_REG(REG_MDAT0);
++	DUMP_REG(REG_MDAT1);
++	DUMP_REG(REG_MDAT2);
++	DUMP_REG(REG_MDAT3);
++	DUMP_REG(REG_MDWE0);
++	DUMP_REG(REG_MDWE1);
++	DUMP_REG(REG_MDWE2);
++	DUMP_REG(REG_MDWE3);
++	DUMP_REG(REG_MCTL);
++	DUMP_REG(REG_MADR);
++	DUMP_REG(REG_ACTL);
++	DUMP_REG(REG_ACSR0);
++	DUMP_REG(REG_ACSR1);
++	DUMP_REG(REG_ACMR0);
++	DUMP_REG(REG_ACMR1);
++}
++
++static void mlb150_dev_dump_hex(const u8 *buf, u32 len)
++{
++	print_hex_dump(KERN_DEBUG, "CTR DUMP:",
++			DUMP_PREFIX_OFFSET, 8, 1, buf, len, 0);
++}
++#endif
++
++static inline void mlb150_dev_enable_ctr_write(u32 mdat0_bits_en,
++		u32 mdat1_bits_en, u32 mdat2_bits_en, u32 mdat3_bits_en)
++{
++	__raw_writel(mdat0_bits_en, mlb_base + REG_MDWE0);
++	__raw_writel(mdat1_bits_en, mlb_base + REG_MDWE1);
++	__raw_writel(mdat2_bits_en, mlb_base + REG_MDWE2);
++	__raw_writel(mdat3_bits_en, mlb_base + REG_MDWE3);
++}
++
++#ifdef DEBUG
++static inline u8 mlb150_dev_dbr_read(u32 dbr_addr)
++{
++	s32 timeout = 1000;
++	u8  dbr_val = 0;
++	unsigned long flags;
++
++	spin_lock_irqsave(&ctr_lock, flags);
++	__raw_writel(MADR_TB | dbr_addr,
++		mlb_base + REG_MADR);
++
++	while ((!(__raw_readl(mlb_base + REG_MCTL)
++			& MCTL_XCMP)) &&
++			timeout--)
++		;
++
++	if (0 == timeout) {
++		spin_unlock_irqrestore(&ctr_lock, flags);
++		return -ETIME;
++	}
++
++	dbr_val = __raw_readl(mlb_base + REG_MDAT0) & 0x000000ff;
++
++	__raw_writel(0, mlb_base + REG_MCTL);
++	spin_unlock_irqrestore(&ctr_lock, flags);
++
++	return dbr_val;
++}
++
++static inline s32 mlb150_dev_dbr_write(u32 dbr_addr, u8 dbr_val)
++{
++	s32 timeout = 1000;
++	u32 mdat0 = dbr_val & 0x000000ff;
++	unsigned long flags;
++
++	spin_lock_irqsave(&ctr_lock, flags);
++	__raw_writel(mdat0, mlb_base + REG_MDAT0);
++
++	__raw_writel(MADR_WNR | MADR_TB | dbr_addr,
++			mlb_base + REG_MADR);
++
++	while ((!(__raw_readl(mlb_base + REG_MCTL)
++			& MCTL_XCMP)) &&
++			timeout--)
++		;
++
++	if (timeout <= 0) {
++		spin_unlock_irqrestore(&ctr_lock, flags);
++		return -ETIME;
++	}
++
++	__raw_writel(0, mlb_base + REG_MCTL);
++	spin_unlock_irqrestore(&ctr_lock, flags);
++
++	return 0;
++}
++
++static inline s32 mlb150_dev_dbr_dump(u32 addr, u32 size)
++{
++	u8 *dump_buf = NULL;
++	u8 *buf_ptr = NULL;
++	s32 i;
++
++	dump_buf = kzalloc(size, GFP_KERNEL);
++	if (!dump_buf) {
++		pr_err("can't allocate enough memory\n");
++		return -ENOMEM;
++	}
++
++	for (i = 0, buf_ptr = dump_buf;
++			i < size; ++i, ++buf_ptr)
++		*buf_ptr = mlb150_dev_dbr_read(addr + i);
++
++	mlb150_dev_dump_hex(dump_buf, size);
++
++	kfree(dump_buf);
++
++	return 0;
++}
++#endif
++
++static s32 mlb150_dev_ctr_read(u32 ctr_offset, u32 *ctr_val)
++{
++	s32 timeout = 1000;
++	unsigned long flags;
++
++	spin_lock_irqsave(&ctr_lock, flags);
++	__raw_writel(ctr_offset, mlb_base + REG_MADR);
++
++	while ((!(__raw_readl(mlb_base + REG_MCTL)
++			& MCTL_XCMP)) &&
++			timeout--)
++		;
++
++	if (timeout <= 0) {
++		spin_unlock_irqrestore(&ctr_lock, flags);
++		pr_debug("mxc_mlb150: Read CTR timeout\n");
++		return -ETIME;
++	}
++
++	ctr_val[0] = __raw_readl(mlb_base + REG_MDAT0);
++	ctr_val[1] = __raw_readl(mlb_base + REG_MDAT1);
++	ctr_val[2] = __raw_readl(mlb_base + REG_MDAT2);
++	ctr_val[3] = __raw_readl(mlb_base + REG_MDAT3);
++
++	__raw_writel(0, mlb_base + REG_MCTL);
++
++	spin_unlock_irqrestore(&ctr_lock, flags);
++
++	return 0;
++}
++
++static s32 mlb150_dev_ctr_write(u32 ctr_offset, const u32 *ctr_val)
++{
++	s32 timeout = 1000;
++	unsigned long flags;
++
++	spin_lock_irqsave(&ctr_lock, flags);
++
++	__raw_writel(ctr_val[0], mlb_base + REG_MDAT0);
++	__raw_writel(ctr_val[1], mlb_base + REG_MDAT1);
++	__raw_writel(ctr_val[2], mlb_base + REG_MDAT2);
++	__raw_writel(ctr_val[3], mlb_base + REG_MDAT3);
++
++	__raw_writel(MADR_WNR | ctr_offset,
++			mlb_base + REG_MADR);
++
++	while ((!(__raw_readl(mlb_base + REG_MCTL)
++			& MCTL_XCMP)) &&
++			timeout--)
++		;
++
++	if (timeout <= 0) {
++		spin_unlock_irqrestore(&ctr_lock, flags);
++		pr_debug("mxc_mlb150: Write CTR timeout\n");
++		return -ETIME;
++	}
++
++	__raw_writel(0, mlb_base + REG_MCTL);
++
++	spin_unlock_irqrestore(&ctr_lock, flags);
++
++#ifdef DEBUG_CTR
++	{
++		u32 ctr_rd[4] = { 0 };
++
++		if (!mlb150_dev_ctr_read(ctr_offset, ctr_rd)) {
++			if (ctr_val[0] == ctr_rd[0] &&
++				ctr_val[1] == ctr_rd[1] &&
++				ctr_val[2] == ctr_rd[2] &&
++				ctr_val[3] == ctr_rd[3])
++				return 0;
++			else {
++				pr_debug("mxc_mlb150: ctr write failed\n");
++				pr_debug("offset: 0x%x\n", ctr_offset);
++				pr_debug("Write: 0x%x 0x%x 0x%x 0x%x\n",
++						ctr_val[3], ctr_val[2],
++						ctr_val[1], ctr_val[0]);
++				pr_debug("Read: 0x%x 0x%x 0x%x 0x%x\n",
++						ctr_rd[3], ctr_rd[2],
++						ctr_rd[1], ctr_rd[0]);
++				return -EBADE;
++			}
++		} else {
++			pr_debug("mxc_mlb150: ctr read failed\n");
++			return -EBADE;
++		}
++	}
++#endif
++
++	return 0;
++}
++
++#ifdef DEBUG
++static s32 mlb150_dev_cat_read(u32 ctr_offset, u32 ch, u16 *cat_val)
++{
++	u16 ctr_val[8] = { 0 };
++
++	if (mlb150_dev_ctr_read(ctr_offset, (u32 *)ctr_val))
++		return -ETIME;
++
++	/*
++	 * Use u16 array to get u32 array value,
++	 * need to convert
++	 */
++	cat_val = ctr_val[ch % 8];
++
++	 return 0;
++}
++#endif
++
++static s32 mlb150_dev_cat_write(u32 ctr_offset, u32 ch, const u16 cat_val)
++{
++	u16 ctr_val[8] = { 0 };
++
++	if (mlb150_dev_ctr_read(ctr_offset, (u32 *)ctr_val))
++		return -ETIME;
++
++	ctr_val[ch % 8] = cat_val;
++	if (mlb150_dev_ctr_write(ctr_offset, (u32 *)ctr_val))
++		return -ETIME;
++
++	return 0;
++}
++
++#define mlb150_dev_cat_mlb_read(ch, cat_val)	\
++	mlb150_dev_cat_read(BUF_CAT_MLB_OFFSET + (ch >> 3), ch, cat_val)
++#define mlb150_dev_cat_mlb_write(ch, cat_val)	\
++	mlb150_dev_cat_write(BUF_CAT_MLB_OFFSET + (ch >> 3), ch, cat_val)
++#define mlb150_dev_cat_hbi_read(ch, cat_val)	\
++	mlb150_dev_cat_read(BUF_CAT_HBI_OFFSET + (ch >> 3), ch, cat_val)
++#define mlb150_dev_cat_hbi_write(ch, cat_val)	\
++	mlb150_dev_cat_write(BUF_CAT_HBI_OFFSET + (ch >> 3), ch, cat_val)
++
++#define mlb150_dev_cdt_read(ch, cdt_val)	\
++	mlb150_dev_ctr_read(BUF_CDT_OFFSET + ch, cdt_val)
++#define mlb150_dev_cdt_write(ch, cdt_val)	\
++	mlb150_dev_ctr_write(BUF_CDT_OFFSET + ch, cdt_val)
++#define mlb150_dev_adt_read(ch, adt_val)	\
++	mlb150_dev_ctr_read(BUF_ADT_OFFSET + ch, adt_val)
++#define mlb150_dev_adt_write(ch, adt_val)	\
++	mlb150_dev_ctr_write(BUF_ADT_OFFSET + ch, adt_val)
++
++static s32 mlb150_dev_get_adt_sts(u32 ch)
++{
++	s32 timeout = 1000;
++	unsigned long flags;
++	u32 reg;
++
++	spin_lock_irqsave(&ctr_lock, flags);
++	__raw_writel(BUF_ADT_OFFSET + ch,
++			mlb_base + REG_MADR);
++
++	while ((!(__raw_readl(mlb_base + REG_MCTL)
++			& MCTL_XCMP)) &&
++			timeout--)
++		;
++
++	if (timeout <= 0) {
++		spin_unlock_irqrestore(&ctr_lock, flags);
++		pr_debug("mxc_mlb150: Read CTR timeout\n");
++		return -ETIME;
++	}
++
++	reg = __raw_readl(mlb_base + REG_MDAT1);
++
++	__raw_writel(0, mlb_base + REG_MCTL);
++	spin_unlock_irqrestore(&ctr_lock, flags);
++
++#ifdef DEBUG_ADT
++	pr_debug("mxc_mlb150: Get ch %d adt sts: 0x%08x\n", ch, reg);
++#endif
++
++	return reg;
++}
++
++#ifdef DEBUG
++static void mlb150_dev_dump_ctr_tbl(u32 ch_start, u32 ch_end)
++{
++	u32 i = 0;
++	u32 ctr_val[4] = { 0 };
++
++	pr_debug("mxc_mlb150: CDT Table");
++	for (i = BUF_CDT_OFFSET + ch_start;
++			i < BUF_CDT_OFFSET + ch_end;
++			++i) {
++		mlb150_dev_ctr_read(i, ctr_val);
++		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
++			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
++	}
++
++	pr_debug("mxc_mlb150: ADT Table");
++	for (i = BUF_ADT_OFFSET + ch_start;
++			i < BUF_ADT_OFFSET + ch_end;
++			++i) {
++		mlb150_dev_ctr_read(i, ctr_val);
++		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
++			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
++	}
++
++	pr_debug("mxc_mlb150: CAT MLB Table");
++	for (i = BUF_CAT_MLB_OFFSET + (ch_start >> 3);
++			i <= BUF_CAT_MLB_OFFSET + ((ch_end + 8) >> 3);
++			++i) {
++		mlb150_dev_ctr_read(i, ctr_val);
++		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
++			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
++	}
++
++	pr_debug("mxc_mlb150: CAT HBI Table");
++	for (i = BUF_CAT_HBI_OFFSET + (ch_start >> 3);
++			i <= BUF_CAT_HBI_OFFSET + ((ch_end + 8) >> 3);
++			++i) {
++		mlb150_dev_ctr_read(i, ctr_val);
++		pr_debug("CTR 0x%02x: 0x%08x, 0x%08x, 0x%08x, 0x%08x\n",
++			i, ctr_val[3], ctr_val[2], ctr_val[1], ctr_val[0]);
++	}
++}
++#endif
++
++/*
++ * Initial the MLB module device
++ */
++static inline void  mlb150_dev_enable_dma_irq(u32 enable)
++{
++	u32 ch_rx_mask = (1 << SYNC_RX_CL_AHB0) | (1 << CTRL_RX_CL_AHB0)
++			| (1 << ASYNC_RX_CL_AHB0) | (1 << ISOC_RX_CL_AHB0)
++			| (1 << SYNC_TX_CL_AHB0) | (1 << CTRL_TX_CL_AHB0)
++			| (1 << ASYNC_TX_CL_AHB0) | (1 << ISOC_TX_CL_AHB0);
++	u32 ch_tx_mask = (1 << (SYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (CTRL_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ASYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ISOC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (SYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (CTRL_TX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ASYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ISOC_TX_CL_AHB1 - INT_AHB1_CH_START));
++
++	if (enable) {
++		__raw_writel(ch_rx_mask, mlb_base + REG_ACMR0);
++		__raw_writel(ch_tx_mask, mlb_base + REG_ACMR1);
++	} else {
++		__raw_writel(0x0, mlb_base + REG_ACMR0);
++		__raw_writel(0x0, mlb_base + REG_ACMR1);
++	}
++}
++
++
++static void mlb150_dev_init_ir_amba_ahb(void)
++{
++	u32 reg = 0;
++
++	/*
++	 * Step 1. Program the ACMRn registers to enable interrupts from all
++	 * active DMA channels
++	 */
++	mlb150_dev_enable_dma_irq(1);
++
++	/*
++	 * Step 2. Select the status clear method:
++	 * ACTL.SCE = 0, hardware clears on read
++	 * ACTL.SCE = 1, software writes a '1' to clear
++	 * We only support DMA MODE 1
++	 */
++	reg = __raw_readl(mlb_base + REG_ACTL);
++	reg |= ACTL_DMAMODE;
++#ifdef MULTIPLE_PACKAGE_MODE
++	reg |= REG_ACTL_MPB;
++#endif
++
++	/*
++	 *  Step 3. Select 1 or 2 interrupt signals:
++	 * ACTL.SMX = 0: one interrupt for channels 0 - 31 on ahb_init[0]
++	 *	and another interrupt for channels 32 - 63 on ahb_init[1]
++	 * ACTL.SMX = 1: singel interrupt all channels on ahb_init[0]
++	 */
++	reg &= ~ACTL_SMX;
++
++	__raw_writel(reg, mlb_base + REG_ACTL);
++}
++
++static inline void mlb150_dev_enable_ir_mlb(u32 enable)
++{
++	/*
++	 * Step 1, Select the MSn to be cleared by software,
++	 * writing a '0' to the appropriate bits
++	 */
++	__raw_writel(0, mlb_base + REG_MS0);
++	__raw_writel(0, mlb_base + REG_MS1);
++
++	/*
++	 * Step 1, Program MIEN to enable protocol error
++	 * interrupts for all active MLB channels
++	 */
++	if (enable)
++		__raw_writel(MIEN_CTX_PE |
++			MIEN_CRX_PE | MIEN_ATX_PE |
++			MIEN_ARX_PE | MIEN_SYNC_PE |
++			MIEN_ISOC_PE,
++			mlb_base + REG_MIEN);
++	else
++		__raw_writel(0, mlb_base + REG_MIEN);
++}
++
++static inline void mlb150_enable_pll(struct mlb_data *drvdata)
++{
++	u32 c0_val;
++
++	__raw_writel(MLBPC1_VAL,
++			drvdata->membase + REG_MLBPC1);
++
++	c0_val = __raw_readl(drvdata->membase + REG_MLBC0);
++	if (c0_val & MLBC0_MLBPEN) {
++		c0_val &= ~MLBC0_MLBPEN;
++		__raw_writel(c0_val,
++				drvdata->membase + REG_MLBC0);
++	}
++
++	clk_prepare_enable(drvdata->clk_mlb6p);
++
++	c0_val |= (MLBC0_MLBPEN);
++	__raw_writel(c0_val, drvdata->membase + REG_MLBC0);
++}
++
++static inline void mlb150_disable_pll(struct mlb_data *drvdata)
++{
++	u32 c0_val;
++
++	clk_disable_unprepare(drvdata->clk_mlb6p);
++
++	c0_val = __raw_readl(drvdata->membase + REG_MLBC0);
++
++	__raw_writel(0x0, drvdata->membase + REG_MLBPC1);
++
++	c0_val &= ~MLBC0_MLBPEN;
++	__raw_writel(c0_val, drvdata->membase + REG_MLBC0);
++}
++
++static void mlb150_dev_reset_cdt(void)
++{
++	int i = 0;
++	u32 ctr_val[4] = { 0 };
++
++	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
++			0xffffffff, 0xffffffff);
++
++	for (i = 0; i < (LOGIC_CH_NUM); ++i)
++		mlb150_dev_ctr_write(BUF_CDT_OFFSET + i, ctr_val);
++}
++
++static s32 mlb150_dev_init_ch_cdt(struct mlb_dev_info *pdevinfo, u32 ch,
++		enum MLB_CTYPE ctype, u32 ch_func)
++{
++	u32 cdt_val[4] = { 0 };
++
++	/* a. Set the 14-bit base address (BA) */
++	pr_debug("mxc_mlb150: ctype: %d, ch: %d, dbr_buf_head: 0x%08x",
++		ctype, ch, pdevinfo->channels[ch_func].dbr_buf_head);
++	cdt_val[3] = (pdevinfo->channels[ch_func].dbr_buf_head)
++			<< CDT_BA_SHIFT;
++	/*
++	 * b. Set the 12-bit or 13-bit buffer depth (BD)
++	 * BD = buffer depth in bytes - 1
++	 * For synchronous channels: (BD + 1) = 4 * m * bpf
++	 * For control channels: (BD + 1) >= max packet length (64)
++	 * For asynchronous channels: (BD + 1) >= max packet length
++	 * 1024 for a MOST Data packet (MDP);
++	 * 1536 for a MOST Ethernet Packet (MEP)
++	 * For isochronous channels: (BD + 1) mod (BS + 1) = 0
++	 * BS
++	 */
++	if (MLB_CTYPE_ISOC == ctype)
++		cdt_val[1] |= (pdevinfo->isoc_blksz - 1);
++	/* BD */
++	cdt_val[3] |= (pdevinfo->cdt_buf_dep - 1) << CDT_BD_SHIFT;
++
++	pr_debug("mxc_mlb150: Set CDT val of channel %d, type: %d: "
++		"0x%08x 0x%08x 0x%08x 0x%08x\n",
++		ch, ctype, cdt_val[3], cdt_val[2], cdt_val[1], cdt_val[0]);
++
++	if (mlb150_dev_cdt_write(ch, cdt_val))
++		return -ETIME;
++
++#ifdef DEBUG_CTR
++	{
++		u32 cdt_rd[4] = { 0 };
++		if (!mlb150_dev_cdt_read(ch, cdt_rd)) {
++			pr_debug("mxc_mlb150: CDT val of channel %d: "
++				"0x%08x 0x%08x 0x%08x 0x%08x\n",
++				ch, cdt_rd[3], cdt_rd[2], cdt_rd[1], cdt_rd[0]);
++			if (cdt_rd[3] == cdt_val[3] &&
++				cdt_rd[2] == cdt_val[2] &&
++				cdt_rd[1] == cdt_val[1] &&
++				cdt_rd[0] == cdt_val[0]) {
++				pr_debug("mxc_mlb150: set cdt succeed!\n");
++				return 0;
++			} else {
++				pr_debug("mxc_mlb150: set cdt failed!\n");
++				return -EBADE;
++			}
++		} else {
++			pr_debug("mxc_mlb150: Read CDT val of channel %d failed\n",
++					ch);
++			return -EBADE;
++		}
++	}
++#endif
++
++	return 0;
++}
++
++static s32 mlb150_dev_init_ch_cat(u32 ch, u32 cl,
++		u32 cat_mode, enum MLB_CTYPE ctype)
++{
++	u16 cat_val = 0;
++#ifdef DEBUG_CTR
++	u16 cat_rd = 0;
++#endif
++
++	cat_val = CAT_CE | (ctype << CAT_CT_SHIFT) | cl;
++
++	if (cat_mode & CAT_MODE_OUTBOUND_DMA)
++		cat_val |= CAT_RNW;
++
++	if (MLB_CTYPE_SYNC == ctype)
++		cat_val |= CAT_MT;
++
++	switch (cat_mode) {
++	case CAT_MODE_RX | CAT_MODE_INBOUND_DMA:
++	case CAT_MODE_TX | CAT_MODE_OUTBOUND_DMA:
++		pr_debug("mxc_mlb150: set CAT val of channel %d, type: %d: 0x%04x\n",
++			ch, ctype, cat_val);
++
++		if (mlb150_dev_cat_mlb_write(ch, cat_val))
++			return -ETIME;
++#ifdef DEBUG_CTR
++		if (!mlb150_dev_cat_mlb_read(ch, &cat_rd))
++			pr_debug("mxc_mlb150: CAT val of mlb channel %d: 0x%04x",
++					ch, cat_rd);
++		else {
++			pr_debug("mxc_mlb150: Read CAT of mlb channel %d failed\n",
++					ch);
++				return -EBADE;
++		}
++#endif
++		break;
++	case CAT_MODE_TX | CAT_MODE_INBOUND_DMA:
++	case CAT_MODE_RX | CAT_MODE_OUTBOUND_DMA:
++		pr_debug("mxc_mlb150: set CAT val of channel %d, type: %d: 0x%04x\n",
++			cl, ctype, cat_val);
++
++		if (mlb150_dev_cat_hbi_write(cl, cat_val))
++			return -ETIME;
++#ifdef DEBUG_CTR
++		if (!mlb150_dev_cat_hbi_read(cl, &cat_rd))
++			pr_debug("mxc_mlb150: CAT val of hbi channel %d: 0x%04x",
++					cl, cat_rd);
++		else {
++			pr_debug("mxc_mlb150: Read CAT of hbi channel %d failed\n",
++					cl);
++				return -EBADE;
++		}
++#endif
++		break;
++	default:
++		return EBADRQC;
++	}
++
++#ifdef DEBUG_CTR
++	{
++		if (cat_val == cat_rd) {
++			pr_debug("mxc_mlb150: set cat succeed!\n");
++			return 0;
++		} else {
++			pr_debug("mxc_mlb150: set cat failed!\n");
++			return -EBADE;
++		}
++	}
++#endif
++	return 0;
++}
++
++static void mlb150_dev_reset_cat(void)
++{
++	int i = 0;
++	u32 ctr_val[4] = { 0 };
++
++	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
++			0xffffffff, 0xffffffff);
++
++	for (i = 0; i < (LOGIC_CH_NUM >> 3); ++i) {
++		mlb150_dev_ctr_write(BUF_CAT_MLB_OFFSET + i, ctr_val);
++		mlb150_dev_ctr_write(BUF_CAT_HBI_OFFSET + i, ctr_val);
++	}
++}
++
++static void mlb150_dev_init_rfb(struct mlb_dev_info *pdevinfo, u32 rx_ch,
++		u32 tx_ch, enum MLB_CTYPE ctype)
++{
++	u32 rx_cl = pdevinfo->channels[RX_CHANNEL].cl;
++	u32 tx_cl = pdevinfo->channels[TX_CHANNEL].cl;
++	/* Step 1, Initialize all bits of CAT to '0' */
++	mlb150_dev_reset_cat();
++	mlb150_dev_reset_cdt();
++	/*
++	 * Step 2, Initialize logical channel
++	 * Step 3, Program the CDT for channel N
++	 */
++	mlb150_dev_init_ch_cdt(pdevinfo, rx_cl, ctype, RX_CHANNEL);
++	mlb150_dev_init_ch_cdt(pdevinfo, tx_cl, ctype, TX_CHANNEL);
++
++	/* Step 4&5, Program the CAT for the inbound and outbound DMA */
++	mlb150_dev_init_ch_cat(rx_ch, rx_cl,
++			CAT_MODE_RX | CAT_MODE_INBOUND_DMA,
++			ctype);
++	mlb150_dev_init_ch_cat(rx_ch, rx_cl,
++			CAT_MODE_RX | CAT_MODE_OUTBOUND_DMA,
++			ctype);
++	mlb150_dev_init_ch_cat(tx_ch, tx_cl,
++			CAT_MODE_TX | CAT_MODE_INBOUND_DMA,
++			ctype);
++	mlb150_dev_init_ch_cat(tx_ch, tx_cl,
++			CAT_MODE_TX | CAT_MODE_OUTBOUND_DMA,
++			ctype);
++}
++
++static void mlb150_dev_reset_adt(void)
++{
++	int i = 0;
++	u32 ctr_val[4] = { 0 };
++
++	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
++			0xffffffff, 0xffffffff);
++
++	for (i = 0; i < (LOGIC_CH_NUM); ++i)
++		mlb150_dev_ctr_write(BUF_ADT_OFFSET + i, ctr_val);
++}
++
++static void mlb150_dev_reset_whole_ctr(void)
++{
++	mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
++			0xffffffff, 0xffffffff);
++	mlb150_dev_reset_cdt();
++	mlb150_dev_reset_adt();
++	mlb150_dev_reset_cat();
++}
++
++#define CLR_REG(reg)  __raw_writel(0x0, mlb_base + reg)
++
++static void mlb150_dev_reset_all_regs(void)
++{
++	CLR_REG(REG_MLBC0);
++	CLR_REG(REG_MLBPC0);
++	CLR_REG(REG_MS0);
++	CLR_REG(REG_MS1);
++	CLR_REG(REG_MSS);
++	CLR_REG(REG_MSD);
++	CLR_REG(REG_MIEN);
++	CLR_REG(REG_MLBPC2);
++	CLR_REG(REG_MLBPC1);
++	CLR_REG(REG_MLBC1);
++	CLR_REG(REG_HCTL);
++	CLR_REG(REG_HCMR0);
++	CLR_REG(REG_HCMR1);
++	CLR_REG(REG_HCER0);
++	CLR_REG(REG_HCER1);
++	CLR_REG(REG_HCBR0);
++	CLR_REG(REG_HCBR1);
++	CLR_REG(REG_MDAT0);
++	CLR_REG(REG_MDAT1);
++	CLR_REG(REG_MDAT2);
++	CLR_REG(REG_MDAT3);
++	CLR_REG(REG_MDWE0);
++	CLR_REG(REG_MDWE1);
++	CLR_REG(REG_MDWE2);
++	CLR_REG(REG_MDWE3);
++	CLR_REG(REG_MCTL);
++	CLR_REG(REG_MADR);
++	CLR_REG(REG_ACTL);
++	CLR_REG(REG_ACSR0);
++	CLR_REG(REG_ACSR1);
++	CLR_REG(REG_ACMR0);
++	CLR_REG(REG_ACMR1);
++}
++
++static inline s32 mlb150_dev_pipo_start(struct mlb_ringbuf *rbuf,
++						u32 ahb_ch, u32 buf_addr)
++{
++	u32 ctr_val[4] = { 0 };
++
++	ctr_val[1] |= ADT_RDY1;
++	ctr_val[2] = buf_addr;
++
++	if (mlb150_dev_adt_write(ahb_ch, ctr_val))
++		return -ETIME;
++
++	return 0;
++}
++
++static inline s32 mlb150_dev_pipo_next(u32 ahb_ch, enum MLB_CTYPE ctype,
++				u32 dne_sts, u32 buf_addr)
++{
++	u32 ctr_val[4] = { 0 };
++
++	if (MLB_CTYPE_ASYNC == ctype ||
++		MLB_CTYPE_CTRL == ctype) {
++		ctr_val[1] |= ADT_PS1;
++		ctr_val[1] |= ADT_PS2;
++	}
++
++	/*
++	 * Clear DNE1 and ERR1
++	 * Set the page ready bit (RDY1)
++	 */
++	if (dne_sts & ADT_DNE1) {
++		ctr_val[1] |= ADT_RDY2;
++		ctr_val[3] = buf_addr;
++	} else {
++		ctr_val[1] |= ADT_RDY1;
++		ctr_val[2] = buf_addr;
++	}
++
++	if (mlb150_dev_adt_write(ahb_ch, ctr_val))
++		return -ETIME;
++
++	return 0;
++}
++
++static inline s32 mlb150_dev_pipo_stop(struct mlb_ringbuf *rbuf, u32 ahb_ch)
++{
++	u32 ctr_val[4] = { 0 };
++	unsigned long flags;
++
++	write_lock_irqsave(&rbuf->rb_lock, flags);
++	rbuf->head = rbuf->tail = 0;
++	write_unlock_irqrestore(&rbuf->rb_lock, flags);
++
++	if (mlb150_dev_adt_write(ahb_ch, ctr_val))
++		return -ETIME;
++
++	return 0;
++}
++
++static s32 mlb150_dev_init_ch_amba_ahb(struct mlb_dev_info *pdevinfo,
++					struct mlb_channel_info *chinfo,
++					enum MLB_CTYPE ctype)
++{
++	u32 ctr_val[4] = { 0 };
++
++	/* a. Set the 32-bit base address (BA1) */
++	ctr_val[3] = 0;
++	ctr_val[2] = 0;
++	ctr_val[1] = (pdevinfo->adt_buf_dep - 1) << ADT_BD1_SHIFT;
++	ctr_val[1] |= (pdevinfo->adt_buf_dep - 1) << ADT_BD2_SHIFT;
++	if (MLB_CTYPE_ASYNC == ctype ||
++		MLB_CTYPE_CTRL == ctype) {
++		ctr_val[1] |= ADT_PS1;
++		ctr_val[1] |= ADT_PS2;
++	}
++
++	ctr_val[0] |= (ADT_LE | ADT_CE);
++
++	pr_debug("mxc_mlb150: Set ADT val of channel %d, ctype: %d: "
++		"0x%08x 0x%08x 0x%08x 0x%08x\n",
++		chinfo->cl, ctype, ctr_val[3], ctr_val[2],
++		ctr_val[1], ctr_val[0]);
++
++	if (mlb150_dev_adt_write(chinfo->cl, ctr_val))
++		return -ETIME;
++
++#ifdef DEBUG_CTR
++	{
++		u32 ctr_rd[4] = { 0 };
++		if (!mlb150_dev_adt_read(chinfo->cl, ctr_rd)) {
++			pr_debug("mxc_mlb150: ADT val of channel %d: "
++				"0x%08x 0x%08x 0x%08x 0x%08x\n",
++				chinfo->cl, ctr_rd[3], ctr_rd[2],
++				ctr_rd[1], ctr_rd[0]);
++			if (ctr_rd[3] == ctr_val[3] &&
++				ctr_rd[2] == ctr_val[2] &&
++				ctr_rd[1] == ctr_val[1] &&
++				ctr_rd[0] == ctr_val[0]) {
++				pr_debug("mxc_mlb150: set adt succeed!\n");
++				return 0;
++			} else {
++				pr_debug("mxc_mlb150: set adt failed!\n");
++				return -EBADE;
++			}
++		} else {
++			pr_debug("mxc_mlb150: Read ADT val of channel %d failed\n",
++					chinfo->cl);
++			return -EBADE;
++		}
++	}
++#endif
++
++	return 0;
++}
++
++static void mlb150_dev_init_amba_ahb(struct mlb_dev_info *pdevinfo,
++					enum MLB_CTYPE ctype)
++{
++	struct mlb_channel_info *tx_chinfo = &pdevinfo->channels[TX_CHANNEL];
++	struct mlb_channel_info *rx_chinfo = &pdevinfo->channels[RX_CHANNEL];
++
++	/* Step 1, Initialize all bits of the ADT to '0' */
++	mlb150_dev_reset_adt();
++
++	/*
++	 * Step 2, Select a logic channel
++	 * Step 3, Program the AMBA AHB block ping page for channel N
++	 * Step 4, Program the AMBA AHB block pong page for channel N
++	 */
++	mlb150_dev_init_ch_amba_ahb(pdevinfo, rx_chinfo, ctype);
++	mlb150_dev_init_ch_amba_ahb(pdevinfo, tx_chinfo, ctype);
++}
++
++static void mlb150_dev_exit(void)
++{
++	u32 c0_val, hctl_val;
++
++	/* Disable EN bits */
++	c0_val = __raw_readl(mlb_base + REG_MLBC0);
++	c0_val &= ~(MLBC0_MLBEN | MLBC0_MLBPEN);
++	__raw_writel(c0_val, mlb_base + REG_MLBC0);
++
++	hctl_val = __raw_readl(mlb_base + REG_HCTL);
++	hctl_val &= ~HCTL_EN;
++	__raw_writel(hctl_val, mlb_base + REG_HCTL);
++
++	__raw_writel(0x0, mlb_base + REG_HCMR0);
++	__raw_writel(0x0, mlb_base + REG_HCMR1);
++
++	mlb150_dev_enable_dma_irq(0);
++	mlb150_dev_enable_ir_mlb(0);
++}
++
++static void mlb150_dev_init(void)
++{
++	u32 c0_val;
++	u32 ch_rx_mask = (1 << SYNC_RX_CL_AHB0) | (1 << CTRL_RX_CL_AHB0)
++			| (1 << ASYNC_RX_CL_AHB0) | (1 << ISOC_RX_CL_AHB0)
++			| (1 << SYNC_TX_CL_AHB0) | (1 << CTRL_TX_CL_AHB0)
++			| (1 << ASYNC_TX_CL_AHB0) | (1 << ISOC_TX_CL_AHB0);
++	u32 ch_tx_mask = (1 << (SYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (CTRL_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ASYNC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ISOC_RX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (SYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (CTRL_TX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ASYNC_TX_CL_AHB1 - INT_AHB1_CH_START)) |
++			(1 << (ISOC_TX_CL_AHB1 - INT_AHB1_CH_START));
++
++	/* Disable EN bits */
++	mlb150_dev_exit();
++
++	/*
++	 * Step 1. Initialize CTR and registers
++	 * a. Set all bit of the CTR (CAT, CDT, and ADT) to 0.
++	 */
++	mlb150_dev_reset_whole_ctr();
++
++	/* a. Set all bit of the CTR (CAT, CDT, and ADT) to 0. */
++	mlb150_dev_reset_all_regs();
++
++	/*
++	 * Step 2, Configure the MediaLB interface
++	 * Select pin mode and clock, 3-pin and 256fs
++	 */
++	c0_val = __raw_readl(mlb_base + REG_MLBC0);
++	c0_val &= ~(MLBC0_MLBPEN | MLBC0_MLBCLK_MASK);
++	__raw_writel(c0_val, mlb_base + REG_MLBC0);
++
++	c0_val |= MLBC0_MLBEN;
++	__raw_writel(c0_val, mlb_base + REG_MLBC0);
++
++	/* Step 3, Configure the HBI interface */
++	__raw_writel(ch_rx_mask, mlb_base + REG_HCMR0);
++	__raw_writel(ch_tx_mask, mlb_base + REG_HCMR1);
++	__raw_writel(HCTL_EN, mlb_base + REG_HCTL);
++
++	mlb150_dev_init_ir_amba_ahb();
++
++	mlb150_dev_enable_ir_mlb(1);
++}
++
++static s32 mlb150_dev_unmute_syn_ch(u32 rx_ch, u32 rx_cl, u32 tx_ch, u32 tx_cl)
++{
++	u32 timeout = 10000;
++
++	/*
++	 * Check that MediaLB clock is running (MLBC1.CLKM = 0)
++	 * If MLBC1.CLKM = 1, clear the register bit, wait one
++	 * APB or I/O clock cycle and repeat the check
++	 */
++	while ((__raw_readl(mlb_base + REG_MLBC1) & MLBC1_CLKM)
++			&& --timeout)
++		__raw_writel(~MLBC1_CLKM, mlb_base + REG_MLBC1);
++
++	if (0 == timeout)
++		return -ETIME;
++
++	timeout = 10000;
++	/* Poll for MLB lock (MLBC0.MLBLK = 1) */
++	while (!(__raw_readl(mlb_base + REG_MLBC0) & MLBC0_MLBLK)
++			&& --timeout)
++		;
++
++	if (0 == timeout)
++		return -ETIME;
++
++	/* Unmute synchronous channel(s) */
++	mlb150_dev_cat_mlb_write(rx_ch, CAT_CE | rx_cl);
++	mlb150_dev_cat_mlb_write(tx_ch,
++			CAT_CE | tx_cl | CAT_RNW);
++	mlb150_dev_cat_hbi_write(rx_cl,
++			CAT_CE | rx_cl | CAT_RNW);
++	mlb150_dev_cat_hbi_write(tx_cl, CAT_CE | tx_cl);
++
++	return 0;
++}
++
++/* In case the user calls channel shutdown, but rx or tx is not completed yet */
++static s32 mlb150_trans_complete_check(struct mlb_dev_info *pdevinfo)
++{
++	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
++	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
++	s32 timeout = 1024;
++
++	while (timeout--) {
++		read_lock(&tx_rbuf->rb_lock);
++		if (!CIRC_CNT(tx_rbuf->head, tx_rbuf->tail, TRANS_RING_NODES)) {
++			read_unlock(&tx_rbuf->rb_lock);
++			break;
++		} else
++			read_unlock(&tx_rbuf->rb_lock);
++	}
++
++	if (timeout <= 0) {
++		pr_debug("TX complete check timeout!\n");
++		return -ETIME;
++	}
++
++	timeout = 1024;
++	while (timeout--) {
++		read_lock(&rx_rbuf->rb_lock);
++		if (!CIRC_CNT(rx_rbuf->head, rx_rbuf->tail, TRANS_RING_NODES)) {
++			read_unlock(&rx_rbuf->rb_lock);
++			break;
++		} else
++			read_unlock(&rx_rbuf->rb_lock);
++	}
++
++	if (timeout <= 0) {
++		pr_debug("RX complete check timeout!\n");
++		return -ETIME;
++	}
++
++	/*
++	 * Interrupt from TX can only inform that the data is sent
++	 * to AHB bus, not mean that it is sent to MITB. Thus we add
++	 * a delay here for data to be completed sent.
++	 */
++	udelay(1000);
++
++	return 0;
++}
++
++/*
++ * Enable/Disable the MLB IRQ
++ */
++static void mxc_mlb150_irq_enable(struct mlb_data *drvdata, u8 enable)
++{
++	if (enable) {
++		enable_irq(drvdata->irq_ahb0);
++		enable_irq(drvdata->irq_ahb1);
++		enable_irq(drvdata->irq_mlb);
++	} else {
++		disable_irq(drvdata->irq_ahb0);
++		disable_irq(drvdata->irq_ahb1);
++		disable_irq(drvdata->irq_mlb);
++	}
++}
++
++/*
++ * Enable the MLB channel
++ */
++static s32 mlb_channel_enable(struct mlb_data *drvdata,
++				int chan_dev_id, int on)
++{
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++	struct mlb_channel_info *tx_chinfo = &pdevinfo->channels[TX_CHANNEL];
++	struct mlb_channel_info *rx_chinfo = &pdevinfo->channels[RX_CHANNEL];
++	u32 tx_ch = tx_chinfo->address;
++	u32 rx_ch = rx_chinfo->address;
++	u32 tx_cl = tx_chinfo->cl;
++	u32 rx_cl = rx_chinfo->cl;
++	s32 ret = 0;
++
++	/*
++	 * setup the direction, enable, channel type,
++	 * mode select, channel address and mask buf start
++	 */
++	if (on) {
++		u32 ctype = pdevinfo->channel_type;
++
++		mlb150_dev_enable_ctr_write(0xffffffff, 0xffffffff,
++				0xffffffff, 0xffffffff);
++		mlb150_dev_init_rfb(pdevinfo, rx_ch, tx_ch, ctype);
++
++		mlb150_dev_init_amba_ahb(pdevinfo, ctype);
++
++#ifdef DEBUG
++		mlb150_dev_dump_ctr_tbl(0, tx_chinfo->cl + 1);
++#endif
++		/* Synchronize and unmute synchrouous channel */
++		if (MLB_CTYPE_SYNC == ctype) {
++			ret = mlb150_dev_unmute_syn_ch(rx_ch, rx_cl,
++							tx_ch, tx_cl);
++			if (ret)
++				return ret;
++		}
++
++		mlb150_dev_enable_ctr_write(0x0, ADT_RDY1 | ADT_DNE1 |
++				ADT_ERR1 | ADT_PS1 |
++				ADT_RDY2 | ADT_DNE2 | ADT_ERR2 | ADT_PS2,
++				0xffffffff, 0xffffffff);
++
++		if (pdevinfo->fps >= CLK_2048FS)
++			mlb150_enable_pll(drvdata);
++
++		atomic_set(&pdevinfo->on, 1);
++
++#ifdef DEBUG
++		mlb150_dev_dump_reg();
++		mlb150_dev_dump_ctr_tbl(0, tx_chinfo->cl + 1);
++#endif
++		/* Init RX ADT */
++		mlb150_dev_pipo_start(&pdevinfo->rx_rbuf, rx_cl,
++					pdevinfo->rx_rbuf.phy_addrs[0]);
++	} else {
++		mlb150_dev_pipo_stop(&pdevinfo->rx_rbuf, rx_cl);
++
++		mlb150_dev_enable_dma_irq(0);
++		mlb150_dev_enable_ir_mlb(0);
++
++		mlb150_dev_reset_cat();
++
++		atomic_set(&pdevinfo->on, 0);
++
++		if (pdevinfo->fps >= CLK_2048FS)
++			mlb150_disable_pll(drvdata);
++	}
++
++	return 0;
++}
++
++/*
++ * MLB interrupt handler
++ */
++static void mlb_rx_isr(s32 ctype, u32 ahb_ch, struct mlb_dev_info *pdevinfo)
++{
++	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
++	s32 head, tail, adt_sts;
++	u32 rx_buf_ptr;
++
++#ifdef DEBUG_RX
++	pr_debug("mxc_mlb150: mlb_rx_isr\n");
++#endif
++
++	read_lock(&rx_rbuf->rb_lock);
++
++	head = (rx_rbuf->head + 1) & (TRANS_RING_NODES - 1);
++	tail = ACCESS_ONCE(rx_rbuf->tail);
++	read_unlock(&rx_rbuf->rb_lock);
++
++	if (CIRC_SPACE(head, tail, TRANS_RING_NODES) >= 1) {
++		rx_buf_ptr = rx_rbuf->phy_addrs[head];
++
++		/* commit the item before incrementing the head */
++		smp_wmb();
++
++		write_lock(&rx_rbuf->rb_lock);
++		rx_rbuf->head = head;
++		write_unlock(&rx_rbuf->rb_lock);
++
++		/* wake up the reader */
++		wake_up_interruptible(&pdevinfo->rx_wq);
++	} else {
++		rx_buf_ptr = rx_rbuf->phy_addrs[head];
++		pr_debug("drop RX package, due to no space, (%d,%d)\n",
++				head, tail);
++	}
++
++	adt_sts = mlb150_dev_get_adt_sts(ahb_ch);
++	/*  Set ADT for RX */
++	mlb150_dev_pipo_next(ahb_ch, ctype, adt_sts, rx_buf_ptr);
++}
++
++static void mlb_tx_isr(s32 ctype, u32 ahb_ch, struct mlb_dev_info *pdevinfo)
++{
++	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
++	s32 head, tail, adt_sts;
++	u32 tx_buf_ptr;
++
++	read_lock(&tx_rbuf->rb_lock);
++
++	head = ACCESS_ONCE(tx_rbuf->head);
++	tail = (tx_rbuf->tail + 1) & (TRANS_RING_NODES - 1);
++	read_unlock(&tx_rbuf->rb_lock);
++
++	smp_mb();
++	write_lock(&tx_rbuf->rb_lock);
++	tx_rbuf->tail = tail;
++	write_unlock(&tx_rbuf->rb_lock);
++
++	/* check the current tx buffer is available or not */
++	if (CIRC_CNT(head, tail, TRANS_RING_NODES) >= 1) {
++		/* read index before reading contents at that index */
++		smp_read_barrier_depends();
++
++		tx_buf_ptr = tx_rbuf->phy_addrs[tail];
++
++		wake_up_interruptible(&pdevinfo->tx_wq);
++
++		adt_sts = mlb150_dev_get_adt_sts(ahb_ch);
++		/*  Set ADT for TX */
++		mlb150_dev_pipo_next(ahb_ch, ctype, adt_sts, tx_buf_ptr);
++	}
++}
++
++static irqreturn_t mlb_ahb_isr(int irq, void *dev_id)
++{
++	u32 acsr0, hcer0;
++	u32 ch_mask = (1 << SYNC_RX_CL) | (1 << CTRL_RX_CL)
++			| (1 << ASYNC_RX_CL) | (1 << ISOC_RX_CL)
++			| (1 << SYNC_TX_CL) | (1 << CTRL_TX_CL)
++			| (1 << ASYNC_TX_CL) | (1 << ISOC_TX_CL);
++
++	/*
++	 * Step 5, Read the ACSRn registers to determine which channel or
++	 * channels are causing the interrupt
++	 */
++	acsr0 = __raw_readl(mlb_base + REG_ACSR0);
++
++	hcer0 = __raw_readl(mlb_base + REG_HCER0);
++
++	/*
++	 * Step 6, If ACTL.SCE = 1, write the result of step 5 back to ACSR0
++	 * and ACSR1 to clear the interrupt
++	 * We'll not set ACTL_SCE
++	 */
++
++	if (ch_mask & hcer0)
++		pr_err("CH encounters an AHB error: 0x%x\n", hcer0);
++
++	if ((1 << SYNC_RX_CL) & acsr0)
++		mlb_rx_isr(MLB_CTYPE_SYNC, SYNC_RX_CL,
++				&mlb_devinfo[MLB_CTYPE_SYNC]);
++
++	if ((1 << CTRL_RX_CL) & acsr0)
++		mlb_rx_isr(MLB_CTYPE_CTRL, CTRL_RX_CL,
++				&mlb_devinfo[MLB_CTYPE_CTRL]);
++
++	if ((1 << ASYNC_RX_CL) & acsr0)
++		mlb_rx_isr(MLB_CTYPE_ASYNC, ASYNC_RX_CL,
++				&mlb_devinfo[MLB_CTYPE_ASYNC]);
++
++	if ((1 << ISOC_RX_CL) & acsr0)
++		mlb_rx_isr(MLB_CTYPE_ISOC, ISOC_RX_CL,
++				&mlb_devinfo[MLB_CTYPE_ISOC]);
++
++	if ((1 << SYNC_TX_CL) & acsr0)
++		mlb_tx_isr(MLB_CTYPE_SYNC, SYNC_TX_CL,
++				&mlb_devinfo[MLB_CTYPE_SYNC]);
++
++	if ((1 << CTRL_TX_CL) & acsr0)
++		mlb_tx_isr(MLB_CTYPE_CTRL, CTRL_TX_CL,
++				&mlb_devinfo[MLB_CTYPE_CTRL]);
++
++	if ((1 << ASYNC_TX_CL) & acsr0)
++		mlb_tx_isr(MLB_CTYPE_ASYNC, ASYNC_TX_CL,
++				&mlb_devinfo[MLB_CTYPE_ASYNC]);
++
++	if ((1 << ISOC_TX_CL) & acsr0)
++		mlb_tx_isr(MLB_CTYPE_ASYNC, ISOC_TX_CL,
++				&mlb_devinfo[MLB_CTYPE_ISOC]);
++
++	return IRQ_HANDLED;
++}
++
++static irqreturn_t mlb_isr(int irq, void *dev_id)
++{
++	u32 rx_int_sts, tx_int_sts, ms0,
++		ms1, tx_cis, rx_cis, ctype;
++	int minor;
++	u32 cdt_val[4] = { 0 };
++
++	/*
++	 * Step 4, Read the MSn register to determine which channel(s)
++	 * are causing the interrupt
++	 */
++	ms0 = __raw_readl(mlb_base + REG_MS0);
++	ms1 = __raw_readl(mlb_base + REG_MS1);
++
++	/*
++	 * The MLB150_MS0, MLB150_MS1 registers need to be cleared. In
++	 * the spec description, the registers should  be cleared when
++	 * enabling interrupt. In fact, we also should clear it in ISR.
++	 */
++	__raw_writel(0, mlb_base + REG_MS0);
++	__raw_writel(0, mlb_base + REG_MS1);
++
++	pr_debug("mxc_mlb150: mlb interrupt:0x%08x 0x%08x\n",
++			(u32)ms0, (u32)ms1);
++
++	for (minor = 0; minor < MLB_MINOR_DEVICES; minor++) {
++		struct mlb_dev_info *pdevinfo = &mlb_devinfo[minor];
++		u32 rx_mlb_ch = pdevinfo->channels[RX_CHANNEL].address;
++		u32 tx_mlb_ch = pdevinfo->channels[TX_CHANNEL].address;
++		u32 rx_mlb_cl = pdevinfo->channels[RX_CHANNEL].cl;
++		u32 tx_mlb_cl = pdevinfo->channels[TX_CHANNEL].cl;
++
++		tx_cis = rx_cis = 0;
++
++		ctype = pdevinfo->channel_type;
++		rx_int_sts = (rx_mlb_ch < 31) ? ms0 : ms1;
++		tx_int_sts = (tx_mlb_ch < 31) ? ms0 : ms1;
++
++		pr_debug("mxc_mlb150: channel interrupt: "
++				"tx %d: 0x%08x, rx %d: 0x%08x\n",
++			tx_mlb_ch, (u32)tx_int_sts, rx_mlb_ch, (u32)rx_int_sts);
++
++		/* Get tx channel interrupt status */
++		if (tx_int_sts & (1 << (tx_mlb_ch % 32))) {
++			mlb150_dev_cdt_read(tx_mlb_cl, cdt_val);
++			pr_debug("mxc_mlb150: TX_CH: %d, cdt_val[3]: 0x%08x, "
++					"cdt_val[2]: 0x%08x, "
++					"cdt_val[1]: 0x%08x, "
++					"cdt_val[0]: 0x%08x\n",
++					tx_mlb_ch, cdt_val[3], cdt_val[2],
++					cdt_val[1], cdt_val[0]);
++			switch (ctype) {
++			case MLB_CTYPE_SYNC:
++				tx_cis = (cdt_val[2] & ~CDT_SYNC_WSTS_MASK)
++					>> CDT_SYNC_WSTS_SHIFT;
++				/*
++				 * Clear RSTS/WSTS errors to resume
++				 * channel operation
++				 * a. For synchronous channels: WSTS[3] = 0
++				 */
++				cdt_val[2] &= ~(0x8 << CDT_SYNC_WSTS_SHIFT);
++				break;
++			case MLB_CTYPE_CTRL:
++			case MLB_CTYPE_ASYNC:
++				tx_cis = (cdt_val[2] &
++					~CDT_CTRL_ASYNC_WSTS_MASK)
++					>> CDT_CTRL_ASYNC_WSTS_SHIFT;
++				tx_cis = (cdt_val[3] & CDT_CTRL_ASYNC_WSTS_1) ?
++					(tx_cis | (0x1 << 4)) : tx_cis;
++				/*
++				 * b. For async and ctrl channels:
++				 * RSTS[4]/WSTS[4] = 0
++				 * and RSTS[2]/WSTS[2] = 0
++				 */
++				cdt_val[3] &= ~CDT_CTRL_ASYNC_WSTS_1;
++				cdt_val[2] &=
++					~(0x4 << CDT_CTRL_ASYNC_WSTS_SHIFT);
++				break;
++			case MLB_CTYPE_ISOC:
++				tx_cis = (cdt_val[2] & ~CDT_ISOC_WSTS_MASK)
++					>> CDT_ISOC_WSTS_SHIFT;
++				/* c. For isoc channels: WSTS[2:1] = 0x00 */
++				cdt_val[2] &= ~(0x6 << CDT_ISOC_WSTS_SHIFT);
++				break;
++			default:
++				break;
++			}
++			mlb150_dev_cdt_write(tx_mlb_ch, cdt_val);
++		}
++
++		/* Get rx channel interrupt status */
++		if (rx_int_sts & (1 << (rx_mlb_ch % 32))) {
++			mlb150_dev_cdt_read(rx_mlb_cl, cdt_val);
++			pr_debug("mxc_mlb150: RX_CH: %d, cdt_val[3]: 0x%08x, "
++					"cdt_val[2]: 0x%08x, "
++					"cdt_val[1]: 0x%08x, "
++					"cdt_val[0]: 0x%08x\n",
++					rx_mlb_ch, cdt_val[3], cdt_val[2],
++					cdt_val[1], cdt_val[0]);
++			switch (ctype) {
++			case MLB_CTYPE_SYNC:
++				tx_cis = (cdt_val[2] & ~CDT_SYNC_RSTS_MASK)
++					>> CDT_SYNC_RSTS_SHIFT;
++				cdt_val[2] &= ~(0x8 << CDT_SYNC_WSTS_SHIFT);
++				break;
++			case MLB_CTYPE_CTRL:
++			case MLB_CTYPE_ASYNC:
++				tx_cis =
++					(cdt_val[2] & ~CDT_CTRL_ASYNC_RSTS_MASK)
++					>> CDT_CTRL_ASYNC_RSTS_SHIFT;
++				tx_cis = (cdt_val[3] & CDT_CTRL_ASYNC_RSTS_1) ?
++					(tx_cis | (0x1 << 4)) : tx_cis;
++				cdt_val[3] &= ~CDT_CTRL_ASYNC_RSTS_1;
++				cdt_val[2] &=
++					~(0x4 << CDT_CTRL_ASYNC_RSTS_SHIFT);
++				break;
++			case MLB_CTYPE_ISOC:
++				tx_cis = (cdt_val[2] & ~CDT_ISOC_RSTS_MASK)
++					>> CDT_ISOC_RSTS_SHIFT;
++				cdt_val[2] &= ~(0x6 << CDT_ISOC_WSTS_SHIFT);
++				break;
++			default:
++				break;
++			}
++			mlb150_dev_cdt_write(rx_mlb_ch, cdt_val);
++		}
++
++		if (!tx_cis && !rx_cis)
++			continue;
++
++		/* fill exception event */
++		spin_lock(&pdevinfo->event_lock);
++		pdevinfo->ex_event |= (rx_cis << 16) | tx_cis;
++		spin_unlock(&pdevinfo->event_lock);
++	}
++
++	return IRQ_HANDLED;
++}
++
++static int mxc_mlb150_open(struct inode *inode, struct file *filp)
++{
++	int minor, ring_buf_size, buf_size, j, ret;
++	void __iomem *buf_addr;
++	ulong phy_addr;
++	struct mlb_dev_info *pdevinfo = NULL;
++	struct mlb_channel_info *pchinfo = NULL;
++	struct mlb_data *drvdata;
++
++	minor = MINOR(inode->i_rdev);
++	drvdata = container_of(inode->i_cdev, struct mlb_data, cdev);
++
++	if (minor < 0 || minor >= MLB_MINOR_DEVICES) {
++		pr_err("no device\n");
++		return -ENODEV;
++	}
++
++	/* open for each channel device */
++	if (atomic_cmpxchg(&mlb_devinfo[minor].opencnt, 0, 1) != 0) {
++		pr_err("busy\n");
++		return -EBUSY;
++	}
++
++	clk_prepare_enable(drvdata->clk_mlb3p);
++
++	/* initial MLB module */
++	mlb150_dev_init();
++
++	pdevinfo = &mlb_devinfo[minor];
++	pchinfo = &pdevinfo->channels[TX_CHANNEL];
++
++	ring_buf_size = pdevinfo->buf_size;
++	buf_size = ring_buf_size * (TRANS_RING_NODES * 2);
++	buf_addr = (void __iomem *)gen_pool_alloc(drvdata->iram_pool, buf_size);
++	if (buf_addr == NULL) {
++		ret = -ENOMEM;
++		pr_err("can not alloc rx/tx buffers: %d\n", buf_size);
++		return ret;
++	}
++	phy_addr = gen_pool_virt_to_phys(drvdata->iram_pool, (ulong)buf_addr);
++	pr_debug("IRAM Range: Virt 0x%p - 0x%p, Phys 0x%x - 0x%x, size: 0x%x\n",
++			buf_addr, (buf_addr + buf_size - 1), (u32)phy_addr,
++			(u32)(phy_addr + buf_size - 1), buf_size);
++	pdevinfo->rbuf_base_virt = buf_addr;
++	pdevinfo->rbuf_base_phy = phy_addr;
++	drvdata->iram_size = buf_size;
++
++	memset(buf_addr, 0, buf_size);
++
++	for (j = 0; j < (TRANS_RING_NODES);
++		++j, buf_addr += ring_buf_size, phy_addr += ring_buf_size) {
++		pdevinfo->rx_rbuf.virt_bufs[j] = buf_addr;
++		pdevinfo->rx_rbuf.phy_addrs[j] = phy_addr;
++		pr_debug("RX Ringbuf[%d]: 0x%p 0x%x\n",
++			j, buf_addr, (u32)phy_addr);
++	}
++	pdevinfo->rx_rbuf.unit_size = ring_buf_size;
++	pdevinfo->rx_rbuf.total_size = buf_size;
++	for (j = 0; j < (TRANS_RING_NODES);
++		++j, buf_addr += ring_buf_size, phy_addr += ring_buf_size) {
++		pdevinfo->tx_rbuf.virt_bufs[j] = buf_addr;
++		pdevinfo->tx_rbuf.phy_addrs[j] = phy_addr;
++		pr_debug("TX Ringbuf[%d]: 0x%p 0x%x\n",
++			j, buf_addr, (u32)phy_addr);
++	}
++
++	pdevinfo->tx_rbuf.unit_size = ring_buf_size;
++	pdevinfo->tx_rbuf.total_size = buf_size;
++
++	/* reset the buffer read/write ptr */
++	pdevinfo->rx_rbuf.head = pdevinfo->rx_rbuf.tail = 0;
++	pdevinfo->tx_rbuf.head = pdevinfo->tx_rbuf.tail = 0;
++	pdevinfo->ex_event = 0;
++	pdevinfo->tx_ok = 0;
++
++	init_waitqueue_head(&pdevinfo->rx_wq);
++	init_waitqueue_head(&pdevinfo->tx_wq);
++
++	drvdata = container_of(inode->i_cdev, struct mlb_data, cdev);
++	drvdata->devinfo = pdevinfo;
++	mxc_mlb150_irq_enable(drvdata, 1);
++	filp->private_data = drvdata;
++
++	return 0;
++}
++
++static int mxc_mlb150_release(struct inode *inode, struct file *filp)
++{
++	int minor;
++	struct mlb_data *drvdata = filp->private_data;
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++
++	minor = MINOR(inode->i_rdev);
++	mxc_mlb150_irq_enable(drvdata, 0);
++
++#ifdef DEBUG
++	mlb150_dev_dump_reg();
++	mlb150_dev_dump_ctr_tbl(0, pdevinfo->channels[TX_CHANNEL].cl + 1);
++#endif
++
++	gen_pool_free(drvdata->iram_pool,
++			(ulong)pdevinfo->rbuf_base_virt, drvdata->iram_size);
++
++	mlb150_dev_exit();
++
++	if (pdevinfo && atomic_read(&pdevinfo->on)
++		&& (pdevinfo->fps >= CLK_2048FS))
++		clk_disable_unprepare(drvdata->clk_mlb6p);
++
++	atomic_set(&pdevinfo->on, 0);
++
++	clk_disable_unprepare(drvdata->clk_mlb3p);
++	/* decrease the open count */
++	atomic_set(&pdevinfo->opencnt, 0);
++
++	drvdata->devinfo = NULL;
++
++	return 0;
++}
++
++static long mxc_mlb150_ioctl(struct file *filp,
++			 unsigned int cmd, unsigned long arg)
++{
++	struct inode *inode = filp->f_path.dentry->d_inode;
++	struct mlb_data *drvdata = filp->private_data;
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++	void __user *argp = (void __user *)arg;
++	unsigned long flags, event;
++	int minor;
++
++	minor = MINOR(inode->i_rdev);
++
++	switch (cmd) {
++	case MLB_CHAN_SETADDR:
++		{
++			unsigned int caddr;
++			/* get channel address from user space */
++			if (copy_from_user(&caddr, argp, sizeof(caddr))) {
++				pr_err("mxc_mlb150: copy from user failed\n");
++				return -EFAULT;
++			}
++			pdevinfo->channels[TX_CHANNEL].address =
++							(caddr >> 16) & 0xFFFF;
++			pdevinfo->channels[RX_CHANNEL].address = caddr & 0xFFFF;
++			pr_debug("mxc_mlb150: set ch addr, tx: %d, rx: %d\n",
++					pdevinfo->channels[TX_CHANNEL].address,
++					pdevinfo->channels[RX_CHANNEL].address);
++			break;
++		}
++
++	case MLB_CHAN_STARTUP:
++		if (atomic_read(&pdevinfo->on)) {
++			pr_debug("mxc_mlb150: channel alreadly startup\n");
++			break;
++		}
++		if (mlb_channel_enable(drvdata, minor, 1))
++			return -EFAULT;
++		break;
++	case MLB_CHAN_SHUTDOWN:
++		if (atomic_read(&pdevinfo->on) == 0) {
++			pr_debug("mxc_mlb150: channel areadly shutdown\n");
++			break;
++		}
++		mlb150_trans_complete_check(pdevinfo);
++		mlb_channel_enable(drvdata, minor, 0);
++		break;
++	case MLB_CHAN_GETEVENT:
++		/* get and clear the ex_event */
++		spin_lock_irqsave(&pdevinfo->event_lock, flags);
++		event = pdevinfo->ex_event;
++		pdevinfo->ex_event = 0;
++		spin_unlock_irqrestore(&pdevinfo->event_lock, flags);
++
++		if (event) {
++			if (copy_to_user(argp, &event, sizeof(event))) {
++				pr_err("mxc_mlb150: copy to user failed\n");
++				return -EFAULT;
++			}
++		} else
++			return -EAGAIN;
++		break;
++	case MLB_SET_ISOC_BLKSIZE_188:
++		pdevinfo->isoc_blksz = 188;
++		pdevinfo->cdt_buf_dep = pdevinfo->adt_buf_dep =
++					pdevinfo->isoc_blksz * CH_ISOC_BLK_NUM;
++		break;
++	case MLB_SET_ISOC_BLKSIZE_196:
++		pdevinfo->isoc_blksz = 196;
++		pdevinfo->cdt_buf_dep = pdevinfo->adt_buf_dep =
++					pdevinfo->isoc_blksz * CH_ISOC_BLK_NUM;
++		break;
++	case MLB_SET_SYNC_QUAD:
++		{
++			u32 quad;
++
++			if (copy_from_user(&quad, argp, sizeof(quad))) {
++				pr_err("mxc_mlb150: get quad number "
++						"from user failed\n");
++				return -EFAULT;
++			}
++			if (quad <= 0 || quad > 3) {
++				pr_err("mxc_mlb150: Invalid Quadlets!"
++					"Quadlets in Sync mode can "
++					"only be 1, 2, 3\n");
++				return -EINVAL;
++			}
++			pdevinfo->sync_quad = quad;
++			/* Each quadlets is 4 bytes */
++			pdevinfo->cdt_buf_dep = quad * 4 * 4;
++			pdevinfo->adt_buf_dep =
++				pdevinfo->cdt_buf_dep * CH_SYNC_ADT_BUF_MULTI;
++		}
++		break;
++	case MLB_SET_FPS:
++		{
++			u32 fps, c0_val;
++
++			/* get fps from user space */
++			if (copy_from_user(&fps, argp, sizeof(fps))) {
++				pr_err("mxc_mlb150: copy from user failed\n");
++				return -EFAULT;
++			}
++
++			c0_val = __raw_readl(mlb_base + REG_MLBC0);
++			c0_val &= ~MLBC0_MLBCLK_MASK;
++
++			/* check fps value */
++			switch (fps) {
++			case 256:
++			case 512:
++			case 1024:
++				pdevinfo->fps = fps >> 9;
++				c0_val &= ~MLBC0_MLBPEN;
++				c0_val |= (fps >> 9)
++					<< MLBC0_MLBCLK_SHIFT;
++
++				if (1024 == fps) {
++					/*
++					 * Invert output clock phase
++					 * in 1024 fps
++					 */
++					__raw_writel(0x1,
++						mlb_base + REG_MLBPC2);
++				}
++				break;
++			case 2048:
++			case 3072:
++			case 4096:
++				pdevinfo->fps = (fps >> 10) + 1;
++				c0_val |= ((fps >> 10) + 1)
++					<< MLBC0_MLBCLK_SHIFT;
++				break;
++			case 6144:
++				pdevinfo->fps = fps >> 10;
++				c0_val |= ((fps >> 10) + 1)
++					<< MLBC0_MLBCLK_SHIFT;
++				break;
++			case 8192:
++				pdevinfo->fps = (fps >> 10) - 1;
++				c0_val |= ((fps >> 10) - 1)
++						<< MLBC0_MLBCLK_SHIFT;
++				break;
++			default:
++				pr_debug("mxc_mlb150: invalid fps argument: %d\n",
++						fps);
++				return -EINVAL;
++			}
++
++			__raw_writel(c0_val, mlb_base + REG_MLBC0);
++
++			pr_debug("mxc_mlb150: set fps to %d, MLBC0: 0x%08x\n",
++				fps,
++				(u32)__raw_readl(mlb_base + REG_MLBC0));
++
++			break;
++		}
++
++	case MLB_GET_VER:
++		{
++			u32 version;
++
++			/* get MLB device module version */
++			version = 0x03030003;
++
++			pr_debug("mxc_mlb150: get version: 0x%08x\n",
++					version);
++
++			if (copy_to_user(argp, &version, sizeof(version))) {
++				pr_err("mxc_mlb150: copy to user failed\n");
++				return -EFAULT;
++			}
++			break;
++		}
++
++	case MLB_SET_DEVADDR:
++		{
++			u32 c1_val;
++			u8 devaddr;
++
++			/* get MLB device address from user space */
++			if (copy_from_user
++				(&devaddr, argp, sizeof(unsigned char))) {
++				pr_err("mxc_mlb150: copy from user failed\n");
++				return -EFAULT;
++			}
++
++			c1_val = __raw_readl(mlb_base + REG_MLBC1);
++			c1_val &= ~MLBC1_NDA_MASK;
++			c1_val |= devaddr << MLBC1_NDA_SHIFT;
++			__raw_writel(c1_val, mlb_base + REG_MLBC1);
++			pr_debug("mxc_mlb150: set dev addr, dev addr: %d, "
++				"MLBC1: 0x%08x\n", devaddr,
++				(u32)__raw_readl(mlb_base + REG_MLBC1));
++
++			break;
++		}
++
++	case MLB_IRQ_DISABLE:
++		{
++			disable_irq(drvdata->irq_mlb);
++			break;
++		}
++
++	case MLB_IRQ_ENABLE:
++		{
++			enable_irq(drvdata->irq_mlb);
++			break;
++		}
++	default:
++		pr_info("mxc_mlb150: Invalid ioctl command\n");
++		return -EINVAL;
++	}
++
++	return 0;
++}
++
++/*
++ * MLB read routine
++ * Read the current received data from queued buffer,
++ * and free this buffer for hw to fill ingress data.
++ */
++static ssize_t mxc_mlb150_read(struct file *filp, char __user *buf,
++			    size_t count, loff_t *f_pos)
++{
++	int size;
++	struct mlb_data *drvdata = filp->private_data;
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
++	int head, tail;
++	unsigned long flags;
++
++	read_lock_irqsave(&rx_rbuf->rb_lock, flags);
++
++	head = ACCESS_ONCE(rx_rbuf->head);
++	tail = rx_rbuf->tail;
++
++	read_unlock_irqrestore(&rx_rbuf->rb_lock, flags);
++
++	/* check the current rx buffer is available or not */
++	if (0 == CIRC_CNT(head, tail, TRANS_RING_NODES)) {
++
++		if (filp->f_flags & O_NONBLOCK)
++			return -EAGAIN;
++
++		do {
++			DEFINE_WAIT(__wait);
++
++			for (;;) {
++				prepare_to_wait(&pdevinfo->rx_wq,
++						&__wait, TASK_INTERRUPTIBLE);
++
++				read_lock_irqsave(&rx_rbuf->rb_lock, flags);
++				if (CIRC_CNT(rx_rbuf->head, rx_rbuf->tail,
++						TRANS_RING_NODES) > 0) {
++					read_unlock_irqrestore(&rx_rbuf->rb_lock,
++								flags);
++					break;
++				}
++				read_unlock_irqrestore(&rx_rbuf->rb_lock,
++							flags);
++
++				if (!signal_pending(current)) {
++					schedule();
++					continue;
++				}
++				return -ERESTARTSYS;
++			}
++			finish_wait(&pdevinfo->rx_wq, &__wait);
++		} while (0);
++	}
++
++	/* read index before reading contents at that index */
++	smp_read_barrier_depends();
++
++	size = pdevinfo->adt_buf_dep;
++	if (size > count) {
++		/* the user buffer is too small */
++		pr_warning
++			("mxc_mlb150: received data size is bigger than "
++			"size: %d, count: %d\n", size, count);
++		return -EINVAL;
++	}
++
++	/* extract one item from the buffer */
++	if (copy_to_user(buf, rx_rbuf->virt_bufs[tail], size)) {
++		pr_err("mxc_mlb150: copy from user failed\n");
++		return -EFAULT;
++	}
++
++	/* finish reading descriptor before incrementing tail */
++	smp_mb();
++
++	write_lock_irqsave(&rx_rbuf->rb_lock, flags);
++	rx_rbuf->tail = (tail + 1) & (TRANS_RING_NODES - 1);
++	write_unlock_irqrestore(&rx_rbuf->rb_lock, flags);
++
++	*f_pos = 0;
++
++	return size;
++}
++
++/*
++ * MLB write routine
++ * Copy the user data to tx channel buffer,
++ * and prepare the channel current/next buffer ptr.
++ */
++static ssize_t mxc_mlb150_write(struct file *filp, const char __user *buf,
++			     size_t count, loff_t *f_pos)
++{
++	s32 ret = 0;
++	struct mlb_channel_info *pchinfo = NULL;
++	struct mlb_data *drvdata = filp->private_data;
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
++	int head, tail;
++	unsigned long flags;
++
++	/*
++	 * minor = MINOR(filp->f_dentry->d_inode->i_rdev);
++	 */
++	pchinfo = &pdevinfo->channels[TX_CHANNEL];
++
++	if (count > pdevinfo->buf_size) {
++		/* too many data to write */
++		pr_warning("mxc_mlb150: overflow write data\n");
++		return -EFBIG;
++	}
++
++	*f_pos = 0;
++
++	read_lock_irqsave(&tx_rbuf->rb_lock, flags);
++
++	head = tx_rbuf->head;
++	tail = ACCESS_ONCE(tx_rbuf->tail);
++	read_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
++
++	if (0 == CIRC_SPACE(head, tail, TRANS_RING_NODES)) {
++		if (filp->f_flags & O_NONBLOCK)
++			return -EAGAIN;
++		do {
++			DEFINE_WAIT(__wait);
++
++			for (;;) {
++				prepare_to_wait(&pdevinfo->tx_wq,
++						&__wait, TASK_INTERRUPTIBLE);
++
++				read_lock_irqsave(&tx_rbuf->rb_lock, flags);
++				if (CIRC_SPACE(tx_rbuf->head, tx_rbuf->tail,
++							TRANS_RING_NODES) > 0) {
++					read_unlock_irqrestore(&tx_rbuf->rb_lock,
++							flags);
++					break;
++				}
++				read_unlock_irqrestore(&tx_rbuf->rb_lock,
++								flags);
++
++				if (!signal_pending(current)) {
++					schedule();
++					continue;
++				}
++				return -ERESTARTSYS;
++			}
++			finish_wait(&pdevinfo->tx_wq, &__wait);
++		} while (0);
++	}
++
++	if (copy_from_user((void *)tx_rbuf->virt_bufs[head], buf, count)) {
++		read_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
++		pr_err("mxc_mlb: copy from user failed\n");
++		ret = -EFAULT;
++		goto out;
++	}
++
++	write_lock_irqsave(&tx_rbuf->rb_lock, flags);
++	smp_wmb();
++	tx_rbuf->head = (head + 1) & (TRANS_RING_NODES - 1);
++	write_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
++
++	if (0 == CIRC_CNT(head, tail, TRANS_RING_NODES)) {
++		u32 tx_buf_ptr, ahb_ch;
++		s32 adt_sts;
++		u32 ctype = pdevinfo->channel_type;
++
++		/* read index before reading contents at that index */
++		smp_read_barrier_depends();
++
++		tx_buf_ptr = tx_rbuf->phy_addrs[tail];
++
++		ahb_ch = pdevinfo->channels[TX_CHANNEL].cl;
++		adt_sts = mlb150_dev_get_adt_sts(ahb_ch);
++
++		/*  Set ADT for TX */
++		mlb150_dev_pipo_next(ahb_ch, ctype, adt_sts, tx_buf_ptr);
++	}
++
++	ret = count;
++out:
++	return ret;
++}
++
++static unsigned int mxc_mlb150_poll(struct file *filp,
++				 struct poll_table_struct *wait)
++{
++	int minor;
++	unsigned int ret = 0;
++	struct mlb_data *drvdata = filp->private_data;
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++	struct mlb_ringbuf *tx_rbuf = &pdevinfo->tx_rbuf;
++	struct mlb_ringbuf *rx_rbuf = &pdevinfo->rx_rbuf;
++	int head, tail;
++	unsigned long flags;
++
++
++	minor = MINOR(filp->f_path.dentry->d_inode->i_rdev);
++
++	poll_wait(filp, &pdevinfo->rx_wq, wait);
++	poll_wait(filp, &pdevinfo->tx_wq, wait);
++
++	read_lock_irqsave(&tx_rbuf->rb_lock, flags);
++	head = tx_rbuf->head;
++	tail = tx_rbuf->tail;
++	read_unlock_irqrestore(&tx_rbuf->rb_lock, flags);
++
++	/* check the tx buffer is avaiable or not */
++	if (CIRC_SPACE(head, tail, TRANS_RING_NODES) >= 1)
++		ret |= POLLOUT | POLLWRNORM;
++
++	read_lock_irqsave(&rx_rbuf->rb_lock, flags);
++	head = rx_rbuf->head;
++	tail = rx_rbuf->tail;
++	read_unlock_irqrestore(&rx_rbuf->rb_lock, flags);
++
++	/* check the rx buffer filled or not */
++	if (CIRC_CNT(head, tail, TRANS_RING_NODES) >= 1)
++		ret |= POLLIN | POLLRDNORM;
++
++
++	/* check the exception event */
++	if (pdevinfo->ex_event)
++		ret |= POLLIN | POLLRDNORM;
++
++	return ret;
++}
++
++/*
++ * char dev file operations structure
++ */
++static const struct file_operations mxc_mlb150_fops = {
++
++	.owner = THIS_MODULE,
++	.open = mxc_mlb150_open,
++	.release = mxc_mlb150_release,
++	.unlocked_ioctl = mxc_mlb150_ioctl,
++	.poll = mxc_mlb150_poll,
++	.read = mxc_mlb150_read,
++	.write = mxc_mlb150_write,
++};
++
++static struct platform_device_id imx_mlb150_devtype[] = {
++	{
++		.name = "imx6q-mlb150",
++		.driver_data = 0,
++	}, {
++		/* sentinel */
++	}
++};
++MODULE_DEVICE_TABLE(platform, imx_mlb150_devtype);
++
++static const struct of_device_id mlb150_imx_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-mlb150", .data = &imx_mlb150_devtype[0], },
++	{ /* sentinel */ }
++};
++
++/*
++ * This function is called whenever the MLB device is detected.
++ */
++static int mxc_mlb150_probe(struct platform_device *pdev)
++{
++	int ret, mlb_major, i;
++	struct mlb_data *drvdata;
++	struct resource *res;
++	struct device_node *np = pdev->dev.of_node;
++
++	drvdata = devm_kzalloc(&pdev->dev, sizeof(struct mlb_data),
++				GFP_KERNEL);
++	if (!drvdata) {
++		dev_err(&pdev->dev, "can't allocate enough memory\n");
++		return -ENOMEM;
++	}
++
++	/*
++	 * Register MLB lld as four character devices
++	 */
++	ret = alloc_chrdev_region(&drvdata->firstdev, 0,
++			MLB_MINOR_DEVICES, "mxc_mlb150");
++	if (ret < 0) {
++		dev_err(&pdev->dev, "alloc region error\n");
++		goto err_reg;
++	}
++	mlb_major = MAJOR(drvdata->firstdev);
++	dev_dbg(&pdev->dev, "MLB device major: %d\n", mlb_major);
++
++	cdev_init(&drvdata->cdev, &mxc_mlb150_fops);
++	drvdata->cdev.owner = THIS_MODULE;
++
++	ret = cdev_add(&drvdata->cdev, drvdata->firstdev, MLB_MINOR_DEVICES);
++	if (ret) {
++		dev_err(&pdev->dev, "can't add cdev\n");
++		goto err_reg;
++	}
++
++	/* create class and device for udev information */
++	drvdata->class = class_create(THIS_MODULE, "mlb150");
++	if (IS_ERR(drvdata->class)) {
++		dev_err(&pdev->dev, "failed to create device class\n");
++		ret = -ENOMEM;
++		goto err_class;
++	}
++
++	for (i = 0; i < MLB_MINOR_DEVICES; i++) {
++		struct device *class_dev;
++
++		class_dev = device_create(drvdata->class, NULL,
++				MKDEV(mlb_major, i),
++				NULL, mlb_devinfo[i].dev_name);
++		if (IS_ERR(class_dev)) {
++			dev_err(&pdev->dev, "failed to create mlb150 %s"
++				" class device\n", mlb_devinfo[i].dev_name);
++			ret = -ENOMEM;
++			goto err_dev;
++		}
++	}
++
++	/* ahb0 irq */
++	drvdata->irq_ahb0 = platform_get_irq(pdev,  1);
++	if (drvdata->irq_ahb0 < 0) {
++		dev_err(&pdev->dev, "No ahb0 irq line provided\n");
++		goto err_dev;
++	}
++	dev_dbg(&pdev->dev, "ahb0_irq: %d\n", drvdata->irq_ahb0);
++	if (devm_request_irq(&pdev->dev, drvdata->irq_ahb0, mlb_ahb_isr,
++				0, "mlb_ahb0", NULL)) {
++		dev_err(&pdev->dev, "can't claim irq %d\n", drvdata->irq_ahb0);
++		goto err_dev;
++	}
++
++	/* ahb1 irq */
++	drvdata->irq_ahb1 = platform_get_irq(pdev,  2);
++	if (drvdata->irq_ahb1 < 0) {
++		dev_err(&pdev->dev, "No ahb1 irq line provided\n");
++		goto err_dev;
++	}
++	dev_dbg(&pdev->dev, "ahb1_irq: %d\n", drvdata->irq_ahb1);
++	if (devm_request_irq(&pdev->dev, drvdata->irq_ahb1, mlb_ahb_isr,
++				0, "mlb_ahb1", NULL)) {
++		dev_err(&pdev->dev, "can't claim irq %d\n", drvdata->irq_ahb1);
++		goto err_dev;
++	}
++
++	/* mlb irq */
++	drvdata->irq_mlb  = platform_get_irq(pdev,  0);
++	if (drvdata->irq_mlb < 0) {
++		dev_err(&pdev->dev, "No mlb irq line provided\n");
++		goto err_dev;
++	}
++	dev_dbg(&pdev->dev, "mlb_irq: %d\n", drvdata->irq_mlb);
++	if (devm_request_irq(&pdev->dev, drvdata->irq_mlb, mlb_isr,
++				0, "mlb", NULL)) {
++		dev_err(&pdev->dev, "can't claim irq %d\n", drvdata->irq_mlb);
++		goto err_dev;
++	}
++
++	/* ioremap from phy mlb to kernel space */
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res) {
++		dev_err(&pdev->dev, "can't get device resources\n");
++		ret = -ENOENT;
++		goto err_dev;
++	}
++	mlb_base = devm_ioremap_resource(&pdev->dev, res);
++	dev_dbg(&pdev->dev, "mapped base address: 0x%08x\n", (u32)mlb_base);
++	if (IS_ERR(mlb_base)) {
++		dev_err(&pdev->dev,
++			"failed to get ioremap base\n");
++		ret = PTR_ERR(mlb_base);
++		goto err_dev;
++	}
++	drvdata->membase = mlb_base;
++
++#ifdef CONFIG_REGULATOR
++	drvdata->nvcc = devm_regulator_get(&pdev->dev, "reg_nvcc");
++	if (!IS_ERR(drvdata->nvcc)) {
++		regulator_set_voltage(drvdata->nvcc, 2500000, 2500000);
++		dev_err(&pdev->dev, "enalbe regulator\n");
++		ret = regulator_enable(drvdata->nvcc);
++		if (ret) {
++			dev_err(&pdev->dev, "vdd set voltage error\n");
++			goto err_dev;
++		}
++	}
++#endif
++
++	/* enable clock */
++	drvdata->clk_mlb3p = devm_clk_get(&pdev->dev, "mlb");
++	if (IS_ERR(drvdata->clk_mlb3p)) {
++		dev_err(&pdev->dev, "unable to get mlb clock\n");
++		ret = PTR_ERR(drvdata->clk_mlb3p);
++		goto err_dev;
++	}
++
++	drvdata->clk_mlb6p = devm_clk_get(&pdev->dev, "pll8_mlb");
++	if (IS_ERR(drvdata->clk_mlb6p)) {
++		dev_err(&pdev->dev, "unable to get mlb pll clock\n");
++		ret = PTR_ERR(drvdata->clk_mlb6p);
++		goto err_dev;
++	}
++
++
++	drvdata->iram_pool = of_get_named_gen_pool(np, "iram", 0);
++	if (!drvdata->iram_pool) {
++		dev_err(&pdev->dev, "iram pool not available\n");
++		ret = -ENOMEM;
++		goto err_dev;
++	}
++
++	drvdata->devinfo = NULL;
++	mxc_mlb150_irq_enable(drvdata, 0);
++	platform_set_drvdata(pdev, drvdata);
++	return 0;
++
++err_dev:
++	for (--i; i >= 0; i--)
++		device_destroy(drvdata->class, MKDEV(mlb_major, i));
++
++	class_destroy(drvdata->class);
++err_class:
++	cdev_del(&drvdata->cdev);
++err_reg:
++	unregister_chrdev_region(drvdata->firstdev, MLB_MINOR_DEVICES);
++
++	return ret;
++}
++
++static int mxc_mlb150_remove(struct platform_device *pdev)
++{
++	int i;
++	struct mlb_data *drvdata = platform_get_drvdata(pdev);
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++
++	if (pdevinfo && atomic_read(&pdevinfo->on)
++		&& (pdevinfo->fps >= CLK_2048FS))
++		clk_disable_unprepare(drvdata->clk_mlb6p);
++
++	if (pdevinfo && atomic_read(&pdevinfo->opencnt))
++		clk_disable_unprepare(drvdata->clk_mlb3p);
++
++	/* disable mlb power */
++#ifdef CONFIG_REGULATOR
++	if (!IS_ERR(drvdata->nvcc))
++		regulator_disable(drvdata->nvcc);
++#endif
++
++	/* destroy mlb device class */
++	for (i = MLB_MINOR_DEVICES - 1; i >= 0; i--)
++		device_destroy(drvdata->class,
++				MKDEV(MAJOR(drvdata->firstdev), i));
++	class_destroy(drvdata->class);
++
++	cdev_del(&drvdata->cdev);
++
++	/* Unregister the two MLB devices */
++	unregister_chrdev_region(drvdata->firstdev, MLB_MINOR_DEVICES);
++
++	return 0;
++}
++
++#ifdef CONFIG_PM
++static int mxc_mlb150_suspend(struct platform_device *pdev, pm_message_t state)
++{
++	struct mlb_data *drvdata = platform_get_drvdata(pdev);
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++
++	if (pdevinfo && atomic_read(&pdevinfo->on)
++		&& (pdevinfo->fps >= CLK_2048FS))
++		clk_disable_unprepare(drvdata->clk_mlb6p);
++
++	if (pdevinfo && atomic_read(&pdevinfo->opencnt)) {
++		mlb150_dev_exit();
++		clk_disable_unprepare(drvdata->clk_mlb3p);
++	}
++
++	return 0;
++}
++
++static int mxc_mlb150_resume(struct platform_device *pdev)
++{
++	struct mlb_data *drvdata = platform_get_drvdata(pdev);
++	struct mlb_dev_info *pdevinfo = drvdata->devinfo;
++
++	if (pdevinfo && atomic_read(&pdevinfo->opencnt)) {
++		clk_prepare_enable(drvdata->clk_mlb3p);
++		mlb150_dev_init();
++	}
++
++	if (pdevinfo && atomic_read(&pdevinfo->on) &&
++		(pdevinfo->fps >= CLK_2048FS))
++		clk_prepare_enable(drvdata->clk_mlb6p);
++
++	return 0;
++}
++#else
++#define mxc_mlb150_suspend NULL
++#define mxc_mlb150_resume NULL
++#endif
++
++/*
++ * platform driver structure for MLB
++ */
++static struct platform_driver mxc_mlb150_driver = {
++	.driver = {
++		.name = DRIVER_NAME,
++		.owner  = THIS_MODULE,
++		.of_match_table = mlb150_imx_dt_ids,
++	},
++	.probe = mxc_mlb150_probe,
++	.remove = mxc_mlb150_remove,
++	.suspend = mxc_mlb150_suspend,
++	.resume = mxc_mlb150_resume,
++	.id_table = imx_mlb150_devtype,
++};
++
++static int __init mxc_mlb150_init(void)
++{
++	return platform_driver_register(&mxc_mlb150_driver);
++}
++
++static void __exit mxc_mlb150_exit(void)
++{
++	platform_driver_unregister(&mxc_mlb150_driver);
++}
++
++module_init(mxc_mlb150_init);
++module_exit(mxc_mlb150_exit);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("MLB150 low level driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/mxc/vpu/Kconfig linux-xbian-imx6/drivers/mxc/vpu/Kconfig
+--- linux-4.1.3/drivers/mxc/vpu/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/vpu/Kconfig	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,31 @@
++#
++# Codec configuration
++#
++
++menu "MXC VPU(Video Processing Unit) support"
++
++config MXC_VPU
++	  tristate "Support for MXC VPU(Video Processing Unit)"
++	  depends on (SOC_IMX27 || SOC_IMX5 || SOC_IMX6Q)
++	  default y
++	---help---
++	  The VPU codec device provides codec function for H.264/MPEG4/H.263,
++	  as well as MPEG2/VC-1/DivX on some platforms.
++
++config MXC_VPU_DEBUG
++	bool "MXC VPU debugging"
++	depends on MXC_VPU != n
++	help
++	  This is an option for the developers; most people should
++	  say N here.  This enables MXC VPU driver debugging.
++
++config MX6_VPU_352M
++	bool "MX6 VPU 352M"
++	depends on MXC_VPU
++	default n
++	help
++	 Increase VPU frequncy to 352M, the config will disable bus frequency
++	 adjust dynamic, and CPU lowest setpoint will be 352Mhz.
++	 This config is used for special VPU use case.
++
++endmenu
+diff -Nur linux-4.1.3/drivers/mxc/vpu/Makefile linux-xbian-imx6/drivers/mxc/vpu/Makefile
+--- linux-4.1.3/drivers/mxc/vpu/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/vpu/Makefile	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,9 @@
++#
++# Makefile for the VPU drivers.
++#
++
++obj-$(CONFIG_MXC_VPU)                  += mxc_vpu.o
++
++ifeq ($(CONFIG_MXC_VPU_DEBUG),y)
++EXTRA_CFLAGS += -DDEBUG
++endif
+diff -Nur linux-4.1.3/drivers/mxc/vpu/mxc_vpu.c linux-xbian-imx6/drivers/mxc/vpu/mxc_vpu.c
+--- linux-4.1.3/drivers/mxc/vpu/mxc_vpu.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/mxc/vpu/mxc_vpu.c	2015-07-27 23:13:06.230751680 +0200
+@@ -0,0 +1,1344 @@
++/*
++ * Copyright 2006-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file mxc_vpu.c
++ *
++ * @brief VPU system initialization and file operation implementation
++ *
++ * @ingroup VPU
++ */
++#include <linux/kernel.h>
++#include <linux/mm.h>
++#include <linux/interrupt.h>
++#include <linux/ioport.h>
++#include <linux/stat.h>
++#include <linux/platform_device.h>
++#include <linux/kdev_t.h>
++#include <linux/dma-mapping.h>
++#include <linux/wait.h>
++#include <linux/list.h>
++#include <linux/clk.h>
++#include <linux/delay.h>
++#include <linux/fsl_devices.h>
++#include <linux/uaccess.h>
++#include <linux/io.h>
++#include <linux/slab.h>
++#include <linux/workqueue.h>
++#include <linux/sched.h>
++#include <linux/vmalloc.h>
++#include <linux/regulator/consumer.h>
++#include <linux/page-flags.h>
++#include <linux/mm_types.h>
++#include <linux/types.h>
++#include <linux/memblock.h>
++#include <linux/memory.h>
++#include <linux/version.h>
++#include <asm/page.h>
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++#include <linux/module.h>
++#include <linux/pm_runtime.h>
++#include <linux/sizes.h>
++#endif
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
++#include <linux/iram_alloc.h>
++#include <mach/clock.h>
++#include <mach/hardware.h>
++#include <mach/mxc_vpu.h>
++#endif
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++#include <linux/busfreq-imx6.h>
++#include <linux/clk.h>
++#include <linux/genalloc.h>
++#include <linux/mxc_vpu.h>
++#include <linux/of.h>
++#include <linux/reset.h>
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++#include <mach/busfreq.h>
++#include <mach/common.h>
++#else
++#include <asm/sizes.h>
++#endif
++
++/* Define one new pgprot which combined uncached and XN(never executable) */
++#define pgprot_noncachedxn(prot) \
++	__pgprot_modify(prot, L_PTE_MT_MASK, L_PTE_MT_UNCACHED | L_PTE_XN)
++
++struct vpu_priv {
++	struct fasync_struct *async_queue;
++	struct work_struct work;
++	struct workqueue_struct *workqueue;
++	struct mutex lock;
++};
++
++/* To track the allocated memory buffer */
++struct memalloc_record {
++	struct list_head list;
++	struct vpu_mem_desc mem;
++};
++
++struct iram_setting {
++	u32 start;
++	u32 end;
++};
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++static struct gen_pool *iram_pool;
++static u32 iram_base;
++#endif
++
++static LIST_HEAD(head);
++
++static int vpu_major;
++static int vpu_clk_usercount;
++static struct class *vpu_class;
++static struct vpu_priv vpu_data;
++static u8 open_count;
++static struct clk *vpu_clk;
++static struct vpu_mem_desc bitwork_mem = { 0 };
++static struct vpu_mem_desc pic_para_mem = { 0 };
++static struct vpu_mem_desc user_data_mem = { 0 };
++static struct vpu_mem_desc share_mem = { 0 };
++static struct vpu_mem_desc vshare_mem = { 0 };
++
++static void __iomem *vpu_base;
++static int vpu_ipi_irq;
++static u32 phy_vpu_base_addr;
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++static phys_addr_t top_address_DRAM;
++static struct mxc_vpu_platform_data *vpu_plat;
++#endif
++
++static struct device *vpu_dev;
++
++/* IRAM setting */
++static struct iram_setting iram;
++
++/* implement the blocking ioctl */
++static int irq_status;
++static int codec_done;
++static wait_queue_head_t vpu_queue;
++
++#ifdef CONFIG_SOC_IMX6Q
++#define MXC_VPU_HAS_JPU
++#endif
++
++#ifdef MXC_VPU_HAS_JPU
++static int vpu_jpu_irq;
++#endif
++
++#ifdef CONFIG_PM
++static unsigned int regBk[64];
++static unsigned int pc_before_suspend;
++#endif
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++static struct regulator *vpu_regulator;
++#endif
++static atomic_t clk_cnt_from_ioc = ATOMIC_INIT(0);
++
++#define	READ_REG(x)		readl_relaxed(vpu_base + x)
++#define	WRITE_REG(val, x)	writel_relaxed(val, vpu_base + x)
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++/* redirect to static functions */
++static int cpu_is_mx6dl(void)
++{
++	int ret;
++	ret = of_machine_is_compatible("fsl,imx6dl");
++	return ret;
++}
++
++static int cpu_is_mx6q(void)
++{
++	int ret;
++	ret = of_machine_is_compatible("fsl,imx6q");
++	return ret;
++}
++#endif
++
++static void vpu_reset(void)
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++	device_reset(vpu_dev);
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++	imx_src_reset_vpu();
++#else
++	if (vpu_plat->reset)
++		vpu_plat->reset();
++#endif
++}
++
++static long vpu_power_get(bool on)
++{
++	long ret = 0;
++
++	if (on) {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++		vpu_regulator = regulator_get(NULL, "cpu_vddvpu");
++		ret = IS_ERR(vpu_regulator);
++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++		vpu_regulator = devm_regulator_get(vpu_dev, "pu");
++		ret = IS_ERR(vpu_regulator);
++#endif
++	} else {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++		if (!IS_ERR(vpu_regulator))
++			regulator_put(vpu_regulator);
++#endif
++	}
++	return ret;
++}
++
++static void vpu_power_up(bool on)
++{
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0) || LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++	int ret = 0;
++
++	if (on) {
++		if (!IS_ERR(vpu_regulator)) {
++			ret = regulator_enable(vpu_regulator);
++			if (ret)
++				dev_err(vpu_dev, "failed to power up vpu\n");
++		}
++	} else {
++		if (!IS_ERR(vpu_regulator)) {
++			ret = regulator_disable(vpu_regulator);
++			if (ret)
++				dev_err(vpu_dev, "failed to power down vpu\n");
++		}
++	}
++#else
++	imx_gpc_power_up_pu(on);
++#endif
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++static int cpu_is_mx53(void)
++{
++	return 0;
++}
++
++static int cpu_is_mx51(void)
++{
++	return 0;
++}
++
++#define VM_RESERVED 0
++#endif
++
++/*!
++ * Private function to alloc dma buffer
++ * @return status  0 success.
++ */
++static int vpu_alloc_dma_buffer(struct vpu_mem_desc *mem)
++{
++	mem->cpu_addr = (unsigned long)
++	    dma_zalloc_coherent(NULL, PAGE_ALIGN(mem->size),
++			       (dma_addr_t *) (&mem->phy_addr),
++			       GFP_DMA | GFP_KERNEL);
++	dev_dbg(vpu_dev, "[ALLOC] mem alloc cpu_addr = 0x%x\n", mem->cpu_addr);
++	if ((void *)(mem->cpu_addr) == NULL) {
++		dev_err(vpu_dev, "Physical memory allocation error!\n");
++		return -1;
++	}
++	return 0;
++}
++
++/*!
++ * Private function to free dma buffer
++ */
++static void vpu_free_dma_buffer(struct vpu_mem_desc *mem)
++{
++	if (mem->cpu_addr != 0) {
++		dma_free_coherent(0, PAGE_ALIGN(mem->size),
++				  (void *)mem->cpu_addr, mem->phy_addr);
++	}
++}
++
++/*!
++ * Private function to free buffers
++ * @return status  0 success.
++ */
++static int vpu_free_buffers(void)
++{
++	struct memalloc_record *rec, *n;
++	struct vpu_mem_desc mem;
++
++	list_for_each_entry_safe(rec, n, &head, list) {
++		mem = rec->mem;
++		if (mem.cpu_addr != 0) {
++			vpu_free_dma_buffer(&mem);
++			dev_dbg(vpu_dev, "[FREE] freed paddr=0x%08X\n", mem.phy_addr);
++			/* delete from list */
++			list_del(&rec->list);
++			kfree(rec);
++		}
++	}
++
++	return 0;
++}
++
++static inline void vpu_worker_callback(struct work_struct *w)
++{
++	struct vpu_priv *dev = container_of(w, struct vpu_priv,
++				work);
++
++	if (dev->async_queue)
++		kill_fasync(&dev->async_queue, SIGIO, POLL_IN);
++
++	irq_status = 1;
++	/*
++	 * Clock is gated on when dec/enc started, gate it off when
++	 * codec is done.
++	 */
++	if (codec_done)
++		codec_done = 0;
++
++	wake_up_interruptible(&vpu_queue);
++}
++
++/*!
++ * @brief vpu interrupt handler
++ */
++static irqreturn_t vpu_ipi_irq_handler(int irq, void *dev_id)
++{
++	struct vpu_priv *dev = dev_id;
++	unsigned long reg;
++
++	reg = READ_REG(BIT_INT_REASON);
++	if (reg & 0x8)
++		codec_done = 1;
++	WRITE_REG(0x1, BIT_INT_CLEAR);
++
++	queue_work(dev->workqueue, &dev->work);
++
++	return IRQ_HANDLED;
++}
++
++/*!
++ * @brief vpu jpu interrupt handler
++ */
++#ifdef MXC_VPU_HAS_JPU
++static irqreturn_t vpu_jpu_irq_handler(int irq, void *dev_id)
++{
++	struct vpu_priv *dev = dev_id;
++	unsigned long reg;
++
++	reg = READ_REG(MJPEG_PIC_STATUS_REG);
++	if (reg & 0x3)
++		codec_done = 1;
++
++	queue_work(dev->workqueue, &dev->work);
++
++	return IRQ_HANDLED;
++}
++#endif
++
++/*!
++ * @brief check phy memory prepare to pass to vpu is valid or not, we
++ * already address some issue that if pass a wrong address to vpu
++ * (like virtual address), system will hang.
++ *
++ * @return true return is a valid phy memory address, false return not.
++ */
++bool vpu_is_valid_phy_memory(u32 paddr)
++{
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++	if (paddr > top_address_DRAM)
++		return false;
++#endif
++
++	return true;
++}
++
++/*!
++ * @brief open function for vpu file operation
++ *
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_open(struct inode *inode, struct file *filp)
++{
++
++	mutex_lock(&vpu_data.lock);
++
++	if (open_count++ == 0) {
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++		pm_runtime_get_sync(vpu_dev);
++#endif
++		vpu_power_up(true);
++
++#ifdef CONFIG_SOC_IMX6Q
++		clk_prepare(vpu_clk);
++		clk_enable(vpu_clk);
++		if (READ_REG(BIT_CUR_PC))
++			dev_dbg(vpu_dev, "Not power off before vpu open!\n");
++		clk_disable(vpu_clk);
++		clk_unprepare(vpu_clk);
++#endif
++	}
++
++	filp->private_data = (void *)(&vpu_data);
++	mutex_unlock(&vpu_data.lock);
++	return 0;
++}
++
++/*!
++ * @brief IO ctrl function for vpu file operation
++ * @param cmd IO ctrl command
++ * @return  0 on success or negative error code on error
++ */
++static long vpu_ioctl(struct file *filp, u_int cmd,
++		     u_long arg)
++{
++	int ret = 0;
++
++	switch (cmd) {
++	case VPU_IOC_PHYMEM_ALLOC:
++		{
++			struct memalloc_record *rec;
++
++			rec = kzalloc(sizeof(*rec), GFP_KERNEL);
++			if (!rec)
++				return -ENOMEM;
++
++			ret = copy_from_user(&(rec->mem),
++					     (struct vpu_mem_desc *)arg,
++					     sizeof(struct vpu_mem_desc));
++			if (ret) {
++				kfree(rec);
++				return -EFAULT;
++			}
++
++			dev_dbg(vpu_dev, "[ALLOC] mem alloc size = 0x%x\n",
++				 rec->mem.size);
++
++			ret = vpu_alloc_dma_buffer(&(rec->mem));
++			if (ret == -1) {
++				kfree(rec);
++				dev_err(vpu_dev,
++					"Physical memory allocation error!\n");
++				break;
++			}
++			ret = copy_to_user((void __user *)arg, &(rec->mem),
++					   sizeof(struct vpu_mem_desc));
++			if (ret) {
++				kfree(rec);
++				ret = -EFAULT;
++				break;
++			}
++
++			mutex_lock(&vpu_data.lock);
++			list_add(&rec->list, &head);
++			mutex_unlock(&vpu_data.lock);
++
++			break;
++		}
++	case VPU_IOC_PHYMEM_FREE:
++		{
++			struct memalloc_record *rec, *n;
++			struct vpu_mem_desc vpu_mem;
++
++			ret = copy_from_user(&vpu_mem,
++					     (struct vpu_mem_desc *)arg,
++					     sizeof(struct vpu_mem_desc));
++			if (ret)
++				return -EACCES;
++
++			dev_dbg(vpu_dev, "[FREE] mem freed cpu_addr = 0x%x\n",
++				 vpu_mem.cpu_addr);
++			if ((void *)vpu_mem.cpu_addr != NULL)
++				vpu_free_dma_buffer(&vpu_mem);
++
++			mutex_lock(&vpu_data.lock);
++			list_for_each_entry_safe(rec, n, &head, list) {
++				if (rec->mem.cpu_addr == vpu_mem.cpu_addr) {
++					/* delete from list */
++					list_del(&rec->list);
++					kfree(rec);
++					break;
++				}
++			}
++			mutex_unlock(&vpu_data.lock);
++
++			break;
++		}
++	case VPU_IOC_WAIT4INT:
++		{
++			u_long timeout = (u_long) arg;
++			if (!wait_event_interruptible_timeout
++			    (vpu_queue, irq_status != 0,
++			     msecs_to_jiffies(timeout))) {
++				dev_warn(vpu_dev, "VPU blocking: timeout.\n");
++				ret = -ETIME;
++			} else if (signal_pending(current)) {
++				dev_warn(vpu_dev, "VPU interrupt received.\n");
++				ret = -ERESTARTSYS;
++			} else
++				irq_status = 0;
++			break;
++		}
++	case VPU_IOC_IRAM_SETTING:
++		{
++			ret = copy_to_user((void __user *)arg, &iram,
++					   sizeof(struct iram_setting));
++			if (ret)
++				ret = -EFAULT;
++
++			break;
++		}
++	case VPU_IOC_CLKGATE_SETTING:
++		{
++			u32 clkgate_en;
++
++			if (get_user(clkgate_en, (u32 __user *) arg))
++				return -EFAULT;
++
++			if (clkgate_en) {
++				clk_prepare(vpu_clk);
++				clk_enable(vpu_clk);
++				atomic_inc(&clk_cnt_from_ioc);
++			} else {
++				clk_disable(vpu_clk);
++				clk_unprepare(vpu_clk);
++				atomic_dec(&clk_cnt_from_ioc);
++			}
++
++			break;
++		}
++	case VPU_IOC_GET_SHARE_MEM:
++		{
++			mutex_lock(&vpu_data.lock);
++			if (share_mem.cpu_addr != 0) {
++				ret = copy_to_user((void __user *)arg,
++						   &share_mem,
++						   sizeof(struct vpu_mem_desc));
++				mutex_unlock(&vpu_data.lock);
++				break;
++			} else {
++				if (copy_from_user(&share_mem,
++						   (struct vpu_mem_desc *)arg,
++						 sizeof(struct vpu_mem_desc))) {
++					mutex_unlock(&vpu_data.lock);
++					return -EFAULT;
++				}
++				if (vpu_alloc_dma_buffer(&share_mem) == -1)
++					ret = -EFAULT;
++				else {
++					if (copy_to_user((void __user *)arg,
++							 &share_mem,
++							 sizeof(struct
++								vpu_mem_desc)))
++						ret = -EFAULT;
++				}
++			}
++			mutex_unlock(&vpu_data.lock);
++			break;
++		}
++	case VPU_IOC_REQ_VSHARE_MEM:
++		{
++			mutex_lock(&vpu_data.lock);
++			if (vshare_mem.cpu_addr != 0) {
++				ret = copy_to_user((void __user *)arg,
++						   &vshare_mem,
++						   sizeof(struct vpu_mem_desc));
++				mutex_unlock(&vpu_data.lock);
++				break;
++			} else {
++				if (copy_from_user(&vshare_mem,
++						   (struct vpu_mem_desc *)arg,
++						   sizeof(struct
++							  vpu_mem_desc))) {
++					mutex_unlock(&vpu_data.lock);
++					return -EFAULT;
++				}
++				/* vmalloc shared memory if not allocated */
++				if (!vshare_mem.cpu_addr)
++					vshare_mem.cpu_addr =
++					    (unsigned long)
++					    vmalloc_user(vshare_mem.size);
++				if (copy_to_user
++				     ((void __user *)arg, &vshare_mem,
++				     sizeof(struct vpu_mem_desc)))
++					ret = -EFAULT;
++			}
++			mutex_unlock(&vpu_data.lock);
++			break;
++		}
++	case VPU_IOC_GET_WORK_ADDR:
++		{
++			if (bitwork_mem.cpu_addr != 0) {
++				ret =
++				    copy_to_user((void __user *)arg,
++						 &bitwork_mem,
++						 sizeof(struct vpu_mem_desc));
++				break;
++			} else {
++				if (copy_from_user(&bitwork_mem,
++						   (struct vpu_mem_desc *)arg,
++						   sizeof(struct vpu_mem_desc)))
++					return -EFAULT;
++
++				if (vpu_alloc_dma_buffer(&bitwork_mem) == -1)
++					ret = -EFAULT;
++				else if (copy_to_user((void __user *)arg,
++						      &bitwork_mem,
++						      sizeof(struct
++							     vpu_mem_desc)))
++					ret = -EFAULT;
++			}
++			break;
++		}
++	/*
++	 * The following two ioctl is used when user allocates working buffer
++	 * and register it to vpu driver.
++	 */
++	case VPU_IOC_QUERY_BITWORK_MEM:
++		{
++			if (copy_to_user((void __user *)arg,
++					 &bitwork_mem,
++					 sizeof(struct vpu_mem_desc)))
++				ret = -EFAULT;
++			break;
++		}
++	case VPU_IOC_SET_BITWORK_MEM:
++		{
++			if (copy_from_user(&bitwork_mem,
++					   (struct vpu_mem_desc *)arg,
++					   sizeof(struct vpu_mem_desc)))
++				ret = -EFAULT;
++			break;
++		}
++	case VPU_IOC_SYS_SW_RESET:
++		{
++			vpu_reset();
++			break;
++		}
++	case VPU_IOC_REG_DUMP:
++		break;
++	case VPU_IOC_PHYMEM_DUMP:
++		break;
++	case VPU_IOC_PHYMEM_CHECK:
++	{
++		struct vpu_mem_desc check_memory;
++		ret = copy_from_user(&check_memory,
++				     (void __user *)arg,
++				     sizeof(struct vpu_mem_desc));
++		if (ret != 0) {
++			dev_err(vpu_dev, "copy from user failure:%d\n", ret);
++			ret = -EFAULT;
++			break;
++		}
++		ret = vpu_is_valid_phy_memory((u32)check_memory.phy_addr);
++
++		dev_dbg(vpu_dev, "vpu: memory phy:0x%x %s phy memory\n",
++		       check_memory.phy_addr, (ret ? "is" : "isn't"));
++		/* borrow .size to pass back the result. */
++		check_memory.size = ret;
++		ret = copy_to_user((void __user *)arg, &check_memory,
++				   sizeof(struct vpu_mem_desc));
++		if (ret) {
++			ret = -EFAULT;
++			break;
++		}
++		break;
++	}
++	case VPU_IOC_LOCK_DEV:
++		{
++			u32 lock_en;
++
++			if (get_user(lock_en, (u32 __user *) arg))
++				return -EFAULT;
++
++			if (lock_en)
++				mutex_lock(&vpu_data.lock);
++			else
++				mutex_unlock(&vpu_data.lock);
++
++			break;
++		}
++	default:
++		{
++			dev_err(vpu_dev, "No such IOCTL, cmd is %d\n", cmd);
++			ret = -EINVAL;
++			break;
++		}
++	}
++	return ret;
++}
++
++/*!
++ * @brief Release function for vpu file operation
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_release(struct inode *inode, struct file *filp)
++{
++	int i;
++	unsigned long timeout;
++
++	mutex_lock(&vpu_data.lock);
++
++	if (open_count > 0 && !(--open_count)) {
++
++		/* Wait for vpu go to idle state */
++		clk_prepare(vpu_clk);
++		clk_enable(vpu_clk);
++		if (READ_REG(BIT_CUR_PC)) {
++
++			timeout = jiffies + HZ;
++			while (READ_REG(BIT_BUSY_FLAG)) {
++				msleep(1);
++				if (time_after(jiffies, timeout)) {
++					dev_warn(vpu_dev, "VPU timeout during release\n");
++					break;
++				}
++			}
++			clk_disable(vpu_clk);
++			clk_unprepare(vpu_clk);
++
++			/* Clean up interrupt */
++			cancel_work_sync(&vpu_data.work);
++			flush_workqueue(vpu_data.workqueue);
++			irq_status = 0;
++
++			clk_prepare(vpu_clk);
++			clk_enable(vpu_clk);
++			if (READ_REG(BIT_BUSY_FLAG)) {
++
++				if (cpu_is_mx51() || cpu_is_mx53()) {
++					dev_err(vpu_dev,
++						"fatal error: can't gate/power off when VPU is busy\n");
++					clk_disable(vpu_clk);
++					clk_unprepare(vpu_clk);
++					mutex_unlock(&vpu_data.lock);
++					return -EFAULT;
++				}
++
++#ifdef CONFIG_SOC_IMX6Q
++				if (cpu_is_mx6dl() || cpu_is_mx6q()) {
++					WRITE_REG(0x11, 0x10F0);
++					timeout = jiffies + HZ;
++					while (READ_REG(0x10F4) != 0x77) {
++						msleep(1);
++						if (time_after(jiffies, timeout))
++							break;
++					}
++
++					if (READ_REG(0x10F4) != 0x77) {
++						dev_err(vpu_dev,
++							"fatal error: can't gate/power off when VPU is busy\n");
++						WRITE_REG(0x0, 0x10F0);
++						clk_disable(vpu_clk);
++						clk_unprepare(vpu_clk);
++						mutex_unlock(&vpu_data.lock);
++						return -EFAULT;
++					} else
++						vpu_reset();
++				}
++#endif
++			}
++		}
++		clk_disable(vpu_clk);
++		clk_unprepare(vpu_clk);
++
++		vpu_free_buffers();
++
++		/* Free shared memory when vpu device is idle */
++		vpu_free_dma_buffer(&share_mem);
++		share_mem.cpu_addr = 0;
++		vfree((void *)vshare_mem.cpu_addr);
++		vshare_mem.cpu_addr = 0;
++
++		vpu_clk_usercount = atomic_read(&clk_cnt_from_ioc);
++		for (i = 0; i < vpu_clk_usercount; i++) {
++			clk_disable(vpu_clk);
++			clk_unprepare(vpu_clk);
++			atomic_dec(&clk_cnt_from_ioc);
++		}
++
++		vpu_power_up(false);
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++		pm_runtime_put_sync_suspend(vpu_dev);
++#endif
++
++	}
++	mutex_unlock(&vpu_data.lock);
++
++	return 0;
++}
++
++/*!
++ * @brief fasync function for vpu file operation
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_fasync(int fd, struct file *filp, int mode)
++{
++	struct vpu_priv *dev = (struct vpu_priv *)filp->private_data;
++	return fasync_helper(fd, filp, mode, &dev->async_queue);
++}
++
++/*!
++ * @brief memory map function of harware registers for vpu file operation
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_map_hwregs(struct file *fp, struct vm_area_struct *vm)
++{
++	unsigned long pfn;
++
++	vm->vm_flags |= VM_IO | VM_RESERVED;
++	/*
++	 * Since vpu registers have been mapped with ioremap() at probe
++	 * which L_PTE_XN is 1, and the same physical address must be
++	 * mapped multiple times with same type, so set L_PTE_XN to 1 here.
++	 * Otherwise, there may be unexpected result in video codec.
++	 */
++	vm->vm_page_prot = pgprot_noncachedxn(vm->vm_page_prot);
++	pfn = phy_vpu_base_addr >> PAGE_SHIFT;
++	dev_dbg(vpu_dev, "size=0x%x, page no.=0x%x\n",
++		 (int)(vm->vm_end - vm->vm_start), (int)pfn);
++	return remap_pfn_range(vm, vm->vm_start, pfn, vm->vm_end - vm->vm_start,
++			       vm->vm_page_prot) ? -EAGAIN : 0;
++}
++
++/*!
++ * @brief memory map function of memory for vpu file operation
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_map_dma_mem(struct file *fp, struct vm_area_struct *vm)
++{
++	int request_size;
++	request_size = vm->vm_end - vm->vm_start;
++
++	dev_dbg(vpu_dev, "start=0x%x, pgoff=0x%x, size=0x%x\n",
++		 (unsigned int)(vm->vm_start), (unsigned int)(vm->vm_pgoff),
++		 request_size);
++
++	vm->vm_flags |= VM_IO | VM_RESERVED;
++	vm->vm_page_prot = pgprot_writecombine(vm->vm_page_prot);
++
++	return remap_pfn_range(vm, vm->vm_start, vm->vm_pgoff,
++			       request_size, vm->vm_page_prot) ? -EAGAIN : 0;
++
++}
++
++/* !
++ * @brief memory map function of vmalloced share memory
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_map_vshare_mem(struct file *fp, struct vm_area_struct *vm)
++{
++	int ret = -EINVAL;
++
++	ret = remap_vmalloc_range(vm, (void *)(vm->vm_pgoff << PAGE_SHIFT), 0);
++	vm->vm_flags |= VM_IO;
++
++	return ret;
++}
++/*!
++ * @brief memory map interface for vpu file operation
++ * @return  0 on success or negative error code on error
++ */
++static int vpu_mmap(struct file *fp, struct vm_area_struct *vm)
++{
++	unsigned long offset;
++
++	offset = vshare_mem.cpu_addr >> PAGE_SHIFT;
++
++	if (vm->vm_pgoff && (vm->vm_pgoff == offset))
++		return vpu_map_vshare_mem(fp, vm);
++	else if (vm->vm_pgoff)
++		return vpu_map_dma_mem(fp, vm);
++	else
++		return vpu_map_hwregs(fp, vm);
++}
++
++const struct file_operations vpu_fops = {
++	.owner = THIS_MODULE,
++	.open = vpu_open,
++	.unlocked_ioctl = vpu_ioctl,
++	.release = vpu_release,
++	.fasync = vpu_fasync,
++	.mmap = vpu_mmap,
++};
++
++/*!
++ * This function is called by the driver framework to initialize the vpu device.
++ * @param   dev The device structure for the vpu passed in by the framework.
++ * @return   0 on success or negative error code on error
++ */
++static int vpu_dev_probe(struct platform_device *pdev)
++{
++	int err = 0;
++	struct device *temp_class;
++	struct resource *res;
++	unsigned long addr = 0;
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++	struct device_node *np = pdev->dev.of_node;
++	u32 iramsize;
++
++	err = of_property_read_u32(np, "iramsize", (u32 *)&iramsize);
++	if (!err && iramsize)
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++	{
++		iram_pool = of_get_named_gen_pool(np, "iram", 0);
++		if (!iram_pool) {
++			dev_err(&pdev->dev, "iram pool not available\n");
++			return -ENOMEM;
++		}
++
++		iram_base = gen_pool_alloc(iram_pool, iramsize);
++		if (!iram_base) {
++			dev_err(&pdev->dev, "unable to alloc iram\n");
++			return -ENOMEM;
++		}
++
++		addr = gen_pool_virt_to_phys(iram_pool, iram_base);
++	}
++#else
++		iram_alloc(iramsize, &addr);
++#endif
++	if (addr == 0)
++		iram.start = iram.end = 0;
++	else {
++		iram.start = addr;
++		iram.end = addr + iramsize - 1;
++	}
++#else
++
++	vpu_plat = pdev->dev.platform_data;
++
++	if (vpu_plat && vpu_plat->iram_enable && vpu_plat->iram_size)
++		iram_alloc(vpu_plat->iram_size, &addr);
++	if (addr == 0)
++		iram.start = iram.end = 0;
++	else {
++		iram.start = addr;
++		iram.end = addr +  vpu_plat->iram_size - 1;
++	}
++#endif
++
++	vpu_dev = &pdev->dev;
++
++	res = platform_get_resource_byname(pdev, IORESOURCE_MEM, "vpu_regs");
++	if (!res) {
++		dev_err(vpu_dev, "vpu: unable to get vpu base addr\n");
++		return -ENODEV;
++	}
++	phy_vpu_base_addr = res->start;
++	vpu_base = ioremap(res->start, res->end - res->start);
++
++	vpu_major = register_chrdev(vpu_major, "mxc_vpu", &vpu_fops);
++	if (vpu_major < 0) {
++		dev_err(vpu_dev, "vpu: unable to get a major for VPU\n");
++		err = -EBUSY;
++		goto error;
++	}
++
++	vpu_class = class_create(THIS_MODULE, "mxc_vpu");
++	if (IS_ERR(vpu_class)) {
++		err = PTR_ERR(vpu_class);
++		goto err_out_chrdev;
++	}
++
++	temp_class = device_create(vpu_class, NULL, MKDEV(vpu_major, 0),
++				   NULL, "mxc_vpu");
++	if (IS_ERR(temp_class)) {
++		err = PTR_ERR(temp_class);
++		goto err_out_class;
++	}
++
++	vpu_clk = clk_get(&pdev->dev, "per");
++	if (IS_ERR(vpu_clk)) {
++		err = -ENOENT;
++		goto err_out_class;
++	}
++
++	vpu_ipi_irq = platform_get_irq_byname(pdev, "bit");
++	if (vpu_ipi_irq < 0) {
++		dev_err(vpu_dev, "vpu: unable to get vpu interrupt\n");
++		err = -ENXIO;
++		goto err_out_class;
++	}
++	err = request_irq(vpu_ipi_irq, vpu_ipi_irq_handler, 0, "VPU_CODEC_IRQ",
++			  (void *)(&vpu_data));
++	if (err)
++		goto err_out_class;
++	if (vpu_power_get(true)) {
++		if (!(cpu_is_mx51() || cpu_is_mx53())) {
++			dev_err(vpu_dev, "failed to get vpu power\n");
++			goto err_out_class;
++		} else {
++			/* regulator_get will return error on MX5x,
++			 * just igore it everywhere*/
++			dev_warn(vpu_dev, "failed to get vpu power\n");
++		}
++	}
++
++#ifdef MXC_VPU_HAS_JPU
++	vpu_jpu_irq = platform_get_irq_byname(pdev, "jpeg");
++	if (vpu_jpu_irq < 0) {
++		dev_err(vpu_dev, "vpu: unable to get vpu jpu interrupt\n");
++		err = -ENXIO;
++		free_irq(vpu_ipi_irq, &vpu_data);
++		goto err_out_class;
++	}
++	err = request_irq(vpu_jpu_irq, vpu_jpu_irq_handler, IRQF_TRIGGER_RISING,
++			  "VPU_JPG_IRQ", (void *)(&vpu_data));
++	if (err) {
++		free_irq(vpu_ipi_irq, &vpu_data);
++		goto err_out_class;
++	}
++#endif
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++	pm_runtime_enable(&pdev->dev);
++#endif
++
++	vpu_data.workqueue = create_workqueue("vpu_wq");
++	INIT_WORK(&vpu_data.work, vpu_worker_callback);
++	mutex_init(&vpu_data.lock);
++	dev_info(vpu_dev, "VPU initialized\n");
++	goto out;
++
++err_out_class:
++	device_destroy(vpu_class, MKDEV(vpu_major, 0));
++	class_destroy(vpu_class);
++err_out_chrdev:
++	unregister_chrdev(vpu_major, "mxc_vpu");
++error:
++	iounmap(vpu_base);
++out:
++	return err;
++}
++
++static int vpu_dev_remove(struct platform_device *pdev)
++{
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++	pm_runtime_disable(&pdev->dev);
++#endif
++	free_irq(vpu_ipi_irq, &vpu_data);
++#ifdef MXC_VPU_HAS_JPU
++	free_irq(vpu_jpu_irq, &vpu_data);
++#endif
++	cancel_work_sync(&vpu_data.work);
++	flush_workqueue(vpu_data.workqueue);
++	destroy_workqueue(vpu_data.workqueue);
++
++	iounmap(vpu_base);
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++	if (iram.start)
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
++		gen_pool_free(iram_pool, iram_base, iram.end-iram.start+1);
++#else
++		iram_free(iram.start, iram.end-iram.start+1);
++#endif
++#else
++	if (vpu_plat && vpu_plat->iram_enable && vpu_plat->iram_size)
++		iram_free(iram.start,  vpu_plat->iram_size);
++#endif
++
++	vpu_power_get(false);
++	return 0;
++}
++
++#ifdef CONFIG_PM
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++static int vpu_suspend(struct device *dev)
++#else
++static int vpu_suspend(struct platform_device *pdev, pm_message_t state)
++#endif
++{
++	int i;
++	unsigned long timeout;
++
++	mutex_lock(&vpu_data.lock);
++	if (open_count == 0) {
++		/* VPU is released (all instances are freed),
++		 * clock is already off, context is no longer needed,
++		 * power is already off on MX6,
++		 * gate power on MX51 */
++		if (cpu_is_mx51()) {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++			if (vpu_plat->pg)
++				vpu_plat->pg(1);
++#endif
++		}
++	} else {
++		/* Wait for vpu go to idle state, suspect vpu cannot be changed
++		   to idle state after about 1 sec */
++		timeout = jiffies + HZ;
++		clk_prepare(vpu_clk);
++		clk_enable(vpu_clk);
++		while (READ_REG(BIT_BUSY_FLAG)) {
++			msleep(1);
++			if (time_after(jiffies, timeout)) {
++				clk_disable(vpu_clk);
++				clk_unprepare(vpu_clk);
++				mutex_unlock(&vpu_data.lock);
++				return -EAGAIN;
++			}
++		}
++		clk_disable(vpu_clk);
++		clk_unprepare(vpu_clk);
++
++		/* Make sure clock is disabled before suspend */
++		vpu_clk_usercount = atomic_read(&clk_cnt_from_ioc);
++		for (i = 0; i < vpu_clk_usercount; i++) {
++			clk_disable(vpu_clk);
++			clk_unprepare(vpu_clk);
++		}
++
++		if (cpu_is_mx53()) {
++			mutex_unlock(&vpu_data.lock);
++			return 0;
++		}
++
++		if (bitwork_mem.cpu_addr != 0) {
++			clk_prepare(vpu_clk);
++			clk_enable(vpu_clk);
++			/* Save 64 registers from BIT_CODE_BUF_ADDR */
++			for (i = 0; i < 64; i++)
++				regBk[i] = READ_REG(BIT_CODE_BUF_ADDR + (i * 4));
++			pc_before_suspend = READ_REG(BIT_CUR_PC);
++			clk_disable(vpu_clk);
++			clk_unprepare(vpu_clk);
++		}
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++		if (vpu_plat->pg)
++			vpu_plat->pg(1);
++#endif
++
++		/* If VPU is working before suspend, disable
++		 * regulator to make usecount right. */
++		vpu_power_up(false);
++	}
++
++	mutex_unlock(&vpu_data.lock);
++	return 0;
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++static int vpu_resume(struct device *dev)
++#else
++static int vpu_resume(struct platform_device *pdev)
++#endif
++{
++	int i;
++
++	mutex_lock(&vpu_data.lock);
++	if (open_count == 0) {
++		/* VPU is released (all instances are freed),
++		 * clock should be kept off, context is no longer needed,
++		 * power should be kept off on MX6,
++		 * disable power gating on MX51 */
++		if (cpu_is_mx51()) {
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++			if (vpu_plat->pg)
++				vpu_plat->pg(0);
++#endif
++		}
++	} else {
++		if (cpu_is_mx53())
++			goto recover_clk;
++
++		/* If VPU is working before suspend, enable
++		 * regulator to make usecount right. */
++		vpu_power_up(true);
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++		if (vpu_plat->pg)
++			vpu_plat->pg(0);
++#endif
++
++		if (bitwork_mem.cpu_addr != 0) {
++			u32 *p = (u32 *) bitwork_mem.cpu_addr;
++			u32 data, pc;
++			u16 data_hi;
++			u16 data_lo;
++
++			clk_prepare(vpu_clk);
++			clk_enable(vpu_clk);
++
++			pc = READ_REG(BIT_CUR_PC);
++			if (pc) {
++				dev_warn(vpu_dev, "Not power off after suspend (PC=0x%x)\n", pc);
++				clk_disable(vpu_clk);
++				clk_unprepare(vpu_clk);
++				goto recover_clk;
++			}
++
++			/* Restore registers */
++			for (i = 0; i < 64; i++)
++				WRITE_REG(regBk[i], BIT_CODE_BUF_ADDR + (i * 4));
++
++			WRITE_REG(0x0, BIT_RESET_CTRL);
++			WRITE_REG(0x0, BIT_CODE_RUN);
++			/* MX6 RTL has a bug not to init MBC_SET_SUBBLK_EN on reset */
++#ifdef CONFIG_SOC_IMX6Q
++			WRITE_REG(0x0, MBC_SET_SUBBLK_EN);
++#endif
++
++			/*
++			 * Re-load boot code, from the codebuffer in external RAM.
++			 * Thankfully, we only need 4096 bytes, same for all platforms.
++			 */
++			for (i = 0; i < 2048; i += 4) {
++				data = p[(i / 2) + 1];
++				data_hi = (data >> 16) & 0xFFFF;
++				data_lo = data & 0xFFFF;
++				WRITE_REG((i << 16) | data_hi, BIT_CODE_DOWN);
++				WRITE_REG(((i + 1) << 16) | data_lo,
++						BIT_CODE_DOWN);
++
++				data = p[i / 2];
++				data_hi = (data >> 16) & 0xFFFF;
++				data_lo = data & 0xFFFF;
++				WRITE_REG(((i + 2) << 16) | data_hi,
++						BIT_CODE_DOWN);
++				WRITE_REG(((i + 3) << 16) | data_lo,
++						BIT_CODE_DOWN);
++			}
++
++			if (pc_before_suspend) {
++				WRITE_REG(0x1, BIT_BUSY_FLAG);
++				WRITE_REG(0x1, BIT_CODE_RUN);
++				while (READ_REG(BIT_BUSY_FLAG))
++					;
++			} else {
++				dev_warn(vpu_dev, "PC=0 before suspend\n");
++			}
++			clk_disable(vpu_clk);
++			clk_unprepare(vpu_clk);
++		}
++
++recover_clk:
++		/* Recover vpu clock */
++		for (i = 0; i < vpu_clk_usercount; i++) {
++			clk_prepare(vpu_clk);
++			clk_enable(vpu_clk);
++		}
++	}
++
++	mutex_unlock(&vpu_data.lock);
++	return 0;
++}
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++static int vpu_runtime_suspend(struct device *dev)
++{
++	dev_dbg(dev, "ipu busfreq high release.\n");
++	release_bus_freq(BUS_FREQ_HIGH);
++	return 0;
++}
++
++static int vpu_runtime_resume(struct device *dev)
++{
++	dev_dbg(dev, "ipu busfreq high request.\n");
++	request_bus_freq(BUS_FREQ_HIGH);
++	return 0;
++}
++
++static const struct dev_pm_ops vpu_pm_ops = {
++	SET_RUNTIME_PM_OPS(vpu_runtime_suspend, vpu_runtime_resume, NULL)
++	SET_SYSTEM_SLEEP_PM_OPS(vpu_suspend, vpu_resume)
++};
++#endif
++
++#else
++#define	vpu_suspend	NULL
++#define	vpu_resume	NULL
++#endif				/* !CONFIG_PM */
++
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++static const struct of_device_id vpu_of_match[] = {
++	{ .compatible = "fsl,imx6-vpu", },
++	{ .compatible = "fsl,imx6q-vpu", },
++	{/* sentinel */}
++};
++MODULE_DEVICE_TABLE(of, vpu_of_match);
++#endif
++
++/*! Driver definition
++ *
++ */
++static struct platform_driver mxcvpu_driver = {
++	.driver = {
++		   .name = "mxc_vpu",
++#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
++		   .of_match_table = vpu_of_match,
++#ifdef CONFIG_PM
++		   .pm = &vpu_pm_ops,
++#endif
++#endif
++		   },
++	.probe = vpu_dev_probe,
++	.remove = vpu_dev_remove,
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++	.suspend = vpu_suspend,
++	.resume = vpu_resume,
++#endif
++};
++
++static int __init vpu_init(void)
++{
++	int ret = platform_driver_register(&mxcvpu_driver);
++
++	init_waitqueue_head(&vpu_queue);
++
++
++#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 5, 0)
++	memblock_analyze();
++	top_address_DRAM = memblock_end_of_DRAM_with_reserved();
++#endif
++
++	return ret;
++}
++
++static void __exit vpu_exit(void)
++{
++	if (vpu_major > 0) {
++		device_destroy(vpu_class, MKDEV(vpu_major, 0));
++		class_destroy(vpu_class);
++		unregister_chrdev(vpu_major, "mxc_vpu");
++		vpu_major = 0;
++	}
++
++	vpu_free_dma_buffer(&bitwork_mem);
++	vpu_free_dma_buffer(&pic_para_mem);
++	vpu_free_dma_buffer(&user_data_mem);
++
++	/* reset VPU state */
++	vpu_power_up(true);
++	clk_prepare(vpu_clk);
++	clk_enable(vpu_clk);
++	vpu_reset();
++	clk_disable(vpu_clk);
++	clk_unprepare(vpu_clk);
++	vpu_power_up(false);
++
++	clk_put(vpu_clk);
++
++	platform_driver_unregister(&mxcvpu_driver);
++	return;
++}
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("Linux VPU driver for Freescale i.MX/MXC");
++MODULE_LICENSE("GPL");
++
++module_init(vpu_init);
++module_exit(vpu_exit);
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/bcmsdh.c	2015-07-27 23:13:06.848547454 +0200
+@@ -1011,6 +1011,14 @@
+ 	return 0;
+ }
+ 
++static void brcmf_sdiod_host_fixup(struct mmc_host *host)
++{
++	/* runtime-pm powers off the device */
++	pm_runtime_forbid(host->parent);
++	/* avoid removal detection upon resume */
++	host->caps |= MMC_CAP_NONREMOVABLE;
++}
++
+ static int brcmf_sdiod_probe(struct brcmf_sdio_dev *sdiodev)
+ {
+ 	struct sdio_func *func;
+@@ -1076,7 +1084,7 @@
+ 		ret = -ENODEV;
+ 		goto out;
+ 	}
+-	pm_runtime_forbid(host->parent);
++	brcmf_sdiod_host_fixup(host);
+ out:
+ 	if (ret)
+ 		brcmf_sdiod_remove(sdiodev);
+@@ -1246,15 +1254,15 @@
+ 	brcmf_sdiod_freezer_on(sdiodev);
+ 	brcmf_sdio_wd_timer(sdiodev->bus, 0);
+ 
++	sdio_flags = MMC_PM_KEEP_POWER;
+ 	if (sdiodev->wowl_enabled) {
+-		sdio_flags = MMC_PM_KEEP_POWER;
+ 		if (sdiodev->pdata->oob_irq_supported)
+ 			enable_irq_wake(sdiodev->pdata->oob_irq_nr);
+ 		else
+-			sdio_flags = MMC_PM_WAKE_SDIO_IRQ;
+-		if (sdio_set_host_pm_flags(sdiodev->func[1], sdio_flags))
+-			brcmf_err("Failed to set pm_flags %x\n", sdio_flags);
++			sdio_flags |= MMC_PM_WAKE_SDIO_IRQ;
+ 	}
++	if (sdio_set_host_pm_flags(sdiodev->func[1], sdio_flags))
++		brcmf_err("Failed to set pm_flags %x\n", sdio_flags);
+ 	return 0;
+ }
+ 
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/cfg80211.c	2015-07-27 23:13:06.848547454 +0200
+@@ -129,13 +129,47 @@
+ 	RATETAB_ENT(BRCM_RATE_54M, 0),
+ };
+ 
+-#define wl_a_rates		(__wl_rates + 4)
+-#define wl_a_rates_size	8
+ #define wl_g_rates		(__wl_rates + 0)
+-#define wl_g_rates_size	12
++#define wl_g_rates_size		ARRAY_SIZE(__wl_rates)
++#define wl_a_rates		(__wl_rates + 4)
++#define wl_a_rates_size		(wl_g_rates_size - 4)
++
++#define CHAN2G(_channel, _freq) {				\
++	.band			= IEEE80211_BAND_2GHZ,		\
++	.center_freq		= (_freq),			\
++	.hw_value		= (_channel),			\
++	.flags			= IEEE80211_CHAN_DISABLED,	\
++	.max_antenna_gain	= 0,				\
++	.max_power		= 30,				\
++}
++
++#define CHAN5G(_channel) {					\
++	.band			= IEEE80211_BAND_5GHZ,		\
++	.center_freq		= 5000 + (5 * (_channel)),	\
++	.hw_value		= (_channel),			\
++	.flags			= IEEE80211_CHAN_DISABLED,	\
++	.max_antenna_gain	= 0,				\
++	.max_power		= 30,				\
++}
++
++static struct ieee80211_channel __wl_2ghz_channels[] = {
++	CHAN2G(1, 2412), CHAN2G(2, 2417), CHAN2G(3, 2422), CHAN2G(4, 2427),
++	CHAN2G(5, 2432), CHAN2G(6, 2437), CHAN2G(7, 2442), CHAN2G(8, 2447),
++	CHAN2G(9, 2452), CHAN2G(10, 2457), CHAN2G(11, 2462), CHAN2G(12, 2467),
++	CHAN2G(13, 2472), CHAN2G(14, 2484)
++};
++
++static struct ieee80211_channel __wl_5ghz_channels[] = {
++	CHAN5G(34), CHAN5G(36), CHAN5G(38), CHAN5G(40), CHAN5G(42),
++	CHAN5G(44), CHAN5G(46), CHAN5G(48), CHAN5G(52), CHAN5G(56),
++	CHAN5G(60), CHAN5G(64), CHAN5G(100), CHAN5G(104), CHAN5G(108),
++	CHAN5G(112), CHAN5G(116), CHAN5G(120), CHAN5G(124), CHAN5G(128),
++	CHAN5G(132), CHAN5G(136), CHAN5G(140), CHAN5G(144), CHAN5G(149),
++	CHAN5G(153), CHAN5G(157), CHAN5G(161), CHAN5G(165)
++};
+ 
+ /* Band templates duplicated per wiphy. The channel info
+- * is filled in after querying the device.
++ * above is added to the band during setup.
+  */
+ static const struct ieee80211_supported_band __wl_band_2ghz = {
+ 	.band = IEEE80211_BAND_2GHZ,
+@@ -143,7 +177,7 @@
+ 	.n_bitrates = wl_g_rates_size,
+ };
+ 
+-static const struct ieee80211_supported_band __wl_band_5ghz_a = {
++static const struct ieee80211_supported_band __wl_band_5ghz = {
+ 	.band = IEEE80211_BAND_5GHZ,
+ 	.bitrates = wl_a_rates,
+ 	.n_bitrates = wl_a_rates_size,
+@@ -5253,40 +5287,6 @@
+ 	return err;
+ }
+ 
+-/* Filter the list of channels received from firmware counting only
+- * the 20MHz channels. The wiphy band data only needs those which get
+- * flagged to indicate if they can take part in higher bandwidth.
+- */
+-static void brcmf_count_20mhz_channels(struct brcmf_cfg80211_info *cfg,
+-				       struct brcmf_chanspec_list *chlist,
+-				       u32 chcnt[])
+-{
+-	u32 total = le32_to_cpu(chlist->count);
+-	struct brcmu_chan ch;
+-	int i;
+-
+-	for (i = 0; i < total; i++) {
+-		ch.chspec = (u16)le32_to_cpu(chlist->element[i]);
+-		cfg->d11inf.decchspec(&ch);
+-
+-		/* Firmware gives a ordered list. We skip non-20MHz
+-		 * channels is 2G. For 5G we can abort upon reaching
+-		 * a non-20MHz channel in the list.
+-		 */
+-		if (ch.bw != BRCMU_CHAN_BW_20) {
+-			if (ch.band == BRCMU_CHAN_BAND_5G)
+-				break;
+-			else
+-				continue;
+-		}
+-
+-		if (ch.band == BRCMU_CHAN_BAND_2G)
+-			chcnt[0] += 1;
+-		else if (ch.band == BRCMU_CHAN_BAND_5G)
+-			chcnt[1] += 1;
+-	}
+-}
+-
+ static void brcmf_update_bw40_channel_flag(struct ieee80211_channel *channel,
+ 					   struct brcmu_chan *ch)
+ {
+@@ -5322,7 +5322,6 @@
+ 	u32 i, j;
+ 	u32 total;
+ 	u32 chaninfo;
+-	u32 chcnt[2] = { 0, 0 };
+ 	u32 index;
+ 
+ 	pbuf = kzalloc(BRCMF_DCMD_MEDLEN, GFP_KERNEL);
+@@ -5339,42 +5338,15 @@
+ 		goto fail_pbuf;
+ 	}
+ 
+-	brcmf_count_20mhz_channels(cfg, list, chcnt);
+ 	wiphy = cfg_to_wiphy(cfg);
+-	if (chcnt[0]) {
+-		band = kmemdup(&__wl_band_2ghz, sizeof(__wl_band_2ghz),
+-			       GFP_KERNEL);
+-		if (band == NULL) {
+-			err = -ENOMEM;
+-			goto fail_pbuf;
+-		}
+-		band->channels = kcalloc(chcnt[0], sizeof(*channel),
+-					 GFP_KERNEL);
+-		if (band->channels == NULL) {
+-			kfree(band);
+-			err = -ENOMEM;
+-			goto fail_pbuf;
+-		}
+-		band->n_channels = 0;
+-		wiphy->bands[IEEE80211_BAND_2GHZ] = band;
+-	}
+-	if (chcnt[1]) {
+-		band = kmemdup(&__wl_band_5ghz_a, sizeof(__wl_band_5ghz_a),
+-			       GFP_KERNEL);
+-		if (band == NULL) {
+-			err = -ENOMEM;
+-			goto fail_band2g;
+-		}
+-		band->channels = kcalloc(chcnt[1], sizeof(*channel),
+-					 GFP_KERNEL);
+-		if (band->channels == NULL) {
+-			kfree(band);
+-			err = -ENOMEM;
+-			goto fail_band2g;
+-		}
+-		band->n_channels = 0;
+-		wiphy->bands[IEEE80211_BAND_5GHZ] = band;
+-	}
++	band = wiphy->bands[IEEE80211_BAND_2GHZ];
++	if (band)
++		for (i = 0; i < band->n_channels; i++)
++			band->channels[i].flags = IEEE80211_CHAN_DISABLED;
++	band = wiphy->bands[IEEE80211_BAND_5GHZ];
++	if (band)
++		for (i = 0; i < band->n_channels; i++)
++			band->channels[i].flags = IEEE80211_CHAN_DISABLED;
+ 
+ 	total = le32_to_cpu(list->count);
+ 	for (i = 0; i < total; i++) {
+@@ -5389,6 +5361,8 @@
+ 			brcmf_err("Invalid channel Spec. 0x%x.\n", ch.chspec);
+ 			continue;
+ 		}
++		if (!band)
++			continue;
+ 		if (!(bw_cap[band->band] & WLC_BW_40MHZ_BIT) &&
+ 		    ch.bw == BRCMU_CHAN_BW_40)
+ 			continue;
+@@ -5416,9 +5390,9 @@
+ 		} else if (ch.bw == BRCMU_CHAN_BW_40) {
+ 			brcmf_update_bw40_channel_flag(&channel[index], &ch);
+ 		} else {
+-			/* disable other bandwidths for now as mentioned
+-			 * order assure they are enabled for subsequent
+-			 * chanspecs.
++			/* enable the channel and disable other bandwidths
++			 * for now as mentioned order assure they are enabled
++			 * for subsequent chanspecs.
+ 			 */
+ 			channel[index].flags = IEEE80211_CHAN_NO_HT40 |
+ 					       IEEE80211_CHAN_NO_80MHZ;
+@@ -5437,16 +5411,8 @@
+ 						IEEE80211_CHAN_NO_IR;
+ 			}
+ 		}
+-		if (index == band->n_channels)
+-			band->n_channels++;
+ 	}
+-	kfree(pbuf);
+-	return 0;
+ 
+-fail_band2g:
+-	kfree(wiphy->bands[IEEE80211_BAND_2GHZ]->channels);
+-	kfree(wiphy->bands[IEEE80211_BAND_2GHZ]);
+-	wiphy->bands[IEEE80211_BAND_2GHZ] = NULL;
+ fail_pbuf:
+ 	kfree(pbuf);
+ 	return err;
+@@ -5779,7 +5745,12 @@
+ 
+ static int brcmf_setup_wiphy(struct wiphy *wiphy, struct brcmf_if *ifp)
+ {
++	struct ieee80211_supported_band *band;
+ 	struct ieee80211_iface_combination ifc_combo;
++	__le32 bandlist[3];
++	u32 n_bands;
++	int err, i;
++
+ 	wiphy->max_scan_ssids = WL_NUM_SCAN_MAX;
+ 	wiphy->max_scan_ie_len = BRCMF_SCAN_IE_LEN_MAX;
+ 	wiphy->max_num_pmkids = WL_NUM_PMKIDS_MAX;
+@@ -5812,7 +5783,8 @@
+ 		wiphy->flags |= WIPHY_FLAG_SUPPORTS_FW_ROAM;
+ 	wiphy->mgmt_stypes = brcmf_txrx_stypes;
+ 	wiphy->max_remain_on_channel_duration = 5000;
+-	brcmf_wiphy_pno_params(wiphy);
++	if (brcmf_feat_is_enabled(ifp, BRCMF_FEAT_PNO))
++		brcmf_wiphy_pno_params(wiphy);
+ 
+ 	/* vendor commands/events support */
+ 	wiphy->vendor_commands = brcmf_vendor_cmds;
+@@ -5821,7 +5793,52 @@
+ 	if (brcmf_feat_is_enabled(ifp, BRCMF_FEAT_WOWL))
+ 		brcmf_wiphy_wowl_params(wiphy);
+ 
+-	return brcmf_setup_wiphybands(wiphy);
++	err = brcmf_fil_cmd_data_get(ifp, BRCMF_C_GET_BANDLIST, &bandlist,
++				     sizeof(bandlist));
++	if (err) {
++		brcmf_err("could not obtain band info: err=%d\n", err);
++		return err;
++	}
++	/* first entry in bandlist is number of bands */
++	n_bands = le32_to_cpu(bandlist[0]);
++	for (i = 1; i <= n_bands && i < ARRAY_SIZE(bandlist); i++) {
++		if (bandlist[i] == cpu_to_le32(WLC_BAND_2G)) {
++			band = kmemdup(&__wl_band_2ghz, sizeof(__wl_band_2ghz),
++				       GFP_KERNEL);
++			if (!band)
++				return -ENOMEM;
++
++			band->channels = kmemdup(&__wl_2ghz_channels,
++						 sizeof(__wl_2ghz_channels),
++						 GFP_KERNEL);
++			if (!band->channels) {
++				kfree(band);
++				return -ENOMEM;
++			}
++
++			band->n_channels = ARRAY_SIZE(__wl_2ghz_channels);
++			wiphy->bands[IEEE80211_BAND_2GHZ] = band;
++		}
++		if (bandlist[i] == cpu_to_le32(WLC_BAND_5G)) {
++			band = kmemdup(&__wl_band_5ghz, sizeof(__wl_band_5ghz),
++				       GFP_KERNEL);
++			if (!band)
++				return -ENOMEM;
++
++			band->channels = kmemdup(&__wl_5ghz_channels,
++						 sizeof(__wl_5ghz_channels),
++						 GFP_KERNEL);
++			if (!band->channels) {
++				kfree(band);
++				return -ENOMEM;
++			}
++
++			band->n_channels = ARRAY_SIZE(__wl_5ghz_channels);
++			wiphy->bands[IEEE80211_BAND_5GHZ] = band;
++		}
++	}
++	err = brcmf_setup_wiphybands(wiphy);
++	return err;
+ }
+ 
+ static s32 brcmf_config_dongle(struct brcmf_cfg80211_info *cfg)
+@@ -5998,7 +6015,15 @@
+ 	brcmf_dbg(TRACE, "enter: initiator=%d, alpha=%c%c\n", req->initiator,
+ 		  req->alpha2[0], req->alpha2[1]);
+ 
+-	/* ignore non-ISO3166 country codes */
++	/* ignore non-ISO3166 country codes
++	 * don't report an error on 00 the world roaming
++	 * designator as the firmware  don't support it
++	 * but there is no reason to pass that info to userspace
++	 */
++
++	if (req->alpha2[0] == '0' && req->alpha2[1] == '0')
++		return;
++
+ 	for (i = 0; i < sizeof(req->alpha2); i++)
+ 		if (req->alpha2[i] < 'A' || req->alpha2[i] > 'Z') {
+ 			brcmf_err("not a ISO3166 code\n");
+@@ -6007,11 +6032,18 @@
+ 	memset(&ccreq, 0, sizeof(ccreq));
+ 	ccreq.rev = cpu_to_le32(-1);
+ 	memcpy(ccreq.ccode, req->alpha2, sizeof(req->alpha2));
+-	brcmf_fil_iovar_data_set(ifp, "country", &ccreq, sizeof(ccreq));
++	if (brcmf_fil_iovar_data_set(ifp, "country", &ccreq, sizeof(ccreq))) {
++		brcmf_err("firmware rejected country setting\n");
++		return;
++	}
++	brcmf_setup_wiphybands(wiphy);
+ }
+ 
+ static void brcmf_free_wiphy(struct wiphy *wiphy)
+ {
++	if (!wiphy)
++		return;
++
+ 	kfree(wiphy->iface_combinations);
+ 	if (wiphy->bands[IEEE80211_BAND_2GHZ]) {
+ 		kfree(wiphy->bands[IEEE80211_BAND_2GHZ]->channels);
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/commonring.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/commonring.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/commonring.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/commonring.c	2015-07-27 23:13:06.848547454 +0200
+@@ -22,17 +22,6 @@
+ #include "core.h"
+ #include "commonring.h"
+ 
+-
+-/* dma flushing needs implementation for mips and arm platforms. Should
+- * be put in util. Note, this is not real flushing. It is virtual non
+- * cached memory. Only write buffers should have to be drained. Though
+- * this may be different depending on platform......
+- * SEE ALSO msgbuf.c
+- */
+-#define brcmf_dma_flush(addr, len)
+-#define brcmf_dma_invalidate_cache(addr, len)
+-
+-
+ void brcmf_commonring_register_cb(struct brcmf_commonring *commonring,
+ 				  int (*cr_ring_bell)(void *ctx),
+ 				  int (*cr_update_rptr)(void *ctx),
+@@ -206,14 +195,9 @@
+ 	address = commonring->buf_addr;
+ 	address += (commonring->f_ptr * commonring->item_len);
+ 	if (commonring->f_ptr > commonring->w_ptr) {
+-		brcmf_dma_flush(address,
+-				(commonring->depth - commonring->f_ptr) *
+-				commonring->item_len);
+ 		address = commonring->buf_addr;
+ 		commonring->f_ptr = 0;
+ 	}
+-	brcmf_dma_flush(address, (commonring->w_ptr - commonring->f_ptr) *
+-			commonring->item_len);
+ 
+ 	commonring->f_ptr = commonring->w_ptr;
+ 
+@@ -258,8 +242,6 @@
+ 	if (commonring->r_ptr == commonring->depth)
+ 		commonring->r_ptr = 0;
+ 
+-	brcmf_dma_invalidate_cache(ret_addr, *n_ items * commonring->item_len);
+-
+ 	return ret_addr;
+ }
+ 
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/core.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/core.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/core.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/core.c	2015-07-27 23:13:06.848547454 +0200
+@@ -791,15 +791,15 @@
+ 	 * in case we missed the BRCMF_E_IF_DEL event.
+ 	 */
+ 	if (ifp) {
+-		brcmf_err("ERROR: netdev:%s already exists\n",
+-			  ifp->ndev->name);
+ 		if (ifidx) {
++			brcmf_err("ERROR: netdev:%s already exists, deleting old interface\n",
++				  ifp->ndev->name);
+ 			netif_stop_queue(ifp->ndev);
+ 			unregister_netdev(ifp->ndev);
+ 			free_netdev(ifp->ndev);
+ 			drvr->iflist[bssidx] = NULL;
+ 		} else {
+-			brcmf_err("ignore IF event\n");
++			brcmf_dbg(EVENT, "ignore IF event\n");
+ 			return ERR_PTR(-EINVAL);
+ 		}
+ 	}
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.c	2015-07-27 23:13:06.848547454 +0200
+@@ -124,9 +124,11 @@
+ 	struct brcmf_if *ifp = drvr->iflist[0];
+ 
+ 	brcmf_feat_iovar_int_get(ifp, BRCMF_FEAT_MCHAN, "mchan");
++	brcmf_feat_iovar_int_get(ifp, BRCMF_FEAT_PNO, "pfn");
+ 	if (drvr->bus_if->wowl_supported)
+ 		brcmf_feat_iovar_int_get(ifp, BRCMF_FEAT_WOWL, "wowl");
+-	if (drvr->bus_if->chip != BRCM_CC_43362_CHIP_ID)
++	if ((drvr->bus_if->chip != BRCM_CC_43362_CHIP_ID) &&
++	    (drvr->bus_if->chip != BRCM_CC_4330_CHIP_ID))
+ 		brcmf_feat_iovar_int_set(ifp, BRCMF_FEAT_MBSS, "mbss", 0);
+ 
+ 	/* set chip related quirks */
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.h linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.h
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/feature.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/feature.h	2015-07-27 23:13:06.848547454 +0200
+@@ -19,11 +19,15 @@
+ /*
+  * Features:
+  *
++ * MBSS: multiple BSSID support (eg. guest network in AP mode).
+  * MCHAN: multi-channel for concurrent P2P.
++ * PNO: preferred network offload.
++ * WOWL: Wake-On-WLAN.
+  */
+ #define BRCMF_FEAT_LIST \
+ 	BRCMF_FEAT_DEF(MBSS) \
+ 	BRCMF_FEAT_DEF(MCHAN) \
++	BRCMF_FEAT_DEF(PNO) \
+ 	BRCMF_FEAT_DEF(WOWL)
+ /*
+  * Quirks:
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.c	2015-07-27 23:13:06.848547454 +0200
+@@ -23,6 +23,10 @@
+ #include "debug.h"
+ #include "firmware.h"
+ 
++#define BRCMF_FW_MAX_NVRAM_SIZE			64000
++#define BRCMF_FW_NVRAM_DEVPATH_LEN		19	/* devpath0=pcie/1/4/ */
++#define BRCMF_FW_NVRAM_PCIEDEV_LEN		9	/* pcie/1/4/ */
++
+ char brcmf_firmware_path[BRCMF_FW_PATH_LEN];
+ module_param_string(firmware_path, brcmf_firmware_path,
+ 		    BRCMF_FW_PATH_LEN, 0440);
+@@ -46,6 +50,8 @@
+  * @column: current column in line.
+  * @pos: byte offset in input buffer.
+  * @entry: start position of key,value entry.
++ * @multi_dev_v1: detect pcie multi device v1 (compressed).
++ * @multi_dev_v2: detect pcie multi device v2.
+  */
+ struct nvram_parser {
+ 	enum nvram_parser_state state;
+@@ -56,6 +62,8 @@
+ 	u32 column;
+ 	u32 pos;
+ 	u32 entry;
++	bool multi_dev_v1;
++	bool multi_dev_v2;
+ };
+ 
+ static bool is_nvram_char(char c)
+@@ -108,6 +116,10 @@
+ 			st = COMMENT;
+ 		else
+ 			st = VALUE;
++		if (strncmp(&nvp->fwnv->data[nvp->entry], "devpath", 7) == 0)
++			nvp->multi_dev_v1 = true;
++		if (strncmp(&nvp->fwnv->data[nvp->entry], "pcie/", 5) == 0)
++			nvp->multi_dev_v2 = true;
+ 	} else if (!is_nvram_char(c)) {
+ 		brcmf_dbg(INFO, "warning: ln=%d:col=%d: '=' expected, skip invalid key entry\n",
+ 			  nvp->line, nvp->column);
+@@ -133,6 +145,8 @@
+ 		ekv = (u8 *)&nvp->fwnv->data[nvp->pos];
+ 		skv = (u8 *)&nvp->fwnv->data[nvp->entry];
+ 		cplen = ekv - skv;
++		if (nvp->nvram_len + cplen + 1 >= BRCMF_FW_MAX_NVRAM_SIZE)
++			return END;
+ 		/* copy to output buffer */
+ 		memcpy(&nvp->nvram[nvp->nvram_len], skv, cplen);
+ 		nvp->nvram_len += cplen;
+@@ -180,10 +194,18 @@
+ static int brcmf_init_nvram_parser(struct nvram_parser *nvp,
+ 				   const struct firmware *nv)
+ {
++	size_t size;
++
+ 	memset(nvp, 0, sizeof(*nvp));
+ 	nvp->fwnv = nv;
++	/* Limit size to MAX_NVRAM_SIZE, some files contain lot of comment */
++	if (nv->size > BRCMF_FW_MAX_NVRAM_SIZE)
++		size = BRCMF_FW_MAX_NVRAM_SIZE;
++	else
++		size = nv->size;
+ 	/* Alloc for extra 0 byte + roundup by 4 + length field */
+-	nvp->nvram = kzalloc(nv->size + 1 + 3 + sizeof(u32), GFP_KERNEL);
++	size += 1 + 3 + sizeof(u32);
++	nvp->nvram = kzalloc(size, GFP_KERNEL);
+ 	if (!nvp->nvram)
+ 		return -ENOMEM;
+ 
+@@ -192,12 +214,136 @@
+ 	return 0;
+ }
+ 
++/* brcmf_fw_strip_multi_v1 :Some nvram files contain settings for multiple
++ * devices. Strip it down for one device, use domain_nr/bus_nr to determine
++ * which data is to be returned. v1 is the version where nvram is stored
++ * compressed and "devpath" maps to index for valid entries.
++ */
++static void brcmf_fw_strip_multi_v1(struct nvram_parser *nvp, u16 domain_nr,
++				    u16 bus_nr)
++{
++	u32 i, j;
++	bool found;
++	u8 *nvram;
++	u8 id;
++
++	nvram = kzalloc(nvp->nvram_len + 1 + 3 + sizeof(u32), GFP_KERNEL);
++	if (!nvram)
++		goto fail;
++
++	/* min length: devpath0=pcie/1/4/ + 0:x=y */
++	if (nvp->nvram_len < BRCMF_FW_NVRAM_DEVPATH_LEN + 6)
++		goto fail;
++
++	/* First search for the devpathX and see if it is the configuration
++	 * for domain_nr/bus_nr. Search complete nvp
++	 */
++	found = false;
++	i = 0;
++	while (i < nvp->nvram_len - BRCMF_FW_NVRAM_DEVPATH_LEN) {
++		/* Format: devpathX=pcie/Y/Z/
++		 * Y = domain_nr, Z = bus_nr, X = virtual ID
++		 */
++		if ((strncmp(&nvp->nvram[i], "devpath", 7) == 0) &&
++		    (strncmp(&nvp->nvram[i + 8], "=pcie/", 6) == 0)) {
++			if (((nvp->nvram[i + 14] - '0') == domain_nr) &&
++			    ((nvp->nvram[i + 16] - '0') == bus_nr)) {
++				id = nvp->nvram[i + 7] - '0';
++				found = true;
++				break;
++			}
++		}
++		while (nvp->nvram[i] != 0)
++			i++;
++		i++;
++	}
++	if (!found)
++		goto fail;
++
++	/* Now copy all valid entries, release old nvram and assign new one */
++	i = 0;
++	j = 0;
++	while (i < nvp->nvram_len) {
++		if ((nvp->nvram[i] - '0' == id) && (nvp->nvram[i + 1] == ':')) {
++			i += 2;
++			while (nvp->nvram[i] != 0) {
++				nvram[j] = nvp->nvram[i];
++				i++;
++				j++;
++			}
++			nvram[j] = 0;
++			j++;
++		}
++		while (nvp->nvram[i] != 0)
++			i++;
++		i++;
++	}
++	kfree(nvp->nvram);
++	nvp->nvram = nvram;
++	nvp->nvram_len = j;
++	return;
++
++fail:
++	kfree(nvram);
++	nvp->nvram_len = 0;
++}
++
++/* brcmf_fw_strip_multi_v2 :Some nvram files contain settings for multiple
++ * devices. Strip it down for one device, use domain_nr/bus_nr to determine
++ * which data is to be returned. v2 is the version where nvram is stored
++ * uncompressed, all relevant valid entries are identified by
++ * pcie/domain_nr/bus_nr:
++ */
++static void brcmf_fw_strip_multi_v2(struct nvram_parser *nvp, u16 domain_nr,
++				    u16 bus_nr)
++{
++	u32 i, j;
++	u8 *nvram;
++
++	nvram = kzalloc(nvp->nvram_len + 1 + 3 + sizeof(u32), GFP_KERNEL);
++	if (!nvram)
++		goto fail;
++
++	/* Copy all valid entries, release old nvram and assign new one.
++	 * Valid entries are of type pcie/X/Y/ where X = domain_nr and
++	 * Y = bus_nr.
++	 */
++	i = 0;
++	j = 0;
++	while (i < nvp->nvram_len - BRCMF_FW_NVRAM_PCIEDEV_LEN) {
++		if ((strncmp(&nvp->nvram[i], "pcie/", 5) == 0) &&
++		    (nvp->nvram[i + 6] == '/') && (nvp->nvram[i + 8] == '/') &&
++		    ((nvp->nvram[i + 5] - '0') == domain_nr) &&
++		    ((nvp->nvram[i + 7] - '0') == bus_nr)) {
++			i += BRCMF_FW_NVRAM_PCIEDEV_LEN;
++			while (nvp->nvram[i] != 0) {
++				nvram[j] = nvp->nvram[i];
++				i++;
++				j++;
++			}
++			nvram[j] = 0;
++			j++;
++		}
++		while (nvp->nvram[i] != 0)
++			i++;
++		i++;
++	}
++	kfree(nvp->nvram);
++	nvp->nvram = nvram;
++	nvp->nvram_len = j;
++	return;
++fail:
++	kfree(nvram);
++	nvp->nvram_len = 0;
++}
++
+ /* brcmf_nvram_strip :Takes a buffer of "<var>=<value>\n" lines read from a fil
+  * and ending in a NUL. Removes carriage returns, empty lines, comment lines,
+  * and converts newlines to NULs. Shortens buffer as needed and pads with NULs.
+  * End of buffer is completed with token identifying length of buffer.
+  */
+-static void *brcmf_fw_nvram_strip(const struct firmware *nv, u32 *new_length)
++static void *brcmf_fw_nvram_strip(const struct firmware *nv, u32 *new_length,
++				  u16 domain_nr, u16 bus_nr)
+ {
+ 	struct nvram_parser nvp;
+ 	u32 pad;
+@@ -212,6 +358,16 @@
+ 		if (nvp.state == END)
+ 			break;
+ 	}
++	if (nvp.multi_dev_v1)
++		brcmf_fw_strip_multi_v1(&nvp, domain_nr, bus_nr);
++	else if (nvp.multi_dev_v2)
++		brcmf_fw_strip_multi_v2(&nvp, domain_nr, bus_nr);
++
++	if (nvp.nvram_len == 0) {
++		kfree(nvp.nvram);
++		return NULL;
++	}
++
+ 	pad = nvp.nvram_len;
+ 	*new_length = roundup(nvp.nvram_len + 1, 4);
+ 	while (pad != *new_length) {
+@@ -239,6 +395,8 @@
+ 	u16 flags;
+ 	const struct firmware *code;
+ 	const char *nvram_name;
++	u16 domain_nr;
++	u16 bus_nr;
+ 	void (*done)(struct device *dev, const struct firmware *fw,
+ 		     void *nvram_image, u32 nvram_len);
+ };
+@@ -254,7 +412,8 @@
+ 		goto fail;
+ 
+ 	if (fw) {
+-		nvram = brcmf_fw_nvram_strip(fw, &nvram_length);
++		nvram = brcmf_fw_nvram_strip(fw, &nvram_length,
++					     fwctx->domain_nr, fwctx->bus_nr);
+ 		release_firmware(fw);
+ 		if (!nvram && !(fwctx->flags & BRCMF_FW_REQ_NV_OPTIONAL))
+ 			goto fail;
+@@ -309,11 +468,12 @@
+ 	kfree(fwctx);
+ }
+ 
+-int brcmf_fw_get_firmwares(struct device *dev, u16 flags,
+-			   const char *code, const char *nvram,
+-			   void (*fw_cb)(struct device *dev,
+-					 const struct firmware *fw,
+-					 void *nvram_image, u32 nvram_len))
++int brcmf_fw_get_firmwares_pcie(struct device *dev, u16 flags,
++				const char *code, const char *nvram,
++				void (*fw_cb)(struct device *dev,
++					      const struct firmware *fw,
++					      void *nvram_image, u32 nvram_len),
++				u16 domain_nr, u16 bus_nr)
+ {
+ 	struct brcmf_fw *fwctx;
+ 
+@@ -333,8 +493,21 @@
+ 	fwctx->done = fw_cb;
+ 	if (flags & BRCMF_FW_REQUEST_NVRAM)
+ 		fwctx->nvram_name = nvram;
++	fwctx->domain_nr = domain_nr;
++	fwctx->bus_nr = bus_nr;
+ 
+ 	return request_firmware_nowait(THIS_MODULE, true, code, dev,
+ 				       GFP_KERNEL, fwctx,
+ 				       brcmf_fw_request_code_done);
+ }
++
++int brcmf_fw_get_firmwares(struct device *dev, u16 flags,
++			   const char *code, const char *nvram,
++			   void (*fw_cb)(struct device *dev,
++					 const struct firmware *fw,
++					 void *nvram_image, u32 nvram_len))
++{
++	return brcmf_fw_get_firmwares_pcie(dev, flags, code, nvram, fw_cb, 0,
++					   0);
++}
++
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.h linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.h
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/firmware.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/firmware.h	2015-07-27 23:13:06.848547454 +0200
+@@ -32,6 +32,12 @@
+  * fails it will not use the callback, but call device_release_driver()
+  * instead which will call the driver .remove() callback.
+  */
++int brcmf_fw_get_firmwares_pcie(struct device *dev, u16 flags,
++				const char *code, const char *nvram,
++				void (*fw_cb)(struct device *dev,
++					      const struct firmware *fw,
++					      void *nvram_image, u32 nvram_len),
++				u16 domain_nr, u16 bus_nr);
+ int brcmf_fw_get_firmwares(struct device *dev, u16 flags,
+ 			   const char *code, const char *nvram,
+ 			   void (*fw_cb)(struct device *dev,
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.c	2015-07-27 23:13:06.848547454 +0200
+@@ -249,8 +249,8 @@
+ }
+ 
+ 
+-void brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
+-			    struct sk_buff *skb)
++u32 brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
++			   struct sk_buff *skb)
+ {
+ 	struct brcmf_flowring_ring *ring;
+ 
+@@ -271,6 +271,7 @@
+ 		if (skb_queue_len(&ring->skblist) < BRCMF_FLOWRING_LOW)
+ 			brcmf_flowring_block(flow, flowid, false);
+ 	}
++	return skb_queue_len(&ring->skblist);
+ }
+ 
+ 
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.h linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.h
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/flowring.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/flowring.h	2015-07-27 23:13:06.848547454 +0200
+@@ -64,8 +64,8 @@
+ void brcmf_flowring_delete(struct brcmf_flowring *flow, u8 flowid);
+ void brcmf_flowring_open(struct brcmf_flowring *flow, u8 flowid);
+ u8 brcmf_flowring_tid(struct brcmf_flowring *flow, u8 flowid);
+-void brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
+-			    struct sk_buff *skb);
++u32 brcmf_flowring_enqueue(struct brcmf_flowring *flow, u8 flowid,
++			   struct sk_buff *skb);
+ struct sk_buff *brcmf_flowring_dequeue(struct brcmf_flowring *flow, u8 flowid);
+ void brcmf_flowring_reinsert(struct brcmf_flowring *flow, u8 flowid,
+ 			     struct sk_buff *skb);
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/fwsignal.c	2015-07-27 23:13:06.860504792 +0200
+@@ -635,7 +635,7 @@
+ 	return 0;
+ }
+ 
+-static int brcmf_fws_hanger_poppkt(struct brcmf_fws_hanger *h,
++static inline int brcmf_fws_hanger_poppkt(struct brcmf_fws_hanger *h,
+ 					  u32 slot_id, struct sk_buff **pktout,
+ 					  bool remove_item)
+ {
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/msgbuf.c	2015-07-27 23:13:06.860504792 +0200
+@@ -73,7 +73,7 @@
+ #define BRCMF_MSGBUF_TX_FLUSH_CNT1		32
+ #define BRCMF_MSGBUF_TX_FLUSH_CNT2		96
+ 
+-#define BRCMF_MSGBUF_DELAY_TXWORKER_THRS	64
++#define BRCMF_MSGBUF_DELAY_TXWORKER_THRS	96
+ #define BRCMF_MSGBUF_TRICKLE_TXWORKER_THRS	32
+ 
+ struct msgbuf_common_hdr {
+@@ -278,16 +278,6 @@
+ 	struct brcmf_msgbuf_pktid *array;
+ };
+ 
+-
+-/* dma flushing needs implementation for mips and arm platforms. Should
+- * be put in util. Note, this is not real flushing. It is virtual non
+- * cached memory. Only write buffers should have to be drained. Though
+- * this may be different depending on platform......
+- */
+-#define brcmf_dma_flush(addr, len)
+-#define brcmf_dma_invalidate_cache(addr, len)
+-
+-
+ static void brcmf_msgbuf_rxbuf_ioctlresp_post(struct brcmf_msgbuf *msgbuf);
+ 
+ 
+@@ -462,7 +452,6 @@
+ 		memcpy(msgbuf->ioctbuf, buf, buf_len);
+ 	else
+ 		memset(msgbuf->ioctbuf, 0, buf_len);
+-	brcmf_dma_flush(ioctl_buf, buf_len);
+ 
+ 	err = brcmf_commonring_write_complete(commonring);
+ 	brcmf_commonring_unlock(commonring);
+@@ -795,6 +784,8 @@
+ 	struct brcmf_flowring *flow = msgbuf->flow;
+ 	struct ethhdr *eh = (struct ethhdr *)(skb->data);
+ 	u32 flowid;
++	u32 queue_count;
++	bool force;
+ 
+ 	flowid = brcmf_flowring_lookup(flow, eh->h_dest, skb->priority, ifidx);
+ 	if (flowid == BRCMF_FLOWRING_INVALID_ID) {
+@@ -802,8 +793,9 @@
+ 		if (flowid == BRCMF_FLOWRING_INVALID_ID)
+ 			return -ENOMEM;
+ 	}
+-	brcmf_flowring_enqueue(flow, flowid, skb);
+-	brcmf_msgbuf_schedule_txdata(msgbuf, flowid, false);
++	queue_count = brcmf_flowring_enqueue(flow, flowid, skb);
++	force = ((queue_count % BRCMF_MSGBUF_TRICKLE_TXWORKER_THRS) == 0);
++	brcmf_msgbuf_schedule_txdata(msgbuf, flowid, force);
+ 
+ 	return 0;
+ }
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/of.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/of.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/of.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/of.c	2015-07-27 23:13:06.868476350 +0200
+@@ -39,10 +39,16 @@
+ 	if (!sdiodev->pdata)
+ 		return;
+ 
++	if (of_property_read_u32(np, "brcm,drive-strength", &val) == 0)
++		sdiodev->pdata->drive_strength = val;
++
++	/* make sure there are interrupts defined in the node */
++	if (!of_find_property(np, "interrupts", NULL))
++		return;
++
+ 	irq = irq_of_parse_and_map(np, 0);
+ 	if (!irq) {
+ 		brcmf_err("interrupt could not be mapped\n");
+-		devm_kfree(dev, sdiodev->pdata);
+ 		return;
+ 	}
+ 	irqf = irqd_get_trigger_type(irq_get_irq_data(irq));
+@@ -50,7 +56,4 @@
+ 	sdiodev->pdata->oob_irq_supported = true;
+ 	sdiodev->pdata->oob_irq_nr = irq;
+ 	sdiodev->pdata->oob_irq_flags = irqf;
+-
+-	if (of_property_read_u32(np, "brcm,drive-strength", &val) == 0)
+-		sdiodev->pdata->drive_strength = val;
+ }
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/pcie.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/pcie.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/pcie.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/pcie.c	2015-07-27 23:13:06.868476350 +0200
+@@ -110,10 +110,12 @@
+ 						 BRCMF_PCIE_MB_INT_D2H3_DB0 | \
+ 						 BRCMF_PCIE_MB_INT_D2H3_DB1)
+ 
+-#define BRCMF_PCIE_MIN_SHARED_VERSION		4
++#define BRCMF_PCIE_MIN_SHARED_VERSION		5
+ #define BRCMF_PCIE_MAX_SHARED_VERSION		5
+ #define BRCMF_PCIE_SHARED_VERSION_MASK		0x00FF
+ #define BRCMF_PCIE_SHARED_TXPUSH_SUPPORT	0x4000
++#define BRCMF_PCIE_SHARED_DMA_INDEX		0x10000
++#define BRCMF_PCIE_SHARED_DMA_2B_IDX		0x100000
+ 
+ #define BRCMF_PCIE_FLAGS_HTOD_SPLIT		0x4000
+ #define BRCMF_PCIE_FLAGS_DTOH_SPLIT		0x8000
+@@ -145,6 +147,10 @@
+ #define BRCMF_SHARED_RING_H2D_R_IDX_PTR_OFFSET	8
+ #define BRCMF_SHARED_RING_D2H_W_IDX_PTR_OFFSET	12
+ #define BRCMF_SHARED_RING_D2H_R_IDX_PTR_OFFSET	16
++#define BRCMF_SHARED_RING_H2D_WP_HADDR_OFFSET	20
++#define BRCMF_SHARED_RING_H2D_RP_HADDR_OFFSET	28
++#define BRCMF_SHARED_RING_D2H_WP_HADDR_OFFSET	36
++#define BRCMF_SHARED_RING_D2H_RP_HADDR_OFFSET	44
+ #define BRCMF_SHARED_RING_TCM_MEMLOC_OFFSET	0
+ #define BRCMF_SHARED_RING_MAX_SUB_QUEUES	52
+ 
+@@ -244,6 +250,13 @@
+ 	bool mbdata_completed;
+ 	bool irq_allocated;
+ 	bool wowl_enabled;
++	u8 dma_idx_sz;
++	void *idxbuf;
++	u32 idxbuf_sz;
++	dma_addr_t idxbuf_dmahandle;
++	u16 (*read_ptr)(struct brcmf_pciedev_info *devinfo, u32 mem_offset);
++	void (*write_ptr)(struct brcmf_pciedev_info *devinfo, u32 mem_offset,
++			  u16 value);
+ };
+ 
+ struct brcmf_pcie_ringbuf {
+@@ -273,15 +286,6 @@
+ };
+ 
+ 
+-/* dma flushing needs implementation for mips and arm platforms. Should
+- * be put in util. Note, this is not real flushing. It is virtual non
+- * cached memory. Only write buffers should have to be drained. Though
+- * this may be different depending on platform......
+- */
+-#define brcmf_dma_flush(addr, len)
+-#define brcmf_dma_invalidate_cache(addr, len)
+-
+-
+ static u32
+ brcmf_pcie_read_reg32(struct brcmf_pciedev_info *devinfo, u32 reg_offset)
+ {
+@@ -329,6 +333,25 @@
+ }
+ 
+ 
++static u16
++brcmf_pcie_read_idx(struct brcmf_pciedev_info *devinfo, u32 mem_offset)
++{
++	u16 *address = devinfo->idxbuf + mem_offset;
++
++	return (*(address));
++}
++
++
++static void
++brcmf_pcie_write_idx(struct brcmf_pciedev_info *devinfo, u32 mem_offset,
++		     u16 value)
++{
++	u16 *address = devinfo->idxbuf + mem_offset;
++
++	*(address) = value;
++}
++
++
+ static u32
+ brcmf_pcie_read_tcm32(struct brcmf_pciedev_info *devinfo, u32 mem_offset)
+ {
+@@ -874,7 +897,7 @@
+ 	brcmf_dbg(PCIE, "W r_ptr %d (%d), ring %d\n", commonring->r_ptr,
+ 		  commonring->w_ptr, ring->id);
+ 
+-	brcmf_pcie_write_tcm16(devinfo, ring->r_idx_addr, commonring->r_ptr);
++	devinfo->write_ptr(devinfo, ring->r_idx_addr, commonring->r_ptr);
+ 
+ 	return 0;
+ }
+@@ -892,7 +915,7 @@
+ 	brcmf_dbg(PCIE, "W w_ptr %d (%d), ring %d\n", commonring->w_ptr,
+ 		  commonring->r_ptr, ring->id);
+ 
+-	brcmf_pcie_write_tcm16(devinfo, ring->w_idx_addr, commonring->w_ptr);
++	devinfo->write_ptr(devinfo, ring->w_idx_addr, commonring->w_ptr);
+ 
+ 	return 0;
+ }
+@@ -921,7 +944,7 @@
+ 	if (devinfo->state != BRCMFMAC_PCIE_STATE_UP)
+ 		return -EIO;
+ 
+-	commonring->r_ptr = brcmf_pcie_read_tcm16(devinfo, ring->r_idx_addr);
++	commonring->r_ptr = devinfo->read_ptr(devinfo, ring->r_idx_addr);
+ 
+ 	brcmf_dbg(PCIE, "R r_ptr %d (%d), ring %d\n", commonring->r_ptr,
+ 		  commonring->w_ptr, ring->id);
+@@ -939,7 +962,7 @@
+ 	if (devinfo->state != BRCMFMAC_PCIE_STATE_UP)
+ 		return -EIO;
+ 
+-	commonring->w_ptr = brcmf_pcie_read_tcm16(devinfo, ring->w_idx_addr);
++	commonring->w_ptr = devinfo->read_ptr(devinfo, ring->w_idx_addr);
+ 
+ 	brcmf_dbg(PCIE, "R w_ptr %d (%d), ring %d\n", commonring->w_ptr,
+ 		  commonring->r_ptr, ring->id);
+@@ -1044,6 +1067,13 @@
+ 	}
+ 	kfree(devinfo->shared.flowrings);
+ 	devinfo->shared.flowrings = NULL;
++	if (devinfo->idxbuf) {
++		dma_free_coherent(&devinfo->pdev->dev,
++				  devinfo->idxbuf_sz,
++				  devinfo->idxbuf,
++				  devinfo->idxbuf_dmahandle);
++		devinfo->idxbuf = NULL;
++	}
+ }
+ 
+ 
+@@ -1059,19 +1089,72 @@
+ 	u32 addr;
+ 	u32 ring_mem_ptr;
+ 	u32 i;
++	u64 address;
++	u32 bufsz;
+ 	u16 max_sub_queues;
++	u8 idx_offset;
+ 
+ 	ring_addr = devinfo->shared.ring_info_addr;
+ 	brcmf_dbg(PCIE, "Base ring addr = 0x%08x\n", ring_addr);
++	addr = ring_addr + BRCMF_SHARED_RING_MAX_SUB_QUEUES;
++	max_sub_queues = brcmf_pcie_read_tcm16(devinfo, addr);
+ 
+-	addr = ring_addr + BRCMF_SHARED_RING_D2H_W_IDX_PTR_OFFSET;
+-	d2h_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
+-	addr = ring_addr + BRCMF_SHARED_RING_D2H_R_IDX_PTR_OFFSET;
+-	d2h_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
+-	addr = ring_addr + BRCMF_SHARED_RING_H2D_W_IDX_PTR_OFFSET;
+-	h2d_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
+-	addr = ring_addr + BRCMF_SHARED_RING_H2D_R_IDX_PTR_OFFSET;
+-	h2d_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
++	if (devinfo->dma_idx_sz != 0) {
++		bufsz = (BRCMF_NROF_D2H_COMMON_MSGRINGS + max_sub_queues) *
++			devinfo->dma_idx_sz * 2;
++		devinfo->idxbuf = dma_alloc_coherent(&devinfo->pdev->dev, bufsz,
++						     &devinfo->idxbuf_dmahandle,
++						     GFP_KERNEL);
++		if (!devinfo->idxbuf)
++			devinfo->dma_idx_sz = 0;
++	}
++
++	if (devinfo->dma_idx_sz == 0) {
++		addr = ring_addr + BRCMF_SHARED_RING_D2H_W_IDX_PTR_OFFSET;
++		d2h_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
++		addr = ring_addr + BRCMF_SHARED_RING_D2H_R_IDX_PTR_OFFSET;
++		d2h_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
++		addr = ring_addr + BRCMF_SHARED_RING_H2D_W_IDX_PTR_OFFSET;
++		h2d_w_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
++		addr = ring_addr + BRCMF_SHARED_RING_H2D_R_IDX_PTR_OFFSET;
++		h2d_r_idx_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
++		idx_offset = sizeof(u32);
++		devinfo->write_ptr = brcmf_pcie_write_tcm16;
++		devinfo->read_ptr = brcmf_pcie_read_tcm16;
++		brcmf_dbg(PCIE, "Using TCM indices\n");
++	} else {
++		memset(devinfo->idxbuf, 0, bufsz);
++		devinfo->idxbuf_sz = bufsz;
++		idx_offset = devinfo->dma_idx_sz;
++		devinfo->write_ptr = brcmf_pcie_write_idx;
++		devinfo->read_ptr = brcmf_pcie_read_idx;
++
++		h2d_w_idx_ptr = 0;
++		addr = ring_addr + BRCMF_SHARED_RING_H2D_WP_HADDR_OFFSET;
++		address = (u64)devinfo->idxbuf_dmahandle;
++		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
++		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
++
++		h2d_r_idx_ptr = h2d_w_idx_ptr + max_sub_queues * idx_offset;
++		addr = ring_addr + BRCMF_SHARED_RING_H2D_RP_HADDR_OFFSET;
++		address += max_sub_queues * idx_offset;
++		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
++		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
++
++		d2h_w_idx_ptr = h2d_r_idx_ptr + max_sub_queues * idx_offset;
++		addr = ring_addr + BRCMF_SHARED_RING_D2H_WP_HADDR_OFFSET;
++		address += max_sub_queues * idx_offset;
++		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
++		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
++
++		d2h_r_idx_ptr = d2h_w_idx_ptr +
++				BRCMF_NROF_D2H_COMMON_MSGRINGS * idx_offset;
++		addr = ring_addr + BRCMF_SHARED_RING_D2H_RP_HADDR_OFFSET;
++		address += BRCMF_NROF_D2H_COMMON_MSGRINGS * idx_offset;
++		brcmf_pcie_write_tcm32(devinfo, addr, address & 0xffffffff);
++		brcmf_pcie_write_tcm32(devinfo, addr + 4, address >> 32);
++		brcmf_dbg(PCIE, "Using host memory indices\n");
++	}
+ 
+ 	addr = ring_addr + BRCMF_SHARED_RING_TCM_MEMLOC_OFFSET;
+ 	ring_mem_ptr = brcmf_pcie_read_tcm32(devinfo, addr);
+@@ -1085,8 +1168,8 @@
+ 		ring->id = i;
+ 		devinfo->shared.commonrings[i] = ring;
+ 
+-		h2d_w_idx_ptr += sizeof(u32);
+-		h2d_r_idx_ptr += sizeof(u32);
++		h2d_w_idx_ptr += idx_offset;
++		h2d_r_idx_ptr += idx_offset;
+ 		ring_mem_ptr += BRCMF_RING_MEM_SZ;
+ 	}
+ 
+@@ -1100,13 +1183,11 @@
+ 		ring->id = i;
+ 		devinfo->shared.commonrings[i] = ring;
+ 
+-		d2h_w_idx_ptr += sizeof(u32);
+-		d2h_r_idx_ptr += sizeof(u32);
++		d2h_w_idx_ptr += idx_offset;
++		d2h_r_idx_ptr += idx_offset;
+ 		ring_mem_ptr += BRCMF_RING_MEM_SZ;
+ 	}
+ 
+-	addr = ring_addr + BRCMF_SHARED_RING_MAX_SUB_QUEUES;
+-	max_sub_queues = brcmf_pcie_read_tcm16(devinfo, addr);
+ 	devinfo->shared.nrof_flowrings =
+ 			max_sub_queues - BRCMF_NROF_H2D_COMMON_MSGRINGS;
+ 	rings = kcalloc(devinfo->shared.nrof_flowrings, sizeof(*ring),
+@@ -1130,15 +1211,15 @@
+ 					     ring);
+ 		ring->w_idx_addr = h2d_w_idx_ptr;
+ 		ring->r_idx_addr = h2d_r_idx_ptr;
+-		h2d_w_idx_ptr += sizeof(u32);
+-		h2d_r_idx_ptr += sizeof(u32);
++		h2d_w_idx_ptr += idx_offset;
++		h2d_r_idx_ptr += idx_offset;
+ 	}
+ 	devinfo->shared.flowrings = rings;
+ 
+ 	return 0;
+ 
+ fail:
+-	brcmf_err("Allocating commonring buffers failed\n");
++	brcmf_err("Allocating ring buffers failed\n");
+ 	brcmf_pcie_release_ringbuffers(devinfo);
+ 	return -ENOMEM;
+ }
+@@ -1171,7 +1252,6 @@
+ 		goto fail;
+ 
+ 	memset(devinfo->shared.scratch, 0, BRCMF_DMA_D2H_SCRATCH_BUF_LEN);
+-	brcmf_dma_flush(devinfo->shared.scratch, BRCMF_DMA_D2H_SCRATCH_BUF_LEN);
+ 
+ 	addr = devinfo->shared.tcm_base_address +
+ 	       BRCMF_SHARED_DMA_SCRATCH_ADDR_OFFSET;
+@@ -1189,7 +1269,6 @@
+ 		goto fail;
+ 
+ 	memset(devinfo->shared.ringupd, 0, BRCMF_DMA_D2H_RINGUPD_BUF_LEN);
+-	brcmf_dma_flush(devinfo->shared.ringupd, BRCMF_DMA_D2H_RINGUPD_BUF_LEN);
+ 
+ 	addr = devinfo->shared.tcm_base_address +
+ 	       BRCMF_SHARED_DMA_RINGUPD_ADDR_OFFSET;
+@@ -1276,10 +1355,13 @@
+ 		brcmf_err("Unsupported PCIE version %d\n", version);
+ 		return -EINVAL;
+ 	}
+-	if (shared->flags & BRCMF_PCIE_SHARED_TXPUSH_SUPPORT) {
+-		brcmf_err("Unsupported legacy TX mode 0x%x\n",
+-			  shared->flags & BRCMF_PCIE_SHARED_TXPUSH_SUPPORT);
+-		return -EINVAL;
++
++	/* check firmware support dma indicies */
++	if (shared->flags & BRCMF_PCIE_SHARED_DMA_INDEX) {
++		if (shared->flags & BRCMF_PCIE_SHARED_DMA_2B_IDX)
++			devinfo->dma_idx_sz = sizeof(u16);
++		else
++			devinfo->dma_idx_sz = sizeof(u32);
+ 	}
+ 
+ 	addr = sharedram_addr + BRCMF_SHARED_MAX_RXBUFPOST_OFFSET;
+@@ -1609,7 +1691,7 @@
+ 		bus->msgbuf->commonrings[i] =
+ 				&devinfo->shared.commonrings[i]->commonring;
+ 
+-	flowrings = kcalloc(devinfo->shared.nrof_flowrings, sizeof(flowrings),
++	flowrings = kcalloc(devinfo->shared.nrof_flowrings, sizeof(*flowrings),
+ 			    GFP_KERNEL);
+ 	if (!flowrings)
+ 		goto fail;
+@@ -1641,8 +1723,13 @@
+ 	struct brcmf_pciedev_info *devinfo;
+ 	struct brcmf_pciedev *pcie_bus_dev;
+ 	struct brcmf_bus *bus;
++	u16 domain_nr;
++	u16 bus_nr;
+ 
+-	brcmf_dbg(PCIE, "Enter %x:%x\n", pdev->vendor, pdev->device);
++	domain_nr = pci_domain_nr(pdev->bus) + 1;
++	bus_nr = pdev->bus->number;
++	brcmf_dbg(PCIE, "Enter %x:%x (%d/%d)\n", pdev->vendor, pdev->device,
++		  domain_nr, bus_nr);
+ 
+ 	ret = -ENOMEM;
+ 	devinfo = kzalloc(sizeof(*devinfo), GFP_KERNEL);
+@@ -1691,10 +1778,10 @@
+ 	if (ret)
+ 		goto fail_bus;
+ 
+-	ret = brcmf_fw_get_firmwares(bus->dev, BRCMF_FW_REQUEST_NVRAM |
+-					       BRCMF_FW_REQ_NV_OPTIONAL,
+-				     devinfo->fw_name, devinfo->nvram_name,
+-				     brcmf_pcie_setup);
++	ret = brcmf_fw_get_firmwares_pcie(bus->dev, BRCMF_FW_REQUEST_NVRAM |
++						    BRCMF_FW_REQ_NV_OPTIONAL,
++					  devinfo->fw_name, devinfo->nvram_name,
++					  brcmf_pcie_setup, domain_nr, bus_nr);
+ 	if (ret == 0)
+ 		return 0;
+ fail_bus:
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/sdio.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/sdio.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/sdio.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/sdio.c	2015-07-27 23:13:06.872462130 +0200
+@@ -3550,10 +3550,6 @@
+ 		return;
+ 	}
+ 
+-	if (bus->sdiodev->state != BRCMF_SDIOD_DATA) {
+-		brcmf_err("bus is down. we have nothing to do\n");
+-		return;
+-	}
+ 	/* Count the interrupt call */
+ 	bus->sdcnt.intrcount++;
+ 	if (in_interrupt())
+diff -Nur linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/usb.c linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/usb.c
+--- linux-4.1.3/drivers/net/wireless/brcm80211/brcmfmac/usb.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/net/wireless/brcm80211/brcmfmac/usb.c	2015-07-27 23:13:06.872462130 +0200
+@@ -1270,8 +1270,13 @@
+ 	bus->chiprev = bus_pub->chiprev;
+ 
+ 	/* request firmware here */
+-	brcmf_fw_get_firmwares(dev, 0, brcmf_usb_get_fwname(devinfo), NULL,
+-			       brcmf_usb_probe_phase2);
++	ret = brcmf_fw_get_firmwares(dev, 0, brcmf_usb_get_fwname(devinfo),
++				     NULL, brcmf_usb_probe_phase2);
++	if (ret) {
++		brcmf_err("firmware request failed: %d\n", ret);
++		goto fail;
++	}
++
+ 	return 0;
+ 
+ fail:
+diff -Nur linux-4.1.3/drivers/spi/spi-imx.c linux-xbian-imx6/drivers/spi/spi-imx.c
+--- linux-4.1.3/drivers/spi/spi-imx.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/spi/spi-imx.c	2015-07-27 23:13:07.837020693 +0200
+@@ -1,5 +1,5 @@
+ /*
+- * Copyright 2004-2007 Freescale Semiconductor, Inc. All Rights Reserved.
++ * Copyright 2004-2007, 2015 Freescale Semiconductor, Inc. All Rights Reserved.
+  * Copyright (C) 2008 Juergen Beisert
+  *
+  * This program is free software; you can redistribute it and/or
+@@ -53,10 +53,14 @@
+ /* generic defines to abstract from the different register layouts */
+ #define MXC_INT_RR	(1 << 0) /* Receive data ready interrupt */
+ #define MXC_INT_TE	(1 << 1) /* Transmit FIFO empty interrupt */
++#define MXC_INT_TCEN    (1 << 7)   /* Transfer complete */
+ 
+ /* The maximum  bytes that a sdma BD can transfer.*/
+ #define MAX_SDMA_BD_BYTES  (1 << 15)
+-#define IMX_DMA_TIMEOUT (msecs_to_jiffies(3000))
++/* 3 Sec for 1MB or less than 1MB, else change with the transfer length */
++#define IMX_DEFAULT_DMA_TIMEOUT (msecs_to_jiffies(3000))
++#define IMX_DMA_TIMEOUT(len) ((len < 0x100000) ? IMX_DEFAULT_DMA_TIMEOUT : \
++				len * IMX_DEFAULT_DMA_TIMEOUT / 0x100000)
+ struct spi_imx_config {
+ 	unsigned int speed_hz;
+ 	unsigned int bpw;
+@@ -102,18 +106,23 @@
+ 
+ 	/* DMA */
+ 	unsigned int dma_is_inited;
+-	unsigned int dma_finished;
+ 	bool usedma;
+ 	u32 rx_wml;
+ 	u32 tx_wml;
+ 	u32 rxt_wml;
+ 	struct completion dma_rx_completion;
+ 	struct completion dma_tx_completion;
++	struct dma_slave_config rx_config;
++	struct dma_slave_config tx_config;
+ 
+ 	const struct spi_imx_devtype_data *devtype_data;
+ 	int chipselect[0];
+ };
+ 
++static struct spi_board_info info = {
++	.modalias	= "spidev",
++};
++
+ static inline int is_imx27_cspi(struct spi_imx_data *d)
+ {
+ 	return d->devtype_data->devtype == IMX27_CSPI;
+@@ -201,8 +210,9 @@
+ {
+ 	struct spi_imx_data *spi_imx = spi_master_get_devdata(master);
+ 
+-	if (spi_imx->dma_is_inited && (transfer->len > spi_imx->rx_wml)
+-	    && (transfer->len > spi_imx->tx_wml))
++	if (spi_imx->dma_is_inited &&
++		(transfer->len > spi_imx_get_fifosize(spi_imx)) &&
++		(transfer->len > spi_imx_get_fifosize(spi_imx)))
+ 		return true;
+ 	return false;
+ }
+@@ -227,6 +237,7 @@
+ #define MX51_ECSPI_INT		0x10
+ #define MX51_ECSPI_INT_TEEN		(1 <<  0)
+ #define MX51_ECSPI_INT_RREN		(1 <<  3)
++#define MX51_ECSPI_INT_TCEN             (1 << 7)
+ 
+ #define MX51_ECSPI_DMA      0x14
+ #define MX51_ECSPI_DMA_TX_WML_OFFSET	0
+@@ -291,17 +302,21 @@
+ 	if (enable & MXC_INT_RR)
+ 		val |= MX51_ECSPI_INT_RREN;
+ 
++	if (enable & MXC_INT_TCEN)
++		val |= MX51_ECSPI_INT_TCEN;
++
+ 	writel(val, spi_imx->base + MX51_ECSPI_INT);
+ }
+ 
+ static void __maybe_unused mx51_ecspi_trigger(struct spi_imx_data *spi_imx)
+ {
+ 	u32 reg = readl(spi_imx->base + MX51_ECSPI_CTRL);
+-
++	/*
++	 * To workaround TKT238285, SDMA script need use XCH instead of SMC
++	 * just like PIO mode.
++	 */
+ 	if (!spi_imx->usedma)
+ 		reg |= MX51_ECSPI_CTRL_XCH;
+-	else if (!spi_imx->dma_finished)
+-		reg |= MX51_ECSPI_CTRL_SMC;
+ 	else
+ 		reg &= ~MX51_ECSPI_CTRL_SMC;
+ 	writel(reg, spi_imx->base + MX51_ECSPI_CTRL);
+@@ -311,7 +326,6 @@
+ 		struct spi_imx_config *config)
+ {
+ 	u32 ctrl = MX51_ECSPI_CTRL_ENABLE, cfg = 0, dma = 0;
+-	u32 tx_wml_cfg, rx_wml_cfg, rxt_wml_cfg;
+ 	u32 clk = config->speed_hz, delay;
+ 
+ 	/*
+@@ -368,20 +382,10 @@
+ 	 * and enable DMA request.
+ 	 */
+ 	if (spi_imx->dma_is_inited) {
+-		dma = readl(spi_imx->base + MX51_ECSPI_DMA);
+-
+-		spi_imx->rxt_wml = spi_imx_get_fifosize(spi_imx) / 2;
+-		rx_wml_cfg = spi_imx->rx_wml << MX51_ECSPI_DMA_RX_WML_OFFSET;
+-		tx_wml_cfg = spi_imx->tx_wml << MX51_ECSPI_DMA_TX_WML_OFFSET;
+-		rxt_wml_cfg = spi_imx->rxt_wml << MX51_ECSPI_DMA_RXT_WML_OFFSET;
+-		dma = (dma & ~MX51_ECSPI_DMA_TX_WML_MASK
+-			   & ~MX51_ECSPI_DMA_RX_WML_MASK
+-			   & ~MX51_ECSPI_DMA_RXT_WML_MASK)
+-			   | rx_wml_cfg | tx_wml_cfg | rxt_wml_cfg
+-			   |(1 << MX51_ECSPI_DMA_TEDEN_OFFSET)
+-			   |(1 << MX51_ECSPI_DMA_RXDEN_OFFSET)
+-			   |(1 << MX51_ECSPI_DMA_RXTDEN_OFFSET);
+-
++		spi_imx->rx_wml = spi_imx_get_fifosize(spi_imx) / 2;
++		dma = (spi_imx->rx_wml - 1) << MX51_ECSPI_DMA_RX_WML_OFFSET
++		      | (1 << MX51_ECSPI_DMA_TEDEN_OFFSET)
++		      | (1 << MX51_ECSPI_DMA_RXDEN_OFFSET);
+ 		writel(dma, spi_imx->base + MX51_ECSPI_DMA);
+ 	}
+ 
+@@ -768,6 +772,7 @@
+ {
+ 	struct spi_imx_data *spi_imx = spi_master_get_devdata(spi->master);
+ 	struct spi_imx_config config;
++	int ret;
+ 
+ 	config.bpw = t ? t->bits_per_word : spi->bits_per_word;
+ 	config.speed_hz  = t ? t->speed_hz : spi->max_speed_hz;
+@@ -783,12 +788,35 @@
+ 	if (config.bpw <= 8) {
+ 		spi_imx->rx = spi_imx_buf_rx_u8;
+ 		spi_imx->tx = spi_imx_buf_tx_u8;
++		spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
++		spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
+ 	} else if (config.bpw <= 16) {
+ 		spi_imx->rx = spi_imx_buf_rx_u16;
+ 		spi_imx->tx = spi_imx_buf_tx_u16;
++		spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_2_BYTES;
++		spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_2_BYTES;
+ 	} else {
+ 		spi_imx->rx = spi_imx_buf_rx_u32;
+ 		spi_imx->tx = spi_imx_buf_tx_u32;
++		spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
++		spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
++	}
++
++	if (spi_imx->bitbang.master->can_dma &&
++	    spi_imx_can_dma(spi_imx->bitbang.master, spi, t)) {
++		ret = dmaengine_slave_config(spi_imx->bitbang.master->dma_tx,
++						&spi_imx->tx_config);
++		if (ret) {
++			dev_err(&spi->dev, "error in TX dma configuration.\n");
++			return ret;
++		}
++
++		ret = dmaengine_slave_config(spi_imx->bitbang.master->dma_rx,
++						&spi_imx->rx_config);
++		if (ret) {
++			dev_err(&spi->dev, "error in RX dma configuration.\n");
++			return ret;
++		}
+ 	}
+ 
+ 	spi_imx->devtype_data->config(spi_imx, &config);
+@@ -817,7 +845,6 @@
+ 			     struct spi_master *master,
+ 			     const struct resource *res)
+ {
+-	struct dma_slave_config slave_config = {};
+ 	int ret;
+ 
+ 	/* use pio mode for i.mx6dl chip TKT238285 */
+@@ -832,11 +859,11 @@
+ 		goto err;
+ 	}
+ 
+-	slave_config.direction = DMA_MEM_TO_DEV;
+-	slave_config.dst_addr = res->start + MXC_CSPITXDATA;
+-	slave_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
+-	slave_config.dst_maxburst = spi_imx_get_fifosize(spi_imx) / 2;
+-	ret = dmaengine_slave_config(master->dma_tx, &slave_config);
++	spi_imx->tx_config.direction = DMA_MEM_TO_DEV;
++	spi_imx->tx_config.dst_addr = res->start + MXC_CSPITXDATA;
++	spi_imx->tx_config.dst_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
++	spi_imx->tx_config.dst_maxburst = spi_imx_get_fifosize(spi_imx) / 4;
++	ret = dmaengine_slave_config(master->dma_tx, &spi_imx->tx_config);
+ 	if (ret) {
+ 		dev_err(dev, "error in TX dma configuration.\n");
+ 		goto err;
+@@ -850,11 +877,11 @@
+ 		goto err;
+ 	}
+ 
+-	slave_config.direction = DMA_DEV_TO_MEM;
+-	slave_config.src_addr = res->start + MXC_CSPIRXDATA;
+-	slave_config.src_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
+-	slave_config.src_maxburst = spi_imx_get_fifosize(spi_imx) / 2;
+-	ret = dmaengine_slave_config(master->dma_rx, &slave_config);
++	spi_imx->rx_config.direction = DMA_DEV_TO_MEM;
++	spi_imx->rx_config.src_addr = res->start + MXC_CSPIRXDATA;
++	spi_imx->rx_config.src_addr_width = DMA_SLAVE_BUSWIDTH_1_BYTE;
++	spi_imx->rx_config.src_maxburst = spi_imx_get_fifosize(spi_imx) / 2;
++	ret = dmaengine_slave_config(master->dma_rx, &spi_imx->rx_config);
+ 	if (ret) {
+ 		dev_err(dev, "error in RX dma configuration.\n");
+ 		goto err;
+@@ -890,14 +917,33 @@
+ 	complete(&spi_imx->dma_tx_completion);
+ }
+ 
++static void spi_imx_tail_pio_set(struct spi_imx_data *spi_imx, int left)
++{
++
++	switch (spi_imx->rx_config.src_addr_width) {
++	case DMA_SLAVE_BUSWIDTH_1_BYTE:
++		spi_imx->rx = spi_imx_buf_rx_u8;
++		break;
++	case DMA_SLAVE_BUSWIDTH_2_BYTES:
++		spi_imx->rx = spi_imx_buf_rx_u16;
++		break;
++	case DMA_SLAVE_BUSWIDTH_4_BYTES:
++		spi_imx->rx = spi_imx_buf_rx_u32;
++		break;
++	default:
++		spi_imx->rx = spi_imx_buf_rx_u8;
++		break;
++	}
++
++	spi_imx->txfifo = left / spi_imx->tx_config.dst_addr_width;
++}
++
+ static int spi_imx_dma_transfer(struct spi_imx_data *spi_imx,
+ 				struct spi_transfer *transfer)
+ {
+ 	struct dma_async_tx_descriptor *desc_tx = NULL, *desc_rx = NULL;
+ 	int ret;
+-	unsigned long timeout;
+-	u32 dma;
+-	int left;
++	int left = 0;
+ 	struct spi_master *master = spi_imx->bitbang.master;
+ 	struct sg_table *tx = &transfer->tx_sg, *rx = &transfer->rx_sg;
+ 
+@@ -914,6 +960,18 @@
+ 	}
+ 
+ 	if (rx) {
++		struct scatterlist *sgl_last = &rx->sgl[rx->nents - 1];
++		unsigned int	orig_length = sgl_last->length;
++		int	wml_mask = ~(spi_imx->rx_wml - 1);
++		/*
++		 * Adjust the transfer lenth of the last scattlist if there are
++		 * some tail data, use PIO read to get the tail data since DMA
++		 * sometimes miss the last tail interrupt.
++		 */
++		left = transfer->len % spi_imx->rx_wml;
++		if (left)
++			sgl_last->length = orig_length & wml_mask;
++
+ 		desc_rx = dmaengine_prep_slave_sg(master->dma_rx,
+ 					rx->sgl, rx->nents, DMA_DEV_TO_MEM,
+ 					DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
+@@ -929,46 +987,50 @@
+ 	reinit_completion(&spi_imx->dma_tx_completion);
+ 
+ 	/* Trigger the cspi module. */
+-	spi_imx->dma_finished = 0;
+-
+-	dma = readl(spi_imx->base + MX51_ECSPI_DMA);
+-	dma = dma & (~MX51_ECSPI_DMA_RXT_WML_MASK);
+-	/* Change RX_DMA_LENGTH trigger dma fetch tail data */
+-	left = transfer->len % spi_imx->rxt_wml;
+-	if (left)
+-		writel(dma | (left << MX51_ECSPI_DMA_RXT_WML_OFFSET),
+-				spi_imx->base + MX51_ECSPI_DMA);
+ 	spi_imx->devtype_data->trigger(spi_imx);
+ 
+ 	dma_async_issue_pending(master->dma_tx);
+ 	dma_async_issue_pending(master->dma_rx);
+ 	/* Wait SDMA to finish the data transfer.*/
+-	timeout = wait_for_completion_timeout(&spi_imx->dma_tx_completion,
+-						IMX_DMA_TIMEOUT);
+-	if (!timeout) {
+-		pr_warn("%s %s: I/O Error in DMA TX\n",
++	ret = wait_for_completion_timeout(&spi_imx->dma_tx_completion,
++					  IMX_DMA_TIMEOUT(transfer->len));
++	if (!ret) {
++		pr_warn("%s %s: I/O Error in DMA TX:%x\n",
+ 			dev_driver_string(&master->dev),
+-			dev_name(&master->dev));
++			dev_name(&master->dev), transfer->len);
+ 		dmaengine_terminate_all(master->dma_tx);
+ 	} else {
+-		timeout = wait_for_completion_timeout(
+-				&spi_imx->dma_rx_completion, IMX_DMA_TIMEOUT);
+-		if (!timeout) {
+-			pr_warn("%s %s: I/O Error in DMA RX\n",
++		ret = wait_for_completion_timeout(&spi_imx->dma_rx_completion,
++				IMX_DMA_TIMEOUT(transfer->len));
++		if (!ret) {
++			pr_warn("%s %s: I/O Error in DMA RX:%x\n",
+ 				dev_driver_string(&master->dev),
+-				dev_name(&master->dev));
++				dev_name(&master->dev), transfer->len);
+ 			spi_imx->devtype_data->reset(spi_imx);
+ 			dmaengine_terminate_all(master->dma_rx);
++		} else if (left) {
++			/* read the tail data by PIO */
++			dma_sync_sg_for_cpu(master->dma_rx->device->dev,
++					    &rx->sgl[rx->nents - 1], 1,
++					    DMA_FROM_DEVICE);
++			spi_imx->rx_buf = transfer->rx_buf
++						+ (transfer->len - left);
++			spi_imx_tail_pio_set(spi_imx, left);
++			reinit_completion(&spi_imx->xfer_done);
++
++			spi_imx->devtype_data->intctrl(spi_imx, MXC_INT_TCEN);
++
++			ret = wait_for_completion_timeout(&spi_imx->xfer_done,
++						IMX_DMA_TIMEOUT(transfer->len));
++			if (!ret) {
++				pr_warn("%s %s: I/O Error in RX tail\n",
++					dev_driver_string(&master->dev),
++					dev_name(&master->dev));
++			}
+ 		}
+-		writel(dma |
+-		       spi_imx->rxt_wml << MX51_ECSPI_DMA_RXT_WML_OFFSET,
+-		       spi_imx->base + MX51_ECSPI_DMA);
+ 	}
+ 
+-	spi_imx->dma_finished = 1;
+-	spi_imx->devtype_data->trigger(spi_imx);
+-
+-	if (!timeout)
++	if (!ret)
+ 		ret = -ETIMEDOUT;
+ 	else
+ 		ret = transfer->len;
+@@ -1013,6 +1075,7 @@
+ 	    spi_imx_can_dma(spi_imx->bitbang.master, spi, transfer)) {
+ 		spi_imx->usedma = true;
+ 		ret = spi_imx_dma_transfer(spi_imx, transfer);
++		spi_imx->usedma = false; /* clear the dma flag */
+ 		if (ret != -EAGAIN)
+ 			return ret;
+ 	}
+@@ -1200,6 +1263,7 @@
+ 		goto out_clk_put;
+ 	}
+ 
++	spi_new_device(master, &info);
+ 	dev_info(&pdev->dev, "probed\n");
+ 
+ 	clk_disable(spi_imx->clk_ipg);
+diff -Nur linux-4.1.3/drivers/video/fbdev/core/fbmon.c linux-xbian-imx6/drivers/video/fbdev/core/fbmon.c
+--- linux-4.1.3/drivers/video/fbdev/core/fbmon.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/video/fbdev/core/fbmon.c	2015-07-27 23:13:08.674034323 +0200
+@@ -494,7 +494,7 @@
+ static int get_std_timing(unsigned char *block, struct fb_videomode *mode,
+ 			  int ver, int rev, const struct fb_monspecs *specs)
+ {
+-	int i;
++	int xres, yres = 0, ratio, i;
+ 
+ 	for (i = 0; i < DMT_SIZE; i++) {
+ 		u32 std_2byte_code = block[0] << 8 | block[1];
+@@ -502,6 +502,32 @@
+ 			break;
+ 	}
+ 
++	ratio = (block[1] & 0xc0) >> 6;
++	switch (ratio) {
++	case 0:
++		/* in EDID 1.3 the meaning of 0 changed to 16:10 (prior 1:1) */
++		if (ver < 1 || (ver == 1 && rev < 3)) {
++			yres = xres;
++			mode->vmode &= FB_VMODE_ASPECT_1;
++		} else {
++			yres = (xres * 10)/16;
++			mode->vmode &= FB_VMODE_ASPECT_16_10;
++		}
++		break;
++	case 1:
++		yres = (xres * 3)/4;
++		mode->vmode &= FB_VMODE_ASPECT_4_3;
++		break;
++	case 2:
++		yres = (xres * 4)/5;
++		mode->vmode &= FB_VMODE_ASPECT_5_4;
++		break;
++	case 3:
++		yres = (xres * 9)/16;
++		mode->vmode &= FB_VMODE_ASPECT_16_9;
++		break;
++	}
++
+ 	if (i < DMT_SIZE && dmt_modes[i].mode) {
+ 		/* DMT mode found */
+ 		*mode = *dmt_modes[i].mode;
+diff -Nur linux-4.1.3/drivers/video/fbdev/core/fbsysfs.c linux-xbian-imx6/drivers/video/fbdev/core/fbsysfs.c
+--- linux-4.1.3/drivers/video/fbdev/core/fbsysfs.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/video/fbdev/core/fbsysfs.c	2015-07-27 23:13:08.674034323 +0200
+@@ -20,6 +20,7 @@
+ #include <linux/fb.h>
+ #include <linux/console.h>
+ #include <linux/module.h>
++#include <linux/ctype.h>
+ 
+ #define FB_SYSFS_FLAG_ATTR 1
+ 
+@@ -119,7 +120,15 @@
+ 		v = 'i';
+ 	if (mode->vmode & FB_VMODE_DOUBLE)
+ 		v = 'd';
++	if (mode->vmode & FB_VMODE_3D_SBS_HALF)
++		m = 'H';
++	if (mode->vmode & FB_VMODE_3D_TOP_BOTTOM)
++		m = 'T';
++	if (mode->vmode & FB_VMODE_3D_FRAME_PACK)
++		m = 'F';
+ 
++	if (mode->vmode & FB_VMODE_FRACTIONAL)
++		m = tolower(m);
+ 	return snprintf(&buf[offset], PAGE_SIZE - offset, "%c:%dx%d%c-%d\n",
+ 	                m, mode->xres, mode->yres, v, mode->refresh);
+ }
+diff -Nur linux-4.1.3/drivers/video/Kconfig linux-xbian-imx6/drivers/video/Kconfig
+--- linux-4.1.3/drivers/video/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/video/Kconfig	2015-07-27 23:13:08.626204974 +0200
+@@ -30,6 +30,8 @@
+ source "drivers/video/fbdev/Kconfig"
+ endmenu
+ 
++source "drivers/video/mxc/Kconfig"
++
+ source "drivers/video/backlight/Kconfig"
+ 
+ config VGASTATE
+diff -Nur linux-4.1.3/drivers/video/Makefile linux-xbian-imx6/drivers/video/Makefile
+--- linux-4.1.3/drivers/video/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/drivers/video/Makefile	2015-07-27 23:13:08.626204974 +0200
+@@ -6,6 +6,7 @@
+ obj-y				  += backlight/
+ 
+ obj-y				  += fbdev/
++obj-y				  += mxc/
+ 
+ obj-$(CONFIG_VIDEOMODE_HELPERS) += display_timing.o videomode.o
+ ifeq ($(CONFIG_OF),y)
+diff -Nur linux-4.1.3/drivers/video/mxc/Kconfig linux-xbian-imx6/drivers/video/mxc/Kconfig
+--- linux-4.1.3/drivers/video/mxc/Kconfig	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/Kconfig	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,55 @@
++config FB_MXC
++	tristate "MXC Framebuffer support"
++	depends on FB
++	select FB_CFB_FILLRECT
++	select FB_CFB_COPYAREA
++	select FB_CFB_IMAGEBLIT
++	select FB_MODE_HELPERS
++	default y
++	help
++	  This is a framebuffer device for the MXC LCD Controller.
++	  See <http://www.linux-fbdev.org/> for information on framebuffer
++	  devices.
++
++	  If you plan to use the LCD display with your MXC system, say
++	  Y here.
++
++config FB_MXC_SYNC_PANEL
++	depends on FB_MXC
++	tristate "Synchronous Panel Framebuffer"
++
++config FB_MXC_LDB
++	tristate "MXC LDB"
++	depends on FB_MXC_SYNC_PANEL
++	depends on MXC_IPU_V3_FSL || IMX_IPUV3_CORE
++
++config FB_MXC_MIPI_DSI
++	tristate "MXC MIPI_DSI"
++	depends on FB_MXC_SYNC_PANEL
++	depends on MXC_IPU_V3_FSL || IMX_IPUV3_CORE
++
++config FB_MXC_TRULY_WVGA_SYNC_PANEL
++	tristate "TRULY WVGA Panel"
++	depends on FB_MXC_SYNC_PANEL
++	depends on FB_MXC_MIPI_DSI
++
++config FB_MXC_HDMI
++	depends on FB_MXC_SYNC_PANEL
++	depends on MXC_IPU_V3_FSL || IMX_IPUV3_CORE
++	depends on I2C
++	tristate "MXC HDMI driver support"
++	select MFD_MXC_HDMI
++	select HDMI
++	help
++	  Driver for the on-chip MXC HDMI controller.
++
++config FB_MXC_DCIC
++        tristate "MXC DCIC"
++        depends on FB_MXC_SYNC_PANEL
++        depends on MXC_IPU_V3_FSL || FB_MXS
++        select VIDEOMODE_HELPERS
++
++config FB_MXC_EDID
++     depends on FB_MXC && I2C
++     tristate "MXC EDID support"
++     default y
+diff -Nur linux-4.1.3/drivers/video/mxc/ldb.c linux-xbian-imx6/drivers/video/mxc/ldb.c
+--- linux-4.1.3/drivers/video/mxc/ldb.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/ldb.c	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,1036 @@
++/*
++ * Copyright (C) 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*!
++ * @file mxc_ldb.c
++ *
++ * @brief This file contains the LDB driver device interface and fops
++ * functions.
++ */
++#include <linux/types.h>
++#include <linux/init.h>
++#include <linux/module.h>
++#include <linux/platform_device.h>
++#include <linux/err.h>
++#include <linux/clk.h>
++#include <linux/console.h>
++#include <linux/io.h>
++#include <linux/ipu.h>
++#include <linux/mxcfb.h>
++#include <linux/regulator/consumer.h>
++#include <linux/spinlock.h>
++#include <linux/of_device.h>
++#include <linux/mod_devicetable.h>
++#include "mxc_dispdrv.h"
++
++#define DISPDRV_LDB	"ldb"
++
++#define LDB_BGREF_RMODE_MASK		0x00008000
++#define LDB_BGREF_RMODE_INT		0x00008000
++#define LDB_BGREF_RMODE_EXT		0x0
++
++#define LDB_DI1_VS_POL_MASK		0x00000400
++#define LDB_DI1_VS_POL_ACT_LOW		0x00000400
++#define LDB_DI1_VS_POL_ACT_HIGH		0x0
++#define LDB_DI0_VS_POL_MASK		0x00000200
++#define LDB_DI0_VS_POL_ACT_LOW		0x00000200
++#define LDB_DI0_VS_POL_ACT_HIGH		0x0
++
++#define LDB_BIT_MAP_CH1_MASK		0x00000100
++#define LDB_BIT_MAP_CH1_JEIDA		0x00000100
++#define LDB_BIT_MAP_CH1_SPWG		0x0
++#define LDB_BIT_MAP_CH0_MASK		0x00000040
++#define LDB_BIT_MAP_CH0_JEIDA		0x00000040
++#define LDB_BIT_MAP_CH0_SPWG		0x0
++
++#define LDB_DATA_WIDTH_CH1_MASK		0x00000080
++#define LDB_DATA_WIDTH_CH1_24		0x00000080
++#define LDB_DATA_WIDTH_CH1_18		0x0
++#define LDB_DATA_WIDTH_CH0_MASK		0x00000020
++#define LDB_DATA_WIDTH_CH0_24		0x00000020
++#define LDB_DATA_WIDTH_CH0_18		0x0
++
++#define LDB_CH1_MODE_MASK		0x0000000C
++#define LDB_CH1_MODE_EN_TO_DI1		0x0000000C
++#define LDB_CH1_MODE_EN_TO_DI0		0x00000004
++#define LDB_CH1_MODE_DISABLE		0x0
++#define LDB_CH0_MODE_MASK		0x00000003
++#define LDB_CH0_MODE_EN_TO_DI1		0x00000003
++#define LDB_CH0_MODE_EN_TO_DI0		0x00000001
++#define LDB_CH0_MODE_DISABLE		0x0
++
++#define LDB_SPLIT_MODE_EN		0x00000010
++
++enum {
++	IMX6_LDB,
++};
++
++enum {
++	LDB_IMX6 = 1,
++};
++
++struct fsl_mxc_ldb_platform_data {
++	int devtype;
++	u32 ext_ref;
++#define LDB_SPL_DI0	1
++#define LDB_SPL_DI1	2
++#define LDB_DUL_DI0	3
++#define LDB_DUL_DI1	4
++#define LDB_SIN0	5
++#define LDB_SIN1	6
++#define LDB_SEP0	7
++#define LDB_SEP1	8
++	int mode;
++	int ipu_id;
++	int disp_id;
++
++	/*only work for separate mode*/
++	int sec_ipu_id;
++	int sec_disp_id;
++};
++
++struct ldb_data {
++	struct platform_device *pdev;
++	struct mxc_dispdrv_handle *disp_ldb;
++	uint32_t *reg;
++	uint32_t *control_reg;
++	uint32_t *gpr3_reg;
++	uint32_t control_reg_data;
++	struct regulator *lvds_bg_reg;
++	int mode;
++	bool inited;
++	struct ldb_setting {
++		struct clk *di_clk;
++		struct clk *ldb_di_clk;
++		struct clk *div_3_5_clk;
++		struct clk *div_7_clk;
++		struct clk *div_sel_clk;
++		bool active;
++		bool clk_en;
++		int ipu;
++		int di;
++		uint32_t ch_mask;
++		uint32_t ch_val;
++	} setting[2];
++	struct notifier_block nb;
++};
++
++static int g_ldb_mode;
++
++static struct fb_videomode ldb_modedb[] = {
++	{
++	 "LDB-WXGA", 60, 1280, 800, 14065,
++	 40, 40,
++	 10, 3,
++	 80, 10,
++	 0,
++	 FB_VMODE_NONINTERLACED,
++	 FB_MODE_IS_DETAILED,},
++	{
++	 "LDB-XGA", 60, 1024, 768, 15385,
++	 220, 40,
++	 21, 7,
++	 60, 10,
++	 0,
++	 FB_VMODE_NONINTERLACED,
++	 FB_MODE_IS_DETAILED,},
++	{
++	 "LDB-1080P60", 60, 1920, 1080, 7692,
++	 100, 40,
++	 30, 3,
++	 10, 2,
++	 0,
++	 FB_VMODE_NONINTERLACED,
++	 FB_MODE_IS_DETAILED,},
++};
++static int ldb_modedb_sz = ARRAY_SIZE(ldb_modedb);
++
++static inline int is_imx6_ldb(struct fsl_mxc_ldb_platform_data *plat_data)
++{
++	return (plat_data->devtype == LDB_IMX6);
++}
++
++static int bits_per_pixel(int pixel_fmt)
++{
++	switch (pixel_fmt) {
++	case IPU_PIX_FMT_BGR24:
++	case IPU_PIX_FMT_RGB24:
++		return 24;
++		break;
++	case IPU_PIX_FMT_BGR666:
++	case IPU_PIX_FMT_RGB666:
++	case IPU_PIX_FMT_LVDS666:
++		return 18;
++		break;
++	default:
++		break;
++	}
++	return 0;
++}
++
++static int valid_mode(int pixel_fmt)
++{
++	return ((pixel_fmt == IPU_PIX_FMT_RGB24) ||
++		(pixel_fmt == IPU_PIX_FMT_BGR24) ||
++		(pixel_fmt == IPU_PIX_FMT_LVDS666) ||
++		(pixel_fmt == IPU_PIX_FMT_RGB666) ||
++		(pixel_fmt == IPU_PIX_FMT_BGR666));
++}
++
++static int parse_ldb_mode(char *mode)
++{
++	int ldb_mode;
++
++	if (!strcmp(mode, "spl0"))
++		ldb_mode = LDB_SPL_DI0;
++	else if (!strcmp(mode, "spl1"))
++		ldb_mode = LDB_SPL_DI1;
++	else if (!strcmp(mode, "dul0"))
++		ldb_mode = LDB_DUL_DI0;
++	else if (!strcmp(mode, "dul1"))
++		ldb_mode = LDB_DUL_DI1;
++	else if (!strcmp(mode, "sin0"))
++		ldb_mode = LDB_SIN0;
++	else if (!strcmp(mode, "sin1"))
++		ldb_mode = LDB_SIN1;
++	else if (!strcmp(mode, "sep0"))
++		ldb_mode = LDB_SEP0;
++	else if (!strcmp(mode, "sep1"))
++		ldb_mode = LDB_SEP1;
++	else
++		ldb_mode = -EINVAL;
++
++	return ldb_mode;
++}
++
++#ifndef MODULE
++/*
++ *    "ldb=spl0/1"       --      split mode on DI0/1
++ *    "ldb=dul0/1"       --      dual mode on DI0/1
++ *    "ldb=sin0/1"       --      single mode on LVDS0/1
++ *    "ldb=sep0/1" 	 --      separate mode begin from LVDS0/1
++ *
++ *    there are two LVDS channels(LVDS0 and LVDS1) which can transfer video
++ *    datas, there two channels can be used as split/dual/single/separate mode.
++ *
++ *    split mode means display data from DI0 or DI1 will send to both channels
++ *    LVDS0+LVDS1.
++ *    dual mode means display data from DI0 or DI1 will be duplicated on LVDS0
++ *    and LVDS1, it said, LVDS0 and LVDS1 has the same content.
++ *    single mode means only work for DI0/DI1->LVDS0 or DI0/DI1->LVDS1.
++ *    separate mode means you can make DI0/DI1->LVDS0 and DI0/DI1->LVDS1 work
++ *    at the same time.
++ */
++static int __init ldb_setup(char *options)
++{
++	g_ldb_mode = parse_ldb_mode(options);
++	return (g_ldb_mode < 0) ? 0 : 1;
++}
++__setup("ldb=", ldb_setup);
++#endif
++
++static int ldb_get_of_property(struct platform_device *pdev,
++				struct fsl_mxc_ldb_platform_data *plat_data)
++{
++	struct device_node *np = pdev->dev.of_node;
++	int err;
++	u32 ipu_id, disp_id;
++	u32 sec_ipu_id, sec_disp_id;
++	char *mode;
++	u32 ext_ref;
++
++	err = of_property_read_string(np, "mode", (const char **)&mode);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property mode fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "ext_ref", &ext_ref);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property ext_ref fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "ipu_id", &ipu_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property ipu_id fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "disp_id", &disp_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property disp_id fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "sec_ipu_id", &sec_ipu_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property sec_ipu_id fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "sec_disp_id", &sec_disp_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property sec_disp_id fail\n");
++		return err;
++	}
++
++	plat_data->mode = parse_ldb_mode(mode);
++	plat_data->ext_ref = ext_ref;
++	plat_data->ipu_id = ipu_id;
++	plat_data->disp_id = disp_id;
++	plat_data->sec_ipu_id = sec_ipu_id;
++	plat_data->sec_disp_id = sec_disp_id;
++
++	return err;
++}
++
++static int find_ldb_setting(struct ldb_data *ldb, struct fb_info *fbi)
++{
++	char *id_di[] = {
++		 "DISP3 BG",
++		 "DISP3 BG - DI1",
++		};
++	char id[16];
++	int i;
++
++	for (i = 0; i < 2; i++) {
++		if (ldb->setting[i].active) {
++			memset(id, 0, 16);
++			memcpy(id, id_di[ldb->setting[i].di],
++				strlen(id_di[ldb->setting[i].di]));
++			id[4] += ldb->setting[i].ipu;
++			if (!strcmp(id, fbi->fix.id))
++				return i;
++		}
++	}
++	return -EINVAL;
++}
++
++static int ldb_disp_setup(struct mxc_dispdrv_handle *disp, struct fb_info *fbi)
++{
++	uint32_t reg, val;
++	uint32_t pixel_clk, rounded_pixel_clk;
++	struct clk *ldb_clk_parent;
++	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
++	int setting_idx, di;
++	int ret;
++
++	setting_idx = find_ldb_setting(ldb, fbi);
++	if (setting_idx < 0)
++		return setting_idx;
++
++	di = ldb->setting[setting_idx].di;
++
++	/* restore channel mode setting */
++	val = readl(ldb->control_reg);
++	val |= ldb->setting[setting_idx].ch_val;
++	writel(val, ldb->control_reg);
++	dev_dbg(&ldb->pdev->dev, "LDB setup, control reg:0x%x\n",
++			readl(ldb->control_reg));
++
++	/* vsync setup */
++	reg = readl(ldb->control_reg);
++	if (fbi->var.sync & FB_SYNC_VERT_HIGH_ACT) {
++		if (di == 0)
++			reg = (reg & ~LDB_DI0_VS_POL_MASK)
++				| LDB_DI0_VS_POL_ACT_HIGH;
++		else
++			reg = (reg & ~LDB_DI1_VS_POL_MASK)
++				| LDB_DI1_VS_POL_ACT_HIGH;
++	} else {
++		if (di == 0)
++			reg = (reg & ~LDB_DI0_VS_POL_MASK)
++				| LDB_DI0_VS_POL_ACT_LOW;
++		else
++			reg = (reg & ~LDB_DI1_VS_POL_MASK)
++				| LDB_DI1_VS_POL_ACT_LOW;
++	}
++	writel(reg, ldb->control_reg);
++
++	/* clk setup */
++	if (ldb->setting[setting_idx].clk_en)
++		 clk_disable_unprepare(ldb->setting[setting_idx].ldb_di_clk);
++	pixel_clk = (PICOS2KHZ(fbi->var.pixclock)) * 1000UL;
++	ldb_clk_parent = clk_get_parent(ldb->setting[setting_idx].ldb_di_clk);
++	if (IS_ERR(ldb_clk_parent)) {
++		dev_err(&ldb->pdev->dev, "get ldb di parent clk fail\n");
++		return PTR_ERR(ldb_clk_parent);
++	}
++	if ((ldb->mode == LDB_SPL_DI0) || (ldb->mode == LDB_SPL_DI1))
++		ret = clk_set_rate(ldb_clk_parent, pixel_clk * 7 / 2);
++	else
++		ret = clk_set_rate(ldb_clk_parent, pixel_clk * 7);
++	if (ret < 0) {
++		dev_err(&ldb->pdev->dev, "set ldb parent clk fail:%d\n", ret);
++		return ret;
++	}
++	rounded_pixel_clk = clk_round_rate(ldb->setting[setting_idx].ldb_di_clk,
++						pixel_clk);
++	dev_dbg(&ldb->pdev->dev, "pixel_clk:%d, rounded_pixel_clk:%d\n",
++			pixel_clk, rounded_pixel_clk);
++	ret = clk_set_rate(ldb->setting[setting_idx].ldb_di_clk,
++				rounded_pixel_clk);
++	if (ret < 0) {
++		dev_err(&ldb->pdev->dev, "set ldb di clk fail:%d\n", ret);
++		return ret;
++	}
++	ret = clk_prepare_enable(ldb->setting[setting_idx].ldb_di_clk);
++	if (ret < 0) {
++		dev_err(&ldb->pdev->dev, "enable ldb di clk fail:%d\n", ret);
++		return ret;
++	}
++
++	if (!ldb->setting[setting_idx].clk_en)
++		ldb->setting[setting_idx].clk_en = true;
++
++	return 0;
++}
++
++int ldb_fb_event(struct notifier_block *nb, unsigned long val, void *v)
++{
++	struct ldb_data *ldb = container_of(nb, struct ldb_data, nb);
++	struct fb_event *event = v;
++	struct fb_info *fbi = event->info;
++	int index;
++	uint32_t data;
++
++	index = find_ldb_setting(ldb, fbi);
++	if (index < 0)
++		return 0;
++
++	fbi->mode = (struct fb_videomode *)fb_match_mode(&fbi->var,
++			&fbi->modelist);
++
++	if (!fbi->mode) {
++		dev_warn(&ldb->pdev->dev,
++				"LDB: can not find mode for xres=%d, yres=%d\n",
++				fbi->var.xres, fbi->var.yres);
++		if (ldb->setting[index].clk_en) {
++			clk_disable(ldb->setting[index].ldb_di_clk);
++			ldb->setting[index].clk_en = false;
++			data = readl(ldb->control_reg);
++			data &= ~ldb->setting[index].ch_mask;
++			writel(data, ldb->control_reg);
++		}
++		return 0;
++	}
++
++	switch (val) {
++	case FB_EVENT_BLANK:
++	{
++		if (*((int *)event->data) == FB_BLANK_UNBLANK) {
++			if (!ldb->setting[index].clk_en) {
++				clk_enable(ldb->setting[index].ldb_di_clk);
++				ldb->setting[index].clk_en = true;
++			}
++		} else {
++			if (ldb->setting[index].clk_en) {
++				clk_disable(ldb->setting[index].ldb_di_clk);
++				ldb->setting[index].clk_en = false;
++				data = readl(ldb->control_reg);
++				data &= ~ldb->setting[index].ch_mask;
++				writel(data, ldb->control_reg);
++				dev_dbg(&ldb->pdev->dev,
++					"LDB blank, control reg:0x%x\n",
++						readl(ldb->control_reg));
++			}
++		}
++		break;
++	}
++	case FB_EVENT_SUSPEND:
++		if (ldb->setting[index].clk_en) {
++			clk_disable(ldb->setting[index].ldb_di_clk);
++			ldb->setting[index].clk_en = false;
++		}
++		break;
++	default:
++		break;
++	}
++	return 0;
++}
++
++#define LVDS_MUX_CTL_WIDTH	2
++#define LVDS_MUX_CTL_MASK	3
++#define LVDS0_MUX_CTL_OFFS	6
++#define LVDS1_MUX_CTL_OFFS	8
++#define LVDS0_MUX_CTL_MASK	(LVDS_MUX_CTL_MASK << 6)
++#define LVDS1_MUX_CTL_MASK	(LVDS_MUX_CTL_MASK << 8)
++#define ROUTE_IPU_DI(ipu, di)	(((ipu << 1) | di) & LVDS_MUX_CTL_MASK)
++static int ldb_ipu_ldb_route(int ipu, int di, struct ldb_data *ldb)
++{
++	uint32_t reg;
++	int channel;
++	int shift;
++	int mode = ldb->mode;
++
++	reg = readl(ldb->gpr3_reg);
++	if (mode < LDB_SIN0) {
++		reg &= ~(LVDS0_MUX_CTL_MASK | LVDS1_MUX_CTL_MASK);
++		reg |= (ROUTE_IPU_DI(ipu, di) << LVDS0_MUX_CTL_OFFS) |
++			(ROUTE_IPU_DI(ipu, di) << LVDS1_MUX_CTL_OFFS);
++		dev_dbg(&ldb->pdev->dev,
++			"Dual/Split mode both channels route to IPU%d-DI%d\n",
++			ipu, di);
++	} else if ((mode == LDB_SIN0) || (mode == LDB_SIN1)) {
++		reg &= ~(LVDS0_MUX_CTL_MASK | LVDS1_MUX_CTL_MASK);
++		channel = mode - LDB_SIN0;
++		shift = LVDS0_MUX_CTL_OFFS + channel * LVDS_MUX_CTL_WIDTH;
++		reg |= ROUTE_IPU_DI(ipu, di) << shift;
++		dev_dbg(&ldb->pdev->dev,
++			"Single mode channel %d route to IPU%d-DI%d\n",
++				channel, ipu, di);
++	} else {
++		static bool first = true;
++
++		if (first) {
++			if (mode == LDB_SEP0) {
++				reg &= ~LVDS0_MUX_CTL_MASK;
++				channel = 0;
++			} else {
++				reg &= ~LVDS1_MUX_CTL_MASK;
++				channel = 1;
++			}
++			first = false;
++		} else {
++			if (mode == LDB_SEP0) {
++				reg &= ~LVDS1_MUX_CTL_MASK;
++				channel = 1;
++			} else {
++				reg &= ~LVDS0_MUX_CTL_MASK;
++				channel = 0;
++			}
++		}
++
++		shift = LVDS0_MUX_CTL_OFFS + channel * LVDS_MUX_CTL_WIDTH;
++		reg |= ROUTE_IPU_DI(ipu, di) << shift;
++
++		dev_dbg(&ldb->pdev->dev,
++			"Separate mode channel %d route to IPU%d-DI%d\n",
++			channel, ipu, di);
++	}
++	writel(reg, ldb->gpr3_reg);
++
++	return 0;
++}
++
++static int ldb_disp_init(struct mxc_dispdrv_handle *disp,
++	struct mxc_dispdrv_setting *setting)
++{
++	int ret = 0, i, lvds_channel = 0;
++	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
++	struct fsl_mxc_ldb_platform_data *plat_data = ldb->pdev->dev.platform_data;
++	struct resource *res;
++	uint32_t reg, setting_idx;
++	uint32_t ch_mask = 0, ch_val = 0;
++	uint32_t ipu_id, disp_id;
++	char di_clk[] = "ipu1_di0_sel";
++	char ldb_clk[] = "ldb_di0";
++	char div_3_5_clk[] = "di0_div_3_5";
++	char div_7_clk[] = "di0_div_7";
++	char div_sel_clk[] = "di0_div_sel";
++
++	/* if input format not valid, make RGB666 as default*/
++	if (!valid_mode(setting->if_fmt)) {
++		dev_warn(&ldb->pdev->dev, "Input pixel format not valid"
++					" use default RGB666\n");
++		setting->if_fmt = IPU_PIX_FMT_RGB666;
++	}
++
++	if (!ldb->inited) {
++		setting_idx = 0;
++		res = platform_get_resource(ldb->pdev, IORESOURCE_MEM, 0);
++		if (!res) {
++			dev_err(&ldb->pdev->dev, "get iomem fail.\n");
++			return -ENOMEM;
++		}
++
++		ldb->reg = devm_ioremap(&ldb->pdev->dev, res->start,
++					resource_size(res));
++		ldb->control_reg = ldb->reg + 2;
++		ldb->gpr3_reg = ldb->reg + 3;
++
++		/* ipu selected by platform data setting */
++		setting->dev_id = plat_data->ipu_id;
++
++		reg = readl(ldb->control_reg);
++
++		/* refrence resistor select */
++		reg &= ~LDB_BGREF_RMODE_MASK;
++		if (plat_data->ext_ref)
++			reg |= LDB_BGREF_RMODE_EXT;
++		else
++			reg |= LDB_BGREF_RMODE_INT;
++
++		/* TODO: now only use SPWG data mapping for both channel */
++		reg &= ~(LDB_BIT_MAP_CH0_MASK | LDB_BIT_MAP_CH1_MASK);
++		reg |= LDB_BIT_MAP_CH0_SPWG | LDB_BIT_MAP_CH1_SPWG;
++
++		/* channel mode setting */
++		reg &= ~(LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK);
++		reg &= ~(LDB_DATA_WIDTH_CH0_MASK | LDB_DATA_WIDTH_CH1_MASK);
++
++		if (bits_per_pixel(setting->if_fmt) == 24)
++			reg |= LDB_DATA_WIDTH_CH0_24 | LDB_DATA_WIDTH_CH1_24;
++		else
++			reg |= LDB_DATA_WIDTH_CH0_18 | LDB_DATA_WIDTH_CH1_18;
++
++		if (g_ldb_mode >= LDB_SPL_DI0)
++			ldb->mode = g_ldb_mode;
++		else
++			ldb->mode = plat_data->mode;
++
++		if ((ldb->mode == LDB_SIN0) || (ldb->mode == LDB_SIN1)) {
++			ret = ldb->mode - LDB_SIN0;
++			if (plat_data->disp_id != ret) {
++				dev_warn(&ldb->pdev->dev,
++					"change IPU DI%d to IPU DI%d for LDB "
++					"channel%d.\n",
++					plat_data->disp_id, ret, ret);
++				plat_data->disp_id = ret;
++			}
++		} else if (((ldb->mode == LDB_SEP0) || (ldb->mode == LDB_SEP1))
++				&& is_imx6_ldb(plat_data)) {
++			if (plat_data->disp_id == plat_data->sec_disp_id) {
++				dev_err(&ldb->pdev->dev,
++					"For LVDS separate mode,"
++					"two DIs should be different!\n");
++				return -EINVAL;
++			}
++
++			if (((!plat_data->disp_id) && (ldb->mode == LDB_SEP1))
++				|| ((plat_data->disp_id) &&
++					(ldb->mode == LDB_SEP0))) {
++				dev_dbg(&ldb->pdev->dev,
++					"LVDS separate mode:"
++					"swap DI configuration!\n");
++				ipu_id = plat_data->ipu_id;
++				disp_id = plat_data->disp_id;
++				plat_data->ipu_id = plat_data->sec_ipu_id;
++				plat_data->disp_id = plat_data->sec_disp_id;
++				plat_data->sec_ipu_id = ipu_id;
++				plat_data->sec_disp_id = disp_id;
++			}
++		}
++
++		if (ldb->mode == LDB_SPL_DI0) {
++			reg |= LDB_SPLIT_MODE_EN | LDB_CH0_MODE_EN_TO_DI0
++				| LDB_CH1_MODE_EN_TO_DI0;
++			setting->disp_id = 0;
++		} else if (ldb->mode == LDB_SPL_DI1) {
++			reg |= LDB_SPLIT_MODE_EN | LDB_CH0_MODE_EN_TO_DI1
++				| LDB_CH1_MODE_EN_TO_DI1;
++			setting->disp_id = 1;
++		} else if (ldb->mode == LDB_DUL_DI0) {
++			reg &= ~LDB_SPLIT_MODE_EN;
++			reg |= LDB_CH0_MODE_EN_TO_DI0 | LDB_CH1_MODE_EN_TO_DI0;
++			setting->disp_id = 0;
++		} else if (ldb->mode == LDB_DUL_DI1) {
++			reg &= ~LDB_SPLIT_MODE_EN;
++			reg |= LDB_CH0_MODE_EN_TO_DI1 | LDB_CH1_MODE_EN_TO_DI1;
++			setting->disp_id = 1;
++		} else if (ldb->mode == LDB_SIN0) {
++			reg &= ~LDB_SPLIT_MODE_EN;
++			setting->disp_id = plat_data->disp_id;
++			if (setting->disp_id == 0)
++				reg |= LDB_CH0_MODE_EN_TO_DI0;
++			else
++				reg |= LDB_CH0_MODE_EN_TO_DI1;
++			ch_mask = LDB_CH0_MODE_MASK;
++			ch_val = reg & LDB_CH0_MODE_MASK;
++		} else if (ldb->mode == LDB_SIN1) {
++			reg &= ~LDB_SPLIT_MODE_EN;
++			setting->disp_id = plat_data->disp_id;
++			if (setting->disp_id == 0)
++				reg |= LDB_CH1_MODE_EN_TO_DI0;
++			else
++				reg |= LDB_CH1_MODE_EN_TO_DI1;
++			ch_mask = LDB_CH1_MODE_MASK;
++			ch_val = reg & LDB_CH1_MODE_MASK;
++		} else { /* separate mode*/
++			setting->disp_id = plat_data->disp_id;
++
++			/* first output is LVDS0 or LVDS1 */
++			if (ldb->mode == LDB_SEP0)
++				lvds_channel = 0;
++			else
++				lvds_channel = 1;
++
++			reg &= ~LDB_SPLIT_MODE_EN;
++
++			if ((lvds_channel == 0) && (setting->disp_id == 0))
++				reg |= LDB_CH0_MODE_EN_TO_DI0;
++			else if ((lvds_channel == 0) && (setting->disp_id == 1))
++				reg |= LDB_CH0_MODE_EN_TO_DI1;
++			else if ((lvds_channel == 1) && (setting->disp_id == 0))
++				reg |= LDB_CH1_MODE_EN_TO_DI0;
++			else
++				reg |= LDB_CH1_MODE_EN_TO_DI1;
++			ch_mask = lvds_channel ? LDB_CH1_MODE_MASK :
++					LDB_CH0_MODE_MASK;
++			ch_val = reg & ch_mask;
++
++			if (bits_per_pixel(setting->if_fmt) == 24) {
++				if (lvds_channel == 0)
++					reg &= ~LDB_DATA_WIDTH_CH1_24;
++				else
++					reg &= ~LDB_DATA_WIDTH_CH0_24;
++			} else {
++				if (lvds_channel == 0)
++					reg &= ~LDB_DATA_WIDTH_CH1_18;
++				else
++					reg &= ~LDB_DATA_WIDTH_CH0_18;
++			}
++		}
++
++		writel(reg, ldb->control_reg);
++		if (ldb->mode <  LDB_SIN0) {
++			ch_mask = LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK;
++			ch_val = reg & (LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK);
++		}
++	} else { /* second time for separate mode */
++		if ((ldb->mode == LDB_SPL_DI0) ||
++			(ldb->mode == LDB_SPL_DI1) ||
++			(ldb->mode == LDB_DUL_DI0) ||
++			(ldb->mode == LDB_DUL_DI1) ||
++			(ldb->mode == LDB_SIN0) ||
++			(ldb->mode == LDB_SIN1)) {
++			dev_err(&ldb->pdev->dev, "for second ldb disp"
++					"ldb mode should in separate mode\n");
++			return -EINVAL;
++		}
++
++		setting_idx = 1;
++		if (is_imx6_ldb(plat_data)) {
++			setting->dev_id = plat_data->sec_ipu_id;
++			setting->disp_id = plat_data->sec_disp_id;
++		} else {
++			setting->dev_id = plat_data->ipu_id;
++			setting->disp_id = !plat_data->disp_id;
++		}
++		if (setting->disp_id == ldb->setting[0].di) {
++			dev_err(&ldb->pdev->dev, "Err: for second ldb disp in"
++				"separate mode, DI should be different!\n");
++			return -EINVAL;
++		}
++
++		/* second output is LVDS0 or LVDS1 */
++		if (ldb->mode == LDB_SEP0)
++			lvds_channel = 1;
++		else
++			lvds_channel = 0;
++
++		reg = readl(ldb->control_reg);
++		if ((lvds_channel == 0) && (setting->disp_id == 0))
++			reg |= LDB_CH0_MODE_EN_TO_DI0;
++		else if ((lvds_channel == 0) && (setting->disp_id == 1))
++			reg |= LDB_CH0_MODE_EN_TO_DI1;
++		else if ((lvds_channel == 1) && (setting->disp_id == 0))
++			reg |= LDB_CH1_MODE_EN_TO_DI0;
++		else
++			reg |= LDB_CH1_MODE_EN_TO_DI1;
++		ch_mask = lvds_channel ?  LDB_CH1_MODE_MASK :
++				LDB_CH0_MODE_MASK;
++		ch_val = reg & ch_mask;
++
++		if (bits_per_pixel(setting->if_fmt) == 24) {
++			if (lvds_channel == 0)
++				reg |= LDB_DATA_WIDTH_CH0_24;
++			else
++				reg |= LDB_DATA_WIDTH_CH1_24;
++		} else {
++			if (lvds_channel == 0)
++				reg |= LDB_DATA_WIDTH_CH0_18;
++			else
++				reg |= LDB_DATA_WIDTH_CH1_18;
++		}
++		writel(reg, ldb->control_reg);
++	}
++
++	/* get clocks */
++	if (is_imx6_ldb(plat_data) &&
++		((ldb->mode == LDB_SEP0) || (ldb->mode == LDB_SEP1))) {
++		ldb_clk[6] += lvds_channel;
++		div_3_5_clk[2] += lvds_channel;
++		div_7_clk[2] += lvds_channel;
++		div_sel_clk[2] += lvds_channel;
++	} else {
++		ldb_clk[6] += setting->disp_id;
++		div_3_5_clk[2] += setting->disp_id;
++		div_7_clk[2] += setting->disp_id;
++		div_sel_clk[2] += setting->disp_id;
++	}
++	ldb->setting[setting_idx].ldb_di_clk = clk_get(&ldb->pdev->dev,
++							ldb_clk);
++	if (IS_ERR(ldb->setting[setting_idx].ldb_di_clk)) {
++		dev_err(&ldb->pdev->dev, "get ldb clk failed\n");
++		return PTR_ERR(ldb->setting[setting_idx].ldb_di_clk);
++	}
++
++	ldb->setting[setting_idx].div_3_5_clk = clk_get(&ldb->pdev->dev,
++							div_3_5_clk);
++	if (IS_ERR(ldb->setting[setting_idx].div_3_5_clk)) {
++		dev_err(&ldb->pdev->dev, "get div 3.5 clk failed\n");
++		return PTR_ERR(ldb->setting[setting_idx].div_3_5_clk);
++	}
++	ldb->setting[setting_idx].div_7_clk = clk_get(&ldb->pdev->dev,
++							div_7_clk);
++	if (IS_ERR(ldb->setting[setting_idx].div_7_clk)) {
++		dev_err(&ldb->pdev->dev, "get div 7 clk failed\n");
++		return PTR_ERR(ldb->setting[setting_idx].div_7_clk);
++	}
++
++	ldb->setting[setting_idx].div_sel_clk = clk_get(&ldb->pdev->dev,
++							div_sel_clk);
++	if (IS_ERR(ldb->setting[setting_idx].div_sel_clk)) {
++		dev_err(&ldb->pdev->dev, "get div sel clk failed\n");
++		return PTR_ERR(ldb->setting[setting_idx].div_sel_clk);
++	}
++
++	di_clk[3] += setting->dev_id;
++	di_clk[7] += setting->disp_id;
++	ldb->setting[setting_idx].di_clk = clk_get(&ldb->pdev->dev,
++							di_clk);
++	if (IS_ERR(ldb->setting[setting_idx].di_clk)) {
++		dev_err(&ldb->pdev->dev, "get di clk failed\n");
++		return PTR_ERR(ldb->setting[setting_idx].di_clk);
++	}
++
++	ldb->setting[setting_idx].ch_mask = ch_mask;
++	ldb->setting[setting_idx].ch_val = ch_val;
++
++	if (is_imx6_ldb(plat_data))
++		ldb_ipu_ldb_route(setting->dev_id, setting->disp_id, ldb);
++
++	/* must use spec video mode defined by driver */
++	ret = fb_find_mode(&setting->fbi->var, setting->fbi, setting->dft_mode_str,
++				ldb_modedb, ldb_modedb_sz, NULL, setting->default_bpp);
++	if (ret != 1)
++		fb_videomode_to_var(&setting->fbi->var, &ldb_modedb[0]);
++
++	INIT_LIST_HEAD(&setting->fbi->modelist);
++	for (i = 0; i < ldb_modedb_sz; i++) {
++		struct fb_videomode m;
++		fb_var_to_videomode(&m, &setting->fbi->var);
++		if (fb_mode_is_equal(&m, &ldb_modedb[i])) {
++			fb_add_videomode(&ldb_modedb[i],
++					&setting->fbi->modelist);
++			break;
++		}
++	}
++
++	ldb->setting[setting_idx].ipu = setting->dev_id;
++	ldb->setting[setting_idx].di = setting->disp_id;
++
++	return ret;
++}
++
++static int ldb_post_disp_init(struct mxc_dispdrv_handle *disp,
++				int ipu_id, int disp_id)
++{
++	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
++	int setting_idx = ldb->inited ? 1 : 0;
++	int ret = 0;
++
++	if (!ldb->inited) {
++		ldb->nb.notifier_call = ldb_fb_event;
++		fb_register_client(&ldb->nb);
++	}
++
++	ret = clk_set_parent(ldb->setting[setting_idx].di_clk,
++			ldb->setting[setting_idx].ldb_di_clk);
++	if (ret) {
++		dev_err(&ldb->pdev->dev, "fail to set ldb_di clk as"
++			"the parent of ipu_di clk\n");
++		return ret;
++	}
++
++	if ((ldb->mode == LDB_SPL_DI0) || (ldb->mode == LDB_SPL_DI1)) {
++		ret = clk_set_parent(ldb->setting[setting_idx].div_sel_clk,
++				ldb->setting[setting_idx].div_3_5_clk);
++		if (ret) {
++			dev_err(&ldb->pdev->dev, "fail to set div 3.5 clk as"
++				"the parent of div sel clk\n");
++			return ret;
++		}
++	} else {
++		ret = clk_set_parent(ldb->setting[setting_idx].div_sel_clk,
++				ldb->setting[setting_idx].div_7_clk);
++		if (ret) {
++			dev_err(&ldb->pdev->dev, "fail to set div 7 clk as"
++				"the parent of div sel clk\n");
++			return ret;
++		}
++	}
++
++	/* save active ldb setting for fb notifier */
++	ldb->setting[setting_idx].active = true;
++
++	ldb->inited = true;
++	return ret;
++}
++
++static void ldb_disp_deinit(struct mxc_dispdrv_handle *disp)
++{
++	struct ldb_data *ldb = mxc_dispdrv_getdata(disp);
++	int i;
++
++	writel(0, ldb->control_reg);
++
++	for (i = 0; i < 2; i++) {
++		clk_disable(ldb->setting[i].ldb_di_clk);
++		clk_put(ldb->setting[i].ldb_di_clk);
++		clk_put(ldb->setting[i].div_3_5_clk);
++		clk_put(ldb->setting[i].div_7_clk);
++		clk_put(ldb->setting[i].div_sel_clk);
++	}
++
++	fb_unregister_client(&ldb->nb);
++}
++
++static struct mxc_dispdrv_driver ldb_drv = {
++	.name 	= DISPDRV_LDB,
++	.init 	= ldb_disp_init,
++	.post_init = ldb_post_disp_init,
++	.deinit	= ldb_disp_deinit,
++	.setup = ldb_disp_setup,
++};
++
++static int ldb_suspend(struct platform_device *pdev, pm_message_t state)
++{
++	struct ldb_data *ldb = dev_get_drvdata(&pdev->dev);
++	uint32_t	data;
++
++	if (!ldb->inited)
++		return 0;
++	data = readl(ldb->control_reg);
++	ldb->control_reg_data = data;
++	data &= ~(LDB_CH0_MODE_MASK | LDB_CH1_MODE_MASK);
++	writel(data, ldb->control_reg);
++
++	return 0;
++}
++
++static int ldb_resume(struct platform_device *pdev)
++{
++	struct ldb_data *ldb = dev_get_drvdata(&pdev->dev);
++
++	if (!ldb->inited)
++		return 0;
++	writel(ldb->control_reg_data, ldb->control_reg);
++
++	return 0;
++}
++
++static struct platform_device_id imx_ldb_devtype[] = {
++	{
++		.name = "ldb-imx6",
++		.driver_data = LDB_IMX6,
++	}, {
++		/* sentinel */
++	}
++};
++
++static const struct of_device_id imx_ldb_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-ldb", .data = &imx_ldb_devtype[IMX6_LDB],},
++	{ /* sentinel */ }
++};
++
++/*!
++ * This function is called by the driver framework to initialize the LDB
++ * device.
++ *
++ * @param	dev	The device structure for the LDB passed in by the
++ *			driver framework.
++ *
++ * @return      Returns 0 on success or negative error code on error
++ */
++static int ldb_probe(struct platform_device *pdev)
++{
++	int ret = 0;
++	struct ldb_data *ldb;
++	struct fsl_mxc_ldb_platform_data *plat_data;
++	const struct of_device_id *of_id =
++			of_match_device(imx_ldb_dt_ids, &pdev->dev);
++
++	dev_dbg(&pdev->dev, "%s enter\n", __func__);
++	ldb = devm_kzalloc(&pdev->dev, sizeof(struct ldb_data), GFP_KERNEL);
++	if (!ldb)
++		return -ENOMEM;
++
++	plat_data = devm_kzalloc(&pdev->dev,
++				sizeof(struct fsl_mxc_ldb_platform_data),
++				GFP_KERNEL);
++	if (!plat_data)
++		return -ENOMEM;
++	pdev->dev.platform_data = plat_data;
++	if (of_id)
++		pdev->id_entry = of_id->data;
++	plat_data->devtype = pdev->id_entry->driver_data;
++
++	ret = ldb_get_of_property(pdev, plat_data);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "get ldb of property fail\n");
++		return ret;
++	}
++
++	ldb->pdev = pdev;
++	ldb->disp_ldb = mxc_dispdrv_register(&ldb_drv);
++	mxc_dispdrv_setdata(ldb->disp_ldb, ldb);
++
++	dev_set_drvdata(&pdev->dev, ldb);
++
++	dev_dbg(&pdev->dev, "%s exit\n", __func__);
++	return ret;
++}
++
++static int ldb_remove(struct platform_device *pdev)
++{
++	struct ldb_data *ldb = dev_get_drvdata(&pdev->dev);
++
++	if (!ldb->inited)
++		return 0;
++	mxc_dispdrv_puthandle(ldb->disp_ldb);
++	mxc_dispdrv_unregister(ldb->disp_ldb);
++	return 0;
++}
++
++static struct platform_driver mxcldb_driver = {
++	.driver = {
++		.name = "mxc_ldb",
++		.of_match_table	= imx_ldb_dt_ids,
++	},
++	.probe = ldb_probe,
++	.remove = ldb_remove,
++	.suspend = ldb_suspend,
++	.resume = ldb_resume,
++};
++
++static int __init ldb_init(void)
++{
++	return platform_driver_register(&mxcldb_driver);
++}
++
++static void __exit ldb_uninit(void)
++{
++	platform_driver_unregister(&mxcldb_driver);
++}
++
++module_init(ldb_init);
++module_exit(ldb_uninit);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("MXC LDB driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/video/mxc/Makefile linux-xbian-imx6/drivers/video/mxc/Makefile
+--- linux-4.1.3/drivers/video/mxc/Makefile	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/Makefile	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,7 @@
++obj-$(CONFIG_FB_MXC_LDB) += ldb.o
++obj-$(CONFIG_FB_MXC_MIPI_DSI)			+= mipi_dsi.o
++obj-$(CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL)	+= mxcfb_hx8369_wvga.o
++obj-$(CONFIG_FB_MXC_HDMI)			+= mxc_hdmi.o
++obj-$(CONFIG_FB_MXC_EDID)			+= mxc_edid.o
++obj-$(CONFIG_FB_MXC_SYNC_PANEL) += mxc_dispdrv.o mxc_lcdif.o mxc_ipuv3_fb.o
++obj-$(CONFIG_FB_MXC_DCIC) += mxc_dcic.o
+diff -Nur linux-4.1.3/drivers/video/mxc/mipi_dsi.c linux-xbian-imx6/drivers/video/mxc/mipi_dsi.c
+--- linux-4.1.3/drivers/video/mxc/mipi_dsi.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mipi_dsi.c	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,953 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/types.h>
++#include <linux/init.h>
++#include <linux/platform_device.h>
++#include <linux/err.h>
++#include <linux/clk.h>
++#include <linux/console.h>
++#include <linux/io.h>
++#include <linux/bitops.h>
++#include <linux/ipu.h>
++#include <linux/mfd/syscon.h>
++#include <linux/mfd/syscon/imx6q-iomuxc-gpr.h>
++#include <linux/mipi_dsi.h>
++#include <linux/module.h>
++#include <linux/mxcfb.h>
++#include <linux/backlight.h>
++#include <linux/of_device.h>
++#include <linux/regulator/consumer.h>
++#include <linux/reset.h>
++#include <linux/spinlock.h>
++#include <linux/delay.h>
++#include <video/mipi_display.h>
++
++#include "mxc_dispdrv.h"
++#include "mipi_dsi.h"
++
++#define DISPDRV_MIPI			"mipi_dsi"
++#define ROUND_UP(x)			((x)+1)
++#define NS2PS_RATIO			(1000)
++#define NUMBER_OF_CHUNKS		(0x8)
++#define NULL_PKT_SIZE			(0x8)
++#define PHY_BTA_MAXTIME			(0xd00)
++#define PHY_LP2HS_MAXTIME		(0x40)
++#define PHY_HS2LP_MAXTIME		(0x40)
++#define	PHY_STOP_WAIT_TIME		(0x20)
++#define	DSI_CLKMGR_CFG_CLK_DIV		(0x107)
++#define DSI_GEN_PLD_DATA_BUF_ENTRY	(0x10)
++#define	MIPI_MUX_CTRL(v)		(((v) & 0x3) << 4)
++#define	MIPI_LCD_SLEEP_MODE_DELAY	(120)
++#define	MIPI_DSI_REG_RW_TIMEOUT		(20)
++#define	MIPI_DSI_PHY_TIMEOUT		(10)
++
++static struct mipi_dsi_match_lcd mipi_dsi_lcd_db[] = {
++#ifdef CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL
++	{
++	 "TRULY-WVGA",
++	 {mipid_hx8369_get_lcd_videomode, mipid_hx8369_lcd_setup}
++	},
++#endif
++	{
++	"", {NULL, NULL}
++	}
++};
++
++struct _mipi_dsi_phy_pll_clk {
++	u32		max_phy_clk;
++	u32		config;
++};
++
++/* configure data for DPHY PLL 27M reference clk out */
++static const struct _mipi_dsi_phy_pll_clk mipi_dsi_phy_pll_clk_table[] = {
++	{1000, 0x74}, /*  950-1000MHz	*/
++	{950,  0x54}, /*  900-950Mhz	*/
++	{900,  0x34}, /*  850-900Mhz	*/
++	{850,  0x14}, /*  800-850MHz	*/
++	{800,  0x32}, /*  750-800MHz	*/
++	{750,  0x12}, /*  700-750Mhz	*/
++	{700,  0x30}, /*  650-700Mhz	*/
++	{650,  0x10}, /*  600-650MHz	*/
++	{600,  0x2e}, /*  550-600MHz	*/
++	{550,  0x0e}, /*  500-550Mhz	*/
++	{500,  0x2c}, /*  450-500Mhz	*/
++	{450,  0x0c}, /*  400-450MHz	*/
++	{400,  0x4a}, /*  360-400MHz	*/
++	{360,  0x2a}, /*  330-360Mhz	*/
++	{330,  0x48}, /*  300-330Mhz	*/
++	{300,  0x28}, /*  270-300MHz	*/
++	{270,  0x08}, /*  250-270MHz	*/
++	{250,  0x46}, /*  240-250Mhz	*/
++	{240,  0x26}, /*  210-240Mhz	*/
++	{210,  0x06}, /*  200-210MHz	*/
++	{200,  0x44}, /*  180-200MHz	*/
++	{180,  0x24}, /*  160-180MHz	*/
++	{160,  0x04}, /*  150-160MHz	*/
++};
++
++static int valid_mode(int pixel_fmt)
++{
++	return ((pixel_fmt == IPU_PIX_FMT_RGB24)  ||
++			(pixel_fmt == IPU_PIX_FMT_BGR24)  ||
++			(pixel_fmt == IPU_PIX_FMT_RGB666) ||
++			(pixel_fmt == IPU_PIX_FMT_RGB565) ||
++			(pixel_fmt == IPU_PIX_FMT_BGR666) ||
++			(pixel_fmt == IPU_PIX_FMT_RGB332));
++}
++
++static inline void mipi_dsi_read_register(struct mipi_dsi_info *mipi_dsi,
++				u32 reg, u32 *val)
++{
++	*val = ioread32(mipi_dsi->mmio_base + reg);
++	dev_dbg(&mipi_dsi->pdev->dev, "read_reg:0x%02x, val:0x%08x.\n",
++			reg, *val);
++}
++
++static inline void mipi_dsi_write_register(struct mipi_dsi_info *mipi_dsi,
++				u32 reg, u32 val)
++{
++	iowrite32(val, mipi_dsi->mmio_base + reg);
++	dev_dbg(&mipi_dsi->pdev->dev, "\t\twrite_reg:0x%02x, val:0x%08x.\n",
++			reg, val);
++}
++
++int mipi_dsi_pkt_write(struct mipi_dsi_info *mipi_dsi,
++				u8 data_type, const u32 *buf, int len)
++{
++	u32 val;
++	u32 status = 0;
++	int write_len = len;
++	uint32_t	timeout = 0;
++
++	if (len) {
++		/* generic long write command */
++		while (len / DSI_GEN_PLD_DATA_BUF_SIZE) {
++			mipi_dsi_write_register(mipi_dsi,
++				MIPI_DSI_GEN_PLD_DATA, *buf);
++			buf++;
++			len -= DSI_GEN_PLD_DATA_BUF_SIZE;
++			mipi_dsi_read_register(mipi_dsi,
++				MIPI_DSI_CMD_PKT_STATUS, &status);
++			while ((status & DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) ==
++					 DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) {
++				msleep(1);
++				timeout++;
++				if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
++					return -EIO;
++				mipi_dsi_read_register(mipi_dsi,
++					MIPI_DSI_CMD_PKT_STATUS, &status);
++			}
++		}
++		/* write the remainder bytes */
++		if (len > 0) {
++			while ((status & DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) ==
++					 DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL) {
++				msleep(1);
++				timeout++;
++				if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
++					return -EIO;
++				mipi_dsi_read_register(mipi_dsi,
++					MIPI_DSI_CMD_PKT_STATUS, &status);
++			}
++			mipi_dsi_write_register(mipi_dsi,
++				MIPI_DSI_GEN_PLD_DATA, *buf);
++		}
++
++		val = data_type | ((write_len & DSI_GEN_HDR_DATA_MASK)
++			<< DSI_GEN_HDR_DATA_SHIFT);
++	} else {
++		/* generic short write command */
++		val = data_type | ((*buf & DSI_GEN_HDR_DATA_MASK)
++			<< DSI_GEN_HDR_DATA_SHIFT);
++	}
++
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &status);
++	while ((status & DSI_CMD_PKT_STATUS_GEN_CMD_FULL) ==
++			 DSI_CMD_PKT_STATUS_GEN_CMD_FULL) {
++		msleep(1);
++		timeout++;
++		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
++			return -EIO;
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
++				&status);
++	}
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_GEN_HDR, val);
++
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &status);
++	while (!((status & DSI_CMD_PKT_STATUS_GEN_CMD_EMPTY) ==
++			 DSI_CMD_PKT_STATUS_GEN_CMD_EMPTY) ||
++			!((status & DSI_CMD_PKT_STATUS_GEN_PLD_W_EMPTY) ==
++			DSI_CMD_PKT_STATUS_GEN_PLD_W_EMPTY)) {
++		msleep(1);
++		timeout++;
++		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
++			return -EIO;
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
++				&status);
++	}
++
++	return 0;
++}
++
++int mipi_dsi_pkt_read(struct mipi_dsi_info *mipi_dsi,
++				u8 data_type, u32 *buf, int len)
++{
++	u32		val;
++	int		read_len = 0;
++	uint32_t	timeout = 0;
++
++	if (!len) {
++		mipi_dbg("%s, len = 0 invalid error!\n", __func__);
++		return -EINVAL;
++	}
++
++	val = data_type | ((*buf & DSI_GEN_HDR_DATA_MASK)
++		<< DSI_GEN_HDR_DATA_SHIFT);
++	memset(buf, 0, len);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_GEN_HDR, val);
++
++	/* wait for cmd to sent out */
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &val);
++	while ((val & DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) !=
++			 DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) {
++		msleep(1);
++		timeout++;
++		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
++			return -EIO;
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
++			&val);
++	}
++	/* wait for entire response stroed in FIFO */
++	while ((val & DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) ==
++			 DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY) {
++		msleep(1);
++		timeout++;
++		if (timeout == MIPI_DSI_REG_RW_TIMEOUT)
++			return -EIO;
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
++			&val);
++	}
++
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS, &val);
++	while (!(val & DSI_CMD_PKT_STATUS_GEN_PLD_R_EMPTY)) {
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_GEN_PLD_DATA, buf);
++		read_len += DSI_GEN_PLD_DATA_BUF_SIZE;
++		buf++;
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_PKT_STATUS,
++			&val);
++		if (read_len == (DSI_GEN_PLD_DATA_BUF_ENTRY *
++					DSI_GEN_PLD_DATA_BUF_SIZE))
++			break;
++	}
++
++	if ((len <= read_len) &&
++		((len + DSI_GEN_PLD_DATA_BUF_SIZE) >= read_len))
++		return 0;
++	else {
++		dev_err(&mipi_dsi->pdev->dev,
++			"actually read_len:%d != len:%d.\n", read_len, len);
++		return -ERANGE;
++	}
++}
++
++int mipi_dsi_dcs_cmd(struct mipi_dsi_info *mipi_dsi,
++				u8 cmd, const u32 *param, int num)
++{
++	int err = 0;
++	u32 buf[DSI_CMD_BUF_MAXSIZE];
++
++	switch (cmd) {
++	case MIPI_DCS_EXIT_SLEEP_MODE:
++	case MIPI_DCS_ENTER_SLEEP_MODE:
++	case MIPI_DCS_SET_DISPLAY_ON:
++	case MIPI_DCS_SET_DISPLAY_OFF:
++		buf[0] = cmd;
++		err = mipi_dsi_pkt_write(mipi_dsi,
++				MIPI_DSI_DCS_SHORT_WRITE, buf, 0);
++		break;
++
++	default:
++	dev_err(&mipi_dsi->pdev->dev,
++			"MIPI DSI DCS Command:0x%x Not supported!\n", cmd);
++		break;
++	}
++
++	return err;
++}
++
++static void mipi_dsi_dphy_init(struct mipi_dsi_info *mipi_dsi,
++						u32 cmd, u32 data)
++{
++	u32 val;
++	u32 timeout = 0;
++
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CTRL,
++			DSI_PHY_IF_CTRL_RESET);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP, DSI_PWRUP_POWERUP);
++
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 0);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL1,
++		(0x10000 | cmd));
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 2);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 0);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL1, (0 | data));
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 2);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TST_CTRL0, 0);
++	val = DSI_PHY_RSTZ_EN_CLK | DSI_PHY_RSTZ_DISABLE_RST |
++			DSI_PHY_RSTZ_DISABLE_SHUTDOWN;
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_RSTZ, val);
++
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_PHY_STATUS, &val);
++	while ((val & DSI_PHY_STATUS_LOCK) != DSI_PHY_STATUS_LOCK) {
++		msleep(1);
++		timeout++;
++		if (timeout == MIPI_DSI_PHY_TIMEOUT) {
++			dev_err(&mipi_dsi->pdev->dev,
++				"Error: phy lock timeout!\n");
++			break;
++		}
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_PHY_STATUS, &val);
++	}
++	timeout = 0;
++	while ((val & DSI_PHY_STATUS_STOPSTATE_CLK_LANE) !=
++			DSI_PHY_STATUS_STOPSTATE_CLK_LANE) {
++		msleep(1);
++		timeout++;
++		if (timeout == MIPI_DSI_PHY_TIMEOUT) {
++			dev_err(&mipi_dsi->pdev->dev,
++				"Error: phy lock lane timeout!\n");
++			break;
++		}
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_PHY_STATUS, &val);
++	}
++}
++
++static void mipi_dsi_enable_controller(struct mipi_dsi_info *mipi_dsi,
++				bool init)
++{
++	u32		val;
++	u32		lane_byte_clk_period;
++	struct  fb_videomode *mode = mipi_dsi->mode;
++	struct  mipi_lcd_config *lcd_config = mipi_dsi->lcd_config;
++
++	if (init) {
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
++			DSI_PWRUP_RESET);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_RSTZ,
++			DSI_PHY_RSTZ_RST);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CLKMGR_CFG,
++			DSI_CLKMGR_CFG_CLK_DIV);
++
++		if (!(mode->sync & FB_SYNC_VERT_HIGH_ACT))
++			val = DSI_DPI_CFG_VSYNC_ACT_LOW;
++		if (!(mode->sync & FB_SYNC_HOR_HIGH_ACT))
++			val |= DSI_DPI_CFG_HSYNC_ACT_LOW;
++		if ((mode->sync & FB_SYNC_OE_LOW_ACT))
++			val |= DSI_DPI_CFG_DATAEN_ACT_LOW;
++		if (MIPI_RGB666_LOOSELY == lcd_config->dpi_fmt)
++			val |= DSI_DPI_CFG_EN18LOOSELY;
++		val |= (lcd_config->dpi_fmt & DSI_DPI_CFG_COLORCODE_MASK)
++				<< DSI_DPI_CFG_COLORCODE_SHIFT;
++		val |= (lcd_config->virtual_ch & DSI_DPI_CFG_VID_MASK)
++				<< DSI_DPI_CFG_VID_SHIFT;
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_DPI_CFG, val);
++
++		val = DSI_PCKHDL_CFG_EN_BTA |
++				DSI_PCKHDL_CFG_EN_ECC_RX |
++				DSI_PCKHDL_CFG_EN_CRC_RX;
++
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PCKHDL_CFG, val);
++
++		val = (mode->xres & DSI_VID_PKT_CFG_VID_PKT_SZ_MASK)
++				<< DSI_VID_PKT_CFG_VID_PKT_SZ_SHIFT;
++		val |= (NUMBER_OF_CHUNKS & DSI_VID_PKT_CFG_NUM_CHUNKS_MASK)
++				<< DSI_VID_PKT_CFG_NUM_CHUNKS_SHIFT;
++		val |= (NULL_PKT_SIZE & DSI_VID_PKT_CFG_NULL_PKT_SZ_MASK)
++				<< DSI_VID_PKT_CFG_NULL_PKT_SZ_SHIFT;
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VID_PKT_CFG, val);
++
++		/* enable LP mode when TX DCS cmd and enable DSI command mode */
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG,
++				MIPI_DSI_CMD_MODE_CFG_EN_LOWPOWER);
++
++		 /* mipi lane byte clk period in ns unit */
++		lane_byte_clk_period = NS2PS_RATIO /
++				(lcd_config->max_phy_clk / BITS_PER_BYTE);
++		val  = ROUND_UP(mode->hsync_len * mode->pixclock /
++				NS2PS_RATIO / lane_byte_clk_period)
++				<< DSI_TME_LINE_CFG_HSA_TIME_SHIFT;
++		val |= ROUND_UP(mode->left_margin * mode->pixclock /
++				NS2PS_RATIO / lane_byte_clk_period)
++				<< DSI_TME_LINE_CFG_HBP_TIME_SHIFT;
++		val |= ROUND_UP((mode->left_margin + mode->right_margin +
++				mode->hsync_len + mode->xres) * mode->pixclock
++				/ NS2PS_RATIO / lane_byte_clk_period)
++				<< DSI_TME_LINE_CFG_HLINE_TIME_SHIFT;
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_TMR_LINE_CFG, val);
++
++		val = ((mode->vsync_len & DSI_VTIMING_CFG_VSA_LINES_MASK)
++					<< DSI_VTIMING_CFG_VSA_LINES_SHIFT);
++		val |= ((mode->upper_margin & DSI_VTIMING_CFG_VBP_LINES_MASK)
++				<< DSI_VTIMING_CFG_VBP_LINES_SHIFT);
++		val |= ((mode->lower_margin & DSI_VTIMING_CFG_VFP_LINES_MASK)
++				<< DSI_VTIMING_CFG_VFP_LINES_SHIFT);
++		val |= ((mode->yres & DSI_VTIMING_CFG_V_ACT_LINES_MASK)
++				<< DSI_VTIMING_CFG_V_ACT_LINES_SHIFT);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VTIMING_CFG, val);
++
++		val = ((PHY_BTA_MAXTIME & DSI_PHY_TMR_CFG_BTA_TIME_MASK)
++				<< DSI_PHY_TMR_CFG_BTA_TIME_SHIFT);
++		val |= ((PHY_LP2HS_MAXTIME & DSI_PHY_TMR_CFG_LP2HS_TIME_MASK)
++				<< DSI_PHY_TMR_CFG_LP2HS_TIME_SHIFT);
++		val |= ((PHY_HS2LP_MAXTIME & DSI_PHY_TMR_CFG_HS2LP_TIME_MASK)
++				<< DSI_PHY_TMR_CFG_HS2LP_TIME_SHIFT);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_TMR_CFG, val);
++
++		val = (((lcd_config->data_lane_num - 1) &
++			DSI_PHY_IF_CFG_N_LANES_MASK)
++			<< DSI_PHY_IF_CFG_N_LANES_SHIFT);
++		val |= ((PHY_STOP_WAIT_TIME & DSI_PHY_IF_CFG_WAIT_TIME_MASK)
++				<< DSI_PHY_IF_CFG_WAIT_TIME_SHIFT);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CFG, val);
++
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST0, &val);
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST1, &val);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_ERROR_MSK0, 0);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_ERROR_MSK1, 0);
++
++		mipi_dsi_dphy_init(mipi_dsi, DSI_PHY_CLK_INIT_COMMAND,
++					mipi_dsi->dphy_pll_config);
++	} else {
++		mipi_dsi_dphy_init(mipi_dsi, DSI_PHY_CLK_INIT_COMMAND,
++					mipi_dsi->dphy_pll_config);
++	}
++}
++
++static void mipi_dsi_disable_controller(struct mipi_dsi_info *mipi_dsi)
++{
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CTRL,
++			DSI_PHY_IF_CTRL_RESET);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP, DSI_PWRUP_RESET);
++	mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_RSTZ, DSI_PHY_RSTZ_RST);
++}
++
++static irqreturn_t mipi_dsi_irq_handler(int irq, void *data)
++{
++	u32		mask0;
++	u32		mask1;
++	u32		status0;
++	u32		status1;
++	struct mipi_dsi_info *mipi_dsi;
++
++	mipi_dsi = (struct mipi_dsi_info *)data;
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST0,  &status0);
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_ST1,  &status1);
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_MSK0, &mask0);
++	mipi_dsi_read_register(mipi_dsi, MIPI_DSI_ERROR_MSK1, &mask1);
++
++	if ((status0 & (~mask0)) || (status1 & (~mask1))) {
++		dev_err(&mipi_dsi->pdev->dev,
++		"mipi_dsi IRQ status0:0x%x, status1:0x%x!\n",
++		status0, status1);
++	}
++
++	return IRQ_HANDLED;
++}
++
++static inline void mipi_dsi_set_mode(struct mipi_dsi_info *mipi_dsi,
++	bool cmd_mode)
++{
++	u32	val;
++
++	if (cmd_mode) {
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
++			DSI_PWRUP_RESET);
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, &val);
++		val |= MIPI_DSI_CMD_MODE_CFG_EN_CMD_MODE;
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, val);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VID_MODE_CFG, 0);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
++			DSI_PWRUP_POWERUP);
++	} else {
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
++			DSI_PWRUP_RESET);
++		 /* Disable Command mode when tranfering video data */
++		mipi_dsi_read_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, &val);
++		val &= ~MIPI_DSI_CMD_MODE_CFG_EN_CMD_MODE;
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_CMD_MODE_CFG, val);
++		val = DSI_VID_MODE_CFG_EN | DSI_VID_MODE_CFG_EN_BURSTMODE |
++				DSI_VID_MODE_CFG_EN_LP_MODE;
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_VID_MODE_CFG, val);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PWR_UP,
++			DSI_PWRUP_POWERUP);
++		mipi_dsi_write_register(mipi_dsi, MIPI_DSI_PHY_IF_CTRL,
++				DSI_PHY_IF_CTRL_TX_REQ_CLK_HS);
++	}
++}
++
++static int mipi_dsi_power_on(struct mxc_dispdrv_handle *disp)
++{
++	int err;
++	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
++
++	if (!mipi_dsi->dsi_power_on) {
++		clk_prepare_enable(mipi_dsi->dphy_clk);
++		clk_prepare_enable(mipi_dsi->cfg_clk);
++		mipi_dsi_enable_controller(mipi_dsi, false);
++		mipi_dsi_set_mode(mipi_dsi, false);
++		/* host send pclk/hsync/vsync for two frames before sleep-out */
++		msleep((1000/mipi_dsi->mode->refresh + 1) << 1);
++		mipi_dsi_set_mode(mipi_dsi, true);
++		err = mipi_dsi_dcs_cmd(mipi_dsi, MIPI_DCS_EXIT_SLEEP_MODE,
++			NULL, 0);
++		if (err) {
++			dev_err(&mipi_dsi->pdev->dev,
++				"MIPI DSI DCS Command sleep-in error!\n");
++		}
++		msleep(MIPI_LCD_SLEEP_MODE_DELAY);
++		mipi_dsi_set_mode(mipi_dsi, false);
++		mipi_dsi->dsi_power_on = 1;
++	}
++
++	return 0;
++}
++
++void mipi_dsi_power_off(struct mxc_dispdrv_handle *disp)
++{
++	int err;
++	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
++
++	if (mipi_dsi->dsi_power_on) {
++		mipi_dsi_set_mode(mipi_dsi, true);
++		err = mipi_dsi_dcs_cmd(mipi_dsi, MIPI_DCS_ENTER_SLEEP_MODE,
++			NULL, 0);
++		if (err) {
++			dev_err(&mipi_dsi->pdev->dev,
++				"MIPI DSI DCS Command display on error!\n");
++		}
++		/* To allow time for the supply voltages
++		 * and clock circuits to stabilize.
++		 */
++		msleep(5);
++		/* video stream timing on */
++		mipi_dsi_set_mode(mipi_dsi, false);
++		msleep(MIPI_LCD_SLEEP_MODE_DELAY);
++
++		mipi_dsi_set_mode(mipi_dsi, true);
++		mipi_dsi_disable_controller(mipi_dsi);
++		mipi_dsi->dsi_power_on = 0;
++		clk_disable_unprepare(mipi_dsi->dphy_clk);
++		clk_disable_unprepare(mipi_dsi->cfg_clk);
++	}
++}
++
++static int mipi_dsi_lcd_init(struct mipi_dsi_info *mipi_dsi,
++	struct mxc_dispdrv_setting *setting)
++{
++	int		err;
++	int		size;
++	int		i;
++	struct  fb_videomode *mipi_lcd_modedb;
++	struct  fb_videomode mode;
++	struct  device		 *dev = &mipi_dsi->pdev->dev;
++
++	for (i = 0; i < ARRAY_SIZE(mipi_dsi_lcd_db); i++) {
++		if (!strcmp(mipi_dsi->lcd_panel,
++			mipi_dsi_lcd_db[i].lcd_panel)) {
++			mipi_dsi->lcd_callback =
++				&mipi_dsi_lcd_db[i].lcd_callback;
++			break;
++		}
++	}
++	if (i == ARRAY_SIZE(mipi_dsi_lcd_db)) {
++		dev_err(dev, "failed to find supported lcd panel.\n");
++		return -EINVAL;
++	}
++	/* get the videomode in the order: cmdline->platform data->driver */
++	mipi_dsi->lcd_callback->get_mipi_lcd_videomode(&mipi_lcd_modedb, &size,
++					&mipi_dsi->lcd_config);
++	err = fb_find_mode(&setting->fbi->var, setting->fbi,
++				setting->dft_mode_str,
++				mipi_lcd_modedb, size, NULL,
++				setting->default_bpp);
++	if (err != 1)
++		fb_videomode_to_var(&setting->fbi->var, mipi_lcd_modedb);
++
++	INIT_LIST_HEAD(&setting->fbi->modelist);
++	for (i = 0; i < size; i++) {
++		fb_var_to_videomode(&mode, &setting->fbi->var);
++		if (fb_mode_is_equal(&mode, mipi_lcd_modedb + i)) {
++			err = fb_add_videomode(mipi_lcd_modedb + i,
++					&setting->fbi->modelist);
++			 /* Note: only support fb mode from driver */
++			mipi_dsi->mode = mipi_lcd_modedb + i;
++			break;
++		}
++	}
++	if ((err < 0) || (size == i)) {
++		dev_err(dev, "failed to add videomode.\n");
++		return err;
++	}
++
++	for (i = 0; i < ARRAY_SIZE(mipi_dsi_phy_pll_clk_table); i++) {
++		if (mipi_dsi_phy_pll_clk_table[i].max_phy_clk <
++				mipi_dsi->lcd_config->max_phy_clk)
++			break;
++	}
++	if ((i == ARRAY_SIZE(mipi_dsi_phy_pll_clk_table)) ||
++		(mipi_dsi->lcd_config->max_phy_clk >
++			mipi_dsi_phy_pll_clk_table[0].max_phy_clk)) {
++		dev_err(dev, "failed to find data in"
++				"mipi_dsi_phy_pll_clk_table.\n");
++		return -EINVAL;
++	}
++	mipi_dsi->dphy_pll_config = mipi_dsi_phy_pll_clk_table[--i].config;
++	dev_dbg(dev, "dphy_pll_config:0x%x.\n", mipi_dsi->dphy_pll_config);
++
++	return 0;
++}
++
++int mipi_dsi_enable(struct mxc_dispdrv_handle *disp)
++{
++	int err;
++	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
++
++	if (!mipi_dsi->lcd_inited) {
++		err = clk_prepare_enable(mipi_dsi->dphy_clk);
++		err |= clk_prepare_enable(mipi_dsi->cfg_clk);
++		if (err)
++			dev_err(&mipi_dsi->pdev->dev,
++				"clk enable error:%d!\n", err);
++		mipi_dsi_enable_controller(mipi_dsi, true);
++		err = mipi_dsi->lcd_callback->mipi_lcd_setup(
++			mipi_dsi);
++		if (err < 0) {
++			dev_err(&mipi_dsi->pdev->dev,
++				"failed to init mipi lcd.");
++			clk_disable_unprepare(mipi_dsi->dphy_clk);
++			clk_disable_unprepare(mipi_dsi->cfg_clk);
++			return err;
++		}
++		mipi_dsi_set_mode(mipi_dsi, false);
++		mipi_dsi->dsi_power_on = 1;
++		mipi_dsi->lcd_inited = 1;
++	}
++	mipi_dsi_power_on(mipi_dsi->disp_mipi);
++
++	return 0;
++}
++
++static int mipi_dsi_disp_init(struct mxc_dispdrv_handle *disp,
++	struct mxc_dispdrv_setting *setting)
++{
++	struct mipi_dsi_info *mipi_dsi = mxc_dispdrv_getdata(disp);
++	struct device *dev = &mipi_dsi->pdev->dev;
++	int ret = 0;
++
++	if (!valid_mode(setting->if_fmt)) {
++		dev_warn(dev, "Input pixel format not valid"
++			"use default RGB24\n");
++		setting->if_fmt = IPU_PIX_FMT_RGB24;
++	}
++
++	setting->dev_id = mipi_dsi->dev_id;
++	setting->disp_id = mipi_dsi->disp_id;
++
++	ret = mipi_dsi_lcd_init(mipi_dsi, setting);
++	if (ret) {
++		dev_err(dev, "failed to init mipi dsi lcd\n");
++		return ret;
++	}
++
++	dev_dbg(dev, "MIPI DSI dispdrv inited!\n");
++	return ret;
++}
++
++static void mipi_dsi_disp_deinit(struct mxc_dispdrv_handle *disp)
++{
++	struct mipi_dsi_info    *mipi_dsi;
++
++	mipi_dsi = mxc_dispdrv_getdata(disp);
++
++	mipi_dsi_power_off(mipi_dsi->disp_mipi);
++	if (mipi_dsi->bl)
++		backlight_device_unregister(mipi_dsi->bl);
++}
++
++static struct mxc_dispdrv_driver mipi_dsi_drv = {
++	.name	= DISPDRV_MIPI,
++	.init	= mipi_dsi_disp_init,
++	.deinit	= mipi_dsi_disp_deinit,
++	.enable	= mipi_dsi_enable,
++	.disable = mipi_dsi_power_off,
++};
++
++static int imx6q_mipi_dsi_get_mux(int dev_id, int disp_id)
++{
++	if (dev_id > 1 || disp_id > 1)
++		return -EINVAL;
++
++	return (dev_id << 5) | (disp_id << 4);
++}
++
++static struct mipi_dsi_bus_mux imx6q_mipi_dsi_mux[] = {
++	{
++		.reg = IOMUXC_GPR3,
++		.mask = IMX6Q_GPR3_MIPI_MUX_CTL_MASK,
++		.get_mux = imx6q_mipi_dsi_get_mux,
++	},
++};
++
++static int imx6dl_mipi_dsi_get_mux(int dev_id, int disp_id)
++{
++	if (dev_id > 1 || disp_id > 1)
++		return -EINVAL;
++
++	/* MIPI DSI source is LCDIF */
++	if (dev_id)
++		disp_id = 0;
++
++	return (dev_id << 5) | (disp_id << 4);
++}
++
++static struct mipi_dsi_bus_mux imx6dl_mipi_dsi_mux[] = {
++	{
++		.reg = IOMUXC_GPR3,
++		.mask = IMX6Q_GPR3_MIPI_MUX_CTL_MASK,
++		.get_mux = imx6dl_mipi_dsi_get_mux,
++	},
++};
++
++static const struct of_device_id imx_mipi_dsi_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-mipi-dsi", .data = imx6q_mipi_dsi_mux, },
++	{ .compatible = "fsl,imx6dl-mipi-dsi", .data = imx6dl_mipi_dsi_mux, },
++	{ }
++};
++MODULE_DEVICE_TABLE(of, imx_mipi_dsi_dt_ids);
++
++/**
++ * This function is called by the driver framework to initialize the MIPI DSI
++ * device.
++ *
++ * @param	pdev	The device structure for the MIPI DSI passed in by the
++ *			driver framework.
++ *
++ * @return      Returns 0 on success or negative error code on error
++ */
++static int mipi_dsi_probe(struct platform_device *pdev)
++{
++	struct device_node *np = pdev->dev.of_node;
++	const struct of_device_id *of_id =
++			of_match_device(of_match_ptr(imx_mipi_dsi_dt_ids),
++					&pdev->dev);
++	struct mipi_dsi_info *mipi_dsi;
++	struct resource *res;
++	u32 dev_id, disp_id;
++	const char *lcd_panel;
++	unsigned int mux;
++	int ret = 0;
++
++	mipi_dsi = devm_kzalloc(&pdev->dev, sizeof(*mipi_dsi), GFP_KERNEL);
++	if (!mipi_dsi)
++		return -ENOMEM;
++
++	ret = of_property_read_string(np, "lcd_panel", &lcd_panel);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to read of property lcd_panel\n");
++		return ret;
++	}
++
++	ret = of_property_read_u32(np, "dev_id", &dev_id);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to read of property dev_id\n");
++		return ret;
++	}
++	ret = of_property_read_u32(np, "disp_id", &disp_id);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to read of property disp_id\n");
++		return ret;
++	}
++	mipi_dsi->dev_id = dev_id;
++	mipi_dsi->disp_id = disp_id;
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res) {
++		dev_err(&pdev->dev, "failed to get platform resource 0\n");
++		return -ENODEV;
++	}
++
++	if (!devm_request_mem_region(&pdev->dev, res->start,
++				resource_size(res), pdev->name))
++		return -EBUSY;
++
++	mipi_dsi->mmio_base = devm_ioremap(&pdev->dev, res->start,
++				   resource_size(res));
++	if (!mipi_dsi->mmio_base)
++		return -EBUSY;
++
++	mipi_dsi->irq = platform_get_irq(pdev, 0);
++	if (mipi_dsi->irq < 0) {
++		dev_err(&pdev->dev, "failed get device irq\n");
++		return -ENODEV;
++	}
++
++	ret = devm_request_irq(&pdev->dev, mipi_dsi->irq,
++				mipi_dsi_irq_handler,
++				0, "mipi_dsi", mipi_dsi);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to request irq\n");
++		return ret;
++	}
++
++	mipi_dsi->dphy_clk = devm_clk_get(&pdev->dev, "mipi_pllref_clk");
++	if (IS_ERR(mipi_dsi->dphy_clk)) {
++		dev_err(&pdev->dev, "failed to get dphy pll_ref_clk\n");
++		return PTR_ERR(mipi_dsi->dphy_clk);
++	}
++
++	mipi_dsi->cfg_clk = devm_clk_get(&pdev->dev, "mipi_cfg_clk");
++	if (IS_ERR(mipi_dsi->cfg_clk)) {
++		dev_err(&pdev->dev, "failed to get cfg_clk\n");
++		return PTR_ERR(mipi_dsi->cfg_clk);
++	}
++
++	mipi_dsi->disp_power_on = devm_regulator_get(&pdev->dev,
++							"disp-power-on");
++	if (!IS_ERR(mipi_dsi->disp_power_on)) {
++		ret = regulator_enable(mipi_dsi->disp_power_on);
++		if (ret) {
++			dev_err(&pdev->dev, "failed to enable display "
++				"power regulator, err=%d\n", ret);
++			return ret;
++		}
++	} else {
++		mipi_dsi->disp_power_on = NULL;
++	}
++
++	ret = device_reset(&pdev->dev);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to reset: %d\n", ret);
++		goto dev_reset_fail;
++	}
++
++	if (of_id)
++		mipi_dsi->bus_mux = of_id->data;
++
++	mipi_dsi->regmap = syscon_regmap_lookup_by_phandle(np, "gpr");
++	if (IS_ERR(mipi_dsi->regmap)) {
++		dev_err(&pdev->dev, "failed to get parent regmap\n");
++		ret = PTR_ERR(mipi_dsi->regmap);
++		goto get_parent_regmap_fail;
++	}
++
++	mux = mipi_dsi->bus_mux->get_mux(dev_id, disp_id);
++	if (mux >= 0)
++		regmap_update_bits(mipi_dsi->regmap, mipi_dsi->bus_mux->reg,
++				   mipi_dsi->bus_mux->mask, mux);
++	else
++		dev_warn(&pdev->dev, "invalid dev_id or disp_id muxing\n");
++
++	mipi_dsi->lcd_panel = kstrdup(lcd_panel, GFP_KERNEL);
++	if (!mipi_dsi->lcd_panel) {
++		dev_err(&pdev->dev, "failed to allocate lcd panel name\n");
++		ret = -ENOMEM;
++		goto kstrdup_fail;
++	}
++
++	mipi_dsi->pdev = pdev;
++	mipi_dsi->disp_mipi = mxc_dispdrv_register(&mipi_dsi_drv);
++	if (IS_ERR(mipi_dsi->disp_mipi)) {
++		dev_err(&pdev->dev, "mxc_dispdrv_register error\n");
++		ret = PTR_ERR(mipi_dsi->disp_mipi);
++		goto dispdrv_reg_fail;
++	}
++
++	mxc_dispdrv_setdata(mipi_dsi->disp_mipi, mipi_dsi);
++	dev_set_drvdata(&pdev->dev, mipi_dsi);
++
++	dev_info(&pdev->dev, "i.MX MIPI DSI driver probed\n");
++	return ret;
++
++dispdrv_reg_fail:
++	kfree(mipi_dsi->lcd_panel);
++kstrdup_fail:
++get_parent_regmap_fail:
++dev_reset_fail:
++	if (mipi_dsi->disp_power_on)
++		regulator_disable(mipi_dsi->disp_power_on);
++	return ret;
++}
++
++static void mipi_dsi_shutdown(struct platform_device *pdev)
++{
++	struct mipi_dsi_info *mipi_dsi = dev_get_drvdata(&pdev->dev);
++
++	mipi_dsi_power_off(mipi_dsi->disp_mipi);
++}
++
++static int mipi_dsi_remove(struct platform_device *pdev)
++{
++	struct mipi_dsi_info *mipi_dsi = dev_get_drvdata(&pdev->dev);
++
++	mxc_dispdrv_puthandle(mipi_dsi->disp_mipi);
++	mxc_dispdrv_unregister(mipi_dsi->disp_mipi);
++
++	if (mipi_dsi->disp_power_on)
++		regulator_disable(mipi_dsi->disp_power_on);
++
++	kfree(mipi_dsi->lcd_panel);
++	dev_set_drvdata(&pdev->dev, NULL);
++
++	return 0;
++}
++
++static struct platform_driver mipi_dsi_driver = {
++	.driver = {
++		   .of_match_table = imx_mipi_dsi_dt_ids,
++		   .name = "mxc_mipi_dsi",
++	},
++	.probe = mipi_dsi_probe,
++	.remove = mipi_dsi_remove,
++	.shutdown = mipi_dsi_shutdown,
++};
++
++static int __init mipi_dsi_init(void)
++{
++	int err;
++
++	err = platform_driver_register(&mipi_dsi_driver);
++	if (err) {
++		pr_err("mipi_dsi_driver register failed\n");
++		return -ENODEV;
++	}
++	pr_info("MIPI DSI driver module loaded\n");
++	return 0;
++}
++
++static void __exit mipi_dsi_cleanup(void)
++{
++	platform_driver_unregister(&mipi_dsi_driver);
++}
++
++module_init(mipi_dsi_init);
++module_exit(mipi_dsi_cleanup);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("i.MX MIPI DSI driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/drivers/video/mxc/mipi_dsi.h linux-xbian-imx6/drivers/video/mxc/mipi_dsi.h
+--- linux-4.1.3/drivers/video/mxc/mipi_dsi.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mipi_dsi.h	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,112 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __MIPI_DSI_H__
++#define __MIPI_DSI_H__
++
++#include <linux/regmap.h>
++
++#ifdef DEBUG
++#define mipi_dbg(fmt, ...) printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__)
++#else
++#define mipi_dbg(fmt, ...)
++#endif
++
++#define	DSI_CMD_BUF_MAXSIZE         (32)
++
++/* DPI interface pixel color coding map */
++enum mipi_dsi_dpi_fmt {
++	MIPI_RGB565_PACKED = 0,
++	MIPI_RGB565_LOOSELY,
++	MIPI_RGB565_CONFIG3,
++	MIPI_RGB666_PACKED,
++	MIPI_RGB666_LOOSELY,
++	MIPI_RGB888,
++};
++
++struct mipi_lcd_config {
++	u32				virtual_ch;
++	u32				data_lane_num;
++	/* device max DPHY clock in MHz unit */
++	u32				max_phy_clk;
++	enum mipi_dsi_dpi_fmt		dpi_fmt;
++};
++
++struct mipi_dsi_info;
++struct mipi_dsi_lcd_callback {
++	/* callback for lcd panel operation */
++	void (*get_mipi_lcd_videomode)(struct fb_videomode **, int *,
++			struct mipi_lcd_config **);
++	int  (*mipi_lcd_setup)(struct mipi_dsi_info *);
++
++};
++
++struct mipi_dsi_match_lcd {
++	char *lcd_panel;
++	struct mipi_dsi_lcd_callback lcd_callback;
++};
++
++struct mipi_dsi_bus_mux {
++	int reg;
++	int mask;
++	int (*get_mux) (int dev_id, int disp_id);
++};
++
++/* driver private data */
++struct mipi_dsi_info {
++	struct platform_device		*pdev;
++	void __iomem			*mmio_base;
++	struct regmap			*regmap;
++	const struct mipi_dsi_bus_mux	*bus_mux;
++	int				dsi_power_on;
++	int				lcd_inited;
++	u32				dphy_pll_config;
++	int				dev_id;
++	int				disp_id;
++	char				*lcd_panel;
++	int				irq;
++	struct clk			*dphy_clk;
++	struct clk			*cfg_clk;
++	struct mxc_dispdrv_handle	*disp_mipi;
++	struct  fb_videomode		*mode;
++	struct regulator		*disp_power_on;
++	struct  mipi_lcd_config		*lcd_config;
++	/* board related power control */
++	struct backlight_device		*bl;
++	/* callback for lcd panel operation */
++	struct mipi_dsi_lcd_callback	*lcd_callback;
++};
++
++int mipi_dsi_pkt_write(struct mipi_dsi_info *mipi,
++				u8 data_type, const u32 *buf, int len);
++int mipi_dsi_pkt_read(struct mipi_dsi_info *mipi,
++				u8 data_type, u32 *buf, int len);
++int mipi_dsi_dcs_cmd(struct mipi_dsi_info *mipi,
++				u8 cmd, const u32 *param, int num);
++
++#ifdef CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL
++void mipid_hx8369_get_lcd_videomode(struct fb_videomode **mode, int *size,
++		struct mipi_lcd_config **data);
++int mipid_hx8369_lcd_setup(struct mipi_dsi_info *);
++#endif
++
++#ifndef CONFIG_FB_MXC_TRULY_WVGA_SYNC_PANEL
++#error "Please configure MIPI LCD panel, we cannot find one!"
++#endif
++
++#endif
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_dcic.c linux-xbian-imx6/drivers/video/mxc/mxc_dcic.c
+--- linux-4.1.3/drivers/video/mxc/mxc_dcic.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_dcic.c	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,697 @@
++/*
++ * Copyright (C) 2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++#include <linux/clk.h>
++#include <linux/cdev.h>
++#include <linux/delay.h>
++#include <linux/err.h>
++#include <linux/fs.h>
++#include <linux/fb.h>
++#include <linux/init.h>
++#include <linux/io.h>
++#include <linux/ioctl.h>
++#include <linux/interrupt.h>
++#include <linux/mfd/syscon.h>
++#include <linux/mfd/syscon/imx6q-iomuxc-gpr.h>
++#include <linux/module.h>
++#include <linux/mxc_dcic.h>
++#include <linux/of_device.h>
++#include <linux/platform_device.h>
++#include <linux/regmap.h>
++#include <linux/types.h>
++#include <linux/uaccess.h>
++#include <video/videomode.h>
++#include <video/of_videomode.h>
++
++#define DRIVER_NAME	"mxc_dcic"
++
++#define  DCIC_IPU1_DI0		"dcic-ipu1-di0"
++#define  DCIC_IPU1_DI1		"dcic-ipu1-di1"
++#define  DCIC_IPU2_DI0		"dcic-ipu2-di0"
++#define  DCIC_IPU2_DI1		"dcic-ipu2-di1"
++#define  DCIC_LCDIF			"dcic-lcdif"
++#define  DCIC_LCDIF1		"dcic-lcdif1"
++#define  DCIC_LCDIF2		"dcic-lcdif2"
++#define  DCIC_LVDS			"dcic-lvds"
++#define  DCIC_LVDS0			"dcic-lvds0"
++#define  DCIC_LVDS1			"dcic-lvds1"
++#define  DCIC_HDMI			"dcic-hdmi"
++
++#define DCIC0_DEV_NAME "mxc_dcic0"
++#define DCIC1_DEV_NAME "mxc_dcic1"
++
++#define FB_SYNC_OE_LOW_ACT		0x80000000
++#define FB_SYNC_CLK_LAT_FALL	0x40000000
++
++static wait_queue_head_t mxc_dcic_wait;
++static int mxc_dcic_vsync;
++static uint16_t mxc_dcic_irq;
++static unsigned long mxc_dcic_counter;
++static uint16_t mxc_dcic_clients;
++
++static const struct dcic_mux imx6q_dcic0_mux[] = {
++	{
++		.dcic = DCIC_IPU1_DI0,
++		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_IPU1_DI0,
++	}, {
++		.dcic = DCIC_LVDS0,
++		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS0,
++	}, {
++		.dcic = DCIC_LVDS1,
++		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS1,
++	}, {
++		.dcic = DCIC_HDMI,
++		.val = IMX6Q_GPR10_DCIC1_MUX_CTL_HDMI,
++	}
++};
++
++static const struct dcic_mux imx6q_dcic1_mux[] = {
++	{
++		.dcic = DCIC_IPU1_DI1,
++		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI1,
++	}, {
++		.dcic = DCIC_LVDS0,
++		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS0,
++	}, {
++		.dcic = DCIC_LVDS1,
++		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS1,
++	}, {
++		.dcic = DCIC_HDMI,
++		.val = IMX6Q_GPR10_DCIC2_MUX_CTL_MIPI,
++	}
++};
++
++static const struct bus_mux imx6q_dcic_buses[] = {
++	{
++		.name = DCIC0_DEV_NAME,
++		.reg = IOMUXC_GPR10,
++		.shift = 0,
++		.mask = IMX6Q_GPR10_DCIC1_MUX_CTL_MASK,
++		.dcic_mux_num = ARRAY_SIZE(imx6q_dcic0_mux),
++		.dcics = imx6q_dcic0_mux,
++	}, {
++		.name = DCIC1_DEV_NAME,
++		.reg = IOMUXC_GPR10,
++		.shift = 2,
++		.mask = IMX6Q_GPR10_DCIC2_MUX_CTL_MASK,
++		.dcic_mux_num = ARRAY_SIZE(imx6q_dcic1_mux),
++		.dcics = imx6q_dcic1_mux,
++	}
++};
++
++static const struct dcic_info imx6q_dcic_info = {
++	.bus_mux_num = ARRAY_SIZE(imx6q_dcic_buses),
++	.buses = imx6q_dcic_buses,
++};
++
++static const struct dcic_mux imx6sx_dcic0_mux[] = {
++	{
++		.dcic = DCIC_LCDIF1,
++		.val = IMX6SX_GPR5_DISP_MUX_DCIC1_LCDIF1,
++	}, {
++		.dcic = DCIC_LVDS,
++		.val = IMX6SX_GPR5_DISP_MUX_DCIC1_LVDS,
++	}
++};
++
++static const struct dcic_mux imx6sx_dcic1_mux[] = {
++	{
++		.dcic = DCIC_LCDIF2,
++		.val = IMX6SX_GPR5_DISP_MUX_DCIC2_LCDIF2,
++	}, {
++		.dcic = DCIC_LVDS,
++		.val = IMX6SX_GPR5_DISP_MUX_DCIC2_LVDS,
++	}
++};
++
++static const struct bus_mux imx6sx_dcic_buses[] = {
++	{
++		.name = DCIC0_DEV_NAME,
++		.reg = IOMUXC_GPR5,
++		.shift = 1,
++		.mask = IMX6SX_GPR5_DISP_MUX_DCIC1_MASK,
++		.dcic_mux_num = ARRAY_SIZE(imx6sx_dcic0_mux),
++		.dcics = imx6sx_dcic0_mux,
++	}, {
++		.name = DCIC1_DEV_NAME,
++		.reg = IOMUXC_GPR5,
++		.shift = 2,
++		.mask = IMX6SX_GPR5_DISP_MUX_DCIC2_MASK,
++		.dcic_mux_num = ARRAY_SIZE(imx6sx_dcic1_mux),
++		.dcics = imx6sx_dcic1_mux,
++	}
++};
++
++static const struct dcic_info imx6sx_dcic_info = {
++	.bus_mux_num = ARRAY_SIZE(imx6sx_dcic_buses),
++	.buses = imx6sx_dcic_buses,
++};
++
++static const struct of_device_id dcic_dt_ids[] = {
++	{ .compatible = "fsl,imx6q-dcic", .data = &imx6q_dcic_info, },
++	{ .compatible = "fsl,imx6sx-dcic", .data = &imx6sx_dcic_info, },
++	{ /* sentinel */ }
++};
++MODULE_DEVICE_TABLE(of, dcic_dt_ids);
++
++static int of_get_dcic_val(struct device_node *np, struct dcic_data *dcic)
++{
++	const char *mux;
++	int ret;
++	u32 i, dcic_id;
++
++	ret = of_property_read_string(np, "dcic_mux", &mux);
++	if (ret < 0) {
++		dev_err(dcic->dev, "Can not get dcic_mux\n");
++		return ret;
++	}
++	ret = of_property_read_u32(np, "dcic_id", &dcic_id);
++	if (ret < 0) {
++		dev_err(dcic->dev, "Can not get dcic_id\n");
++		return ret;
++	}
++
++	dcic->bus_n = dcic_id;
++
++	for (i = 0; i < dcic->buses[dcic_id].dcic_mux_num; i++)
++		if (!strcmp(mux, dcic->buses[dcic_id].dcics[i].dcic)) {
++			dcic->mux_n = i;
++			return dcic->buses[dcic_id].dcics[i].val;
++		}
++
++	return -EINVAL;
++}
++
++static void dcic_enable(struct dcic_data *dcic)
++{
++	u32 val;
++
++	val = readl(&dcic->regs->dcicc);
++	val |= DCICC_IC_ENABLE;
++	writel(val, &dcic->regs->dcicc);
++}
++
++void dcic_disable(struct dcic_data *dcic)
++{
++	u32 val;
++
++	val = readl(&dcic->regs->dcicc);
++	val &= ~DCICC_IC_MASK;
++	val |= DCICC_IC_DISABLE;
++	writel(val, &dcic->regs->dcicc);
++}
++
++static void roi_enable(struct dcic_data *dcic, struct roi_params *roi_param)
++{
++	u32 val;
++	u32 roi_n = roi_param->roi_n;
++
++	val = readl(&dcic->regs->ROI[roi_n].dcicrc);
++	val |= DCICRC_ROI_ENABLE;
++	if (roi_param->freeze)
++		val |= DCICRC_ROI_FROZEN;
++	writel(val, &dcic->regs->ROI[roi_n].dcicrc);
++}
++
++static void roi_disable(struct dcic_data *dcic, u32 roi_n)
++{
++	u32 val;
++
++	val = readl(&dcic->regs->ROI[roi_n].dcicrc);
++	val &= ~DCICRC_ROI_ENABLE;
++	writel(val, &dcic->regs->ROI[roi_n].dcicrc);
++}
++
++static bool roi_configure(struct dcic_data *dcic, struct roi_params *roi_param)
++{
++	struct roi_regs *roi_reg;
++	u32 val;
++
++	if (roi_param->roi_n < 0 || roi_param->roi_n >= 16) {
++		pr_err("Error, Wrong ROI number %d\n", roi_param->roi_n);
++		return false;
++	}
++
++	if (roi_param->end_x <= roi_param->start_x ||
++			roi_param->end_y <= roi_param->start_y) {
++		pr_err("Error, Wrong ROI\n");
++		return false;
++	}
++
++	roi_reg = (struct roi_regs *) &dcic->regs->ROI[roi_param->roi_n];
++
++	/* init roi block size  */
++	val = roi_param->start_y << 16 | roi_param->start_x;
++	writel(val, &roi_reg->dcicrc);
++
++	val = roi_param->end_y << 16 | roi_param->end_x;
++	writel(val, &roi_reg->dcicrs);
++
++	writel(roi_param->ref_sig, &roi_reg->dcicrrs);
++
++	roi_enable(dcic, roi_param);
++	return true;
++}
++
++static void dcic_int_enable(struct dcic_data *dcic)
++{
++	u32 val;
++
++	/* Clean pending interrupt before enable int */
++	writel(DCICS_FI_STAT_PENDING, &dcic->regs->dcics);
++	writel(0xffffffff, &dcic->regs->dcics);
++
++	/* Enable function interrupt */
++	val = readl(&dcic->regs->dcicic);
++	val &= ~DCICIC_FUN_INT_MASK;
++	val |= DCICIC_FUN_INT_ENABLE;
++	writel(val, &dcic->regs->dcicic);
++}
++
++static void dcic_int_disable(struct dcic_data *dcic)
++{
++	u32 val;
++
++	/* Disable both function and error interrupt */
++	val = readl(&dcic->regs->dcicic);
++	val = DCICIC_ERROR_INT_DISABLE | DCICIC_FUN_INT_DISABLE;
++	writel(val, &dcic->regs->dcicic);
++}
++
++static irqreturn_t dcic_irq_handler(int irq, void *data)
++{
++	u32 i;
++
++	struct dcic_data *dcic = data;
++	u32 dcics = readl(&dcic->regs->dcics);
++
++	dcic->result = dcics & 0xffff;
++
++	if (!mxc_dcic_vsync)
++		dcic_int_disable(dcic);
++	else {
++		mxc_dcic_irq = -1;
++		mxc_dcic_counter++;
++	}
++
++	/* clean dcic interrupt state */
++	writel(DCICS_FI_STAT_PENDING, &dcic->regs->dcics);
++	writel(dcics, &dcic->regs->dcics);
++
++	if (mxc_dcic_vsync) {
++		wake_up(&mxc_dcic_wait);
++		return IRQ_HANDLED;
++	}
++
++	for (i = 0; i < 16; i++) {
++		pr_debug("ROI=%d,crcRS=0x%x, crcCS=0x%x\n", i,
++				readl(&dcic->regs->ROI[i].dcicrrs),
++				readl(&dcic->regs->ROI[i].dcicrcs));
++	}
++	complete(&dcic->roi_crc_comp);
++
++	return IRQ_HANDLED;
++}
++
++static int dcic_configure(struct dcic_data *dcic, unsigned int sync)
++{
++	u32 val;
++	val = 0;
++
++	/* vsync, hsync,  DE, clk_pol  */
++	if (!(sync & FB_SYNC_HOR_HIGH_ACT))
++		val |= DCICC_HSYNC_POL_ACTIVE_LOW;
++	if (!(sync & FB_SYNC_VERT_HIGH_ACT))
++		val |= DCICC_VSYNC_POL_ACTIVE_LOW;
++	if (sync & FB_SYNC_OE_LOW_ACT)
++		val |= DCICC_DE_ACTIVE_LOW;
++	if (sync & FB_SYNC_CLK_LAT_FALL)
++		val |= DCICC_CLK_POL_INVERTED;
++
++	writel(val, &dcic->regs->dcicc);
++	return 0;
++}
++
++static int dcic_open(struct inode *inode, struct file *file)
++{
++	struct dcic_data *dcic = container_of(inode->i_cdev, struct dcic_data, cdev);
++	struct dcic_private *dcic_client;
++	int i = 0;
++
++	dcic_client = devm_kzalloc(dcic->dev,
++				sizeof(struct dcic_private),
++				GFP_KERNEL);
++	if (!dcic_client) {
++		dev_err(dcic->dev, "Cannot allocate device data\n");
++		return -ENOMEM;
++	}
++
++	mutex_lock(&dcic->lock);
++
++	if (mxc_dcic_clients == 0xffff) {
++		mutex_unlock(&dcic->lock);
++		return -EBUSY;
++	}
++
++	clk_prepare_enable(dcic->disp_axi_clk);
++	clk_prepare_enable(dcic->dcic_clk);
++
++	dcic_client->dcic = dcic;
++	file->private_data = dcic_client;
++
++	while (mxc_dcic_clients & BIT(i++));
++	mxc_dcic_clients |= BIT(i);
++	dcic_client->client_id |= BIT(i);
++
++	mutex_unlock(&dcic->lock);
++	return 0;
++}
++
++static int dcic_release(struct inode *inode, struct file *file)
++{
++	struct dcic_private *dcic_client = file->private_data;
++	struct dcic_data *dcic = dcic_client->dcic;
++	u32 i;
++
++	mutex_lock(&dcic->lock);
++
++	mxc_dcic_clients &= ~dcic_client->client_id;
++	if (!mxc_dcic_clients) {
++		for (i = 0; i < 16; i++)
++			roi_disable(dcic, i);
++
++		clk_disable_unprepare(dcic->dcic_clk);
++		clk_disable_unprepare(dcic->disp_axi_clk);
++	}
++
++	mutex_unlock(&dcic->lock);
++	devm_kfree(dcic->dev, dcic_client);
++	return 0;
++}
++
++static int dcic_init(struct device_node *np, struct dcic_data *dcic)
++{
++	u32 val, bus;
++
++	val = of_get_dcic_val(np, dcic);
++	if (val < 0) {
++		pr_err("Error incorrect\n");
++		return -1;
++	}
++
++	bus = dcic->bus_n;
++
++	regmap_update_bits(dcic->regmap, dcic->buses[bus].reg ,
++			   dcic->buses[bus].mask, val);
++
++	return 0;
++}
++
++static long dcic_ioctl(struct file *file,
++		unsigned int cmd, unsigned long arg)
++{
++	int __user *argp = (void __user *)arg;
++	struct dcic_private *dcic_client = file->private_data;
++	struct dcic_data *dcic = dcic_client->dcic;
++	struct roi_params roi_param;
++	unsigned int sync;
++	int ret = 0;
++	int i, t = 0;
++
++	if (cmd == DCIC_IOC_STOP_VSYNC || cmd == DCIC_IOC_START_VSYNC) {
++		for (i = 0; i < 16; i++)
++			if (mxc_dcic_clients & BIT(i) && ++t > 1)
++				return 0;
++	}
++
++	switch (cmd) {
++	case DCIC_IOC_CONFIG_DCIC:
++		if (!copy_from_user(&sync, argp, sizeof(unsigned int)))
++			dcic_configure(dcic, sync);
++		break;
++	case DCIC_IOC_CONFIG_ROI:
++		if (copy_from_user(&roi_param, argp, sizeof(roi_param)))
++			return -EFAULT;
++		else
++			if (!roi_configure(dcic, &roi_param))
++				return -EINVAL;
++		break;
++	case DCIC_IOC_GET_RESULT:
++		init_completion(&dcic->roi_crc_comp);
++
++		dcic_enable(dcic);
++
++		dcic->result = 0;
++		msleep(25);
++
++		dcic_int_enable(dcic);
++
++		ret = wait_for_completion_interruptible_timeout(
++			&dcic->roi_crc_comp, 1 * HZ);
++		if (ret == 0) {
++			dev_err(dcic->dev,
++			"dcic wait for roi crc cal timeout\n");
++			ret = -ETIME;
++		} else if (ret > 0) {
++			if (copy_to_user(argp, &dcic->result, sizeof(dcic->result)))
++				return -EFAULT;
++			ret = 0;
++		}
++		dcic_disable(dcic);
++		break;
++	case DCIC_IOC_START_VSYNC:
++		mxc_dcic_vsync = 1;
++		mxc_dcic_irq = 0;
++		mxc_dcic_counter = 0;
++
++		// configure minimum roi block
++		roi_param.roi_n = 0;
++		roi_param.end_x = 1;
++		roi_param.start_x = 0;
++		roi_param.end_y = 1;
++		roi_param.start_y = 0;
++		roi_configure(dcic, &roi_param);
++
++		dcic_enable(dcic);
++		dcic_int_enable(dcic);
++		break;
++	case DCIC_IOC_STOP_VSYNC:
++		mxc_dcic_vsync = 0;
++		mxc_dcic_irq = 0;
++		init_completion(&dcic->roi_crc_comp);
++		wait_for_completion_interruptible_timeout(&dcic->roi_crc_comp, 1 * HZ);
++		dcic_disable(dcic);
++		break;
++	default:
++		pr_err("%s, Unsupport cmd %d\n", __func__, cmd);
++		break;
++     }
++     return ret;
++}
++
++static ssize_t dcic_read(struct file *file, char __user *buf, size_t count,
++			    loff_t *ppos)
++{
++	struct dcic_private *dcic_client = file->private_data;
++	int ret = 0;
++
++	do {
++		if (mxc_dcic_irq & dcic_client->client_id) {
++			count = min(sizeof(unsigned long), count);
++			ret = copy_to_user(buf, &mxc_dcic_counter, count) ? -EFAULT : count;
++			mxc_dcic_irq &= ~dcic_client->client_id;
++			break;
++		}
++		if (file->f_flags & O_NONBLOCK) {
++			ret = -EAGAIN;
++		}
++		else if (wait_event_interruptible(mxc_dcic_wait, mxc_dcic_irq & dcic_client->client_id))
++			ret = -ERESTARTSYS;
++	} while(!ret);
++
++	return ret;
++}
++
++static const struct file_operations mxc_dcic_fops = {
++	.owner = THIS_MODULE,
++	.open = dcic_open,
++	.release = dcic_release,
++	.unlocked_ioctl = dcic_ioctl,
++	.read = dcic_read,
++};
++
++static int dcic_probe(struct platform_device *pdev)
++{
++	struct device *dev = &pdev->dev;
++	const struct of_device_id *of_id =
++			of_match_device(dcic_dt_ids, dev);
++	const struct dcic_info *dcic_info =
++			(const struct dcic_info *)of_id->data;
++	struct device_node *np = dev->of_node;
++	struct dcic_data *dcic;
++	struct resource *res;
++	const char *name;
++	dev_t devt;
++	int ret = 0;
++	int irq;
++
++	dcic = devm_kzalloc(&pdev->dev,
++				sizeof(struct dcic_data),
++				GFP_KERNEL);
++	if (!dcic) {
++		dev_err(&pdev->dev, "Cannot allocate device data\n");
++		ret = -ENOMEM;
++		goto ealloc;
++	}
++
++	platform_set_drvdata(pdev, dcic);
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res) {
++		dev_err(&pdev->dev, "No dcic base address found.\n");
++		ret = -ENODEV;
++		goto ealloc;
++	}
++
++	dcic->regs = (struct dcic_regs *) devm_ioremap(&pdev->dev, res->start, resource_size(res));
++	if (!dcic->regs) {
++		dev_err(&pdev->dev, "ioremap failed with dcic base\n");
++		ret = -ENOMEM;
++		goto ealloc;
++	}
++
++	dcic->dev = dev;
++	dcic->buses = dcic_info->buses;
++
++	dcic->regmap = syscon_regmap_lookup_by_phandle(np, "gpr");
++	if (IS_ERR(dcic->regmap)) {
++		dev_err(dev, "failed to get parent regmap\n");
++		ret = PTR_ERR(dcic->regmap);
++		goto ealloc;
++	}
++
++	/* clock */
++	dcic->disp_axi_clk = devm_clk_get(&pdev->dev, "disp-axi");
++	if (IS_ERR(dcic->disp_axi_clk)) {
++		dev_err(&pdev->dev, "get disp-axi clock failed\n");
++		ret = PTR_ERR(dcic->disp_axi_clk);
++		goto ealloc;
++	}
++
++	dcic->dcic_clk = devm_clk_get(&pdev->dev, "dcic");
++	if (IS_ERR(dcic->dcic_clk)) {
++		dev_err(&pdev->dev, "get dcic clk failed\n");
++		ret = PTR_ERR(dcic->dcic_clk);
++		goto ealloc;
++	}
++
++	mutex_init(&dcic->lock);
++	ret = dcic_init(np, dcic);
++	if (ret < 0) {
++		pr_err("Failed init dcic\n");
++		goto ealloc;
++	}
++
++	/* register device */
++	name = dcic->buses[dcic->bus_n].name;
++	dcic->major = register_chrdev(0, name, &mxc_dcic_fops);
++	if (dcic->major < 0) {
++		pr_err("DCIC: unable to get a major for dcic\n");
++		ret = -EBUSY;
++		goto ealloc;
++	}
++
++	dcic->class = class_create(THIS_MODULE, name);
++	if (IS_ERR(dcic->class)) {
++		ret = PTR_ERR(dcic->class);
++		goto err_out_chrdev;
++	}
++
++	/* create char device */
++	devt = MKDEV(dcic->major, 0);
++	dcic->devt = devt;
++
++	cdev_init(&dcic->cdev, &mxc_dcic_fops);
++	dcic->cdev.owner = THIS_MODULE;
++	ret = cdev_add(&dcic->cdev, devt, 1);
++	if (ret)
++		goto err_out_class;
++
++	device_create(dcic->class, NULL, devt,
++				   NULL, name);
++
++	/* IRQ */
++	irq = platform_get_irq(pdev, 0);
++
++	ret = devm_request_irq(&pdev->dev, irq, dcic_irq_handler, 0,
++			  dev_name(&pdev->dev), dcic);
++	if (ret) {
++		dev_err(&pdev->dev, "request_irq (%d) failed with error %d\n",
++				irq, ret);
++		goto err_out_cdev;
++	}
++
++	init_waitqueue_head(&mxc_dcic_wait);
++	mxc_dcic_vsync = 0;
++	mxc_dcic_irq = 0;
++
++	return 0;
++
++err_out_cdev:
++	cdev_del(&dcic->cdev);
++err_out_class:
++	device_destroy(dcic->class, devt);
++	class_destroy(dcic->class);
++err_out_chrdev:
++	unregister_chrdev(dcic->major, name);
++ealloc:
++	return ret;
++}
++
++static int dcic_remove(struct platform_device *pdev)
++{
++	struct dcic_data *dcic = platform_get_drvdata(pdev);
++	const char *name;
++
++	name = dcic->buses[dcic->bus_n].name;
++
++	device_destroy(dcic->class, dcic->devt);
++	cdev_del(&dcic->cdev);
++	class_destroy(dcic->class);
++	unregister_chrdev(dcic->major, name);
++	mutex_destroy(&dcic->lock);
++
++	return 0;
++}
++
++static struct platform_driver dcic_driver = {
++	.driver = {
++		.name = DRIVER_NAME,
++		.of_match_table	= dcic_dt_ids,
++	},
++	.probe = dcic_probe,
++	.remove = dcic_remove,
++};
++
++module_platform_driver(dcic_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("MXC DCIC driver");
++MODULE_LICENSE("GPL");
++MODULE_ALIAS("platform:" DRIVER_NAME);
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_dispdrv.c linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.c
+--- linux-4.1.3/drivers/video/mxc/mxc_dispdrv.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.c	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,150 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @file mxc_dispdrv.c
++ * @brief mxc display driver framework.
++ *
++ * A display device driver could call mxc_dispdrv_register(drv) in its dev_probe() function.
++ * Move all dev_probe() things into mxc_dispdrv_driver->init(), init() function should init
++ * and feedback setting;
++ * Necessary deferred operations can be done in mxc_dispdrv_driver->post_init(),
++ * after dev_id and disp_id pass usage check;
++ * Move all dev_remove() things into mxc_dispdrv_driver->deinit();
++ * Move all dev_suspend() things into fb_notifier for SUSPEND, if there is;
++ * Move all dev_resume() things into fb_notifier for RESUME, if there is;
++ *
++ * ipuv3 fb driver could call mxc_dispdrv_gethandle(name, setting) before a fb
++ * need be added, with fbi param passing by setting, after
++ * mxc_dispdrv_gethandle() return, FB driver should get the basic setting
++ * about fbi info and ipuv3-hw (ipu_id and disp_id).
++ *
++ * @ingroup Framebuffer
++ */
++
++#include <linux/kernel.h>
++#include <linux/module.h>
++#include <linux/list.h>
++#include <linux/mutex.h>
++#include <linux/slab.h>
++#include <linux/err.h>
++#include <linux/string.h>
++#include "mxc_dispdrv.h"
++
++static LIST_HEAD(dispdrv_list);
++static DEFINE_MUTEX(dispdrv_lock);
++
++struct mxc_dispdrv_entry {
++	/* Note: drv always the first element */
++	struct mxc_dispdrv_driver *drv;
++	bool active;
++	void *priv;
++	struct list_head list;
++};
++
++struct mxc_dispdrv_handle *mxc_dispdrv_register(struct mxc_dispdrv_driver *drv)
++{
++	struct mxc_dispdrv_entry *new;
++
++	mutex_lock(&dispdrv_lock);
++
++	new = kzalloc(sizeof(struct mxc_dispdrv_entry), GFP_KERNEL);
++	if (!new) {
++		mutex_unlock(&dispdrv_lock);
++		return ERR_PTR(-ENOMEM);
++	}
++
++	new->drv = drv;
++	list_add_tail(&new->list, &dispdrv_list);
++
++	mutex_unlock(&dispdrv_lock);
++
++	return (struct mxc_dispdrv_handle *)new;
++}
++EXPORT_SYMBOL_GPL(mxc_dispdrv_register);
++
++int mxc_dispdrv_unregister(struct mxc_dispdrv_handle *handle)
++{
++	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
++
++	if (entry) {
++		mutex_lock(&dispdrv_lock);
++		list_del(&entry->list);
++		mutex_unlock(&dispdrv_lock);
++		kfree(entry);
++		return 0;
++	} else
++		return -EINVAL;
++}
++EXPORT_SYMBOL_GPL(mxc_dispdrv_unregister);
++
++struct mxc_dispdrv_handle *mxc_dispdrv_gethandle(char *name,
++	struct mxc_dispdrv_setting *setting)
++{
++	int ret, found = 0;
++	struct mxc_dispdrv_entry *entry;
++
++	mutex_lock(&dispdrv_lock);
++	list_for_each_entry(entry, &dispdrv_list, list) {
++		if (!strcmp(entry->drv->name, name) && (entry->drv->init)) {
++			ret = entry->drv->init((struct mxc_dispdrv_handle *)
++				entry, setting);
++			if (ret >= 0) {
++				entry->active = true;
++				found = 1;
++				break;
++			}
++		}
++	}
++	mutex_unlock(&dispdrv_lock);
++
++	return found ? (struct mxc_dispdrv_handle *)entry:ERR_PTR(-ENODEV);
++}
++EXPORT_SYMBOL_GPL(mxc_dispdrv_gethandle);
++
++void mxc_dispdrv_puthandle(struct mxc_dispdrv_handle *handle)
++{
++	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
++
++	mutex_lock(&dispdrv_lock);
++	if (entry && entry->active && entry->drv->deinit) {
++		entry->drv->deinit(handle);
++		entry->active = false;
++	}
++	mutex_unlock(&dispdrv_lock);
++
++}
++EXPORT_SYMBOL_GPL(mxc_dispdrv_puthandle);
++
++int mxc_dispdrv_setdata(struct mxc_dispdrv_handle *handle, void *data)
++{
++	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
++
++	if (entry) {
++		entry->priv = data;
++		return 0;
++	} else
++		return -EINVAL;
++}
++EXPORT_SYMBOL_GPL(mxc_dispdrv_setdata);
++
++void *mxc_dispdrv_getdata(struct mxc_dispdrv_handle *handle)
++{
++	struct mxc_dispdrv_entry *entry = (struct mxc_dispdrv_entry *)handle;
++
++	if (entry) {
++		return entry->priv;
++	} else
++		return ERR_PTR(-EINVAL);
++}
++EXPORT_SYMBOL_GPL(mxc_dispdrv_getdata);
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_dispdrv.h linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.h
+--- linux-4.1.3/drivers/video/mxc/mxc_dispdrv.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_dispdrv.h	2015-07-27 23:13:08.749764128 +0200
+@@ -0,0 +1,54 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++#ifndef __MXC_DISPDRV_H__
++#define __MXC_DISPDRV_H__
++#include <linux/fb.h>
++
++struct mxc_dispdrv_handle {
++	struct mxc_dispdrv_driver *drv;
++};
++
++struct mxc_dispdrv_setting {
++	/*input-feedback parameter*/
++	struct fb_info *fbi;
++	int if_fmt;
++	int default_bpp;
++	char *dft_mode_str;
++
++	/*feedback parameter*/
++	int dev_id;
++	int disp_id;
++};
++
++struct mxc_dispdrv_driver {
++	const char *name;
++	int (*init) (struct mxc_dispdrv_handle *, struct mxc_dispdrv_setting *);
++	/* deferred operations after dev_id and disp_id pass usage check */
++	int (*post_init) (struct mxc_dispdrv_handle *, int dev_id, int disp_id);
++	void (*deinit) (struct mxc_dispdrv_handle *);
++	/* display driver enable function for extension */
++	int (*enable) (struct mxc_dispdrv_handle *);
++	/* display driver disable function, called at early part of fb_blank */
++	void (*disable) (struct mxc_dispdrv_handle *);
++	/* display driver setup function, called at early part of fb_set_par */
++	int (*setup) (struct mxc_dispdrv_handle *, struct fb_info *fbi);
++};
++
++struct mxc_dispdrv_handle *mxc_dispdrv_register(struct mxc_dispdrv_driver *drv);
++int mxc_dispdrv_unregister(struct mxc_dispdrv_handle *handle);
++struct mxc_dispdrv_handle *mxc_dispdrv_gethandle(char *name,
++	struct mxc_dispdrv_setting *setting);
++void mxc_dispdrv_puthandle(struct mxc_dispdrv_handle *handle);
++int mxc_dispdrv_setdata(struct mxc_dispdrv_handle *handle, void *data);
++void *mxc_dispdrv_getdata(struct mxc_dispdrv_handle *handle);
++#endif
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_edid.c linux-xbian-imx6/drivers/video/mxc/mxc_edid.c
+--- linux-4.1.3/drivers/video/mxc/mxc_edid.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_edid.c	2015-07-27 23:13:08.753749907 +0200
+@@ -0,0 +1,828 @@
++/*
++ * Copyright 2009-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @defgroup Framebuffer Framebuffer Driver for SDC and ADC.
++ */
++
++/*!
++ * @file mxc_edid.c
++ *
++ * @brief MXC EDID driver
++ *
++ * @ingroup Framebuffer
++ */
++
++/*!
++ * Include files
++ */
++#include <linux/i2c.h>
++#include <linux/fb.h>
++#include <video/mxc_edid.h>
++#include "../fbdev/edid.h"
++
++#undef DEBUG  /* define this for verbose EDID parsing output */
++#ifdef DEBUG
++#define DPRINTK(fmt, args...) printk(fmt, ## args)
++#else
++#define DPRINTK(fmt, args...)
++#endif
++
++const struct fb_videomode mxc_cea_mode[64] = {
++	/* #1: 640x480p@59.94/60Hz 4:3 */
++	[1] = {
++		NULL, 60, 640, 480, 39722, 48, 16, 33, 10, 96, 2, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #2: 720x480p@59.94/60Hz 4:3 */
++	[2] = {
++		NULL, 60, 720, 480, 37037, 60, 16, 30, 9, 62, 6, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #3: 720x480p@59.94/60Hz 16:9 */
++	[3] = {
++		NULL, 60, 720, 480, 37037, 60, 16, 30, 9, 62, 6, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #4: 1280x720p@59.94/60Hz 16:9 */
++	[4] = {
++		NULL, 60, 1280, 720, 13468, 220, 110, 20, 5, 40, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0
++	},
++	/* #5: 1920x1080i@59.94/60Hz 16:9 */
++	[5] = {
++		NULL, 60, 1920, 1080, 13468, 88, 148, 4, 31, 44, 10,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #6: 720(1440)x480iH@59.94/60Hz 4:3 */
++	[6] = {
++		NULL, 60, 1440, 480, 37037, 38, 114, 8, 31, 124, 6, 0,
++		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #7: 720(1440)x480iH@59.94/60Hz 16:9 */
++	[7] = {
++		NULL, 60, 1440, 480, 37037, 38, 114, 8, 31, 124, 6, 0,
++		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #8: 720(1440)x240pH@59.94/60Hz 4:3 */
++	[8] = {
++		NULL, 60, 1440, 240, 37108, 114, 38, 15, 4, 124, 3, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #9: 720(1440)x240pH@59.94/60Hz 16:9 */
++	[9] = {
++		NULL, 60, 1440, 240, 37108, 114, 38, 15, 4, 124, 3, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #14: 1440x480p@59.94/60Hz 4:3 */
++	[14] = {
++		NULL, 60, 1440, 480, 18500, 120, 32, 30, 9, 124, 6, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #15: 1440x480p@59.94/60Hz 16:9 */
++	[15] = {
++		NULL, 60, 1440, 480, 18500, 120, 32, 30, 9, 124, 6, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #16: 1920x1080p@60Hz 16:9 */
++	[16] = {
++		NULL, 60, 1920, 1080, 6734, 148, 88, 36, 4, 44, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #17: 720x576pH@50Hz 4:3 */
++	[17] = {
++		NULL, 50, 720, 576, 37037, 68, 12, 39, 5, 64, 5, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #18: 720x576pH@50Hz 16:9 */
++	[18] = {
++		NULL, 50, 720, 576, 37037, 68, 12, 39, 5, 64, 5, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #19: 1280x720p@50Hz */
++	[19] = {
++		NULL, 50, 1280, 720, 13468, 220, 440, 20, 5, 40, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #20: 1920x1080i@50Hz */
++	[20] = {
++		NULL, 50, 1920, 1080, 13468, 148, 528, 4, 31, 44, 10,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #21: 720(1440)x576i@50Hz */
++	[21] = {
++		NULL, 50, 1440, 576, 37037, 24, 138, 4, 39, 126, 6, 0,
++		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #22: 720(1440)x576i@50Hz */
++	[22] = {
++		NULL, 50, 1440, 576, 37037, 24, 138, 4, 39, 126, 6, 0,
++		FB_VMODE_INTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #23: 720(1440)x288pH@50Hz 4:3 */
++	[23] = {
++		NULL, 50, 1440, 288, 37037, 138, 24, 19, 2, 126, 3, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #24: 720(1440)x288pH@50Hz 16:9 */
++	[24] = {
++		NULL, 50, 1440, 288, 37037, 138, 24, 19, 2, 126, 3, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #29: 720(1440)x576pH@50Hz 4:3 */
++	[29] = {
++		NULL, 50, 1440, 576, 18518, 136, 24, 39, 5, 128, 5, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, 0,
++	},
++	/* #30: 720(1440)x576pH@50Hz 16:9 */
++	[30] = {
++		NULL, 50, 1440, 576, 18518, 136, 24, 39, 5, 128, 5, 0,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #31: 1920x1080p@50Hz */
++	[31] = {
++		NULL, 50, 1920, 1080, 6734, 148, 528, 36, 4, 44, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #32: 1920x1080p@23.98/24Hz */
++	[32] = {
++		NULL, 24, 1920, 1080, 13468, 148, 638, 36, 4, 44, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #33: 1920x1080p@25Hz */
++	[33] = {
++		NULL, 25, 1920, 1080, 13468, 148, 528, 36, 4, 44, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #34: 1920x1080p@30Hz */
++	[34] = {
++		NULL, 30, 1920, 1080, 13468, 148, 88, 36, 4, 44, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0,
++	},
++	/* #41: 1280x720p@100Hz 16:9 */
++	[41] = {
++		NULL, 100, 1280, 720, 6734, 220, 440, 20, 5, 40, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0
++	},
++	/* #47: 1280x720p@119.88/120Hz 16:9 */
++	[47] = {
++		NULL, 120, 1280, 720, 6734, 220, 110, 20, 5, 40, 5,
++		FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++		FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_16_9, 0
++	},
++};
++
++/*
++ * We have a special version of fb_mode_is_equal that ignores
++ * pixclock, since for many CEA modes, 2 frequencies are supported
++ * e.g. 640x480 @ 60Hz or 59.94Hz
++ */
++int mxc_edid_fb_mode_is_equal(bool use_aspect,
++			const struct fb_videomode *mode1,
++			const struct fb_videomode *mode2,
++			u32 mode_mask)
++{
++	u32 mask;
++
++	if (use_aspect)
++		mask = ~0;
++	else
++		mask = ~FB_VMODE_ASPECT_MASK;
++
++	return (mode1->xres         == mode2->xres &&
++		mode1->yres         == mode2->yres &&
++		mode1->hsync_len    == mode2->hsync_len &&
++		mode1->vsync_len    == mode2->vsync_len &&
++		mode1->left_margin  == mode2->left_margin &&
++		mode1->right_margin == mode2->right_margin &&
++		mode1->upper_margin == mode2->upper_margin &&
++		mode1->lower_margin == mode2->lower_margin &&
++		mode1->sync         == mode2->sync &&
++		/* refresh check, 59.94Hz and 60Hz have the same parameter
++		 * in struct of mxc_cea_mode */
++		abs(mode1->refresh - mode2->refresh) <= 1 &&
++		(mode1->vmode & mask & mode_mask) ==
++		(mode2->vmode & mask & mode_mask));
++}
++EXPORT_SYMBOL(mxc_edid_fb_mode_is_equal);
++
++static void get_detailed_timing(unsigned char *block,
++				struct fb_videomode *mode)
++{
++	mode->xres = H_ACTIVE;
++	mode->yres = V_ACTIVE;
++	mode->pixclock = PIXEL_CLOCK;
++	mode->pixclock /= 1000;
++	mode->pixclock = KHZ2PICOS(mode->pixclock);
++	mode->right_margin = H_SYNC_OFFSET;
++	mode->left_margin = (H_ACTIVE + H_BLANKING) -
++		(H_ACTIVE + H_SYNC_OFFSET + H_SYNC_WIDTH);
++	mode->upper_margin = V_BLANKING - V_SYNC_OFFSET -
++		V_SYNC_WIDTH;
++	mode->lower_margin = V_SYNC_OFFSET;
++	mode->hsync_len = H_SYNC_WIDTH;
++	mode->vsync_len = V_SYNC_WIDTH;
++	if (HSYNC_POSITIVE)
++		mode->sync |= FB_SYNC_HOR_HIGH_ACT;
++	if (VSYNC_POSITIVE)
++		mode->sync |= FB_SYNC_VERT_HIGH_ACT;
++	mode->refresh = PIXEL_CLOCK/((H_ACTIVE + H_BLANKING) *
++				     (V_ACTIVE + V_BLANKING));
++	if (INTERLACED) {
++		mode->yres *= 2;
++		mode->upper_margin *= 2;
++		mode->lower_margin *= 2;
++		mode->vsync_len *= 2;
++		mode->vmode |= FB_VMODE_INTERLACED;
++	}
++	mode->flag = FB_MODE_IS_DETAILED;
++
++	if ((H_SIZE / 16) == (V_SIZE / 9))
++		mode->vmode |= FB_VMODE_ASPECT_16_9;
++	else if ((H_SIZE / 4) == (V_SIZE / 3))
++		mode->vmode |= FB_VMODE_ASPECT_4_3;
++	else if ((mode->xres / 16) == (mode->yres / 9))
++		mode->vmode |= FB_VMODE_ASPECT_16_9;
++	else if ((mode->xres / 4) == (mode->yres / 3))
++		mode->vmode |= FB_VMODE_ASPECT_4_3;
++
++	if (mode->vmode & FB_VMODE_ASPECT_16_9)
++		DPRINTK("Aspect ratio: 16:9\n");
++	if (mode->vmode & FB_VMODE_ASPECT_4_3)
++		DPRINTK("Aspect ratio: 4:3\n");
++	DPRINTK("      %d MHz ",  PIXEL_CLOCK/1000000);
++	DPRINTK("%d %d %d %d ", H_ACTIVE, H_ACTIVE + H_SYNC_OFFSET,
++	       H_ACTIVE + H_SYNC_OFFSET + H_SYNC_WIDTH, H_ACTIVE + H_BLANKING);
++	DPRINTK("%d %d %d %d ", V_ACTIVE, V_ACTIVE + V_SYNC_OFFSET,
++	       V_ACTIVE + V_SYNC_OFFSET + V_SYNC_WIDTH, V_ACTIVE + V_BLANKING);
++	DPRINTK("%sHSync %sVSync\n\n", (HSYNC_POSITIVE) ? "+" : "-",
++	       (VSYNC_POSITIVE) ? "+" : "-");
++}
++
++int mxc_edid_parse_ext_blk(unsigned char *edid,
++		struct mxc_edid_cfg *cfg,
++		struct fb_monspecs *specs)
++{
++	char detail_timing_desc_offset;
++	struct fb_videomode *mode, *m;
++	unsigned char index = 0x0;
++	unsigned char *block;
++	int i, num = 0, revision;
++
++	if (edid[index++] != 0x2) /* only support cea ext block now */
++		return -1;
++	revision = edid[index++];
++	DPRINTK("cea extent revision %d\n", revision);
++	mode = kzalloc(50 * sizeof(struct fb_videomode), GFP_KERNEL);
++	if (mode == NULL)
++		return -1;
++
++	detail_timing_desc_offset = edid[index++];
++
++	if (revision >= 2) {
++		cfg->cea_underscan = (edid[index] >> 7) & 0x1;
++		cfg->cea_basicaudio = (edid[index] >> 6) & 0x1;
++		cfg->cea_ycbcr444 = (edid[index] >> 5) & 0x1;
++		cfg->cea_ycbcr422 = (edid[index] >> 4) & 0x1;
++
++		DPRINTK("CEA underscan %d\n", cfg->cea_underscan);
++		DPRINTK("CEA basicaudio %d\n", cfg->cea_basicaudio);
++		DPRINTK("CEA ycbcr444 %d\n", cfg->cea_ycbcr444);
++		DPRINTK("CEA ycbcr422 %d\n", cfg->cea_ycbcr422);
++	}
++
++	if (revision >= 3) {
++		/* short desc */
++		DPRINTK("CEA Short desc timmings\n");
++		index++;
++		while (index < detail_timing_desc_offset) {
++			unsigned char tagcode, blklen;
++
++			tagcode = (edid[index] >> 5) & 0x7;
++			blklen = (edid[index]) & 0x1f;
++
++			DPRINTK("Tagcode %x Len %d\n", tagcode, blklen);
++
++			switch (tagcode) {
++			case 0x2: /*Video data block*/
++				{
++					int cea_idx;
++					i = 0;
++					while (i < blklen) {
++						index++;
++						cea_idx = edid[index] & 0x7f;
++						if (cea_idx < ARRAY_SIZE(mxc_cea_mode) &&
++								(mxc_cea_mode[cea_idx].xres)) {
++							DPRINTK("Support CEA Format #%d\n", cea_idx);
++							mode[num] = mxc_cea_mode[cea_idx];
++							mode[num].flag |= FB_MODE_IS_STANDARD;
++							num++;
++						}
++						i++;
++					}
++					break;
++				}
++			case 0x3: /*Vendor specific data*/
++				{
++					unsigned char IEEE_reg_iden[3];
++					unsigned char deep_color;
++					unsigned char latency_present;
++					unsigned char I_latency_present;
++					unsigned char hdmi_video_present;
++					unsigned char hdmi_3d_present;
++					unsigned char hdmi_3d_multi_present;
++					unsigned char hdmi_vic_len;
++					unsigned char hdmi_3d_len;
++					unsigned char index_inc = 0;
++					unsigned char vsd_end;
++
++					vsd_end = index + blklen;
++
++					IEEE_reg_iden[0] = edid[index+1];
++					IEEE_reg_iden[1] = edid[index+2];
++					IEEE_reg_iden[2] = edid[index+3];
++					cfg->physical_address[0] = (edid[index+4] & 0xf0) >> 4;
++					cfg->physical_address[1] = (edid[index+4] & 0x0f);
++					cfg->physical_address[2] = (edid[index+5] & 0xf0) >> 4;
++					cfg->physical_address[3] = (edid[index+5] & 0x0f);
++
++					if ((IEEE_reg_iden[0] == 0x03) &&
++							(IEEE_reg_iden[1] == 0x0c) &&
++							(IEEE_reg_iden[2] == 0x00))
++						cfg->hdmi_cap = 1;
++
++					if (blklen > 5) {
++						deep_color = edid[index+6];
++						if (deep_color & 0x80)
++							cfg->vsd_support_ai = true;
++						if (deep_color & 0x40)
++							cfg->vsd_dc_48bit = true;
++						if (deep_color & 0x20)
++							cfg->vsd_dc_36bit = true;
++						if (deep_color & 0x10)
++							cfg->vsd_dc_30bit = true;
++						if (deep_color & 0x08)
++							cfg->vsd_dc_y444 = true;
++						if (deep_color & 0x01)
++							cfg->vsd_dvi_dual = true;
++					}
++
++					DPRINTK("VSD hdmi capability %d\n", cfg->hdmi_cap);
++					DPRINTK("VSD support ai %d\n", cfg->vsd_support_ai);
++					DPRINTK("VSD support deep color 48bit %d\n", cfg->vsd_dc_48bit);
++					DPRINTK("VSD support deep color 36bit %d\n", cfg->vsd_dc_36bit);
++					DPRINTK("VSD support deep color 30bit %d\n", cfg->vsd_dc_30bit);
++					DPRINTK("VSD support deep color y444 %d\n", cfg->vsd_dc_y444);
++					DPRINTK("VSD support dvi dual %d\n", cfg->vsd_dvi_dual);
++
++					if (blklen > 6)
++						cfg->vsd_max_tmdsclk_rate = edid[index+7] * 5;
++					DPRINTK("VSD MAX TMDS CLOCK RATE %d\n", cfg->vsd_max_tmdsclk_rate);
++
++					if (blklen > 7) {
++						latency_present = edid[index+8] >> 7;
++						I_latency_present =  (edid[index+8] & 0x40) >> 6;
++						hdmi_video_present = (edid[index+8] & 0x20) >> 5;
++						cfg->vsd_cnc3 = (edid[index+8] & 0x8) >> 3;
++						cfg->vsd_cnc2 = (edid[index+8] & 0x4) >> 2;
++						cfg->vsd_cnc1 = (edid[index+8] & 0x2) >> 1;
++						cfg->vsd_cnc0 = edid[index+8] & 0x1;
++
++						DPRINTK("VSD cnc0 %d\n", cfg->vsd_cnc0);
++						DPRINTK("VSD cnc1 %d\n", cfg->vsd_cnc1);
++						DPRINTK("VSD cnc2 %d\n", cfg->vsd_cnc2);
++						DPRINTK("VSD cnc3 %d\n", cfg->vsd_cnc3);
++						DPRINTK("latency_present %d\n", latency_present);
++						DPRINTK("I_latency_present %d\n", I_latency_present);
++						DPRINTK("hdmi_video_present %d\n", hdmi_video_present);
++
++					} else {
++						index += blklen;
++						break;
++					}
++
++					index += 9;
++
++					/*latency present */
++					if (latency_present) {
++						cfg->vsd_video_latency = edid[index++];
++						cfg->vsd_audio_latency = edid[index++];
++
++						if (I_latency_present) {
++							cfg->vsd_I_video_latency = edid[index++];
++							cfg->vsd_I_audio_latency = edid[index++];
++						} else {
++							cfg->vsd_I_video_latency = cfg->vsd_video_latency;
++							cfg->vsd_I_audio_latency = cfg->vsd_audio_latency;
++						}
++
++						DPRINTK("VSD latency video_latency  %d\n", cfg->vsd_video_latency);
++						DPRINTK("VSD latency audio_latency  %d\n", cfg->vsd_audio_latency);
++						DPRINTK("VSD latency I_video_latency  %d\n", cfg->vsd_I_video_latency);
++						DPRINTK("VSD latency I_audio_latency  %d\n", cfg->vsd_I_audio_latency);
++					}
++
++					if (hdmi_video_present) {
++						hdmi_3d_present = edid[index] >> 7;
++						hdmi_3d_multi_present = (edid[index] & 0x60) >> 5;
++						index++;
++						hdmi_vic_len = (edid[index] & 0xe0) >> 5;
++						hdmi_3d_len = edid[index] & 0x1f;
++						index++;
++
++						DPRINTK("hdmi_3d_present %d\n", hdmi_3d_present);
++						DPRINTK("hdmi_3d_multi_present %d\n", hdmi_3d_multi_present);
++						DPRINTK("hdmi_vic_len %d\n", hdmi_vic_len);
++						DPRINTK("hdmi_3d_len %d\n", hdmi_3d_len);
++
++						if (hdmi_vic_len > 0) {
++							for (i = 0; i < hdmi_vic_len; i++) {
++								cfg->hdmi_vic[i] = edid[index++];
++								DPRINTK("HDMI_vic=%d\n", cfg->hdmi_vic[i]);
++							}
++						}
++
++						if (hdmi_3d_len > 0) {
++							if (hdmi_3d_present) {
++								cfg->hdmi_3d_present = hdmi_3d_present;
++								if (hdmi_3d_multi_present == 0x1) {
++									cfg->hdmi_3d_struct_all = (edid[index] << 8) | edid[index+1];
++									index_inc = 2;
++								} else if (hdmi_3d_multi_present == 0x2) {
++									cfg->hdmi_3d_struct_all = (edid[index] << 8) | edid[index+1];
++									cfg->hdmi_3d_mask_all = (edid[index+2] << 8) | edid[index+3];
++									index_inc = 4;
++								} else
++									index_inc = 0;
++								cfg->hdmi_3d_len = hdmi_3d_len - index_inc;
++								cfg->hdmi_3d_multi_present = hdmi_3d_multi_present;
++							}
++
++							DPRINTK("HDMI 3d struct all =0x%x\n", cfg->hdmi_3d_struct_all);
++							DPRINTK("HDMI 3d mask all =0x%x\n", cfg->hdmi_3d_mask_all);
++
++							/* Read 2D vic 3D_struct */
++							if ((hdmi_3d_len - index_inc) > 0) {
++								DPRINTK("Support 3D video format\n");
++								i = 0;
++								while ((hdmi_3d_len - index_inc) > 0) {
++
++									cfg->hdmi_3d_format[i].vic_order_2d = edid[index+index_inc] >> 4;
++									cfg->hdmi_3d_format[i].struct_3d = edid[index+index_inc] & 0x0f;
++									index_inc++;
++
++									if (cfg->hdmi_3d_format[i].struct_3d ==  8) {
++										cfg->hdmi_3d_format[i].detail_3d = edid[index+index_inc] >> 4;
++										index_inc++;
++									} else if (cfg->hdmi_3d_format[i].struct_3d > 8) {
++										cfg->hdmi_3d_format[i].detail_3d = 0;
++										index_inc++;
++									}
++
++									DPRINTK("vic_order_2d=%d, 3d_struct=%d, 3d_detail=0x%x\n",
++											cfg->hdmi_3d_format[i].vic_order_2d,
++											cfg->hdmi_3d_format[i].struct_3d,
++											cfg->hdmi_3d_format[i].detail_3d);
++									i++;
++								}
++							}
++							index += index_inc;
++						}
++					}
++
++					index = vsd_end;
++
++					break;
++				}
++			case 0x1: /*Audio data block*/
++				{
++					u8 audio_format, max_ch, byte1, byte2, byte3;
++
++					i = 0;
++					cfg->max_channels = 0;
++					cfg->sample_rates = 0;
++					cfg->sample_sizes = 0;
++
++					while (i < blklen) {
++						byte1 = edid[index + 1];
++						byte2 = edid[index + 2];
++						byte3 = edid[index + 3];
++						index += 3;
++						i += 3;
++
++						audio_format = byte1 >> 3;
++						max_ch = (byte1 & 0x07) + 1;
++
++						DPRINTK("Audio Format Descriptor : %2d\n", audio_format);
++						DPRINTK("Max Number of Channels  : %2d\n", max_ch);
++						DPRINTK("Sample Rates            : %02x\n", byte2);
++
++						/* ALSA can't specify specific compressed
++						 * formats, so only care about PCM for now. */
++						if (audio_format == AUDIO_CODING_TYPE_LPCM) {
++							if (max_ch > cfg->max_channels)
++								cfg->max_channels = max_ch;
++
++							cfg->sample_rates |= byte2;
++							cfg->sample_sizes |= byte3 & 0x7;
++							DPRINTK("Sample Sizes            : %02x\n",
++								byte3 & 0x7);
++						}
++					}
++					break;
++				}
++			case 0x4: /*Speaker allocation block*/
++				{
++					i = 0;
++					while (i < blklen) {
++						cfg->speaker_alloc = edid[index + 1];
++						index += 3;
++						i += 3;
++						DPRINTK("Speaker Alloc           : %02x\n", cfg->speaker_alloc);
++					}
++					break;
++				}
++			case 0x7: /*User extended block*/
++			default:
++				/* skip */
++				DPRINTK("Not handle block, tagcode = 0x%x\n", tagcode);
++				index += blklen;
++				break;
++			}
++
++			index++;
++		}
++	}
++
++	/* long desc */
++	DPRINTK("CEA long desc timmings\n");
++	index = detail_timing_desc_offset;
++	block = edid + index;
++	while (index < (EDID_LENGTH - DETAILED_TIMING_DESCRIPTION_SIZE)) {
++		if (!(block[0] == 0x00 && block[1] == 0x00)) {
++			get_detailed_timing(block, &mode[num]);
++			num++;
++		}
++		block += DETAILED_TIMING_DESCRIPTION_SIZE;
++		index += DETAILED_TIMING_DESCRIPTION_SIZE;
++	}
++
++	if (!num) {
++		kfree(mode);
++		return 0;
++	}
++
++	m = kmalloc((num + specs->modedb_len) *
++			sizeof(struct fb_videomode), GFP_KERNEL);
++	if (!m)
++		return 0;
++
++	if (specs->modedb_len) {
++		memmove(m, specs->modedb,
++			specs->modedb_len * sizeof(struct fb_videomode));
++		kfree(specs->modedb);
++	}
++	memmove(m+specs->modedb_len, mode,
++		num * sizeof(struct fb_videomode));
++	kfree(mode);
++
++	specs->modedb_len += num;
++	specs->modedb = m;
++
++	return 0;
++}
++EXPORT_SYMBOL(mxc_edid_parse_ext_blk);
++
++static int mxc_edid_readblk(struct i2c_adapter *adp,
++		unsigned short addr, unsigned char *edid)
++{
++	int ret = 0, extblknum = 0;
++	unsigned char regaddr = 0x0;
++	struct i2c_msg msg[2] = {
++		{
++		.addr	= addr,
++		.flags	= 0,
++		.len	= 1,
++		.buf	= &regaddr,
++		}, {
++		.addr	= addr,
++		.flags	= I2C_M_RD,
++		.len	= EDID_LENGTH,
++		.buf	= edid,
++		},
++	};
++
++	ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
++	if (ret != ARRAY_SIZE(msg)) {
++		DPRINTK("unable to read EDID block\n");
++		return -EIO;
++	}
++
++	if (edid[1] == 0x00)
++		return -ENOENT;
++
++	extblknum = edid[0x7E];
++
++	if (extblknum) {
++		regaddr = 128;
++		msg[1].buf = edid + EDID_LENGTH;
++
++		ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
++		if (ret != ARRAY_SIZE(msg)) {
++			DPRINTK("unable to read EDID ext block\n");
++			return -EIO;
++		}
++	}
++
++	return extblknum;
++}
++
++static int mxc_edid_readsegblk(struct i2c_adapter *adp, unsigned short addr,
++			unsigned char *edid, int seg_num)
++{
++	int ret = 0;
++	unsigned char segment = 0x1, regaddr = 0;
++	struct i2c_msg msg[3] = {
++		{
++		.addr	= 0x30,
++		.flags	= 0,
++		.len	= 1,
++		.buf	= &segment,
++		}, {
++		.addr	= addr,
++		.flags	= 0,
++		.len	= 1,
++		.buf	= &regaddr,
++		}, {
++		.addr	= addr,
++		.flags	= I2C_M_RD,
++		.len	= EDID_LENGTH,
++		.buf	= edid,
++		},
++	};
++
++	ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
++	if (ret != ARRAY_SIZE(msg)) {
++		DPRINTK("unable to read EDID block\n");
++		return -EIO;
++	}
++
++	if (seg_num == 2) {
++		regaddr = 128;
++		msg[2].buf = edid + EDID_LENGTH;
++
++		ret = i2c_transfer(adp, msg, ARRAY_SIZE(msg));
++		if (ret != ARRAY_SIZE(msg)) {
++			DPRINTK("unable to read EDID block\n");
++			return -EIO;
++		}
++	}
++
++	return ret;
++}
++
++int mxc_edid_var_to_vic(struct fb_var_screeninfo *var)
++{
++	int i;
++	struct fb_videomode m;
++
++	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
++		fb_var_to_videomode(&m, var);
++		if (mxc_edid_fb_mode_is_equal(false, &m, &mxc_cea_mode[i], FB_VMODE_MASK))
++			break;
++	}
++
++	if (i == ARRAY_SIZE(mxc_cea_mode))
++		return 0;
++
++	return i;
++}
++EXPORT_SYMBOL(mxc_edid_var_to_vic);
++
++int mxc_edid_mode_to_vic(const struct fb_videomode *mode, u32 mode_mask)
++{
++	int i;
++	bool use_aspect = (mode->vmode & FB_VMODE_ASPECT_MASK);
++	u32 use_mask = mode_mask ? mode_mask : FB_VMODE_MASK ^ (FB_VMODE_3D_MASK | FB_VMODE_FRACTIONAL);
++
++	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
++		if (mxc_edid_fb_mode_is_equal(use_aspect, mode, &mxc_cea_mode[i], use_mask))
++			break;
++	}
++
++	if (i == ARRAY_SIZE(mxc_cea_mode))
++		return 0;
++
++	return i;
++}
++EXPORT_SYMBOL(mxc_edid_mode_to_vic);
++
++/* make sure edid has 512 bytes*/
++int mxc_edid_read(struct i2c_adapter *adp, unsigned short addr,
++	unsigned char *edid, struct mxc_edid_cfg *cfg, struct fb_info *fbi)
++{
++	int ret = 0, extblknum;
++	if (!adp || !edid || !cfg || !fbi)
++		return -EINVAL;
++
++	memset(edid, 0, EDID_LENGTH*4);
++	memset(cfg, 0, sizeof(struct mxc_edid_cfg));
++
++	extblknum = mxc_edid_readblk(adp, addr, edid);
++	if (extblknum < 0)
++		return extblknum;
++
++	/* edid first block parsing */
++	memset(&fbi->monspecs, 0, sizeof(fbi->monspecs));
++	fb_edid_to_monspecs(edid, &fbi->monspecs);
++
++	if (extblknum) {
++		int i;
++
++		/* need read segment block? */
++		if (extblknum > 1) {
++			ret = mxc_edid_readsegblk(adp, addr,
++				edid + EDID_LENGTH*2, extblknum - 1);
++			if (ret < 0)
++				return ret;
++		}
++
++		for (i = 1; i <= extblknum; i++)
++			/* edid ext block parsing */
++			mxc_edid_parse_ext_blk(edid + i*EDID_LENGTH,
++					cfg, &fbi->monspecs);
++	}
++
++	return 0;
++}
++EXPORT_SYMBOL(mxc_edid_read);
++
++const struct fb_videomode *mxc_fb_find_nearest_mode(const struct fb_videomode *mode,
++						    struct list_head *head)
++{
++	struct list_head *pos;
++	struct fb_modelist *modelist;
++	struct fb_videomode *cmode, *best = NULL;
++	u32 diff = -1, diff_refresh = -1;
++
++	list_for_each(pos, head) {
++		u32 d;
++
++		modelist = list_entry(pos, struct fb_modelist, list);
++		cmode = &modelist->mode;
++
++		if (!(mode->vmode & FB_VMODE_3D_MASK) &&
++		     (cmode->vmode & FB_VMODE_3D_MASK))
++			continue;
++		if ((mode->vmode & FB_VMODE_3D_MASK) &&
++		   ((mode->vmode & FB_VMODE_3D_MASK) != (cmode->vmode & FB_VMODE_3D_MASK)))
++			continue;
++
++		if ((mode->vmode & FB_VMODE_MASK_SIMPLE) != (cmode->vmode & FB_VMODE_MASK_SIMPLE))
++			continue;
++
++		if ((mode->vmode & FB_VMODE_ASPECT_MASK) &&
++		   ((mode->vmode & FB_VMODE_ASPECT_MASK) != (cmode->vmode & FB_VMODE_ASPECT_MASK)))
++			continue;
++
++		if ((mode->vmode & FB_VMODE_FRACTIONAL) != (cmode->vmode & FB_VMODE_FRACTIONAL))
++			continue;
++
++		d = abs(cmode->xres - mode->xres) +
++			abs(cmode->yres - mode->yres);
++		if (diff > d) {
++			diff = d;
++			diff_refresh = abs(cmode->refresh - mode->refresh);
++			best = cmode;
++		} else if (diff == d) {
++			d = abs(cmode->refresh - mode->refresh);
++			if (diff_refresh > d) {
++				diff_refresh = d;
++				best = cmode;
++			}
++		}
++	}
++
++	return best;
++}
++EXPORT_SYMBOL(mxc_fb_find_nearest_mode);
+diff -Nur linux-4.1.3/drivers/video/mxc/mxcfb_hx8369_wvga.c linux-xbian-imx6/drivers/video/mxc/mxcfb_hx8369_wvga.c
+--- linux-4.1.3/drivers/video/mxc/mxcfb_hx8369_wvga.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxcfb_hx8369_wvga.c	2015-07-27 23:13:08.753749907 +0200
+@@ -0,0 +1,449 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/types.h>
++#include <linux/init.h>
++#include <linux/delay.h>
++#include <linux/platform_device.h>
++#include <linux/err.h>
++#include <linux/clk.h>
++#include <linux/console.h>
++#include <linux/io.h>
++#include <linux/bitops.h>
++#include <linux/spinlock.h>
++#include <linux/mipi_dsi.h>
++#include <linux/mxcfb.h>
++#include <linux/backlight.h>
++#include <video/mipi_display.h>
++
++#include "mipi_dsi.h"
++
++#define MIPI_DSI_MAX_RET_PACK_SIZE				(0x4)
++
++#define HX8369BL_MAX_BRIGHT		(255)
++#define HX8369BL_DEF_BRIGHT		(255)
++
++#define HX8369_MAX_DPHY_CLK					(800)
++#define HX8369_ONE_DATA_LANE					(0x1)
++#define HX8369_TWO_DATA_LANE					(0x2)
++
++#define HX8369_CMD_SETEXTC					(0xB9)
++#define HX8369_CMD_SETEXTC_LEN					(0x4)
++#define HX8369_CMD_SETEXTC_PARAM_1				(0x6983ff)
++
++#define HX8369_CMD_GETHXID					(0xF4)
++#define HX8369_CMD_GETHXID_LEN					(0x4)
++#define HX8369_ID						(0x69)
++#define HX8369_ID_MASK						(0xFF)
++
++#define HX8369_CMD_SETDISP					(0xB2)
++#define HX8369_CMD_SETDISP_LEN					(16)
++#define HX8369_CMD_SETDISP_1_HALT				(0x00)
++#define HX8369_CMD_SETDISP_2_RES_MODE				(0x23)
++#define HX8369_CMD_SETDISP_3_BP					(0x03)
++#define HX8369_CMD_SETDISP_4_FP					(0x03)
++#define HX8369_CMD_SETDISP_5_SAP				(0x70)
++#define HX8369_CMD_SETDISP_6_GENON				(0x00)
++#define HX8369_CMD_SETDISP_7_GENOFF				(0xff)
++#define HX8369_CMD_SETDISP_8_RTN				(0x00)
++#define HX8369_CMD_SETDISP_9_TEI				(0x00)
++#define HX8369_CMD_SETDISP_10_TEP_UP				(0x00)
++#define HX8369_CMD_SETDISP_11_TEP_LOW				(0x00)
++#define HX8369_CMD_SETDISP_12_BP_PE				(0x03)
++#define HX8369_CMD_SETDISP_13_FP_PE				(0x03)
++#define HX8369_CMD_SETDISP_14_RTN_PE				(0x00)
++#define HX8369_CMD_SETDISP_15_GON				(0x01)
++
++#define HX8369_CMD_SETCYC					(0xB4)
++#define HX8369_CMD_SETCYC_LEN					(6)
++#define HX8369_CMD_SETCYC_PARAM_1				(0x5f1d00)
++#define HX8369_CMD_SETCYC_PARAM_2				(0x060e)
++
++#define HX8369_CMD_SETGIP					(0xD5)
++#define HX8369_CMD_SETGIP_LEN					(27)
++#define HX8369_CMD_SETGIP_PARAM_1				(0x030400)
++#define HX8369_CMD_SETGIP_PARAM_2				(0x1c050100)
++#define HX8369_CMD_SETGIP_PARAM_3				(0x00030170)
++#define HX8369_CMD_SETGIP_PARAM_4				(0x51064000)
++#define HX8369_CMD_SETGIP_PARAM_5				(0x41000007)
++#define HX8369_CMD_SETGIP_PARAM_6				(0x07075006)
++#define HX8369_CMD_SETGIP_PARAM_7				(0x040f)
++
++#define HX8369_CMD_SETPOWER					(0xB1)
++#define HX8369_CMD_SETPOWER_LEN					(20)
++#define HX8369_CMD_SETPOWER_PARAM_1				(0x340001)
++#define HX8369_CMD_SETPOWER_PARAM_2				(0x0f0f0006)
++#define HX8369_CMD_SETPOWER_PARAM_3				(0x3f3f322a)
++#define HX8369_CMD_SETPOWER_PARAM_4				(0xe6013a07)
++#define HX8369_CMD_SETPOWER_PARAM_5				(0xe6e6e6e6)
++
++#define HX8369_CMD_SETVCOM					(0xB6)
++#define HX8369_CMD_SETVCOM_LEN					(3)
++#define HX8369_CMD_SETVCOM_PARAM_1				(0x5656)
++
++#define HX8369_CMD_SETPANEL					(0xCC)
++#define HX8369_CMD_SETPANEL_PARAM_1				(0x02)
++
++#define HX8369_CMD_SETGAMMA					(0xE0)
++#define HX8369_CMD_SETGAMMA_LEN					(35)
++#define HX8369_CMD_SETGAMMA_PARAM_1				(0x221d00)
++#define HX8369_CMD_SETGAMMA_PARAM_2				(0x2e3f3d38)
++#define HX8369_CMD_SETGAMMA_PARAM_3				(0x0f0d064a)
++#define HX8369_CMD_SETGAMMA_PARAM_4				(0x16131513)
++#define HX8369_CMD_SETGAMMA_PARAM_5				(0x1d001910)
++#define HX8369_CMD_SETGAMMA_PARAM_6				(0x3f3d3822)
++#define HX8369_CMD_SETGAMMA_PARAM_7				(0x0d064a2e)
++#define HX8369_CMD_SETGAMMA_PARAM_8				(0x1315130f)
++#define HX8369_CMD_SETGAMMA_PARAM_9				(0x191016)
++
++#define HX8369_CMD_SETMIPI					(0xBA)
++#define HX8369_CMD_SETMIPI_LEN					(14)
++#define HX8369_CMD_SETMIPI_PARAM_1				(0xc6a000)
++#define HX8369_CMD_SETMIPI_PARAM_2				(0x10000a00)
++#define HX8369_CMD_SETMIPI_ONELANE				(0x10 << 24)
++#define HX8369_CMD_SETMIPI_TWOLANE				(0x11 << 24)
++#define HX8369_CMD_SETMIPI_PARAM_3				(0x00026f30)
++#define HX8369_CMD_SETMIPI_PARAM_4				(0x4018)
++
++#define HX8369_CMD_SETPIXEL_FMT					(0x3A)
++#define HX8369_CMD_SETPIXEL_FMT_24BPP				(0x77)
++#define HX8369_CMD_SETPIXEL_FMT_18BPP				(0x66)
++#define HX8369_CMD_SETPIXEL_FMT_16BPP				(0x55)
++
++#define HX8369_CMD_SETCLUMN_ADDR				(0x2A)
++#define HX8369_CMD_SETCLUMN_ADDR_LEN				(5)
++#define HX8369_CMD_SETCLUMN_ADDR_PARAM_1			(0xdf0000)
++#define HX8369_CMD_SETCLUMN_ADDR_PARAM_2			(0x01)
++
++#define HX8369_CMD_SETPAGE_ADDR					(0x2B)
++#define HX8369_CMD_SETPAGE_ADDR_LEN				(5)
++#define HX8369_CMD_SETPAGE_ADDR_PARAM_1				(0x1f0000)
++#define HX8369_CMD_SETPAGE_ADDR_PARAM_2				(0x03)
++
++#define HX8369_CMD_WRT_DISP_BRIGHT				(0x51)
++#define HX8369_CMD_WRT_DISP_BRIGHT_PARAM_1			(0xFF)
++
++#define HX8369_CMD_WRT_CABC_MIN_BRIGHT				(0x5E)
++#define HX8369_CMD_WRT_CABC_MIN_BRIGHT_PARAM_1			(0x20)
++
++#define HX8369_CMD_WRT_CABC_CTRL				(0x55)
++#define HX8369_CMD_WRT_CABC_CTRL_PARAM_1			(0x1)
++
++#define HX8369_CMD_WRT_CTRL_DISP				(0x53)
++#define HX8369_CMD_WRT_CTRL_DISP_PARAM_1			(0x24)
++
++#define CHECK_RETCODE(ret)					\
++do {								\
++	if (ret < 0) {						\
++		dev_err(&mipi_dsi->pdev->dev,			\
++			"%s ERR: ret:%d, line:%d.\n",		\
++			__func__, ret, __LINE__);		\
++		return ret;					\
++	}							\
++} while (0)
++
++static int hx8369bl_brightness;
++static int mipid_init_backlight(struct mipi_dsi_info *mipi_dsi);
++
++static struct fb_videomode truly_lcd_modedb[] = {
++	{
++	 "TRULY-WVGA", 64, 480, 800, 37880,
++	 8, 8,
++	 6, 6,
++	 8, 6,
++	 FB_SYNC_OE_LOW_ACT,
++	 FB_VMODE_NONINTERLACED,
++	 0,
++	},
++};
++
++static struct mipi_lcd_config lcd_config = {
++	.virtual_ch		= 0x0,
++	.data_lane_num  = HX8369_TWO_DATA_LANE,
++	.max_phy_clk    = HX8369_MAX_DPHY_CLK,
++	.dpi_fmt		= MIPI_RGB888,
++};
++void mipid_hx8369_get_lcd_videomode(struct fb_videomode **mode, int *size,
++		struct mipi_lcd_config **data)
++{
++	*mode = &truly_lcd_modedb[0];
++	*size = ARRAY_SIZE(truly_lcd_modedb);
++	*data = &lcd_config;
++}
++
++int mipid_hx8369_lcd_setup(struct mipi_dsi_info *mipi_dsi)
++{
++	u32 buf[DSI_CMD_BUF_MAXSIZE];
++	int err;
++
++	dev_dbg(&mipi_dsi->pdev->dev, "MIPI DSI LCD setup.\n");
++	buf[0] = HX8369_CMD_SETEXTC | (HX8369_CMD_SETEXTC_PARAM_1 << 8);
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
++					buf, HX8369_CMD_SETEXTC_LEN);
++	CHECK_RETCODE(err);
++	buf[0] = MIPI_DSI_MAX_RET_PACK_SIZE;
++	err = mipi_dsi_pkt_write(mipi_dsi,
++				MIPI_DSI_SET_MAXIMUM_RETURN_PACKET_SIZE,
++				buf, 0);
++	CHECK_RETCODE(err);
++	buf[0] = HX8369_CMD_GETHXID;
++	err =  mipi_dsi_pkt_read(mipi_dsi,
++			MIPI_DSI_GENERIC_READ_REQUEST_2_PARAM,
++			buf, HX8369_CMD_GETHXID_LEN);
++	if (!err && ((buf[0] & HX8369_ID_MASK) == HX8369_ID)) {
++		dev_info(&mipi_dsi->pdev->dev,
++				"MIPI DSI LCD ID:0x%x.\n", buf[0]);
++	} else {
++		dev_err(&mipi_dsi->pdev->dev,
++			"mipi_dsi_pkt_read err:%d, data:0x%x.\n",
++			err, buf[0]);
++		dev_info(&mipi_dsi->pdev->dev,
++				"MIPI DSI LCD not detected!\n");
++		return err;
++	}
++
++	/* set LCD resolution as 480RGBx800, DPI interface,
++	 * display operation mode: RGB data bypass GRAM mode.
++	 */
++	buf[0] = HX8369_CMD_SETDISP | (HX8369_CMD_SETDISP_1_HALT << 8) |
++			(HX8369_CMD_SETDISP_2_RES_MODE << 16) |
++			(HX8369_CMD_SETDISP_3_BP << 24);
++	buf[1] = HX8369_CMD_SETDISP_4_FP | (HX8369_CMD_SETDISP_5_SAP << 8) |
++			 (HX8369_CMD_SETDISP_6_GENON << 16) |
++			 (HX8369_CMD_SETDISP_7_GENOFF << 24);
++	buf[2] = HX8369_CMD_SETDISP_8_RTN | (HX8369_CMD_SETDISP_9_TEI << 8) |
++			 (HX8369_CMD_SETDISP_10_TEP_UP << 16) |
++			 (HX8369_CMD_SETDISP_11_TEP_LOW << 24);
++	buf[3] = HX8369_CMD_SETDISP_12_BP_PE |
++			(HX8369_CMD_SETDISP_13_FP_PE << 8) |
++			 (HX8369_CMD_SETDISP_14_RTN_PE << 16) |
++			 (HX8369_CMD_SETDISP_15_GON << 24);
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
++						buf, HX8369_CMD_SETDISP_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set display waveform cycle */
++	buf[0] = HX8369_CMD_SETCYC | (HX8369_CMD_SETCYC_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETCYC_PARAM_2;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
++						buf, HX8369_CMD_SETCYC_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set GIP timing output control */
++	buf[0] = HX8369_CMD_SETGIP | (HX8369_CMD_SETGIP_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETGIP_PARAM_2;
++	buf[2] = HX8369_CMD_SETGIP_PARAM_3;
++	buf[3] = HX8369_CMD_SETGIP_PARAM_4;
++	buf[4] = HX8369_CMD_SETGIP_PARAM_5;
++	buf[5] = HX8369_CMD_SETGIP_PARAM_6;
++	buf[6] = HX8369_CMD_SETGIP_PARAM_7;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
++				HX8369_CMD_SETGIP_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set power: standby, DC etc. */
++	buf[0] = HX8369_CMD_SETPOWER | (HX8369_CMD_SETPOWER_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETPOWER_PARAM_2;
++	buf[2] = HX8369_CMD_SETPOWER_PARAM_3;
++	buf[3] = HX8369_CMD_SETPOWER_PARAM_4;
++	buf[4] = HX8369_CMD_SETPOWER_PARAM_5;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
++				HX8369_CMD_SETPOWER_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set VCOM voltage. */
++	buf[0] = HX8369_CMD_SETVCOM | (HX8369_CMD_SETVCOM_PARAM_1 << 8);
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
++				HX8369_CMD_SETVCOM_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set Panel: BGR/RGB or Inversion. */
++	buf[0] = HX8369_CMD_SETPANEL | (HX8369_CMD_SETPANEL_PARAM_1 << 8);
++	err = mipi_dsi_pkt_write(mipi_dsi,
++		MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM, buf, 0);
++	CHECK_RETCODE(err);
++
++	/* Set gamma curve related setting */
++	buf[0] = HX8369_CMD_SETGAMMA | (HX8369_CMD_SETGAMMA_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETGAMMA_PARAM_2;
++	buf[2] = HX8369_CMD_SETGAMMA_PARAM_3;
++	buf[3] = HX8369_CMD_SETGAMMA_PARAM_4;
++	buf[4] = HX8369_CMD_SETGAMMA_PARAM_5;
++	buf[5] = HX8369_CMD_SETGAMMA_PARAM_6;
++	buf[7] = HX8369_CMD_SETGAMMA_PARAM_7;
++	buf[7] = HX8369_CMD_SETGAMMA_PARAM_8;
++	buf[8] = HX8369_CMD_SETGAMMA_PARAM_9;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
++				HX8369_CMD_SETGAMMA_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set MIPI: DPHYCMD & DSICMD, data lane number */
++	buf[0] = HX8369_CMD_SETMIPI | (HX8369_CMD_SETMIPI_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETMIPI_PARAM_2;
++	buf[2] = HX8369_CMD_SETMIPI_PARAM_3;
++	if (lcd_config.data_lane_num == HX8369_ONE_DATA_LANE)
++		buf[2] |= HX8369_CMD_SETMIPI_ONELANE;
++	else
++		buf[2] |= HX8369_CMD_SETMIPI_TWOLANE;
++	buf[3] = HX8369_CMD_SETMIPI_PARAM_4;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE, buf,
++				HX8369_CMD_SETMIPI_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set pixel format:24bpp */
++	buf[0] = HX8369_CMD_SETPIXEL_FMT;
++	switch (lcd_config.dpi_fmt) {
++	case MIPI_RGB565_PACKED:
++	case MIPI_RGB565_LOOSELY:
++	case MIPI_RGB565_CONFIG3:
++		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_16BPP << 8);
++		break;
++
++	case MIPI_RGB666_LOOSELY:
++	case MIPI_RGB666_PACKED:
++		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_18BPP << 8);
++		break;
++
++	case MIPI_RGB888:
++		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_24BPP << 8);
++		break;
++
++	default:
++		buf[0] |= (HX8369_CMD_SETPIXEL_FMT_24BPP << 8);
++		break;
++	}
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
++			buf, 0);
++	CHECK_RETCODE(err);
++
++	/* Set column address: 0~479 */
++	buf[0] = HX8369_CMD_SETCLUMN_ADDR |
++		(HX8369_CMD_SETCLUMN_ADDR_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETCLUMN_ADDR_PARAM_2;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
++				buf, HX8369_CMD_SETCLUMN_ADDR_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set page address: 0~799 */
++	buf[0] = HX8369_CMD_SETPAGE_ADDR |
++		(HX8369_CMD_SETPAGE_ADDR_PARAM_1 << 8);
++	buf[1] = HX8369_CMD_SETPAGE_ADDR_PARAM_2;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_LONG_WRITE,
++					buf, HX8369_CMD_SETPAGE_ADDR_LEN);
++	CHECK_RETCODE(err);
++
++	/* Set display brightness related */
++	buf[0] = HX8369_CMD_WRT_DISP_BRIGHT |
++			(HX8369_CMD_WRT_DISP_BRIGHT_PARAM_1 << 8);
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
++		buf, 0);
++	CHECK_RETCODE(err);
++
++	buf[0] = HX8369_CMD_WRT_CABC_CTRL |
++		(HX8369_CMD_WRT_CABC_CTRL_PARAM_1 << 8);
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
++		buf, 0);
++	CHECK_RETCODE(err);
++
++	buf[0] = HX8369_CMD_WRT_CTRL_DISP |
++		(HX8369_CMD_WRT_CTRL_DISP_PARAM_1 << 8);
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
++		buf, 0);
++	CHECK_RETCODE(err);
++
++	/* exit sleep mode and set display on */
++	buf[0] = MIPI_DCS_EXIT_SLEEP_MODE;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_1_PARAM,
++		buf, 0);
++	CHECK_RETCODE(err);
++	/* To allow time for the supply voltages
++	 * and clock circuits to stabilize.
++	 */
++	msleep(5);
++	buf[0] = MIPI_DCS_SET_DISPLAY_ON;
++	err = mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_1_PARAM,
++		buf, 0);
++	CHECK_RETCODE(err);
++
++	err = mipid_init_backlight(mipi_dsi);
++	return err;
++}
++
++static int mipid_bl_update_status(struct backlight_device *bl)
++{
++	u32 buf;
++	int brightness = bl->props.brightness;
++	struct mipi_dsi_info *mipi_dsi = bl_get_data(bl);
++
++	if (bl->props.power != FB_BLANK_UNBLANK ||
++	    bl->props.fb_blank != FB_BLANK_UNBLANK)
++		brightness = 0;
++
++	buf = HX8369_CMD_WRT_DISP_BRIGHT |
++			((brightness & HX8369BL_MAX_BRIGHT) << 8);
++	mipi_dsi_pkt_write(mipi_dsi, MIPI_DSI_GENERIC_SHORT_WRITE_2_PARAM,
++		&buf, 0);
++
++	hx8369bl_brightness = brightness & HX8369BL_MAX_BRIGHT;
++
++	dev_dbg(&bl->dev, "mipid backlight bringtness:%d.\n", brightness);
++	return 0;
++}
++
++static int mipid_bl_get_brightness(struct backlight_device *bl)
++{
++	return hx8369bl_brightness;
++}
++
++static int mipi_bl_check_fb(struct backlight_device *bl, struct fb_info *fbi)
++{
++	return 0;
++}
++
++static const struct backlight_ops mipid_lcd_bl_ops = {
++	.update_status = mipid_bl_update_status,
++	.get_brightness = mipid_bl_get_brightness,
++	.check_fb = mipi_bl_check_fb,
++};
++
++static int mipid_init_backlight(struct mipi_dsi_info *mipi_dsi)
++{
++	struct backlight_properties props;
++	struct backlight_device	*bl;
++
++	if (mipi_dsi->bl) {
++		pr_debug("mipid backlight already init!\n");
++		return 0;
++	}
++	memset(&props, 0, sizeof(struct backlight_properties));
++	props.max_brightness = HX8369BL_MAX_BRIGHT;
++	props.type = BACKLIGHT_RAW;
++	bl = backlight_device_register("mipid-bl", &mipi_dsi->pdev->dev,
++		mipi_dsi, &mipid_lcd_bl_ops, &props);
++	if (IS_ERR(bl)) {
++		pr_err("error %ld on backlight register\n", PTR_ERR(bl));
++		return PTR_ERR(bl);
++	}
++	mipi_dsi->bl = bl;
++	bl->props.power = FB_BLANK_UNBLANK;
++	bl->props.fb_blank = FB_BLANK_UNBLANK;
++	bl->props.brightness = HX8369BL_DEF_BRIGHT;
++
++	mipid_bl_update_status(bl);
++	return 0;
++}
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_hdmi.c linux-xbian-imx6/drivers/video/mxc/mxc_hdmi.c
+--- linux-4.1.3/drivers/video/mxc/mxc_hdmi.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_hdmi.c	2015-07-27 23:13:08.753749907 +0200
+@@ -0,0 +1,3404 @@
++/*
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++/*
++ * SH-Mobile High-Definition Multimedia Interface (HDMI) driver
++ * for SLISHDMI13T and SLIPHDMIT IP cores
++ *
++ * Copyright (C) 2010, Guennadi Liakhovetski <g.liakhovetski@gmx.de>
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License version 2 as
++ * published by the Free Software Foundation.
++ */
++
++#include <linux/module.h>
++#include <linux/kernel.h>
++#include <linux/device.h>
++#include <linux/platform_device.h>
++#include <linux/input.h>
++#include <linux/interrupt.h>
++#include <linux/irq.h>
++#include <linux/io.h>
++#include <linux/fb.h>
++#include <linux/init.h>
++#include <linux/list.h>
++#include <linux/delay.h>
++#include <linux/dma-mapping.h>
++#include <linux/err.h>
++#include <linux/clk.h>
++#include <linux/uaccess.h>
++#include <linux/cpufreq.h>
++#include <linux/firmware.h>
++#include <linux/kthread.h>
++#include <linux/regulator/driver.h>
++#include <linux/fsl_devices.h>
++#include <linux/ipu.h>
++#include <linux/regmap.h>
++#include <linux/pinctrl/consumer.h>
++#include <linux/of_device.h>
++
++#include <linux/console.h>
++#include <linux/types.h>
++
++#include "../fbdev/edid.h"
++#include <video/mxc_edid.h>
++#include <video/mxc_hdmi.h>
++#include "mxc_dispdrv.h"
++
++#include <linux/mfd/mxc-hdmi-core.h>
++
++#include <linux/hdmi.h>
++
++#define DISPDRV_HDMI	"hdmi"
++#define HDMI_EDID_LEN		512
++
++/* status codes for reading edid */
++#define HDMI_EDID_SUCCESS	0
++#define HDMI_EDID_FAIL		-1
++#define HDMI_EDID_SAME		-2
++#define HDMI_EDID_NO_MODES	-3
++
++#define NUM_CEA_VIDEO_MODES	64
++#define DEFAULT_VIDEO_MODE	16 /* 1080P */
++
++#define RGB			0
++#define YCBCR444		1
++#define YCBCR422_16BITS		2
++#define YCBCR422_8BITS		3
++#define XVYCC444            4
++
++#define fb_mode_is_equal(a, b)	mxc_edid_fb_mode_is_equal(true, a, b, ~0)
++
++/*
++ * We follow a flowchart which is in the "Synopsys DesignWare Courses
++ * HDMI Transmitter Controller User Guide, 1.30a", section 3.1
++ * (dwc_hdmi_tx_user.pdf)
++ *
++ * Below are notes that say "HDMI Initialization Step X"
++ * These correspond to the flowchart.
++ */
++
++/*
++ * We are required to configure VGA mode before reading edid
++ * in HDMI Initialization Step B
++ */
++static const struct fb_videomode vga_mode = {
++	/* 640x480 @ 60 Hz, 31.5 kHz hsync */
++	NULL, 60, 640, 480, 39721, 48, 16, 33, 10, 96, 2, 0,
++	FB_VMODE_NONINTERLACED | FB_VMODE_ASPECT_4_3, FB_MODE_IS_VESA,
++};
++
++enum hdmi_datamap {
++	RGB444_8B = 0x01,
++	RGB444_10B = 0x03,
++	RGB444_12B = 0x05,
++	RGB444_16B = 0x07,
++	YCbCr444_8B = 0x09,
++	YCbCr444_10B = 0x0B,
++	YCbCr444_12B = 0x0D,
++	YCbCr444_16B = 0x0F,
++	YCbCr422_8B = 0x16,
++	YCbCr422_10B = 0x14,
++	YCbCr422_12B = 0x12,
++};
++
++enum hdmi_mxc_colorimetry {
++	eITU601,
++	eITU709,
++};
++
++struct hdmi_vmode {
++	bool mDVI;
++	bool mHSyncPolarity;
++	bool mVSyncPolarity;
++	bool mInterlaced;
++	bool mDataEnablePolarity;
++
++	unsigned long mPixelClock;
++	unsigned int mPixelRepetitionInput;
++	unsigned int mPixelRepetitionOutput;
++};
++
++struct hdmi_data_info {
++	unsigned int enc_in_format;
++	unsigned int enc_out_format;
++	unsigned int enc_color_depth;
++	unsigned int colorimetry;
++	unsigned int pix_repet_factor;
++	unsigned int hdcp_enable;
++	unsigned int rgb_out_enable;
++	unsigned int rgb_quant_range;
++	unsigned int enable_3d;
++	unsigned int enable_fract;
++	struct hdmi_vmode video_mode;
++};
++
++struct hdmi_phy_reg_config {
++	/* HDMI PHY register config for pass HCT */
++	u16 reg_vlev;
++	u16 reg_cksymtx;
++};
++
++struct mxc_hdmi {
++	struct platform_device *pdev;
++	struct platform_device *core_pdev;
++	struct mxc_dispdrv_handle *disp_mxc_hdmi;
++	struct fb_info *fbi;
++	struct clk *hdmi_isfr_clk;
++	struct clk *hdmi_iahb_clk;
++	struct timer_list jitter_timer;
++	struct work_struct hotplug_work;
++	struct delayed_work hdcp_hdp_work;
++
++	struct notifier_block nb;
++
++	struct hdmi_data_info hdmi_data;
++	int vic;
++	int edid_status;
++	struct mxc_edid_cfg edid_cfg;
++	u8 edid[HDMI_EDID_LEN];
++	bool fb_reg;
++	bool cable_plugin;
++	u8  blank;
++	bool dft_mode_set;
++	char *dft_mode_str;
++	int default_bpp;
++	u8 latest_intr_stat;
++	u8 plug_event;
++	u8 plug_mask;
++	bool irq_enabled;
++	spinlock_t irq_lock;
++	bool phy_enabled;
++	struct fb_videomode default_mode;
++	struct fb_var_screeninfo previous_non_vga_mode;
++	bool requesting_vga_for_initialization;
++
++	int *gpr_base;
++	int *gpr_hdmi_base;
++	int *gpr_sdma_base;
++	int cpu_type;
++	int cpu_version;
++	struct hdmi_phy_reg_config phy_config;
++
++	struct pinctrl *pinctrl;
++};
++
++static int hdmi_major;
++static struct class *hdmi_class;
++
++struct i2c_client *hdmi_i2c;
++struct mxc_hdmi *g_hdmi;
++
++static bool hdmi_inited;
++static bool hdcp_init;
++
++extern const struct fb_videomode mxc_cea_mode[64];
++extern void mxc_hdmi_cec_handle(u32 cec_stat);
++
++static void mxc_hdmi_setup(struct mxc_hdmi *hdmi, unsigned long event);
++static void hdmi_enable_overflow_interrupts(void);
++static void hdmi_disable_overflow_interrupts(void);
++static void mxc_hdmi_edid_rebuild_modelist(struct mxc_hdmi *hdmi);
++static void mxc_hdmi_default_edid_cfg(struct mxc_hdmi *hdmi);
++static void mxc_hdmi_default_modelist(struct mxc_hdmi *hdmi);
++static void mxc_hdmi_set_mode(struct mxc_hdmi *hdmi);
++
++static char *rgb_quant_range = "default";
++module_param(rgb_quant_range, charp, S_IRUGO);
++MODULE_PARM_DESC(rgb_quant_range, "RGB Quant Range (default, limited, full)");
++
++static char *enable_3d = "1";
++module_param(enable_3d, charp, S_IRUGO);
++MODULE_PARM_DESC(enable_3d, "3D modes enabled (0/1)");
++
++static char *enable_fract = "1";
++module_param(enable_fract, charp, S_IRUGO);
++MODULE_PARM_DESC(enable_fract, "Fractional modes enabled (0/1)");
++
++static struct platform_device_id imx_hdmi_devtype[] = {
++	{
++		.name = "hdmi-imx6DL",
++		.driver_data = IMX6DL_HDMI,
++	}, {
++		.name = "hdmi-imx6Q",
++		.driver_data = IMX6Q_HDMI,
++	}, {
++		/* sentinel */
++	}
++};
++MODULE_DEVICE_TABLE(platform, imx_hdmi_devtype);
++
++static const struct of_device_id imx_hdmi_dt_ids[] = {
++	{ .compatible = "fsl,imx6dl-hdmi-video", .data = &imx_hdmi_devtype[IMX6DL_HDMI], },
++	{ .compatible = "fsl,imx6q-hdmi-video", .data = &imx_hdmi_devtype[IMX6Q_HDMI], },
++	{ /* sentinel */ }
++};
++MODULE_DEVICE_TABLE(of, imx_hdmi_dt_ids);
++
++static inline int cpu_is_imx6dl(struct mxc_hdmi *hdmi)
++{
++	return hdmi->cpu_type == IMX6DL_HDMI;
++}
++
++static inline void get_refresh_str(struct fb_videomode *m, char *refresh)
++{
++	snprintf(refresh, 10, "%u.%uHz", m->refresh - (int)(m->vmode & FB_VMODE_FRACTIONAL ? 1 : 0),
++				m->refresh * (int)(m->vmode & FB_VMODE_FRACTIONAL ? 999 : 1000) % 1000);
++}
++
++static void dump_fb_videomode(struct fb_videomode *m)
++{
++	char refresh[10];
++
++	get_refresh_str(m, refresh);
++	pr_debug("fb_videomode = %ux%u%c-%s (%ukHz) %u %u %u %u %u %u %u %u %u\n",
++		m->xres, m->yres, m->vmode & FB_VMODE_INTERLACED ? 'i' : 'p',
++		refresh, m->pixclock, m->left_margin,
++		m->right_margin, m->upper_margin, m->lower_margin,
++		m->hsync_len, m->vsync_len, m->sync, m->vmode, m->flag);
++}
++
++static ssize_t mxc_hdmi_show_name(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	strcpy(buf, hdmi->fbi->fix.id);
++	sprintf(buf+strlen(buf), "\n");
++
++	return strlen(buf);
++}
++
++static DEVICE_ATTR(fb_name, S_IRUGO, mxc_hdmi_show_name, NULL);
++
++static ssize_t mxc_hdmi_show_state(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	if (hdmi->cable_plugin == false)
++		strcpy(buf, "plugout\n");
++	else
++		strcpy(buf, "plugin\n");
++
++	return strlen(buf);
++}
++
++static DEVICE_ATTR(cable_state, S_IRUGO, mxc_hdmi_show_state, NULL);
++
++static ssize_t mxc_hdmi_show_edid(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++	int i, j, len = 0;
++
++	for (j = 0; j < HDMI_EDID_LEN/16; j++) {
++		for (i = 0; i < 16; i++)
++			len += sprintf(buf+len, "0x%02X ",
++					hdmi->edid[j*16 + i]);
++		len += sprintf(buf+len, "\n");
++	}
++
++	return len;
++}
++
++static DEVICE_ATTR(edid, S_IRUGO, mxc_hdmi_show_edid, NULL);
++
++static ssize_t mxc_hdmi_show_rgb_out_enable(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	if (hdmi->hdmi_data.rgb_out_enable == true)
++		strcpy(buf, "RGB out\n");
++	else
++		strcpy(buf, "YCbCr out\n");
++
++	return strlen(buf);
++}
++
++static ssize_t mxc_hdmi_store_rgb_out_enable(struct device *dev,
++		struct device_attribute *attr, const char *buf, size_t count)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++	unsigned long value;
++	int ret;
++
++	ret = kstrtol(buf, 10, &value);
++	if (ret)
++		return ret;
++
++	hdmi->hdmi_data.rgb_out_enable = value;
++
++	/* Reconfig HDMI for output color space change */
++	mxc_hdmi_setup(hdmi, 0);
++
++	return count;
++}
++
++static DEVICE_ATTR(rgb_out_enable, S_IRUGO | S_IWUSR,
++				mxc_hdmi_show_rgb_out_enable,
++				mxc_hdmi_store_rgb_out_enable);
++
++static ssize_t mxc_hdmi_show_rgb_quant_range(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	switch (hdmi->hdmi_data.rgb_quant_range) {
++	case HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE: 
++		strcpy(buf, "limited\n");
++		break;
++	case HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE: 
++		strcpy(buf, "full\n");
++		break;
++	case HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT: 
++	default:
++		strcpy(buf, "default\n");
++		break;
++	};
++
++	return strlen(buf);
++}
++
++static ssize_t mxc_hdmi_store_rgb_quant_range(struct device *dev,
++		struct device_attribute *attr, const char *buf, size_t count)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++	int ret = count;
++
++	if (sysfs_streq("limited", buf)) {
++		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE;
++	} else if (sysfs_streq("full", buf)) {
++		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE;
++	} else if (sysfs_streq("default", buf)) {
++		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT;
++	} else {
++		ret = -EINVAL;
++		goto out;
++	}
++
++	/* Reconfig HDMI for output RGB Quant Range change if using RGB out */
++	if(hdmi->hdmi_data.rgb_out_enable)
++		mxc_hdmi_setup(hdmi, 0);
++out:
++	return ret;
++}
++
++static DEVICE_ATTR(rgb_quant_range, S_IRUGO | S_IWUSR,
++				mxc_hdmi_show_rgb_quant_range,
++				mxc_hdmi_store_rgb_quant_range);
++
++static ssize_t mxc_hdmi_show_enable_3d(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	switch (hdmi->hdmi_data.enable_3d) {
++	case 0:
++		strcpy(buf, "disabled\n");
++		break;
++	default:
++		strcpy(buf, "enabled\n");
++		break;
++	};
++
++	return strlen(buf);
++}
++
++static ssize_t mxc_hdmi_store_enable_3d(struct device *dev,
++		struct device_attribute *attr, const char *buf, size_t count)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++	int ret = count;
++
++	if (sysfs_streq("disable", buf)) {
++		hdmi->hdmi_data.enable_3d = 0;
++	} else if (sysfs_streq("0", buf)) {
++		hdmi->hdmi_data.enable_3d = 0;
++	} else {
++		hdmi->hdmi_data.enable_3d = 1;
++	}
++
++	mxc_hdmi_edid_rebuild_modelist(hdmi);
++	if (hdmi->cable_plugin)
++		mxc_hdmi_set_mode(hdmi);
++
++	return ret;
++}
++
++static DEVICE_ATTR(enable_3d, S_IRUGO | S_IWUSR,
++				mxc_hdmi_show_enable_3d,
++				mxc_hdmi_store_enable_3d);
++
++static ssize_t mxc_hdmi_show_enable_fract(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	switch (hdmi->hdmi_data.enable_fract) {
++	case 0:
++		strcpy(buf, "disabled\n");
++		break;
++	default:
++		strcpy(buf, "enabled\n");
++		break;
++	};
++
++	return strlen(buf);
++}
++
++static ssize_t mxc_hdmi_store_enable_fract(struct device *dev,
++		struct device_attribute *attr, const char *buf, size_t count)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++	int ret = count;
++
++	if (sysfs_streq("disable", buf)) {
++		hdmi->hdmi_data.enable_fract = 0;
++	} else if (sysfs_streq("0", buf)) {
++		hdmi->hdmi_data.enable_fract = 0;
++	} else {
++		hdmi->hdmi_data.enable_fract = 1;
++	}
++
++	mxc_hdmi_edid_rebuild_modelist(hdmi);
++	if (hdmi->cable_plugin)
++		mxc_hdmi_set_mode(hdmi);
++
++	return ret;
++}
++
++static DEVICE_ATTR(enable_fract, S_IRUGO | S_IWUSR,
++				mxc_hdmi_show_enable_fract,
++				mxc_hdmi_store_enable_fract);
++
++static ssize_t mxc_hdmi_show_hdcp_enable(struct device *dev,
++		struct device_attribute *attr, char *buf)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++
++	if (hdmi->hdmi_data.hdcp_enable == false)
++		strcpy(buf, "hdcp disable\n");
++	else
++		strcpy(buf, "hdcp enable\n");
++
++	return strlen(buf);
++
++}
++
++static ssize_t mxc_hdmi_store_hdcp_enable(struct device *dev,
++		struct device_attribute *attr, const char *buf, size_t count)
++{
++	struct mxc_hdmi *hdmi = dev_get_drvdata(dev);
++	char event_string[32];
++	char *envp[] = { event_string, NULL };
++	unsigned long value;
++	int ret;
++
++	ret = kstrtol(buf, 10, &value);
++	if (ret)
++		return ret;
++
++	hdmi->hdmi_data.hdcp_enable = value;
++
++	/* Reconfig HDMI for HDCP */
++	mxc_hdmi_setup(hdmi, 0);
++
++	if (hdmi->hdmi_data.hdcp_enable == false) {
++		sprintf(event_string, "EVENT=hdcpdisable");
++		kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
++	} else {
++		sprintf(event_string, "EVENT=hdcpenable");
++		kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
++	}
++
++	return count;
++
++}
++
++static DEVICE_ATTR(hdcp_enable, S_IRUGO | S_IWUSR,
++			mxc_hdmi_show_hdcp_enable, mxc_hdmi_store_hdcp_enable);
++
++/*!
++ * this submodule is responsible for the video data synchronization.
++ * for example, for RGB 4:4:4 input, the data map is defined as
++ *			pin{47~40} <==> R[7:0]
++ *			pin{31~24} <==> G[7:0]
++ *			pin{15~8}  <==> B[7:0]
++ */
++static void hdmi_video_sample(struct mxc_hdmi *hdmi)
++{
++	int color_format = 0;
++	u8 val;
++
++	if (hdmi->hdmi_data.enc_in_format == RGB) {
++		if (hdmi->hdmi_data.enc_color_depth == 8)
++			color_format = 0x01;
++		else if (hdmi->hdmi_data.enc_color_depth == 10)
++			color_format = 0x03;
++		else if (hdmi->hdmi_data.enc_color_depth == 12)
++			color_format = 0x05;
++		else if (hdmi->hdmi_data.enc_color_depth == 16)
++			color_format = 0x07;
++		else
++			return;
++	} else if (hdmi->hdmi_data.enc_in_format == YCBCR444) {
++		if (hdmi->hdmi_data.enc_color_depth == 8)
++			color_format = 0x09;
++		else if (hdmi->hdmi_data.enc_color_depth == 10)
++			color_format = 0x0B;
++		else if (hdmi->hdmi_data.enc_color_depth == 12)
++			color_format = 0x0D;
++		else if (hdmi->hdmi_data.enc_color_depth == 16)
++			color_format = 0x0F;
++		else
++			return;
++	} else if (hdmi->hdmi_data.enc_in_format == YCBCR422_8BITS) {
++		if (hdmi->hdmi_data.enc_color_depth == 8)
++			color_format = 0x16;
++		else if (hdmi->hdmi_data.enc_color_depth == 10)
++			color_format = 0x14;
++		else if (hdmi->hdmi_data.enc_color_depth == 12)
++			color_format = 0x12;
++		else
++			return;
++	}
++
++	val = HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_DISABLE |
++		((color_format << HDMI_TX_INVID0_VIDEO_MAPPING_OFFSET) &
++		HDMI_TX_INVID0_VIDEO_MAPPING_MASK);
++	hdmi_writeb(val, HDMI_TX_INVID0);
++
++	/* Enable TX stuffing: When DE is inactive, fix the output data to 0 */
++	val = HDMI_TX_INSTUFFING_BDBDATA_STUFFING_ENABLE |
++		HDMI_TX_INSTUFFING_RCRDATA_STUFFING_ENABLE |
++		HDMI_TX_INSTUFFING_GYDATA_STUFFING_ENABLE;
++	hdmi_writeb(val, HDMI_TX_INSTUFFING);
++	hdmi_writeb(0x0, HDMI_TX_GYDATA0);
++	hdmi_writeb(0x0, HDMI_TX_GYDATA1);
++	hdmi_writeb(0x0, HDMI_TX_RCRDATA0);
++	hdmi_writeb(0x0, HDMI_TX_RCRDATA1);
++	hdmi_writeb(0x0, HDMI_TX_BCBDATA0);
++	hdmi_writeb(0x0, HDMI_TX_BCBDATA1);
++}
++
++static int isColorSpaceConversion(struct mxc_hdmi *hdmi)
++{
++	return (hdmi->hdmi_data.enc_in_format != hdmi->hdmi_data.enc_out_format) ||
++		(hdmi->hdmi_data.enc_out_format == RGB &&
++		  ((hdmi->hdmi_data.rgb_quant_range == HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE) ||
++		   (hdmi->hdmi_data.rgb_quant_range == HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT && hdmi->vic > 1)));
++}
++
++static int isColorSpaceDecimation(struct mxc_hdmi *hdmi)
++{
++	return ((hdmi->hdmi_data.enc_out_format == YCBCR422_8BITS) &&
++		(hdmi->hdmi_data.enc_in_format == RGB ||
++		hdmi->hdmi_data.enc_in_format == YCBCR444));
++}
++
++static int isColorSpaceInterpolation(struct mxc_hdmi *hdmi)
++{
++	return ((hdmi->hdmi_data.enc_in_format == YCBCR422_8BITS) &&
++		(hdmi->hdmi_data.enc_out_format == RGB
++		|| hdmi->hdmi_data.enc_out_format == YCBCR444));
++}
++
++/*!
++ * update the color space conversion coefficients.
++ */
++static void update_csc_coeffs(struct mxc_hdmi *hdmi)
++{
++	unsigned short csc_coeff[3][4];
++	unsigned int csc_scale = 1;
++	u8 val;
++	bool coeff_selected = false;
++
++	if (isColorSpaceConversion(hdmi)) { /* csc needed */
++		if (hdmi->hdmi_data.enc_out_format == RGB) {
++			if (hdmi->hdmi_data.enc_in_format == RGB) {
++				csc_coeff[0][0] = 0x1b80;
++				csc_coeff[0][1] = 0x0000;
++				csc_coeff[0][2] = 0x0000;
++				csc_coeff[0][3] = 0x0020;
++
++				csc_coeff[1][0] = 0x0000;
++				csc_coeff[1][1] = 0x1b80;
++				csc_coeff[1][2] = 0x0000;
++				csc_coeff[1][3] = 0x0020;
++
++				csc_coeff[2][0] = 0x0000;
++				csc_coeff[2][1] = 0x0000;
++				csc_coeff[2][2] = 0x1b80;
++				csc_coeff[2][3] = 0x0020;
++
++				csc_scale = 1;
++				coeff_selected = true;
++			} else if (hdmi->hdmi_data.colorimetry == eITU601) {
++				csc_coeff[0][0] = 0x2000;
++				csc_coeff[0][1] = 0x6926;
++				csc_coeff[0][2] = 0x74fd;
++				csc_coeff[0][3] = 0x010e;
++
++				csc_coeff[1][0] = 0x2000;
++				csc_coeff[1][1] = 0x2cdd;
++				csc_coeff[1][2] = 0x0000;
++				csc_coeff[1][3] = 0x7e9a;
++
++				csc_coeff[2][0] = 0x2000;
++				csc_coeff[2][1] = 0x0000;
++				csc_coeff[2][2] = 0x38b4;
++				csc_coeff[2][3] = 0x7e3b;
++
++				csc_scale = 1;
++				coeff_selected = true;
++			} else if (hdmi->hdmi_data.colorimetry == eITU709) {
++				csc_coeff[0][0] = 0x2000;
++				csc_coeff[0][1] = 0x7106;
++				csc_coeff[0][2] = 0x7a02;
++				csc_coeff[0][3] = 0x00a7;
++
++				csc_coeff[1][0] = 0x2000;
++				csc_coeff[1][1] = 0x3264;
++				csc_coeff[1][2] = 0x0000;
++				csc_coeff[1][3] = 0x7e6d;
++
++				csc_coeff[2][0] = 0x2000;
++				csc_coeff[2][1] = 0x0000;
++				csc_coeff[2][2] = 0x3b61;
++				csc_coeff[2][3] = 0x7e25;
++
++				csc_scale = 1;
++				coeff_selected = true;
++			}
++		} else if (hdmi->hdmi_data.enc_in_format == RGB) {
++			if (hdmi->hdmi_data.colorimetry == eITU601) {
++				csc_coeff[0][0] = 0x2591;
++				csc_coeff[0][1] = 0x1322;
++				csc_coeff[0][2] = 0x074b;
++				csc_coeff[0][3] = 0x0000;
++
++				csc_coeff[1][0] = 0x6535;
++				csc_coeff[1][1] = 0x2000;
++				csc_coeff[1][2] = 0x7acc;
++				csc_coeff[1][3] = 0x0200;
++
++				csc_coeff[2][0] = 0x6acd;
++				csc_coeff[2][1] = 0x7534;
++				csc_coeff[2][2] = 0x2000;
++				csc_coeff[2][3] = 0x0200;
++
++				csc_scale = 0;
++				coeff_selected = true;
++			} else if (hdmi->hdmi_data.colorimetry == eITU709) {
++				csc_coeff[0][0] = 0x2dc5;
++				csc_coeff[0][1] = 0x0d9b;
++				csc_coeff[0][2] = 0x049e;
++				csc_coeff[0][3] = 0x0000;
++
++				csc_coeff[1][0] = 0x62f0;
++				csc_coeff[1][1] = 0x2000;
++				csc_coeff[1][2] = 0x7d11;
++				csc_coeff[1][3] = 0x0200;
++
++				csc_coeff[2][0] = 0x6756;
++				csc_coeff[2][1] = 0x78ab;
++				csc_coeff[2][2] = 0x2000;
++				csc_coeff[2][3] = 0x0200;
++
++				csc_scale = 0;
++				coeff_selected = true;
++			}
++		}
++	}
++
++	if (!coeff_selected) {
++		csc_coeff[0][0] = 0x2000;
++		csc_coeff[0][1] = 0x0000;
++		csc_coeff[0][2] = 0x0000;
++		csc_coeff[0][3] = 0x0000;
++
++		csc_coeff[1][0] = 0x0000;
++		csc_coeff[1][1] = 0x2000;
++		csc_coeff[1][2] = 0x0000;
++		csc_coeff[1][3] = 0x0000;
++
++		csc_coeff[2][0] = 0x0000;
++		csc_coeff[2][1] = 0x0000;
++		csc_coeff[2][2] = 0x2000;
++		csc_coeff[2][3] = 0x0000;
++
++		csc_scale = 1;
++	}
++
++	/* Update CSC parameters in HDMI CSC registers */
++	hdmi_writeb((unsigned char)(csc_coeff[0][0] & 0xFF),
++		HDMI_CSC_COEF_A1_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][0] >> 8),
++		HDMI_CSC_COEF_A1_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][1] & 0xFF),
++		HDMI_CSC_COEF_A2_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][1] >> 8),
++		HDMI_CSC_COEF_A2_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][2] & 0xFF),
++		HDMI_CSC_COEF_A3_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][2] >> 8),
++		HDMI_CSC_COEF_A3_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][3] & 0xFF),
++		HDMI_CSC_COEF_A4_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[0][3] >> 8),
++		HDMI_CSC_COEF_A4_MSB);
++
++	hdmi_writeb((unsigned char)(csc_coeff[1][0] & 0xFF),
++		HDMI_CSC_COEF_B1_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][0] >> 8),
++		HDMI_CSC_COEF_B1_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][1] & 0xFF),
++		HDMI_CSC_COEF_B2_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][1] >> 8),
++		HDMI_CSC_COEF_B2_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][2] & 0xFF),
++		HDMI_CSC_COEF_B3_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][2] >> 8),
++		HDMI_CSC_COEF_B3_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][3] & 0xFF),
++		HDMI_CSC_COEF_B4_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[1][3] >> 8),
++		HDMI_CSC_COEF_B4_MSB);
++
++	hdmi_writeb((unsigned char)(csc_coeff[2][0] & 0xFF),
++		HDMI_CSC_COEF_C1_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][0] >> 8),
++		HDMI_CSC_COEF_C1_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][1] & 0xFF),
++		HDMI_CSC_COEF_C2_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][1] >> 8),
++		HDMI_CSC_COEF_C2_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][2] & 0xFF),
++		HDMI_CSC_COEF_C3_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][2] >> 8),
++		HDMI_CSC_COEF_C3_MSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][3] & 0xFF),
++		HDMI_CSC_COEF_C4_LSB);
++	hdmi_writeb((unsigned char)(csc_coeff[2][3] >> 8),
++		HDMI_CSC_COEF_C4_MSB);
++
++	val = hdmi_readb(HDMI_CSC_SCALE);
++	val &= ~HDMI_CSC_SCALE_CSCSCALE_MASK;
++	val |= csc_scale & HDMI_CSC_SCALE_CSCSCALE_MASK;
++	hdmi_writeb(val, HDMI_CSC_SCALE);
++}
++
++static void hdmi_video_csc(struct mxc_hdmi *hdmi)
++{
++	int color_depth = 0;
++	int interpolation = HDMI_CSC_CFG_INTMODE_DISABLE;
++	int decimation = HDMI_CSC_CFG_DECMODE_DISABLE;
++	u8 val;
++
++	/* YCC422 interpolation to 444 mode */
++	if (isColorSpaceInterpolation(hdmi))
++		interpolation = HDMI_CSC_CFG_INTMODE_CHROMA_INT_FORMULA1;
++	else if (isColorSpaceDecimation(hdmi))
++		decimation = HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA3;
++
++	if (hdmi->hdmi_data.enc_color_depth == 8)
++		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_24BPP;
++	else if (hdmi->hdmi_data.enc_color_depth == 10)
++		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_30BPP;
++	else if (hdmi->hdmi_data.enc_color_depth == 12)
++		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_36BPP;
++	else if (hdmi->hdmi_data.enc_color_depth == 16)
++		color_depth = HDMI_CSC_SCALE_CSC_COLORDE_PTH_48BPP;
++	else
++		return;
++
++	/*configure the CSC registers */
++	hdmi_writeb(interpolation | decimation, HDMI_CSC_CFG);
++	val = hdmi_readb(HDMI_CSC_SCALE);
++	val &= ~HDMI_CSC_SCALE_CSC_COLORDE_PTH_MASK;
++	val |= color_depth;
++	hdmi_writeb(val, HDMI_CSC_SCALE);
++
++	update_csc_coeffs(hdmi);
++}
++
++/*!
++ * HDMI video packetizer is used to packetize the data.
++ * for example, if input is YCC422 mode or repeater is used,
++ * data should be repacked this module can be bypassed.
++ */
++static void hdmi_video_packetize(struct mxc_hdmi *hdmi)
++{
++	unsigned int color_depth = 0;
++	unsigned int remap_size = HDMI_VP_REMAP_YCC422_16bit;
++	unsigned int output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_PP;
++	struct hdmi_data_info *hdmi_data = &hdmi->hdmi_data;
++	u8 val;
++
++	if (hdmi_data->enc_out_format == RGB
++		|| hdmi_data->enc_out_format == YCBCR444) {
++		if (hdmi_data->enc_color_depth == 0)
++			output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS;
++		else if (hdmi_data->enc_color_depth == 8) {
++			color_depth = 4;
++			output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS;
++		} else if (hdmi_data->enc_color_depth == 10)
++			color_depth = 5;
++		else if (hdmi_data->enc_color_depth == 12)
++			color_depth = 6;
++		else if (hdmi_data->enc_color_depth == 16)
++			color_depth = 7;
++		else
++			return;
++	} else if (hdmi_data->enc_out_format == YCBCR422_8BITS) {
++		if (hdmi_data->enc_color_depth == 0 ||
++			hdmi_data->enc_color_depth == 8)
++			remap_size = HDMI_VP_REMAP_YCC422_16bit;
++		else if (hdmi_data->enc_color_depth == 10)
++			remap_size = HDMI_VP_REMAP_YCC422_20bit;
++		else if (hdmi_data->enc_color_depth == 12)
++			remap_size = HDMI_VP_REMAP_YCC422_24bit;
++		else
++			return;
++		output_select = HDMI_VP_CONF_OUTPUT_SELECTOR_YCC422;
++	} else
++		return;
++
++	/* HDMI not support deep color,
++	 * because IPU MAX support color depth is 24bit */
++	color_depth = 0;
++
++	/* set the packetizer registers */
++	val = ((color_depth << HDMI_VP_PR_CD_COLOR_DEPTH_OFFSET) &
++		HDMI_VP_PR_CD_COLOR_DEPTH_MASK) |
++		((hdmi_data->pix_repet_factor <<
++		HDMI_VP_PR_CD_DESIRED_PR_FACTOR_OFFSET) &
++		HDMI_VP_PR_CD_DESIRED_PR_FACTOR_MASK);
++	hdmi_writeb(val, HDMI_VP_PR_CD);
++
++	val = hdmi_readb(HDMI_VP_STUFF);
++	val &= ~HDMI_VP_STUFF_PR_STUFFING_MASK;
++	val |= HDMI_VP_STUFF_PR_STUFFING_STUFFING_MODE;
++	hdmi_writeb(val, HDMI_VP_STUFF);
++
++	/* Data from pixel repeater block */
++	if (hdmi_data->pix_repet_factor > 1) {
++		val = hdmi_readb(HDMI_VP_CONF);
++		val &= ~(HDMI_VP_CONF_PR_EN_MASK |
++			HDMI_VP_CONF_BYPASS_SELECT_MASK);
++		val |= HDMI_VP_CONF_PR_EN_ENABLE |
++			HDMI_VP_CONF_BYPASS_SELECT_PIX_REPEATER;
++		hdmi_writeb(val, HDMI_VP_CONF);
++	} else { /* data from packetizer block */
++		val = hdmi_readb(HDMI_VP_CONF);
++		val &= ~(HDMI_VP_CONF_PR_EN_MASK |
++			HDMI_VP_CONF_BYPASS_SELECT_MASK);
++		val |= HDMI_VP_CONF_PR_EN_DISABLE |
++			HDMI_VP_CONF_BYPASS_SELECT_VID_PACKETIZER;
++		hdmi_writeb(val, HDMI_VP_CONF);
++	}
++
++	val = hdmi_readb(HDMI_VP_STUFF);
++	val &= ~HDMI_VP_STUFF_IDEFAULT_PHASE_MASK;
++	val |= 1 << HDMI_VP_STUFF_IDEFAULT_PHASE_OFFSET;
++	hdmi_writeb(val, HDMI_VP_STUFF);
++
++	hdmi_writeb(remap_size, HDMI_VP_REMAP);
++
++	if (output_select == HDMI_VP_CONF_OUTPUT_SELECTOR_PP) {
++		val = hdmi_readb(HDMI_VP_CONF);
++		val &= ~(HDMI_VP_CONF_BYPASS_EN_MASK |
++			HDMI_VP_CONF_PP_EN_ENMASK |
++			HDMI_VP_CONF_YCC422_EN_MASK);
++		val |= HDMI_VP_CONF_BYPASS_EN_DISABLE |
++			HDMI_VP_CONF_PP_EN_ENABLE |
++			HDMI_VP_CONF_YCC422_EN_DISABLE;
++		hdmi_writeb(val, HDMI_VP_CONF);
++	} else if (output_select == HDMI_VP_CONF_OUTPUT_SELECTOR_YCC422) {
++		val = hdmi_readb(HDMI_VP_CONF);
++		val &= ~(HDMI_VP_CONF_BYPASS_EN_MASK |
++			HDMI_VP_CONF_PP_EN_ENMASK |
++			HDMI_VP_CONF_YCC422_EN_MASK);
++		val |= HDMI_VP_CONF_BYPASS_EN_DISABLE |
++			HDMI_VP_CONF_PP_EN_DISABLE |
++			HDMI_VP_CONF_YCC422_EN_ENABLE;
++		hdmi_writeb(val, HDMI_VP_CONF);
++	} else if (output_select == HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS) {
++		val = hdmi_readb(HDMI_VP_CONF);
++		val &= ~(HDMI_VP_CONF_BYPASS_EN_MASK |
++			HDMI_VP_CONF_PP_EN_ENMASK |
++			HDMI_VP_CONF_YCC422_EN_MASK);
++		val |= HDMI_VP_CONF_BYPASS_EN_ENABLE |
++			HDMI_VP_CONF_PP_EN_DISABLE |
++			HDMI_VP_CONF_YCC422_EN_DISABLE;
++		hdmi_writeb(val, HDMI_VP_CONF);
++	} else {
++		return;
++	}
++
++	val = hdmi_readb(HDMI_VP_STUFF);
++	val &= ~(HDMI_VP_STUFF_PP_STUFFING_MASK |
++		HDMI_VP_STUFF_YCC422_STUFFING_MASK);
++	val |= HDMI_VP_STUFF_PP_STUFFING_STUFFING_MODE |
++		HDMI_VP_STUFF_YCC422_STUFFING_STUFFING_MODE;
++	hdmi_writeb(val, HDMI_VP_STUFF);
++
++	val = hdmi_readb(HDMI_VP_CONF);
++	val &= ~HDMI_VP_CONF_OUTPUT_SELECTOR_MASK;
++	val |= output_select;
++	hdmi_writeb(val, HDMI_VP_CONF);
++}
++
++#if 0
++/* Force a fixed color screen */
++static void hdmi_video_force_output(struct mxc_hdmi *hdmi, unsigned char force)
++{
++	u8 val;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	if (force) {
++		hdmi_writeb(0x00, HDMI_FC_DBGTMDS2);   /* R */
++		hdmi_writeb(0x00, HDMI_FC_DBGTMDS1);   /* G */
++		hdmi_writeb(0xFF, HDMI_FC_DBGTMDS0);   /* B */
++		val = hdmi_readb(HDMI_FC_DBGFORCE);
++		val |= HDMI_FC_DBGFORCE_FORCEVIDEO;
++		hdmi_writeb(val, HDMI_FC_DBGFORCE);
++	} else {
++		val = hdmi_readb(HDMI_FC_DBGFORCE);
++		val &= ~HDMI_FC_DBGFORCE_FORCEVIDEO;
++		hdmi_writeb(val, HDMI_FC_DBGFORCE);
++		hdmi_writeb(0x00, HDMI_FC_DBGTMDS2);   /* R */
++		hdmi_writeb(0x00, HDMI_FC_DBGTMDS1);   /* G */
++		hdmi_writeb(0x00, HDMI_FC_DBGTMDS0);   /* B */
++	}
++}
++#endif
++
++static inline void hdmi_phy_test_clear(struct mxc_hdmi *hdmi,
++						unsigned char bit)
++{
++	u8 val = hdmi_readb(HDMI_PHY_TST0);
++	val &= ~HDMI_PHY_TST0_TSTCLR_MASK;
++	val |= (bit << HDMI_PHY_TST0_TSTCLR_OFFSET) &
++		HDMI_PHY_TST0_TSTCLR_MASK;
++	hdmi_writeb(val, HDMI_PHY_TST0);
++}
++
++static inline void hdmi_phy_test_enable(struct mxc_hdmi *hdmi,
++						unsigned char bit)
++{
++	u8 val = hdmi_readb(HDMI_PHY_TST0);
++	val &= ~HDMI_PHY_TST0_TSTEN_MASK;
++	val |= (bit << HDMI_PHY_TST0_TSTEN_OFFSET) &
++		HDMI_PHY_TST0_TSTEN_MASK;
++	hdmi_writeb(val, HDMI_PHY_TST0);
++}
++
++static inline void hdmi_phy_test_clock(struct mxc_hdmi *hdmi,
++						unsigned char bit)
++{
++	u8 val = hdmi_readb(HDMI_PHY_TST0);
++	val &= ~HDMI_PHY_TST0_TSTCLK_MASK;
++	val |= (bit << HDMI_PHY_TST0_TSTCLK_OFFSET) &
++		HDMI_PHY_TST0_TSTCLK_MASK;
++	hdmi_writeb(val, HDMI_PHY_TST0);
++}
++
++static inline void hdmi_phy_test_din(struct mxc_hdmi *hdmi,
++						unsigned char bit)
++{
++	hdmi_writeb(bit, HDMI_PHY_TST1);
++}
++
++static inline void hdmi_phy_test_dout(struct mxc_hdmi *hdmi,
++						unsigned char bit)
++{
++	hdmi_writeb(bit, HDMI_PHY_TST2);
++}
++
++static bool hdmi_phy_wait_i2c_done(struct mxc_hdmi *hdmi, int msec)
++{
++	unsigned char val = 0;
++	val = hdmi_readb(HDMI_IH_I2CMPHY_STAT0) & 0x3;
++	while (val == 0) {
++		udelay(1000);
++		if (msec-- == 0)
++			return false;
++		val = hdmi_readb(HDMI_IH_I2CMPHY_STAT0) & 0x3;
++	}
++	return true;
++}
++
++static void hdmi_phy_i2c_write(struct mxc_hdmi *hdmi, unsigned short data,
++			      unsigned char addr)
++{
++	hdmi_writeb(0xFF, HDMI_IH_I2CMPHY_STAT0);
++	hdmi_writeb(addr, HDMI_PHY_I2CM_ADDRESS_ADDR);
++	hdmi_writeb((unsigned char)(data >> 8),
++		HDMI_PHY_I2CM_DATAO_1_ADDR);
++	hdmi_writeb((unsigned char)(data >> 0),
++		HDMI_PHY_I2CM_DATAO_0_ADDR);
++	hdmi_writeb(HDMI_PHY_I2CM_OPERATION_ADDR_WRITE,
++		HDMI_PHY_I2CM_OPERATION_ADDR);
++	hdmi_phy_wait_i2c_done(hdmi, 1000);
++}
++
++#if 0
++static unsigned short hdmi_phy_i2c_read(struct mxc_hdmi *hdmi,
++					unsigned char addr)
++{
++	unsigned short data;
++	unsigned char msb = 0, lsb = 0;
++	hdmi_writeb(0xFF, HDMI_IH_I2CMPHY_STAT0);
++	hdmi_writeb(addr, HDMI_PHY_I2CM_ADDRESS_ADDR);
++	hdmi_writeb(HDMI_PHY_I2CM_OPERATION_ADDR_READ,
++		HDMI_PHY_I2CM_OPERATION_ADDR);
++	hdmi_phy_wait_i2c_done(hdmi, 1000);
++	msb = hdmi_readb(HDMI_PHY_I2CM_DATAI_1_ADDR);
++	lsb = hdmi_readb(HDMI_PHY_I2CM_DATAI_0_ADDR);
++	data = (msb << 8) | lsb;
++	return data;
++}
++
++static int hdmi_phy_i2c_write_verify(struct mxc_hdmi *hdmi, unsigned short data,
++				     unsigned char addr)
++{
++	unsigned short val = 0;
++	hdmi_phy_i2c_write(hdmi, data, addr);
++	val = hdmi_phy_i2c_read(hdmi, addr);
++	return (val == data);
++}
++#endif
++
++static bool  hdmi_edid_wait_i2c_done(struct mxc_hdmi *hdmi, int msec)
++{
++    unsigned char val = 0;
++    val = hdmi_readb(HDMI_IH_I2CM_STAT0) & 0x2;
++    while (val == 0) {
++
++		udelay(1000);
++		if (msec-- == 0) {
++			dev_dbg(&hdmi->pdev->dev,
++					"HDMI EDID i2c operation time out!!\n");
++			return false;
++		}
++		val = hdmi_readb(HDMI_IH_I2CM_STAT0) & 0x2;
++	}
++	return true;
++}
++
++static u8 hdmi_edid_i2c_read(struct mxc_hdmi *hdmi,
++					u8 addr, u8 blockno)
++{
++	u8 spointer = blockno / 2;
++	u8 edidaddress = ((blockno % 2) * 0x80) + addr;
++	u8 data;
++
++	hdmi_writeb(0xFF, HDMI_IH_I2CM_STAT0);
++	hdmi_writeb(edidaddress, HDMI_I2CM_ADDRESS);
++	hdmi_writeb(spointer, HDMI_I2CM_SEGADDR);
++	if (spointer == 0)
++		hdmi_writeb(HDMI_I2CM_OPERATION_READ,
++			HDMI_I2CM_OPERATION);
++	else
++		hdmi_writeb(HDMI_I2CM_OPERATION_READ_EXT,
++			HDMI_I2CM_OPERATION);
++
++	hdmi_edid_wait_i2c_done(hdmi, 1000);
++	data = hdmi_readb(HDMI_I2CM_DATAI);
++	hdmi_writeb(0xFF, HDMI_IH_I2CM_STAT0);
++	return data;
++}
++
++
++/* "Power-down enable (active low)"
++ * That mean that power up == 1! */
++static void mxc_hdmi_phy_enable_power(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_PDZ_OFFSET,
++			HDMI_PHY_CONF0_PDZ_MASK);
++}
++
++static void mxc_hdmi_phy_enable_tmds(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_ENTMDS_OFFSET,
++			HDMI_PHY_CONF0_ENTMDS_MASK);
++}
++
++static void mxc_hdmi_phy_gen2_pddq(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_GEN2_PDDQ_OFFSET,
++			HDMI_PHY_CONF0_GEN2_PDDQ_MASK);
++}
++
++static void mxc_hdmi_phy_gen2_txpwron(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_GEN2_TXPWRON_OFFSET,
++			HDMI_PHY_CONF0_GEN2_TXPWRON_MASK);
++}
++
++#if 0
++static void mxc_hdmi_phy_gen2_enhpdrxsense(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_OFFSET,
++			HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_MASK);
++}
++#endif
++
++static void mxc_hdmi_phy_sel_data_en_pol(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_SELDATAENPOL_OFFSET,
++			HDMI_PHY_CONF0_SELDATAENPOL_MASK);
++}
++
++static void mxc_hdmi_phy_sel_interface_control(u8 enable)
++{
++	hdmi_mask_writeb(enable, HDMI_PHY_CONF0,
++			HDMI_PHY_CONF0_SELDIPIF_OFFSET,
++			HDMI_PHY_CONF0_SELDIPIF_MASK);
++}
++
++static int hdmi_phy_configure(struct mxc_hdmi *hdmi, unsigned char pRep,
++			      unsigned char cRes, int cscOn)
++{
++	u8 val;
++	u8 msec;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* color resolution 0 is 8 bit colour depth */
++	if (cRes == 0)
++		cRes = 8;
++
++	if (pRep != 0)
++		return false;
++	else if (cRes != 8 && cRes != 12)
++		return false;
++
++	/* Enable csc path */
++	if (cscOn)
++		val = HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_IN_PATH;
++	else
++		val = HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_BYPASS;
++
++	hdmi_writeb(val, HDMI_MC_FLOWCTRL);
++
++	/* gen2 tx power off */
++	mxc_hdmi_phy_gen2_txpwron(0);
++
++	/* gen2 pddq */
++	mxc_hdmi_phy_gen2_pddq(1);
++
++	/* PHY reset */
++	hdmi_writeb(HDMI_MC_PHYRSTZ_DEASSERT, HDMI_MC_PHYRSTZ);
++	hdmi_writeb(HDMI_MC_PHYRSTZ_ASSERT, HDMI_MC_PHYRSTZ);
++
++	hdmi_writeb(HDMI_MC_HEACPHY_RST_ASSERT, HDMI_MC_HEACPHY_RST);
++
++	hdmi_phy_test_clear(hdmi, 1);
++	hdmi_writeb(HDMI_PHY_I2CM_SLAVE_ADDR_PHY_GEN2,
++			HDMI_PHY_I2CM_SLAVE_ADDR);
++	hdmi_phy_test_clear(hdmi, 0);
++
++	if (hdmi->hdmi_data.video_mode.mPixelClock < 0) {
++		dev_dbg(&hdmi->pdev->dev, "Pixel clock (%lu) must be positive\n",
++			hdmi->hdmi_data.video_mode.mPixelClock);
++		return false;
++	}
++
++	if (hdmi->hdmi_data.video_mode.mPixelClock <= 45250000) {
++		switch (cRes) {
++		case 8:
++			/* PLL/MPLL Cfg */
++			hdmi_phy_i2c_write(hdmi, 0x01e0, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x0000, 0x15);  /* GMPCTRL */
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x21e1, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x0000, 0x15);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x41e2, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x0000, 0x15);
++			break;
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 92500000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x0140, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x0005, 0x15);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x2141, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x0005, 0x15);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x4142, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x0005, 0x15);
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 148500000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x00a0, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x20a1, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x40a2, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
++		default:
++			return false;
++		}
++	} else {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x00a0, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x000a, 0x15);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x2001, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x000f, 0x15);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x4002, 0x06);
++			hdmi_phy_i2c_write(hdmi, 0x000f, 0x15);
++		default:
++			return false;
++		}
++	}
++
++	if (hdmi->hdmi_data.video_mode.mPixelClock <= 54000000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);  /* CURRCTRL */
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 58400000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 72000000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 74250000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x0b5c, 0x10);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 118800000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		default:
++			return false;
++		}
++	} else if (hdmi->hdmi_data.video_mode.mPixelClock <= 216000000) {
++		switch (cRes) {
++		case 8:
++			hdmi_phy_i2c_write(hdmi, 0x06dc, 0x10);
++			break;
++		case 10:
++			hdmi_phy_i2c_write(hdmi, 0x0b5c, 0x10);
++			break;
++		case 12:
++			hdmi_phy_i2c_write(hdmi, 0x091c, 0x10);
++			break;
++		default:
++			return false;
++		}
++	} else {
++		dev_err(&hdmi->pdev->dev,
++				"Pixel clock %lu - unsupported by HDMI\n",
++				hdmi->hdmi_data.video_mode.mPixelClock);
++		return false;
++	}
++
++	hdmi_phy_i2c_write(hdmi, 0x0000, 0x13);  /* PLLPHBYCTRL */
++	hdmi_phy_i2c_write(hdmi, 0x0006, 0x17);
++	/* RESISTANCE TERM 133Ohm Cfg */
++	hdmi_phy_i2c_write(hdmi, 0x0005, 0x19);  /* TXTERM */
++	/* PREEMP Cgf 0.00 */
++	hdmi_phy_i2c_write(hdmi, 0x800d, 0x09);  /* CKSYMTXCTRL */
++	/* TX/CK LVL 10 */
++	hdmi_phy_i2c_write(hdmi, 0x01ad, 0x0E);  /* VLEVCTRL */
++
++	/* Board specific setting for PHY register 0x09, 0x0e to pass HCT */
++	if (hdmi->phy_config.reg_cksymtx != 0)
++		hdmi_phy_i2c_write(hdmi, hdmi->phy_config.reg_cksymtx, 0x09);
++
++	if (hdmi->phy_config.reg_vlev != 0)
++		hdmi_phy_i2c_write(hdmi, hdmi->phy_config.reg_vlev, 0x0E);
++
++	/* REMOVE CLK TERM */
++	hdmi_phy_i2c_write(hdmi, 0x8000, 0x05);  /* CKCALCTRL */
++
++	if (hdmi->hdmi_data.video_mode.mPixelClock > 148500000) {
++			hdmi_phy_i2c_write(hdmi, 0x800b, 0x09);
++			hdmi_phy_i2c_write(hdmi, 0x0129, 0x0E);
++	}
++
++	mxc_hdmi_phy_enable_power(1);
++
++	/* toggle TMDS enable */
++	mxc_hdmi_phy_enable_tmds(0);
++	mxc_hdmi_phy_enable_tmds(1);
++
++	/* gen2 tx power on */
++	mxc_hdmi_phy_gen2_txpwron(1);
++	mxc_hdmi_phy_gen2_pddq(0);
++
++	/*Wait for PHY PLL lock */
++	msec = 4;
++	val = hdmi_readb(HDMI_PHY_STAT0) & HDMI_PHY_TX_PHY_LOCK;
++	while (val == 0) {
++		udelay(1000);
++		if (msec-- == 0) {
++			dev_dbg(&hdmi->pdev->dev, "PHY PLL not locked\n");
++			return false;
++		}
++		val = hdmi_readb(HDMI_PHY_STAT0) & HDMI_PHY_TX_PHY_LOCK;
++	}
++
++	return true;
++}
++
++static void mxc_hdmi_phy_init(struct mxc_hdmi *hdmi)
++{
++	int i;
++	bool cscon = false;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* Never do phy init if pixel clock is gated.
++	 * Otherwise HDMI PHY will get messed up and generate an overflow
++	 * interrupt that can't be cleared or detected by accessing the
++	 * status register. */
++	if (!hdmi->fb_reg || !hdmi->cable_plugin
++			|| (hdmi->blank != FB_BLANK_UNBLANK))
++		return;
++
++	/*check csc whether needed activated in HDMI mode */
++	cscon = (isColorSpaceConversion(hdmi) &&
++			!hdmi->hdmi_data.video_mode.mDVI);
++
++	/* HDMI Phy spec says to do the phy initialization sequence twice */
++	for (i = 0 ; i < 2 ; i++) {
++		mxc_hdmi_phy_sel_data_en_pol(1);
++		mxc_hdmi_phy_sel_interface_control(0);
++		mxc_hdmi_phy_enable_tmds(0);
++		mxc_hdmi_phy_enable_power(0);
++
++		/* Enable CSC */
++		hdmi_phy_configure(hdmi, 0, 8, cscon);
++	}
++
++	hdmi->phy_enabled = true;
++}
++
++static enum hdmi_3d_structure mxc_3d_structure_infoframe(u32 layout)
++{
++	switch (layout) {
++	case FB_VMODE_3D_SBS_HALF:
++		return HDMI_3D_STRUCTURE_SIDE_BY_SIDE_HALF;
++	case FB_VMODE_3D_SBS_FULL:
++		return HDMI_3D_STRUCTURE_SIDE_BY_SIDE_FULL;
++	case FB_VMODE_3D_TOP_BOTTOM:
++		return HDMI_3D_STRUCTURE_TOP_AND_BOTTOM;
++	case FB_VMODE_3D_FRAME_PACK:
++		return HDMI_3D_STRUCTURE_FRAME_PACKING;
++	default:
++		return HDMI_3D_STRUCTURE_INVALID;
++	}
++}
++
++static int mxc_hdmi_vendor_infoframe(struct mxc_hdmi *hdmi, struct hdmi_vendor_infoframe *frame)
++{
++	int err;
++	u32 s3d_flags;
++	u8 vic;
++	uint8_t buffer[32]; //HDMI_FC_VSDPAYLOAD23 - HDMI_FC_VSDIEEEID0
++			    //(with a hole starting at 0102B, ending 102F
++	ssize_t len;
++	int i;
++
++	if (!frame)
++		return -EINVAL;
++
++	vic = hdmi->vic;
++	s3d_flags = (*hdmi->fbi->mode).vmode & FB_VMODE_3D_MASK;
++
++	if (!vic && !s3d_flags)
++		return -EINVAL;
++
++	err = hdmi_vendor_infoframe_init(frame);
++	if (err < 0)
++		return err;
++
++	if (s3d_flags)
++		frame->s3d_struct = mxc_3d_structure_infoframe(s3d_flags);
++	else if (vic)
++		frame->vic = vic;
++	else
++		return -EINVAL;
++
++	/* see comment above for the reason for this offset */
++	len = hdmi_vendor_infoframe_pack(frame, buffer+1, sizeof(buffer)-1);
++	if (len < 0)
++		return -EINVAL;
++
++	buffer[0] = buffer[5];
++	buffer[1] = buffer[3];
++	buffer[2] = 0;
++	buffer[3] = 0;
++	buffer[4] = 0;
++	buffer[5] = 0;
++
++	//buffer[6] = buffer[6];
++	//buffer[7] = buffer[7];
++
++	for (i = 0; i < 32; i++)
++		hdmi_writeb(buffer[i], HDMI_FC_VSDIEEEID0 + i);
++	return 0;
++}
++
++static void hdmi_config_AVI(struct mxc_hdmi *hdmi)
++{
++	u8 val;
++	u8 pix_fmt;
++	u8 under_scan;
++	u8 act_ratio, coded_ratio, colorimetry, ext_colorimetry;
++	struct fb_videomode mode;
++	const struct fb_videomode *edid_mode;
++	bool aspect_16_9;
++	struct hdmi_vendor_infoframe vendor_infoframe;
++
++	dev_dbg(&hdmi->pdev->dev, "set up AVI frame\n");
++	fb_var_to_videomode(&mode, &hdmi->fbi->var);
++	/* Use mode from list extracted from EDID to get aspect ratio */
++	if (!list_empty(&hdmi->fbi->modelist)) {
++		edid_mode = fb_find_nearest_mode(&mode, &hdmi->fbi->modelist);
++		if (edid_mode->vmode & FB_VMODE_ASPECT_16_9)
++			aspect_16_9 = true;
++		else
++			aspect_16_9 = false;
++	} else
++		aspect_16_9 = false;
++
++	/********************************************
++	 * AVI Data Byte 1
++	 ********************************************/
++	if (hdmi->hdmi_data.enc_out_format == YCBCR444)
++		pix_fmt = HDMI_FC_AVICONF0_PIX_FMT_YCBCR444;
++	else if (hdmi->hdmi_data.enc_out_format == YCBCR422_8BITS)
++		pix_fmt = HDMI_FC_AVICONF0_PIX_FMT_YCBCR422;
++	else
++		pix_fmt = HDMI_FC_AVICONF0_PIX_FMT_RGB;
++
++	if (hdmi->edid_cfg.cea_underscan)
++		under_scan = HDMI_FC_AVICONF0_SCAN_INFO_UNDERSCAN;
++	else
++		under_scan =  HDMI_FC_AVICONF0_SCAN_INFO_NODATA;
++
++	/*
++	 * Active format identification data is present in the AVI InfoFrame.
++	 * Under scan info, no bar data
++	 */
++	val = pix_fmt | under_scan |
++		HDMI_FC_AVICONF0_ACTIVE_FMT_INFO_PRESENT |
++		HDMI_FC_AVICONF0_BAR_DATA_NO_DATA;
++
++	hdmi_writeb(val, HDMI_FC_AVICONF0);
++
++	/********************************************
++	 * AVI Data Byte 2
++	 ********************************************/
++
++	/*  Set the Aspect Ratio */
++	if (aspect_16_9) {
++		act_ratio = HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_16_9;
++		coded_ratio = HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_16_9;
++	} else {
++		act_ratio = HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_4_3;
++		coded_ratio = HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_4_3;
++	}
++
++	/* Set up colorimetry */
++	if (hdmi->hdmi_data.enc_out_format == XVYCC444) {
++		colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_EXTENDED_INFO;
++		if (hdmi->hdmi_data.colorimetry == eITU601)
++			ext_colorimetry =
++				HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601;
++		else /* hdmi->hdmi_data.colorimetry == eITU709 */
++			ext_colorimetry =
++				HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC709;
++	} else if (hdmi->hdmi_data.enc_out_format != RGB) {
++		if (hdmi->hdmi_data.colorimetry == eITU601)
++			colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_SMPTE;
++		else /* hdmi->hdmi_data.colorimetry == eITU709 */
++			colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_ITUR;
++		ext_colorimetry = HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601;
++	} else { /* Carries no data */
++		colorimetry = HDMI_FC_AVICONF1_COLORIMETRY_NO_DATA;
++		ext_colorimetry = HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601;
++	}
++
++	val = colorimetry | coded_ratio | act_ratio;
++	hdmi_writeb(val, HDMI_FC_AVICONF1);
++
++	/********************************************
++	 * AVI Data Byte 3
++	 ********************************************/
++
++	val = HDMI_FC_AVICONF2_IT_CONTENT_NO_DATA | ext_colorimetry |
++		hdmi->hdmi_data.rgb_quant_range |
++		HDMI_FC_AVICONF2_SCALING_NONE;
++	hdmi_writeb(val, HDMI_FC_AVICONF2);
++
++	/********************************************
++	 * AVI Data Byte 4
++	 ********************************************/
++	hdmi_writeb(hdmi->vic, HDMI_FC_AVIVID);
++
++	/********************************************
++	 * AVI Data Byte 5
++	 ********************************************/
++
++	/* Set up input and output pixel repetition */
++	val = (((hdmi->hdmi_data.video_mode.mPixelRepetitionInput + 1) <<
++		HDMI_FC_PRCONF_INCOMING_PR_FACTOR_OFFSET) &
++		HDMI_FC_PRCONF_INCOMING_PR_FACTOR_MASK) |
++		((hdmi->hdmi_data.video_mode.mPixelRepetitionOutput <<
++		HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_OFFSET) &
++		HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_MASK);
++	hdmi_writeb(val, HDMI_FC_PRCONF);
++
++	/* IT Content and quantization range = don't care */
++	val = HDMI_FC_AVICONF3_IT_CONTENT_TYPE_GRAPHICS |
++		HDMI_FC_AVICONF3_QUANT_RANGE_LIMITED;
++	hdmi_writeb(val, HDMI_FC_AVICONF3);
++
++	/********************************************
++	 * AVI Data Bytes 6-13
++	 ********************************************/
++	hdmi_writeb(0, HDMI_FC_AVIETB0);
++	hdmi_writeb(0, HDMI_FC_AVIETB1);
++	hdmi_writeb(0, HDMI_FC_AVISBB0);
++	hdmi_writeb(0, HDMI_FC_AVISBB1);
++	hdmi_writeb(0, HDMI_FC_AVIELB0);
++	hdmi_writeb(0, HDMI_FC_AVIELB1);
++	hdmi_writeb(0, HDMI_FC_AVISRB0);
++	hdmi_writeb(0, HDMI_FC_AVISRB1);
++
++	mxc_hdmi_vendor_infoframe(hdmi, &vendor_infoframe);
++}
++
++/*!
++ * this submodule is responsible for the video/audio data composition.
++ */
++static void hdmi_av_composer(struct mxc_hdmi *hdmi)
++{
++	u8 inv_val;
++	struct fb_info *fbi = hdmi->fbi;
++	struct fb_videomode fb_mode;
++	struct hdmi_vmode *vmode = &hdmi->hdmi_data.video_mode;
++	int hblank, vblank;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	fb_var_to_videomode(&fb_mode, &fbi->var);
++
++	vmode->mHSyncPolarity = ((fb_mode.sync & FB_SYNC_HOR_HIGH_ACT) != 0);
++	vmode->mVSyncPolarity = ((fb_mode.sync & FB_SYNC_VERT_HIGH_ACT) != 0);
++	vmode->mInterlaced = ((fb_mode.vmode & FB_VMODE_INTERLACED) != 0);
++	vmode->mPixelClock = (u32) (PICOS2KHZ(fb_mode.pixclock) * 1000UL);
++
++	dev_dbg(&hdmi->pdev->dev, "final pixclk = %lu\n", vmode->mPixelClock);
++
++	/* Set up HDMI_FC_INVIDCONF */
++	inv_val = (vmode->mVSyncPolarity ?
++		HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_HIGH :
++		HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_LOW);
++
++	inv_val |= (vmode->mHSyncPolarity ?
++		HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_HIGH :
++		HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_LOW);
++
++	inv_val |= (vmode->mDataEnablePolarity ?
++		HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_HIGH :
++		HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_LOW);
++
++	if (fb_mode.vmode & FB_VMODE_FRACTIONAL)
++		inv_val |= HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_HIGH;
++	else
++		inv_val |= (vmode->mInterlaced ?
++			HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_HIGH :
++			HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_LOW);
++
++	inv_val |= (vmode->mInterlaced ?
++		HDMI_FC_INVIDCONF_IN_I_P_INTERLACED :
++		HDMI_FC_INVIDCONF_IN_I_P_PROGRESSIVE);
++
++	inv_val |= (vmode->mDVI ?
++		HDMI_FC_INVIDCONF_DVI_MODEZ_DVI_MODE :
++		HDMI_FC_INVIDCONF_DVI_MODEZ_HDMI_MODE);
++
++	hdmi_writeb(inv_val, HDMI_FC_INVIDCONF);
++
++	/* Set up horizontal active pixel region width */
++	hdmi_writeb(fb_mode.xres >> 8, HDMI_FC_INHACTV1);
++	hdmi_writeb(fb_mode.xres, HDMI_FC_INHACTV0);
++
++	/* Set up vertical blanking pixel region width */
++	if (vmode->mInterlaced) {
++		hdmi_writeb((fb_mode.yres/2) >> 8, HDMI_FC_INVACTV1);
++		hdmi_writeb((fb_mode.yres/2), HDMI_FC_INVACTV0);
++	} else {
++		hdmi_writeb(fb_mode.yres >> 8, HDMI_FC_INVACTV1);
++		hdmi_writeb(fb_mode.yres, HDMI_FC_INVACTV0);
++	}
++
++	/* Set up horizontal blanking pixel region width */
++	hblank = fb_mode.left_margin + fb_mode.right_margin +
++		fb_mode.hsync_len;
++	hdmi_writeb(hblank >> 8, HDMI_FC_INHBLANK1);
++	hdmi_writeb(hblank, HDMI_FC_INHBLANK0);
++
++	/* Set up vertical blanking pixel region width */
++	vblank = fb_mode.upper_margin + fb_mode.lower_margin +
++		fb_mode.vsync_len;
++	if (vmode->mInterlaced)
++		hdmi_writeb(vblank/2, HDMI_FC_INVBLANK);
++	else
++		hdmi_writeb(vblank, HDMI_FC_INVBLANK);
++
++	/* Set up HSYNC active edge delay width (in pixel clks) */
++	hdmi_writeb(fb_mode.right_margin >> 8, HDMI_FC_HSYNCINDELAY1);
++	hdmi_writeb(fb_mode.right_margin, HDMI_FC_HSYNCINDELAY0);
++
++	/* Set up VSYNC active edge delay (in pixel clks) */
++	if (vmode->mInterlaced)
++		hdmi_writeb(fb_mode.lower_margin / 2, HDMI_FC_VSYNCINDELAY);
++	else
++		hdmi_writeb(fb_mode.lower_margin, HDMI_FC_VSYNCINDELAY);
++
++	/* Set up HSYNC active pulse width (in pixel clks) */
++	hdmi_writeb(fb_mode.hsync_len >> 8, HDMI_FC_HSYNCINWIDTH1);
++	hdmi_writeb(fb_mode.hsync_len, HDMI_FC_HSYNCINWIDTH0);
++
++	/* Set up VSYNC active edge delay (in pixel clks) */
++	if (vmode->mInterlaced)
++		hdmi_writeb(fb_mode.vsync_len / 2, HDMI_FC_VSYNCINWIDTH);
++	else
++		hdmi_writeb(fb_mode.vsync_len, HDMI_FC_VSYNCINWIDTH);
++
++	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
++}
++
++static int mxc_edid_read_internal(struct mxc_hdmi *hdmi, unsigned char *edid,
++			struct mxc_edid_cfg *cfg, struct fb_info *fbi)
++{
++	int extblknum;
++	int i, j, ret;
++	unsigned char *ediddata = edid;
++	unsigned char tmpedid[EDID_LENGTH];
++
++	dev_info(&hdmi->pdev->dev, "%s\n", __func__);
++
++	if (!edid || !cfg || !fbi)
++		return -EINVAL;
++
++	/* init HDMI I2CM for read edid*/
++	hdmi_writeb(0x0, HDMI_I2CM_DIV);
++	hdmi_writeb(0x00, HDMI_I2CM_SS_SCL_HCNT_1_ADDR);
++	hdmi_writeb(0x79, HDMI_I2CM_SS_SCL_HCNT_0_ADDR);
++	hdmi_writeb(0x00, HDMI_I2CM_SS_SCL_LCNT_1_ADDR);
++	hdmi_writeb(0x91, HDMI_I2CM_SS_SCL_LCNT_0_ADDR);
++
++	hdmi_writeb(0x00, HDMI_I2CM_FS_SCL_HCNT_1_ADDR);
++	hdmi_writeb(0x0F, HDMI_I2CM_FS_SCL_HCNT_0_ADDR);
++	hdmi_writeb(0x00, HDMI_I2CM_FS_SCL_LCNT_1_ADDR);
++	hdmi_writeb(0x21, HDMI_I2CM_FS_SCL_LCNT_0_ADDR);
++
++	hdmi_writeb(0x50, HDMI_I2CM_SLAVE);
++	hdmi_writeb(0x30, HDMI_I2CM_SEGADDR);
++
++	/* Umask edid interrupt */
++	hdmi_writeb(HDMI_I2CM_INT_DONE_POL,
++		    HDMI_I2CM_INT);
++
++	hdmi_writeb(HDMI_I2CM_CTLINT_NAC_POL |
++		    HDMI_I2CM_CTLINT_ARBITRATION_POL,
++		    HDMI_I2CM_CTLINT);
++
++	/* reset edid data zero */
++	memset(edid, 0, EDID_LENGTH*4);
++	memset(cfg, 0, sizeof(struct mxc_edid_cfg));
++
++	/* Check first three byte of EDID head */
++	if (!(hdmi_edid_i2c_read(hdmi, 0, 0) == 0x00) ||
++		!(hdmi_edid_i2c_read(hdmi, 1, 0) == 0xFF) ||
++		!(hdmi_edid_i2c_read(hdmi, 2, 0) == 0xFF)) {
++		dev_info(&hdmi->pdev->dev, "EDID head check failed!");
++		return -ENOENT;
++	}
++
++	for (i = 0; i < 128; i++) {
++		*ediddata = hdmi_edid_i2c_read(hdmi, i, 0);
++		ediddata++;
++	}
++
++	extblknum = edid[0x7E];
++	if (extblknum < 0)
++		return extblknum;
++
++	if (extblknum) {
++		ediddata = edid + EDID_LENGTH;
++		for (i = 0; i < 128; i++) {
++			*ediddata = hdmi_edid_i2c_read(hdmi, i, 1);
++			ediddata++;
++		}
++	}
++
++	/* edid first block parsing */
++	memset(&fbi->monspecs, 0, sizeof(fbi->monspecs));
++	fb_edid_to_monspecs(edid, &fbi->monspecs);
++
++	ret = mxc_edid_parse_ext_blk(edid + EDID_LENGTH,
++			cfg, &fbi->monspecs);
++	if (ret < 0) {
++                fb_edid_add_monspecs(edid + EDID_LENGTH, &fbi->monspecs);
++                if (fbi->monspecs.modedb_len > 0)
++                        hdmi->edid_cfg.hdmi_cap = false;
++                else
++			return -ENOENT;
++	}
++
++	/* need read segment block? */
++	if (extblknum > 1) {
++		for (j = 1; j <= extblknum; j++) {
++			for (i = 0; i < 128; i++)
++				*(tmpedid + 1) = hdmi_edid_i2c_read(hdmi, i, j);
++
++			/* edid ext block parsing */
++			ret = mxc_edid_parse_ext_blk(tmpedid + EDID_LENGTH,
++					cfg, &fbi->monspecs);
++			if (ret < 0)
++				return -ENOENT;
++		}
++	}
++
++	return 0;
++}
++
++static int mxc_hdmi_read_edid(struct mxc_hdmi *hdmi)
++{
++	int ret;
++	u8 edid_old[HDMI_EDID_LEN];
++	u8 clkdis;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* save old edid */
++	memcpy(edid_old, hdmi->edid, HDMI_EDID_LEN);
++
++	/* Read EDID via HDMI DDC when HDCP Enable */
++	if (!hdcp_init)
++		ret = mxc_edid_read(hdmi_i2c->adapter, hdmi_i2c->addr,
++				hdmi->edid, &hdmi->edid_cfg, hdmi->fbi);
++	else {
++
++		/* Disable HDCP clk */
++		if (hdmi->hdmi_data.hdcp_enable) {
++			clkdis = hdmi_readb(HDMI_MC_CLKDIS);
++			clkdis |= HDMI_MC_CLKDIS_HDCPCLK_DISABLE;
++			hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++		}
++
++		ret = mxc_edid_read_internal(hdmi, hdmi->edid,
++				&hdmi->edid_cfg, hdmi->fbi);
++
++		/* Enable HDCP clk */
++		if (hdmi->hdmi_data.hdcp_enable) {
++			clkdis = hdmi_readb(HDMI_MC_CLKDIS);
++			clkdis &= ~HDMI_MC_CLKDIS_HDCPCLK_DISABLE;
++			hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++		}
++
++	}
++
++	if (ret < 0)
++		return HDMI_EDID_FAIL;
++
++	dev_info(&hdmi->pdev->dev, "%s HDMI in %s mode\n", __func__, hdmi->edid_cfg.hdmi_cap?"HDMI":"DVI");
++	hdmi->plug_event = hdmi->edid_cfg.hdmi_cap?HDMI_IH_PHY_STAT0_HPD:HDMI_DVI_IH_STAT;
++	hdmi->plug_mask = hdmi->edid_cfg.hdmi_cap?HDMI_PHY_HPD:HDMI_DVI_STAT;
++
++	if (!memcmp(edid_old, hdmi->edid, HDMI_EDID_LEN)) {
++		dev_info(&hdmi->pdev->dev, "same edid\n");
++		return HDMI_EDID_SAME;
++	}
++
++	if (hdmi->fbi->monspecs.modedb_len == 0) {
++		dev_info(&hdmi->pdev->dev, "No modes read from edid\n");
++		return HDMI_EDID_NO_MODES;
++	}
++
++	return HDMI_EDID_SUCCESS;
++}
++
++static void mxc_hdmi_phy_disable(struct mxc_hdmi *hdmi)
++{
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	if (!hdmi->phy_enabled)
++		return;
++
++	hdmi_disable_overflow_interrupts();
++
++	/* Setting PHY to reset status */
++	hdmi_writeb(HDMI_MC_PHYRSTZ_DEASSERT, HDMI_MC_PHYRSTZ);
++
++	/* Power down PHY */
++	mxc_hdmi_phy_enable_tmds(0);
++	mxc_hdmi_phy_enable_power(0);
++	mxc_hdmi_phy_gen2_txpwron(0);
++	mxc_hdmi_phy_gen2_pddq(1);
++
++	hdmi->phy_enabled = false;
++	dev_dbg(&hdmi->pdev->dev, "%s - exit\n", __func__);
++}
++
++/* HDMI Initialization Step B.4 */
++static void mxc_hdmi_enable_video_path(struct mxc_hdmi *hdmi)
++{
++	u8 clkdis;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* control period minimum duration */
++	hdmi_writeb(12, HDMI_FC_CTRLDUR);
++	hdmi_writeb(32, HDMI_FC_EXCTRLDUR);
++	hdmi_writeb(1, HDMI_FC_EXCTRLSPAC);
++
++	/* Set to fill TMDS data channels */
++	hdmi_writeb(0x0B, HDMI_FC_CH0PREAM);
++	hdmi_writeb(0x16, HDMI_FC_CH1PREAM);
++	hdmi_writeb(0x21, HDMI_FC_CH2PREAM);
++
++	/* Save CEC clock */
++	clkdis = hdmi_readb(HDMI_MC_CLKDIS) & HDMI_MC_CLKDIS_CECCLK_DISABLE;
++	clkdis |= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
++
++	/* Enable pixel clock and tmds data path */
++	clkdis = 0x7F & clkdis;
++	clkdis &= ~HDMI_MC_CLKDIS_PIXELCLK_DISABLE;
++	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++
++	clkdis &= ~HDMI_MC_CLKDIS_TMDSCLK_DISABLE;
++	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++
++	/* Enable csc path */
++	if (isColorSpaceConversion(hdmi) && !hdmi->hdmi_data.video_mode.mDVI) {
++		clkdis &= ~HDMI_MC_CLKDIS_CSCCLK_DISABLE;
++		hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++	}
++}
++
++static void hdmi_enable_audio_clk(struct mxc_hdmi *hdmi)
++{
++	u8 clkdis;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	clkdis = hdmi_readb(HDMI_MC_CLKDIS);
++	clkdis &= ~HDMI_MC_CLKDIS_AUDCLK_DISABLE;
++	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++}
++
++/* Workaround to clear the overflow condition */
++static void mxc_hdmi_clear_overflow(struct mxc_hdmi *hdmi)
++{
++	int count;
++	u8 val;
++
++	/* TMDS software reset */
++	hdmi_writeb((u8)~HDMI_MC_SWRSTZ_TMDSSWRST_REQ, HDMI_MC_SWRSTZ);
++
++	val = hdmi_readb(HDMI_FC_INVIDCONF);
++
++	if (cpu_is_imx6dl(hdmi)) {
++		 hdmi_writeb(val, HDMI_FC_INVIDCONF);
++		 return;
++	}
++
++	for (count = 0 ; count < 5 ; count++)
++		hdmi_writeb(val, HDMI_FC_INVIDCONF);
++}
++
++static void hdmi_enable_overflow_interrupts(void)
++{
++	pr_debug("%s\n", __func__);
++	hdmi_writeb(0, HDMI_FC_MASK2);
++	hdmi_writeb(0, HDMI_IH_MUTE_FC_STAT2);
++}
++
++static void hdmi_disable_overflow_interrupts(void)
++{
++	pr_debug("%s\n", __func__);
++	hdmi_writeb(HDMI_IH_MUTE_FC_STAT2_OVERFLOW_MASK,
++		    HDMI_IH_MUTE_FC_STAT2);
++	hdmi_writeb(0x7f, HDMI_FC_MASK2);
++}
++
++static void mxc_hdmi_notify_fb(struct mxc_hdmi *hdmi)
++{
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* Don't notify if we aren't registered yet */
++	WARN_ON(!hdmi->fb_reg);
++
++	/* disable the phy before ipu changes mode */
++	mxc_hdmi_phy_disable(hdmi);
++
++	/*
++	 * Note that fb_set_var will block.  During this time,
++	 * FB_EVENT_MODE_CHANGE callback will happen.
++	 * So by the end of this function, mxc_hdmi_setup()
++	 * will be done.
++	 */
++	hdmi->fbi->var.activate |= FB_ACTIVATE_FORCE;
++	console_lock();
++	hdmi->fbi->flags |= FBINFO_MISC_USEREVENT;
++	fb_set_var(hdmi->fbi, &hdmi->fbi->var);
++	hdmi->fbi->flags &= ~FBINFO_MISC_USEREVENT;
++	console_unlock();
++
++	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
++}
++
++inline
++static void mxc_fb_add_videomode(const struct fb_videomode *src_mode, struct list_head *modelist, const u32 new_flag, const u32 mod_vmode)
++{
++	struct fb_videomode mode;
++
++	memcpy(&mode, src_mode, sizeof(struct fb_videomode));
++	mode.flag = new_flag; mode.vmode |= mod_vmode;
++	fb_add_videomode(&mode, modelist);
++}
++
++enum {
++	hzSTART = 0,
++	hz50    = 50,
++	hz60    = 60,
++	hzEND   = 61
++};
++
++struct stereo_mandatory_mode {
++	int				rfc_refresh;
++	const struct fb_videomode	*rfc_parent_cea_mode;
++	uint32_t			flag;
++	uint32_t			vmode;
++};
++
++static struct stereo_mandatory_mode stereo_mandatory_modes[] = {
++	// 1280x720p @ 59.94 / 60Hz TOP-and-BOTTOM
++	{ 60, &mxc_cea_mode[4],  FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM },
++	// 1920x1080p @ 23.98 / 24Hz TOP-and-BOTTOM
++	{ 60, &mxc_cea_mode[32], FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM },
++	// 1280x720p @ 59.94 / 60Hz FRAME-PACK
++	{ 60, &mxc_cea_mode[4],  FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK },
++	// 1920x1080p @ 23.98 / 24Hz FRAME-PACK
++	{ 60, &mxc_cea_mode[32], FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK },
++	// 1920x1080i @ 59.94 / 60Hz SIDE-by-SIDE half
++	{ 60, &mxc_cea_mode[5],  FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF   },
++	// 1280x720p @ 50Hz TOP-and-BOTTOM
++	{ 50, &mxc_cea_mode[19], FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM },
++	// 1280x720p @ 50Hz FRAME-PACK
++	{ 50, &mxc_cea_mode[19], FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK },
++	// 1920x1080i @ 50Hz SIDE-by-SIDE half
++	{ 50, &mxc_cea_mode[20], FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF   }
++};
++
++static void mxc_hdmi_edid_rebuild_modelist(struct mxc_hdmi *hdmi)
++{
++	int i, j, k, nvic = 0, vic;
++	struct fb_videomode *mode;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	console_lock();
++
++	fb_destroy_modelist(&hdmi->fbi->modelist);
++	fb_add_videomode(&vga_mode, &hdmi->fbi->modelist);
++
++	for (i = 0; i < hdmi->fbi->monspecs.modedb_len; i++) {
++		/*
++		 * We might check here if mode is supported by HDMI.
++		 * We do not currently support interlaced modes.
++		 * And add CEA modes in the modelist.
++		 */
++		mode = &hdmi->fbi->monspecs.modedb[i];
++
++		if ((vic = mxc_edid_mode_to_vic(mode, 0)))
++			nvic++;
++
++		// allow detailed timing specification with vic=0 for HDMI
++		// mode
++		if (hdmi->edid_cfg.hdmi_cap &&
++		   (((mode->flag != FB_MODE_IS_DETAILED) && (vic == 0))
++				||
++		   (mode->flag == FB_MODE_IS_VESA)))
++				continue;
++
++		if (!mode->xres || !mode->refresh)
++			continue;
++
++		if (!(mode->vmode & FB_VMODE_ASPECT_MASK)) {
++			if (mode->yres == (mode->xres * 3)/4)
++				mode->vmode |= FB_VMODE_ASPECT_4_3;
++			else
++				mode->vmode |= FB_VMODE_ASPECT_16_9;
++		}
++
++		for (j = 0; j < 1 || (hdmi->hdmi_data.enable_fract && j < 2); j++) {
++			struct fb_videomode *tm = mode;
++			struct fb_videomode mode2;
++			char refresh[10];
++
++			if (j == 1 && (mode->refresh != 24 && mode->refresh != 30 && mode->refresh != 60))
++				break;
++
++			switch (j) {
++			case 1:
++				memcpy(&mode2, mode, sizeof(struct fb_videomode));
++				mode2.vmode = mode->vmode | FB_VMODE_FRACTIONAL;
++				mode2.pixclock = PICOS2KHZ(KHZ2PICOS(mode2.pixclock) * 1000/1001);
++				fb_add_videomode(&mode2, &hdmi->fbi->modelist);
++				tm = &mode2;
++				break;
++			default:
++				break;
++			}
++
++			get_refresh_str(tm, refresh);
++			dev_info(&hdmi->pdev->dev, "Added mode: %d, vic: %d %s", i, vic, j == 1 ? " fractional" : "");
++			dev_info(&hdmi->pdev->dev,
++				"xres = %d, yres = %d, ratio = %s, freq = %s, vmode = %d, flag = %d, pclk = %d\n",
++				tm->xres,
++				tm->yres,
++				tm->vmode & FB_VMODE_ASPECT_1 ? "1" :
++				    mode->vmode & FB_VMODE_ASPECT_4_3 ? "4/3" :
++				    mode->vmode & FB_VMODE_ASPECT_5_4 ? "5/4" :
++				    mode->vmode & FB_VMODE_ASPECT_16_10 ? "16/10" :
++				    mode->vmode & FB_VMODE_ASPECT_16_9 ? "16/9" : "n/a",
++				refresh,
++				tm->vmode,
++				tm->flag,
++				tm->pixclock);
++			fb_add_videomode(tm, &hdmi->fbi->modelist);
++		}
++
++		if (!hdmi->hdmi_data.enable_3d || !vic)
++			continue;
++
++		/* according to HDMI 1.4 specs, add mandatory modes for 50 and 60Hz existing 2d modes */
++		for (k = hzSTART + 1; k < hzEND; k++) {
++		    if (mode->refresh == k && hdmi->edid_cfg.hdmi_3d_present) {
++			for (j = 0; j < sizeof(stereo_mandatory_modes) / sizeof(struct stereo_mandatory_mode); j++) {
++				if (stereo_mandatory_modes[j].rfc_refresh != k)
++					continue;
++				mxc_fb_add_videomode(stereo_mandatory_modes[j].rfc_parent_cea_mode, &hdmi->fbi->modelist,
++							stereo_mandatory_modes[j].flag, stereo_mandatory_modes[j].vmode);
++			}
++		    }
++		}
++
++		if ((hdmi->edid_cfg.hdmi_3d_multi_present == 2 && hdmi->edid_cfg.hdmi_3d_mask_all & (1 << (nvic-1))) ||
++		    (hdmi->edid_cfg.hdmi_3d_multi_present == 1 && nvic <= 16)) {
++			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x1)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK);
++			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x6)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_FULL);
++			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x40)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM);
++			if (hdmi->edid_cfg.hdmi_3d_struct_all & 0x100)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF);
++		}
++
++		for (j = 0; j < hdmi->edid_cfg.hdmi_3d_len; j++) {
++			if (hdmi->edid_cfg.hdmi_3d_format[j].vic_order_2d != nvic-1)
++				continue;
++
++			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 0)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_FRAME_PACK);
++			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 3)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_FULL);
++			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 6)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_TOP_BOTTOM);
++			if (hdmi->edid_cfg.hdmi_3d_format[j].struct_3d == 8)
++				mxc_fb_add_videomode(mode, &hdmi->fbi->modelist, FB_MODE_IS_3D, FB_VMODE_3D_SBS_HALF);
++		}
++	}
++
++	fb_new_modelist(hdmi->fbi);
++
++	console_unlock();
++}
++
++static void  mxc_hdmi_default_edid_cfg(struct mxc_hdmi *hdmi)
++{
++	/* Default setting HDMI working in HDMI mode */
++	hdmi->edid_cfg.hdmi_cap = true;
++}
++
++static void  mxc_hdmi_default_modelist(struct mxc_hdmi *hdmi)
++{
++	u32 i;
++	const struct fb_videomode *mode;
++	struct fb_videomode m;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* If not EDID data read, set up default modelist  */
++	dev_info(&hdmi->pdev->dev, "No modes read from edid\n");
++	dev_info(&hdmi->pdev->dev, "create default modelist\n");
++
++	console_lock();
++
++	fb_destroy_modelist(&hdmi->fbi->modelist);
++
++	fb_var_to_videomode(&m, &hdmi->fbi->var);
++	fb_add_videomode(&m, &hdmi->fbi->modelist);
++
++	/*Add all no interlaced CEA mode to default modelist */
++	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
++		mode = &mxc_cea_mode[i];
++		if (mode->xres != 0)
++			fb_add_videomode(mode, &hdmi->fbi->modelist);
++	}
++
++	fb_new_modelist(hdmi->fbi);
++
++	console_unlock();
++}
++
++static void mxc_hdmi_set_mode(struct mxc_hdmi *hdmi)
++{
++	const struct fb_videomode *mode;
++	struct fb_videomode m;
++	struct fb_var_screeninfo var;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* Set the default mode only once. */
++	if (!hdmi->dft_mode_set) {
++		fb_videomode_to_var(&var, &hdmi->default_mode);
++		hdmi->dft_mode_set = true;
++		hdmi->requesting_vga_for_initialization = false;
++	} else
++		memcpy(&var, &hdmi->previous_non_vga_mode,
++		       sizeof(struct fb_var_screeninfo));
++
++	fb_var_to_videomode(&m, &var);
++
++	mode = mxc_fb_find_nearest_mode(&m, &hdmi->fbi->modelist);
++	if (!mode) {
++		pr_err("%s: could not find mode in modelist\n", __func__);
++		return;
++	}
++
++	/* If video mode same as previous, init HDMI again */
++	if (fb_mode_is_equal(&m, mode) && hdmi->edid_status == HDMI_EDID_SAME) {
++		dev_dbg(&hdmi->pdev->dev,
++				"%s: Video mode and EDID same as previous\n", __func__);
++		/* update fbi mode in case modelist is updated */
++		hdmi->fbi->mode = (struct fb_videomode *)mode;
++		memcpy(&hdmi->fbi->var, &hdmi->previous_non_vga_mode,
++		       sizeof(struct fb_var_screeninfo));
++		/* update hdmi setting in case EDID data updated  */
++		mxc_hdmi_setup(hdmi, 0);
++	} else if (fb_mode_is_equal(&m, mode)) {
++		dev_dbg(&hdmi->pdev->dev,
++				"%s: Video mode same as previous\n", __func__);
++		/* update fbi mode in case modelist is updated */
++		hdmi->fbi->mode = (struct fb_videomode *)mode;
++		dump_fb_videomode(hdmi->fbi->mode);
++		memcpy(&hdmi->fbi->var, &hdmi->previous_non_vga_mode,
++		       sizeof(struct fb_var_screeninfo));
++		mxc_hdmi_notify_fb(hdmi);
++	} else {
++		dev_dbg(&hdmi->pdev->dev, "%s: New video mode\n", __func__);
++		fb_videomode_to_var(&hdmi->fbi->var, mode);
++		dump_fb_videomode((struct fb_videomode *)mode);
++		mxc_hdmi_notify_fb(hdmi);
++	}
++
++}
++
++static void mxc_hdmi_cable_connected(struct mxc_hdmi *hdmi)
++{
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	hdmi->cable_plugin = true;
++
++	/* HDMI Initialization Step C */
++	hdmi->edid_status = mxc_hdmi_read_edid(hdmi);
++
++	/* Read EDID again if first EDID read failed */
++	if (hdmi->edid_status == HDMI_EDID_NO_MODES ||
++			hdmi->edid_status == HDMI_EDID_FAIL) {
++		dev_info(&hdmi->pdev->dev, "Read EDID again\n");
++		msleep(25);
++		hdmi->edid_status = mxc_hdmi_read_edid(hdmi);
++	}
++
++	/* HDMI Initialization Steps D, E, F */
++	switch (hdmi->edid_status) {
++	case HDMI_EDID_SUCCESS:
++		mxc_hdmi_edid_rebuild_modelist(hdmi);
++		break;
++
++	/* Nothing to do if EDID same */
++	case HDMI_EDID_SAME:
++		break;
++
++	case HDMI_EDID_FAIL:
++		mxc_hdmi_default_edid_cfg(hdmi);
++		/* No break here  */
++	case HDMI_EDID_NO_MODES:
++	default:
++		mxc_hdmi_default_modelist(hdmi);
++		break;
++	}
++
++	/* Save edid cfg for audio driver */
++	hdmi_set_edid_cfg(hdmi->edid_status, &hdmi->edid_cfg);
++
++	/* Setting video mode */
++	mxc_hdmi_set_mode(hdmi);
++
++	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
++}
++
++static int mxc_hdmi_power_on(struct mxc_dispdrv_handle *disp)
++{
++	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
++
++	dev_dbg(&hdmi->pdev->dev, "%s reg %d cable %d blank %d\n", __func__, hdmi->fb_reg, hdmi->cable_plugin, hdmi->blank);
++
++	mxc_hdmi_phy_init(hdmi);
++	hdmi_clk_regenerator_update_pixel_clock(hdmi->fbi->var.pixclock);
++	return 0;
++}
++
++static void mxc_hdmi_power_off(struct mxc_dispdrv_handle *disp)
++{
++	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	mxc_hdmi_phy_disable(hdmi);
++}
++
++static void mxc_hdmi_cable_disconnected(struct mxc_hdmi *hdmi)
++{
++	u8  clkdis;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* Save CEC clock */
++	clkdis = hdmi_readb(HDMI_MC_CLKDIS) & HDMI_MC_CLKDIS_CECCLK_DISABLE;
++	clkdis |= ~HDMI_MC_CLKDIS_CECCLK_DISABLE;
++
++	/* Disable All HDMI clock */
++	hdmi_writeb(0x7f, HDMI_MC_CLKDIS);
++
++	mxc_hdmi_phy_disable(hdmi);
++
++	//hdmi_disable_overflow_interrupts();
++	hdmi_writeb(clkdis, HDMI_MC_CLKDIS);
++
++	hdmi->cable_plugin = false;
++}
++
++static void hotplug_worker(struct work_struct *work)
++{
++	struct mxc_hdmi *hdmi =
++		container_of(work, struct mxc_hdmi, hotplug_work);
++	u32 hdmi_phy_stat0, hdmi_phy_pol0, hdmi_phy_mask0;
++	unsigned long flags;
++	char event_string[32];
++	char *envp[] = { event_string, NULL };
++	u32 l;
++
++	hdmi_phy_stat0 = hdmi_readb(HDMI_PHY_STAT0);
++	hdmi_phy_pol0 = hdmi_readb(HDMI_PHY_POL0);
++
++	dev_dbg(&hdmi->pdev->dev, "phy_int_stat=0x%x/0x%x, phy_int_pol=0x%x, plug_event=0x%x, plug_mask=0x%x\n",
++			hdmi_phy_stat0, hdmi->latest_intr_stat, hdmi_phy_pol0, hdmi->plug_event, hdmi->plug_mask);
++
++		/* Make HPD intr active low to capture unplug event or
++		 * active high to capture plugin event */
++		hdmi_writeb((hdmi->plug_mask & ~hdmi_phy_pol0), HDMI_PHY_POL0);
++
++		/* cable connection changes */
++		if (hdmi_phy_pol0 & hdmi->plug_mask) {
++			/* Plugin event */
++			dev_dbg(&hdmi->pdev->dev, "EVENT=plugin\n");
++			mxc_hdmi_cable_connected(hdmi);
++
++			sprintf(event_string, "EVENT=plugin");
++			kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
++#ifdef CONFIG_MXC_HDMI_CEC
++			memcpy(&l, &hdmi->edid_cfg.physical_address, 4 *sizeof(u8));
++			mxc_hdmi_cec_handle(l);
++#endif
++			hdmi_set_cable_state(1);
++		} else {
++			/* Plugout event */
++			dev_dbg(&hdmi->pdev->dev, "EVENT=plugout\n");
++			hdmi_set_cable_state(0);
++			mxc_hdmi_abort_stream();
++			mxc_hdmi_cable_disconnected(hdmi);
++
++			sprintf(event_string, "EVENT=plugout");
++			kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
++#ifdef CONFIG_MXC_HDMI_CEC
++			mxc_hdmi_cec_handle(0x0);
++#endif
++		}
++
++	/* Lock here to ensure full powerdown sequence
++	 * completed before next interrupt processed */
++	spin_lock_irqsave(&hdmi->irq_lock, flags);
++
++	/* Re-enable HPD interrupts */
++	hdmi_phy_mask0 = hdmi_readb(HDMI_PHY_MASK0);
++	hdmi_phy_mask0 &= ~hdmi->plug_mask;
++	hdmi_writeb(hdmi_phy_mask0, HDMI_PHY_MASK0);
++
++	/* Unmute interrupts */
++	hdmi_writeb(~hdmi->plug_event, HDMI_IH_MUTE_PHY_STAT0);
++
++	if (hdmi_readb(HDMI_IH_FC_STAT2) & HDMI_IH_FC_STAT2_OVERFLOW_MASK)
++		mxc_hdmi_clear_overflow(hdmi);
++
++	spin_unlock_irqrestore(&hdmi->irq_lock, flags);
++	pr_debug("%s exit\n", __func__);
++}
++
++static void hotplug_work_launch(unsigned long data)
++{
++	struct mxc_hdmi *hdmi = (struct mxc_hdmi *)data;
++	pr_debug("%s\n", __func__);
++	schedule_work(&hdmi->hotplug_work);
++}
++
++static void hdcp_hdp_worker(struct work_struct *work)
++{
++	struct delayed_work *delay_work = to_delayed_work(work);
++	struct mxc_hdmi *hdmi =
++		container_of(delay_work, struct mxc_hdmi, hdcp_hdp_work);
++	char event_string[32];
++	char *envp[] = { event_string, NULL };
++
++	/* HDCP interrupt */
++	sprintf(event_string, "EVENT=hdcpint");
++	kobject_uevent_env(&hdmi->pdev->dev.kobj, KOBJ_CHANGE, envp);
++
++	/* Unmute interrupts in HDCP application*/
++}
++
++static irqreturn_t mxc_hdmi_hotplug(int irq, void *data)
++{
++	struct mxc_hdmi *hdmi = data;
++	u8 val, intr_stat;
++	unsigned long flags;
++
++	spin_lock_irqsave(&hdmi->irq_lock, flags);
++
++	/* Check and clean packet overflow interrupt.*/
++	if (hdmi_readb(HDMI_IH_FC_STAT2) &
++			HDMI_IH_FC_STAT2_OVERFLOW_MASK) {
++		mxc_hdmi_clear_overflow(hdmi);
++
++		dev_dbg(&hdmi->pdev->dev, "Overflow interrupt received\n");
++		/* clear irq status */
++		hdmi_writeb(HDMI_IH_FC_STAT2_OVERFLOW_MASK,
++			    HDMI_IH_FC_STAT2);
++	}
++
++	/*
++	 * We could not disable the irq.  Probably the audio driver
++	 * has enabled it. Masking off the HDMI interrupts using
++	 * HDMI registers.
++	 */
++	/* Capture status - used in hotplug_worker ISR */
++	intr_stat = hdmi_readb(HDMI_IH_PHY_STAT0);
++	if (intr_stat & hdmi->plug_event) {
++
++		dev_dbg(&hdmi->pdev->dev, "Hotplug interrupt received\n");
++		hdmi->latest_intr_stat = intr_stat;
++
++		/* Mute interrupts until handled */
++
++		val = hdmi_readb(HDMI_IH_MUTE_PHY_STAT0);
++		val |= hdmi->plug_event;
++		hdmi_writeb(val, HDMI_IH_MUTE_PHY_STAT0);
++
++		val = hdmi_readb(HDMI_PHY_MASK0);
++		val |= hdmi->plug_mask;
++		hdmi_writeb(val, HDMI_PHY_MASK0);
++
++		/* Clear Hotplug interrupts */
++		hdmi_writeb(hdmi->plug_event, HDMI_IH_PHY_STAT0);
++
++		if(hdmi_inited) {
++			if (!hdmi->dft_mode_set)
++				mod_timer(&hdmi->jitter_timer, jiffies + msecs_to_jiffies(20));
++			else
++				mod_timer(&hdmi->jitter_timer, jiffies + HZ);
++		}
++	}
++
++	/* Check HDCP  interrupt state */
++	if (hdmi->hdmi_data.hdcp_enable) {
++		val = hdmi_readb(HDMI_A_APIINTSTAT);
++		if (val != 0) {
++			/* Mute interrupts until interrupt handled */
++			val = 0x7F;
++			hdmi_writeb(val, HDMI_A_APIINTMSK);
++			schedule_delayed_work(&(hdmi->hdcp_hdp_work), msecs_to_jiffies(50));
++		}
++	}
++
++	spin_unlock_irqrestore(&hdmi->irq_lock, flags);
++	return IRQ_HANDLED;
++}
++
++static void mxc_hdmi_setup(struct mxc_hdmi *hdmi, unsigned long event)
++{
++	struct fb_videomode m;
++	const struct fb_videomode *edid_mode;
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	fb_var_to_videomode(&m, &hdmi->fbi->var);
++
++	dev_dbg(&hdmi->pdev->dev, "%s - video mode changed\n", __func__);
++
++	hdmi->vic = 0;
++	if (!hdmi->requesting_vga_for_initialization) {
++		/* Save mode if this isn't the result of requesting
++		 * vga default. */
++		memcpy(&hdmi->previous_non_vga_mode, &hdmi->fbi->var,
++		       sizeof(struct fb_var_screeninfo));
++		if (!list_empty(&hdmi->fbi->modelist)) {
++			edid_mode = mxc_fb_find_nearest_mode(&m, &hdmi->fbi->modelist);
++			pr_debug("edid mode vx:%d vy:%d", hdmi->fbi->var.xres_virtual, hdmi->fbi->var.yres_virtual);
++			dump_fb_videomode((struct fb_videomode *)edid_mode);
++			/* update fbi mode */
++			hdmi->fbi->mode = (struct fb_videomode *)edid_mode;
++			hdmi->vic = mxc_edid_mode_to_vic(edid_mode, 0);
++		}
++	}
++
++	hdmi_disable_overflow_interrupts();
++
++	dev_dbg(&hdmi->pdev->dev, "CEA mode used vic=%d\n", hdmi->vic);
++	if (hdmi->edid_cfg.hdmi_cap || !hdmi->edid_status) {
++		hdmi_set_dvi_mode(0);
++		hdmi->hdmi_data.video_mode.mDVI = false;
++	} else {
++		hdmi_set_dvi_mode(1);
++		dev_dbg(&hdmi->pdev->dev, "CEA mode vic=%d work in DVI\n", hdmi->vic);
++		hdmi->hdmi_data.video_mode.mDVI = true;
++	}
++
++	if ((hdmi->vic == 6) || (hdmi->vic == 7) ||
++		(hdmi->vic == 21) || (hdmi->vic == 22) ||
++		(hdmi->vic == 2) || (hdmi->vic == 3) ||
++		(hdmi->vic == 17) || (hdmi->vic == 18))
++		hdmi->hdmi_data.colorimetry = eITU601;
++	else
++		hdmi->hdmi_data.colorimetry = eITU709;
++
++	if ((hdmi->vic == 10) || (hdmi->vic == 11) ||
++		(hdmi->vic == 12) || (hdmi->vic == 13) ||
++		(hdmi->vic == 14) || (hdmi->vic == 15) ||
++		(hdmi->vic == 25) || (hdmi->vic == 26) ||
++		(hdmi->vic == 27) || (hdmi->vic == 28) ||
++		(hdmi->vic == 29) || (hdmi->vic == 30) ||
++		(hdmi->vic == 35) || (hdmi->vic == 36) ||
++		(hdmi->vic == 37) || (hdmi->vic == 38))
++		hdmi->hdmi_data.video_mode.mPixelRepetitionOutput = 1;
++	else
++		hdmi->hdmi_data.video_mode.mPixelRepetitionOutput = 0;
++
++	hdmi->hdmi_data.video_mode.mPixelRepetitionInput = 0;
++
++	/* TODO: Get input format from IPU (via FB driver iface) */
++	hdmi->hdmi_data.enc_in_format = RGB;
++
++	hdmi->hdmi_data.enc_out_format = RGB;
++
++	/* YCbCr only enabled in HDMI mode */
++	if (!hdmi->hdmi_data.video_mode.mDVI &&
++		!hdmi->hdmi_data.rgb_out_enable) {
++		if (hdmi->edid_cfg.cea_ycbcr444)
++			hdmi->hdmi_data.enc_out_format = YCBCR444;
++		else if (hdmi->edid_cfg.cea_ycbcr422)
++			hdmi->hdmi_data.enc_out_format = YCBCR422_8BITS;
++	}
++
++	/* IPU not support depth color output */
++	hdmi->hdmi_data.enc_color_depth = 8;
++	hdmi->hdmi_data.pix_repet_factor = 0;
++	hdmi->hdmi_data.video_mode.mDataEnablePolarity = true;
++
++	/* HDMI Initialization Step B.1 */
++	hdmi_av_composer(hdmi);
++
++	/* HDMI Initializateion Step B.2 */
++	mxc_hdmi_phy_init(hdmi);
++
++	/* HDMI Initialization Step B.3 */
++	mxc_hdmi_enable_video_path(hdmi);
++
++	/* not for DVI mode */
++	if (hdmi->hdmi_data.video_mode.mDVI)
++		dev_dbg(&hdmi->pdev->dev, "%s DVI mode\n", __func__);
++	else {
++		dev_dbg(&hdmi->pdev->dev, "%s CEA mode\n", __func__);
++
++		/* HDMI Initialization Step E - Configure audio */
++		hdmi_enable_audio_clk(hdmi);
++
++		/* HDMI Initialization Step F - Configure AVI InfoFrame */
++		hdmi_config_AVI(hdmi);
++	}
++
++	hdmi_video_packetize(hdmi);
++	hdmi_video_csc(hdmi);
++	hdmi_video_sample(hdmi);
++
++	mxc_hdmi_clear_overflow(hdmi);
++
++	if (hdmi->cable_plugin && !hdmi->hdmi_data.video_mode.mDVI)
++		hdmi_enable_overflow_interrupts();
++
++	dev_dbg(&hdmi->pdev->dev, "%s exit\n\n", __func__);
++
++}
++
++/* Wait until we are registered to enable interrupts */
++static void mxc_hdmi_fb_registered(struct mxc_hdmi *hdmi)
++{
++	unsigned long flags;
++
++	if (hdmi->fb_reg)
++		return;
++
++	spin_lock_irqsave(&hdmi->irq_lock, flags);
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	hdmi_writeb(HDMI_PHY_I2CM_INT_ADDR_DONE_POL,
++		    HDMI_PHY_I2CM_INT_ADDR);
++
++	hdmi_writeb(HDMI_PHY_I2CM_CTLINT_ADDR_NAC_POL |
++		    HDMI_PHY_I2CM_CTLINT_ADDR_ARBITRATION_POL,
++		    HDMI_PHY_I2CM_CTLINT_ADDR);
++
++	/* enable cable hot plug irq */
++	hdmi_writeb(~hdmi->plug_mask, HDMI_PHY_MASK0);
++
++	/* Clear Hotplug interrupts */
++	hdmi_writeb(hdmi->plug_event, HDMI_IH_PHY_STAT0);
++
++	/* Unmute interrupts */
++	hdmi_writeb(~hdmi->plug_event, HDMI_IH_MUTE_PHY_STAT0);
++
++	hdmi->fb_reg = true;
++
++	spin_unlock_irqrestore(&hdmi->irq_lock, flags);
++
++}
++
++static int mxc_hdmi_fb_event(struct notifier_block *nb,
++					unsigned long val, void *v)
++{
++	struct fb_event *event = v;
++	struct mxc_hdmi *hdmi = container_of(nb, struct mxc_hdmi, nb);
++
++	if (strcmp(event->info->fix.id, hdmi->fbi->fix.id))
++		return 0;
++
++	switch (val) {
++	case FB_EVENT_FB_REGISTERED:
++		dev_dbg(&hdmi->pdev->dev, "event=FB_EVENT_FB_REGISTERED\n");
++		mxc_hdmi_fb_registered(hdmi);
++		hdmi_set_registered(1);
++		break;
++
++	case FB_EVENT_FB_UNREGISTERED:
++		dev_dbg(&hdmi->pdev->dev, "event=FB_EVENT_FB_UNREGISTERED\n");
++		hdmi->fb_reg = false;
++		hdmi_set_registered(0);
++		break;
++
++	case FB_EVENT_MODE_CHANGE:
++		dev_dbg(&hdmi->pdev->dev, "event=FB_EVENT_MODE_CHANGE\n");
++		if (hdmi->fb_reg)
++			mxc_hdmi_setup(hdmi, val);
++		break;
++
++	case FB_EVENT_BLANK:
++		if ((*((int *)event->data) == FB_BLANK_UNBLANK) &&
++			(*((int *)event->data) != hdmi->blank)) {
++			dev_dbg(&hdmi->pdev->dev,
++				"event=FB_EVENT_BLANK - UNBLANK\n");
++
++			hdmi->blank = *((int *)event->data);
++
++			/* Re-enable HPD interrupts */
++			val = hdmi_readb(HDMI_PHY_MASK0);
++			val &= ~hdmi->plug_mask;
++			hdmi_writeb(val, HDMI_PHY_MASK0);
++
++			/* Unmute interrupts */
++			hdmi_writeb(~hdmi->plug_event, HDMI_IH_MUTE_PHY_STAT0);
++
++			if (hdmi->fb_reg && hdmi->cable_plugin)
++				mxc_hdmi_setup(hdmi, val);
++			hdmi_set_blank_state(1);
++
++		} else if (*((int *)event->data) != hdmi->blank) {
++			dev_dbg(&hdmi->pdev->dev,
++				"event=FB_EVENT_BLANK - BLANK\n");
++			hdmi_set_blank_state(0);
++			mxc_hdmi_abort_stream();
++
++			mxc_hdmi_phy_disable(hdmi);
++
++			if(hdmi->plug_mask == HDMI_DVI_STAT) {
++				u8 val;
++				pr_info("In DVI Mode disable interrupts\n");
++				val = hdmi_readb(HDMI_IH_MUTE_PHY_STAT0);
++				val |= hdmi->plug_event;
++				hdmi_writeb(val, HDMI_IH_MUTE_PHY_STAT0);
++
++				val = hdmi_readb(HDMI_PHY_MASK0);
++				val |= hdmi->plug_mask;
++				hdmi_writeb(val, HDMI_PHY_MASK0);
++
++				hdmi_set_dvi_mode(1);
++			}
++
++			hdmi->blank = *((int *)event->data);
++		} else
++			dev_dbg(&hdmi->pdev->dev,
++				"FB BLANK state no changed!\n");
++
++		break;
++
++	case FB_EVENT_SUSPEND:
++		dev_dbg(&hdmi->pdev->dev,
++			"event=FB_EVENT_SUSPEND\n");
++
++		if (hdmi->blank == FB_BLANK_UNBLANK) {
++			mxc_hdmi_phy_disable(hdmi);
++			clk_disable(hdmi->hdmi_iahb_clk);
++			clk_disable(hdmi->hdmi_isfr_clk);
++		}
++		break;
++
++	case FB_EVENT_RESUME:
++		dev_dbg(&hdmi->pdev->dev,
++			"event=FB_EVENT_RESUME\n");
++
++		if (hdmi->blank == FB_BLANK_UNBLANK) {
++			clk_enable(hdmi->hdmi_iahb_clk);
++			clk_enable(hdmi->hdmi_isfr_clk);
++			mxc_hdmi_phy_init(hdmi);
++		}
++		break;
++	default:
++		break;
++	}
++
++	return 0;
++}
++
++static void hdmi_init_route(struct mxc_hdmi *hdmi)
++{
++	uint32_t hdmi_mux_setting, reg;
++	int ipu_id, disp_id;
++
++	ipu_id = mxc_hdmi_ipu_id;
++	disp_id = mxc_hdmi_disp_id;
++
++	if ((ipu_id > 1) || (ipu_id < 0)) {
++		pr_err("Invalid IPU select for HDMI: %d. Set to 0\n", ipu_id);
++		ipu_id = 0;
++	}
++
++	if ((disp_id > 1) || (disp_id < 0)) {
++		pr_err("Invalid DI select for HDMI: %d. Set to 0\n", disp_id);
++		disp_id = 0;
++	}
++
++	reg = readl(hdmi->gpr_hdmi_base);
++
++	/* Configure the connection between IPU1/2 and HDMI */
++	hdmi_mux_setting = 2*ipu_id + disp_id;
++
++	/* GPR3, bits 2-3 = HDMI_MUX_CTL */
++	reg &= ~0xd;
++	reg |= hdmi_mux_setting << 2;
++
++	writel(reg, hdmi->gpr_hdmi_base);
++
++	/* Set HDMI event as SDMA event2 for HDMI audio */
++	reg = readl(hdmi->gpr_sdma_base);
++	reg |= 0x1;
++	writel(reg, hdmi->gpr_sdma_base);
++}
++
++static void hdmi_hdcp_get_property(struct platform_device *pdev)
++{
++	struct device_node *np = pdev->dev.of_node;
++
++	/* Check hdcp enable by dts.*/
++	hdcp_init = of_property_read_bool(np, "fsl,hdcp");
++	if (hdcp_init)
++		dev_dbg(&pdev->dev, "hdcp enable\n");
++	else
++		dev_dbg(&pdev->dev, "hdcp disable\n");
++}
++
++static void hdmi_get_of_property(struct mxc_hdmi *hdmi)
++{
++	struct platform_device *pdev = hdmi->pdev;
++	struct device_node *np = pdev->dev.of_node;
++	const struct of_device_id *of_id =
++			of_match_device(imx_hdmi_dt_ids, &pdev->dev);
++	int ret;
++	u32 phy_reg_vlev = 0, phy_reg_cksymtx = 0;
++
++	if (of_id) {
++		pdev->id_entry = of_id->data;
++		hdmi->cpu_type = pdev->id_entry->driver_data;
++	}
++
++	/* HDMI PHY register vlev and cksymtx preperty is optional.
++	 * It is for specific board to pass HCT electrical part.
++	 * Default value will been setting in HDMI PHY config function
++	 * if it is not define in device tree.
++	 */
++	ret = of_property_read_u32(np, "fsl,phy_reg_vlev", &phy_reg_vlev);
++	if (ret)
++		dev_dbg(&pdev->dev, "No board specific HDMI PHY vlev\n");
++
++	ret = of_property_read_u32(np, "fsl,phy_reg_cksymtx", &phy_reg_cksymtx);
++	if (ret)
++		dev_dbg(&pdev->dev, "No board specific HDMI PHY cksymtx\n");
++
++	/* Specific phy config */
++	hdmi->phy_config.reg_cksymtx = phy_reg_cksymtx;
++	hdmi->phy_config.reg_vlev = phy_reg_vlev;
++
++}
++
++/* HDMI Initialization Step A */
++static int mxc_hdmi_disp_init(struct mxc_dispdrv_handle *disp,
++			      struct mxc_dispdrv_setting *setting)
++{
++	int ret = 0;
++	u32 i;
++	const struct fb_videomode *mode;
++	struct fb_videomode m;
++	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
++	int irq = platform_get_irq(hdmi->pdev, 0);
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	/* Check hdmi disp init once */
++	if (hdmi_inited) {
++		dev_err(&hdmi->pdev->dev,
++				"Error only one HDMI output support now!\n");
++		return -1;
++	}
++
++	hdmi_get_of_property(hdmi);
++
++	if (irq < 0)
++		return -ENODEV;
++
++	/* Setting HDMI default to blank state */
++	hdmi->blank = FB_BLANK_POWERDOWN;
++
++	setting->dev_id = mxc_hdmi_ipu_id;
++	setting->disp_id = mxc_hdmi_disp_id;
++	setting->if_fmt = IPU_PIX_FMT_RGB24;
++
++	hdmi->dft_mode_str = setting->dft_mode_str;
++	hdmi->default_bpp = setting->default_bpp;
++	dev_dbg(&hdmi->pdev->dev, "%s - default mode %s bpp=%d\n",
++		__func__, hdmi->dft_mode_str, hdmi->default_bpp);
++
++	hdmi->fbi = setting->fbi;
++
++	hdmi_init_route(hdmi);
++
++	hdmi->hdmi_isfr_clk = clk_get(&hdmi->pdev->dev, "hdmi_isfr");
++	if (IS_ERR(hdmi->hdmi_isfr_clk)) {
++		ret = PTR_ERR(hdmi->hdmi_isfr_clk);
++		dev_err(&hdmi->pdev->dev,
++			"Unable to get HDMI clk: %d\n", ret);
++		goto egetclk1;
++	}
++
++	ret = clk_prepare_enable(hdmi->hdmi_isfr_clk);
++	if (ret < 0) {
++		dev_err(&hdmi->pdev->dev,
++			"Cannot enable HDMI isfr clock: %d\n", ret);
++		goto erate1;
++	}
++
++	hdmi->hdmi_iahb_clk = clk_get(&hdmi->pdev->dev, "hdmi_iahb");
++	if (IS_ERR(hdmi->hdmi_iahb_clk)) {
++		ret = PTR_ERR(hdmi->hdmi_iahb_clk);
++		dev_err(&hdmi->pdev->dev,
++			"Unable to get HDMI clk: %d\n", ret);
++		goto egetclk2;
++	}
++
++	ret = clk_prepare_enable(hdmi->hdmi_iahb_clk);
++	if (ret < 0) {
++		dev_err(&hdmi->pdev->dev,
++			"Cannot enable HDMI iahb clock: %d\n", ret);
++		goto erate2;
++	}
++
++	dev_dbg(&hdmi->pdev->dev, "Enabled HDMI clocks\n");
++
++	/* Init DDC pins for HDCP  */
++	if (hdcp_init) {
++		hdmi->pinctrl = devm_pinctrl_get_select_default(&hdmi->pdev->dev);
++		if (IS_ERR(hdmi->pinctrl)) {
++			dev_err(&hdmi->pdev->dev, "can't get/select DDC pinctrl\n");
++			goto erate2;
++		}
++	}
++
++	/* Product and revision IDs */
++	dev_info(&hdmi->pdev->dev,
++		"Detected HDMI controller 0x%x:0x%x:0x%x:0x%x\n",
++		hdmi_readb(HDMI_DESIGN_ID),
++		hdmi_readb(HDMI_REVISION_ID),
++		hdmi_readb(HDMI_PRODUCT_ID0),
++		hdmi_readb(HDMI_PRODUCT_ID1));
++
++	/* To prevent overflows in HDMI_IH_FC_STAT2, set the clk regenerator
++	 * N and cts values before enabling phy */
++	hdmi_init_clk_regenerator();
++
++	INIT_LIST_HEAD(&hdmi->fbi->modelist);
++
++	spin_lock_init(&hdmi->irq_lock);
++
++	/* Set the default mode and modelist when disp init. */
++	fb_find_mode(&hdmi->fbi->var, hdmi->fbi,
++		     hdmi->dft_mode_str, /*NULL, 0, NULL,*/mxc_cea_mode, ARRAY_SIZE(mxc_cea_mode), NULL,
++		     hdmi->default_bpp);
++
++	console_lock();
++
++	fb_destroy_modelist(&hdmi->fbi->modelist);
++
++	/*Add all no interlaced CEA mode to default modelist */
++	for (i = 0; i < ARRAY_SIZE(mxc_cea_mode); i++) {
++		mode = &mxc_cea_mode[i];
++		if (mode->xres != 0)
++			fb_add_videomode(mode, &hdmi->fbi->modelist);
++	}
++
++	console_unlock();
++
++	/* Find a nearest mode in default modelist */
++	fb_var_to_videomode(&m, &hdmi->fbi->var);
++	dump_fb_videomode(&m);
++	hdmi->dft_mode_set = false;
++	/* Save default video mode */
++	memcpy(&hdmi->default_mode, &m, sizeof(struct fb_videomode));
++
++	mode = mxc_fb_find_nearest_mode(&m, &hdmi->fbi->modelist);
++	if (!mode) {
++		pr_err("%s: could not find mode in modelist\n", __func__);
++		return -1;
++	}
++
++	fb_videomode_to_var(&hdmi->fbi->var, mode);
++
++	/* update fbi mode */
++	hdmi->fbi->mode = (struct fb_videomode *)mode;
++
++	/* Default setting HDMI working in HDMI mode*/
++	hdmi->edid_cfg.hdmi_cap = true;
++
++	hdmi->plug_event = HDMI_DVI_IH_STAT;
++	hdmi->plug_mask = HDMI_DVI_STAT;
++
++	setup_timer(&hdmi->jitter_timer, hotplug_work_launch, (unsigned long)hdmi);
++	INIT_WORK(&hdmi->hotplug_work, hotplug_worker);
++	INIT_DELAYED_WORK(&hdmi->hdcp_hdp_work, hdcp_hdp_worker);
++
++	/* Configure registers related to HDMI interrupt
++	 * generation before registering IRQ. */
++	hdmi_writeb(hdmi->plug_mask, HDMI_PHY_POL0);
++
++	/* Clear Hotplug interrupts */
++	hdmi_writeb(hdmi->plug_event, HDMI_IH_PHY_STAT0);
++
++	hdmi->nb.notifier_call = mxc_hdmi_fb_event;
++	ret = fb_register_client(&hdmi->nb);
++	if (ret < 0)
++		goto efbclient;
++
++	memset(&hdmi->hdmi_data, 0, sizeof(struct hdmi_data_info));
++
++	/* Default HDMI working in RGB mode */
++	hdmi->hdmi_data.rgb_out_enable = true;
++
++	if (!strcasecmp(rgb_quant_range, "limited")) {
++		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE;
++	} else if (!strcasecmp(rgb_quant_range, "full")) {
++		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE;
++	} else {
++		hdmi->hdmi_data.rgb_quant_range = HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT;
++	}
++
++	if (!strcasecmp(enable_3d, "disable")) {
++		hdmi->hdmi_data.enable_3d = 0;
++	} else if (!strcasecmp(enable_3d, "0")) {
++		hdmi->hdmi_data.enable_3d = 0;
++	} else {
++		hdmi->hdmi_data.enable_3d = 1;
++	}
++
++	if (!strcasecmp(enable_fract, "disable")) {
++		hdmi->hdmi_data.enable_fract = 0;
++	} else if (!strcasecmp(enable_fract, "0")) {
++		hdmi->hdmi_data.enable_fract = 0;
++	} else {
++		hdmi->hdmi_data.enable_fract = 1;
++	}
++
++	ret = devm_request_irq(&hdmi->pdev->dev, irq, mxc_hdmi_hotplug, IRQF_SHARED,
++			dev_name(&hdmi->pdev->dev), hdmi);
++	if (ret < 0) {
++		dev_err(&hdmi->pdev->dev,
++			"Unable to request irq: %d\n", ret);
++		goto ereqirq;
++	}
++
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_fb_name);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for fb name\n");
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_cable_state);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for cable state\n");
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_edid);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for edid\n");
++
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_rgb_out_enable);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for rgb out enable\n");
++
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_rgb_quant_range);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for rgb quant range\n");
++
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_enable_3d);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for enable_3d\n");
++
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_enable_fract);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for enable_fract\n");
++
++	ret = device_create_file(&hdmi->pdev->dev, &dev_attr_hdcp_enable);
++	if (ret < 0)
++		dev_warn(&hdmi->pdev->dev,
++			"cound not create sys node for hdcp enable\n");
++
++	dev_dbg(&hdmi->pdev->dev, "%s exit\n", __func__);
++
++	hdmi_inited = true;
++
++	return ret;
++
++efbclient:
++	free_irq(irq, hdmi);
++ereqirq:
++	clk_disable_unprepare(hdmi->hdmi_iahb_clk);
++erate2:
++	clk_put(hdmi->hdmi_iahb_clk);
++egetclk2:
++	clk_disable_unprepare(hdmi->hdmi_isfr_clk);
++erate1:
++	clk_put(hdmi->hdmi_isfr_clk);
++egetclk1:
++	dev_dbg(&hdmi->pdev->dev, "%s error exit\n", __func__);
++
++	return ret;
++}
++
++static void mxc_hdmi_disp_deinit(struct mxc_dispdrv_handle *disp)
++{
++	struct mxc_hdmi *hdmi = mxc_dispdrv_getdata(disp);
++
++	dev_dbg(&hdmi->pdev->dev, "%s\n", __func__);
++
++	fb_unregister_client(&hdmi->nb);
++
++	clk_disable_unprepare(hdmi->hdmi_isfr_clk);
++	clk_put(hdmi->hdmi_isfr_clk);
++	clk_disable_unprepare(hdmi->hdmi_iahb_clk);
++	clk_put(hdmi->hdmi_iahb_clk);
++
++	platform_device_unregister(hdmi->pdev);
++
++	hdmi_inited = false;
++}
++
++static struct mxc_dispdrv_driver mxc_hdmi_drv = {
++	.name	= DISPDRV_HDMI,
++	.init	= mxc_hdmi_disp_init,
++	.deinit	= mxc_hdmi_disp_deinit,
++	.enable = mxc_hdmi_power_on,
++	.disable = mxc_hdmi_power_off,
++};
++
++
++static int mxc_hdmi_open(struct inode *inode, struct file *file)
++{
++	return 0;
++}
++
++static long mxc_hdmi_ioctl(struct file *file,
++		unsigned int cmd, unsigned long arg)
++{
++	int __user *argp = (void __user *)arg;
++	int ret = 0;
++
++	switch (cmd) {
++	case HDMI_IOC_GET_RESOURCE:
++		ret = copy_to_user(argp, &g_hdmi->hdmi_data,
++				sizeof(g_hdmi->hdmi_data)) ? -EFAULT : 0;
++		break;
++	case HDMI_IOC_GET_CPU_TYPE:
++		*argp = g_hdmi->cpu_type;
++		break;
++	default:
++		pr_debug("Unsupport cmd %d\n", cmd);
++		break;
++     }
++     return ret;
++}
++
++static int mxc_hdmi_release(struct inode *inode, struct file *file)
++{
++	return 0;
++}
++
++static const struct file_operations mxc_hdmi_fops = {
++	.owner = THIS_MODULE,
++	.open = mxc_hdmi_open,
++	.release = mxc_hdmi_release,
++	.unlocked_ioctl = mxc_hdmi_ioctl,
++};
++
++
++static int mxc_hdmi_probe(struct platform_device *pdev)
++{
++	struct mxc_hdmi *hdmi;
++	struct device *temp_class;
++	struct resource *res;
++	int ret = 0;
++
++	/* Check I2C driver is loaded and available
++	 * check hdcp function is enable by dts */
++	hdmi_hdcp_get_property(pdev);
++	if (!hdmi_i2c && !hdcp_init)
++		return -ENODEV;
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (!res)
++		return -ENOENT;
++
++	hdmi = devm_kzalloc(&pdev->dev,
++				sizeof(struct mxc_hdmi),
++				GFP_KERNEL);
++	if (!hdmi) {
++		dev_err(&pdev->dev, "Cannot allocate device data\n");
++		ret = -ENOMEM;
++		goto ealloc;
++	}
++	g_hdmi = hdmi;
++
++	hdmi_major = register_chrdev(hdmi_major, "mxc_hdmi", &mxc_hdmi_fops);
++	if (hdmi_major < 0) {
++		printk(KERN_ERR "HDMI: unable to get a major for HDMI\n");
++		ret = -EBUSY;
++		goto ealloc;
++	}
++
++	hdmi_class = class_create(THIS_MODULE, "mxc_hdmi");
++	if (IS_ERR(hdmi_class)) {
++		ret = PTR_ERR(hdmi_class);
++		goto err_out_chrdev;
++	}
++
++	temp_class = device_create(hdmi_class, NULL, MKDEV(hdmi_major, 0),
++				   NULL, "mxc_hdmi");
++	if (IS_ERR(temp_class)) {
++		ret = PTR_ERR(temp_class);
++		goto err_out_class;
++	}
++
++	hdmi->pdev = pdev;
++
++	hdmi->core_pdev = platform_device_alloc("mxc_hdmi_core", -1);
++	if (!hdmi->core_pdev) {
++		pr_err("%s failed platform_device_alloc for hdmi core\n",
++			__func__);
++		ret = -ENOMEM;
++		goto ecore;
++	}
++
++	hdmi->gpr_base = ioremap(res->start, resource_size(res));
++	if (!hdmi->gpr_base) {
++		dev_err(&pdev->dev, "ioremap failed\n");
++		ret = -ENOMEM;
++		goto eiomap;
++	}
++
++	hdmi->gpr_hdmi_base = hdmi->gpr_base + 3;
++	hdmi->gpr_sdma_base = hdmi->gpr_base;
++
++	hdmi_inited = false;
++
++	hdmi->disp_mxc_hdmi = mxc_dispdrv_register(&mxc_hdmi_drv);
++	if (IS_ERR(hdmi->disp_mxc_hdmi)) {
++		dev_err(&pdev->dev, "Failed to register dispdrv - 0x%x\n",
++			(int)hdmi->disp_mxc_hdmi);
++		ret = (int)hdmi->disp_mxc_hdmi;
++		goto edispdrv;
++	}
++	mxc_dispdrv_setdata(hdmi->disp_mxc_hdmi, hdmi);
++
++	platform_set_drvdata(pdev, hdmi);
++
++	return 0;
++edispdrv:
++	iounmap(hdmi->gpr_base);
++eiomap:
++	platform_device_put(hdmi->core_pdev);
++ecore:
++	kfree(hdmi);
++err_out_class:
++	device_destroy(hdmi_class, MKDEV(hdmi_major, 0));
++	class_destroy(hdmi_class);
++err_out_chrdev:
++	unregister_chrdev(hdmi_major, "mxc_hdmi");
++ealloc:
++	return ret;
++}
++
++static int mxc_hdmi_remove(struct platform_device *pdev)
++{
++	struct mxc_hdmi *hdmi = platform_get_drvdata(pdev);
++	int irq = platform_get_irq(pdev, 0);
++
++	fb_unregister_client(&hdmi->nb);
++
++	mxc_dispdrv_puthandle(hdmi->disp_mxc_hdmi);
++	mxc_dispdrv_unregister(hdmi->disp_mxc_hdmi);
++	iounmap(hdmi->gpr_base);
++	/* No new work will be scheduled, wait for running ISR */
++	free_irq(irq, hdmi);
++	kfree(hdmi);
++	g_hdmi = NULL;
++
++	return 0;
++}
++
++static struct platform_driver mxc_hdmi_driver = {
++	.probe = mxc_hdmi_probe,
++	.remove = mxc_hdmi_remove,
++	.driver = {
++		.name = "mxc_hdmi",
++		.of_match_table	= imx_hdmi_dt_ids,
++		.owner = THIS_MODULE,
++	},
++};
++
++static int __init mxc_hdmi_init(void)
++{
++	return platform_driver_register(&mxc_hdmi_driver);
++}
++module_init(mxc_hdmi_init);
++
++static void __exit mxc_hdmi_exit(void)
++{
++	if (hdmi_major > 0) {
++		device_destroy(hdmi_class, MKDEV(hdmi_major, 0));
++		class_destroy(hdmi_class);
++		unregister_chrdev(hdmi_major, "mxc_hdmi");
++		hdmi_major = 0;
++	}
++
++	platform_driver_unregister(&mxc_hdmi_driver);
++}
++module_exit(mxc_hdmi_exit);
++
++static int mxc_hdmi_i2c_probe(struct i2c_client *client,
++		const struct i2c_device_id *id)
++{
++	if (!i2c_check_functionality(client->adapter,
++				I2C_FUNC_SMBUS_BYTE | I2C_FUNC_I2C))
++		return -ENODEV;
++
++	hdmi_i2c = client;
++
++	return 0;
++}
++
++static int mxc_hdmi_i2c_remove(struct i2c_client *client)
++{
++	hdmi_i2c = NULL;
++	return 0;
++}
++
++static const struct of_device_id imx_hdmi_i2c_match[] = {
++	{ .compatible = "fsl,imx6-hdmi-i2c", },
++	{ /* sentinel */ }
++};
++
++static const struct i2c_device_id mxc_hdmi_i2c_id[] = {
++	{ "mxc_hdmi_i2c", 0 },
++	{},
++};
++MODULE_DEVICE_TABLE(i2c, mxc_hdmi_i2c_id);
++
++static struct i2c_driver mxc_hdmi_i2c_driver = {
++	.driver = {
++		   .name = "mxc_hdmi_i2c",
++			.of_match_table	= imx_hdmi_i2c_match,
++		   },
++	.probe = mxc_hdmi_i2c_probe,
++	.remove = mxc_hdmi_i2c_remove,
++	.id_table = mxc_hdmi_i2c_id,
++};
++
++static int __init mxc_hdmi_i2c_init(void)
++{
++	return i2c_add_driver(&mxc_hdmi_i2c_driver);
++}
++
++static void __exit mxc_hdmi_i2c_exit(void)
++{
++	i2c_del_driver(&mxc_hdmi_i2c_driver);
++}
++
++subsys_initcall(mxc_hdmi_i2c_init);
++module_exit(mxc_hdmi_i2c_exit);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_ipuv3_fb.c linux-xbian-imx6/drivers/video/mxc/mxc_ipuv3_fb.c
+--- linux-4.1.3/drivers/video/mxc/mxc_ipuv3_fb.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_ipuv3_fb.c	2015-07-27 23:13:08.753749907 +0200
+@@ -0,0 +1,2579 @@
++/*
++ * Copyright 2004-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @defgroup Framebuffer Framebuffer Driver for SDC and ADC.
++ */
++
++/*!
++ * @file mxcfb.c
++ *
++ * @brief MXC Frame buffer driver for SDC
++ *
++ * @ingroup Framebuffer
++ */
++
++/*!
++ * Include files
++ */
++#include <linux/clk.h>
++#include <linux/console.h>
++#include <linux/delay.h>
++#include <linux/dma-mapping.h>
++#include <linux/errno.h>
++#include <linux/fb.h>
++#include <linux/fsl_devices.h>
++#include <linux/init.h>
++#include <linux/interrupt.h>
++#include <linux/io.h>
++#include <linux/ioport.h>
++#include <linux/ipu.h>
++#include <linux/ipu-v3.h>
++#include <linux/kernel.h>
++#include <linux/module.h>
++#include <linux/mxcfb.h>
++#include <linux/of_device.h>
++#include <linux/platform_device.h>
++#include <linux/sched.h>
++#include <linux/slab.h>
++#include <linux/string.h>
++#include <linux/uaccess.h>
++
++#include "mxc_dispdrv.h"
++
++/*
++ * Driver name
++ */
++#define MXCFB_NAME      "mxc_sdc_fb"
++
++/* Display port number */
++#define MXCFB_PORT_NUM	2
++/*!
++ * Structure containing the MXC specific framebuffer information.
++ */
++struct mxcfb_info {
++	int default_bpp;
++	int cur_blank;
++	int next_blank;
++	ipu_channel_t ipu_ch;
++	int ipu_id;
++	int ipu_di;
++	u32 ipu_di_pix_fmt;
++	bool ipu_int_clk;
++	bool overlay;
++	bool alpha_chan_en;
++	bool late_init;
++	bool first_set_par;
++	dma_addr_t alpha_phy_addr0;
++	dma_addr_t alpha_phy_addr1;
++	void *alpha_virt_addr0;
++	void *alpha_virt_addr1;
++	uint32_t alpha_mem_len;
++	uint32_t ipu_ch_irq;
++	uint32_t ipu_ch_nf_irq;
++	uint32_t ipu_alp_ch_irq;
++	uint32_t cur_ipu_buf;
++	uint32_t cur_ipu_alpha_buf;
++
++	u32 pseudo_palette[16];
++
++	bool mode_found;
++	struct completion flip_complete;
++	struct completion alpha_flip_complete;
++	struct completion vsync_complete;
++
++	void *ipu;
++	struct fb_info *ovfbi;
++
++	struct mxc_dispdrv_handle *dispdrv;
++
++	struct fb_var_screeninfo cur_var;
++};
++
++struct mxcfb_pfmt {
++	u32 fb_pix_fmt;
++	int bpp;
++	struct fb_bitfield red;
++	struct fb_bitfield green;
++	struct fb_bitfield blue;
++	struct fb_bitfield transp;
++};
++
++static const struct mxcfb_pfmt mxcfb_pfmts[] = {
++	/*     pixel         bpp    red         green        blue      transp */
++	{IPU_PIX_FMT_RGB565, 16, {11, 5, 0}, { 5, 6, 0}, { 0, 5, 0}, { 0, 0, 0} },
++	{IPU_PIX_FMT_RGB24,  24, { 0, 8, 0}, { 8, 8, 0}, {16, 8, 0}, { 0, 0, 0} },
++	{IPU_PIX_FMT_BGR24,  24, {16, 8, 0}, { 8, 8, 0}, { 0, 8, 0}, { 0, 0, 0} },
++	{IPU_PIX_FMT_RGB32,  32, { 0, 8, 0}, { 8, 8, 0}, {16, 8, 0}, {24, 8, 0} },
++	{IPU_PIX_FMT_BGR32,  32, {16, 8, 0}, { 8, 8, 0}, { 0, 8, 0}, {24, 8, 0} },
++	{IPU_PIX_FMT_ABGR32, 32, {24, 8, 0}, {16, 8, 0}, { 8, 8, 0}, { 0, 8, 0} },
++};
++
++struct mxcfb_alloc_list {
++	struct list_head list;
++	dma_addr_t phy_addr;
++	void *cpu_addr;
++	u32 size;
++};
++
++enum {
++	BOTH_ON,
++	SRC_ON,
++	TGT_ON,
++	BOTH_OFF
++};
++
++static bool g_dp_in_use[2];
++LIST_HEAD(fb_alloc_list);
++
++/* Return default standard(RGB) pixel format */
++static uint32_t bpp_to_pixfmt(int bpp)
++{
++	uint32_t pixfmt = 0;
++
++	switch (bpp) {
++	case 24:
++		pixfmt = IPU_PIX_FMT_BGR24;
++		break;
++	case 32:
++		pixfmt = IPU_PIX_FMT_BGR32;
++		break;
++	case 16:
++		pixfmt = IPU_PIX_FMT_RGB565;
++		break;
++	}
++	return pixfmt;
++}
++
++static inline int bitfield_is_equal(struct fb_bitfield f1,
++				    struct fb_bitfield f2)
++{
++	return !memcmp(&f1, &f2, sizeof(f1));
++}
++
++static int pixfmt_to_var(uint32_t pixfmt, struct fb_var_screeninfo *var)
++{
++	int i, ret = -1;
++
++	for (i = 0; i < ARRAY_SIZE(mxcfb_pfmts); i++) {
++		if (pixfmt == mxcfb_pfmts[i].fb_pix_fmt) {
++			var->red    = mxcfb_pfmts[i].red;
++			var->green  = mxcfb_pfmts[i].green;
++			var->blue   = mxcfb_pfmts[i].blue;
++			var->transp = mxcfb_pfmts[i].transp;
++			var->bits_per_pixel = mxcfb_pfmts[i].bpp;
++			ret = 0;
++			break;
++		}
++	}
++	return ret;
++}
++
++static int bpp_to_var(int bpp, struct fb_var_screeninfo *var)
++{
++	uint32_t pixfmt = 0;
++
++	pixfmt = bpp_to_pixfmt(bpp);
++	if (pixfmt)
++		return pixfmt_to_var(pixfmt, var);
++	else
++		return -1;
++}
++
++static int check_var_pixfmt(struct fb_var_screeninfo *var)
++{
++	int i, ret = -1;
++
++	for (i = 0; i < ARRAY_SIZE(mxcfb_pfmts); i++) {
++		if (bitfield_is_equal(var->red, mxcfb_pfmts[i].red) &&
++		    bitfield_is_equal(var->green, mxcfb_pfmts[i].green) &&
++		    bitfield_is_equal(var->blue, mxcfb_pfmts[i].blue) &&
++		    bitfield_is_equal(var->transp, mxcfb_pfmts[i].transp) &&
++		    var->bits_per_pixel == mxcfb_pfmts[i].bpp) {
++			ret = 0;
++			break;
++		}
++	}
++	return ret;
++}
++
++static uint32_t fbi_to_pixfmt(struct fb_info *fbi)
++{
++	int i;
++	uint32_t pixfmt = 0;
++
++	if (fbi->var.nonstd)
++		return fbi->var.nonstd;
++
++	for (i = 0; i < ARRAY_SIZE(mxcfb_pfmts); i++) {
++		if (bitfield_is_equal(fbi->var.red, mxcfb_pfmts[i].red) &&
++		    bitfield_is_equal(fbi->var.green, mxcfb_pfmts[i].green) &&
++		    bitfield_is_equal(fbi->var.blue, mxcfb_pfmts[i].blue) &&
++		    bitfield_is_equal(fbi->var.transp, mxcfb_pfmts[i].transp)) {
++			pixfmt = mxcfb_pfmts[i].fb_pix_fmt;
++			break;
++		}
++	}
++
++	if (pixfmt == 0)
++		dev_err(fbi->device, "cannot get pixel format\n");
++
++	return pixfmt;
++}
++
++static struct fb_info *found_registered_fb(ipu_channel_t ipu_ch, int ipu_id)
++{
++	int i;
++	struct mxcfb_info *mxc_fbi;
++	struct fb_info *fbi = NULL;
++
++	for (i = 0; i < num_registered_fb; i++) {
++		mxc_fbi =
++			((struct mxcfb_info *)(registered_fb[i]->par));
++
++		if ((mxc_fbi->ipu_ch == ipu_ch) &&
++			(mxc_fbi->ipu_id == ipu_id)) {
++			fbi = registered_fb[i];
++			break;
++		}
++	}
++	return fbi;
++}
++
++static irqreturn_t mxcfb_irq_handler(int irq, void *dev_id);
++static irqreturn_t mxcfb_nf_irq_handler(int irq, void *dev_id);
++static int mxcfb_blank(int blank, struct fb_info *info);
++static int mxcfb_map_video_memory(struct fb_info *fbi);
++static int mxcfb_unmap_video_memory(struct fb_info *fbi);
++
++/*
++ * Set fixed framebuffer parameters based on variable settings.
++ *
++ * @param       info     framebuffer information pointer
++ */
++static int mxcfb_set_fix(struct fb_info *info)
++{
++	struct fb_fix_screeninfo *fix = &info->fix;
++	struct fb_var_screeninfo *var = &info->var;
++
++	fix->line_length = var->xres_virtual * var->bits_per_pixel / 8;
++
++	fix->type = FB_TYPE_PACKED_PIXELS;
++	fix->accel = FB_ACCEL_NONE;
++	fix->visual = FB_VISUAL_TRUECOLOR;
++	fix->xpanstep = 1;
++	fix->ywrapstep = 1;
++	fix->ypanstep = 1;
++
++	return 0;
++}
++
++static int _setup_disp_channel1(struct fb_info *fbi)
++{
++	ipu_channel_params_t params;
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++
++	memset(&params, 0, sizeof(params));
++
++	if (mxc_fbi->ipu_ch == MEM_DC_SYNC) {
++		params.mem_dc_sync.di = mxc_fbi->ipu_di;
++		if (fbi->var.vmode & FB_VMODE_INTERLACED)
++			params.mem_dc_sync.interlaced = true;
++		params.mem_dc_sync.out_pixel_fmt = mxc_fbi->ipu_di_pix_fmt;
++		params.mem_dc_sync.in_pixel_fmt = fbi_to_pixfmt(fbi);
++	} else {
++		params.mem_dp_bg_sync.di = mxc_fbi->ipu_di;
++		if (fbi->var.vmode & FB_VMODE_INTERLACED)
++			params.mem_dp_bg_sync.interlaced = true;
++		params.mem_dp_bg_sync.out_pixel_fmt = mxc_fbi->ipu_di_pix_fmt;
++		params.mem_dp_bg_sync.in_pixel_fmt = fbi_to_pixfmt(fbi);
++		if (mxc_fbi->alpha_chan_en)
++			params.mem_dp_bg_sync.alpha_chan_en = true;
++	}
++	ipu_init_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch, &params);
++
++	return 0;
++}
++
++static int _setup_disp_channel2(struct fb_info *fbi)
++{
++	int retval = 0;
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++	int fb_stride;
++	unsigned long base;
++	unsigned int fr_xoff, fr_yoff, fr_w, fr_h;
++
++	switch (fbi_to_pixfmt(fbi)) {
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_NV12:
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YVU422P:
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YUV444P:
++		fb_stride = fbi->var.xres_virtual;
++		break;
++	default:
++		fb_stride = fbi->fix.line_length;
++	}
++
++	base = fbi->fix.smem_start;
++	fr_xoff = fbi->var.xoffset;
++	fr_w = fbi->var.xres_virtual;
++	if (!(fbi->var.vmode & FB_VMODE_YWRAP)) {
++		dev_dbg(fbi->device, "Y wrap disabled\n");
++		fr_yoff = fbi->var.yoffset % fbi->var.yres;
++		fr_h = fbi->var.yres;
++		base += fbi->fix.line_length * fbi->var.yres *
++			(fbi->var.yoffset / fbi->var.yres);
++	} else {
++		dev_dbg(fbi->device, "Y wrap enabled\n");
++		fr_yoff = fbi->var.yoffset;
++		fr_h = fbi->var.yres_virtual;
++	}
++	base += fr_yoff * fb_stride + fr_xoff;
++
++	mxc_fbi->cur_ipu_buf = 2;
++	init_completion(&mxc_fbi->flip_complete);
++	/*
++	 * We don't need to wait for vsync at the first time
++	 * we do pan display after fb is initialized, as IPU will
++	 * switch to the newly selected buffer automatically,
++	 * so we call complete() for both mxc_fbi->flip_complete
++	 * and mxc_fbi->alpha_flip_complete.
++	 */
++	complete(&mxc_fbi->flip_complete);
++	if (mxc_fbi->alpha_chan_en) {
++		mxc_fbi->cur_ipu_alpha_buf = 1;
++		init_completion(&mxc_fbi->alpha_flip_complete);
++		complete(&mxc_fbi->alpha_flip_complete);
++	}
++
++	retval = ipu_init_channel_buffer(mxc_fbi->ipu,
++					 mxc_fbi->ipu_ch, IPU_INPUT_BUFFER,
++					 fbi_to_pixfmt(fbi),
++					 fbi->var.xres, fbi->var.yres,
++					 fb_stride,
++					 fbi->var.rotate,
++					 base,
++					 base,
++					 fbi->var.accel_flags &
++						FB_ACCEL_DOUBLE_FLAG ? 0 : base,
++					 0, 0);
++	if (retval) {
++		dev_err(fbi->device,
++			"ipu_init_channel_buffer error %d\n", retval);
++		return retval;
++	}
++
++	/* update u/v offset */
++	ipu_update_channel_offset(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++			IPU_INPUT_BUFFER,
++			fbi_to_pixfmt(fbi),
++			fr_w,
++			fr_h,
++			fr_w,
++			0, 0,
++			fr_yoff,
++			fr_xoff);
++
++	if (mxc_fbi->alpha_chan_en) {
++		retval = ipu_init_channel_buffer(mxc_fbi->ipu,
++						 mxc_fbi->ipu_ch,
++						 IPU_ALPHA_IN_BUFFER,
++						 IPU_PIX_FMT_GENERIC,
++						 fbi->var.xres, fbi->var.yres,
++						 fbi->var.xres,
++						 fbi->var.rotate,
++						 mxc_fbi->alpha_phy_addr1,
++						 mxc_fbi->alpha_phy_addr0,
++						 0,
++						 0, 0);
++		if (retval) {
++			dev_err(fbi->device,
++				"ipu_init_channel_buffer error %d\n", retval);
++			return retval;
++		}
++	}
++
++	return retval;
++}
++
++static bool mxcfb_need_to_set_par(struct fb_info *fbi)
++{
++	struct mxcfb_info *mxc_fbi = fbi->par;
++
++	if ((fbi->var.activate & FB_ACTIVATE_FORCE) &&
++	    (fbi->var.activate & FB_ACTIVATE_MASK) == FB_ACTIVATE_NOW)
++		return true;
++
++	/*
++	 * Ignore xoffset and yoffset update,
++	 * because pan display handles this case.
++	 */
++	mxc_fbi->cur_var.xoffset = fbi->var.xoffset;
++	mxc_fbi->cur_var.yoffset = fbi->var.yoffset;
++
++	return !!memcmp(&mxc_fbi->cur_var, &fbi->var,
++			sizeof(struct fb_var_screeninfo));
++}
++
++/*
++ * Set framebuffer parameters and change the operating mode.
++ *
++ * @param       info     framebuffer information pointer
++ */
++static int mxcfb_set_par(struct fb_info *fbi)
++{
++	int retval = 0;
++	u32 mem_len, alpha_mem_len;
++	ipu_di_signal_cfg_t sig_cfg;
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++
++	int16_t ov_pos_x = 0, ov_pos_y = 0;
++	int ov_pos_ret = 0;
++	struct mxcfb_info *mxc_fbi_fg = NULL;
++	bool ovfbi_enable = false;
++
++	if (ipu_ch_param_bad_alpha_pos(fbi_to_pixfmt(fbi)) &&
++	    mxc_fbi->alpha_chan_en) {
++		dev_err(fbi->device, "Bad pixel format for "
++				"graphics plane fb\n");
++		return -EINVAL;
++	}
++
++	if (mxc_fbi->ovfbi)
++		mxc_fbi_fg = (struct mxcfb_info *)mxc_fbi->ovfbi->par;
++
++	if (mxc_fbi->ovfbi && mxc_fbi_fg)
++		if (mxc_fbi_fg->next_blank == FB_BLANK_UNBLANK)
++			ovfbi_enable = true;
++
++	if (!mxcfb_need_to_set_par(fbi))
++		return 0;
++
++	dev_dbg(fbi->device, "Reconfiguring framebuffer\n");
++
++	if (fbi->var.xres == 0 || fbi->var.yres == 0)
++		return 0;
++
++	if (ovfbi_enable) {
++		ov_pos_ret = ipu_disp_get_window_pos(
++						mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch,
++						&ov_pos_x, &ov_pos_y);
++		if (ov_pos_ret < 0)
++			dev_err(fbi->device, "Get overlay pos failed, dispdrv:%s.\n",
++					mxc_fbi->dispdrv->drv->name);
++
++		ipu_clear_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_irq);
++		ipu_disable_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_irq);
++		ipu_clear_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_nf_irq);
++		ipu_disable_irq(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch_nf_irq);
++		ipu_disable_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch, true);
++		ipu_uninit_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch);
++	}
++
++	ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
++	ipu_disable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
++	ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
++	ipu_disable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
++	ipu_disable_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch, true);
++	ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
++
++	/*
++	 * Disable IPU hsp clock if it is enabled for an
++	 * additional time in ipu common driver.
++	 */
++	if (mxc_fbi->first_set_par && mxc_fbi->late_init)
++		ipu_disable_hsp_clk(mxc_fbi->ipu);
++
++	mxcfb_set_fix(fbi);
++
++	mem_len = fbi->var.yres_virtual * fbi->fix.line_length;
++	if (!fbi->fix.smem_start || (mem_len > fbi->fix.smem_len)) {
++		if (fbi->fix.smem_start)
++			mxcfb_unmap_video_memory(fbi);
++
++		if (mxcfb_map_video_memory(fbi) < 0)
++			return -ENOMEM;
++	}
++
++	if (mxc_fbi->first_set_par) {
++		/*
++		 * Clear the screen in case uboot fb pixel format is not
++		 * the same to kernel fb pixel format.
++		 */
++		if (mxc_fbi->late_init)
++			memset((char *)fbi->screen_base, 0, fbi->fix.smem_len);
++
++		mxc_fbi->first_set_par = false;
++	}
++
++	if (mxc_fbi->alpha_chan_en) {
++		alpha_mem_len = fbi->var.xres * fbi->var.yres;
++		if ((!mxc_fbi->alpha_phy_addr0 && !mxc_fbi->alpha_phy_addr1) ||
++		    (alpha_mem_len > mxc_fbi->alpha_mem_len)) {
++			if (mxc_fbi->alpha_phy_addr0)
++				dma_free_coherent(fbi->device,
++						  mxc_fbi->alpha_mem_len,
++						  mxc_fbi->alpha_virt_addr0,
++						  mxc_fbi->alpha_phy_addr0);
++			if (mxc_fbi->alpha_phy_addr1)
++				dma_free_coherent(fbi->device,
++						  mxc_fbi->alpha_mem_len,
++						  mxc_fbi->alpha_virt_addr1,
++						  mxc_fbi->alpha_phy_addr1);
++
++			mxc_fbi->alpha_virt_addr0 =
++					dma_alloc_coherent(fbi->device,
++						  alpha_mem_len,
++						  &mxc_fbi->alpha_phy_addr0,
++						  GFP_DMA | GFP_KERNEL);
++
++			mxc_fbi->alpha_virt_addr1 =
++					dma_alloc_coherent(fbi->device,
++						  alpha_mem_len,
++						  &mxc_fbi->alpha_phy_addr1,
++						  GFP_DMA | GFP_KERNEL);
++			if (mxc_fbi->alpha_virt_addr0 == NULL ||
++			    mxc_fbi->alpha_virt_addr1 == NULL) {
++				dev_err(fbi->device, "mxcfb: dma alloc for"
++					" alpha buffer failed.\n");
++				if (mxc_fbi->alpha_virt_addr0)
++					dma_free_coherent(fbi->device,
++						  mxc_fbi->alpha_mem_len,
++						  mxc_fbi->alpha_virt_addr0,
++						  mxc_fbi->alpha_phy_addr0);
++				if (mxc_fbi->alpha_virt_addr1)
++					dma_free_coherent(fbi->device,
++						  mxc_fbi->alpha_mem_len,
++						  mxc_fbi->alpha_virt_addr1,
++						  mxc_fbi->alpha_phy_addr1);
++				return -ENOMEM;
++			}
++			mxc_fbi->alpha_mem_len = alpha_mem_len;
++		}
++	}
++
++	if (mxc_fbi->next_blank != FB_BLANK_UNBLANK)
++		return retval;
++
++	if (mxc_fbi->dispdrv && mxc_fbi->dispdrv->drv->setup) {
++		retval = mxc_fbi->dispdrv->drv->setup(mxc_fbi->dispdrv, fbi);
++		if (retval < 0) {
++			dev_err(fbi->device, "setup error, dispdrv:%s.\n",
++					mxc_fbi->dispdrv->drv->name);
++			return -EINVAL;
++		}
++	}
++
++	_setup_disp_channel1(fbi);
++	if (ovfbi_enable)
++		_setup_disp_channel1(mxc_fbi->ovfbi);
++
++	if (!mxc_fbi->overlay) {
++		uint32_t out_pixel_fmt;
++
++		memset(&sig_cfg, 0, sizeof(sig_cfg));
++		if (fbi->var.vmode & FB_VMODE_INTERLACED)
++			sig_cfg.interlaced = true;
++		out_pixel_fmt = mxc_fbi->ipu_di_pix_fmt;
++		if (fbi->var.vmode & FB_VMODE_ODD_FLD_FIRST) /* PAL */
++			sig_cfg.odd_field_first = true;
++		if (mxc_fbi->ipu_int_clk)
++			sig_cfg.int_clk = true;
++		if (fbi->var.sync & FB_SYNC_HOR_HIGH_ACT)
++			sig_cfg.Hsync_pol = true;
++		if (fbi->var.sync & FB_SYNC_VERT_HIGH_ACT)
++			sig_cfg.Vsync_pol = true;
++		if (!(fbi->var.sync & FB_SYNC_CLK_LAT_FALL))
++			sig_cfg.clk_pol = true;
++		if (fbi->var.sync & FB_SYNC_DATA_INVERT)
++			sig_cfg.data_pol = true;
++		if (!(fbi->var.sync & FB_SYNC_OE_LOW_ACT))
++			sig_cfg.enable_pol = true;
++		if (fbi->var.sync & FB_SYNC_CLK_IDLE_EN)
++			sig_cfg.clkidle_en = true;
++
++		dev_dbg(fbi->device, "pixclock = %ul Hz\n",
++			(u32) (PICOS2KHZ(fbi->var.pixclock) * 1000UL));
++
++		if (ipu_init_sync_panel(mxc_fbi->ipu, mxc_fbi->ipu_di,
++					(PICOS2KHZ(fbi->var.pixclock)) * 1000UL,
++					fbi->var.xres, fbi->var.yres,
++					out_pixel_fmt,
++					fbi->var.left_margin,
++					fbi->var.hsync_len,
++					fbi->var.right_margin,
++					fbi->var.upper_margin,
++					fbi->var.vsync_len,
++					fbi->var.lower_margin,
++					0, sig_cfg) != 0) {
++			dev_err(fbi->device,
++				"mxcfb: Error initializing panel.\n");
++			return -EINVAL;
++		}
++
++		fbi->mode =
++		    (struct fb_videomode *)fb_match_mode(&fbi->var,
++							 &fbi->modelist);
++
++		ipu_disp_set_window_pos(mxc_fbi->ipu, mxc_fbi->ipu_ch, 0, 0);
++	}
++
++	retval = _setup_disp_channel2(fbi);
++	if (retval) {
++		ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
++		return retval;
++	}
++
++	if (ovfbi_enable) {
++		if (ov_pos_ret >= 0)
++			ipu_disp_set_window_pos(
++					mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch,
++					ov_pos_x, ov_pos_y);
++		retval = _setup_disp_channel2(mxc_fbi->ovfbi);
++		if (retval) {
++			ipu_uninit_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch);
++			ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
++			return retval;
++		}
++	}
++
++	ipu_enable_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
++	if (ovfbi_enable)
++		ipu_enable_channel(mxc_fbi_fg->ipu, mxc_fbi_fg->ipu_ch);
++
++	if (mxc_fbi->dispdrv && mxc_fbi->dispdrv->drv->enable) {
++		retval = mxc_fbi->dispdrv->drv->enable(mxc_fbi->dispdrv);
++		if (retval < 0) {
++			dev_err(fbi->device, "enable error, dispdrv:%s.\n",
++					mxc_fbi->dispdrv->drv->name);
++			return -EINVAL;
++		}
++	}
++
++	mxc_fbi->cur_var = fbi->var;
++
++	return retval;
++}
++
++static int _swap_channels(struct fb_info *fbi_from,
++			  struct fb_info *fbi_to, bool both_on)
++{
++	int retval, tmp;
++	ipu_channel_t old_ch;
++	struct fb_info *ovfbi;
++	struct mxcfb_info *mxc_fbi_from = (struct mxcfb_info *)fbi_from->par;
++	struct mxcfb_info *mxc_fbi_to = (struct mxcfb_info *)fbi_to->par;
++
++	if (both_on) {
++		ipu_disable_channel(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch, true);
++		ipu_uninit_channel(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch);
++	}
++
++	/* switch the mxc fbi parameters */
++	old_ch = mxc_fbi_from->ipu_ch;
++	mxc_fbi_from->ipu_ch = mxc_fbi_to->ipu_ch;
++	mxc_fbi_to->ipu_ch = old_ch;
++	tmp = mxc_fbi_from->ipu_ch_irq;
++	mxc_fbi_from->ipu_ch_irq = mxc_fbi_to->ipu_ch_irq;
++	mxc_fbi_to->ipu_ch_irq = tmp;
++	tmp = mxc_fbi_from->ipu_ch_nf_irq;
++	mxc_fbi_from->ipu_ch_nf_irq = mxc_fbi_to->ipu_ch_nf_irq;
++	mxc_fbi_to->ipu_ch_nf_irq = tmp;
++	ovfbi = mxc_fbi_from->ovfbi;
++	mxc_fbi_from->ovfbi = mxc_fbi_to->ovfbi;
++	mxc_fbi_to->ovfbi = ovfbi;
++
++	_setup_disp_channel1(fbi_from);
++	retval = _setup_disp_channel2(fbi_from);
++	if (retval)
++		return retval;
++
++	/* switch between dp and dc, disable old idmac, enable new idmac */
++	retval = ipu_swap_channel(mxc_fbi_from->ipu, old_ch, mxc_fbi_from->ipu_ch);
++	ipu_uninit_channel(mxc_fbi_from->ipu, old_ch);
++
++	if (both_on) {
++		_setup_disp_channel1(fbi_to);
++		retval = _setup_disp_channel2(fbi_to);
++		if (retval)
++			return retval;
++		ipu_enable_channel(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch);
++	}
++
++	return retval;
++}
++
++static int swap_channels(struct fb_info *fbi_from)
++{
++	int i;
++	int swap_mode;
++	ipu_channel_t ch_to;
++	struct mxcfb_info *mxc_fbi_from = (struct mxcfb_info *)fbi_from->par;
++	struct fb_info *fbi_to = NULL;
++	struct mxcfb_info *mxc_fbi_to;
++
++	/* what's the target channel? */
++	if (mxc_fbi_from->ipu_ch == MEM_BG_SYNC)
++		ch_to = MEM_DC_SYNC;
++	else
++		ch_to = MEM_BG_SYNC;
++
++	fbi_to = found_registered_fb(ch_to, mxc_fbi_from->ipu_id);
++	if (!fbi_to)
++		return -1;
++	mxc_fbi_to = (struct mxcfb_info *)fbi_to->par;
++
++	ipu_clear_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq);
++	ipu_clear_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq);
++	ipu_free_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq, fbi_from);
++	ipu_free_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq, fbi_to);
++	ipu_clear_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq);
++	ipu_clear_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq);
++	ipu_free_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq, fbi_from);
++	ipu_free_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq, fbi_to);
++
++	if (mxc_fbi_from->cur_blank == FB_BLANK_UNBLANK) {
++		if (mxc_fbi_to->cur_blank == FB_BLANK_UNBLANK)
++			swap_mode = BOTH_ON;
++		else
++			swap_mode = SRC_ON;
++	} else {
++		if (mxc_fbi_to->cur_blank == FB_BLANK_UNBLANK)
++			swap_mode = TGT_ON;
++		else
++			swap_mode = BOTH_OFF;
++	}
++
++	switch (swap_mode) {
++	case BOTH_ON:
++		/* disable target->switch src->enable target */
++		_swap_channels(fbi_from, fbi_to, true);
++		break;
++	case SRC_ON:
++		/* just switch src */
++		_swap_channels(fbi_from, fbi_to, false);
++		break;
++	case TGT_ON:
++		/* just switch target */
++		_swap_channels(fbi_to, fbi_from, false);
++		break;
++	case BOTH_OFF:
++		/* switch directly, no more need to do */
++		mxc_fbi_to->ipu_ch = mxc_fbi_from->ipu_ch;
++		mxc_fbi_from->ipu_ch = ch_to;
++		i = mxc_fbi_from->ipu_ch_irq;
++		mxc_fbi_from->ipu_ch_irq = mxc_fbi_to->ipu_ch_irq;
++		mxc_fbi_to->ipu_ch_irq = i;
++		i = mxc_fbi_from->ipu_ch_nf_irq;
++		mxc_fbi_from->ipu_ch_nf_irq = mxc_fbi_to->ipu_ch_nf_irq;
++		mxc_fbi_to->ipu_ch_nf_irq = i;
++		break;
++	default:
++		break;
++	}
++
++	if (ipu_request_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq,
++		mxcfb_irq_handler, IPU_IRQF_ONESHOT,
++		MXCFB_NAME, fbi_from) != 0) {
++		dev_err(fbi_from->device, "Error registering irq %d\n",
++			mxc_fbi_from->ipu_ch_irq);
++		return -EBUSY;
++	}
++	ipu_disable_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_irq);
++	if (ipu_request_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq,
++		mxcfb_irq_handler, IPU_IRQF_ONESHOT,
++		MXCFB_NAME, fbi_to) != 0) {
++		dev_err(fbi_to->device, "Error registering irq %d\n",
++			mxc_fbi_to->ipu_ch_irq);
++		return -EBUSY;
++	}
++	ipu_disable_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_irq);
++	if (ipu_request_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq,
++		mxcfb_nf_irq_handler, IPU_IRQF_ONESHOT,
++		MXCFB_NAME, fbi_from) != 0) {
++		dev_err(fbi_from->device, "Error registering irq %d\n",
++			mxc_fbi_from->ipu_ch_nf_irq);
++		return -EBUSY;
++	}
++	ipu_disable_irq(mxc_fbi_from->ipu, mxc_fbi_from->ipu_ch_nf_irq);
++	if (ipu_request_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq,
++		mxcfb_nf_irq_handler, IPU_IRQF_ONESHOT,
++		MXCFB_NAME, fbi_to) != 0) {
++		dev_err(fbi_to->device, "Error registering irq %d\n",
++			mxc_fbi_to->ipu_ch_nf_irq);
++		return -EBUSY;
++	}
++	ipu_disable_irq(mxc_fbi_to->ipu, mxc_fbi_to->ipu_ch_nf_irq);
++
++	return 0;
++}
++
++/*
++ * Check framebuffer variable parameters and adjust to valid values.
++ *
++ * @param       var      framebuffer variable parameters
++ *
++ * @param       info     framebuffer information pointer
++ */
++static int mxcfb_check_var(struct fb_var_screeninfo *var, struct fb_info *info)
++{
++	u32 vtotal;
++	u32 htotal;
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)info->par;
++
++
++	if (var->xres == 0 || var->yres == 0)
++		return 0;
++
++	/* fg should not bigger than bg */
++	if (mxc_fbi->ipu_ch == MEM_FG_SYNC) {
++		struct fb_info *fbi_tmp;
++		int bg_xres = 0, bg_yres = 0;
++		int16_t pos_x, pos_y;
++
++		bg_xres = var->xres;
++		bg_yres = var->yres;
++
++		fbi_tmp = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
++		if (fbi_tmp) {
++			bg_xres = fbi_tmp->var.xres;
++			bg_yres = fbi_tmp->var.yres;
++		}
++
++		ipu_disp_get_window_pos(mxc_fbi->ipu, mxc_fbi->ipu_ch, &pos_x, &pos_y);
++
++		if ((var->xres + pos_x) > bg_xres)
++			var->xres = bg_xres - pos_x;
++		if ((var->yres + pos_y) > bg_yres)
++			var->yres = bg_yres - pos_y;
++	}
++
++	if (var->rotate > IPU_ROTATE_VERT_FLIP)
++		var->rotate = IPU_ROTATE_NONE;
++
++	if (var->xres_virtual < var->xres)
++		var->xres_virtual = var->xres;
++
++	if (var->yres_virtual < var->yres)
++		var->yres_virtual = var->yres * 3;
++
++	if ((var->bits_per_pixel != 32) && (var->bits_per_pixel != 24) &&
++	    (var->bits_per_pixel != 16) && (var->bits_per_pixel != 12) &&
++	    (var->bits_per_pixel != 8))
++		var->bits_per_pixel = 16;
++
++	if (check_var_pixfmt(var))
++		/* Fall back to default */
++		bpp_to_var(var->bits_per_pixel, var);
++
++	if (var->pixclock < 1000) {
++		htotal = var->xres + var->right_margin + var->hsync_len +
++		    var->left_margin;
++		vtotal = var->yres + var->lower_margin + var->vsync_len +
++		    var->upper_margin;
++		var->pixclock = (vtotal * htotal * 6UL) / 100UL;
++		var->pixclock = KHZ2PICOS(var->pixclock);
++		dev_dbg(info->device,
++			"pixclock set for 60Hz refresh = %u ps\n",
++			var->pixclock);
++	}
++
++	var->height = -1;
++	var->width = -1;
++	var->grayscale = 0;
++
++	return 0;
++}
++
++static inline u_int _chan_to_field(u_int chan, struct fb_bitfield *bf)
++{
++	chan &= 0xffff;
++	chan >>= 16 - bf->length;
++	return chan << bf->offset;
++}
++
++static int mxcfb_setcolreg(u_int regno, u_int red, u_int green, u_int blue,
++			   u_int trans, struct fb_info *fbi)
++{
++	unsigned int val;
++	int ret = 1;
++
++	/*
++	 * If greyscale is true, then we convert the RGB value
++	 * to greyscale no matter what visual we are using.
++	 */
++	if (fbi->var.grayscale)
++		red = green = blue = (19595 * red + 38470 * green +
++				      7471 * blue) >> 16;
++	switch (fbi->fix.visual) {
++	case FB_VISUAL_TRUECOLOR:
++		/*
++		 * 16-bit True Colour.  We encode the RGB value
++		 * according to the RGB bitfield information.
++		 */
++		if (regno < 16) {
++			u32 *pal = fbi->pseudo_palette;
++
++			val = _chan_to_field(red, &fbi->var.red);
++			val |= _chan_to_field(green, &fbi->var.green);
++			val |= _chan_to_field(blue, &fbi->var.blue);
++
++			pal[regno] = val;
++			ret = 0;
++		}
++		break;
++
++	case FB_VISUAL_STATIC_PSEUDOCOLOR:
++	case FB_VISUAL_PSEUDOCOLOR:
++		break;
++	}
++
++	return ret;
++}
++
++/*
++ * Function to handle custom ioctls for MXC framebuffer.
++ *
++ * @param       inode   inode struct
++ *
++ * @param       file    file struct
++ *
++ * @param       cmd     Ioctl command to handle
++ *
++ * @param       arg     User pointer to command arguments
++ *
++ * @param       fbi     framebuffer information pointer
++ */
++static int mxcfb_ioctl(struct fb_info *fbi, unsigned int cmd, unsigned long arg)
++{
++	int retval = 0;
++	int __user *argp = (void __user *)arg;
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++
++	switch (cmd) {
++	case MXCFB_SET_GBL_ALPHA:
++		{
++			struct mxcfb_gbl_alpha ga;
++
++			if (copy_from_user(&ga, (void *)arg, sizeof(ga))) {
++				retval = -EFAULT;
++				break;
++			}
++
++			if (ipu_disp_set_global_alpha(mxc_fbi->ipu,
++						      mxc_fbi->ipu_ch,
++						      (bool)ga.enable,
++						      ga.alpha)) {
++				retval = -EINVAL;
++				break;
++			}
++
++			if (ga.enable)
++				mxc_fbi->alpha_chan_en = false;
++
++			if (ga.enable)
++				dev_dbg(fbi->device,
++					"Set global alpha of %s to %d\n",
++					fbi->fix.id, ga.alpha);
++			break;
++		}
++	case MXCFB_SET_LOC_ALPHA:
++		{
++			struct mxcfb_loc_alpha la;
++			bool bad_pixfmt =
++				ipu_ch_param_bad_alpha_pos(fbi_to_pixfmt(fbi));
++
++			if (copy_from_user(&la, (void *)arg, sizeof(la))) {
++				retval = -EFAULT;
++				break;
++			}
++
++			if (la.enable && !la.alpha_in_pixel) {
++				struct fb_info *fbi_tmp;
++				ipu_channel_t ipu_ch;
++
++				if (bad_pixfmt) {
++					dev_err(fbi->device, "Bad pixel format "
++						"for graphics plane fb\n");
++					retval = -EINVAL;
++					break;
++				}
++
++				mxc_fbi->alpha_chan_en = true;
++
++				if (mxc_fbi->ipu_ch == MEM_FG_SYNC)
++					ipu_ch = MEM_BG_SYNC;
++				else if (mxc_fbi->ipu_ch == MEM_BG_SYNC)
++					ipu_ch = MEM_FG_SYNC;
++				else {
++					retval = -EINVAL;
++					break;
++				}
++
++				fbi_tmp = found_registered_fb(ipu_ch, mxc_fbi->ipu_id);
++				if (fbi_tmp)
++					((struct mxcfb_info *)(fbi_tmp->par))->alpha_chan_en = false;
++			} else
++				mxc_fbi->alpha_chan_en = false;
++
++			if (ipu_disp_set_global_alpha(mxc_fbi->ipu,
++						      mxc_fbi->ipu_ch,
++						      !(bool)la.enable, 0)) {
++				retval = -EINVAL;
++				break;
++			}
++
++			fbi->var.activate = (fbi->var.activate & ~FB_ACTIVATE_MASK) |
++						FB_ACTIVATE_NOW | FB_ACTIVATE_FORCE;
++			mxcfb_set_par(fbi);
++
++			la.alpha_phy_addr0 = mxc_fbi->alpha_phy_addr0;
++			la.alpha_phy_addr1 = mxc_fbi->alpha_phy_addr1;
++			if (copy_to_user((void *)arg, &la, sizeof(la))) {
++				retval = -EFAULT;
++				break;
++			}
++
++			if (la.enable)
++				dev_dbg(fbi->device,
++					"Enable DP local alpha for %s\n",
++					fbi->fix.id);
++			break;
++		}
++	case MXCFB_SET_LOC_ALP_BUF:
++		{
++			unsigned long base;
++			uint32_t ipu_alp_ch_irq;
++
++			if (!(((mxc_fbi->ipu_ch == MEM_FG_SYNC) ||
++			     (mxc_fbi->ipu_ch == MEM_BG_SYNC)) &&
++			     (mxc_fbi->alpha_chan_en))) {
++				dev_err(fbi->device,
++					"Should use background or overlay "
++					"framebuffer to set the alpha buffer "
++					"number\n");
++				return -EINVAL;
++			}
++
++			if (get_user(base, argp))
++				return -EFAULT;
++
++			if (base != mxc_fbi->alpha_phy_addr0 &&
++			    base != mxc_fbi->alpha_phy_addr1) {
++				dev_err(fbi->device,
++					"Wrong alpha buffer physical address "
++					"%lu\n", base);
++				return -EINVAL;
++			}
++
++			if (mxc_fbi->ipu_ch == MEM_FG_SYNC)
++				ipu_alp_ch_irq = IPU_IRQ_FG_ALPHA_SYNC_EOF;
++			else
++				ipu_alp_ch_irq = IPU_IRQ_BG_ALPHA_SYNC_EOF;
++
++			retval = wait_for_completion_timeout(
++				&mxc_fbi->alpha_flip_complete, HZ/2);
++			if (retval == 0) {
++				dev_err(fbi->device, "timeout when waiting for alpha flip irq\n");
++				retval = -ETIMEDOUT;
++				break;
++			}
++
++			mxc_fbi->cur_ipu_alpha_buf =
++						!mxc_fbi->cur_ipu_alpha_buf;
++			if (ipu_update_channel_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++						      IPU_ALPHA_IN_BUFFER,
++						      mxc_fbi->
++							cur_ipu_alpha_buf,
++						      base) == 0) {
++				ipu_select_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++						  IPU_ALPHA_IN_BUFFER,
++						  mxc_fbi->cur_ipu_alpha_buf);
++				ipu_clear_irq(mxc_fbi->ipu, ipu_alp_ch_irq);
++				ipu_enable_irq(mxc_fbi->ipu, ipu_alp_ch_irq);
++			} else {
++				dev_err(fbi->device,
++					"Error updating %s SDC alpha buf %d "
++					"to address=0x%08lX\n",
++					fbi->fix.id,
++					mxc_fbi->cur_ipu_alpha_buf, base);
++			}
++			break;
++		}
++	case MXCFB_SET_CLR_KEY:
++		{
++			struct mxcfb_color_key key;
++			if (copy_from_user(&key, (void *)arg, sizeof(key))) {
++				retval = -EFAULT;
++				break;
++			}
++			retval = ipu_disp_set_color_key(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++							key.enable,
++							key.color_key);
++			dev_dbg(fbi->device, "Set color key to 0x%08X\n",
++				key.color_key);
++			break;
++		}
++	case MXCFB_SET_GAMMA:
++		{
++			struct mxcfb_gamma gamma;
++			if (copy_from_user(&gamma, (void *)arg, sizeof(gamma))) {
++				retval = -EFAULT;
++				break;
++			}
++			retval = ipu_disp_set_gamma_correction(mxc_fbi->ipu,
++							mxc_fbi->ipu_ch,
++							gamma.enable,
++							gamma.constk,
++							gamma.slopek);
++			break;
++		}
++	case MXCFB_WAIT_FOR_VSYNC:
++		{
++			if (mxc_fbi->ipu_ch == MEM_FG_SYNC) {
++				/* BG should poweron */
++				struct mxcfb_info *bg_mxcfbi = NULL;
++				struct fb_info *fbi_tmp;
++
++				fbi_tmp = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
++				if (fbi_tmp)
++					bg_mxcfbi = ((struct mxcfb_info *)(fbi_tmp->par));
++
++				if (!bg_mxcfbi) {
++					retval = -EINVAL;
++					break;
++				}
++				if (bg_mxcfbi->cur_blank != FB_BLANK_UNBLANK) {
++					retval = -EINVAL;
++					break;
++				}
++			}
++			if (mxc_fbi->cur_blank != FB_BLANK_UNBLANK) {
++				retval = -EINVAL;
++				break;
++			}
++
++			init_completion(&mxc_fbi->vsync_complete);
++			ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
++			ipu_enable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_nf_irq);
++			retval = wait_for_completion_interruptible_timeout(
++				&mxc_fbi->vsync_complete, 1 * HZ);
++			if (retval == 0) {
++				dev_err(fbi->device,
++					"MXCFB_WAIT_FOR_VSYNC: timeout %d\n",
++					retval);
++				retval = -ETIME;
++			} else if (retval > 0) {
++				retval = 0;
++			}
++			break;
++		}
++	case FBIO_ALLOC:
++		{
++			int size;
++			struct mxcfb_alloc_list *mem;
++
++			mem = kzalloc(sizeof(*mem), GFP_KERNEL);
++			if (mem == NULL)
++				return -ENOMEM;
++
++			if (get_user(size, argp))
++				return -EFAULT;
++
++			mem->size = PAGE_ALIGN(size);
++
++			mem->cpu_addr = dma_alloc_coherent(fbi->device, size,
++							   &mem->phy_addr,
++							   GFP_KERNEL);
++			if (mem->cpu_addr == NULL) {
++				kfree(mem);
++				return -ENOMEM;
++			}
++
++			list_add(&mem->list, &fb_alloc_list);
++
++			dev_dbg(fbi->device, "allocated %d bytes @ 0x%08X\n",
++				mem->size, mem->phy_addr);
++
++			if (put_user(mem->phy_addr, argp))
++				return -EFAULT;
++
++			break;
++		}
++	case FBIO_FREE:
++		{
++			unsigned long offset;
++			struct mxcfb_alloc_list *mem;
++
++			if (get_user(offset, argp))
++				return -EFAULT;
++
++			retval = -EINVAL;
++			list_for_each_entry(mem, &fb_alloc_list, list) {
++				if (mem->phy_addr == offset) {
++					list_del(&mem->list);
++					dma_free_coherent(fbi->device,
++							  mem->size,
++							  mem->cpu_addr,
++							  mem->phy_addr);
++					kfree(mem);
++					retval = 0;
++					break;
++				}
++			}
++
++			break;
++		}
++	case MXCFB_SET_OVERLAY_POS:
++		{
++			struct mxcfb_pos pos;
++			struct fb_info *bg_fbi = NULL;
++			struct mxcfb_info *bg_mxcfbi = NULL;
++
++			if (mxc_fbi->ipu_ch != MEM_FG_SYNC) {
++				dev_err(fbi->device, "Should use the overlay "
++					"framebuffer to set the position of "
++					"the overlay window\n");
++				retval = -EINVAL;
++				break;
++			}
++
++			if (copy_from_user(&pos, (void *)arg, sizeof(pos))) {
++				retval = -EFAULT;
++				break;
++			}
++
++			bg_fbi = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
++			if (bg_fbi)
++				bg_mxcfbi = ((struct mxcfb_info *)(bg_fbi->par));
++
++			if (bg_fbi == NULL) {
++				dev_err(fbi->device, "Cannot find the "
++					"background framebuffer\n");
++				retval = -ENOENT;
++				break;
++			}
++
++			/* if fb is unblank, check if the pos fit the display */
++			if (mxc_fbi->cur_blank == FB_BLANK_UNBLANK) {
++				if (fbi->var.xres + pos.x > bg_fbi->var.xres) {
++					if (bg_fbi->var.xres < fbi->var.xres)
++						pos.x = 0;
++					else
++						pos.x = bg_fbi->var.xres - fbi->var.xres;
++				}
++				if (fbi->var.yres + pos.y > bg_fbi->var.yres) {
++					if (bg_fbi->var.yres < fbi->var.yres)
++						pos.y = 0;
++					else
++						pos.y = bg_fbi->var.yres - fbi->var.yres;
++				}
++			}
++
++			retval = ipu_disp_set_window_pos(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++							 pos.x, pos.y);
++
++			if (copy_to_user((void *)arg, &pos, sizeof(pos))) {
++				retval = -EFAULT;
++				break;
++			}
++			break;
++		}
++	case MXCFB_GET_FB_IPU_CHAN:
++		{
++			struct mxcfb_info *mxc_fbi =
++				(struct mxcfb_info *)fbi->par;
++
++			if (put_user(mxc_fbi->ipu_ch, argp))
++				return -EFAULT;
++			break;
++		}
++	case MXCFB_GET_DIFMT:
++		{
++			struct mxcfb_info *mxc_fbi =
++				(struct mxcfb_info *)fbi->par;
++
++			if (put_user(mxc_fbi->ipu_di_pix_fmt, argp))
++				return -EFAULT;
++			break;
++		}
++	case MXCFB_GET_FB_IPU_DI:
++		{
++			struct mxcfb_info *mxc_fbi =
++				(struct mxcfb_info *)fbi->par;
++
++			if (put_user(mxc_fbi->ipu_di, argp))
++				return -EFAULT;
++			break;
++		}
++	case MXCFB_GET_FB_BLANK:
++		{
++			struct mxcfb_info *mxc_fbi =
++				(struct mxcfb_info *)fbi->par;
++
++			if (put_user(mxc_fbi->cur_blank, argp))
++				return -EFAULT;
++			break;
++		}
++	case MXCFB_SET_DIFMT:
++		{
++			struct mxcfb_info *mxc_fbi =
++				(struct mxcfb_info *)fbi->par;
++
++			if (get_user(mxc_fbi->ipu_di_pix_fmt, argp))
++				return -EFAULT;
++
++			break;
++		}
++	case MXCFB_CSC_UPDATE:
++		{
++			struct mxcfb_csc_matrix csc;
++
++			if (copy_from_user(&csc, (void *) arg, sizeof(csc)))
++				return -EFAULT;
++
++			if ((mxc_fbi->ipu_ch != MEM_FG_SYNC) &&
++				(mxc_fbi->ipu_ch != MEM_BG_SYNC) &&
++				(mxc_fbi->ipu_ch != MEM_BG_ASYNC0))
++				return -EFAULT;
++			ipu_set_csc_coefficients(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++						csc.param);
++			break;
++		}
++	default:
++		retval = -EINVAL;
++	}
++	return retval;
++}
++
++/*
++ * mxcfb_blank():
++ *      Blank the display.
++ */
++static int mxcfb_blank(int blank, struct fb_info *info)
++{
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)info->par;
++	int ret = 0;
++
++	dev_dbg(info->device, "blank = %d\n", blank);
++
++	if (mxc_fbi->cur_blank == blank)
++		return 0;
++
++	mxc_fbi->next_blank = blank;
++
++	switch (blank) {
++	case FB_BLANK_POWERDOWN:
++	case FB_BLANK_VSYNC_SUSPEND:
++	case FB_BLANK_HSYNC_SUSPEND:
++	case FB_BLANK_NORMAL:
++		if (mxc_fbi->dispdrv && mxc_fbi->dispdrv->drv->disable)
++			mxc_fbi->dispdrv->drv->disable(mxc_fbi->dispdrv);
++		ipu_disable_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch, true);
++		if (mxc_fbi->ipu_di >= 0)
++			ipu_uninit_sync_panel(mxc_fbi->ipu, mxc_fbi->ipu_di);
++		ipu_uninit_channel(mxc_fbi->ipu, mxc_fbi->ipu_ch);
++		break;
++	case FB_BLANK_UNBLANK:
++		info->var.activate = (info->var.activate & ~FB_ACTIVATE_MASK) |
++				FB_ACTIVATE_NOW | FB_ACTIVATE_FORCE;
++		ret = mxcfb_set_par(info);
++		break;
++	}
++	if (!ret)
++		mxc_fbi->cur_blank = blank;
++	return ret;
++}
++
++/*
++ * Pan or Wrap the Display
++ *
++ * This call looks only at xoffset, yoffset and the FB_VMODE_YWRAP flag
++ *
++ * @param               var     Variable screen buffer information
++ * @param               info    Framebuffer information pointer
++ */
++static int
++mxcfb_pan_display(struct fb_var_screeninfo *var, struct fb_info *info)
++{
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)info->par,
++			  *mxc_graphic_fbi = NULL;
++	u_int y_bottom;
++	unsigned int fr_xoff, fr_yoff, fr_w, fr_h;
++	unsigned long base, active_alpha_phy_addr = 0;
++	bool loc_alpha_en = false;
++	int fb_stride;
++	int i;
++	int ret;
++
++	/* no pan display during fb blank */
++	if (mxc_fbi->ipu_ch == MEM_FG_SYNC) {
++		struct mxcfb_info *bg_mxcfbi = NULL;
++		struct fb_info *fbi_tmp;
++
++		fbi_tmp = found_registered_fb(MEM_BG_SYNC, mxc_fbi->ipu_id);
++		if (fbi_tmp)
++			bg_mxcfbi = ((struct mxcfb_info *)(fbi_tmp->par));
++		if (!bg_mxcfbi)
++			return -EINVAL;
++		if (bg_mxcfbi->cur_blank != FB_BLANK_UNBLANK)
++			return -EINVAL;
++	}
++	if (mxc_fbi->cur_blank != FB_BLANK_UNBLANK)
++		return -EINVAL;
++
++	y_bottom = var->yoffset;
++
++	if (y_bottom > info->var.yres_virtual)
++		return -EINVAL;
++
++	switch (fbi_to_pixfmt(info)) {
++	case IPU_PIX_FMT_YUV420P2:
++	case IPU_PIX_FMT_YVU420P:
++	case IPU_PIX_FMT_NV12:
++	case IPU_PIX_FMT_YUV422P:
++	case IPU_PIX_FMT_YVU422P:
++	case IPU_PIX_FMT_YUV420P:
++	case IPU_PIX_FMT_YUV444P:
++		fb_stride = info->var.xres_virtual;
++		break;
++	default:
++		fb_stride = info->fix.line_length;
++	}
++
++	base = info->fix.smem_start;
++	fr_xoff = var->xoffset;
++	fr_w = info->var.xres_virtual;
++	if (!(var->vmode & FB_VMODE_YWRAP)) {
++		dev_dbg(info->device, "Y wrap disabled\n");
++		fr_yoff = var->yoffset % info->var.yres;
++		fr_h = info->var.yres;
++		base += info->fix.line_length * info->var.yres *
++			(var->yoffset / info->var.yres);
++	} else {
++		dev_dbg(info->device, "Y wrap enabled\n");
++		fr_yoff = var->yoffset;
++		fr_h = info->var.yres_virtual;
++	}
++	base += fr_yoff * fb_stride + fr_xoff;
++
++	/* Check if DP local alpha is enabled and find the graphic fb */
++	if (mxc_fbi->ipu_ch == MEM_BG_SYNC || mxc_fbi->ipu_ch == MEM_FG_SYNC) {
++		for (i = 0; i < num_registered_fb; i++) {
++			char bg_id[] = "DISP3 BG";
++			char fg_id[] = "DISP3 FG";
++			char *idstr = registered_fb[i]->fix.id;
++			bg_id[4] += mxc_fbi->ipu_id;
++			fg_id[4] += mxc_fbi->ipu_id;
++			if ((strcmp(idstr, bg_id) == 0 ||
++			     strcmp(idstr, fg_id) == 0) &&
++			    ((struct mxcfb_info *)
++			      (registered_fb[i]->par))->alpha_chan_en) {
++				loc_alpha_en = true;
++				mxc_graphic_fbi = (struct mxcfb_info *)
++						(registered_fb[i]->par);
++				active_alpha_phy_addr =
++					mxc_fbi->cur_ipu_alpha_buf ?
++					mxc_graphic_fbi->alpha_phy_addr1 :
++					mxc_graphic_fbi->alpha_phy_addr0;
++				dev_dbg(info->device, "Updating SDC alpha "
++					"buf %d address=0x%08lX\n",
++					!mxc_fbi->cur_ipu_alpha_buf,
++					active_alpha_phy_addr);
++				break;
++			}
++		}
++	}
++
++	ret = wait_for_completion_timeout(&mxc_fbi->flip_complete, HZ/2);
++	if (ret == 0) {
++		dev_err(info->device, "timeout when waiting for flip irq\n");
++		return -ETIMEDOUT;
++	}
++
++	++mxc_fbi->cur_ipu_buf;
++	mxc_fbi->cur_ipu_buf %= 3;
++	mxc_fbi->cur_ipu_alpha_buf = !mxc_fbi->cur_ipu_alpha_buf;
++
++	dev_dbg(info->device, "Updating SDC %s buf %d address=0x%08lX\n",
++		info->fix.id, mxc_fbi->cur_ipu_buf, base);
++
++	if (ipu_update_channel_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch, IPU_INPUT_BUFFER,
++				      mxc_fbi->cur_ipu_buf, base) == 0) {
++		/* Update the DP local alpha buffer only for graphic plane */
++		if (loc_alpha_en && mxc_graphic_fbi == mxc_fbi &&
++		    ipu_update_channel_buffer(mxc_graphic_fbi->ipu, mxc_graphic_fbi->ipu_ch,
++					      IPU_ALPHA_IN_BUFFER,
++					      mxc_fbi->cur_ipu_alpha_buf,
++					      active_alpha_phy_addr) == 0) {
++			ipu_select_buffer(mxc_graphic_fbi->ipu, mxc_graphic_fbi->ipu_ch,
++					  IPU_ALPHA_IN_BUFFER,
++					  mxc_fbi->cur_ipu_alpha_buf);
++		}
++
++		/* update u/v offset */
++		ipu_update_channel_offset(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++				IPU_INPUT_BUFFER,
++				fbi_to_pixfmt(info),
++				fr_w,
++				fr_h,
++				fr_w,
++				0, 0,
++				fr_yoff,
++				fr_xoff);
++
++		ipu_select_buffer(mxc_fbi->ipu, mxc_fbi->ipu_ch, IPU_INPUT_BUFFER,
++				  mxc_fbi->cur_ipu_buf);
++		ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
++		ipu_enable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
++	} else {
++		dev_err(info->device,
++			"Error updating SDC buf %d to address=0x%08lX, "
++			"current buf %d, buf0 ready %d, buf1 ready %d, "
++			"buf2 ready %d\n", mxc_fbi->cur_ipu_buf, base,
++			ipu_get_cur_buffer_idx(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++					       IPU_INPUT_BUFFER),
++			ipu_check_buffer_ready(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++					       IPU_INPUT_BUFFER, 0),
++			ipu_check_buffer_ready(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++					       IPU_INPUT_BUFFER, 1),
++			ipu_check_buffer_ready(mxc_fbi->ipu, mxc_fbi->ipu_ch,
++					       IPU_INPUT_BUFFER, 2));
++		++mxc_fbi->cur_ipu_buf;
++		mxc_fbi->cur_ipu_buf %= 3;
++		++mxc_fbi->cur_ipu_buf;
++		mxc_fbi->cur_ipu_buf %= 3;
++		mxc_fbi->cur_ipu_alpha_buf = !mxc_fbi->cur_ipu_alpha_buf;
++		ipu_clear_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
++		ipu_enable_irq(mxc_fbi->ipu, mxc_fbi->ipu_ch_irq);
++		return -EBUSY;
++	}
++
++	dev_dbg(info->device, "Update complete\n");
++
++	info->var.yoffset = var->yoffset;
++
++	return 0;
++}
++
++/*
++ * Function to handle custom mmap for MXC framebuffer.
++ *
++ * @param       fbi     framebuffer information pointer
++ *
++ * @param       vma     Pointer to vm_area_struct
++ */
++static int mxcfb_mmap(struct fb_info *fbi, struct vm_area_struct *vma)
++{
++	bool found = false;
++	u32 len;
++	unsigned long offset = vma->vm_pgoff << PAGE_SHIFT;
++	struct mxcfb_alloc_list *mem;
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++
++	if (offset < fbi->fix.smem_len) {
++		/* mapping framebuffer memory */
++		len = fbi->fix.smem_len - offset;
++		vma->vm_pgoff = (fbi->fix.smem_start + offset) >> PAGE_SHIFT;
++	} else if ((vma->vm_pgoff ==
++			(mxc_fbi->alpha_phy_addr0 >> PAGE_SHIFT)) ||
++		   (vma->vm_pgoff ==
++			(mxc_fbi->alpha_phy_addr1 >> PAGE_SHIFT))) {
++		len = mxc_fbi->alpha_mem_len;
++	} else {
++		list_for_each_entry(mem, &fb_alloc_list, list) {
++			if (offset == mem->phy_addr) {
++				found = true;
++				len = mem->size;
++				break;
++			}
++		}
++		if (!found)
++			return -EINVAL;
++	}
++
++	len = PAGE_ALIGN(len);
++	if (vma->vm_end - vma->vm_start > len)
++		return -EINVAL;
++
++	/* make buffers bufferable */
++	vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
++
++	vma->vm_flags |= VM_IO;
++
++	if (remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
++			    vma->vm_end - vma->vm_start, vma->vm_page_prot)) {
++		dev_dbg(fbi->device, "mmap remap_pfn_range failed\n");
++		return -ENOBUFS;
++	}
++
++	return 0;
++}
++
++/*!
++ * This structure contains the pointers to the control functions that are
++ * invoked by the core framebuffer driver to perform operations like
++ * blitting, rectangle filling, copy regions and cursor definition.
++ */
++static struct fb_ops mxcfb_ops = {
++	.owner = THIS_MODULE,
++	.fb_set_par = mxcfb_set_par,
++	.fb_check_var = mxcfb_check_var,
++	.fb_setcolreg = mxcfb_setcolreg,
++	.fb_pan_display = mxcfb_pan_display,
++	.fb_ioctl = mxcfb_ioctl,
++	.fb_mmap = mxcfb_mmap,
++	.fb_fillrect = cfb_fillrect,
++	.fb_copyarea = cfb_copyarea,
++	.fb_imageblit = cfb_imageblit,
++	.fb_blank = mxcfb_blank,
++};
++
++static irqreturn_t mxcfb_irq_handler(int irq, void *dev_id)
++{
++	struct fb_info *fbi = dev_id;
++	struct mxcfb_info *mxc_fbi = fbi->par;
++
++	complete(&mxc_fbi->flip_complete);
++	return IRQ_HANDLED;
++}
++
++static irqreturn_t mxcfb_nf_irq_handler(int irq, void *dev_id)
++{
++	struct fb_info *fbi = dev_id;
++	struct mxcfb_info *mxc_fbi = fbi->par;
++
++	complete(&mxc_fbi->vsync_complete);
++	return IRQ_HANDLED;
++}
++
++static irqreturn_t mxcfb_alpha_irq_handler(int irq, void *dev_id)
++{
++	struct fb_info *fbi = dev_id;
++	struct mxcfb_info *mxc_fbi = fbi->par;
++
++	complete(&mxc_fbi->alpha_flip_complete);
++	return IRQ_HANDLED;
++}
++
++/*
++ * Suspends the framebuffer and blanks the screen. Power management support
++ */
++static int mxcfb_suspend(struct platform_device *pdev, pm_message_t state)
++{
++	struct fb_info *fbi = platform_get_drvdata(pdev);
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++	int saved_blank;
++#ifdef CONFIG_FB_MXC_LOW_PWR_DISPLAY
++	void *fbmem;
++#endif
++
++	if (mxc_fbi->ovfbi) {
++		struct mxcfb_info *mxc_fbi_fg =
++			(struct mxcfb_info *)mxc_fbi->ovfbi->par;
++
++		console_lock();
++		fb_set_suspend(mxc_fbi->ovfbi, 1);
++		saved_blank = mxc_fbi_fg->cur_blank;
++		mxcfb_blank(FB_BLANK_POWERDOWN, mxc_fbi->ovfbi);
++		mxc_fbi_fg->next_blank = saved_blank;
++		console_unlock();
++	}
++
++	console_lock();
++	fb_set_suspend(fbi, 1);
++	saved_blank = mxc_fbi->cur_blank;
++	mxcfb_blank(FB_BLANK_POWERDOWN, fbi);
++	mxc_fbi->next_blank = saved_blank;
++	console_unlock();
++
++	return 0;
++}
++
++/*
++ * Resumes the framebuffer and unblanks the screen. Power management support
++ */
++static int mxcfb_resume(struct platform_device *pdev)
++{
++	struct fb_info *fbi = platform_get_drvdata(pdev);
++	struct mxcfb_info *mxc_fbi = (struct mxcfb_info *)fbi->par;
++
++	console_lock();
++	mxcfb_blank(mxc_fbi->next_blank, fbi);
++	fb_set_suspend(fbi, 0);
++	console_unlock();
++
++	if (mxc_fbi->ovfbi) {
++		struct mxcfb_info *mxc_fbi_fg =
++			(struct mxcfb_info *)mxc_fbi->ovfbi->par;
++		console_lock();
++		mxcfb_blank(mxc_fbi_fg->next_blank, mxc_fbi->ovfbi);
++		fb_set_suspend(mxc_fbi->ovfbi, 0);
++		console_unlock();
++	}
++
++	return 0;
++}
++
++/*
++ * Main framebuffer functions
++ */
++
++/*!
++ * Allocates the DRAM memory for the frame buffer.      This buffer is remapped
++ * into a non-cached, non-buffered, memory region to allow palette and pixel
++ * writes to occur without flushing the cache.  Once this area is remapped,
++ * all virtual memory access to the video memory should occur at the new region.
++ *
++ * @param       fbi     framebuffer information pointer
++ *
++ * @return      Error code indicating success or failure
++ */
++static int mxcfb_map_video_memory(struct fb_info *fbi)
++{
++	if (fbi->fix.smem_len < fbi->var.yres_virtual * fbi->fix.line_length)
++		fbi->fix.smem_len = fbi->var.yres_virtual *
++				    fbi->fix.line_length;
++
++	fbi->screen_base = dma_alloc_writecombine(fbi->device,
++				fbi->fix.smem_len,
++				(dma_addr_t *)&fbi->fix.smem_start,
++				GFP_DMA | GFP_KERNEL);
++	if (fbi->screen_base == 0) {
++		dev_err(fbi->device, "Unable to allocate framebuffer memory\n");
++		fbi->fix.smem_len = 0;
++		fbi->fix.smem_start = 0;
++		return -EBUSY;
++	}
++
++	dev_dbg(fbi->device, "allocated fb @ paddr=0x%08X, size=%d.\n",
++		(uint32_t) fbi->fix.smem_start, fbi->fix.smem_len);
++
++	fbi->screen_size = fbi->fix.smem_len;
++
++	/* Clear the screen */
++	memset((char *)fbi->screen_base, 0, fbi->fix.smem_len);
++
++	return 0;
++}
++
++/*!
++ * De-allocates the DRAM memory for the frame buffer.
++ *
++ * @param       fbi     framebuffer information pointer
++ *
++ * @return      Error code indicating success or failure
++ */
++static int mxcfb_unmap_video_memory(struct fb_info *fbi)
++{
++	dma_free_writecombine(fbi->device, fbi->fix.smem_len,
++			      fbi->screen_base, fbi->fix.smem_start);
++	fbi->screen_base = 0;
++	fbi->fix.smem_start = 0;
++	fbi->fix.smem_len = 0;
++	return 0;
++}
++
++/*!
++ * Initializes the framebuffer information pointer. After allocating
++ * sufficient memory for the framebuffer structure, the fields are
++ * filled with custom information passed in from the configurable
++ * structures.  This includes information such as bits per pixel,
++ * color maps, screen width/height and RGBA offsets.
++ *
++ * @return      Framebuffer structure initialized with our information
++ */
++static struct fb_info *mxcfb_init_fbinfo(struct device *dev, struct fb_ops *ops)
++{
++	struct fb_info *fbi;
++	struct mxcfb_info *mxcfbi;
++
++	/*
++	 * Allocate sufficient memory for the fb structure
++	 */
++	fbi = framebuffer_alloc(sizeof(struct mxcfb_info), dev);
++	if (!fbi)
++		return NULL;
++
++	mxcfbi = (struct mxcfb_info *)fbi->par;
++
++	fbi->var.activate = FB_ACTIVATE_NOW;
++
++	fbi->fbops = ops;
++	fbi->flags = FBINFO_FLAG_DEFAULT;
++	fbi->pseudo_palette = mxcfbi->pseudo_palette;
++
++	/*
++	 * Allocate colormap
++	 */
++	fb_alloc_cmap(&fbi->cmap, 16, 0);
++
++	return fbi;
++}
++
++static ssize_t show_disp_chan(struct device *dev,
++			      struct device_attribute *attr, char *buf)
++{
++	struct fb_info *info = dev_get_drvdata(dev);
++	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)info->par;
++
++	if (mxcfbi->ipu_ch == MEM_BG_SYNC)
++		return sprintf(buf, "2-layer-fb-bg\n");
++	else if (mxcfbi->ipu_ch == MEM_FG_SYNC)
++		return sprintf(buf, "2-layer-fb-fg\n");
++	else if (mxcfbi->ipu_ch == MEM_DC_SYNC)
++		return sprintf(buf, "1-layer-fb\n");
++	else
++		return sprintf(buf, "err: no display chan\n");
++}
++
++static ssize_t swap_disp_chan(struct device *dev,
++			      struct device_attribute *attr,
++			      const char *buf, size_t count)
++{
++	struct fb_info *info = dev_get_drvdata(dev);
++	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)info->par;
++	struct mxcfb_info *fg_mxcfbi = NULL;
++
++	console_lock();
++	/* swap only happen between DP-BG and DC, while DP-FG disable */
++	if (((mxcfbi->ipu_ch == MEM_BG_SYNC) &&
++	     (strstr(buf, "1-layer-fb") != NULL)) ||
++	    ((mxcfbi->ipu_ch == MEM_DC_SYNC) &&
++	     (strstr(buf, "2-layer-fb-bg") != NULL))) {
++		struct fb_info *fbi_fg;
++
++		fbi_fg = found_registered_fb(MEM_FG_SYNC, mxcfbi->ipu_id);
++		if (fbi_fg)
++			fg_mxcfbi = (struct mxcfb_info *)fbi_fg->par;
++
++		if (!fg_mxcfbi ||
++			fg_mxcfbi->cur_blank == FB_BLANK_UNBLANK) {
++			dev_err(dev,
++				"Can not switch while fb2(fb-fg) is on.\n");
++			console_unlock();
++			return count;
++		}
++
++		if (swap_channels(info) < 0)
++			dev_err(dev, "Swap display channel failed.\n");
++	}
++
++	console_unlock();
++	return count;
++}
++static DEVICE_ATTR(fsl_disp_property, S_IWUSR | S_IRUGO,
++		   show_disp_chan, swap_disp_chan);
++
++static ssize_t show_disp_dev(struct device *dev,
++			     struct device_attribute *attr, char *buf)
++{
++	struct fb_info *info = dev_get_drvdata(dev);
++	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)info->par;
++
++	if (mxcfbi->ipu_ch == MEM_FG_SYNC)
++		return sprintf(buf, "overlay\n");
++	else
++		return sprintf(buf, "%s\n", mxcfbi->dispdrv->drv->name);
++}
++static DEVICE_ATTR(fsl_disp_dev_property, S_IRUGO, show_disp_dev, NULL);
++
++static int mxcfb_dispdrv_init(struct platform_device *pdev,
++		struct fb_info *fbi)
++{
++	struct ipuv3_fb_platform_data *plat_data = pdev->dev.platform_data;
++	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)fbi->par;
++	struct mxc_dispdrv_setting setting;
++	char disp_dev[32], *default_dev = "lcd";
++	int ret = 0;
++
++	setting.if_fmt = plat_data->interface_pix_fmt;
++	setting.dft_mode_str = plat_data->mode_str;
++	setting.default_bpp = plat_data->default_bpp;
++	if (!setting.default_bpp)
++		setting.default_bpp = 16;
++	setting.fbi = fbi;
++	if (!strlen(plat_data->disp_dev)) {
++		memcpy(disp_dev, default_dev, strlen(default_dev));
++		disp_dev[strlen(default_dev)] = '\0';
++	} else {
++		memcpy(disp_dev, plat_data->disp_dev,
++				strlen(plat_data->disp_dev));
++		disp_dev[strlen(plat_data->disp_dev)] = '\0';
++	}
++
++	dev_info(&pdev->dev, "register mxc display driver %s\n", disp_dev);
++
++	mxcfbi->dispdrv = mxc_dispdrv_gethandle(disp_dev, &setting);
++	if (IS_ERR(mxcfbi->dispdrv)) {
++		ret = PTR_ERR(mxcfbi->dispdrv);
++		dev_err(&pdev->dev, "NO mxc display driver found!\n");
++		return ret;
++	} else {
++		/* fix-up  */
++		mxcfbi->ipu_di_pix_fmt = setting.if_fmt;
++		mxcfbi->default_bpp = setting.default_bpp;
++
++		/* setting */
++		mxcfbi->ipu_id = setting.dev_id;
++		mxcfbi->ipu_di = setting.disp_id;
++		dev_dbg(&pdev->dev, "di_pixfmt:0x%x, bpp:0x%x, di:%d, ipu:%d\n",
++				setting.if_fmt, setting.default_bpp,
++				setting.disp_id, setting.dev_id);
++	}
++
++	return ret;
++}
++
++/*
++ * Parse user specified options (`video=trident:')
++ * example:
++ * 	video=mxcfb0:dev=lcd,800x480M-16@55,if=RGB565,bpp=16,noaccel
++ *	video=mxcfb0:dev=lcd,800x480M-16@55,if=RGB565,fbpix=RGB565
++ */
++static int mxcfb_option_setup(struct platform_device *pdev, struct fb_info *fbi)
++{
++	struct ipuv3_fb_platform_data *pdata = pdev->dev.platform_data;
++	char *options, *opt, *fb_mode_str = NULL;
++	char name[] = "mxcfb0";
++	uint32_t fb_pix_fmt = 0;
++
++	name[5] += pdev->id;
++	if (fb_get_options(name, &options)) {
++		dev_err(&pdev->dev, "Can't get fb option for %s!\n", name);
++		return -ENODEV;
++	}
++
++	if (!options || !*options)
++		return 0;
++
++	while ((opt = strsep(&options, ",")) != NULL) {
++		if (!*opt)
++			continue;
++
++		if (!strncmp(opt, "dev=", 4)) {
++			memcpy(pdata->disp_dev, opt + 4, strlen(opt) - 4);
++			pdata->disp_dev[strlen(opt) - 4] = '\0';
++		} else if (!strncmp(opt, "if=", 3)) {
++			if (!strncmp(opt+3, "RGB24", 5))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_RGB24;
++			else if (!strncmp(opt+3, "BGR24", 5))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_BGR24;
++			else if (!strncmp(opt+3, "GBR24", 5))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_GBR24;
++			else if (!strncmp(opt+3, "RGB565", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_RGB565;
++			else if (!strncmp(opt+3, "RGB666", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_RGB666;
++			else if (!strncmp(opt+3, "YUV444", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_YUV444;
++			else if (!strncmp(opt+3, "LVDS666", 7))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_LVDS666;
++			else if (!strncmp(opt+3, "YUYV16", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_YUYV;
++			else if (!strncmp(opt+3, "UYVY16", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_UYVY;
++			else if (!strncmp(opt+3, "YVYU16", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_YVYU;
++			else if (!strncmp(opt+3, "VYUY16", 6))
++				pdata->interface_pix_fmt = IPU_PIX_FMT_VYUY;
++		} else if (!strncmp(opt, "fbpix=", 6)) {
++			if (!strncmp(opt+6, "RGB24", 5))
++				fb_pix_fmt = IPU_PIX_FMT_RGB24;
++			else if (!strncmp(opt+6, "BGR24", 5))
++				fb_pix_fmt = IPU_PIX_FMT_BGR24;
++			else if (!strncmp(opt+6, "RGB32", 5))
++				fb_pix_fmt = IPU_PIX_FMT_RGB32;
++			else if (!strncmp(opt+6, "BGR32", 5))
++				fb_pix_fmt = IPU_PIX_FMT_BGR32;
++			else if (!strncmp(opt+6, "ABGR32", 6))
++				fb_pix_fmt = IPU_PIX_FMT_ABGR32;
++			else if (!strncmp(opt+6, "RGB565", 6))
++				fb_pix_fmt = IPU_PIX_FMT_RGB565;
++
++			if (fb_pix_fmt) {
++				pixfmt_to_var(fb_pix_fmt, &fbi->var);
++				pdata->default_bpp =
++					fbi->var.bits_per_pixel;
++			}
++		} else if (!strncmp(opt, "int_clk", 7)) {
++			pdata->int_clk = true;
++			continue;
++		} else if (!strncmp(opt, "bpp=", 4)) {
++			/* bpp setting cannot overwirte fbpix setting */
++			if (fb_pix_fmt)
++				continue;
++
++			pdata->default_bpp =
++				simple_strtoul(opt + 4, NULL, 0);
++
++			fb_pix_fmt = bpp_to_pixfmt(pdata->default_bpp);
++			if (fb_pix_fmt)
++				pixfmt_to_var(fb_pix_fmt, &fbi->var);
++		} else
++			fb_mode_str = opt;
++	}
++
++	if (fb_mode_str)
++		pdata->mode_str = fb_mode_str;
++
++	return 0;
++}
++
++static int mxcfb_register(struct fb_info *fbi)
++{
++	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)fbi->par;
++	struct fb_videomode m;
++	int ret = 0;
++	char bg0_id[] = "DISP3 BG";
++	char bg1_id[] = "DISP3 BG - DI1";
++	char fg_id[] = "DISP3 FG";
++
++	if (mxcfbi->ipu_di == 0) {
++		bg0_id[4] += mxcfbi->ipu_id;
++		strcpy(fbi->fix.id, bg0_id);
++	} else if (mxcfbi->ipu_di == 1) {
++		bg1_id[4] += mxcfbi->ipu_id;
++		strcpy(fbi->fix.id, bg1_id);
++	} else { /* Overlay */
++		fg_id[4] += mxcfbi->ipu_id;
++		strcpy(fbi->fix.id, fg_id);
++	}
++
++	mxcfb_check_var(&fbi->var, fbi);
++
++	mxcfb_set_fix(fbi);
++
++	/* Added first mode to fbi modelist. */
++	if (!fbi->modelist.next || !fbi->modelist.prev)
++		INIT_LIST_HEAD(&fbi->modelist);
++	fb_var_to_videomode(&m, &fbi->var);
++	fb_add_videomode(&m, &fbi->modelist);
++
++	if (ipu_request_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq,
++		mxcfb_irq_handler, IPU_IRQF_ONESHOT, MXCFB_NAME, fbi) != 0) {
++		dev_err(fbi->device, "Error registering EOF irq handler.\n");
++		ret = -EBUSY;
++		goto err0;
++	}
++	ipu_disable_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq);
++	if (ipu_request_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq,
++		mxcfb_nf_irq_handler, IPU_IRQF_ONESHOT, MXCFB_NAME, fbi) != 0) {
++		dev_err(fbi->device, "Error registering NFACK irq handler.\n");
++		ret = -EBUSY;
++		goto err1;
++	}
++	ipu_disable_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq);
++
++	if (mxcfbi->ipu_alp_ch_irq != -1)
++		if (ipu_request_irq(mxcfbi->ipu, mxcfbi->ipu_alp_ch_irq,
++				mxcfb_alpha_irq_handler, IPU_IRQF_ONESHOT,
++					MXCFB_NAME, fbi) != 0) {
++			dev_err(fbi->device, "Error registering alpha irq "
++					"handler.\n");
++			ret = -EBUSY;
++			goto err2;
++		}
++
++	if (!mxcfbi->late_init) {
++		fbi->var.activate |= FB_ACTIVATE_FORCE;
++		console_lock();
++		fbi->flags |= FBINFO_MISC_USEREVENT;
++		ret = fb_set_var(fbi, &fbi->var);
++		fbi->flags &= ~FBINFO_MISC_USEREVENT;
++		console_unlock();
++		if (ret < 0) {
++			dev_err(fbi->device, "Error fb_set_var ret:%d\n", ret);
++			goto err3;
++		}
++
++		if (mxcfbi->next_blank == FB_BLANK_UNBLANK) {
++			console_lock();
++			ret = fb_blank(fbi, FB_BLANK_UNBLANK);
++			console_unlock();
++			if (ret < 0) {
++				dev_err(fbi->device,
++					"Error fb_blank ret:%d\n", ret);
++				goto err4;
++			}
++		}
++	} else {
++		/*
++		 * Setup the channel again though bootloader
++		 * has done this, then set_par() can stop the
++		 * channel neatly and re-initialize it .
++		 */
++		if (mxcfbi->next_blank == FB_BLANK_UNBLANK) {
++			console_lock();
++			_setup_disp_channel1(fbi);
++			ipu_enable_channel(mxcfbi->ipu, mxcfbi->ipu_ch);
++			console_unlock();
++		}
++	}
++
++
++	ret = register_framebuffer(fbi);
++	if (ret < 0)
++		goto err5;
++
++	return ret;
++err5:
++	if (mxcfbi->next_blank == FB_BLANK_UNBLANK) {
++		console_lock();
++		if (!mxcfbi->late_init)
++			fb_blank(fbi, FB_BLANK_POWERDOWN);
++		else {
++			ipu_disable_channel(mxcfbi->ipu, mxcfbi->ipu_ch,
++					    true);
++			ipu_uninit_channel(mxcfbi->ipu, mxcfbi->ipu_ch);
++		}
++		console_unlock();
++	}
++err4:
++err3:
++	if (mxcfbi->ipu_alp_ch_irq != -1)
++		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_alp_ch_irq, fbi);
++err2:
++	ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq, fbi);
++err1:
++	ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq, fbi);
++err0:
++	return ret;
++}
++
++static void mxcfb_unregister(struct fb_info *fbi)
++{
++	struct mxcfb_info *mxcfbi = (struct mxcfb_info *)fbi->par;
++
++	if (mxcfbi->ipu_alp_ch_irq != -1)
++		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_alp_ch_irq, fbi);
++	if (mxcfbi->ipu_ch_irq)
++		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_irq, fbi);
++	if (mxcfbi->ipu_ch_nf_irq)
++		ipu_free_irq(mxcfbi->ipu, mxcfbi->ipu_ch_nf_irq, fbi);
++
++	unregister_framebuffer(fbi);
++}
++
++static int mxcfb_setup_overlay(struct platform_device *pdev,
++		struct fb_info *fbi_bg, struct resource *res)
++{
++	struct fb_info *ovfbi;
++	struct mxcfb_info *mxcfbi_bg = (struct mxcfb_info *)fbi_bg->par;
++	struct mxcfb_info *mxcfbi_fg;
++	int ret = 0;
++
++	ovfbi = mxcfb_init_fbinfo(&pdev->dev, &mxcfb_ops);
++	if (!ovfbi) {
++		ret = -ENOMEM;
++		goto init_ovfbinfo_failed;
++	}
++	mxcfbi_fg = (struct mxcfb_info *)ovfbi->par;
++
++	mxcfbi_fg->ipu = ipu_get_soc(mxcfbi_bg->ipu_id);
++	if (IS_ERR(mxcfbi_fg->ipu)) {
++		ret = -ENODEV;
++		goto get_ipu_failed;
++	}
++	mxcfbi_fg->ipu_id = mxcfbi_bg->ipu_id;
++	mxcfbi_fg->ipu_ch_irq = IPU_IRQ_FG_SYNC_EOF;
++	mxcfbi_fg->ipu_ch_nf_irq = IPU_IRQ_FG_SYNC_NFACK;
++	mxcfbi_fg->ipu_alp_ch_irq = IPU_IRQ_FG_ALPHA_SYNC_EOF;
++	mxcfbi_fg->ipu_ch = MEM_FG_SYNC;
++	mxcfbi_fg->ipu_di = -1;
++	mxcfbi_fg->ipu_di_pix_fmt = mxcfbi_bg->ipu_di_pix_fmt;
++	mxcfbi_fg->overlay = true;
++	mxcfbi_fg->cur_blank = mxcfbi_fg->next_blank = FB_BLANK_POWERDOWN;
++
++	/* Need dummy values until real panel is configured */
++	ovfbi->var.xres = 240;
++	ovfbi->var.yres = 320;
++
++	if (res && res->start && res->end) {
++		ovfbi->fix.smem_len = res->end - res->start + 1;
++		ovfbi->fix.smem_start = res->start;
++		ovfbi->screen_base = ioremap(
++					ovfbi->fix.smem_start,
++					ovfbi->fix.smem_len);
++	}
++
++	ret = mxcfb_register(ovfbi);
++	if (ret < 0)
++		goto register_ov_failed;
++
++	mxcfbi_bg->ovfbi = ovfbi;
++
++	return ret;
++
++register_ov_failed:
++get_ipu_failed:
++	fb_dealloc_cmap(&ovfbi->cmap);
++	framebuffer_release(ovfbi);
++init_ovfbinfo_failed:
++	return ret;
++}
++
++static void mxcfb_unsetup_overlay(struct fb_info *fbi_bg)
++{
++	struct mxcfb_info *mxcfbi_bg = (struct mxcfb_info *)fbi_bg->par;
++	struct fb_info *ovfbi = mxcfbi_bg->ovfbi;
++
++	mxcfb_unregister(ovfbi);
++
++	if (&ovfbi->cmap)
++		fb_dealloc_cmap(&ovfbi->cmap);
++	framebuffer_release(ovfbi);
++}
++
++static bool ipu_usage[2][2];
++static int ipu_test_set_usage(int ipu, int di)
++{
++	if (ipu_usage[ipu][di])
++		return -EBUSY;
++	else
++		ipu_usage[ipu][di] = true;
++	return 0;
++}
++
++static void ipu_clear_usage(int ipu, int di)
++{
++	ipu_usage[ipu][di] = false;
++}
++
++static int mxcfb_get_of_property(struct platform_device *pdev,
++				struct ipuv3_fb_platform_data *plat_data)
++{
++	struct device_node *np = pdev->dev.of_node;
++	const char *disp_dev;
++	const char *mode_str;
++	const char *pixfmt;
++	int err;
++	int len;
++	u32 bpp, int_clk;
++	u32 late_init;
++
++	err = of_property_read_string(np, "disp_dev", &disp_dev);
++	if (err < 0) {
++		dev_dbg(&pdev->dev, "get of property disp_dev fail\n");
++		return err;
++	}
++	err = of_property_read_string(np, "mode_str", &mode_str);
++	if (err < 0) {
++		dev_dbg(&pdev->dev, "get of property mode_str fail\n");
++		return err;
++	}
++	err = of_property_read_string(np, "interface_pix_fmt", &pixfmt);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property pix fmt fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "default_bpp", &bpp);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property bpp fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "int_clk", &int_clk);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property int_clk fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "late_init", &late_init);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property late_init fail\n");
++		return err;
++	}
++
++	if (!strncmp(pixfmt, "RGB24", 5))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_RGB24;
++	else if (!strncmp(pixfmt, "BGR24", 5))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_BGR24;
++	else if (!strncmp(pixfmt, "GBR24", 5))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_GBR24;
++	else if (!strncmp(pixfmt, "RGB565", 6))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_RGB565;
++	else if (!strncmp(pixfmt, "RGB666", 6))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_RGB666;
++	else if (!strncmp(pixfmt, "YUV444", 6))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_YUV444;
++	else if (!strncmp(pixfmt, "LVDS666", 7))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_LVDS666;
++	else if (!strncmp(pixfmt, "YUYV16", 6))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_YUYV;
++	else if (!strncmp(pixfmt, "UYVY16", 6))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_UYVY;
++	else if (!strncmp(pixfmt, "YVYU16", 6))
++		plat_data->interface_pix_fmt = IPU_PIX_FMT_YVYU;
++	else if (!strncmp(pixfmt, "VYUY16", 6))
++				plat_data->interface_pix_fmt = IPU_PIX_FMT_VYUY;
++	else {
++		dev_err(&pdev->dev, "err interface_pix_fmt!\n");
++		return -ENOENT;
++	}
++
++	len = min(sizeof(plat_data->disp_dev) - 1, strlen(disp_dev));
++	memcpy(plat_data->disp_dev, disp_dev, len);
++	plat_data->disp_dev[len] = '\0';
++	plat_data->mode_str = (char *)mode_str;
++	plat_data->default_bpp = bpp;
++	plat_data->int_clk = (bool)int_clk;
++	plat_data->late_init = (bool)late_init;
++	return err;
++}
++
++/*!
++ * Probe routine for the framebuffer driver. It is called during the
++ * driver binding process.      The following functions are performed in
++ * this routine: Framebuffer initialization, Memory allocation and
++ * mapping, Framebuffer registration, IPU initialization.
++ *
++ * @return      Appropriate error code to the kernel common code
++ */
++static int mxcfb_probe(struct platform_device *pdev)
++{
++	struct ipuv3_fb_platform_data *plat_data;
++	struct fb_info *fbi;
++	struct mxcfb_info *mxcfbi;
++	struct resource *res;
++	int ret = 0;
++
++	dev_dbg(&pdev->dev, "%s enter\n", __func__);
++	pdev->id = of_alias_get_id(pdev->dev.of_node, "mxcfb");
++	if (pdev->id < 0) {
++		dev_err(&pdev->dev, "can not get alias id\n");
++		return pdev->id;
++	}
++
++	plat_data = devm_kzalloc(&pdev->dev, sizeof(struct
++					ipuv3_fb_platform_data), GFP_KERNEL);
++	if (!plat_data)
++		return -ENOMEM;
++	pdev->dev.platform_data = plat_data;
++
++	ret = mxcfb_get_of_property(pdev, plat_data);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "get mxcfb of property fail\n");
++		return ret;
++	}
++
++	/* Initialize FB structures */
++	fbi = mxcfb_init_fbinfo(&pdev->dev, &mxcfb_ops);
++	if (!fbi) {
++		ret = -ENOMEM;
++		goto init_fbinfo_failed;
++	}
++
++	ret = mxcfb_option_setup(pdev, fbi);
++	if (ret)
++		goto get_fb_option_failed;
++
++	mxcfbi = (struct mxcfb_info *)fbi->par;
++	mxcfbi->ipu_int_clk = plat_data->int_clk;
++	mxcfbi->late_init = plat_data->late_init;
++	mxcfbi->first_set_par = true;
++	ret = mxcfb_dispdrv_init(pdev, fbi);
++	if (ret < 0)
++		goto init_dispdrv_failed;
++
++	ret = ipu_test_set_usage(mxcfbi->ipu_id, mxcfbi->ipu_di);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "ipu%d-di%d already in use\n",
++				mxcfbi->ipu_id, mxcfbi->ipu_di);
++		goto ipu_in_busy;
++	}
++
++	if (mxcfbi->dispdrv->drv->post_init) {
++		ret = mxcfbi->dispdrv->drv->post_init(mxcfbi->dispdrv,
++						mxcfbi->ipu_id,
++						mxcfbi->ipu_di);
++		if (ret < 0) {
++			dev_err(&pdev->dev, "post init failed\n");
++			goto post_init_failed;
++		}
++	}
++
++	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
++	if (res && res->start && res->end) {
++		fbi->fix.smem_len = res->end - res->start + 1;
++		fbi->fix.smem_start = res->start;
++		fbi->screen_base = ioremap(fbi->fix.smem_start, fbi->fix.smem_len);
++		/* Do not clear the fb content drawn in bootloader. */
++		if (!mxcfbi->late_init)
++			memset(fbi->screen_base, 0, fbi->fix.smem_len);
++	}
++
++	mxcfbi->ipu = ipu_get_soc(mxcfbi->ipu_id);
++	if (IS_ERR(mxcfbi->ipu)) {
++		ret = -ENODEV;
++		goto get_ipu_failed;
++	}
++
++	/* first user uses DP with alpha feature */
++	if (!g_dp_in_use[mxcfbi->ipu_id]) {
++		mxcfbi->ipu_ch_irq = IPU_IRQ_BG_SYNC_EOF;
++		mxcfbi->ipu_ch_nf_irq = IPU_IRQ_BG_SYNC_NFACK;
++		mxcfbi->ipu_alp_ch_irq = IPU_IRQ_BG_ALPHA_SYNC_EOF;
++		mxcfbi->ipu_ch = MEM_BG_SYNC;
++		/* Unblank the primary fb only by default */
++		if (pdev->id == 0)
++			mxcfbi->cur_blank = mxcfbi->next_blank = FB_BLANK_UNBLANK;
++		else
++			mxcfbi->cur_blank = mxcfbi->next_blank = FB_BLANK_POWERDOWN;
++
++		ret = mxcfb_register(fbi);
++		if (ret < 0)
++			goto mxcfb_register_failed;
++
++		ipu_disp_set_global_alpha(mxcfbi->ipu, mxcfbi->ipu_ch,
++					  true, 0x80);
++		ipu_disp_set_color_key(mxcfbi->ipu, mxcfbi->ipu_ch, false, 0);
++
++		res = platform_get_resource(pdev, IORESOURCE_MEM, 1);
++		ret = mxcfb_setup_overlay(pdev, fbi, res);
++
++		if (ret < 0) {
++			mxcfb_unregister(fbi);
++			goto mxcfb_setupoverlay_failed;
++		}
++
++		g_dp_in_use[mxcfbi->ipu_id] = true;
++
++		ret = device_create_file(mxcfbi->ovfbi->dev,
++					 &dev_attr_fsl_disp_property);
++		if (ret)
++			dev_err(mxcfbi->ovfbi->dev, "Error %d on creating "
++						    "file for disp property\n",
++						    ret);
++
++		ret = device_create_file(mxcfbi->ovfbi->dev,
++					 &dev_attr_fsl_disp_dev_property);
++		if (ret)
++			dev_err(mxcfbi->ovfbi->dev, "Error %d on creating "
++						    "file for disp device "
++						    "propety\n", ret);
++	} else {
++		mxcfbi->ipu_ch_irq = IPU_IRQ_DC_SYNC_EOF;
++		mxcfbi->ipu_ch_nf_irq = IPU_IRQ_DC_SYNC_NFACK;
++		mxcfbi->ipu_alp_ch_irq = -1;
++		mxcfbi->ipu_ch = MEM_DC_SYNC;
++		mxcfbi->cur_blank = mxcfbi->next_blank = FB_BLANK_POWERDOWN;
++
++		ret = mxcfb_register(fbi);
++		if (ret < 0)
++			goto mxcfb_register_failed;
++	}
++
++	platform_set_drvdata(pdev, fbi);
++
++	ret = device_create_file(fbi->dev, &dev_attr_fsl_disp_property);
++	if (ret)
++		dev_err(&pdev->dev, "Error %d on creating file for disp "
++				    "property\n", ret);
++
++	ret = device_create_file(fbi->dev, &dev_attr_fsl_disp_dev_property);
++	if (ret)
++		dev_err(&pdev->dev, "Error %d on creating file for disp "
++				    " device propety\n", ret);
++
++	return 0;
++
++mxcfb_setupoverlay_failed:
++mxcfb_register_failed:
++get_ipu_failed:
++post_init_failed:
++	ipu_clear_usage(mxcfbi->ipu_id, mxcfbi->ipu_di);
++ipu_in_busy:
++init_dispdrv_failed:
++	fb_dealloc_cmap(&fbi->cmap);
++	framebuffer_release(fbi);
++get_fb_option_failed:
++init_fbinfo_failed:
++	return ret;
++}
++
++static int mxcfb_remove(struct platform_device *pdev)
++{
++	struct fb_info *fbi = platform_get_drvdata(pdev);
++	struct mxcfb_info *mxc_fbi = fbi->par;
++
++	if (!fbi)
++		return 0;
++
++	device_remove_file(fbi->dev, &dev_attr_fsl_disp_dev_property);
++	device_remove_file(fbi->dev, &dev_attr_fsl_disp_property);
++	mxcfb_blank(FB_BLANK_POWERDOWN, fbi);
++	mxcfb_unregister(fbi);
++	mxcfb_unmap_video_memory(fbi);
++
++	if (mxc_fbi->ovfbi) {
++		device_remove_file(mxc_fbi->ovfbi->dev,
++				   &dev_attr_fsl_disp_dev_property);
++		device_remove_file(mxc_fbi->ovfbi->dev,
++				   &dev_attr_fsl_disp_property);
++		mxcfb_blank(FB_BLANK_POWERDOWN, mxc_fbi->ovfbi);
++		mxcfb_unsetup_overlay(fbi);
++		mxcfb_unmap_video_memory(mxc_fbi->ovfbi);
++	}
++
++	ipu_clear_usage(mxc_fbi->ipu_id, mxc_fbi->ipu_di);
++	if (&fbi->cmap)
++		fb_dealloc_cmap(&fbi->cmap);
++	framebuffer_release(fbi);
++	return 0;
++}
++
++static const struct of_device_id imx_mxcfb_dt_ids[] = {
++	{ .compatible = "fsl,mxc_sdc_fb"},
++	{ /* sentinel */ }
++};
++
++/*!
++ * This structure contains pointers to the power management callback functions.
++ */
++static struct platform_driver mxcfb_driver = {
++	.driver = {
++		.name = MXCFB_NAME,
++		.of_match_table	= imx_mxcfb_dt_ids,
++	},
++	.probe = mxcfb_probe,
++	.remove = mxcfb_remove,
++	.suspend = mxcfb_suspend,
++	.resume = mxcfb_resume,
++};
++
++/*!
++ * Main entry function for the framebuffer. The function registers the power
++ * management callback functions with the kernel and also registers the MXCFB
++ * callback functions with the core Linux framebuffer driver \b fbmem.c
++ *
++ * @return      Error code indicating success or failure
++ */
++int __init mxcfb_init(void)
++{
++	return platform_driver_register(&mxcfb_driver);
++}
++
++void mxcfb_exit(void)
++{
++	platform_driver_unregister(&mxcfb_driver);
++}
++
++module_init(mxcfb_init);
++module_exit(mxcfb_exit);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("MXC framebuffer driver");
++MODULE_LICENSE("GPL");
++MODULE_SUPPORTED_DEVICE("fb");
+diff -Nur linux-4.1.3/drivers/video/mxc/mxc_lcdif.c linux-xbian-imx6/drivers/video/mxc/mxc_lcdif.c
+--- linux-4.1.3/drivers/video/mxc/mxc_lcdif.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/drivers/video/mxc/mxc_lcdif.c	2015-07-27 23:13:08.753749907 +0200
+@@ -0,0 +1,241 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++#include <linux/init.h>
++#include <linux/ipu.h>
++#include <linux/kernel.h>
++#include <linux/module.h>
++#include <linux/mxcfb.h>
++#include <linux/of_device.h>
++#include <linux/pinctrl/consumer.h>
++#include <linux/platform_device.h>
++
++#include "mxc_dispdrv.h"
++
++struct mxc_lcd_platform_data {
++	u32 default_ifmt;
++	u32 ipu_id;
++	u32 disp_id;
++};
++
++struct mxc_lcdif_data {
++	struct platform_device *pdev;
++	struct mxc_dispdrv_handle *disp_lcdif;
++};
++
++#define DISPDRV_LCD	"lcd"
++
++static struct fb_videomode lcdif_modedb[] = {
++	{
++	/* 800x480 @ 57 Hz , pixel clk @ 27MHz */
++	"CLAA-WVGA", 57, 800, 480, 37037, 40, 60, 10, 10, 20, 10,
++	FB_SYNC_CLK_LAT_FALL,
++	FB_VMODE_NONINTERLACED,
++	0,},
++	{
++	/* 800x480 @ 60 Hz , pixel clk @ 32MHz */
++	"SEIKO-WVGA", 60, 800, 480, 29850, 89, 164, 23, 10, 10, 10,
++	FB_SYNC_CLK_LAT_FALL,
++	FB_VMODE_NONINTERLACED,
++	0,},
++	{
++	/* 1920x1080i @ 50 Hz , pixel clk @ 74.5MHz */
++	"LCD-1080I50", 50, 1920, 1080, 13468, 528, 148, 4, 31, 44, 10,
++	FB_SYNC_HOR_HIGH_ACT | FB_SYNC_VERT_HIGH_ACT,
++	FB_VMODE_INTERLACED,
++	0,},
++};
++static int lcdif_modedb_sz = ARRAY_SIZE(lcdif_modedb);
++
++static int lcdif_init(struct mxc_dispdrv_handle *disp,
++	struct mxc_dispdrv_setting *setting)
++{
++	int ret, i;
++	struct mxc_lcdif_data *lcdif = mxc_dispdrv_getdata(disp);
++	struct mxc_lcd_platform_data *plat_data
++			= lcdif->pdev->dev.platform_data;
++	struct fb_videomode *modedb = lcdif_modedb;
++	int modedb_sz = lcdif_modedb_sz;
++
++	/* use platform defined ipu/di */
++	setting->dev_id = plat_data->ipu_id;
++	setting->disp_id = plat_data->disp_id;
++
++	ret = fb_find_mode(&setting->fbi->var, setting->fbi, setting->dft_mode_str,
++				modedb, modedb_sz, NULL, setting->default_bpp);
++	if (!ret) {
++		fb_videomode_to_var(&setting->fbi->var, &modedb[0]);
++		setting->if_fmt = plat_data->default_ifmt;
++	}
++
++	INIT_LIST_HEAD(&setting->fbi->modelist);
++	for (i = 0; i < modedb_sz; i++) {
++		struct fb_videomode m;
++		fb_var_to_videomode(&m, &setting->fbi->var);
++		if (fb_mode_is_equal(&m, &modedb[i])) {
++			fb_add_videomode(&modedb[i],
++					&setting->fbi->modelist);
++			break;
++		}
++	}
++
++	return ret;
++}
++
++void lcdif_deinit(struct mxc_dispdrv_handle *disp)
++{
++	/*TODO*/
++}
++
++static struct mxc_dispdrv_driver lcdif_drv = {
++	.name 	= DISPDRV_LCD,
++	.init 	= lcdif_init,
++	.deinit	= lcdif_deinit,
++};
++
++static int lcd_get_of_property(struct platform_device *pdev,
++				struct mxc_lcd_platform_data *plat_data)
++{
++	struct device_node *np = pdev->dev.of_node;
++	int err;
++	u32 ipu_id, disp_id;
++	const char *default_ifmt;
++
++	err = of_property_read_string(np, "default_ifmt", &default_ifmt);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property default_ifmt fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "ipu_id", &ipu_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property ipu_id fail\n");
++		return err;
++	}
++	err = of_property_read_u32(np, "disp_id", &disp_id);
++	if (err) {
++		dev_dbg(&pdev->dev, "get of property disp_id fail\n");
++		return err;
++	}
++
++	plat_data->ipu_id = ipu_id;
++	plat_data->disp_id = disp_id;
++	if (!strncmp(default_ifmt, "RGB24", 5))
++		plat_data->default_ifmt = IPU_PIX_FMT_RGB24;
++	else if (!strncmp(default_ifmt, "BGR24", 5))
++		plat_data->default_ifmt = IPU_PIX_FMT_BGR24;
++	else if (!strncmp(default_ifmt, "GBR24", 5))
++		plat_data->default_ifmt = IPU_PIX_FMT_GBR24;
++	else if (!strncmp(default_ifmt, "RGB565", 6))
++		plat_data->default_ifmt = IPU_PIX_FMT_RGB565;
++	else if (!strncmp(default_ifmt, "RGB666", 6))
++		plat_data->default_ifmt = IPU_PIX_FMT_RGB666;
++	else if (!strncmp(default_ifmt, "YUV444", 6))
++		plat_data->default_ifmt = IPU_PIX_FMT_YUV444;
++	else if (!strncmp(default_ifmt, "LVDS666", 7))
++		plat_data->default_ifmt = IPU_PIX_FMT_LVDS666;
++	else if (!strncmp(default_ifmt, "YUYV16", 6))
++		plat_data->default_ifmt = IPU_PIX_FMT_YUYV;
++	else if (!strncmp(default_ifmt, "UYVY16", 6))
++		plat_data->default_ifmt = IPU_PIX_FMT_UYVY;
++	else if (!strncmp(default_ifmt, "YVYU16", 6))
++		plat_data->default_ifmt = IPU_PIX_FMT_YVYU;
++	else if (!strncmp(default_ifmt, "VYUY16", 6))
++				plat_data->default_ifmt = IPU_PIX_FMT_VYUY;
++	else {
++		dev_err(&pdev->dev, "err default_ifmt!\n");
++		return -ENOENT;
++	}
++
++	return err;
++}
++
++static int mxc_lcdif_probe(struct platform_device *pdev)
++{
++	int ret;
++	struct pinctrl *pinctrl;
++	struct mxc_lcdif_data *lcdif;
++	struct mxc_lcd_platform_data *plat_data;
++
++	dev_dbg(&pdev->dev, "%s enter\n", __func__);
++	lcdif = devm_kzalloc(&pdev->dev, sizeof(struct mxc_lcdif_data),
++				GFP_KERNEL);
++	if (!lcdif)
++		return -ENOMEM;
++	plat_data = devm_kzalloc(&pdev->dev,
++				sizeof(struct mxc_lcd_platform_data),
++				GFP_KERNEL);
++	if (!plat_data)
++		return -ENOMEM;
++	pdev->dev.platform_data = plat_data;
++
++	ret = lcd_get_of_property(pdev, plat_data);
++	if (ret < 0) {
++		dev_err(&pdev->dev, "get lcd of property fail\n");
++		return ret;
++	}
++
++	pinctrl = devm_pinctrl_get_select_default(&pdev->dev);
++	if (IS_ERR(pinctrl)) {
++		dev_err(&pdev->dev, "can't get/select pinctrl\n");
++		return PTR_ERR(pinctrl);
++	}
++
++	lcdif->pdev = pdev;
++	lcdif->disp_lcdif = mxc_dispdrv_register(&lcdif_drv);
++	mxc_dispdrv_setdata(lcdif->disp_lcdif, lcdif);
++
++	dev_set_drvdata(&pdev->dev, lcdif);
++	dev_dbg(&pdev->dev, "%s exit\n", __func__);
++
++	return ret;
++}
++
++static int mxc_lcdif_remove(struct platform_device *pdev)
++{
++	struct mxc_lcdif_data *lcdif = dev_get_drvdata(&pdev->dev);
++
++	mxc_dispdrv_puthandle(lcdif->disp_lcdif);
++	mxc_dispdrv_unregister(lcdif->disp_lcdif);
++	kfree(lcdif);
++	return 0;
++}
++
++static const struct of_device_id imx_lcd_dt_ids[] = {
++	{ .compatible = "fsl,lcd"},
++	{ /* sentinel */ }
++};
++static struct platform_driver mxc_lcdif_driver = {
++	.driver = {
++		.name = "mxc_lcdif",
++		.of_match_table	= imx_lcd_dt_ids,
++	},
++	.probe = mxc_lcdif_probe,
++	.remove = mxc_lcdif_remove,
++};
++
++static int __init mxc_lcdif_init(void)
++{
++	return platform_driver_register(&mxc_lcdif_driver);
++}
++
++static void __exit mxc_lcdif_exit(void)
++{
++	platform_driver_unregister(&mxc_lcdif_driver);
++}
++
++module_init(mxc_lcdif_init);
++module_exit(mxc_lcdif_exit);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("i.MX ipuv3 LCD extern port driver");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/firmware/imx/sdma/sdma-imx6q.bin.ihex linux-xbian-imx6/firmware/imx/sdma/sdma-imx6q.bin.ihex
+--- linux-4.1.3/firmware/imx/sdma/sdma-imx6q.bin.ihex	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/firmware/imx/sdma/sdma-imx6q.bin.ihex	2015-07-27 23:13:08.841437049 +0200
+@@ -0,0 +1,116 @@
++:1000000053444D4101000000010000001C000000AD
++:1000100026000000B40000007A0600008202000002
++:10002000FFFFFFFF00000000FFFFFFFFFFFFFFFFDC
++:10003000FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFD0
++:10004000FFFFFFFFFFFFFFFF6A1A0000FFFFFFFF38
++:10005000EB020000BB180000FFFFFFFF08040000D8
++:10006000FFFFFFFFC0030000FFFFFFFFFFFFFFFFD9
++:10007000FFFFFFFFAB020000FFFFFFFF7B0300005D
++:10008000FFFFFFFFFFFFFFFF4C0400006E040000B6
++:10009000FFFFFFFF00180000FFFFFFFFFFFFFFFF54
++:1000A000000000000018000062180000161A00008E
++:1000B000061B0000E3C1DB57E35FE357F352016A1D
++:1000C0008F00D500017D8D00A005EB5D7804037DD8
++:1000D00079042C7D367C79041F7CEE56000F600677
++:1000E000057D0965437E0A62417E20980A623E7E54
++:1000F00009653C7E12051205AD026007037DFB55C4
++:10010000D36D2B98FB55041DD36DC86A2F7F011F3B
++:1001100003200048E47C5398FB55D76D1500057803
++:100120000962C86A0962C86AD76D5298FB55D76DD3
++:100130001500150005780A62C86A0A62C86AD76D98
++:100140005298FB55D76D15001500150005780B6208
++:10015000C86A0B62C86AD76D097CDF6D077F000033
++:10016000EB55004D077DFAC1E35706980700CC68B0
++:100170000C6813C20AC20398D9C1E3C1DB57E35F1D
++:10018000E357F352216A8F00D500017D8D00A00551
++:10019000EB5DFB567804037D79042A7D317C79047C
++:1001A000207C700B1103EB53000F6003057D096584
++:1001B000377E0A62357E86980A62327E0965307E15
++:1001C00012051205AD026007027C065A8E98265A67
++:1001D000277F011F03200048E87C700B1103135395
++:1001E000AF98150004780962065A0962265AAE983B
++:1001F0001500150004780A62065A0A62265AAE985B
++:1002000015001500150004780B62065A0B62265A79
++:10021000077C0000EB55004D067DFAC1E357699855
++:1002200007000C6813C20AC26698700B11031353BF
++:100230006C07017CD9C1FB5E8A066B07017CD9C1C2
++:10024000F35EDB59D3588F0110010F398B003CC18D
++:100250002B7DC05AC85B4EC1277C88038906E35CAE
++:10026000FF0D1105FF1DBC053E07004D187D7008F0
++:1002700011007E07097D7D07027D2852E698F8521D
++:10028000DB54BC02CC02097C7C07027D2852EF982B
++:10029000F852D354BC02CC02097D0004DD988B00D7
++:1002A000C052C85359C1D67D0002CD98FF08BF0087
++:1002B0007F07157D8804D500017D8D00A005EB5DCD
++:1002C0008F0212021202FF3ADA05027C3E071899E9
++:1002D000A402DD02027D3E0718995E071899EB55CE
++:1002E0009805EB5DF352FB546A07267D6C07017D90
++:1002F00055996B07577C6907047D6807027D010EDD
++:100300002F999358D600017D8E009355A005935DDB
++:10031000A00602780255045D1D7C004E087C69072A
++:10032000037D0255177E3C99045D147F8906935026
++:100330000048017D2799A099150006780255045DB3
++:100340004F070255245D2F07017CA09917006F0706
++:10035000017C012093559D000700A7D9F598D36C27
++:100360006907047D6807027D010E64999358D600E1
++:10037000017D8E009355A005935DA006027802557D
++:10038000C86D0F7C004E087C6907037D0255097E0D
++:100390007199C86D067F890693500048017D5C996C
++:1003A000A0999A99C36A6907047D6807027D010EC6
++:1003B00087999358D600017D8E009355A005935DD3
++:1003C000A0060278C865045D0F7C004E087C6907B2
++:1003D000037DC865097E9499045D067F8906935064
++:1003E0000048017D7F99A09993559D000700FF6CFF
++:1003F000A7D9F5980000E354EB55004D017CF59822
++:10040000DD98E354EB55FF0A1102FF1A7F07027CC7
++:10041000A005B4999D008C05BA05A0051002BA0488
++:10042000AD0454040600E3C1DB57FB52C36AF35228
++:10043000056A8F00D500017D8D00A005EB5D780475
++:10044000037D79042B7D1E7C7904337CEE56000FEE
++:10045000FB556007027DC36DD599041DC36DC8624D
++:100460003B7E6006027D10021202096A357F12028D
++:10047000096A327F1202096A2F7F011F0320004898
++:10048000E77C099AFB55C76D150015001500057826
++:10049000C8620B6AC8620B6AC76D089AFB55C76DC4
++:1004A000150015000578C8620A6AC8620A6AC76D35
++:1004B000089AFB55C76D15000578C862096AC862BD
++:1004C000096AC76D097C286A077F0000EB55004D5B
++:1004D000057DFAC1DB57BF9977C254040AC2BA99A5
++:1004E000D9C1E3C1DB57F352056A8F00D500017D06
++:1004F0008D00A005FB567804037D7904297D1F7CBF
++:1005000079042E7CE35D700D1105ED55000F600739
++:10051000027D0652329A2652337E6005027D100219
++:100520001202096A2D7F1202096A2A7F1202096AE1
++:10053000277F011F03200048EA7CE3555D9A1500E0
++:1005400015001500047806520B6A26520B6A5C9A55
++:1005500015001500047806520A6A26520A6A5C9A47
++:10056000150004780652096A2652096A097C286A2D
++:10057000077F0000DB57004D057DFAC1DB571B9A52
++:1005800077C254040AC2189AE3C1DB57F352056AD2
++:10059000FB568E02941AC36AC8626902247D941EB7
++:1005A000C36ED36EC8624802C86A9426981EC36E92
++:1005B000D36EC8624C02C86A9826C36E981EC36E7A
++:1005C000C8629826C36E6002097CC8626E02247DF0
++:1005D000096A1E7F0125004D257D849A286A187FAF
++:1005E00004627AC2B89AE36E8F00D805017D8D004F
++:1005F000A005C8626E02107D096A0A7F0120F97C9D
++:10060000286A067F0000004D0D7DFAC1DB576E9A07
++:10061000070004620C6AB59A286AFA7F04627AC2FB
++:1006200058045404286AF47F0AC26B9AD9C1E3C102
++:10063000DB57F352056AFB568E02941A0252690286
++:100640001D7D941E06524802065A9426981E065294
++:100650004C02065A9826981E065260020A7C98267A
++:1006600006526E02237D096A1D7F0125004D247DFF
++:10067000D19A286A177F04627AC2029B8F00D8053C
++:10068000017D8D00A00506526E02107D096A0A7F69
++:100690000120F97C286A067F0000004D0D7DFAC11B
++:1006A000DB57C19A070004620C6AFF9A286AFA7F36
++:1006B00004627AC258045404286AF47F0AC2BE9ABB
++:1006C000016E0B612F7E0B622D7E0B632B7E0C0D5A
++:1006D0001704170417049D04081DCC05017C0C0D9C
++:1006E000D16A000F4207C86FDD6F1C7F8E009D002E
++:1006F00001680B67177ED56B04080278C86F120774
++:10070000117C0B670F7E04080278C86F12070A7C01
++:10071000DD6F087FD169010FC86FDD6F037F0101B5
++:0E0720000004129B0700FF680C680002129B89
++:00000001FF
+diff -Nur linux-4.1.3/firmware/Makefile linux-xbian-imx6/firmware/Makefile
+--- linux-4.1.3/firmware/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/firmware/Makefile	2015-07-27 23:13:08.809550816 +0200
+@@ -62,6 +62,7 @@
+ 				   radeon/RV730_pfp.bin radeon/RV730_me.bin \
+ 				   radeon/RV710_pfp.bin radeon/RV710_me.bin
+ fw-shipped-$(CONFIG_DVB_AV7110) += av7110/bootcode.bin
++fw-shipped-$(CONFIG_IMX_SDMA) += imx/sdma/sdma-imx6q.bin
+ fw-shipped-$(CONFIG_DVB_TTUSB_BUDGET) += ttusb-budget/dspbootcode.bin
+ fw-shipped-$(CONFIG_E100) += e100/d101m_ucode.bin e100/d101s_ucode.bin \
+ 			     e100/d102e_ucode.bin
+diff -Nur linux-4.1.3/fs/btrfs/compression.c linux-xbian-imx6/fs/btrfs/compression.c
+--- linux-4.1.3/fs/btrfs/compression.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/compression.c	2015-07-27 23:13:08.905209516 +0200
+@@ -753,6 +753,8 @@
+ static const struct btrfs_compress_op * const btrfs_compress_op[] = {
+ 	&btrfs_zlib_compress,
+ 	&btrfs_lzo_compress,
++	&btrfs_lz4_compress,
++	&btrfs_lz4hc_compress,
+ };
+ 
+ void __init btrfs_init_compress(void)
+diff -Nur linux-4.1.3/fs/btrfs/compression.h linux-xbian-imx6/fs/btrfs/compression.h
+--- linux-4.1.3/fs/btrfs/compression.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/compression.h	2015-07-27 23:13:08.905209516 +0200
+@@ -79,5 +79,7 @@
+ 
+ extern const struct btrfs_compress_op btrfs_zlib_compress;
+ extern const struct btrfs_compress_op btrfs_lzo_compress;
++extern const struct btrfs_compress_op btrfs_lz4_compress;
++extern const struct btrfs_compress_op btrfs_lz4hc_compress;
+ 
+ #endif
+diff -Nur linux-4.1.3/fs/btrfs/ctree.h linux-xbian-imx6/fs/btrfs/ctree.h
+--- linux-4.1.3/fs/btrfs/ctree.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/ctree.h	2015-07-27 23:13:08.909195295 +0200
+@@ -504,13 +504,7 @@
+ #define BTRFS_FEATURE_INCOMPAT_DEFAULT_SUBVOL	(1ULL << 1)
+ #define BTRFS_FEATURE_INCOMPAT_MIXED_GROUPS	(1ULL << 2)
+ #define BTRFS_FEATURE_INCOMPAT_COMPRESS_LZO	(1ULL << 3)
+-/*
+- * some patches floated around with a second compression method
+- * lets save that incompat here for when they do get in
+- * Note we don't actually support it, we're just reserving the
+- * number
+- */
+-#define BTRFS_FEATURE_INCOMPAT_COMPRESS_LZOv2	(1ULL << 4)
++#define BTRFS_FEATURE_INCOMPAT_COMPRESS_LZ4	(1ULL << 4)
+ 
+ /*
+  * older kernels tried to do bigger metadata blocks, but the
+@@ -539,6 +533,7 @@
+ 	 BTRFS_FEATURE_INCOMPAT_RAID56 |		\
+ 	 BTRFS_FEATURE_INCOMPAT_EXTENDED_IREF |		\
+ 	 BTRFS_FEATURE_INCOMPAT_SKINNY_METADATA |	\
++	 BTRFS_FEATURE_INCOMPAT_COMPRESS_LZ4 |		\
+ 	 BTRFS_FEATURE_INCOMPAT_NO_HOLES)
+ 
+ #define BTRFS_FEATURE_INCOMPAT_SAFE_SET			\
+@@ -709,8 +704,10 @@
+ 	BTRFS_COMPRESS_NONE  = 0,
+ 	BTRFS_COMPRESS_ZLIB  = 1,
+ 	BTRFS_COMPRESS_LZO   = 2,
+-	BTRFS_COMPRESS_TYPES = 2,
+-	BTRFS_COMPRESS_LAST  = 3,
++	BTRFS_COMPRESS_LZ4   = 3,
++	BTRFS_COMPRESS_LZ4HC = 4,
++	BTRFS_COMPRESS_TYPES = 4,
++	BTRFS_COMPRESS_LAST  = 5,
+ };
+ 
+ struct btrfs_inode_item {
+diff -Nur linux-4.1.3/fs/btrfs/disk-io.c linux-xbian-imx6/fs/btrfs/disk-io.c
+--- linux-4.1.3/fs/btrfs/disk-io.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/disk-io.c	2015-07-27 23:13:08.909195295 +0200
+@@ -2703,6 +2703,10 @@
+ 	if (tree_root->fs_info->compress_type == BTRFS_COMPRESS_LZO)
+ 		features |= BTRFS_FEATURE_INCOMPAT_COMPRESS_LZO;
+ 
++	if (tree_root->fs_info->compress_type == BTRFS_COMPRESS_LZ4 ||
++	    tree_root->fs_info->compress_type == BTRFS_COMPRESS_LZ4HC)
++		features |= BTRFS_FEATURE_INCOMPAT_COMPRESS_LZ4;
++
+ 	if (features & BTRFS_FEATURE_INCOMPAT_SKINNY_METADATA)
+ 		printk(KERN_INFO "BTRFS: has skinny extents\n");
+ 
+diff -Nur linux-4.1.3/fs/btrfs/ioctl.c linux-xbian-imx6/fs/btrfs/ioctl.c
+--- linux-4.1.3/fs/btrfs/ioctl.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/ioctl.c	2015-07-27 23:13:08.921152633 +0200
+@@ -1439,6 +1439,10 @@
+ 	if (range->compress_type == BTRFS_COMPRESS_LZO) {
+ 		btrfs_set_fs_incompat(root->fs_info, COMPRESS_LZO);
+ 	}
++	if (range->compress_type == BTRFS_COMPRESS_LZ4 ||
++	    range->compress_type == BTRFS_COMPRESS_LZ4HC) {
++		btrfs_set_fs_incompat(root->fs_info, COMPRESS_LZ4);
++	}
+ 
+ 	ret = defrag_count;
+ 
+diff -Nur linux-4.1.3/fs/btrfs/lz4_wrapper.c linux-xbian-imx6/fs/btrfs/lz4_wrapper.c
+--- linux-4.1.3/fs/btrfs/lz4_wrapper.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/fs/btrfs/lz4_wrapper.c	2015-07-27 23:13:08.921152633 +0200
+@@ -0,0 +1,487 @@
++/*
++ * Copyright (C) 2008 Oracle.  All rights reserved.
++ * Copyright (C) 2013 SUSE.  All rights reserved.
++ *
++ * This program is free software; you can redistribute it and/or
++ * modify it under the terms of the GNU General Public
++ * License v2 as published by the Free Software Foundation.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
++ * General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public
++ * License along with this program; if not, write to the
++ * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
++ * Boston, MA 021110-1307, USA.
++ */
++
++#include <linux/kernel.h>
++#include <linux/slab.h>
++#include <linux/vmalloc.h>
++#include <linux/init.h>
++#include <linux/err.h>
++#include <linux/sched.h>
++#include <linux/pagemap.h>
++#include <linux/bio.h>
++#include <linux/lz4.h>
++#include "compression.h"
++
++#define LZ4_LEN		4
++#define LZ4_CHUNK_SIZE	(4096)
++#define LZ4_MAX_WORKBUF	2*LZ4_CHUNK_SIZE
++
++struct workspace {
++	void *mem;	/* work memory for compression */
++	void *buf;	/* where compressed data goes */
++	void *cbuf;	/* where decompressed data goes */
++	struct list_head list;
++};
++
++static void lz4_free_workspace(struct list_head *ws)
++{
++	struct workspace *workspace = list_entry(ws, struct workspace, list);
++
++	vfree(workspace->buf);
++	vfree(workspace->cbuf);
++	vfree(workspace->mem);
++	kfree(workspace);
++}
++
++static struct list_head *lz4_alloc_workspace_generic(int hi)
++{
++	struct workspace *workspace;
++
++	workspace = kzalloc(sizeof(*workspace), GFP_NOFS);
++	if (!workspace)
++		return ERR_PTR(-ENOMEM);
++
++	if (hi)
++		workspace->mem = vmalloc(LZ4HC_MEM_COMPRESS);
++	else
++		workspace->mem = vmalloc(LZ4_MEM_COMPRESS);
++	workspace->buf = vmalloc(LZ4_MAX_WORKBUF);
++	workspace->cbuf = vmalloc(LZ4_MAX_WORKBUF);
++	if (!workspace->mem || !workspace->buf || !workspace->cbuf)
++		goto fail;
++
++	INIT_LIST_HEAD(&workspace->list);
++
++	return &workspace->list;
++fail:
++	lz4_free_workspace(&workspace->list);
++	return ERR_PTR(-ENOMEM);
++}
++
++static struct list_head *lz4_alloc_workspace(void)
++{
++	return lz4_alloc_workspace_generic(0);
++}
++
++static struct list_head *lz4hc_alloc_workspace(void)
++{
++	return lz4_alloc_workspace_generic(1);
++}
++
++static inline void write_compress_length(char *buf, size_t len)
++{
++	__le32 dlen;
++
++	dlen = cpu_to_le32(len);
++	memcpy(buf, &dlen, LZ4_LEN);
++}
++
++static inline size_t read_compress_length(char *buf)
++{
++	__le32 dlen;
++
++	memcpy(&dlen, buf, LZ4_LEN);
++	return le32_to_cpu(dlen);
++}
++
++static int lz4_compress_pages_generic(struct list_head *ws,
++			      struct address_space *mapping,
++			      u64 start, unsigned long len,
++			      struct page **pages,
++			      unsigned long nr_dest_pages,
++			      unsigned long *out_pages,
++			      unsigned long *total_in,
++			      unsigned long *total_out,
++			      unsigned long max_out, int hi)
++{
++	struct workspace *workspace = list_entry(ws, struct workspace, list);
++	int ret = 0;
++	char *data_in;
++	char *cpage_out;
++	int nr_pages = 0;
++	struct page *in_page = NULL;
++	struct page *out_page = NULL;
++	unsigned long bytes_left;
++
++	size_t in_len;
++	size_t out_len;
++	char *buf;
++	unsigned long tot_in = 0;
++	unsigned long tot_out = 0;
++	unsigned long pg_bytes_left;
++	unsigned long out_offset;
++	unsigned long bytes;
++
++	*out_pages = 0;
++	*total_out = 0;
++	*total_in = 0;
++
++	in_page = find_get_page(mapping, start >> PAGE_CACHE_SHIFT);
++	data_in = kmap(in_page);
++
++	/*
++	 * store the size of all chunks of compressed data in
++	 * the first 4 bytes
++	 */
++	out_page = alloc_page(GFP_NOFS | __GFP_HIGHMEM);
++	if (out_page == NULL) {
++		ret = -ENOMEM;
++		goto out;
++	}
++	cpage_out = kmap(out_page);
++	out_offset = LZ4_LEN;
++	tot_out = LZ4_LEN;
++	pages[0] = out_page;
++	nr_pages = 1;
++	pg_bytes_left = PAGE_CACHE_SIZE - LZ4_LEN;
++
++	/* compress at most one page of data each time */
++	in_len = min(len, PAGE_CACHE_SIZE);
++	while (tot_in < len) {
++		if (hi)
++			ret = lz4hc_compress(data_in, in_len, workspace->cbuf,
++					&out_len, workspace->mem);
++		else
++			ret = lz4_compress(data_in, in_len, workspace->cbuf, &out_len,
++					workspace->mem);
++		if (ret < 0) {
++			printk(KERN_DEBUG
++				"btrfs: lz4 compress in loop returned %d\n",
++			       ret);
++			ret = -1;
++			goto out;
++		}
++
++		/* store the size of this chunk of compressed data */
++		write_compress_length(cpage_out + out_offset, out_len);
++		tot_out += LZ4_LEN;
++		out_offset += LZ4_LEN;
++		pg_bytes_left -= LZ4_LEN;
++
++		tot_in += in_len;
++		tot_out += out_len;
++
++		/* copy bytes from the working buffer into the pages */
++		buf = workspace->cbuf;
++		while (out_len) {
++			bytes = min_t(unsigned long, pg_bytes_left, out_len);
++
++			memcpy(cpage_out + out_offset, buf, bytes);
++
++			out_len -= bytes;
++			pg_bytes_left -= bytes;
++			buf += bytes;
++			out_offset += bytes;
++
++			/*
++			 * we need another page for writing out.
++			 *
++			 * Note if there's less than 4 bytes left, we just
++			 * skip to a new page.
++			 */
++			if ((out_len == 0 && pg_bytes_left < LZ4_LEN) ||
++			    pg_bytes_left == 0) {
++				if (pg_bytes_left) {
++					memset(cpage_out + out_offset, 0,
++					       pg_bytes_left);
++					tot_out += pg_bytes_left;
++				}
++
++				/* we're done, don't allocate new page */
++				if (out_len == 0 && tot_in >= len)
++					break;
++
++				kunmap(out_page);
++				if (nr_pages == nr_dest_pages) {
++					out_page = NULL;
++					ret = -1;
++					goto out;
++				}
++
++				out_page = alloc_page(GFP_NOFS | __GFP_HIGHMEM);
++				if (out_page == NULL) {
++					ret = -ENOMEM;
++					goto out;
++				}
++				cpage_out = kmap(out_page);
++				pages[nr_pages++] = out_page;
++
++				pg_bytes_left = PAGE_CACHE_SIZE;
++				out_offset = 0;
++			}
++		}
++
++		/* we're making it bigger, give up */
++		if (tot_in > 8192 && tot_in < tot_out)
++			goto out;
++
++		/* we're all done */
++		if (tot_in >= len)
++			break;
++
++		if (tot_out > max_out)
++			break;
++
++		bytes_left = len - tot_in;
++		kunmap(in_page);
++		page_cache_release(in_page);
++
++		start += PAGE_CACHE_SIZE;
++		in_page = find_get_page(mapping, start >> PAGE_CACHE_SHIFT);
++		data_in = kmap(in_page);
++		in_len = min(bytes_left, PAGE_CACHE_SIZE);
++	}
++
++	if (tot_out > tot_in)
++		goto out;
++
++	/* store the size of all chunks of compressed data */
++	cpage_out = kmap(pages[0]);
++	write_compress_length(cpage_out, tot_out);
++
++	kunmap(pages[0]);
++
++	ret = 0;
++	*total_out = tot_out;
++	*total_in = tot_in;
++out:
++	*out_pages = nr_pages;
++	if (out_page)
++		kunmap(out_page);
++
++	if (in_page) {
++		kunmap(in_page);
++		page_cache_release(in_page);
++	}
++
++	return ret;
++}
++
++static int lz4_compress_pages(struct list_head *ws,
++			      struct address_space *mapping,
++			      u64 start, unsigned long len,
++			      struct page **pages,
++			      unsigned long nr_dest_pages,
++			      unsigned long *out_pages,
++			      unsigned long *total_in,
++			      unsigned long *total_out,
++			      unsigned long max_out)
++{
++	return lz4_compress_pages_generic(ws, mapping, start, len, pages,
++				nr_dest_pages, out_pages, total_in, total_out,
++				max_out, 0);
++}
++
++static int lz4hc_compress_pages(struct list_head *ws,
++			      struct address_space *mapping,
++			      u64 start, unsigned long len,
++			      struct page **pages,
++			      unsigned long nr_dest_pages,
++			      unsigned long *out_pages,
++			      unsigned long *total_in,
++			      unsigned long *total_out,
++			      unsigned long max_out)
++{
++	return lz4_compress_pages_generic(ws, mapping, start, len, pages,
++				nr_dest_pages, out_pages, total_in, total_out,
++				max_out, 1);
++}
++
++static int lz4_decompress_biovec(struct list_head *ws,
++				 struct page **pages_in,
++				 u64 disk_start,
++				 struct bio_vec *bvec,
++				 int vcnt,
++				 size_t srclen)
++{
++	struct workspace *workspace = list_entry(ws, struct workspace, list);
++	int ret = 0, ret2;
++	char *data_in;
++	unsigned long page_in_index = 0;
++	unsigned long page_out_index = 0;
++	unsigned long total_pages_in = (srclen + PAGE_CACHE_SIZE - 1) /
++					PAGE_CACHE_SIZE;
++	unsigned long buf_start;
++	unsigned long buf_offset = 0;
++	unsigned long bytes;
++	unsigned long working_bytes;
++	unsigned long pg_offset;
++
++	size_t in_len;
++	size_t out_len;
++	unsigned long in_offset;
++	unsigned long in_page_bytes_left;
++	unsigned long tot_in;
++	unsigned long tot_out;
++	unsigned long tot_len;
++	char *buf;
++	bool may_late_unmap, need_unmap;
++
++	data_in = kmap(pages_in[0]);
++	tot_len = read_compress_length(data_in);
++
++	tot_in = LZ4_LEN;
++	in_offset = LZ4_LEN;
++	tot_len = min_t(size_t, srclen, tot_len);
++	in_page_bytes_left = PAGE_CACHE_SIZE - LZ4_LEN;
++
++	tot_out = 0;
++	pg_offset = 0;
++
++	while (tot_in < tot_len) {
++		in_len = read_compress_length(data_in + in_offset);
++		in_page_bytes_left -= LZ4_LEN;
++		in_offset += LZ4_LEN;
++		tot_in += LZ4_LEN;
++
++		tot_in += in_len;
++		working_bytes = in_len;
++		may_late_unmap = need_unmap = false;
++
++		/* fast path: avoid using the working buffer */
++		if (in_page_bytes_left >= in_len) {
++			buf = data_in + in_offset;
++			bytes = in_len;
++			may_late_unmap = true;
++			goto cont;
++		}
++
++		/* copy bytes from the pages into the working buffer */
++		buf = workspace->cbuf;
++		buf_offset = 0;
++		while (working_bytes) {
++			bytes = min(working_bytes, in_page_bytes_left);
++
++			memcpy(buf + buf_offset, data_in + in_offset, bytes);
++			buf_offset += bytes;
++cont:
++			working_bytes -= bytes;
++			in_page_bytes_left -= bytes;
++			in_offset += bytes;
++
++			/* check if we need to pick another page */
++			if ((working_bytes == 0 && in_page_bytes_left < LZ4_LEN)
++			    || in_page_bytes_left == 0) {
++				tot_in += in_page_bytes_left;
++
++				if (working_bytes == 0 && tot_in >= tot_len)
++					break;
++
++				if (page_in_index + 1 >= total_pages_in) {
++					ret = -1;
++					goto done;
++				}
++
++				if (may_late_unmap)
++					need_unmap = true;
++				else
++					kunmap(pages_in[page_in_index]);
++
++				data_in = kmap(pages_in[++page_in_index]);
++
++				in_page_bytes_left = PAGE_CACHE_SIZE;
++				in_offset = 0;
++			}
++		}
++
++		out_len = LZ4_CHUNK_SIZE;
++		ret = lz4_decompress_unknownoutputsize(buf, in_len, workspace->buf,
++				&out_len);
++		if (need_unmap)
++			kunmap(pages_in[page_in_index - 1]);
++		if (ret < 0) {
++			printk(KERN_WARNING "btrfs: lz4 decompress failed\n");
++			ret = -1;
++			break;
++		}
++
++		buf_start = tot_out;
++		tot_out += out_len;
++
++		ret2 = btrfs_decompress_buf2page(workspace->buf, buf_start,
++						 tot_out, disk_start,
++						 bvec, vcnt,
++						 &page_out_index, &pg_offset);
++		if (ret2 == 0)
++			break;
++	}
++done:
++	kunmap(pages_in[page_in_index]);
++	return ret;
++}
++
++static int lz4_decompress_wrapper(struct list_head *ws, unsigned char *data_in,
++			  struct page *dest_page,
++			  unsigned long start_byte,
++			  size_t srclen, size_t destlen)
++{
++	struct workspace *workspace = list_entry(ws, struct workspace, list);
++	size_t in_len;
++	size_t out_len;
++	size_t tot_len;
++	int ret = 0;
++	char *kaddr;
++	unsigned long bytes;
++
++	BUG_ON(srclen < LZ4_LEN);
++
++	tot_len = read_compress_length(data_in);
++	data_in += LZ4_LEN;
++
++	in_len = read_compress_length(data_in);
++	data_in += LZ4_LEN;
++
++	out_len = LZ4_CHUNK_SIZE;
++	ret = lz4_decompress_unknownoutputsize(data_in, in_len, workspace->buf,
++			&out_len);
++	if (ret < 0) {
++		printk(KERN_WARNING "btrfs: lz4 decompress failed\n");
++		ret = -1;
++		goto out;
++	}
++
++	if (out_len < start_byte) {
++		ret = -1;
++		goto out;
++	}
++
++	bytes = min_t(unsigned long, destlen, out_len - start_byte);
++
++	kaddr = kmap_atomic(dest_page);
++	memcpy(kaddr, workspace->buf + start_byte, bytes);
++	kunmap_atomic(kaddr);
++out:
++	return ret;
++}
++
++const struct btrfs_compress_op btrfs_lz4_compress = {
++	.alloc_workspace	= lz4_alloc_workspace,
++	.free_workspace		= lz4_free_workspace,
++	.compress_pages		= lz4_compress_pages,
++	.decompress_biovec	= lz4_decompress_biovec,
++	.decompress		= lz4_decompress_wrapper,
++};
++
++const struct btrfs_compress_op btrfs_lz4hc_compress = {
++	.alloc_workspace	= lz4hc_alloc_workspace,
++	.free_workspace		= lz4_free_workspace,
++	.compress_pages		= lz4hc_compress_pages,
++	.decompress_biovec	= lz4_decompress_biovec,
++	.decompress		= lz4_decompress_wrapper,
++};
+diff -Nur linux-4.1.3/fs/btrfs/Makefile linux-xbian-imx6/fs/btrfs/Makefile
+--- linux-4.1.3/fs/btrfs/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/Makefile	2015-07-27 23:13:08.901223737 +0200
+@@ -9,7 +9,7 @@
+ 	   export.o tree-log.o free-space-cache.o zlib.o lzo.o \
+ 	   compression.o delayed-ref.o relocation.o delayed-inode.o scrub.o \
+ 	   reada.o backref.o ulist.o qgroup.o send.o dev-replace.o raid56.o \
+-	   uuid-tree.o props.o hash.o
++	   uuid-tree.o props.o hash.o lz4_wrapper.o
+ 
+ btrfs-$(CONFIG_BTRFS_FS_POSIX_ACL) += acl.o
+ btrfs-$(CONFIG_BTRFS_FS_CHECK_INTEGRITY) += check-integrity.o
+diff -Nur linux-4.1.3/fs/btrfs/super.c linux-xbian-imx6/fs/btrfs/super.c
+--- linux-4.1.3/fs/btrfs/super.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/fs/btrfs/super.c	2015-07-27 23:13:08.961010425 +0200
+@@ -492,6 +492,20 @@
+ 				btrfs_clear_opt(info->mount_opt, COMPRESS);
+ 				btrfs_clear_opt(info->mount_opt, FORCE_COMPRESS);
+ 				compress_force = false;
++			} else if (strcmp(args[0].from, "lz4") == 0) {
++				compress_type = "lz4";
++				info->compress_type = BTRFS_COMPRESS_LZ4;
++				btrfs_set_opt(info->mount_opt, COMPRESS);
++				btrfs_clear_opt(info->mount_opt, NODATACOW);
++				btrfs_clear_opt(info->mount_opt, NODATASUM);
++				btrfs_set_fs_incompat(info, COMPRESS_LZ4);
++			} else if (strcmp(args[0].from, "lz4hc") == 0) {
++				compress_type = "lz4hc";
++				info->compress_type = BTRFS_COMPRESS_LZ4HC;
++				btrfs_set_opt(info->mount_opt, COMPRESS);
++				btrfs_clear_opt(info->mount_opt, NODATACOW);
++				btrfs_clear_opt(info->mount_opt, NODATASUM);
++				btrfs_set_fs_incompat(info, COMPRESS_LZ4);
+ 			} else {
+ 				ret = -EINVAL;
+ 				goto out;
+@@ -1051,8 +1065,14 @@
+ 	if (btrfs_test_opt(root, COMPRESS)) {
+ 		if (info->compress_type == BTRFS_COMPRESS_ZLIB)
+ 			compress_type = "zlib";
++		else if (info->compress_type == BTRFS_COMPRESS_LZ4)
++			compress_type = "lz4";
++		else if (info->compress_type == BTRFS_COMPRESS_LZ4HC)
++			compress_type = "lz4hc";
++ 		else if (info->compress_type == BTRFS_COMPRESS_LZO)
++ 			compress_type = "lzo";
+ 		else
+-			compress_type = "lzo";
++			compress_type = "none";
+ 		if (btrfs_test_opt(root, FORCE_COMPRESS))
+ 			seq_printf(seq, ",compress-force=%s", compress_type);
+ 		else
+diff -Nur linux-4.1.3/include/dt-bindings/clock/imx6qdl-clock.h linux-xbian-imx6/include/dt-bindings/clock/imx6qdl-clock.h
+--- linux-4.1.3/include/dt-bindings/clock/imx6qdl-clock.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/dt-bindings/clock/imx6qdl-clock.h	2015-07-27 23:13:09.467204382 +0200
+@@ -86,8 +86,6 @@
+ #define IMX6QDL_CLK_GPU3D_SHADER		74
+ #define IMX6QDL_CLK_IPU1_PODF			75
+ #define IMX6QDL_CLK_IPU2_PODF			76
+-#define IMX6QDL_CLK_LDB_DI0_PODF		77
+-#define IMX6QDL_CLK_LDB_DI1_PODF		78
+ #define IMX6QDL_CLK_IPU1_DI0_PRE		79
+ #define IMX6QDL_CLK_IPU1_DI1_PRE		80
+ #define IMX6QDL_CLK_IPU2_DI0_PRE		81
+@@ -251,6 +249,13 @@
+ #define IMX6QDL_CLK_VIDEO_27M			238
+ #define IMX6QDL_CLK_MIPI_CORE_CFG		239
+ #define IMX6QDL_CLK_MIPI_IPG			240
+-#define IMX6QDL_CLK_END				241
++#define IMX6QDL_CLK_LDB_DI0_DIV_7		241
++#define IMX6QDL_CLK_LDB_DI1_DIV_7		242
++#define IMX6QDL_CLK_LDB_DI0_DIV_SEL		243
++#define IMX6QDL_CLK_LDB_DI1_DIV_SEL		244
++#define IMX6QDL_CLK_DCIC1			245
++#define IMX6QDL_CLK_DCIC2			246
++#define IMX6QDL_CLK_SPDIF_GCLK			247
++#define IMX6QDL_CLK_END				248
+ 
+ #endif /* __DT_BINDINGS_CLOCK_IMX6QDL_H */
+diff -Nur linux-4.1.3/include/linux/busfreq-imx6.h linux-xbian-imx6/include/linux/busfreq-imx6.h
+--- linux-4.1.3/include/linux/busfreq-imx6.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/busfreq-imx6.h	2015-07-27 23:13:09.479161721 +0200
+@@ -0,0 +1,23 @@
++/*
++ * Copyright 2012-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License version 2 as
++ * published by the Free Software Foundation.
++ */
++
++#ifndef __ASM_ARCH_MXC_BUSFREQ_H__
++#define __ASM_ARCH_MXC_BUSFREQ_H__
++
++/*
++ * This enumerates busfreq mode.
++ */
++enum bus_freq_mode {
++	BUS_FREQ_HIGH,
++	BUS_FREQ_MED,
++	BUS_FREQ_AUDIO,
++	BUS_FREQ_LOW,
++};
++void request_bus_freq(enum bus_freq_mode mode);
++void release_bus_freq(enum bus_freq_mode mode);
++#endif
+diff -Nur linux-4.1.3/include/linux/cgroup_subsys.h linux-xbian-imx6/include/linux/cgroup_subsys.h
+--- linux-4.1.3/include/linux/cgroup_subsys.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/linux/cgroup_subsys.h	2015-07-27 23:13:09.483147501 +0200
+@@ -35,6 +35,10 @@
+ SUBSYS(net_cls)
+ #endif
+ 
++#if IS_ENABLED(CONFIG_CGROUP_BFQIO)
++SUBSYS(bfqio)
++#endif
++
+ #if IS_ENABLED(CONFIG_CGROUP_PERF)
+ SUBSYS(perf_event)
+ #endif
+diff -Nur linux-4.1.3/include/linux/device_cooling.h linux-xbian-imx6/include/linux/device_cooling.h
+--- linux-4.1.3/include/linux/device_cooling.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/device_cooling.h	2015-07-27 23:13:09.491119057 +0200
+@@ -0,0 +1,45 @@
++/*
++ * Copyright (C) 2013 Freescale Semiconductor, Inc.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License version 2 as
++ * published by the Free Software Foundation.
++ *
++ */
++
++#ifndef __DEVICE_THERMAL_H__
++#define __DEVICE_THERMAL_H__
++
++#include <linux/thermal.h>
++
++#ifdef CONFIG_DEVICE_THERMAL
++int register_devfreq_cooling_notifier(struct notifier_block *nb);
++int unregister_devfreq_cooling_notifier(struct notifier_block *nb);
++struct thermal_cooling_device *devfreq_cooling_register(void);
++void devfreq_cooling_unregister(struct thermal_cooling_device *cdev);
++#else
++static inline
++int register_devfreq_cooling_notifier(struct notifier_block *nb)
++{
++	return 0;
++}
++
++static inline
++int unregister_devfreq_cooling_notifier(struct notifier_block *nb)
++{
++	return 0;
++}
++
++static inline
++struct thermal_cooling_device *devfreq_cooling_register(void)
++{
++	return NULL;
++}
++
++static inline
++void devfreq_cooling_unregister(struct thermal_cooling_device *cdev)
++{
++	return;
++}
++#endif
++#endif /* __DEVICE_THERMAL_H__ */
+diff -Nur linux-4.1.3/include/linux/fb.h linux-xbian-imx6/include/linux/fb.h
+--- linux-4.1.3/include/linux/fb.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/linux/fb.h	2015-07-27 23:13:09.495104834 +0200
+@@ -702,7 +702,8 @@
+ #define FB_MODE_IS_VESA		4
+ #define FB_MODE_IS_CALCULATED	8
+ #define FB_MODE_IS_FIRST	16
+-#define FB_MODE_IS_FROM_VAR     32
++#define FB_MODE_IS_FROM_VAR	32
++#define FB_MODE_IS_3D		64
+ 
+ extern int fbmon_dpms(const struct fb_info *fb_info);
+ extern int fb_get_mode(int flags, u32 val, struct fb_var_screeninfo *var,
+diff -Nur linux-4.1.3/include/linux/ipu.h linux-xbian-imx6/include/linux/ipu.h
+--- linux-4.1.3/include/linux/ipu.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/ipu.h	2015-07-27 23:13:09.542934188 +0200
+@@ -0,0 +1,38 @@
++/*
++ * Copyright 2005-2013 Freescale Semiconductor, Inc.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU Lesser General
++ * Public License.  You may obtain a copy of the GNU Lesser General
++ * Public License Version 2.1 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/lgpl-license.html
++ * http://www.gnu.org/copyleft/lgpl.html
++ */
++
++/*!
++ * @defgroup IPU MXC Image Processing Unit (IPU) Driver
++ */
++/*!
++ * @file linux/ipu.h
++ *
++ * @brief This file contains the IPU driver API declarations.
++ *
++ * @ingroup IPU
++ */
++
++#ifndef __LINUX_IPU_H__
++#define __LINUX_IPU_H__
++
++#include <linux/interrupt.h>
++#include <uapi/linux/ipu.h>
++
++unsigned int fmt_to_bpp(unsigned int pixelformat);
++cs_t colorspaceofpixel(int fmt);
++int need_csc(int ifmt, int ofmt);
++
++int ipu_queue_task(struct ipu_task *task);
++int ipu_check_task(struct ipu_task *task);
++
++#endif
+diff -Nur linux-4.1.3/include/linux/ipu-v3.h linux-xbian-imx6/include/linux/ipu-v3.h
+--- linux-4.1.3/include/linux/ipu-v3.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/ipu-v3.h	2015-07-27 23:13:09.542934188 +0200
+@@ -0,0 +1,752 @@
++/*
++ * Copyright (c) 2010 Sascha Hauer <s.hauer@pengutronix.de>
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
++ *
++ * This program is free software; you can redistribute it and/or modify it
++ * under the terms of the GNU General Public License as published by the
++ * Free Software Foundation; either version 2 of the License, or (at your
++ * option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful, but
++ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
++ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
++ * for more details.
++ */
++
++#ifndef __LINUX_IPU_V3_H_
++#define __LINUX_IPU_V3_H_
++
++#include <linux/ipu.h>
++
++/* IPU Driver channels definitions.	*/
++/* Note these are different from IDMA channels */
++#define IPU_MAX_CH	32
++#define _MAKE_CHAN(num, v_in, g_in, a_in, out) \
++	((num << 24) | (v_in << 18) | (g_in << 12) | (a_in << 6) | out)
++#define _MAKE_ALT_CHAN(ch)		(ch | (IPU_MAX_CH << 24))
++#define IPU_CHAN_ID(ch)			(ch >> 24)
++#define IPU_CHAN_ALT(ch)		(ch & 0x02000000)
++#define IPU_CHAN_ALPHA_IN_DMA(ch)	((uint32_t) (ch >> 6) & 0x3F)
++#define IPU_CHAN_GRAPH_IN_DMA(ch)	((uint32_t) (ch >> 12) & 0x3F)
++#define IPU_CHAN_VIDEO_IN_DMA(ch)	((uint32_t) (ch >> 18) & 0x3F)
++#define IPU_CHAN_OUT_DMA(ch)		((uint32_t) (ch & 0x3F))
++#define NO_DMA 0x3F
++#define ALT	1
++/*!
++ * Enumeration of IPU logical channels. An IPU logical channel is defined as a
++ * combination of an input (memory to IPU), output (IPU to memory), and/or
++ * secondary input IDMA channels and in some cases an Image Converter task.
++ * Some channels consist of only an input or output.
++ */
++typedef enum {
++	CHAN_NONE = -1,
++	MEM_ROT_ENC_MEM = _MAKE_CHAN(1, 45, NO_DMA, NO_DMA, 48),
++	MEM_ROT_VF_MEM = _MAKE_CHAN(2, 46, NO_DMA, NO_DMA, 49),
++	MEM_ROT_PP_MEM = _MAKE_CHAN(3, 47, NO_DMA, NO_DMA, 50),
++
++	MEM_PRP_ENC_MEM = _MAKE_CHAN(4, 12, 14, 17, 20),
++	MEM_PRP_VF_MEM = _MAKE_CHAN(5, 12, 14, 17, 21),
++	MEM_PP_MEM = _MAKE_CHAN(6, 11, 15, 18, 22),
++
++	MEM_DC_SYNC = _MAKE_CHAN(7, 28, NO_DMA, NO_DMA, NO_DMA),
++	MEM_DC_ASYNC = _MAKE_CHAN(8, 41, NO_DMA, NO_DMA, NO_DMA),
++	MEM_BG_SYNC = _MAKE_CHAN(9, 23, NO_DMA, 51, NO_DMA),
++	MEM_FG_SYNC = _MAKE_CHAN(10, 27, NO_DMA, 31, NO_DMA),
++
++	MEM_BG_ASYNC0 = _MAKE_CHAN(11, 24, NO_DMA, 52, NO_DMA),
++	MEM_FG_ASYNC0 = _MAKE_CHAN(12, 29, NO_DMA, 33, NO_DMA),
++	MEM_BG_ASYNC1 = _MAKE_ALT_CHAN(MEM_BG_ASYNC0),
++	MEM_FG_ASYNC1 = _MAKE_ALT_CHAN(MEM_FG_ASYNC0),
++
++	DIRECT_ASYNC0 = _MAKE_CHAN(13, NO_DMA, NO_DMA, NO_DMA, NO_DMA),
++	DIRECT_ASYNC1 = _MAKE_CHAN(14, NO_DMA, NO_DMA, NO_DMA, NO_DMA),
++
++	CSI_MEM0 = _MAKE_CHAN(15, NO_DMA, NO_DMA, NO_DMA, 0),
++	CSI_MEM1 = _MAKE_CHAN(16, NO_DMA, NO_DMA, NO_DMA, 1),
++	CSI_MEM2 = _MAKE_CHAN(17, NO_DMA, NO_DMA, NO_DMA, 2),
++	CSI_MEM3 = _MAKE_CHAN(18, NO_DMA, NO_DMA, NO_DMA, 3),
++
++	CSI_MEM = CSI_MEM0,
++
++	CSI_PRP_ENC_MEM = _MAKE_CHAN(19, NO_DMA, NO_DMA, NO_DMA, 20),
++	CSI_PRP_VF_MEM = _MAKE_CHAN(20, NO_DMA, NO_DMA, NO_DMA, 21),
++
++	/* for vdi mem->vdi->ic->mem , add graphics plane and alpha*/
++	MEM_VDI_PRP_VF_MEM_P = _MAKE_CHAN(21, 8, 14, 17, 21),
++	MEM_VDI_PRP_VF_MEM = _MAKE_CHAN(22, 9, 14, 17, 21),
++	MEM_VDI_PRP_VF_MEM_N = _MAKE_CHAN(23, 10, 14, 17, 21),
++
++	/* for vdi mem->vdi->mem */
++	MEM_VDI_MEM_P = _MAKE_CHAN(24, 8, NO_DMA, NO_DMA, 5),
++	MEM_VDI_MEM = _MAKE_CHAN(25, 9, NO_DMA, NO_DMA, 5),
++	MEM_VDI_MEM_N = _MAKE_CHAN(26, 10, NO_DMA, NO_DMA, 5),
++
++	/* fake channel for vdoa to link with IPU */
++	MEM_VDOA_MEM =  _MAKE_CHAN(27, NO_DMA, NO_DMA, NO_DMA, NO_DMA),
++
++	MEM_PP_ADC = CHAN_NONE,
++	ADC_SYS2 = CHAN_NONE,
++
++} ipu_channel_t;
++
++/*!
++ * Enumeration of types of buffers for a logical channel.
++ */
++typedef enum {
++	IPU_OUTPUT_BUFFER = 0,	/*!< Buffer for output from IPU */
++	IPU_ALPHA_IN_BUFFER = 1,	/*!< Buffer for input to IPU */
++	IPU_GRAPH_IN_BUFFER = 2,	/*!< Buffer for input to IPU */
++	IPU_VIDEO_IN_BUFFER = 3,	/*!< Buffer for input to IPU */
++	IPU_INPUT_BUFFER = IPU_VIDEO_IN_BUFFER,
++	IPU_SEC_INPUT_BUFFER = IPU_GRAPH_IN_BUFFER,
++} ipu_buffer_t;
++
++#define IPU_PANEL_SERIAL		1
++#define IPU_PANEL_PARALLEL		2
++
++/*!
++ * Enumeration of ADC channel operation mode.
++ */
++typedef enum {
++	Disable,
++	WriteTemplateNonSeq,
++	ReadTemplateNonSeq,
++	WriteTemplateUnCon,
++	ReadTemplateUnCon,
++	WriteDataWithRS,
++	WriteDataWoRS,
++	WriteCmd
++} mcu_mode_t;
++
++/*!
++ * Enumeration of ADC channel addressing mode.
++ */
++typedef enum {
++	FullWoBE,
++	FullWithBE,
++	XY
++} display_addressing_t;
++
++/*!
++ * Union of initialization parameters for a logical channel.
++ */
++typedef union {
++	struct {
++		uint32_t csi;
++		uint32_t mipi_id;
++		uint32_t mipi_vc;
++		bool mipi_en;
++		bool interlaced;
++	} csi_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		uint32_t outh_resize_ratio;
++		uint32_t outv_resize_ratio;
++		uint32_t csi;
++		uint32_t mipi_id;
++		uint32_t mipi_vc;
++		bool mipi_en;
++	} csi_prp_enc_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		uint32_t outh_resize_ratio;
++		uint32_t outv_resize_ratio;
++	} mem_prp_enc_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++	} mem_rot_enc_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		uint32_t outh_resize_ratio;
++		uint32_t outv_resize_ratio;
++		bool graphics_combine_en;
++		bool global_alpha_en;
++		bool key_color_en;
++		uint32_t in_g_pixel_fmt;
++		uint8_t alpha;
++		uint32_t key_color;
++		bool alpha_chan_en;
++		ipu_motion_sel motion_sel;
++		enum v4l2_field field_fmt;
++		uint32_t csi;
++		uint32_t mipi_id;
++		uint32_t mipi_vc;
++		bool mipi_en;
++	} csi_prp_vf_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		bool graphics_combine_en;
++		bool global_alpha_en;
++		bool key_color_en;
++		display_port_t disp;
++		uint32_t out_left;
++		uint32_t out_top;
++	} csi_prp_vf_adc;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		uint32_t outh_resize_ratio;
++		uint32_t outv_resize_ratio;
++		bool graphics_combine_en;
++		bool global_alpha_en;
++		bool key_color_en;
++		uint32_t in_g_pixel_fmt;
++		uint8_t alpha;
++		uint32_t key_color;
++		bool alpha_chan_en;
++		ipu_motion_sel motion_sel;
++		enum v4l2_field field_fmt;
++	} mem_prp_vf_mem;
++	struct {
++		uint32_t temp;
++	} mem_prp_vf_adc;
++	struct {
++		uint32_t temp;
++	} mem_rot_vf_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		uint32_t outh_resize_ratio;
++		uint32_t outv_resize_ratio;
++		bool graphics_combine_en;
++		bool global_alpha_en;
++		bool key_color_en;
++		uint32_t in_g_pixel_fmt;
++		uint8_t alpha;
++		uint32_t key_color;
++		bool alpha_chan_en;
++	} mem_pp_mem;
++	struct {
++		uint32_t temp;
++	} mem_rot_mem;
++	struct {
++		uint32_t in_width;
++		uint32_t in_height;
++		uint32_t in_pixel_fmt;
++		uint32_t out_width;
++		uint32_t out_height;
++		uint32_t out_pixel_fmt;
++		bool graphics_combine_en;
++		bool global_alpha_en;
++		bool key_color_en;
++		display_port_t disp;
++		uint32_t out_left;
++		uint32_t out_top;
++	} mem_pp_adc;
++	struct {
++		uint32_t di;
++		bool interlaced;
++		uint32_t in_pixel_fmt;
++		uint32_t out_pixel_fmt;
++	} mem_dc_sync;
++	struct {
++		uint32_t temp;
++	} mem_sdc_fg;
++	struct {
++		uint32_t di;
++		bool interlaced;
++		uint32_t in_pixel_fmt;
++		uint32_t out_pixel_fmt;
++		bool alpha_chan_en;
++	} mem_dp_bg_sync;
++	struct {
++		uint32_t temp;
++	} mem_sdc_bg;
++	struct {
++		uint32_t di;
++		bool interlaced;
++		uint32_t in_pixel_fmt;
++		uint32_t out_pixel_fmt;
++		bool alpha_chan_en;
++	} mem_dp_fg_sync;
++	struct {
++		uint32_t di;
++	} direct_async;
++	struct {
++		display_port_t disp;
++		mcu_mode_t ch_mode;
++		uint32_t out_left;
++		uint32_t out_top;
++	} adc_sys1;
++	struct {
++		display_port_t disp;
++		mcu_mode_t ch_mode;
++		uint32_t out_left;
++		uint32_t out_top;
++	} adc_sys2;
++} ipu_channel_params_t;
++
++/*
++ * IPU_IRQF_ONESHOT - Interrupt is not reenabled after the irq handler finished.
++ */
++#define IPU_IRQF_NONE		0x00000000
++#define IPU_IRQF_ONESHOT	0x00000001
++
++/*!
++ * Enumeration of IPU interrupt sources.
++ */
++enum ipu_irq_line {
++	IPU_IRQ_CSI0_OUT_EOF = 0,
++	IPU_IRQ_CSI1_OUT_EOF = 1,
++	IPU_IRQ_CSI2_OUT_EOF = 2,
++	IPU_IRQ_CSI3_OUT_EOF = 3,
++	IPU_IRQ_VDIC_OUT_EOF = 5,
++	IPU_IRQ_VDI_P_IN_EOF = 8,
++	IPU_IRQ_VDI_C_IN_EOF = 9,
++	IPU_IRQ_VDI_N_IN_EOF = 10,
++	IPU_IRQ_PP_IN_EOF = 11,
++	IPU_IRQ_PRP_IN_EOF = 12,
++	IPU_IRQ_PRP_GRAPH_IN_EOF = 14,
++	IPU_IRQ_PP_GRAPH_IN_EOF = 15,
++	IPU_IRQ_PRP_ALPHA_IN_EOF = 17,
++	IPU_IRQ_PP_ALPHA_IN_EOF = 18,
++	IPU_IRQ_PRP_ENC_OUT_EOF = 20,
++	IPU_IRQ_PRP_VF_OUT_EOF = 21,
++	IPU_IRQ_PP_OUT_EOF = 22,
++	IPU_IRQ_BG_SYNC_EOF = 23,
++	IPU_IRQ_BG_ASYNC_EOF = 24,
++	IPU_IRQ_FG_SYNC_EOF = 27,
++	IPU_IRQ_DC_SYNC_EOF = 28,
++	IPU_IRQ_FG_ASYNC_EOF = 29,
++	IPU_IRQ_FG_ALPHA_SYNC_EOF = 31,
++
++	IPU_IRQ_FG_ALPHA_ASYNC_EOF = 33,
++	IPU_IRQ_DC_READ_EOF = 40,
++	IPU_IRQ_DC_ASYNC_EOF = 41,
++	IPU_IRQ_DC_CMD1_EOF = 42,
++	IPU_IRQ_DC_CMD2_EOF = 43,
++	IPU_IRQ_DC_MASK_EOF = 44,
++	IPU_IRQ_PRP_ENC_ROT_IN_EOF = 45,
++	IPU_IRQ_PRP_VF_ROT_IN_EOF = 46,
++	IPU_IRQ_PP_ROT_IN_EOF = 47,
++	IPU_IRQ_PRP_ENC_ROT_OUT_EOF = 48,
++	IPU_IRQ_PRP_VF_ROT_OUT_EOF = 49,
++	IPU_IRQ_PP_ROT_OUT_EOF = 50,
++	IPU_IRQ_BG_ALPHA_SYNC_EOF = 51,
++	IPU_IRQ_BG_ALPHA_ASYNC_EOF = 52,
++
++	IPU_IRQ_BG_SYNC_NFACK = 64 + 23,
++	IPU_IRQ_FG_SYNC_NFACK = 64 + 27,
++	IPU_IRQ_DC_SYNC_NFACK = 64 + 28,
++
++	IPU_IRQ_DP_SF_START = 448 + 2,
++	IPU_IRQ_DP_SF_END = 448 + 3,
++	IPU_IRQ_BG_SF_END = IPU_IRQ_DP_SF_END,
++	IPU_IRQ_DC_FC_0 = 448 + 8,
++	IPU_IRQ_DC_FC_1 = 448 + 9,
++	IPU_IRQ_DC_FC_2 = 448 + 10,
++	IPU_IRQ_DC_FC_3 = 448 + 11,
++	IPU_IRQ_DC_FC_4 = 448 + 12,
++	IPU_IRQ_DC_FC_6 = 448 + 13,
++	IPU_IRQ_VSYNC_PRE_0 = 448 + 14,
++	IPU_IRQ_VSYNC_PRE_1 = 448 + 15,
++
++	IPU_IRQ_COUNT
++};
++
++/*!
++ * Bitfield of Display Interface signal polarities.
++ */
++typedef struct {
++	unsigned datamask_en:1;
++	unsigned int_clk:1;
++	unsigned interlaced:1;
++	unsigned odd_field_first:1;
++	unsigned clksel_en:1;
++	unsigned clkidle_en:1;
++	unsigned data_pol:1;	/* true = inverted */
++	unsigned clk_pol:1;	/* true = rising edge */
++	unsigned enable_pol:1;
++	unsigned Hsync_pol:1;	/* true = active high */
++	unsigned Vsync_pol:1;
++} ipu_di_signal_cfg_t;
++
++/*!
++ * Bitfield of CSI signal polarities and modes.
++ */
++
++typedef struct {
++	unsigned data_width:4;
++	unsigned clk_mode:3;
++	unsigned ext_vsync:1;
++	unsigned Vsync_pol:1;
++	unsigned Hsync_pol:1;
++	unsigned pixclk_pol:1;
++	unsigned data_pol:1;
++	unsigned sens_clksrc:1;
++	unsigned pack_tight:1;
++	unsigned force_eof:1;
++	unsigned data_en_pol:1;
++	unsigned data_fmt;
++	unsigned csi;
++	unsigned mclk;
++} ipu_csi_signal_cfg_t;
++
++/*!
++ * Enumeration of CSI data bus widths.
++ */
++enum {
++	IPU_CSI_DATA_WIDTH_4 = 0,
++	IPU_CSI_DATA_WIDTH_8 = 1,
++	IPU_CSI_DATA_WIDTH_10 = 3,
++	IPU_CSI_DATA_WIDTH_16 = 9,
++};
++
++/*!
++ * Enumeration of CSI clock modes.
++ */
++enum {
++	IPU_CSI_CLK_MODE_GATED_CLK,
++	IPU_CSI_CLK_MODE_NONGATED_CLK,
++	IPU_CSI_CLK_MODE_CCIR656_PROGRESSIVE,
++	IPU_CSI_CLK_MODE_CCIR656_INTERLACED,
++	IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_DDR,
++	IPU_CSI_CLK_MODE_CCIR1120_PROGRESSIVE_SDR,
++	IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_DDR,
++	IPU_CSI_CLK_MODE_CCIR1120_INTERLACED_SDR,
++};
++
++enum {
++	IPU_CSI_MIPI_DI0,
++	IPU_CSI_MIPI_DI1,
++	IPU_CSI_MIPI_DI2,
++	IPU_CSI_MIPI_DI3,
++};
++
++typedef enum {
++	RGB,
++	YCbCr,
++	YUV
++} ipu_color_space_t;
++
++/*!
++ * Enumeration of ADC vertical sync mode.
++ */
++typedef enum {
++	VsyncNone,
++	VsyncInternal,
++	VsyncCSI,
++	VsyncExternal
++} vsync_t;
++
++typedef enum {
++	DAT,
++	CMD
++} cmddata_t;
++
++/*!
++ * Enumeration of ADC display update mode.
++ */
++typedef enum {
++	IPU_ADC_REFRESH_NONE,
++	IPU_ADC_AUTO_REFRESH,
++	IPU_ADC_AUTO_REFRESH_SNOOP,
++	IPU_ADC_SNOOPING,
++} ipu_adc_update_mode_t;
++
++/*!
++ * Enumeration of ADC display interface types (serial or parallel).
++ */
++enum {
++	IPU_ADC_IFC_MODE_SYS80_TYPE1,
++	IPU_ADC_IFC_MODE_SYS80_TYPE2,
++	IPU_ADC_IFC_MODE_SYS68K_TYPE1,
++	IPU_ADC_IFC_MODE_SYS68K_TYPE2,
++	IPU_ADC_IFC_MODE_3WIRE_SERIAL,
++	IPU_ADC_IFC_MODE_4WIRE_SERIAL,
++	IPU_ADC_IFC_MODE_5WIRE_SERIAL_CLK,
++	IPU_ADC_IFC_MODE_5WIRE_SERIAL_CS,
++};
++
++enum {
++	IPU_ADC_IFC_WIDTH_8,
++	IPU_ADC_IFC_WIDTH_16,
++};
++
++/*!
++ * Enumeration of ADC display interface burst mode.
++ */
++enum {
++	IPU_ADC_BURST_WCS,
++	IPU_ADC_BURST_WBLCK,
++	IPU_ADC_BURST_NONE,
++	IPU_ADC_BURST_SERIAL,
++};
++
++/*!
++ * Enumeration of ADC display interface RW signal timing modes.
++ */
++enum {
++	IPU_ADC_SER_NO_RW,
++	IPU_ADC_SER_RW_BEFORE_RS,
++	IPU_ADC_SER_RW_AFTER_RS,
++};
++
++/*!
++ * Bitfield of ADC signal polarities and modes.
++ */
++typedef struct {
++	unsigned data_pol:1;
++	unsigned clk_pol:1;
++	unsigned cs_pol:1;
++	unsigned rs_pol:1;
++	unsigned addr_pol:1;
++	unsigned read_pol:1;
++	unsigned write_pol:1;
++	unsigned Vsync_pol:1;
++	unsigned burst_pol:1;
++	unsigned burst_mode:2;
++	unsigned ifc_mode:3;
++	unsigned ifc_width:5;
++	unsigned ser_preamble_len:4;
++	unsigned ser_preamble:8;
++	unsigned ser_rw_mode:2;
++} ipu_adc_sig_cfg_t;
++
++/*!
++ * Enumeration of ADC template commands.
++ */
++enum {
++	RD_DATA,
++	RD_ACK,
++	RD_WAIT,
++	WR_XADDR,
++	WR_YADDR,
++	WR_ADDR,
++	WR_CMND,
++	WR_DATA,
++};
++
++/*!
++ * Enumeration of ADC template command flow control.
++ */
++enum {
++	SINGLE_STEP,
++	PAUSE,
++	STOP,
++};
++
++
++/*Define template constants*/
++#define     ATM_ADDR_RANGE      0x20	/*offset address of DISP */
++#define     TEMPLATE_BUF_SIZE   0x20	/*size of template */
++
++/*!
++ * Define to create ADC template command entry.
++ */
++#define ipu_adc_template_gen(oc, rs, fc, dat) (((rs) << 29) | ((fc) << 27) | \
++			((oc) << 24) | (dat))
++
++typedef struct {
++	u32 reg;
++	u32 value;
++} ipu_lpmc_reg_t;
++
++#define IPU_LPMC_REG_READ       0x80000000L
++
++#define CSI_MCLK_VF  1
++#define CSI_MCLK_ENC 2
++#define CSI_MCLK_RAW 4
++#define CSI_MCLK_I2C 8
++
++struct ipu_soc;
++/* Common IPU API */
++struct ipu_soc *ipu_get_soc(int id);
++int32_t ipu_init_channel(struct ipu_soc *ipu, ipu_channel_t channel, ipu_channel_params_t *params);
++void ipu_uninit_channel(struct ipu_soc *ipu, ipu_channel_t channel);
++void ipu_disable_hsp_clk(struct ipu_soc *ipu);
++
++static inline bool ipu_can_rotate_in_place(ipu_rotate_mode_t rot)
++{
++#ifdef CONFIG_MXC_IPU_V3D
++	return (rot < IPU_ROTATE_HORIZ_FLIP);
++#else
++	return (rot < IPU_ROTATE_90_RIGHT);
++#endif
++}
++
++int32_t ipu_init_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++				uint32_t pixel_fmt,
++				uint16_t width, uint16_t height,
++				uint32_t stride,
++				ipu_rotate_mode_t rot_mode,
++				dma_addr_t phyaddr_0, dma_addr_t phyaddr_1,
++				dma_addr_t phyaddr_2,
++				uint32_t u_offset, uint32_t v_offset);
++
++int32_t ipu_update_channel_buffer(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++				  uint32_t bufNum, dma_addr_t phyaddr);
++
++int32_t ipu_update_channel_offset(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++				uint32_t pixel_fmt,
++				uint16_t width, uint16_t height,
++				uint32_t stride,
++				uint32_t u, uint32_t v,
++				uint32_t vertical_offset, uint32_t horizontal_offset);
++
++int32_t ipu_select_buffer(struct ipu_soc *ipu, ipu_channel_t channel,
++			  ipu_buffer_t type, uint32_t bufNum);
++int32_t ipu_select_multi_vdi_buffer(struct ipu_soc *ipu, uint32_t bufNum);
++
++int32_t ipu_link_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch);
++int32_t ipu_unlink_channels(struct ipu_soc *ipu, ipu_channel_t src_ch, ipu_channel_t dest_ch);
++
++int32_t ipu_is_channel_busy(struct ipu_soc *ipu, ipu_channel_t channel);
++int32_t ipu_check_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++		uint32_t bufNum);
++void ipu_clear_buffer_ready(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type,
++		uint32_t bufNum);
++uint32_t ipu_get_cur_buffer_idx(struct ipu_soc *ipu, ipu_channel_t channel, ipu_buffer_t type);
++int32_t ipu_enable_channel(struct ipu_soc *ipu, ipu_channel_t channel);
++int32_t ipu_disable_channel(struct ipu_soc *ipu, ipu_channel_t channel, bool wait_for_stop);
++int32_t ipu_swap_channel(struct ipu_soc *ipu, ipu_channel_t from_ch, ipu_channel_t to_ch);
++uint32_t ipu_channel_status(struct ipu_soc *ipu, ipu_channel_t channel);
++
++int32_t ipu_enable_csi(struct ipu_soc *ipu, uint32_t csi);
++int32_t ipu_disable_csi(struct ipu_soc *ipu, uint32_t csi);
++
++int ipu_lowpwr_display_enable(void);
++int ipu_lowpwr_display_disable(void);
++
++int ipu_enable_irq(struct ipu_soc *ipu, uint32_t irq);
++void ipu_disable_irq(struct ipu_soc *ipu, uint32_t irq);
++void ipu_clear_irq(struct ipu_soc *ipu, uint32_t irq);
++int ipu_request_irq(struct ipu_soc *ipu, uint32_t irq,
++		    irqreturn_t(*handler) (int, void *),
++		    uint32_t irq_flags, const char *devname, void *dev_id);
++void ipu_free_irq(struct ipu_soc *ipu, uint32_t irq, void *dev_id);
++bool ipu_get_irq_status(struct ipu_soc *ipu, uint32_t irq);
++void ipu_set_csc_coefficients(struct ipu_soc *ipu, ipu_channel_t channel, int32_t param[][3]);
++int32_t ipu_set_channel_bandmode(struct ipu_soc *ipu, ipu_channel_t channel,
++				 ipu_buffer_t type, uint32_t band_height);
++
++/* two stripe calculations */
++struct stripe_param{
++	unsigned int input_width; /* width of the input stripe */
++	unsigned int output_width; /* width of the output stripe */
++	unsigned int input_column; /* the first column on the input stripe */
++	unsigned int output_column; /* the first column on the output stripe */
++	unsigned int idr;
++	/* inverse downisizing ratio parameter; expressed as a power of 2 */
++	unsigned int irr;
++	/* inverse resizing ratio parameter; expressed as a multiple of 2^-13 */
++};
++int ipu_calc_stripes_sizes(const unsigned int input_frame_width,
++				unsigned int output_frame_width,
++				const unsigned int maximal_stripe_width,
++				const unsigned long long cirr,
++				const unsigned int equal_stripes,
++				u32 input_pixelformat,
++				u32 output_pixelformat,
++				struct stripe_param *left,
++				struct stripe_param *right);
++
++/* SDC API */
++int32_t ipu_init_sync_panel(struct ipu_soc *ipu, int disp,
++			    uint32_t pixel_clk,
++			    uint16_t width, uint16_t height,
++			    uint32_t pixel_fmt,
++			    uint16_t h_start_width, uint16_t h_sync_width,
++			    uint16_t h_end_width, uint16_t v_start_width,
++			    uint16_t v_sync_width, uint16_t v_end_width,
++			    uint32_t v_to_h_sync, ipu_di_signal_cfg_t sig);
++
++void ipu_uninit_sync_panel(struct ipu_soc *ipu, int disp);
++
++int32_t ipu_disp_set_window_pos(struct ipu_soc *ipu, ipu_channel_t channel, int16_t x_pos,
++				int16_t y_pos);
++int32_t ipu_disp_get_window_pos(struct ipu_soc *ipu, ipu_channel_t channel, int16_t *x_pos,
++				int16_t *y_pos);
++int32_t ipu_disp_set_global_alpha(struct ipu_soc *ipu, ipu_channel_t channel, bool enable,
++				  uint8_t alpha);
++int32_t ipu_disp_set_color_key(struct ipu_soc *ipu, ipu_channel_t channel, bool enable,
++			       uint32_t colorKey);
++int32_t ipu_disp_set_gamma_correction(struct ipu_soc *ipu, ipu_channel_t channel, bool enable,
++				int constk[], int slopek[]);
++
++int ipu_init_async_panel(struct ipu_soc *ipu, int disp, int type, uint32_t cycle_time,
++			 uint32_t pixel_fmt, ipu_adc_sig_cfg_t sig);
++void ipu_disp_direct_write(struct ipu_soc *ipu, ipu_channel_t channel, u32 value, u32 offset);
++void ipu_reset_disp_panel(struct ipu_soc *ipu);
++
++/* CMOS Sensor Interface API */
++int32_t ipu_csi_init_interface(struct ipu_soc *ipu, uint16_t width, uint16_t height,
++			       uint32_t pixel_fmt, ipu_csi_signal_cfg_t sig);
++
++int32_t ipu_csi_get_sensor_protocol(struct ipu_soc *ipu, uint32_t csi);
++
++int32_t ipu_csi_enable_mclk(struct ipu_soc *ipu, int src, bool flag, bool wait);
++
++static inline int32_t ipu_csi_enable_mclk_if(struct ipu_soc *ipu, int src, uint32_t csi,
++		bool flag, bool wait)
++{
++	return ipu_csi_enable_mclk(ipu, csi, flag, wait);
++}
++
++int ipu_csi_read_mclk_flag(void);
++
++void ipu_csi_flash_strobe(bool flag);
++
++void ipu_csi_get_window_size(struct ipu_soc *ipu, uint32_t *width, uint32_t *height, uint32_t csi);
++
++void ipu_csi_set_window_size(struct ipu_soc *ipu, uint32_t width, uint32_t height, uint32_t csi);
++
++void ipu_csi_set_window_pos(struct ipu_soc *ipu, uint32_t left, uint32_t top, uint32_t csi);
++
++uint32_t bytes_per_pixel(uint32_t fmt);
++
++bool ipu_ch_param_bad_alpha_pos(uint32_t fmt);
++
++struct ipuv3_fb_platform_data {
++	char				disp_dev[32];
++	u32				interface_pix_fmt;
++	char				*mode_str;
++	int				default_bpp;
++	bool				int_clk;
++
++	/* reserved mem */
++	resource_size_t 		res_base[2];
++	resource_size_t 		res_size[2];
++
++	/*
++	 * Late init to avoid display channel being
++	 * re-initialized as we've probably setup the
++	 * channel in bootloader.
++	 */
++	bool                            late_init;
++};
++
++#endif /* __LINUX_IPU_V3_H_ */
+diff -Nur linux-4.1.3/include/linux/mfd/mxc-hdmi-core.h linux-xbian-imx6/include/linux/mfd/mxc-hdmi-core.h
+--- linux-4.1.3/include/linux/mfd/mxc-hdmi-core.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/mfd/mxc-hdmi-core.h	2015-07-27 23:13:09.586777757 +0200
+@@ -0,0 +1,68 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++#ifndef __LINUX_MXC_HDMI_CORE_H_
++#define __LINUX_MXC_HDMI_CORE_H_
++
++#include <video/mxc_edid.h>
++
++#include <sound/core.h>
++#include <sound/pcm.h>
++#include <sound/pcm_params.h>
++#include <sound/soc.h>
++
++#define IRQ_DISABLE_SUCCEED	0
++#define IRQ_DISABLE_FAIL	1
++
++bool hdmi_check_overflow(void);
++
++u8 hdmi_readb(unsigned int reg);
++void hdmi_writeb(u8 value, unsigned int reg);
++void hdmi_mask_writeb(u8 data, unsigned int addr, u8 shift, u8 mask);
++unsigned int hdmi_read4(unsigned int reg);
++void hdmi_write4(unsigned int value, unsigned int reg);
++
++void hdmi_irq_init(void);
++void hdmi_irq_enable(int irq);
++unsigned int hdmi_irq_disable(int irq);
++
++void hdmi_set_sample_rate(unsigned int rate);
++void hdmi_set_dma_mode(unsigned int dma_running);
++void hdmi_init_clk_regenerator(void);
++void hdmi_clk_regenerator_update_pixel_clock(u32 pixclock);
++
++void hdmi_set_edid_cfg(int edid_status, struct mxc_edid_cfg *cfg);
++int hdmi_get_edid_cfg(struct mxc_edid_cfg *cfg);
++
++extern int mxc_hdmi_ipu_id;
++extern int mxc_hdmi_disp_id;
++
++void hdmi_set_registered(int registered);
++int hdmi_get_registered(void);
++int mxc_hdmi_abort_stream(void);
++int mxc_hdmi_register_audio(struct snd_pcm_substream *substream);
++void mxc_hdmi_unregister_audio(struct snd_pcm_substream *substream);
++void hdmi_set_dvi_mode(unsigned int state);
++unsigned int hdmi_set_cable_state(unsigned int state);
++unsigned int hdmi_set_blank_state(unsigned int state);
++int check_hdmi_state(void);
++
++void hdmi_cec_start_device(void);
++void hdmi_cec_stop_device(void);
++
++#endif
+diff -Nur linux-4.1.3/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h linux-xbian-imx6/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h
+--- linux-4.1.3/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/linux/mfd/syscon/imx6q-iomuxc-gpr.h	2015-07-27 23:13:09.590763539 +0200
+@@ -1,5 +1,5 @@
+ /*
+- * Copyright (C) 2012 Freescale Semiconductor, Inc.
++ * Copyright (C) 2012-2014 Freescale Semiconductor, Inc.
+  *
+  * This program is free software; you can redistribute it and/or modify
+  * it under the terms of the GNU General Public License version 2 as
+@@ -123,6 +123,9 @@
+ #define IMX6Q_GPR1_USB_OTG_ID_SEL_ENET_RX_ER	0x0
+ #define IMX6Q_GPR1_USB_OTG_ID_SEL_GPIO_1	BIT(13)
+ #define IMX6Q_GPR1_GINT				BIT(12)
++#define IMX6Q_GPR1_GINT_MASK			BIT(12)
++#define IMX6Q_GPR1_GINT_CLEAR			0x0
++#define IMX6Q_GPR1_GINT_ASSERT			BIT(12)
+ #define IMX6Q_GPR1_ADDRS3_MASK			(0x3 << 10)
+ #define IMX6Q_GPR1_ADDRS3_32MB			(0x0 << 10)
+ #define IMX6Q_GPR1_ADDRS3_64MB			(0x1 << 10)
+@@ -285,15 +288,15 @@
+ #define IMX6Q_GPR10_OCRAM_TZ_ADDR_MASK		(0x3f << 5)
+ #define IMX6Q_GPR10_OCRAM_TZ_EN_MASK		BIT(4)
+ #define IMX6Q_GPR10_DCIC2_MUX_CTL_MASK		(0x3 << 2)
+-#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI0	(0x0 << 2)
+-#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI1	(0x1 << 2)
+-#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU2_DI0	(0x2 << 2)
+-#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU2_DI1	(0x3 << 2)
++#define IMX6Q_GPR10_DCIC2_MUX_CTL_IPU1_DI1	(0x0 << 2)
++#define IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS0		(0x1 << 2)
++#define IMX6Q_GPR10_DCIC2_MUX_CTL_LVDS1		(0x2 << 2)
++#define IMX6Q_GPR10_DCIC2_MUX_CTL_MIPI		(0x3 << 2)
+ #define IMX6Q_GPR10_DCIC1_MUX_CTL_MASK		(0x3 << 0)
+ #define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU1_DI0	(0x0 << 0)
+-#define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU1_DI1	(0x1 << 0)
+-#define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU2_DI0	(0x2 << 0)
+-#define IMX6Q_GPR10_DCIC1_MUX_CTL_IPU2_DI1	(0x3 << 0)
++#define IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS0		(0x1 << 0)
++#define IMX6Q_GPR10_DCIC1_MUX_CTL_LVDS1		(0x2 << 0)
++#define IMX6Q_GPR10_DCIC1_MUX_CTL_HDMI		(0x3 << 0)
+ 
+ #define IMX6Q_GPR12_ARMP_IPG_CLK_EN		BIT(27)
+ #define IMX6Q_GPR12_ARMP_AHB_CLK_EN		BIT(26)
+@@ -302,6 +305,7 @@
+ #define IMX6Q_GPR12_DEVICE_TYPE			(0xf << 12)
+ #define IMX6Q_GPR12_PCIE_CTL_2			BIT(10)
+ #define IMX6Q_GPR12_LOS_LEVEL			(0x1f << 4)
++#define IMX6Q_GPR12_LOS_LEVEL_9			(0x9 << 4)
+ 
+ #define IMX6Q_GPR13_SDMA_STOP_REQ		BIT(30)
+ #define IMX6Q_GPR13_CAN2_STOP_REQ		BIT(29)
+@@ -392,6 +396,16 @@
+ #define IMX6Q_GPR13_SATA_MPLL_CLK_EN		BIT(1)
+ #define IMX6Q_GPR13_SATA_TX_EDGE_RATE		BIT(0)
+ 
++/* For imx6dl iomux gpr register field definitions */
++#define IMX6DL_GPR3_LVDS1_MUX_CTL_MASK		(0x3 << 8)
++#define IMX6DL_GPR3_LVDS1_MUX_CTL_IPU1_DI0	(0x0 << 8)
++#define IMX6DL_GPR3_LVDS1_MUX_CTL_IPU1_DI1	(0x1 << 8)
++#define IMX6DL_GPR3_LVDS1_MUX_CTL_LCDIF		(0x2 << 8)
++#define IMX6DL_GPR3_LVDS0_MUX_CTL_MASK		(0x3 << 6)
++#define IMX6DL_GPR3_LVDS0_MUX_CTL_IPU1_DI0	(0x0 << 6)
++#define IMX6DL_GPR3_LVDS0_MUX_CTL_IPU1_DI1	(0x1 << 6)
++#define IMX6DL_GPR3_LVDS0_MUX_CTL_LCDIF		(0x2 << 6)
++
+ /* For imx6sl iomux gpr register field define */
+ #define IMX6SL_GPR1_FEC_CLOCK_MUX1_SEL_MASK    (0x3 << 17)
+ #define IMX6SL_GPR1_FEC_CLOCK_MUX2_SEL_MASK    (0x1 << 14)
+@@ -407,6 +421,15 @@
+ #define IMX6SX_GPR1_FEC_CLOCK_PAD_DIR_MASK		(0x3 << 17)
+ #define IMX6SX_GPR1_FEC_CLOCK_MUX_SEL_EXT		(0x3 << 13)
+ 
++#define IMX6SX_GPR2_MQS_OVERSAMPLE_MASK			(0x1 << 26)
++#define IMX6SX_GPR2_MQS_OVERSAMPLE_SHIFT		(26)
++#define IMX6SX_GPR2_MQS_EN_MASK				(0x1 << 25)
++#define IMX6SX_GPR2_MQS_EN_SHIFT			(25)
++#define IMX6SX_GPR2_MQS_SW_RST_MASK			(0x1 << 24)
++#define IMX6SX_GPR2_MQS_SW_RST_SHIFT			(24)
++#define IMX6SX_GPR2_MQS_CLK_DIV_MASK			(0xFF << 16)
++#define IMX6SX_GPR2_MQS_CLK_DIV_SHIFT			(16)
++
+ #define IMX6SX_GPR4_FEC_ENET1_STOP_REQ			(0x1 << 3)
+ #define IMX6SX_GPR4_FEC_ENET2_STOP_REQ			(0x1 << 4)
+ 
+@@ -435,4 +458,11 @@
+ #define IMX6SX_GPR5_DISP_MUX_DCIC1_LVDS			(0x1 << 1)
+ #define IMX6SX_GPR5_DISP_MUX_DCIC1_MASK			(0x1 << 1)
+ 
++#define IMX6SX_GPR5_PCIE_BTNRST			BIT(19)
++#define IMX6SX_GPR5_PCIE_PERST			BIT(18)
++
++#define IMX6SX_GPR12_PCIE_PM_TURN_OFF		BIT(16)
++#define IMX6SX_GPR12_PCIE_TEST_PD		BIT(30)
++#define IMX6SX_GPR12_RX_EQ_MASK			(0x7 << 0)
++#define IMX6SX_GPR12_RX_EQ_2			(0x2 << 0)
+ #endif /* __LINUX_IMX6Q_IOMUXC_GPR_H */
+diff -Nur linux-4.1.3/include/linux/mipi_csi2.h linux-xbian-imx6/include/linux/mipi_csi2.h
+--- linux-4.1.3/include/linux/mipi_csi2.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/mipi_csi2.h	2015-07-27 23:13:09.598735098 +0200
+@@ -0,0 +1,93 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __INCLUDE_MIPI_CSI2_H
++#define __INCLUDE_MIPI_CSI2_H
++
++/* MIPI CSI2 registers */
++#define MIPI_CSI2_REG(offset)		(offset)
++
++#define	MIPI_CSI2_VERSION		MIPI_CSI2_REG(0x000)
++#define	MIPI_CSI2_N_LANES		MIPI_CSI2_REG(0x004)
++#define	MIPI_CSI2_PHY_SHUTDOWNZ		MIPI_CSI2_REG(0x008)
++#define	MIPI_CSI2_DPHY_RSTZ		MIPI_CSI2_REG(0x00c)
++#define	MIPI_CSI2_CSI2_RESETN		MIPI_CSI2_REG(0x010)
++#define	MIPI_CSI2_PHY_STATE		MIPI_CSI2_REG(0x014)
++#define	MIPI_CSI2_DATA_IDS_1		MIPI_CSI2_REG(0x018)
++#define	MIPI_CSI2_DATA_IDS_2		MIPI_CSI2_REG(0x01c)
++#define	MIPI_CSI2_ERR1			MIPI_CSI2_REG(0x020)
++#define	MIPI_CSI2_ERR2			MIPI_CSI2_REG(0x024)
++#define	MIPI_CSI2_MASK1			MIPI_CSI2_REG(0x028)
++#define	MIPI_CSI2_MASK2			MIPI_CSI2_REG(0x02c)
++#define	MIPI_CSI2_PHY_TST_CTRL0		MIPI_CSI2_REG(0x030)
++#define	MIPI_CSI2_PHY_TST_CTRL1		MIPI_CSI2_REG(0x034)
++#define	MIPI_CSI2_SFT_RESET		MIPI_CSI2_REG(0xf00)
++
++/* mipi data type */
++#define MIPI_DT_YUV420		0x18 /* YYY.../UYVY.... */
++#define MIPI_DT_YUV420_LEGACY	0x1a /* UYY.../VYY...   */
++#define MIPI_DT_YUV422		0x1e /* UYVY...		*/
++#define MIPI_DT_RGB444		0x20
++#define MIPI_DT_RGB555		0x21
++#define MIPI_DT_RGB565		0x22
++#define MIPI_DT_RGB666		0x23
++#define MIPI_DT_RGB888		0x24
++#define MIPI_DT_RAW6		0x28
++#define MIPI_DT_RAW7		0x29
++#define MIPI_DT_RAW8		0x2a
++#define MIPI_DT_RAW10		0x2b
++#define MIPI_DT_RAW12		0x2c
++#define MIPI_DT_RAW14		0x2d
++
++
++struct mipi_csi2_info;
++/* mipi csi2 API */
++struct mipi_csi2_info *mipi_csi2_get_info(void);
++
++bool mipi_csi2_enable(struct mipi_csi2_info *info);
++
++bool mipi_csi2_disable(struct mipi_csi2_info *info);
++
++bool mipi_csi2_get_status(struct mipi_csi2_info *info);
++
++int mipi_csi2_get_bind_ipu(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_get_bind_csi(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_get_virtual_channel(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_set_lanes(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_set_datatype(struct mipi_csi2_info *info,
++					unsigned int datatype);
++
++unsigned int mipi_csi2_get_datatype(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_dphy_status(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_get_error1(struct mipi_csi2_info *info);
++
++unsigned int mipi_csi2_get_error2(struct mipi_csi2_info *info);
++
++int mipi_csi2_pixelclk_enable(struct mipi_csi2_info *info);
++
++void mipi_csi2_pixelclk_disable(struct mipi_csi2_info *info);
++
++int mipi_csi2_reset(struct mipi_csi2_info *info);
++
++#endif
+diff -Nur linux-4.1.3/include/linux/mipi_dsi.h linux-xbian-imx6/include/linux/mipi_dsi.h
+--- linux-4.1.3/include/linux/mipi_dsi.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/mipi_dsi.h	2015-07-27 23:13:09.598735098 +0200
+@@ -0,0 +1,171 @@
++/*
++ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __INCLUDE_MIPI_DSI_H
++#define __INCLUDE_MIPI_DSI_H
++
++#define     MIPI_DSI_VERSION		(0x000)
++#define     MIPI_DSI_PWR_UP		(0x004)
++#define     MIPI_DSI_CLKMGR_CFG		(0x008)
++#define     MIPI_DSI_DPI_CFG		(0x00c)
++#define     MIPI_DSI_DBI_CFG		(0x010)
++#define     MIPI_DSI_DBIS_CMDSIZE	(0x014)
++#define     MIPI_DSI_PCKHDL_CFG		(0x018)
++#define     MIPI_DSI_VID_MODE_CFG	(0x01c)
++#define     MIPI_DSI_VID_PKT_CFG	(0x020)
++#define     MIPI_DSI_CMD_MODE_CFG	(0x024)
++#define     MIPI_DSI_TMR_LINE_CFG	(0x028)
++#define     MIPI_DSI_VTIMING_CFG	(0x02c)
++#define     MIPI_DSI_PHY_TMR_CFG	(0x030)
++#define     MIPI_DSI_GEN_HDR		(0x034)
++#define     MIPI_DSI_GEN_PLD_DATA	(0x038)
++#define     MIPI_DSI_CMD_PKT_STATUS	(0x03c)
++#define     MIPI_DSI_TO_CNT_CFG		(0x040)
++#define     MIPI_DSI_ERROR_ST0		(0x044)
++#define     MIPI_DSI_ERROR_ST1		(0x048)
++#define     MIPI_DSI_ERROR_MSK0		(0x04c)
++#define     MIPI_DSI_ERROR_MSK1		(0x050)
++#define     MIPI_DSI_PHY_RSTZ		(0x054)
++#define     MIPI_DSI_PHY_IF_CFG		(0x058)
++#define     MIPI_DSI_PHY_IF_CTRL	(0x05c)
++#define     MIPI_DSI_PHY_STATUS		(0x060)
++#define     MIPI_DSI_PHY_TST_CTRL0	(0x064)
++#define     MIPI_DSI_PHY_TST_CTRL1	(0x068)
++
++#define		DSI_PWRUP_RESET					(0x0 << 0)
++#define		DSI_PWRUP_POWERUP				(0x1 << 0)
++
++#define		DSI_DPI_CFG_VID_SHIFT				(0)
++#define		DSI_DPI_CFG_VID_MASK				(0x3)
++#define		DSI_DPI_CFG_COLORCODE_SHIFT			(2)
++#define		DSI_DPI_CFG_COLORCODE_MASK			(0x7)
++#define		DSI_DPI_CFG_DATAEN_ACT_LOW			(0x1 << 5)
++#define		DSI_DPI_CFG_DATAEN_ACT_HIGH			(0x0 << 5)
++#define		DSI_DPI_CFG_VSYNC_ACT_LOW			(0x1 << 6)
++#define		DSI_DPI_CFG_VSYNC_ACT_HIGH			(0x0 << 6)
++#define		DSI_DPI_CFG_HSYNC_ACT_LOW			(0x1 << 7)
++#define		DSI_DPI_CFG_HSYNC_ACT_HIGH			(0x0 << 7)
++#define		DSI_DPI_CFG_SHUTD_ACT_LOW			(0x1 << 8)
++#define		DSI_DPI_CFG_SHUTD_ACT_HIGH			(0x0 << 8)
++#define		DSI_DPI_CFG_COLORMODE_ACT_LOW			(0x1 << 9)
++#define		DSI_DPI_CFG_COLORMODE_ACT_HIGH			(0x0 << 9)
++#define		DSI_DPI_CFG_EN18LOOSELY				(0x1 << 10)
++
++#define		DSI_PCKHDL_CFG_EN_EOTP_TX			(0x1 << 0)
++#define		DSI_PCKHDL_CFG_EN_EOTP_RX			(0x1 << 1)
++#define		DSI_PCKHDL_CFG_EN_BTA				(0x1 << 2)
++#define		DSI_PCKHDL_CFG_EN_ECC_RX			(0x1 << 3)
++#define		DSI_PCKHDL_CFG_EN_CRC_RX			(0x1 << 4)
++#define		DSI_PCKHDL_CFG_GEN_VID_RX_MASK			(0x3)
++#define		DSI_PCKHDL_CFG_GEN_VID_RX_SHIFT			(5)
++
++#define		DSI_VID_MODE_CFG_EN				(0x1 << 0)
++#define		DSI_VID_MODE_CFG_EN_BURSTMODE			(0x3 << 1)
++#define		DSI_VID_MODE_CFG_TYPE_MASK			(0x3)
++#define		DSI_VID_MODE_CFG_TYPE_SHIFT			(1)
++#define		DSI_VID_MODE_CFG_EN_LP_VSA			(0x1 << 3)
++#define		DSI_VID_MODE_CFG_EN_LP_VBP			(0x1 << 4)
++#define		DSI_VID_MODE_CFG_EN_LP_VFP			(0x1 << 5)
++#define		DSI_VID_MODE_CFG_EN_LP_VACT			(0x1 << 6)
++#define		DSI_VID_MODE_CFG_EN_LP_HBP			(0x1 << 7)
++#define		DSI_VID_MODE_CFG_EN_LP_HFP			(0x1 << 8)
++#define		DSI_VID_MODE_CFG_EN_MULTI_PKT			(0x1 << 9)
++#define		DSI_VID_MODE_CFG_EN_NULL_PKT			(0x1 << 10)
++#define		DSI_VID_MODE_CFG_EN_FRAME_ACK			(0x1 << 11)
++#define		DSI_VID_MODE_CFG_EN_LP_MODE (DSI_VID_MODE_CFG_EN_LP_VSA | \
++						 DSI_VID_MODE_CFG_EN_LP_VBP | \
++						 DSI_VID_MODE_CFG_EN_LP_VFP | \
++						 DSI_VID_MODE_CFG_EN_LP_HFP | \
++						 DSI_VID_MODE_CFG_EN_LP_HBP | \
++						 DSI_VID_MODE_CFG_EN_LP_VACT)
++
++
++
++#define		DSI_VID_PKT_CFG_VID_PKT_SZ_MASK			(0x7ff)
++#define		DSI_VID_PKT_CFG_VID_PKT_SZ_SHIFT		(0)
++#define		DSI_VID_PKT_CFG_NUM_CHUNKS_MASK			(0x3ff)
++#define		DSI_VID_PKT_CFG_NUM_CHUNKS_SHIFT		(11)
++#define		DSI_VID_PKT_CFG_NULL_PKT_SZ_MASK		(0x3ff)
++#define		DSI_VID_PKT_CFG_NULL_PKT_SZ_SHIFT		(21)
++
++#define		MIPI_DSI_CMD_MODE_CFG_EN_LOWPOWER		(0x1FFF)
++#define		MIPI_DSI_CMD_MODE_CFG_EN_CMD_MODE		(0x1 << 0)
++
++#define		DSI_TME_LINE_CFG_HSA_TIME_MASK			(0x1ff)
++#define		DSI_TME_LINE_CFG_HSA_TIME_SHIFT			(0)
++#define		DSI_TME_LINE_CFG_HBP_TIME_MASK			(0x1ff)
++#define		DSI_TME_LINE_CFG_HBP_TIME_SHIFT			(9)
++#define		DSI_TME_LINE_CFG_HLINE_TIME_MASK		(0x3fff)
++#define		DSI_TME_LINE_CFG_HLINE_TIME_SHIFT		(18)
++
++#define		DSI_VTIMING_CFG_VSA_LINES_MASK			(0xf)
++#define		DSI_VTIMING_CFG_VSA_LINES_SHIFT			(0)
++#define		DSI_VTIMING_CFG_VBP_LINES_MASK			(0x3f)
++#define		DSI_VTIMING_CFG_VBP_LINES_SHIFT			(4)
++#define		DSI_VTIMING_CFG_VFP_LINES_MASK			(0x3f)
++#define		DSI_VTIMING_CFG_VFP_LINES_SHIFT			(10)
++#define		DSI_VTIMING_CFG_V_ACT_LINES_MASK		(0x7ff)
++#define		DSI_VTIMING_CFG_V_ACT_LINES_SHIFT		(16)
++
++#define		DSI_PHY_TMR_CFG_BTA_TIME_MASK			(0xfff)
++#define		DSI_PHY_TMR_CFG_BTA_TIME_SHIFT			(0)
++#define		DSI_PHY_TMR_CFG_LP2HS_TIME_MASK			(0xff)
++#define		DSI_PHY_TMR_CFG_LP2HS_TIME_SHIFT		(12)
++#define		DSI_PHY_TMR_CFG_HS2LP_TIME_MASK			(0xff)
++#define		DSI_PHY_TMR_CFG_HS2LP_TIME_SHIFT		(20)
++
++#define		DSI_PHY_IF_CFG_N_LANES_MASK			(0x3)
++#define		DSI_PHY_IF_CFG_N_LANES_SHIFT			(0)
++#define		DSI_PHY_IF_CFG_WAIT_TIME_MASK			(0xff)
++#define		DSI_PHY_IF_CFG_WAIT_TIME_SHIFT			(2)
++
++#define		DSI_PHY_RSTZ_EN_CLK				(0x1 << 2)
++#define		DSI_PHY_RSTZ_DISABLE_RST			(0x1 << 1)
++#define		DSI_PHY_RSTZ_DISABLE_SHUTDOWN			(0x1 << 0)
++#define		DSI_PHY_RSTZ_RST				(0x0)
++
++#define		DSI_PHY_STATUS_LOCK				(0x1 << 0)
++#define		DSI_PHY_STATUS_STOPSTATE_CLK_LANE		(0x1 << 2)
++
++#define		DSI_GEN_HDR_TYPE_MASK				(0xff)
++#define		DSI_GEN_HDR_TYPE_SHIFT				(0)
++#define		DSI_GEN_HDR_DATA_MASK				(0xffff)
++#define		DSI_GEN_HDR_DATA_SHIFT				(8)
++
++#define		DSI_CMD_PKT_STATUS_GEN_CMD_EMPTY		(0x1 << 0)
++#define		DSI_CMD_PKT_STATUS_GEN_CMD_FULL			(0x1 << 1)
++#define		DSI_CMD_PKT_STATUS_GEN_PLD_W_EMPTY		(0x1 << 2)
++#define		DSI_CMD_PKT_STATUS_GEN_PLD_W_FULL		(0x1 << 3)
++#define		DSI_CMD_PKT_STATUS_GEN_PLD_R_EMPTY		(0x1 << 4)
++#define		DSI_CMD_PKT_STATUS_GEN_RD_CMD_BUSY		(0x1 << 6)
++
++#define		DSI_ERROR_MSK0_ALL_MASK				(0x1fffff)
++#define		DSI_ERROR_MSK1_ALL_MASK				(0x3ffff)
++
++#define		DSI_PHY_IF_CTRL_RESET				(0x0)
++#define		DSI_PHY_IF_CTRL_TX_REQ_CLK_HS			(0x1 << 0)
++#define		DSI_PHY_IF_CTRL_TX_REQ_CLK_ULPS			(0x1 << 1)
++#define		DSI_PHY_IF_CTRL_TX_EXIT_CLK_ULPS		(0x1 << 2)
++#define		DSI_PHY_IF_CTRL_TX_REQ_DATA_ULPS		(0x1 << 3)
++#define		DSI_PHY_IF_CTRL_TX_EXIT_DATA_ULPS		(0x1 << 4)
++#define		DSI_PHY_IF_CTRL_TX_TRIG_MASK			(0xF)
++#define		DSI_PHY_IF_CTRL_TX_TRIG_SHIFT			(5)
++
++#define		DSI_PHY_CLK_INIT_COMMAND			(0x44)
++#define		DSI_GEN_PLD_DATA_BUF_SIZE			(0x4)
++#endif
+diff -Nur linux-4.1.3/include/linux/mmc/host.h linux-xbian-imx6/include/linux/mmc/host.h
+--- linux-4.1.3/include/linux/mmc/host.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/linux/mmc/host.h	2015-07-27 23:13:09.602720875 +0200
+@@ -300,6 +300,11 @@
+ 	unsigned long           clkgate_delay;
+ #endif
+ 
++	/* card specific properties to deal with power and reset */
++	struct regulator	*card_regulator; /* External VCC needed by the card */
++	struct gpio_desc	*card_reset_gpios[2]; /* External resets, active low */
++	struct clk		*card_clk;	/* External clock needed by the card */
++
+ 	/* host specific block data */
+ 	unsigned int		max_seg_size;	/* see blk_queue_max_segment_size */
+ 	unsigned short		max_segs;	/* see blk_queue_max_segments */
+diff -Nur linux-4.1.3/include/linux/mm_types.h linux-xbian-imx6/include/linux/mm_types.h
+--- linux-4.1.3/include/linux/mm_types.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/linux/mm_types.h	2015-07-27 23:13:09.602720875 +0200
+@@ -23,7 +23,7 @@
+ struct address_space;
+ struct mem_cgroup;
+ 
+-#define USE_SPLIT_PTE_PTLOCKS	(NR_CPUS >= CONFIG_SPLIT_PTLOCK_CPUS)
++#define USE_SPLIT_PTE_PTLOCKS	(0)
+ #define USE_SPLIT_PMD_PTLOCKS	(USE_SPLIT_PTE_PTLOCKS && \
+ 		IS_ENABLED(CONFIG_ARCH_ENABLE_SPLIT_PMD_PTLOCK))
+ #define ALLOC_SPLIT_PTLOCKS	(SPINLOCK_SIZE > BITS_PER_LONG/8)
+diff -Nur linux-4.1.3/include/linux/mxc_asrc.h linux-xbian-imx6/include/linux/mxc_asrc.h
+--- linux-4.1.3/include/linux/mxc_asrc.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/mxc_asrc.h	2015-07-27 23:13:09.606706653 +0200
+@@ -0,0 +1,389 @@
++/*
++ * Copyright 2008-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ *
++ * @file mxc_asrc.h
++ *
++ * @brief i.MX Asynchronous Sample Rate Converter
++ *
++ * @ingroup Audio
++ */
++
++#ifndef __MXC_ASRC_H__
++#define __MXC_ASRC_H__
++
++#include <uapi/linux/mxc_asrc.h>
++#include <linux/scatterlist.h>
++
++#define ASRC_DMA_BUFFER_NUM		2
++#define ASRC_INPUTFIFO_THRESHOLD	32
++#define ASRC_OUTPUTFIFO_THRESHOLD	32
++#define ASRC_FIFO_THRESHOLD_MIN		0
++#define ASRC_FIFO_THRESHOLD_MAX		63
++#define ASRC_DMA_BUFFER_SIZE		(1024 * 48 * 4)
++#define ASRC_MAX_BUFFER_SIZE		(1024 * 48)
++#define ASRC_OUTPUT_LAST_SAMPLE_DEFAULT_MAX 32
++#define ASRC_OUTPUT_LAST_SAMPLE_DEFAULT 16
++
++
++/* Ideal Ratio mode doesn't care the outclk frequency, so be fixed */
++#define ASRC_PRESCALER_IDEAL_RATIO	5
++/* SPDIF rxclk pulse rate is 128 * samplerate, so 2 ^ 7 */
++#define ASRC_PRESCALER_SPDIF_RX		7
++/* SPDIF txclk pulse rate is 64 * samplerate, so 2 ^ 6 */
++#define ASRC_PRESCALER_SPDIF_TX		6
++/* I2S bclk is 16 * 2 = 32, so 2 ^ 5 */
++#define ASRC_PRESCALER_I2S_16BIT	5
++/* I2S bclk is 24 * 2 = 48 -> 64, so 2 ^ 6 */
++#define ASRC_PRESCALER_I2S_24BIT	6
++
++
++#define REG_ASRCTR			0x00
++#define REG_ASRIER			0x04
++#define REG_ASRCNCR			0x0C
++#define REG_ASRCFG			0x10
++#define REG_ASRCSR			0x14
++
++#define REG_ASRCDR1			0x18
++#define REG_ASRCDR2			0x1C
++#define REG_ASRCDR(x)			((x < 2) ? REG_ASRCDR1 : REG_ASRCDR2)
++
++#define REG_ASRSTR			0x20
++#define REG_ASRRA			0x24
++#define REG_ASRRB			0x28
++#define REG_ASRRC			0x2C
++#define REG_ASRPM1			0x40
++#define REG_ASRPM2			0x44
++#define REG_ASRPM3			0x48
++#define REG_ASRPM4			0x4C
++#define REG_ASRPM5			0x50
++#define REG_ASRTFR1			0x54
++#define REG_ASRCCR			0x5C
++
++#define REG_ASRDIA			0x60
++#define REG_ASRDOA			0x64
++#define REG_ASRDIB			0x68
++#define REG_ASRDOB			0x6C
++#define REG_ASRDIC			0x70
++#define REG_ASRDOC			0x74
++#define REG_ASRDI(x)			(REG_ASRDIA + (x << 3))
++#define REG_ASRDO(x)			(REG_ASRDOA + (x << 3))
++
++#define REG_ASRIDRHA			0x80
++#define REG_ASRIDRLA			0x84
++#define REG_ASRIDRHB			0x88
++#define REG_ASRIDRLB			0x8C
++#define REG_ASRIDRHC			0x90
++#define REG_ASRIDRLC			0x94
++#define REG_ASRIDRH(x)			(REG_ASRIDRHA + (x << 3))
++#define REG_ASRIDRL(x)			(REG_ASRIDRLA + (x << 3))
++
++#define REG_ASR76K			0x98
++#define REG_ASR56K			0x9C
++
++#define REG_ASRMCRA			0xA0
++#define REG_ASRFSTA			0xA4
++#define REG_ASRMCRB			0xA8
++#define REG_ASRFSTB			0xAC
++#define REG_ASRMCRC			0xB0
++#define REG_ASRFSTC			0xB4
++#define REG_ASRMCR(x)			(REG_ASRMCRA + (x << 3))
++#define REG_ASRFST(x)			(REG_ASRFSTA + (x << 3))
++
++#define REG_ASRMCR1A			0xC0
++#define REG_ASRMCR1B			0xC4
++#define REG_ASRMCR1C			0xC8
++#define REG_ASRMCR1(x)			(REG_ASRMCR1A + (x << 2))
++
++
++/* REG0 0x00 REG_ASRCTR */
++#define ASRCTR_ATSx_SHIFT(x)		(20 + x)
++#define ASRCTR_ATSx_MASK(x)		(1 << ASRCTR_ATSx_SHIFT(x))
++#define ASRCTR_ATS(x)			(1 << ASRCTR_ATSx_SHIFT(x))
++#define ASRCTR_USRx_SHIFT(x)		(14 + (x << 1))
++#define ASRCTR_USRx_MASK(x)		(1 << ASRCTR_USRx_SHIFT(x))
++#define ASRCTR_USR(x)			(1 << ASRCTR_USRx_SHIFT(x))
++#define ASRCTR_IDRx_SHIFT(x)		(13 + (x << 1))
++#define ASRCTR_IDRx_MASK(x)		(1 << ASRCTR_IDRx_SHIFT(x))
++#define ASRCTR_IDR(x)			(1 << ASRCTR_IDRx_SHIFT(x))
++#define ASRCTR_SRST_SHIFT		4
++#define ASRCTR_SRST_MASK		(1 << ASRCTR_SRST_SHIFT)
++#define ASRCTR_SRST			(1 << ASRCTR_SRST_SHIFT)
++#define ASRCTR_ASRCEx_SHIFT(x)		(1 + x)
++#define ASRCTR_ASRCEx_MASK(x)		(1 << ASRCTR_ASRCEx_SHIFT(x))
++#define ASRCTR_ASRCE(x)			(1 << ASRCTR_ASRCEx_SHIFT(x))
++#define ASRCTR_ASRCEx_ALL_MASK		(0x7 << ASRCTR_ASRCEx_SHIFT(0))
++#define ASRCTR_ASRCEN_SHIFT		0
++#define ASRCTR_ASRCEN_MASK		(1 << ASRCTR_ASRCEN_SHIFT)
++#define ASRCTR_ASRCEN			(1 << ASRCTR_ASRCEN_SHIFT)
++
++/* REG1 0x04 REG_ASRIER */
++#define ASRIER_AFPWE_SHIFT		7
++#define ASRIER_AFPWE_MASK		(1 << ASRIER_AFPWE_SHIFT)
++#define ASRIER_AFPWE			(1 << ASRIER_AFPWE_SHIFT)
++#define ASRIER_AOLIE_SHIFT		6
++#define ASRIER_AOLIE_MASK		(1 << ASRIER_AOLIE_SHIFT)
++#define ASRIER_AOLIE			(1 << ASRIER_AOLIE_SHIFT)
++#define ASRIER_ADOEx_SHIFT(x)		(3 + x)
++#define ASRIER_ADOEx_MASK(x)		(1 << ASRIER_ADOEx_SHIFT(x))
++#define ASRIER_ADOE(x)			(1 << ASRIER_ADOEx_SHIFT(x))
++#define ASRIER_ADIEx_SHIFT(x)		(0 + x)
++#define ASRIER_ADIEx_MASK(x)		(1 << ASRIER_ADIEx_SHIFT(x))
++#define ASRIER_ADIE(x)			(1 << ASRIER_ADIEx_SHIFT(x))
++
++/* REG2 0x0C REG_ASRCNCR */
++#define ASRCNCR_ANCx_SHIFT(x, b)	(b * x)
++#define ASRCNCR_ANCx_MASK(x, b)		(((1 << b) - 1) << ASRCNCR_ANCx_SHIFT(x, b))
++#define ASRCNCR_ANCx_get(x, v, b)	((v & ASRCNCR_ANCx_MASK(x, b)) >> ASRCNCR_ANCx_SHIFT(x, b))
++#define ASRCNCR_ANCx_set(x, v, b)	((v << ASRCNCR_ANCx_SHIFT(x, b)) & ASRCNCR_ANCx_MASK(x, b))
++
++/* REG3 0x10 REG_ASRCFG */
++#define ASRCFG_INIRQx_SHIFT(x)		(21 + x)
++#define ASRCFG_INIRQx_MASK(x)		(1 << ASRCFG_INIRQx_SHIFT(x))
++#define ASRCFG_INIRQx			(1 << ASRCFG_INIRQx_SHIFT(x))
++#define ASRCFG_NDPRx_SHIFT(x)		(18 + x)
++#define ASRCFG_NDPRx_MASK(x)		(1 << ASRCFG_NDPRx_SHIFT(x))
++#define ASRCFG_NDPRx			(1 << ASRCFG_NDPRx_SHIFT(x))
++#define ASRCFG_POSTMODx_SHIFT(x)	(8 + (x << 2))
++#define ASRCFG_POSTMODx_WIDTH		2
++#define ASRCFG_POSTMODx_MASK(x)		(((1 << ASRCFG_POSTMODx_WIDTH) - 1) << ASRCFG_POSTMODx_SHIFT(x))
++#define ASRCFG_POSTMOD(x, v)		((v) << ASRCFG_POSTMODx_SHIFT(x))
++#define ASRCFG_POSTMODx_UP(x)		(0 << ASRCFG_POSTMODx_SHIFT(x))
++#define ASRCFG_POSTMODx_DCON(x)		(1 << ASRCFG_POSTMODx_SHIFT(x))
++#define ASRCFG_POSTMODx_DOWN(x)		(2 << ASRCFG_POSTMODx_SHIFT(x))
++#define ASRCFG_PREMODx_SHIFT(x)		(6 + (x << 2))
++#define ASRCFG_PREMODx_WIDTH		2
++#define ASRCFG_PREMODx_MASK(x)		(((1 << ASRCFG_PREMODx_WIDTH) - 1) << ASRCFG_PREMODx_SHIFT(x))
++#define ASRCFG_PREMOD(x, v)		((v) << ASRCFG_PREMODx_SHIFT(x))
++#define ASRCFG_PREMODx_UP(x)		(0 << ASRCFG_PREMODx_SHIFT(x))
++#define ASRCFG_PREMODx_DCON(x)		(1 << ASRCFG_PREMODx_SHIFT(x))
++#define ASRCFG_PREMODx_DOWN(x)		(2 << ASRCFG_PREMODx_SHIFT(x))
++#define ASRCFG_PREMODx_BYPASS(x)	(3 << ASRCFG_PREMODx_SHIFT(x))
++
++/* REG4 0x14 REG_ASRCSR */
++#define ASRCSR_AxCSx_WIDTH		4
++#define ASRCSR_AxCSx_MASK		((1 << ASRCSR_AxCSx_WIDTH) - 1)
++#define ASRCSR_AOCSx_SHIFT(x)		(12 + (x << 2))
++#define ASRCSR_AOCSx_MASK(x)		(((1 << ASRCSR_AxCSx_WIDTH) - 1) << ASRCSR_AOCSx_SHIFT(x))
++#define ASRCSR_AOCS(x, v)		((v) << ASRCSR_AOCSx_SHIFT(x))
++#define ASRCSR_AICSx_SHIFT(x)		(x << 2)
++#define ASRCSR_AICSx_MASK(x)		(((1 << ASRCSR_AxCSx_WIDTH) - 1) << ASRCSR_AICSx_SHIFT(x))
++#define ASRCSR_AICS(x, v)		((v) << ASRCSR_AICSx_SHIFT(x))
++
++/* REG5&6 0x18 & 0x1C REG_ASRCDR1 & ASRCDR2 */
++#define ASRCDRx_AxCPx_WIDTH		3
++#define ASRCDRx_AICPx_SHIFT(x)		(0 + (x % 2) * 6)
++#define ASRCDRx_AICPx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AICPx_SHIFT(x))
++#define ASRCDRx_AICP(x, v)		((v) << ASRCDRx_AICPx_SHIFT(x))
++#define ASRCDRx_AICDx_SHIFT(x)		(3 + (x % 2) * 6)
++#define ASRCDRx_AICDx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AICDx_SHIFT(x))
++#define ASRCDRx_AICD(x, v)		((v) << ASRCDRx_AICDx_SHIFT(x))
++#define ASRCDRx_AOCPx_SHIFT(x)		((x < 2) ? 12 + x * 6 : 6)
++#define ASRCDRx_AOCPx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AOCPx_SHIFT(x))
++#define ASRCDRx_AOCP(x, v)		((v) << ASRCDRx_AOCPx_SHIFT(x))
++#define ASRCDRx_AOCDx_SHIFT(x)		((x < 2) ? 15 + x * 6 : 9)
++#define ASRCDRx_AOCDx_MASK(x)		(((1 << ASRCDRx_AxCPx_WIDTH) - 1) << ASRCDRx_AOCDx_SHIFT(x))
++#define ASRCDRx_AOCD(x, v)		((v) << ASRCDRx_AOCDx_SHIFT(x))
++
++/* REG7 0x20 REG_ASRSTR */
++#define ASRSTR_DSLCNT_SHIFT		21
++#define ASRSTR_DSLCNT_MASK		(1 << ASRSTR_DSLCNT_SHIFT)
++#define ASRSTR_DSLCNT			(1 << ASRSTR_DSLCNT_SHIFT)
++#define ASRSTR_ATQOL_SHIFT		20
++#define ASRSTR_ATQOL_MASK		(1 << ASRSTR_ATQOL_SHIFT)
++#define ASRSTR_ATQOL			(1 << ASRSTR_ATQOL_SHIFT)
++#define ASRSTR_AOOLx_SHIFT(x)		(17 + x)
++#define ASRSTR_AOOLx_MASK(x)		(1 << ASRSTR_AOOLx_SHIFT(x))
++#define ASRSTR_AOOL(x)			(1 << ASRSTR_AOOLx_SHIFT(x))
++#define ASRSTR_AIOLx_SHIFT(x)		(14 + x)
++#define ASRSTR_AIOLx_MASK(x)		(1 << ASRSTR_AIOLx_SHIFT(x))
++#define ASRSTR_AIOL(x)			(1 << ASRSTR_AIOLx_SHIFT(x))
++#define ASRSTR_AODOx_SHIFT(x)		(11 + x)
++#define ASRSTR_AODOx_MASK(x)		(1 << ASRSTR_AODOx_SHIFT(x))
++#define ASRSTR_AODO(x)			(1 << ASRSTR_AODOx_SHIFT(x))
++#define ASRSTR_AIDUx_SHIFT(x)		(8 + x)
++#define ASRSTR_AIDUx_MASK(x)		(1 << ASRSTR_AIDUx_SHIFT(x))
++#define ASRSTR_AIDU(x)			(1 << ASRSTR_AIDUx_SHIFT(x))
++#define ASRSTR_FPWT_SHIFT		7
++#define ASRSTR_FPWT_MASK		(1 << ASRSTR_FPWT_SHIFT)
++#define ASRSTR_FPWT			(1 << ASRSTR_FPWT_SHIFT)
++#define ASRSTR_AOLE_SHIFT		6
++#define ASRSTR_AOLE_MASK		(1 << ASRSTR_AOLE_SHIFT)
++#define ASRSTR_AOLE			(1 << ASRSTR_AOLE_SHIFT)
++#define ASRSTR_AODEx_SHIFT(x)		(3 + x)
++#define ASRSTR_AODFx_MASK(x)		(1 << ASRSTR_AODEx_SHIFT(x))
++#define ASRSTR_AODF(x)			(1 << ASRSTR_AODEx_SHIFT(x))
++#define ASRSTR_AIDEx_SHIFT(x)		(0 + x)
++#define ASRSTR_AIDEx_MASK(x)		(1 << ASRSTR_AIDEx_SHIFT(x))
++#define ASRSTR_AIDE(x)			(1 << ASRSTR_AIDEx_SHIFT(x))
++
++/* REG10 0x54 REG_ASRTFR1 */
++#define ASRTFR1_TF_BASE_WIDTH		7
++#define ASRTFR1_TF_BASE_SHIFT		6
++#define ASRTFR1_TF_BASE_MASK		(((1 << ASRTFR1_TF_BASE_WIDTH) - 1) << ASRTFR1_TF_BASE_SHIFT)
++#define ASRTFR1_TF_BASE(x)		((x) << ASRTFR1_TF_BASE_SHIFT)
++
++/*
++ * REG22 0xA0 REG_ASRMCRA
++ * REG24 0xA8 REG_ASRMCRB
++ * REG26 0xB0 REG_ASRMCRC
++ */
++#define ASRMCRx_ZEROBUFx_SHIFT		23
++#define ASRMCRx_ZEROBUFxCLR_MASK	(1 << ASRMCRx_ZEROBUFx_SHIFT)
++#define ASRMCRx_ZEROBUFxCLR		(1 << ASRMCRx_ZEROBUFx_SHIFT)
++#define ASRMCRx_EXTTHRSHx_SHIFT		22
++#define ASRMCRx_EXTTHRSHx_MASK		(1 << ASRMCRx_EXTTHRSHx_SHIFT)
++#define ASRMCRx_EXTTHRSHx		(1 << ASRMCRx_EXTTHRSHx_SHIFT)
++#define ASRMCRx_BUFSTALLx_SHIFT		21
++#define ASRMCRx_BUFSTALLx_MASK		(1 << ASRMCRx_BUFSTALLx_SHIFT)
++#define ASRMCRx_BUFSTALLx		(1 << ASRMCRx_BUFSTALLx_SHIFT)
++#define ASRMCRx_BYPASSPOLYx_SHIFT	20
++#define ASRMCRx_BYPASSPOLYx_MASK	(1 << ASRMCRx_BYPASSPOLYx_SHIFT)
++#define ASRMCRx_BYPASSPOLYx		(1 << ASRMCRx_BYPASSPOLYx_SHIFT)
++#define ASRMCRx_OUTFIFO_THRESHOLD_WIDTH	6
++#define ASRMCRx_OUTFIFO_THRESHOLD_SHIFT	12
++#define ASRMCRx_OUTFIFO_THRESHOLD_MASK	(((1 << ASRMCRx_OUTFIFO_THRESHOLD_WIDTH) - 1) << ASRMCRx_OUTFIFO_THRESHOLD_SHIFT)
++#define ASRMCRx_OUTFIFO_THRESHOLD(v)	(((v) << ASRMCRx_OUTFIFO_THRESHOLD_SHIFT) & ASRMCRx_OUTFIFO_THRESHOLD_MASK)
++#define ASRMCRx_RSYNIFx_SHIFT		11
++#define ASRMCRx_RSYNIFx_MASK		(1 << ASRMCRx_RSYNIFx_SHIFT)
++#define ASRMCRx_RSYNIFx			(1 << ASRMCRx_RSYNIFx_SHIFT)
++#define ASRMCRx_RSYNOFx_SHIFT		10
++#define ASRMCRx_RSYNOFx_MASK		(1 << ASRMCRx_RSYNOFx_SHIFT)
++#define ASRMCRx_RSYNOFx			(1 << ASRMCRx_RSYNOFx_SHIFT)
++#define ASRMCRx_INFIFO_THRESHOLD_WIDTH	6
++#define ASRMCRx_INFIFO_THRESHOLD_SHIFT	0
++#define ASRMCRx_INFIFO_THRESHOLD_MASK	(((1 << ASRMCRx_INFIFO_THRESHOLD_WIDTH) - 1) << ASRMCRx_INFIFO_THRESHOLD_SHIFT)
++#define ASRMCRx_INFIFO_THRESHOLD(v)	(((v) << ASRMCRx_INFIFO_THRESHOLD_SHIFT) & ASRMCRx_INFIFO_THRESHOLD_MASK)
++
++/*
++ * REG23 0xA4 REG_ASRFSTA
++ * REG25 0xAC REG_ASRFSTB
++ * REG27 0xB4 REG_ASRFSTC
++ */
++#define ASRFSTx_OAFx_SHIFT		23
++#define ASRFSTx_OAFx_MASK		(1 << ASRFSTx_OAFx_SHIFT)
++#define ASRFSTx_OAFx			(1 << ASRFSTx_OAFx_SHIFT)
++#define ASRFSTx_OUTPUT_FIFO_WIDTH	7
++#define ASRFSTx_OUTPUT_FIFO_SHIFT	12
++#define ASRFSTx_OUTPUT_FIFO_MASK	(((1 << ASRFSTx_OUTPUT_FIFO_WIDTH) - 1) << ASRFSTx_OUTPUT_FIFO_SHIFT)
++#define ASRFSTx_IAEx_SHIFT		11
++#define ASRFSTx_IAEx_MASK		(1 << ASRFSTx_OAFx_SHIFT)
++#define ASRFSTx_IAEx			(1 << ASRFSTx_OAFx_SHIFT)
++#define ASRFSTx_INPUT_FIFO_WIDTH	7
++#define ASRFSTx_INPUT_FIFO_SHIFT	0
++#define ASRFSTx_INPUT_FIFO_MASK		((1 << ASRFSTx_INPUT_FIFO_WIDTH) - 1)
++
++/* REG28 0xC0 & 0xC4 & 0xC8 REG_ASRMCR1x */
++#define ASRMCR1x_IWD_WIDTH		3
++#define ASRMCR1x_IWD_SHIFT		9
++#define ASRMCR1x_IWD_MASK		(((1 << ASRMCR1x_IWD_WIDTH) - 1) << ASRMCR1x_IWD_SHIFT)
++#define ASRMCR1x_IWD(v)			((v) << ASRMCR1x_IWD_SHIFT)
++#define ASRMCR1x_IMSB_SHIFT		8
++#define ASRMCR1x_IMSB_MASK		(1 << ASRMCR1x_IMSB_SHIFT)
++#define ASRMCR1x_IMSB_MSB		(1 << ASRMCR1x_IMSB_SHIFT)
++#define ASRMCR1x_IMSB_LSB		(0 << ASRMCR1x_IMSB_SHIFT)
++#define ASRMCR1x_OMSB_SHIFT		2
++#define ASRMCR1x_OMSB_MASK		(1 << ASRMCR1x_OMSB_SHIFT)
++#define ASRMCR1x_OMSB_MSB		(1 << ASRMCR1x_OMSB_SHIFT)
++#define ASRMCR1x_OMSB_LSB		(0 << ASRMCR1x_OMSB_SHIFT)
++#define ASRMCR1x_OSGN_SHIFT		1
++#define ASRMCR1x_OSGN_MASK		(1 << ASRMCR1x_OSGN_SHIFT)
++#define ASRMCR1x_OSGN			(1 << ASRMCR1x_OSGN_SHIFT)
++#define ASRMCR1x_OW16_SHIFT		0
++#define ASRMCR1x_OW16_MASK		(1 << ASRMCR1x_OW16_SHIFT)
++#define ASRMCR1x_OW16(v)		((v) << ASRMCR1x_OW16_SHIFT)
++
++
++struct dma_block {
++	unsigned int index;
++	unsigned int length;
++	void *dma_vaddr;
++	dma_addr_t dma_paddr;
++	struct list_head queue;
++};
++
++struct asrc_p2p_params {
++	u32 p2p_rate;				/* ASRC output rate for p2p */
++	enum asrc_word_width p2p_width;		/* ASRC output wordwidth for p2p */
++};
++
++struct asrc_pair_params {
++	enum asrc_pair_index index;
++	struct completion input_complete;
++	struct completion output_complete;
++	struct dma_chan *input_dma_channel;
++	struct dma_chan *output_dma_channel;
++	unsigned int input_buffer_size;
++	unsigned int output_buffer_size;
++	unsigned int buffer_num;
++	unsigned int pair_hold;
++	unsigned int asrc_active;
++	unsigned int channel_nums;
++	struct dma_block input_dma_total;
++	struct dma_block input_dma[ASRC_DMA_BUFFER_NUM];
++	struct dma_block output_dma_total;
++	struct dma_block output_dma[ASRC_DMA_BUFFER_NUM];
++	struct dma_block output_last_period;
++	struct dma_async_tx_descriptor *desc_in;
++	struct dma_async_tx_descriptor *desc_out;
++	unsigned int input_sg_nodes;
++	unsigned int output_sg_nodes;
++	struct scatterlist input_sg[4], output_sg[4];
++	enum asrc_word_width input_word_width;
++	enum asrc_word_width output_word_width;
++	u32 input_sample_rate;
++	u32 output_sample_rate;
++	u32 input_wm;
++	u32 output_wm;
++	unsigned int last_period_sample;
++};
++
++struct asrc_data {
++	struct asrc_pair_params *params[ASRC_PAIR_MAX_NUM];
++	struct asrc_pair asrc_pair[ASRC_PAIR_MAX_NUM];
++	struct proc_dir_entry *proc_asrc;
++	struct class *asrc_class;
++	struct regmap *regmap;
++	struct clk *mem_clk;
++	struct clk *ipg_clk;
++	struct clk *asrck_clk;
++	struct clk *dma_clk;
++	unsigned long paddr;
++	unsigned int channel_bits;
++	int asrc_major;
++	int irq;
++	struct device *dev;
++};
++
++struct asrc_p2p_ops {
++	void (*asrc_p2p_start_conv)(enum asrc_pair_index);
++	void (*asrc_p2p_stop_conv)(enum asrc_pair_index);
++	int (*asrc_p2p_get_dma_request)(enum asrc_pair_index, bool);
++	u32 (*asrc_p2p_per_addr)(enum asrc_pair_index, bool);
++	int (*asrc_p2p_req_pair)(int, enum asrc_pair_index *index);
++	int (*asrc_p2p_config_pair)(struct asrc_config *config);
++	void (*asrc_p2p_release_pair)(enum asrc_pair_index);
++	void (*asrc_p2p_finish_conv)(enum asrc_pair_index);
++};
++
++extern void asrc_p2p_hook(struct asrc_p2p_ops *asrc_p2p_ct);
++
++extern int asrc_req_pair(int chn_num, enum asrc_pair_index *index);
++extern void asrc_release_pair(enum asrc_pair_index index);
++extern int asrc_config_pair(struct asrc_config *config);
++extern void asrc_get_status(struct asrc_status_flags *flags);
++extern void asrc_start_conv(enum asrc_pair_index index);
++extern void asrc_stop_conv(enum asrc_pair_index index);
++extern u32 asrc_get_per_addr(enum asrc_pair_index index, bool i);
++extern int asrc_get_dma_request(enum asrc_pair_index index, bool i);
++extern void asrc_finish_conv(enum asrc_pair_index index);
++extern int asrc_set_watermark(enum asrc_pair_index index,
++		u32 in_wm, u32 out_wm);
++
++#endif/* __MXC_ASRC_H__ */
+diff -Nur linux-4.1.3/include/linux/mxc_dcic.h linux-xbian-imx6/include/linux/mxc_dcic.h
+--- linux-4.1.3/include/linux/mxc_dcic.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/mxc_dcic.h	2015-07-27 23:13:09.606706653 +0200
+@@ -0,0 +1,139 @@
++/*
++ * Copyright (C) 2014 Freescale Semiconductor, Inc. All Rights Reserved
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*!
++ * @file linux/mxc_dcic.h
++ *
++ * @brief Global header file for the MXC DCIC driver
++ *
++ * @ingroup MXC DCIC
++ */
++
++#ifndef __LINUX_DCIC_H__
++#define __LINUX_DCIC_H__
++
++#include <uapi/linux/mxc_dcic.h>
++
++#define DCICC_IC_ENABLE					0x1
++#define DCICC_IC_DISABLE				0x0
++#define DCICC_IC_MASK					0x1
++#define DCICC_DE_ACTIVE_HIGH			0
++#define DCICC_DE_ACTIVE_LOW				(0x1 << 4)
++#define DCICC_DE_ACTIVE_MASK			(0x1 << 4)
++#define DCICC_HSYNC_POL_ACTIVE_HIGH		0
++#define DCICC_HSYNC_POL_ACTIVE_LOW		(0x1 << 5)
++#define DCICC_HSYNC_POL_ACTIVE_MASK		(0x1 << 5)
++#define DCICC_VSYNC_POL_ACTIVE_HIGH		0
++#define DCICC_VSYNC_POL_ACTIVE_LOW		(0x1 << 6)
++#define DCICC_VSYNC_POL_ACTIVE_MASK		(0x1 << 6)
++#define DCICC_CLK_POL_NO_INVERTED		0
++#define DCICC_CLK_POL_INVERTED			(0x1 << 7)
++#define DCICC_CLK_POL_INVERTED_MASK		(0x1 << 7)
++
++#define DCICIC_ERROR_INT_DISABLE		1
++#define DCICIC_ERROR_INT_ENABLE			0
++#define DCICIC_ERROR_INT_MASK_MASK		1
++#define DCICIC_FUN_INT_DISABLE			(0x1 << 1)
++#define DCICIC_FUN_INT_ENABLE			0
++#define DCICIC_FUN_INT_MASK				(0x1 << 1)
++#define DCICIC_FREEZE_MASK_CHANGED		0
++#define DCICIC_FREEZE_MASK_FORZEN		(0x1 << 3)
++#define DCICIC_FREEZE_MASK_MASK			(0x1 << 3)
++#define DCICIC_EXT_SIG_EX_DISABLE		0
++#define DCICIC_EXT_SIG_EN_ENABLE		(0x1 << 16)
++#define DCICIC_EXT_SIG_EN_MASK			(0x1 << 16)
++
++#define DCICS_ROI_MATCH_STAT_MASK		0xFFFF
++#define DCICS_EI_STAT_PENDING			(0x1 << 16)
++#define DCICS_EI_STAT_NO_PENDING		0
++#define DCICS_FI_STAT_PENDING			(0x1 << 17)
++#define DCICS_FI_STAT_NO_PENDING		0
++
++#define DCICRC_ROI_START_OFFSET_X_MASK	0x1FFF
++#define DCICRC_ROI_START_OFFSET_X_SHIFT	0
++#define DCICRC_ROI_START_OFFSET_Y_MASK	(0xFFF << 16)
++#define DCICRC_ROI_START_OFFSET_Y_SHIFT	16
++#define DCICRC_ROI_CHANGED				0
++#define DCICRC_ROI_FROZEN				(0x1 << 30)
++#define DCICRC_ROI_ENABLE				(0x1 << 31)
++#define DCICRC_ROI_DISABLE				0
++
++#define DCICRS_ROI_END_OFFSET_X_MASK	0x1FFF
++#define DCICRS_ROI_END_OFFSET_X_SHIFT	0
++#define DCICRS_ROI_END_OFFSET_Y_MASK	(0xFFF << 16)
++#define DCICRS_ROI_END_OFFSET_Y_SHIFT	16
++
++struct roi_regs {
++	u32 dcicrc;
++	u32 dcicrs;
++	u32 dcicrrs;
++	u32 dcicrcs;
++};
++
++struct dcic_regs {
++	u32 dcicc;
++	u32 dcicic;
++	u32 dcics;
++	u32 dcic_reserved;
++	struct roi_regs ROI[16];
++};
++
++struct dcic_mux {
++	char dcic[16];
++	u32 val;
++};
++
++struct bus_mux {
++	char name[16];
++	int reg;
++	int shift;
++	int mask;
++	int dcic_mux_num;
++	const struct dcic_mux *dcics;
++};
++
++struct dcic_info {
++	int bus_mux_num;
++	const struct bus_mux *buses;
++};
++
++struct dcic_data {
++	struct regmap *regmap;
++	struct device *dev;
++	struct dcic_regs *regs;
++	const struct bus_mux *buses;
++	u32 bus_n;
++	u32 mux_n;
++	struct clk *disp_axi_clk;
++	struct clk *dcic_clk;
++	struct mutex lock;
++	struct completion roi_crc_comp;
++	struct class *class;
++	int major;
++	struct cdev cdev;	/* Char device structure */
++	dev_t devt;
++	unsigned int result;
++};
++
++struct dcic_private {
++	struct dcic_data *dcic;
++	u16 client_id;
++};
++#endif
+diff -Nur linux-4.1.3/include/linux/mxc_vpu.h linux-xbian-imx6/include/linux/mxc_vpu.h
+--- linux-4.1.3/include/linux/mxc_vpu.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/mxc_vpu.h	2015-07-27 23:13:09.606706653 +0200
+@@ -0,0 +1,118 @@
++/*
++ * Copyright 2004-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU Lesser General
++ * Public License.  You may obtain a copy of the GNU Lesser General
++ * Public License Version 2.1 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/lgpl-license.html
++ * http://www.gnu.org/copyleft/lgpl.html
++ */
++
++/*!
++ * @defgroup VPU Video Processor Unit Driver
++ */
++
++/*!
++ * @file linux/mxc_vpu.h
++ *
++ * @brief VPU system initialization and file operation definition
++ *
++ * @ingroup VPU
++ */
++
++#ifndef __LINUX_MXC_VPU_H__
++#define __LINUX_MXC_VPU_H__
++
++#include <linux/fs.h>
++
++struct mxc_vpu_platform_data {
++	bool iram_enable;
++	int  iram_size;
++	void (*reset) (void);
++	void (*pg) (int);
++};
++
++struct vpu_mem_desc {
++	u32 size;
++	dma_addr_t phy_addr;
++	u32 cpu_addr;		/* cpu address to free the dma mem */
++	u32 virt_uaddr;		/* virtual user space address */
++};
++
++#define VPU_IOC_MAGIC  'V'
++
++#define VPU_IOC_PHYMEM_ALLOC	_IO(VPU_IOC_MAGIC, 0)
++#define VPU_IOC_PHYMEM_FREE	_IO(VPU_IOC_MAGIC, 1)
++#define VPU_IOC_WAIT4INT	_IO(VPU_IOC_MAGIC, 2)
++#define VPU_IOC_PHYMEM_DUMP	_IO(VPU_IOC_MAGIC, 3)
++#define VPU_IOC_REG_DUMP	_IO(VPU_IOC_MAGIC, 4)
++#define VPU_IOC_IRAM_SETTING	_IO(VPU_IOC_MAGIC, 6)
++#define VPU_IOC_CLKGATE_SETTING	_IO(VPU_IOC_MAGIC, 7)
++#define VPU_IOC_GET_WORK_ADDR   _IO(VPU_IOC_MAGIC, 8)
++#define VPU_IOC_REQ_VSHARE_MEM	_IO(VPU_IOC_MAGIC, 9)
++#define VPU_IOC_SYS_SW_RESET	_IO(VPU_IOC_MAGIC, 11)
++#define VPU_IOC_GET_SHARE_MEM   _IO(VPU_IOC_MAGIC, 12)
++#define VPU_IOC_QUERY_BITWORK_MEM  _IO(VPU_IOC_MAGIC, 13)
++#define VPU_IOC_SET_BITWORK_MEM    _IO(VPU_IOC_MAGIC, 14)
++#define VPU_IOC_PHYMEM_CHECK	_IO(VPU_IOC_MAGIC, 15)
++#define VPU_IOC_LOCK_DEV	_IO(VPU_IOC_MAGIC, 16)
++
++#define BIT_CODE_RUN			0x000
++#define BIT_CODE_DOWN			0x004
++#define BIT_INT_CLEAR			0x00C
++#define BIT_INT_STATUS			0x010
++#define BIT_CUR_PC			0x018
++#define BIT_INT_REASON			0x174
++
++#define MJPEG_PIC_STATUS_REG		0x3004
++#define MBC_SET_SUBBLK_EN		0x4A0
++
++#define BIT_WORK_CTRL_BUF_BASE		0x100
++#define BIT_WORK_CTRL_BUF_REG(i)	(BIT_WORK_CTRL_BUF_BASE + i * 4)
++#define BIT_CODE_BUF_ADDR		BIT_WORK_CTRL_BUF_REG(0)
++#define BIT_WORK_BUF_ADDR		BIT_WORK_CTRL_BUF_REG(1)
++#define BIT_PARA_BUF_ADDR		BIT_WORK_CTRL_BUF_REG(2)
++#define BIT_BIT_STREAM_CTRL		BIT_WORK_CTRL_BUF_REG(3)
++#define BIT_FRAME_MEM_CTRL		BIT_WORK_CTRL_BUF_REG(4)
++#define BIT_BIT_STREAM_PARAM		BIT_WORK_CTRL_BUF_REG(5)
++
++#ifndef CONFIG_SOC_IMX6Q
++#define BIT_RESET_CTRL			0x11C
++#else
++#define BIT_RESET_CTRL			0x128
++#endif
++
++/* i could be 0, 1, 2, 3 */
++#define	BIT_RD_PTR_BASE			0x120
++#define BIT_RD_PTR_REG(i)		(BIT_RD_PTR_BASE + i * 8)
++#define BIT_WR_PTR_REG(i)		(BIT_RD_PTR_BASE + i * 8 + 4)
++
++/* i could be 0, 1, 2, 3 */
++#define BIT_FRM_DIS_FLG_BASE		(cpu_is_mx51() ? 0x150 : 0x140)
++#define	BIT_FRM_DIS_FLG_REG(i)		(BIT_FRM_DIS_FLG_BASE + i * 4)
++
++#define BIT_BUSY_FLAG			0x160
++#define BIT_RUN_COMMAND			0x164
++#define BIT_INT_ENABLE			0x170
++
++#define	BITVAL_PIC_RUN			8
++
++#define	VPU_SLEEP_REG_VALUE		10
++#define	VPU_WAKE_REG_VALUE		11
++
++int vl2cc_init(u32 vl2cc_hw_base);
++void vl2cc_enable(void);
++void vl2cc_flush(void);
++void vl2cc_disable(void);
++void vl2cc_cleanup(void);
++
++int vl2cc_init(u32 vl2cc_hw_base);
++void vl2cc_enable(void);
++void vl2cc_flush(void);
++void vl2cc_disable(void);
++void vl2cc_cleanup(void);
++
++#endif
+diff -Nur linux-4.1.3/include/linux/platform_data/dma-imx.h linux-xbian-imx6/include/linux/platform_data/dma-imx.h
+--- linux-4.1.3/include/linux/platform_data/dma-imx.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/linux/platform_data/dma-imx.h	2015-07-27 23:13:09.622649772 +0200
+@@ -17,31 +17,30 @@
+  * This enumerates peripheral types. Used for SDMA.
+  */
+ enum sdma_peripheral_type {
+-	IMX_DMATYPE_SSI,	/* MCU domain SSI */
+-	IMX_DMATYPE_SSI_SP,	/* Shared SSI */
+-	IMX_DMATYPE_MMC,	/* MMC */
+-	IMX_DMATYPE_SDHC,	/* SDHC */
+-	IMX_DMATYPE_UART,	/* MCU domain UART */
+-	IMX_DMATYPE_UART_SP,	/* Shared UART */
+-	IMX_DMATYPE_FIRI,	/* FIRI */
+-	IMX_DMATYPE_CSPI,	/* MCU domain CSPI */
+-	IMX_DMATYPE_CSPI_SP,	/* Shared CSPI */
+-	IMX_DMATYPE_SIM,	/* SIM */
+-	IMX_DMATYPE_ATA,	/* ATA */
+-	IMX_DMATYPE_CCM,	/* CCM */
+-	IMX_DMATYPE_EXT,	/* External peripheral */
+-	IMX_DMATYPE_MSHC,	/* Memory Stick Host Controller */
+-	IMX_DMATYPE_MSHC_SP,	/* Shared Memory Stick Host Controller */
+-	IMX_DMATYPE_DSP,	/* DSP */
+-	IMX_DMATYPE_MEMORY,	/* Memory */
+-	IMX_DMATYPE_FIFO_MEMORY,/* FIFO type Memory */
+-	IMX_DMATYPE_SPDIF,	/* SPDIF */
+-	IMX_DMATYPE_IPU_MEMORY,	/* IPU Memory */
+-	IMX_DMATYPE_ASRC,	/* ASRC */
+-	IMX_DMATYPE_ESAI,	/* ESAI */
+-	IMX_DMATYPE_SSI_DUAL,	/* SSI Dual FIFO */
+-	IMX_DMATYPE_ASRC_SP,	/* Shared ASRC */
+-	IMX_DMATYPE_SAI,	/* SAI */
++        IMX_DMATYPE_SSI,        /* MCU domain SSI */
++        IMX_DMATYPE_SSI_SP,     /* Shared SSI */
++        IMX_DMATYPE_MMC,        /* MMC */
++        IMX_DMATYPE_SDHC,       /* SDHC */
++        IMX_DMATYPE_UART,       /* MCU domain UART */
++        IMX_DMATYPE_UART_SP,    /* Shared UART */
++        IMX_DMATYPE_FIRI,       /* FIRI */
++        IMX_DMATYPE_CSPI,       /* MCU domain CSPI */
++        IMX_DMATYPE_CSPI_SP,    /* Shared CSPI */
++        IMX_DMATYPE_SIM,        /* SIM */
++        IMX_DMATYPE_ATA,        /* ATA */
++        IMX_DMATYPE_CCM,        /* CCM */
++        IMX_DMATYPE_EXT,        /* External peripheral */
++        IMX_DMATYPE_MSHC,       /* Memory Stick Host Controller */
++        IMX_DMATYPE_MSHC_SP,    /* Shared Memory Stick Host Controller */
++        IMX_DMATYPE_DSP,        /* DSP */
++        IMX_DMATYPE_MEMORY,     /* Memory */
++        IMX_DMATYPE_FIFO_MEMORY,/* FIFO type Memory */
++        IMX_DMATYPE_SPDIF,      /* SPDIF */
++        IMX_DMATYPE_IPU_MEMORY, /* IPU Memory */
++        IMX_DMATYPE_ASRC,       /* ASRC */
++        IMX_DMATYPE_ESAI,       /* ESAI */
++        IMX_DMATYPE_SSI_DUAL,   /* SSI Dual FIFO */
++        IMX_DMATYPE_HDMI,       /* HDMI Audio */
+ };
+ 
+ enum imx_dma_prio {
+@@ -55,6 +54,7 @@
+ 	int dma_request2; /* secondary DMA request line */
+ 	enum sdma_peripheral_type peripheral_type;
+ 	int priority;
++	void *data_addr1, *data_addr2;
+ };
+ 
+ static inline int imx_dma_is_ipu(struct dma_chan *chan)
+diff -Nur linux-4.1.3/include/linux/pxp_device.h linux-xbian-imx6/include/linux/pxp_device.h
+--- linux-4.1.3/include/linux/pxp_device.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/pxp_device.h	2015-07-27 23:13:09.634607108 +0200
+@@ -0,0 +1,68 @@
++/*
++ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++#ifndef _PXP_DEVICE
++#define _PXP_DEVICE
++
++#include <linux/idr.h>
++#include <linux/hash.h>
++#include <uapi/linux/pxp_device.h>
++
++struct pxp_irq_info {
++	wait_queue_head_t waitq;
++	atomic_t irq_pending;
++	int hist_status;
++};
++
++struct pxp_buffer_hash {
++	struct hlist_head *hash_table;
++	u32 order;
++	spinlock_t hash_lock;
++};
++
++struct pxp_buf_obj {
++	uint32_t handle;
++
++	uint32_t size;
++	uint32_t mem_type;
++
++	unsigned long offset;
++	void *virtual;
++
++	struct hlist_node item;
++};
++
++struct pxp_chan_obj {
++	uint32_t handle;
++	struct dma_chan *chan;
++};
++
++/* File private data */
++struct pxp_file {
++	struct file *filp;
++
++	/* record allocated dma buffer */
++	struct idr buffer_idr;
++	spinlock_t buffer_lock;
++
++	/* record allocated dma channel */
++	struct idr channel_idr;
++	spinlock_t channel_lock;
++};
++
++#endif
+diff -Nur linux-4.1.3/include/linux/pxp_dma.h linux-xbian-imx6/include/linux/pxp_dma.h
+--- linux-4.1.3/include/linux/pxp_dma.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/linux/pxp_dma.h	2015-07-27 23:13:09.634607108 +0200
+@@ -0,0 +1,72 @@
++/*
++ * Copyright (C) 2010-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++#ifndef _PXP_DMA
++#define _PXP_DMA
++
++#include <uapi/linux/pxp_dma.h>
++
++struct pxp_tx_desc {
++	struct dma_async_tx_descriptor txd;
++	struct list_head tx_list;
++	struct list_head list;
++	int len;
++	union {
++		struct pxp_layer_param s0_param;
++		struct pxp_layer_param out_param;
++		struct pxp_layer_param ol_param;
++	} layer_param;
++	struct pxp_proc_data proc_data;
++
++	u32 hist_status;	/* Histogram output status */
++
++	struct pxp_tx_desc *next;
++};
++
++struct pxp_channel {
++	struct dma_chan dma_chan;
++	dma_cookie_t completed;	/* last completed cookie */
++	enum pxp_channel_status status;
++	void *client;		/* Only one client per channel */
++	unsigned int n_tx_desc;
++	struct pxp_tx_desc *desc;	/* allocated tx-descriptors */
++	struct list_head queue;	/* queued tx-descriptors */
++	struct list_head list;	/* track queued channel number */
++	spinlock_t lock;	/* protects sg[0,1], queue,
++				 * status, cookie, free_list
++				 */
++	int active_buffer;
++	unsigned int eof_irq;
++	char eof_name[16];	/* EOF IRQ name for request_irq()  */
++};
++
++#define to_tx_desc(tx) container_of(tx, struct pxp_tx_desc, txd)
++#define to_pxp_channel(d) container_of(d, struct pxp_channel, dma_chan)
++
++void pxp_txd_ack(struct dma_async_tx_descriptor *txd,
++		 struct pxp_channel *pxp_chan);
++
++#ifdef CONFIG_MXC_PXP_CLIENT_DEVICE
++int register_pxp_device(void);
++void unregister_pxp_device(void);
++#else
++int register_pxp_device(void) { return 0; }
++void unregister_pxp_device(void) {}
++#endif
++
++#endif
+diff -Nur linux-4.1.3/include/mmc-mxcmmc.h linux-xbian-imx6/include/mmc-mxcmmc.h
+--- linux-4.1.3/include/mmc-mxcmmc.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/mmc-mxcmmc.h	2015-07-27 23:13:09.770123601 +0200
+@@ -0,0 +1,39 @@
++#ifndef ASMARM_ARCH_MMC_H
++#define ASMARM_ARCH_MMC_H
++
++#include <linux/mmc/host.h>
++
++struct device;
++
++/* board specific SDHC data, optional.
++ * If not present, a writable card with 3,3V is assumed.
++ */
++struct imxmmc_platform_data {
++	/* Return values for the get_ro callback should be:
++	 *   0 for a read/write card
++	 *   1 for a read-only card
++	 *   -ENOSYS when not supported (equal to NULL callback)
++	 *   or a negative errno value when something bad happened
++	 */
++	int (*get_ro)(struct device *);
++
++	/* board specific hook to (de)initialize the SD slot.
++	 * The board code can call 'handler' on a card detection
++	 * change giving data as argument.
++	 */
++	int (*init)(struct device *dev, irq_handler_t handler, void *data);
++	void (*exit)(struct device *dev, void *data);
++
++	/* available voltages. If not given, assume
++	 * MMC_VDD_32_33 | MMC_VDD_33_34
++	 */
++	unsigned int ocr_avail;
++
++	/* adjust slot voltage */
++	void (*setpower)(struct device *, unsigned int vdd);
++
++	/* enable card detect using DAT3 */
++	int dat3_card_detect;
++};
++
++#endif
+diff -Nur linux-4.1.3/include/mtd-mxc_nand.h linux-xbian-imx6/include/mtd-mxc_nand.h
+--- linux-4.1.3/include/mtd-mxc_nand.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/mtd-mxc_nand.h	2015-07-27 23:13:09.770123601 +0200
+@@ -0,0 +1,32 @@
++/*
++ * Copyright 2004-2007 Freescale Semiconductor, Inc. All Rights Reserved.
++ * Copyright 2008 Sascha Hauer, kernel@pengutronix.de
++ *
++ * This program is free software; you can redistribute it and/or
++ * modify it under the terms of the GNU General Public License
++ * as published by the Free Software Foundation; either version 2
++ * of the License, or (at your option) any later version.
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
++ * MA 02110-1301, USA.
++ */
++
++#ifndef __ASM_ARCH_NAND_H
++#define __ASM_ARCH_NAND_H
++
++#include <linux/mtd/partitions.h>
++
++struct mxc_nand_platform_data {
++	unsigned int width;	/* data bus width in bytes */
++	unsigned int hw_ecc:1;	/* 0 if suppress hardware ECC */
++	unsigned int flash_bbt:1; /* set to 1 to use a flash based bbt */
++	struct mtd_partition *parts;	/* partition table */
++	int nr_parts;			/* size of parts */
++};
++#endif /* __ASM_ARCH_NAND_H */
+diff -Nur linux-4.1.3/include/sound/soc.h linux-xbian-imx6/include/sound/soc.h
+--- linux-4.1.3/include/sound/soc.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/sound/soc.h	2015-07-27 23:13:09.837881847 +0200
+@@ -28,6 +28,18 @@
+ #include <sound/control.h>
+ #include <sound/ac97_codec.h>
+ 
++/*enum snd_soc_control_type {
++	SND_SOC_CUSTOM,
++	SND_SOC_I2C,
++	SND_SOC_SPI,
++};*/
++
++enum snd_soc_control_type {
++        SND_SOC_I2C = 1,
++        SND_SOC_SPI,
++        SND_SOC_REGMAP,
++};
++
+ /*
+  * Convenience kcontrol builders
+  */
+@@ -805,16 +817,24 @@
+ 
+ 	struct list_head list;
+ 	struct list_head card_list;
++	int (*volatile_register)(struct snd_soc_codec *, unsigned int);
+ 
+ 	/* runtime */
+ 	unsigned int cache_bypass:1; /* Suppress access to the cache */
+ 	unsigned int suspended:1; /* Codec is in suspend PM state */
+ 	unsigned int cache_init:1; /* codec cache has been initialized */
++	unsigned int using_regmap:1; /* using regmap access */
++	u32 cache_only;  /* Suppress writes to hardware */
++	u32 cache_sync; /* Cache needs to be synced to hardware */
+ 
+ 	/* codec IO */
+ 	void *control_data; /* codec control (i2c/3wire) data */
+ 	hw_write_t hw_write;
++	unsigned int (*read)(struct snd_soc_codec *, unsigned int);
++	int (*write)(struct snd_soc_codec *, unsigned int, unsigned int);
+ 	void *reg_cache;
++	struct mutex cache_rw_mutex;
++	int val_bytes;
+ 
+ 	/* component */
+ 	struct snd_soc_component component;
+diff -Nur linux-4.1.3/include/sync.h linux-xbian-imx6/include/sync.h
+--- linux-4.1.3/include/sync.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/sync.h	2015-07-27 23:13:09.837881847 +0200
+@@ -0,0 +1,356 @@
++/*
++ * include/linux/sync.h
++ *
++ * Copyright (C) 2012 Google, Inc.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ */
++
++#ifndef _LINUX_SYNC_H
++#define _LINUX_SYNC_H
++
++#include <linux/types.h>
++#include <linux/kref.h>
++#include <linux/ktime.h>
++#include <linux/list.h>
++#include <linux/spinlock.h>
++#include <linux/wait.h>
++#include <linux/fence.h>
++
++#include "uapi/sync.h"
++
++struct sync_timeline;
++struct sync_pt;
++struct sync_fence;
++
++/**
++ * struct sync_timeline_ops - sync object implementation ops
++ * @driver_name:	name of the implementation
++ * @dup:		duplicate a sync_pt
++ * @has_signaled:	returns:
++ *			  1 if pt has signaled
++ *			  0 if pt has not signaled
++ *			 <0 on error
++ * @compare:		returns:
++ *			  1 if b will signal before a
++ *			  0 if a and b will signal at the same time
++ *			 -1 if a will signal before b
++ * @free_pt:		called before sync_pt is freed
++ * @release_obj:	called before sync_timeline is freed
++ * @fill_driver_data:	write implementation specific driver data to data.
++ *			  should return an error if there is not enough room
++ *			  as specified by size.  This information is returned
++ *			  to userspace by SYNC_IOC_FENCE_INFO.
++ * @timeline_value_str: fill str with the value of the sync_timeline's counter
++ * @pt_value_str:	fill str with the value of the sync_pt
++ */
++struct sync_timeline_ops {
++	const char *driver_name;
++
++	/* required */
++	struct sync_pt * (*dup)(struct sync_pt *pt);
++
++	/* required */
++	int (*has_signaled)(struct sync_pt *pt);
++
++	/* required */
++	int (*compare)(struct sync_pt *a, struct sync_pt *b);
++
++	/* optional */
++	void (*free_pt)(struct sync_pt *sync_pt);
++
++	/* optional */
++	void (*release_obj)(struct sync_timeline *sync_timeline);
++
++	/* optional */
++	int (*fill_driver_data)(struct sync_pt *syncpt, void *data, int size);
++
++	/* optional */
++	void (*timeline_value_str)(struct sync_timeline *timeline, char *str,
++				   int size);
++
++	/* optional */
++	void (*pt_value_str)(struct sync_pt *pt, char *str, int size);
++};
++
++/**
++ * struct sync_timeline - sync object
++ * @kref:		reference count on fence.
++ * @ops:		ops that define the implementation of the sync_timeline
++ * @name:		name of the sync_timeline. Useful for debugging
++ * @destroyed:		set when sync_timeline is destroyed
++ * @child_list_head:	list of children sync_pts for this sync_timeline
++ * @child_list_lock:	lock protecting @child_list_head, destroyed, and
++ *			  sync_pt.status
++ * @active_list_head:	list of active (unsignaled/errored) sync_pts
++ * @sync_timeline_list:	membership in global sync_timeline_list
++ */
++struct sync_timeline {
++	struct kref		kref;
++	const struct sync_timeline_ops	*ops;
++	char			name[32];
++
++	/* protected by child_list_lock */
++	bool			destroyed;
++	int			context, value;
++
++	struct list_head	child_list_head;
++	spinlock_t		child_list_lock;
++
++	struct list_head	active_list_head;
++
++#ifdef CONFIG_DEBUG_FS
++	struct list_head	sync_timeline_list;
++#endif
++};
++
++/**
++ * struct sync_pt - sync point
++ * @fence:		base fence class
++ * @child_list:		membership in sync_timeline.child_list_head
++ * @active_list:	membership in sync_timeline.active_list_head
++ * @signaled_list:	membership in temporary signaled_list on stack
++ * @fence:		sync_fence to which the sync_pt belongs
++ * @pt_list:		membership in sync_fence.pt_list_head
++ * @status:		1: signaled, 0:active, <0: error
++ * @timestamp:		time which sync_pt status transitioned from active to
++ *			  signaled or error.
++ */
++struct sync_pt {
++	struct fence base;
++
++	struct list_head	child_list;
++	struct list_head	active_list;
++};
++
++static inline struct sync_timeline *sync_pt_parent(struct sync_pt *pt)
++{
++	return container_of(pt->base.lock, struct sync_timeline,
++			    child_list_lock);
++}
++
++struct sync_fence_cb {
++	struct fence_cb cb;
++	struct fence *sync_pt;
++	struct sync_fence *fence;
++};
++
++/**
++ * struct sync_fence - sync fence
++ * @file:		file representing this fence
++ * @kref:		reference count on fence.
++ * @name:		name of sync_fence.  Useful for debugging
++ * @pt_list_head:	list of sync_pts in the fence.  immutable once fence
++ *			  is created
++ * @status:		0: signaled, >0:active, <0: error
++ *
++ * @wq:			wait queue for fence signaling
++ * @sync_fence_list:	membership in global fence list
++ */
++struct sync_fence {
++	struct file		*file;
++	struct kref		kref;
++	char			name[32];
++#ifdef CONFIG_DEBUG_FS
++	struct list_head	sync_fence_list;
++#endif
++	int num_fences;
++
++	wait_queue_head_t	wq;
++	atomic_t		status;
++
++	struct sync_fence_cb	cbs[];
++};
++
++struct sync_fence_waiter;
++typedef void (*sync_callback_t)(struct sync_fence *fence,
++				struct sync_fence_waiter *waiter);
++
++/**
++ * struct sync_fence_waiter - metadata for asynchronous waiter on a fence
++ * @waiter_list:	membership in sync_fence.waiter_list_head
++ * @callback:		function pointer to call when fence signals
++ * @callback_data:	pointer to pass to @callback
++ */
++struct sync_fence_waiter {
++	wait_queue_t work;
++	sync_callback_t callback;
++};
++
++static inline void sync_fence_waiter_init(struct sync_fence_waiter *waiter,
++					  sync_callback_t callback)
++{
++	INIT_LIST_HEAD(&waiter->work.task_list);
++	waiter->callback = callback;
++}
++
++/*
++ * API for sync_timeline implementers
++ */
++
++/**
++ * sync_timeline_create() - creates a sync object
++ * @ops:	specifies the implementation ops for the object
++ * @size:	size to allocate for this obj
++ * @name:	sync_timeline name
++ *
++ * Creates a new sync_timeline which will use the implementation specified by
++ * @ops.  @size bytes will be allocated allowing for implementation specific
++ * data to be kept after the generic sync_timeline struct.
++ */
++struct sync_timeline *sync_timeline_create(const struct sync_timeline_ops *ops,
++					   int size, const char *name);
++
++/**
++ * sync_timeline_destroy() - destroys a sync object
++ * @obj:	sync_timeline to destroy
++ *
++ * A sync implementation should call this when the @obj is going away
++ * (i.e. module unload.)  @obj won't actually be freed until all its children
++ * sync_pts are freed.
++ */
++void sync_timeline_destroy(struct sync_timeline *obj);
++
++/**
++ * sync_timeline_signal() - signal a status change on a sync_timeline
++ * @obj:	sync_timeline to signal
++ *
++ * A sync implementation should call this any time one of it's sync_pts
++ * has signaled or has an error condition.
++ */
++void sync_timeline_signal(struct sync_timeline *obj);
++
++/**
++ * sync_pt_create() - creates a sync pt
++ * @parent:	sync_pt's parent sync_timeline
++ * @size:	size to allocate for this pt
++ *
++ * Creates a new sync_pt as a child of @parent.  @size bytes will be
++ * allocated allowing for implementation specific data to be kept after
++ * the generic sync_timeline struct.
++ */
++struct sync_pt *sync_pt_create(struct sync_timeline *parent, int size);
++
++/**
++ * sync_pt_free() - frees a sync pt
++ * @pt:		sync_pt to free
++ *
++ * This should only be called on sync_pts which have been created but
++ * not added to a fence.
++ */
++void sync_pt_free(struct sync_pt *pt);
++
++/**
++ * sync_fence_create() - creates a sync fence
++ * @name:	name of fence to create
++ * @pt:		sync_pt to add to the fence
++ *
++ * Creates a fence containg @pt.  Once this is called, the fence takes
++ * ownership of @pt.
++ */
++struct sync_fence *sync_fence_create(const char *name, struct sync_pt *pt);
++
++/*
++ * API for sync_fence consumers
++ */
++
++/**
++ * sync_fence_merge() - merge two fences
++ * @name:	name of new fence
++ * @a:		fence a
++ * @b:		fence b
++ *
++ * Creates a new fence which contains copies of all the sync_pts in both
++ * @a and @b.  @a and @b remain valid, independent fences.
++ */
++struct sync_fence *sync_fence_merge(const char *name,
++				    struct sync_fence *a, struct sync_fence *b);
++
++/**
++ * sync_fence_fdget() - get a fence from an fd
++ * @fd:		fd referencing a fence
++ *
++ * Ensures @fd references a valid fence, increments the refcount of the backing
++ * file, and returns the fence.
++ */
++struct sync_fence *sync_fence_fdget(int fd);
++
++/**
++ * sync_fence_put() - puts a reference of a sync fence
++ * @fence:	fence to put
++ *
++ * Puts a reference on @fence.  If this is the last reference, the fence and
++ * all it's sync_pts will be freed
++ */
++void sync_fence_put(struct sync_fence *fence);
++
++/**
++ * sync_fence_install() - installs a fence into a file descriptor
++ * @fence:	fence to install
++ * @fd:		file descriptor in which to install the fence
++ *
++ * Installs @fence into @fd.  @fd's should be acquired through
++ * get_unused_fd_flags(O_CLOEXEC).
++ */
++void sync_fence_install(struct sync_fence *fence, int fd);
++
++/**
++ * sync_fence_wait_async() - registers and async wait on the fence
++ * @fence:		fence to wait on
++ * @waiter:		waiter callback struck
++ *
++ * Returns 1 if @fence has already signaled.
++ *
++ * Registers a callback to be called when @fence signals or has an error.
++ * @waiter should be initialized with sync_fence_waiter_init().
++ */
++int sync_fence_wait_async(struct sync_fence *fence,
++			  struct sync_fence_waiter *waiter);
++
++/**
++ * sync_fence_cancel_async() - cancels an async wait
++ * @fence:		fence to wait on
++ * @waiter:		waiter callback struck
++ *
++ * returns 0 if waiter was removed from fence's async waiter list.
++ * returns -ENOENT if waiter was not found on fence's async waiter list.
++ *
++ * Cancels a previously registered async wait.  Will fail gracefully if
++ * @waiter was never registered or if @fence has already signaled @waiter.
++ */
++int sync_fence_cancel_async(struct sync_fence *fence,
++			    struct sync_fence_waiter *waiter);
++
++/**
++ * sync_fence_wait() - wait on fence
++ * @fence:	fence to wait on
++ * @tiemout:	timeout in ms
++ *
++ * Wait for @fence to be signaled or have an error.  Waits indefinitely
++ * if @timeout < 0
++ */
++int sync_fence_wait(struct sync_fence *fence, long timeout);
++
++#ifdef CONFIG_DEBUG_FS
++
++extern void sync_timeline_debug_add(struct sync_timeline *obj);
++extern void sync_timeline_debug_remove(struct sync_timeline *obj);
++extern void sync_fence_debug_add(struct sync_fence *fence);
++extern void sync_fence_debug_remove(struct sync_fence *fence);
++extern void sync_dump(void);
++
++#else
++# define sync_timeline_debug_add(obj)
++# define sync_timeline_debug_remove(obj)
++# define sync_fence_debug_add(fence)
++# define sync_fence_debug_remove(fence)
++# define sync_dump()
++#endif
++int sync_fence_wake_up_wq(wait_queue_t *curr, unsigned mode,
++				 int wake_flags, void *key);
++
++#endif /* _LINUX_SYNC_H */
+diff -Nur linux-4.1.3/include/uapi/linux/fb.h linux-xbian-imx6/include/uapi/linux/fb.h
+--- linux-4.1.3/include/uapi/linux/fb.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/uapi/linux/fb.h	2015-07-27 23:13:09.853824963 +0200
+@@ -217,14 +217,45 @@
+ #define FB_SYNC_ON_GREEN	32	/* sync on green */
+ 
+ #define FB_VMODE_NONINTERLACED  0	/* non interlaced */
+-#define FB_VMODE_INTERLACED	1	/* interlaced	*/
+-#define FB_VMODE_DOUBLE		2	/* double scan */
+-#define FB_VMODE_ODD_FLD_FIRST	4	/* interlaced: top line first */
+-#define FB_VMODE_MASK		255
+-
+-#define FB_VMODE_YWRAP		256	/* ywrap instead of panning     */
+-#define FB_VMODE_SMOOTH_XPAN	512	/* smooth xpan possible (internally used) */
+-#define FB_VMODE_CONUPDATE	512	/* don't update x/yoffset	*/
++#define FB_VMODE_INTERLACED	BIT(1)	/* interlaced	*/
++#define FB_VMODE_DOUBLE		BIT(2)	/* double scan */
++#define FB_VMODE_ODD_FLD_FIRST	BIT(3)	/* interlaced: top line first */
++#define FB_VMODE_MASK_SIMPLE	(BIT(1) | \
++				 BIT(2))
++/*
++ * mxc_edid is taking 16 and 32 for ASPECT_16_9/4_3
++ */
++#define FB_VMODE_3D_SBS_HALF	BIT(4)     /* HDMI_3D_STRUCTURE_SIDE_BY_SIDE_HALF */
++#define FB_VMODE_3D_SBS_FULL	BIT(5)     /* HDMI_3D_STRUCTURE_SIDE_BY_SIDE_FULL */
++#define FB_VMODE_3D_TOP_BOTTOM	BIT(6)     /* HDMI_3D_STRUCTURE_TOP_AND_BOTTOM */
++#define FB_VMODE_3D_FRAME_PACK	BIT(7)    /* HDMI_3D_STRUCTURE_FRAME_PACKING */
++#define FB_VMODE_3D_MASK	(BIT(4) | \
++				 BIT(5) | \
++				 BIT(6) | \
++				 BIT(7))
++
++#define FB_VMODE_YWRAP		BIT(8)	/* ywrap instead of panning     */
++#define FB_VMODE_SMOOTH_XPAN	BIT(9)	/* smooth xpan possible (internally used) */
++#define FB_VMODE_CONUPDATE	BIT(9)	/* don't update x/yoffset	*/
++
++#define FB_VMODE_ASPECT_1	BIT(10)
++#define FB_VMODE_ASPECT_4_3	BIT(11)
++#define FB_VMODE_ASPECT_5_4	BIT(12)
++#define FB_VMODE_ASPECT_16_9	BIT(13)
++#define FB_VMODE_ASPECT_16_10	BIT(14)
++#define FB_VMODE_ASPECT_MASK	(BIT(10) | \
++				 BIT(11) | \
++				 BIT(12) | \
++				 BIT(13) | \
++				 BIT(14))
++
++#define FB_VMODE_FRACTIONAL	BIT(15)
++
++#define FB_VMODE_MASK		(FB_VMODE_MASK_SIMPLE | \
++				 FB_VMODE_3D_MASK     | \
++				 FB_VMODE_ASPECT_MASK | \
++				 FB_VMODE_FRACTIONAL)
++
+ 
+ /*
+  * Display rotation support
+diff -Nur linux-4.1.3/include/uapi/linux/ipu.h linux-xbian-imx6/include/uapi/linux/ipu.h
+--- linux-4.1.3/include/uapi/linux/ipu.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/ipu.h	2015-07-27 23:13:09.861796522 +0200
+@@ -0,0 +1,282 @@
++/*
++ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*!
++ * @defgroup IPU MXC Image Processing Unit (IPU) Driver
++ */
++/*!
++ * @file uapi/linux/ipu.h
++ *
++ * @brief This file contains the IPU driver API declarations.
++ *
++ * @ingroup IPU
++ */
++
++#ifndef __ASM_ARCH_IPU_H__
++#define __ASM_ARCH_IPU_H__
++
++#include <linux/types.h>
++#include <linux/videodev2.h>
++
++#ifndef __KERNEL__
++#ifndef __cplusplus
++typedef unsigned char bool;
++#endif
++#define irqreturn_t int
++#define dma_addr_t int
++#define uint32_t unsigned int
++#define uint16_t unsigned short
++#define uint8_t unsigned char
++#define u32 unsigned int
++#define u8 unsigned char
++#define __u32 u32
++#endif
++
++/*!
++ * Enumeration of IPU rotation modes
++ */
++typedef enum {
++	/* Note the enum values correspond to BAM value */
++	IPU_ROTATE_NONE = 0,
++	IPU_ROTATE_VERT_FLIP = 1,
++	IPU_ROTATE_HORIZ_FLIP = 2,
++	IPU_ROTATE_180 = 3,
++	IPU_ROTATE_90_RIGHT = 4,
++	IPU_ROTATE_90_RIGHT_VFLIP = 5,
++	IPU_ROTATE_90_RIGHT_HFLIP = 6,
++	IPU_ROTATE_90_LEFT = 7,
++} ipu_rotate_mode_t;
++
++/*!
++ * Enumeration of VDI MOTION select
++ */
++typedef enum {
++	MED_MOTION = 0,
++	LOW_MOTION = 1,
++	HIGH_MOTION = 2,
++} ipu_motion_sel;
++
++/*!
++ * Enumeration of DI ports for ADC.
++ */
++typedef enum {
++	DISP0,
++	DISP1,
++	DISP2,
++	DISP3
++} display_port_t;
++
++/*  IPU Pixel format definitions */
++/*  Four-character-code (FOURCC) */
++#define fourcc(a, b, c, d)\
++	 (((__u32)(a)<<0)|((__u32)(b)<<8)|((__u32)(c)<<16)|((__u32)(d)<<24))
++
++/*!
++ * @name IPU Pixel Formats
++ *
++ * Pixel formats are defined with ASCII FOURCC code. The pixel format codes are
++ * the same used by V4L2 API.
++ */
++
++/*! @{ */
++/*! @name Generic or Raw Data Formats */
++/*! @{ */
++#define IPU_PIX_FMT_GENERIC fourcc('I', 'P', 'U', '0')	/*!< IPU Generic Data */
++#define IPU_PIX_FMT_GENERIC_32 fourcc('I', 'P', 'U', '1')	/*!< IPU Generic Data */
++#define IPU_PIX_FMT_GENERIC_16 fourcc('I', 'P', 'U', '2')	/*!< IPU Generic Data */
++#define IPU_PIX_FMT_LVDS666 fourcc('L', 'V', 'D', '6')	/*!< IPU Generic Data */
++#define IPU_PIX_FMT_LVDS888 fourcc('L', 'V', 'D', '8')	/*!< IPU Generic Data */
++/*! @} */
++/*! @name RGB Formats */
++/*! @{ */
++#define IPU_PIX_FMT_RGB332  fourcc('R', 'G', 'B', '1')	/*!<  8  RGB-3-3-2    */
++#define IPU_PIX_FMT_RGB555  fourcc('R', 'G', 'B', 'O')	/*!< 16  RGB-5-5-5    */
++#define IPU_PIX_FMT_RGB565  fourcc('R', 'G', 'B', 'P')	/*!< 1 6  RGB-5-6-5   */
++#define IPU_PIX_FMT_RGB666  fourcc('R', 'G', 'B', '6')	/*!< 18  RGB-6-6-6    */
++#define IPU_PIX_FMT_BGR666  fourcc('B', 'G', 'R', '6')	/*!< 18  BGR-6-6-6    */
++#define IPU_PIX_FMT_BGR24   fourcc('B', 'G', 'R', '3')	/*!< 24  BGR-8-8-8    */
++#define IPU_PIX_FMT_RGB24   fourcc('R', 'G', 'B', '3')	/*!< 24  RGB-8-8-8    */
++#define IPU_PIX_FMT_GBR24   fourcc('G', 'B', 'R', '3')	/*!< 24  GBR-8-8-8    */
++#define IPU_PIX_FMT_BGR32   fourcc('B', 'G', 'R', '4')	/*!< 32  BGR-8-8-8-8  */
++#define IPU_PIX_FMT_BGRA32  fourcc('B', 'G', 'R', 'A')	/*!< 32  BGR-8-8-8-8  */
++#define IPU_PIX_FMT_RGB32   fourcc('R', 'G', 'B', '4')	/*!< 32  RGB-8-8-8-8  */
++#define IPU_PIX_FMT_RGBA32  fourcc('R', 'G', 'B', 'A')	/*!< 32  RGB-8-8-8-8  */
++#define IPU_PIX_FMT_ABGR32  fourcc('A', 'B', 'G', 'R')	/*!< 32  ABGR-8-8-8-8 */
++/*! @} */
++/*! @name YUV Interleaved Formats */
++/*! @{ */
++#define IPU_PIX_FMT_YUYV    fourcc('Y', 'U', 'Y', 'V')	/*!< 16 YUV 4:2:2 */
++#define IPU_PIX_FMT_UYVY    fourcc('U', 'Y', 'V', 'Y')	/*!< 16 YUV 4:2:2 */
++#define IPU_PIX_FMT_YVYU    fourcc('Y', 'V', 'Y', 'U')  /*!< 16 YVYU 4:2:2 */
++#define IPU_PIX_FMT_VYUY    fourcc('V', 'Y', 'U', 'Y')  /*!< 16 VYYU 4:2:2 */
++#define IPU_PIX_FMT_Y41P    fourcc('Y', '4', '1', 'P')	/*!< 12 YUV 4:1:1 */
++#define IPU_PIX_FMT_YUV444  fourcc('Y', '4', '4', '4')	/*!< 24 YUV 4:4:4 */
++#define IPU_PIX_FMT_VYU444  fourcc('V', '4', '4', '4')	/*!< 24 VYU 4:4:4 */
++/* two planes -- one Y, one Cb + Cr interleaved  */
++#define IPU_PIX_FMT_NV12    fourcc('N', 'V', '1', '2') /* 12  Y/CbCr 4:2:0  */
++/* two planes -- 12  tiled Y/CbCr 4:2:0  */
++#define IPU_PIX_FMT_TILED_NV12    fourcc('T', 'N', 'V', 'P')
++#define IPU_PIX_FMT_TILED_NV12F   fourcc('T', 'N', 'V', 'F')
++
++/*! @} */
++/*! @name YUV Planar Formats */
++/*! @{ */
++#define IPU_PIX_FMT_GREY    fourcc('G', 'R', 'E', 'Y')	/*!< 8  Greyscale */
++#define IPU_PIX_FMT_YVU410P fourcc('Y', 'V', 'U', '9')	/*!< 9  YVU 4:1:0 */
++#define IPU_PIX_FMT_YUV410P fourcc('Y', 'U', 'V', '9')	/*!< 9  YUV 4:1:0 */
++#define IPU_PIX_FMT_YVU420P fourcc('Y', 'V', '1', '2')	/*!< 12 YVU 4:2:0 */
++#define IPU_PIX_FMT_YUV420P fourcc('I', '4', '2', '0')	/*!< 12 YUV 4:2:0 */
++#define IPU_PIX_FMT_YUV420P2 fourcc('Y', 'U', '1', '2')	/*!< 12 YUV 4:2:0 */
++#define IPU_PIX_FMT_YVU422P fourcc('Y', 'V', '1', '6')	/*!< 16 YVU 4:2:2 */
++#define IPU_PIX_FMT_YUV422P fourcc('4', '2', '2', 'P')	/*!< 16 YUV 4:2:2 */
++/* non-interleaved 4:4:4 */
++#define IPU_PIX_FMT_YUV444P fourcc('4', '4', '4', 'P')	/*!< 24 YUV 4:4:4 */
++/*! @} */
++#define IPU_PIX_FMT_TILED_NV12_MBALIGN	(16)
++#define TILED_NV12_FRAME_SIZE(w, h)	\
++		(ALIGN((w) * (h), SZ_4K) + ALIGN((w) * (h) / 2, SZ_4K))
++/* IPU device */
++typedef enum {
++	RGB_CS,
++	YUV_CS,
++	NULL_CS
++} cs_t;
++
++struct ipu_pos {
++	u32 x;
++	u32 y;
++};
++
++struct ipu_crop {
++	struct ipu_pos pos;
++	u32 w;
++	u32 h;
++};
++
++struct ipu_deinterlace {
++	bool	enable;
++	u8	motion; /*see ipu_motion_sel*/
++#define IPU_DEINTERLACE_FIELD_TOP	0
++#define IPU_DEINTERLACE_FIELD_BOTTOM	1
++#define IPU_DEINTERLACE_FIELD_MASK	\
++		(IPU_DEINTERLACE_FIELD_TOP | IPU_DEINTERLACE_FIELD_BOTTOM)
++	/* deinterlace frame rate double flags */
++#define IPU_DEINTERLACE_RATE_EN		0x80
++#define IPU_DEINTERLACE_RATE_FRAME1	0x40
++#define IPU_DEINTERLACE_RATE_MASK	\
++		(IPU_DEINTERLACE_RATE_EN | IPU_DEINTERLACE_RATE_FRAME1)
++#define IPU_DEINTERLACE_MAX_FRAME	2
++	u8	field_fmt;
++};
++
++struct ipu_input {
++	u32 width;
++	u32 height;
++	u32 format;
++	struct ipu_crop crop;
++	dma_addr_t paddr;
++
++	struct ipu_deinterlace deinterlace;
++	dma_addr_t paddr_n; /*valid when deinterlace enable*/
++};
++
++struct ipu_alpha {
++#define IPU_ALPHA_MODE_GLOBAL	0
++#define IPU_ALPHA_MODE_LOCAL	1
++	u8 mode;
++	u8 gvalue; /* 0~255 */
++	dma_addr_t loc_alp_paddr;
++};
++
++struct ipu_colorkey {
++	bool enable;
++	u32 value; /* RGB 24bit */
++};
++
++struct ipu_overlay {
++	u32	width;
++	u32	height;
++	u32	format;
++	struct ipu_crop crop;
++	struct ipu_alpha alpha;
++	struct ipu_colorkey colorkey;
++	dma_addr_t paddr;
++};
++
++struct ipu_output {
++	u32	width;
++	u32	height;
++	u32	format;
++	u8	rotate;
++	struct ipu_crop crop;
++	dma_addr_t paddr;
++};
++
++struct ipu_task {
++	struct ipu_input input;
++	struct ipu_output output;
++
++	bool overlay_en;
++	struct ipu_overlay overlay;
++
++#define IPU_TASK_PRIORITY_NORMAL 0
++#define IPU_TASK_PRIORITY_HIGH	1
++	u8	priority;
++
++#define	IPU_TASK_ID_ANY	0
++#define	IPU_TASK_ID_VF	1
++#define	IPU_TASK_ID_PP	2
++#define	IPU_TASK_ID_MAX 3
++	u8	task_id;
++
++	int	timeout;
++};
++
++enum {
++	IPU_CHECK_OK = 0,
++	IPU_CHECK_WARN_INPUT_OFFS_NOT8ALIGN = 0x1,
++	IPU_CHECK_WARN_OUTPUT_OFFS_NOT8ALIGN = 0x2,
++	IPU_CHECK_WARN_OVERLAY_OFFS_NOT8ALIGN = 0x4,
++	IPU_CHECK_ERR_MIN,
++	IPU_CHECK_ERR_INPUT_CROP,
++	IPU_CHECK_ERR_OUTPUT_CROP,
++	IPU_CHECK_ERR_OVERLAY_CROP,
++	IPU_CHECK_ERR_INPUT_OVER_LIMIT,
++	IPU_CHECK_ERR_OV_OUT_NO_FIT,
++	IPU_CHECK_ERR_OVERLAY_WITH_VDI,
++	IPU_CHECK_ERR_PROC_NO_NEED,
++	IPU_CHECK_ERR_SPLIT_INPUTW_OVER,
++	IPU_CHECK_ERR_SPLIT_INPUTH_OVER,
++	IPU_CHECK_ERR_SPLIT_OUTPUTW_OVER,
++	IPU_CHECK_ERR_SPLIT_OUTPUTH_OVER,
++	IPU_CHECK_ERR_SPLIT_WITH_ROT,
++	IPU_CHECK_ERR_NOT_SUPPORT,
++	IPU_CHECK_ERR_NOT16ALIGN,
++	IPU_CHECK_ERR_W_DOWNSIZE_OVER,
++	IPU_CHECK_ERR_H_DOWNSIZE_OVER,
++};
++
++/* IOCTL commands */
++#define IPU_CHECK_TASK		_IOWR('I', 0x1, struct ipu_task)
++#define IPU_QUEUE_TASK		_IOW('I', 0x2, struct ipu_task)
++#define IPU_ALLOC		_IOWR('I', 0x3, int)
++#define IPU_FREE		_IOW('I', 0x4, int)
++
++#endif
+diff -Nur linux-4.1.3/include/uapi/linux/Kbuild linux-xbian-imx6/include/uapi/linux/Kbuild
+--- linux-4.1.3/include/uapi/linux/Kbuild	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/include/uapi/linux/Kbuild	2015-07-27 23:13:09.849839184 +0200
+@@ -266,6 +266,9 @@
+ header-y += msdos_fs.h
+ header-y += msg.h
+ header-y += mtio.h
++header-y += mxcfb.h
++header-y += mxc_dcic.h
++header-y += ipu.h
+ header-y += nbd.h
+ header-y += ncp_fs.h
+ header-y += ncp.h
+@@ -451,3 +454,6 @@
+ header-y += xilinx-v4l2-controls.h
+ header-y += zorro.h
+ header-y += zorro_ids.h
++
++header-y += pxp_device.h
++header-y += pxp_dma.h
+diff -Nur linux-4.1.3/include/uapi/linux/mxc_asrc.h linux-xbian-imx6/include/uapi/linux/mxc_asrc.h
+--- linux-4.1.3/include/uapi/linux/mxc_asrc.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/mxc_asrc.h	2015-07-27 23:13:09.865782301 +0200
+@@ -0,0 +1,143 @@
++/*
++ * Copyright 2008-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ *
++ * @file mxc_asrc.h
++ *
++ * @brief i.MX Asynchronous Sample Rate Converter
++ *
++ * @ingroup Audio
++ */
++
++#ifndef __MXC_ASRC_UAPI_H__
++#define __MXC_ASRC_UAPI_H__
++
++#define ASRC_IOC_MAGIC		'C'
++
++#define ASRC_REQ_PAIR		_IOWR(ASRC_IOC_MAGIC, 0, struct asrc_req)
++#define ASRC_CONFIG_PAIR	_IOWR(ASRC_IOC_MAGIC, 1, struct asrc_config)
++#define ASRC_RELEASE_PAIR	_IOW(ASRC_IOC_MAGIC, 2, enum asrc_pair_index)
++#define ASRC_CONVERT		_IOW(ASRC_IOC_MAGIC, 3, struct asrc_convert_buffer)
++#define ASRC_START_CONV		_IOW(ASRC_IOC_MAGIC, 4, enum asrc_pair_index)
++#define ASRC_STOP_CONV		_IOW(ASRC_IOC_MAGIC, 5, enum asrc_pair_index)
++#define ASRC_STATUS		_IOW(ASRC_IOC_MAGIC, 6, struct asrc_status_flags)
++#define ASRC_FLUSH		_IOW(ASRC_IOC_MAGIC, 7, enum asrc_pair_index)
++
++enum asrc_pair_index {
++	ASRC_UNVALID_PAIR = -1,
++	ASRC_PAIR_A = 0,
++	ASRC_PAIR_B = 1,
++	ASRC_PAIR_C = 2,
++};
++
++#define ASRC_PAIR_MAX_NUM	(ASRC_PAIR_C + 1)
++
++enum asrc_inclk {
++	INCLK_NONE = 0x03,
++	INCLK_ESAI_RX = 0x00,
++	INCLK_SSI1_RX = 0x01,
++	INCLK_SSI2_RX = 0x02,
++	INCLK_SSI3_RX = 0x07,
++	INCLK_SPDIF_RX = 0x04,
++	INCLK_MLB_CLK = 0x05,
++	INCLK_PAD = 0x06,
++	INCLK_ESAI_TX = 0x08,
++	INCLK_SSI1_TX = 0x09,
++	INCLK_SSI2_TX = 0x0a,
++	INCLK_SSI3_TX = 0x0b,
++	INCLK_SPDIF_TX = 0x0c,
++	INCLK_ASRCK1_CLK = 0x0f,
++};
++
++enum asrc_outclk {
++	OUTCLK_NONE = 0x03,
++	OUTCLK_ESAI_TX = 0x00,
++	OUTCLK_SSI1_TX = 0x01,
++	OUTCLK_SSI2_TX = 0x02,
++	OUTCLK_SSI3_TX = 0x07,
++	OUTCLK_SPDIF_TX = 0x04,
++	OUTCLK_MLB_CLK = 0x05,
++	OUTCLK_PAD = 0x06,
++	OUTCLK_ESAI_RX = 0x08,
++	OUTCLK_SSI1_RX = 0x09,
++	OUTCLK_SSI2_RX = 0x0a,
++	OUTCLK_SSI3_RX = 0x0b,
++	OUTCLK_SPDIF_RX = 0x0c,
++	OUTCLK_ASRCK1_CLK = 0x0f,
++};
++
++enum asrc_word_width {
++	ASRC_WIDTH_24_BIT = 0,
++	ASRC_WIDTH_16_BIT = 1,
++	ASRC_WIDTH_8_BIT = 2,
++};
++
++struct asrc_config {
++	enum asrc_pair_index pair;
++	unsigned int channel_num;
++	unsigned int buffer_num;
++	unsigned int dma_buffer_size;
++	unsigned int input_sample_rate;
++	unsigned int output_sample_rate;
++	enum asrc_word_width input_word_width;
++	enum asrc_word_width output_word_width;
++	enum asrc_inclk inclk;
++	enum asrc_outclk outclk;
++};
++
++struct asrc_pair {
++	unsigned int start_channel;
++	unsigned int chn_num;
++	unsigned int chn_max;
++	unsigned int active;
++	unsigned int overload_error;
++};
++
++struct asrc_req {
++	unsigned int chn_num;
++	enum asrc_pair_index index;
++};
++
++struct asrc_querybuf {
++	unsigned int buffer_index;
++	unsigned int input_length;
++	unsigned int output_length;
++	unsigned long input_offset;
++	unsigned long output_offset;
++};
++
++struct asrc_convert_buffer {
++	void *input_buffer_vaddr;
++	void *output_buffer_vaddr;
++	unsigned int input_buffer_length;
++	unsigned int output_buffer_length;
++};
++
++struct asrc_buffer {
++	unsigned int index;
++	unsigned int length;
++	unsigned int output_last_length;
++	int buf_valid;
++};
++
++struct asrc_status_flags {
++	enum asrc_pair_index index;
++	unsigned int overload_error;
++};
++
++#define ASRC_BUF_NA	-35	/* ASRC DQ's buffer is NOT available */
++#define ASRC_BUF_AV	 35	/* ASRC DQ's buffer is available */
++enum asrc_error_status {
++	ASRC_TASK_Q_OVERLOAD		= 0x01,
++	ASRC_OUTPUT_TASK_OVERLOAD	= 0x02,
++	ASRC_INPUT_TASK_OVERLOAD	= 0x04,
++	ASRC_OUTPUT_BUFFER_OVERFLOW	= 0x08,
++	ASRC_INPUT_BUFFER_UNDERRUN	= 0x10,
++};
++#endif/* __MXC_ASRC_UAPI_H__ */
+diff -Nur linux-4.1.3/include/uapi/linux/mxc_dcic.h linux-xbian-imx6/include/uapi/linux/mxc_dcic.h
+--- linux-4.1.3/include/uapi/linux/mxc_dcic.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/mxc_dcic.h	2015-07-27 23:13:09.865782301 +0200
+@@ -0,0 +1,49 @@
++/*
++ * Copyright (C) 2014 Freescale Semiconductor, Inc. All Rights Reserved
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*!
++ * @file uapi/linux/mxc_dcic.h
++ *
++ * @brief MXC DCIC private header file
++ *
++ * @ingroup MXC DCIC
++ */
++#ifndef __ASM_ARCH_MXC_DCIC_H__
++#define __ASM_ARCH_MXC_DCIC_H__
++
++#define DCIC_IOC_ALLOC_ROI_NUM	_IO('D', 10)
++#define DCIC_IOC_FREE_ROI_NUM	_IO('D', 11)
++#define DCIC_IOC_CONFIG_DCIC	_IO('D', 12)
++#define DCIC_IOC_CONFIG_ROI		_IO('D', 13)
++#define DCIC_IOC_GET_RESULT		_IO('D', 14)
++#define DCIC_IOC_START_VSYNC		_IO('D', 15)
++#define DCIC_IOC_STOP_VSYNC		_IO('D', 16)
++
++struct roi_params {
++	unsigned int roi_n;
++	unsigned int ref_sig;
++	unsigned int start_y;
++	unsigned int start_x;
++	unsigned int end_y;
++	unsigned int end_x;
++	char freeze;
++};
++
++#endif
+diff -Nur linux-4.1.3/include/uapi/linux/mxcfb.h linux-xbian-imx6/include/uapi/linux/mxcfb.h
+--- linux-4.1.3/include/uapi/linux/mxcfb.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/mxcfb.h	2015-07-27 23:13:09.865782301 +0200
+@@ -0,0 +1,176 @@
++/*
++ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc. All Rights Reserved
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*
++ * @file uapi/linux/mxcfb.h
++ *
++ * @brief Global header file for the MXC frame buffer
++ *
++ * @ingroup Framebuffer
++ */
++#ifndef __ASM_ARCH_MXCFB_H__
++#define __ASM_ARCH_MXCFB_H__
++
++#include <linux/fb.h>
++
++#define FB_SYNC_OE_LOW_ACT	0x80000000
++#define FB_SYNC_CLK_LAT_FALL	0x40000000
++#define FB_SYNC_DATA_INVERT	0x20000000
++#define FB_SYNC_CLK_IDLE_EN	0x10000000
++#define FB_SYNC_SHARP_MODE	0x08000000
++#define FB_SYNC_SWAP_RGB	0x04000000
++#define FB_ACCEL_TRIPLE_FLAG	0x00000000
++#define FB_ACCEL_DOUBLE_FLAG	0x00000001
++
++struct mxcfb_gbl_alpha {
++	int enable;
++	int alpha;
++};
++
++struct mxcfb_loc_alpha {
++	int enable;
++	int alpha_in_pixel;
++	unsigned long alpha_phy_addr0;
++	unsigned long alpha_phy_addr1;
++};
++
++struct mxcfb_color_key {
++	int enable;
++	__u32 color_key;
++};
++
++struct mxcfb_pos {
++	__u16 x;
++	__u16 y;
++};
++
++struct mxcfb_gamma {
++	int enable;
++	int constk[16];
++	int slopek[16];
++};
++
++struct mxcfb_rect {
++	__u32 top;
++	__u32 left;
++	__u32 width;
++	__u32 height;
++};
++
++#define GRAYSCALE_8BIT				0x1
++#define GRAYSCALE_8BIT_INVERTED			0x2
++#define GRAYSCALE_4BIT                          0x3
++#define GRAYSCALE_4BIT_INVERTED                 0x4
++
++#define AUTO_UPDATE_MODE_REGION_MODE		0
++#define AUTO_UPDATE_MODE_AUTOMATIC_MODE		1
++
++#define UPDATE_SCHEME_SNAPSHOT			0
++#define UPDATE_SCHEME_QUEUE			1
++#define UPDATE_SCHEME_QUEUE_AND_MERGE		2
++
++#define UPDATE_MODE_PARTIAL			0x0
++#define UPDATE_MODE_FULL			0x1
++
++#define WAVEFORM_MODE_AUTO			257
++
++#define TEMP_USE_AMBIENT			0x1000
++
++#define EPDC_FLAG_ENABLE_INVERSION		0x01
++#define EPDC_FLAG_FORCE_MONOCHROME		0x02
++#define EPDC_FLAG_USE_CMAP			0x04
++#define EPDC_FLAG_USE_ALT_BUFFER		0x100
++#define EPDC_FLAG_TEST_COLLISION		0x200
++#define EPDC_FLAG_GROUP_UPDATE			0x400
++#define EPDC_FLAG_USE_DITHERING_Y1		0x2000
++#define EPDC_FLAG_USE_DITHERING_Y4		0x4000
++
++#define FB_POWERDOWN_DISABLE			-1
++
++struct mxcfb_alt_buffer_data {
++	__u32 phys_addr;
++	__u32 width;	/* width of entire buffer */
++	__u32 height;	/* height of entire buffer */
++	struct mxcfb_rect alt_update_region;	/* region within buffer to update */
++};
++
++struct mxcfb_update_data {
++	struct mxcfb_rect update_region;
++	__u32 waveform_mode;
++	__u32 update_mode;
++	__u32 update_marker;
++	int temp;
++	unsigned int flags;
++	struct mxcfb_alt_buffer_data alt_buffer_data;
++};
++
++struct mxcfb_update_marker_data {
++	__u32 update_marker;
++	__u32 collision_test;
++};
++
++/*
++ * Structure used to define waveform modes for driver
++ * Needed for driver to perform auto-waveform selection
++ */
++struct mxcfb_waveform_modes {
++	int mode_init;
++	int mode_du;
++	int mode_gc4;
++	int mode_gc8;
++	int mode_gc16;
++	int mode_gc32;
++};
++
++/*
++ * Structure used to define a 5*3 matrix of parameters for
++ * setting IPU DP CSC module related to this framebuffer.
++ */
++struct mxcfb_csc_matrix {
++	int param[5][3];
++};
++
++#define MXCFB_WAIT_FOR_VSYNC	_IOW('F', 0x20, u_int32_t)
++#define MXCFB_SET_GBL_ALPHA     _IOW('F', 0x21, struct mxcfb_gbl_alpha)
++#define MXCFB_SET_CLR_KEY       _IOW('F', 0x22, struct mxcfb_color_key)
++#define MXCFB_SET_OVERLAY_POS   _IOWR('F', 0x24, struct mxcfb_pos)
++#define MXCFB_GET_FB_IPU_CHAN 	_IOR('F', 0x25, u_int32_t)
++#define MXCFB_SET_LOC_ALPHA     _IOWR('F', 0x26, struct mxcfb_loc_alpha)
++#define MXCFB_SET_LOC_ALP_BUF    _IOW('F', 0x27, unsigned long)
++#define MXCFB_SET_GAMMA	       _IOW('F', 0x28, struct mxcfb_gamma)
++#define MXCFB_GET_FB_IPU_DI 	_IOR('F', 0x29, u_int32_t)
++#define MXCFB_GET_DIFMT	       _IOR('F', 0x2A, u_int32_t)
++#define MXCFB_GET_FB_BLANK     _IOR('F', 0x2B, u_int32_t)
++#define MXCFB_SET_DIFMT		_IOW('F', 0x2C, u_int32_t)
++#define MXCFB_CSC_UPDATE	_IOW('F', 0x2D, struct mxcfb_csc_matrix)
++
++/* IOCTLs for E-ink panel updates */
++#define MXCFB_SET_WAVEFORM_MODES	_IOW('F', 0x2B, struct mxcfb_waveform_modes)
++#define MXCFB_SET_TEMPERATURE		_IOW('F', 0x2C, int32_t)
++#define MXCFB_SET_AUTO_UPDATE_MODE	_IOW('F', 0x2D, __u32)
++#define MXCFB_SEND_UPDATE		_IOW('F', 0x2E, struct mxcfb_update_data)
++#define MXCFB_WAIT_FOR_UPDATE_COMPLETE	_IOWR('F', 0x2F, struct mxcfb_update_marker_data)
++#define MXCFB_SET_PWRDOWN_DELAY		_IOW('F', 0x30, int32_t)
++#define MXCFB_GET_PWRDOWN_DELAY		_IOR('F', 0x31, int32_t)
++#define MXCFB_SET_UPDATE_SCHEME		_IOW('F', 0x32, __u32)
++#define MXCFB_GET_WORK_BUFFER		_IOWR('F', 0x34, unsigned long)
++#define MXCFB_DISABLE_EPDC_ACCESS	_IO('F', 0x35)
++#define MXCFB_ENABLE_EPDC_ACCESS	_IO('F', 0x36)
++#endif
+diff -Nur linux-4.1.3/include/uapi/linux/mxc_mlb.h linux-xbian-imx6/include/uapi/linux/mxc_mlb.h
+--- linux-4.1.3/include/uapi/linux/mxc_mlb.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/mxc_mlb.h	2015-07-27 23:13:09.865782301 +0200
+@@ -0,0 +1,55 @@
++/*
++ * mxc_mlb.h
++ *
++ * Copyright 2008-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++#ifndef _MXC_MLB_UAPI_H
++#define _MXC_MLB_UAPI_H
++
++/* define IOCTL command */
++#define MLB_DBG_RUNTIME		_IO('S', 0x09)
++#define MLB_SET_FPS		_IOW('S', 0x10, unsigned int)
++#define MLB_GET_VER		_IOR('S', 0x11, unsigned long)
++#define MLB_SET_DEVADDR		_IOR('S', 0x12, unsigned char)
++
++/*!
++ * set channel address for each logical channel
++ * the MSB 16bits is for tx channel, the left LSB is for rx channel
++ */
++#define MLB_CHAN_SETADDR	_IOW('S', 0x13, unsigned int)
++#define MLB_CHAN_STARTUP	_IO('S', 0x14)
++#define MLB_CHAN_SHUTDOWN	_IO('S', 0x15)
++#define MLB_CHAN_GETEVENT	_IOR('S', 0x16, unsigned long)
++
++#define MLB_SET_ISOC_BLKSIZE_188 _IO('S', 0x17)
++#define MLB_SET_ISOC_BLKSIZE_196 _IO('S', 0x18)
++#define MLB_SET_SYNC_QUAD	_IOW('S', 0x19, unsigned int)
++#define MLB_IRQ_ENABLE		_IO('S', 0x20)
++#define MLB_IRQ_DISABLE		_IO('S', 0x21)
++
++/*!
++ * MLB event define
++ */
++enum {
++	MLB_EVT_TX_PROTO_ERR_CUR = 1 << 0,
++	MLB_EVT_TX_BRK_DETECT_CUR = 1 << 1,
++	MLB_EVT_TX_PROTO_ERR_PREV = 1 << 8,
++	MLB_EVT_TX_BRK_DETECT_PREV = 1 << 9,
++	MLB_EVT_RX_PROTO_ERR_CUR = 1 << 16,
++	MLB_EVT_RX_BRK_DETECT_CUR = 1 << 17,
++	MLB_EVT_RX_PROTO_ERR_PREV = 1 << 24,
++	MLB_EVT_RX_BRK_DETECT_PREV = 1 << 25,
++};
++
++
++#endif				/* _MXC_MLB_H */
+diff -Nur linux-4.1.3/include/uapi/linux/mxc_v4l2.h linux-xbian-imx6/include/uapi/linux/mxc_v4l2.h
+--- linux-4.1.3/include/uapi/linux/mxc_v4l2.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/mxc_v4l2.h	2015-07-27 23:13:09.865782301 +0200
+@@ -0,0 +1,56 @@
++/*
++ * Copyright (C) 2013 Freescale Semiconductor, Inc. All Rights Reserved
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++/*!
++ * @file uapi/linux/mxc_v4l2.h
++ *
++ * @brief MXC V4L2 private header file
++ *
++ * @ingroup MXC V4L2
++ */
++
++#ifndef __ASM_ARCH_MXC_V4L2_H__
++#define __ASM_ARCH_MXC_V4L2_H__
++
++/*
++ * For IPUv1 and IPUv3, V4L2_CID_MXC_ROT means encoder ioctl ID.
++ * And V4L2_CID_MXC_VF_ROT is viewfinder ioctl ID only for IPUv1 and IPUv3.
++ */
++#define V4L2_CID_MXC_ROT		(V4L2_CID_PRIVATE_BASE + 0)
++#define V4L2_CID_MXC_FLASH		(V4L2_CID_PRIVATE_BASE + 1)
++#define V4L2_CID_MXC_VF_ROT		(V4L2_CID_PRIVATE_BASE + 2)
++#define V4L2_CID_MXC_MOTION		(V4L2_CID_PRIVATE_BASE + 3)
++#define V4L2_CID_MXC_SWITCH_CAM		(V4L2_CID_PRIVATE_BASE + 6)
++
++#define V4L2_MXC_ROTATE_NONE			0
++#define V4L2_MXC_ROTATE_VERT_FLIP		1
++#define V4L2_MXC_ROTATE_HORIZ_FLIP		2
++#define V4L2_MXC_ROTATE_180			3
++#define V4L2_MXC_ROTATE_90_RIGHT		4
++#define V4L2_MXC_ROTATE_90_RIGHT_VFLIP		5
++#define V4L2_MXC_ROTATE_90_RIGHT_HFLIP		6
++#define V4L2_MXC_ROTATE_90_LEFT			7
++
++struct v4l2_mxc_offset {
++	uint32_t u_offset;
++	uint32_t v_offset;
++};
++
++#endif
+diff -Nur linux-4.1.3/include/uapi/linux/pxp_device.h linux-xbian-imx6/include/uapi/linux/pxp_device.h
+--- linux-4.1.3/include/uapi/linux/pxp_device.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/pxp_device.h	2015-07-27 23:13:09.941512106 +0200
+@@ -0,0 +1,63 @@
++/*
++ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++#ifndef _UAPI_PXP_DEVICE
++#define _UAPI_PXP_DEVICE
++
++#include <linux/pxp_dma.h>
++
++struct pxp_chan_handle {
++	unsigned int handle;
++	int hist_status;
++};
++
++struct pxp_mem_desc {
++	unsigned int handle;
++	unsigned int size;
++	dma_addr_t phys_addr;
++	unsigned int virt_uaddr;		/* virtual user space address */
++	unsigned int mtype;
++};
++
++struct pxp_mem_flush {
++	unsigned int handle;
++	unsigned int type;
++};
++
++#define PXP_IOC_MAGIC  'P'
++
++#define PXP_IOC_GET_CHAN      _IOR(PXP_IOC_MAGIC, 0, struct pxp_mem_desc)
++#define PXP_IOC_PUT_CHAN      _IOW(PXP_IOC_MAGIC, 1, struct pxp_mem_desc)
++#define PXP_IOC_CONFIG_CHAN   _IOW(PXP_IOC_MAGIC, 2, struct pxp_mem_desc)
++#define PXP_IOC_START_CHAN    _IOW(PXP_IOC_MAGIC, 3, struct pxp_mem_desc)
++#define PXP_IOC_GET_PHYMEM    _IOWR(PXP_IOC_MAGIC, 4, struct pxp_mem_desc)
++#define PXP_IOC_PUT_PHYMEM    _IOW(PXP_IOC_MAGIC, 5, struct pxp_mem_desc)
++#define PXP_IOC_WAIT4CMPLT    _IOWR(PXP_IOC_MAGIC, 6, struct pxp_mem_desc)
++#define PXP_IOC_FLUSH_PHYMEM   _IOR(PXP_IOC_MAGIC, 7, struct pxp_mem_flush)
++
++/* Memory types supported*/
++#define MEMORY_TYPE_UNCACHED 0x0
++#define MEMORY_TYPE_WC	     0x1
++#define MEMORY_TYPE_CACHED   0x2
++
++/* Cache flush operations */
++#define CACHE_CLEAN      0x1
++#define CACHE_INVALIDATE 0x2
++#define CACHE_FLUSH      0x4
++
++#endif
+diff -Nur linux-4.1.3/include/uapi/linux/pxp_dma.h linux-xbian-imx6/include/uapi/linux/pxp_dma.h
+--- linux-4.1.3/include/uapi/linux/pxp_dma.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/linux/pxp_dma.h	2015-07-27 23:13:09.941512106 +0200
+@@ -0,0 +1,173 @@
++/*
++ * Copyright (C) 2013-2015 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License
++ * along with this program; if not, write to the Free Software
++ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
++ *
++ */
++#ifndef _UAPI_PXP_DMA
++#define _UAPI_PXP_DMA
++
++#include <linux/posix_types.h>
++#include <linux/types.h>
++
++#ifndef __KERNEL__
++typedef unsigned long dma_addr_t;
++typedef unsigned char bool;
++#endif
++
++/*  PXP Pixel format definitions */
++/*  Four-character-code (FOURCC) */
++#define fourcc(a, b, c, d)\
++	(((__u32)(a)<<0)|((__u32)(b)<<8)|((__u32)(c)<<16)|((__u32)(d)<<24))
++
++/*!
++ * @name PXP Pixel Formats
++ *
++ * Pixel formats are defined with ASCII FOURCC code. The pixel format codes are
++ * the same used by V4L2 API.
++ */
++
++/*! @} */
++/*! @name RGB Formats */
++/*! @{ */
++#define PXP_PIX_FMT_RGB332  fourcc('R', 'G', 'B', '1')	/*!<  8  RGB-3-3-2    */
++#define PXP_PIX_FMT_RGB555  fourcc('R', 'G', 'B', 'O')	/*!< 16  RGB-5-5-5    */
++#define PXP_PIX_FMT_RGB565  fourcc('R', 'G', 'B', 'P')	/*!< 1 6  RGB-5-6-5   */
++#define PXP_PIX_FMT_RGB666  fourcc('R', 'G', 'B', '6')	/*!< 18  RGB-6-6-6    */
++#define PXP_PIX_FMT_BGR666  fourcc('B', 'G', 'R', '6')	/*!< 18  BGR-6-6-6    */
++#define PXP_PIX_FMT_BGR24   fourcc('B', 'G', 'R', '3')	/*!< 24  BGR-8-8-8    */
++#define PXP_PIX_FMT_RGB24   fourcc('R', 'G', 'B', '3')	/*!< 24  RGB-8-8-8    */
++#define PXP_PIX_FMT_BGR32   fourcc('B', 'G', 'R', '4')	/*!< 32  BGR-8-8-8-8  */
++#define PXP_PIX_FMT_BGRA32  fourcc('B', 'G', 'R', 'A')	/*!< 32  BGR-8-8-8-8  */
++#define PXP_PIX_FMT_RGB32   fourcc('R', 'G', 'B', '4')	/*!< 32  RGB-8-8-8-8  */
++#define PXP_PIX_FMT_RGBA32  fourcc('R', 'G', 'B', 'A')	/*!< 32  RGB-8-8-8-8  */
++#define PXP_PIX_FMT_ABGR32  fourcc('A', 'B', 'G', 'R')	/*!< 32  ABGR-8-8-8-8 */
++/*! @} */
++/*! @name YUV Interleaved Formats */
++/*! @{ */
++#define PXP_PIX_FMT_YUYV    fourcc('Y', 'U', 'Y', 'V')	/*!< 16 YUV 4:2:2 */
++#define PXP_PIX_FMT_UYVY    fourcc('U', 'Y', 'V', 'Y')	/*!< 16 YUV 4:2:2 */
++#define PXP_PIX_FMT_VYUY    fourcc('V', 'Y', 'U', 'Y')  /*!< 16 YVU 4:2:2 */
++#define PXP_PIX_FMT_YVYU    fourcc('Y', 'V', 'Y', 'U')  /*!< 16 YVU 4:2:2 */
++#define PXP_PIX_FMT_Y41P    fourcc('Y', '4', '1', 'P')	/*!< 12 YUV 4:1:1 */
++#define PXP_PIX_FMT_VUY444  fourcc('V', 'U', 'Y', 'A')	/*!< 32 VUYA 8:8:8 */
++/* two planes -- one Y, one Cb + Cr interleaved  */
++#define PXP_PIX_FMT_NV12    fourcc('N', 'V', '1', '2')	/* 12  Y/CbCr 4:2:0  */
++#define PXP_PIX_FMT_NV21    fourcc('N', 'V', '2', '1')	/* 12  Y/CbCr 4:2:0  */
++#define PXP_PIX_FMT_NV16    fourcc('N', 'V', '1', '6')	/* 12  Y/CbCr 4:2:2  */
++#define PXP_PIX_FMT_NV61    fourcc('N', 'V', '6', '1')	/* 12  Y/CbCr 4:2:2  */
++/*! @} */
++/*! @name YUV Planar Formats */
++/*! @{ */
++#define PXP_PIX_FMT_GREY    fourcc('G', 'R', 'E', 'Y')	/*!< 8  Greyscale */
++#define PXP_PIX_FMT_GY04    fourcc('G', 'Y', '0', '4') /*!< 4  Greyscale */
++#define PXP_PIX_FMT_YVU410P fourcc('Y', 'V', 'U', '9')	/*!< 9  YVU 4:1:0 */
++#define PXP_PIX_FMT_YUV410P fourcc('Y', 'U', 'V', '9')	/*!< 9  YUV 4:1:0 */
++#define PXP_PIX_FMT_YVU420P fourcc('Y', 'V', '1', '2')	/*!< 12 YVU 4:2:0 */
++#define PXP_PIX_FMT_YUV420P fourcc('I', '4', '2', '0')	/*!< 12 YUV 4:2:0 */
++#define PXP_PIX_FMT_YUV420P2 fourcc('Y', 'U', '1', '2')	/*!< 12 YUV 4:2:0 */
++#define PXP_PIX_FMT_YVU422P fourcc('Y', 'V', '1', '6')	/*!< 16 YVU 4:2:2 */
++#define PXP_PIX_FMT_YUV422P fourcc('4', '2', '2', 'P')	/*!< 16 YUV 4:2:2 */
++/*! @} */
++
++#define PXP_LUT_NONE			0x0
++#define PXP_LUT_INVERT			0x1
++#define PXP_LUT_BLACK_WHITE		0x2
++#define PXP_LUT_USE_CMAP		0x4
++
++#define NR_PXP_VIRT_CHANNEL	16
++
++/* Order significant! */
++enum pxp_channel_status {
++	PXP_CHANNEL_FREE,
++	PXP_CHANNEL_INITIALIZED,
++	PXP_CHANNEL_READY,
++};
++
++struct rect {
++	int top;		/* Upper left coordinate of rectangle */
++	int left;
++	int width;
++	int height;
++};
++
++struct pxp_layer_param {
++	unsigned short width;
++	unsigned short height;
++	unsigned short stride; /* aka pitch */
++	unsigned int pixel_fmt;
++
++	/* layers combining parameters
++	 * (these are ignored for S0 and output
++	 * layers, and only apply for OL layer)
++	 */
++	bool combine_enable;
++	unsigned int color_key_enable;
++	unsigned int color_key;
++	bool global_alpha_enable;
++	/* global alpha is either override or multiply */
++	bool global_override;
++	unsigned char global_alpha;
++	bool alpha_invert;
++	bool local_alpha_enable;
++
++	dma_addr_t paddr;
++};
++
++struct pxp_proc_data {
++	/* S0 Transformation Info */
++	int scaling;
++	int hflip;
++	int vflip;
++	int rotate;
++	int rot_pos;
++	int yuv;
++
++	/* Source rectangle (srect) defines the sub-rectangle
++	 * within S0 to undergo processing.
++	 */
++	struct rect srect;
++	/* Dest rect (drect) defines how to position the processed
++	 * source rectangle (after resizing) within the output frame,
++	 * whose dimensions are defined in pxp->pxp_conf_state.out_param
++	 */
++	struct rect drect;
++
++	/* Current S0 configuration */
++	unsigned int bgcolor;
++
++	/* Output overlay support */
++	int overlay_state;
++
++	/* LUT transformation on Y data */
++	int lut_transform;
++	unsigned char *lut_map; /* 256 entries */
++	bool lut_map_updated; /* Map recently changed */
++	bool combine_enable;
++};
++
++struct pxp_config_data {
++	struct pxp_layer_param s0_param;
++	struct pxp_layer_param ol_param[8];
++	struct pxp_layer_param out_param;
++	struct pxp_proc_data proc_data;
++	int layer_nr;
++
++	/* Users don't touch */
++	int handle;
++};
++
++
++#endif
+diff -Nur linux-4.1.3/include/uapi/sync.h linux-xbian-imx6/include/uapi/sync.h
+--- linux-4.1.3/include/uapi/sync.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/uapi/sync.h	2015-07-27 23:13:09.977384118 +0200
+@@ -0,0 +1,97 @@
++/*
++ * Copyright (C) 2012 Google, Inc.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ */
++
++#ifndef _UAPI_LINUX_SYNC_H
++#define _UAPI_LINUX_SYNC_H
++
++#include <linux/ioctl.h>
++#include <linux/types.h>
++
++/**
++ * struct sync_merge_data - data passed to merge ioctl
++ * @fd2:	file descriptor of second fence
++ * @name:	name of new fence
++ * @fence:	returns the fd of the new fence to userspace
++ */
++struct sync_merge_data {
++	__s32	fd2; /* fd of second fence */
++	char	name[32]; /* name of new fence */
++	__s32	fence; /* fd on newly created fence */
++};
++
++/**
++ * struct sync_pt_info - detailed sync_pt information
++ * @len:		length of sync_pt_info including any driver_data
++ * @obj_name:		name of parent sync_timeline
++ * @driver_name:	name of driver implementing the parent
++ * @status:		status of the sync_pt 0:active 1:signaled <0:error
++ * @timestamp_ns:	timestamp of status change in nanoseconds
++ * @driver_data:	any driver dependent data
++ */
++struct sync_pt_info {
++	__u32	len;
++	char	obj_name[32];
++	char	driver_name[32];
++	__s32	status;
++	__u64	timestamp_ns;
++
++	__u8	driver_data[0];
++};
++
++/**
++ * struct sync_fence_info_data - data returned from fence info ioctl
++ * @len:	ioctl caller writes the size of the buffer its passing in.
++ *		ioctl returns length of sync_fence_data returned to userspace
++ *		including pt_info.
++ * @name:	name of fence
++ * @status:	status of fence. 1: signaled 0:active <0:error
++ * @pt_info:	a sync_pt_info struct for every sync_pt in the fence
++ */
++struct sync_fence_info_data {
++	__u32	len;
++	char	name[32];
++	__s32	status;
++
++	__u8	pt_info[0];
++};
++
++#define SYNC_IOC_MAGIC		'>'
++
++/**
++ * DOC: SYNC_IOC_WAIT - wait for a fence to signal
++ *
++ * pass timeout in milliseconds.  Waits indefinitely timeout < 0.
++ */
++#define SYNC_IOC_WAIT		_IOW(SYNC_IOC_MAGIC, 0, __s32)
++
++/**
++ * DOC: SYNC_IOC_MERGE - merge two fences
++ *
++ * Takes a struct sync_merge_data.  Creates a new fence containing copies of
++ * the sync_pts in both the calling fd and sync_merge_data.fd2.  Returns the
++ * new fence's fd in sync_merge_data.fence
++ */
++#define SYNC_IOC_MERGE		_IOWR(SYNC_IOC_MAGIC, 1, struct sync_merge_data)
++
++/**
++ * DOC: SYNC_IOC_FENCE_INFO - get detailed information on a fence
++ *
++ * Takes a struct sync_fence_info_data with extra space allocated for pt_info.
++ * Caller should write the size of the buffer into len.  On return, len is
++ * updated to reflect the total size of the sync_fence_info_data including
++ * pt_info.
++ *
++ * pt_info is a buffer containing sync_pt_infos for every sync_pt in the fence.
++ * To iterate over the sync_pt_infos, use the sync_pt_info.len field.
++ */
++#define SYNC_IOC_FENCE_INFO	_IOWR(SYNC_IOC_MAGIC, 2,\
++	struct sync_fence_info_data)
++
++#endif /* _UAPI_LINUX_SYNC_H */
+diff -Nur linux-4.1.3/include/usb-ehci-mxc.h linux-xbian-imx6/include/usb-ehci-mxc.h
+--- linux-4.1.3/include/usb-ehci-mxc.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/usb-ehci-mxc.h	2015-07-27 23:13:09.981369897 +0200
+@@ -0,0 +1,13 @@
++#ifndef __INCLUDE_ASM_ARCH_MXC_EHCI_H
++#define __INCLUDE_ASM_ARCH_MXC_EHCI_H
++
++struct mxc_usbh_platform_data {
++	int (*init)(struct platform_device *pdev);
++	int (*exit)(struct platform_device *pdev);
++
++	unsigned int		 portsc;
++	struct usb_phy		*otg;
++};
++
++#endif /* __INCLUDE_ASM_ARCH_MXC_EHCI_H */
++
+diff -Nur linux-4.1.3/include/video/mxc_edid.h linux-xbian-imx6/include/video/mxc_edid.h
+--- linux-4.1.3/include/video/mxc_edid.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/video/mxc_edid.h	2015-07-27 23:13:09.981369897 +0200
+@@ -0,0 +1,108 @@
++/*
++ * Copyright 2009-2013 Freescale Semiconductor, Inc. All Rights Reserved.
++ */
++
++/*
++ * The code contained herein is licensed under the GNU General Public
++ * License. You may obtain a copy of the GNU General Public License
++ * Version 2 or later at the following locations:
++ *
++ * http://www.opensource.org/licenses/gpl-license.html
++ * http://www.gnu.org/copyleft/gpl.html
++ */
++
++/*!
++ * @defgroup Framebuffer Framebuffer Driver for SDC and ADC.
++ */
++
++/*!
++ * @file mxc_edid.h
++ *
++ * @brief MXC EDID tools
++ *
++ * @ingroup Framebuffer
++ */
++
++#ifndef MXC_EDID_H
++#define MXC_EDID_H
++
++#include <linux/fb.h>
++
++enum cea_audio_coding_types {
++	AUDIO_CODING_TYPE_REF_STREAM_HEADER	=  0,
++	AUDIO_CODING_TYPE_LPCM			=  1,
++	AUDIO_CODING_TYPE_AC3			=  2,
++	AUDIO_CODING_TYPE_MPEG1			=  3,
++	AUDIO_CODING_TYPE_MP3			=  4,
++	AUDIO_CODING_TYPE_MPEG2			=  5,
++	AUDIO_CODING_TYPE_AACLC			=  6,
++	AUDIO_CODING_TYPE_DTS			=  7,
++	AUDIO_CODING_TYPE_ATRAC			=  8,
++	AUDIO_CODING_TYPE_SACD			=  9,
++	AUDIO_CODING_TYPE_EAC3			= 10,
++	AUDIO_CODING_TYPE_DTS_HD		= 11,
++	AUDIO_CODING_TYPE_MLP			= 12,
++	AUDIO_CODING_TYPE_DST			= 13,
++	AUDIO_CODING_TYPE_WMAPRO		= 14,
++	AUDIO_CODING_TYPE_RESERVED		= 15,
++};
++
++struct mxc_hdmi_3d_format {
++	unsigned char vic_order_2d;
++	unsigned char struct_3d;
++	unsigned char detail_3d;
++	unsigned char reserved;
++};
++
++struct mxc_edid_cfg {
++	bool cea_underscan;
++	bool cea_basicaudio;
++	bool cea_ycbcr444;
++	bool cea_ycbcr422;
++	bool hdmi_cap;
++
++	/*VSD*/
++	bool vsd_support_ai;
++	bool vsd_dc_48bit;
++	bool vsd_dc_36bit;
++	bool vsd_dc_30bit;
++	bool vsd_dc_y444;
++	bool vsd_dvi_dual;
++
++	bool vsd_cnc0;
++	bool vsd_cnc1;
++	bool vsd_cnc2;
++	bool vsd_cnc3;
++
++	u8 vsd_video_latency;
++	u8 vsd_audio_latency;
++	u8 vsd_I_video_latency;
++	u8 vsd_I_audio_latency;
++
++	u8 physical_address[4];
++	u8 hdmi_vic[64];
++	struct mxc_hdmi_3d_format hdmi_3d_format[64];
++	u16 hdmi_3d_mask_all;
++	u16 hdmi_3d_struct_all;
++	unsigned char hdmi_3d_present;
++	unsigned char hdmi_3d_len;
++	unsigned char hdmi_3d_multi_present;
++	u32 vsd_max_tmdsclk_rate;
++
++	u8 max_channels;
++	u8 sample_sizes;
++	u8 sample_rates;
++	u8 speaker_alloc;
++};
++
++int mxc_edid_var_to_vic(struct fb_var_screeninfo *var);
++int mxc_edid_mode_to_vic(const struct fb_videomode *mode, u32 mode_mask);
++int mxc_edid_read(struct i2c_adapter *adp, unsigned short addr,
++	unsigned char *edid, struct mxc_edid_cfg *cfg, struct fb_info *fbi);
++int mxc_edid_parse_ext_blk(unsigned char *edid, struct mxc_edid_cfg *cfg,
++	struct fb_monspecs *specs);
++const struct fb_videomode *mxc_fb_find_nearest_mode(const struct fb_videomode *mode,
++	struct list_head *head);
++int mxc_edid_fb_mode_is_equal(bool use_aspect, const struct fb_videomode *mode1,
++	const struct fb_videomode *mode2, u32 mode_mask);
++#endif
+diff -Nur linux-4.1.3/include/video/mxc_hdmi.h linux-xbian-imx6/include/video/mxc_hdmi.h
+--- linux-4.1.3/include/video/mxc_hdmi.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/include/video/mxc_hdmi.h	2015-07-27 23:13:09.981369897 +0200
+@@ -0,0 +1,1027 @@
++/*
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
++ */
++
++/*
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __MXC_HDMI_H__
++#define __MXC_HDMI_H__
++
++/*
++ * Hdmi controller registers
++ */
++
++/* Identification Registers */
++#define HDMI_DESIGN_ID                          0x0000
++#define HDMI_REVISION_ID                        0x0001
++#define HDMI_PRODUCT_ID0                        0x0002
++#define HDMI_PRODUCT_ID1                        0x0003
++#define HDMI_CONFIG0_ID                         0x0004
++#define HDMI_CONFIG1_ID                         0x0005
++#define HDMI_CONFIG2_ID                         0x0006
++#define HDMI_CONFIG3_ID                         0x0007
++
++/* Interrupt Registers */
++#define HDMI_IH_FC_STAT0                        0x0100
++#define HDMI_IH_FC_STAT1                        0x0101
++#define HDMI_IH_FC_STAT2                        0x0102
++#define HDMI_IH_AS_STAT0                        0x0103
++#define HDMI_IH_PHY_STAT0                       0x0104
++#define HDMI_IH_I2CM_STAT0                      0x0105
++#define HDMI_IH_CEC_STAT0                       0x0106
++#define HDMI_IH_VP_STAT0                        0x0107
++#define HDMI_IH_I2CMPHY_STAT0                   0x0108
++#define HDMI_IH_AHBDMAAUD_STAT0                 0x0109
++
++#define HDMI_IH_MUTE_FC_STAT0                   0x0180
++#define HDMI_IH_MUTE_FC_STAT1                   0x0181
++#define HDMI_IH_MUTE_FC_STAT2                   0x0182
++#define HDMI_IH_MUTE_AS_STAT0                   0x0183
++#define HDMI_IH_MUTE_PHY_STAT0                  0x0184
++#define HDMI_IH_MUTE_I2CM_STAT0                 0x0185
++#define HDMI_IH_MUTE_CEC_STAT0                  0x0186
++#define HDMI_IH_MUTE_VP_STAT0                   0x0187
++#define HDMI_IH_MUTE_I2CMPHY_STAT0              0x0188
++#define HDMI_IH_MUTE_AHBDMAAUD_STAT0            0x0189
++#define HDMI_IH_MUTE                            0x01FF
++
++/* Video Sample Registers */
++#define HDMI_TX_INVID0                          0x0200
++#define HDMI_TX_INSTUFFING                      0x0201
++#define HDMI_TX_GYDATA0                         0x0202
++#define HDMI_TX_GYDATA1                         0x0203
++#define HDMI_TX_RCRDATA0                        0x0204
++#define HDMI_TX_RCRDATA1                        0x0205
++#define HDMI_TX_BCBDATA0                        0x0206
++#define HDMI_TX_BCBDATA1                        0x0207
++
++/* Video Packetizer Registers */
++#define HDMI_VP_STATUS                          0x0800
++#define HDMI_VP_PR_CD                           0x0801
++#define HDMI_VP_STUFF                           0x0802
++#define HDMI_VP_REMAP                           0x0803
++#define HDMI_VP_CONF                            0x0804
++#define HDMI_VP_STAT                            0x0805
++#define HDMI_VP_INT                             0x0806
++#define HDMI_VP_MASK                            0x0807
++#define HDMI_VP_POL                             0x0808
++
++/* Frame Composer Registers */
++#define HDMI_FC_INVIDCONF                       0x1000
++#define HDMI_FC_INHACTV0                        0x1001
++#define HDMI_FC_INHACTV1                        0x1002
++#define HDMI_FC_INHBLANK0                       0x1003
++#define HDMI_FC_INHBLANK1                       0x1004
++#define HDMI_FC_INVACTV0                        0x1005
++#define HDMI_FC_INVACTV1                        0x1006
++#define HDMI_FC_INVBLANK                        0x1007
++#define HDMI_FC_HSYNCINDELAY0                   0x1008
++#define HDMI_FC_HSYNCINDELAY1                   0x1009
++#define HDMI_FC_HSYNCINWIDTH0                   0x100A
++#define HDMI_FC_HSYNCINWIDTH1                   0x100B
++#define HDMI_FC_VSYNCINDELAY                    0x100C
++#define HDMI_FC_VSYNCINWIDTH                    0x100D
++#define HDMI_FC_INFREQ0                         0x100E
++#define HDMI_FC_INFREQ1                         0x100F
++#define HDMI_FC_INFREQ2                         0x1010
++#define HDMI_FC_CTRLDUR                         0x1011
++#define HDMI_FC_EXCTRLDUR                       0x1012
++#define HDMI_FC_EXCTRLSPAC                      0x1013
++#define HDMI_FC_CH0PREAM                        0x1014
++#define HDMI_FC_CH1PREAM                        0x1015
++#define HDMI_FC_CH2PREAM                        0x1016
++#define HDMI_FC_AVICONF3                        0x1017
++#define HDMI_FC_GCP                             0x1018
++#define HDMI_FC_AVICONF0                        0x1019
++#define HDMI_FC_AVICONF1                        0x101A
++#define HDMI_FC_AVICONF2                        0x101B
++#define HDMI_FC_AVIVID                          0x101C
++#define HDMI_FC_AVIETB0                         0x101D
++#define HDMI_FC_AVIETB1                         0x101E
++#define HDMI_FC_AVISBB0                         0x101F
++#define HDMI_FC_AVISBB1                         0x1020
++#define HDMI_FC_AVIELB0                         0x1021
++#define HDMI_FC_AVIELB1                         0x1022
++#define HDMI_FC_AVISRB0                         0x1023
++#define HDMI_FC_AVISRB1                         0x1024
++#define HDMI_FC_AUDICONF0                       0x1025
++#define HDMI_FC_AUDICONF1                       0x1026
++#define HDMI_FC_AUDICONF2                       0x1027
++#define HDMI_FC_AUDICONF3                       0x1028
++#define HDMI_FC_VSDIEEEID0                      0x1029
++#define HDMI_FC_VSDSIZE                         0x102A
++#define HDMI_FC_VSDIEEEID1                      0x1030
++#define HDMI_FC_VSDIEEEID2                      0x1031
++#define HDMI_FC_VSDPAYLOAD0                     0x1032
++#define HDMI_FC_VSDPAYLOAD1                     0x1033
++#define HDMI_FC_VSDPAYLOAD2                     0x1034
++#define HDMI_FC_VSDPAYLOAD3                     0x1035
++#define HDMI_FC_VSDPAYLOAD4                     0x1036
++#define HDMI_FC_VSDPAYLOAD5                     0x1037
++#define HDMI_FC_VSDPAYLOAD6                     0x1038
++#define HDMI_FC_VSDPAYLOAD7                     0x1039
++#define HDMI_FC_VSDPAYLOAD8                     0x103A
++#define HDMI_FC_VSDPAYLOAD9                     0x103B
++#define HDMI_FC_VSDPAYLOAD10                    0x103C
++#define HDMI_FC_VSDPAYLOAD11                    0x103D
++#define HDMI_FC_VSDPAYLOAD12                    0x103E
++#define HDMI_FC_VSDPAYLOAD13                    0x103F
++#define HDMI_FC_VSDPAYLOAD14                    0x1040
++#define HDMI_FC_VSDPAYLOAD15                    0x1041
++#define HDMI_FC_VSDPAYLOAD16                    0x1042
++#define HDMI_FC_VSDPAYLOAD17                    0x1043
++#define HDMI_FC_VSDPAYLOAD18                    0x1044
++#define HDMI_FC_VSDPAYLOAD19                    0x1045
++#define HDMI_FC_VSDPAYLOAD20                    0x1046
++#define HDMI_FC_VSDPAYLOAD21                    0x1047
++#define HDMI_FC_VSDPAYLOAD22                    0x1048
++#define HDMI_FC_VSDPAYLOAD23                    0x1049
++#define HDMI_FC_SPDVENDORNAME0                  0x104A
++#define HDMI_FC_SPDVENDORNAME1                  0x104B
++#define HDMI_FC_SPDVENDORNAME2                  0x104C
++#define HDMI_FC_SPDVENDORNAME3                  0x104D
++#define HDMI_FC_SPDVENDORNAME4                  0x104E
++#define HDMI_FC_SPDVENDORNAME5                  0x104F
++#define HDMI_FC_SPDVENDORNAME6                  0x1050
++#define HDMI_FC_SPDVENDORNAME7                  0x1051
++#define HDMI_FC_SDPPRODUCTNAME0                 0x1052
++#define HDMI_FC_SDPPRODUCTNAME1                 0x1053
++#define HDMI_FC_SDPPRODUCTNAME2                 0x1054
++#define HDMI_FC_SDPPRODUCTNAME3                 0x1055
++#define HDMI_FC_SDPPRODUCTNAME4                 0x1056
++#define HDMI_FC_SDPPRODUCTNAME5                 0x1057
++#define HDMI_FC_SDPPRODUCTNAME6                 0x1058
++#define HDMI_FC_SDPPRODUCTNAME7                 0x1059
++#define HDMI_FC_SDPPRODUCTNAME8                 0x105A
++#define HDMI_FC_SDPPRODUCTNAME9                 0x105B
++#define HDMI_FC_SDPPRODUCTNAME10                0x105C
++#define HDMI_FC_SDPPRODUCTNAME11                0x105D
++#define HDMI_FC_SDPPRODUCTNAME12                0x105E
++#define HDMI_FC_SDPPRODUCTNAME13                0x105F
++#define HDMI_FC_SDPPRODUCTNAME14                0x1060
++#define HDMI_FC_SPDPRODUCTNAME15                0x1061
++#define HDMI_FC_SPDDEVICEINF                    0x1062
++#define HDMI_FC_AUDSCONF                        0x1063
++#define HDMI_FC_AUDSSTAT                        0x1064
++#define HDMI_FC_DATACH0FILL                     0x1070
++#define HDMI_FC_DATACH1FILL                     0x1071
++#define HDMI_FC_DATACH2FILL                     0x1072
++#define HDMI_FC_CTRLQHIGH                       0x1073
++#define HDMI_FC_CTRLQLOW                        0x1074
++#define HDMI_FC_ACP0                            0x1075
++#define HDMI_FC_ACP28                           0x1076
++#define HDMI_FC_ACP27                           0x1077
++#define HDMI_FC_ACP26                           0x1078
++#define HDMI_FC_ACP25                           0x1079
++#define HDMI_FC_ACP24                           0x107A
++#define HDMI_FC_ACP23                           0x107B
++#define HDMI_FC_ACP22                           0x107C
++#define HDMI_FC_ACP21                           0x107D
++#define HDMI_FC_ACP20                           0x107E
++#define HDMI_FC_ACP19                           0x107F
++#define HDMI_FC_ACP18                           0x1080
++#define HDMI_FC_ACP17                           0x1081
++#define HDMI_FC_ACP16                           0x1082
++#define HDMI_FC_ACP15                           0x1083
++#define HDMI_FC_ACP14                           0x1084
++#define HDMI_FC_ACP13                           0x1085
++#define HDMI_FC_ACP12                           0x1086
++#define HDMI_FC_ACP11                           0x1087
++#define HDMI_FC_ACP10                           0x1088
++#define HDMI_FC_ACP9                            0x1089
++#define HDMI_FC_ACP8                            0x108A
++#define HDMI_FC_ACP7                            0x108B
++#define HDMI_FC_ACP6                            0x108C
++#define HDMI_FC_ACP5                            0x108D
++#define HDMI_FC_ACP4                            0x108E
++#define HDMI_FC_ACP3                            0x108F
++#define HDMI_FC_ACP2                            0x1090
++#define HDMI_FC_ACP1                            0x1091
++#define HDMI_FC_ISCR1_0                         0x1092
++#define HDMI_FC_ISCR1_16                        0x1093
++#define HDMI_FC_ISCR1_15                        0x1094
++#define HDMI_FC_ISCR1_14                        0x1095
++#define HDMI_FC_ISCR1_13                        0x1096
++#define HDMI_FC_ISCR1_12                        0x1097
++#define HDMI_FC_ISCR1_11                        0x1098
++#define HDMI_FC_ISCR1_10                        0x1099
++#define HDMI_FC_ISCR1_9                         0x109A
++#define HDMI_FC_ISCR1_8                         0x109B
++#define HDMI_FC_ISCR1_7                         0x109C
++#define HDMI_FC_ISCR1_6                         0x109D
++#define HDMI_FC_ISCR1_5                         0x109E
++#define HDMI_FC_ISCR1_4                         0x109F
++#define HDMI_FC_ISCR1_3                         0x10A0
++#define HDMI_FC_ISCR1_2                         0x10A1
++#define HDMI_FC_ISCR1_1                         0x10A2
++#define HDMI_FC_ISCR2_15                        0x10A3
++#define HDMI_FC_ISCR2_14                        0x10A4
++#define HDMI_FC_ISCR2_13                        0x10A5
++#define HDMI_FC_ISCR2_12                        0x10A6
++#define HDMI_FC_ISCR2_11                        0x10A7
++#define HDMI_FC_ISCR2_10                        0x10A8
++#define HDMI_FC_ISCR2_9                         0x10A9
++#define HDMI_FC_ISCR2_8                         0x10AA
++#define HDMI_FC_ISCR2_7                         0x10AB
++#define HDMI_FC_ISCR2_6                         0x10AC
++#define HDMI_FC_ISCR2_5                         0x10AD
++#define HDMI_FC_ISCR2_4                         0x10AE
++#define HDMI_FC_ISCR2_3                         0x10AF
++#define HDMI_FC_ISCR2_2                         0x10B0
++#define HDMI_FC_ISCR2_1                         0x10B1
++#define HDMI_FC_ISCR2_0                         0x10B2
++#define HDMI_FC_DATAUTO0                        0x10B3
++#define HDMI_FC_DATAUTO1                        0x10B4
++#define HDMI_FC_DATAUTO2                        0x10B5
++#define HDMI_FC_DATMAN                          0x10B6
++#define HDMI_FC_DATAUTO3                        0x10B7
++#define HDMI_FC_RDRB0                           0x10B8
++#define HDMI_FC_RDRB1                           0x10B9
++#define HDMI_FC_RDRB2                           0x10BA
++#define HDMI_FC_RDRB3                           0x10BB
++#define HDMI_FC_RDRB4                           0x10BC
++#define HDMI_FC_RDRB5                           0x10BD
++#define HDMI_FC_RDRB6                           0x10BE
++#define HDMI_FC_RDRB7                           0x10BF
++#define HDMI_FC_STAT0                           0x10D0
++#define HDMI_FC_INT0                            0x10D1
++#define HDMI_FC_MASK0                           0x10D2
++#define HDMI_FC_POL0                            0x10D3
++#define HDMI_FC_STAT1                           0x10D4
++#define HDMI_FC_INT1                            0x10D5
++#define HDMI_FC_MASK1                           0x10D6
++#define HDMI_FC_POL1                            0x10D7
++#define HDMI_FC_STAT2                           0x10D8
++#define HDMI_FC_INT2                            0x10D9
++#define HDMI_FC_MASK2                           0x10DA
++#define HDMI_FC_POL2                            0x10DB
++#define HDMI_FC_PRCONF                          0x10E0
++
++#define HDMI_FC_GMD_STAT                        0x1100
++#define HDMI_FC_GMD_EN                          0x1101
++#define HDMI_FC_GMD_UP                          0x1102
++#define HDMI_FC_GMD_CONF                        0x1103
++#define HDMI_FC_GMD_HB                          0x1104
++#define HDMI_FC_GMD_PB0                         0x1105
++#define HDMI_FC_GMD_PB1                         0x1106
++#define HDMI_FC_GMD_PB2                         0x1107
++#define HDMI_FC_GMD_PB3                         0x1108
++#define HDMI_FC_GMD_PB4                         0x1109
++#define HDMI_FC_GMD_PB5                         0x110A
++#define HDMI_FC_GMD_PB6                         0x110B
++#define HDMI_FC_GMD_PB7                         0x110C
++#define HDMI_FC_GMD_PB8                         0x110D
++#define HDMI_FC_GMD_PB9                         0x110E
++#define HDMI_FC_GMD_PB10                        0x110F
++#define HDMI_FC_GMD_PB11                        0x1110
++#define HDMI_FC_GMD_PB12                        0x1111
++#define HDMI_FC_GMD_PB13                        0x1112
++#define HDMI_FC_GMD_PB14                        0x1113
++#define HDMI_FC_GMD_PB15                        0x1114
++#define HDMI_FC_GMD_PB16                        0x1115
++#define HDMI_FC_GMD_PB17                        0x1116
++#define HDMI_FC_GMD_PB18                        0x1117
++#define HDMI_FC_GMD_PB19                        0x1118
++#define HDMI_FC_GMD_PB20                        0x1119
++#define HDMI_FC_GMD_PB21                        0x111A
++#define HDMI_FC_GMD_PB22                        0x111B
++#define HDMI_FC_GMD_PB23                        0x111C
++#define HDMI_FC_GMD_PB24                        0x111D
++#define HDMI_FC_GMD_PB25                        0x111E
++#define HDMI_FC_GMD_PB26                        0x111F
++#define HDMI_FC_GMD_PB27                        0x1120
++
++#define HDMI_FC_DBGFORCE                        0x1200
++#define HDMI_FC_DBGAUD0CH0                      0x1201
++#define HDMI_FC_DBGAUD1CH0                      0x1202
++#define HDMI_FC_DBGAUD2CH0                      0x1203
++#define HDMI_FC_DBGAUD0CH1                      0x1204
++#define HDMI_FC_DBGAUD1CH1                      0x1205
++#define HDMI_FC_DBGAUD2CH1                      0x1206
++#define HDMI_FC_DBGAUD0CH2                      0x1207
++#define HDMI_FC_DBGAUD1CH2                      0x1208
++#define HDMI_FC_DBGAUD2CH2                      0x1209
++#define HDMI_FC_DBGAUD0CH3                      0x120A
++#define HDMI_FC_DBGAUD1CH3                      0x120B
++#define HDMI_FC_DBGAUD2CH3                      0x120C
++#define HDMI_FC_DBGAUD0CH4                      0x120D
++#define HDMI_FC_DBGAUD1CH4                      0x120E
++#define HDMI_FC_DBGAUD2CH4                      0x120F
++#define HDMI_FC_DBGAUD0CH5                      0x1210
++#define HDMI_FC_DBGAUD1CH5                      0x1211
++#define HDMI_FC_DBGAUD2CH5                      0x1212
++#define HDMI_FC_DBGAUD0CH6                      0x1213
++#define HDMI_FC_DBGAUD1CH6                      0x1214
++#define HDMI_FC_DBGAUD2CH6                      0x1215
++#define HDMI_FC_DBGAUD0CH7                      0x1216
++#define HDMI_FC_DBGAUD1CH7                      0x1217
++#define HDMI_FC_DBGAUD2CH7                      0x1218
++#define HDMI_FC_DBGTMDS0                        0x1219
++#define HDMI_FC_DBGTMDS1                        0x121A
++#define HDMI_FC_DBGTMDS2                        0x121B
++
++/* HDMI Source PHY Registers */
++#define HDMI_PHY_CONF0                          0x3000
++#define HDMI_PHY_TST0                           0x3001
++#define HDMI_PHY_TST1                           0x3002
++#define HDMI_PHY_TST2                           0x3003
++#define HDMI_PHY_STAT0                          0x3004
++#define HDMI_PHY_INT0                           0x3005
++#define HDMI_PHY_MASK0                          0x3006
++#define HDMI_PHY_POL0                           0x3007
++
++/* HDMI Master PHY Registers */
++#define HDMI_PHY_I2CM_SLAVE_ADDR                0x3020
++#define HDMI_PHY_I2CM_ADDRESS_ADDR              0x3021
++#define HDMI_PHY_I2CM_DATAO_1_ADDR              0x3022
++#define HDMI_PHY_I2CM_DATAO_0_ADDR              0x3023
++#define HDMI_PHY_I2CM_DATAI_1_ADDR              0x3024
++#define HDMI_PHY_I2CM_DATAI_0_ADDR              0x3025
++#define HDMI_PHY_I2CM_OPERATION_ADDR            0x3026
++#define HDMI_PHY_I2CM_INT_ADDR                  0x3027
++#define HDMI_PHY_I2CM_CTLINT_ADDR               0x3028
++#define HDMI_PHY_I2CM_DIV_ADDR                  0x3029
++#define HDMI_PHY_I2CM_SOFTRSTZ_ADDR             0x302a
++#define HDMI_PHY_I2CM_SS_SCL_HCNT_1_ADDR        0x302b
++#define HDMI_PHY_I2CM_SS_SCL_HCNT_0_ADDR        0x302c
++#define HDMI_PHY_I2CM_SS_SCL_LCNT_1_ADDR        0x302d
++#define HDMI_PHY_I2CM_SS_SCL_LCNT_0_ADDR        0x302e
++#define HDMI_PHY_I2CM_FS_SCL_HCNT_1_ADDR        0x302f
++#define HDMI_PHY_I2CM_FS_SCL_HCNT_0_ADDR        0x3030
++#define HDMI_PHY_I2CM_FS_SCL_LCNT_1_ADDR        0x3031
++#define HDMI_PHY_I2CM_FS_SCL_LCNT_0_ADDR        0x3032
++
++/* Audio Sampler Registers */
++#define HDMI_AUD_CONF0                          0x3100
++#define HDMI_AUD_CONF1                          0x3101
++#define HDMI_AUD_INT                            0x3102
++#define HDMI_AUD_CONF2                          0x3103
++#define HDMI_AUD_N1                             0x3200
++#define HDMI_AUD_N2                             0x3201
++#define HDMI_AUD_N3                             0x3202
++#define HDMI_AUD_CTS1                           0x3203
++#define HDMI_AUD_CTS2                           0x3204
++#define HDMI_AUD_CTS3                           0x3205
++#define HDMI_AUD_INPUTCLKFS                     0x3206
++#define HDMI_AUD_SPDIFINT			0x3302
++#define HDMI_AUD_CONF0_HBR                      0x3400
++#define HDMI_AUD_HBR_STATUS                     0x3401
++#define HDMI_AUD_HBR_INT                        0x3402
++#define HDMI_AUD_HBR_POL                        0x3403
++#define HDMI_AUD_HBR_MASK                       0x3404
++
++/* Generic Parallel Audio Interface Registers */
++/* Not used as GPAUD interface is not enabled in hw */
++#define HDMI_GP_CONF0                           0x3500
++#define HDMI_GP_CONF1                           0x3501
++#define HDMI_GP_CONF2                           0x3502
++#define HDMI_GP_STAT                            0x3503
++#define HDMI_GP_INT                             0x3504
++#define HDMI_GP_MASK                            0x3505
++#define HDMI_GP_POL                             0x3506
++
++/* Audio DMA Registers */
++#define HDMI_AHB_DMA_CONF0                      0x3600
++#define HDMI_AHB_DMA_START                      0x3601
++#define HDMI_AHB_DMA_STOP                       0x3602
++#define HDMI_AHB_DMA_THRSLD                     0x3603
++#define HDMI_AHB_DMA_STRADDR0                   0x3604
++#define HDMI_AHB_DMA_STRADDR1                   0x3605
++#define HDMI_AHB_DMA_STRADDR2                   0x3606
++#define HDMI_AHB_DMA_STRADDR3                   0x3607
++#define HDMI_AHB_DMA_STPADDR0                   0x3608
++#define HDMI_AHB_DMA_STPADDR1                   0x3609
++#define HDMI_AHB_DMA_STPADDR2                   0x360a
++#define HDMI_AHB_DMA_STPADDR3                   0x360b
++#define HDMI_AHB_DMA_BSTADDR0                   0x360c
++#define HDMI_AHB_DMA_BSTADDR1                   0x360d
++#define HDMI_AHB_DMA_BSTADDR2                   0x360e
++#define HDMI_AHB_DMA_BSTADDR3                   0x360f
++#define HDMI_AHB_DMA_MBLENGTH0                  0x3610
++#define HDMI_AHB_DMA_MBLENGTH1                  0x3611
++#define HDMI_AHB_DMA_STAT                       0x3612
++#define HDMI_AHB_DMA_INT                        0x3613
++#define HDMI_AHB_DMA_MASK                       0x3614
++#define HDMI_AHB_DMA_POL                        0x3615
++#define HDMI_AHB_DMA_CONF1                      0x3616
++#define HDMI_AHB_DMA_BUFFSTAT                   0x3617
++#define HDMI_AHB_DMA_BUFFINT                    0x3618
++#define HDMI_AHB_DMA_BUFFMASK                   0x3619
++#define HDMI_AHB_DMA_BUFFPOL                    0x361a
++
++/* Main Controller Registers */
++#define HDMI_MC_SFRDIV                          0x4000
++#define HDMI_MC_CLKDIS                          0x4001
++#define HDMI_MC_SWRSTZ                          0x4002
++#define HDMI_MC_OPCTRL                          0x4003
++#define HDMI_MC_FLOWCTRL                        0x4004
++#define HDMI_MC_PHYRSTZ                         0x4005
++#define HDMI_MC_LOCKONCLOCK                     0x4006
++#define HDMI_MC_HEACPHY_RST                     0x4007
++
++/* Color Space  Converter Registers */
++#define HDMI_CSC_CFG                            0x4100
++#define HDMI_CSC_SCALE                          0x4101
++#define HDMI_CSC_COEF_A1_MSB                    0x4102
++#define HDMI_CSC_COEF_A1_LSB                    0x4103
++#define HDMI_CSC_COEF_A2_MSB                    0x4104
++#define HDMI_CSC_COEF_A2_LSB                    0x4105
++#define HDMI_CSC_COEF_A3_MSB                    0x4106
++#define HDMI_CSC_COEF_A3_LSB                    0x4107
++#define HDMI_CSC_COEF_A4_MSB                    0x4108
++#define HDMI_CSC_COEF_A4_LSB                    0x4109
++#define HDMI_CSC_COEF_B1_MSB                    0x410A
++#define HDMI_CSC_COEF_B1_LSB                    0x410B
++#define HDMI_CSC_COEF_B2_MSB                    0x410C
++#define HDMI_CSC_COEF_B2_LSB                    0x410D
++#define HDMI_CSC_COEF_B3_MSB                    0x410E
++#define HDMI_CSC_COEF_B3_LSB                    0x410F
++#define HDMI_CSC_COEF_B4_MSB                    0x4110
++#define HDMI_CSC_COEF_B4_LSB                    0x4111
++#define HDMI_CSC_COEF_C1_MSB                    0x4112
++#define HDMI_CSC_COEF_C1_LSB                    0x4113
++#define HDMI_CSC_COEF_C2_MSB                    0x4114
++#define HDMI_CSC_COEF_C2_LSB                    0x4115
++#define HDMI_CSC_COEF_C3_MSB                    0x4116
++#define HDMI_CSC_COEF_C3_LSB                    0x4117
++#define HDMI_CSC_COEF_C4_MSB                    0x4118
++#define HDMI_CSC_COEF_C4_LSB                    0x4119
++
++/* HDCP Interrupt Registers */
++#define HDMI_A_APIINTCLR                        0x5006
++#define HDMI_A_APIINTSTAT                       0x5007
++#define HDMI_A_APIINTMSK                        0x5008
++
++/* CEC Engine Registers */
++#define HDMI_CEC_CTRL                           0x7D00
++#define HDMI_CEC_STAT                           0x7D01
++#define HDMI_CEC_MASK                           0x7D02
++#define HDMI_CEC_POLARITY                       0x7D03
++#define HDMI_CEC_INT                            0x7D04
++#define HDMI_CEC_ADDR_L                         0x7D05
++#define HDMI_CEC_ADDR_H                         0x7D06
++#define HDMI_CEC_TX_CNT                         0x7D07
++#define HDMI_CEC_RX_CNT                         0x7D08
++#define HDMI_CEC_TX_DATA0                       0x7D10
++#define HDMI_CEC_TX_DATA1                       0x7D11
++#define HDMI_CEC_TX_DATA2                       0x7D12
++#define HDMI_CEC_TX_DATA3                       0x7D13
++#define HDMI_CEC_TX_DATA4                       0x7D14
++#define HDMI_CEC_TX_DATA5                       0x7D15
++#define HDMI_CEC_TX_DATA6                       0x7D16
++#define HDMI_CEC_TX_DATA7                       0x7D17
++#define HDMI_CEC_TX_DATA8                       0x7D18
++#define HDMI_CEC_TX_DATA9                       0x7D19
++#define HDMI_CEC_TX_DATA10                      0x7D1a
++#define HDMI_CEC_TX_DATA11                      0x7D1b
++#define HDMI_CEC_TX_DATA12                      0x7D1c
++#define HDMI_CEC_TX_DATA13                      0x7D1d
++#define HDMI_CEC_TX_DATA14                      0x7D1e
++#define HDMI_CEC_TX_DATA15                      0x7D1f
++#define HDMI_CEC_RX_DATA0                       0x7D20
++#define HDMI_CEC_RX_DATA1                       0x7D21
++#define HDMI_CEC_RX_DATA2                       0x7D22
++#define HDMI_CEC_RX_DATA3                       0x7D23
++#define HDMI_CEC_RX_DATA4                       0x7D24
++#define HDMI_CEC_RX_DATA5                       0x7D25
++#define HDMI_CEC_RX_DATA6                       0x7D26
++#define HDMI_CEC_RX_DATA7                       0x7D27
++#define HDMI_CEC_RX_DATA8                       0x7D28
++#define HDMI_CEC_RX_DATA9                       0x7D29
++#define HDMI_CEC_RX_DATA10                      0x7D2a
++#define HDMI_CEC_RX_DATA11                      0x7D2b
++#define HDMI_CEC_RX_DATA12                      0x7D2c
++#define HDMI_CEC_RX_DATA13                      0x7D2d
++#define HDMI_CEC_RX_DATA14                      0x7D2e
++#define HDMI_CEC_RX_DATA15                      0x7D2f
++#define HDMI_CEC_LOCK                           0x7D30
++#define HDMI_CEC_WKUPCTRL                       0x7D31
++
++/* I2C Master Registers (E-DDC) */
++#define HDMI_I2CM_SLAVE                         0x7E00
++#define HDMI_I2CM_ADDRESS                       0x7E01
++#define HDMI_I2CM_DATAO                         0x7E02
++#define HDMI_I2CM_DATAI                         0x7E03
++#define HDMI_I2CM_OPERATION                     0x7E04
++#define HDMI_I2CM_INT                           0x7E05
++#define HDMI_I2CM_CTLINT                        0x7E06
++#define HDMI_I2CM_DIV                           0x7E07
++#define HDMI_I2CM_SEGADDR                       0x7E08
++#define HDMI_I2CM_SOFTRSTZ                      0x7E09
++#define HDMI_I2CM_SEGPTR                        0x7E0A
++#define HDMI_I2CM_SS_SCL_HCNT_1_ADDR            0x7E0B
++#define HDMI_I2CM_SS_SCL_HCNT_0_ADDR            0x7E0C
++#define HDMI_I2CM_SS_SCL_LCNT_1_ADDR            0x7E0D
++#define HDMI_I2CM_SS_SCL_LCNT_0_ADDR            0x7E0E
++#define HDMI_I2CM_FS_SCL_HCNT_1_ADDR            0x7E0F
++#define HDMI_I2CM_FS_SCL_HCNT_0_ADDR            0x7E10
++#define HDMI_I2CM_FS_SCL_LCNT_1_ADDR            0x7E11
++#define HDMI_I2CM_FS_SCL_LCNT_0_ADDR            0x7E12
++
++/* Random Number Generator Registers (RNG) */
++#define HDMI_RNG_BASE                           0x8000
++
++
++/*
++ * Register field definitions
++ */
++enum {
++/* IH_FC_INT2 field values */
++	HDMI_IH_FC_INT2_OVERFLOW_MASK = 0x03,
++	HDMI_IH_FC_INT2_LOW_PRIORITY_OVERFLOW = 0x02,
++	HDMI_IH_FC_INT2_HIGH_PRIORITY_OVERFLOW = 0x01,
++
++/* IH_FC_STAT2 field values */
++	HDMI_IH_FC_STAT2_OVERFLOW_MASK = 0x03,
++	HDMI_IH_FC_STAT2_LOW_PRIORITY_OVERFLOW = 0x02,
++	HDMI_IH_FC_STAT2_HIGH_PRIORITY_OVERFLOW = 0x01,
++
++/* IH_PHY_STAT0 field values */
++	HDMI_IH_PHY_STAT0_RX_SENSE3 = 0x20,
++	HDMI_IH_PHY_STAT0_RX_SENSE2 = 0x10,
++	HDMI_IH_PHY_STAT0_RX_SENSE1 = 0x8,
++	HDMI_IH_PHY_STAT0_RX_SENSE0 = 0x4,
++	HDMI_IH_PHY_STAT0_TX_PHY_LOCK = 0x2,
++	HDMI_IH_PHY_STAT0_HPD = 0x1,
++
++/* IH_CEC_STAT0 field values */
++	HDMI_IH_CEC_STAT0_WAKEUP = 0x40,
++	HDMI_IH_CEC_STAT0_ERROR_FOLL = 0x20,
++	HDMI_IH_CEC_STAT0_ERROR_INIT = 0x10,
++	HDMI_IH_CEC_STAT0_ARB_LOST = 0x8,
++	HDMI_IH_CEC_STAT0_NACK = 0x4,
++	HDMI_IH_CEC_STAT0_EOM = 0x2,
++	HDMI_IH_CEC_STAT0_DONE = 0x1,
++
++
++/* IH_MUTE_I2CMPHY_STAT0 field values */
++	HDMI_IH_MUTE_I2CMPHY_STAT0_I2CMPHYDONE = 0x2,
++	HDMI_IH_MUTE_I2CMPHY_STAT0_I2CMPHYERROR = 0x1,
++
++/* IH_PHY_STAT0 field values */
++	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE3 = 0x20,
++	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE2 = 0x10,
++	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE1 = 0x8,
++	HDMI_IH_MUTE_PHY_STAT0_RX_SENSE0 = 0x4,
++	HDMI_IH_MUTE_PHY_STAT0_TX_PHY_LOCK = 0x2,
++	HDMI_IH_MUTE_PHY_STAT0_HPD = 0x1,
++
++/* IH and IH_MUTE convenience macro RX_SENSE | HPD*/
++	HDMI_DVI_IH_STAT = 0x3D,
++
++
++/* IH_AHBDMAAUD_STAT0 field values */
++	HDMI_IH_AHBDMAAUD_STAT0_ERROR = 0x20,
++	HDMI_IH_AHBDMAAUD_STAT0_LOST = 0x10,
++	HDMI_IH_AHBDMAAUD_STAT0_RETRY = 0x08,
++	HDMI_IH_AHBDMAAUD_STAT0_DONE = 0x04,
++	HDMI_IH_AHBDMAAUD_STAT0_BUFFFULL = 0x02,
++	HDMI_IH_AHBDMAAUD_STAT0_BUFFEMPTY = 0x01,
++
++/* IH_MUTE_FC_STAT2 field values */
++	HDMI_IH_MUTE_FC_STAT2_OVERFLOW_MASK = 0x03,
++	HDMI_IH_MUTE_FC_STAT2_LOW_PRIORITY_OVERFLOW = 0x02,
++	HDMI_IH_MUTE_FC_STAT2_HIGH_PRIORITY_OVERFLOW = 0x01,
++
++/* IH_MUTE_AHBDMAAUD_STAT0 field values */
++	HDMI_IH_MUTE_AHBDMAAUD_STAT0_ERROR = 0x20,
++	HDMI_IH_MUTE_AHBDMAAUD_STAT0_LOST = 0x10,
++	HDMI_IH_MUTE_AHBDMAAUD_STAT0_RETRY = 0x08,
++	HDMI_IH_MUTE_AHBDMAAUD_STAT0_DONE = 0x04,
++	HDMI_IH_MUTE_AHBDMAAUD_STAT0_BUFFFULL = 0x02,
++	HDMI_IH_MUTE_AHBDMAAUD_STAT0_BUFFEMPTY = 0x01,
++
++/* IH_MUTE field values */
++	HDMI_IH_MUTE_MUTE_WAKEUP_INTERRUPT = 0x2,
++	HDMI_IH_MUTE_MUTE_ALL_INTERRUPT = 0x1,
++
++/* TX_INVID0 field values */
++	HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_MASK = 0x80,
++	HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_ENABLE = 0x80,
++	HDMI_TX_INVID0_INTERNAL_DE_GENERATOR_DISABLE = 0x00,
++	HDMI_TX_INVID0_VIDEO_MAPPING_MASK = 0x1F,
++	HDMI_TX_INVID0_VIDEO_MAPPING_OFFSET = 0,
++
++/* TX_INSTUFFING field values */
++	HDMI_TX_INSTUFFING_BDBDATA_STUFFING_MASK = 0x4,
++	HDMI_TX_INSTUFFING_BDBDATA_STUFFING_ENABLE = 0x4,
++	HDMI_TX_INSTUFFING_BDBDATA_STUFFING_DISABLE = 0x0,
++	HDMI_TX_INSTUFFING_RCRDATA_STUFFING_MASK = 0x2,
++	HDMI_TX_INSTUFFING_RCRDATA_STUFFING_ENABLE = 0x2,
++	HDMI_TX_INSTUFFING_RCRDATA_STUFFING_DISABLE = 0x0,
++	HDMI_TX_INSTUFFING_GYDATA_STUFFING_MASK = 0x1,
++	HDMI_TX_INSTUFFING_GYDATA_STUFFING_ENABLE = 0x1,
++	HDMI_TX_INSTUFFING_GYDATA_STUFFING_DISABLE = 0x0,
++
++/* VP_PR_CD field values */
++	HDMI_VP_PR_CD_COLOR_DEPTH_MASK = 0xF0,
++	HDMI_VP_PR_CD_COLOR_DEPTH_OFFSET = 4,
++	HDMI_VP_PR_CD_DESIRED_PR_FACTOR_MASK = 0x0F,
++	HDMI_VP_PR_CD_DESIRED_PR_FACTOR_OFFSET = 0,
++
++/* VP_STUFF field values */
++	HDMI_VP_STUFF_IDEFAULT_PHASE_MASK = 0x20,
++	HDMI_VP_STUFF_IDEFAULT_PHASE_OFFSET = 5,
++	HDMI_VP_STUFF_IFIX_PP_TO_LAST_MASK = 0x10,
++	HDMI_VP_STUFF_IFIX_PP_TO_LAST_OFFSET = 4,
++	HDMI_VP_STUFF_ICX_GOTO_P0_ST_MASK = 0x8,
++	HDMI_VP_STUFF_ICX_GOTO_P0_ST_OFFSET = 3,
++	HDMI_VP_STUFF_YCC422_STUFFING_MASK = 0x4,
++	HDMI_VP_STUFF_YCC422_STUFFING_STUFFING_MODE = 0x4,
++	HDMI_VP_STUFF_YCC422_STUFFING_DIRECT_MODE = 0x0,
++	HDMI_VP_STUFF_PP_STUFFING_MASK = 0x2,
++	HDMI_VP_STUFF_PP_STUFFING_STUFFING_MODE = 0x2,
++	HDMI_VP_STUFF_PP_STUFFING_DIRECT_MODE = 0x0,
++	HDMI_VP_STUFF_PR_STUFFING_MASK = 0x1,
++	HDMI_VP_STUFF_PR_STUFFING_STUFFING_MODE = 0x1,
++	HDMI_VP_STUFF_PR_STUFFING_DIRECT_MODE = 0x0,
++
++/* VP_CONF field values */
++	HDMI_VP_CONF_BYPASS_EN_MASK = 0x40,
++	HDMI_VP_CONF_BYPASS_EN_ENABLE = 0x40,
++	HDMI_VP_CONF_BYPASS_EN_DISABLE = 0x00,
++	HDMI_VP_CONF_PP_EN_ENMASK = 0x20,
++	HDMI_VP_CONF_PP_EN_ENABLE = 0x20,
++	HDMI_VP_CONF_PP_EN_DISABLE = 0x00,
++	HDMI_VP_CONF_PR_EN_MASK = 0x10,
++	HDMI_VP_CONF_PR_EN_ENABLE = 0x10,
++	HDMI_VP_CONF_PR_EN_DISABLE = 0x00,
++	HDMI_VP_CONF_YCC422_EN_MASK = 0x8,
++	HDMI_VP_CONF_YCC422_EN_ENABLE = 0x8,
++	HDMI_VP_CONF_YCC422_EN_DISABLE = 0x0,
++	HDMI_VP_CONF_BYPASS_SELECT_MASK = 0x4,
++	HDMI_VP_CONF_BYPASS_SELECT_VID_PACKETIZER = 0x4,
++	HDMI_VP_CONF_BYPASS_SELECT_PIX_REPEATER = 0x0,
++	HDMI_VP_CONF_OUTPUT_SELECTOR_MASK = 0x3,
++	HDMI_VP_CONF_OUTPUT_SELECTOR_BYPASS = 0x3,
++	HDMI_VP_CONF_OUTPUT_SELECTOR_YCC422 = 0x1,
++	HDMI_VP_CONF_OUTPUT_SELECTOR_PP = 0x0,
++
++/* VP_REMAP field values */
++	HDMI_VP_REMAP_MASK = 0x3,
++	HDMI_VP_REMAP_YCC422_24bit = 0x2,
++	HDMI_VP_REMAP_YCC422_20bit = 0x1,
++	HDMI_VP_REMAP_YCC422_16bit = 0x0,
++
++/* FC_INVIDCONF field values */
++	HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_MASK = 0x40,
++	HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_HIGH = 0x40,
++	HDMI_FC_INVIDCONF_VSYNC_IN_POLARITY_ACTIVE_LOW = 0x00,
++	HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_MASK = 0x20,
++	HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_HIGH = 0x20,
++	HDMI_FC_INVIDCONF_HSYNC_IN_POLARITY_ACTIVE_LOW = 0x00,
++	HDMI_FC_INVIDCONF_DE_IN_POLARITY_MASK = 0x10,
++	HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_HIGH = 0x10,
++	HDMI_FC_INVIDCONF_DE_IN_POLARITY_ACTIVE_LOW = 0x00,
++	HDMI_FC_INVIDCONF_DVI_MODEZ_MASK = 0x8,
++	HDMI_FC_INVIDCONF_DVI_MODEZ_HDMI_MODE = 0x8,
++	HDMI_FC_INVIDCONF_DVI_MODEZ_DVI_MODE = 0x0,
++	HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_MASK = 0x2,
++	HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_HIGH = 0x2,
++	HDMI_FC_INVIDCONF_R_V_BLANK_IN_OSC_ACTIVE_LOW = 0x0,
++	HDMI_FC_INVIDCONF_IN_I_P_MASK = 0x1,
++	HDMI_FC_INVIDCONF_IN_I_P_INTERLACED = 0x1,
++	HDMI_FC_INVIDCONF_IN_I_P_PROGRESSIVE = 0x0,
++
++/* FC_AUDICONF0 field values */
++	HDMI_FC_AUDICONF0_CC_OFFSET = 4,
++	HDMI_FC_AUDICONF0_CC_MASK = 0x70,
++	HDMI_FC_AUDICONF0_CT_OFFSET = 0,
++	HDMI_FC_AUDICONF0_CT_MASK = 0xF,
++
++/* FC_AUDICONF1 field values */
++	HDMI_FC_AUDICONF1_SS_OFFSET = 3,
++	HDMI_FC_AUDICONF1_SS_MASK = 0x18,
++	HDMI_FC_AUDICONF1_SF_OFFSET = 0,
++	HDMI_FC_AUDICONF1_SF_MASK = 0x7,
++
++/* FC_AUDICONF3 field values */
++	HDMI_FC_AUDICONF3_LFEPBL_OFFSET = 5,
++	HDMI_FC_AUDICONF3_LFEPBL_MASK = 0x60,
++	HDMI_FC_AUDICONF3_DM_INH_OFFSET = 4,
++	HDMI_FC_AUDICONF3_DM_INH_MASK = 0x10,
++	HDMI_FC_AUDICONF3_LSV_OFFSET = 0,
++	HDMI_FC_AUDICONF3_LSV_MASK = 0xF,
++
++/* FC_AUDSCHNLS0 field values */
++	HDMI_FC_AUDSCHNLS0_CGMSA_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS0_CGMSA_MASK = 0x30,
++	HDMI_FC_AUDSCHNLS0_COPYRIGHT_OFFSET = 0,
++	HDMI_FC_AUDSCHNLS0_COPYRIGHT_MASK = 0x01,
++
++/* FC_AUDSCHNLS3-6 field values */
++	HDMI_FC_AUDSCHNLS3_OIEC_CH0_OFFSET = 0,
++	HDMI_FC_AUDSCHNLS3_OIEC_CH0_MASK = 0x0f,
++	HDMI_FC_AUDSCHNLS3_OIEC_CH1_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS3_OIEC_CH1_MASK = 0xf0,
++	HDMI_FC_AUDSCHNLS4_OIEC_CH2_OFFSET = 0,
++	HDMI_FC_AUDSCHNLS4_OIEC_CH2_MASK = 0x0f,
++	HDMI_FC_AUDSCHNLS4_OIEC_CH3_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS4_OIEC_CH3_MASK = 0xf0,
++
++	HDMI_FC_AUDSCHNLS5_OIEC_CH0_OFFSET = 0,
++	HDMI_FC_AUDSCHNLS5_OIEC_CH0_MASK = 0x0f,
++	HDMI_FC_AUDSCHNLS5_OIEC_CH1_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS5_OIEC_CH1_MASK = 0xf0,
++	HDMI_FC_AUDSCHNLS6_OIEC_CH2_OFFSET = 0,
++	HDMI_FC_AUDSCHNLS6_OIEC_CH2_MASK = 0x0f,
++	HDMI_FC_AUDSCHNLS6_OIEC_CH3_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS6_OIEC_CH3_MASK = 0xf0,
++
++/* HDMI_FC_AUDSCHNLS7 field values */
++	HDMI_FC_AUDSCHNLS7_ACCURACY_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS7_ACCURACY_MASK = 0x30,
++
++/* HDMI_FC_AUDSCHNLS8 field values */
++	HDMI_FC_AUDSCHNLS8_ORIGSAMPFREQ_MASK = 0xf0,
++	HDMI_FC_AUDSCHNLS8_ORIGSAMPFREQ_OFFSET = 4,
++	HDMI_FC_AUDSCHNLS8_WORDLEGNTH_MASK = 0x0f,
++	HDMI_FC_AUDSCHNLS8_WORDLEGNTH_OFFSET = 0,
++
++/* FC_AUDSCONF field values */
++	HDMI_FC_AUDSCONF_AUD_PACKET_SAMPFIT_MASK = 0xF0,
++	HDMI_FC_AUDSCONF_AUD_PACKET_SAMPFIT_OFFSET = 4,
++	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_MASK = 0x1,
++	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_OFFSET = 0,
++	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_LAYOUT1 = 0x1,
++	HDMI_FC_AUDSCONF_AUD_PACKET_LAYOUT_LAYOUT0 = 0x0,
++
++/* FC_STAT2 field values */
++	HDMI_FC_STAT2_OVERFLOW_MASK = 0x03,
++	HDMI_FC_STAT2_LOW_PRIORITY_OVERFLOW = 0x02,
++	HDMI_FC_STAT2_HIGH_PRIORITY_OVERFLOW = 0x01,
++
++/* FC_INT2 field values */
++	HDMI_FC_INT2_OVERFLOW_MASK = 0x03,
++	HDMI_FC_INT2_LOW_PRIORITY_OVERFLOW = 0x02,
++	HDMI_FC_INT2_HIGH_PRIORITY_OVERFLOW = 0x01,
++
++/* FC_MASK2 field values */
++	HDMI_FC_MASK2_OVERFLOW_MASK = 0x03,
++	HDMI_FC_MASK2_LOW_PRIORITY_OVERFLOW = 0x02,
++	HDMI_FC_MASK2_HIGH_PRIORITY_OVERFLOW = 0x01,
++
++/* FC_PRCONF field values */
++	HDMI_FC_PRCONF_INCOMING_PR_FACTOR_MASK = 0xF0,
++	HDMI_FC_PRCONF_INCOMING_PR_FACTOR_OFFSET = 4,
++	HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_MASK = 0x0F,
++	HDMI_FC_PRCONF_OUTPUT_PR_FACTOR_OFFSET = 0,
++
++/* FC_AVICONF0-FC_AVICONF3 field values */
++	HDMI_FC_AVICONF0_PIX_FMT_MASK = 0x03,
++	HDMI_FC_AVICONF0_PIX_FMT_RGB = 0x00,
++	HDMI_FC_AVICONF0_PIX_FMT_YCBCR422 = 0x01,
++	HDMI_FC_AVICONF0_PIX_FMT_YCBCR444 = 0x02,
++	HDMI_FC_AVICONF0_ACTIVE_FMT_MASK = 0x40,
++	HDMI_FC_AVICONF0_ACTIVE_FMT_INFO_PRESENT = 0x40,
++	HDMI_FC_AVICONF0_ACTIVE_FMT_NO_INFO = 0x00,
++	HDMI_FC_AVICONF0_BAR_DATA_MASK = 0x0C,
++	HDMI_FC_AVICONF0_BAR_DATA_NO_DATA = 0x00,
++	HDMI_FC_AVICONF0_BAR_DATA_VERT_BAR = 0x04,
++	HDMI_FC_AVICONF0_BAR_DATA_HORIZ_BAR = 0x08,
++	HDMI_FC_AVICONF0_BAR_DATA_VERT_HORIZ_BAR = 0x0C,
++	HDMI_FC_AVICONF0_SCAN_INFO_MASK = 0x30,
++	HDMI_FC_AVICONF0_SCAN_INFO_OVERSCAN = 0x10,
++	HDMI_FC_AVICONF0_SCAN_INFO_UNDERSCAN = 0x20,
++	HDMI_FC_AVICONF0_SCAN_INFO_NODATA = 0x00,
++
++	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_MASK = 0x0F,
++	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_USE_CODED = 0x08,
++	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_4_3 = 0x09,
++	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_16_9 = 0x0A,
++	HDMI_FC_AVICONF1_ACTIVE_ASPECT_RATIO_14_9 = 0x0B,
++	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_MASK = 0x30,
++	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_NO_DATA = 0x00,
++	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_4_3 = 0x10,
++	HDMI_FC_AVICONF1_CODED_ASPECT_RATIO_16_9 = 0x20,
++	HDMI_FC_AVICONF1_COLORIMETRY_MASK = 0xC0,
++	HDMI_FC_AVICONF1_COLORIMETRY_NO_DATA = 0x00,
++	HDMI_FC_AVICONF1_COLORIMETRY_SMPTE = 0x40,
++	HDMI_FC_AVICONF1_COLORIMETRY_ITUR = 0x80,
++	HDMI_FC_AVICONF1_COLORIMETRY_EXTENDED_INFO = 0xC0,
++
++	HDMI_FC_AVICONF2_SCALING_MASK = 0x03,
++	HDMI_FC_AVICONF2_SCALING_NONE = 0x00,
++	HDMI_FC_AVICONF2_SCALING_HORIZ = 0x01,
++	HDMI_FC_AVICONF2_SCALING_VERT = 0x02,
++	HDMI_FC_AVICONF2_SCALING_HORIZ_VERT = 0x03,
++	HDMI_FC_AVICONF2_RGB_QUANT_MASK = 0x0C,
++	HDMI_FC_AVICONF2_RGB_QUANT_DEFAULT = 0x00,
++	HDMI_FC_AVICONF2_RGB_QUANT_LIMITED_RANGE = 0x04,
++	HDMI_FC_AVICONF2_RGB_QUANT_FULL_RANGE = 0x08,
++	HDMI_FC_AVICONF2_EXT_COLORIMETRY_MASK = 0x70,
++	HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC601 = 0x00,
++	HDMI_FC_AVICONF2_EXT_COLORIMETRY_XVYCC709 = 0x10,
++	HDMI_FC_AVICONF2_EXT_COLORIMETRY_SYCC601 = 0x20,
++	HDMI_FC_AVICONF2_EXT_COLORIMETRY_ADOBE_YCC601 = 0x30,
++	HDMI_FC_AVICONF2_EXT_COLORIMETRY_ADOBE_RGB = 0x40,
++	HDMI_FC_AVICONF2_IT_CONTENT_MASK = 0x80,
++	HDMI_FC_AVICONF2_IT_CONTENT_NO_DATA = 0x00,
++	HDMI_FC_AVICONF2_IT_CONTENT_VALID = 0x80,
++
++	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_MASK = 0x03,
++	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_GRAPHICS = 0x00,
++	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_PHOTO = 0x01,
++	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_CINEMA = 0x02,
++	HDMI_FC_AVICONF3_IT_CONTENT_TYPE_GAME = 0x03,
++	HDMI_FC_AVICONF3_QUANT_RANGE_MASK = 0x0C,
++	HDMI_FC_AVICONF3_QUANT_RANGE_LIMITED = 0x00,
++	HDMI_FC_AVICONF3_QUANT_RANGE_FULL = 0x04,
++
++/* FC_DBGFORCE field values */
++	HDMI_FC_DBGFORCE_FORCEAUDIO = 0x10,
++	HDMI_FC_DBGFORCE_FORCEVIDEO = 0x1,
++
++/* PHY_CONF0 field values */
++	HDMI_PHY_CONF0_PDZ_MASK = 0x80,
++	HDMI_PHY_CONF0_PDZ_OFFSET = 7,
++	HDMI_PHY_CONF0_ENTMDS_MASK = 0x40,
++	HDMI_PHY_CONF0_ENTMDS_OFFSET = 6,
++	HDMI_PHY_CONF0_SPARECTRL = 0x20,
++	HDMI_PHY_CONF0_GEN2_PDDQ_MASK = 0x10,
++	HDMI_PHY_CONF0_GEN2_PDDQ_OFFSET = 4,
++	HDMI_PHY_CONF0_GEN2_TXPWRON_MASK = 0x8,
++	HDMI_PHY_CONF0_GEN2_TXPWRON_OFFSET = 3,
++	HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_MASK = 0x4,
++	HDMI_PHY_CONF0_GEN2_ENHPDRXSENSE_OFFSET = 2,
++	HDMI_PHY_CONF0_SELDATAENPOL_MASK = 0x2,
++	HDMI_PHY_CONF0_SELDATAENPOL_OFFSET = 1,
++	HDMI_PHY_CONF0_SELDIPIF_MASK = 0x1,
++	HDMI_PHY_CONF0_SELDIPIF_OFFSET = 0,
++
++/* PHY_TST0 field values */
++	HDMI_PHY_TST0_TSTCLR_MASK = 0x20,
++	HDMI_PHY_TST0_TSTCLR_OFFSET = 5,
++	HDMI_PHY_TST0_TSTEN_MASK = 0x10,
++	HDMI_PHY_TST0_TSTEN_OFFSET = 4,
++	HDMI_PHY_TST0_TSTCLK_MASK = 0x1,
++	HDMI_PHY_TST0_TSTCLK_OFFSET = 0,
++
++/* PHY_STAT0 field values */
++	HDMI_PHY_RX_SENSE3 = 0x80,
++	HDMI_PHY_RX_SENSE2 = 0x40,
++	HDMI_PHY_RX_SENSE1 = 0x20,
++	HDMI_PHY_RX_SENSE0 = 0x10,
++	HDMI_PHY_HPD = 0x02,
++	HDMI_PHY_TX_PHY_LOCK = 0x01,
++
++/* HDMI STAT convenience RX_SENSE | HPD */
++	HDMI_DVI_STAT = 0xF2,
++
++/* PHY_I2CM_SLAVE_ADDR field values */
++	HDMI_PHY_I2CM_SLAVE_ADDR_PHY_GEN2 = 0x69,
++	HDMI_PHY_I2CM_SLAVE_ADDR_HEAC_PHY = 0x49,
++
++/* PHY_I2CM_OPERATION_ADDR field values */
++	HDMI_PHY_I2CM_OPERATION_ADDR_WRITE = 0x10,
++	HDMI_PHY_I2CM_OPERATION_ADDR_READ = 0x1,
++
++/* HDMI_PHY_I2CM_INT_ADDR */
++	HDMI_PHY_I2CM_INT_ADDR_DONE_POL = 0x08,
++	HDMI_PHY_I2CM_INT_ADDR_DONE_MASK = 0x04,
++
++/* HDMI_PHY_I2CM_CTLINT_ADDR */
++	HDMI_PHY_I2CM_CTLINT_ADDR_NAC_POL = 0x80,
++	HDMI_PHY_I2CM_CTLINT_ADDR_NAC_MASK = 0x40,
++	HDMI_PHY_I2CM_CTLINT_ADDR_ARBITRATION_POL = 0x08,
++	HDMI_PHY_I2CM_CTLINT_ADDR_ARBITRATION_MASK = 0x04,
++
++/* AUD_CTS3 field values */
++	HDMI_AUD_CTS3_N_SHIFT_OFFSET = 5,
++	HDMI_AUD_CTS3_N_SHIFT_MASK = 0xe0,
++	HDMI_AUD_CTS3_N_SHIFT_1 = 0,
++	HDMI_AUD_CTS3_N_SHIFT_16 = 0x20,
++	HDMI_AUD_CTS3_N_SHIFT_32 = 0x40,
++	HDMI_AUD_CTS3_N_SHIFT_64 = 0x60,
++	HDMI_AUD_CTS3_N_SHIFT_128 = 0x80,
++	HDMI_AUD_CTS3_N_SHIFT_256 = 0xa0,
++	/* note that the CTS3 MANUAL bit has been removed
++	   from our part. Can't set it, will read as 0. */
++	HDMI_AUD_CTS3_CTS_MANUAL = 0x10,
++	HDMI_AUD_CTS3_AUDCTS19_16_MASK = 0x0f,
++
++/* AHB_DMA_CONF0 field values */
++	HDMI_AHB_DMA_CONF0_SW_FIFO_RST_OFFSET = 7,
++	HDMI_AHB_DMA_CONF0_SW_FIFO_RST_MASK = 0x80,
++	HDMI_AHB_DMA_CONF0_HBR_OFFSET = 4,
++	HDMI_AHB_DMA_CONF0_HBR_MASK = 0x10,
++	HDMI_AHB_DMA_CONF0_EN_HLOCK_OFFSET = 3,
++	HDMI_AHB_DMA_CONF0_EN_HLOCK_MASK = 0x08,
++	HDMI_AHB_DMA_CONF0_INCR_TYPE_OFFSET = 1,
++	HDMI_AHB_DMA_CONF0_INCR_TYPE_MASK = 0x06,
++	HDMI_AHB_DMA_CONF0_INCR4 = 0x0,
++	HDMI_AHB_DMA_CONF0_INCR8 = 0x2,
++	HDMI_AHB_DMA_CONF0_INCR16 = 0x4,
++	HDMI_AHB_DMA_CONF0_BURST_MODE = 0x1,
++
++/* HDMI_AHB_DMA_START field values */
++	HDMI_AHB_DMA_START_START_OFFSET = 0,
++	HDMI_AHB_DMA_START_START_MASK = 0x01,
++
++/* HDMI_AHB_DMA_STOP field values */
++	HDMI_AHB_DMA_STOP_STOP_OFFSET = 0,
++	HDMI_AHB_DMA_STOP_STOP_MASK = 0x01,
++
++/* AHB_DMA_STAT, AHB_DMA_INT, AHB_DMA_MASK, AHB_DMA_POL field values */
++	HDMI_AHB_DMA_DONE = 0x80,
++	HDMI_AHB_DMA_RETRY_SPLIT = 0x40,
++	HDMI_AHB_DMA_LOSTOWNERSHIP = 0x20,
++	HDMI_AHB_DMA_ERROR = 0x10,
++	HDMI_AHB_DMA_FIFO_THREMPTY = 0x04,
++	HDMI_AHB_DMA_FIFO_FULL = 0x02,
++	HDMI_AHB_DMA_FIFO_EMPTY = 0x01,
++
++/* AHB_DMA_BUFFSTAT, AHB_DMA_BUFFINT, AHB_DMA_BUFFMASK, AHB_DMA_BUFFPOL field values */
++	HDMI_AHB_DMA_BUFFSTAT_FULL = 0x02,
++	HDMI_AHB_DMA_BUFFSTAT_EMPTY = 0x01,
++
++/* MC_CLKDIS field values */
++	HDMI_MC_CLKDIS_HDCPCLK_DISABLE = 0x40,
++	HDMI_MC_CLKDIS_CECCLK_DISABLE = 0x20,
++	HDMI_MC_CLKDIS_CSCCLK_DISABLE = 0x10,
++	HDMI_MC_CLKDIS_AUDCLK_DISABLE = 0x8,
++	HDMI_MC_CLKDIS_PREPCLK_DISABLE = 0x4,
++	HDMI_MC_CLKDIS_TMDSCLK_DISABLE = 0x2,
++	HDMI_MC_CLKDIS_PIXELCLK_DISABLE = 0x1,
++
++/* MC_SWRSTZ field values */
++	HDMI_MC_SWRSTZ_TMDSSWRST_REQ = 0x02,
++
++/* MC_FLOWCTRL field values */
++	HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_MASK = 0x1,
++	HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_IN_PATH = 0x1,
++	HDMI_MC_FLOWCTRL_FEED_THROUGH_OFF_CSC_BYPASS = 0x0,
++
++/* MC_PHYRSTZ field values */
++	HDMI_MC_PHYRSTZ_ASSERT = 0x0,
++	HDMI_MC_PHYRSTZ_DEASSERT = 0x1,
++
++/* MC_HEACPHY_RST field values */
++	HDMI_MC_HEACPHY_RST_ASSERT = 0x1,
++	HDMI_MC_HEACPHY_RST_DEASSERT = 0x0,
++
++/* CSC_CFG field values */
++	HDMI_CSC_CFG_INTMODE_MASK = 0x30,
++	HDMI_CSC_CFG_INTMODE_OFFSET = 4,
++	HDMI_CSC_CFG_INTMODE_DISABLE = 0x00,
++	HDMI_CSC_CFG_INTMODE_CHROMA_INT_FORMULA1 = 0x10,
++	HDMI_CSC_CFG_INTMODE_CHROMA_INT_FORMULA2 = 0x20,
++	HDMI_CSC_CFG_DECMODE_MASK = 0x3,
++	HDMI_CSC_CFG_DECMODE_OFFSET = 0,
++	HDMI_CSC_CFG_DECMODE_DISABLE = 0x0,
++	HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA1 = 0x1,
++	HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA2 = 0x2,
++	HDMI_CSC_CFG_DECMODE_CHROMA_INT_FORMULA3 = 0x3,
++
++/* CSC_SCALE field values */
++	HDMI_CSC_SCALE_CSC_COLORDE_PTH_MASK = 0xF0,
++	HDMI_CSC_SCALE_CSC_COLORDE_PTH_24BPP = 0x00,
++	HDMI_CSC_SCALE_CSC_COLORDE_PTH_30BPP = 0x50,
++	HDMI_CSC_SCALE_CSC_COLORDE_PTH_36BPP = 0x60,
++	HDMI_CSC_SCALE_CSC_COLORDE_PTH_48BPP = 0x70,
++	HDMI_CSC_SCALE_CSCSCALE_MASK = 0x03,
++
++/* I2CM_OPERATION field values */
++	HDMI_I2CM_OPERATION_WRITE = 0x10,
++	HDMI_I2CM_OPERATION_READ_EXT = 0x2,
++	HDMI_I2CM_OPERATION_READ = 0x1,
++
++/* HDMI_I2CM_INT */
++	HDMI_I2CM_INT_DONE_POL = 0x08,
++	HDMI_I2CM_INT_DONE_MASK = 0x04,
++
++/* HDMI_I2CM_CTLINT */
++	HDMI_I2CM_CTLINT_NAC_POL = 0x80,
++	HDMI_I2CM_CTLINT_NAC_MASK = 0x40,
++	HDMI_I2CM_CTLINT_ARBITRATION_POL = 0x08,
++	HDMI_I2CM_CTLINT_ARBITRATION_MASK = 0x04,
++
++};
++
++enum imx_hdmi_type {
++	IMX6DL_HDMI,
++	IMX6Q_HDMI,
++};
++
++/* IOCTL commands */
++#define HDMI_IOC_MAGIC  'H'
++
++#define HDMI_IOC_GET_RESOURCE	_IO(HDMI_IOC_MAGIC, 0)
++#define HDMI_IOC_GET_CPU_TYPE	_IO(HDMI_IOC_MAGIC, 1)
++
++
++#endif /* __MXC_HDMI_H__ */
+diff -Nur linux-4.1.3/sound/soc/codecs/hdmi.c linux-xbian-imx6/sound/soc/codecs/hdmi.c
+--- linux-4.1.3/sound/soc/codecs/hdmi.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/codecs/hdmi.c	2015-07-27 23:13:11.073473395 +0200
+@@ -47,7 +47,7 @@
+ 			SNDRV_PCM_RATE_176400 | SNDRV_PCM_RATE_192000,
+ 		.formats = SNDRV_PCM_FMTBIT_S16_LE |
+ 			SNDRV_PCM_FMTBIT_S24_LE | SNDRV_PCM_FMTBIT_S32_LE,
+-		.sig_bits = 24,
++//		.sig_bits = 24,
+ 	},
+ 	.capture = {
+ 		.stream_name = "Capture",
+diff -Nur linux-4.1.3/sound/soc/codecs/sgtl5000.c linux-xbian-imx6/sound/soc/codecs/sgtl5000.c
+--- linux-4.1.3/sound/soc/codecs/sgtl5000.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/codecs/sgtl5000.c	2015-07-27 23:13:11.085430733 +0200
+@@ -16,7 +16,6 @@
+ #include <linux/pm.h>
+ #include <linux/i2c.h>
+ #include <linux/clk.h>
+-#include <linux/log2.h>
+ #include <linux/regmap.h>
+ #include <linux/regulator/driver.h>
+ #include <linux/regulator/machine.h>
+@@ -35,34 +34,25 @@
+ #define SGTL5000_DAP_REG_OFFSET	0x0100
+ #define SGTL5000_MAX_REG_OFFSET	0x013A
+ 
++
++int snd_soc_codec_set_cache_io(struct snd_soc_codec *codec,
++					int addr_bits, int data_bits,
++					enum snd_soc_control_type control);
++
+ /* default value of sgtl5000 registers */
+ static const struct reg_default sgtl5000_reg_defaults[] = {
+-	{ SGTL5000_CHIP_DIG_POWER,		0x0000 },
+ 	{ SGTL5000_CHIP_CLK_CTRL,		0x0008 },
+ 	{ SGTL5000_CHIP_I2S_CTRL,		0x0010 },
+ 	{ SGTL5000_CHIP_SSS_CTRL,		0x0010 },
+-	{ SGTL5000_CHIP_ADCDAC_CTRL,		0x020c },
+ 	{ SGTL5000_CHIP_DAC_VOL,		0x3c3c },
+ 	{ SGTL5000_CHIP_PAD_STRENGTH,		0x015f },
+-	{ SGTL5000_CHIP_ANA_ADC_CTRL,		0x0000 },
+ 	{ SGTL5000_CHIP_ANA_HP_CTRL,		0x1818 },
+ 	{ SGTL5000_CHIP_ANA_CTRL,		0x0111 },
+-	{ SGTL5000_CHIP_LINREG_CTRL,		0x0000 },
+-	{ SGTL5000_CHIP_REF_CTRL,		0x0000 },
+-	{ SGTL5000_CHIP_MIC_CTRL,		0x0000 },
+-	{ SGTL5000_CHIP_LINE_OUT_CTRL,		0x0000 },
+ 	{ SGTL5000_CHIP_LINE_OUT_VOL,		0x0404 },
+ 	{ SGTL5000_CHIP_ANA_POWER,		0x7060 },
+ 	{ SGTL5000_CHIP_PLL_CTRL,		0x5000 },
+-	{ SGTL5000_CHIP_CLK_TOP_CTRL,		0x0000 },
+-	{ SGTL5000_CHIP_ANA_STATUS,		0x0000 },
+-	{ SGTL5000_CHIP_SHORT_CTRL,		0x0000 },
+-	{ SGTL5000_CHIP_ANA_TEST2,		0x0000 },
+-	{ SGTL5000_DAP_CTRL,			0x0000 },
+-	{ SGTL5000_DAP_PEQ,			0x0000 },
+ 	{ SGTL5000_DAP_BASS_ENHANCE,		0x0040 },
+ 	{ SGTL5000_DAP_BASS_ENHANCE_CTRL,	0x051f },
+-	{ SGTL5000_DAP_AUDIO_EQ,		0x0000 },
+ 	{ SGTL5000_DAP_SURROUND,		0x0040 },
+ 	{ SGTL5000_DAP_EQ_BASS_BAND0,		0x002f },
+ 	{ SGTL5000_DAP_EQ_BASS_BAND1,		0x002f },
+@@ -70,7 +60,6 @@
+ 	{ SGTL5000_DAP_EQ_BASS_BAND3,		0x002f },
+ 	{ SGTL5000_DAP_EQ_BASS_BAND4,		0x002f },
+ 	{ SGTL5000_DAP_MAIN_CHAN,		0x8000 },
+-	{ SGTL5000_DAP_MIX_CHAN,		0x0000 },
+ 	{ SGTL5000_DAP_AVC_CTRL,		0x0510 },
+ 	{ SGTL5000_DAP_AVC_THRESHOLD,		0x1473 },
+ 	{ SGTL5000_DAP_AVC_ATTACK,		0x0028 },
+@@ -122,13 +111,6 @@
+ 	bool enabled;
+ };
+ 
+-enum sgtl5000_micbias_resistor {
+-	SGTL5000_MICBIAS_OFF = 0,
+-	SGTL5000_MICBIAS_2K = 2,
+-	SGTL5000_MICBIAS_4K = 4,
+-	SGTL5000_MICBIAS_8K = 8,
+-};
+-
+ /* sgtl5000 private structure in codec */
+ struct sgtl5000_priv {
+ 	int sysclk;	/* sysclk rate */
+@@ -216,9 +198,8 @@
+ 	"MIC_IN", "LINE_IN"
+ };
+ 
+-static SOC_ENUM_SINGLE_DECL(adc_enum,
+-			    SGTL5000_CHIP_ANA_CTRL, 2,
+-			    adc_mux_text);
++static const struct soc_enum adc_enum =
++SOC_ENUM_SINGLE(SGTL5000_CHIP_ANA_CTRL, 2, 2, adc_mux_text);
+ 
+ static const struct snd_kcontrol_new adc_mux =
+ SOC_DAPM_ENUM("Capture Mux", adc_enum);
+@@ -228,9 +209,8 @@
+ 	"DAC", "LINE_IN"
+ };
+ 
+-static SOC_ENUM_SINGLE_DECL(dac_enum,
+-			    SGTL5000_CHIP_ANA_CTRL, 6,
+-			    dac_mux_text);
++static const struct soc_enum dac_enum =
++SOC_ENUM_SINGLE(SGTL5000_CHIP_ANA_CTRL, 6, 2, dac_mux_text);
+ 
+ static const struct snd_kcontrol_new dac_mux =
+ SOC_DAPM_ENUM("Headphone Mux", dac_enum);
+@@ -325,7 +305,7 @@
+ static int dac_get_volsw(struct snd_kcontrol *kcontrol,
+ 			 struct snd_ctl_elem_value *ucontrol)
+ {
+-	struct snd_soc_codec *codec = snd_soc_kcontrol_codec(kcontrol);
++	struct snd_soc_codec *codec = snd_kcontrol_chip(kcontrol);
+ 	int reg;
+ 	int l;
+ 	int r;
+@@ -378,7 +358,7 @@
+ static int dac_put_volsw(struct snd_kcontrol *kcontrol,
+ 			 struct snd_ctl_elem_value *ucontrol)
+ {
+-	struct snd_soc_codec *codec = snd_soc_kcontrol_codec(kcontrol);
++	struct snd_soc_codec *codec = snd_kcontrol_chip(kcontrol);
+ 	int reg;
+ 	int l;
+ 	int r;
+@@ -485,21 +465,21 @@
+ 	/* setting i2s data format */
+ 	switch (fmt & SND_SOC_DAIFMT_FORMAT_MASK) {
+ 	case SND_SOC_DAIFMT_DSP_A:
+-		i2sctl |= SGTL5000_I2S_MODE_PCM << SGTL5000_I2S_MODE_SHIFT;
++		i2sctl |= SGTL5000_I2S_MODE_PCM;
+ 		break;
+ 	case SND_SOC_DAIFMT_DSP_B:
+-		i2sctl |= SGTL5000_I2S_MODE_PCM << SGTL5000_I2S_MODE_SHIFT;
++		i2sctl |= SGTL5000_I2S_MODE_PCM;
+ 		i2sctl |= SGTL5000_I2S_LRALIGN;
+ 		break;
+ 	case SND_SOC_DAIFMT_I2S:
+-		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ << SGTL5000_I2S_MODE_SHIFT;
++		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ;
+ 		break;
+ 	case SND_SOC_DAIFMT_RIGHT_J:
+-		i2sctl |= SGTL5000_I2S_MODE_RJ << SGTL5000_I2S_MODE_SHIFT;
++		i2sctl |= SGTL5000_I2S_MODE_RJ;
+ 		i2sctl |= SGTL5000_I2S_LRPOL;
+ 		break;
+ 	case SND_SOC_DAIFMT_LEFT_J:
+-		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ << SGTL5000_I2S_MODE_SHIFT;
++		i2sctl |= SGTL5000_I2S_MODE_I2S_LJ;
+ 		i2sctl |= SGTL5000_I2S_LRALIGN;
+ 		break;
+ 	default:
+@@ -544,16 +524,16 @@
+ 
+ /*
+  * set clock according to i2s frame clock,
+- * sgtl5000 provides 2 clock sources:
+- * 1. sys_mclk: sample freq can only be configured to
++ * sgtl5000 provide 2 clock sources.
++ * 1. sys_mclk. sample freq can only configure to
+  *	1/256, 1/384, 1/512 of sys_mclk.
+- * 2. pll: can derive any audio clocks.
++ * 2. pll. can derive any audio clocks.
+  *
+  * clock setting rules:
+- * 1. in slave mode, only sys_mclk can be used
+- * 2. as constraint by sys_mclk, sample freq should be set to 32 kHz, 44.1 kHz
+- * and above.
+- * 3. usage of sys_mclk is preferred over pll to save power.
++ * 1. in slave mode, only sys_mclk can use.
++ * 2. as constraint by sys_mclk, sample freq should
++ *	set to 32k, 44.1k and above.
++ * 3. using sys_mclk prefer to pll to save power.
+  */
+ static int sgtl5000_set_clock(struct snd_soc_codec *codec, int frame_rate)
+ {
+@@ -563,8 +543,8 @@
+ 
+ 	/*
+ 	 * sample freq should be divided by frame clock,
+-	 * if frame clock is lower than 44.1 kHz, sample freq should be set to
+-	 * 32 kHz or 44.1 kHz.
++	 * if frame clock lower than 44.1khz, sample feq should set to
++	 * 32khz or 44.1khz.
+ 	 */
+ 	switch (frame_rate) {
+ 	case 8000:
+@@ -617,10 +597,9 @@
+ 
+ 	/*
+ 	 * calculate the divider of mclk/sample_freq,
+-	 * factor of freq = 96 kHz can only be 256, since mclk is in the range
+-	 * of 8 MHz - 27 MHz
++	 * factor of freq =96k can only be 256, since mclk in range (12m,27m)
+ 	 */
+-	switch (sgtl5000->sysclk / frame_rate) {
++	switch (sgtl5000->sysclk / sys_fs) {
+ 	case 256:
+ 		clk_ctl |= SGTL5000_MCLK_FREQ_256FS <<
+ 			SGTL5000_MCLK_FREQ_SHIFT;
+@@ -634,16 +613,13 @@
+ 			SGTL5000_MCLK_FREQ_SHIFT;
+ 		break;
+ 	default:
+-		/* if mclk does not satisfy the divider, use pll */
++		/* if mclk not satisify the divider, use pll */
+ 		if (sgtl5000->master) {
+ 			clk_ctl |= SGTL5000_MCLK_FREQ_PLL <<
+ 				SGTL5000_MCLK_FREQ_SHIFT;
+ 		} else {
+ 			dev_err(codec->dev,
+ 				"PLL not supported in slave mode\n");
+-			dev_err(codec->dev, "%d ratio is not supported. "
+-				"SYS_MCLK needs to be 256, 384 or 512 * fs\n",
+-				sgtl5000->sysclk / frame_rate);
+ 			return -EINVAL;
+ 		}
+ 	}
+@@ -742,25 +718,25 @@
+ 		return ret;
+ 
+ 	/* set i2s data format */
+-	switch (params_width(params)) {
+-	case 16:
++	switch (params_format(params)) {
++	case SNDRV_PCM_FORMAT_S16_LE:
+ 		if (sgtl5000->fmt == SND_SOC_DAIFMT_RIGHT_J)
+ 			return -EINVAL;
+ 		i2s_ctl |= SGTL5000_I2S_DLEN_16 << SGTL5000_I2S_DLEN_SHIFT;
+ 		i2s_ctl |= SGTL5000_I2S_SCLKFREQ_32FS <<
+ 		    SGTL5000_I2S_SCLKFREQ_SHIFT;
+ 		break;
+-	case 20:
++	case SNDRV_PCM_FORMAT_S20_3LE:
+ 		i2s_ctl |= SGTL5000_I2S_DLEN_20 << SGTL5000_I2S_DLEN_SHIFT;
+ 		i2s_ctl |= SGTL5000_I2S_SCLKFREQ_64FS <<
+ 		    SGTL5000_I2S_SCLKFREQ_SHIFT;
+ 		break;
+-	case 24:
++	case SNDRV_PCM_FORMAT_S24_LE:
+ 		i2s_ctl |= SGTL5000_I2S_DLEN_24 << SGTL5000_I2S_DLEN_SHIFT;
+ 		i2s_ctl |= SGTL5000_I2S_SCLKFREQ_64FS <<
+ 		    SGTL5000_I2S_SCLKFREQ_SHIFT;
+ 		break;
+-	case 32:
++	case SNDRV_PCM_FORMAT_S32_LE:
+ 		if (sgtl5000->fmt == SND_SOC_DAIFMT_RIGHT_J)
+ 			return -EINVAL;
+ 		i2s_ctl |= SGTL5000_I2S_DLEN_32 << SGTL5000_I2S_DLEN_SHIFT;
+@@ -791,7 +767,7 @@
+ 	struct ldo_regulator *ldo = rdev_get_drvdata(dev);
+ 	struct snd_soc_codec *codec = (struct snd_soc_codec *)ldo->codec_data;
+ 	int reg;
+-
++dev_info(codec->dev, "%s(): enabled %u\n", __func__, ldo->enabled);
+ 	if (ldo_regulator_is_enabled(dev))
+ 		return 0;
+ 
+@@ -810,7 +786,7 @@
+ 				SGTL5000_LINEREG_D_POWERUP,
+ 				SGTL5000_LINEREG_D_POWERUP);
+ 
+-	/* when internal ldo is enabled, simple digital power can be disabled */
++	/* when internal ldo enabled, simple digital power can be disabled */
+ 	snd_soc_update_bits(codec, SGTL5000_CHIP_ANA_POWER,
+ 				SGTL5000_LINREG_SIMPLE_POWERUP,
+ 				0);
+@@ -823,10 +799,16 @@
+ {
+ 	struct ldo_regulator *ldo = rdev_get_drvdata(dev);
+ 	struct snd_soc_codec *codec = (struct snd_soc_codec *)ldo->codec_data;
++dev_info(codec->dev, "%s(): enabled %u\n", __func__, ldo->enabled);
++
++	snd_soc_update_bits(codec, SGTL5000_CHIP_ANA_POWER,
++				SGTL5000_LINREG_SIMPLE_POWERUP,
++				SGTL5000_LINREG_SIMPLE_POWERUP);
+ 
+ 	snd_soc_update_bits(codec, SGTL5000_CHIP_ANA_POWER,
+ 				SGTL5000_LINEREG_D_POWERUP,
+ 				0);
++dev_info(codec->dev, "%s: ANA_POWER = 0x%04x\n", __func__, snd_soc_read(codec, SGTL5000_CHIP_ANA_POWER));
+ 
+ 	/* clear voltage info */
+ 	snd_soc_update_bits(codec, SGTL5000_CHIP_LINREG_CTRL,
+@@ -861,8 +843,10 @@
+ 
+ 	ldo = kzalloc(sizeof(struct ldo_regulator), GFP_KERNEL);
+ 
+-	if (!ldo)
++	if (!ldo) {
++		dev_err(codec->dev, "failed to allocate ldo_regulator\n");
+ 		return -ENOMEM;
++	}
+ 
+ 	ldo->desc.name = kstrdup(dev_name(codec->dev), GFP_KERNEL);
+ 	if (!ldo->desc.name) {
+@@ -882,6 +866,7 @@
+ 	config.dev = codec->dev;
+ 	config.driver_data = ldo;
+ 	config.init_data = init_data;
++	config.ena_gpio = -EINVAL;
+ 
+ 	ldo->dev = regulator_register(&ldo->desc, &config);
+ 	if (IS_ERR(ldo->dev)) {
+@@ -1091,10 +1076,90 @@
+ 	}
+ }
+ 
++#ifdef CONFIG_SUSPEND
++static int sgtl5000_suspend(struct snd_soc_codec *codec)
++{
++	sgtl5000_set_bias_level(codec, SND_SOC_BIAS_OFF);
++
++	return 0;
++}
++
++/*
++ * restore all sgtl5000 registers,
++ * since a big hole between dap and regular registers,
++ * we will restore them respectively.
++ */
++static int sgtl5000_restore_regs(struct snd_soc_codec *codec)
++{
++	u16 *cache = codec->reg_cache;
++	u16 reg;
++
++	/* restore regular registers */
++	for (reg = 0; reg <= SGTL5000_CHIP_SHORT_CTRL; reg += 2) {
++
++		/* These regs should restore in particular order */
++		if (reg == SGTL5000_CHIP_ANA_POWER ||
++			reg == SGTL5000_CHIP_CLK_CTRL ||
++			reg == SGTL5000_CHIP_LINREG_CTRL ||
++			reg == SGTL5000_CHIP_LINE_OUT_CTRL ||
++			reg == SGTL5000_CHIP_REF_CTRL)
++			continue;
++
++		snd_soc_write(codec, reg, cache[reg]);
++	}
++
++	/* restore dap registers */
++	for (reg = SGTL5000_DAP_REG_OFFSET; reg < SGTL5000_MAX_REG_OFFSET; reg += 2)
++		snd_soc_write(codec, reg, cache[reg]);
++
++	/*
++	 * restore these regs according to the power setting sequence in
++	 * sgtl5000_set_power_regs() and clock setting sequence in
++	 * sgtl5000_set_clock().
++	 *
++	 * The order of restore is:
++	 * 1. SGTL5000_CHIP_CLK_CTRL MCLK_FREQ bits (1:0) should be restore after
++	 *    SGTL5000_CHIP_ANA_POWER PLL bits set
++	 * 2. SGTL5000_CHIP_LINREG_CTRL should be set before
++	 *    SGTL5000_CHIP_ANA_POWER LINREG_D restored
++	 * 3. SGTL5000_CHIP_REF_CTRL controls Analog Ground Voltage,
++	 *    prefer to resotre it after SGTL5000_CHIP_ANA_POWER restored
++	 */
++	snd_soc_write(codec, SGTL5000_CHIP_LINREG_CTRL,
++			cache[SGTL5000_CHIP_LINREG_CTRL]);
++
++	snd_soc_write(codec, SGTL5000_CHIP_ANA_POWER,
++			cache[SGTL5000_CHIP_ANA_POWER]);
++
++	snd_soc_write(codec, SGTL5000_CHIP_CLK_CTRL,
++			cache[SGTL5000_CHIP_CLK_CTRL]);
++
++	snd_soc_write(codec, SGTL5000_CHIP_REF_CTRL,
++			cache[SGTL5000_CHIP_REF_CTRL]);
++
++	snd_soc_write(codec, SGTL5000_CHIP_LINE_OUT_CTRL,
++			cache[SGTL5000_CHIP_LINE_OUT_CTRL]);
++	return 0;
++}
++
++static int sgtl5000_resume(struct snd_soc_codec *codec)
++{
++	/* Bring the codec back up to standby to enable regulators */
++	sgtl5000_set_bias_level(codec, SND_SOC_BIAS_STANDBY);
++
++	/* Restore registers by cached in memory */
++	sgtl5000_restore_regs(codec);
++	return 0;
++}
++#else
++#define sgtl5000_suspend NULL
++#define sgtl5000_resume  NULL
++#endif	/* CONFIG_SUSPEND */
++
+ /*
+  * sgtl5000 has 3 internal power supplies:
+  * 1. VAG, normally set to vdda/2
+- * 2. charge pump, set to different value
++ * 2. chargepump, set to different value
+  *	according to voltage of vdda and vddio
+  * 3. line out VAG, normally set to vddio/2
+  *
+@@ -1267,7 +1332,7 @@
+ 			return ret;
+ 	}
+ 
+-	ret = regulator_bulk_get(codec->dev, ARRAY_SIZE(sgtl5000->supplies),
++	ret = devm_regulator_bulk_get(codec->dev, ARRAY_SIZE(sgtl5000->supplies),
+ 				 sgtl5000->supplies);
+ 	if (ret)
+ 		goto err_ldo_remove;
+@@ -1275,16 +1340,13 @@
+ 	ret = regulator_bulk_enable(ARRAY_SIZE(sgtl5000->supplies),
+ 					sgtl5000->supplies);
+ 	if (ret)
+-		goto err_regulator_free;
++		goto err_ldo_remove;
+ 
+ 	/* wait for all power rails bring up */
+ 	udelay(10);
+ 
+ 	return 0;
+ 
+-err_regulator_free:
+-	regulator_bulk_free(ARRAY_SIZE(sgtl5000->supplies),
+-				sgtl5000->supplies);
+ err_ldo_remove:
+ 	if (!external_vddd)
+ 		ldo_regulator_remove(codec);
+@@ -1297,6 +1359,17 @@
+ 	int ret;
+ 	struct sgtl5000_priv *sgtl5000 = snd_soc_codec_get_drvdata(codec);
+ 
++	/* setup i2c data ops */
++	codec->control_data = sgtl5000->regmap;
++	ret = snd_soc_codec_set_cache_io(codec, 16, 16, SND_SOC_REGMAP);
++	if (ret < 0) {
++		dev_err(codec->dev, "Failed to set cache I/O: %d\n", ret);
++		return ret;
++	}
++
++	if (!devres_open_group(codec->dev, NULL, GFP_KERNEL))
++		return -ENOMEM;
++
+ 	ret = sgtl5000_enable_regulators(codec);
+ 	if (ret)
+ 		return ret;
+@@ -1334,13 +1407,8 @@
+ 			SGTL5000_HP_ZCD_EN |
+ 			SGTL5000_ADC_ZCD_EN);
+ 
+-	snd_soc_update_bits(codec, SGTL5000_CHIP_MIC_CTRL,
+-			SGTL5000_BIAS_R_MASK,
+-			sgtl5000->micbias_resistor << SGTL5000_BIAS_R_SHIFT);
++	snd_soc_write(codec, SGTL5000_CHIP_MIC_CTRL, 2);
+ 
+-	snd_soc_update_bits(codec, SGTL5000_CHIP_MIC_CTRL,
+-			SGTL5000_BIAS_R_MASK,
+-			sgtl5000->micbias_voltage << SGTL5000_BIAS_R_SHIFT);
+ 	/*
+ 	 * disable DAP
+ 	 * TODO:
+@@ -1348,13 +1416,19 @@
+ 	 */
+ 	snd_soc_write(codec, SGTL5000_DAP_CTRL, 0);
+ 
++	/* leading to standby state */
++	ret = sgtl5000_set_bias_level(codec, SND_SOC_BIAS_STANDBY);
++	if (ret)
++		goto err;
++
+ 	return 0;
+ 
+ err:
+ 	regulator_bulk_disable(ARRAY_SIZE(sgtl5000->supplies),
+ 						sgtl5000->supplies);
+-	regulator_bulk_free(ARRAY_SIZE(sgtl5000->supplies),
+-				sgtl5000->supplies);
++
++	devres_release_group(codec->dev, NULL);
++
+ 	ldo_regulator_remove(codec);
+ 
+ 	return ret;
+@@ -1364,10 +1438,13 @@
+ {
+ 	struct sgtl5000_priv *sgtl5000 = snd_soc_codec_get_drvdata(codec);
+ 
++	sgtl5000_set_bias_level(codec, SND_SOC_BIAS_OFF);
++
+ 	regulator_bulk_disable(ARRAY_SIZE(sgtl5000->supplies),
+ 						sgtl5000->supplies);
+-	regulator_bulk_free(ARRAY_SIZE(sgtl5000->supplies),
+-				sgtl5000->supplies);
++
++	devres_release_group(codec->dev, NULL);
++
+ 	ldo_regulator_remove(codec);
+ 
+ 	return 0;
+@@ -1376,8 +1453,9 @@
+ static struct snd_soc_codec_driver sgtl5000_driver = {
+ 	.probe = sgtl5000_probe,
+ 	.remove = sgtl5000_remove,
++	.suspend = sgtl5000_suspend,
++	.resume = sgtl5000_resume,
+ 	.set_bias_level = sgtl5000_set_bias_level,
+-	.suspend_bias_off = true,
+ 	.controls = sgtl5000_snd_controls,
+ 	.num_controls = ARRAY_SIZE(sgtl5000_snd_controls),
+ 	.dapm_widgets = sgtl5000_dapm_widgets,
+@@ -1430,10 +1508,9 @@
+ {
+ 	struct sgtl5000_priv *sgtl5000;
+ 	int ret, reg, rev;
+-	struct device_node *np = client->dev.of_node;
+-	u32 value;
+ 
+-	sgtl5000 = devm_kzalloc(&client->dev, sizeof(*sgtl5000), GFP_KERNEL);
++	sgtl5000 = devm_kzalloc(&client->dev, sizeof(struct sgtl5000_priv),
++								GFP_KERNEL);
+ 	if (!sgtl5000)
+ 		return -ENOMEM;
+ 
+@@ -1478,47 +1555,6 @@
+ 	dev_info(&client->dev, "sgtl5000 revision 0x%x\n", rev);
+ 	sgtl5000->revision = rev;
+ 
+-	if (np) {
+-		if (!of_property_read_u32(np,
+-			"micbias-resistor-k-ohms", &value)) {
+-			switch (value) {
+-			case SGTL5000_MICBIAS_OFF:
+-				sgtl5000->micbias_resistor = 0;
+-				break;
+-			case SGTL5000_MICBIAS_2K:
+-				sgtl5000->micbias_resistor = 1;
+-				break;
+-			case SGTL5000_MICBIAS_4K:
+-				sgtl5000->micbias_resistor = 2;
+-				break;
+-			case SGTL5000_MICBIAS_8K:
+-				sgtl5000->micbias_resistor = 3;
+-				break;
+-			default:
+-				sgtl5000->micbias_resistor = 2;
+-				dev_err(&client->dev,
+-					"Unsuitable MicBias resistor\n");
+-			}
+-		} else {
+-			/* default is 4Kohms */
+-			sgtl5000->micbias_resistor = 2;
+-		}
+-		if (!of_property_read_u32(np,
+-			"micbias-voltage-m-volts", &value)) {
+-			/* 1250mV => 0 */
+-			/* steps of 250mV */
+-			if ((value >= 1250) && (value <= 3000))
+-				sgtl5000->micbias_voltage = (value / 250) - 5;
+-			else {
+-				sgtl5000->micbias_voltage = 0;
+-				dev_err(&client->dev,
+-					"Unsuitable MicBias resistor\n");
+-			}
+-		} else {
+-			sgtl5000->micbias_voltage = 0;
+-		}
+-	}
+-
+ 	i2c_set_clientdata(client, sgtl5000);
+ 
+ 	/* Ensure sgtl5000 will start with sane register values */
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_asrc.h linux-xbian-imx6/sound/soc/fsl/fsl_asrc.h
+--- linux-4.1.3/sound/soc/fsl/fsl_asrc.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/fsl_asrc.h	2015-07-27 23:13:11.149203200 +0200
+@@ -326,7 +326,7 @@
+ 	OUTCLK_ASRCK1_CLK = 0x0f,
+ };
+ 
+-#define ASRC_CLK_MAX_NUM	16
++#define ASRC_CLK_MAX_NUM	1
+ 
+ enum asrc_word_width {
+ 	ASRC_WIDTH_24_BIT = 0,
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_esai.c linux-xbian-imx6/sound/soc/fsl/fsl_esai.c
+--- linux-4.1.3/sound/soc/fsl/fsl_esai.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/fsl_esai.c	2015-07-27 23:13:11.149203200 +0200
+@@ -839,7 +839,7 @@
+ 		return ret;
+ 	}
+ 
+-	ret = imx_pcm_dma_init(pdev);
++	ret = imx_pcm_dma_init(pdev, IMX_ESAI_DMABUF_SIZE);
+ 	if (ret)
+ 		dev_err(&pdev->dev, "failed to init imx pcm dma: %d\n", ret);
+ 
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_hdmi.c linux-xbian-imx6/sound/soc/fsl/fsl_hdmi.c
+--- linux-4.1.3/sound/soc/fsl/fsl_hdmi.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/sound/soc/fsl/fsl_hdmi.c	2015-07-27 23:13:11.149203200 +0200
+@@ -0,0 +1,614 @@
++/*
++ * ALSA SoC HDMI Audio Layer for Freescale i.MX
++ *
++ * Copyright (C) 2011-2013 Freescale Semiconductor, Inc.
++ *
++ * Some code from patch_hdmi.c
++ *  Copyright (c) 2008-2010 Intel Corporation. All rights reserved.
++ *  Copyright (c) 2006 ATI Technologies Inc.
++ *  Copyright (c) 2008 NVIDIA Corp.  All rights reserved.
++ *  Copyright (c) 2008 Wei Ni <wni@nvidia.com>
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#include <linux/init.h>
++#include <linux/module.h>
++#include <linux/dma-mapping.h>
++#include <linux/slab.h>
++#include <linux/clk.h>
++#include <linux/delay.h>
++#include <linux/mfd/mxc-hdmi-core.h>
++#include <sound/pcm.h>
++#include <sound/soc.h>
++#include <sound/asoundef.h>
++
++#include <video/mxc_hdmi.h>
++
++#include "imx-hdmi.h"
++
++
++static struct mxc_edid_cfg edid_cfg;
++
++static u32 playback_rates[HDMI_MAX_RATES];
++static u32 playback_sample_size[HDMI_MAX_SAMPLE_SIZE];
++static u32 playback_channels[HDMI_MAX_CHANNEL_CONSTRAINTS];
++
++static struct snd_pcm_hw_constraint_list playback_constraint_rates;
++static struct snd_pcm_hw_constraint_list playback_constraint_bits;
++static struct snd_pcm_hw_constraint_list playback_constraint_channels;
++
++#ifdef DEBUG
++static void dumpregs(struct snd_soc_dai *dai)
++{
++	u32 n, cts;
++
++	cts = (hdmi_readb(HDMI_AUD_CTS3) << 16) |
++		(hdmi_readb(HDMI_AUD_CTS2) << 8) |
++		hdmi_readb(HDMI_AUD_CTS1);
++
++	n = (hdmi_readb(HDMI_AUD_N3) << 16) |
++		(hdmi_readb(HDMI_AUD_N2) << 8) |
++		hdmi_readb(HDMI_AUD_N1);
++
++	dev_dbg(dai->dev, "HDMI_PHY_CONF0      0x%02x\n",
++			hdmi_readb(HDMI_PHY_CONF0));
++	dev_dbg(dai->dev, "HDMI_MC_CLKDIS      0x%02x\n",
++			hdmi_readb(HDMI_MC_CLKDIS));
++	dev_dbg(dai->dev, "HDMI_AUD_N[1-3]     0x%06x (%d)\n",
++			n, n);
++	dev_dbg(dai->dev, "HDMI_AUD_CTS[1-3]   0x%06x (%d)\n",
++			cts, cts);
++	dev_dbg(dai->dev, "HDMI_FC_AUDSCONF    0x%02x\n",
++			hdmi_readb(HDMI_FC_AUDSCONF));
++}
++#else
++static void dumpregs(struct snd_soc_dai *dai) {}
++#endif
++
++enum cea_speaker_placement {
++	FL  = (1 <<  0),	/* Front Left           */
++	FC  = (1 <<  1),	/* Front Center         */
++	FR  = (1 <<  2),	/* Front Right          */
++	FLC = (1 <<  3),	/* Front Left Center    */
++	FRC = (1 <<  4),	/* Front Right Center   */
++	RL  = (1 <<  5),	/* Rear Left            */
++	RC  = (1 <<  6),	/* Rear Center          */
++	RR  = (1 <<  7),	/* Rear Right           */
++	RLC = (1 <<  8),	/* Rear Left Center     */
++	RRC = (1 <<  9),	/* Rear Right Center    */
++	LFE = (1 << 10),	/* Low Frequency Effect */
++	FLW = (1 << 11),	/* Front Left Wide      */
++	FRW = (1 << 12),	/* Front Right Wide     */
++	FLH = (1 << 13),	/* Front Left High      */
++	FCH = (1 << 14),	/* Front Center High    */
++	FRH = (1 << 15),	/* Front Right High     */
++	TC  = (1 << 16),	/* Top Center           */
++};
++
++/*
++ * EDID SA bits in the CEA Speaker Allocation data block
++ */
++static int edid_speaker_allocation_bits[] = {
++	[0] = FL | FR,
++	[1] = LFE,
++	[2] = FC,
++	[3] = RL | RR,
++	[4] = RC,
++	[5] = FLC | FRC,
++	[6] = RLC | RRC,
++	[7] = FLW | FRW,
++	[8] = FLH | FRH,
++	[9] = TC,
++	[10] = FCH,
++};
++
++struct cea_channel_speaker_allocation {
++	int ca_index;
++	int speakers[8];
++
++	/* Derived values, just for convenience */
++	int channels;
++	int spk_mask;
++};
++
++/*
++ * This is an ordered list!
++ *
++ * The preceding ones have better chances to be selected by
++ * hdmi_channel_allocation().
++ */
++static struct cea_channel_speaker_allocation channel_allocations[] = {
++	/*			  channel:  7     6    5    4    3     2    1    0  */
++	{ .ca_index = 0x00, .speakers = {   0,    0,   0,   0,   0,    0,  FR,  FL },},
++					 /* 2.1 */
++	{ .ca_index = 0x01, .speakers = {   0,    0,   0,   0,   0,  LFE,  FR,  FL },},
++					 /* Dolby Surround */
++	{ .ca_index = 0x08, .speakers = {   0,    0,  RR,  RL,   0,    0,  FR,  FL },},  /* Prefer FL/FR/RL/RR over FL/FR/LFE/FC */
++	{ .ca_index = 0x02, .speakers = {   0,    0,   0,   0,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x03, .speakers = {   0,    0,   0,   0,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x04, .speakers = {   0,    0,   0,  RC,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x05, .speakers = {   0,    0,   0,  RC,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x06, .speakers = {   0,    0,   0,  RC,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x07, .speakers = {   0,    0,   0,  RC,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x09, .speakers = {   0,    0,  RR,  RL,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x0a, .speakers = {   0,    0,  RR,  RL,  FC,    0,  FR,  FL },},
++					 /* surround51 */
++	{ .ca_index = 0x0b, .speakers = {   0,    0,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x0c, .speakers = {   0,   RC,  RR,  RL,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x0d, .speakers = {   0,   RC,  RR,  RL,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x0e, .speakers = {   0,   RC,  RR,  RL,  FC,    0,  FR,  FL },},
++					 /* 6.1 */
++	{ .ca_index = 0x0f, .speakers = {   0,   RC,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x10, .speakers = { RRC,  RLC,  RR,  RL,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x11, .speakers = { RRC,  RLC,  RR,  RL,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x12, .speakers = { RRC,  RLC,  RR,  RL,  FC,    0,  FR,  FL },},
++					 /* surround71 */
++	{ .ca_index = 0x13, .speakers = { RRC,  RLC,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x14, .speakers = { FRC,  FLC,   0,   0,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x15, .speakers = { FRC,  FLC,   0,   0,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x16, .speakers = { FRC,  FLC,   0,   0,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x17, .speakers = { FRC,  FLC,   0,   0,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x18, .speakers = { FRC,  FLC,   0,  RC,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x19, .speakers = { FRC,  FLC,   0,  RC,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x1a, .speakers = { FRC,  FLC,   0,  RC,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x1b, .speakers = { FRC,  FLC,   0,  RC,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x1c, .speakers = { FRC,  FLC,  RR,  RL,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x1d, .speakers = { FRC,  FLC,  RR,  RL,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x1e, .speakers = { FRC,  FLC,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x1f, .speakers = { FRC,  FLC,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x20, .speakers = {   0,  FCH,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x21, .speakers = {   0,  FCH,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x22, .speakers = {  TC,    0,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x23, .speakers = {  TC,    0,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x24, .speakers = { FRH,  FLH,  RR,  RL,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x25, .speakers = { FRH,  FLH,  RR,  RL,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x26, .speakers = { FRW,  FLW,  RR,  RL,   0,    0,  FR,  FL },},
++	{ .ca_index = 0x27, .speakers = { FRW,  FLW,  RR,  RL,   0,  LFE,  FR,  FL },},
++	{ .ca_index = 0x28, .speakers = {  TC,   RC,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x29, .speakers = {  TC,   RC,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x2a, .speakers = { FCH,   RC,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x2b, .speakers = { FCH,   RC,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x2c, .speakers = {  TC,  FCH,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x2d, .speakers = {  TC,  FCH,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x2e, .speakers = { FRH,  FLH,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x2f, .speakers = { FRH,  FLH,  RR,  RL,  FC,  LFE,  FR,  FL },},
++	{ .ca_index = 0x30, .speakers = { FRW,  FLW,  RR,  RL,  FC,    0,  FR,  FL },},
++	{ .ca_index = 0x31, .speakers = { FRW,  FLW,  RR,  RL,  FC,  LFE,  FR,  FL },},
++};
++
++/* Compute derived values in channel_allocations[] */
++static void init_channel_allocations(void)
++{
++	struct cea_channel_speaker_allocation *p;
++	int i, j;
++
++	for (i = 0; i < ARRAY_SIZE(channel_allocations); i++) {
++		p = channel_allocations + i;
++		p->channels = 0;
++		p->spk_mask = 0;
++		for (j = 0; j < ARRAY_SIZE(p->speakers); j++)
++			if (p->speakers[j]) {
++				p->channels++;
++				p->spk_mask |= p->speakers[j];
++			}
++	}
++}
++
++/*
++ * The transformation takes two steps:
++ *
++ * speaker_alloc => (edid_speaker_allocation_bits[]) => spk_mask
++ * spk_mask      => (channel_allocations[])         => CA
++ *
++ * TODO: it could select the wrong CA from multiple candidates.
++*/
++static int hdmi_channel_allocation(int channels)
++{
++	int spk_mask = 0, ca = 0, i, tmpchn, tmpspk;
++
++	/* CA defaults to 0 for basic stereo audio */
++	if (channels <= 2)
++		return 0;
++
++	/*
++	 * Expand EDID's speaker allocation mask
++	 *
++	 * EDID tells the speaker mask in a compact(paired) form,
++	 * expand EDID's notions to match the ones used by Audio InfoFrame.
++	 */
++	for (i = 0; i < ARRAY_SIZE(edid_speaker_allocation_bits); i++) {
++		if (edid_cfg.speaker_alloc & (1 << i))
++			spk_mask |= edid_speaker_allocation_bits[i];
++	}
++
++	/* Search for the first working match in the CA table */
++	for (i = 0; i < ARRAY_SIZE(channel_allocations); i++) {
++		tmpchn = channel_allocations[i].channels;
++		tmpspk = channel_allocations[i].spk_mask;
++
++		if (channels == tmpchn && (spk_mask & tmpspk) == tmpspk) {
++			ca = channel_allocations[i].ca_index;
++			break;
++		}
++	}
++
++	return ca;
++}
++
++static void hdmi_set_audio_infoframe(unsigned int channels)
++{
++	u8 audiconf0, audiconf2;
++
++	/*
++	 * From CEA-861-D spec:
++	 * HDMI requires the CT, SS and SF fields to be set to 0 ("Refer
++	 * to Stream Header") as these items are carried in the audio stream.
++	 *
++	 * So we only set the CC and CA fields.
++	 */
++	audiconf0 = ((channels - 1) << HDMI_FC_AUDICONF0_CC_OFFSET) &
++		HDMI_FC_AUDICONF0_CC_MASK;
++
++	audiconf2 = hdmi_channel_allocation(channels);
++
++	hdmi_writeb(audiconf0, HDMI_FC_AUDICONF0);
++	hdmi_writeb(0, HDMI_FC_AUDICONF1);
++	hdmi_writeb(audiconf2, HDMI_FC_AUDICONF2);
++	hdmi_writeb(0, HDMI_FC_AUDICONF3);
++}
++
++static int cea_audio_rates[HDMI_MAX_RATES] = {
++	32000, 44100, 48000, 88200, 96000, 176400, 192000,
++};
++
++static void fsl_hdmi_get_playback_rates(void)
++{
++	int i, count = 0;
++	u8 rates;
++
++	/* Always assume basic audio support */
++	rates = edid_cfg.sample_rates | 0x7;
++
++	for (i = 0 ; i < HDMI_MAX_RATES ; i++)
++		if ((rates & (1 << i)) != 0)
++			playback_rates[count++] = cea_audio_rates[i];
++
++	playback_constraint_rates.list = playback_rates;
++	playback_constraint_rates.count = count;
++
++	for (i = 0 ; i < playback_constraint_rates.count ; i++)
++		pr_debug("%s: constraint = %d Hz\n", __func__, playback_rates[i]);
++}
++
++static void fsl_hdmi_get_playback_sample_size(void)
++{
++	int i = 0;
++
++	/* Always assume basic audio support */
++	playback_sample_size[i++] = 16;
++
++	if (edid_cfg.sample_sizes & 0x4)
++		playback_sample_size[i++] = 32;
++
++	playback_constraint_bits.list = playback_sample_size;
++	playback_constraint_bits.count = i;
++
++	for (i = 0 ; i < playback_constraint_bits.count ; i++)
++		pr_debug("%s: constraint = %d bits\n", __func__, playback_sample_size[i]);
++}
++
++static void fsl_hdmi_get_playback_channels(void)
++{
++	int channels = 2, i = 0;
++
++	/* Always assume basic audio support */
++	playback_channels[i++] = channels;
++	channels += 2;
++
++	while ((i < HDMI_MAX_CHANNEL_CONSTRAINTS) &&
++			(channels <= edid_cfg.max_channels)) {
++		playback_channels[i++] = channels;
++		channels += 2;
++	}
++
++	playback_constraint_channels.list = playback_channels;
++	playback_constraint_channels.count = i;
++
++	for (i = 0 ; i < playback_constraint_channels.count ; i++)
++		pr_debug("%s: constraint = %d channels\n", __func__, playback_channels[i]);
++}
++
++static int fsl_hdmi_update_constraints(struct snd_pcm_substream *substream)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	int edid_status, ret;
++
++	edid_status = hdmi_get_edid_cfg(&edid_cfg);
++
++	if (edid_status && !edid_cfg.hdmi_cap)
++		return -1;
++
++	fsl_hdmi_get_playback_rates();
++	ret = snd_pcm_hw_constraint_list(runtime, 0, SNDRV_PCM_HW_PARAM_RATE,
++			&playback_constraint_rates);
++	if (ret)
++		return ret;
++
++	fsl_hdmi_get_playback_sample_size();
++	ret = snd_pcm_hw_constraint_list(runtime, 0, SNDRV_PCM_HW_PARAM_SAMPLE_BITS,
++			&playback_constraint_bits);
++	if (ret)
++		return ret;
++
++	fsl_hdmi_get_playback_channels();
++	ret = snd_pcm_hw_constraint_list(runtime, 0, SNDRV_PCM_HW_PARAM_CHANNELS,
++			&playback_constraint_channels);
++	if (ret)
++		return ret;
++
++	ret = snd_pcm_hw_constraint_integer(runtime, SNDRV_PCM_HW_PARAM_PERIODS);
++	if (ret)
++		return ret;
++
++	return 0;
++}
++
++static int fsl_hdmi_soc_startup(struct snd_pcm_substream *substream,
++				struct snd_soc_dai *dai)
++{
++	struct imx_hdmi *hdmi_data = snd_soc_dai_get_drvdata(dai);
++	int ret;
++
++	ret = fsl_hdmi_update_constraints(substream);
++	if (ret < 0)
++		return ret;
++
++	clk_prepare_enable(hdmi_data->isfr_clk);
++	clk_prepare_enable(hdmi_data->iahb_clk);
++
++	dev_dbg(dai->dev, "%s hdmi clks: isfr:%d iahb:%d\n", __func__,
++			(int)clk_get_rate(hdmi_data->isfr_clk),
++			(int)clk_get_rate(hdmi_data->iahb_clk));
++
++	/* Indicates the subpacket represents a flatline sample */
++	hdmi_audio_writeb(FC_AUDSCONF, AUD_PACKET_SAMPFIT, 0x0);
++
++	return 0;
++}
++
++static void fsl_hdmi_soc_shutdown(struct snd_pcm_substream *substream,
++				struct snd_soc_dai *dai)
++{
++	struct imx_hdmi *hdmi_data = snd_soc_dai_get_drvdata(dai);
++
++	clk_disable_unprepare(hdmi_data->iahb_clk);
++	clk_disable_unprepare(hdmi_data->isfr_clk);
++}
++
++static int fsl_hdmi_soc_prepare(struct snd_pcm_substream *substream,
++		struct snd_soc_dai *dai)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++
++	hdmi_set_audio_infoframe(runtime->channels);
++	hdmi_audio_writeb(FC_AUDSCONF, AUD_PACKET_LAYOUT,
++			(runtime->channels > 2) ? 0x1 : 0x0);
++	hdmi_set_sample_rate(runtime->rate);
++	dumpregs(dai);
++
++	return 0;
++}
++
++static struct snd_soc_dai_ops fsl_hdmi_soc_dai_ops = {
++	.startup = fsl_hdmi_soc_startup,
++	.shutdown = fsl_hdmi_soc_shutdown,
++	.prepare = fsl_hdmi_soc_prepare,
++};
++
++/* IEC60958 status functions */
++static int fsl_hdmi_iec_info(struct snd_kcontrol *kcontrol,
++		struct snd_ctl_elem_info *uinfo)
++{
++	uinfo->type = SNDRV_CTL_ELEM_TYPE_IEC958;
++	uinfo->count = 1;
++
++	return 0;
++}
++
++
++static int fsl_hdmi_iec_get(struct snd_kcontrol *kcontrol,
++		struct snd_ctl_elem_value *uvalue)
++{
++	int i;
++
++	for (i = 0 ; i < 6 ; i++)
++		uvalue->value.iec958.status[i] = iec_header.status[i];
++
++	return 0;
++}
++
++static int fsl_hdmi_iec_put(struct snd_kcontrol *kcontrol,
++		struct snd_ctl_elem_value *uvalue)
++{
++	int i;
++
++	/* Do not allow professional mode */
++	if (uvalue->value.iec958.status[0] & IEC958_AES0_PROFESSIONAL)
++		return -EPERM;
++
++	for (i = 0 ; i < 6 ; i++) {
++		iec_header.status[i] = uvalue->value.iec958.status[i];
++		pr_debug("%s status[%d]=0x%02x\n", __func__, i, iec_header.status[i]);
++	}
++
++	return 0;
++}
++
++static struct snd_kcontrol_new fsl_hdmi_ctrls[] = {
++	/* Status cchanel controller */
++	{
++		.iface = SNDRV_CTL_ELEM_IFACE_MIXER,
++		.name = SNDRV_CTL_NAME_IEC958("", PLAYBACK, DEFAULT),
++		.access = SNDRV_CTL_ELEM_ACCESS_READ |
++			SNDRV_CTL_ELEM_ACCESS_WRITE |
++			SNDRV_CTL_ELEM_ACCESS_VOLATILE,
++		.info = fsl_hdmi_iec_info,
++		.get = fsl_hdmi_iec_get,
++		.put = fsl_hdmi_iec_put,
++	},
++};
++
++static int fsl_hdmi_soc_dai_probe(struct snd_soc_dai *dai)
++{
++	int ret;
++
++	init_channel_allocations();
++
++	ret = snd_soc_add_dai_controls(dai, fsl_hdmi_ctrls,
++			ARRAY_SIZE(fsl_hdmi_ctrls));
++	if (ret)
++		dev_warn(dai->dev, "failed to add dai controls\n");
++
++	return 0;
++}
++
++static struct snd_soc_dai_driver fsl_hdmi_dai = {
++	.probe = &fsl_hdmi_soc_dai_probe,
++	.playback = {
++		.channels_min = 2,
++		.channels_max = 8,
++		.rates = MXC_HDMI_RATES_PLAYBACK,
++		.formats = MXC_HDMI_FORMATS_PLAYBACK,
++	},
++	.ops = &fsl_hdmi_soc_dai_ops,
++};
++
++static const struct snd_soc_component_driver fsl_hdmi_component = {
++	.name		= "fsl-hdmi",
++};
++
++static int fsl_hdmi_dai_probe(struct platform_device *pdev)
++{
++	struct device_node *np = pdev->dev.of_node;
++	struct imx_hdmi *hdmi_data;
++	int ret = 0;
++
++	if (!np)
++		return -ENODEV;
++
++	if (!hdmi_get_registered()) {
++		dev_err(&pdev->dev, "failed to probe. Load HDMI-video first.\n");
++		return -ENOMEM;
++	}
++
++	hdmi_data = devm_kzalloc(&pdev->dev, sizeof(*hdmi_data), GFP_KERNEL);
++	if (!hdmi_data) {
++		dev_err(&pdev->dev, "failed to alloc hdmi_data\n");
++		return -ENOMEM;
++	}
++
++	hdmi_data->pdev = pdev;
++
++	memcpy(&hdmi_data->cpu_dai_drv, &fsl_hdmi_dai, sizeof(fsl_hdmi_dai));
++	hdmi_data->cpu_dai_drv.name = np->name;
++
++	hdmi_data->isfr_clk = devm_clk_get(&pdev->dev, "hdmi_isfr");
++	if (IS_ERR(hdmi_data->isfr_clk)) {
++		ret = PTR_ERR(hdmi_data->isfr_clk);
++		dev_err(&pdev->dev, "failed to get HDMI isfr clk: %d\n", ret);
++		return -EINVAL;
++	}
++
++	hdmi_data->iahb_clk = devm_clk_get(&pdev->dev, "hdmi_iahb");
++	if (IS_ERR(hdmi_data->iahb_clk)) {
++		ret = PTR_ERR(hdmi_data->iahb_clk);
++		dev_err(&pdev->dev, "failed to get HDMI ahb clk: %d\n", ret);
++		return -EINVAL;
++	}
++
++	dev_set_drvdata(&pdev->dev, hdmi_data);
++	ret = snd_soc_register_component(&pdev->dev, &fsl_hdmi_component,
++					&hdmi_data->cpu_dai_drv, 1);
++	if (ret) {
++		dev_err(&pdev->dev, "register DAI failed\n");
++		return ret;
++	}
++
++	hdmi_data->codec_dev = platform_device_register_simple(
++			"hdmi-audio-codec", -1, NULL, 0);
++	if (IS_ERR(hdmi_data->codec_dev)) {
++		dev_err(&pdev->dev, "failed to register HDMI audio codec\n");
++		ret = PTR_ERR(hdmi_data->codec_dev);
++		goto fail;
++	}
++
++	hdmi_data->dma_dev = platform_device_alloc("imx-hdmi-audio", -1);
++	if (IS_ERR(hdmi_data->dma_dev)) {
++		ret = PTR_ERR(hdmi_data->dma_dev);
++		goto fail_dma;
++	}
++
++	platform_set_drvdata(hdmi_data->dma_dev, hdmi_data);
++
++	ret = platform_device_add(hdmi_data->dma_dev);
++	if (ret) {
++		platform_device_put(hdmi_data->dma_dev);
++		goto fail_dma;
++	}
++
++	return 0;
++
++fail_dma:
++	platform_device_unregister(hdmi_data->codec_dev);
++fail:
++	snd_soc_unregister_component(&pdev->dev);
++
++	return ret;
++}
++
++static int fsl_hdmi_dai_remove(struct platform_device *pdev)
++{
++	struct imx_hdmi *hdmi_data = platform_get_drvdata(pdev);
++
++	platform_device_unregister(hdmi_data->dma_dev);
++	platform_device_unregister(hdmi_data->codec_dev);
++	snd_soc_unregister_component(&pdev->dev);
++
++	return 0;
++}
++
++static const struct of_device_id fsl_hdmi_dai_dt_ids[] = {
++	{ .compatible = "fsl,imx6dl-hdmi-audio", },
++	{ .compatible = "fsl,imx6q-hdmi-audio", },
++	{ /* sentinel */ }
++};
++MODULE_DEVICE_TABLE(of, fsl_hdmi_dai_dt_ids);
++
++static struct platform_driver fsl_hdmi_driver = {
++	.probe = fsl_hdmi_dai_probe,
++	.remove = fsl_hdmi_dai_remove,
++	.driver = {
++		.name = "fsl-hdmi-dai",
++		.owner = THIS_MODULE,
++		.of_match_table = fsl_hdmi_dai_dt_ids,
++	},
++};
++module_platform_driver(fsl_hdmi_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("IMX HDMI TX DAI");
++MODULE_LICENSE("GPL");
++MODULE_ALIAS("platform:fsl-hdmi-dai");
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_sai.c linux-xbian-imx6/sound/soc/fsl/fsl_sai.c
+--- linux-4.1.3/sound/soc/fsl/fsl_sai.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/fsl_sai.c	2015-07-27 23:13:11.149203200 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * Freescale ALSA SoC Digital Audio Interface (SAI) driver.
+  *
+- * Copyright 2012-2013 Freescale Semiconductor, Inc.
++ * Copyright 2012-2014 Freescale Semiconductor, Inc.
+  *
+  * This program is free software, you can redistribute it and/or modify it
+  * under the terms of the GNU General Public License as published by the
+@@ -662,7 +662,7 @@
+ 		return ret;
+ 
+ 	if (sai->sai_on_imx)
+-		return imx_pcm_dma_init(pdev);
++		return imx_pcm_dma_init(pdev, IMX_SAI_DMABUF_SIZE);
+ 	else
+ 		return devm_snd_dmaengine_pcm_register(&pdev->dev, NULL,
+ 				SND_DMAENGINE_PCM_FLAG_NO_RESIDUE);
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_spdif.c linux-xbian-imx6/sound/soc/fsl/fsl_spdif.c
+--- linux-4.1.3/sound/soc/fsl/fsl_spdif.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/fsl_spdif.c	2015-07-27 23:13:11.149203200 +0200
+@@ -1,7 +1,7 @@
+ /*
+  * Freescale S/PDIF ALSA SoC Digital Audio Interface (DAI) driver
+  *
+- * Copyright (C) 2013 Freescale Semiconductor, Inc.
++ * Copyright (C) 2013-2014 Freescale Semiconductor, Inc.
+  *
+  * Based on stmp3xxx_spdif_dai.c
+  * Vladimir Barinov <vbarinov@embeddedalley.com>
+@@ -20,6 +20,8 @@
+ #include <linux/of_device.h>
+ #include <linux/of_irq.h>
+ #include <linux/regmap.h>
++#include <linux/pm_runtime.h>
++#include <linux/busfreq-imx6.h>
+ 
+ #include <sound/asoundef.h>
+ #include <sound/dmaengine_pcm.h>
+@@ -106,8 +108,11 @@
+ 	struct clk *rxclk;
+ 	struct clk *coreclk;
+ 	struct clk *sysclk;
++	struct clk *dmaclk;
+ 	struct snd_dmaengine_dai_dma_data dma_params_tx;
+ 	struct snd_dmaengine_dai_dma_data dma_params_rx;
++	/* regcache for SRPC */
++	u32 regcache_srpc;
+ };
+ 
+ /* DPLL locked and lock loss interrupt handler */
+@@ -300,6 +305,8 @@
+ 	struct regmap *regmap = spdif_priv->regmap;
+ 	u32 val, cycle = 1000;
+ 
++	regcache_cache_bypass(regmap, true);
++
+ 	regmap_write(regmap, REG_SPDIF_SCR, SCR_SOFT_RESET);
+ 
+ 	/*
+@@ -310,6 +317,10 @@
+ 		regmap_read(regmap, REG_SPDIF_SCR, &val);
+ 	} while ((val & SCR_SOFT_RESET) && cycle--);
+ 
++	regcache_cache_bypass(regmap, false);
++	regcache_mark_dirty(regmap);
++	regcache_sync(regmap);
++
+ 	if (cycle)
+ 		return 0;
+ 	else
+@@ -371,7 +382,6 @@
+ 	unsigned long csfs = 0;
+ 	u32 stc, mask, rate;
+ 	u8 clk, txclk_df, sysclk_df;
+-	int ret;
+ 
+ 	switch (sample_rate) {
+ 	case 32000:
+@@ -413,21 +423,6 @@
+ 
+ 	sysclk_df = spdif_priv->sysclk_df[rate];
+ 
+-	/* Don't mess up the clocks from other modules */
+-	if (clk != STC_TXCLK_SPDIF_ROOT)
+-		goto clk_set_bypass;
+-
+-	/*
+-	 * The S/PDIF block needs a clock of 64 * fs * txclk_df.
+-	 * So request 64 * fs * (txclk_df + 1) to get rounded.
+-	 */
+-	ret = clk_set_rate(spdif_priv->txclk[rate], 64 * sample_rate * (txclk_df + 1));
+-	if (ret) {
+-		dev_err(&pdev->dev, "failed to set tx clock rate\n");
+-		return ret;
+-	}
+-
+-clk_set_bypass:
+ 	dev_dbg(&pdev->dev, "expected clock rate = %d\n",
+ 			(64 * sample_rate * txclk_df * sysclk_df));
+ 	dev_dbg(&pdev->dev, "actual clock rate = %ld\n",
+@@ -459,6 +454,8 @@
+ 	u32 scr, mask, i;
+ 	int ret;
+ 
++	pm_runtime_get_sync(cpu_dai->dev);
++
+ 	/* Reset module and interrupts only for first initialization */
+ 	if (!cpu_dai->active) {
+ 		ret = clk_prepare_enable(spdif_priv->coreclk);
+@@ -467,6 +464,12 @@
+ 			return ret;
+ 		}
+ 
++		ret = clk_prepare_enable(spdif_priv->dmaclk);
++		if (ret) {
++			dev_err(&pdev->dev, "failed to enable dma clock\n");
++			return ret;
++		}
++
+ 		ret = spdif_softreset(spdif_priv);
+ 		if (ret) {
+ 			dev_err(&pdev->dev, "failed to soft reset\n");
+@@ -533,8 +536,11 @@
+ 		spdif_intr_status_clear(spdif_priv);
+ 		regmap_update_bits(regmap, REG_SPDIF_SCR,
+ 				SCR_LOW_POWER, SCR_LOW_POWER);
++		clk_disable_unprepare(spdif_priv->dmaclk);
+ 		clk_disable_unprepare(spdif_priv->coreclk);
+ 	}
++
++	pm_runtime_put_sync(cpu_dai->dev);
+ }
+ 
+ static int fsl_spdif_hw_params(struct snd_pcm_substream *substream,
+@@ -1015,6 +1021,27 @@
+ 	}
+ }
+ 
++static bool fsl_spdif_volatile_reg(struct device *dev, unsigned int reg)
++{
++	switch (reg) {
++	case REG_SPDIF_SRPC:
++	case REG_SPDIF_SIS:
++	case REG_SPDIF_SRL:
++	case REG_SPDIF_SRR:
++	case REG_SPDIF_SRCSH:
++	case REG_SPDIF_SRCSL:
++	case REG_SPDIF_SRU:
++	case REG_SPDIF_SRQ:
++	case REG_SPDIF_STL:
++	case REG_SPDIF_STR:
++	case REG_SPDIF_SRFM:
++		return true;
++	default:
++		return false;
++	}
++
++}
++
+ static bool fsl_spdif_writeable_reg(struct device *dev, unsigned int reg)
+ {
+ 	switch (reg) {
+@@ -1041,7 +1068,9 @@
+ 
+ 	.max_register = REG_SPDIF_STC,
+ 	.readable_reg = fsl_spdif_readable_reg,
++	.volatile_reg = fsl_spdif_volatile_reg,
+ 	.writeable_reg = fsl_spdif_writeable_reg,
++	.cache_type = REGCACHE_RBTREE,
+ };
+ 
+ static u32 fsl_spdif_txclk_caldiv(struct fsl_spdif_priv *spdif_priv,
+@@ -1049,8 +1078,8 @@
+ 				enum spdif_txrate index, bool round)
+ {
+ 	const u32 rate[] = { 32000, 44100, 48000, 96000, 192000 };
+-	bool is_sysclk = clk_is_match(clk, spdif_priv->sysclk);
+-	u64 rate_ideal, rate_actual, sub;
++	bool is_sysclk = clk == spdif_priv->sysclk;
++	u64 rate_actual, sub;
+ 	u32 sysclk_dfmin, sysclk_dfmax;
+ 	u32 txclk_df, sysclk_df, arate;
+ 
+@@ -1060,11 +1089,7 @@
+ 
+ 	for (sysclk_df = sysclk_dfmin; sysclk_df <= sysclk_dfmax; sysclk_df++) {
+ 		for (txclk_df = 1; txclk_df <= 128; txclk_df++) {
+-			rate_ideal = rate[index] * (txclk_df + 1) * 64;
+-			if (round)
+-				rate_actual = clk_round_rate(clk, rate_ideal);
+-			else
+-				rate_actual = clk_get_rate(clk);
++			rate_actual = clk_get_rate(clk);
+ 
+ 			arate = rate_actual / 64;
+ 			arate /= txclk_df * sysclk_df;
+@@ -1214,6 +1239,13 @@
+ 		return PTR_ERR(spdif_priv->coreclk);
+ 	}
+ 
++	/* Get dma clock for dma script operation */
++	spdif_priv->dmaclk = devm_clk_get(&pdev->dev, "dma");
++	if (IS_ERR(spdif_priv->dmaclk)) {
++		dev_err(&pdev->dev, "no dma clock in devicetree\n");
++		return PTR_ERR(spdif_priv->dmaclk);
++	}
++
+ 	/* Select clock source for rx/tx clock */
+ 	spdif_priv->rxclk = devm_clk_get(&pdev->dev, "rxtx1");
+ 	if (IS_ERR(spdif_priv->rxclk)) {
+@@ -1247,6 +1279,8 @@
+ 	spdif_priv->dma_params_tx.addr = res->start + REG_SPDIF_STL;
+ 	spdif_priv->dma_params_rx.addr = res->start + REG_SPDIF_SRL;
+ 
++	pm_runtime_enable(&pdev->dev);
++
+ 	/* Register with ASoC */
+ 	dev_set_drvdata(&pdev->dev, spdif_priv);
+ 
+@@ -1257,13 +1291,62 @@
+ 		return ret;
+ 	}
+ 
+-	ret = imx_pcm_dma_init(pdev);
++	ret = imx_pcm_dma_init(pdev, IMX_SPDIF_DMABUF_SIZE);
+ 	if (ret)
+ 		dev_err(&pdev->dev, "imx_pcm_dma_init failed: %d\n", ret);
+ 
+ 	return ret;
+ }
+ 
++#ifdef CONFIG_PM
++static int fsl_spdif_runtime_resume(struct device *dev)
++{
++	request_bus_freq(BUS_FREQ_HIGH);
++	return 0;
++}
++
++static int fsl_spdif_runtime_suspend(struct device *dev)
++{
++	release_bus_freq(BUS_FREQ_HIGH);
++	return 0;
++}
++#endif
++
++#ifdef CONFIG_PM_SLEEP
++static int fsl_spdif_suspend(struct device *dev)
++{
++	struct fsl_spdif_priv *spdif_priv = dev_get_drvdata(dev);
++
++	regmap_read(spdif_priv->regmap, REG_SPDIF_SRPC,
++			&spdif_priv->regcache_srpc);
++
++	regcache_cache_only(spdif_priv->regmap, true);
++	regcache_mark_dirty(spdif_priv->regmap);
++
++	return 0;
++}
++
++static int fsl_spdif_resume(struct device *dev)
++{
++	struct fsl_spdif_priv *spdif_priv = dev_get_drvdata(dev);
++
++	regcache_cache_only(spdif_priv->regmap, false);
++
++	regmap_update_bits(spdif_priv->regmap, REG_SPDIF_SRPC,
++			SRPC_CLKSRC_SEL_MASK | SRPC_GAINSEL_MASK,
++			spdif_priv->regcache_srpc);
++
++	return regcache_sync(spdif_priv->regmap);
++}
++#endif /* CONFIG_PM_SLEEP */
++
++static const struct dev_pm_ops fsl_spdif_pm = {
++	SET_RUNTIME_PM_OPS(fsl_spdif_runtime_suspend,
++			fsl_spdif_runtime_resume,
++			NULL)
++	SET_SYSTEM_SLEEP_PM_OPS(fsl_spdif_suspend, fsl_spdif_resume)
++};
++
+ static const struct of_device_id fsl_spdif_dt_ids[] = {
+ 	{ .compatible = "fsl,imx35-spdif", },
+ 	{ .compatible = "fsl,vf610-spdif", },
+@@ -1275,6 +1358,7 @@
+ 	.driver = {
+ 		.name = "fsl-spdif-dai",
+ 		.of_match_table = fsl_spdif_dt_ids,
++		.pm = &fsl_spdif_pm,
+ 	},
+ 	.probe = fsl_spdif_probe,
+ };
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_ssi.c linux-xbian-imx6/sound/soc/fsl/fsl_ssi.c
+--- linux-4.1.3/sound/soc/fsl/fsl_ssi.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/fsl_ssi.c	2015-07-27 23:13:11.153188979 +0200
+@@ -3,7 +3,7 @@
+  *
+  * Author: Timur Tabi <timur@freescale.com>
+  *
+- * Copyright 2007-2010 Freescale Semiconductor, Inc.
++ * Copyright (C) 2007-2013 Freescale Semiconductor, Inc.
+  *
+  * This file is licensed under the terms of the GNU General Public License
+  * version 2.  This program is licensed "as is" without any warranty of any
+@@ -30,19 +30,21 @@
+  * around this by not polling these bits but only wait a fixed delay.
+  */
+ 
++#include <linux/busfreq-imx6.h>
+ #include <linux/init.h>
+ #include <linux/io.h>
+ #include <linux/module.h>
+ #include <linux/interrupt.h>
+ #include <linux/clk.h>
++#include <linux/debugfs.h>
+ #include <linux/device.h>
+ #include <linux/delay.h>
+ #include <linux/slab.h>
+ #include <linux/spinlock.h>
+-#include <linux/of.h>
+ #include <linux/of_address.h>
+ #include <linux/of_irq.h>
+ #include <linux/of_platform.h>
++#include <linux/pm_runtime.h>
+ 
+ #include <sound/core.h>
+ #include <sound/pcm.h>
+@@ -54,6 +56,43 @@
+ #include "fsl_ssi.h"
+ #include "imx-pcm.h"
+ 
++#ifdef PPC
++#define read_ssi(addr)			 in_be32(addr)
++#define write_ssi(val, addr)		 out_be32(addr, val)
++#define write_ssi_mask(addr, clear, set) clrsetbits_be32(addr, clear, set)
++#else
++#define read_ssi(addr)			 readl(addr)
++#define write_ssi(val, addr)		 writel(val, addr)
++/*
++ * FIXME: Proper locking should be added at write_ssi_mask caller level
++ * to ensure this register read/modify/write sequence is race free.
++ */
++static inline void write_ssi_mask(u32 __iomem *addr, u32 clear, u32 set)
++{
++	u32 val = readl(addr);
++	val = (val & ~clear) | set;
++	writel(val, addr);
++}
++#endif
++
++#ifdef DEBUG
++#define NUM_OF_SSI_REG (sizeof(struct ccsr_ssi) / sizeof(__be32))
++
++void dump_reg(struct ccsr_ssi __iomem *ssi)
++{
++	u32 val, i;
++
++	for (i = 0; i < NUM_OF_SSI_REG; i++) {
++		if (&ssi->stx0 + i == NULL)
++			continue;
++		val = read_ssi(&ssi->stx0 + i);
++		pr_debug("REG %x = %x\n", (u32)(&ssi->stx0 + i) & 0xff, val);
++	}
++}
++#else
++void dump_reg(struct ccsr_ssi __iomem *ssi) {}
++#endif
++
+ /**
+  * FSLSSI_I2S_RATES: sample rates supported by the I2S
+  *
+@@ -67,6 +106,8 @@
+ /**
+  * FSLSSI_I2S_FORMATS: audio formats supported by the SSI
+  *
++ * This driver currently only supports the SSI running in I2S slave mode.
++ *
+  * The SSI has a limitation in that the samples must be in the same byte
+  * order as the host CPU.  This is because when multiple bytes are written
+  * to the STX register, the bytes and bits must be written in the same
+@@ -92,6 +133,8 @@
+ #define FSLSSI_SIER_DBG_TX_FLAGS (CCSR_SSI_SIER_TFE0_EN | \
+ 		CCSR_SSI_SIER_TLS_EN | CCSR_SSI_SIER_TFS_EN | \
+ 		CCSR_SSI_SIER_TUE0_EN | CCSR_SSI_SIER_TFRC_EN)
++#define FSLSSI_SISR_MASK (FSLSSI_SIER_DBG_RX_FLAGS | FSLSSI_SIER_DBG_TX_FLAGS)
++
+ 
+ enum fsl_ssi_type {
+ 	FSL_SSI_MCP8610,
+@@ -111,158 +154,105 @@
+ 	struct fsl_ssi_reg_val rx;
+ 	struct fsl_ssi_reg_val tx;
+ };
+-static const struct regmap_config fsl_ssi_regconfig = {
+-	.max_register = CCSR_SSI_SACCDIS,
+-	.reg_bits = 32,
+-	.val_bits = 32,
+-	.reg_stride = 4,
+-	.val_format_endian = REGMAP_ENDIAN_NATIVE,
+-};
+-
+-struct fsl_ssi_soc_data {
+-	bool imx;
+-	bool offline_config;
+-	u32 sisr_write_mask;
+-};
+ 
+ /**
+  * fsl_ssi_private: per-SSI private data
+  *
+- * @reg: Pointer to the regmap registers
+- * @irq: IRQ of this SSI
+- * @cpu_dai_drv: CPU DAI driver for this device
+- *
+- * @dai_fmt: DAI configuration this device is currently used with
+- * @i2s_mode: i2s and network mode configuration of the device. Is used to
+- * switch between normal and i2s/network mode
+- * mode depending on the number of channels
+- * @use_dma: DMA is used or FIQ with stream filter
+- * @use_dual_fifo: DMA with support for both FIFOs used
+- * @fifo_deph: Depth of the SSI FIFOs
+- * @rxtx_reg_val: Specific register settings for receive/transmit configuration
+- *
+- * @clk: SSI clock
+- * @baudclk: SSI baud clock for master mode
+- * @baudclk_streams: Active streams that are using baudclk
+- * @bitclk_freq: bitclock frequency set by .set_dai_sysclk
+- *
+- * @dma_params_tx: DMA transmit parameters
+- * @dma_params_rx: DMA receive parameters
++ * @ssi: pointer to the SSI's registers
+  * @ssi_phys: physical address of the SSI registers
+- *
+- * @fiq_params: FIQ stream filtering parameters
+- *
+- * @pdev: Pointer to pdev used for deprecated fsl-ssi sound card
+- *
+- * @dbg_stats: Debugging statistics
+- *
+- * @soc: SoC specifc data
++ * @irq: IRQ of this SSI
++ * @playback: the number of playback streams opened
++ * @capture: the number of capture streams opened
++ * @cpu_dai: the CPU DAI for this device
++ * @dev_attr: the sysfs device attribute structure
++ * @stats: SSI statistics
++ * @name: name for this device
+  */
+ struct fsl_ssi_private {
+-	struct regmap *regs;
+-	int irq;
++	struct ccsr_ssi __iomem *ssi;
++	dma_addr_t ssi_phys;
++	unsigned int irq;
++	unsigned int fifo_depth;
+ 	struct snd_soc_dai_driver cpu_dai_drv;
++	struct platform_device *pdev;
+ 
+-	unsigned int dai_fmt;
+-	u8 i2s_mode;
++	enum fsl_ssi_type hw_type;
++	bool new_binding;
++	bool ssi_on_imx;
++	bool imx_ac97;
+ 	bool use_dma;
++	bool baudclk_locked;
++	bool irq_stats;
++	bool offline_config;
+ 	bool use_dual_fifo;
+-	bool has_ipg_clk_name;
+-	unsigned int fifo_depth;
+-	struct fsl_ssi_rxtx_reg_val rxtx_reg_val;
+-
+-	struct clk *clk;
++	u8 i2s_mode;
++	spinlock_t baudclk_lock;
+ 	struct clk *baudclk;
+-	unsigned int baudclk_streams;
+-	unsigned int bitclk_freq;
+-
+-	/* DMA params */
++	struct clk *clk;
+ 	struct snd_dmaengine_dai_dma_data dma_params_tx;
+ 	struct snd_dmaengine_dai_dma_data dma_params_rx;
+-	dma_addr_t ssi_phys;
+-
+-	/* params for non-dma FIQ stream filtered mode */
+ 	struct imx_pcm_fiq_params fiq_params;
++	/* Register values for rx/tx configuration */
++	struct fsl_ssi_rxtx_reg_val rxtx_reg_val;
+ 
+-	/* Used when using fsl-ssi as sound-card. This is only used by ppc and
+-	 * should be replaced with simple-sound-card. */
+-	struct platform_device *pdev;
+-
+-	struct fsl_ssi_dbg dbg_stats;
+-
+-	const struct fsl_ssi_soc_data *soc;
+-};
+-
+-/*
+- * imx51 and later SoCs have a slightly different IP that allows the
+- * SSI configuration while the SSI unit is running.
+- *
+- * More important, it is necessary on those SoCs to configure the
+- * sperate TX/RX DMA bits just before starting the stream
+- * (fsl_ssi_trigger). The SDMA unit has to be configured before fsl_ssi
+- * sends any DMA requests to the SDMA unit, otherwise it is not defined
+- * how the SDMA unit handles the DMA request.
+- *
+- * SDMA units are present on devices starting at imx35 but the imx35
+- * reference manual states that the DMA bits should not be changed
+- * while the SSI unit is running (SSIEN). So we support the necessary
+- * online configuration of fsl-ssi starting at imx51.
+- */
++	struct {
++		unsigned int rfrc;
++		unsigned int tfrc;
++		unsigned int cmdau;
++		unsigned int cmddu;
++		unsigned int rxt;
++		unsigned int rdr1;
++		unsigned int rdr0;
++		unsigned int tde1;
++		unsigned int tde0;
++		unsigned int roe1;
++		unsigned int roe0;
++		unsigned int tue1;
++		unsigned int tue0;
++		unsigned int tfs;
++		unsigned int rfs;
++		unsigned int tls;
++		unsigned int rls;
++		unsigned int rff1;
++		unsigned int rff0;
++		unsigned int tfe1;
++		unsigned int tfe0;
++	} stats;
++	struct dentry *dbg_dir;
++	struct dentry *dbg_stats;
+ 
+-static struct fsl_ssi_soc_data fsl_ssi_mpc8610 = {
+-	.imx = false,
+-	.offline_config = true,
+-	.sisr_write_mask = CCSR_SSI_SISR_RFRC | CCSR_SSI_SISR_TFRC |
+-			CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
+-			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1,
++	char name[1];
+ };
+ 
+-static struct fsl_ssi_soc_data fsl_ssi_imx21 = {
+-	.imx = true,
+-	.offline_config = true,
+-	.sisr_write_mask = 0,
+-};
++#ifdef CONFIG_PM
++static int fsl_ssi_runtime_resume(struct device *dev)
++{
++	request_bus_freq(BUS_FREQ_AUDIO);
++	return 0;
++}
+ 
+-static struct fsl_ssi_soc_data fsl_ssi_imx35 = {
+-	.imx = true,
+-	.offline_config = true,
+-	.sisr_write_mask = CCSR_SSI_SISR_RFRC | CCSR_SSI_SISR_TFRC |
+-			CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
+-			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1,
+-};
++static int fsl_ssi_runtime_suspend(struct device *dev)
++{
++	release_bus_freq(BUS_FREQ_AUDIO);
++	return 0;
++}
++#endif
+ 
+-static struct fsl_ssi_soc_data fsl_ssi_imx51 = {
+-	.imx = true,
+-	.offline_config = false,
+-	.sisr_write_mask = CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
+-		CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1,
++static const struct dev_pm_ops fsl_ssi_pm = {
++	SET_RUNTIME_PM_OPS(fsl_ssi_runtime_suspend,
++			fsl_ssi_runtime_resume,
++			NULL)
+ };
+ 
+ static const struct of_device_id fsl_ssi_ids[] = {
+-	{ .compatible = "fsl,mpc8610-ssi", .data = &fsl_ssi_mpc8610 },
+-	{ .compatible = "fsl,imx51-ssi", .data = &fsl_ssi_imx51 },
+-	{ .compatible = "fsl,imx35-ssi", .data = &fsl_ssi_imx35 },
+-	{ .compatible = "fsl,imx21-ssi", .data = &fsl_ssi_imx21 },
++	{ .compatible = "fsl,mpc8610-ssi", .data = (void *) FSL_SSI_MCP8610},
++	{ .compatible = "fsl,imx51-ssi", .data = (void *) FSL_SSI_MX51},
++	{ .compatible = "fsl,imx35-ssi", .data = (void *) FSL_SSI_MX35},
++	{ .compatible = "fsl,imx21-ssi", .data = (void *) FSL_SSI_MX21},
+ 	{}
+ };
+ MODULE_DEVICE_TABLE(of, fsl_ssi_ids);
+ 
+-static bool fsl_ssi_is_ac97(struct fsl_ssi_private *ssi_private)
+-{
+-	return !!(ssi_private->dai_fmt & SND_SOC_DAIFMT_AC97);
+-}
+-
+-static bool fsl_ssi_is_i2s_master(struct fsl_ssi_private *ssi_private)
+-{
+-	return (ssi_private->dai_fmt & SND_SOC_DAIFMT_MASTER_MASK) ==
+-		SND_SOC_DAIFMT_CBS_CFS;
+-}
+-
+-static bool fsl_ssi_is_i2s_cbm_cfs(struct fsl_ssi_private *ssi_private)
+-{
+-	return (ssi_private->dai_fmt & SND_SOC_DAIFMT_MASTER_MASK) ==
+-		SND_SOC_DAIFMT_CBM_CFS;
+-}
+ /**
+  * fsl_ssi_isr: SSI interrupt handler
+  *
+@@ -278,74 +268,281 @@
+ static irqreturn_t fsl_ssi_isr(int irq, void *dev_id)
+ {
+ 	struct fsl_ssi_private *ssi_private = dev_id;
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
++	irqreturn_t ret = IRQ_NONE;
+ 	__be32 sisr;
+ 	__be32 sisr2;
++	__be32 sisr_write_mask = 0;
++
++	switch (ssi_private->hw_type) {
++	case FSL_SSI_MX21:
++		sisr_write_mask = 0;
++		break;
++
++	case FSL_SSI_MCP8610:
++	case FSL_SSI_MX35:
++		sisr_write_mask = CCSR_SSI_SISR_RFRC | CCSR_SSI_SISR_TFRC |
++			CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
++			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1;
++		break;
++
++	case FSL_SSI_MX51:
++		sisr_write_mask = CCSR_SSI_SISR_ROE0 | CCSR_SSI_SISR_ROE1 |
++			CCSR_SSI_SISR_TUE0 | CCSR_SSI_SISR_TUE1;
++		break;
++	}
+ 
+ 	/* We got an interrupt, so read the status register to see what we
+ 	   were interrupted for.  We mask it with the Interrupt Enable register
+ 	   so that we only check for events that we're interested in.
+ 	 */
+-	regmap_read(regs, CCSR_SSI_SISR, &sisr);
++	sisr = read_ssi(&ssi->sisr) & FSLSSI_SISR_MASK;
+ 
+-	sisr2 = sisr & ssi_private->soc->sisr_write_mask;
++	if (sisr & CCSR_SSI_SISR_RFRC) {
++		ssi_private->stats.rfrc++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TFRC) {
++		ssi_private->stats.tfrc++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_CMDAU) {
++		ssi_private->stats.cmdau++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_CMDDU) {
++		ssi_private->stats.cmddu++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RXT) {
++		ssi_private->stats.rxt++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RDR1) {
++		ssi_private->stats.rdr1++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RDR0) {
++		ssi_private->stats.rdr0++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TDE1) {
++		ssi_private->stats.tde1++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TDE0) {
++		ssi_private->stats.tde0++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_ROE1) {
++		ssi_private->stats.roe1++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_ROE0) {
++		ssi_private->stats.roe0++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TUE1) {
++		ssi_private->stats.tue1++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TUE0) {
++		ssi_private->stats.tue0++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TFS) {
++		ssi_private->stats.tfs++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RFS) {
++		ssi_private->stats.rfs++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TLS) {
++		ssi_private->stats.tls++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RLS) {
++		ssi_private->stats.rls++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RFF1) {
++		ssi_private->stats.rff1++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_RFF0) {
++		ssi_private->stats.rff0++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TFE1) {
++		ssi_private->stats.tfe1++;
++		ret = IRQ_HANDLED;
++	}
++
++	if (sisr & CCSR_SSI_SISR_TFE0) {
++		ssi_private->stats.tfe0++;
++		ret = IRQ_HANDLED;
++	}
++
++	sisr2 = sisr & sisr_write_mask;
+ 	/* Clear the bits that we set */
+ 	if (sisr2)
+-		regmap_write(regs, CCSR_SSI_SISR, sisr2);
++		write_ssi(sisr2, &ssi->sisr);
++
++	return ret;
++}
++
++#if IS_ENABLED(CONFIG_DEBUG_FS)
++/* Show the statistics of a flag only if its interrupt is enabled.  The
++ * compiler will optimze this code to a no-op if the interrupt is not
++ * enabled.
++ */
++#define SIER_SHOW(flag, name) \
++	do { \
++		if (FSLSSI_SISR_MASK & CCSR_SSI_SIER_##flag) \
++			seq_printf(s, #name "=%u\n", ssi_private->stats.name); \
++	} while (0)
++
++
++/**
++ * fsl_sysfs_ssi_show: display SSI statistics
++ *
++ * Display the statistics for the current SSI device.  To avoid confusion,
++ * we only show those counts that are enabled.
++ */
++static int fsl_ssi_stats_show(struct seq_file *s, void *unused)
++{
++	struct fsl_ssi_private *ssi_private = s->private;
++
++	SIER_SHOW(RFRC_EN, rfrc);
++	SIER_SHOW(TFRC_EN, tfrc);
++	SIER_SHOW(CMDAU_EN, cmdau);
++	SIER_SHOW(CMDDU_EN, cmddu);
++	SIER_SHOW(RXT_EN, rxt);
++	SIER_SHOW(RDR1_EN, rdr1);
++	SIER_SHOW(RDR0_EN, rdr0);
++	SIER_SHOW(TDE1_EN, tde1);
++	SIER_SHOW(TDE0_EN, tde0);
++	SIER_SHOW(ROE1_EN, roe1);
++	SIER_SHOW(ROE0_EN, roe0);
++	SIER_SHOW(TUE1_EN, tue1);
++	SIER_SHOW(TUE0_EN, tue0);
++	SIER_SHOW(TFS_EN, tfs);
++	SIER_SHOW(RFS_EN, rfs);
++	SIER_SHOW(TLS_EN, tls);
++	SIER_SHOW(RLS_EN, rls);
++	SIER_SHOW(RFF1_EN, rff1);
++	SIER_SHOW(RFF0_EN, rff0);
++	SIER_SHOW(TFE1_EN, tfe1);
++	SIER_SHOW(TFE0_EN, tfe0);
++
++	return 0;
++}
++
++static int fsl_ssi_stats_open(struct inode *inode, struct file *file)
++{
++	return single_open(file, fsl_ssi_stats_show, inode->i_private);
++}
+ 
+-	fsl_ssi_dbg_isr(&ssi_private->dbg_stats, sisr);
++static const struct file_operations fsl_ssi_stats_ops = {
++	.open = fsl_ssi_stats_open,
++	.read = seq_read,
++	.llseek = seq_lseek,
++	.release = single_release,
++};
++
++static int fsl_ssi_debugfs_create(struct fsl_ssi_private *ssi_private,
++		struct device *dev)
++{
++	ssi_private->dbg_dir = debugfs_create_dir(dev_name(dev), NULL);
++	if (!ssi_private->dbg_dir)
++		return -ENOMEM;
++
++	ssi_private->dbg_stats = debugfs_create_file("stats", S_IRUGO,
++			ssi_private->dbg_dir, ssi_private, &fsl_ssi_stats_ops);
++	if (!ssi_private->dbg_stats) {
++		debugfs_remove(ssi_private->dbg_dir);
++		return -ENOMEM;
++	}
++
++	return 0;
++}
++
++static void fsl_ssi_debugfs_remove(struct fsl_ssi_private *ssi_private)
++{
++	debugfs_remove(ssi_private->dbg_stats);
++	debugfs_remove(ssi_private->dbg_dir);
++}
++
++#else
++
++static int fsl_ssi_debugfs_create(struct fsl_ssi_private *ssi_private,
++		struct device *dev)
++{
++	return 0;
++}
+ 
+-	return IRQ_HANDLED;
++static void fsl_ssi_debugfs_remove(struct fsl_ssi_private *ssi_private)
++{
+ }
+ 
++#endif /* IS_ENABLED(CONFIG_DEBUG_FS) */
++
+ /*
+  * Enable/Disable all rx/tx config flags at once.
+  */
+ static void fsl_ssi_rxtx_config(struct fsl_ssi_private *ssi_private,
+ 		bool enable)
+ {
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
+ 	struct fsl_ssi_rxtx_reg_val *vals = &ssi_private->rxtx_reg_val;
+ 
+ 	if (enable) {
+-		regmap_update_bits(regs, CCSR_SSI_SIER,
+-				vals->rx.sier | vals->tx.sier,
+-				vals->rx.sier | vals->tx.sier);
+-		regmap_update_bits(regs, CCSR_SSI_SRCR,
+-				vals->rx.srcr | vals->tx.srcr,
+-				vals->rx.srcr | vals->tx.srcr);
+-		regmap_update_bits(regs, CCSR_SSI_STCR,
+-				vals->rx.stcr | vals->tx.stcr,
+-				vals->rx.stcr | vals->tx.stcr);
++		write_ssi_mask(&ssi->sier, 0, vals->rx.sier | vals->tx.sier);
++		write_ssi_mask(&ssi->srcr, 0, vals->rx.srcr | vals->tx.srcr);
++		write_ssi_mask(&ssi->stcr, 0, vals->rx.stcr | vals->tx.stcr);
+ 	} else {
+-		regmap_update_bits(regs, CCSR_SSI_SRCR,
+-				vals->rx.srcr | vals->tx.srcr, 0);
+-		regmap_update_bits(regs, CCSR_SSI_STCR,
+-				vals->rx.stcr | vals->tx.stcr, 0);
+-		regmap_update_bits(regs, CCSR_SSI_SIER,
+-				vals->rx.sier | vals->tx.sier, 0);
++		write_ssi_mask(&ssi->srcr, vals->rx.srcr | vals->tx.srcr, 0);
++		write_ssi_mask(&ssi->stcr, vals->rx.stcr | vals->tx.stcr, 0);
++		write_ssi_mask(&ssi->sier, vals->rx.sier | vals->tx.sier, 0);
+ 	}
+ }
+ 
+-/*
+- * Calculate the bits that have to be disabled for the current stream that is
+- * getting disabled. This keeps the bits enabled that are necessary for the
+- * second stream to work if 'stream_active' is true.
+- *
+- * Detailed calculation:
+- * These are the values that need to be active after disabling. For non-active
+- * second stream, this is 0:
+- *	vals_stream * !!stream_active
+- *
+- * The following computes the overall differences between the setup for the
+- * to-disable stream and the active stream, a simple XOR:
+- *	vals_disable ^ (vals_stream * !!(stream_active))
+- *
+- * The full expression adds a mask on all values we care about
+- */
+-#define fsl_ssi_disable_val(vals_disable, vals_stream, stream_active) \
+-	((vals_disable) & \
+-	 ((vals_disable) ^ ((vals_stream) * (u32)!!(stream_active))))
++static void fsl_ssi_clk_ctrl(struct fsl_ssi_private *ssi_private, bool enable)
++{
++	if (enable) {
++		if (ssi_private->ssi_on_imx) {
++			if (!IS_ERR(ssi_private->baudclk))
++				clk_enable(ssi_private->baudclk);
++			clk_enable(ssi_private->clk);
++		}
++	} else {
++		if (ssi_private->ssi_on_imx) {
++			if (!IS_ERR(ssi_private->baudclk))
++				clk_disable(ssi_private->baudclk);
++			clk_disable(ssi_private->clk);
++		}
++	}
++}
+ 
+ /*
+  * Enable/Disable a ssi configuration. You have to pass either
+@@ -354,22 +551,12 @@
+ static void fsl_ssi_config(struct fsl_ssi_private *ssi_private, bool enable,
+ 		struct fsl_ssi_reg_val *vals)
+ {
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
+ 	struct fsl_ssi_reg_val *avals;
+-	int nr_active_streams;
+-	u32 scr_val;
+-	int keep_active;
+-
+-	regmap_read(regs, CCSR_SSI_SCR, &scr_val);
+-
+-	nr_active_streams = !!(scr_val & CCSR_SSI_SCR_TE) +
++	u32 scr_val = read_ssi(&ssi->scr);
++	int nr_active_streams = !!(scr_val & CCSR_SSI_SCR_TE) +
+ 				!!(scr_val & CCSR_SSI_SCR_RE);
+ 
+-	if (nr_active_streams - 1 > 0)
+-		keep_active = 1;
+-	else
+-		keep_active = 0;
+-
+ 	/* Find the other direction values rx or tx which we do not want to
+ 	 * modify */
+ 	if (&ssi_private->rxtx_reg_val.rx == vals)
+@@ -377,11 +564,12 @@
+ 	else
+ 		avals = &ssi_private->rxtx_reg_val.rx;
+ 
++	fsl_ssi_clk_ctrl(ssi_private, enable);
++
+ 	/* If vals should be disabled, start with disabling the unit */
+ 	if (!enable) {
+-		u32 scr = fsl_ssi_disable_val(vals->scr, avals->scr,
+-				keep_active);
+-		regmap_update_bits(regs, CCSR_SSI_SCR, scr, 0);
++		u32 scr = vals->scr & (vals->scr ^ avals->scr);
++		write_ssi_mask(&ssi->scr, scr, 0);
+ 	}
+ 
+ 	/*
+@@ -389,9 +577,9 @@
+ 	 * reconfiguration, so we have to enable all necessary flags at once
+ 	 * even if we do not use them later (capture and playback configuration)
+ 	 */
+-	if (ssi_private->soc->offline_config) {
++	if (ssi_private->offline_config) {
+ 		if ((enable && !nr_active_streams) ||
+-				(!enable && !keep_active))
++				(!enable && nr_active_streams == 1))
+ 			fsl_ssi_rxtx_config(ssi_private, enable);
+ 
+ 		goto config_done;
+@@ -402,9 +590,9 @@
+ 	 * (online configuration)
+ 	 */
+ 	if (enable) {
+-		regmap_update_bits(regs, CCSR_SSI_SIER, vals->sier, vals->sier);
+-		regmap_update_bits(regs, CCSR_SSI_SRCR, vals->srcr, vals->srcr);
+-		regmap_update_bits(regs, CCSR_SSI_STCR, vals->stcr, vals->stcr);
++		write_ssi_mask(&ssi->sier, 0, vals->sier);
++		write_ssi_mask(&ssi->srcr, 0, vals->srcr);
++		write_ssi_mask(&ssi->stcr, 0, vals->stcr);
+ 	} else {
+ 		u32 sier;
+ 		u32 srcr;
+@@ -420,22 +608,19 @@
+ 		 */
+ 
+ 		/* These assignments are simply vals without bits set in avals*/
+-		sier = fsl_ssi_disable_val(vals->sier, avals->sier,
+-				keep_active);
+-		srcr = fsl_ssi_disable_val(vals->srcr, avals->srcr,
+-				keep_active);
+-		stcr = fsl_ssi_disable_val(vals->stcr, avals->stcr,
+-				keep_active);
+-
+-		regmap_update_bits(regs, CCSR_SSI_SRCR, srcr, 0);
+-		regmap_update_bits(regs, CCSR_SSI_STCR, stcr, 0);
+-		regmap_update_bits(regs, CCSR_SSI_SIER, sier, 0);
++		sier = vals->sier & (vals->sier ^ avals->sier);
++		srcr = vals->srcr & (vals->srcr ^ avals->srcr);
++		stcr = vals->stcr & (vals->stcr ^ avals->stcr);
++
++		write_ssi_mask(&ssi->srcr, srcr, 0);
++		write_ssi_mask(&ssi->stcr, stcr, 0);
++		write_ssi_mask(&ssi->sier, sier, 0);
+ 	}
+ 
+ config_done:
+ 	/* Enabling of subunits is done after configuration */
+ 	if (enable)
+-		regmap_update_bits(regs, CCSR_SSI_SCR, vals->scr, vals->scr);
++		write_ssi_mask(&ssi->scr, 0, vals->scr);
+ }
+ 
+ 
+@@ -465,7 +650,7 @@
+ 	reg->tx.stcr = CCSR_SSI_STCR_TFEN0;
+ 	reg->tx.scr = 0;
+ 
+-	if (!fsl_ssi_is_ac97(ssi_private)) {
++	if (!ssi_private->imx_ac97) {
+ 		reg->rx.scr = CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_RE;
+ 		reg->rx.sier |= CCSR_SSI_SIER_RFF0_EN;
+ 		reg->tx.scr = CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_TE;
+@@ -486,197 +671,161 @@
+ 
+ static void fsl_ssi_setup_ac97(struct fsl_ssi_private *ssi_private)
+ {
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
+ 
+ 	/*
+ 	 * Setup the clock control register
+ 	 */
+-	regmap_write(regs, CCSR_SSI_STCCR,
+-			CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13));
+-	regmap_write(regs, CCSR_SSI_SRCCR,
+-			CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13));
++	write_ssi(CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13),
++			&ssi->stccr);
++	write_ssi(CCSR_SSI_SxCCR_WL(17) | CCSR_SSI_SxCCR_DC(13),
++			&ssi->srccr);
+ 
+ 	/*
+ 	 * Enable AC97 mode and startup the SSI
+ 	 */
+-	regmap_write(regs, CCSR_SSI_SACNT,
+-			CCSR_SSI_SACNT_AC97EN | CCSR_SSI_SACNT_FV);
+-	regmap_write(regs, CCSR_SSI_SACCDIS, 0xff);
+-	regmap_write(regs, CCSR_SSI_SACCEN, 0x300);
++	write_ssi(CCSR_SSI_SACNT_AC97EN | CCSR_SSI_SACNT_FV,
++			&ssi->sacnt);
++	write_ssi(0xff, &ssi->saccdis);
++	write_ssi(0x300, &ssi->saccen);
+ 
+ 	/*
+ 	 * Enable SSI, Transmit and Receive. AC97 has to communicate with the
+ 	 * codec before a stream is started.
+ 	 */
+-	regmap_update_bits(regs, CCSR_SSI_SCR,
+-			CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE,
+-			CCSR_SSI_SCR_SSIEN | CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE);
+-
+-	regmap_write(regs, CCSR_SSI_SOR, CCSR_SSI_SOR_WAIT(3));
+-}
+-
+-/**
+- * fsl_ssi_startup: create a new substream
+- *
+- * This is the first function called when a stream is opened.
+- *
+- * If this is the first stream open, then grab the IRQ and program most of
+- * the SSI registers.
+- */
+-static int fsl_ssi_startup(struct snd_pcm_substream *substream,
+-			   struct snd_soc_dai *dai)
+-{
+-	struct snd_soc_pcm_runtime *rtd = substream->private_data;
+-	struct fsl_ssi_private *ssi_private =
+-		snd_soc_dai_get_drvdata(rtd->cpu_dai);
+-	int ret;
+-
+-	ret = clk_prepare_enable(ssi_private->clk);
+-	if (ret)
+-		return ret;
+-
+-	/* When using dual fifo mode, it is safer to ensure an even period
+-	 * size. If appearing to an odd number while DMA always starts its
+-	 * task from fifo0, fifo1 would be neglected at the end of each
+-	 * period. But SSI would still access fifo1 with an invalid data.
+-	 */
+-	if (ssi_private->use_dual_fifo)
+-		snd_pcm_hw_constraint_step(substream->runtime, 0,
+-				SNDRV_PCM_HW_PARAM_PERIOD_SIZE, 2);
++	write_ssi_mask(&ssi->scr, 0, CCSR_SSI_SCR_SSIEN |
++			CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE);
+ 
+-	return 0;
++	write_ssi(CCSR_SSI_SOR_WAIT(3), &ssi->sor);
+ }
+ 
+-/**
+- * fsl_ssi_shutdown: shutdown the SSI
+- *
+- */
+-static void fsl_ssi_shutdown(struct snd_pcm_substream *substream,
+-				struct snd_soc_dai *dai)
++static int fsl_ssi_setup(struct fsl_ssi_private *ssi_private)
+ {
+-	struct snd_soc_pcm_runtime *rtd = substream->private_data;
+-	struct fsl_ssi_private *ssi_private =
+-		snd_soc_dai_get_drvdata(rtd->cpu_dai);
+-
+-	clk_disable_unprepare(ssi_private->clk);
+-
+-}
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
++	u8 wm;
++	int synchronous = ssi_private->cpu_dai_drv.symmetric_rates;
+ 
+-/**
+- * fsl_ssi_set_bclk - configure Digital Audio Interface bit clock
+- *
+- * Note: This function can be only called when using SSI as DAI master
+- *
+- * Quick instruction for parameters:
+- * freq: Output BCLK frequency = samplerate * 32 (fixed) * channels
+- * dir: SND_SOC_CLOCK_OUT -> TxBCLK, SND_SOC_CLOCK_IN -> RxBCLK.
+- */
+-static int fsl_ssi_set_bclk(struct snd_pcm_substream *substream,
+-		struct snd_soc_dai *cpu_dai,
+-		struct snd_pcm_hw_params *hw_params)
+-{
+-	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
+-	struct regmap *regs = ssi_private->regs;
+-	int synchronous = ssi_private->cpu_dai_drv.symmetric_rates, ret;
+-	u32 pm = 999, div2, psr, stccr, mask, afreq, factor, i;
+-	unsigned long clkrate, baudrate, tmprate;
+-	u64 sub, savesub = 100000;
+-	unsigned int freq;
+-	bool baudclk_is_used;
++	fsl_ssi_setup_reg_vals(ssi_private);
+ 
+-	/* Prefer the explicitly set bitclock frequency */
+-	if (ssi_private->bitclk_freq)
+-		freq = ssi_private->bitclk_freq;
++	if (ssi_private->imx_ac97)
++		ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_NORMAL | CCSR_SSI_SCR_NET;
+ 	else
+-		freq = params_channels(hw_params) * 32 * params_rate(hw_params);
+-
+-	/* Don't apply it to any non-baudclk circumstance */
+-	if (IS_ERR(ssi_private->baudclk))
+-		return -EINVAL;
+-
+-	baudclk_is_used = ssi_private->baudclk_streams & ~(BIT(substream->stream));
++		ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_SLAVE;
+ 
+-	/* It should be already enough to divide clock by setting pm alone */
+-	psr = 0;
+-	div2 = 0;
+-
+-	factor = (div2 + 1) * (7 * psr + 1) * 2;
++	/*
++	 * Section 16.5 of the MPC8610 reference manual says that the SSI needs
++	 * to be disabled before updating the registers we set here.
++	 */
++	write_ssi_mask(&ssi->scr, CCSR_SSI_SCR_SSIEN, 0);
+ 
+-	for (i = 0; i < 255; i++) {
+-		tmprate = freq * factor * (i + 1);
++	/*
++	 * Program the SSI into I2S Slave Non-Network Synchronous mode. Also
++	 * enable the transmit and receive FIFO.
++	 *
++	 * FIXME: Little-endian samples require a different shift dir
++	 */
++	write_ssi_mask(&ssi->scr,
++		CCSR_SSI_SCR_I2S_MODE_MASK | CCSR_SSI_SCR_SYN,
++		CCSR_SSI_SCR_TFR_CLK_DIS |
++		ssi_private->i2s_mode |
++		(synchronous ? CCSR_SSI_SCR_SYN : 0));
+ 
+-		if (baudclk_is_used)
+-			clkrate = clk_get_rate(ssi_private->baudclk);
+-		else
+-			clkrate = clk_round_rate(ssi_private->baudclk, tmprate);
++	write_ssi(CCSR_SSI_STCR_TXBIT0 | CCSR_SSI_STCR_TFSI |
++			CCSR_SSI_STCR_TEFS | CCSR_SSI_STCR_TSCKP, &ssi->stcr);
+ 
+-		/*
+-		 * Hardware limitation: The bclk rate must be
+-		 * never greater than 1/5 IPG clock rate
+-		 */
+-		if (clkrate * 5 > clk_get_rate(ssi_private->clk))
+-			continue;
++	write_ssi(CCSR_SSI_SRCR_RXBIT0 | CCSR_SSI_SRCR_RFSI |
++			CCSR_SSI_SRCR_REFS | CCSR_SSI_SRCR_RSCKP, &ssi->srcr);
+ 
+-		clkrate /= factor;
+-		afreq = clkrate / (i + 1);
++	/*
++	 * The DC and PM bits are only used if the SSI is the clock master.
++	 */
+ 
+-		if (freq == afreq)
+-			sub = 0;
+-		else if (freq / afreq == 1)
+-			sub = freq - afreq;
+-		else if (afreq / freq == 1)
+-			sub = afreq - freq;
+-		else
+-			continue;
++	/*
++	 * Set the watermark for transmit FIFI 0 and receive FIFO 0. We don't
++	 * use FIFO 1. We program the transmit water to signal a DMA transfer
++	 * if there are only two (or fewer) elements left in the FIFO. Two
++	 * elements equals one frame (left channel, right channel). This value,
++	 * however, depends on the depth of the transmit buffer.
++	 *
++	 * We set the watermark on the same level as the DMA burstsize.  For
++	 * fiq it is probably better to use the biggest possible watermark
++	 * size.
++	 */
++	if (ssi_private->use_dma)
++		wm = ssi_private->fifo_depth - 2;
++	else
++		wm = ssi_private->fifo_depth;
+ 
+-		/* Calculate the fraction */
+-		sub *= 100000;
+-		do_div(sub, freq);
++	write_ssi(CCSR_SSI_SFCSR_TFWM0(wm) | CCSR_SSI_SFCSR_RFWM0(wm) |
++		CCSR_SSI_SFCSR_TFWM1(wm) | CCSR_SSI_SFCSR_RFWM1(wm),
++		&ssi->sfcsr);
+ 
+-		if (sub < savesub) {
+-			baudrate = tmprate;
+-			savesub = sub;
+-			pm = i;
+-		}
++	/*
++	 * For ac97 interrupts are enabled with the startup of the substream
++	 * because it is also running without an active substream. Normally SSI
++	 * is only enabled when there is a substream.
++	 */
++	if (ssi_private->imx_ac97)
++		fsl_ssi_setup_ac97(ssi_private);
+ 
+-		/* We are lucky */
+-		if (savesub == 0)
+-			break;
++	/*
++	 * Set a default slot number so that there is no need for those common
++	 * cases like I2S mode to call the extra set_tdm_slot() any more.
++	 */
++	if (!ssi_private->imx_ac97) {
++		write_ssi_mask(&ssi->stccr, CCSR_SSI_SxCCR_DC_MASK,
++				CCSR_SSI_SxCCR_DC(2));
++		write_ssi_mask(&ssi->srccr, CCSR_SSI_SxCCR_DC_MASK,
++				CCSR_SSI_SxCCR_DC(2));
+ 	}
+ 
+-	/* No proper pm found if it is still remaining the initial value */
+-	if (pm == 999) {
+-		dev_err(cpu_dai->dev, "failed to handle the required sysclk\n");
+-		return -EINVAL;
++	if (ssi_private->use_dual_fifo) {
++		write_ssi_mask(&ssi->srcr, 0, CCSR_SSI_SRCR_RFEN1);
++		write_ssi_mask(&ssi->stcr, 0, CCSR_SSI_STCR_TFEN1);
++		write_ssi_mask(&ssi->scr, 0, CCSR_SSI_SCR_TCH_EN);
+ 	}
+ 
+-	stccr = CCSR_SSI_SxCCR_PM(pm + 1) | (div2 ? CCSR_SSI_SxCCR_DIV2 : 0) |
+-		(psr ? CCSR_SSI_SxCCR_PSR : 0);
+-	mask = CCSR_SSI_SxCCR_PM_MASK | CCSR_SSI_SxCCR_DIV2 |
+-		CCSR_SSI_SxCCR_PSR;
++	return 0;
++}
+ 
+-	if (substream->stream == SNDRV_PCM_STREAM_PLAYBACK || synchronous)
+-		regmap_update_bits(regs, CCSR_SSI_STCCR, mask, stccr);
+-	else
+-		regmap_update_bits(regs, CCSR_SSI_SRCCR, mask, stccr);
+ 
+-	if (!baudclk_is_used) {
+-		ret = clk_set_rate(ssi_private->baudclk, baudrate);
+-		if (ret) {
+-			dev_err(cpu_dai->dev, "failed to set baudclk rate\n");
+-			return -EINVAL;
+-		}
+-	}
++/**
++ * fsl_ssi_startup: create a new substream
++ *
++ * This is the first function called when a stream is opened.
++ *
++ * If this is the first stream open, then grab the IRQ and program most of
++ * the SSI registers.
++ */
++static int fsl_ssi_startup(struct snd_pcm_substream *substream,
++			   struct snd_soc_dai *dai)
++{
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct fsl_ssi_private *ssi_private =
++		snd_soc_dai_get_drvdata(rtd->cpu_dai);
++	unsigned long flags;
+ 
+-	return 0;
+-}
++	pm_runtime_get_sync(dai->dev);
+ 
+-static int fsl_ssi_set_dai_sysclk(struct snd_soc_dai *cpu_dai,
+-		int clk_id, unsigned int freq, int dir)
+-{
+-	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
++	/* First, we only do fsl_ssi_setup() when SSI is going to be active.
++	 * Second, fsl_ssi_setup was already called by ac97_init earlier if
++	 * the driver is in ac97 mode.
++	 */
++	if (!dai->active && !ssi_private->imx_ac97) {
++		fsl_ssi_setup(ssi_private);
++		spin_lock_irqsave(&ssi_private->baudclk_lock, flags);
++		ssi_private->baudclk_locked = false;
++		spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
++	}
+ 
+-	ssi_private->bitclk_freq = freq;
++	/* When using dual fifo mode, it is safer to ensure an even period
++	 * size. If appearing to an odd number while DMA always starts its
++	 * task from fifo0, fifo1 would be neglected at the end of each
++	 * period. But SSI would still access fifo1 with an invalid data.
++	 */
++	if (ssi_private->use_dual_fifo)
++		snd_pcm_hw_constraint_step(substream->runtime, 0,
++				SNDRV_PCM_HW_PARAM_PERIOD_SIZE, 2);
+ 
+ 	return 0;
+ }
+@@ -698,17 +847,12 @@
+ 	struct snd_pcm_hw_params *hw_params, struct snd_soc_dai *cpu_dai)
+ {
+ 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
+ 	unsigned int channels = params_channels(hw_params);
+ 	unsigned int sample_size =
+ 		snd_pcm_format_width(params_format(hw_params));
+ 	u32 wl = CCSR_SSI_SxCCR_WL(sample_size);
+-	int ret;
+-	u32 scr_val;
+-	int enabled;
+-
+-	regmap_read(regs, CCSR_SSI_SCR, &scr_val);
+-	enabled = scr_val & CCSR_SSI_SCR_SSIEN;
++	int enabled = read_ssi(&ssi->scr) & CCSR_SSI_SCR_SSIEN;
+ 
+ 	/*
+ 	 * If we're in synchronous mode, and the SSI is already enabled,
+@@ -717,38 +861,6 @@
+ 	if (enabled && ssi_private->cpu_dai_drv.symmetric_rates)
+ 		return 0;
+ 
+-	if (fsl_ssi_is_i2s_master(ssi_private)) {
+-		ret = fsl_ssi_set_bclk(substream, cpu_dai, hw_params);
+-		if (ret)
+-			return ret;
+-
+-		/* Do not enable the clock if it is already enabled */
+-		if (!(ssi_private->baudclk_streams & BIT(substream->stream))) {
+-			ret = clk_prepare_enable(ssi_private->baudclk);
+-			if (ret)
+-				return ret;
+-
+-			ssi_private->baudclk_streams |= BIT(substream->stream);
+-		}
+-	}
+-
+-	if (!fsl_ssi_is_ac97(ssi_private)) {
+-		u8 i2smode;
+-		/*
+-		 * Switch to normal net mode in order to have a frame sync
+-		 * signal every 32 bits instead of 16 bits
+-		 */
+-		if (fsl_ssi_is_i2s_cbm_cfs(ssi_private) && sample_size == 16)
+-			i2smode = CCSR_SSI_SCR_I2S_MODE_NORMAL |
+-				CCSR_SSI_SCR_NET;
+-		else
+-			i2smode = ssi_private->i2s_mode;
+-
+-		regmap_update_bits(regs, CCSR_SSI_SCR,
+-				CCSR_SSI_SCR_NET | CCSR_SSI_SCR_I2S_MODE_MASK,
+-				channels == 1 ? 0 : i2smode);
+-	}
+-
+ 	/*
+ 	 * FIXME: The documentation says that SxCCR[WL] should not be
+ 	 * modified while the SSI is enabled.  The only time this can
+@@ -762,80 +874,49 @@
+ 	/* In synchronous mode, the SSI uses STCCR for capture */
+ 	if ((substream->stream == SNDRV_PCM_STREAM_PLAYBACK) ||
+ 	    ssi_private->cpu_dai_drv.symmetric_rates)
+-		regmap_update_bits(regs, CCSR_SSI_STCCR, CCSR_SSI_SxCCR_WL_MASK,
+-				wl);
++		write_ssi_mask(&ssi->stccr, CCSR_SSI_SxCCR_WL_MASK, wl);
+ 	else
+-		regmap_update_bits(regs, CCSR_SSI_SRCCR, CCSR_SSI_SxCCR_WL_MASK,
+-				wl);
++		write_ssi_mask(&ssi->srccr, CCSR_SSI_SxCCR_WL_MASK, wl);
+ 
+-	return 0;
+-}
+-
+-static int fsl_ssi_hw_free(struct snd_pcm_substream *substream,
+-		struct snd_soc_dai *cpu_dai)
+-{
+-	struct snd_soc_pcm_runtime *rtd = substream->private_data;
+-	struct fsl_ssi_private *ssi_private =
+-		snd_soc_dai_get_drvdata(rtd->cpu_dai);
+-
+-	if (fsl_ssi_is_i2s_master(ssi_private) &&
+-			ssi_private->baudclk_streams & BIT(substream->stream)) {
+-		clk_disable_unprepare(ssi_private->baudclk);
+-		ssi_private->baudclk_streams &= ~BIT(substream->stream);
+-	}
++	if (!ssi_private->imx_ac97)
++		write_ssi_mask(&ssi->scr,
++				CCSR_SSI_SCR_NET | CCSR_SSI_SCR_I2S_MODE_MASK,
++				channels == 1 ? 0 : ssi_private->i2s_mode);
+ 
+ 	return 0;
+ }
+ 
+-static int _fsl_ssi_set_dai_fmt(struct device *dev,
+-				struct fsl_ssi_private *ssi_private,
+-				unsigned int fmt)
++/**
++ * fsl_ssi_set_dai_fmt - configure Digital Audio Interface Format.
++ */
++static int fsl_ssi_set_dai_fmt(struct snd_soc_dai *cpu_dai, unsigned int fmt)
+ {
+-	struct regmap *regs = ssi_private->regs;
++	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
+ 	u32 strcr = 0, stcr, srcr, scr, mask;
+-	u8 wm;
+ 
+-	ssi_private->dai_fmt = fmt;
+-
+-	if (fsl_ssi_is_i2s_master(ssi_private) && IS_ERR(ssi_private->baudclk)) {
+-		dev_err(dev, "baudclk is missing which is necessary for master mode\n");
+-		return -EINVAL;
+-	}
+-
+-	fsl_ssi_setup_reg_vals(ssi_private);
+-
+-	regmap_read(regs, CCSR_SSI_SCR, &scr);
+-	scr &= ~(CCSR_SSI_SCR_SYN | CCSR_SSI_SCR_I2S_MODE_MASK);
+-	scr |= CCSR_SSI_SCR_SYNC_TX_FS;
++	scr = read_ssi(&ssi->scr) & ~(CCSR_SSI_SCR_SYN | CCSR_SSI_SCR_I2S_MODE_MASK);
++	scr |= CCSR_SSI_SCR_NET;
+ 
+ 	mask = CCSR_SSI_STCR_TXBIT0 | CCSR_SSI_STCR_TFDIR | CCSR_SSI_STCR_TXDIR |
+ 		CCSR_SSI_STCR_TSCKP | CCSR_SSI_STCR_TFSI | CCSR_SSI_STCR_TFSL |
+ 		CCSR_SSI_STCR_TEFS;
+-	regmap_read(regs, CCSR_SSI_STCR, &stcr);
+-	regmap_read(regs, CCSR_SSI_SRCR, &srcr);
+-	stcr &= ~mask;
+-	srcr &= ~mask;
++	stcr = read_ssi(&ssi->stcr) & ~mask;
++	srcr = read_ssi(&ssi->srcr) & ~mask;
+ 
+-	ssi_private->i2s_mode = CCSR_SSI_SCR_NET;
+ 	switch (fmt & SND_SOC_DAIFMT_FORMAT_MASK) {
+ 	case SND_SOC_DAIFMT_I2S:
+ 		switch (fmt & SND_SOC_DAIFMT_MASTER_MASK) {
+-		case SND_SOC_DAIFMT_CBM_CFS:
+ 		case SND_SOC_DAIFMT_CBS_CFS:
+-			ssi_private->i2s_mode |= CCSR_SSI_SCR_I2S_MODE_MASTER;
+-			regmap_update_bits(regs, CCSR_SSI_STCCR,
+-					CCSR_SSI_SxCCR_DC_MASK,
+-					CCSR_SSI_SxCCR_DC(2));
+-			regmap_update_bits(regs, CCSR_SSI_SRCCR,
+-					CCSR_SSI_SxCCR_DC_MASK,
+-					CCSR_SSI_SxCCR_DC(2));
++			ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_MASTER;
+ 			break;
+ 		case SND_SOC_DAIFMT_CBM_CFM:
+-			ssi_private->i2s_mode |= CCSR_SSI_SCR_I2S_MODE_SLAVE;
++			ssi_private->i2s_mode = CCSR_SSI_SCR_I2S_MODE_SLAVE;
+ 			break;
+ 		default:
+ 			return -EINVAL;
+ 		}
++		scr |= ssi_private->i2s_mode;
+ 
+ 		/* Data on rising edge of bclk, frame low, 1clk before data */
+ 		strcr |= CCSR_SSI_STCR_TFSI | CCSR_SSI_STCR_TSCKP |
+@@ -855,13 +936,9 @@
+ 		strcr |= CCSR_SSI_STCR_TFSL | CCSR_SSI_STCR_TSCKP |
+ 			CCSR_SSI_STCR_TXBIT0;
+ 		break;
+-	case SND_SOC_DAIFMT_AC97:
+-		ssi_private->i2s_mode |= CCSR_SSI_SCR_I2S_MODE_NORMAL;
+-		break;
+ 	default:
+ 		return -EINVAL;
+ 	}
+-	scr |= ssi_private->i2s_mode;
+ 
+ 	/* DAI clock inversion */
+ 	switch (fmt & SND_SOC_DAIFMT_INV_MASK) {
+@@ -894,11 +971,6 @@
+ 	case SND_SOC_DAIFMT_CBM_CFM:
+ 		scr &= ~CCSR_SSI_SCR_SYS_CLK_EN;
+ 		break;
+-	case SND_SOC_DAIFMT_CBM_CFS:
+-		strcr &= ~CCSR_SSI_STCR_TXDIR;
+-		strcr |= CCSR_SSI_STCR_TFDIR;
+-		scr &= ~CCSR_SSI_SCR_SYS_CLK_EN;
+-		break;
+ 	default:
+ 		return -EINVAL;
+ 	}
+@@ -912,54 +984,105 @@
+ 		scr |= CCSR_SSI_SCR_SYN;
+ 	}
+ 
+-	regmap_write(regs, CCSR_SSI_STCR, stcr);
+-	regmap_write(regs, CCSR_SSI_SRCR, srcr);
+-	regmap_write(regs, CCSR_SSI_SCR, scr);
+-
+-	/*
+-	 * Set the watermark for transmit FIFI 0 and receive FIFO 0. We don't
+-	 * use FIFO 1. We program the transmit water to signal a DMA transfer
+-	 * if there are only two (or fewer) elements left in the FIFO. Two
+-	 * elements equals one frame (left channel, right channel). This value,
+-	 * however, depends on the depth of the transmit buffer.
+-	 *
+-	 * We set the watermark on the same level as the DMA burstsize.  For
+-	 * fiq it is probably better to use the biggest possible watermark
+-	 * size.
+-	 */
+-	if (ssi_private->use_dma)
+-		wm = ssi_private->fifo_depth - 2;
+-	else
+-		wm = ssi_private->fifo_depth;
+-
+-	regmap_write(regs, CCSR_SSI_SFCSR,
+-			CCSR_SSI_SFCSR_TFWM0(wm) | CCSR_SSI_SFCSR_RFWM0(wm) |
+-			CCSR_SSI_SFCSR_TFWM1(wm) | CCSR_SSI_SFCSR_RFWM1(wm));
+-
+-	if (ssi_private->use_dual_fifo) {
+-		regmap_update_bits(regs, CCSR_SSI_SRCR, CCSR_SSI_SRCR_RFEN1,
+-				CCSR_SSI_SRCR_RFEN1);
+-		regmap_update_bits(regs, CCSR_SSI_STCR, CCSR_SSI_STCR_TFEN1,
+-				CCSR_SSI_STCR_TFEN1);
+-		regmap_update_bits(regs, CCSR_SSI_SCR, CCSR_SSI_SCR_TCH_EN,
+-				CCSR_SSI_SCR_TCH_EN);
+-	}
+-
+-	if (fmt & SND_SOC_DAIFMT_AC97)
+-		fsl_ssi_setup_ac97(ssi_private);
++	write_ssi(stcr, &ssi->stcr);
++	write_ssi(srcr, &ssi->srcr);
++	write_ssi(scr, &ssi->scr);
+ 
+ 	return 0;
+-
+ }
+ 
+ /**
+- * fsl_ssi_set_dai_fmt - configure Digital Audio Interface Format.
++ * fsl_ssi_set_dai_sysclk - configure Digital Audio Interface bit clock
++ *
++ * Note: This function can be only called when using SSI as DAI master
++ *
++ * Quick instruction for parameters:
++ * freq: Output BCLK frequency = samplerate * 32 (fixed) * channels
++ * dir: SND_SOC_CLOCK_OUT -> TxBCLK, SND_SOC_CLOCK_IN -> RxBCLK.
+  */
+-static int fsl_ssi_set_dai_fmt(struct snd_soc_dai *cpu_dai, unsigned int fmt)
++static int fsl_ssi_set_dai_sysclk(struct snd_soc_dai *cpu_dai,
++				  int clk_id, unsigned int freq, int dir)
+ {
+ 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
++	int synchronous = ssi_private->cpu_dai_drv.symmetric_rates, ret;
++	u32 pm = 999, div2, psr, stccr, mask, afreq, factor, i;
++	unsigned long flags, clkrate, baudrate, tmprate;
++	u64 sub, savesub = 100000;
++
++	/* Don't apply it to any non-baudclk circumstance */
++	if (IS_ERR(ssi_private->baudclk))
++		return -EINVAL;
++
++	/* It should be already enough to divide clock by setting pm alone */
++	psr = 0;
++	div2 = 0;
++
++	factor = (div2 + 1) * (7 * psr + 1) * 2;
++
++	for (i = 0; i < 255; i++) {
++		/* The bclk rate must be smaller than 1/5 sysclk rate */
++		if (factor * (i + 1) < 5)
++			continue;
++
++		tmprate = freq * factor * (i + 2);
++		clkrate = clk_round_rate(ssi_private->baudclk, tmprate);
++
++		do_div(clkrate, factor);
++		afreq = (u32)clkrate / (i + 1);
++
++		if (freq == afreq)
++			sub = 0;
++		else if (freq / afreq == 1)
++			sub = freq - afreq;
++		else if (afreq / freq == 1)
++			sub = afreq - freq;
++		else
++			continue;
++
++		/* Calculate the fraction */
++		sub *= 100000;
++		do_div(sub, freq);
++
++		if (sub < savesub) {
++			baudrate = tmprate;
++			savesub = sub;
++			pm = i;
++		}
++
++		/* We are lucky */
++		if (savesub == 0)
++			break;
++	}
++
++	/* No proper pm found if it is still remaining the initial value */
++	if (pm == 999) {
++		dev_err(cpu_dai->dev, "failed to handle the required sysclk\n");
++		return -EINVAL;
++	}
++
++	stccr = CCSR_SSI_SxCCR_PM(pm + 1) | (div2 ? CCSR_SSI_SxCCR_DIV2 : 0) |
++		(psr ? CCSR_SSI_SxCCR_PSR : 0);
++	mask = CCSR_SSI_SxCCR_PM_MASK | CCSR_SSI_SxCCR_DIV2 | CCSR_SSI_SxCCR_PSR;
++
++	if (dir == SND_SOC_CLOCK_OUT || synchronous)
++		write_ssi_mask(&ssi->stccr, mask, stccr);
++	else
++		write_ssi_mask(&ssi->srccr, mask, stccr);
++
++	spin_lock_irqsave(&ssi_private->baudclk_lock, flags);
++	if (!ssi_private->baudclk_locked) {
++		ret = clk_set_rate(ssi_private->baudclk, baudrate);
++		if (ret) {
++			spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
++			dev_err(cpu_dai->dev, "failed to set baudclk rate\n");
++			return -EINVAL;
++		}
++		ssi_private->baudclk_locked = true;
++	}
++	spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
+ 
+-	return _fsl_ssi_set_dai_fmt(cpu_dai->dev, ssi_private, fmt);
++	return 0;
+ }
+ 
+ /**
+@@ -971,34 +1094,31 @@
+ 				u32 rx_mask, int slots, int slot_width)
+ {
+ 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(cpu_dai);
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
+ 	u32 val;
+ 
+ 	/* The slot number should be >= 2 if using Network mode or I2S mode */
+-	regmap_read(regs, CCSR_SSI_SCR, &val);
+-	val &= CCSR_SSI_SCR_I2S_MODE_MASK | CCSR_SSI_SCR_NET;
++	val = read_ssi(&ssi->scr) & (CCSR_SSI_SCR_I2S_MODE_MASK | CCSR_SSI_SCR_NET);
+ 	if (val && slots < 2) {
+ 		dev_err(cpu_dai->dev, "slot number should be >= 2 in I2S or NET\n");
+ 		return -EINVAL;
+ 	}
+ 
+-	regmap_update_bits(regs, CCSR_SSI_STCCR, CCSR_SSI_SxCCR_DC_MASK,
++	write_ssi_mask(&ssi->stccr, CCSR_SSI_SxCCR_DC_MASK,
+ 			CCSR_SSI_SxCCR_DC(slots));
+-	regmap_update_bits(regs, CCSR_SSI_SRCCR, CCSR_SSI_SxCCR_DC_MASK,
++	write_ssi_mask(&ssi->srccr, CCSR_SSI_SxCCR_DC_MASK,
+ 			CCSR_SSI_SxCCR_DC(slots));
+ 
+ 	/* The register SxMSKs needs SSI to provide essential clock due to
+ 	 * hardware design. So we here temporarily enable SSI to set them.
+ 	 */
+-	regmap_read(regs, CCSR_SSI_SCR, &val);
+-	val &= CCSR_SSI_SCR_SSIEN;
+-	regmap_update_bits(regs, CCSR_SSI_SCR, CCSR_SSI_SCR_SSIEN,
+-			CCSR_SSI_SCR_SSIEN);
++	val = read_ssi(&ssi->scr) & CCSR_SSI_SCR_SSIEN;
++	write_ssi_mask(&ssi->scr, 0, CCSR_SSI_SCR_SSIEN);
+ 
+-	regmap_write(regs, CCSR_SSI_STMSK, ~tx_mask);
+-	regmap_write(regs, CCSR_SSI_SRMSK, ~rx_mask);
++	write_ssi(tx_mask, &ssi->stmsk);
++	write_ssi(rx_mask, &ssi->srmsk);
+ 
+-	regmap_update_bits(regs, CCSR_SSI_SCR, CCSR_SSI_SCR_SSIEN, val);
++	write_ssi_mask(&ssi->scr, CCSR_SSI_SCR_SSIEN, val);
+ 
+ 	return 0;
+ }
+@@ -1017,7 +1137,8 @@
+ {
+ 	struct snd_soc_pcm_runtime *rtd = substream->private_data;
+ 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(rtd->cpu_dai);
+-	struct regmap *regs = ssi_private->regs;
++	struct ccsr_ssi __iomem *ssi = ssi_private->ssi;
++	unsigned long flags;
+ 
+ 	switch (cmd) {
+ 	case SNDRV_PCM_TRIGGER_START:
+@@ -1027,6 +1148,7 @@
+ 			fsl_ssi_tx_config(ssi_private, true);
+ 		else
+ 			fsl_ssi_rx_config(ssi_private, true);
++		dump_reg(ssi);
+ 		break;
+ 
+ 	case SNDRV_PCM_TRIGGER_STOP:
+@@ -1036,27 +1158,40 @@
+ 			fsl_ssi_tx_config(ssi_private, false);
+ 		else
+ 			fsl_ssi_rx_config(ssi_private, false);
++
++		if (!ssi_private->imx_ac97 && (read_ssi(&ssi->scr) &
++					(CCSR_SSI_SCR_TE | CCSR_SSI_SCR_RE)) == 0) {
++			spin_lock_irqsave(&ssi_private->baudclk_lock, flags);
++			ssi_private->baudclk_locked = false;
++			spin_unlock_irqrestore(&ssi_private->baudclk_lock, flags);
++		}
+ 		break;
+ 
+ 	default:
+ 		return -EINVAL;
+ 	}
+ 
+-	if (fsl_ssi_is_ac97(ssi_private)) {
++	if (ssi_private->imx_ac97) {
+ 		if (substream->stream == SNDRV_PCM_STREAM_PLAYBACK)
+-			regmap_write(regs, CCSR_SSI_SOR, CCSR_SSI_SOR_TX_CLR);
++			write_ssi(CCSR_SSI_SOR_TX_CLR, &ssi->sor);
+ 		else
+-			regmap_write(regs, CCSR_SSI_SOR, CCSR_SSI_SOR_RX_CLR);
++			write_ssi(CCSR_SSI_SOR_RX_CLR, &ssi->sor);
+ 	}
+ 
+ 	return 0;
+ }
+ 
++static void fsl_ssi_shutdown(struct snd_pcm_substream *substream,
++   			     struct snd_soc_dai *dai)
++{
++	pm_runtime_put_sync(dai->dev);
++}
++
+ static int fsl_ssi_dai_probe(struct snd_soc_dai *dai)
+ {
+ 	struct fsl_ssi_private *ssi_private = snd_soc_dai_get_drvdata(dai);
+ 
+-	if (ssi_private->soc->imx && ssi_private->use_dma) {
++	if (ssi_private->ssi_on_imx && ssi_private->use_dma) {
+ 		dai->playback_dma_data = &ssi_private->dma_params_tx;
+ 		dai->capture_dma_data = &ssi_private->dma_params_rx;
+ 	}
+@@ -1066,27 +1201,24 @@
+ 
+ static const struct snd_soc_dai_ops fsl_ssi_dai_ops = {
+ 	.startup	= fsl_ssi_startup,
+-	.shutdown       = fsl_ssi_shutdown,
+ 	.hw_params	= fsl_ssi_hw_params,
+-	.hw_free	= fsl_ssi_hw_free,
+ 	.set_fmt	= fsl_ssi_set_dai_fmt,
+ 	.set_sysclk	= fsl_ssi_set_dai_sysclk,
+ 	.set_tdm_slot	= fsl_ssi_set_dai_tdm_slot,
+ 	.trigger	= fsl_ssi_trigger,
++	.shutdown	= fsl_ssi_shutdown,
+ };
+ 
+ /* Template for the CPU dai driver structure */
+ static struct snd_soc_dai_driver fsl_ssi_dai_template = {
+ 	.probe = fsl_ssi_dai_probe,
+ 	.playback = {
+-		.stream_name = "CPU-Playback",
+ 		.channels_min = 1,
+ 		.channels_max = 2,
+ 		.rates = FSLSSI_I2S_RATES,
+ 		.formats = FSLSSI_I2S_FORMATS,
+ 	},
+ 	.capture = {
+-		.stream_name = "CPU-Capture",
+ 		.channels_min = 1,
+ 		.channels_max = 2,
+ 		.rates = FSLSSI_I2S_RATES,
+@@ -1100,7 +1232,7 @@
+ };
+ 
+ static struct snd_soc_dai_driver fsl_ssi_ac97_dai = {
+-	.bus_control = true,
++//	.ac97_control = 1,
+ 	.playback = {
+ 		.stream_name = "AC97 Playback",
+ 		.channels_min = 2,
+@@ -1121,10 +1253,15 @@
+ 
+ static struct fsl_ssi_private *fsl_ac97_data;
+ 
++static void fsl_ssi_ac97_init(void)
++{
++	fsl_ssi_setup(fsl_ac97_data);
++}
++
+ static void fsl_ssi_ac97_write(struct snd_ac97 *ac97, unsigned short reg,
+ 		unsigned short val)
+ {
+-	struct regmap *regs = fsl_ac97_data->regs;
++	struct ccsr_ssi *ssi = fsl_ac97_data->ssi;
+ 	unsigned int lreg;
+ 	unsigned int lval;
+ 
+@@ -1133,12 +1270,12 @@
+ 
+ 
+ 	lreg = reg <<  12;
+-	regmap_write(regs, CCSR_SSI_SACADD, lreg);
++	write_ssi(lreg, &ssi->sacadd);
+ 
+ 	lval = val << 4;
+-	regmap_write(regs, CCSR_SSI_SACDAT, lval);
++	write_ssi(lval , &ssi->sacdat);
+ 
+-	regmap_update_bits(regs, CCSR_SSI_SACNT, CCSR_SSI_SACNT_RDWR_MASK,
++	write_ssi_mask(&ssi->sacnt, CCSR_SSI_SACNT_RDWR_MASK,
+ 			CCSR_SSI_SACNT_WR);
+ 	udelay(100);
+ }
+@@ -1146,21 +1283,19 @@
+ static unsigned short fsl_ssi_ac97_read(struct snd_ac97 *ac97,
+ 		unsigned short reg)
+ {
+-	struct regmap *regs = fsl_ac97_data->regs;
++	struct ccsr_ssi *ssi = fsl_ac97_data->ssi;
+ 
+ 	unsigned short val = -1;
+-	u32 reg_val;
+ 	unsigned int lreg;
+ 
+ 	lreg = (reg & 0x7f) <<  12;
+-	regmap_write(regs, CCSR_SSI_SACADD, lreg);
+-	regmap_update_bits(regs, CCSR_SSI_SACNT, CCSR_SSI_SACNT_RDWR_MASK,
++	write_ssi(lreg, &ssi->sacadd);
++	write_ssi_mask(&ssi->sacnt, CCSR_SSI_SACNT_RDWR_MASK,
+ 			CCSR_SSI_SACNT_RD);
+ 
+ 	udelay(100);
+ 
+-	regmap_read(regs, CCSR_SSI_SACDAT, &reg_val);
+-	val = (reg_val >> 4) & 0xffff;
++	val = (read_ssi(&ssi->sacdat) >> 4) & 0xffff;
+ 
+ 	return val;
+ }
+@@ -1185,112 +1320,20 @@
+ 	}
+ }
+ 
+-static int fsl_ssi_imx_probe(struct platform_device *pdev,
+-		struct fsl_ssi_private *ssi_private, void __iomem *iomem)
+-{
+-	struct device_node *np = pdev->dev.of_node;
+-	u32 dmas[4];
+-	int ret;
+-
+-	if (ssi_private->has_ipg_clk_name)
+-		ssi_private->clk = devm_clk_get(&pdev->dev, "ipg");
+-	else
+-		ssi_private->clk = devm_clk_get(&pdev->dev, NULL);
+-	if (IS_ERR(ssi_private->clk)) {
+-		ret = PTR_ERR(ssi_private->clk);
+-		dev_err(&pdev->dev, "could not get clock: %d\n", ret);
+-		return ret;
+-	}
+-
+-	if (!ssi_private->has_ipg_clk_name) {
+-		ret = clk_prepare_enable(ssi_private->clk);
+-		if (ret) {
+-			dev_err(&pdev->dev, "clk_prepare_enable failed: %d\n", ret);
+-			return ret;
+-		}
+-	}
+-
+-	/* For those SLAVE implementations, we ingore non-baudclk cases
+-	 * and, instead, abandon MASTER mode that needs baud clock.
+-	 */
+-	ssi_private->baudclk = devm_clk_get(&pdev->dev, "baud");
+-	if (IS_ERR(ssi_private->baudclk))
+-		dev_dbg(&pdev->dev, "could not get baud clock: %ld\n",
+-			 PTR_ERR(ssi_private->baudclk));
+-
+-	/*
+-	 * We have burstsize be "fifo_depth - 2" to match the SSI
+-	 * watermark setting in fsl_ssi_startup().
+-	 */
+-	ssi_private->dma_params_tx.maxburst = ssi_private->fifo_depth - 2;
+-	ssi_private->dma_params_rx.maxburst = ssi_private->fifo_depth - 2;
+-	ssi_private->dma_params_tx.addr = ssi_private->ssi_phys + CCSR_SSI_STX0;
+-	ssi_private->dma_params_rx.addr = ssi_private->ssi_phys + CCSR_SSI_SRX0;
+-
+-	ret = of_property_read_u32_array(np, "dmas", dmas, 4);
+-	if (ssi_private->use_dma && !ret && dmas[2] == IMX_DMATYPE_SSI_DUAL) {
+-		ssi_private->use_dual_fifo = true;
+-		/* When using dual fifo mode, we need to keep watermark
+-		 * as even numbers due to dma script limitation.
+-		 */
+-		ssi_private->dma_params_tx.maxburst &= ~0x1;
+-		ssi_private->dma_params_rx.maxburst &= ~0x1;
+-	}
+-
+-	if (!ssi_private->use_dma) {
+-
+-		/*
+-		 * Some boards use an incompatible codec. To get it
+-		 * working, we are using imx-fiq-pcm-audio, that
+-		 * can handle those codecs. DMA is not possible in this
+-		 * situation.
+-		 */
+-
+-		ssi_private->fiq_params.irq = ssi_private->irq;
+-		ssi_private->fiq_params.base = iomem;
+-		ssi_private->fiq_params.dma_params_rx =
+-			&ssi_private->dma_params_rx;
+-		ssi_private->fiq_params.dma_params_tx =
+-			&ssi_private->dma_params_tx;
+-
+-		ret = imx_pcm_fiq_init(pdev, &ssi_private->fiq_params);
+-		if (ret)
+-			goto error_pcm;
+-	} else {
+-		ret = imx_pcm_dma_init(pdev);
+-		if (ret)
+-			goto error_pcm;
+-	}
+-
+-	return 0;
+-
+-error_pcm:
+-
+-	if (!ssi_private->has_ipg_clk_name)
+-		clk_disable_unprepare(ssi_private->clk);
+-	return ret;
+-}
+-
+-static void fsl_ssi_imx_clean(struct platform_device *pdev,
+-		struct fsl_ssi_private *ssi_private)
+-{
+-	if (!ssi_private->use_dma)
+-		imx_pcm_fiq_exit(pdev);
+-	if (!ssi_private->has_ipg_clk_name)
+-		clk_disable_unprepare(ssi_private->clk);
+-}
+-
+ static int fsl_ssi_probe(struct platform_device *pdev)
+ {
+ 	struct fsl_ssi_private *ssi_private;
+ 	int ret = 0;
++	struct device_attribute *dev_attr = NULL;
+ 	struct device_node *np = pdev->dev.of_node;
++	u32 dmas[4];
+ 	const struct of_device_id *of_id;
++	enum fsl_ssi_type hw_type;
+ 	const char *p, *sprop;
+ 	const uint32_t *iprop;
+-	struct resource *res;
+-	void __iomem *iomem;
++	struct resource res;
+ 	char name[64];
++	bool ac97 = false;
+ 
+ 	/* SSIs that are not connected on the board should have a
+ 	 *      status = "disabled"
+@@ -1300,32 +1343,39 @@
+ 		return -ENODEV;
+ 
+ 	of_id = of_match_device(fsl_ssi_ids, &pdev->dev);
+-	if (!of_id || !of_id->data)
++	if (!of_id)
++		return -EINVAL;
++	hw_type = (enum fsl_ssi_type) of_id->data;
++
++	sprop = of_get_property(np, "fsl,mode", NULL);
++	if (!sprop) {
++		dev_err(&pdev->dev, "fsl,mode property is necessary\n");
+ 		return -EINVAL;
++	}
++	if (!strcmp(sprop, "ac97-slave"))
++		ac97 = true;
+ 
+-	ssi_private = devm_kzalloc(&pdev->dev, sizeof(*ssi_private),
+-			GFP_KERNEL);
++	/* The DAI name is the last part of the full name of the node. */
++	p = strrchr(np->full_name, '/') + 1;
++	ssi_private = devm_kzalloc(&pdev->dev, sizeof(*ssi_private) + strlen(p),
++			      GFP_KERNEL);
+ 	if (!ssi_private) {
+ 		dev_err(&pdev->dev, "could not allocate DAI object\n");
+ 		return -ENOMEM;
+ 	}
+ 
+-	ssi_private->soc = of_id->data;
+-
+-	sprop = of_get_property(np, "fsl,mode", NULL);
+-	if (sprop) {
+-		if (!strcmp(sprop, "ac97-slave"))
+-			ssi_private->dai_fmt = SND_SOC_DAIFMT_AC97;
+-	}
++	strcpy(ssi_private->name, p);
+ 
+ 	ssi_private->use_dma = !of_property_read_bool(np,
+ 			"fsl,fiq-stream-filter");
++	ssi_private->hw_type = hw_type;
+ 
+-	if (fsl_ssi_is_ac97(ssi_private)) {
++	if (ac97) {
+ 		memcpy(&ssi_private->cpu_dai_drv, &fsl_ssi_ac97_dai,
+ 				sizeof(fsl_ssi_ac97_dai));
+ 
+ 		fsl_ac97_data = ssi_private;
++		ssi_private->imx_ac97 = true;
+ 
+ 		snd_soc_set_ac97_ops_of_reset(&fsl_ssi_ac97_ops, pdev);
+ 	} else {
+@@ -1333,33 +1383,25 @@
+ 		memcpy(&ssi_private->cpu_dai_drv, &fsl_ssi_dai_template,
+ 		       sizeof(fsl_ssi_dai_template));
+ 	}
+-	ssi_private->cpu_dai_drv.name = dev_name(&pdev->dev);
++	ssi_private->cpu_dai_drv.name = ssi_private->name;
+ 
+-	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
+-	iomem = devm_ioremap_resource(&pdev->dev, res);
+-	if (IS_ERR(iomem))
+-		return PTR_ERR(iomem);
+-	ssi_private->ssi_phys = res->start;
+-
+-	ret = of_property_match_string(np, "clock-names", "ipg");
+-	if (ret < 0) {
+-		ssi_private->has_ipg_clk_name = false;
+-		ssi_private->regs = devm_regmap_init_mmio(&pdev->dev, iomem,
+-			&fsl_ssi_regconfig);
+-	} else {
+-		ssi_private->has_ipg_clk_name = true;
+-		ssi_private->regs = devm_regmap_init_mmio_clk(&pdev->dev,
+-			"ipg", iomem, &fsl_ssi_regconfig);
+-	}
+-	if (IS_ERR(ssi_private->regs)) {
+-		dev_err(&pdev->dev, "Failed to init register map\n");
+-		return PTR_ERR(ssi_private->regs);
++	/* Get the addresses and IRQ */
++	ret = of_address_to_resource(np, 0, &res);
++	if (ret) {
++		dev_err(&pdev->dev, "could not determine device resources\n");
++		return ret;
++	}
++	ssi_private->ssi = of_iomap(np, 0);
++	if (!ssi_private->ssi) {
++		dev_err(&pdev->dev, "could not map device resources\n");
++		return -ENOMEM;
+ 	}
++	ssi_private->ssi_phys = res.start;
+ 
+-	ssi_private->irq = platform_get_irq(pdev, 0);
+-	if (ssi_private->irq < 0) {
+-		dev_err(&pdev->dev, "no irq for node %s\n", pdev->name);
+-		return ssi_private->irq;
++	ssi_private->irq = irq_of_parse_and_map(np, 0);
++	if (!ssi_private->irq) {
++		dev_err(&pdev->dev, "no irq for node %s\n", np->full_name);
++		return -ENXIO;
+ 	}
+ 
+ 	/* Are the RX and the TX clocks locked? */
+@@ -1377,43 +1419,153 @@
+                 /* Older 8610 DTs didn't have the fifo-depth property */
+ 		ssi_private->fifo_depth = 8;
+ 
+-	dev_set_drvdata(&pdev->dev, ssi_private);
++	ssi_private->baudclk_locked = false;
++	spin_lock_init(&ssi_private->baudclk_lock);
+ 
+-	if (ssi_private->soc->imx) {
+-		ret = fsl_ssi_imx_probe(pdev, ssi_private, iomem);
+-		if (ret)
+-			return ret;
++	/*
++	 * imx51 and later SoCs have a slightly different IP that allows the
++	 * SSI configuration while the SSI unit is running.
++	 *
++	 * More important, it is necessary on those SoCs to configure the
++	 * sperate TX/RX DMA bits just before starting the stream
++	 * (fsl_ssi_trigger). The SDMA unit has to be configured before fsl_ssi
++	 * sends any DMA requests to the SDMA unit, otherwise it is not defined
++	 * how the SDMA unit handles the DMA request.
++	 *
++	 * SDMA units are present on devices starting at imx35 but the imx35
++	 * reference manual states that the DMA bits should not be changed
++	 * while the SSI unit is running (SSIEN). So we support the necessary
++	 * online configuration of fsl-ssi starting at imx51.
++	 */
++	switch (hw_type) {
++	case FSL_SSI_MCP8610:
++	case FSL_SSI_MX21:
++	case FSL_SSI_MX35:
++		ssi_private->offline_config = true;
++		break;
++	case FSL_SSI_MX51:
++		ssi_private->offline_config = false;
++		break;
+ 	}
+ 
+-	ret = devm_snd_soc_register_component(&pdev->dev, &fsl_ssi_component,
+-					      &ssi_private->cpu_dai_drv, 1);
+-	if (ret) {
+-		dev_err(&pdev->dev, "failed to register DAI: %d\n", ret);
+-		goto error_asoc_register;
++	if (hw_type == FSL_SSI_MX21 || hw_type == FSL_SSI_MX51 ||
++			hw_type == FSL_SSI_MX35) {
++		ssi_private->ssi_on_imx = true;
++
++		ssi_private->clk = devm_clk_get(&pdev->dev, NULL);
++		if (IS_ERR(ssi_private->clk)) {
++			ret = PTR_ERR(ssi_private->clk);
++			dev_err(&pdev->dev, "could not get clock: %d\n", ret);
++			goto error_irqmap;
++		}
++		ret = clk_prepare(ssi_private->clk);
++		if (ret) {
++			dev_err(&pdev->dev, "clk_prepare failed: %d\n",
++				ret);
++			goto error_irqmap;
++		}
++
++		/* For those SLAVE implementations, we ingore non-baudclk cases
++		 * and, instead, abandon MASTER mode that needs baud clock.
++		 */
++		ssi_private->baudclk = devm_clk_get(&pdev->dev, "baud");
++		if (IS_ERR(ssi_private->baudclk))
++			dev_dbg(&pdev->dev, "could not get baud clock: %ld\n",
++				 PTR_ERR(ssi_private->baudclk));
++		else
++			clk_prepare(ssi_private->baudclk);
++
++		/*
++		 * We have burstsize be "fifo_depth - 2" to match the SSI
++		 * watermark setting in fsl_ssi_startup().
++		 */
++		ssi_private->dma_params_tx.maxburst = ssi_private->fifo_depth - 2;
++		ssi_private->dma_params_rx.maxburst = ssi_private->fifo_depth - 2;
++		ssi_private->dma_params_tx.addr =
++			ssi_private->ssi_phys + offsetof(struct ccsr_ssi, stx0);
++		ssi_private->dma_params_rx.addr =
++			ssi_private->ssi_phys + offsetof(struct ccsr_ssi, srx0);
++
++		ret = !of_property_read_u32_array(np, "dmas", dmas, 4);
++		if (ssi_private->use_dma && !ret && dmas[2] == IMX_DMATYPE_SSI_DUAL) {
++			ssi_private->use_dual_fifo = true;
++			/* When using dual fifo mode, we need to keep watermark
++			 * as even numbers due to dma script limitation.
++			 */
++			ssi_private->dma_params_tx.maxburst &= ~0x1;
++			ssi_private->dma_params_rx.maxburst &= ~0x1;
++		}
+ 	}
+ 
++	/*
++	 * Enable interrupts only for MCP8610 and MX51. The other MXs have
++	 * different writeable interrupt status registers.
++	 */
+ 	if (ssi_private->use_dma) {
++		/* The 'name' should not have any slashes in it. */
+ 		ret = devm_request_irq(&pdev->dev, ssi_private->irq,
+-					fsl_ssi_isr, 0, dev_name(&pdev->dev),
++					fsl_ssi_isr, 0, ssi_private->name,
+ 					ssi_private);
++		ssi_private->irq_stats = true;
+ 		if (ret < 0) {
+ 			dev_err(&pdev->dev, "could not claim irq %u\n",
+ 					ssi_private->irq);
+-			goto error_asoc_register;
++			goto error_clk;
+ 		}
+ 	}
+ 
+-	ret = fsl_ssi_debugfs_create(&ssi_private->dbg_stats, &pdev->dev);
++	pm_runtime_enable(&pdev->dev);
++
++	/* Register with ASoC */
++	dev_set_drvdata(&pdev->dev, ssi_private);
++
++	ret = snd_soc_register_component(&pdev->dev, &fsl_ssi_component,
++					 &ssi_private->cpu_dai_drv, 1);
++	if (ret) {
++		dev_err(&pdev->dev, "failed to register DAI: %d\n", ret);
++		goto error_dev;
++	}
++
++	ret = fsl_ssi_debugfs_create(ssi_private, &pdev->dev);
+ 	if (ret)
+-		goto error_asoc_register;
++		goto error_dbgfs;
++
++	if (ssi_private->ssi_on_imx) {
++		if (!ssi_private->use_dma) {
++
++			/*
++			 * Some boards use an incompatible codec. To get it
++			 * working, we are using imx-fiq-pcm-audio, that
++			 * can handle those codecs. DMA is not possible in this
++			 * situation.
++			 */
++
++			ssi_private->fiq_params.irq = ssi_private->irq;
++			ssi_private->fiq_params.base = ssi_private->ssi;
++			ssi_private->fiq_params.dma_params_rx =
++				&ssi_private->dma_params_rx;
++			ssi_private->fiq_params.dma_params_tx =
++				&ssi_private->dma_params_tx;
++
++			ret = imx_pcm_fiq_init(pdev, &ssi_private->fiq_params);
++			if (ret)
++				goto error_pcm;
++		} else {
++			ret = imx_pcm_dma_init(pdev, IMX_SSI_DMABUF_SIZE);
++			if (ret)
++				goto error_pcm;
++		}
++	}
+ 
+ 	/*
+ 	 * If codec-handle property is missing from SSI node, we assume
+ 	 * that the machine driver uses new binding which does not require
+ 	 * SSI driver to trigger machine driver's probe.
+ 	 */
+-	if (!of_get_property(np, "codec-handle", NULL))
++	if (!of_get_property(np, "codec-handle", NULL)) {
++		ssi_private->new_binding = true;
+ 		goto done;
++	}
+ 
+ 	/* Trigger the machine driver's probe function.  The platform driver
+ 	 * name of the machine driver is taken from /compatible property of the
+@@ -1433,22 +1585,42 @@
+ 	if (IS_ERR(ssi_private->pdev)) {
+ 		ret = PTR_ERR(ssi_private->pdev);
+ 		dev_err(&pdev->dev, "failed to register platform: %d\n", ret);
+-		goto error_sound_card;
++		goto error_dai;
+ 	}
+ 
+ done:
+-	if (ssi_private->dai_fmt)
+-		_fsl_ssi_set_dai_fmt(&pdev->dev, ssi_private,
+-				     ssi_private->dai_fmt);
++	if (ssi_private->imx_ac97)
++		fsl_ssi_ac97_init();
+ 
+ 	return 0;
+ 
+-error_sound_card:
+-	fsl_ssi_debugfs_remove(&ssi_private->dbg_stats);
++error_dai:
++	if (ssi_private->ssi_on_imx && !ssi_private->use_dma)
++		imx_pcm_fiq_exit(pdev);
++
++error_pcm:
++	fsl_ssi_debugfs_remove(ssi_private);
++
++error_dbgfs:
++	snd_soc_unregister_component(&pdev->dev);
++
++error_dev:
++	device_remove_file(&pdev->dev, dev_attr);
+ 
+-error_asoc_register:
+-	if (ssi_private->soc->imx)
+-		fsl_ssi_imx_clean(pdev, ssi_private);
++	if (ssi_private->ssi_on_imx) {
++		if (!IS_ERR(ssi_private->baudclk))
++			clk_unprepare(ssi_private->baudclk);
++		clk_unprepare(ssi_private->clk);
++	}
++error_clk:
++	if (!IS_ERR(ssi_private->baudclk))
++		clk_unprepare(ssi_private->baudclk);
++	if (!IS_ERR(ssi_private->clk))
++		clk_unprepare(ssi_private->clk);
++
++error_irqmap:
++	if (ssi_private->irq_stats)
++		irq_dispose_mapping(ssi_private->irq);
+ 
+ 	return ret;
+ }
+@@ -1457,13 +1629,18 @@
+ {
+ 	struct fsl_ssi_private *ssi_private = dev_get_drvdata(&pdev->dev);
+ 
+-	fsl_ssi_debugfs_remove(&ssi_private->dbg_stats);
++	fsl_ssi_debugfs_remove(ssi_private);
+ 
+-	if (ssi_private->pdev)
++	if (!ssi_private->new_binding)
+ 		platform_device_unregister(ssi_private->pdev);
+-
+-	if (ssi_private->soc->imx)
+-		fsl_ssi_imx_clean(pdev, ssi_private);
++	snd_soc_unregister_component(&pdev->dev);
++	if (ssi_private->ssi_on_imx) {
++		if (!IS_ERR(ssi_private->baudclk))
++			clk_unprepare(ssi_private->baudclk);
++		clk_unprepare(ssi_private->clk);
++	}
++	if (ssi_private->irq_stats)
++		irq_dispose_mapping(ssi_private->irq);
+ 
+ 	return 0;
+ }
+@@ -1471,7 +1648,9 @@
+ static struct platform_driver fsl_ssi_driver = {
+ 	.driver = {
+ 		.name = "fsl-ssi-dai",
++		.owner = THIS_MODULE,
+ 		.of_match_table = fsl_ssi_ids,
++		.pm = &fsl_ssi_pm,
+ 	},
+ 	.probe = fsl_ssi_probe,
+ 	.remove = fsl_ssi_remove,
+diff -Nur linux-4.1.3/sound/soc/fsl/fsl_ssi.h linux-xbian-imx6/sound/soc/fsl/fsl_ssi.h
+--- linux-4.1.3/sound/soc/fsl/fsl_ssi.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/fsl_ssi.h	2015-07-27 23:13:11.153188979 +0200
+@@ -12,32 +12,33 @@
+ #ifndef _MPC8610_I2S_H
+ #define _MPC8610_I2S_H
+ 
+-/* SSI registers */
+-#define CCSR_SSI_STX0			0x00
+-#define CCSR_SSI_STX1			0x04
+-#define CCSR_SSI_SRX0			0x08
+-#define CCSR_SSI_SRX1			0x0c
+-#define CCSR_SSI_SCR			0x10
+-#define CCSR_SSI_SISR			0x14
+-#define CCSR_SSI_SIER			0x18
+-#define CCSR_SSI_STCR			0x1c
+-#define CCSR_SSI_SRCR			0x20
+-#define CCSR_SSI_STCCR			0x24
+-#define CCSR_SSI_SRCCR			0x28
+-#define CCSR_SSI_SFCSR			0x2c
+-#define CCSR_SSI_STR			0x30
+-#define CCSR_SSI_SOR			0x34
+-#define CCSR_SSI_SACNT			0x38
+-#define CCSR_SSI_SACADD			0x3c
+-#define CCSR_SSI_SACDAT			0x40
+-#define CCSR_SSI_SATAG			0x44
+-#define CCSR_SSI_STMSK			0x48
+-#define CCSR_SSI_SRMSK			0x4c
+-#define CCSR_SSI_SACCST			0x50
+-#define CCSR_SSI_SACCEN			0x54
+-#define CCSR_SSI_SACCDIS		0x58
++/* SSI Register Map */
++struct ccsr_ssi {
++	__be32 stx0;	/* 0x.0000 - SSI Transmit Data Register 0 */
++	__be32 stx1;	/* 0x.0004 - SSI Transmit Data Register 1 */
++	__be32 srx0;	/* 0x.0008 - SSI Receive Data Register 0 */
++	__be32 srx1;	/* 0x.000C - SSI Receive Data Register 1 */
++	__be32 scr;	/* 0x.0010 - SSI Control Register */
++	__be32 sisr;	/* 0x.0014 - SSI Interrupt Status Register Mixed */
++	__be32 sier;	/* 0x.0018 - SSI Interrupt Enable Register */
++	__be32 stcr;	/* 0x.001C - SSI Transmit Configuration Register */
++	__be32 srcr;	/* 0x.0020 - SSI Receive Configuration Register */
++	__be32 stccr;	/* 0x.0024 - SSI Transmit Clock Control Register */
++	__be32 srccr;	/* 0x.0028 - SSI Receive Clock Control Register */
++	__be32 sfcsr;	/* 0x.002C - SSI FIFO Control/Status Register */
++	__be32 str;	/* 0x.0030 - SSI Test Register */
++	__be32 sor;	/* 0x.0034 - SSI Option Register */
++	__be32 sacnt;	/* 0x.0038 - SSI AC97 Control Register */
++	__be32 sacadd;	/* 0x.003C - SSI AC97 Command Address Register */
++	__be32 sacdat;	/* 0x.0040 - SSI AC97 Command Data Register */
++	__be32 satag;	/* 0x.0044 - SSI AC97 Tag Register */
++	__be32 stmsk;	/* 0x.0048 - SSI Transmit Time Slot Mask Register */
++	__be32 srmsk;	/* 0x.004C - SSI Receive Time Slot Mask Register */
++	__be32 saccst;	/* 0x.0050 - SSI AC97 Channel Status Register */
++	__be32 saccen;	/* 0x.0054 - SSI AC97 Channel Enable Register */
++	__be32 saccdis; /* 0x.0058 - SSI AC97 Channel Disable Register */
++};
+ 
+-#define CCSR_SSI_SCR_SYNC_TX_FS		0x00001000
+ #define CCSR_SSI_SCR_RFR_CLK_DIS	0x00000800
+ #define CCSR_SSI_SCR_TFR_CLK_DIS	0x00000400
+ #define CCSR_SSI_SCR_TCH_EN		0x00000100
+@@ -205,64 +206,5 @@
+ #define CCSR_SSI_SACNT_FV		0x00000002
+ #define CCSR_SSI_SACNT_AC97EN		0x00000001
+ 
+-
+-struct device;
+-
+-#if IS_ENABLED(CONFIG_DEBUG_FS)
+-
+-struct fsl_ssi_dbg {
+-	struct dentry *dbg_dir;
+-	struct dentry *dbg_stats;
+-
+-	struct {
+-		unsigned int rfrc;
+-		unsigned int tfrc;
+-		unsigned int cmdau;
+-		unsigned int cmddu;
+-		unsigned int rxt;
+-		unsigned int rdr1;
+-		unsigned int rdr0;
+-		unsigned int tde1;
+-		unsigned int tde0;
+-		unsigned int roe1;
+-		unsigned int roe0;
+-		unsigned int tue1;
+-		unsigned int tue0;
+-		unsigned int tfs;
+-		unsigned int rfs;
+-		unsigned int tls;
+-		unsigned int rls;
+-		unsigned int rff1;
+-		unsigned int rff0;
+-		unsigned int tfe1;
+-		unsigned int tfe0;
+-	} stats;
+-};
+-
+-void fsl_ssi_dbg_isr(struct fsl_ssi_dbg *ssi_dbg, u32 sisr);
+-
+-int fsl_ssi_debugfs_create(struct fsl_ssi_dbg *ssi_dbg, struct device *dev);
+-
+-void fsl_ssi_debugfs_remove(struct fsl_ssi_dbg *ssi_dbg);
+-
+-#else
+-
+-struct fsl_ssi_dbg {
+-};
+-
+-static inline void fsl_ssi_dbg_isr(struct fsl_ssi_dbg *stats, u32 sisr)
+-{
+-}
+-
+-static inline int fsl_ssi_debugfs_create(struct fsl_ssi_dbg *ssi_dbg,
+-		struct device *dev)
+-{
+-	return 0;
+-}
+-
+-static inline void fsl_ssi_debugfs_remove(struct fsl_ssi_dbg *ssi_dbg)
+-{
+-}
+-#endif  /* ! IS_ENABLED(CONFIG_DEBUG_FS) */
+-
+ #endif
++
+diff -Nur linux-4.1.3/sound/soc/fsl/hdmi_pcm.S linux-xbian-imx6/sound/soc/fsl/hdmi_pcm.S
+--- linux-4.1.3/sound/soc/fsl/hdmi_pcm.S	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/sound/soc/fsl/hdmi_pcm.S	2015-07-27 23:13:11.153188979 +0200
+@@ -0,0 +1,246 @@
++/**
++ * Copyright (C) 2010-2014 Freescale Semiconductor, Inc. All Rights Reserved.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++.section .text
++
++.global hdmi_dma_copy_16_neon_lut
++.global hdmi_dma_copy_16_neon_fast
++.global hdmi_dma_copy_24_neon_lut
++.global hdmi_dma_copy_24_neon_fast
++
++
++/**
++ * hdmi_dma_copy_16_neon_lut
++ * Convert pcm sample to iec sample. Pcm sample is 16 bits.
++ * Frame index's between 0 and 47 inclusively. Channel count can be 1, 2, 4, 8.
++ * Frame count should be multipliable by 4, and Sample count by 8.
++ *
++ * C Prototype
++ *   void hdmi_dma_copy_16_neon_lut(unsigned short *src, unsigned int *dst,
++ *			int samples, unsigned char *lookup_table);
++ * Return value
++ *   None
++ * Parameters
++ *   src		Source PCM16 samples
++ *   dst		Dest buffer to store pcm with header
++ *   samples		Contains sample count (=frame_count * channel_count)
++ *   lookup_table	Preconstructed header table. Channels interleaved.
++ */
++
++hdmi_dma_copy_16_neon_lut:
++	mov     r12, #1		/* construct vector(1) */
++	vdup.8 d6, r12
++
++hdmi_dma_copy_16_neon_lut_start:
++
++	/* get 8 samples to q0 */
++	vld1.16 {d0, d1}, [r0]!	/* TODO: aligned */
++
++	/* pld [r1, #(64*4)] */
++
++	/* xor every bit */
++	vcnt.8     q1, q0	/* count of 1s */
++	vpadd.i8 d2, d2, d3	/* only care about the LST in every element */
++	vand       d2, d2, d6	/* clear other bits while keep the least bit */
++	vshl.u8    d2, d2, #3	/* bit p: d2 = d2 << 3 */
++
++	/* get packet header */
++	vld1.8       {d5}, [r3]!
++	veor        d4, d5, d2	/* xor bit c */
++
++	/* store: (d4 << 16 | q0) << 8 */
++	vmovl.u8  q2, d4	/* expand from char to short */
++	vzip.16     q0, q2
++	vshl.u32   q0, q0, #8
++	vshl.u32   q1, q2, #8
++	vst1.32     {d0, d1, d2, d3}, [r1]!
++
++	/* decrease sample count */
++	subs  r2, r2, #8
++	bne   hdmi_dma_copy_16_neon_lut_start
++
++	mov pc, lr
++
++/**
++ * hdmi_dma_copy_16_neon_fast
++ * Convert pcm sample to iec sample. Pcm sample is 16 bits.
++ * Frame index's between 48 and 191 inclusively.
++ * Channel count can be 1, 2, 4 or 8.
++ * Frame count should be multipliable by 4, and Sample count by 8.
++ *
++ * C Prototype
++ * void hdmi_dma_copy_16_neon_fast(unsigned short *src,
++ * 		unsigned int *dst, int samples);
++ * Return value
++ *   None
++ * Parameters
++ *   src		Source PCM16 samples
++ *   dst		Dest buffer to store pcm with header
++ *   samples		Contains sample count (=frame_count * channel_count)
++ */
++
++hdmi_dma_copy_16_neon_fast:
++	mov     r12, #1		/* construct vector(1) */
++	vdup.8 d6, r12
++
++hdmi_dma_copy_16_neon_fast_start:
++	/* get 8 samples to q0 */
++	vld1.16 {d0, d1}, [r0]!	/* TODO: aligned */
++
++	/* pld [r1, #(64*4)] */
++
++	/* xor every bit */
++	vcnt.8     q1, q0	/* count of 1s */
++	vpadd.i8 d2, d2, d3
++	vand       d2, d2, d6	/* clear other bits while keep the LST */
++	/* finally we construct packet header */
++	vshl.u8    d4, d2, #3	/* bit p: d2 = d2 << 3 */
++
++	/* get packet header: always 0 */
++
++	/* store: (d4 << 16 | q0) << 8 */
++	vmovl.u8  q2, d4	/* expand from char to short */
++	vzip.16     q0, q2
++	vshl.u32   q0, q0, #8
++	vshl.u32   q1, q2, #8
++	vst1.32     {d0, d1, d2, d3}, [r1]!
++
++	/* decrease sample count */
++	subs  r2, r2, #8
++	bne   hdmi_dma_copy_16_neon_fast_start
++
++	mov pc, lr
++
++
++
++/**
++ * hdmi_dma_copy_24_neon_lut
++ * Convert pcm sample to iec sample. Pcm sample is 24 bits.
++ * Frame index's between 0 and 47 inclusively. Channel count can be 1, 2, 4, 8.
++ * Frame count should be multipliable by 4, and Sample count by 8.
++ *
++ * C Prototype
++ *   void hdmi_dma_copy_24_neon_lut(unsigned int *src, unsigned int *dst,
++ *			int samples, unsigned char *lookup_table);
++ * Return value
++ *   None
++ * Parameters
++ *   src		Source PCM24 samples
++ *   dst		Dest buffer to store pcm with header
++ *   samples		Contains sample count (=frame_count * channel_count)
++ *   lookup_table	Preconstructed header table. Channels interleaved.
++ */
++
++hdmi_dma_copy_24_neon_lut:
++	vpush   {d8}
++
++	mov     r12, #1		/* construct vector(1) */
++	vdup.8 d8, r12
++
++hdmi_dma_copy_24_neon_lut_start:
++
++	/* get 8 samples to q0 and q1 */
++	vld1.32 {d0, d1, d2, d3}, [r0]! /* TODO: aligned */
++
++	/* pld [r1, #(64*4)] */
++
++	/* xor every bit */
++	vcnt.8     q2, q0	/* count of 1s */
++	vpadd.i8 d4, d4, d5	/* only care about the LSB in every element */
++	vcnt.8     q3, q1
++	vpadd.i8 d6, d6, d7
++	vpadd.i8 d4, d4, d6	/* d4: contains xor result and other dirty bits */
++	vand       d4, d4, d8	/* clear other bits while keep the least bit */
++	vshl.u8    d4, d4, #3	/* bit p: d4 = d4 << 3 */
++
++	/* get packet header */
++	vld1.8       {d5}, [r3]!/* d5: original header */
++	veor        d5, d5, d4	/* fix bit p */
++
++	/* store: (d5 << 24 | q0) */
++	vmovl.u8  q3, d5	/* expand from char to short */
++	vmovl.u16 q2, d6	/* expand from short to int */
++	vmovl.u16 q3, d7
++	vshl.u32    q2, q2, #24
++	vshl.u32    q3, q3, #24
++	vorr          q0, q0, q2
++	vorr          q1, q1, q3
++	vst1.32     {d0, d1, d2, d3}, [r1]!
++
++	/* decrease sample count */
++	subs  r2, r2, #8
++	bne   hdmi_dma_copy_24_neon_lut_start
++
++	vpop {d8}
++	mov pc, lr
++
++/**
++ * hdmi_dma_copy_24_neon_fast
++ * Convert pcm sample to iec sample. Pcm sample is 24 bits.
++ * Frame index's between 48 and 191 inclusively.
++ * Channel count can be 1, 2, 4 or 8.
++ * Frame count should be multipliable by 4, and Sample count by 8.
++ *
++ * C Prototype
++ * void hdmi_dma_copy_24_neon_fast(unsigned int *src,
++ * 		unsigned int *dst, int samples);
++ * Return value
++ *   None
++ * Parameters
++ *   src		Source PCM24 samples
++ *   dst		Dest buffer to store pcm with header
++ *   samples		Contains sample count (=frame_count * channel_count)
++ */
++
++hdmi_dma_copy_24_neon_fast:
++	vpush   {d8}
++
++	mov     r12, #1		/* construct vector(1) */
++	vdup.8 d8, r12
++
++hdmi_dma_copy_24_neon_fast_start:
++	/* get 8 samples to q0 and q1 */
++	vld1.32 {d0, d1, d2, d3}, [r0]! /* TODO: aligned */
++
++	/* pld [r1, #(64*4)] */
++
++	/* xor every bit */
++	vcnt.8     q2, q0	/* count of 1s */
++	vpadd.i8 d4, d4, d5	/* only care about the LSB in every element */
++	vcnt.8     q3, q1
++	vpadd.i8 d6, d6, d7
++	vpadd.i8 d4, d4, d6	/* d4: contains xor result and other dirty bits */
++	vand       d4, d4, d8	/* clear other bits while keep the least bit */
++	vshl.u8    d4, d4, #3	/* bit p: d4 = d4 << 3 */
++
++	/* store: (d4 << 24 | q0)  */
++	vmovl.u8  q3, d4	/* expand from char to short */
++	vmovl.u16 q2, d6	/* expand from short to int */
++	vmovl.u16 q3, d7
++	vshl.u32    q2, q2, #24
++	vshl.u32    q3, q3, #24
++	vorr          q0, q0, q2
++	vorr          q1, q1, q3
++	vst1.32     {d0, d1, d2, d3}, [r1]!
++
++	/* decrease sample count */
++	subs  r2, r2, #8
++	bne   hdmi_dma_copy_24_neon_fast_start
++
++	vpop {d8}
++	mov pc, lr
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-audmux.c linux-xbian-imx6/sound/soc/fsl/imx-audmux.c
+--- linux-4.1.3/sound/soc/fsl/imx-audmux.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/imx-audmux.c	2015-07-27 23:13:11.153188979 +0200
+@@ -67,7 +67,7 @@
+ {
+ 	ssize_t ret;
+ 	char *buf;
+-	uintptr_t port = (uintptr_t)file->private_data;
++	int port = (int)file->private_data;
+ 	u32 pdcr, ptcr;
+ 
+ 	if (audmux_clk) {
+@@ -145,9 +145,9 @@
+ 	.llseek = default_llseek,
+ };
+ 
+-static void audmux_debugfs_init(void)
++static void __init audmux_debugfs_init(void)
+ {
+-	uintptr_t i;
++	int i;
+ 	char buf[20];
+ 
+ 	audmux_debugfs_root = debugfs_create_dir("audmux", NULL);
+@@ -157,10 +157,10 @@
+ 	}
+ 
+ 	for (i = 0; i < MX31_AUDMUX_PORT7_SSI_PINS_7 + 1; i++) {
+-		snprintf(buf, sizeof(buf), "ssi%lu", i);
++		snprintf(buf, sizeof(buf), "ssi%d", i);
+ 		if (!debugfs_create_file(buf, 0444, audmux_debugfs_root,
+ 					 (void *)i, &audmux_debugfs_fops))
+-			pr_warning("Failed to create AUDMUX port %lu debugfs file\n",
++			pr_warning("Failed to create AUDMUX port %d debugfs file\n",
+ 				   i);
+ 	}
+ }
+@@ -356,6 +356,7 @@
+ 	.id_table	= imx_audmux_ids,
+ 	.driver	= {
+ 		.name	= DRIVER_NAME,
++		.owner	= THIS_MODULE,
+ 		.of_match_table = imx_audmux_dt_ids,
+ 	}
+ };
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-hdmi.c linux-xbian-imx6/sound/soc/fsl/imx-hdmi.c
+--- linux-4.1.3/sound/soc/fsl/imx-hdmi.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/sound/soc/fsl/imx-hdmi.c	2015-07-27 23:13:11.153188979 +0200
+@@ -0,0 +1,114 @@
++/*
++ * ASoC HDMI Transmitter driver for IMX development boards
++ *
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
++ *
++ * based on stmp3780_devb_hdmi.c
++ *
++ * Vladimir Barinov <vbarinov@embeddedalley.com>
++ *
++ * Copyright 2008 SigmaTel, Inc
++ * Copyright 2008 Embedded Alley Solutions, Inc
++ *
++ * This file is licensed under the terms of the GNU General Public License
++ * version 2.  This program  is licensed "as is" without any warranty of any
++ * kind, whether express or implied.
++ */
++
++#include <linux/module.h>
++#include <linux/of_platform.h>
++#include <linux/mfd/mxc-hdmi-core.h>
++#include <sound/soc.h>
++
++#include "imx-hdmi.h"
++
++/* imx digital audio interface glue - connects codec <--> CPU */
++static struct snd_soc_dai_link imx_hdmi_dai_link = {
++	.name = "i.MX HDMI Audio Tx",
++	.stream_name = "i.MX HDMI Audio Tx",
++	.codec_dai_name = "hdmi-hifi",
++	.codec_name = "hdmi-audio-codec",
++	.platform_name = "imx-hdmi-audio",
++	.ignore_pmdown_time = 1,
++};
++
++static struct snd_soc_card snd_soc_card_imx_hdmi = {
++	.name = "imx-hdmi-soc",
++	.dai_link = &imx_hdmi_dai_link,
++	.num_links = 1,
++};
++
++static int imx_hdmi_audio_probe(struct platform_device *pdev)
++{
++	struct device_node *hdmi_np, *np = pdev->dev.of_node;
++	struct snd_soc_card *card = &snd_soc_card_imx_hdmi;
++	struct platform_device *hdmi_pdev;
++	int ret = 0;
++
++	if (!hdmi_get_registered()) {
++		dev_err(&pdev->dev, "initialize HDMI-audio failed. load HDMI-video first!\n");
++		return -ENODEV;
++	}
++
++	hdmi_np = of_parse_phandle(np, "hdmi-controller", 0);
++	if (!hdmi_np) {
++		dev_err(&pdev->dev, "failed to find hdmi-audio cpudai\n");
++		ret = -EINVAL;
++		goto end;
++	}
++
++	hdmi_pdev = of_find_device_by_node(hdmi_np);
++	if (!hdmi_pdev) {
++		dev_err(&pdev->dev, "failed to find SSI platform device\n");
++		ret = -EINVAL;
++		goto end;
++	}
++
++	card->dev = &pdev->dev;
++	card->dai_link->cpu_dai_name = dev_name(&hdmi_pdev->dev);
++
++	platform_set_drvdata(pdev, card);
++
++	ret = snd_soc_register_card(card);
++	if (ret)
++		dev_err(&pdev->dev, "failed to register card: %d\n", ret);
++
++end:
++	if (hdmi_np)
++		of_node_put(hdmi_np);
++
++	return ret;
++}
++
++static int imx_hdmi_audio_remove(struct platform_device *pdev)
++{
++	struct snd_soc_card *card = platform_get_drvdata(pdev);
++
++	snd_soc_unregister_card(card);
++
++	return 0;
++}
++
++static const struct of_device_id imx_hdmi_dt_ids[] = {
++	{ .compatible = "fsl,imx-audio-hdmi", },
++	{ /* sentinel */ }
++};
++MODULE_DEVICE_TABLE(of, imx_hdmi_dt_ids);
++
++static struct platform_driver imx_hdmi_audio_driver = {
++	.probe = imx_hdmi_audio_probe,
++	.remove = imx_hdmi_audio_remove,
++	.driver = {
++		.of_match_table = imx_hdmi_dt_ids,
++		.name = "imx-audio-hdmi",
++		.owner = THIS_MODULE,
++		.pm = &snd_soc_pm_ops,
++	},
++};
++
++module_platform_driver(imx_hdmi_audio_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("IMX HDMI TX ASoC driver");
++MODULE_LICENSE("GPL");
++MODULE_ALIAS("platform:imx-audio-hdmi");
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-hdmi-dma.c linux-xbian-imx6/sound/soc/fsl/imx-hdmi-dma.c
+--- linux-4.1.3/sound/soc/fsl/imx-hdmi-dma.c	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/sound/soc/fsl/imx-hdmi-dma.c	2015-07-27 23:13:11.153188979 +0200
+@@ -0,0 +1,1256 @@
++/*
++ * imx-hdmi-dma.c  --  HDMI DMA driver for ALSA Soc Audio Layer
++ *
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
++ *
++ * based on imx-pcm-dma-mx2.c
++ * Copyright 2009 Sascha Hauer <s.hauer@pengutronix.de>
++ *
++ * This code is based on code copyrighted by Freescale,
++ * Liam Girdwood, Javier Martin and probably others.
++ *
++ *  This program is free software; you can redistribute  it and/or modify it
++ *  under  the terms of  the GNU General  Public License as published by the
++ *  Free Software Foundation;  either version 2 of the  License, or (at your
++ *  option) any later version.
++ */
++
++#include <linux/module.h>
++#include <linux/delay.h>
++#include <linux/dma-mapping.h>
++#include <linux/mfd/mxc-hdmi-core.h>
++#include <linux/platform_data/dma-imx.h>
++
++#include <video/mxc_hdmi.h>
++
++#include "imx-hdmi.h"
++
++#define HDMI_DMA_BURST_UNSPECIFIED_LEGNTH	0
++#define HDMI_DMA_BURST_INCR4			1
++#define HDMI_DMA_BURST_INCR8			2
++#define HDMI_DMA_BURST_INCR16			3
++
++#define HDMI_BASE_ADDR 0x00120000
++
++struct hdmi_sdma_script {
++	int control_reg_addr;
++	int status_reg_addr;
++	int dma_start_addr;
++	u32 buffer[20];
++};
++
++struct hdmi_dma_priv {
++	struct snd_pcm_substream *substream;
++	struct platform_device *pdev;
++
++	struct snd_dma_buffer hw_buffer;
++	unsigned long buffer_bytes;
++	unsigned long appl_bytes;
++
++	int periods;
++	int period_time;
++	int period_bytes;
++	int dma_period_bytes;
++	int buffer_ratio;
++
++	unsigned long offset;
++
++	snd_pcm_format_t format;
++	int sample_align;
++	int sample_bits;
++	int channels;
++	int rate;
++
++	int frame_idx;
++
++	bool tx_active;
++	spinlock_t irq_lock;
++
++	/* SDMA part */
++	dma_addr_t phy_hdmi_sdma_t;
++	struct hdmi_sdma_script *hdmi_sdma_t;
++	struct dma_chan *dma_channel;
++	struct imx_dma_data dma_data;
++	struct dma_async_tx_descriptor *desc;
++	struct imx_hdmi_sdma_params sdma_params;
++};
++
++/* bit 0:0:0:b:p(0):c:(u)0:(v)0 */
++/* max 8 channels supported; channels are interleaved */
++static u8 g_packet_head_table[48 * 8];
++
++/* channel remapping for hdmi_dma_copy_xxxx() */
++static u8 g_channel_remap_table[24];
++
++/* default mapping tables */
++static const u8 channel_maps_alsa_cea[5][8] = {
++	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 0CH: no remapping */
++	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 2CH: no remapping */
++	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 4CH: no remapping */
++	{ 0, 1, 4, 5, 3, 2, 6, 7 },	/* 6CH: ALSA5.1 to CEA */
++	{ 0, 1, 6, 7, 3, 2, 4, 5 }	/* 8CH: ALSA7.1 to CEA */
++};
++
++static const u8 channel_maps_cea_alsa[5][8] = {
++	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 0CH: no remapping */
++	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 2CH: no remapping */
++	{ 0, 1, 2, 3, 4, 5, 6, 7 },	/* 4CH: no remapping */
++	{ 0, 1, 5, 4, 2, 3, 6, 7 },	/* 6CH: CEA to ALSA5.1 */
++	{ 0, 1, 5, 4, 6, 7, 2, 3 }	/* 8CH: CEA to ALSA7.1 */
++};
++
++union hdmi_audio_header_t iec_header;
++EXPORT_SYMBOL(iec_header);
++
++/*
++ * Note that the period size for DMA != period size for ALSA because the
++ * driver adds iec frame info to the audio samples (in hdmi_dma_copy).
++ *
++ * Each 4 byte subframe = 1 byte of iec data + 3 byte audio sample.
++ *
++ * A 16 bit audio sample becomes 32 bits including the frame info. Ratio=2
++ * A 24 bit audio sample becomes 32 bits including the frame info. Ratio=3:4
++ * If the 24 bit raw audio is in 32 bit words, the
++ *
++ *  Original  Packed into  subframe  Ratio of size        Format
++ *   sample    how many      size    of DMA buffer
++ *   (bits)      bits                to ALSA buffer
++ *  --------  -----------  --------  --------------  ------------------------
++ *     16         16          32          2          SNDRV_PCM_FORMAT_S16_LE
++ *     24         24          32          1.33       SNDRV_PCM_FORMAT_S24_3LE*
++ *     24         32          32          1          SNDRV_PCM_FORMAT_S24_LE
++ *
++ * *so SNDRV_PCM_FORMAT_S24_3LE is not supported.
++ */
++
++/*
++ * The minimum dma period is one IEC audio frame (192 * 4 * channels).
++ * The maximum dma period for the HDMI DMA is 8K.
++ *
++ *   channels       minimum          maximum
++ *                 dma period       dma period
++ *   --------  ------------------   ----------
++ *       2     192 * 4 * 2 = 1536   * 4 = 6144
++ *       4     192 * 4 * 4 = 3072   * 2 = 6144
++ *       6     192 * 4 * 6 = 4608   * 1 = 4608
++ *       8     192 * 4 * 8 = 6144   * 1 = 6144
++ *
++ * Bottom line:
++ * 1. Must keep the ratio of DMA buffer to ALSA buffer consistent.
++ * 2. frame_idx is saved in the private data, so even if a frame cannot be
++ *    transmitted in a period, it can be continued in the next period.  This
++ *    is necessary for 6 ch.
++ */
++#define HDMI_DMA_PERIOD_BYTES		(12288)
++#define HDMI_DMA_BUF_SIZE		(1280 * 1024)
++#define HDMI_PCM_BUF_SIZE		(1280 * 1024)
++
++#define hdmi_audio_debug(dev, reg) \
++	dev_dbg(dev, #reg ": 0x%02x\n", hdmi_readb(reg))
++
++#ifdef DEBUG
++static void dumpregs(struct device *dev)
++{
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_CONF0);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_START);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_STOP);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_THRSLD);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_STRADDR0);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_STPADDR0);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_BSTADDR0);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_MBLENGTH0);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_MBLENGTH1);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_STAT);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_INT);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_MASK);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_POL);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_CONF1);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFSTAT);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFINT);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFMASK);
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_BUFFPOL);
++	hdmi_audio_debug(dev, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
++	hdmi_audio_debug(dev, HDMI_IH_AHBDMAAUD_STAT0);
++	hdmi_audio_debug(dev, HDMI_IH_MUTE);
++}
++
++static void dumppriv(struct device *dev, struct hdmi_dma_priv *priv)
++{
++	dev_dbg(dev, "channels         = %d\n", priv->channels);
++	dev_dbg(dev, "periods          = %d\n", priv->periods);
++	dev_dbg(dev, "period_bytes     = %d\n", priv->period_bytes);
++	dev_dbg(dev, "dma period_bytes = %d\n", priv->dma_period_bytes);
++	dev_dbg(dev, "buffer_ratio     = %d\n", priv->buffer_ratio);
++	dev_dbg(dev, "hw dma buffer    = 0x%08x\n", (int)priv->hw_buffer.addr);
++	dev_dbg(dev, "dma buf size     = %d\n", (int)priv->buffer_bytes);
++	dev_dbg(dev, "sample_rate      = %d\n", (int)priv->rate);
++}
++#else
++static void dumpregs(struct device *dev) {}
++static void dumppriv(struct device *dev, struct hdmi_dma_priv *priv) {}
++#endif
++
++/*
++ * Conditions for DMA to work:
++ * ((final_addr - initial_addr)>>2)+1) < 2k.  So max period is 8k.
++ * (inital_addr & 0x3) == 0
++ * (final_addr  & 0x3) == 0x3
++ *
++ * The DMA Period should be an integer multiple of the IEC 60958 audio
++ * frame size, which is 768 bytes (192 * 4).
++ */
++static void hdmi_dma_set_addr(int start_addr, int dma_period_bytes)
++{
++	int final_addr = start_addr + dma_period_bytes - 1;
++
++	hdmi_write4(start_addr, HDMI_AHB_DMA_STRADDR0);
++	hdmi_write4(final_addr, HDMI_AHB_DMA_STPADDR0);
++}
++
++static void hdmi_dma_irq_set(bool set)
++{
++	u8 val = hdmi_readb(HDMI_AHB_DMA_MASK);
++
++	if (set)
++		val |= HDMI_AHB_DMA_DONE;
++	else
++		val &= (u8)~HDMI_AHB_DMA_DONE;
++
++	hdmi_writeb(val, HDMI_AHB_DMA_MASK);
++}
++
++static void hdmi_mask(int mask)
++{
++	u8 regval = hdmi_readb(HDMI_AHB_DMA_MASK);
++
++	if (mask)
++		regval |= HDMI_AHB_DMA_ERROR | HDMI_AHB_DMA_FIFO_EMPTY;
++	else
++		regval &= (u8)~(HDMI_AHB_DMA_ERROR | HDMI_AHB_DMA_FIFO_EMPTY);
++
++	hdmi_writeb(regval, HDMI_AHB_DMA_MASK);
++}
++
++static inline int odd_ones(unsigned a)
++{
++	a ^= a >> 16;
++	a ^= a >> 8;
++	a ^= a >> 4;
++	a ^= a >> 2;
++	a ^= a >> 1;
++
++	return a & 1;
++}
++
++/* Add frame information for one pcm subframe */
++static u32 hdmi_dma_add_frame_info(struct hdmi_dma_priv *priv,
++				   u32 pcm_data, int subframe_idx)
++{
++	union hdmi_audio_dma_data_t subframe;
++	union hdmi_audio_header_t tmp_header;
++
++	subframe.U = 0;
++
++	if (priv->frame_idx < 42) {
++		tmp_header = iec_header;
++
++		/* fill v (validity) */
++		subframe.B.v = tmp_header.B.linear_pcm;
++
++		/* fill c (channel status) */
++		if (tmp_header.B.linear_pcm == 0)
++			tmp_header.B.channel = subframe_idx + 1;
++		subframe.B.c = tmp_header.U >> priv->frame_idx;
++	} else {
++		/* fill v (validity), c is always zero */
++		subframe.B.v = iec_header.B.linear_pcm;
++	}
++
++	/* fill data */
++	if (priv->sample_bits == 16)
++		pcm_data <<= 8;
++	subframe.B.data = pcm_data;
++
++	/* fill p (parity) Note: Do not include b ! */
++	subframe.B.p = odd_ones(subframe.U);
++
++	/* fill b (start-of-block) */
++	if (priv->frame_idx == 0)
++		subframe.B.b = 1;
++
++	return subframe.U;
++}
++
++static void init_table(int channels)
++{
++	int i, map_sel, ch;
++	unsigned char *p = g_packet_head_table;
++	union hdmi_audio_header_t tmp_header = iec_header;
++
++	for (i = 0; i < 48; i++) {
++		int b = 0;
++		if (i == 0)
++			b = 1;
++
++		for (ch = 0; ch < channels; ch++) {
++			int c = 0;
++			if (i < 42) {
++				tmp_header.B.channel = ch + 1;
++				c = (tmp_header.U >> i) & 0x1;
++			}
++			/* preset bit p as c */
++			*p++ = (b << 4) | (c << 2) | (c << 3);
++		}
++	}
++
++	map_sel = channels / 2;
++	for (i = 0; i < 24; i++) {
++		g_channel_remap_table[i] = (i / channels) * channels +
++			channel_maps_cea_alsa[map_sel][i % channels];
++	}
++}
++
++/* Optimization for IEC head */
++static void hdmi_dma_copy_16_c_lut(u16 *src, u32 *dst, int samples,
++				u8 *lookup_table)
++{
++	u32 sample, head;
++	int i = 0;
++
++	while (samples--) {
++		/* get source sample */
++		sample = src[g_channel_remap_table[i]];
++
++		/* get packet header and p-bit */
++		head = *lookup_table++ ^ (odd_ones(sample) << 3);
++
++		/* store sample and header */
++		*dst++ = (head << 24) | (sample << 8);
++
++		if (++i == 24) {
++			src += 24;
++			i = 0;
++		}
++	}
++}
++
++static void hdmi_dma_copy_16_c_fast(u16 *src, u32 *dst, int samples)
++{
++	u32 sample;
++	int i = 0;
++
++	while (samples--) {
++		/* get source sample */
++		sample = src[g_channel_remap_table[i]];
++
++		/* store sample and p-bit */
++		*dst++ = (odd_ones(sample) << (3+24)) | (sample << 8);
++
++		if (++i == 24) {
++			src += 24;
++			i = 0;
++		}
++	}
++}
++
++static void hdmi_dma_copy_24_c_lut(u32 *src, u32 *dst, int samples,
++				u8 *lookup_table)
++{
++	u32 sample, head;
++	int i = 0;
++
++	while (samples--) {
++		/* get source sample */
++		sample = src[g_channel_remap_table[i]] & 0x00ffffff;
++
++		/* get packet header and p-bit */
++		head = *lookup_table++ ^ (odd_ones(sample) << 3);
++
++		/* store sample and header */
++		*dst++ = (head << 24) | sample;
++
++		if (++i == 24) {
++			src += 24;
++			i = 0;
++		}
++	}
++}
++
++static void hdmi_dma_copy_24_c_fast(u32 *src, u32 *dst, int samples)
++{
++	u32 sample;
++	int i = 0;
++
++	while (samples--) {
++		/* get source sample */
++		sample = src[g_channel_remap_table[i]] & 0x00ffffff;
++
++		/* store sample and p-bit */
++		*dst++ = (odd_ones(sample) << (3+24)) | sample;
++
++		if (++i == 24) {
++			src += 24;
++			i = 0;
++		}
++	}
++}
++
++static void hdmi_mmap_copy(u8 *src, int samplesize, u32 *dst, int framecnt, int channelcnt)
++{
++	/* split input frames into 192-frame each */
++	int count_in_192 = (framecnt + 191) / 192;
++	int i;
++
++	typedef void (*fn_copy_lut)(u8 *src, u32 *dst, int samples, u8 *lookup_table);
++	typedef void (*fn_copy_fast)(u8 *src, u32 *dst, int samples);
++	fn_copy_lut copy_lut;
++	fn_copy_fast copy_fast;
++
++	if (samplesize == 4) {
++		copy_lut = (fn_copy_lut)hdmi_dma_copy_24_c_lut;
++		copy_fast = (fn_copy_fast)hdmi_dma_copy_24_c_fast;
++	} else {
++		copy_lut = (fn_copy_lut)hdmi_dma_copy_16_c_lut;
++		copy_fast = (fn_copy_fast)hdmi_dma_copy_16_c_fast;
++	}
++
++	for (i = 0; i < count_in_192; i++) {
++		int count, samples;
++
++		/* handles frame index [0, 48) */
++		count = (framecnt < 48) ? framecnt : 48;
++		samples = count * channelcnt;
++		copy_lut(src, dst, samples, g_packet_head_table);
++		framecnt -= count;
++		if (framecnt == 0)
++			break;
++
++		src  += samples * samplesize;
++		dst += samples;
++
++		/* handles frame index [48, 192) */
++		count = (framecnt < 192 - 48) ? framecnt : 192 - 48;
++		samples = count * channelcnt;
++		copy_fast(src, dst, samples);
++		framecnt -= count;
++		src  += samples * samplesize;
++		dst += samples;
++	}
++}
++
++static void hdmi_dma_mmap_copy(struct snd_pcm_substream *substream,
++				int offset, int count)
++{
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++	struct device *dev = rtd->platform->dev;
++	u32 framecount, *dst;
++
++	framecount = count / (priv->sample_align * priv->channels);
++
++	/* hw_buffer is the destination for pcm data plus frame info. */
++	dst = (u32 *)(priv->hw_buffer.area + (offset * priv->buffer_ratio));
++
++	switch (priv->format) {
++	case SNDRV_PCM_FORMAT_S16_LE:
++	case SNDRV_PCM_FORMAT_S24_LE:
++		/* dma_buffer is the mmapped buffer we are copying pcm from. */
++		hdmi_mmap_copy(runtime->dma_area + offset,
++			       priv->sample_align, dst, framecount, priv->channels);
++		break;
++	default:
++		dev_err(dev, "unsupported sample format %s\n",
++				snd_pcm_format_name(priv->format));
++		return;
++	}
++}
++
++static void hdmi_dma_data_copy(struct snd_pcm_substream *substream,
++				struct hdmi_dma_priv *priv, char type)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	unsigned long offset, count, appl_bytes, space_to_end;
++
++	if (runtime->access != SNDRV_PCM_ACCESS_MMAP_INTERLEAVED)
++		return;
++
++	appl_bytes = frames_to_bytes(runtime, runtime->status->hw_ptr);
++
++	switch (type) {
++	case 'p':
++		offset = (appl_bytes + 2 * priv->period_bytes) % priv->buffer_bytes;
++		count = priv->period_bytes;
++		space_to_end = priv->period_bytes;
++		break;
++	case 'b':
++		offset = appl_bytes % priv->buffer_bytes;
++		count = priv->buffer_bytes;
++		space_to_end = priv->buffer_bytes - offset;
++		break;
++	default:
++		return;
++	}
++
++	if (count <= space_to_end) {
++		hdmi_dma_mmap_copy(substream, offset, count);
++	} else {
++		hdmi_dma_mmap_copy(substream, offset, space_to_end);
++		hdmi_dma_mmap_copy(substream, 0, count - space_to_end);
++	}
++}
++
++static void hdmi_sdma_callback(void *data)
++{
++	struct hdmi_dma_priv *priv = (struct hdmi_dma_priv *)data;
++	struct snd_pcm_substream *substream = priv->substream;
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	unsigned long flags;
++
++	spin_lock_irqsave(&priv->irq_lock, flags);
++
++	if (runtime && runtime->dma_area && priv->tx_active) {
++		priv->offset += priv->period_bytes;
++		priv->offset %= priv->period_bytes * priv->periods;
++
++		/* Copy data by period_bytes */
++		hdmi_dma_data_copy(substream, priv, 'p');
++
++		snd_pcm_period_elapsed(substream);
++	}
++
++	spin_unlock_irqrestore(&priv->irq_lock, flags);
++
++	return;
++}
++
++static int hdmi_dma_set_thrsld_incrtype(struct device *dev, int channels)
++{
++	u8 mask = HDMI_AHB_DMA_CONF0_BURST_MODE | HDMI_AHB_DMA_CONF0_INCR_TYPE_MASK;
++	u8 val = hdmi_readb(HDMI_AHB_DMA_CONF0) & ~mask;
++	int incr_type, threshold;
++
++	switch (hdmi_readb(HDMI_REVISION_ID)) {
++	case 0x0a:
++		incr_type = HDMI_DMA_BURST_INCR4;
++		if (channels == 2)
++			threshold = 126;
++		else
++			threshold = 124;
++		break;
++	case 0x1a:
++		incr_type = HDMI_DMA_BURST_INCR8;
++		threshold = 128;
++		break;
++	default:
++		dev_err(dev, "unknown hdmi controller!\n");
++		return -ENODEV;
++	}
++
++	hdmi_writeb(threshold, HDMI_AHB_DMA_THRSLD);
++
++	switch (incr_type) {
++	case HDMI_DMA_BURST_UNSPECIFIED_LEGNTH:
++		break;
++	case HDMI_DMA_BURST_INCR4:
++		val |= HDMI_AHB_DMA_CONF0_BURST_MODE;
++		break;
++	case HDMI_DMA_BURST_INCR8:
++		val |= HDMI_AHB_DMA_CONF0_BURST_MODE |
++			 HDMI_AHB_DMA_CONF0_INCR8;
++		break;
++	case HDMI_DMA_BURST_INCR16:
++		val |= HDMI_AHB_DMA_CONF0_BURST_MODE |
++			 HDMI_AHB_DMA_CONF0_INCR16;
++		break;
++	default:
++		dev_err(dev, "invalid increment type: %d!", incr_type);
++		return -EINVAL;
++	}
++
++	hdmi_writeb(val, HDMI_AHB_DMA_CONF0);
++
++	hdmi_audio_debug(dev, HDMI_AHB_DMA_THRSLD);
++
++	return 0;
++}
++
++static void hdmi_dma_set_hbr(struct device *dev, int channels)
++{
++	u8 value = hdmi_readb(HDMI_AHB_DMA_CONF0) & (~HDMI_AHB_DMA_CONF0_HBR_MASK);
++
++	/* non audio AES and 8 channels means we have to enable HBR */
++	if ((channels == 8) &&
++	    (iec_header.B.linear_pcm == 0)) {
++		value |= HDMI_AHB_DMA_CONF0_HBR_MASK;
++		dev_info(dev, "Enabling HBR");
++	}
++
++	hdmi_writeb(value, HDMI_AHB_DMA_CONF0);
++}
++
++static int hdmi_dma_configure_dma(struct device *dev, int channels)
++{
++	int ret;
++	static u8 chan_enable[] = { 0x00, 0x03, 0x33, 0x3f, 0xff };
++
++	if (channels <= 0 || channels > 8 || channels % 2 != 0) {
++		dev_err(dev, "unsupported channel number: %d\n", channels);
++		return -EINVAL;
++	}
++
++	hdmi_audio_writeb(AHB_DMA_CONF0, EN_HLOCK, 0x1);
++
++	ret = hdmi_dma_set_thrsld_incrtype(dev, channels);
++	if (ret)
++		return ret;
++
++	hdmi_writeb(chan_enable[channels / 2], HDMI_AHB_DMA_CONF1);
++
++	/* Handle HBR */
++	hdmi_dma_set_hbr(dev, channels);
++
++	return 0;
++}
++
++static void hdmi_dma_init_iec_header(void)
++{
++	iec_header.U = 0;
++
++	iec_header.B.consumer = 0;		/* Consumer use */
++	iec_header.B.linear_pcm = 0;		/* linear pcm audio */
++	iec_header.B.copyright = 1;		/* no copyright */
++	iec_header.B.pre_emphasis = 0;		/* 2 channels without pre-emphasis */
++	iec_header.B.mode = 0;			/* Mode 0 */
++
++	iec_header.B.category_code = 0;
++
++	iec_header.B.source = 2;		/* stereo */
++	iec_header.B.channel = 0;
++
++	iec_header.B.sample_freq = 0x02;	/* 48 KHz */
++	iec_header.B.clock_acc = 0;		/* Level II */
++
++	iec_header.B.word_length = 0x02;	/* 16 bits */
++	iec_header.B.org_sample_freq = 0x0D;	/* 48 KHz */
++
++	iec_header.B.cgms_a = 0;		/* Copying is permitted without restriction */
++}
++
++static int hdmi_dma_update_iec_header(struct snd_pcm_substream *substream)
++{
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++	struct device *dev = rtd->platform->dev;
++
++	iec_header.B.source = priv->channels;
++
++	switch (priv->rate) {
++	case 32000:
++		iec_header.B.sample_freq = 0x03;
++		iec_header.B.org_sample_freq = 0x0C;
++		break;
++	case 44100:
++		iec_header.B.sample_freq = 0x00;
++		iec_header.B.org_sample_freq = 0x0F;
++		break;
++	case 48000:
++		iec_header.B.sample_freq = 0x02;
++		iec_header.B.org_sample_freq = 0x0D;
++		break;
++	case 88200:
++		iec_header.B.sample_freq = 0x08;
++		iec_header.B.org_sample_freq = 0x07;
++		break;
++	case 96000:
++		iec_header.B.sample_freq = 0x0A;
++		iec_header.B.org_sample_freq = 0x05;
++		break;
++	case 176400:
++		iec_header.B.sample_freq = 0x0C;
++		iec_header.B.org_sample_freq = 0x03;
++		break;
++	case 192000:
++		iec_header.B.sample_freq = 0x0E;
++		iec_header.B.org_sample_freq = 0x01;
++		break;
++	default:
++		dev_err(dev, "unsupported sample rate\n");
++		return -EFAULT;
++	}
++
++	switch (priv->format) {
++	case SNDRV_PCM_FORMAT_S16_LE:
++		iec_header.B.word_length = 0x02;
++		break;
++	case SNDRV_PCM_FORMAT_S24_LE:
++		iec_header.B.word_length = 0x0b;
++		break;
++	default:
++		return -EFAULT;
++	}
++
++	return 0;
++}
++
++/*
++ * The HDMI block transmits the audio data without adding any of the audio
++ * frame bits.  So we have to copy the raw dma data from the ALSA buffer
++ * to the DMA buffer, adding the frame information.
++ */
++static int hdmi_dma_copy(struct snd_pcm_substream *substream, int channel,
++			snd_pcm_uframes_t pos, void __user *buf,
++			snd_pcm_uframes_t frames)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++	unsigned int count = frames_to_bytes(runtime, frames);
++	unsigned int pos_bytes = frames_to_bytes(runtime, pos);
++	int channel_no, pcm_idx, subframe_idx, bits_left, sample_bits, map_sel;
++	u32 pcm_data[8], pcm_temp, *hw_buf, sample_block, inc_mask;
++
++	/* Adding frame info to pcm data from userspace and copy to hw_buffer */
++	hw_buf = (u32 *)(priv->hw_buffer.area + (pos_bytes * priv->buffer_ratio));
++
++	sample_bits = priv->sample_align * 8;
++	sample_block = priv->sample_align * priv->channels;
++
++	if (iec_header.B.linear_pcm == 0) {
++		map_sel = priv->channels / 2;
++		inc_mask = 1 << (priv->channels - 1);
++	} else {
++		map_sel = 0;
++		inc_mask = 0xaa;
++	}
++
++	while (count > 0) {
++		if (copy_from_user(pcm_data, buf, sample_block))
++			return -EFAULT;
++
++		buf += sample_block;
++		count -= sample_block;
++
++		channel_no = pcm_idx = 0;
++		do {
++			pcm_temp = pcm_data[pcm_idx++];
++			bits_left = 32;
++			for (;;) {
++				/* re-map channels */
++				subframe_idx = channel_maps_alsa_cea[map_sel][channel_no];
++
++				/* Save the header info to the audio dma buffer */
++				hw_buf[subframe_idx] = hdmi_dma_add_frame_info(
++								priv, pcm_temp, subframe_idx);
++
++				if (inc_mask & (1 << channel_no)) {
++					if (++priv->frame_idx == 192)
++						priv->frame_idx = 0;
++				}
++
++				channel_no++;
++
++				if (bits_left <= sample_bits)
++					break;
++
++				bits_left -= sample_bits;
++				pcm_temp >>= sample_bits;
++			}
++		} while (channel_no < priv->channels);
++
++		hw_buf += priv->channels;
++	}
++
++	return 0;
++}
++
++static int hdmi_sdma_initbuf(struct device *dev, struct hdmi_dma_priv *priv)
++{
++	struct hdmi_sdma_script *hdmi_sdma_t = priv->hdmi_sdma_t;
++	u32 *head, *tail, i;
++
++	if (!hdmi_sdma_t) {
++		dev_err(dev, "hdmi private addr invalid!!!\n");
++		return -EINVAL;
++	}
++
++	hdmi_sdma_t->control_reg_addr = HDMI_BASE_ADDR + HDMI_AHB_DMA_START;
++	hdmi_sdma_t->status_reg_addr = HDMI_BASE_ADDR + HDMI_IH_AHBDMAAUD_STAT0;
++	hdmi_sdma_t->dma_start_addr = HDMI_BASE_ADDR + HDMI_AHB_DMA_STRADDR0;
++
++	head = &hdmi_sdma_t->buffer[0];
++	tail = &hdmi_sdma_t->buffer[1];
++
++	for (i = 0; i < priv->sdma_params.buffer_num; i++) {
++		*head = priv->hw_buffer.addr + i * priv->period_bytes * priv->buffer_ratio;
++		*tail = *head + priv->dma_period_bytes - 1;
++		head += 2;
++		tail += 2;
++	}
++
++	return 0;
++}
++
++static int hdmi_sdma_config(struct snd_pcm_substream *substream,
++			struct hdmi_dma_priv *priv)
++{
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct device *dai_dev = &priv->pdev->dev;
++	struct device *dev = rtd->platform->dev;
++	struct dma_slave_config slave_config;
++	int ret;
++
++	priv->dma_channel = dma_request_slave_channel(dai_dev, "tx");
++	if (priv->dma_channel == NULL) {
++		dev_err(dev, "failed to alloc dma channel\n");
++		return -EBUSY;
++	}
++
++	priv->dma_data.data_addr1 = &priv->sdma_params.buffer_num;
++	priv->dma_data.data_addr2 = &priv->sdma_params.phyaddr;
++	//priv->dma_data.peripheral_type = IMX_DMATYPE_HDMI;
++	priv->dma_channel->private = &priv->dma_data;
++
++	slave_config.direction = DMA_TRANS_NONE;
++
++	ret = dmaengine_slave_config(priv->dma_channel, &slave_config);
++	if (ret) {
++		dev_err(dev, "failed to config slave dma, (%d)\n", ret);
++		return -EINVAL;
++	}
++
++	return 0;
++}
++
++static int hdmi_dma_hw_free(struct snd_pcm_substream *substream)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++
++	if (priv->dma_channel) {
++		dma_release_channel(priv->dma_channel);
++		priv->dma_channel = NULL;
++	}
++
++	return 0;
++}
++
++static int hdmi_dma_hw_params(struct snd_pcm_substream *substream,
++				struct snd_pcm_hw_params *params)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct device *dev = rtd->platform->dev;
++	int ret;
++
++	priv->buffer_bytes = params_buffer_bytes(params);
++	priv->periods = params_periods(params);
++	priv->period_bytes = params_period_bytes(params);
++	priv->channels = params_channels(params);
++	priv->format = params_format(params);
++	priv->rate = params_rate(params);
++
++	priv->offset = 0;
++	priv->period_time = HZ / (priv->rate / params_period_size(params));
++
++	switch (priv->format) {
++	case SNDRV_PCM_FORMAT_S16_LE:
++		priv->buffer_ratio = 2;
++		priv->sample_align = 2;
++		priv->sample_bits = 16;
++		break;
++	case SNDRV_PCM_FORMAT_S24_LE:
++		/* 24 bit audio in 32 bit word */
++		priv->buffer_ratio = 1;
++		priv->sample_align = 4;
++		priv->sample_bits = 24;
++		break;
++	default:
++		dev_err(dev, "unsupported sample format: %d\n", priv->format);
++		return -EINVAL;
++	}
++
++	priv->dma_period_bytes = priv->period_bytes * priv->buffer_ratio;
++	priv->sdma_params.buffer_num = priv->periods;
++	priv->sdma_params.phyaddr = priv->phy_hdmi_sdma_t;
++
++	ret = hdmi_sdma_initbuf(dev, priv);
++	if (ret)
++		return ret;
++
++	ret = hdmi_sdma_config(substream, priv);
++	if (ret)
++		return ret;
++
++	snd_pcm_set_runtime_buffer(substream, &substream->dma_buffer);
++
++	ret = hdmi_dma_configure_dma(dev, priv->channels);
++	if (ret)
++		return ret;
++
++	hdmi_dma_set_addr(priv->hw_buffer.addr, priv->dma_period_bytes);
++
++	dumppriv(dev, priv);
++
++	hdmi_dma_update_iec_header(substream);
++
++	/* Init par for mmap optimizate */
++	init_table(priv->channels);
++
++	priv->appl_bytes = 0;
++	priv->frame_idx = 0;
++
++	return 0;
++}
++
++static void hdmi_dma_trigger_init(struct snd_pcm_substream *substream,
++				struct hdmi_dma_priv *priv)
++{
++	unsigned long status;
++	bool hbr;
++
++	/*
++	 * Set HBR mode (>192kHz IEC-61937 HD audio bitstreaming).
++	 * This is done this late because userspace may alter the AESx
++	 * parameters until the stream is finally prepared.
++	 */
++	hbr = (iec_header.B.linear_pcm != 0 && priv->channels == 8);
++	hdmi_audio_writeb(AHB_DMA_CONF0, HBR, !!hbr);
++
++	/*
++	 * Override AES3 - parameter: This is a temporary hack for
++	 * callers that provide incorrect information when opening
++	 * the device. 0x09 (i.e. 768K) is the only acceptable value.
++	 */
++	if (hbr) {
++		iec_header.B.sample_freq = 0x09;
++		iec_header.B.org_sample_freq = 0x00;
++	}
++
++	priv->offset = 0;
++
++	/* Copy data by buffer_bytes */
++	hdmi_dma_data_copy(substream, priv, 'b');
++
++	hdmi_audio_writeb(AHB_DMA_CONF0, SW_FIFO_RST, 0x1);
++
++	/* Delay after reset */
++	udelay(1);
++
++	status = hdmi_readb(HDMI_IH_AHBDMAAUD_STAT0);
++	hdmi_writeb(status, HDMI_IH_AHBDMAAUD_STAT0);
++}
++
++static int hdmi_dma_prepare_and_submit(struct snd_pcm_substream *substream,
++					struct hdmi_dma_priv *priv)
++{
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct device *dev = rtd->platform->dev;
++
++	priv->desc = dmaengine_prep_dma_cyclic(priv->dma_channel, 0, 0, 0,
++						DMA_TRANS_NONE, 0);
++	if (!priv->desc) {
++		dev_err(dev, "failed to prepare slave dma\n");
++		return -EINVAL;
++	}
++
++	priv->desc->callback = hdmi_sdma_callback;
++	priv->desc->callback_param = (void *)priv;
++	dmaengine_submit(priv->desc);
++
++	return 0;
++}
++
++static int hdmi_dma_trigger(struct snd_pcm_substream *substream, int cmd)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++	struct device *dev = rtd->platform->dev;
++	int ret;
++
++	switch (cmd) {
++	case SNDRV_PCM_TRIGGER_START:
++	case SNDRV_PCM_TRIGGER_RESUME:
++		if (!check_hdmi_state())
++			return 0;
++		hdmi_dma_trigger_init(substream, priv);
++
++		dumpregs(dev);
++
++	case SNDRV_PCM_TRIGGER_PAUSE_RELEASE:
++		priv->tx_active = true;
++		hdmi_audio_writeb(AHB_DMA_START, START, 0x1);
++		hdmi_dma_irq_set(false);
++		hdmi_set_dma_mode(1);
++		ret = hdmi_dma_prepare_and_submit(substream, priv);
++		if (ret)
++			return ret;
++		dma_async_issue_pending(priv->desc->chan);
++		break;
++	case SNDRV_PCM_TRIGGER_STOP:
++	case SNDRV_PCM_TRIGGER_SUSPEND:
++	case SNDRV_PCM_TRIGGER_PAUSE_PUSH:
++		dmaengine_terminate_all(priv->dma_channel);
++		hdmi_set_dma_mode(0);
++		hdmi_dma_irq_set(true);
++		hdmi_audio_writeb(AHB_DMA_STOP, STOP, 0x1);
++		priv->tx_active = false;
++		break;
++	default:
++		return -EINVAL;
++	}
++
++	return 0;
++}
++
++static snd_pcm_uframes_t hdmi_dma_pointer(struct snd_pcm_substream *substream)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++
++	return bytes_to_frames(runtime, priv->offset);
++}
++
++static struct snd_pcm_hardware snd_imx_hardware = {
++	.info = SNDRV_PCM_INFO_INTERLEAVED |
++		SNDRV_PCM_INFO_BLOCK_TRANSFER |
++		SNDRV_PCM_INFO_MMAP |
++		SNDRV_PCM_INFO_MMAP_VALID |
++		SNDRV_PCM_INFO_PAUSE |
++		SNDRV_PCM_INFO_RESUME,
++	.formats = MXC_HDMI_FORMATS_PLAYBACK,
++	.rate_min = 32000,
++	.channels_min = 2,
++	.channels_max = 8,
++	.buffer_bytes_max = HDMI_PCM_BUF_SIZE,
++	.period_bytes_min = HDMI_DMA_PERIOD_BYTES / 2,
++	.period_bytes_max = HDMI_DMA_PERIOD_BYTES / 2,
++	.periods_min = 2, //8
++	.periods_max = HDMI_DMA_BUF_SIZE / HDMI_DMA_PERIOD_BYTES,
++	.fifo_size = 0,
++};
++
++static void hdmi_dma_irq_enable(struct hdmi_dma_priv *priv)
++{
++	unsigned long flags;
++
++	hdmi_writeb(0xff, HDMI_AHB_DMA_POL);
++	hdmi_writeb(0xff, HDMI_AHB_DMA_BUFFPOL);
++
++	spin_lock_irqsave(&priv->irq_lock, flags);
++
++	hdmi_writeb(0xff, HDMI_IH_AHBDMAAUD_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
++	hdmi_dma_irq_set(false);
++	hdmi_mask(0);
++
++	spin_unlock_irqrestore(&priv->irq_lock, flags);
++}
++
++static void hdmi_dma_irq_disable(struct hdmi_dma_priv *priv)
++{
++	unsigned long flags;
++
++	spin_lock_irqsave(&priv->irq_lock, flags);
++
++	hdmi_dma_irq_set(true);
++	hdmi_writeb(0x0, HDMI_IH_MUTE_AHBDMAAUD_STAT0);
++	hdmi_writeb(0xff, HDMI_IH_AHBDMAAUD_STAT0);
++	hdmi_mask(1);
++
++	spin_unlock_irqrestore(&priv->irq_lock, flags);
++}
++
++static int hdmi_dma_open(struct snd_pcm_substream *substream)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct snd_soc_pcm_runtime *rtd = substream->private_data;
++	struct device *dev = rtd->platform->dev;
++	struct hdmi_dma_priv *priv = dev_get_drvdata(dev);
++	int ret;
++
++	runtime->private_data = priv;
++
++	ret = mxc_hdmi_register_audio(substream);
++	if (ret < 0) {
++		dev_err(dev, "HDMI Video is not ready!\n");
++		return ret;
++	}
++
++	hdmi_audio_writeb(AHB_DMA_CONF0, SW_FIFO_RST, 0x1);
++
++	ret = snd_pcm_hw_constraint_integer(substream->runtime,
++			SNDRV_PCM_HW_PARAM_PERIODS);
++	if (ret < 0)
++		return ret;
++
++	snd_soc_set_runtime_hwparams(substream, &snd_imx_hardware);
++
++	hdmi_dma_irq_enable(priv);
++
++	return 0;
++}
++
++static int hdmi_dma_close(struct snd_pcm_substream *substream)
++{
++	struct snd_pcm_runtime *runtime = substream->runtime;
++	struct hdmi_dma_priv *priv = runtime->private_data;
++
++	hdmi_dma_irq_disable(priv);
++	mxc_hdmi_unregister_audio(substream);
++
++	return 0;
++}
++
++static struct snd_pcm_ops imx_hdmi_dma_pcm_ops = {
++	.open		= hdmi_dma_open,
++	.close		= hdmi_dma_close,
++	.ioctl		= snd_pcm_lib_ioctl,
++	.hw_params	= hdmi_dma_hw_params,
++	.hw_free	= hdmi_dma_hw_free,
++	.trigger	= hdmi_dma_trigger,
++	.pointer	= hdmi_dma_pointer,
++	.copy		= hdmi_dma_copy,
++};
++
++static int imx_hdmi_dma_pcm_new(struct snd_soc_pcm_runtime *rtd)
++{
++	struct hdmi_dma_priv *priv = dev_get_drvdata(rtd->platform->dev);
++	struct snd_card *card = rtd->card->snd_card;
++	struct snd_pcm_substream *substream;
++	struct snd_pcm *pcm = rtd->pcm;
++	u64 dma_mask = DMA_BIT_MASK(32);
++	int ret = 0;
++
++	if (!card->dev->dma_mask)
++		card->dev->dma_mask = &dma_mask;
++	if (!card->dev->coherent_dma_mask)
++		card->dev->coherent_dma_mask = DMA_BIT_MASK(32);
++
++	substream = pcm->streams[SNDRV_PCM_STREAM_PLAYBACK].substream;
++
++	ret = snd_dma_alloc_pages(SNDRV_DMA_TYPE_DEV, pcm->card->dev,
++			HDMI_PCM_BUF_SIZE, &substream->dma_buffer);
++	if (ret) {
++		dev_err(card->dev, "failed to alloc playback dma buffer\n");
++		return ret;
++	}
++
++	priv->substream = substream;
++
++	/* Alloc the hw_buffer */
++	ret = snd_dma_alloc_pages(SNDRV_DMA_TYPE_DEV, pcm->card->dev,
++			HDMI_DMA_BUF_SIZE, &priv->hw_buffer);
++	if (ret) {
++		dev_err(card->dev, "failed to alloc hw dma buffer\n");
++		return ret;
++	}
++
++	return ret;
++}
++
++static void imx_hdmi_dma_pcm_free(struct snd_pcm *pcm)
++{
++	int stream = SNDRV_PCM_STREAM_PLAYBACK;
++	struct snd_pcm_substream *substream = pcm->streams[stream].substream;
++	struct snd_soc_pcm_runtime *rtd = pcm->private_data;
++	struct hdmi_dma_priv *priv = dev_get_drvdata(rtd->platform->dev);
++
++	if (substream) {
++		snd_dma_free_pages(&substream->dma_buffer);
++		substream->dma_buffer.area = NULL;
++		substream->dma_buffer.addr = 0;
++	}
++
++	/* Free the hw_buffer */
++	snd_dma_free_pages(&priv->hw_buffer);
++	priv->hw_buffer.area = NULL;
++	priv->hw_buffer.addr = 0;
++}
++
++static struct snd_soc_platform_driver imx_hdmi_platform = {
++	.ops		= &imx_hdmi_dma_pcm_ops,
++	.pcm_new	= imx_hdmi_dma_pcm_new,
++	.pcm_free	= imx_hdmi_dma_pcm_free,
++};
++
++static int imx_soc_platform_probe(struct platform_device *pdev)
++{
++	struct imx_hdmi *hdmi_drvdata = platform_get_drvdata(pdev);
++	struct hdmi_dma_priv *priv;
++	int ret = 0;
++
++	priv = devm_kzalloc(&pdev->dev, sizeof(*priv), GFP_KERNEL);
++	if (!priv) {
++		dev_err(&pdev->dev, "Failed to alloc hdmi_dma\n");
++		return -ENOMEM;
++	}
++
++	priv->hdmi_sdma_t = dma_alloc_coherent(NULL,
++			sizeof(struct hdmi_sdma_script),
++			&priv->phy_hdmi_sdma_t, GFP_KERNEL);
++	if (!priv->hdmi_sdma_t) {
++		dev_err(&pdev->dev, "Failed to alloc hdmi_sdma_t\n");
++		return -ENOMEM;
++	}
++
++	priv->tx_active = false;
++	spin_lock_init(&priv->irq_lock);
++
++	priv->pdev = hdmi_drvdata->pdev;
++
++	hdmi_dma_init_iec_header();
++
++	dev_set_drvdata(&pdev->dev, priv);
++
++	switch (hdmi_readb(HDMI_REVISION_ID)) {
++	case 0x0a:
++		snd_imx_hardware.period_bytes_max = HDMI_DMA_PERIOD_BYTES / 4;
++		snd_imx_hardware.period_bytes_min = HDMI_DMA_PERIOD_BYTES / 4;
++		snd_imx_hardware.periods_max = HDMI_DMA_BUF_SIZE / (HDMI_DMA_PERIOD_BYTES / 2);
++		break;
++	default:
++		break;
++	}
++
++	ret = snd_soc_register_platform(&pdev->dev, &imx_hdmi_platform);
++	if (ret)
++		goto err_plat;
++
++	return 0;
++
++err_plat:
++	dma_free_coherent(NULL, sizeof(struct hdmi_sdma_script),
++			priv->hdmi_sdma_t, priv->phy_hdmi_sdma_t);
++
++	return ret;
++}
++
++static int imx_soc_platform_remove(struct platform_device *pdev)
++{
++	struct hdmi_dma_priv *priv = dev_get_drvdata(&pdev->dev);
++
++	dma_free_coherent(NULL, sizeof(struct hdmi_sdma_script),
++			priv->hdmi_sdma_t, priv->phy_hdmi_sdma_t);
++
++	snd_soc_unregister_platform(&pdev->dev);
++
++	return 0;
++}
++
++static struct platform_driver imx_hdmi_dma_driver = {
++	.driver = {
++		.name = "imx-hdmi-audio",
++		.owner = THIS_MODULE,
++	},
++	.probe = imx_soc_platform_probe,
++	.remove = imx_soc_platform_remove,
++};
++
++module_platform_driver(imx_hdmi_dma_driver);
++
++MODULE_AUTHOR("Freescale Semiconductor, Inc.");
++MODULE_DESCRIPTION("i.MX HDMI audio DMA");
++MODULE_LICENSE("GPL");
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-hdmi.h linux-xbian-imx6/sound/soc/fsl/imx-hdmi.h
+--- linux-4.1.3/sound/soc/fsl/imx-hdmi.h	1970-01-01 01:00:00.000000000 +0100
++++ linux-xbian-imx6/sound/soc/fsl/imx-hdmi.h	2015-07-27 23:13:11.153188979 +0200
+@@ -0,0 +1,106 @@
++/*
++ * Copyright (C) 2011-2014 Freescale Semiconductor, Inc.
++ *
++ * This program is free software; you can redistribute it and/or modify
++ * it under the terms of the GNU General Public License as published by
++ * the Free Software Foundation; either version 2 of the License, or
++ * (at your option) any later version.
++ *
++ * This program is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
++ * GNU General Public License for more details.
++ *
++ * You should have received a copy of the GNU General Public License along
++ * with this program; if not, write to the Free Software Foundation, Inc.,
++ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
++ */
++
++#ifndef __IMX_HDMI_H
++#define __IMX_HDMI_H
++
++struct imx_hdmi_sdma_params {
++	dma_addr_t phyaddr;
++	u32 buffer_num;
++	int dma;
++};
++
++struct imx_hdmi {
++	struct snd_soc_dai_driver cpu_dai_drv;
++	struct platform_device *codec_dev;
++	struct platform_device *dma_dev;
++	struct platform_device *pdev;
++	struct clk *isfr_clk;
++	struct clk *iahb_clk;
++	struct clk *mipi_core_clk;
++};
++
++#define HDMI_MAX_RATES 7
++#define HDMI_MAX_SAMPLE_SIZE 3
++#define HDMI_MAX_CHANNEL_CONSTRAINTS 4
++
++#define MXC_HDMI_RATES_PLAYBACK \
++	(SNDRV_PCM_RATE_32000 | SNDRV_PCM_RATE_44100 | SNDRV_PCM_RATE_48000 | \
++	 SNDRV_PCM_RATE_88200 | SNDRV_PCM_RATE_96000 | \
++	 SNDRV_PCM_RATE_176400 | SNDRV_PCM_RATE_192000)
++
++#define MXC_HDMI_FORMATS_PLAYBACK \
++	(SNDRV_PCM_FMTBIT_S16_LE | SNDRV_PCM_FMTBIT_S24_LE)
++
++union hdmi_audio_header_t {
++	uint64_t  U;
++	struct {
++		unsigned consumer:1;
++		unsigned linear_pcm:1;
++		unsigned copyright:1;
++		unsigned pre_emphasis:3;
++		unsigned mode:2;
++
++		unsigned category_code:8;
++
++		unsigned source:4;
++		unsigned channel:4;
++
++		unsigned sample_freq:4;
++		unsigned clock_acc:2;
++		unsigned reserved0:2;
++
++		unsigned word_length:4;
++		unsigned org_sample_freq:4;
++
++		unsigned cgms_a:2;
++		unsigned reserved1:6;
++
++		unsigned reserved2:8;
++
++		unsigned reserved3:8;
++	} B;
++	unsigned char status[8];
++};
++
++union hdmi_audio_dma_data_t {
++	uint32_t  U;
++	struct {
++		unsigned data:24;
++		unsigned v:1;
++		unsigned u:1;
++		unsigned c:1;
++		unsigned p:1;
++		unsigned b:1;
++		unsigned reserved:3;
++	} B;
++};
++
++extern union hdmi_audio_header_t iec_header;
++
++#define hdmi_audio_writeb(reg, bit, val) \
++	do { \
++		hdmi_mask_writeb(val, HDMI_ ## reg, \
++			HDMI_ ## reg ## _ ## bit ## _OFFSET, \
++			HDMI_ ## reg ## _ ## bit ## _MASK); \
++		pr_debug("Set reg: HDMI_" #reg " (0x%x) "\
++			"bit: HDMI_" #reg "_" #bit " (%d) to val: %x\n", \
++			HDMI_ ## reg, HDMI_ ## reg ## _ ## bit ## _OFFSET, val); \
++	} while (0)
++
++#endif /* __IMX_HDMI_H */
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-pcm-dma.c linux-xbian-imx6/sound/soc/fsl/imx-pcm-dma.c
+--- linux-4.1.3/sound/soc/fsl/imx-pcm-dma.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/imx-pcm-dma.c	2015-07-27 23:13:11.153188979 +0200
+@@ -43,7 +43,7 @@
+ 	.buffer_bytes_max = IMX_SSI_DMABUF_SIZE,
+ 	.period_bytes_min = 128,
+ 	.period_bytes_max = 65535, /* Limited by SDMA engine */
+-	.periods_min = 2,
++	.periods_min = 4,
+ 	.periods_max = 255,
+ 	.fifo_size = 0,
+ };
+@@ -55,10 +55,27 @@
+ 	.prealloc_buffer_size = IMX_SSI_DMABUF_SIZE,
+ };
+ 
+-int imx_pcm_dma_init(struct platform_device *pdev)
++int imx_pcm_dma_init(struct platform_device *pdev, size_t size)
+ {
++	struct snd_dmaengine_pcm_config *config;
++	struct snd_pcm_hardware *pcm_hardware;
++
++	config = devm_kzalloc(&pdev->dev,
++			sizeof(struct snd_dmaengine_pcm_config), GFP_KERNEL);
++	*config = imx_dmaengine_pcm_config;
++	if (size)
++		config->prealloc_buffer_size = size;
++
++	pcm_hardware = devm_kzalloc(&pdev->dev,
++			sizeof(struct snd_pcm_hardware), GFP_KERNEL);
++	*pcm_hardware = imx_pcm_hardware;
++	if (size)
++		pcm_hardware->buffer_bytes_max = size;
++
++	config->pcm_hardware = pcm_hardware;
++
+ 	return devm_snd_dmaengine_pcm_register(&pdev->dev,
+-		&imx_dmaengine_pcm_config,
++		config,
+ 		SND_DMAENGINE_PCM_FLAG_COMPAT);
+ }
+ EXPORT_SYMBOL_GPL(imx_pcm_dma_init);
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-pcm.h linux-xbian-imx6/sound/soc/fsl/imx-pcm.h
+--- linux-4.1.3/sound/soc/fsl/imx-pcm.h	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/imx-pcm.h	2015-07-27 23:13:11.153188979 +0200
+@@ -19,6 +19,10 @@
+  * Do not change this as the FIQ handler depends on this size
+  */
+ #define IMX_SSI_DMABUF_SIZE	(64 * 1024)
++#define IMX_SAI_DMABUF_SIZE	(64 * 1024)
++#define IMX_SPDIF_DMABUF_SIZE	(64 * 1024)
++#define IMX_ESAI_DMABUF_SIZE	(256 * 1024)
++#define IMX_ASRC_DMABUF_SIZE	(256 * 1024)
+ 
+ static inline void
+ imx_pcm_dma_params_init_data(struct imx_dma_data *dma_data,
+@@ -39,9 +43,9 @@
+ };
+ 
+ #if IS_ENABLED(CONFIG_SND_SOC_IMX_PCM_DMA)
+-int imx_pcm_dma_init(struct platform_device *pdev);
++int imx_pcm_dma_init(struct platform_device *pdev, size_t size);
+ #else
+-static inline int imx_pcm_dma_init(struct platform_device *pdev)
++static inline int imx_pcm_dma_init(struct platform_device *pdev, size_t size)
+ {
+ 	return -ENODEV;
+ }
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-sgtl5000.c linux-xbian-imx6/sound/soc/fsl/imx-sgtl5000.c
+--- linux-4.1.3/sound/soc/fsl/imx-sgtl5000.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/imx-sgtl5000.c	2015-07-27 23:13:11.153188979 +0200
+@@ -175,8 +175,10 @@
+ fail:
+ 	if (data && !IS_ERR(data->codec_clk))
+ 		clk_put(data->codec_clk);
+-	of_node_put(ssi_np);
+-	of_node_put(codec_np);
++	if (ssi_np)
++		of_node_put(ssi_np);
++	if (codec_np)
++		of_node_put(codec_np);
+ 
+ 	return ret;
+ }
+@@ -200,6 +202,7 @@
+ static struct platform_driver imx_sgtl5000_driver = {
+ 	.driver = {
+ 		.name = "imx-sgtl5000",
++		.owner = THIS_MODULE,
+ 		.pm = &snd_soc_pm_ops,
+ 		.of_match_table = imx_sgtl5000_dt_ids,
+ 	},
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-spdif.c linux-xbian-imx6/sound/soc/fsl/imx-spdif.c
+--- linux-4.1.3/sound/soc/fsl/imx-spdif.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/imx-spdif.c	2015-07-27 23:13:11.153188979 +0200
+@@ -66,16 +66,18 @@
+ 	if (ret)
+ 		goto end;
+ 
++	platform_set_drvdata(pdev, &data->card);
++	snd_soc_card_set_drvdata(&data->card, data);
++
+ 	ret = devm_snd_soc_register_card(&pdev->dev, &data->card);
+ 	if (ret) {
+ 		dev_err(&pdev->dev, "snd_soc_register_card failed: %d\n", ret);
+ 		goto end;
+ 	}
+ 
+-	platform_set_drvdata(pdev, data);
+-
+ end:
+-	of_node_put(spdif_np);
++	if (spdif_np)
++		of_node_put(spdif_np);
+ 
+ 	return ret;
+ }
+@@ -89,6 +91,8 @@
+ static struct platform_driver imx_spdif_driver = {
+ 	.driver = {
+ 		.name = "imx-spdif",
++		.owner = THIS_MODULE,
++		.pm = &snd_soc_pm_ops,
+ 		.of_match_table = imx_spdif_dt_ids,
+ 	},
+ 	.probe = imx_spdif_audio_probe,
+diff -Nur linux-4.1.3/sound/soc/fsl/imx-ssi.c linux-xbian-imx6/sound/soc/fsl/imx-ssi.c
+--- linux-4.1.3/sound/soc/fsl/imx-ssi.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/imx-ssi.c	2015-07-27 23:13:11.153188979 +0200
+@@ -603,7 +603,7 @@
+ 	ssi->fiq_params.dma_params_tx = &ssi->dma_params_tx;
+ 
+ 	ssi->fiq_init = imx_pcm_fiq_init(pdev, &ssi->fiq_params);
+-	ssi->dma_init = imx_pcm_dma_init(pdev);
++	ssi->dma_init = imx_pcm_dma_init(pdev, IMX_SSI_DMABUF_SIZE);
+ 
+ 	if (ssi->fiq_init && ssi->dma_init) {
+ 		ret = ssi->fiq_init;
+diff -Nur linux-4.1.3/sound/soc/fsl/Kconfig linux-xbian-imx6/sound/soc/fsl/Kconfig
+--- linux-4.1.3/sound/soc/fsl/Kconfig	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/Kconfig	2015-07-27 23:13:11.149203200 +0200
+@@ -55,6 +55,9 @@
+ 	  This option is only useful for out-of-tree drivers since
+ 	  in-tree drivers select it automatically.
+ 
++config SND_SOC_FSL_HDMI
++        tristate
++
+ config SND_SOC_FSL_UTILS
+ 	tristate
+ 
+@@ -62,6 +65,11 @@
+ 	tristate
+ 	select SND_SOC_GENERIC_DMAENGINE_PCM
+ 
++config SND_SOC_IMX_HDMI_DMA
++	bool
++	select SND_SOC_GENERIC_DMAENGINE_PCM
++	select SND_SOC_IMX_PCM_DMA
++
+ config SND_SOC_IMX_AUDMUX
+ 	tristate "Digital Audio Mux module support"
+ 	help
+@@ -235,7 +243,9 @@
+ 	select SND_SOC_WM8962
+ 	select SND_SOC_IMX_PCM_DMA
+ 	select SND_SOC_IMX_AUDMUX
++	select SND_SOC_FSL_SAI
+ 	select SND_SOC_FSL_SSI
++	select SND_SOC_FSL_UTILS
+ 	help
+ 	  Say Y if you want to add support for SoC audio on an i.MX board with
+ 	  a wm8962 codec.
+@@ -258,7 +268,9 @@
+ 	select SND_SOC_SGTL5000
+ 	select SND_SOC_IMX_PCM_DMA
+ 	select SND_SOC_IMX_AUDMUX
++	select SND_SOC_FSL_SAI
+ 	select SND_SOC_FSL_SSI
++	select SND_SOC_FSL_UTILS
+ 	help
+ 	  Say Y if you want to add support for SoC audio on an i.MX board with
+ 	  a sgtl5000 codec.
+@@ -280,6 +292,17 @@
+ 	select SND_SOC_MC13783
+ 	select SND_SOC_IMX_PCM_DMA
+ 
++config SND_SOC_IMX_HDMI
++	tristate "SoC Audio support for i.MX boards with HDMI port"
++	depends on MFD_MXC_HDMI
++	select SND_SOC_IMX_HDMI_DMA
++	select SND_SOC_FSL_HDMI
++	select SND_SOC_OMAP_HDMI_CODEC
++	help
++	  SoC Audio support for i.MX boards with HDMI audio
++	  Say Y if you want to add support for SoC audio on an i.MX board with
++	  IMX HDMI.
++
+ config SND_SOC_FSL_ASOC_CARD
+ 	tristate "Generic ASoC Sound Card with ASRC support"
+ 	depends on OF && I2C
+diff -Nur linux-4.1.3/sound/soc/fsl/Makefile linux-xbian-imx6/sound/soc/fsl/Makefile
+--- linux-4.1.3/sound/soc/fsl/Makefile	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/fsl/Makefile	2015-07-27 23:13:11.149203200 +0200
+@@ -15,7 +15,8 @@
+ snd-soc-fsl-asrc-objs := fsl_asrc.o fsl_asrc_dma.o
+ snd-soc-fsl-sai-objs := fsl_sai.o
+ snd-soc-fsl-ssi-y := fsl_ssi.o
+-snd-soc-fsl-ssi-$(CONFIG_DEBUG_FS) += fsl_ssi_dbg.o
++##snd-soc-fsl-ssi-$(CONFIG_DEBUG_FS) += fsl_ssi_dbg.o
++snd-soc-fsl-hdmi-objs := fsl_hdmi.o
+ snd-soc-fsl-spdif-objs := fsl_spdif.o
+ snd-soc-fsl-esai-objs := fsl_esai.o
+ snd-soc-fsl-utils-objs := fsl_utils.o
+@@ -26,6 +27,7 @@
+ obj-$(CONFIG_SND_SOC_FSL_SSI) += snd-soc-fsl-ssi.o
+ obj-$(CONFIG_SND_SOC_FSL_SPDIF) += snd-soc-fsl-spdif.o
+ obj-$(CONFIG_SND_SOC_FSL_ESAI) += snd-soc-fsl-esai.o
++obj-$(CONFIG_SND_SOC_FSL_HDMI) += snd-soc-fsl-hdmi.o
+ obj-$(CONFIG_SND_SOC_FSL_UTILS) += snd-soc-fsl-utils.o
+ obj-$(CONFIG_SND_SOC_POWERPC_DMA) += snd-soc-fsl-dma.o
+ 
+@@ -46,7 +48,7 @@
+ 
+ obj-$(CONFIG_SND_SOC_IMX_PCM_FIQ) += imx-pcm-fiq.o
+ obj-$(CONFIG_SND_SOC_IMX_PCM_DMA) += imx-pcm-dma.o
+-
++obj-$(CONFIG_SND_SOC_IMX_HDMI_DMA) += imx-hdmi-dma.o hdmi_pcm.o
+ # i.MX Machine Support
+ snd-soc-eukrea-tlv320-objs := eukrea-tlv320.o
+ snd-soc-phycore-ac97-objs := phycore-ac97.o
+@@ -57,6 +59,7 @@
+ snd-soc-imx-wm8962-objs := imx-wm8962.o
+ snd-soc-imx-spdif-objs := imx-spdif.o
+ snd-soc-imx-mc13783-objs := imx-mc13783.o
++snd-soc-imx-hdmi-objs := imx-hdmi.o
+ 
+ obj-$(CONFIG_SND_SOC_EUKREA_TLV320) += snd-soc-eukrea-tlv320.o
+ obj-$(CONFIG_SND_SOC_PHYCORE_AC97) += snd-soc-phycore-ac97.o
+@@ -67,3 +70,6 @@
+ obj-$(CONFIG_SND_SOC_IMX_WM8962) += snd-soc-imx-wm8962.o
+ obj-$(CONFIG_SND_SOC_IMX_SPDIF) += snd-soc-imx-spdif.o
+ obj-$(CONFIG_SND_SOC_IMX_MC13783) += snd-soc-imx-mc13783.o
++obj-$(CONFIG_SND_SOC_IMX_HDMI) += snd-soc-imx-hdmi.o
++
++AFLAGS_hdmi_pcm.o := -march=armv7-a -mtune=cortex-a9 -mfpu=neon -mfloat-abi=softfp
+diff -Nur linux-4.1.3/sound/soc/soc-io.c linux-xbian-imx6/sound/soc/soc-io.c
+--- linux-4.1.3/sound/soc/soc-io.c	2015-07-21 19:10:33.000000000 +0200
++++ linux-xbian-imx6/sound/soc/soc-io.c	2015-07-27 23:13:11.344506380 +0200
+@@ -17,6 +17,8 @@
+ #include <linux/export.h>
+ #include <sound/soc.h>
+ 
++#include <trace/events/asoc.h>
++
+ /**
+  * snd_soc_component_read() - Read register value
+  * @component: Component to read from
+@@ -271,3 +273,233 @@
+ 	return snd_soc_component_write(&platform->component, reg, val);
+ }
+ EXPORT_SYMBOL_GPL(snd_soc_platform_write);
++
++#ifdef CONFIG_REGMAP
++static bool snd_soc_set_cache_val(void *base, unsigned int idx,
++                                  unsigned int val, unsigned int word_size)
++{
++        switch (word_size) {
++        case 1: {
++                u8 *cache = base;
++                if (cache[idx] == val)
++                        return true;
++                cache[idx] = val;
++                break;
++        }
++        case 2: {
++                u16 *cache = base;
++                if (cache[idx] == val)
++                        return true;
++                cache[idx] = val;
++                break;
++        }
++        default:
++                WARN(1, "Invalid word_size %d\n", word_size);
++                break;
++        }
++        return false;
++}
++
++static unsigned int snd_soc_get_cache_val(const void *base, unsigned int idx,
++                unsigned int word_size)
++{
++        if (!base)
++                return -1;
++
++        switch (word_size) {
++        case 1: {
++                const u8 *cache = base;
++                return cache[idx];
++        }
++        case 2: {
++                const u16 *cache = base;
++                return cache[idx];
++        }
++        default:
++                WARN(1, "Invalid word_size %d\n", word_size);
++                break;
++        }
++        /* unreachable */
++        return -1;
++}
++
++/**
++ * snd_soc_cache_read: Fetch the value of a given register from the cache.
++ *
++ * @codec: CODEC to configure.
++ * @reg: The register index.
++ * @value: The value to be returned.
++ */
++int snd_soc_cache_read(struct snd_soc_codec *codec,
++                       unsigned int reg, unsigned int *value)
++{
++        if (!value)
++                return -EINVAL;
++
++        mutex_lock(&codec->cache_rw_mutex);
++        *value = snd_soc_get_cache_val(codec->reg_cache, reg,
++                                       codec->driver->reg_word_size);
++        mutex_unlock(&codec->cache_rw_mutex);
++
++        return 0;
++}
++
++/**
++ * snd_soc_cache_write: Set the value of a given register in the cache.
++ *
++ * @codec: CODEC to configure.
++ * @reg: The register index.
++ * @value: The new register value.
++ */
++int snd_soc_cache_write(struct snd_soc_codec *codec,
++                        unsigned int reg, unsigned int value)
++{
++        mutex_lock(&codec->cache_rw_mutex);
++        snd_soc_set_cache_val(codec->reg_cache, reg, value,
++                              codec->driver->reg_word_size);
++        mutex_unlock(&codec->cache_rw_mutex);
++
++        return 0;
++}
++
++/**
++ * snd_soc_codec_volatile_register: Report if a register is volatile.
++ *
++ * @codec: CODEC to query.
++ * @reg: Register to query.
++ *
++ * Boolean function indiciating if a CODEC register is volatile.
++ */
++int snd_soc_codec_volatile_register(struct snd_soc_codec *codec,
++                                    unsigned int reg)
++{
++        if (codec->volatile_register)
++                return codec->volatile_register(codec, reg);
++        else
++                return 0;
++}
++
++static int hw_write(struct snd_soc_codec *codec, unsigned int reg,
++                    unsigned int value)
++{
++        int ret;
++
++        if (!snd_soc_codec_volatile_register(codec, reg) &&
++            reg < codec->driver->reg_cache_size &&
++            !codec->cache_bypass) {
++                ret = snd_soc_cache_write(codec, reg, value);
++                if (ret < 0)
++                        return -1;
++        }
++
++        if (codec->cache_only) {
++                codec->cache_sync = 1;
++                return 0;
++        }
++
++        return regmap_write(codec->control_data, reg, value);
++}
++
++static unsigned int hw_read(struct snd_soc_codec *codec, unsigned int reg)
++{
++        int ret;
++        unsigned int val;
++
++        if (reg >= codec->driver->reg_cache_size ||
++            snd_soc_codec_volatile_register(codec, reg) ||
++            codec->cache_bypass) {
++                if (codec->cache_only)
++                        return -1;
++
++                ret = regmap_read(codec->control_data, reg, &val);
++                if (ret == 0)
++                        return val;
++                else
++                        return -1;
++        }
++
++        ret = snd_soc_cache_read(codec, reg, &val);
++        if (ret < 0)
++                return -1;
++        return val;
++}
++
++/**
++ * snd_soc_codec_set_cache_io: Set up standard I/O functions.
++ *
++ * @codec: CODEC to configure.
++ * @addr_bits: Number of bits of register address data.
++ * @data_bits: Number of bits of data per register.
++ * @control: Control bus used.
++ *
++ * Register formats are frequently shared between many I2C and SPI
++ * devices.  In order to promote code reuse the ASoC core provides
++ * some standard implementations of CODEC read and write operations
++ * which can be set up using this function.
++ *
++ * The caller is responsible for allocating and initialising the
++ * actual cache.
++ *
++ * Note that at present this code cannot be used by CODECs with
++ * volatile registers.
++ */
++int snd_soc_codec_set_cache_io(struct snd_soc_codec *codec,
++                               int addr_bits, int data_bits,
++                               enum snd_soc_control_type control)
++{
++        struct regmap_config config;
++        int ret;
++
++        memset(&config, 0, sizeof(config));
++        codec->write = hw_write;
++        codec->read = hw_read;
++
++        config.reg_bits = addr_bits;
++        config.val_bits = data_bits;
++
++        switch (control) {
++#if IS_ENABLED(CONFIG_REGMAP_I2C)
++        case SND_SOC_I2C:
++                codec->control_data = regmap_init_i2c(to_i2c_client(codec->dev),
++                                                      &config);
++                break;
++#endif
++
++#if IS_ENABLED(CONFIG_REGMAP_SPI)
++        case SND_SOC_SPI:
++                codec->control_data = regmap_init_spi(to_spi_device(codec->dev),
++                                                      &config);
++                break;
++#endif
++
++        case SND_SOC_REGMAP:
++                /* Device has made its own regmap arrangements */
++                codec->using_regmap = true;
++                if (!codec->control_data)
++                        codec->control_data = dev_get_regmap(codec->dev, NULL);
++
++                if (codec->control_data) {
++                        ret = regmap_get_val_bytes(codec->control_data);
++                        /* Errors are legitimate for non-integer byte
++                         * multiples */
++                        if (ret > 0)
++                                codec->val_bytes = ret;
++                }
++                break;
++
++        default:
++                return -EINVAL;
++        }
++
++        return PTR_ERR_OR_ZERO(codec->control_data);
++}
++EXPORT_SYMBOL_GPL(snd_soc_codec_set_cache_io);
++#else
++int snd_soc_codec_set_cache_io(struct snd_soc_codec *codec,
++                               int addr_bits, int data_bits,
++                               enum snd_soc_control_type control)
++{
++        return -ENOTSUPP;
++}
++EXPORT_SYMBOL_GPL(snd_soc_codec_set_cache_io);
++#endif
-- 
cgit v1.2.3